Wiktionary
siwiktionary
https://si.wiktionary.org/wiki/%E0%B7%80%E0%B7%92%E0%B6%9A%E0%B7%8A%E0%B7%82%E0%B6%B1%E0%B6%BB%E0%B7%92:%E0%B6%B8%E0%B7%94%E0%B6%BD%E0%B7%8A_%E0%B6%B4%E0%B7%92%E0%B6%A7%E0%B7%94%E0%B7%80
MediaWiki 1.47.0-wmf.3
case-sensitive
මාධ්යය
විශේෂ
සාකච්ඡාව
පරිශීලක
පරිශීලක සාකච්ඡාව
වික්ෂනරි
වික්ෂනරි සාකච්ඡාව
ගොනුව
ගොනුව සාකච්ඡාව
මාධ්යවිකි
මාධ්යවිකි සාකච්ඡාව
සැකිල්ල
සැකිලි සාකච්ඡාව
උදවු
උදවු සාකච්ඡාව
ප්රවර්ගය
ප්රවර්ග සාකච්ඡාව
TimedText
TimedText talk
Module
Module talk
Event
Event talk
Module:languages/data/3/z
828
6246
234884
220375
2026-03-03T16:38:42Z
en>Thadh
0
Undid revision [[Special:Diff/89740565|89740565]] by [[Special:Contributions/Thadh|Thadh]] ([[User talk:Thadh|talk]])
234884
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["zaa"] = {
"Sierra de Juárez Zapotec",
12953989,
"omq-zap",
"Latn",
}
m["zab"] = {
"San Juan Guelavía Zapotec",
5614751,
"omq-zpc",
"Latn",
}
m["zac"] = {
"Ocotlán Zapotec",
7076643,
"omq-zap",
"Latn",
}
m["zad"] = {
"Cajonos Zapotec",
5017997,
"omq-zpc",
"Latn",
}
m["zae"] = {
"Yareni Zapotec",
12645368,
"omq-zap",
"Latn",
}
m["zaf"] = {
"Ayoquesco Zapotec",
4831570,
"omq-zpc",
"Latn",
}
m["zag"] = {
"Zaghawa",
37007,
"ssa-sah",
"Latn", -- also Beria
}
m["zah"] = {
"Zangwal",
3441387,
"cdc-wst",
"Latn",
}
m["zai"] = {
"Isthmus Zapotec",
56728,
"omq-zpc",
"Latn",
}
m["zaj"] = {
"Zaramo",
8066599,
"bnt-ruv",
"Latn",
}
m["zak"] = {
"Zanaki",
8066018,
"bnt-lok",
"Latn",
}
m["zal"] = {
"Zauzou",
3616358,
"tbq-nus",
"Latn, Hani",
sort_key = {Hani = "Hani-sortkey"},
}
m["zam"] = {
"Central Mahuatlán Zapotec",
13541830,
"omq-zap",
"Latn",
}
m["zao"] = {
"Ozolotepec Zapotec",
7116610,
"omq-zap",
"Latn",
}
m["zap"] = {
"Zapotec",
13214,
"omq-zap",
"Latn",
}
m["zaq"] = {
"Aloápam Zapotec",
4734726,
"omq-zap",
"Latn",
}
m["zar"] = {
"Rincón Zapotec",
7334628,
"omq-zap",
"Latn",
}
m["zas"] = {
"Santo Domingo Albarradas Zapotec",
4709425,
"omq-zap",
"Latn",
}
m["zat"] = {
"Tabaa Zapotec",
7672849,
"omq-zap",
"Latn",
}
m["zau"] = {
"Zangskari",
771203,
"sit-lab",
"Tibt",
ancestors = "lbj",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["zav"] = {
"Yatzachi Zapotec",
8050301,
"omq-zpc",
"Latn",
}
m["zaw"] = {
"Mitla Zapotec",
3053288,
"omq-zpc",
"Latn",
}
m["zax"] = {
"Xadani Zapotec",
8042823,
"omq-zap",
"Latn",
}
m["zay"] = {
"Zayse-Zergulla",
673895,
"omv-eom",
"Latn",
}
m["zaz"] = {
"Zari",
3914398,
"cdc-wst",
"Latn",
}
m["zbt"] = {
"Batui",
16839143,
"poz-slb",
"Latn",
}
m["zca"] = {
"Coatecas Altas Zapotec",
5138603,
"omq-zap",
"Latn",
}
m["zdj"] = {
"Ngazidja Comorian",
3114653,
"bnt-com",
"Latn",
sort_key = "bnt-com-sortkey",
}
m["zea"] = {
"Zealandic",
237409,
"gmw-frk",
"Latn",
ancestors = "dum",
sort_key = {
from = {"^'([aeiouy].*)$"},
to = {"%1'"}
}
}
m["zeg"] = {
"Zenag",
12953345,
"poz-ocw",
"Latn",
}
m["zen"] = {
"Zenaga",
37005,
"ber",
"Latn",
}
m["zga"] = {
"Kinga",
11005332,
"bnt-bki",
"Latn",
}
m["zgh"] = {
"Moroccan Amazigh",
7598268,
"ber",
"Tfng",
translit = "Tfng-translit",
}
m["zgr"] = {
"Magori",
3277370,
"poz-ocw",
"Latn",
}
m["zhb"] = {
"Zhaba",
56334,
"sit-qia",
}
m["zhi"] = {
"Zhire",
3914910,
"nic-plc",
"Latn",
}
m["zhn"] = {
"Nong Zhuang",
7049385,
"tai-cen",
"Latn",
sort_key = {remove_diacritics = "%p"},
}
m["zhw"] = {
"Zhoa",
8070885,
"nic-rnw",
"Latn",
}
m["zia"] = {
"Zia",
3038636,
"ngf-nbi",
"Latn",
}
m["zib"] = {
"Zimbabwe Sign Language",
8072097,
"sgn",
}
m["zik"] = {
"Zimakani",
56740,
"paa-boa",
"Latn",
}
m["zil"] = {
"Zialo",
36991,
"dmn-msw",
"Latn",
}
m["zim"] = {
"Mesme",
56282,
"cdc-mas",
"Latn",
}
m["zin"] = {
"Zinza",
8072460,
"bnt-haj",
"Latn",
}
m["zir"] = {
"Ziriya",
3913943,
"nic-jer",
"Latn",
}
m["ziw"] = {
"Zigula",
37010,
"bnt-seu",
"Latn",
}
m["ziz"] = {
"Zizilivakan",
56300,
"cdc-cbm",
"Latn",
}
m["zka"] = {
"Kaimbulawa",
6348011,
"poz-mun",
"Latn",
}
m["zkb"] = {
"Koibal",
949259,
"syd",
"Latn, Cyrl",
}
m["zkd"] = {
"Kadu (Myanmar)", -- The name is duplicated with Kadu languages in Africa.
54324451,
"sit-luu",
"Latn", -- and also unencoded Kadu script
}
m["zkg"] = {
"Goguryeo",
706327,
"qfa-kor",
"Hani",
sort_key = "Hani-sortkey",
}
m["zkh"] = {
"Khorezmian Turkic",
25502,
"trk-kar",
"Arab",
ancestors = "xqa",
}
m["zkk"] = {
"Karankawa",
3192947,
"qfa-unc", -- extinct Texas coast language; fairly poorly attested, nearby languages poorly attested; maybe an isolate
"Latn",
}
m["zko"] = {
"Kott",
34163,
"qfa-yko",
"Latn, Cyrl",
}
m["zkp"] = {
"São Paulo Kaingáng",
7665661,
"sai-jee",
"Latn",
}
m["zkr"] = {
"Zakhring",
56996,
"sit-mdz",
"Latn, Hani",
sort_key = {Hani = "Hani-sortkey"},
}
m["zkt"] = {
"Khitan",
1064482,
"qfa-xgx",
"Kitl, Kits, Hani",
translit = {Kits = "zkt-translit"},
sort_key = {Hani = "Hani-sortkey"},
}
m["zku"] = {
"Kaurna",
6378899,
"aus-psw",
"Latn",
}
m["zkv"] = {
"Krevinian",
6436902,
"urj-fin",
"Latn",
ancestors = "vot",
}
m["zkz"] = {
"Khazar",
1067986,
"trk-ogr",
"Orkh",
-- Orkh translit in [[Module:scripts/data]] (NOTE: not present before, presumably an accidental omission)
}
m["zma"] = {
"Manda (Australia)",
18650060,
"aus-dal",
"Latn",
}
m["zmb"] = {
"Zimba",
8071960,
"bnt-lgb",
"Latn",
}
m["zmc"] = {
"Margany",
10577017,
"aus-pam",
"Latn",
}
m["zmd"] = {
"Maridan",
10577273,
"aus-dal",
"Latn",
}
m["zme"] = {
"Mangerr",
10576387,
nil,
"Latn",
}
m["zmf"] = {
"Mfinu",
35915,
"bnt-tek",
"Latn",
}
m["zmg"] = {
"Marti Ke",
10577823,
"aus-dal",
"Latn",
}
m["zmh"] = {
"Makolkol",
12636052,
"paa-bai",
"Latn",
}
m["zmi"] = {
"Negeri Sembilan Malay",
3915909,
"poz-mly",
"Latn",
}
m["zmj"] = {
"Maridjabin",
10577274,
"aus-dal",
"Latn",
}
m["zmk"] = {
"Mandandanyi",
10576338,
"aus-pam",
"Latn",
}
m["zml"] = {
"Madngele",
10575155,
"aus-dal",
"Latn",
}
m["zmm"] = {
"Marimanindji",
10577424,
"aus-dal",
"Latn",
}
m["zmn"] = {
"Mbangwe",
35928,
"bnt-kel",
"Latn",
}
m["zmo"] = {
"Molo",
15974357,
"sdv-eje",
"Latn",
}
m["zmp"] = {
"Mbuun",
106249400,
"bnt",
"Latn",
}
m["zmq"] = {
"Mituku",
6883590,
"bnt-mbe",
"Latn",
}
m["zmr"] = {
"Maranungku",
6772792,
"aus-dal",
"Latn",
}
m["zms"] = {
"Mbesa",
6799676,
"bnt-ske",
"Latn",
}
m["zmt"] = {
"Maringarr",
10577443,
"aus-dal",
"Latn",
}
m["zmu"] = {
"Muruwari",
3915442,
"aus-pam",
"Latn",
}
m["zmv"] = {
"Mbariman-Gudhinma",
3915672,
"aus-pmn",
"Latn",
}
m["zmw"] = {
"Mbo (Congo)",
6799710,
"bnt-nya",
"Latn",
}
m["zmx"] = {
"Bomitaba",
35063,
"bnt-ngn",
"Latn",
}
m["zmy"] = {
"Mariyedi",
10577501,
"aus-dal",
"Latn",
}
m["zmz"] = {
"Mbandja",
3915310,
"bad",
"Latn",
}
m["zna"] = {
"Zan Gula",
863726,
"alv-bua",
"Latn",
}
m["zne"] = {
"Zande",
35015,
"znd",
"Latn",
}
m["zng"] = {
"Mang",
720192,
"mkh-mng",
"Latn",
}
m["znk"] = {
"Manangkari",
6746906,
"aus-wdj",
"Latn",
}
m["zns"] = {
"Mangas",
3438780,
"cdc-wst",
"Latn",
}
m["zoc"] = {
"Copainalá Zoque",
12954017,
"nai-miz",
"Latn",
}
m["zoh"] = {
"Chimalapa Zoque",
5099289,
"nai-miz",
"Latn",
}
m["zom"] = {
"Zou",
37011,
"tbq-kuk",
"Latn",
strip_diacritics = {remove_diacritics = c.circ .. c.acute .. c.grave .. c.dacute .. c.dgrave},
}
m["zoo"] = {
"Asunción Mixtepec Zapotec",
4811888,
"omq-zap",
"Latn",
}
m["zoq"] = {
"Tabasco Zoque",
323325,
"nai-miz",
"Latn",
}
m["zor"] = {
"Rayón Zoque",
12954015,
"nai-miz",
"Latn",
}
m["zos"] = {
"Francisco León Zoque",
12954011,
"nai-miz",
"Latn",
}
m["zpa"] = {
"Lachiguiri Zapotec",
6468403,
"omq-zap",
"Latn",
}
m["zpb"] = {
"Yautepec Zapotec",
7413392,
"omq-zap",
"Latn",
}
m["zpc"] = {
"Choapan Zapotec",
5103425,
"omq-zap",
"Latn",
}
m["zpd"] = {
"Southeastern Ixtlán Zapotec",
8050392,
"omq-zap",
"Latn",
}
m["zpe"] = {
"Petapa Zapotec",
7171675,
"omq-zap",
"Latn",
}
m["zpf"] = {
"San Pedro Quiatoni Zapotec",
7271640,
"omq-zpc",
"Latn",
}
m["zpg"] = {
"Guevea de Humboldt Zapotec",
13459953,
"omq-zap",
"Latn",
}
m["zph"] = {
"Totomachapan Zapotec",
7828390,
"omq-zap",
"Latn",
}
m["zpi"] = {
"Santa María Quiegolani Zapotec",
7271823,
"omq-zpc",
"Latn",
}
m["zpj"] = {
"Quiavicuzas Zapotec",
7271642,
"omq-zap",
"Latn",
}
m["zpk"] = {
"Tlacolulita Zapotec",
7810685,
"omq-zpc",
"Latn",
}
m["zpl"] = {
"Lachixío Zapotec",
6468420,
"omq-zap",
"Latn",
}
m["zpm"] = {
"Mixtepec Zapotec",
7414598,
"omq-zpc",
"Latn",
}
m["zpn"] = {
"Santa Inés Yatzechi Zapotec",
8050300,
"omq-zap",
"Latn",
}
m["zpo"] = {
"Amatlán Zapotec",
4740613,
"omq-zpc",
"Latn",
}
m["zpp"] = {
"El Alto Zapotec",
5350733,
"omq-zap",
"Latn",
}
m["zpq"] = {
"Zoogocho Zapotec",
8074100,
"omq-zpc",
"Latn",
}
m["zpr"] = {
"Santiago Xanica Zapotec",
8042924,
"omq-zap",
"Latn",
}
m["zps"] = {
"Coatlán Zapotec",
7420514,
"omq-zap",
"Latn",
}
m["zpt"] = {
"San Vicente Coatlán Zapotec",
13541831,
"omq-zap",
"Latn",
}
m["zpu"] = {
"Yalálag Zapotec",
8047534,
"omq-zpc",
"Latn",
}
m["zpv"] = {
"Chichicapan Zapotec",
5096050,
"omq-zap",
"Latn",
}
m["zpw"] = {
"Zaniza Zapotec",
8066220,
"omq-zpc",
"Latn",
}
m["zpx"] = {
"San Baltazar Loxicha Zapotec",
7413390,
"omq-zap",
"Latn",
}
m["zpy"] = {
"Mazaltepec Zapotec",
6798223,
"omq-zap",
"Latn",
}
m["zpz"] = {
"Texmelucan Zapotec",
7708357,
"omq-zpc",
"Latn",
}
m["zra"] = {
"Gaya",
5528695,
"qfa-kor",
"Hani",
sort_key = "Hani-sortkey",
}
m["zrg"] = {
"Mirgan",
6873206,
"inc-eas",
}
m["zrn"] = {
"Zirenkel",
3441365,
"cdc-est",
"Latn",
}
m["zro"] = {
"Záparo",
10206,
"sai-zap",
"Latn",
}
m["zrs"] = {
"Mairasi",
3038645,
"paa-mai",
"Latn",
}
m["zsa"] = {
"Sarasira",
57333197,
"poz-ocw",
}
m["zsk"] = { -- attested?
"Kaskean",
6374586,
}
m["zsl"] = {
"Zambian Sign Language",
8065713,
"sgn",
}
m["zsr"] = {
"Southern Rincon Zapotec",
12954000,
"omq-zpc",
"Latn",
}
m["zsu"] = {
"Sukurum",
57333741,
"poz-ocw",
}
m["zte"] = {
"Elotepec Zapotec",
5367223,
"omq-zap",
"Latn",
}
m["ztg"] = {
"Xanaguía Zapotec",
8042887,
"omq-zpc",
"Latn",
}
m["ztl"] = {
"Lapaguía-Guivini Zapotec",
6488084,
"omq-zap",
"Latn",
}
m["ztm"] = {
"San Agustín Mixtepec Zapotec",
7413220,
"omq-zap",
"Latn",
}
m["ztn"] = {
"Santa Catarina Albarradas Zapotec",
7419277,
"omq-zap",
"Latn",
}
m["ztp"] = {
"Loxicha Zapotec",
6694268,
"omq-zap",
"Latn",
}
m["ztq"] = {
"Quioquitani-Quierí Zapotec",
3574818,
"omq-zpc",
"Latn",
}
m["zts"] = {
"Tilquiapan Zapotec",
7802959,
"omq-zpc",
"Latn",
}
m["ztt"] = {
"Tejalapan Zapotec",
13510225,
"omq-zap",
"Latn",
}
m["ztu"] = {
"San Pablo Güilá Zapotec",
5626813,
"omq-zap",
"Latn",
}
m["ztx"] = {
"Zaachila Zapotec",
8063390,
"omq-zap",
"Latn",
}
m["zty"] = {
"Yatee Zapotec",
3574815,
"omq-zpc",
"Latn",
}
m["zua"] = {
"Zeem",
3450131,
"cdc-wst",
"Latn",
}
m["zuh"] = {
"Tokano",
7813481,
"ngf-gah",
"Latn",
}
m["zum"] = {
"Kumzari",
36158,
"ira-swi",
"Arab",
ancestors = "pal",
}
m["zun"] = {
"Zuni",
10188,
"qfa-iso",
"Latn",
}
m["zuy"] = {
"Zumaya",
56626,
"cdc-mas",
"Latn",
}
m["zwa"] = {
"Zay",
10195,
"sem-eth",
"Ethi",
}
m["zyp"] = {
"Zyphe",
57004,
"tbq-kuk",
"Latn",
}
m["zza"] = {
"Zazaki",
10199,
"ira-zgr",
"Latn",
dotted_dotless_i = true,
sort_key = "zza-sortkey",
wikimedia_codes = "diq",
}
m["zzj"] = {
"Zuojiang Zhuang",
13848149,
"tai-cen",
"Latn",
sort_key = {remove_diacritics = "%p"},
}
return require("Module:languages").finalizeData(m, "language")
iprbne0zsebhn4gs15vhe8q01btiaj3
234885
234884
2026-05-24T09:45:10Z
Lee
19
[[:en:Module:languages/data/3/z]] වෙතින් එක් සංශෝධනයක්
234884
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["zaa"] = {
"Sierra de Juárez Zapotec",
12953989,
"omq-zap",
"Latn",
}
m["zab"] = {
"San Juan Guelavía Zapotec",
5614751,
"omq-zpc",
"Latn",
}
m["zac"] = {
"Ocotlán Zapotec",
7076643,
"omq-zap",
"Latn",
}
m["zad"] = {
"Cajonos Zapotec",
5017997,
"omq-zpc",
"Latn",
}
m["zae"] = {
"Yareni Zapotec",
12645368,
"omq-zap",
"Latn",
}
m["zaf"] = {
"Ayoquesco Zapotec",
4831570,
"omq-zpc",
"Latn",
}
m["zag"] = {
"Zaghawa",
37007,
"ssa-sah",
"Latn", -- also Beria
}
m["zah"] = {
"Zangwal",
3441387,
"cdc-wst",
"Latn",
}
m["zai"] = {
"Isthmus Zapotec",
56728,
"omq-zpc",
"Latn",
}
m["zaj"] = {
"Zaramo",
8066599,
"bnt-ruv",
"Latn",
}
m["zak"] = {
"Zanaki",
8066018,
"bnt-lok",
"Latn",
}
m["zal"] = {
"Zauzou",
3616358,
"tbq-nus",
"Latn, Hani",
sort_key = {Hani = "Hani-sortkey"},
}
m["zam"] = {
"Central Mahuatlán Zapotec",
13541830,
"omq-zap",
"Latn",
}
m["zao"] = {
"Ozolotepec Zapotec",
7116610,
"omq-zap",
"Latn",
}
m["zap"] = {
"Zapotec",
13214,
"omq-zap",
"Latn",
}
m["zaq"] = {
"Aloápam Zapotec",
4734726,
"omq-zap",
"Latn",
}
m["zar"] = {
"Rincón Zapotec",
7334628,
"omq-zap",
"Latn",
}
m["zas"] = {
"Santo Domingo Albarradas Zapotec",
4709425,
"omq-zap",
"Latn",
}
m["zat"] = {
"Tabaa Zapotec",
7672849,
"omq-zap",
"Latn",
}
m["zau"] = {
"Zangskari",
771203,
"sit-lab",
"Tibt",
ancestors = "lbj",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["zav"] = {
"Yatzachi Zapotec",
8050301,
"omq-zpc",
"Latn",
}
m["zaw"] = {
"Mitla Zapotec",
3053288,
"omq-zpc",
"Latn",
}
m["zax"] = {
"Xadani Zapotec",
8042823,
"omq-zap",
"Latn",
}
m["zay"] = {
"Zayse-Zergulla",
673895,
"omv-eom",
"Latn",
}
m["zaz"] = {
"Zari",
3914398,
"cdc-wst",
"Latn",
}
m["zbt"] = {
"Batui",
16839143,
"poz-slb",
"Latn",
}
m["zca"] = {
"Coatecas Altas Zapotec",
5138603,
"omq-zap",
"Latn",
}
m["zdj"] = {
"Ngazidja Comorian",
3114653,
"bnt-com",
"Latn",
sort_key = "bnt-com-sortkey",
}
m["zea"] = {
"Zealandic",
237409,
"gmw-frk",
"Latn",
ancestors = "dum",
sort_key = {
from = {"^'([aeiouy].*)$"},
to = {"%1'"}
}
}
m["zeg"] = {
"Zenag",
12953345,
"poz-ocw",
"Latn",
}
m["zen"] = {
"Zenaga",
37005,
"ber",
"Latn",
}
m["zga"] = {
"Kinga",
11005332,
"bnt-bki",
"Latn",
}
m["zgh"] = {
"Moroccan Amazigh",
7598268,
"ber",
"Tfng",
translit = "Tfng-translit",
}
m["zgr"] = {
"Magori",
3277370,
"poz-ocw",
"Latn",
}
m["zhb"] = {
"Zhaba",
56334,
"sit-qia",
}
m["zhi"] = {
"Zhire",
3914910,
"nic-plc",
"Latn",
}
m["zhn"] = {
"Nong Zhuang",
7049385,
"tai-cen",
"Latn",
sort_key = {remove_diacritics = "%p"},
}
m["zhw"] = {
"Zhoa",
8070885,
"nic-rnw",
"Latn",
}
m["zia"] = {
"Zia",
3038636,
"ngf-nbi",
"Latn",
}
m["zib"] = {
"Zimbabwe Sign Language",
8072097,
"sgn",
}
m["zik"] = {
"Zimakani",
56740,
"paa-boa",
"Latn",
}
m["zil"] = {
"Zialo",
36991,
"dmn-msw",
"Latn",
}
m["zim"] = {
"Mesme",
56282,
"cdc-mas",
"Latn",
}
m["zin"] = {
"Zinza",
8072460,
"bnt-haj",
"Latn",
}
m["zir"] = {
"Ziriya",
3913943,
"nic-jer",
"Latn",
}
m["ziw"] = {
"Zigula",
37010,
"bnt-seu",
"Latn",
}
m["ziz"] = {
"Zizilivakan",
56300,
"cdc-cbm",
"Latn",
}
m["zka"] = {
"Kaimbulawa",
6348011,
"poz-mun",
"Latn",
}
m["zkb"] = {
"Koibal",
949259,
"syd",
"Latn, Cyrl",
}
m["zkd"] = {
"Kadu (Myanmar)", -- The name is duplicated with Kadu languages in Africa.
54324451,
"sit-luu",
"Latn", -- and also unencoded Kadu script
}
m["zkg"] = {
"Goguryeo",
706327,
"qfa-kor",
"Hani",
sort_key = "Hani-sortkey",
}
m["zkh"] = {
"Khorezmian Turkic",
25502,
"trk-kar",
"Arab",
ancestors = "xqa",
}
m["zkk"] = {
"Karankawa",
3192947,
"qfa-unc", -- extinct Texas coast language; fairly poorly attested, nearby languages poorly attested; maybe an isolate
"Latn",
}
m["zko"] = {
"Kott",
34163,
"qfa-yko",
"Latn, Cyrl",
}
m["zkp"] = {
"São Paulo Kaingáng",
7665661,
"sai-jee",
"Latn",
}
m["zkr"] = {
"Zakhring",
56996,
"sit-mdz",
"Latn, Hani",
sort_key = {Hani = "Hani-sortkey"},
}
m["zkt"] = {
"Khitan",
1064482,
"qfa-xgx",
"Kitl, Kits, Hani",
translit = {Kits = "zkt-translit"},
sort_key = {Hani = "Hani-sortkey"},
}
m["zku"] = {
"Kaurna",
6378899,
"aus-psw",
"Latn",
}
m["zkv"] = {
"Krevinian",
6436902,
"urj-fin",
"Latn",
ancestors = "vot",
}
m["zkz"] = {
"Khazar",
1067986,
"trk-ogr",
"Orkh",
-- Orkh translit in [[Module:scripts/data]] (NOTE: not present before, presumably an accidental omission)
}
m["zma"] = {
"Manda (Australia)",
18650060,
"aus-dal",
"Latn",
}
m["zmb"] = {
"Zimba",
8071960,
"bnt-lgb",
"Latn",
}
m["zmc"] = {
"Margany",
10577017,
"aus-pam",
"Latn",
}
m["zmd"] = {
"Maridan",
10577273,
"aus-dal",
"Latn",
}
m["zme"] = {
"Mangerr",
10576387,
nil,
"Latn",
}
m["zmf"] = {
"Mfinu",
35915,
"bnt-tek",
"Latn",
}
m["zmg"] = {
"Marti Ke",
10577823,
"aus-dal",
"Latn",
}
m["zmh"] = {
"Makolkol",
12636052,
"paa-bai",
"Latn",
}
m["zmi"] = {
"Negeri Sembilan Malay",
3915909,
"poz-mly",
"Latn",
}
m["zmj"] = {
"Maridjabin",
10577274,
"aus-dal",
"Latn",
}
m["zmk"] = {
"Mandandanyi",
10576338,
"aus-pam",
"Latn",
}
m["zml"] = {
"Madngele",
10575155,
"aus-dal",
"Latn",
}
m["zmm"] = {
"Marimanindji",
10577424,
"aus-dal",
"Latn",
}
m["zmn"] = {
"Mbangwe",
35928,
"bnt-kel",
"Latn",
}
m["zmo"] = {
"Molo",
15974357,
"sdv-eje",
"Latn",
}
m["zmp"] = {
"Mbuun",
106249400,
"bnt",
"Latn",
}
m["zmq"] = {
"Mituku",
6883590,
"bnt-mbe",
"Latn",
}
m["zmr"] = {
"Maranungku",
6772792,
"aus-dal",
"Latn",
}
m["zms"] = {
"Mbesa",
6799676,
"bnt-ske",
"Latn",
}
m["zmt"] = {
"Maringarr",
10577443,
"aus-dal",
"Latn",
}
m["zmu"] = {
"Muruwari",
3915442,
"aus-pam",
"Latn",
}
m["zmv"] = {
"Mbariman-Gudhinma",
3915672,
"aus-pmn",
"Latn",
}
m["zmw"] = {
"Mbo (Congo)",
6799710,
"bnt-nya",
"Latn",
}
m["zmx"] = {
"Bomitaba",
35063,
"bnt-ngn",
"Latn",
}
m["zmy"] = {
"Mariyedi",
10577501,
"aus-dal",
"Latn",
}
m["zmz"] = {
"Mbandja",
3915310,
"bad",
"Latn",
}
m["zna"] = {
"Zan Gula",
863726,
"alv-bua",
"Latn",
}
m["zne"] = {
"Zande",
35015,
"znd",
"Latn",
}
m["zng"] = {
"Mang",
720192,
"mkh-mng",
"Latn",
}
m["znk"] = {
"Manangkari",
6746906,
"aus-wdj",
"Latn",
}
m["zns"] = {
"Mangas",
3438780,
"cdc-wst",
"Latn",
}
m["zoc"] = {
"Copainalá Zoque",
12954017,
"nai-miz",
"Latn",
}
m["zoh"] = {
"Chimalapa Zoque",
5099289,
"nai-miz",
"Latn",
}
m["zom"] = {
"Zou",
37011,
"tbq-kuk",
"Latn",
strip_diacritics = {remove_diacritics = c.circ .. c.acute .. c.grave .. c.dacute .. c.dgrave},
}
m["zoo"] = {
"Asunción Mixtepec Zapotec",
4811888,
"omq-zap",
"Latn",
}
m["zoq"] = {
"Tabasco Zoque",
323325,
"nai-miz",
"Latn",
}
m["zor"] = {
"Rayón Zoque",
12954015,
"nai-miz",
"Latn",
}
m["zos"] = {
"Francisco León Zoque",
12954011,
"nai-miz",
"Latn",
}
m["zpa"] = {
"Lachiguiri Zapotec",
6468403,
"omq-zap",
"Latn",
}
m["zpb"] = {
"Yautepec Zapotec",
7413392,
"omq-zap",
"Latn",
}
m["zpc"] = {
"Choapan Zapotec",
5103425,
"omq-zap",
"Latn",
}
m["zpd"] = {
"Southeastern Ixtlán Zapotec",
8050392,
"omq-zap",
"Latn",
}
m["zpe"] = {
"Petapa Zapotec",
7171675,
"omq-zap",
"Latn",
}
m["zpf"] = {
"San Pedro Quiatoni Zapotec",
7271640,
"omq-zpc",
"Latn",
}
m["zpg"] = {
"Guevea de Humboldt Zapotec",
13459953,
"omq-zap",
"Latn",
}
m["zph"] = {
"Totomachapan Zapotec",
7828390,
"omq-zap",
"Latn",
}
m["zpi"] = {
"Santa María Quiegolani Zapotec",
7271823,
"omq-zpc",
"Latn",
}
m["zpj"] = {
"Quiavicuzas Zapotec",
7271642,
"omq-zap",
"Latn",
}
m["zpk"] = {
"Tlacolulita Zapotec",
7810685,
"omq-zpc",
"Latn",
}
m["zpl"] = {
"Lachixío Zapotec",
6468420,
"omq-zap",
"Latn",
}
m["zpm"] = {
"Mixtepec Zapotec",
7414598,
"omq-zpc",
"Latn",
}
m["zpn"] = {
"Santa Inés Yatzechi Zapotec",
8050300,
"omq-zap",
"Latn",
}
m["zpo"] = {
"Amatlán Zapotec",
4740613,
"omq-zpc",
"Latn",
}
m["zpp"] = {
"El Alto Zapotec",
5350733,
"omq-zap",
"Latn",
}
m["zpq"] = {
"Zoogocho Zapotec",
8074100,
"omq-zpc",
"Latn",
}
m["zpr"] = {
"Santiago Xanica Zapotec",
8042924,
"omq-zap",
"Latn",
}
m["zps"] = {
"Coatlán Zapotec",
7420514,
"omq-zap",
"Latn",
}
m["zpt"] = {
"San Vicente Coatlán Zapotec",
13541831,
"omq-zap",
"Latn",
}
m["zpu"] = {
"Yalálag Zapotec",
8047534,
"omq-zpc",
"Latn",
}
m["zpv"] = {
"Chichicapan Zapotec",
5096050,
"omq-zap",
"Latn",
}
m["zpw"] = {
"Zaniza Zapotec",
8066220,
"omq-zpc",
"Latn",
}
m["zpx"] = {
"San Baltazar Loxicha Zapotec",
7413390,
"omq-zap",
"Latn",
}
m["zpy"] = {
"Mazaltepec Zapotec",
6798223,
"omq-zap",
"Latn",
}
m["zpz"] = {
"Texmelucan Zapotec",
7708357,
"omq-zpc",
"Latn",
}
m["zra"] = {
"Gaya",
5528695,
"qfa-kor",
"Hani",
sort_key = "Hani-sortkey",
}
m["zrg"] = {
"Mirgan",
6873206,
"inc-eas",
}
m["zrn"] = {
"Zirenkel",
3441365,
"cdc-est",
"Latn",
}
m["zro"] = {
"Záparo",
10206,
"sai-zap",
"Latn",
}
m["zrs"] = {
"Mairasi",
3038645,
"paa-mai",
"Latn",
}
m["zsa"] = {
"Sarasira",
57333197,
"poz-ocw",
}
m["zsk"] = { -- attested?
"Kaskean",
6374586,
}
m["zsl"] = {
"Zambian Sign Language",
8065713,
"sgn",
}
m["zsr"] = {
"Southern Rincon Zapotec",
12954000,
"omq-zpc",
"Latn",
}
m["zsu"] = {
"Sukurum",
57333741,
"poz-ocw",
}
m["zte"] = {
"Elotepec Zapotec",
5367223,
"omq-zap",
"Latn",
}
m["ztg"] = {
"Xanaguía Zapotec",
8042887,
"omq-zpc",
"Latn",
}
m["ztl"] = {
"Lapaguía-Guivini Zapotec",
6488084,
"omq-zap",
"Latn",
}
m["ztm"] = {
"San Agustín Mixtepec Zapotec",
7413220,
"omq-zap",
"Latn",
}
m["ztn"] = {
"Santa Catarina Albarradas Zapotec",
7419277,
"omq-zap",
"Latn",
}
m["ztp"] = {
"Loxicha Zapotec",
6694268,
"omq-zap",
"Latn",
}
m["ztq"] = {
"Quioquitani-Quierí Zapotec",
3574818,
"omq-zpc",
"Latn",
}
m["zts"] = {
"Tilquiapan Zapotec",
7802959,
"omq-zpc",
"Latn",
}
m["ztt"] = {
"Tejalapan Zapotec",
13510225,
"omq-zap",
"Latn",
}
m["ztu"] = {
"San Pablo Güilá Zapotec",
5626813,
"omq-zap",
"Latn",
}
m["ztx"] = {
"Zaachila Zapotec",
8063390,
"omq-zap",
"Latn",
}
m["zty"] = {
"Yatee Zapotec",
3574815,
"omq-zpc",
"Latn",
}
m["zua"] = {
"Zeem",
3450131,
"cdc-wst",
"Latn",
}
m["zuh"] = {
"Tokano",
7813481,
"ngf-gah",
"Latn",
}
m["zum"] = {
"Kumzari",
36158,
"ira-swi",
"Arab",
ancestors = "pal",
}
m["zun"] = {
"Zuni",
10188,
"qfa-iso",
"Latn",
}
m["zuy"] = {
"Zumaya",
56626,
"cdc-mas",
"Latn",
}
m["zwa"] = {
"Zay",
10195,
"sem-eth",
"Ethi",
}
m["zyp"] = {
"Zyphe",
57004,
"tbq-kuk",
"Latn",
}
m["zza"] = {
"Zazaki",
10199,
"ira-zgr",
"Latn",
dotted_dotless_i = true,
sort_key = "zza-sortkey",
wikimedia_codes = "diq",
}
m["zzj"] = {
"Zuojiang Zhuang",
13848149,
"tai-cen",
"Latn",
sort_key = {remove_diacritics = "%p"},
}
return require("Module:languages").finalizeData(m, "language")
iprbne0zsebhn4gs15vhe8q01btiaj3
Module:languages/data/3/w
828
6254
234882
220382
2026-02-03T03:32:53Z
en>WingerBot
0
various renamess per [[Wiktionary:Language_treatment_requests#the_many_Mari_languages]], [[Wiktionary:Language_treatment_requests#Baïnounk_Gubëeher:_one_of_these_things_is_not_like_the_others]] and [[Wiktionary:Language_treatment_requests#Lots_of_name_changes]] (manually assisted)
234882
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["waa"] = {
"Walla Walla",
12953960,
"nai-shp",
"Latn",
ancestors = "nai-spt",
}
m["wab"] = {
"Wab",
11222271,
"poz-ocw",
"Latn",
}
m["wac"] = {
"Wasco-Wishram",
12645081,
"nai-ckn",
"Latn",
}
m["wad"] = {
"Wandamen",
2806128,
"poz-hce",
"Latn",
}
m["waf"] = {
"Wakoná",
7961205,
}
m["wag"] = {
"Wa'ema",
12953264,
"poz-ocw",
"Latn",
}
m["wah"] = {
"Watubela",
7975070,
"poz-cma",
"Latn",
}
m["waj"] = {
"Waffa",
3565058,
"ngf-tai",
"Latn",
}
m["wal"] = {
"Wolaytta",
36943,
"omv-nom",
"Latn, Ethi",
}
m["wam"] = {
"Massachusett",
56519,
"alg-eas",
"Latn",
}
m["wan"] = {
"Wan",
3913272,
"dmn-nbe",
}
m["wao"] = {
"Wappo",
56530,
"nai-ykn",
"Latn",
}
m["wap"] = {
"Wapishana",
3450493,
"awd",
"Latn",
}
m["waq"] = {
"Wageman",
3436843,
"aus-gun",
"Latn",
}
m["war"] = {
"Waray-Waray",
34279,
"phi",
"Latn",
strip_diacritics = {Latn = {remove_diacritics = c.grave .. c.acute .. c.circ}},
standard_chars = {
Latn = "AaBbKkDdEeGgHhIiLlMmNnOoPpRrSsTtUuWwYy",
c.punc
},
sort_key = {
Latn = "tl-sortkey",
},
}
m["was"] = {
"Washo",
34198,
"qfa-iso",
"Latn",
}
m["wat"] = {
"Kaninuwa",
12952565,
"poz-ocw",
"Latn",
}
m["wau"] = {
"Wauja",
3450522,
"awd",
"Latn",
}
m["wav"] = {
"Waka",
3913394,
"alv-mye",
}
m["waw"] = {
"Waiwai",
56632,
"sai-prk",
"Latn",
}
m["wax"] = {
"Watam",
3566597,
"paa-ott",
"Latn",
}
m["way"] = {
"Wayana",
5908753,
"sai-gui",
"Latn",
}
m["waz"] = {
"Wampur",
7966957,
"poz-ocw",
"Latn",
}
m["wba"] = {
"Warao",
36946,
"qfa-iso",
"Latn",
}
m["wbb"] = {
"Wabo",
7958701,
"poz-hce",
"Latn",
}
m["wbe"] = {
"Waritai",
7969453,
"paa-clp",
"Latn",
}
m["wbf"] = {
"Wara",
3914052,
"alv-wan",
}
m["wbh"] = {
"Wanda",
7967153,
"bnt-mwi",
}
m["wbi"] = {
"Wanji",
3376818,
"bnt-bki",
"Latn",
}
m["wbj"] = {
"Alagwa",
56621,
"cus-sou",
"Latn",
}
m["wbk"] = {
"Waigali",
34196,
"nur-sou",
"Latn",
}
m["wbl"] = {
"Wakhi",
34208,
"xsc-skw",
"Cyrl, Latn, Arab",
translit = {Cyrl = "tg-translit"},
}
m["wbm"] = {
"Wa",
12644869,
"mkh-pal",
}
m["wbp"] = {
"Warlpiri",
1639998,
"aus-pam",
"Latn",
}
m["wbq"] = {
"Waddar",
6708569,
"dra-tel",
}
m["wbr"] = {
"Wagdi",
7959490,
"inc-bhi",
"Deva",
}
m["wbt"] = {
"Wanman",
7967989,
}
m["wbv"] = {
"Wajarri",
3913856,
"aus-psw",
"Latn",
}
m["wbw"] = {
"Woi",
8029092,
"poz-hce",
"Latn",
}
m["wca"] = {
"Yanomam",
7960056,
"sai-ynm",
"Latn",
}
m["wci"] = {
"Waci Gbe",
36987,
"alv-gbe",
}
m["wdd"] = {
"Wandji",
36976,
"bnt-nze",
}
m["wdg"] = {
"Wadaginam",
7958930,
"ngf-sad",
"Latn",
}
m["wdj"] = {
"Wadjiginy",
7959489,
}
m["wdt"] = {
"Wendat",
3567223,
"iro-nor",
"Latn",
ancestors = "iro-ohu",
}
m["wdu"] = {
"Wadjigu",
10719025,
}
m["wdy"] = {
"Wadjabangayi",
63313681,
}
m["wea"] = {
"Wewaw",
15895870,
}
m["wec"] = {
"Wè Western",
11159067,
"kro-wee",
}
m["wed"] = {
"Wedau",
12953294,
"poz-ocw",
"Latn",
}
m["weh"] = {
"Weh",
7979690,
"nic-rnw",
}
m["wei"] = {
"Kiunum",
7983230,
"paa-tir",
"Latn",
}
m["wem"] = {
"Weme Gbe",
18379970,
"alv-gbe",
}
m["weo"] = {
"Wemale",
7982165,
"poz-cma",
}
m["wer"] = {
"Weri",
11732752,
"paa-kun",
"Latn",
}
m["wes"] = {
"Cameroon Pidgin",
35541,
"crp",
"Latn",
ancestors = "en",
}
m["wet"] = {
"Perai",
12953035,
"poz-tim",
}
m["weu"] = {
"Welaung",
7980503,
"tbq-kuk",
}
m["wew"] = {
"Weyewa",
4314526,
"poz-cet",
"Latn",
}
m["wfg"] = {
"Yafi",
8074520,
"paa-epw",
"Latn",
}
m["wga"] = {
"Wagaya",
7959487,
"aus-pam",
"Latn",
}
m["wgb"] = {
"Wagawaga",
7959485,
"poz-ocw",
"Latn",
}
m["wgg"] = {
"Wangganguru",
7967859,
"aus-kar",
"Latn",
}
m["wgi"] = {
"Wahgi", -- not to be confused with North Wahgi
3565122,
"ngf-wah",
"Latn",
}
m["wgo"] = {
"Waigeo",
7959937,
"poz-hce",
"Latn",
}
m["wgu"] = {
"Wirangu",
2092286,
"aus-pam",
"Latn",
}
m["wgy"] = {
"Warrgamay",
3915942,
"aus-pam",
"Latn",
}
m["wha"] = {
"Manusela",
3287127,
"poz-cma",
"Latn",
}
m["whg"] = {
"North Wahgi",
12953273,
"ngf-wah",
"Latn",
}
m["whk"] = {
"Wahau Kenyah",
7959737,
"poz-swa",
"Latn",
}
m["whu"] = {
"Wahau Kayan",
12473397,
}
m["wib"] = {
"Southern Toussian",
11158982,
"alv-sav",
}
m["wic"] = {
"Wichita",
56513,
"cdd",
"Latn",
}
m["wie"] = {
"Wik-Epa",
10720035,
"aus-pmn",
"Latn",
}
m["wif"] = {
"Wik-Keyangan",
10720037,
"aus-pmn",
"Latn",
}
m["wig"] = {
"Wik-Ngathana",
3915695,
"aus-pmn",
"Latn",
}
m["wih"] = {
"Wik-Me'anha",
10720039,
"aus-pmn",
"Latn",
}
m["wii"] = {
"Minidien",
6865237,
"paa-wap",
"Latn",
}
m["wij"] = {
"Wik-Iiyanh",
10720036,
"aus-pmn",
"Latn",
}
m["wik"] = {
"Wikalkan",
7999800,
"aus-pmn",
"Latn",
}
m["wil"] = {
"Wilawila",
10720050,
"aus-wor",
"Latn",
}
m["wim"] = {
"Wik-Mungkan",
2092246,
"aus-pmn",
"Latn",
}
m["win"] = {
"Winnebago",
1957108,
"sio-msv",
"Latn",
}
m["wir"] = {
"Wiraféd",
12953970,
"tup-gua",
"Latn",
}
m["wiu"] = {
"Wiru",
8027044,
"qfa-dis", -- Papuan; isolate in Glottolog; grouped with Teberan by Usher (2020)
"Latn",
}
m["wiv"] = {
"Muduapa",
3121040,
"poz-ocw",
"Latn",
}
m["wiy"] = {
"Wiyot",
36937,
"aql",
"Latn",
}
m["wja"] = {
"Waja",
3914415,
"alv-wjk",
}
m["wji"] = {
"Warji",
3440381,
"cdc-wst",
"Latn",
}
m["wka"] = {
"Kw'adza",
3807652,
"cus-sou",
}
m["wkb"] = {
"Kumbaran",
16878146,
"dra-sdo",
}
m["wkd"] = {
"Mo",
7960881,
"poz-ocw",
"Latn",
}
m["wkl"] = {
"Kalanadi",
6350515,
"dra-mal",
}
m["wku"] = {
"Kunduvadi",
6444383,
"dra-mal",
}
m["wkw"] = {
"Wakawaka",
10719110,
"aus-pam",
"Latn",
}
m["wky"] = {
"Wangkayutyuru",
33060533,
"aus-kar",
"Latn",
}
m["wla"] = {
"Walio",
7961958,
"paa-wal",
"Latn",
}
m["wlc"] = {
"Mwali Comorian",
3319155,
"bnt-com",
"Latn",
sort_key = "bnt-com-sortkey",
}
m["wle"] = {
"Wolane",
12645275,
"sem-eth",
"Ethi",
}
m["wlg"] = {
"Kunbarlang",
5618523,
"aus-gun",
"Latn",
}
m["wli"] = {
"Waioli",
7960241,
"paa-sah",
"Latn",
}
m["wlk"] = {
"Wailaki",
20832,
"ath-pco",
"Latn",
}
m["wll"] = {
"Wali (Sudan)",
30597440,
"nub-hil",
}
m["wlm"] = {
"Middle Welsh",
2487263,
"cel-brw",
"Latn",
ancestors = "owl",
strip_diacritics = {
from = {"Ð", "ð"},
to = {"D", "d"}
},
sort_key = "wlm-sortkey",
}
m["wlo"] = {
"Wolio",
1185114,
"poz-wot",
"Latn, Arab",
}
m["wlr"] = {
"Wailapa",
7960062,
"poz-vnn",
"Latn",
}
m["wls"] = {
"Wallisian",
36979,
"poz-pnp",
"Latn",
}
m["wlu"] = {
"Wuliwuli",
8039208,
}
m["wlv"] = {
"Wichí Lhamtés Vejoz",
13526867,
"sai-wic",
"Latn",
}
m["wlw"] = {
"Walak",
7961258,
"ngf-gvd",
"Latn",
}
m["wlx"] = {
"Wali (Ghana)",
36895,
"nic-mre",
"Latn",
}
m["wly"] = {
"Waling",
7961957,
"sit-kic",
ancestors = "bap",
}
m["wmb"] = {
"Wambaya",
2083197,
"aus-mir",
"Latn",
}
m["wmc"] = {
"Wamas",
7966909,
"ngf-nwh",
"Latn",
}
m["wmd"] = {
"Mamaindé",
3284890,
"sai-nmk",
"Latn",
}
m["wme"] = {
"Wambule",
56785,
"sit-kiw",
"Latn",
}
m["wmh"] = {
"Waima'a",
7960132,
"poz-tim",
"Latn",
}
m["wmi"] = {
"Wamin",
7966934,
}
m["wmm"] = {
"Maiwa (Indonesia)",
6737226,
"poz",
"Latn",
}
m["wmn"] = {
"Waamwang",
7958575,
"poz-cln",
"Latn",
}
m["wmo"] = {
"Wam",
8030620,
"paa-trr",
"Latn",
}
m["wms"] = {
"Wambon",
7966922,
"ngf-dum",
"Latn",
}
m["wmt"] = {
"Walmajarri",
2232696,
"aus-pam",
"Latn",
}
m["wmw"] = {
"Mwani",
3042206,
"bnt-swh",
"Latn",
}
m["wmx"] = {
"Womo",
8031646,
"paa-shi",
"Latn",
}
m["wnb"] = {
"Mokati",
7967057,
"ngf-tib",
"Latn",
}
m["wnc"] = {
"Wantoat",
7968184,
"ngf-waa",
"Latn",
}
m["wnd"] = {
"Wandarang",
3913767,
"aus-arn",
"Latn",
}
m["wne"] = {
"Waneci",
7967334,
"ira-pat",
"ps-Arab",
}
m["wng"] = {
"Wanggom",
11732736,
"ngf-nde",
"Latn",
}
m["wni"] = {
"Ndzwani Comorian",
2850262,
"bnt-com",
"Latn",
sort_key = "bnt-com-sortkey",
}
m["wnk"] = {
"Wanukaka",
2370136,
"poz",
"Latn",
}
m["wnm"] = {
"Wanggamala",
7967860,
"aus-kar",
"Latn",
}
m["wno"] = {
"Wano",
3566166,
"ngf-dan",
"Latn",
}
m["wnp"] = {
"Wanap",
7967060,
"paa-wpa",
"Latn",
}
m["wnu"] = {
"Usan",
7901709,
"ngf-num",
"Latn",
}
m["wnw"] = {
"Wintu",
56754,
"nai-wtq",
"Latn",
}
m["wny"] = {
"Wanyi",
7968201,
"aus-gar",
"Latn",
}
m["woa"] = {
"Tyaraity",
10706951,
}
m["wob"] = {
"Wobé",
3915363,
"kro-wee",
}
m["woc"] = {
"Wogeo",
8029061,
"poz-ocw",
"Latn",
}
m["wod"] = {
"Wolani",
8029704,
"ngf-pan",
"Latn",
}
m["woe"] = {
"Woleaian",
34037,
"poz-mic",
"Latn, Wole",
}
m["wog"] = {
"Wogamusin",
56991,
"paa-sep",
"Latn",
}
m["woi"] = {
"Kamang",
8029096,
"paa-alp",
"Latn",
}
m["wok"] = {
"Longto",
35795,
"alv-dur",
"Latn",
}
m["wom"] = {
"Perema",
3913378,
"alv-lek",
"Latn",
}
m["won"] = {
"Wongo",
8032058,
"bnt-bsh",
"Latn",
}
m["woo"] = {
"Manombai",
6751253,
"poz",
"Latn",
}
m["wor"] = {
"Woria",
8034514,
"paa-egb",
"Latn",
}
m["wos"] = {
"Hanga Hundi",
6450232,
"paa-nnd",
"Latn",
}
m["wow"] = {
"Wawonii",
3566780,
"poz-btk",
"Latn",
}
m["woy"] = {
"Weyto",
3915918,
"qfa-unc", -- speculated to have been Agaw
}
m["wpc"] = {
"Wirö",
12953684,
nil,
"Latn",
}
m["wra"] = {
"Warapu",
56739,
"paa-sko",
"Latn",
}
m["wrb"] = {
"Warluwara",
3913761,
"aus-pam",
"Latn",
}
m["wrg"] = {
"Warungu",
7970854,
"aus-pam",
"Latn",
}
m["wrh"] = {
"Wiradjuri",
3913840,
"aus-cww",
"Latn",
}
m["wri"] = {
"Wariyangga",
10719289,
"aus-psw",
"Latn",
}
m["wrk"] = {
"Garawa",
2524022,
"aus-gar",
"Latn",
}
m["wrl"] = {
"Warlmanpa",
3913823,
"aus-pam",
"Latn",
}
m["wrm"] = {
"Warumungu",
1764544,
"aus-pam",
"Latn",
}
m["wrn"] = {
"Warnang",
36971,
"alv-hei",
}
m["wro"] = {
"Worora",
3504106,
"aus-wor",
"Latn",
}
m["wrp"] = {
"Waropen",
7969851,
"poz-hce",
"Latn",
}
m["wrr"] = {
"Wardaman",
3913842,
"aus-yng",
"Latn",
}
m["wrs"] = {
"Waris",
3502610,
"paa-war",
"Latn",
}
m["wru"] = {
"Waru",
3566463,
}
m["wrv"] = {
"Waruna",
7971078,
"ngf-gsu",
"Latn",
}
m["wrw"] = {
"Gugu Warra",
5615286,
}
m["wrx"] = {
"Wae Rana",
7959375,
}
m["wrz"] = {
"Warray",
7969971,
"aus-gun",
"Latn",
}
m["wsa"] = {
"Warembori",
56459,
nil,
"Latn",
}
m["wsi"] = {
"Wusi",
8039349,
"poz-vnn",
"Latn",
}
m["wsk"] = {
"Waskia",
7972683,
"ngf-kow",
"Latn",
}
m["wsr"] = {
"Owenia",
7114727,
"ngf-gau",
"Latn",
}
-- "wss" Wasa is treated as "ak" Akan, see [[WT:LT]]
m["wsu"] = {
"Wasu",
7972892,
}
m["wsv"] = {
"Wotapuri-Katarqalai",
3877569,
"inc-koh",
}
m["wtf"] = {
"Watiwa",
35316,
"ngf-eva",
"Latn",
}
m["wth"] = {
"Wathaurong",
7974656,
"aus-pam",
"Latn",
}
m["wti"] = {
"Berta",
33178,
"qfa-iso", -- may be ssa
"Latn",
}
m["wtk"] = {
"Watakataui",
7972975,
"paa-sep",
"Latn",
}
m["wtm"] = {
"Mewati",
2605943,
"raj",
"Deva",
translit = "hi-translit",
}
m["wtw"] = {
"Wotu",
12473488,
"poz-wot",
"Latn",
}
m["wua"] = {
"Wikngenchera",
10720045,
"aus-pmn",
"Latn",
}
m["wub"] = {
"Wunambal",
3913805,
"aus-wor",
"Latn",
}
m["wud"] = {
"Wudu",
36972,
"alv-gbe",
"Latn",
}
m["wuh"] = {
"Wutunhua",
1012917,
"qfa-mix",
"Latn",
ancestors = "cmn, bo, peh",
}
m["wul"] = {
"Silimo",
11732514,
"ngf-ngn",
"Latn",
}
m["wum"] = {
"Wumbvu",
36891,
"bnt-kel",
"Latn",
}
m["wun"] = {
"Bungu",
4997686,
"bnt-mby",
"Latn",
}
m["wur"] = {
"Wurrugu",
8039305,
"aus-wdj",
"Latn",
}
m["wut"] = {
"Wutung",
56743,
"paa-isk",
"Latn",
}
m["wuu"] = {
"Wu",
34290,
"zhx",
"Hants",
ancestors = "ltc",
generate_forms = "zh-generateforms",
translit = "zh-translit",
sort_key = "Hani-sortkey",
}
m["wuv"] = {
"Wuvulu-Aua",
3062746,
"poz-aay",
"Latn",
}
m["wux"] = {
"Wulna",
13591670,
}
m["wuy"] = {
"Wauyai",
12953295,
"poz-hce",
"Latn",
}
m["wwa"] = {
"Waama",
7958576,
"nic-eov",
"Latn",
}
m["wwo"] = {
"Dorig",
3037047,
"poz-vnn",
"Latn",
}
m["wwr"] = {
"Warrwa",
7970852,
}
m["www"] = {
"Wawa",
36889,
"nic-mmb",
"Latn",
}
m["wxa"] = {
"Waxiang",
2252191,
"zhx",
"Hants",
generate_forms = "zh-generateforms",
sort_key = "Hani-sortkey",
}
m["wxw"] = {
"Wardandi",
61999705,
}
m["wya"] = {
"Wyandot",
1185119,
"iro-nor",
"Latn",
}
m["wyb"] = {
"Ngiyambaa",
3913825,
"aus-cww",
"Latn",
}
m["wyi"] = {
"Woiwurrung",
8029099,
"aus-pam",
"Latn",
}
m["wym"] = {
"Vilamovian",
56485,
"gmw-hgm",
"Latn",
ancestors = "gmh",
strip_diacritics = {remove_diacritics = c.dotabove},
}
m["wyr"] = {
"Wayoró",
2875044,
"tup",
}
m["wyy"] = {
"Western Fijian",
3062751,
"poz-pcc",
"Latn",
}
return require("Module:languages").finalizeData(m, "language")
cfhpbn3sajoez0tfffvnbp4os4648vf
234883
234882
2026-05-24T09:44:40Z
Lee
19
[[:en:Module:languages/data/3/w]] වෙතින් එක් සංශෝධනයක්
234882
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["waa"] = {
"Walla Walla",
12953960,
"nai-shp",
"Latn",
ancestors = "nai-spt",
}
m["wab"] = {
"Wab",
11222271,
"poz-ocw",
"Latn",
}
m["wac"] = {
"Wasco-Wishram",
12645081,
"nai-ckn",
"Latn",
}
m["wad"] = {
"Wandamen",
2806128,
"poz-hce",
"Latn",
}
m["waf"] = {
"Wakoná",
7961205,
}
m["wag"] = {
"Wa'ema",
12953264,
"poz-ocw",
"Latn",
}
m["wah"] = {
"Watubela",
7975070,
"poz-cma",
"Latn",
}
m["waj"] = {
"Waffa",
3565058,
"ngf-tai",
"Latn",
}
m["wal"] = {
"Wolaytta",
36943,
"omv-nom",
"Latn, Ethi",
}
m["wam"] = {
"Massachusett",
56519,
"alg-eas",
"Latn",
}
m["wan"] = {
"Wan",
3913272,
"dmn-nbe",
}
m["wao"] = {
"Wappo",
56530,
"nai-ykn",
"Latn",
}
m["wap"] = {
"Wapishana",
3450493,
"awd",
"Latn",
}
m["waq"] = {
"Wageman",
3436843,
"aus-gun",
"Latn",
}
m["war"] = {
"Waray-Waray",
34279,
"phi",
"Latn",
strip_diacritics = {Latn = {remove_diacritics = c.grave .. c.acute .. c.circ}},
standard_chars = {
Latn = "AaBbKkDdEeGgHhIiLlMmNnOoPpRrSsTtUuWwYy",
c.punc
},
sort_key = {
Latn = "tl-sortkey",
},
}
m["was"] = {
"Washo",
34198,
"qfa-iso",
"Latn",
}
m["wat"] = {
"Kaninuwa",
12952565,
"poz-ocw",
"Latn",
}
m["wau"] = {
"Wauja",
3450522,
"awd",
"Latn",
}
m["wav"] = {
"Waka",
3913394,
"alv-mye",
}
m["waw"] = {
"Waiwai",
56632,
"sai-prk",
"Latn",
}
m["wax"] = {
"Watam",
3566597,
"paa-ott",
"Latn",
}
m["way"] = {
"Wayana",
5908753,
"sai-gui",
"Latn",
}
m["waz"] = {
"Wampur",
7966957,
"poz-ocw",
"Latn",
}
m["wba"] = {
"Warao",
36946,
"qfa-iso",
"Latn",
}
m["wbb"] = {
"Wabo",
7958701,
"poz-hce",
"Latn",
}
m["wbe"] = {
"Waritai",
7969453,
"paa-clp",
"Latn",
}
m["wbf"] = {
"Wara",
3914052,
"alv-wan",
}
m["wbh"] = {
"Wanda",
7967153,
"bnt-mwi",
}
m["wbi"] = {
"Wanji",
3376818,
"bnt-bki",
"Latn",
}
m["wbj"] = {
"Alagwa",
56621,
"cus-sou",
"Latn",
}
m["wbk"] = {
"Waigali",
34196,
"nur-sou",
"Latn",
}
m["wbl"] = {
"Wakhi",
34208,
"xsc-skw",
"Cyrl, Latn, Arab",
translit = {Cyrl = "tg-translit"},
}
m["wbm"] = {
"Wa",
12644869,
"mkh-pal",
}
m["wbp"] = {
"Warlpiri",
1639998,
"aus-pam",
"Latn",
}
m["wbq"] = {
"Waddar",
6708569,
"dra-tel",
}
m["wbr"] = {
"Wagdi",
7959490,
"inc-bhi",
"Deva",
}
m["wbt"] = {
"Wanman",
7967989,
}
m["wbv"] = {
"Wajarri",
3913856,
"aus-psw",
"Latn",
}
m["wbw"] = {
"Woi",
8029092,
"poz-hce",
"Latn",
}
m["wca"] = {
"Yanomam",
7960056,
"sai-ynm",
"Latn",
}
m["wci"] = {
"Waci Gbe",
36987,
"alv-gbe",
}
m["wdd"] = {
"Wandji",
36976,
"bnt-nze",
}
m["wdg"] = {
"Wadaginam",
7958930,
"ngf-sad",
"Latn",
}
m["wdj"] = {
"Wadjiginy",
7959489,
}
m["wdt"] = {
"Wendat",
3567223,
"iro-nor",
"Latn",
ancestors = "iro-ohu",
}
m["wdu"] = {
"Wadjigu",
10719025,
}
m["wdy"] = {
"Wadjabangayi",
63313681,
}
m["wea"] = {
"Wewaw",
15895870,
}
m["wec"] = {
"Wè Western",
11159067,
"kro-wee",
}
m["wed"] = {
"Wedau",
12953294,
"poz-ocw",
"Latn",
}
m["weh"] = {
"Weh",
7979690,
"nic-rnw",
}
m["wei"] = {
"Kiunum",
7983230,
"paa-tir",
"Latn",
}
m["wem"] = {
"Weme Gbe",
18379970,
"alv-gbe",
}
m["weo"] = {
"Wemale",
7982165,
"poz-cma",
}
m["wer"] = {
"Weri",
11732752,
"paa-kun",
"Latn",
}
m["wes"] = {
"Cameroon Pidgin",
35541,
"crp",
"Latn",
ancestors = "en",
}
m["wet"] = {
"Perai",
12953035,
"poz-tim",
}
m["weu"] = {
"Welaung",
7980503,
"tbq-kuk",
}
m["wew"] = {
"Weyewa",
4314526,
"poz-cet",
"Latn",
}
m["wfg"] = {
"Yafi",
8074520,
"paa-epw",
"Latn",
}
m["wga"] = {
"Wagaya",
7959487,
"aus-pam",
"Latn",
}
m["wgb"] = {
"Wagawaga",
7959485,
"poz-ocw",
"Latn",
}
m["wgg"] = {
"Wangganguru",
7967859,
"aus-kar",
"Latn",
}
m["wgi"] = {
"Wahgi", -- not to be confused with North Wahgi
3565122,
"ngf-wah",
"Latn",
}
m["wgo"] = {
"Waigeo",
7959937,
"poz-hce",
"Latn",
}
m["wgu"] = {
"Wirangu",
2092286,
"aus-pam",
"Latn",
}
m["wgy"] = {
"Warrgamay",
3915942,
"aus-pam",
"Latn",
}
m["wha"] = {
"Manusela",
3287127,
"poz-cma",
"Latn",
}
m["whg"] = {
"North Wahgi",
12953273,
"ngf-wah",
"Latn",
}
m["whk"] = {
"Wahau Kenyah",
7959737,
"poz-swa",
"Latn",
}
m["whu"] = {
"Wahau Kayan",
12473397,
}
m["wib"] = {
"Southern Toussian",
11158982,
"alv-sav",
}
m["wic"] = {
"Wichita",
56513,
"cdd",
"Latn",
}
m["wie"] = {
"Wik-Epa",
10720035,
"aus-pmn",
"Latn",
}
m["wif"] = {
"Wik-Keyangan",
10720037,
"aus-pmn",
"Latn",
}
m["wig"] = {
"Wik-Ngathana",
3915695,
"aus-pmn",
"Latn",
}
m["wih"] = {
"Wik-Me'anha",
10720039,
"aus-pmn",
"Latn",
}
m["wii"] = {
"Minidien",
6865237,
"paa-wap",
"Latn",
}
m["wij"] = {
"Wik-Iiyanh",
10720036,
"aus-pmn",
"Latn",
}
m["wik"] = {
"Wikalkan",
7999800,
"aus-pmn",
"Latn",
}
m["wil"] = {
"Wilawila",
10720050,
"aus-wor",
"Latn",
}
m["wim"] = {
"Wik-Mungkan",
2092246,
"aus-pmn",
"Latn",
}
m["win"] = {
"Winnebago",
1957108,
"sio-msv",
"Latn",
}
m["wir"] = {
"Wiraféd",
12953970,
"tup-gua",
"Latn",
}
m["wiu"] = {
"Wiru",
8027044,
"qfa-dis", -- Papuan; isolate in Glottolog; grouped with Teberan by Usher (2020)
"Latn",
}
m["wiv"] = {
"Muduapa",
3121040,
"poz-ocw",
"Latn",
}
m["wiy"] = {
"Wiyot",
36937,
"aql",
"Latn",
}
m["wja"] = {
"Waja",
3914415,
"alv-wjk",
}
m["wji"] = {
"Warji",
3440381,
"cdc-wst",
"Latn",
}
m["wka"] = {
"Kw'adza",
3807652,
"cus-sou",
}
m["wkb"] = {
"Kumbaran",
16878146,
"dra-sdo",
}
m["wkd"] = {
"Mo",
7960881,
"poz-ocw",
"Latn",
}
m["wkl"] = {
"Kalanadi",
6350515,
"dra-mal",
}
m["wku"] = {
"Kunduvadi",
6444383,
"dra-mal",
}
m["wkw"] = {
"Wakawaka",
10719110,
"aus-pam",
"Latn",
}
m["wky"] = {
"Wangkayutyuru",
33060533,
"aus-kar",
"Latn",
}
m["wla"] = {
"Walio",
7961958,
"paa-wal",
"Latn",
}
m["wlc"] = {
"Mwali Comorian",
3319155,
"bnt-com",
"Latn",
sort_key = "bnt-com-sortkey",
}
m["wle"] = {
"Wolane",
12645275,
"sem-eth",
"Ethi",
}
m["wlg"] = {
"Kunbarlang",
5618523,
"aus-gun",
"Latn",
}
m["wli"] = {
"Waioli",
7960241,
"paa-sah",
"Latn",
}
m["wlk"] = {
"Wailaki",
20832,
"ath-pco",
"Latn",
}
m["wll"] = {
"Wali (Sudan)",
30597440,
"nub-hil",
}
m["wlm"] = {
"Middle Welsh",
2487263,
"cel-brw",
"Latn",
ancestors = "owl",
strip_diacritics = {
from = {"Ð", "ð"},
to = {"D", "d"}
},
sort_key = "wlm-sortkey",
}
m["wlo"] = {
"Wolio",
1185114,
"poz-wot",
"Latn, Arab",
}
m["wlr"] = {
"Wailapa",
7960062,
"poz-vnn",
"Latn",
}
m["wls"] = {
"Wallisian",
36979,
"poz-pnp",
"Latn",
}
m["wlu"] = {
"Wuliwuli",
8039208,
}
m["wlv"] = {
"Wichí Lhamtés Vejoz",
13526867,
"sai-wic",
"Latn",
}
m["wlw"] = {
"Walak",
7961258,
"ngf-gvd",
"Latn",
}
m["wlx"] = {
"Wali (Ghana)",
36895,
"nic-mre",
"Latn",
}
m["wly"] = {
"Waling",
7961957,
"sit-kic",
ancestors = "bap",
}
m["wmb"] = {
"Wambaya",
2083197,
"aus-mir",
"Latn",
}
m["wmc"] = {
"Wamas",
7966909,
"ngf-nwh",
"Latn",
}
m["wmd"] = {
"Mamaindé",
3284890,
"sai-nmk",
"Latn",
}
m["wme"] = {
"Wambule",
56785,
"sit-kiw",
"Latn",
}
m["wmh"] = {
"Waima'a",
7960132,
"poz-tim",
"Latn",
}
m["wmi"] = {
"Wamin",
7966934,
}
m["wmm"] = {
"Maiwa (Indonesia)",
6737226,
"poz",
"Latn",
}
m["wmn"] = {
"Waamwang",
7958575,
"poz-cln",
"Latn",
}
m["wmo"] = {
"Wam",
8030620,
"paa-trr",
"Latn",
}
m["wms"] = {
"Wambon",
7966922,
"ngf-dum",
"Latn",
}
m["wmt"] = {
"Walmajarri",
2232696,
"aus-pam",
"Latn",
}
m["wmw"] = {
"Mwani",
3042206,
"bnt-swh",
"Latn",
}
m["wmx"] = {
"Womo",
8031646,
"paa-shi",
"Latn",
}
m["wnb"] = {
"Mokati",
7967057,
"ngf-tib",
"Latn",
}
m["wnc"] = {
"Wantoat",
7968184,
"ngf-waa",
"Latn",
}
m["wnd"] = {
"Wandarang",
3913767,
"aus-arn",
"Latn",
}
m["wne"] = {
"Waneci",
7967334,
"ira-pat",
"ps-Arab",
}
m["wng"] = {
"Wanggom",
11732736,
"ngf-nde",
"Latn",
}
m["wni"] = {
"Ndzwani Comorian",
2850262,
"bnt-com",
"Latn",
sort_key = "bnt-com-sortkey",
}
m["wnk"] = {
"Wanukaka",
2370136,
"poz",
"Latn",
}
m["wnm"] = {
"Wanggamala",
7967860,
"aus-kar",
"Latn",
}
m["wno"] = {
"Wano",
3566166,
"ngf-dan",
"Latn",
}
m["wnp"] = {
"Wanap",
7967060,
"paa-wpa",
"Latn",
}
m["wnu"] = {
"Usan",
7901709,
"ngf-num",
"Latn",
}
m["wnw"] = {
"Wintu",
56754,
"nai-wtq",
"Latn",
}
m["wny"] = {
"Wanyi",
7968201,
"aus-gar",
"Latn",
}
m["woa"] = {
"Tyaraity",
10706951,
}
m["wob"] = {
"Wobé",
3915363,
"kro-wee",
}
m["woc"] = {
"Wogeo",
8029061,
"poz-ocw",
"Latn",
}
m["wod"] = {
"Wolani",
8029704,
"ngf-pan",
"Latn",
}
m["woe"] = {
"Woleaian",
34037,
"poz-mic",
"Latn, Wole",
}
m["wog"] = {
"Wogamusin",
56991,
"paa-sep",
"Latn",
}
m["woi"] = {
"Kamang",
8029096,
"paa-alp",
"Latn",
}
m["wok"] = {
"Longto",
35795,
"alv-dur",
"Latn",
}
m["wom"] = {
"Perema",
3913378,
"alv-lek",
"Latn",
}
m["won"] = {
"Wongo",
8032058,
"bnt-bsh",
"Latn",
}
m["woo"] = {
"Manombai",
6751253,
"poz",
"Latn",
}
m["wor"] = {
"Woria",
8034514,
"paa-egb",
"Latn",
}
m["wos"] = {
"Hanga Hundi",
6450232,
"paa-nnd",
"Latn",
}
m["wow"] = {
"Wawonii",
3566780,
"poz-btk",
"Latn",
}
m["woy"] = {
"Weyto",
3915918,
"qfa-unc", -- speculated to have been Agaw
}
m["wpc"] = {
"Wirö",
12953684,
nil,
"Latn",
}
m["wra"] = {
"Warapu",
56739,
"paa-sko",
"Latn",
}
m["wrb"] = {
"Warluwara",
3913761,
"aus-pam",
"Latn",
}
m["wrg"] = {
"Warungu",
7970854,
"aus-pam",
"Latn",
}
m["wrh"] = {
"Wiradjuri",
3913840,
"aus-cww",
"Latn",
}
m["wri"] = {
"Wariyangga",
10719289,
"aus-psw",
"Latn",
}
m["wrk"] = {
"Garawa",
2524022,
"aus-gar",
"Latn",
}
m["wrl"] = {
"Warlmanpa",
3913823,
"aus-pam",
"Latn",
}
m["wrm"] = {
"Warumungu",
1764544,
"aus-pam",
"Latn",
}
m["wrn"] = {
"Warnang",
36971,
"alv-hei",
}
m["wro"] = {
"Worora",
3504106,
"aus-wor",
"Latn",
}
m["wrp"] = {
"Waropen",
7969851,
"poz-hce",
"Latn",
}
m["wrr"] = {
"Wardaman",
3913842,
"aus-yng",
"Latn",
}
m["wrs"] = {
"Waris",
3502610,
"paa-war",
"Latn",
}
m["wru"] = {
"Waru",
3566463,
}
m["wrv"] = {
"Waruna",
7971078,
"ngf-gsu",
"Latn",
}
m["wrw"] = {
"Gugu Warra",
5615286,
}
m["wrx"] = {
"Wae Rana",
7959375,
}
m["wrz"] = {
"Warray",
7969971,
"aus-gun",
"Latn",
}
m["wsa"] = {
"Warembori",
56459,
nil,
"Latn",
}
m["wsi"] = {
"Wusi",
8039349,
"poz-vnn",
"Latn",
}
m["wsk"] = {
"Waskia",
7972683,
"ngf-kow",
"Latn",
}
m["wsr"] = {
"Owenia",
7114727,
"ngf-gau",
"Latn",
}
-- "wss" Wasa is treated as "ak" Akan, see [[WT:LT]]
m["wsu"] = {
"Wasu",
7972892,
}
m["wsv"] = {
"Wotapuri-Katarqalai",
3877569,
"inc-koh",
}
m["wtf"] = {
"Watiwa",
35316,
"ngf-eva",
"Latn",
}
m["wth"] = {
"Wathaurong",
7974656,
"aus-pam",
"Latn",
}
m["wti"] = {
"Berta",
33178,
"qfa-iso", -- may be ssa
"Latn",
}
m["wtk"] = {
"Watakataui",
7972975,
"paa-sep",
"Latn",
}
m["wtm"] = {
"Mewati",
2605943,
"raj",
"Deva",
translit = "hi-translit",
}
m["wtw"] = {
"Wotu",
12473488,
"poz-wot",
"Latn",
}
m["wua"] = {
"Wikngenchera",
10720045,
"aus-pmn",
"Latn",
}
m["wub"] = {
"Wunambal",
3913805,
"aus-wor",
"Latn",
}
m["wud"] = {
"Wudu",
36972,
"alv-gbe",
"Latn",
}
m["wuh"] = {
"Wutunhua",
1012917,
"qfa-mix",
"Latn",
ancestors = "cmn, bo, peh",
}
m["wul"] = {
"Silimo",
11732514,
"ngf-ngn",
"Latn",
}
m["wum"] = {
"Wumbvu",
36891,
"bnt-kel",
"Latn",
}
m["wun"] = {
"Bungu",
4997686,
"bnt-mby",
"Latn",
}
m["wur"] = {
"Wurrugu",
8039305,
"aus-wdj",
"Latn",
}
m["wut"] = {
"Wutung",
56743,
"paa-isk",
"Latn",
}
m["wuu"] = {
"Wu",
34290,
"zhx",
"Hants",
ancestors = "ltc",
generate_forms = "zh-generateforms",
translit = "zh-translit",
sort_key = "Hani-sortkey",
}
m["wuv"] = {
"Wuvulu-Aua",
3062746,
"poz-aay",
"Latn",
}
m["wux"] = {
"Wulna",
13591670,
}
m["wuy"] = {
"Wauyai",
12953295,
"poz-hce",
"Latn",
}
m["wwa"] = {
"Waama",
7958576,
"nic-eov",
"Latn",
}
m["wwo"] = {
"Dorig",
3037047,
"poz-vnn",
"Latn",
}
m["wwr"] = {
"Warrwa",
7970852,
}
m["www"] = {
"Wawa",
36889,
"nic-mmb",
"Latn",
}
m["wxa"] = {
"Waxiang",
2252191,
"zhx",
"Hants",
generate_forms = "zh-generateforms",
sort_key = "Hani-sortkey",
}
m["wxw"] = {
"Wardandi",
61999705,
}
m["wya"] = {
"Wyandot",
1185119,
"iro-nor",
"Latn",
}
m["wyb"] = {
"Ngiyambaa",
3913825,
"aus-cww",
"Latn",
}
m["wyi"] = {
"Woiwurrung",
8029099,
"aus-pam",
"Latn",
}
m["wym"] = {
"Vilamovian",
56485,
"gmw-hgm",
"Latn",
ancestors = "gmh",
strip_diacritics = {remove_diacritics = c.dotabove},
}
m["wyr"] = {
"Wayoró",
2875044,
"tup",
}
m["wyy"] = {
"Western Fijian",
3062751,
"poz-pcc",
"Latn",
}
return require("Module:languages").finalizeData(m, "language")
cfhpbn3sajoez0tfffvnbp4os4648vf
Module:languages/data/3/s
828
6260
234886
220390
2026-05-22T23:20:41Z
en>Theknightwho
0
234886
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["saa"] = {
"Saba",
3914885,
"cdc-est",
"Latn",
}
m["sab"] = {
"Buglere",
3368506,
"cba",
"Latn",
}
m["sac"] = {
"Fox",
12714767,
"alg-sfk",
"Latn",
}
m["sad"] = {
"Sandawe",
34016,
"qfa-iso",
"Latn",
}
m["sae"] = {
"Sabanê",
3460478,
"sai-nmk",
"Latn",
}
m["saf"] = {
"Safaliba",
36432,
"nic-mre",
"Latn",
}
m["sah"] = {
"Yakut",
34299,
"trk-nsb",
"Cyrl",
translit = "sah-translit",
override_translit = true,
}
m["saj"] = {
"Sahu",
7399757,
"paa-sah",
"Latn",
}
m["sak"] = {
"Sake",
36425,
"bnt-kel",
"Latn",
}
m["sam"] = {
"Samaritan Aramaic",
56612,
"sem-arw",
"Samr",
translit = "Samr-translit",
-- Samr strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["sao"] = {
"Sause",
4409155,
"qfa-dis", -- isolate per Glottolog, possibly related to Kapauri in a Kapauri-Sause family under Greater Kwerba
"Latn",
}
m["saq"] = {
"Samburu",
56536,
"sdv-lma",
}
m["sar"] = {
"Saraveca",
3450556,
"awd",
"Latn",
}
m["sas"] = {
"Sasak",
1294047,
"poz-bss",
"Latn, Bali, Java",
}
m["sat"] = {
"Santali",
33965,
"mun",
"Olck",
translit = "Olck-translit",
override_translit = true,
}
m["sau"] = {
"Saleman",
7404262,
"poz-cet",
}
m["sav"] = {
"Saafi-Saafi",
36308,
"alv-cng",
"Arab, Latn",
}
m["saw"] = {
"Sawi",
677064,
"ngf-awd",
"Latn",
}
m["sax"] = {
"Sa",
3460352,
"poz-vnn",
"Latn",
}
m["say"] = {
"Saya",
3914431,
"cdc-wst",
"Latn",
}
m["saz"] = {
"Saurashtra",
13292,
"inc-wes",
"Saur, Latn, Taml, Deva",
translit = "saz-translit",
ancestors = "inc-ogu",
}
m["sba"] = {
"Ngambay",
2372207,
"csu-sar",
"Latn",
}
m["sbb"] = {
"Simbo",
3484101,
"poz-ocw",
}
m["sbc"] = {
"Gele'",
3194847,
"poz-aay",
"Latn",
}
m["sbd"] = {
"Southern Samo",
33122730,
"dmn-sam",
"Latn",
}
m["sbe"] = {
"Saliba (New Guinea)",
3469737,
"poz-ocw",
}
m["sbf"] = {
"Shabo",
36342,
"ssa",
"Latn",
}
m["sbg"] = {
"Seget",
7446237,
"paa-wbh",
"Latn",
}
m["sbh"] = {
"Sori-Harengan",
36515,
"poz-aay",
"Latn",
}
m["sbi"] = {
"Seti",
7456682,
"paa-trr",
"Latn",
}
m["sbj"] = {
"Surbakhal",
759995,
}
m["sbk"] = {
"Safwa",
4121160,
"bnt-mby",
"Latn",
}
m["sbl"] = {
"Botolan Sambal",
4095195,
"phi",
"Latn",
}
m["sbm"] = {
"Sagala",
11732610,
"bnt-ruv",
"Latn",
}
m["sbn"] = {
"Sindhi Bhil",
25559289,
"inc-snd",
"Arab, Deva, Sind, Guru",
ancestors = "sd",
}
m["sbo"] = {
"Sabüm",
7396535,
"mkh-asl",
}
m["sbp"] = {
"Sangu (Tanzania)",
7418149,
"bnt-bki",
"Latn",
}
m["sbq"] = {
"Sirva",
7514337,
"ngf-nso",
"Latn",
}
m["sbr"] = {
"Sembakung Murut",
7449148,
"poz-san",
}
m["sbs"] = {
"Subiya",
6442073,
"bnt-bot",
"Latn",
}
m["sbt"] = {
"Kimki",
6410160,
"qfa-dis", -- Papuan; Glottolog and Foley treat as an isolate, Usher puts in South Pauwasi
"Latn",
}
m["sbu"] = {
"Stod Bhoti",
15622700,
"sit-las",
}
m["sbv"] = {
"Sabine",
65455885,
"itc-sbl",
"Latn",
display_text = s["itc-Latn-displaytext"],
strip_diacritics = s["itc-Latn-stripdiacritics"],
sort_key = s["itc-Latn-sortkey"],
}
m["sbw"] = {
"Simba",
36430,
"bnt-tso",
"Latn",
}
m["sbx"] = {
"Seberuang",
12473470,
"poz-mly",
}
m["sby"] = {
"Soli",
7557754,
"bnt-bot",
"Latn",
}
m["sbz"] = {
"Sara Kaba",
25559318,
"csu-kab",
"Latn",
}
m["scb"] = {
"Chut",
2967709,
"mkh-vie",
"Latn",
}
m["sce"] = {
"Dongxiang",
32947,
"xgn-shr",
"Arab, Latn",
}
m["scf"] = {
"San Miguel Creole French",
12953094,
"crp",
"Latn",
ancestors = "gcf",
sort_key = s["roa-oil-sortkey"],
}
m["scg"] = {
"Sanggau",
12473466,
"day",
}
m["sch"] = {
"Sakachep",
37054,
"tbq-kuk",
}
m["sci"] = {
"Sri Lankan Creole Malay",
1089151,
"crp",
"Latn",
ancestors = "ms",
}
m["sck"] = {
"Sadri",
765922,
"inc-bih",
"Deva, Kthi",
translit = {
Deva = "hi-translit",
Kthi = "bho-Kthi-translit",
},
}
m["scl"] = {
"Shina",
1353320,
"inc-shn",
"ur-Arab, Deva",
}
m["scn"] = {
"Sicilian",
33973,
"roa-itr",
ancestors = "scn-old",
"Latn",
}
m["sco"] = {
"Scots",
14549,
"gmw-ang",
"Latn",
ancestors = "gmw-msc",
}
m["scp"] = {
"Yolmo",
22662107,
"sit-kyk",
"Deva",
}
m["scq"] = {
"Sa'och",
6583617,
"mkh-pea",
}
m["scs"] = {
"North Slavey",
20628,
"den",
"Latn",
}
m["scu"] = {
"Shumcho",
22077739,
"sit-kin",
}
m["scv"] = {
"Sheni",
11015820,
"nic-jer",
"Latn",
ancestors = "zir",
}
m["scw"] = {
"Sha",
3438816,
"cdc-wst",
"Latn",
}
m["scx"] = {
"Sicel",
36667,
"itc",
"Polyt",
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["scz"] = {
"Shetland",
3069598,
"qfa-mix",
"Latn",
ancestors = "nrn, gmw-msc",
standard_chars = "AaBbCcDdEeFfGgHhIiJjKkLlMmNnOoPpQqRrSsTtUuVvWwXxYyZzØøÖüÜü0123456789" .. c.punc,
}
m["sda"] = {
"Toraja-Sa'dan",
36673,
"poz-ssw",
"Latn",
}
m["sdb"] = {
"Shabak",
3289596,
"ira-zgr",
ancestors = "hac",
}
m["sdc"] = {
"Sassarese",
845441,
"roa-itr",
"Latn",
}
m["sde"] = {
"Surubu",
3913336,
"nic-kau",
"Latn",
}
m["sdf"] = {
"Sarli",
7424256,
"ira-zgr",
ancestors = "hac",
}
m["sdg"] = {
"Savi",
3474654,
"inc-dng",
}
m["sdh"] = {
"Southern Kurdish",
1496597,
"ku",
"ku-Arab",
translit = "sdh-translit",
strip_diacritics = {remove_diacritics = c.kasra .. c.sukun},
}
m["sdj"] = {
"Suundi",
7650407,
"bnt-kng",
"Latn",
}
m["sdk"] = {
"Sos Kundi",
7563811,
"paa-nnd",
"Latn",
}
m["sdl"] = {
"Saudi Arabian Sign Language",
3504160,
"sgn",
}
m["sdm"] = {
"Semandang",
7449012,
"day",
}
m["sdn"] = {
"Gallurese",
612220,
"roa-itr",
"Latn",
ancestors = "co",
}
m["sdo"] = {
"Bukar-Sadung Bidayuh",
2927799,
"day",
"Latn",
}
m["sdp"] = {
"Sherdukpen",
7494785,
"sit-khm",
}
m["sdr"] = {
"Oraon Sadri",
12953860,
"inc-bih",
}
m["sds"] = {
"Tunisian Berber",
5329732,
"ber",
}
m["sdu"] = {
"Sarudu",
7424700,
"poz-cet",
}
m["sdx"] = {
"Sibu Melanau",
18642842,
"poz-bnn",
}
m["sea"] = {
"Semai",
3135426,
"mkh-asl",
"Latn",
}
-- seb is a duplicate code of spp
m["sec"] = {
"Sechelt",
7442898,
"sal",
"Latn",
}
m["sed"] = {
"Sedang",
56448,
"mkh-nbn",
"Latn",
}
m["see"] = {
"Seneca",
1185133,
"iro-nor",
"Latn",
}
m["sef"] = {
"Cebaara",
10975121,
"alv-snr",
"Latn",
}
m["seg"] = {
"Segeju",
17584599,
"bnt-mij",
"Latn",
}
m["seh"] = {
"Sena",
2964008,
"bnt-sna",
"Latn",
}
m["sei"] = {
"Seri",
36583,
"qfa-iso",
"Latn",
}
m["sej"] = {
"Sene",
7450252,
"ngf-ehu",
"Latn",
}
m["sek"] = {
"Sekani",
28562,
"ath-nor",
"Latn",
}
m["sen"] = {
"Nanerige",
36002,
"alv-sma",
}
m["seo"] = {
"Asaba",
7630513,
"qfa-dis", -- Papuan; isolate or unclassified in Glottolog; Sepik language in Foley (2018)
"Latn",
}
m["sep"] = {
"Sicite",
56787,
"alv-sma",
}
m["seq"] = {
"Senara", -- not to be confused with Syenara (shz)
35210,
"alv-snr",
}
m["ser"] = {
"Serrano",
3479942,
"azc-tak",
"Latn",
}
m["ses"] = {
"Koyraboro Senni",
35655,
"son",
"Latn",
}
m["set"] = {
"Sentani",
3441672,
"paa-sen",
"Latn",
}
m["seu"] = {
"Serui-Laut",
7455503,
"poz-hce",
"Latn",
}
m["sev"] = {
"Nyarafolo",
36306,
"alv-snr",
}
m["sew"] = {
"Sewa Bay",
7458126,
"poz-ocw",
}
m["sey"] = {
"Secoya",
3477218,
"sai-tuc",
"Latn",
}
m["sez"] = {
"Senthang Chin",
7451223,
"tbq-kuk",
}
m["sfb"] = {
"French Belgian Sign Language",
3217332,
"sgn",
}
m["sfe"] = {
"Eastern Subanun",
63311321,
"phi",
"Latn",
}
m["sfm"] = {
"Small Flowery Miao",
7542773,
"hmn",
}
m["sfs"] = {
"South African Sign Language",
3322093,
"sgn",
}
m["sfw"] = {
"Sehwi",
36593,
"alv-ctn",
"Latn",
}
m["sga"] = {
"Old Irish",
35308,
"cel-gae",
"Latn, Ogam",
strip_diacritics = {remove_diacritics = c.dotabove .. c.diaer .. "·"},
sort_key = "sga-sortkey",
standard_chars = "AaÁáBbCcDdEeÉéFfGgHhIiÍíLlMmNnOoÓóPpRrSsTtUuÚú0123456789ᚁᚂᚃᚄᚅᚆᚇᚈᚉᚊᚋᚌᚍᚎᚏᚐᚑᚒᚓᚔ" .. c.punc,
}
m["sgb"] = {
"Mag-Anchi Ayta",
4356243,
"phi",
"Latn",
}
m["sgc"] = {
"Kipsigis",
56339,
"sdv-nma",
}
m["sgd"] = {
"Surigaonon",
34140,
"phi",
"Latn",
}
m["sge"] = {
"Segai",
7446180,
}
m["sgg"] = {
"Swiss-German Sign Language",
35150,
"sgn",
}
m["sgh"] = {
"Shughni",
34053,
"ira-shr",
"Latn, Cyrl",
translit = "sgh-translit",
override_translit = true,
}
m["sgi"] = {
"Suga",
36475,
"nic-mmb",
"Latn",
}
m["sgk"] = {
"Sangkong",
2945610,
"tbq-bis",
}
m["sgm"] = {
"Singa",
7522797,
"bnt-lok",
"Latn",
}
m["sgp"] = {
"Singpho",
7524158,
"sit-jnp",
"Latn",
}
m["sgr"] = {
"Sangisari",
3394363,
"ira-kms",
"Arab",
}
m["sgs"] = {
"Samogitian",
213434,
"bat-eas",
"Latn",
wikimedia_codes = "bat-smg",
ancestors = "olt",
display_text = "lt-common",
strip_diacritics = "lt-common",
sort_key = "lt-common",
}
m["sgt"] = {
"Brokpake",
56603,
"sit-tib",
"Tibt",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["sgu"] = {
"Salas",
7403694,
"poz-cma",
}
m["sgw"] = {
"Sebat Bet Gurage",
2707343,
"sem-eth",
"Ethi",
}
m["sgx"] = {
"Sierra Leone Sign Language",
7511448,
"sgn",
}
m["sgy"] = {
"Sanglechi",
3472220,
"ira-sgi",
}
m["sgz"] = {
"Sursurunga",
36511,
"poz-ocw",
"Latn",
}
m["sha"] = {
"Shall-Zwall",
3915355,
"nic-beo",
}
m["shb"] = {
"Ninam",
3436586,
"sai-ynm",
"Latn",
}
m["shc"] = {
"Sonde",
7560881,
"bnt-pen",
"Latn",
}
m["shd"] = {
"Kundal Shahi",
6444265,
"inc-shn",
"Arab",
}
m["she"] = {
"Sheko",
3183355,
"omv-diz",
}
m["shg"] = {
"Shua",
3501092,
"khi-kal",
"Latn",
}
m["shh"] = {
"Shoshone",
33811,
"azc-num",
"Latn",
}
m["shi"] = {
"Tashelhit",
34152,
"ber",
"Latn, Arab, Tfng, Hebr",
ancestors = "shi-med",
translit = {
Tfng = "Tfng-translit",
},
strip_diacritics = {
Arab = "ar-stripdiacritics",
},
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["shj"] = {
"Shatt",
56344,
"sdv-daj",
}
m["shk"] = {
"Shilluk",
36486,
"sdv-lon",
"Latn",
}
m["shl"] = {
"Shendu",
22074616,
"tbq-kuk",
}
m["shm"] = {
"Shahrudi",
7462280,
"xme-ttc",
"fa-Arab, Latn",
ancestors = "xme-ttc-cen",
}
m["shn"] = {
"Shan",
56482,
"tai-swe",
"Mymr",
translit = "shn-translit",
sort_key = {
from = {"[ၢႃ]", "ဵ", "ႅ", "ႇ", "ႈ", "း", "ႉ", "ႊ"},
to = {"ာ", "ေ", "ႄ", "႒", "႓", "႔", "႕", "႖"}
},
}
m["sho"] = {
"Shanga",
3913931,
"dmn-bbu",
"Latn",
}
m["shp"] = {
"Shipibo-Conibo",
2671988,
"sai-pan",
"Latn",
}
m["shq"] = {
"Sala",
10961665,
"bnt-bot",
"Latn",
}
m["shr"] = {
"Shi",
3481999,
"bnt-shh",
"Latn",
}
m["shs"] = {
"Shuswap",
3482685,
"sal",
"Latn",
}
m["sht"] = {
"Shasta",
56396,
"nai-shs",
"Latn",
}
m["shu"] = {
"Chadian Arabic",
56497,
"sem-arb",
"Arab",
strip_diacritics = {
remove_diacritics = c.kashida .. c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.superalef,
from = {u(0x0671)},
to = {u(0x0627)}
},
}
m["shv"] = {
"Shehri",
33445,
"sem-sar",
"Arab, Latn",
}
m["shw"] = {
"Shwai",
36527,
"alv-hei",
}
m["shx"] = {
"She",
2605689,
"hmn",
}
m["shy"] = {
"Tachawit",
33274,
"ber",
"Tfng, Arab, Latn",
translit = "Tfng-translit",
}
m["shz"] = {
"Syenara", -- not to be confused with Senara (seq)
36316,
"alv-snr",
}
m["sia"] = {
"Akkala Sami",
35241,
"smi",
"Cyrl, Latn",
translit = "sia-translit",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
}
m["sib"] = {
"Sebop",
7442799,
"poz-swa",
"Latn",
}
m["sid"] = {
"Sidamo",
33786,
"cus-hec",
"Latn, Ethi",
}
m["sie"] = {
"Simaa",
7517329,
"bnt-kav",
"Latn",
}
m["sif"] = {
"Siamou",
36252,
}
m["sig"] = {
"Paasaal",
36426,
"nic-sis",
"Latn",
}
m["sih"] = {
"Sîshëë",
8072753,
"poz-cln",
"Latn",
}
m["sii"] = {
"Shom Peng",
1039346,
"aav",
}
m["sij"] = {
"Numbami",
3346277,
"poz-ocw",
"Latn",
}
m["sik"] = {
"Sikiana",
3443734,
"sai-prk",
"Latn",
}
m["sil"] = {
"Tumulung Sisaala",
25383006,
"nic-sis",
"Latn",
}
m["sim"] = {
"Mende (New Guinea)",
7446815,
"paa-sep",
"Latn",
}
m["sip"] = {
"Sikkimese",
35285,
"sit-tib",
"Tibt",
ancestors = "xct",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["siq"] = {
"Sonia",
7561770,
"ngf-bos",
"Latn",
}
m["sir"] = {
"Siri",
3438729,
"cdc-wst",
"Latn",
}
m["sis"] = {
"Siuslaw",
2315424,
}
m["siu"] = {
"Sinagen",
7521655,
"paa-wap",
"Latn",
}
m["siv"] = {
"Sumariup",
7636966,
"paa-sep",
"Latn",
}
m["siw"] = {
"Siwai",
7532519,
"paa-sbo",
"Latn",
}
m["six"] = {
"Sumau",
7637021,
"ngf-pek",
"Latn",
}
m["siy"] = {
"Sivandi",
13269,
"xme",
"fa-Arab, Latn",
ancestors = "xme-mid",
}
m["siz"] = {
"Siwi",
36814,
"ber",
"Tfng, Arab, Latn",
}
m["sja"] = {
"Epena",
3055682,
"sai-chc",
"Latn",
}
m["sjb"] = {
"Sajau Basap",
4684353,
"poz-bnn",
}
m["sjc"] = {
"Shaojiang Min",
3431451,
"zhx-inm",
"Hants",
generate_forms = "zh-generateforms",
sort_key = "Hani-sortkey",
}
m["sjd"] = {
"Kildin Sami",
33656,
"smi",
"Cyrl",
translit = "sjd-translit",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
}
m["sje"] = {
"Pite Sami",
56314,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = c.macron .. "'ˈ"},
sort_key = "sje-sortkey",
}
m["sjg"] = {
"Assangori",
3502255,
"sdv-tmn",
}
m["sjk"] = {
"Kemi Sami",
35871,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
}
m["sjl"] = {
"Miji",
6845470,
"sit-hrs",
}
m["sjm"] = {
"Mapun",
3287253,
"poz-sbj",
"Latn",
}
m["sjn"] = {
"Sindarin",
56437,
"art",
"Latn, Teng",
type = "appendix-constructed",
}
m["sjo"] = {
"Xibe",
13223,
"tuw-jrc",
"sjo-Mong",
ancestors = "mnc",
}
m["sjp"] = {
"Surjapuri",
7645351,
"inc-krd",
"Deva, as-Beng, Kthi",
}
m["sjr"] = {
"Siar-Lak",
3482907,
"poz-ocw",
}
m["sjs"] = {
"Senhaja de Srair",
56744,
"ber",
"Latn, Tfng, Arab",
strip_diacritics = {
Arab = "ar-stripdiacritics",
},
translit = {
Tfng = "Tfng-translit",
}
}
m["sjt"] = {
"Ter Sami",
36656,
"smi",
"Cyrl, Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
translit = "sjt-translit",
}
m["sju"] = {
"Ume Sami",
56415,
"smi",
"Latn",
strip_diacritics = {remove_diacritics = c.macron .. "'ˈ"},
display_text = {
from = {"'"},
to = {"ˈ"}
},
sort_key = "sju-sortkey",
}
m["sjw"] = {
"Shawnee",
2669206,
"alg",
"Latn",
}
-- [ska] Skagit is treated as part of [lut] Lushootseed
m["skb"] = {
"Saek",
36437,
"tai-nor",
"Thai",
sort_key = "Thai-sortkey",
}
m["skc"] = {
"Ma Manda",
6720783,
"ngf-era",
"Latn",
}
m["skd"] = {
"Southern Sierra Miwok",
3492334,
"nai-utn",
"Latn",
}
m["ske"] = {
"Ske",
7534244,
"poz-vnn",
"Latn",
}
m["skf"] = {
"Mekéns",
3304806,
"tup",
"Latn",
}
m["skh"] = {
"Sikule",
3121081,
"poz-nws",
}
m["ski"] = {
"Sika",
33960,
"poz-cet",
"Latn",
}
m["skj"] = { -- compare 'ths'
"Seke",
30226846,
"sit-tam",
}
m["skk"] = {
"Sok",
12953887,
"mkh-ban",
}
m["skm"] = {
"Sakam",
6448517,
"ngf-uru",
"Latn",
}
m["skn"] = {
"Kolibugan Subanon",
18755617,
"phi",
"Latn",
}
m["sko"] = {
"Seko Tengah",
15613270,
"poz",
}
m["skp"] = {
"Sekapan",
7447132,
"poz-bnn",
}
m["skq"] = {
"Sininkere",
3914896,
"dmn-snb",
"Latn",
}
m["skr"] = {
"Saraiki",
33902,
"inc-pan",
"pa-Arab, Mult, Deva",
strip_diacritics = {remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.nunghunna},
translit = {
["pa-Arab"] = "pa-Arab-translit",
Deva = "hi-translit",
Mult = "Mult-translit",
},
}
m["sks"] = {
"Maia",
12952760,
"ngf-kau",
"Latn",
}
m["skt"] = {
"Sakata",
36691,
"bnt-bnm",
"Latn",
}
m["sku"] = {
"Sakao",
3298421,
"poz-vnn",
"Latn",
}
m["skv"] = {
"Skou",
3915200,
"paa-isk",
"Latn",
}
m["skw"] = {
"Skepi Creole Dutch",
2522153,
"crp",
"Latn",
ancestors = "nl",
}
m["skx"] = {
"Seko Padang",
15613282,
"poz-ssw",
"Latn",
}
m["sky"] = {
"Sikaiana",
7439242,
"poz-pnp",
"Latn",
}
m["skz"] = {
"Sekar",
7447136,
"poz-cet",
}
m["slc"] = {
"Saliba (Colombia)",
3441097,
nil,
"Latn",
}
m["sld"] = {
"Sisaala",
11020264,
"nic-sis",
"Latn",
}
m["sle"] = {
"Sholaga",
7500203,
"dra-kan",
"Knda",
-- Knda translit in [[Module:scripts/data]]
}
m["slf"] = {
"Swiss-Italian Sign Language",
12953479,
"sgn",
}
m["slg"] = {
"Selungai Murut",
7448844,
"poz-san",
}
-- [slh] Southern Puget Sound Salish is treated as part of [lut] Lushootseed
-- "sli" "Silesian German" IS SUBSUMED INTO "gmw-ecg" "East Central German"
m["slj"] = {
"Salumá",
7406296,
"sai-prk",
"Latn",
}
m["sll"] = {
"Salt-Yui",
7405785,
"ngf-sim",
"Latn",
}
m["slm"] = {
"Pangutaran Sama",
3362086,
"poz-sbj",
"Latn",
}
m["sln"] = {
"Salinan",
1568938,
"qfa-iso",
"Latn",
}
m["slp"] = {
"Lamaholot",
6480777,
"poz-cet",
"Latn",
}
m["slr"] = {
"Salar",
33963,
"trk-ogz",
"Arab, Latn",
ancestors = "trk-eog",
}
m["sls"] = {
"Singapore Sign Language",
7512563,
"sgn",
}
m["slt"] = {
"Sila",
7514021,
"tbq-sil",
}
m["slu"] = {
"Selaru",
7447500,
"poz-cet",
"Latn",
}
m["slw"] = {
"Sialum",
7506694,
"ngf-ehu",
"Latn",
}
m["slx"] = {
"Salampasu",
7403607,
"bnt-lun",
"Latn",
}
m["sly"] = {
"Selayar",
7447520,
"poz-ssw",
}
m["slz"] = {
"Ma'ya",
2291492,
"poz-hce",
"Latn",
}
m["sma"] = {
"Southern Sami",
13293,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
sort_key = "sma-sortkey",
}
m["smb"] = {
"Simbari",
7517427,
"ngf-bsi",
"Latn",
}
m["smc"] = {
"Som",
7559081,
"ngf-uru",
"Latn",
}
m["smd"] = {
"Sama",
6407456,
"bnt-kmb",
"Latn",
}
m["smf"] = {
"Auwe",
3502072,
"paa-war",
"Latn",
ancestors = "dnd",
}
m["smg"] = {
"Simbali",
56692,
"paa-bai",
"Latn",
}
m["smh"] = {
"Samei",
7409269,
"tbq-axi",
}
m["smj"] = {
"Lule Sami",
56322,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = c.macron .. "'ˈ"},
sort_key = "smj-sortkey",
}
m["smk"] = {
"Bolinao",
2669235,
"phi",
"Latn, Tglg",
}
m["sml"] = {
"Central Sama",
3470593,
"poz-sbj",
"Latn",
}
m["smm"] = {
"Musasa",
6940122,
"inc-bih",
}
m["smn"] = {
"Inari Sami",
33462,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = c.dotbelow .. "'ˈ"},
sort_key = "smn-sortkey",
}
m["smp"] = {
"Samaritan Hebrew",
56502,
"sem-can",
"Samr",
translit = "Samr-translit",
-- Samr strip_diacritics, sort_key in [[Module:scripts/data]]
ancestors = "hbo",
}
m["smq"] = {
"Samo",
7409884,
"ngf-est",
"Latn",
}
m["smr"] = {
"Simeulue",
2992833,
"poz-nws",
"Latn",
}
m["sms"] = {
"Skolt Sami",
13271,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = c.dotbelow .. "'ˈ"},
sort_key = "sms-sortkey",
}
m["smt"] = {
"Simte",
7521268,
"tbq-kuk",
}
m["smu"] = {
"Somray",
6583612,
"mkh-pea",
}
m["smv"] = {
"Samvedi",
6345632,
"inc-sou",
}
m["smw"] = {
"Sumbawa",
3182585,
"poz-bss",
"Latn",
}
m["smx"] = {
"Samba",
11120157,
"bnt-pen",
"Latn",
}
m["smy"] = {
"Semnani",
14531212,
"xme",
"fa-Arab, Latn",
}
m["smz"] = {
"Simeku",
7517534,
"paa-sbo",
"Latn",
}
m["snb"] = {
"Sebuyau",
7442836,
"poz-mly",
"Latn",
}
m["snc"] = {
"Sinaugoro",
4170719,
"poz-ocw",
"Latn",
}
m["sne"] = {
"Bau Bidayuh",
2891938,
"day",
"Latn",
}
m["snf"] = {
"Noon",
36304,
"alv-cng",
"Latn",
}
m["sng"] = {
"Sanga (Congo)",
3438316,
"bnt-lub",
"Latn",
}
m["sni"] = {
"Sensi",
7451029,
"sai-pan",
"Latn",
}
m["snj"] = {
"Riverain Sango",
25559751,
"crp",
"Latn",
ancestors = "ngb",
}
m["snk"] = {
"Soninke",
36660,
"dmn-snb",
"Latn",
}
m["snl"] = {
"Sangil",
3472206,
"phi",
"Latn",
}
m["snm"] = {
"Southern Ma'di",
15637273,
"csu-mma",
}
m["snn"] = {
"Siona",
3485116,
"sai-tuc",
"Latn",
}
-- [sno] Snohomish is treated as part of [lut] Lushootseed
m["snp"] = {
"Siane",
7506812,
"ngf-gor",
"Latn",
}
m["snq"] = {
"Sangu (Gabon)",
36609,
"bnt-sir",
"Latn",
}
m["snr"] = {
"Sihan",
7513400,
"ngf-gum",
"Latn",
}
m["sns"] = {
"Nahavaq",
2160435,
"poz-vnc",
"Latn",
}
m["snu"] = {
"Senggi",
7929052,
"paa-war",
"Latn",
}
m["snv"] = {
"Sa'ban",
3474891,
"poz-swa",
"Latn",
}
m["snw"] = {
"Selee",
36272,
"alv-ntg",
"Latn",
}
m["snx"] = {
"Sam",
7408387,
"ngf-min",
"Latn",
}
m["sny"] = {
"Saniyo-Hiyewe",
7418302,
"paa-sep",
"Latn",
}
m["snz"] = {
"Kou",
7525035, -- also 4803639
"ngf-eva",
"Latn",
}
m["soa"] = {
"Thai Song",
7709159,
"tai-swe",
"Tavt, Thai",
--translit = "Tavt-translit",
sort_key = {
from = {"([ꪵꪶꪹꪻꪼ])([ꪀ-ꪯ])", "([เแโใไ])([ก-ฮ])"},
to = {"%2%1", "%2%1"}
},
}
m["sob"] = {
"Sobei",
3121035,
"poz-ocw",
"Latn",
}
m["soc"] = {
"Soko",
7555138,
"bnt-ske",
"Latn",
}
m["sod"] = {
"Songoora",
7561296,
"bnt-lgb",
"Latn",
}
m["soe"] = {
"Songomeno",
5713543,
"bnt-bsh",
"Latn",
}
m["sog"] = {
"Sogdian",
205979,
"ira-sgc",
"Sogd, Mani, Syrc, Sogo",
translit = {
Sogd = "Sogd-translit",
-- Mani translit in [[Module:scripts/data]]
Sogo = "Sogo-translit",
},
}
m["soh"] = {
"Aka (Sudan)",
3450949,
"sdv-eje",
"Latn",
}
m["soi"] = {
"Sonha",
12953890,
"inc-eas",
}
m["sok"] = {
"Sokoro",
3441303,
"cdc-est",
"Latn",
}
m["sol"] = {
"Solos",
3489591,
"poz-ocw",
}
m["soo"] = {
"Nsong",
12953148,
"bnt-bdz",
"Latn",
}
m["sop"] = {
"Songe",
3130911,
"bnt-lbn",
"Latn",
}
m["soq"] = {
"Kanasi",
11732656,
"ngf-dag",
"Latn",
}
m["sor"] = {
"Somrai",
3123566,
"cdc-est",
"Latn",
}
m["sos"] = {
"Seenku",
36274,
"dmn-smg",
}
m["sou"] = {
"Southern Thai",
56508,
"tai-swe",
"Thai",
sort_key = "Thai-sortkey",
}
m["sov"] = {
"Sonsorolese",
13281,
"poz-mic",
"Latn",
}
m["sow"] = {
"Sowanda",
7571845,
"paa-war",
"Latn",
}
m["sox"] = {
"Swo",
36604,
"bnt-mka",
"Latn",
}
m["soy"] = {
"Miyobe",
35913,
"alv-sav",
"Latn",
}
m["soz"] = {
"Temi",
13278,
"bnt-kka",
"Latn",
}
m["spb"] = {
"Sepa (Indonesia)",
18603687,
"poz-cma",
"Latn",
}
m["spc"] = {
"Sapé",
2888158,
nil,
"Latn",
}
m["spd"] = {
"Saep",
7398312,
"ngf-yag",
"Latn",
}
m["spe"] = {
"Sepa (New Guinea)",
7451725,
"poz-ocw",
"Latn",
}
m["spg"] = {
"Sian",
7506806,
"poz-bnn",
}
m["spi"] = {
"Saponi",
3915418,
"paa-rsa",
"Latn",
}
m["spk"] = {
"Sengo",
7450584,
"paa-nnd",
"Latn",
}
m["spl"] = {
"Selepet",
7447917,
"ngf-kab",
"Latn",
}
m["spm"] = {
"Sepen",
4701931,
"paa-rub",
"Latn",
}
m["spn"] = {
"Sanapaná",
3033556,
"sai-mas",
"Latn",
}
m["spo"] = {
"Spokane",
3493704,
"sal",
}
m["spp"] = {
"Supyire",
56284,
"alv-sma",
"Latn",
}
m["spr"] = {
"Saparua",
7420921,
"poz-cma",
"Latn",
}
m["sps"] = {
"Saposa",
3473187,
"poz-ocw",
}
m["spt"] = {
"Spiti Bhoti",
22080879,
"sit-las",
}
m["spu"] = {
"Sapuan",
7421168,
"mkh-ban",
}
m["spv"] = {
"Sambalpuri",
6433240,
"inc-eas",
"Orya",
translit = "or-translit",
ancestors = "or",
}
m["spx"] = {
"South Picene",
36688,
"itc-sbl",
"Ital, Latn",
-- Ital translit in [[Module:scripts/data]]
display_text = {
Latn = s["itc-Latn-displaytext"]
},
strip_diacritics = {
Latn = s["itc-Latn-stripdiacritics"],
},
sort_key = {
Latn = s["itc-Latn-sortkey"],
},
}
m["spy"] = {
"Sabaot",
7395896,
"sdv-kln",
}
m["sqa"] = {
"Shama-Sambuga",
3914392,
"nic-kmk",
"Latn",
}
m["sqh"] = {
"Shau",
3913925,
"nic-jer",
"Latn",
}
m["sqk"] = {
"Albanian Sign Language",
4709168,
"sgn",
}
m["sqm"] = {
"Suma",
11008431,
"gba-wes",
}
m["sqn"] = {
"Susquehannock",
3505736,
"iro-nor",
}
m["sqo"] = {
"Sorkhei",
3491964,
"ira-kms",
}
m["sqq"] = {
"Sou",
16979751,
"mkh-ban",
}
m["sqr"] = {
"Siculo-Arabic",
1069489,
"sem-arb",
"Arab",
}
m["sqs"] = {
"Sri Lankan Sign Language",
3915466,
"sgn",
}
m["sqt"] = {
"Soqotri",
13283,
"sem-sar",
"Arab, Latn",
}
m["squ"] = {
"Squamish",
2484579,
"sal",
"Latn",
}
m["sra"] = {
"Saruga",
7424699,
"ngf-han",
"Latn",
}
m["srb"] = {
"Sora",
13284,
"mun",
"Sora, Latn, Orya",
}
m["sre"] = {
"Sara",
33957,
"day",
}
m["srf"] = {
"Nafi",
6958174,
"poz-ocw",
}
m["srg"] = {
"Sulod",
7636489,
"phi",
}
m["srh"] = {
"Sarikoli",
33873,
"ira-shr",
"Latn, ug-Arab, Cyrl",
}
m["sri"] = {
"Siriano",
3485264,
"sai-tuc",
"Latn",
}
m["srk"] = {
"Serudung Murut",
7455497,
"poz-san",
}
m["srl"] = {
"Isirawa",
4203802,
"paa-gkw",
"Latn",
}
m["srm"] = {
"Saramaccan",
33779,
"crp",
"Latn",
ancestors = "en, pt",
}
m["srn"] = {
"Sranan Tongo",
33989,
"crp",
"Latn",
ancestors = "en",
}
m["srq"] = {
"Sirionó",
3027953,
"tup-gua",
"Latn",
}
m["srr"] = {
"Serer",
36284,
"alv-fwo",
"Latn",
}
m["srs"] = {
"Tsuut'ina",
20825,
"ath-nor",
"Latn",
}
m["srt"] = {
"Sauri",
7427547,
"paa-egb",
"Latn",
}
m["sru"] = {
"Suruí",
7646993,
"tup",
"Latn",
}
m["srv"] = {
"Waray Sorsogon",
18755610,
"phi",
"Latn",
}
m["srw"] = {
"Serua",
14916905,
"poz-cet",
}
m["srx"] = {
"Sirmauri",
7530505,
"him",
}
m["sry"] = {
"Sera",
7452602,
"poz-ocw",
"Latn",
}
m["srz"] = {
"Shahmirzadi",
12953126,
"ira-msh",
"fa-Arab",
}
m["ssb"] = {
"Southern Sama",
3470594,
"poz-sbj",
"Latn",
}
m["ssc"] = {
"Suba-Simbiti",
7630687,
"bnt-lok",
"Latn",
}
m["ssd"] = {
"Siroi",
10771067,
"ngf-rai",
"Latn",
}
m["sse"] = {
"Balangingi",
2880535,
"poz-sbj",
"Latn",
}
m["ssf"] = {
"Thao",
676492,
"map",
"Latn",
}
m["ssg"] = {
"Seimat",
3182581,
"poz-aay",
"Latn",
}
m["ssh"] = {
"Shihhi Arabic",
56571,
"sem-arb",
"Arab",
strip_diacritics = {
remove_diacritics = c.kashida .. c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.superalef,
from = {u(0x0671)},
to = {u(0x0627)}
},
}
m["ssi"] = {
"Sansi",
3309366,
"inc-nwe",
}
m["ssj"] = {
"Sausi",
7427605,
"ngf-eva",
"Latn",
}
m["ssk"] = {
"Sunam",
11002210,
"sit-kin",
}
m["ssl"] = {
"Western Sisaala",
11154776,
"nic-sis",
"Latn",
}
m["ssm"] = {
"Semnam",
7449713,
"mkh-asl",
"Latn",
}
m["sso"] = {
"Sissano",
7530937,
"poz-ocw",
"Latn",
}
m["ssp"] = {
"Spanish Sign Language",
3100814,
"sgn",
}
m["ssq"] = {
"So'a",
7572120,
"poz-cet",
"Latn",
}
m["ssr"] = {
"Swiss-French Sign Language",
12953483,
"sgn",
}
m["sss"] = {
"Sô",
3082037,
"mkh-kat",
}
m["sst"] = {
"Sinasina",
7521813,
"ngf-sim",
"Latn",
}
m["ssu"] = {
"Susuami",
7649752,
"ngf-woj",
"Latn",
}
m["ssv"] = {
"Shark Bay",
7489783,
"poz-vnn",
"Latn",
}
m["ssx"] = {
"Samberigi",
7409020,
"ngf-sak",
"Latn",
}
m["ssy"] = {
"Saho",
36353,
"cus-eas",
"Latn, Ethi, Arab",
}
m["ssz"] = {
"Sengseng",
7450601,
"poz-ocw",
"Latn",
}
m["stb"] = {
"Northern Subanen",
12953892,
"phi",
"Latn",
}
m["std"] = {
"Sentinelese",
568377,
"qfa-unc", -- presumed Ongan
}
m["ste"] = {
"Liana-Seti",
6539924,
"poz-cma",
}
m["stf"] = {
"Seta",
7456326,
"paa-trr",
"Latn",
}
m["stg"] = {
"Trieng",
22694648,
"mkh-ban",
}
m["sth"] = {
"Shelta",
36705,
"qfa-mix",
"Latn",
ancestors = "ga, en",
}
m["sti"] = {
"Bulo Stieng",
15771431,
"mkh-ban",
"Khmr, Latn",
}
m["stj"] = {
"Matya Samo",
10974879,
"dmn-sam",
"Latn",
}
m["stk"] = {
"Arammba",
3502094,
"paa-ton",
"Latn",
}
m["stm"] = {
"Setaman",
7456333,
"ngf-mok",
"Latn",
}
m["stn"] = {
"Owa",
1324132,
"poz-sls",
"Latn",
}
m["sto"] = {
"Stoney",
3033570,
"sio-dkt",
"Latn",
}
m["stp"] = {
"Southeastern Tepehuan",
12953917,
"azc-pim",
"Latn",
}
m["stq"] = {
"Saterland Frisian",
27154,
"gmw-fri",
"Latn",
}
m["str"] = {
"Saanich",
36444,
"sal",
"Latn",
}
m["sts"] = {
"Shumashti",
33777,
"inc-kun",
"Arab",
}
m["stt"] = {
"Budeh Stieng",
12953891,
"mkh-ban",
}
m["stu"] = {
"Samtao",
25559550,
"mkh-pal",
}
m["stv"] = {
"Silt'e",
33880,
"sem-eth",
"Ethi",
}
m["stw"] = {
"Satawalese",
28477,
"poz-mic",
"Latn",
}
m["sty"] = {
"Siberian Tatar",
4418344,
"trk-kno",
"Cyrl",
}
m["sua"] = {
"Sulka",
7636341,
"qfa-iso", -- Papuan; isolate in Glottolog and Palmer (2018)
"Latn",
}
m["sub"] = {
"Suku",
12953160,
"bnt-yak",
"Latn",
}
m["suc"] = {
"Western Subanon",
16113894,
"phi",
"Latn",
}
m["sue"] = {
"Suena",
7634386,
"ngf-nbi",
"Latn",
}
m["sug"] = {
"Suganga",
7634706,
"ngf-msu",
"Latn",
}
m["sui"] = {
"Suki",
2089984,
"ngf-gsu",
"Latn",
}
m["suk"] = {
"Sukuma",
2638144,
"bnt-tkm",
"Latn",
}
m["suo"] = {
"Bouni",
65043887,
"paa-pio",
"Latn",
}
m["suq"] = {
"Suri",
5364172,
"sdv",
}
m["sur"] = {
"Mwaghavul",
3440486,
"cdc-wst",
"Latn",
}
m["sus"] = {
"Susu",
33990,
"dmn-sya",
"Latn",
}
m["sut"] = {
"Subtiaba",
3915405,
"omq",
"Latn",
}
m["suv"] = {
"Puroik",
56408,
"sit-khb",
"Beng, Deva, Latn",
ancestors = "sit-khp-pro",
}
m["suw"] = {
"Sumbwa",
7637055,
"bnt-glb",
"Latn",
}
m["sux"] = {
"Sumerian",
36790,
"qfa-iso",
"Xsux, Latn",
}
m["suy"] = {
"Suyá",
3505859,
"sai-nje",
"Latn",
}
m["suz"] = {
"Sunwar",
56549,
"sit-kiw",
"Deva, Sunu"
}
m["sva"] = {
"Svan",
34067,
"ccs",
"Geor, Cyrl",
translit = {
Geor = "sva-translit",
},
override_translit = true,
}
m["svb"] = {
"Ulau-Suain",
7878769,
"poz-ocw",
"Latn",
}
m["svc"] = {
"Vincentian Creole English",
3501785,
"crp",
"Latn",
ancestors = "en",
}
m["sve"] = {
"Serili",
7454834,
"poz-tim",
}
m["svk"] = {
"Slovakian Sign Language",
7541557,
"sgn",
}
m["svm"] = {
"Slavomolisano",
36254,
"zls",
"Latn",
ancestors = "sh",
}
m["svs"] = {
"Savosavo",
3130296,
"qfa-dis", -- Papuan; isolate in Glottolog; in the tentative Central Solomons family by Ross (2005) and Pedrós
-- (2015)
"Latn",
}
m["svx"] = {
"Skalvian",
3486125,
"bat-wes",
"Latn",
}
m["swb"] = {
"Maore Comorian",
34075,
"bnt-com",
"Latn",
sort_key = "bnt-com-sortkey",
}
m["swf"] = {
"Sere",
7453056,
"nic-ser",
"Latn",
}
m["swg"] = {
"Swabian",
327274,
"gmw-hgm",
"Latn",
ancestors = "gsw",
}
m["swi"] = {
"Sui",
3112388,
"qfa-kms",
"Latn, Shui, Hani",
sort_key = {Hani = "Hani-sortkey"},
}
m["swj"] = {
"Sira",
36599,
"bnt-sir",
"Latn",
}
m["swl"] = {
"Swedish Sign Language",
36558,
"sgn",
}
m["swm"] = {
"Samosa",
7410037,
"ngf-nwh",
"Latn",
}
m["swn"] = {
"Sokna",
2988323,
"ber",
}
m["swo"] = {
"Shanenawa",
61974839,
"sai-pan",
"Latn",
}
m["swp"] = {
"Suau",
3502368,
"poz-ocw",
}
m["swq"] = {
"Sharwa",
56791,
"cdc-cbm",
"Latn",
}
m["swr"] = {
"Saweru",
3474649,
"paa-ysa",
"Latn",
}
m["sws"] = {
"Seluwasan",
7448845,
"poz-cet",
}
m["swt"] = {
"Sawila",
7428639,
"paa-alp",
"Latn",
}
m["swu"] = {
"Suwawa",
7650588,
"phi",
}
m["sww"] = {
"Sowa",
7571843,
"poz-vnn",
"Latn",
}
m["swx"] = {
"Suruahá",
3114402,
"auf",
}
m["swy"] = {
"Sarua",
56261,
"cdc-est",
"Latn",
}
m["sxb"] = {
"Suba",
33916,
"bnt-lok",
"Latn",
}
m["sxc"] = {
"Sicanian",
36335,
"qfa-unc", -- extinct; lack of data: only names deciphered
"Polyt",
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["sxe"] = {
"Sighu",
36431,
"bnt-kel",
"Latn",
}
m["sxg"] = {
"Shixing",
56337,
"sit-nax",
"Latn",
}
m["sxk"] = {
"Southern Kalapuya",
3192122,
"nai-klp",
}
m["sxl"] = {
"Selonian",
36491,
"bat-eas",
"Latn",
}
m["sxm"] = {
"Samre",
6583615,
"mkh-pea",
}
m["sxn"] = {
"Sangir",
25714758,
"phi",
"Latn",
}
m["sxo"] = {
"Sorothaptic",
2762254,
}
m["sxr"] = {
"Saaroa",
716599,
"map",
"Latn",
}
m["sxs"] = {
"Sasaru",
3913384,
"alv-yek",
"Latn",
}
-- "sxu" "Upper Saxon" IS SUBSUMED INTO "gmw-ecg" "East Central German"
m["sxw"] = {
"Saxwe Gbe",
7428892,
"alv-pph",
"Latn",
}
m["sya"] = {
"Siang",
3482903,
}
m["syb"] = {
"Central Subanen",
12953893,
"phi",
"Latn",
}
m["syc"] = {
"Classical Syriac",
33538,
"sem-are",
"Syrc",
strip_diacritics = {remove_diacritics = c.macron .. c.diaer .. c.macronbelow .. u(0x0730) .. "-" .. u(0x0748)},
}
m["syi"] = {
"Seki",
36547,
"bnt-kel",
"Latn",
}
m["syk"] = {
"Sukur",
56292,
"cdc-cbm",
"Latn",
}
m["syl"] = {
"Sylheti",
2044560,
"inc-bas",
"Sylo, Beng",
ancestors = "inc-obn",
translit = "syl-translit",
}
m["sym"] = {
"Maya Samo",
10950421,
"dmn-sam",
"Latn",
}
m["syn"] = {
"Senaya",
33914,
"sem-nna",
}
m["syo"] = {
"Suoy",
7641864,
"mkh-pea",
}
m["sys"] = {
"Sinyar",
56840,
"csu",
"Latn",
}
m["syw"] = {
"Kagate",
12952538,
"sit-kyk",
"Deva",
}
m["syx"] = {
"Osamayi",
7408415,
"bnt-kel",
"Latn",
}
m["syy"] = {
"Al-Sayyid Bedouin Sign Language",
2915457,
"sgn",
}
m["sza"] = {
"Semelai",
3111827,
"mkh-asl",
"Latn",
}
m["szb"] = {
"Ngalum",
11732516,
"ngf-okk",
"Latn",
}
m["szc"] = {
"Semaq Beri",
7449119,
"mkh-asl",
}
m["szd"] = {
"Seru",
7455488,
"poz-bnn",
"Latn",
}
m["sze"] = {
"Seze",
373683,
"omv-mao",
"Latn",
}
m["szg"] = {
"Sengele",
7450555,
"bnt-mon",
"Latn",
}
m["szl"] = {
"Silesian",
30319,
"zlw-lch",
"Latn",
ancestors = "zlw-opl",
}
m["szn"] = {
"Sula",
3503403,
"poz-cma",
"Latn",
}
m["szp"] = {
"Suabo",
7630429,
"ngf-sbh",
"Latn",
}
m["szv"] = {
"Isubu",
35431,
"bnt-saw",
"Latn",
}
m["szw"] = {
"Sawai",
3447258,
"poz-hce",
"Latn",
}
m["szy"] = {
"Sakizaya",
718269,
"map",
"Latn",
}
return require("Module:languages").finalizeData(m, "language")
5q1vkgr7iqfj6q1fxha4dbfhok7eo7v
234887
234886
2026-05-24T09:46:01Z
Lee
19
[[:en:Module:languages/data/3/s]] වෙතින් එක් සංශෝධනයක්
234886
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["saa"] = {
"Saba",
3914885,
"cdc-est",
"Latn",
}
m["sab"] = {
"Buglere",
3368506,
"cba",
"Latn",
}
m["sac"] = {
"Fox",
12714767,
"alg-sfk",
"Latn",
}
m["sad"] = {
"Sandawe",
34016,
"qfa-iso",
"Latn",
}
m["sae"] = {
"Sabanê",
3460478,
"sai-nmk",
"Latn",
}
m["saf"] = {
"Safaliba",
36432,
"nic-mre",
"Latn",
}
m["sah"] = {
"Yakut",
34299,
"trk-nsb",
"Cyrl",
translit = "sah-translit",
override_translit = true,
}
m["saj"] = {
"Sahu",
7399757,
"paa-sah",
"Latn",
}
m["sak"] = {
"Sake",
36425,
"bnt-kel",
"Latn",
}
m["sam"] = {
"Samaritan Aramaic",
56612,
"sem-arw",
"Samr",
translit = "Samr-translit",
-- Samr strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["sao"] = {
"Sause",
4409155,
"qfa-dis", -- isolate per Glottolog, possibly related to Kapauri in a Kapauri-Sause family under Greater Kwerba
"Latn",
}
m["saq"] = {
"Samburu",
56536,
"sdv-lma",
}
m["sar"] = {
"Saraveca",
3450556,
"awd",
"Latn",
}
m["sas"] = {
"Sasak",
1294047,
"poz-bss",
"Latn, Bali, Java",
}
m["sat"] = {
"Santali",
33965,
"mun",
"Olck",
translit = "Olck-translit",
override_translit = true,
}
m["sau"] = {
"Saleman",
7404262,
"poz-cet",
}
m["sav"] = {
"Saafi-Saafi",
36308,
"alv-cng",
"Arab, Latn",
}
m["saw"] = {
"Sawi",
677064,
"ngf-awd",
"Latn",
}
m["sax"] = {
"Sa",
3460352,
"poz-vnn",
"Latn",
}
m["say"] = {
"Saya",
3914431,
"cdc-wst",
"Latn",
}
m["saz"] = {
"Saurashtra",
13292,
"inc-wes",
"Saur, Latn, Taml, Deva",
translit = "saz-translit",
ancestors = "inc-ogu",
}
m["sba"] = {
"Ngambay",
2372207,
"csu-sar",
"Latn",
}
m["sbb"] = {
"Simbo",
3484101,
"poz-ocw",
}
m["sbc"] = {
"Gele'",
3194847,
"poz-aay",
"Latn",
}
m["sbd"] = {
"Southern Samo",
33122730,
"dmn-sam",
"Latn",
}
m["sbe"] = {
"Saliba (New Guinea)",
3469737,
"poz-ocw",
}
m["sbf"] = {
"Shabo",
36342,
"ssa",
"Latn",
}
m["sbg"] = {
"Seget",
7446237,
"paa-wbh",
"Latn",
}
m["sbh"] = {
"Sori-Harengan",
36515,
"poz-aay",
"Latn",
}
m["sbi"] = {
"Seti",
7456682,
"paa-trr",
"Latn",
}
m["sbj"] = {
"Surbakhal",
759995,
}
m["sbk"] = {
"Safwa",
4121160,
"bnt-mby",
"Latn",
}
m["sbl"] = {
"Botolan Sambal",
4095195,
"phi",
"Latn",
}
m["sbm"] = {
"Sagala",
11732610,
"bnt-ruv",
"Latn",
}
m["sbn"] = {
"Sindhi Bhil",
25559289,
"inc-snd",
"Arab, Deva, Sind, Guru",
ancestors = "sd",
}
m["sbo"] = {
"Sabüm",
7396535,
"mkh-asl",
}
m["sbp"] = {
"Sangu (Tanzania)",
7418149,
"bnt-bki",
"Latn",
}
m["sbq"] = {
"Sirva",
7514337,
"ngf-nso",
"Latn",
}
m["sbr"] = {
"Sembakung Murut",
7449148,
"poz-san",
}
m["sbs"] = {
"Subiya",
6442073,
"bnt-bot",
"Latn",
}
m["sbt"] = {
"Kimki",
6410160,
"qfa-dis", -- Papuan; Glottolog and Foley treat as an isolate, Usher puts in South Pauwasi
"Latn",
}
m["sbu"] = {
"Stod Bhoti",
15622700,
"sit-las",
}
m["sbv"] = {
"Sabine",
65455885,
"itc-sbl",
"Latn",
display_text = s["itc-Latn-displaytext"],
strip_diacritics = s["itc-Latn-stripdiacritics"],
sort_key = s["itc-Latn-sortkey"],
}
m["sbw"] = {
"Simba",
36430,
"bnt-tso",
"Latn",
}
m["sbx"] = {
"Seberuang",
12473470,
"poz-mly",
}
m["sby"] = {
"Soli",
7557754,
"bnt-bot",
"Latn",
}
m["sbz"] = {
"Sara Kaba",
25559318,
"csu-kab",
"Latn",
}
m["scb"] = {
"Chut",
2967709,
"mkh-vie",
"Latn",
}
m["sce"] = {
"Dongxiang",
32947,
"xgn-shr",
"Arab, Latn",
}
m["scf"] = {
"San Miguel Creole French",
12953094,
"crp",
"Latn",
ancestors = "gcf",
sort_key = s["roa-oil-sortkey"],
}
m["scg"] = {
"Sanggau",
12473466,
"day",
}
m["sch"] = {
"Sakachep",
37054,
"tbq-kuk",
}
m["sci"] = {
"Sri Lankan Creole Malay",
1089151,
"crp",
"Latn",
ancestors = "ms",
}
m["sck"] = {
"Sadri",
765922,
"inc-bih",
"Deva, Kthi",
translit = {
Deva = "hi-translit",
Kthi = "bho-Kthi-translit",
},
}
m["scl"] = {
"Shina",
1353320,
"inc-shn",
"ur-Arab, Deva",
}
m["scn"] = {
"Sicilian",
33973,
"roa-itr",
ancestors = "scn-old",
"Latn",
}
m["sco"] = {
"Scots",
14549,
"gmw-ang",
"Latn",
ancestors = "gmw-msc",
}
m["scp"] = {
"Yolmo",
22662107,
"sit-kyk",
"Deva",
}
m["scq"] = {
"Sa'och",
6583617,
"mkh-pea",
}
m["scs"] = {
"North Slavey",
20628,
"den",
"Latn",
}
m["scu"] = {
"Shumcho",
22077739,
"sit-kin",
}
m["scv"] = {
"Sheni",
11015820,
"nic-jer",
"Latn",
ancestors = "zir",
}
m["scw"] = {
"Sha",
3438816,
"cdc-wst",
"Latn",
}
m["scx"] = {
"Sicel",
36667,
"itc",
"Polyt",
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["scz"] = {
"Shetland",
3069598,
"qfa-mix",
"Latn",
ancestors = "nrn, gmw-msc",
standard_chars = "AaBbCcDdEeFfGgHhIiJjKkLlMmNnOoPpQqRrSsTtUuVvWwXxYyZzØøÖüÜü0123456789" .. c.punc,
}
m["sda"] = {
"Toraja-Sa'dan",
36673,
"poz-ssw",
"Latn",
}
m["sdb"] = {
"Shabak",
3289596,
"ira-zgr",
ancestors = "hac",
}
m["sdc"] = {
"Sassarese",
845441,
"roa-itr",
"Latn",
}
m["sde"] = {
"Surubu",
3913336,
"nic-kau",
"Latn",
}
m["sdf"] = {
"Sarli",
7424256,
"ira-zgr",
ancestors = "hac",
}
m["sdg"] = {
"Savi",
3474654,
"inc-dng",
}
m["sdh"] = {
"Southern Kurdish",
1496597,
"ku",
"ku-Arab",
translit = "sdh-translit",
strip_diacritics = {remove_diacritics = c.kasra .. c.sukun},
}
m["sdj"] = {
"Suundi",
7650407,
"bnt-kng",
"Latn",
}
m["sdk"] = {
"Sos Kundi",
7563811,
"paa-nnd",
"Latn",
}
m["sdl"] = {
"Saudi Arabian Sign Language",
3504160,
"sgn",
}
m["sdm"] = {
"Semandang",
7449012,
"day",
}
m["sdn"] = {
"Gallurese",
612220,
"roa-itr",
"Latn",
ancestors = "co",
}
m["sdo"] = {
"Bukar-Sadung Bidayuh",
2927799,
"day",
"Latn",
}
m["sdp"] = {
"Sherdukpen",
7494785,
"sit-khm",
}
m["sdr"] = {
"Oraon Sadri",
12953860,
"inc-bih",
}
m["sds"] = {
"Tunisian Berber",
5329732,
"ber",
}
m["sdu"] = {
"Sarudu",
7424700,
"poz-cet",
}
m["sdx"] = {
"Sibu Melanau",
18642842,
"poz-bnn",
}
m["sea"] = {
"Semai",
3135426,
"mkh-asl",
"Latn",
}
-- seb is a duplicate code of spp
m["sec"] = {
"Sechelt",
7442898,
"sal",
"Latn",
}
m["sed"] = {
"Sedang",
56448,
"mkh-nbn",
"Latn",
}
m["see"] = {
"Seneca",
1185133,
"iro-nor",
"Latn",
}
m["sef"] = {
"Cebaara",
10975121,
"alv-snr",
"Latn",
}
m["seg"] = {
"Segeju",
17584599,
"bnt-mij",
"Latn",
}
m["seh"] = {
"Sena",
2964008,
"bnt-sna",
"Latn",
}
m["sei"] = {
"Seri",
36583,
"qfa-iso",
"Latn",
}
m["sej"] = {
"Sene",
7450252,
"ngf-ehu",
"Latn",
}
m["sek"] = {
"Sekani",
28562,
"ath-nor",
"Latn",
}
m["sen"] = {
"Nanerige",
36002,
"alv-sma",
}
m["seo"] = {
"Asaba",
7630513,
"qfa-dis", -- Papuan; isolate or unclassified in Glottolog; Sepik language in Foley (2018)
"Latn",
}
m["sep"] = {
"Sicite",
56787,
"alv-sma",
}
m["seq"] = {
"Senara", -- not to be confused with Syenara (shz)
35210,
"alv-snr",
}
m["ser"] = {
"Serrano",
3479942,
"azc-tak",
"Latn",
}
m["ses"] = {
"Koyraboro Senni",
35655,
"son",
"Latn",
}
m["set"] = {
"Sentani",
3441672,
"paa-sen",
"Latn",
}
m["seu"] = {
"Serui-Laut",
7455503,
"poz-hce",
"Latn",
}
m["sev"] = {
"Nyarafolo",
36306,
"alv-snr",
}
m["sew"] = {
"Sewa Bay",
7458126,
"poz-ocw",
}
m["sey"] = {
"Secoya",
3477218,
"sai-tuc",
"Latn",
}
m["sez"] = {
"Senthang Chin",
7451223,
"tbq-kuk",
}
m["sfb"] = {
"French Belgian Sign Language",
3217332,
"sgn",
}
m["sfe"] = {
"Eastern Subanun",
63311321,
"phi",
"Latn",
}
m["sfm"] = {
"Small Flowery Miao",
7542773,
"hmn",
}
m["sfs"] = {
"South African Sign Language",
3322093,
"sgn",
}
m["sfw"] = {
"Sehwi",
36593,
"alv-ctn",
"Latn",
}
m["sga"] = {
"Old Irish",
35308,
"cel-gae",
"Latn, Ogam",
strip_diacritics = {remove_diacritics = c.dotabove .. c.diaer .. "·"},
sort_key = "sga-sortkey",
standard_chars = "AaÁáBbCcDdEeÉéFfGgHhIiÍíLlMmNnOoÓóPpRrSsTtUuÚú0123456789ᚁᚂᚃᚄᚅᚆᚇᚈᚉᚊᚋᚌᚍᚎᚏᚐᚑᚒᚓᚔ" .. c.punc,
}
m["sgb"] = {
"Mag-Anchi Ayta",
4356243,
"phi",
"Latn",
}
m["sgc"] = {
"Kipsigis",
56339,
"sdv-nma",
}
m["sgd"] = {
"Surigaonon",
34140,
"phi",
"Latn",
}
m["sge"] = {
"Segai",
7446180,
}
m["sgg"] = {
"Swiss-German Sign Language",
35150,
"sgn",
}
m["sgh"] = {
"Shughni",
34053,
"ira-shr",
"Latn, Cyrl",
translit = "sgh-translit",
override_translit = true,
}
m["sgi"] = {
"Suga",
36475,
"nic-mmb",
"Latn",
}
m["sgk"] = {
"Sangkong",
2945610,
"tbq-bis",
}
m["sgm"] = {
"Singa",
7522797,
"bnt-lok",
"Latn",
}
m["sgp"] = {
"Singpho",
7524158,
"sit-jnp",
"Latn",
}
m["sgr"] = {
"Sangisari",
3394363,
"ira-kms",
"Arab",
}
m["sgs"] = {
"Samogitian",
213434,
"bat-eas",
"Latn",
wikimedia_codes = "bat-smg",
ancestors = "olt",
display_text = "lt-common",
strip_diacritics = "lt-common",
sort_key = "lt-common",
}
m["sgt"] = {
"Brokpake",
56603,
"sit-tib",
"Tibt",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["sgu"] = {
"Salas",
7403694,
"poz-cma",
}
m["sgw"] = {
"Sebat Bet Gurage",
2707343,
"sem-eth",
"Ethi",
}
m["sgx"] = {
"Sierra Leone Sign Language",
7511448,
"sgn",
}
m["sgy"] = {
"Sanglechi",
3472220,
"ira-sgi",
}
m["sgz"] = {
"Sursurunga",
36511,
"poz-ocw",
"Latn",
}
m["sha"] = {
"Shall-Zwall",
3915355,
"nic-beo",
}
m["shb"] = {
"Ninam",
3436586,
"sai-ynm",
"Latn",
}
m["shc"] = {
"Sonde",
7560881,
"bnt-pen",
"Latn",
}
m["shd"] = {
"Kundal Shahi",
6444265,
"inc-shn",
"Arab",
}
m["she"] = {
"Sheko",
3183355,
"omv-diz",
}
m["shg"] = {
"Shua",
3501092,
"khi-kal",
"Latn",
}
m["shh"] = {
"Shoshone",
33811,
"azc-num",
"Latn",
}
m["shi"] = {
"Tashelhit",
34152,
"ber",
"Latn, Arab, Tfng, Hebr",
ancestors = "shi-med",
translit = {
Tfng = "Tfng-translit",
},
strip_diacritics = {
Arab = "ar-stripdiacritics",
},
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["shj"] = {
"Shatt",
56344,
"sdv-daj",
}
m["shk"] = {
"Shilluk",
36486,
"sdv-lon",
"Latn",
}
m["shl"] = {
"Shendu",
22074616,
"tbq-kuk",
}
m["shm"] = {
"Shahrudi",
7462280,
"xme-ttc",
"fa-Arab, Latn",
ancestors = "xme-ttc-cen",
}
m["shn"] = {
"Shan",
56482,
"tai-swe",
"Mymr",
translit = "shn-translit",
sort_key = {
from = {"[ၢႃ]", "ဵ", "ႅ", "ႇ", "ႈ", "း", "ႉ", "ႊ"},
to = {"ာ", "ေ", "ႄ", "႒", "႓", "႔", "႕", "႖"}
},
}
m["sho"] = {
"Shanga",
3913931,
"dmn-bbu",
"Latn",
}
m["shp"] = {
"Shipibo-Conibo",
2671988,
"sai-pan",
"Latn",
}
m["shq"] = {
"Sala",
10961665,
"bnt-bot",
"Latn",
}
m["shr"] = {
"Shi",
3481999,
"bnt-shh",
"Latn",
}
m["shs"] = {
"Shuswap",
3482685,
"sal",
"Latn",
}
m["sht"] = {
"Shasta",
56396,
"nai-shs",
"Latn",
}
m["shu"] = {
"Chadian Arabic",
56497,
"sem-arb",
"Arab",
strip_diacritics = {
remove_diacritics = c.kashida .. c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.superalef,
from = {u(0x0671)},
to = {u(0x0627)}
},
}
m["shv"] = {
"Shehri",
33445,
"sem-sar",
"Arab, Latn",
}
m["shw"] = {
"Shwai",
36527,
"alv-hei",
}
m["shx"] = {
"She",
2605689,
"hmn",
}
m["shy"] = {
"Tachawit",
33274,
"ber",
"Tfng, Arab, Latn",
translit = "Tfng-translit",
}
m["shz"] = {
"Syenara", -- not to be confused with Senara (seq)
36316,
"alv-snr",
}
m["sia"] = {
"Akkala Sami",
35241,
"smi",
"Cyrl, Latn",
translit = "sia-translit",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
}
m["sib"] = {
"Sebop",
7442799,
"poz-swa",
"Latn",
}
m["sid"] = {
"Sidamo",
33786,
"cus-hec",
"Latn, Ethi",
}
m["sie"] = {
"Simaa",
7517329,
"bnt-kav",
"Latn",
}
m["sif"] = {
"Siamou",
36252,
}
m["sig"] = {
"Paasaal",
36426,
"nic-sis",
"Latn",
}
m["sih"] = {
"Sîshëë",
8072753,
"poz-cln",
"Latn",
}
m["sii"] = {
"Shom Peng",
1039346,
"aav",
}
m["sij"] = {
"Numbami",
3346277,
"poz-ocw",
"Latn",
}
m["sik"] = {
"Sikiana",
3443734,
"sai-prk",
"Latn",
}
m["sil"] = {
"Tumulung Sisaala",
25383006,
"nic-sis",
"Latn",
}
m["sim"] = {
"Mende (New Guinea)",
7446815,
"paa-sep",
"Latn",
}
m["sip"] = {
"Sikkimese",
35285,
"sit-tib",
"Tibt",
ancestors = "xct",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["siq"] = {
"Sonia",
7561770,
"ngf-bos",
"Latn",
}
m["sir"] = {
"Siri",
3438729,
"cdc-wst",
"Latn",
}
m["sis"] = {
"Siuslaw",
2315424,
}
m["siu"] = {
"Sinagen",
7521655,
"paa-wap",
"Latn",
}
m["siv"] = {
"Sumariup",
7636966,
"paa-sep",
"Latn",
}
m["siw"] = {
"Siwai",
7532519,
"paa-sbo",
"Latn",
}
m["six"] = {
"Sumau",
7637021,
"ngf-pek",
"Latn",
}
m["siy"] = {
"Sivandi",
13269,
"xme",
"fa-Arab, Latn",
ancestors = "xme-mid",
}
m["siz"] = {
"Siwi",
36814,
"ber",
"Tfng, Arab, Latn",
}
m["sja"] = {
"Epena",
3055682,
"sai-chc",
"Latn",
}
m["sjb"] = {
"Sajau Basap",
4684353,
"poz-bnn",
}
m["sjc"] = {
"Shaojiang Min",
3431451,
"zhx-inm",
"Hants",
generate_forms = "zh-generateforms",
sort_key = "Hani-sortkey",
}
m["sjd"] = {
"Kildin Sami",
33656,
"smi",
"Cyrl",
translit = "sjd-translit",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
}
m["sje"] = {
"Pite Sami",
56314,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = c.macron .. "'ˈ"},
sort_key = "sje-sortkey",
}
m["sjg"] = {
"Assangori",
3502255,
"sdv-tmn",
}
m["sjk"] = {
"Kemi Sami",
35871,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
}
m["sjl"] = {
"Miji",
6845470,
"sit-hrs",
}
m["sjm"] = {
"Mapun",
3287253,
"poz-sbj",
"Latn",
}
m["sjn"] = {
"Sindarin",
56437,
"art",
"Latn, Teng",
type = "appendix-constructed",
}
m["sjo"] = {
"Xibe",
13223,
"tuw-jrc",
"sjo-Mong",
ancestors = "mnc",
}
m["sjp"] = {
"Surjapuri",
7645351,
"inc-krd",
"Deva, as-Beng, Kthi",
}
m["sjr"] = {
"Siar-Lak",
3482907,
"poz-ocw",
}
m["sjs"] = {
"Senhaja de Srair",
56744,
"ber",
"Latn, Tfng, Arab",
strip_diacritics = {
Arab = "ar-stripdiacritics",
},
translit = {
Tfng = "Tfng-translit",
}
}
m["sjt"] = {
"Ter Sami",
36656,
"smi",
"Cyrl, Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
translit = "sjt-translit",
}
m["sju"] = {
"Ume Sami",
56415,
"smi",
"Latn",
strip_diacritics = {remove_diacritics = c.macron .. "'ˈ"},
display_text = {
from = {"'"},
to = {"ˈ"}
},
sort_key = "sju-sortkey",
}
m["sjw"] = {
"Shawnee",
2669206,
"alg",
"Latn",
}
-- [ska] Skagit is treated as part of [lut] Lushootseed
m["skb"] = {
"Saek",
36437,
"tai-nor",
"Thai",
sort_key = "Thai-sortkey",
}
m["skc"] = {
"Ma Manda",
6720783,
"ngf-era",
"Latn",
}
m["skd"] = {
"Southern Sierra Miwok",
3492334,
"nai-utn",
"Latn",
}
m["ske"] = {
"Ske",
7534244,
"poz-vnn",
"Latn",
}
m["skf"] = {
"Mekéns",
3304806,
"tup",
"Latn",
}
m["skh"] = {
"Sikule",
3121081,
"poz-nws",
}
m["ski"] = {
"Sika",
33960,
"poz-cet",
"Latn",
}
m["skj"] = { -- compare 'ths'
"Seke",
30226846,
"sit-tam",
}
m["skk"] = {
"Sok",
12953887,
"mkh-ban",
}
m["skm"] = {
"Sakam",
6448517,
"ngf-uru",
"Latn",
}
m["skn"] = {
"Kolibugan Subanon",
18755617,
"phi",
"Latn",
}
m["sko"] = {
"Seko Tengah",
15613270,
"poz",
}
m["skp"] = {
"Sekapan",
7447132,
"poz-bnn",
}
m["skq"] = {
"Sininkere",
3914896,
"dmn-snb",
"Latn",
}
m["skr"] = {
"Saraiki",
33902,
"inc-pan",
"pa-Arab, Mult, Deva",
strip_diacritics = {remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.nunghunna},
translit = {
["pa-Arab"] = "pa-Arab-translit",
Deva = "hi-translit",
Mult = "Mult-translit",
},
}
m["sks"] = {
"Maia",
12952760,
"ngf-kau",
"Latn",
}
m["skt"] = {
"Sakata",
36691,
"bnt-bnm",
"Latn",
}
m["sku"] = {
"Sakao",
3298421,
"poz-vnn",
"Latn",
}
m["skv"] = {
"Skou",
3915200,
"paa-isk",
"Latn",
}
m["skw"] = {
"Skepi Creole Dutch",
2522153,
"crp",
"Latn",
ancestors = "nl",
}
m["skx"] = {
"Seko Padang",
15613282,
"poz-ssw",
"Latn",
}
m["sky"] = {
"Sikaiana",
7439242,
"poz-pnp",
"Latn",
}
m["skz"] = {
"Sekar",
7447136,
"poz-cet",
}
m["slc"] = {
"Saliba (Colombia)",
3441097,
nil,
"Latn",
}
m["sld"] = {
"Sisaala",
11020264,
"nic-sis",
"Latn",
}
m["sle"] = {
"Sholaga",
7500203,
"dra-kan",
"Knda",
-- Knda translit in [[Module:scripts/data]]
}
m["slf"] = {
"Swiss-Italian Sign Language",
12953479,
"sgn",
}
m["slg"] = {
"Selungai Murut",
7448844,
"poz-san",
}
-- [slh] Southern Puget Sound Salish is treated as part of [lut] Lushootseed
-- "sli" "Silesian German" IS SUBSUMED INTO "gmw-ecg" "East Central German"
m["slj"] = {
"Salumá",
7406296,
"sai-prk",
"Latn",
}
m["sll"] = {
"Salt-Yui",
7405785,
"ngf-sim",
"Latn",
}
m["slm"] = {
"Pangutaran Sama",
3362086,
"poz-sbj",
"Latn",
}
m["sln"] = {
"Salinan",
1568938,
"qfa-iso",
"Latn",
}
m["slp"] = {
"Lamaholot",
6480777,
"poz-cet",
"Latn",
}
m["slr"] = {
"Salar",
33963,
"trk-ogz",
"Arab, Latn",
ancestors = "trk-eog",
}
m["sls"] = {
"Singapore Sign Language",
7512563,
"sgn",
}
m["slt"] = {
"Sila",
7514021,
"tbq-sil",
}
m["slu"] = {
"Selaru",
7447500,
"poz-cet",
"Latn",
}
m["slw"] = {
"Sialum",
7506694,
"ngf-ehu",
"Latn",
}
m["slx"] = {
"Salampasu",
7403607,
"bnt-lun",
"Latn",
}
m["sly"] = {
"Selayar",
7447520,
"poz-ssw",
}
m["slz"] = {
"Ma'ya",
2291492,
"poz-hce",
"Latn",
}
m["sma"] = {
"Southern Sami",
13293,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = "'ˈ"},
sort_key = "sma-sortkey",
}
m["smb"] = {
"Simbari",
7517427,
"ngf-bsi",
"Latn",
}
m["smc"] = {
"Som",
7559081,
"ngf-uru",
"Latn",
}
m["smd"] = {
"Sama",
6407456,
"bnt-kmb",
"Latn",
}
m["smf"] = {
"Auwe",
3502072,
"paa-war",
"Latn",
ancestors = "dnd",
}
m["smg"] = {
"Simbali",
56692,
"paa-bai",
"Latn",
}
m["smh"] = {
"Samei",
7409269,
"tbq-axi",
}
m["smj"] = {
"Lule Sami",
56322,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = c.macron .. "'ˈ"},
sort_key = "smj-sortkey",
}
m["smk"] = {
"Bolinao",
2669235,
"phi",
"Latn, Tglg",
}
m["sml"] = {
"Central Sama",
3470593,
"poz-sbj",
"Latn",
}
m["smm"] = {
"Musasa",
6940122,
"inc-bih",
}
m["smn"] = {
"Inari Sami",
33462,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = c.dotbelow .. "'ˈ"},
sort_key = "smn-sortkey",
}
m["smp"] = {
"Samaritan Hebrew",
56502,
"sem-can",
"Samr",
translit = "Samr-translit",
-- Samr strip_diacritics, sort_key in [[Module:scripts/data]]
ancestors = "hbo",
}
m["smq"] = {
"Samo",
7409884,
"ngf-est",
"Latn",
}
m["smr"] = {
"Simeulue",
2992833,
"poz-nws",
"Latn",
}
m["sms"] = {
"Skolt Sami",
13271,
"smi",
"Latn",
display_text = {
from = {"'"},
to = {"ˈ"}
},
strip_diacritics = {remove_diacritics = c.dotbelow .. "'ˈ"},
sort_key = "sms-sortkey",
}
m["smt"] = {
"Simte",
7521268,
"tbq-kuk",
}
m["smu"] = {
"Somray",
6583612,
"mkh-pea",
}
m["smv"] = {
"Samvedi",
6345632,
"inc-sou",
}
m["smw"] = {
"Sumbawa",
3182585,
"poz-bss",
"Latn",
}
m["smx"] = {
"Samba",
11120157,
"bnt-pen",
"Latn",
}
m["smy"] = {
"Semnani",
14531212,
"xme",
"fa-Arab, Latn",
}
m["smz"] = {
"Simeku",
7517534,
"paa-sbo",
"Latn",
}
m["snb"] = {
"Sebuyau",
7442836,
"poz-mly",
"Latn",
}
m["snc"] = {
"Sinaugoro",
4170719,
"poz-ocw",
"Latn",
}
m["sne"] = {
"Bau Bidayuh",
2891938,
"day",
"Latn",
}
m["snf"] = {
"Noon",
36304,
"alv-cng",
"Latn",
}
m["sng"] = {
"Sanga (Congo)",
3438316,
"bnt-lub",
"Latn",
}
m["sni"] = {
"Sensi",
7451029,
"sai-pan",
"Latn",
}
m["snj"] = {
"Riverain Sango",
25559751,
"crp",
"Latn",
ancestors = "ngb",
}
m["snk"] = {
"Soninke",
36660,
"dmn-snb",
"Latn",
}
m["snl"] = {
"Sangil",
3472206,
"phi",
"Latn",
}
m["snm"] = {
"Southern Ma'di",
15637273,
"csu-mma",
}
m["snn"] = {
"Siona",
3485116,
"sai-tuc",
"Latn",
}
-- [sno] Snohomish is treated as part of [lut] Lushootseed
m["snp"] = {
"Siane",
7506812,
"ngf-gor",
"Latn",
}
m["snq"] = {
"Sangu (Gabon)",
36609,
"bnt-sir",
"Latn",
}
m["snr"] = {
"Sihan",
7513400,
"ngf-gum",
"Latn",
}
m["sns"] = {
"Nahavaq",
2160435,
"poz-vnc",
"Latn",
}
m["snu"] = {
"Senggi",
7929052,
"paa-war",
"Latn",
}
m["snv"] = {
"Sa'ban",
3474891,
"poz-swa",
"Latn",
}
m["snw"] = {
"Selee",
36272,
"alv-ntg",
"Latn",
}
m["snx"] = {
"Sam",
7408387,
"ngf-min",
"Latn",
}
m["sny"] = {
"Saniyo-Hiyewe",
7418302,
"paa-sep",
"Latn",
}
m["snz"] = {
"Kou",
7525035, -- also 4803639
"ngf-eva",
"Latn",
}
m["soa"] = {
"Thai Song",
7709159,
"tai-swe",
"Tavt, Thai",
--translit = "Tavt-translit",
sort_key = {
from = {"([ꪵꪶꪹꪻꪼ])([ꪀ-ꪯ])", "([เแโใไ])([ก-ฮ])"},
to = {"%2%1", "%2%1"}
},
}
m["sob"] = {
"Sobei",
3121035,
"poz-ocw",
"Latn",
}
m["soc"] = {
"Soko",
7555138,
"bnt-ske",
"Latn",
}
m["sod"] = {
"Songoora",
7561296,
"bnt-lgb",
"Latn",
}
m["soe"] = {
"Songomeno",
5713543,
"bnt-bsh",
"Latn",
}
m["sog"] = {
"Sogdian",
205979,
"ira-sgc",
"Sogd, Mani, Syrc, Sogo",
translit = {
Sogd = "Sogd-translit",
-- Mani translit in [[Module:scripts/data]]
Sogo = "Sogo-translit",
},
}
m["soh"] = {
"Aka (Sudan)",
3450949,
"sdv-eje",
"Latn",
}
m["soi"] = {
"Sonha",
12953890,
"inc-eas",
}
m["sok"] = {
"Sokoro",
3441303,
"cdc-est",
"Latn",
}
m["sol"] = {
"Solos",
3489591,
"poz-ocw",
}
m["soo"] = {
"Nsong",
12953148,
"bnt-bdz",
"Latn",
}
m["sop"] = {
"Songe",
3130911,
"bnt-lbn",
"Latn",
}
m["soq"] = {
"Kanasi",
11732656,
"ngf-dag",
"Latn",
}
m["sor"] = {
"Somrai",
3123566,
"cdc-est",
"Latn",
}
m["sos"] = {
"Seenku",
36274,
"dmn-smg",
}
m["sou"] = {
"Southern Thai",
56508,
"tai-swe",
"Thai",
sort_key = "Thai-sortkey",
}
m["sov"] = {
"Sonsorolese",
13281,
"poz-mic",
"Latn",
}
m["sow"] = {
"Sowanda",
7571845,
"paa-war",
"Latn",
}
m["sox"] = {
"Swo",
36604,
"bnt-mka",
"Latn",
}
m["soy"] = {
"Miyobe",
35913,
"alv-sav",
"Latn",
}
m["soz"] = {
"Temi",
13278,
"bnt-kka",
"Latn",
}
m["spb"] = {
"Sepa (Indonesia)",
18603687,
"poz-cma",
"Latn",
}
m["spc"] = {
"Sapé",
2888158,
nil,
"Latn",
}
m["spd"] = {
"Saep",
7398312,
"ngf-yag",
"Latn",
}
m["spe"] = {
"Sepa (New Guinea)",
7451725,
"poz-ocw",
"Latn",
}
m["spg"] = {
"Sian",
7506806,
"poz-bnn",
}
m["spi"] = {
"Saponi",
3915418,
"paa-rsa",
"Latn",
}
m["spk"] = {
"Sengo",
7450584,
"paa-nnd",
"Latn",
}
m["spl"] = {
"Selepet",
7447917,
"ngf-kab",
"Latn",
}
m["spm"] = {
"Sepen",
4701931,
"paa-rub",
"Latn",
}
m["spn"] = {
"Sanapaná",
3033556,
"sai-mas",
"Latn",
}
m["spo"] = {
"Spokane",
3493704,
"sal",
}
m["spp"] = {
"Supyire",
56284,
"alv-sma",
"Latn",
}
m["spr"] = {
"Saparua",
7420921,
"poz-cma",
"Latn",
}
m["sps"] = {
"Saposa",
3473187,
"poz-ocw",
}
m["spt"] = {
"Spiti Bhoti",
22080879,
"sit-las",
}
m["spu"] = {
"Sapuan",
7421168,
"mkh-ban",
}
m["spv"] = {
"Sambalpuri",
6433240,
"inc-eas",
"Orya",
translit = "or-translit",
ancestors = "or",
}
m["spx"] = {
"South Picene",
36688,
"itc-sbl",
"Ital, Latn",
-- Ital translit in [[Module:scripts/data]]
display_text = {
Latn = s["itc-Latn-displaytext"]
},
strip_diacritics = {
Latn = s["itc-Latn-stripdiacritics"],
},
sort_key = {
Latn = s["itc-Latn-sortkey"],
},
}
m["spy"] = {
"Sabaot",
7395896,
"sdv-kln",
}
m["sqa"] = {
"Shama-Sambuga",
3914392,
"nic-kmk",
"Latn",
}
m["sqh"] = {
"Shau",
3913925,
"nic-jer",
"Latn",
}
m["sqk"] = {
"Albanian Sign Language",
4709168,
"sgn",
}
m["sqm"] = {
"Suma",
11008431,
"gba-wes",
}
m["sqn"] = {
"Susquehannock",
3505736,
"iro-nor",
}
m["sqo"] = {
"Sorkhei",
3491964,
"ira-kms",
}
m["sqq"] = {
"Sou",
16979751,
"mkh-ban",
}
m["sqr"] = {
"Siculo-Arabic",
1069489,
"sem-arb",
"Arab",
}
m["sqs"] = {
"Sri Lankan Sign Language",
3915466,
"sgn",
}
m["sqt"] = {
"Soqotri",
13283,
"sem-sar",
"Arab, Latn",
}
m["squ"] = {
"Squamish",
2484579,
"sal",
"Latn",
}
m["sra"] = {
"Saruga",
7424699,
"ngf-han",
"Latn",
}
m["srb"] = {
"Sora",
13284,
"mun",
"Sora, Latn, Orya",
}
m["sre"] = {
"Sara",
33957,
"day",
}
m["srf"] = {
"Nafi",
6958174,
"poz-ocw",
}
m["srg"] = {
"Sulod",
7636489,
"phi",
}
m["srh"] = {
"Sarikoli",
33873,
"ira-shr",
"Latn, ug-Arab, Cyrl",
}
m["sri"] = {
"Siriano",
3485264,
"sai-tuc",
"Latn",
}
m["srk"] = {
"Serudung Murut",
7455497,
"poz-san",
}
m["srl"] = {
"Isirawa",
4203802,
"paa-gkw",
"Latn",
}
m["srm"] = {
"Saramaccan",
33779,
"crp",
"Latn",
ancestors = "en, pt",
}
m["srn"] = {
"Sranan Tongo",
33989,
"crp",
"Latn",
ancestors = "en",
}
m["srq"] = {
"Sirionó",
3027953,
"tup-gua",
"Latn",
}
m["srr"] = {
"Serer",
36284,
"alv-fwo",
"Latn",
}
m["srs"] = {
"Tsuut'ina",
20825,
"ath-nor",
"Latn",
}
m["srt"] = {
"Sauri",
7427547,
"paa-egb",
"Latn",
}
m["sru"] = {
"Suruí",
7646993,
"tup",
"Latn",
}
m["srv"] = {
"Waray Sorsogon",
18755610,
"phi",
"Latn",
}
m["srw"] = {
"Serua",
14916905,
"poz-cet",
}
m["srx"] = {
"Sirmauri",
7530505,
"him",
}
m["sry"] = {
"Sera",
7452602,
"poz-ocw",
"Latn",
}
m["srz"] = {
"Shahmirzadi",
12953126,
"ira-msh",
"fa-Arab",
}
m["ssb"] = {
"Southern Sama",
3470594,
"poz-sbj",
"Latn",
}
m["ssc"] = {
"Suba-Simbiti",
7630687,
"bnt-lok",
"Latn",
}
m["ssd"] = {
"Siroi",
10771067,
"ngf-rai",
"Latn",
}
m["sse"] = {
"Balangingi",
2880535,
"poz-sbj",
"Latn",
}
m["ssf"] = {
"Thao",
676492,
"map",
"Latn",
}
m["ssg"] = {
"Seimat",
3182581,
"poz-aay",
"Latn",
}
m["ssh"] = {
"Shihhi Arabic",
56571,
"sem-arb",
"Arab",
strip_diacritics = {
remove_diacritics = c.kashida .. c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.superalef,
from = {u(0x0671)},
to = {u(0x0627)}
},
}
m["ssi"] = {
"Sansi",
3309366,
"inc-nwe",
}
m["ssj"] = {
"Sausi",
7427605,
"ngf-eva",
"Latn",
}
m["ssk"] = {
"Sunam",
11002210,
"sit-kin",
}
m["ssl"] = {
"Western Sisaala",
11154776,
"nic-sis",
"Latn",
}
m["ssm"] = {
"Semnam",
7449713,
"mkh-asl",
"Latn",
}
m["sso"] = {
"Sissano",
7530937,
"poz-ocw",
"Latn",
}
m["ssp"] = {
"Spanish Sign Language",
3100814,
"sgn",
}
m["ssq"] = {
"So'a",
7572120,
"poz-cet",
"Latn",
}
m["ssr"] = {
"Swiss-French Sign Language",
12953483,
"sgn",
}
m["sss"] = {
"Sô",
3082037,
"mkh-kat",
}
m["sst"] = {
"Sinasina",
7521813,
"ngf-sim",
"Latn",
}
m["ssu"] = {
"Susuami",
7649752,
"ngf-woj",
"Latn",
}
m["ssv"] = {
"Shark Bay",
7489783,
"poz-vnn",
"Latn",
}
m["ssx"] = {
"Samberigi",
7409020,
"ngf-sak",
"Latn",
}
m["ssy"] = {
"Saho",
36353,
"cus-eas",
"Latn, Ethi, Arab",
}
m["ssz"] = {
"Sengseng",
7450601,
"poz-ocw",
"Latn",
}
m["stb"] = {
"Northern Subanen",
12953892,
"phi",
"Latn",
}
m["std"] = {
"Sentinelese",
568377,
"qfa-unc", -- presumed Ongan
}
m["ste"] = {
"Liana-Seti",
6539924,
"poz-cma",
}
m["stf"] = {
"Seta",
7456326,
"paa-trr",
"Latn",
}
m["stg"] = {
"Trieng",
22694648,
"mkh-ban",
}
m["sth"] = {
"Shelta",
36705,
"qfa-mix",
"Latn",
ancestors = "ga, en",
}
m["sti"] = {
"Bulo Stieng",
15771431,
"mkh-ban",
"Khmr, Latn",
}
m["stj"] = {
"Matya Samo",
10974879,
"dmn-sam",
"Latn",
}
m["stk"] = {
"Arammba",
3502094,
"paa-ton",
"Latn",
}
m["stm"] = {
"Setaman",
7456333,
"ngf-mok",
"Latn",
}
m["stn"] = {
"Owa",
1324132,
"poz-sls",
"Latn",
}
m["sto"] = {
"Stoney",
3033570,
"sio-dkt",
"Latn",
}
m["stp"] = {
"Southeastern Tepehuan",
12953917,
"azc-pim",
"Latn",
}
m["stq"] = {
"Saterland Frisian",
27154,
"gmw-fri",
"Latn",
}
m["str"] = {
"Saanich",
36444,
"sal",
"Latn",
}
m["sts"] = {
"Shumashti",
33777,
"inc-kun",
"Arab",
}
m["stt"] = {
"Budeh Stieng",
12953891,
"mkh-ban",
}
m["stu"] = {
"Samtao",
25559550,
"mkh-pal",
}
m["stv"] = {
"Silt'e",
33880,
"sem-eth",
"Ethi",
}
m["stw"] = {
"Satawalese",
28477,
"poz-mic",
"Latn",
}
m["sty"] = {
"Siberian Tatar",
4418344,
"trk-kno",
"Cyrl",
}
m["sua"] = {
"Sulka",
7636341,
"qfa-iso", -- Papuan; isolate in Glottolog and Palmer (2018)
"Latn",
}
m["sub"] = {
"Suku",
12953160,
"bnt-yak",
"Latn",
}
m["suc"] = {
"Western Subanon",
16113894,
"phi",
"Latn",
}
m["sue"] = {
"Suena",
7634386,
"ngf-nbi",
"Latn",
}
m["sug"] = {
"Suganga",
7634706,
"ngf-msu",
"Latn",
}
m["sui"] = {
"Suki",
2089984,
"ngf-gsu",
"Latn",
}
m["suk"] = {
"Sukuma",
2638144,
"bnt-tkm",
"Latn",
}
m["suo"] = {
"Bouni",
65043887,
"paa-pio",
"Latn",
}
m["suq"] = {
"Suri",
5364172,
"sdv",
}
m["sur"] = {
"Mwaghavul",
3440486,
"cdc-wst",
"Latn",
}
m["sus"] = {
"Susu",
33990,
"dmn-sya",
"Latn",
}
m["sut"] = {
"Subtiaba",
3915405,
"omq",
"Latn",
}
m["suv"] = {
"Puroik",
56408,
"sit-khb",
"Beng, Deva, Latn",
ancestors = "sit-khp-pro",
}
m["suw"] = {
"Sumbwa",
7637055,
"bnt-glb",
"Latn",
}
m["sux"] = {
"Sumerian",
36790,
"qfa-iso",
"Xsux, Latn",
}
m["suy"] = {
"Suyá",
3505859,
"sai-nje",
"Latn",
}
m["suz"] = {
"Sunwar",
56549,
"sit-kiw",
"Deva, Sunu"
}
m["sva"] = {
"Svan",
34067,
"ccs",
"Geor, Cyrl",
translit = {
Geor = "sva-translit",
},
override_translit = true,
}
m["svb"] = {
"Ulau-Suain",
7878769,
"poz-ocw",
"Latn",
}
m["svc"] = {
"Vincentian Creole English",
3501785,
"crp",
"Latn",
ancestors = "en",
}
m["sve"] = {
"Serili",
7454834,
"poz-tim",
}
m["svk"] = {
"Slovakian Sign Language",
7541557,
"sgn",
}
m["svm"] = {
"Slavomolisano",
36254,
"zls",
"Latn",
ancestors = "sh",
}
m["svs"] = {
"Savosavo",
3130296,
"qfa-dis", -- Papuan; isolate in Glottolog; in the tentative Central Solomons family by Ross (2005) and Pedrós
-- (2015)
"Latn",
}
m["svx"] = {
"Skalvian",
3486125,
"bat-wes",
"Latn",
}
m["swb"] = {
"Maore Comorian",
34075,
"bnt-com",
"Latn",
sort_key = "bnt-com-sortkey",
}
m["swf"] = {
"Sere",
7453056,
"nic-ser",
"Latn",
}
m["swg"] = {
"Swabian",
327274,
"gmw-hgm",
"Latn",
ancestors = "gsw",
}
m["swi"] = {
"Sui",
3112388,
"qfa-kms",
"Latn, Shui, Hani",
sort_key = {Hani = "Hani-sortkey"},
}
m["swj"] = {
"Sira",
36599,
"bnt-sir",
"Latn",
}
m["swl"] = {
"Swedish Sign Language",
36558,
"sgn",
}
m["swm"] = {
"Samosa",
7410037,
"ngf-nwh",
"Latn",
}
m["swn"] = {
"Sokna",
2988323,
"ber",
}
m["swo"] = {
"Shanenawa",
61974839,
"sai-pan",
"Latn",
}
m["swp"] = {
"Suau",
3502368,
"poz-ocw",
}
m["swq"] = {
"Sharwa",
56791,
"cdc-cbm",
"Latn",
}
m["swr"] = {
"Saweru",
3474649,
"paa-ysa",
"Latn",
}
m["sws"] = {
"Seluwasan",
7448845,
"poz-cet",
}
m["swt"] = {
"Sawila",
7428639,
"paa-alp",
"Latn",
}
m["swu"] = {
"Suwawa",
7650588,
"phi",
}
m["sww"] = {
"Sowa",
7571843,
"poz-vnn",
"Latn",
}
m["swx"] = {
"Suruahá",
3114402,
"auf",
}
m["swy"] = {
"Sarua",
56261,
"cdc-est",
"Latn",
}
m["sxb"] = {
"Suba",
33916,
"bnt-lok",
"Latn",
}
m["sxc"] = {
"Sicanian",
36335,
"qfa-unc", -- extinct; lack of data: only names deciphered
"Polyt",
-- Polyt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["sxe"] = {
"Sighu",
36431,
"bnt-kel",
"Latn",
}
m["sxg"] = {
"Shixing",
56337,
"sit-nax",
"Latn",
}
m["sxk"] = {
"Southern Kalapuya",
3192122,
"nai-klp",
}
m["sxl"] = {
"Selonian",
36491,
"bat-eas",
"Latn",
}
m["sxm"] = {
"Samre",
6583615,
"mkh-pea",
}
m["sxn"] = {
"Sangir",
25714758,
"phi",
"Latn",
}
m["sxo"] = {
"Sorothaptic",
2762254,
}
m["sxr"] = {
"Saaroa",
716599,
"map",
"Latn",
}
m["sxs"] = {
"Sasaru",
3913384,
"alv-yek",
"Latn",
}
-- "sxu" "Upper Saxon" IS SUBSUMED INTO "gmw-ecg" "East Central German"
m["sxw"] = {
"Saxwe Gbe",
7428892,
"alv-pph",
"Latn",
}
m["sya"] = {
"Siang",
3482903,
}
m["syb"] = {
"Central Subanen",
12953893,
"phi",
"Latn",
}
m["syc"] = {
"Classical Syriac",
33538,
"sem-are",
"Syrc",
strip_diacritics = {remove_diacritics = c.macron .. c.diaer .. c.macronbelow .. u(0x0730) .. "-" .. u(0x0748)},
}
m["syi"] = {
"Seki",
36547,
"bnt-kel",
"Latn",
}
m["syk"] = {
"Sukur",
56292,
"cdc-cbm",
"Latn",
}
m["syl"] = {
"Sylheti",
2044560,
"inc-bas",
"Sylo, Beng",
ancestors = "inc-obn",
translit = "syl-translit",
}
m["sym"] = {
"Maya Samo",
10950421,
"dmn-sam",
"Latn",
}
m["syn"] = {
"Senaya",
33914,
"sem-nna",
}
m["syo"] = {
"Suoy",
7641864,
"mkh-pea",
}
m["sys"] = {
"Sinyar",
56840,
"csu",
"Latn",
}
m["syw"] = {
"Kagate",
12952538,
"sit-kyk",
"Deva",
}
m["syx"] = {
"Osamayi",
7408415,
"bnt-kel",
"Latn",
}
m["syy"] = {
"Al-Sayyid Bedouin Sign Language",
2915457,
"sgn",
}
m["sza"] = {
"Semelai",
3111827,
"mkh-asl",
"Latn",
}
m["szb"] = {
"Ngalum",
11732516,
"ngf-okk",
"Latn",
}
m["szc"] = {
"Semaq Beri",
7449119,
"mkh-asl",
}
m["szd"] = {
"Seru",
7455488,
"poz-bnn",
"Latn",
}
m["sze"] = {
"Seze",
373683,
"omv-mao",
"Latn",
}
m["szg"] = {
"Sengele",
7450555,
"bnt-mon",
"Latn",
}
m["szl"] = {
"Silesian",
30319,
"zlw-lch",
"Latn",
ancestors = "zlw-opl",
}
m["szn"] = {
"Sula",
3503403,
"poz-cma",
"Latn",
}
m["szp"] = {
"Suabo",
7630429,
"ngf-sbh",
"Latn",
}
m["szv"] = {
"Isubu",
35431,
"bnt-saw",
"Latn",
}
m["szw"] = {
"Sawai",
3447258,
"poz-hce",
"Latn",
}
m["szy"] = {
"Sakizaya",
718269,
"map",
"Latn",
}
return require("Module:languages").finalizeData(m, "language")
5q1vkgr7iqfj6q1fxha4dbfhok7eo7v
Module:languages/data/3/l
828
6261
234837
220406
2026-02-11T05:31:54Z
en>Benwing2
0
remove redundant ancestor 'inc-opa' in Lahnda
234837
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["laa"] = {
"Lapuyan Subanun",
12635302,
"phi",
}
m["lab"] = {
"Linear A",
nil,
"qfa-unc", -- undeciphered
"Lina",
}
m["lac"] = {
"Lacandon",
35766,
"myn",
"Latn",
}
m["lad"] = {
"Ladino",
36196,
"roa-cas",
"Hebr, Latn, Cyrl",
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lae"] = {
"Pattani",
7148323,
"sit-whm",
}
m["laf"] = {
"Lafofa",
35711,
"alv",
}
m["lag"] = {
"Langi",
584983,
"bnt-mra",
}
m["lah"] = {
"Lahnda",
1334774,
"inc-pan",
"pa-Arab",
}
m["lai"] = {
"Lambya",
6481626,
"bnt-mby",
"Latn",
}
m["laj"] = {
"Lango (Uganda)",
35670,
"sdv-los",
"Latn",
}
m["lak"] = {
"Laka",
6474529, -- also Q55616620
"csu-sar", -- formerly classified as "alv-mbm"; see [[w:Lau Laka language]]
}
m["lam"] = {
"Lamba",
36098,
"bnt-sbi",
"Latn",
}
m["lan"] = {
"Laru",
3913987,
"nic-knj",
"Latn",
}
m["lap"] = {
"Kabba-Laka",
6474528,
"csu-sar",
"Latn",
}
m["laq"] = {
"Qabiao",
3436700,
"qfa-kra",
}
m["lar"] = {
"Larteh",
35639,
"alv-gng",
"Latn",
}
m["las"] = {
"Gur Lama",
35652,
"nic-gne",
"Latn",
}
m["lau"] = {
"Laba",
12952694,
"paa-lla",
"Latn",
}
m["law"] = {
"Lauje",
6498258,
"poz",
"Latn",
}
m["lax"] = {
"Tiwa",
7810466,
"tbq-bdg",
"Latn, as-Beng",
}
m["lay"] = {
"Lama Bai",
6480756,
"sit-nba",
"Hani, Latn",
sort_key = {Hani = "Hani-sortkey"},
}
m["laz"] = {
"Aribwatsa",
3502104,
"poz-ocw",
"Latn",
}
m["lbb"] = {
"Label",
3214296,
"poz-ocw",
"Latn",
}
m["lbc"] = {
"Lakkia",
3027879,
"qfa-tak",
}
m["lbe"] = {
"Lak",
36206,
"cau-nec",
"Cyrl, Latn, Arab, Geor",
translit = {
Cyrl = "lbe-translit",
-- Geor translit in [[Module:scripts/data]]
},
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Cyrl = s["cau-Cyrl-stripdiacritics"],
Latn = s["cau-Latn-stripdiacritics"],
},
sort_key = "lbe-sortkey",
}
m["lbf"] = {
"Tinani",
784502,
"sit-whm",
}
m["lbg"] = {
"Laopang",
12952711,
"tbq-bis",
}
m["lbi"] = {
"La'bi",
6460637,
"alv-mbm",
}
m["lbj"] = {
"Ladakhi",
35833,
"sit-lab",
"Tibt",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lbk"] = {
"Central Bontoc",
63257803,
"phi",
"Latn",
}
m["lbl"] = {
"Libon Bikol",
18664462,
"phi",
"Latn",
}
m["lbm"] = {
"Lodhi",
6666374,
"mun",
}
m["lbn"] = {
"Lamet",
3216723,
"mkh-pal",
"Laoo, Latn",
}
m["lbo"] = {
"Laven",
6298648,
"mkh-ban",
"Latn",
}
m["lbq"] = {
"Wampar",
7966946,
"poz-ocw",
"Latn",
}
m["lbr"] = {
"Northern Lorung",
6668040,
"sit-kie",
"Deva",
}
m["lbs"] = {
"Libyan Sign Language",
11775688,
"sgn",
}
m["lbt"] = {
"Lachi",
6583606,
"qfa-kra",
}
m["lbu"] = {
"Labu",
6467660,
"poz-ocw",
"Latn",
}
m["lbv"] = {
"Lavatbura-Lamusong",
2405981,
"poz-ocw",
"Latn",
}
m["lbw"] = {
"Tolaki",
3033597,
"poz-btk",
"Latn",
}
m["lbx"] = {
"Lawangan",
3120345,
"poz-bre",
"Latn",
}
m["lby"] = {
"Lamu-Lamu",
6482727,
nil,
"Latn",
}
m["lbz"] = {
"Lardil",
3915688,
"aus-tnk",
"Latn",
}
m["lcc"] = {
"Legenyem",
12952713,
"poz-hce",
"Latn",
}
m["lcd"] = {
"Lola",
6668867,
"poz-cet",
"Latn",
}
m["lce"] = {
"Loncong",
3058192,
}
m["lcf"] = {
"Lubu",
3264685,
}
m["lch"] = {
"Luchazi",
3265143,
"bnt-clu",
}
m["lcl"] = {
"Lisela",
6558753,
"poz-cma",
"Latn",
}
m["lcm"] = {
"Tungag",
3542085,
"poz-ocw",
"Latn",
}
m["lcp"] = {
"Western Lawa",
18644465,
"mkh-pal",
"Thai",
sort_key = "Thai-sortkey",
}
m["lcq"] = {
"Luhu",
6699890,
"poz-cma",
"Latn",
}
m["lcs"] = {
"Lisabata-Nuniali",
6558534,
}
m["lda"] = {
"Kla",
63257856,
"dmn-mda",
"Latn",
}
m["ldb"] = {
"Idun",
3914441,
"nic-plc",
"Latn",
}
m["ldd"] = {
"Luri (Nigeria)",
4701277,
"cdc-wst",
}
m["ldg"] = {
"Lenyima",
3914423,
"nic-uce",
"Latn",
}
m["ldh"] = {
"Lamja-Dengsa-Tola",
11001739,
"nic-dak",
}
m["ldj"] = {
"Lemoro",
3912761,
"nic-jer",
}
m["ldk"] = {
"Leelau",
3914465,
"alv-bwj",
}
m["ldl"] = {
"Kaan",
3914501,
"alv-yun",
}
m["ldm"] = {
"Landoma",
35568,
"alv-mel",
}
m["ldn"] = {
"Láadan",
35757,
"art",
"Latn",
type = "appendix-constructed",
}
m["ldo"] = {
"Loo",
3915378,
"alv-bwj",
}
m["ldp"] = {
"Tso",
3913953,
"alv-wjk",
}
m["ldq"] = {
"Lufu",
35796,
"nic-ykb",
"Latn",
}
m["lea"] = {
"Lega-Shabunda",
12952719,
"bnt-lgb",
}
m["leb"] = {
"Lala-Bisa",
6480112,
"bnt-sbi",
}
m["lec"] = {
"Leco",
2625398,
"qfa-iso",
}
m["led"] = {
"Lendu",
523823,
"csu-lnd",
"Latn",
}
m["lee"] = {
"Lyélé",
3089032,
"nic-gnn",
}
m["lef"] = {
"Lelemi",
35585,
"alv-ntg",
}
m["leh"] = {
"Lenje",
6522666,
"bnt-bot",
}
m["lei"] = {
"Lemio",
6521165,
"ngf-rai",
"Latn",
}
m["lej"] = {
"Lengola",
6522474,
"bnt-leb",
}
m["lek"] = {
"Leipon",
3229216,
"poz-aay",
"Latn",
}
m["lel"] = {
"Lele (Congo)",
56733,
"bnt-bsh",
}
m["lem"] = {
"Nomaande",
13479983,
"nic-mbw",
"Latn",
}
m["len"] = {
"Honduran Lenca",
36189,
"nai-len",
"Latn",
}
m["leo"] = {
"Mengisa",
1345684,
"nic-mba",
ancestors = "bag",
}
m["lep"] = {
"Lepcha",
35990,
"sit",
"Lepc",
translit = "lep-translit",
}
m["leq"] = {
"Lembena",
6521067,
"ngf-enc",
"Latn",
}
m["ler"] = {
"Lenkau",
3229472,
"poz-aay",
"Latn",
}
m["les"] = {
"Lese",
11033939,
"csu-mle",
}
m["let"] = {
"Lesing-Gelimi",
12635445,
"poz-ocw",
"Latn",
}
m["leu"] = {
"Kara (New Guinea)",
3192889,
"poz-ocw",
"Latn",
}
m["lev"] = {
"Lamma",
6583582,
"paa-alp",
"Latn",
}
m["lew"] = { -- this code was basically assigned as a catch-all for things that aren't brs, kzf or unz
"Ledo Kaili",
35877,
"poz-kal",
"Latn",
}
m["lex"] = {
"Luang",
6695015,
"poz-tim",
"Latn",
}
m["ley"] = {
"Lemolang",
3033560,
"poz-ssw",
}
m["lez"] = {
"Lezgi",
31746,
"cau-esm",
"Cyrl, Latn, Arab",
translit = "lez-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Cyrl = s["cau-Cyrl-stripdiacritics"],
Latn = s["cau-Latn-stripdiacritics"],
},
}
m["lfa"] = {
"Lefa",
35643,
"bnt-baf",
}
m["lfn"] = {
"Lingua Franca Nova",
146803,
"art",
"Latn, Cyrl",
type = "appendix-constructed",
}
m["lga"] = {
"Lungga",
3267590,
"poz-ocw",
"Latn",
}
m["lgb"] = {
"Laghu",
3216169,
"poz-ocw",
"Latn",
}
m["lgg"] = {
"Lugbara",
3272737,
"csu-mma",
"Latn",
strip_diacritics =
{
remove_diacritics = c.acute .. c.grave,
from = { "ä", "ɛ", "ë", "ï", "ɔ", "ö" },
to = { "a", "e", "i", "i", "o", "u" },
},
}
m["lgh"] = {
"Laghuu",
6472114,
"tbq-muj",
}
m["lgi"] = {
"Lengilu",
6522465,
"poz-swa",
"Latn",
}
m["lgk"] = {
"Neverver",
3241515,
"poz-vnc",
"Latn",
}
m["lgl"] = {
"Wala",
3565284,
"poz-sls",
}
m["lgm"] = {
"Lega-Mwenga",
14916883,
"bnt-lgb",
}
m["lgn"] = {
"Opuuo",
3354339,
"ssa-kom",
}
m["lgq"] = {
"Logba",
35813,
"alv-ntg",
"Latn",
}
m["lgr"] = {
"Lengo",
3229454,
"poz-sls",
"Latn",
}
m["lgs"] = {
"Guinea-Bissau Sign Language",
5616441,
"sgn",
}
m["lgt"] = {
"Pahi",
7124545,
"paa-sep",
"Latn",
}
m["lgu"] = {
"Longgu",
3259105,
"poz-sls",
}
m["lgz"] = {
"Ligenza",
5531038,
"bnt-bun",
}
m["lha"] = {
"Laha (Vietnam)",
3112363,
"qfa-kra",
}
m["lhh"] = {
"Laha (Indonesia)",
6473107,
"poz-cma",
"Latn",
}
m["lhi"] = {
"Lahu Shi",
25559457,
"tbq-lho",
}
m["lhl"] = {
"Lahul Lohar",
12953672,
}
m["lhn"] = {
"Lahanan",
12953660,
"poz-bnn",
"Latn",
}
m["lhp"] = {
"Lhokpu",
3436603,
"sit-dhi",
}
m["lhs"] = {
"Mlahsö",
3393063,
"sem-cna",
"Syrc",
}
m["lht"] = {
"Lo-Toga",
3257566,
"poz-vnn",
"Latn",
}
m["lhu"] = {
"Lahu",
35780,
"tbq-lho",
"Latn",
}
m["lia"] = {
"West-Central Limba",
32867815,
"alv-lim",
}
m["lib"] = {
"Likum",
3240737,
"poz-aay",
"Latn",
}
m["lic"] = {
"Hlai",
934738,
"qfa-lic",
"Latn",
}
m["lid"] = {
"Nyindrou",
3346666,
"poz-aay",
"Latn",
}
m["lie"] = {
"Likila",
11011614,
"bnt-ngn",
}
m["lif"] = {
"Limbu",
56477,
"sit-kir",
"Limb, Latn, Deva",
translit = "lif-translit",
}
m["lig"] = {
"Ligbi",
33594,
"dmn-jje",
}
m["lih"] = {
"Lihir",
6546938,
"poz-ocw",
"Latn",
}
m["lii"] = {
"Lingkhim",
12635536,
}
m["lij"] = {
"Ligurian",
36106,
"roa-git",
ancestors = "lij-old",
"Latn",
}
m["lik"] = {
"Lika",
1530394,
"bnt-boa",
}
m["lil"] = {
"Lillooet",
34154,
"sal",
"Latn",
}
m["lio"] = {
"Liki",
4261493,
"poz-ocw",
"Latn",
}
m["lip"] = {
"Sekpele",
36257,
"alv-ntg",
}
m["liq"] = {
"Libido",
35691,
"cus-hec",
}
m["lir"] = {
"Liberian Kreyol",
6541128,
"crp",
"Latn",
ancestors = "en",
}
m["lis"] = {
"Lisu",
56480,
"tbq-lso",
"Lisu, Latn",
override_translit = true,
-- Lisu translit, sort_key in [[Module:scripts/data]]
}
m["liu"] = {
"Logorik",
6667811,
"sdv-daj",
}
m["liv"] = {
"Livonian",
33698,
"urj-fin",
"Latn",
display_text = {
from = {"'"},
to = {"’"}
},
strip_diacritics = {
remove_diacritics = "'’" .. u(0x2019),
from = {"Ǭ", "ǭ"},
to = {"Ō", "ō"}
},
sort_key = {
from = {
"ā", "ä", "ǟ",
"ḑ",
"ē",
"ī",
"ļ",
"ņ",
"ō", "ȯ", "ȱ", "õ", "ȭ", "ö", "ȫ",
"ŗ",
"š",
"ț",
"ū", "ü", "ṻ",
"ȳ",
"ž",
},
to = {
"a" .. p[1], "a" .. p[2], "a" .. p[3],
"d" .. p[1],
"e" .. p[1],
"i" .. p[1],
"l" .. p[1],
"n" .. p[1],
"o" .. p[1], "o" .. p[2], "o" .. p[3], "o" .. p[4], "o" .. p[5], "o" .. p[6], "o" .. p[7],
"r" .. p[1],
"s" .. p[1],
"t" .. p[1],
"u" .. p[1], "u" .. p[2], "u" .. p[3],
"y" .. p[1],
"z" .. p[1],
}
}
}
m["liw"] = {
"Col",
2981948,
}
m["lix"] = {
"Liabuku",
13580912,
}
m["liy"] = {
"Banda-Bambari",
11051591,
"bad-cnt",
"Latn",
}
m["liz"] = {
"Libinza",
4914576,
"bnt-zbi",
}
m["lja"] = {
"Golpa",
50934920,
"aus-yol",
"Latn",
}
m["lje"] = {
"Rampi",
7290041,
"poz",
}
m["lji"] = {
"Laiyolo",
6474218,
"poz-wot",
"Latn",
}
m["ljl"] = {
"Li'o",
2697010,
"poz",
"Latn",
}
m["ljp"] = {
"Lampung Api",
49215,
"poz-lgx",
"Latn",
}
m["ljw"] = {
"Yirandali",
17059380,
}
m["ljx"] = {
"Yuru",
63257867,
}
m["lka"] = {
"Lakalei",
12952700,
"poz-tim",
"Latn",
}
m["lkb"] = {
"Kabras",
63257894,
"bnt-msl",
ancestors = "luy",
}
m["lkc"] = {
"Kucong",
6441572,
"tbq-lho",
}
m["lkd"] = {
"Lakondê",
20527166,
"sai-nmk",
"Latn",
}
m["lke"] = {
"Kenyi",
12952628,
"bnt-nyg",
}
m["lkh"] = {
"Lakha",
56606,
"sit-tib",
}
m["lki"] = {
"Laki",
56483,
"ku",
"fa-Arab",
translit = "lki-translit",
strip_diacritics = {remove_diacritics = c.kasra .. c.sukun},
}
m["lkj"] = {
"Remun",
7312239,
"poz-mly",
"Latn",
}
m["lkl"] = {
"Laeko-Libuat",
3504331,
"paa-trr",
"Latn",
}
m["lkm"] = {
"Kalaamaya",
6349988,
}
m["lkn"] = {
"Lakon",
3216494,
"poz-vnn",
"Latn",
}
m["lko"] = {
"Khayo",
6401095,
"bnt-msl",
}
m["lkr"] = {
"Päri",
36487,
"sdv-lon",
}
m["lks"] = {
"Kisa",
63259208,
"bnt-msl",
ancestors = "luy",
}
m["lkt"] = {
"Lakota",
33537,
"sio-dkt",
"Latn",
}
m["lku"] = {
"Kungkari",
6444526,
}
m["lky"] = {
"Lokoya",
56687,
"sdv-lma",
}
m["lla"] = {
"Lala-Roba",
3914878,
"alv-yun",
}
m["llb"] = {
"Lolo",
11006056,
"bnt-mak",
ancestors = "vmw",
}
m["llc"] = {
"Lele (Guinea)",
6520837,
"dmn-mok",
"Latn",
}
m["lld"] = {
"Ladin",
36202,
"roa-rhe",
"Latn",
}
m["lle"] = {
"Lele (New Guinea)",
3229269,
"poz-aay",
"Latn",
}
m["llf"] = {
"Hermit",
3134240,
"poz-aay",
"Latn",
}
m["llg"] = {
"Lole",
6668883,
"poz-tim",
}
m["llh"] = {
"Lamu",
6482736,
"tbq-lso",
}
m["lli"] = {
"Teke-Laali",
36543,
"bnt-nze",
}
m["llj"] = {
"Ladji-Ladji",
6512694,
"aus-pam",
"Latn",
}
m["llk"] = {
"Lelak",
3229263,
"poz-swa",
"Latn",
}
m["lll"] = {
"Lilau",
6547570,
"paa-mon",
"Latn",
}
m["llm"] = {
"Lasalimu",
6492774,
}
m["lln"] = {
"Lele (Chad)",
1641493,
"cdc-est",
}
-- llo: retired by ISO in 2019 as duplicate of ngt (Kriang); removed from Wiktionary 2026-02-01
m["llp"] = {
"North Efate",
3580152,
"poz-vnc",
"Latn",
}
m["llq"] = {
"Lolak",
12953679,
"phi",
}
m["lls"] = {
"Lithuanian Sign Language",
3915480,
"sgn",
}
m["llu"] = {
"Lau",
3218574,
"poz-sls",
"Latn",
}
m["llx"] = {
"Lauan",
35682,
"poz-pcc",
"Latn",
}
m["lma"] = {
"East Limba",
11034212,
"alv-lim",
}
m["lmb"] = {
"Merei",
12952843,
"poz-vnn",
"Latn",
}
m["lmc"] = {
"Limilngan",
6549414,
nil,
"Latn",
}
m["lmd"] = {
"Lumun",
35777,
"alv-tal",
}
m["lme"] = {
"Pévé",
56249,
"cdc-mas",
"Latn",
}
m["lmf"] = {
"South Lembata",
7567815,
}
m["lmg"] = {
"Lamogai",
278365,
"poz-ocw",
"Latn",
}
m["lmh"] = {
"Lambichhong",
6481472,
"sit-kie",
ancestors = "ybh",
}
m["lmi"] = {
"Lombi",
11259563,
"csu-maa",
}
m["lmj"] = {
"West Lembata",
6864697,
}
m["lmk"] = {
"Lamkang",
12952703,
"tbq-kuk",
}
m["lml"] = {
"Raga",
3063193,
"poz-vnn",
"Latn",
}
m["lmn"] = {
"Lambadi",
33474,
"raj",
"Latn",
}
m["lmo"] = {
"Lombard",
33754,
"roa-git",
ancestors = "lmo-old",
"Latn",
}
m["lmp"] = {
"Limbum",
35801,
"nic-nka",
"Latn",
}
m["lmq"] = {
"Lamatuka",
6480982,
}
m["lmr"] = {
"Lamalera",
6480787,
}
m["lmu"] = {
"Lamenu",
740604,
"poz-vnc",
"Latn",
}
m["lmv"] = {
"Lomaiviti",
3130221,
"poz-pcc",
"Latn",
}
m["lmw"] = {
"Lake Miwok",
3216471,
"nai-utn",
"Latn",
}
m["lmx"] = {
"Laimbue",
6473933,
"nic-rnw",
}
m["lmy"] = {
"Laboya",
6481538,
"poz-cet",
"Latn",
sort_key = "lmy-sortkey",
}
-- Lumbee [lmz] is spurious
m["lna"] = {
"Langbashe",
11137550,
"bad",
}
m["lnb"] = {
"Mbalanhu",
12952830,
"bnt-ova",
}
m["lnd"] = {
"Lun Bawang",
13479839,
"poz-swa",
"Latn",
}
m["lnh"] = {
"Lanoh",
6487291,
"mkh-asl",
}
m["lni"] = {
"Daantanai'",
5207384,
"paa-sbo",
"Latn",
}
m["lnj"] = {
"Linngithigh",
3915694,
"aus-pmn",
"Latn",
}
m["lnl"] = {
"South Central Banda",
41354532,
"bad",
}
m["lnm"] = {
"Pondi",
6485678,
"paa-wke",
"Latn",
}
m["lnn"] = {
"Lorediakarkar",
6680287,
"poz-vnn",
"Latn",
}
m["lno"] = {
"Lango (Sudan)",
223306,
"sdv-lma",
}
m["lns"] = {
"Lamnso'",
35788,
"nic-rng",
}
m["lnu"] = {
"Longuda",
35797,
"alv-bam",
"Latn",
}
m["lnw"] = {
"Lanima",
56825017,
"aus-pam",
"Latn",
}
m["loa"] = {
"Loloda",
6669025,
"paa-lla",
"Latn",
}
m["lob"] = {
"Lobi",
35807,
}
m["loc"] = {
"Inonhan",
2400870,
"phi",
"Latn",
}
m["lod"] = {
"Berawan",
4891018,
"poz-swa",
"Latn",
}
m["loe"] = {
"Saluan",
12953867,
"poz",
"Latn",
}
m["lof"] = {
"Logol",
35779,
"alv-hei",
}
m["log"] = {
"Logo",
2613477,
"csu-mma",
}
m["loh"] = {
"Narim",
56353,
"sdv",
}
m["loi"] = {
"Lomakka",
3913961,
"alv-kul",
}
m["loj"] = {
"Lou",
3260104,
"poz-aay",
"Latn",
}
m["lok"] = {
"Loko",
3914912,
"dmn-msw",
"Latn",
}
m["lol"] = {
"Mongo",
112893,
"bnt-mon",
"Latn",
}
m["lom"] = {
"Loma",
35885,
"dmn-msw",
"Latn, Loma"
}
m["lon"] = {
"Malawi Lomwe",
10975286,
"bnt-mak",
"Latn",
}
m["loo"] = {
"Lombo",
11167192,
"bnt-ske",
}
m["lop"] = {
"Lopa",
3914875,
}
m["loq"] = {
"Lobala",
4849710,
"bnt-ngn",
}
m["lor"] = {
"Téén",
36467,
"alv-kul",
}
m["los"] = {
"Loniu",
3259202,
"poz-aay",
"Latn",
}
m["lot"] = {
"Lotuko",
56672,
"sdv-lma",
}
m["lou"] = {
"Louisiana Creole",
1185127,
"crp",
"Latn",
ancestors = "fr",
sort_key = s["roa-oil-sortkey"],
}
m["lov"] = {
"Lopi",
12952740,
"tbq-tal",
}
m["low"] = {
"Tampias Lobu",
12953674,
}
m["lox"] = {
"Loun",
6689636,
"poz-cet",
"Latn",
}
m["loz"] = {
"Lozi",
33628,
"bnt-sts",
"Latn",
}
m["lpa"] = {
"Lelepa",
3229273,
"poz-vnc",
"Latn",
}
m["lpe"] = {
"Lepki",
4259152,
"paa-lmu",
"Latn",
}
m["lpn"] = {
"Long Phuri Naga",
6673049,
"sit-aao",
}
m["lpo"] = {
"Lipo",
56921,
"tbq-llo",
"Plrd",
}
m["lpx"] = {
"Lopit",
56684,
"sdv-lma",
}
m["lra"] = {
"Rara Bakati'",
3419746,
"day",
}
m["lrc"] = {
"Northern Luri",
19933293,
"ira-swi",
"fa-Arab",
ancestors = "pal",
}
m["lre"] = {
"Laurentian",
1790301,
"iro-nor",
"Latn",
}
m["lrg"] = {
"Laragia",
2591193,
}
m["lri"] = {
"Marachi",
6754565,
"bnt-msl",
}
m["lrk"] = {
"Loarki",
6663513,
}
m["lrl"] = {
"Larestani",
33468,
"ira-swi",
"fa-Arab",
}
m["lrm"] = {
"Marama",
6325931,
"bnt-msl",
ancestors = "luy",
}
m["lrn"] = {
"Lorang",
6678781,
}
m["lro"] = {
"Laro",
35687,
"alv-hei",
}
m["lrr"] = {
"Southern Lorung",
12952742,
"sit-kie",
}
m["lrt"] = {
"Larantuka Malay",
6488691,
"poz-mly",
"Latn",
}
m["lrv"] = {
"Larëvat",
3217892,
"poz-vnc",
"Latn",
}
m["lrz"] = {
"Lemerig",
2028448,
"poz-vnn",
"Latn",
}
m["lsa"] = {
"Lasgerdi",
3218296,
"ira-kms",
"Arab",
}
m["lsd"] = {
"Lishana Deni",
3436461,
"sem-nna",
"Hebr",
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lse"] = {
"Lusengo",
6683546,
"bnt-zbi",
}
m["lsh"] = {
"Lish",
6558822,
"sit-khc",
}
m["lsi"] = {
"Lashi",
6493203,
"tbq-brm",
"Latn",
}
m["lsl"] = {
"Latvian Sign Language",
6497414,
"sgn",
}
m["lsm"] = {
"Saamia",
3739441,
"bnt-msl",
}
m["lsn"] = {
"Tibetan Sign Language",
15936110,
"sgn",
}
m["lso"] = {
"Laos Sign Language",
6488022,
"sgn",
}
m["lsp"] = {
"Panamanian Sign Language",
7129968,
"sgn",
}
m["lsr"] = {
"Aruop",
3450566,
"paa-pal",
"Latn",
}
m["lss"] = {
"Lasi",
12953669,
"inc-snd",
"Arab",
ancestors = "sd",
}
m["lst"] = {
"Trinidad and Tobago Sign Language",
7842495,
"sgn",
}
m["lsv"] = {
"Sivia Sign Language",
55558911,
"sgn",
}
m["lsy"] = {
"Mauritian Sign Language",
6793754,
"sgn",
}
m["ltc"] = {
"Middle Chinese",
2016252,
"zhx",
"Hant, Phag, Tang",
translit = {Hant = "zh-translit"},
-- Tang translit in [[Module:scripts/data]]; NOTE: Previously not present, presumably an accidental omission.
sort_key = {Hant = "Hani-sortkey"},
}
m["ltg"] = {
"Latgalian",
36212,
"bat-eas",
"Latn",
}
m["lti"] = {
"Leti",
3236912,
"poz-tim",
"Latn",
}
m["ltn"] = {
"Latundê",
63259736,
"sai-nmk",
"Latn",
}
m["lto"] = {
"Olutsotso",
63259915,
"bnt-msl",
ancestors = "luy",
}
m["lts"] = {
"Lutachoni",
63283459,
"bnt-msl",
}
m["ltu"] = {
"Latu",
6497181,
"poz-cma",
}
m["lua"] = {
"Luba-Kasai",
34173,
"bnt-lub",
"Latn",
}
m["luc"] = {
"Aringa",
56556,
"csu-mma",
"Latn",
}
m["lud"] = {
"Ludian",
33918,
"urj-fin",
"Latn",
display_text = {
from = {"'"},
to = {"ʹ"}
},
strip_diacritics = {
from = {"'"},
to = {"ʹ"}
},
sort_key = {
from = {
"č", "š", "ž", "ü", "ä", "ö", -- 2 chars
"z", "ʹ" -- 1 char
},
to = {
"c" .. p[1], "s" .. p[1], "s" .. p[3], "y" .. p[1], "y" .. p[2], "y" .. p[3],
"s" .. p[2], "y" .. p[4],
}
},
}
m["lue"] = {
"Luvale",
33597,
"bnt-clu",
"Latn",
}
m["luf"] = {
"Laua",
6497673,
"paa-mal",
"Latn",
}
m["luh"] = {
"Leizhou Min",
1988433,
"zhx-nan",
"Hants",
generate_forms = "zh-generateforms",
sort_key = "Hani-sortkey",
}
m["lui"] = {
"Luiseño",
56236,
"azc-cup",
"Latn",
strip_diacritics = {remove_diacritics = c.acute .. c.circ},
}
m["luj"] = {
"Luna",
11003832,
"bnt-lbn",
}
m["luk"] = {
"Lunanakha",
56446,
"sit-tib",
"Tibt",
ancestors = "dz",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lul"] = {
"Olu'bo",
6589401,
"csu-mma",
}
m["lum"] = {
"Luimbi",
10963134,
"bnt-clu",
}
m["lun"] = {
"Lunda",
33607,
"bnt-lun",
"Latn",
}
m["luo"] = {
"Luo",
5414796,
"sdv-los",
"Latn",
}
m["lup"] = {
"Lumbu",
35793,
"bnt-sir",
}
m["luq"] = {
"Lucumí",
1768321,
"alv-yor",
"Latn",
ancestors = "yo",
sort_key = {
remove_diacritics = c.acute,
},
}
m["lur"] = {
"Laura",
2984540,
}
m["lus"] = {
"Mizo",
36147,
"tbq-kuk",
"Latn",
}
m["lut"] = {
"Lushootseed",
33658,
"sal",
"Latn",
}
m["luu"] = {
"Lumba-Yakkha",
6703050,
"sit-kie",
ancestors = "ybh",
}
m["luv"] = {
"Luwati",
33402,
"inc-snd",
"Khoj",
}
m["luy"] = {
"Luhya",
35893,
"bnt-msl",
"Latn",
}
m["luz"] = {
"Southern Luri",
12952748,
"ira-swi",
"fa-Arab",
ancestors = "pal",
}
m["lva"] = {
"Maku'a",
35790,
"poz-tim",
}
m["lvi"] = {
"Lawi",
6502657,
"mkh-ban",
"Latn",
}
m["lvk"] = {
"Lavukaleve",
770547,
"qfa-dis", -- Papuan; isolate in Glottolog; in the tentative Central Solomons family by Ross (2005) and Pedrós
-- (2015)
"Latn",
}
m["lvl"] = {
"Lwel",
93936908,
"bnt-bdz",
"Latn",
}
m["lvu"] = {
"Levuka",
6535860,
}
m["lwa"] = {
"Lwalu",
6706953,
"bnt-lbn",
}
m["lwe"] = {
"Lewo Eleng",
6537465,
}
m["lwg"] = {
"Wanga",
nil,
"bnt-msl",
ancestors = "luy",
}
m["lwh"] = {
"White Lachi",
8842956,
"qfa-kra",
}
m["lwl"] = {
"Eastern Lawa",
18644464,
"mkh-pal",
"Thai",
sort_key = "Thai-sortkey",
}
m["lwm"] = {
"Laomian",
19597674,
"tbq-bis",
}
m["lwo"] = {
"Luwo",
56362,
"sdv-lon",
"Latn",
}
m["lws"] = {
"Malawian Sign Language",
47522462,
"sgn",
}
m["lwt"] = {
"Lewotobi",
14916885,
}
m["lwu"] = {
"Lawu",
6505073,
"tbq-lwo",
}
m["lww"] = {
"Lewo",
3237321,
"poz-vnc",
"Latn",
}
m["lya"] = {
"Layakha",
56602,
"sit-tib",
"Tibt",
ancestors = "dz",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lyg"] = {
"Lyngngam",
12635902,
"aav-pkl",
}
m["lyn"] = {
"Luyana",
3268098,
}
m["lzh"] = {
"Classical Chinese",
37041,
"zhx",
"Hant",
wikimedia_codes = "zh-classical",
translit = "zh-translit",
sort_key = "Hani-sortkey",
}
m["lzl"] = {
"Litzlitz",
6653424,
"poz-vnc",
"Latn",
}
m["lzn"] = {
"Leinong Naga",
5924455,
"sit-kch",
}
m["lzz"] = {
"Laz",
1160372,
"ccs-zan",
"Geor, Latn",
translit = {Geor = "lzz-translit"},
override_translit = true,
strip_diacritics = {remove_diacritics = c.grave .. c.acute .. c.circ},
}
return require("Module:languages").finalizeData(m, "language")
6k294u12958415w2stzdehtw2q5svjz
234838
234837
2026-05-24T09:07:24Z
Lee
19
[[:en:Module:languages/data/3/l]] වෙතින් එක් සංශෝධනයක්
234837
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["laa"] = {
"Lapuyan Subanun",
12635302,
"phi",
}
m["lab"] = {
"Linear A",
nil,
"qfa-unc", -- undeciphered
"Lina",
}
m["lac"] = {
"Lacandon",
35766,
"myn",
"Latn",
}
m["lad"] = {
"Ladino",
36196,
"roa-cas",
"Hebr, Latn, Cyrl",
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lae"] = {
"Pattani",
7148323,
"sit-whm",
}
m["laf"] = {
"Lafofa",
35711,
"alv",
}
m["lag"] = {
"Langi",
584983,
"bnt-mra",
}
m["lah"] = {
"Lahnda",
1334774,
"inc-pan",
"pa-Arab",
}
m["lai"] = {
"Lambya",
6481626,
"bnt-mby",
"Latn",
}
m["laj"] = {
"Lango (Uganda)",
35670,
"sdv-los",
"Latn",
}
m["lak"] = {
"Laka",
6474529, -- also Q55616620
"csu-sar", -- formerly classified as "alv-mbm"; see [[w:Lau Laka language]]
}
m["lam"] = {
"Lamba",
36098,
"bnt-sbi",
"Latn",
}
m["lan"] = {
"Laru",
3913987,
"nic-knj",
"Latn",
}
m["lap"] = {
"Kabba-Laka",
6474528,
"csu-sar",
"Latn",
}
m["laq"] = {
"Qabiao",
3436700,
"qfa-kra",
}
m["lar"] = {
"Larteh",
35639,
"alv-gng",
"Latn",
}
m["las"] = {
"Gur Lama",
35652,
"nic-gne",
"Latn",
}
m["lau"] = {
"Laba",
12952694,
"paa-lla",
"Latn",
}
m["law"] = {
"Lauje",
6498258,
"poz",
"Latn",
}
m["lax"] = {
"Tiwa",
7810466,
"tbq-bdg",
"Latn, as-Beng",
}
m["lay"] = {
"Lama Bai",
6480756,
"sit-nba",
"Hani, Latn",
sort_key = {Hani = "Hani-sortkey"},
}
m["laz"] = {
"Aribwatsa",
3502104,
"poz-ocw",
"Latn",
}
m["lbb"] = {
"Label",
3214296,
"poz-ocw",
"Latn",
}
m["lbc"] = {
"Lakkia",
3027879,
"qfa-tak",
}
m["lbe"] = {
"Lak",
36206,
"cau-nec",
"Cyrl, Latn, Arab, Geor",
translit = {
Cyrl = "lbe-translit",
-- Geor translit in [[Module:scripts/data]]
},
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Cyrl = s["cau-Cyrl-stripdiacritics"],
Latn = s["cau-Latn-stripdiacritics"],
},
sort_key = "lbe-sortkey",
}
m["lbf"] = {
"Tinani",
784502,
"sit-whm",
}
m["lbg"] = {
"Laopang",
12952711,
"tbq-bis",
}
m["lbi"] = {
"La'bi",
6460637,
"alv-mbm",
}
m["lbj"] = {
"Ladakhi",
35833,
"sit-lab",
"Tibt",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lbk"] = {
"Central Bontoc",
63257803,
"phi",
"Latn",
}
m["lbl"] = {
"Libon Bikol",
18664462,
"phi",
"Latn",
}
m["lbm"] = {
"Lodhi",
6666374,
"mun",
}
m["lbn"] = {
"Lamet",
3216723,
"mkh-pal",
"Laoo, Latn",
}
m["lbo"] = {
"Laven",
6298648,
"mkh-ban",
"Latn",
}
m["lbq"] = {
"Wampar",
7966946,
"poz-ocw",
"Latn",
}
m["lbr"] = {
"Northern Lorung",
6668040,
"sit-kie",
"Deva",
}
m["lbs"] = {
"Libyan Sign Language",
11775688,
"sgn",
}
m["lbt"] = {
"Lachi",
6583606,
"qfa-kra",
}
m["lbu"] = {
"Labu",
6467660,
"poz-ocw",
"Latn",
}
m["lbv"] = {
"Lavatbura-Lamusong",
2405981,
"poz-ocw",
"Latn",
}
m["lbw"] = {
"Tolaki",
3033597,
"poz-btk",
"Latn",
}
m["lbx"] = {
"Lawangan",
3120345,
"poz-bre",
"Latn",
}
m["lby"] = {
"Lamu-Lamu",
6482727,
nil,
"Latn",
}
m["lbz"] = {
"Lardil",
3915688,
"aus-tnk",
"Latn",
}
m["lcc"] = {
"Legenyem",
12952713,
"poz-hce",
"Latn",
}
m["lcd"] = {
"Lola",
6668867,
"poz-cet",
"Latn",
}
m["lce"] = {
"Loncong",
3058192,
}
m["lcf"] = {
"Lubu",
3264685,
}
m["lch"] = {
"Luchazi",
3265143,
"bnt-clu",
}
m["lcl"] = {
"Lisela",
6558753,
"poz-cma",
"Latn",
}
m["lcm"] = {
"Tungag",
3542085,
"poz-ocw",
"Latn",
}
m["lcp"] = {
"Western Lawa",
18644465,
"mkh-pal",
"Thai",
sort_key = "Thai-sortkey",
}
m["lcq"] = {
"Luhu",
6699890,
"poz-cma",
"Latn",
}
m["lcs"] = {
"Lisabata-Nuniali",
6558534,
}
m["lda"] = {
"Kla",
63257856,
"dmn-mda",
"Latn",
}
m["ldb"] = {
"Idun",
3914441,
"nic-plc",
"Latn",
}
m["ldd"] = {
"Luri (Nigeria)",
4701277,
"cdc-wst",
}
m["ldg"] = {
"Lenyima",
3914423,
"nic-uce",
"Latn",
}
m["ldh"] = {
"Lamja-Dengsa-Tola",
11001739,
"nic-dak",
}
m["ldj"] = {
"Lemoro",
3912761,
"nic-jer",
}
m["ldk"] = {
"Leelau",
3914465,
"alv-bwj",
}
m["ldl"] = {
"Kaan",
3914501,
"alv-yun",
}
m["ldm"] = {
"Landoma",
35568,
"alv-mel",
}
m["ldn"] = {
"Láadan",
35757,
"art",
"Latn",
type = "appendix-constructed",
}
m["ldo"] = {
"Loo",
3915378,
"alv-bwj",
}
m["ldp"] = {
"Tso",
3913953,
"alv-wjk",
}
m["ldq"] = {
"Lufu",
35796,
"nic-ykb",
"Latn",
}
m["lea"] = {
"Lega-Shabunda",
12952719,
"bnt-lgb",
}
m["leb"] = {
"Lala-Bisa",
6480112,
"bnt-sbi",
}
m["lec"] = {
"Leco",
2625398,
"qfa-iso",
}
m["led"] = {
"Lendu",
523823,
"csu-lnd",
"Latn",
}
m["lee"] = {
"Lyélé",
3089032,
"nic-gnn",
}
m["lef"] = {
"Lelemi",
35585,
"alv-ntg",
}
m["leh"] = {
"Lenje",
6522666,
"bnt-bot",
}
m["lei"] = {
"Lemio",
6521165,
"ngf-rai",
"Latn",
}
m["lej"] = {
"Lengola",
6522474,
"bnt-leb",
}
m["lek"] = {
"Leipon",
3229216,
"poz-aay",
"Latn",
}
m["lel"] = {
"Lele (Congo)",
56733,
"bnt-bsh",
}
m["lem"] = {
"Nomaande",
13479983,
"nic-mbw",
"Latn",
}
m["len"] = {
"Honduran Lenca",
36189,
"nai-len",
"Latn",
}
m["leo"] = {
"Mengisa",
1345684,
"nic-mba",
ancestors = "bag",
}
m["lep"] = {
"Lepcha",
35990,
"sit",
"Lepc",
translit = "lep-translit",
}
m["leq"] = {
"Lembena",
6521067,
"ngf-enc",
"Latn",
}
m["ler"] = {
"Lenkau",
3229472,
"poz-aay",
"Latn",
}
m["les"] = {
"Lese",
11033939,
"csu-mle",
}
m["let"] = {
"Lesing-Gelimi",
12635445,
"poz-ocw",
"Latn",
}
m["leu"] = {
"Kara (New Guinea)",
3192889,
"poz-ocw",
"Latn",
}
m["lev"] = {
"Lamma",
6583582,
"paa-alp",
"Latn",
}
m["lew"] = { -- this code was basically assigned as a catch-all for things that aren't brs, kzf or unz
"Ledo Kaili",
35877,
"poz-kal",
"Latn",
}
m["lex"] = {
"Luang",
6695015,
"poz-tim",
"Latn",
}
m["ley"] = {
"Lemolang",
3033560,
"poz-ssw",
}
m["lez"] = {
"Lezgi",
31746,
"cau-esm",
"Cyrl, Latn, Arab",
translit = "lez-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Cyrl = s["cau-Cyrl-stripdiacritics"],
Latn = s["cau-Latn-stripdiacritics"],
},
}
m["lfa"] = {
"Lefa",
35643,
"bnt-baf",
}
m["lfn"] = {
"Lingua Franca Nova",
146803,
"art",
"Latn, Cyrl",
type = "appendix-constructed",
}
m["lga"] = {
"Lungga",
3267590,
"poz-ocw",
"Latn",
}
m["lgb"] = {
"Laghu",
3216169,
"poz-ocw",
"Latn",
}
m["lgg"] = {
"Lugbara",
3272737,
"csu-mma",
"Latn",
strip_diacritics =
{
remove_diacritics = c.acute .. c.grave,
from = { "ä", "ɛ", "ë", "ï", "ɔ", "ö" },
to = { "a", "e", "i", "i", "o", "u" },
},
}
m["lgh"] = {
"Laghuu",
6472114,
"tbq-muj",
}
m["lgi"] = {
"Lengilu",
6522465,
"poz-swa",
"Latn",
}
m["lgk"] = {
"Neverver",
3241515,
"poz-vnc",
"Latn",
}
m["lgl"] = {
"Wala",
3565284,
"poz-sls",
}
m["lgm"] = {
"Lega-Mwenga",
14916883,
"bnt-lgb",
}
m["lgn"] = {
"Opuuo",
3354339,
"ssa-kom",
}
m["lgq"] = {
"Logba",
35813,
"alv-ntg",
"Latn",
}
m["lgr"] = {
"Lengo",
3229454,
"poz-sls",
"Latn",
}
m["lgs"] = {
"Guinea-Bissau Sign Language",
5616441,
"sgn",
}
m["lgt"] = {
"Pahi",
7124545,
"paa-sep",
"Latn",
}
m["lgu"] = {
"Longgu",
3259105,
"poz-sls",
}
m["lgz"] = {
"Ligenza",
5531038,
"bnt-bun",
}
m["lha"] = {
"Laha (Vietnam)",
3112363,
"qfa-kra",
}
m["lhh"] = {
"Laha (Indonesia)",
6473107,
"poz-cma",
"Latn",
}
m["lhi"] = {
"Lahu Shi",
25559457,
"tbq-lho",
}
m["lhl"] = {
"Lahul Lohar",
12953672,
}
m["lhn"] = {
"Lahanan",
12953660,
"poz-bnn",
"Latn",
}
m["lhp"] = {
"Lhokpu",
3436603,
"sit-dhi",
}
m["lhs"] = {
"Mlahsö",
3393063,
"sem-cna",
"Syrc",
}
m["lht"] = {
"Lo-Toga",
3257566,
"poz-vnn",
"Latn",
}
m["lhu"] = {
"Lahu",
35780,
"tbq-lho",
"Latn",
}
m["lia"] = {
"West-Central Limba",
32867815,
"alv-lim",
}
m["lib"] = {
"Likum",
3240737,
"poz-aay",
"Latn",
}
m["lic"] = {
"Hlai",
934738,
"qfa-lic",
"Latn",
}
m["lid"] = {
"Nyindrou",
3346666,
"poz-aay",
"Latn",
}
m["lie"] = {
"Likila",
11011614,
"bnt-ngn",
}
m["lif"] = {
"Limbu",
56477,
"sit-kir",
"Limb, Latn, Deva",
translit = "lif-translit",
}
m["lig"] = {
"Ligbi",
33594,
"dmn-jje",
}
m["lih"] = {
"Lihir",
6546938,
"poz-ocw",
"Latn",
}
m["lii"] = {
"Lingkhim",
12635536,
}
m["lij"] = {
"Ligurian",
36106,
"roa-git",
ancestors = "lij-old",
"Latn",
}
m["lik"] = {
"Lika",
1530394,
"bnt-boa",
}
m["lil"] = {
"Lillooet",
34154,
"sal",
"Latn",
}
m["lio"] = {
"Liki",
4261493,
"poz-ocw",
"Latn",
}
m["lip"] = {
"Sekpele",
36257,
"alv-ntg",
}
m["liq"] = {
"Libido",
35691,
"cus-hec",
}
m["lir"] = {
"Liberian Kreyol",
6541128,
"crp",
"Latn",
ancestors = "en",
}
m["lis"] = {
"Lisu",
56480,
"tbq-lso",
"Lisu, Latn",
override_translit = true,
-- Lisu translit, sort_key in [[Module:scripts/data]]
}
m["liu"] = {
"Logorik",
6667811,
"sdv-daj",
}
m["liv"] = {
"Livonian",
33698,
"urj-fin",
"Latn",
display_text = {
from = {"'"},
to = {"’"}
},
strip_diacritics = {
remove_diacritics = "'’" .. u(0x2019),
from = {"Ǭ", "ǭ"},
to = {"Ō", "ō"}
},
sort_key = {
from = {
"ā", "ä", "ǟ",
"ḑ",
"ē",
"ī",
"ļ",
"ņ",
"ō", "ȯ", "ȱ", "õ", "ȭ", "ö", "ȫ",
"ŗ",
"š",
"ț",
"ū", "ü", "ṻ",
"ȳ",
"ž",
},
to = {
"a" .. p[1], "a" .. p[2], "a" .. p[3],
"d" .. p[1],
"e" .. p[1],
"i" .. p[1],
"l" .. p[1],
"n" .. p[1],
"o" .. p[1], "o" .. p[2], "o" .. p[3], "o" .. p[4], "o" .. p[5], "o" .. p[6], "o" .. p[7],
"r" .. p[1],
"s" .. p[1],
"t" .. p[1],
"u" .. p[1], "u" .. p[2], "u" .. p[3],
"y" .. p[1],
"z" .. p[1],
}
}
}
m["liw"] = {
"Col",
2981948,
}
m["lix"] = {
"Liabuku",
13580912,
}
m["liy"] = {
"Banda-Bambari",
11051591,
"bad-cnt",
"Latn",
}
m["liz"] = {
"Libinza",
4914576,
"bnt-zbi",
}
m["lja"] = {
"Golpa",
50934920,
"aus-yol",
"Latn",
}
m["lje"] = {
"Rampi",
7290041,
"poz",
}
m["lji"] = {
"Laiyolo",
6474218,
"poz-wot",
"Latn",
}
m["ljl"] = {
"Li'o",
2697010,
"poz",
"Latn",
}
m["ljp"] = {
"Lampung Api",
49215,
"poz-lgx",
"Latn",
}
m["ljw"] = {
"Yirandali",
17059380,
}
m["ljx"] = {
"Yuru",
63257867,
}
m["lka"] = {
"Lakalei",
12952700,
"poz-tim",
"Latn",
}
m["lkb"] = {
"Kabras",
63257894,
"bnt-msl",
ancestors = "luy",
}
m["lkc"] = {
"Kucong",
6441572,
"tbq-lho",
}
m["lkd"] = {
"Lakondê",
20527166,
"sai-nmk",
"Latn",
}
m["lke"] = {
"Kenyi",
12952628,
"bnt-nyg",
}
m["lkh"] = {
"Lakha",
56606,
"sit-tib",
}
m["lki"] = {
"Laki",
56483,
"ku",
"fa-Arab",
translit = "lki-translit",
strip_diacritics = {remove_diacritics = c.kasra .. c.sukun},
}
m["lkj"] = {
"Remun",
7312239,
"poz-mly",
"Latn",
}
m["lkl"] = {
"Laeko-Libuat",
3504331,
"paa-trr",
"Latn",
}
m["lkm"] = {
"Kalaamaya",
6349988,
}
m["lkn"] = {
"Lakon",
3216494,
"poz-vnn",
"Latn",
}
m["lko"] = {
"Khayo",
6401095,
"bnt-msl",
}
m["lkr"] = {
"Päri",
36487,
"sdv-lon",
}
m["lks"] = {
"Kisa",
63259208,
"bnt-msl",
ancestors = "luy",
}
m["lkt"] = {
"Lakota",
33537,
"sio-dkt",
"Latn",
}
m["lku"] = {
"Kungkari",
6444526,
}
m["lky"] = {
"Lokoya",
56687,
"sdv-lma",
}
m["lla"] = {
"Lala-Roba",
3914878,
"alv-yun",
}
m["llb"] = {
"Lolo",
11006056,
"bnt-mak",
ancestors = "vmw",
}
m["llc"] = {
"Lele (Guinea)",
6520837,
"dmn-mok",
"Latn",
}
m["lld"] = {
"Ladin",
36202,
"roa-rhe",
"Latn",
}
m["lle"] = {
"Lele (New Guinea)",
3229269,
"poz-aay",
"Latn",
}
m["llf"] = {
"Hermit",
3134240,
"poz-aay",
"Latn",
}
m["llg"] = {
"Lole",
6668883,
"poz-tim",
}
m["llh"] = {
"Lamu",
6482736,
"tbq-lso",
}
m["lli"] = {
"Teke-Laali",
36543,
"bnt-nze",
}
m["llj"] = {
"Ladji-Ladji",
6512694,
"aus-pam",
"Latn",
}
m["llk"] = {
"Lelak",
3229263,
"poz-swa",
"Latn",
}
m["lll"] = {
"Lilau",
6547570,
"paa-mon",
"Latn",
}
m["llm"] = {
"Lasalimu",
6492774,
}
m["lln"] = {
"Lele (Chad)",
1641493,
"cdc-est",
}
-- llo: retired by ISO in 2019 as duplicate of ngt (Kriang); removed from Wiktionary 2026-02-01
m["llp"] = {
"North Efate",
3580152,
"poz-vnc",
"Latn",
}
m["llq"] = {
"Lolak",
12953679,
"phi",
}
m["lls"] = {
"Lithuanian Sign Language",
3915480,
"sgn",
}
m["llu"] = {
"Lau",
3218574,
"poz-sls",
"Latn",
}
m["llx"] = {
"Lauan",
35682,
"poz-pcc",
"Latn",
}
m["lma"] = {
"East Limba",
11034212,
"alv-lim",
}
m["lmb"] = {
"Merei",
12952843,
"poz-vnn",
"Latn",
}
m["lmc"] = {
"Limilngan",
6549414,
nil,
"Latn",
}
m["lmd"] = {
"Lumun",
35777,
"alv-tal",
}
m["lme"] = {
"Pévé",
56249,
"cdc-mas",
"Latn",
}
m["lmf"] = {
"South Lembata",
7567815,
}
m["lmg"] = {
"Lamogai",
278365,
"poz-ocw",
"Latn",
}
m["lmh"] = {
"Lambichhong",
6481472,
"sit-kie",
ancestors = "ybh",
}
m["lmi"] = {
"Lombi",
11259563,
"csu-maa",
}
m["lmj"] = {
"West Lembata",
6864697,
}
m["lmk"] = {
"Lamkang",
12952703,
"tbq-kuk",
}
m["lml"] = {
"Raga",
3063193,
"poz-vnn",
"Latn",
}
m["lmn"] = {
"Lambadi",
33474,
"raj",
"Latn",
}
m["lmo"] = {
"Lombard",
33754,
"roa-git",
ancestors = "lmo-old",
"Latn",
}
m["lmp"] = {
"Limbum",
35801,
"nic-nka",
"Latn",
}
m["lmq"] = {
"Lamatuka",
6480982,
}
m["lmr"] = {
"Lamalera",
6480787,
}
m["lmu"] = {
"Lamenu",
740604,
"poz-vnc",
"Latn",
}
m["lmv"] = {
"Lomaiviti",
3130221,
"poz-pcc",
"Latn",
}
m["lmw"] = {
"Lake Miwok",
3216471,
"nai-utn",
"Latn",
}
m["lmx"] = {
"Laimbue",
6473933,
"nic-rnw",
}
m["lmy"] = {
"Laboya",
6481538,
"poz-cet",
"Latn",
sort_key = "lmy-sortkey",
}
-- Lumbee [lmz] is spurious
m["lna"] = {
"Langbashe",
11137550,
"bad",
}
m["lnb"] = {
"Mbalanhu",
12952830,
"bnt-ova",
}
m["lnd"] = {
"Lun Bawang",
13479839,
"poz-swa",
"Latn",
}
m["lnh"] = {
"Lanoh",
6487291,
"mkh-asl",
}
m["lni"] = {
"Daantanai'",
5207384,
"paa-sbo",
"Latn",
}
m["lnj"] = {
"Linngithigh",
3915694,
"aus-pmn",
"Latn",
}
m["lnl"] = {
"South Central Banda",
41354532,
"bad",
}
m["lnm"] = {
"Pondi",
6485678,
"paa-wke",
"Latn",
}
m["lnn"] = {
"Lorediakarkar",
6680287,
"poz-vnn",
"Latn",
}
m["lno"] = {
"Lango (Sudan)",
223306,
"sdv-lma",
}
m["lns"] = {
"Lamnso'",
35788,
"nic-rng",
}
m["lnu"] = {
"Longuda",
35797,
"alv-bam",
"Latn",
}
m["lnw"] = {
"Lanima",
56825017,
"aus-pam",
"Latn",
}
m["loa"] = {
"Loloda",
6669025,
"paa-lla",
"Latn",
}
m["lob"] = {
"Lobi",
35807,
}
m["loc"] = {
"Inonhan",
2400870,
"phi",
"Latn",
}
m["lod"] = {
"Berawan",
4891018,
"poz-swa",
"Latn",
}
m["loe"] = {
"Saluan",
12953867,
"poz",
"Latn",
}
m["lof"] = {
"Logol",
35779,
"alv-hei",
}
m["log"] = {
"Logo",
2613477,
"csu-mma",
}
m["loh"] = {
"Narim",
56353,
"sdv",
}
m["loi"] = {
"Lomakka",
3913961,
"alv-kul",
}
m["loj"] = {
"Lou",
3260104,
"poz-aay",
"Latn",
}
m["lok"] = {
"Loko",
3914912,
"dmn-msw",
"Latn",
}
m["lol"] = {
"Mongo",
112893,
"bnt-mon",
"Latn",
}
m["lom"] = {
"Loma",
35885,
"dmn-msw",
"Latn, Loma"
}
m["lon"] = {
"Malawi Lomwe",
10975286,
"bnt-mak",
"Latn",
}
m["loo"] = {
"Lombo",
11167192,
"bnt-ske",
}
m["lop"] = {
"Lopa",
3914875,
}
m["loq"] = {
"Lobala",
4849710,
"bnt-ngn",
}
m["lor"] = {
"Téén",
36467,
"alv-kul",
}
m["los"] = {
"Loniu",
3259202,
"poz-aay",
"Latn",
}
m["lot"] = {
"Lotuko",
56672,
"sdv-lma",
}
m["lou"] = {
"Louisiana Creole",
1185127,
"crp",
"Latn",
ancestors = "fr",
sort_key = s["roa-oil-sortkey"],
}
m["lov"] = {
"Lopi",
12952740,
"tbq-tal",
}
m["low"] = {
"Tampias Lobu",
12953674,
}
m["lox"] = {
"Loun",
6689636,
"poz-cet",
"Latn",
}
m["loz"] = {
"Lozi",
33628,
"bnt-sts",
"Latn",
}
m["lpa"] = {
"Lelepa",
3229273,
"poz-vnc",
"Latn",
}
m["lpe"] = {
"Lepki",
4259152,
"paa-lmu",
"Latn",
}
m["lpn"] = {
"Long Phuri Naga",
6673049,
"sit-aao",
}
m["lpo"] = {
"Lipo",
56921,
"tbq-llo",
"Plrd",
}
m["lpx"] = {
"Lopit",
56684,
"sdv-lma",
}
m["lra"] = {
"Rara Bakati'",
3419746,
"day",
}
m["lrc"] = {
"Northern Luri",
19933293,
"ira-swi",
"fa-Arab",
ancestors = "pal",
}
m["lre"] = {
"Laurentian",
1790301,
"iro-nor",
"Latn",
}
m["lrg"] = {
"Laragia",
2591193,
}
m["lri"] = {
"Marachi",
6754565,
"bnt-msl",
}
m["lrk"] = {
"Loarki",
6663513,
}
m["lrl"] = {
"Larestani",
33468,
"ira-swi",
"fa-Arab",
}
m["lrm"] = {
"Marama",
6325931,
"bnt-msl",
ancestors = "luy",
}
m["lrn"] = {
"Lorang",
6678781,
}
m["lro"] = {
"Laro",
35687,
"alv-hei",
}
m["lrr"] = {
"Southern Lorung",
12952742,
"sit-kie",
}
m["lrt"] = {
"Larantuka Malay",
6488691,
"poz-mly",
"Latn",
}
m["lrv"] = {
"Larëvat",
3217892,
"poz-vnc",
"Latn",
}
m["lrz"] = {
"Lemerig",
2028448,
"poz-vnn",
"Latn",
}
m["lsa"] = {
"Lasgerdi",
3218296,
"ira-kms",
"Arab",
}
m["lsd"] = {
"Lishana Deni",
3436461,
"sem-nna",
"Hebr",
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lse"] = {
"Lusengo",
6683546,
"bnt-zbi",
}
m["lsh"] = {
"Lish",
6558822,
"sit-khc",
}
m["lsi"] = {
"Lashi",
6493203,
"tbq-brm",
"Latn",
}
m["lsl"] = {
"Latvian Sign Language",
6497414,
"sgn",
}
m["lsm"] = {
"Saamia",
3739441,
"bnt-msl",
}
m["lsn"] = {
"Tibetan Sign Language",
15936110,
"sgn",
}
m["lso"] = {
"Laos Sign Language",
6488022,
"sgn",
}
m["lsp"] = {
"Panamanian Sign Language",
7129968,
"sgn",
}
m["lsr"] = {
"Aruop",
3450566,
"paa-pal",
"Latn",
}
m["lss"] = {
"Lasi",
12953669,
"inc-snd",
"Arab",
ancestors = "sd",
}
m["lst"] = {
"Trinidad and Tobago Sign Language",
7842495,
"sgn",
}
m["lsv"] = {
"Sivia Sign Language",
55558911,
"sgn",
}
m["lsy"] = {
"Mauritian Sign Language",
6793754,
"sgn",
}
m["ltc"] = {
"Middle Chinese",
2016252,
"zhx",
"Hant, Phag, Tang",
translit = {Hant = "zh-translit"},
-- Tang translit in [[Module:scripts/data]]; NOTE: Previously not present, presumably an accidental omission.
sort_key = {Hant = "Hani-sortkey"},
}
m["ltg"] = {
"Latgalian",
36212,
"bat-eas",
"Latn",
}
m["lti"] = {
"Leti",
3236912,
"poz-tim",
"Latn",
}
m["ltn"] = {
"Latundê",
63259736,
"sai-nmk",
"Latn",
}
m["lto"] = {
"Olutsotso",
63259915,
"bnt-msl",
ancestors = "luy",
}
m["lts"] = {
"Lutachoni",
63283459,
"bnt-msl",
}
m["ltu"] = {
"Latu",
6497181,
"poz-cma",
}
m["lua"] = {
"Luba-Kasai",
34173,
"bnt-lub",
"Latn",
}
m["luc"] = {
"Aringa",
56556,
"csu-mma",
"Latn",
}
m["lud"] = {
"Ludian",
33918,
"urj-fin",
"Latn",
display_text = {
from = {"'"},
to = {"ʹ"}
},
strip_diacritics = {
from = {"'"},
to = {"ʹ"}
},
sort_key = {
from = {
"č", "š", "ž", "ü", "ä", "ö", -- 2 chars
"z", "ʹ" -- 1 char
},
to = {
"c" .. p[1], "s" .. p[1], "s" .. p[3], "y" .. p[1], "y" .. p[2], "y" .. p[3],
"s" .. p[2], "y" .. p[4],
}
},
}
m["lue"] = {
"Luvale",
33597,
"bnt-clu",
"Latn",
}
m["luf"] = {
"Laua",
6497673,
"paa-mal",
"Latn",
}
m["luh"] = {
"Leizhou Min",
1988433,
"zhx-nan",
"Hants",
generate_forms = "zh-generateforms",
sort_key = "Hani-sortkey",
}
m["lui"] = {
"Luiseño",
56236,
"azc-cup",
"Latn",
strip_diacritics = {remove_diacritics = c.acute .. c.circ},
}
m["luj"] = {
"Luna",
11003832,
"bnt-lbn",
}
m["luk"] = {
"Lunanakha",
56446,
"sit-tib",
"Tibt",
ancestors = "dz",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lul"] = {
"Olu'bo",
6589401,
"csu-mma",
}
m["lum"] = {
"Luimbi",
10963134,
"bnt-clu",
}
m["lun"] = {
"Lunda",
33607,
"bnt-lun",
"Latn",
}
m["luo"] = {
"Luo",
5414796,
"sdv-los",
"Latn",
}
m["lup"] = {
"Lumbu",
35793,
"bnt-sir",
}
m["luq"] = {
"Lucumí",
1768321,
"alv-yor",
"Latn",
ancestors = "yo",
sort_key = {
remove_diacritics = c.acute,
},
}
m["lur"] = {
"Laura",
2984540,
}
m["lus"] = {
"Mizo",
36147,
"tbq-kuk",
"Latn",
}
m["lut"] = {
"Lushootseed",
33658,
"sal",
"Latn",
}
m["luu"] = {
"Lumba-Yakkha",
6703050,
"sit-kie",
ancestors = "ybh",
}
m["luv"] = {
"Luwati",
33402,
"inc-snd",
"Khoj",
}
m["luy"] = {
"Luhya",
35893,
"bnt-msl",
"Latn",
}
m["luz"] = {
"Southern Luri",
12952748,
"ira-swi",
"fa-Arab",
ancestors = "pal",
}
m["lva"] = {
"Maku'a",
35790,
"poz-tim",
}
m["lvi"] = {
"Lawi",
6502657,
"mkh-ban",
"Latn",
}
m["lvk"] = {
"Lavukaleve",
770547,
"qfa-dis", -- Papuan; isolate in Glottolog; in the tentative Central Solomons family by Ross (2005) and Pedrós
-- (2015)
"Latn",
}
m["lvl"] = {
"Lwel",
93936908,
"bnt-bdz",
"Latn",
}
m["lvu"] = {
"Levuka",
6535860,
}
m["lwa"] = {
"Lwalu",
6706953,
"bnt-lbn",
}
m["lwe"] = {
"Lewo Eleng",
6537465,
}
m["lwg"] = {
"Wanga",
nil,
"bnt-msl",
ancestors = "luy",
}
m["lwh"] = {
"White Lachi",
8842956,
"qfa-kra",
}
m["lwl"] = {
"Eastern Lawa",
18644464,
"mkh-pal",
"Thai",
sort_key = "Thai-sortkey",
}
m["lwm"] = {
"Laomian",
19597674,
"tbq-bis",
}
m["lwo"] = {
"Luwo",
56362,
"sdv-lon",
"Latn",
}
m["lws"] = {
"Malawian Sign Language",
47522462,
"sgn",
}
m["lwt"] = {
"Lewotobi",
14916885,
}
m["lwu"] = {
"Lawu",
6505073,
"tbq-lwo",
}
m["lww"] = {
"Lewo",
3237321,
"poz-vnc",
"Latn",
}
m["lya"] = {
"Layakha",
56602,
"sit-tib",
"Tibt",
ancestors = "dz",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["lyg"] = {
"Lyngngam",
12635902,
"aav-pkl",
}
m["lyn"] = {
"Luyana",
3268098,
}
m["lzh"] = {
"Classical Chinese",
37041,
"zhx",
"Hant",
wikimedia_codes = "zh-classical",
translit = "zh-translit",
sort_key = "Hani-sortkey",
}
m["lzl"] = {
"Litzlitz",
6653424,
"poz-vnc",
"Latn",
}
m["lzn"] = {
"Leinong Naga",
5924455,
"sit-kch",
}
m["lzz"] = {
"Laz",
1160372,
"ccs-zan",
"Geor, Latn",
translit = {Geor = "lzz-translit"},
override_translit = true,
strip_diacritics = {remove_diacritics = c.grave .. c.acute .. c.circ},
}
return require("Module:languages").finalizeData(m, "language")
6k294u12958415w2stzdehtw2q5svjz
Module:languages/data/3/k
828
6262
234820
220408
2026-03-14T20:46:33Z
en>Chuck Entz
0
234820
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["kaa"] = {
"Karakalpak",
33541,
"trk-kno",
"Latn, Cyrl, fa-Arab",
dotted_dotless_i = true,
strip_diacritics = {
from = {"['’]"},
to = {"ʼ"}
},
sort_key = {
Latn = {
from = {
-- Sort the old orthography (using the apostrophe) after the new orthography (using the acute accent).
"í", "iʼ", "i", -- Ensure "i" comes after "í", "iʼ", "ı".
"sh", "ch",
"á", "aʼ", "ǵ", "gʼ", "x", p[4], p[5], "ı", "q", "ń", "nʼ", "ó", "oʼ", "ú", "uʼ", "c"
},
to = {
p[4], p[5], "i" .. p[3],
"z" .. p[1], "z" .. p[3],
"a" .. p[1], "a" .. p[2], "g" .. p[1], "g" .. p[2], "h" .. p[1], "i", "i" .. p[1], "i" .. p[2], "k" .. p[1], "n" .. p[1], "n" .. p[2], "o" .. p[1], "o" .. p[2], "u" .. p[1], "u" .. p[2], "z" .. p[2]
}
},
Cyrl = {
from = {"ә", "ғ", "ё", "қ", "ң", "ө", "ү", "ў", "ҳ"},
to = {"а" .. p[1], "г" .. p[1], "е" .. p[1], "к" .. p[1], "н" .. p[1], "о" .. p[1], "у" .. p[1], "у" .. p[2], "х" .. p[1]}
},
},
}
m["kab"] = {
"Kabyle",
35853,
"ber",
"Latn, Arab, Tfng",
}
m["kac"] = {
"Jingpho",
33332,
"sit-jnp",
"Latn, Mymr",
}
m["kad"] = {
"Kadara",
3914011,
"nic-plc",
"Latn",
}
m["kae"] = {
"Ketangalan",
2779411,
"map",
}
m["kaf"] = {
"Katso",
246122,
"tbq-kzh",
}
m["kag"] = {
"Kajaman",
6348863,
"poz",
"Latn",
}
m["kah"] = {
"Fer",
5443742,
"csu-bgr",
"Latn",
}
m["kai"] = {
"Karekare",
3438770,
"cdc-wst",
"Latn",
}
m["kaj"] = {
"Jju",
35401,
"nic-plc",
"Latn",
}
m["kak"] = {
"Kayapa Kallahan",
3192220,
"phi",
"Latn",
}
m["kam"] = {
"Kamba",
2574767,
"bnt-kka",
"Latn",
}
m["kao"] = {
"Kassonke",
36905,
"dmn-wmn",
"Latn",
}
m["kap"] = {
"Bezhta",
33054,
"cau-ets",
"Cyrl",
translit = "cau-nec-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {Cyrl = s["cau-Cyrl-stripdiacritics"]},
}
m["kaq"] = {
"Capanahua",
2937196,
"sai-pan",
"Latn",
}
m["kaw"] = {
"Old Javanese",
49341,
"poz",
"Latn, Java, Kawi",
translit = "jv-translit", --same as jv
}
m["kax"] = {
"Kao",
3192799,
"paa-gto",
"Latn",
}
m["kay"] = {
"Kamayurá",
3192336,
"tup-gua",
"Latn",
}
m["kba"] = {
"Kalarko",
5517764,
"aus-pam",
"Latn",
}
m["kbb"] = {
"Kaxuyana",
12953626,
"sai-prk",
"Latn",
}
m["kbc"] = {
"Kadiwéu",
18168288,
"sai-guc",
"Latn",
}
m["kbd"] = {
"East Circassian",
33522,
"cau-cir",
"Cyrl, Latn, Arab",
translit = {
Cyrl = "cau-cir-translit",
Arab = "ar-translit",
},
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Cyrl = s["cau-Cyrl-stripdiacritics"],
Latn = s["cau-Latn-stripdiacritics"],
},
sort_key = {
Cyrl = {
from = {
"кхъу", "къӏу", -- 4 chars
"гъу", "джу", "дзу", "жъу", "къу", "кхъ", "къӏ", "кӏу", "кӏь", "лъу", "лӏу", "пӏу", "сӏу", "тӏу", "фӏу", "хъу", "цӏу", "чъу", "чӏу", "шъу", "шӏу", "щӏу", -- 3 chars
"гу", "гъ", "гь", "дж", "дз", "ё", "жъ", "жь", "ку", "къ", "кь", "кӏ", "лъ", "ль", "лӏ", "пӏ", "сӏ", "тӏ", "фӏ", "ху", "хъ", "хь", "цу", "цӏ", "чу", "чъ", "чӏ", "шъ", "шӏ", "щӏ", "ӏу", "ӏь", -- 2 chars
"э" -- 1 char
},
to = {
"к" .. p[5], "к" .. p[7],
"г" .. p[3], "д" .. p[2], "д" .. p[4], "ж" .. p[2], "к" .. p[3], "к" .. p[4], "к" .. p[6], "к" .. p[10], "к" .. p[11], "л" .. p[2], "л" .. p[5], "п" .. p[2], "с" .. p[2], "т" .. p[2], "ф" .. p[2], "х" .. p[3], "ц" .. p[3], "ч" .. p[3], "ч" .. p[5], "ш" .. p[2], "ш" .. p[4], "щ" .. p[2],
"г" .. p[1], "г" .. p[2], "г" .. p[4], "д" .. p[1], "д" .. p[3], "е" .. p[1], "ж" .. p[1], "ж" .. p[3], "к" .. p[1], "к" .. p[2], "к" .. p[8], "к" .. p[9], "л" .. p[1], "л" .. p[3], "л" .. p[4], "п" .. p[1], "с" .. p[1], "т" .. p[1], "ф" .. p[1], "х" .. p[1], "х" .. p[2], "х" .. p[4], "ц" .. p[1], "ц" .. p[2], "ч" .. p[1], "ч" .. p[2], "ч" .. p[4], "ш" .. p[1], "ш" .. p[3], "щ" .. p[1], "ӏ" .. p[1], "ӏ" .. p[2],
"а" .. p[1]
}
},
},
}
m["kbe"] = {
"Kanju",
10543322,
"aus-pam",
"Latn",
}
m["kbh"] = {
"Camsá",
2842667,
"qfa-iso",
"Latn",
}
m["kbi"] = {
"Kaptiau",
6367294,
"poz-oce",
"Latn",
}
m["kbj"] = {
"Kari",
6370438,
"bnt-boa",
"Latn",
}
m["kbk"] = {
"Grass Koiari",
12952642,
"ngf-koi",
"Latn",
}
m["kbm"] = {
"Iwal",
3156391,
"poz-ocw",
"Latn",
}
m["kbn"] = {
"Kare (Central Africa)",
35554,
"alv-mbm",
"Latn",
}
m["kbo"] = {
"Keliko",
11275553,
"csu-mma",
}
m["kbp"] = {
"Kabiye",
35475,
"nic-gne",
"Latn",
}
m["kbq"] = {
"Kamano",
11732272,
"ngf-kya",
"Latn",
}
m["kbr"] = {
"Kafa",
35481,
"omv-gon",
"Ethi, Latn",
}
m["kbs"] = {
"Kande",
35556,
"bnt-tso",
"Latn",
}
m["kbt"] = {
"Gabadi",
3291159,
"poz-ocw",
"Latn",
}
m["kbu"] = {
"Kabutra",
10966761,
"raj",
}
m["kbv"] = {
"Kamberataro",
5261289,
"paa-sng",
"Latn",
}
m["kbw"] = {
"Kaiep",
6347632,
"poz-ocw",
"Latn",
}
m["kbx"] = {
"Ap Ma",
56298,
"paa-eke",
"Latn",
}
m["kbz"] = {
"Duhwa",
56295,
"cdc-wst",
"Latn",
}
m["kcb"] = {
"Kawacha",
11732302,
"ngf-woj",
"Latn",
}
m["kcc"] = {
"Lubila",
3914381,
"nic-uce",
"Latn",
}
m["kcd"] = {
"Ngkâlmpw Kanum",
12952566,
"paa-ngk",
"Latn",
}
m["kce"] = {
"Kaivi",
6348685,
"nic-kau",
}
m["kcf"] = {
"Ukaan",
36651,
"nic-bco",
}
m["kcg"] = {
"Tyap",
3912765,
"nic-plc",
"Latn",
}
m["kch"] = {
"Vono",
3913920,
"nic-kau",
}
m["kci"] = {
"Kamantan",
3914019,
"nic-plc",
}
m["kcj"] = {
"Kobiana",
35609,
"alv-nyn",
}
m["kck"] = {
"Kalanga",
33672,
"bnt-sho",
"Latn",
}
m["kcl"] = {
"Kala",
6349982,
"poz-ocw",
"Latn",
}
m["kcm"] = {
"Tar Gula",
277963,
"csu-bba",
}
m["kcn"] = {
"Nubi",
36388,
"crp",
"Latn, Arab",
ancestors = "apd",
strip_diacritics = {remove_diacritics = c.acute},
}
m["kco"] = {
"Kinalakna",
11732320,
"ngf-dal",
"Latn",
}
m["kcp"] = {
"Kanga",
6362384,
"qfa-kad",
"Latn",
}
m["kcq"] = {
"Kamo",
3914879,
"alv-wjk",
}
m["kcr"] = {
"Katla",
35688,
"nic-ktl",
}
m["kcs"] = {
"Koenoem",
3438755,
"cdc-wst",
}
m["kct"] = {
"Kaian",
6347538,
"paa-ott",
"Latn",
}
m["kcu"] = {
"Kikami",
3915212,
"bnt-ruv",
"Latn",
}
m["kcv"] = {
"Kete",
3195598,
"bnt-lub",
}
m["kcw"] = {
"Kabwari",
6344539,
"bnt-glb",
}
m["kcx"] = {
"Kachama-Ganjule",
12634070,
"omv-eom",
}
m["kcy"] = {
"Korandje",
33427,
"son",
}
m["kcz"] = {
"Konongo",
11732345,
"bnt-tkm",
"Latn",
}
m["kda"] = {
"Worimi",
3914062,
"aus-pam",
"Latn",
}
m["kdc"] = {
"Kutu",
6448634,
"bnt-ruv",
}
m["kdd"] = {
"Yankunytjatjara",
34207,
"aus-pam",
"Latn",
}
m["kde"] = {
"Makonde",
35172,
"bnt-rvm",
"Latn",
}
m["kdf"] = {
"Mamusi",
6746036,
"poz-ocw",
"Latn",
}
m["kdg"] = {
"Seba",
7442316,
"bnt-sbi",
"Latn",
}
m["kdh"] = {
"Tem",
36531,
"nic-gne",
"Latn",
}
m["kdi"] = {
"Kumam",
6443410,
"sdv-los",
}
m["kdj"] = {
"Karamojong",
56326,
"sdv-ttu",
"Latn",
}
m["kdk"] = {
"Numèè",
3346774,
"poz-cln",
"Latn",
}
m["kdl"] = {
"Tsikimba",
3914404,
"nic-kam",
}
m["kdm"] = {
"Kagoma",
3914420,
"nic-plc",
}
m["kdn"] = {
"Kunda",
4121130,
"bnt-sna",
"Latn",
}
m["kdp"] = {
"Kaningdon-Nindem",
3914956,
"nic-nin",
}
m["kdq"] = {
"Koch",
56431,
"tbq-bdg",
}
m["kdr"] = {
"Karaim",
33725,
"trk-kcu",
"Cyrl, Latn, Hebr",
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["kdt"] = {
"Kuy",
56310,
"mkh-kat",
"Thai, Khmr, Laoo",
}
m["kdu"] = {
"Kadaru",
35441,
"nub-hil",
"Latn",
}
m["kdv"] = {
"Kado",
7402721,
"sit-luu",
}
m["kdw"] = {
"Koneraw",
11732341,
"ngf-mom",
"Latn",
}
m["kdx"] = {
"Kam",
36753,
"alv-wjk",
}
m["kdy"] = {
"Keder",
6383641,
"paa-tor",
"Latn",
}
m["kdz"] = {
"Kwaja",
11128866,
"nic-nka",
"Latn",
}
m["kea"] = {
"Kabuverdianu",
35963,
"crp",
"Latn",
ancestors = "pt",
}
m["keb"] = {
"Kélé",
35559,
"bnt-kel",
}
m["kec"] = {
"Keiga",
3409311,
"qfa-kad",
"Latn",
}
m["ked"] = {
"Kerewe",
6393846,
"bnt-haj",
}
m["kee"] = {
"Eastern Keres",
15649021,
"nai-ker",
"Latn",
}
m["kef"] = {
"Kpessi",
35748,
"alv-gbe",
}
m["keg"] = {
"Tese",
16887296,
"sdv",
}
m["keh"] = {
"Keak",
6382110,
"paa-nnd",
"Latn",
}
m["kei"] = {
"Kei",
2410352,
"poz-cet",
"Latn",
}
m["kej"] = {
"Kadar",
6345179,
"dra-mal",
}
m["kek"] = {
"Q'eqchi",
35536,
"myn",
"Latn",
}
m["kel"] = {
"Kela-Yela",
6385426,
"bnt-mon",
"Latn",
}
m["kem"] = {
"Kemak",
35549,
"poz-tim",
"Latn",
}
m["ken"] = {
"Kenyang",
35650,
"nic-mam",
"Latn",
}
m["keo"] = {
"Kakwa",
3033547,
"sdv-bri",
}
m["kep"] = {
"Kaikadi",
6347757,
"dra-tam",
}
m["keq"] = {
"Kamar",
14916877,
"inc-hal",
}
m["ker"] = {
"Kera",
56251,
"cdc-est",
"Latn",
}
m["kes"] = {
"Kugbo",
3813394,
"nic-cde",
"Latn",
}
m["ket"] = {
"Ket",
33485,
"qfa-yke",
"Cyrl",
strip_diacritics = {
from = {"['’]"},
to = {"ʼ"}
},
sort_key = {
from = {"ӷ", "ё", "ӄ", "ӈ", "ө", "ә", "ʼ"},
to = {"г" .. p[1], "е" .. p[1], "к" .. p[1], "н" .. p[1], "о" .. p[1], "ъ" .. p[1], "ь" .. p[1]}
},
}
m["keu"] = {
"Akebu",
35026,
"alv-ktg",
"Latn",
}
m["kev"] = {
"Kanikkaran",
6363201,
"dra-mal",
"Taml, Mlym",
-- Mlym translit in [[Module:scripts/data]] (NOTE: not present before, presumably an accidental omission)
}
m["kew"] = {
"Kewa",
12952619,
"ngf-ank",
"Latn",
}
m["kex"] = {
"Kukna",
5031131,
"inc-bhi",
wikipedia_article = "Dhodia–Kukna language",
}
m["key"] = {
"Kupia",
6445354,
"inc-eas",
}
m["kez"] = {
"Kukele",
3915391,
"nic-ucn",
"Latn",
}
m["kfa"] = {
"Kodava",
33531,
"dra-kod",
"Knda, Mlym",
-- Knda translit in [[Module:scripts/data]]
-- Mlym translit in [[Module:scripts/data]]
}
m["kfb"] = {
"Kolami",
33479,
"dra-knk",
"Deva, Telu",
translit = {
Telu = "te-translit",
},
}
m["kfc"] = {
"Konda-Dora",
35679,
"dra-kki",
"Orya, Telu",
translit = {
Orya = "gon-Orya-translit",
Telu = "te-translit",
},
}
m["kfd"] = {
"Korra Koraga",
12952655,
"dra-kor",
"Knda",
-- Knda translit in [[Module:scripts/data]]
}
m["kfe"] = {
"Kota (India)",
33483,
"dra-tkt",
"Taml",
translit = "ta-translit",
}
m["kff"] = {
"Koya",
33471,
"dra-gon",
"Telu, Orya, Deva, Latn",
}
m["kfg"] = {
"Kudiya",
12952667,
"dra-tlk",
}
m["kfh"] = {
"Kurichiya",
12952676,
"dra-mal",
"Mlym",
-- Mlym translit in [[Module:scripts/data]]
}
m["kfi"] = {
"Kannada Kurumba",
56589,
"dra-sdo",
}
m["kfj"] = {
"Kemiehua",
27144776,
"mkh-pal",
}
m["kfk"] = {
"Kinnauri",
2383208,
"sit-kin",
"Takr, Deva, Latn",
}
m["kfl"] = {
"Kung",
6444510,
"nic-rnc",
"Latn",
}
m["kfn"] = {
"Kuk",
6442398,
"nic-rnc",
"Latn",
}
m["kfo"] = {
"Koro (West Africa)",
11160588,
"dmn-mnk",
"Latn, Nkoo",
}
m["kfp"] = {
"Korwa",
6432786,
"mun",
}
m["kfq"] = {
"Korku",
33715,
"mun",
"Deva",
}
m["kfr"] = {
"Kachchi",
56487,
"inc-snd",
"Gujr, sd-Arab, Sind, Khoj",
translit = {
Gujr = "gu-translit",
Sind = "Sind-translit",
["sd-Arab"] = "sd-Arab-translit",
},
strip_diacritics = {
remove_diacritics = c.kashida .. c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.superalef,
from = {u(0x0671)},
to = {u(0x0627)}
},
}
m["kfs"] = {
"Bilaspuri",
12953397,
"him",
"Deva, Takr",
translit = "hi-translit",
}
m["kft"] = {
"Kanjari",
12953610,
"inc-pan",
ancestors = "pa",
}
m["kfu"] = {
"Katkari",
6377671,
"inc-sou",
}
m["kfv"] = {
"Kurmukar",
6446193,
"inc-eas",
}
m["kfw"] = {
"Kharam Naga",
12952906,
"tbq-kuk",
}
m["kfx"] = {
"Kullu Pahari",
6443148,
"him",
"Deva",
translit = "hi-translit",
}
m["kfy"] = {
"Kumaoni",
33529,
"inc-pah",
"Deva, Shrd, Takr",
-- Shrd translit in [[Module:scripts/data]] (NOTE: not present before, presumably an accidental omission)
}
m["kfz"] = {
"Koromfé",
35701,
"nic-gur",
"Latn",
}
m["kga"] = {
"Koyaga",
11155632,
"dmn-mnk",
}
m["kgb"] = {
"Kawe",
12952750,
"poz-hce",
"Latn",
}
m["kgd"] = {
"Kataang",
12953622,
"mkh",
}
m["kge"] = {
"Komering",
49224,
"poz-lgx",
"Latn, Arab",
}
m["kgf"] = {
"Kube",
11732359,
"ngf-kto",
"Latn",
}
m["kgg"] = {
"Kusunda",
33630,
"qfa-iso", -- central Nepal
"Latn",
}
m["kgi"] = {
"Selangor Sign Language",
33731,
"sgn",
}
m["kgj"] = {
"Gamale Kham",
22236996,
"sit-kha",
"Deva",
}
m["kgk"] = {
"Kaiwá",
3111883,
"gn",
"Latn",
}
m["kgl"] = {
"Kunggari",
10550184,
"aus-pam",
"Latn",
}
m["kgn"] = {
"Karingani",
6371041,
"xme-ttc",
"fa-Arab, Latn",
ancestors = "xme-ttc-nor",
}
m["kgo"] = {
"Krongo",
6438927,
"qfa-kad",
"Latn",
}
m["kgp"] = {
"Kaingang",
2665734,
"sai-sje",
"Latn",
}
m["kgq"] = {
"Kamoro",
6359001,
"ngf-ask",
"Latn",
}
m["kgr"] = {
"Abun",
56657,
"qfa-iso", -- Papuan; isolate in Ethnologue, Glottolog and Palmer (2018); grouped with West Papuan by Ross (2005)
"Latn",
}
m["kgs"] = {
"Kumbainggar",
3915412,
"aus-pam",
"Latn",
}
m["kgt"] = {
"Somyev",
3913354,
"nic-mmb",
"Latn",
}
m["kgu"] = {
"Kobol",
11732325,
"ngf-omo",
"Latn",
}
m["kgv"] = {
"Karas",
6368621,
"qfa-dis", -- Divergent Papuan language; grouped with Mbaham-Iha by Glottolog to form a (mainland) West Bomberai
-- family, but with Mbaham-Iha and Timor-Alor-Pantar by Wikipedia (following Usher and Schapper 2022)
-- into a (Greater) West Bomberai family.
"Latn",
}
m["kgw"] = {
"Karon Dori",
56817,
"paa-may",
"Latn",
}
m["kgx"] = {
"Kamaru",
12953604,
"poz-wot",
"Latn",
}
m["kgy"] = {
"Kyerung",
12952691,
"sit-kyk",
}
m["kha"] = {
"Khasi",
33584,
"aav-pkl",
"Latn, as-Beng",
}
m["khb"] = {
"Lü",
36948,
"tai-swe",
"Talu, Lana",
translit = {Talu = "Talu-translit"},
strip_diacritics = {remove_diacritics = c.ZWNJ},
sort_key = {
Talu = "Talu-sortkey",
Lana = "Lana-sortkey",
},
}
m["khc"] = {
"North Tukang Besi",
18611555,
"poz",
}
m["khd"] = {
"Bädi Kanum",
20888004,
"paa-ngk",
"Latn",
}
m["khe"] = {
"Korowai",
6432598,
"ngf-bda",
"Latn",
}
m["khf"] = {
"Khuen",
27144893,
"mkh",
}
m["khh"] = {
"Kehu",
10994953,
}
m["khj"] = {
"Kuturmi",
3914490,
"nic-plc",
"Latn",
}
m["khl"] = {
"Lusi",
3267788,
"poz-ocw",
"Latn",
}
m["khn"] = {
"Khandeshi",
33726,
"inc-sou",
}
m["kho"] = {
"Khotanese",
6583551,
"xsc-sak",
"Brah, Khar",
-- Brah translit in [[Module:scripts/data]]
}
m["khp"] = {
"Kapauri",
3502575,
"qfa-dis", -- isolate per Glottolog, possibly Greater Kwerba per Wikipedia in Kapauri-Sause family
"Latn",
}
m["khq"] = {
"Koyra Chiini",
33600,
"son",
"Latn, Arab",
}
m["khr"] = {
"Kharia",
3915562,
"mun",
}
m["khs"] = {
"Kasua",
6374863,
"ngf-bos",
"Latn",
}
m["kht"] = {
"Khamti",
3915502,
"tai-swe",
"Mymr",
display_text = s["kht-displaytext"],
strip_diacritics = s["kht-stripdiacritics"],
}
m["khu"] = {
"Nkhumbi",
11019169,
"bnt-swb",
}
m["khv"] = {
"Khvarshi",
56425,
"cau-wts",
"Cyrl",
translit = "khv-translit",
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {Cyrl = s["cau-Cyrl-stripdiacritics"]},
}
m["khw"] = {
"Khowar",
938216,
"inc-chi",
"Arab",
strip_diacritics = {
-- character "ۂ" code U+06C2 to "ه" and "هٔ" (U+0647 + U+0654) to "ه"; hamzatu l-waṣli to a regular alif
from = {"هٔ", "ۂ", "ٱ"},
to = {"ہ", "ہ", "ا"},
remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.nunghunna .. c.superalef
},
}
m["khx"] = {
"Kanu",
12952571,
"bnt-lgb",
}
m["khy"] = {
"Ekele",
6385549,
"bnt-ske",
"Latn",
}
m["khz"] = {
"Keapara",
12952603,
"poz-ocw",
"Latn",
}
m["kia"] = {
"Kim",
35685,
"alv-kim",
}
m["kib"] = {
"Koalib",
35859,
"alv-hei",
}
m["kic"] = {
"Kickapoo",
20162127,
"alg-sfk",
"Latn",
}
m["kid"] = {
"Koshin",
35632,
"nic-beb",
"Latn",
}
m["kie"] = {
"Kibet",
56893,
}
m["kif"] = {
"Eastern Parbate Kham",
12953022,
"sit-kha",
"Deva",
}
m["kig"] = {
"Kimaama",
11732321,
"paa-kol",
"Latn",
}
m["kih"] = {
"Kilmeri",
6408020,
"paa-bew",
"Latn",
}
m["kii"] = {
"Kitsai",
56627,
"cdd",
"Latn",
}
m["kij"] = {
"Kilivila",
3196601,
"poz-ocw",
"Latn",
}
m["kil"] = {
"Kariya",
3438708,
"cdc-wst",
}
m["kim"] = {
"Tofa",
36848,
"trk-ssb",
"Cyrl",
}
m["kio"] = {
"Kiowa",
56631,
"nai-kta",
"Latn",
}
m["kip"] = {
"Sheshi Kham",
12952622,
"sit-kha",
"Deva",
}
m["kiq"] = {
"Kosadle",
6432994,
"paa-kko",
"Latn",
}
m["kis"] = {
"Kis",
6416362,
"poz-ocw",
"Latn",
}
m["kit"] = {
"Agob",
3332143,
"paa-pah",
"Latn",
}
m["kiv"] = {
"Kimbu",
10997740,
"bnt-tkm",
}
m["kiw"] = {
"Northeast Kiwai",
11732324,
"paa-kiw",
"Latn",
}
m["kix"] = {
"Khiamniungan Naga",
6401546,
"sit-kch",
"Latn",
}
m["kiy"] = {
"Kirikiri",
6415159,
"paa-wlp",
"Latn",
}
m["kiz"] = {
"Kisi",
3912772,
"bnt-bki",
}
m["kja"] = {
"Mlap",
6885683,
"paa-nim",
"Latn",
}
m["kjb"] = {
"Q'anjob'al",
35551,
"myn",
"Latn",
}
m["kjc"] = {
"Coastal Konjo",
3198689,
"poz",
"Latn",
}
m["kjd"] = {
"Southern Kiwai",
11732322,
"paa-kiw",
"Latn",
}
m["kje"] = {
"Kisar",
3197441,
"poz",
"Latn",
}
m["kjg"] = {
"Khmu",
33335,
"mkh",
"Laoo",
ancestors = "mkh-khm-pro",
sort_key = "Laoo-sortkey",
}
m["kjh"] = {
"Khakas",
33575,
"trk-ssb",
"Cyrl",
translit = "kjh-translit",
override_translit = true,
}
m["kji"] = {
"Zabana",
379130,
"poz-ocw",
"Latn",
}
m["kjj"] = {
"Khinalug",
35278,
"cau-nec",
"Cyrl, Latn",
translit = "kjj-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Cyrl = s["cau-Cyrl-stripdiacritics"],
Latn = s["cau-Latn-stripdiacritics"],
},
}
m["kjk"] = {
"Highland Konjo",
3198688,
"poz",
}
m["kjl"] = {
"Western Parbate Kham",
22237017,
"sit-kha",
"Deva",
}
m["kjm"] = {
"Kháng",
6403501,
"mkh-pal",
}
m["kjn"] = {
"Kunjen",
3200468,
"aus-pmn",
"Latn",
}
m["kjo"] = {
"Harijan Kinnauri",
5657463,
"him",
"Takr, Deva",
}
m["kjp"] = {
"Eastern Pwo",
5330390,
"kar",
"Mymr, Leke, Thai",
translit = "kjp-translit",
override_translit = true,
}
m["kjq"] = {
"Western Keres",
12645568,
"nai-ker",
"Latn",
}
m["kjr"] = {
"Kurudu",
12952678,
"poz-hce",
"Latn",
}
m["kjs"] = {
"East Kewa",
20050949,
"ngf-ank",
"Latn",
}
m["kjt"] = {
"Phrae Pwo",
7187991,
"kar",
"Thai",
}
m["kju"] = {
"Kashaya",
3193689,
"nai-pom",
"Latn",
}
m["kjx"] = {
"Ramopa",
56830,
"paa-nbo",
"Latn",
}
m["kjy"] = {
"Erave",
12952416,
"ngf-ank",
"Latn",
}
m["kjz"] = {
"Bumthangkha",
2786408,
"sit-ebo",
"Tibt",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["kka"] = {
"Kakanda",
3915342,
"alv-ngb",
}
m["kkb"] = {
"Kwerisa",
56881,
"paa-clp",
"Latn",
}
m["kkc"] = {
"Odoodee",
12952987,
"ngf-est",
"Latn",
}
m["kkd"] = {
"Kinuku",
6414422,
"nic-kau",
}
m["kke"] = {
"Kakabe",
3913966,
"dmn-mok",
"Latn",
}
m["kkf"] = {
"Kalaktang Monpa",
63257089,
"sit-tsk",
"Tibt, Latn, Deva",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["kkg"] = {
"Mabaka Valley Kalinga",
18753304,
"phi",
}
m["kkh"] = {
"Khün",
3545044,
"tai-swe",
"Lana, Thai",
sort_key = {
Lana = "Lana-sortkey",
Thai = "Thai-sortkey"
},
}
m["kki"] = {
"Kagulu",
12952537,
"bnt-ruv",
"Latn",
}
m["kkj"] = {
"Kako",
35755,
"bnt-kak",
}
m["kkk"] = {
"Kokota",
3198399,
"poz-ocw",
"Latn",
}
m["kkl"] = {
"Kosarek Yale",
6432995,
"ngf-mek",
"Latn",
}
m["kkm"] = {
"Kiong",
6414512,
"nic-ucr",
"Latn",
}
m["kkn"] = {
"Kon Keu",
6428686,
"mkh-pal",
}
m["kko"] = {
"Karko",
35529,
"nub-hil",
}
m["kkp"] = {
"Koko-Bera",
6426699,
"aus-pmn",
"Latn",
}
m["kkq"] = {
"Kaiku",
6347840,
"bnt-kbi",
"Latn",
}
m["kkr"] = {
"Kir-Balar",
3440527,
"cdc-wst",
"Latn",
}
m["kks"] = {
"Kirfi",
56242,
"cdc-wst",
"Latn",
}
m["kkt"] = {
"Koi",
6426194,
"sit-kiw",
}
m["kku"] = {
"Tumi",
3913934,
"nic-kau",
}
m["kkv"] = {
"Kangean",
2071325,
"poz-msa",
"Latn",
}
m["kkw"] = {
"Teke-Kukuya",
36560,
"bnt-tek",
}
m["kkx"] = {
"Kohin",
6425997,
"poz-brw",
}
m["kky"] = {
"Guugu Yimidhirr",
56543,
"aus-pam",
"Latn",
}
m["kkz"] = {
"Kaska",
20823,
"ath-nor",
"Latn",
}
m["kla"] = {
"Klamath-Modoc",
2669248,
"nai-plp",
"Latn",
}
m["klb"] = {
"Kiliwa",
3182593,
"nai-yuc",
"Latn",
}
m["klc"] = {
"Kolbila",
6427122,
"alv-lek",
}
m["kld"] = {
"Gamilaraay",
3111818,
"aus-cww",
"Latn",
}
m["kle"] = {
"Kulung",
6443304,
"sit-kic",
}
m["klf"] = {
"Kendeje",
56895,
}
m["klg"] = {
"Tagakaulu Kalagan",
18756514,
"phi",
"Latn",
}
m["klh"] = {
"Weliki",
7981017,
"ngf-uru",
"Latn",
}
m["kli"] = {
"Kalumpang",
13561407,
"poz",
}
m["klj"] = {
"Khalaj",
33455,
"trk",
"fa-Arab, Latn",
ancestors = "klj-arg",
strip_diacritics = {
remove_diacritics = c.kashida .. c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun,
}
}
m["klk"] = {
"Kono (Nigeria)",
6429589,
"nic-kau",
"Latn",
}
m["kll"] = {
"Kagan Kalagan",
18748913,
"phi",
}
m["klm"] = {
"Kolom",
6844970,
"ngf-rai",
"Latn",
}
m["kln"] = {
"Kalenjin",
637228,
"sdv-nma",
"Latn",
}
m["klo"] = {
"Kapya",
6367410,
"nic-ykb",
}
m["klp"] = {
"Kamasa",
6356107,
"ngf-woj",
"Latn",
}
m["klq"] = {
"Rumu",
7379420,
"paa-tki",
"Latn",
}
m["klr"] = {
"Khaling",
56381,
"sit-kiw",
"Deva",
}
m["kls"] = {
"Kalasha",
33416,
"inc-chi",
"Latn, ks-Arab",
}
m["klt"] = {
"Nukna",
7068874,
"ngf-uru",
"Latn",
}
m["klu"] = {
"Klao",
3914866,
"kro-wkr",
}
m["klv"] = {
"Maskelynes",
3297282,
"poz-vnc",
"Latn",
}
m["klw"] = {
"Lindu",
18390055,
"poz-kal",
"Latn",
}
m["klx"] = {
"Koluwawa",
6427954,
"poz-ocw",
"Latn",
}
m["kly"] = {
"Kalao",
6350643,
"poz-wot",
"Latn",
}
m["klz"] = {
"Kabola",
11732258,
"paa-alp",
"Latn",
}
m["kma"] = {
"Konni",
35680,
"nic-buk",
}
m["kmb"] = {
"Kimbundu",
35891,
"bnt-kmb",
"Latn",
}
m["kmc"] = {
"Southern Kam",
35379,
"qfa-kms",
"Latn",
}
m["kmd"] = {
"Madukayang Kalinga",
18753305,
"phi",
}
m["kme"] = {
"Bakole",
35068,
"bnt-kpw",
"Latn",
}
m["kmf"] = {
"Kare (New Guinea)",
11732286,
"ngf-mab",
"Latn",
}
m["kmg"] = {
"Kâte",
3201059,
"ngf-kma",
"Latn",
}
m["kmh"] = {
"Kalam",
12952550,
"ngf-kak",
"Latn",
}
m["kmi"] = {
"Kami",
3915372,
"alv-ngb",
"Latn",
}
m["kmj"] = {
"Kumarbhag Paharia",
3130374,
"dra-mlo",
"Beng, Deva",
}
m["kmk"] = {
"Limos Kalinga",
18753303,
"phi",
"Latn",
}
m["kml"] = {
"Tanudan Kalinga",
18753307,
"phi",
"Latn",
}
m["kmm"] = {
"Kom (India)",
12952647,
"tbq-kuk",
}
m["kmn"] = {
"Awtuw",
3504217,
"paa-sep",
"Latn",
}
m["kmo"] = {
"Kwoma",
11732376,
"paa-sep",
"Latn",
}
m["kmp"] = {
"Gimme",
11152236,
"alv-dur",
}
m["kmq"] = {
"Kwama",
2591184,
"ssa-kom",
}
m["kmr"] = {
"Northern Kurdish",
36163,
"ku",
"Latn, Cyrl, Armn, ku-Arab, Yezi",
translit = {
Cyrl = "kmr-translit",
-- Armn translit in [[Module:scripts/data]]
["ku-Arab"] = "ckb-translit",
},
strip_diacritics = {
Latn = {
remove_diacritics = "'’",
from = {"r̄", "R̄", "ẍ", "Ẍ"},
to = {"rr", "Rr", "x", "X"}
},
},
wikimedia_codes = "ku",
}
m["kms"] = {
"Kamasau",
6356117,
"paa-mar",
"Latn",
}
m["kmt"] = {
"Kemtuik",
6387179,
"paa-nim",
"Latn",
}
m["kmu"] = {
"Kanite",
12952567,
"ngf-kya",
"Latn",
}
m["kmv"] = {
"Karipúna Creole French",
2523999,
"crp",
"Latn",
ancestors = "fr",
sort_key = s["roa-oil-sortkey"],
}
m["kmw"] = {
"Kumu",
6428450,
"bnt-kbi",
"Latn",
}
m["kmx"] = {
"Waboda",
7958705,
"paa-kiw",
"Latn",
}
m["kmy"] = {
"Koma",
35634,
"alv-dur",
}
m["kmz"] = {
"Khorasani Turkish",
35373,
"trk-ogz",
"Arab",
ancestors = "trk-oat",
}
m["kna"] = {
"Kanakuru",
56811,
"cdc-wst",
"Latn",
}
m["knb"] = {
"Lubuagan Kalinga",
12953602,
"phi",
"Latn",
}
m["knd"] = {
"Konda",
11732340,
"ngf-sbh",
"Latn",
}
m["kne"] = {
"Kankanaey",
18753329,
"phi",
"Latn",
strip_diacritics = {
Latn = {
remove_diacritics = c.grave .. c.acute .. c.circ .. c.diaer,
}
},
sort_key = {
Latn = "tl-sortkey",
},
standard_chars = {
Latn = "AaBbKkDdEeGgHhIiLlMmNnOoPpRrSsTtUuWwYy" .. c.punc,
},
}
m["knf"] = {
"Mankanya",
35789,
"alv-pap",
"Latn",
}
m["kni"] = {
"Kanufi",
3913297,
"nic-nin",
"Latn",
}
m["knj"] = {
"Akatek",
34923,
"myn",
"Latn",
}
m["knk"] = {
"Kuranko",
3198896,
"dmn-mok",
"Latn",
}
m["knl"] = {
"Keninjal",
6389309,
"poz-mly",
"Latn",
}
m["knm"] = { -- two unrelated lects have this name; this is the Katukinian one
"Kanamari",
3438373,
"sai-ktk",
"Latn",
}
m["kno"] = {
"Kono (Sierra Leone)",
35675,
"dmn-vak",
"Latn",
}
m["knp"] = {
"Kwanja",
35641,
"nic-mmb",
"Latn",
}
m["knq"] = {
"Kintaq",
6414335,
"mkh-asl",
}
m["knr"] = {
"Kaningra",
6363253,
"paa-sep",
"Latn",
}
m["kns"] = {
"Kensiu",
6391529,
"mkh-asl",
}
m["knt"] = {
"Katukina",
3194265,
"sai-pan",
"Latn",
}
m["knu"] = { -- a dialect of 'kpe'
"Kono (Guinea)",
3198703,
"dmn-msw",
"Latn, Kpel",
ancestors = "kpe",
}
m["knv"] = {
"Tabo",
7959888,
"aav",
}
m["knx"] = {
"Kendayan",
6388963,
"poz-mly",
"Latn",
}
m["kny"] = {
"Kanyok",
11110766,
"bnt-lub",
"Latn",
}
m["knz"] = {
"Kalamsé",
3914000,
"nic-gnn",
}
m["koa"] = {
"Konomala",
3198732,
"poz-ocw",
"Latn",
}
m["koc"] = {
"Kpati",
3913279,
"nic-nge",
"Latn",
}
m["kod"] = {
"Kodi",
4577633,
"poz-cet",
"Latn",
}
m["koe"] = {
"Kacipo-Balesi",
5364424,
"sdv",
}
m["kof"] = {
"Kubi",
3438718,
"cdc-wst",
"Latn",
}
m["kog"] = {
"Cogui",
3198286,
"cba",
"Latn",
}
m["koh"] = {
"Koyo",
35649,
"bnt-mbo",
"Latn",
}
m["koi"] = {
"Komi-Permyak",
56318,
"kv",
"Cyrl",
translit = "kv-translit",
strip_diacritics = {remove_diacritics = c.acute},
override_translit = true,
}
m["kok"] = {
"Konkani",
34239,
"inc-sou",
"Deva, Knda, Mlym, fa-Arab, Latn",
translit = {
Deva = "mr-translit",
},
-- Knda translit in [[Module:scripts/data]]
-- Mlym translit in [[Module:scripts/data]]
strip_diacritics = {
-- FIXME: Separate out the scripts
from = {"च़", "ज़", "झ़", "ಚ಼", "ಜ಼", "ಝ಼"},
to = {"च", "ज", "झ", "ಚ", "ಜ", "ಝ"}
} ,
}
m["kol"] = {
"Kol (New Guinea)",
4227542,
}
m["koo"] = {
"Konzo",
2361829,
"bnt-glb",
"Latn",
}
m["kop"] = {
"Waube",
11732373,
"ngf-nur",
"Latn",
}
m["koq"] = {
"Kota (Gabon)",
35607,
"bnt-kel",
"Latn",
}
m["kos"] = {
"Kosraean",
33464,
"poz-mic",
"Latn",
}
m["kot"] = {
"Lagwan",
3502264,
"cdc-cbm",
"Latn",
}
m["kou"] = {
"Koke",
797249,
"alv-bua",
}
m["kov"] = {
"Kudu-Camo",
3915850,
"nic-jer",
}
m["kow"] = {
"Kugama",
3913307,
"alv-mye",
}
m["koy"] = {
"Koyukon",
28304,
"ath-nor",
"Latn",
}
m["koz"] = {
"Korak",
6431365,
"ngf-kow",
"Latn",
}
m["kpa"] = {
"Kutto",
3437656,
"cdc-wst",
}
m["kpb"] = {
"Mullu Kurumba",
19573111,
"dra-mal",
}
m["kpc"] = {
"Curripaco",
2882543,
"awd-nwk",
"Latn",
}
m["kpd"] = {
"Koba",
6424249,
"poz",
}
m["kpe"] = {
"Kpelle",
35673,
"dmn-msw",
"Latn, Kpel",
}
m["kpf"] = {
"Komba",
6428239,
"ngf-kab",
"Latn",
}
m["kpg"] = {
"Kapingamarangi",
35771,
"poz-pnp",
"Latn",
}
m["kph"] = {
"Kplang",
35628,
"alv-gng",
}
m["kpi"] = {
"Kofei",
6425665,
"paa-egb",
"Latn",
}
m["kpj"] = {
"Karajá",
10322066,
"sai-mje",
"Latn",
}
m["kpk"] = {
"Kpan",
3915380,
"nic-jkn",
"Latn",
}
m["kpl"] = {
"Kpala",
11154769,
"nic-nkk",
"Latn",
}
m["kpm"] = {
"Koho",
3511919,
"mkh-ban",
"Latn",
}
m["kpn"] = {
"Kepkiriwát",
3195366,
"tup",
"Latn",
}
m["kpo"] = {
"Ikposo",
35029,
"alv-ktg",
"Latn",
}
m["kpq"] = {
"Korupun-Sela",
6432769,
"ngf-mek",
"Latn",
}
m["kpr"] = {
"Korafe-Yegha",
11732347,
"ngf-gko",
"Latn",
}
m["kps"] = {
"Tehit",
7694851,
"paa-wbh",
"Latn",
}
m["kpt"] = {
"Karata",
56636,
"cau-and",
"Cyrl",
translit = "kpt-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {Cyrl = s["cau-Cyrl-stripdiacritics"]},
}
m["kpu"] = {
"Kafoa",
6346151,
"paa-alp",
"Latn",
}
m["kpv"] = {
"Komi-Zyrian",
34114,
"kv",
"Cyrl",
translit = "kv-translit",
override_translit = true,
wikimedia_codes = "kv",
}
m["kpw"] = {
"Kobon",
11732326,
"ngf-kak",
"Latn",
}
m["kpx"] = {
"Mountain Koiari",
6925030,
"ngf-koi",
"Latn",
}
m["kpy"] = {
"Koryak",
36199,
"qfa-ckn",
"Cyrl",
strip_diacritics = {
from = {"['’]"},
to = {"ʼ"}
},
sort_key = {
from = {"вʼ", "гʼ", "ё", "ӄ", "ӈ"},
to = {"в" .. p[1], "г" .. p[1], "е" .. p[1], "к" .. p[1], "н" .. p[1]}
},
translit = "kpy-translit",
}
m["kpz"] = {
"Kupsabiny",
56445,
"sdv-kln",
}
m["kqa"] = {
"Mum",
6935252,
"ngf-nso",
"Latn",
}
m["kqb"] = {
"Kovai",
6434822,
"ngf-ehu",
"Latn",
}
m["kqc"] = {
"Doromu-Koki",
5298175,
"paa-man",
"Latn",
}
m["kqd"] = {
"Koy Sanjaq Surat",
33463,
"sem-nna",
}
m["kqe"] = {
"Kalagan",
18748906,
"phi",
"Latn",
}
m["kqf"] = {
"Kakabai",
6349119,
"poz-ocw",
"Latn",
}
m["kqg"] = {
"Khe",
3914015,
"nic-gur",
}
m["kqh"] = {
"Kisankasa",
6416409,
"sdv",
}
m["kqi"] = {
"Koitabu",
6426363,
"ngf-koi",
"Latn",
}
m["kqj"] = {
"Koromira",
6432520,
"paa-sbo",
"Latn",
}
m["kqk"] = {
"Kotafon Gbe",
12952447,
"alv-pph",
}
m["kql"] = {
"Kyenele",
11732453,
"paa-yua",
"Latn",
}
m["kqm"] = {
"Khisa",
3913955,
"nic-gur",
}
m["kqn"] = {
"Kaonde",
33601,
"bnt-lub",
"Latn",
}
m["kqo"] = {
"Eastern Krahn",
3915374,
"kro-wee",
}
m["kqp"] = {
"Kimré",
3441210,
"cdc-est",
}
m["kqq"] = {
"Krenak",
6436747,
"sai-cer",
}
m["kqr"] = {
"Kimaragang",
3196845,
"poz-san",
"Latn",
}
m["kqs"] = {
"Northern Kissi",
19921576,
"alv-kis",
}
m["kqt"] = {
"Klias River Kadazan",
12953594,
"poz-san",
}
m["kqu"] = {
"Seroa",
33127766,
"khi-tuu",
}
m["kqv"] = {
"Okolod",
7082487,
"poz-san",
}
m["kqw"] = {
"Kandas",
3192590,
"poz-ocw",
"Latn",
}
m["kqx"] = {
"Mser",
3502347,
"cdc-cbm",
}
m["kqy"] = {
"Koorete",
6430753,
"omv-eom",
"Ethi, Latn",
}
m["kqz"] = {
"Korana",
2756709,
"khi-khk",
"Latn",
}
m["kra"] = {
"Kumhali",
13580783,
"inc-bih",
}
m["krb"] = {
"Karkin",
3193345,
"nai-utn",
"Latn",
}
m["krc"] = {
"Karachay-Balkar",
33714,
"trk-kcu",
"Cyrl",
translit = "krc-translit",
sort_key = {
from = {"гъ", "дж", "ё", "къ", "нг"},
to = {"г" .. p[1], "д" .. p[1], "е" .. p[1], "к" .. p[1], "н" .. p[1]}
},
}
m["krd"] = {
"Kairui-Midiki",
12953277,
"poz-tim",
}
m["kre"] = {
"Panará",
3361895,
"sai-cer",
"Latn",
}
m["krf"] = {
"Koro (Vanuatu)",
3198995,
"poz-vnn",
"Latn",
}
m["krh"] = {
"Kurama",
35593,
"nic-kau",
}
m["kri"] = {
"Krio",
35744,
"crp",
"Latn",
ancestors = "en",
strip_diacritics = {remove_diacritics = c.grave .. c.acute .. c.circ},
sort_key = {
from = {"ɛ", "gb", "kp", "ɔ"},
to = {"e" .. p[1], "g" .. p[1], "k" .. p[1], "o" .. p[1]}
},
}
m["krj"] = {
"Kinaray-a",
33720,
"phi",
"Latn",
}
m["krk"] = {
"Kerek",
332792,
"qfa-ckn",
"Cyrl",
}
m["krl"] = {
"Karelian",
33557,
"urj-fin",
"Latn",
sort_key = {
from = {
"č", "š", "ž", "ü", "ä", "ö", -- 2 chars
"z", "'" -- 1 char
},
to = {
"c" .. p[1], "s" .. p[1], "s" .. p[3], "y" .. p[1], "y" .. p[2], "y" .. p[3],
"s" .. p[2], "y" .. p[4],
}
},
}
m["krm"] = {
"Krim",
35713,
"alv",
}
m["krn"] = {
"Sapo",
3915386,
"kro-wee",
}
m["krp"] = {
"Korop",
35626,
"nic-ucr",
"Latn",
}
m["krr"] = {
"Kru'ng",
12953650,
"mkh-ban",
}
m["krs"] = {
"Kresh",
56674,
"csu-bkr",
}
m["kru"] = {
"Kurux",
33492,
"dra-kml",
"Deva, Tols",
translit = {
Deva = "hi-translit",
},
}
m["krv"] = {
"Kavet",
12953649,
"sai-ktk",
"Latn",
}
m["krw"] = {
"Western Krahn",
10975611,
"kro-wee",
}
m["krx"] = {
"Karon",
35704,
"alv-jol",
}
m["kry"] = {
"Kryts",
35861,
"cau-ssm",
"Latn, Cyrl",
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Latn = s["cau-Latn-stripdiacritics"],
Cyrl = s["cau-Cyrl-stripdiacritics"],
},
}
m["krz"] = {
"Sota Kanum",
12952568,
"paa-kan",
"Latn",
}
m["ksa"] = {
"Shuwa-Zamani",
3913929,
"nic-kau",
}
m["ksb"] = {
"Shambala",
3788739,
"bnt-seu",
"Latn",
}
m["ksc"] = {
"Southern Kalinga",
18753301,
"phi",
}
m["ksd"] = {
"Tolai",
35870,
"poz-ocw",
"Latn",
}
m["kse"] = {
"Kuni",
6444619,
"poz-ocw",
"Latn",
}
m["ksf"] = {
"Bafia",
34930,
"bnt-baf",
"Latn",
}
m["ksg"] = {
"Kusaghe",
3200638,
"poz-ocw",
"Latn",
}
m["ksi"] = {
"Krisa",
841704,
"paa-sko",
"Latn",
}
m["ksj"] = {
"Uare",
6450052,
"paa-kwa",
"Latn",
}
m["ksk"] = {
"Kansa",
3192772,
"sio-dhe",
"Latn",
}
m["ksl"] = {
"Kumalu",
17584381,
"poz-ocw",
"Latn",
}
m["ksm"] = {
"Kumba",
3913972,
"alv-mye",
}
m["ksn"] = {
"Kasiguranin",
6374525,
"phi",
}
m["kso"] = {
"Kofa",
56278,
"cdc-cbm",
}
m["ksp"] = {
"Kaba",
3915316,
"csu-sar",
}
m["ksq"] = {
"Kwaami",
3440525,
"cdc-wst",
}
m["ksr"] = {
"Borong",
4946263,
"ngf-kbm",
"Latn",
}
m["kss"] = {
"Southern Kissi",
11028974,
"alv-kis",
}
m["kst"] = {
"Winyé",
3913360,
"nic-gnw",
}
m["ksu"] = {
"Khamyang",
6583541,
"tai-swe",
}
m["ksv"] = {
"Kusu",
6448199,
"bnt-tet",
}
m["ksw"] = {
"S'gaw Karen",
56410,
"kar",
"Mymr",
translit = "ksw-translit",
}
m["ksx"] = {
"Kedang",
6382520,
"poz",
"Latn",
}
m["ksy"] = {
"Kharia Thar",
6400661,
"inc-eas",
}
m["ksz"] = {
"Kodaku",
21179986,
"mun",
}
m["kta"] = {
"Katua",
6378404,
"mkh-ban",
}
m["ktb"] = {
"Kambaata",
35664,
"cus-hec",
"Latn",
}
m["ktc"] = {
"Kholok",
3440464,
"cdc-wst",
}
m["ktd"] = {
"Kokata",
10547021,
"aus-pam",
"Latn",
}
m["ktf"] = {
"Kwami",
12952687,
"bnt-lgb",
}
m["ktg"] = {
"Kalkatungu",
3914057,
"aus-pam",
"Latn",
}
m["kth"] = {
"Karanga",
713643,
}
m["kti"] = {
"North Muyu",
20857698,
"ngf-lok",
"Latn",
}
m["ktj"] = {
"Plapo Krumen",
10975356,
"kro-grb",
}
m["ktk"] = {
"Kaniet",
3399050,
"poz-aay",
"Latn",
}
m["ktl"] = {
"Koroshi",
3775265,
"ira-nwi",
ancestors = "bal",
}
m["ktm"] = {
"Kurti",
3200615,
"poz-aay",
"Latn",
}
m["ktn"] = {
"Karitiâna",
3112184,
"tup",
"Latn",
}
m["kto"] = {
"Kuot",
56537,
}
m["ktp"] = {
"Kaduo",
769809,
"tbq-bka",
}
m["ktq"] = {
"Katabaga",
3193895,
}
m["ktr"] = {
"Kota Marudu Tinagas",
18642280,
}
m["kts"] = {
"South Muyu",
42308820,
"ngf-lok",
"Latn",
}
m["ktt"] = {
"Ketum",
12952616,
"ngf-dum",
"Latn",
}
m["ktu"] = {
"Kituba",
35746,
"crp",
"Latn",
ancestors = "kg",
}
m["ktv"] = {
"Eastern Katu",
22808951,
"mkh-kat",
"Latn",
}
m["ktw"] = {
"Kato",
20831,
"ath-pco",
"Latn",
}
m["ktx"] = {
"Kaxararí",
6380124,
"sai-pan",
"Latn",
}
m["kty"] = {
"Kango",
6362818,
"bnt-bta",
"Latn",
}
m["ktz"] = {
"Juǀ'hoan",
1192295,
"khi-kxa",
"Latn",
}
m["kub"] = {
"Kutep",
35645,
"nic-jkn",
}
m["kuc"] = {
"Kwinsu",
6450460,
"paa-tor",
"Latn",
}
m["kud"] = {
"Auhelawa",
5166,
"poz-ocw",
"Latn",
}
m["kue"] = {
"Kuman",
137525,
"ngf-sim",
"Latn",
}
m["kuf"] = {
"Western Katu",
6378400,
"mkh-kat",
"Laoo, Tale, Latn",
}
m["kug"] = {
"Kupa",
3915336,
"alv-ngb",
}
m["kuh"] = {
"Kushi",
3438747,
"cdc-wst",
}
m["kui"] = {
"Kuikúro",
3915522,
"sai-kui",
"Latn",
}
m["kuj"] = {
"Kuria",
6445968,
"bnt-lok",
"Latn",
}
m["kuk"] = {
"Kepo'",
6393217,
"poz",
}
m["kul"] = {
"Kulere",
3440506,
"cdc-wst",
}
m["kum"] = {
"Kumyk",
36209,
"trk-kcu",
"Cyrl",
translit = "kum-translit",
sort_key = {
from = {"гъ", "гь", "ё", "къ", "нг", "оь", "уь"},
to = {"г" .. p[1], "г" .. p[2], "е" .. p[1], "к" .. p[1], "н" .. p[1], "о" .. p[1], "у" .. p[1]}
},
}
m["kun"] = {
"Kunama",
36041,
}
m["kuo"] = {
"Kumukio",
11732362,
"ngf-dal",
"Latn",
}
m["kup"] = {
"Kunimaipa",
6444696,
"paa-kun",
"Latn",
}
m["kuq"] = {
"Karipuna",
6371071,
"tup-gua",
"Latn",
}
m["kus"] = {
"Kusaal",
35708,
"nic-dag",
"Latn",
}
m["kut"] = {
"Ktunaxa",
33434,
"qfa-iso",
"Latn",
}
m["kuu"] = {
"Upper Kuskokwim",
28062,
"ath-nor",
"Latn",
}
m["kuv"] = {
"Kur",
12635082,
"poz-cma",
"Latn",
}
m["kuw"] = {
"Kpagua",
11137573,
"bad-cnt",
}
m["kux"] = {
"Kukatja",
10549839,
"aus-pam",
"Latn",
}
m["kuy"] = {
"Kuuku-Ya'u",
10550697,
"aus-pmn",
"Latn",
}
m["kuz"] = {
"Kunza",
2669181,
"qfa-iso",
"Latn",
}
m["kva"] = {
"Bagvalal",
56638,
"cau-and",
"Cyrl",
translit = "cau-nec-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {Cyrl = s["cau-Cyrl-stripdiacritics"]},
}
m["kvb"] = {
"Kubu",
6441341,
"poz-mly",
}
m["kvc"] = {
"Kove",
3199402,
"poz-ocw",
"Latn",
}
m["kvd"] = {
"Kui (Indonesia)",
6442230,
"paa-alp",
"Latn",
}
m["kve"] = {
"Kalabakan",
6350003,
"poz-san",
"Latn",
}
m["kvf"] = {
"Kabalai",
3440427,
"cdc-est",
}
m["kvg"] = {
"Kuni-Boazi",
2907551,
"paa-boa",
"Latn",
}
m["kvh"] = {
"Komodo",
3198565,
"poz-cet",
"Latn",
}
m["kvi"] = {
"Kwang",
3440398,
"cdc-est",
"Latn",
}
m["kvj"] = {
"Psikye",
56304,
"cdc-cbm",
}
m["kvk"] = {
"Korean Sign Language",
3073428,
"sgn-jsl",
}
m["kvl"] = {
"Brek Karen",
12952577,
"kar",
}
m["kvm"] = {
"Kendem",
35751,
"nic-mam",
"Latn",
}
m["kvn"] = {
"Border Kuna",
31777873,
"cba",
}
m["kvo"] = {
"Dobel",
5286559,
"poz",
"Latn",
}
m["kvp"] = {
"Kompane",
18343041,
"poz",
}
m["kvq"] = {
"Geba Karen",
12952581,
"kar",
"Latn, Mymr",
}
m["kvr"] = {
"Kerinci",
3195442,
"poz-mly",
"Latn, Arab", -- Also Incung, which we don't have
}
m["kvt"] = {
"Lahta Karen",
12952582,
"kar",
}
m["kvu"] = {
"Yinbaw Karen",
14426328,
"kar",
}
m["kvv"] = {
"Kola",
6426967,
"poz",
"Latn",
}
m["kvw"] = {
"Wersing",
7983599,
"paa-alp",
"Latn",
}
m["kvx"] = {
"Parkari Koli",
3244176,
"inc-wes",
}
m["kvy"] = {
"Yintale Karen",
14426329,
"kar",
}
m["kvz"] = {
"Tsakwambo",
7849438,
"ngf-kts",
"Latn",
}
m["kwa"] = {
"Dâw",
3042278,
"sai-nad",
"Latn",
}
m["kwb"] = {
"Baa",
34842,
"alv-ada",
}
m["kwc"] = {
"Likwala",
35597,
"bnt-mbo",
}
m["kwd"] = {
"Kwaio",
3200796,
"poz-sls",
"Latn",
}
m["kwe"] = {
"Kwerba",
6450328,
"paa-kwe",
"Latn",
}
m["kwf"] = {
"Kwara'ae",
3200829,
"poz-sls",
"Latn",
}
m["kwg"] = {
"Sara Kaba Deme",
3915384,
"csu-kab",
}
m["kwh"] = {
"Kowiai",
6435028,
"poz",
"Latn",
}
m["kwi"] = {
"Awa-Cuaiquer",
2603103,
"sai-bar",
"Latn",
}
m["kwj"] = {
"Kwanga",
3438383,
"paa-sep",
"Latn",
}
m["kwk"] = {
"Kwak'wala",
2640628,
"wak",
"Latn",
}
m["kwl"] = {
"Kofyar",
3441382,
"cdc-wst",
"Latn",
}
m["kwm"] = {
"Kwambi",
3487165,
"bnt-ova",
}
m["kwn"] = {
"Kwangali",
36334,
"bnt-kav",
"Latn",
}
m["kwo"] = {
"Kwomtari",
3508116,
"paa-kwo",
"Latn",
}
m["kwp"] = {
"Kodia",
3914867,
"kro-ekr",
}
m["kwq"] = {
"Kwak",
11014183,
"nic-nka",
ancestors = "yam",
}
m["kwr"] = {
"Kwer",
12635137,
"ngf-wok",
"Latn",
}
m["kws"] = {
"Kwese",
3200846,
"bnt-pen",
}
m["kwt"] = {
"Kwesten",
6450354,
"paa-tor",
"Latn",
}
m["kwu"] = {
"Kwakum",
35624,
"bnt-kak",
}
m["kwv"] = {
"Sara Kaba Náà",
3915361,
"csu-kab",
"Latn",
}
m["kww"] = {
"Kwinti",
721182,
"crp",
"Latn",
ancestors = "en"
}
m["kwx"] = {
"Khirwar",
12976968,
"dra",
}
m["kwz"] = {
"Kwadi",
2364661,
"khi-kkw",
"Latn",
}
m["kxa"] = {
"Kairiru",
3398785,
"poz-ocw",
"Latn",
}
m["kxb"] = {
"Krobu",
35586,
"alv-ptn",
"Latn",
}
m["kxc"] = {
"Konso",
56624,
"cus-eas",
"Ethi, Latn",
}
m["kxd"] = {
"Brunei Malay",
3182878,
"poz-mly",
"Latn, ms-Arab",
}
m["kxe"] = {
"Kakihum",
3914433,
"nic-kam",
ancestors = "tvd",
}
m["kxf"] = {
"Manumanaw Karen",
12952592,
"kar",
"Mymr, Latn",
}
m["kxh"] = {
"Karo",
3447116,
"omv-aro",
}
m["kxi"] = {
"Keningau Murut",
6389308,
"poz-san",
"Latn",
}
m["kxj"] = {
"Kulfa",
713654,
"csu-kab",
}
m["kxk"] = {
"Zayein Karen",
14352960,
"kar",
}
-- Nepali Kurux [kxl] treated as part of Kurux [kru], consistent with ISO merger in 2020
m["kxm"] = {
"Northern Khmer",
3502234,
"mkh-kmr",
"Thai, Khmr",
ancestors = "xhm",
sort_key = {
from = {"[%pๆ]", "[็-๎]", "([เแโใไ])([ก-ฮ])"},
to = {"", "", "%2%1"}
},
}
m["kxn"] = {
"Kanowit",
6364300,
"poz-bnn",
"Latn",
}
m["kxo"] = {
"Kanoé",
4356223,
"qfa-iso",
"Latn",
}
m["kxp"] = {
"Wadiyara Koli",
12953645,
"inc-wes",
}
m["kxq"] = {
"Smärky Kanum",
12952569,
"paa-kan",
"Latn",
}
m["kxr"] = {
"Manus Koro",
3198994,
"poz-aay",
"Latn",
}
m["kxs"] = {
"Kangjia",
3182570,
"xgn-shr",
"Latn",
}
m["kxt"] = {
"Koiwat",
6426388,
"paa-nnd",
"Latn",
}
m["kxu"] = {
"Kui (India)",
33919,
"dra-kki",
"Orya",
translit = "kxv-translit",
strip_diacritics = {
remove_diacritics = "୕",
from = {"ଆଆ", "ଇଇ", "ଉଉ", "ଏଏ", "ଓଓ", "ିଇ", "ୁଉ", "େଏ", "ୋଓ"},
to = {"ଆ", "ଈ", "ଊ", "ଏ", "ଓ", "ୀ", "ୂ", "େ", "ୋ"},
},
}
m["kxv"] = {
"Kuvi",
3200721,
"dra-kki",
"Orya",
translit = "kxv-translit",
strip_diacritics = {
remove_diacritics = "୕",
from = {"ଆଆ", "ଇଇ", "ଉଉ", "ଏଏ", "ଓଓ", "([କ-ହ])ଆ", "ିଇ", "ୁଉ", "େଏ", "ୋଓ"},
to = {"ଆ", "ଈ", "ଊ", "ଏ", "ଓ", "%1ା", "ୀ", "ୂ", "େ", "ୋ"},
},
}
m["kxw"] = {
"Konai",
11732339,
"ngf-est",
"Latn",
}
m["kxx"] = {
"Likuba",
35646,
"bnt-bmo",
}
m["kxy"] = {
"Kayong",
6380673,
"mkh",
}
m["kxz"] = {
"Kerewo",
6393847,
"paa-kiw",
"Latn",
}
m["kya"] = {
"Kwaya",
6450276,
"bnt-haj",
"Latn",
}
m["kyb"] = {
"Butbut Kalinga",
18753300,
"phi",
"Latn",
}
m["kyc"] = {
"Kyaka",
12952690,
"ngf-enc",
"Latn",
}
m["kyd"] = {
"Karey",
6370196,
"poz",
}
m["kye"] = {
"Krache",
35658,
"alv-gng",
}
m["kyf"] = {
"Kouya",
35595,
"kro-bet",
}
m["kyg"] = {
"Keyagana",
6398208,
"ngf-kya",
"Latn",
}
m["kyh"] = {
"Karok",
1288440,
"qfa-iso", -- or Hokan?
"Latn",
}
m["kyi"] = {
"Kiput",
3038653,
"poz-swa",
"Latn",
}
m["kyj"] = {
"Karao",
3192950,
"phi",
"Latn",
}
m["kyk"] = {
"Kamayo",
3192339,
"phi",
"Latn",
}
m["kyl"] = {
"Kalapuya",
3192120,
"nai-klp",
}
m["kym"] = {
"Kpatili",
3913982,
"znd",
}
m["kyn"] = {
"Karolanos",
6373093,
"phi",
}
m["kyo"] = {
"Kelon",
6386414,
"paa-alp",
"Latn",
}
m["kyp"] = {
"Kang",
25559558,
"tai",
}
m["kyq"] = {
"Kenga",
35707,
"csu-bgr",
}
m["kyr"] = {
"Kuruáya",
3200633,
"tup",
"Latn",
}
m["kys"] = {
"Baram Kayan",
2883794,
"poz",
"Latn",
}
m["kyt"] = {
"Kayagar",
6380394,
"paa-kay",
"Latn",
}
m["kyu"] = {
"Western Kayah",
12952596,
"kar",
"Kali, Mymr, Latn",
translit = {Kali = "Kali-translit"},
}
m["kyv"] = {
"Kayort",
6380675,
"inc-krd",
"Deva",
}
m["kyw"] = {
"Kudmali",
6446173,
"inc-bih",
"Deva, as-Beng, Orya, Chis",
}
m["kyx"] = {
"Rapoisi",
7294279,
"paa-nbo",
"Latn",
}
m["kyy"] = {
"Kambaira",
6356254,
"ngf-kai",
"Latn",
}
m["kyz"] = {
"Kayabí",
6380372,
"tup-gua",
"Latn",
}
m["kza"] = {
"Western Karaboro",
36601,
"alv-krb",
}
m["kzb"] = {
"Kaibobo",
6347565,
"poz-cma",
}
m["kzc"] = {
"Bondoukou Kulango",
11031321,
"alv-kul",
"Latn",
}
m["kzd"] = {
"Kadai",
7679471,
"poz-cma",
"Latn",
}
--kze (Kosena) made an etym-only child of auy (Auyana) per [[Wiktionary:Language_treatment_requests#merge_Kosena_[kze]_into_Auyana_[auy]]]
m["kzf"] = {
"Da'a Kaili",
33103997,
"poz-kal",
"Latn",
}
m["kzg"] = {
"Kikai",
3196527,
"jpx-nry",
"Jpan",
translit = s["jpx-translit"],
display_text = s["jpx-displaytext"],
strip_diacritics = s["jpx-stripdiacritics"],
sort_key = s["jpx-sortkey"],
}
m["kzh"] = {
"Dongolawi",
5295991,
"nub",
"Latn",
}
m["kzi"] = {
"Kelabit",
6385445,
"poz-swa",
"Latn",
}
m["kzj"] = {
"Coastal Kadazan",
3307195,
"poz-san",
"Latn",
}
m["kzk"] = {
"Kazukuru",
1089069,
"poz-ocw",
}
m["kzl"] = {
"Kayeli",
4207444,
"poz-cma",
"Latn",
}
m["kzm"] = {
"Kais",
6348319,
"ngf-sbh",
"Latn",
}
m["kzn"] = {
"Kokola",
11128329,
"bnt-mak",
"Latn",
ancestors = "vmw",
}
m["kzo"] = {
"Kaningi",
35683,
"bnt-mbt",
}
m["kzp"] = {
"Kaidipang",
6347611,
"phi",
"Latn",
}
m["kzq"] = {
"Kaike",
10951226,
"sit-tam",
}
m["kzr"] = {
"Karang",
35681,
"alv-mbm",
"Latn",
}
m["kzs"] = {
"Sugut Dusun",
12953510,
"poz-san",
"Latn",
}
m["kzt"] = {
"Tambunan Dusun",
12953514,
"poz-san",
"Latn",
}
m["kzu"] = {
"Kayupulau",
6380723,
"poz-ocw",
}
m["kzv"] = {
"Komyandaret",
6428671,
"ngf-kts",
"Latn",
}
m["kzw"] = { -- contrast xoo, sai-kat, sai-xoc, the last of which the ISO conflated into this code
"Kariri",
12953620,
"sai-mje",
"Latn",
}
m["kzx"] = {
"Kamarian",
6356040,
"poz-cma",
"Latn",
}
m["kzy"] = {
"Kango-Sua",
11008360,
"bnt-kbi",
"Latn",
ancestors = "bip",
}
m["kzz"] = {
"Kalabra",
6350038,
"paa-wbh",
"Latn",
}
return require("Module:languages").finalizeData(m, "language")
cde9rgm4ot172eeyv0u4lv3su75yy5w
234821
234820
2026-05-24T08:01:32Z
Lee
19
[[:en:Module:languages/data/3/k]] වෙතින් එක් සංශෝධනයක්
234820
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
m["kaa"] = {
"Karakalpak",
33541,
"trk-kno",
"Latn, Cyrl, fa-Arab",
dotted_dotless_i = true,
strip_diacritics = {
from = {"['’]"},
to = {"ʼ"}
},
sort_key = {
Latn = {
from = {
-- Sort the old orthography (using the apostrophe) after the new orthography (using the acute accent).
"í", "iʼ", "i", -- Ensure "i" comes after "í", "iʼ", "ı".
"sh", "ch",
"á", "aʼ", "ǵ", "gʼ", "x", p[4], p[5], "ı", "q", "ń", "nʼ", "ó", "oʼ", "ú", "uʼ", "c"
},
to = {
p[4], p[5], "i" .. p[3],
"z" .. p[1], "z" .. p[3],
"a" .. p[1], "a" .. p[2], "g" .. p[1], "g" .. p[2], "h" .. p[1], "i", "i" .. p[1], "i" .. p[2], "k" .. p[1], "n" .. p[1], "n" .. p[2], "o" .. p[1], "o" .. p[2], "u" .. p[1], "u" .. p[2], "z" .. p[2]
}
},
Cyrl = {
from = {"ә", "ғ", "ё", "қ", "ң", "ө", "ү", "ў", "ҳ"},
to = {"а" .. p[1], "г" .. p[1], "е" .. p[1], "к" .. p[1], "н" .. p[1], "о" .. p[1], "у" .. p[1], "у" .. p[2], "х" .. p[1]}
},
},
}
m["kab"] = {
"Kabyle",
35853,
"ber",
"Latn, Arab, Tfng",
}
m["kac"] = {
"Jingpho",
33332,
"sit-jnp",
"Latn, Mymr",
}
m["kad"] = {
"Kadara",
3914011,
"nic-plc",
"Latn",
}
m["kae"] = {
"Ketangalan",
2779411,
"map",
}
m["kaf"] = {
"Katso",
246122,
"tbq-kzh",
}
m["kag"] = {
"Kajaman",
6348863,
"poz",
"Latn",
}
m["kah"] = {
"Fer",
5443742,
"csu-bgr",
"Latn",
}
m["kai"] = {
"Karekare",
3438770,
"cdc-wst",
"Latn",
}
m["kaj"] = {
"Jju",
35401,
"nic-plc",
"Latn",
}
m["kak"] = {
"Kayapa Kallahan",
3192220,
"phi",
"Latn",
}
m["kam"] = {
"Kamba",
2574767,
"bnt-kka",
"Latn",
}
m["kao"] = {
"Kassonke",
36905,
"dmn-wmn",
"Latn",
}
m["kap"] = {
"Bezhta",
33054,
"cau-ets",
"Cyrl",
translit = "cau-nec-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {Cyrl = s["cau-Cyrl-stripdiacritics"]},
}
m["kaq"] = {
"Capanahua",
2937196,
"sai-pan",
"Latn",
}
m["kaw"] = {
"Old Javanese",
49341,
"poz",
"Latn, Java, Kawi",
translit = "jv-translit", --same as jv
}
m["kax"] = {
"Kao",
3192799,
"paa-gto",
"Latn",
}
m["kay"] = {
"Kamayurá",
3192336,
"tup-gua",
"Latn",
}
m["kba"] = {
"Kalarko",
5517764,
"aus-pam",
"Latn",
}
m["kbb"] = {
"Kaxuyana",
12953626,
"sai-prk",
"Latn",
}
m["kbc"] = {
"Kadiwéu",
18168288,
"sai-guc",
"Latn",
}
m["kbd"] = {
"East Circassian",
33522,
"cau-cir",
"Cyrl, Latn, Arab",
translit = {
Cyrl = "cau-cir-translit",
Arab = "ar-translit",
},
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Cyrl = s["cau-Cyrl-stripdiacritics"],
Latn = s["cau-Latn-stripdiacritics"],
},
sort_key = {
Cyrl = {
from = {
"кхъу", "къӏу", -- 4 chars
"гъу", "джу", "дзу", "жъу", "къу", "кхъ", "къӏ", "кӏу", "кӏь", "лъу", "лӏу", "пӏу", "сӏу", "тӏу", "фӏу", "хъу", "цӏу", "чъу", "чӏу", "шъу", "шӏу", "щӏу", -- 3 chars
"гу", "гъ", "гь", "дж", "дз", "ё", "жъ", "жь", "ку", "къ", "кь", "кӏ", "лъ", "ль", "лӏ", "пӏ", "сӏ", "тӏ", "фӏ", "ху", "хъ", "хь", "цу", "цӏ", "чу", "чъ", "чӏ", "шъ", "шӏ", "щӏ", "ӏу", "ӏь", -- 2 chars
"э" -- 1 char
},
to = {
"к" .. p[5], "к" .. p[7],
"г" .. p[3], "д" .. p[2], "д" .. p[4], "ж" .. p[2], "к" .. p[3], "к" .. p[4], "к" .. p[6], "к" .. p[10], "к" .. p[11], "л" .. p[2], "л" .. p[5], "п" .. p[2], "с" .. p[2], "т" .. p[2], "ф" .. p[2], "х" .. p[3], "ц" .. p[3], "ч" .. p[3], "ч" .. p[5], "ш" .. p[2], "ш" .. p[4], "щ" .. p[2],
"г" .. p[1], "г" .. p[2], "г" .. p[4], "д" .. p[1], "д" .. p[3], "е" .. p[1], "ж" .. p[1], "ж" .. p[3], "к" .. p[1], "к" .. p[2], "к" .. p[8], "к" .. p[9], "л" .. p[1], "л" .. p[3], "л" .. p[4], "п" .. p[1], "с" .. p[1], "т" .. p[1], "ф" .. p[1], "х" .. p[1], "х" .. p[2], "х" .. p[4], "ц" .. p[1], "ц" .. p[2], "ч" .. p[1], "ч" .. p[2], "ч" .. p[4], "ш" .. p[1], "ш" .. p[3], "щ" .. p[1], "ӏ" .. p[1], "ӏ" .. p[2],
"а" .. p[1]
}
},
},
}
m["kbe"] = {
"Kanju",
10543322,
"aus-pam",
"Latn",
}
m["kbh"] = {
"Camsá",
2842667,
"qfa-iso",
"Latn",
}
m["kbi"] = {
"Kaptiau",
6367294,
"poz-oce",
"Latn",
}
m["kbj"] = {
"Kari",
6370438,
"bnt-boa",
"Latn",
}
m["kbk"] = {
"Grass Koiari",
12952642,
"ngf-koi",
"Latn",
}
m["kbm"] = {
"Iwal",
3156391,
"poz-ocw",
"Latn",
}
m["kbn"] = {
"Kare (Central Africa)",
35554,
"alv-mbm",
"Latn",
}
m["kbo"] = {
"Keliko",
11275553,
"csu-mma",
}
m["kbp"] = {
"Kabiye",
35475,
"nic-gne",
"Latn",
}
m["kbq"] = {
"Kamano",
11732272,
"ngf-kya",
"Latn",
}
m["kbr"] = {
"Kafa",
35481,
"omv-gon",
"Ethi, Latn",
}
m["kbs"] = {
"Kande",
35556,
"bnt-tso",
"Latn",
}
m["kbt"] = {
"Gabadi",
3291159,
"poz-ocw",
"Latn",
}
m["kbu"] = {
"Kabutra",
10966761,
"raj",
}
m["kbv"] = {
"Kamberataro",
5261289,
"paa-sng",
"Latn",
}
m["kbw"] = {
"Kaiep",
6347632,
"poz-ocw",
"Latn",
}
m["kbx"] = {
"Ap Ma",
56298,
"paa-eke",
"Latn",
}
m["kbz"] = {
"Duhwa",
56295,
"cdc-wst",
"Latn",
}
m["kcb"] = {
"Kawacha",
11732302,
"ngf-woj",
"Latn",
}
m["kcc"] = {
"Lubila",
3914381,
"nic-uce",
"Latn",
}
m["kcd"] = {
"Ngkâlmpw Kanum",
12952566,
"paa-ngk",
"Latn",
}
m["kce"] = {
"Kaivi",
6348685,
"nic-kau",
}
m["kcf"] = {
"Ukaan",
36651,
"nic-bco",
}
m["kcg"] = {
"Tyap",
3912765,
"nic-plc",
"Latn",
}
m["kch"] = {
"Vono",
3913920,
"nic-kau",
}
m["kci"] = {
"Kamantan",
3914019,
"nic-plc",
}
m["kcj"] = {
"Kobiana",
35609,
"alv-nyn",
}
m["kck"] = {
"Kalanga",
33672,
"bnt-sho",
"Latn",
}
m["kcl"] = {
"Kala",
6349982,
"poz-ocw",
"Latn",
}
m["kcm"] = {
"Tar Gula",
277963,
"csu-bba",
}
m["kcn"] = {
"Nubi",
36388,
"crp",
"Latn, Arab",
ancestors = "apd",
strip_diacritics = {remove_diacritics = c.acute},
}
m["kco"] = {
"Kinalakna",
11732320,
"ngf-dal",
"Latn",
}
m["kcp"] = {
"Kanga",
6362384,
"qfa-kad",
"Latn",
}
m["kcq"] = {
"Kamo",
3914879,
"alv-wjk",
}
m["kcr"] = {
"Katla",
35688,
"nic-ktl",
}
m["kcs"] = {
"Koenoem",
3438755,
"cdc-wst",
}
m["kct"] = {
"Kaian",
6347538,
"paa-ott",
"Latn",
}
m["kcu"] = {
"Kikami",
3915212,
"bnt-ruv",
"Latn",
}
m["kcv"] = {
"Kete",
3195598,
"bnt-lub",
}
m["kcw"] = {
"Kabwari",
6344539,
"bnt-glb",
}
m["kcx"] = {
"Kachama-Ganjule",
12634070,
"omv-eom",
}
m["kcy"] = {
"Korandje",
33427,
"son",
}
m["kcz"] = {
"Konongo",
11732345,
"bnt-tkm",
"Latn",
}
m["kda"] = {
"Worimi",
3914062,
"aus-pam",
"Latn",
}
m["kdc"] = {
"Kutu",
6448634,
"bnt-ruv",
}
m["kdd"] = {
"Yankunytjatjara",
34207,
"aus-pam",
"Latn",
}
m["kde"] = {
"Makonde",
35172,
"bnt-rvm",
"Latn",
}
m["kdf"] = {
"Mamusi",
6746036,
"poz-ocw",
"Latn",
}
m["kdg"] = {
"Seba",
7442316,
"bnt-sbi",
"Latn",
}
m["kdh"] = {
"Tem",
36531,
"nic-gne",
"Latn",
}
m["kdi"] = {
"Kumam",
6443410,
"sdv-los",
}
m["kdj"] = {
"Karamojong",
56326,
"sdv-ttu",
"Latn",
}
m["kdk"] = {
"Numèè",
3346774,
"poz-cln",
"Latn",
}
m["kdl"] = {
"Tsikimba",
3914404,
"nic-kam",
}
m["kdm"] = {
"Kagoma",
3914420,
"nic-plc",
}
m["kdn"] = {
"Kunda",
4121130,
"bnt-sna",
"Latn",
}
m["kdp"] = {
"Kaningdon-Nindem",
3914956,
"nic-nin",
}
m["kdq"] = {
"Koch",
56431,
"tbq-bdg",
}
m["kdr"] = {
"Karaim",
33725,
"trk-kcu",
"Cyrl, Latn, Hebr",
-- Hebr display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["kdt"] = {
"Kuy",
56310,
"mkh-kat",
"Thai, Khmr, Laoo",
}
m["kdu"] = {
"Kadaru",
35441,
"nub-hil",
"Latn",
}
m["kdv"] = {
"Kado",
7402721,
"sit-luu",
}
m["kdw"] = {
"Koneraw",
11732341,
"ngf-mom",
"Latn",
}
m["kdx"] = {
"Kam",
36753,
"alv-wjk",
}
m["kdy"] = {
"Keder",
6383641,
"paa-tor",
"Latn",
}
m["kdz"] = {
"Kwaja",
11128866,
"nic-nka",
"Latn",
}
m["kea"] = {
"Kabuverdianu",
35963,
"crp",
"Latn",
ancestors = "pt",
}
m["keb"] = {
"Kélé",
35559,
"bnt-kel",
}
m["kec"] = {
"Keiga",
3409311,
"qfa-kad",
"Latn",
}
m["ked"] = {
"Kerewe",
6393846,
"bnt-haj",
}
m["kee"] = {
"Eastern Keres",
15649021,
"nai-ker",
"Latn",
}
m["kef"] = {
"Kpessi",
35748,
"alv-gbe",
}
m["keg"] = {
"Tese",
16887296,
"sdv",
}
m["keh"] = {
"Keak",
6382110,
"paa-nnd",
"Latn",
}
m["kei"] = {
"Kei",
2410352,
"poz-cet",
"Latn",
}
m["kej"] = {
"Kadar",
6345179,
"dra-mal",
}
m["kek"] = {
"Q'eqchi",
35536,
"myn",
"Latn",
}
m["kel"] = {
"Kela-Yela",
6385426,
"bnt-mon",
"Latn",
}
m["kem"] = {
"Kemak",
35549,
"poz-tim",
"Latn",
}
m["ken"] = {
"Kenyang",
35650,
"nic-mam",
"Latn",
}
m["keo"] = {
"Kakwa",
3033547,
"sdv-bri",
}
m["kep"] = {
"Kaikadi",
6347757,
"dra-tam",
}
m["keq"] = {
"Kamar",
14916877,
"inc-hal",
}
m["ker"] = {
"Kera",
56251,
"cdc-est",
"Latn",
}
m["kes"] = {
"Kugbo",
3813394,
"nic-cde",
"Latn",
}
m["ket"] = {
"Ket",
33485,
"qfa-yke",
"Cyrl",
strip_diacritics = {
from = {"['’]"},
to = {"ʼ"}
},
sort_key = {
from = {"ӷ", "ё", "ӄ", "ӈ", "ө", "ә", "ʼ"},
to = {"г" .. p[1], "е" .. p[1], "к" .. p[1], "н" .. p[1], "о" .. p[1], "ъ" .. p[1], "ь" .. p[1]}
},
}
m["keu"] = {
"Akebu",
35026,
"alv-ktg",
"Latn",
}
m["kev"] = {
"Kanikkaran",
6363201,
"dra-mal",
"Taml, Mlym",
-- Mlym translit in [[Module:scripts/data]] (NOTE: not present before, presumably an accidental omission)
}
m["kew"] = {
"Kewa",
12952619,
"ngf-ank",
"Latn",
}
m["kex"] = {
"Kukna",
5031131,
"inc-bhi",
wikipedia_article = "Dhodia–Kukna language",
}
m["key"] = {
"Kupia",
6445354,
"inc-eas",
}
m["kez"] = {
"Kukele",
3915391,
"nic-ucn",
"Latn",
}
m["kfa"] = {
"Kodava",
33531,
"dra-kod",
"Knda, Mlym",
-- Knda translit in [[Module:scripts/data]]
-- Mlym translit in [[Module:scripts/data]]
}
m["kfb"] = {
"Kolami",
33479,
"dra-knk",
"Deva, Telu",
translit = {
Telu = "te-translit",
},
}
m["kfc"] = {
"Konda-Dora",
35679,
"dra-kki",
"Orya, Telu",
translit = {
Orya = "gon-Orya-translit",
Telu = "te-translit",
},
}
m["kfd"] = {
"Korra Koraga",
12952655,
"dra-kor",
"Knda",
-- Knda translit in [[Module:scripts/data]]
}
m["kfe"] = {
"Kota (India)",
33483,
"dra-tkt",
"Taml",
translit = "ta-translit",
}
m["kff"] = {
"Koya",
33471,
"dra-gon",
"Telu, Orya, Deva, Latn",
}
m["kfg"] = {
"Kudiya",
12952667,
"dra-tlk",
}
m["kfh"] = {
"Kurichiya",
12952676,
"dra-mal",
"Mlym",
-- Mlym translit in [[Module:scripts/data]]
}
m["kfi"] = {
"Kannada Kurumba",
56589,
"dra-sdo",
}
m["kfj"] = {
"Kemiehua",
27144776,
"mkh-pal",
}
m["kfk"] = {
"Kinnauri",
2383208,
"sit-kin",
"Takr, Deva, Latn",
}
m["kfl"] = {
"Kung",
6444510,
"nic-rnc",
"Latn",
}
m["kfn"] = {
"Kuk",
6442398,
"nic-rnc",
"Latn",
}
m["kfo"] = {
"Koro (West Africa)",
11160588,
"dmn-mnk",
"Latn, Nkoo",
}
m["kfp"] = {
"Korwa",
6432786,
"mun",
}
m["kfq"] = {
"Korku",
33715,
"mun",
"Deva",
}
m["kfr"] = {
"Kachchi",
56487,
"inc-snd",
"Gujr, sd-Arab, Sind, Khoj",
translit = {
Gujr = "gu-translit",
Sind = "Sind-translit",
["sd-Arab"] = "sd-Arab-translit",
},
strip_diacritics = {
remove_diacritics = c.kashida .. c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.superalef,
from = {u(0x0671)},
to = {u(0x0627)}
},
}
m["kfs"] = {
"Bilaspuri",
12953397,
"him",
"Deva, Takr",
translit = "hi-translit",
}
m["kft"] = {
"Kanjari",
12953610,
"inc-pan",
ancestors = "pa",
}
m["kfu"] = {
"Katkari",
6377671,
"inc-sou",
}
m["kfv"] = {
"Kurmukar",
6446193,
"inc-eas",
}
m["kfw"] = {
"Kharam Naga",
12952906,
"tbq-kuk",
}
m["kfx"] = {
"Kullu Pahari",
6443148,
"him",
"Deva",
translit = "hi-translit",
}
m["kfy"] = {
"Kumaoni",
33529,
"inc-pah",
"Deva, Shrd, Takr",
-- Shrd translit in [[Module:scripts/data]] (NOTE: not present before, presumably an accidental omission)
}
m["kfz"] = {
"Koromfé",
35701,
"nic-gur",
"Latn",
}
m["kga"] = {
"Koyaga",
11155632,
"dmn-mnk",
}
m["kgb"] = {
"Kawe",
12952750,
"poz-hce",
"Latn",
}
m["kgd"] = {
"Kataang",
12953622,
"mkh",
}
m["kge"] = {
"Komering",
49224,
"poz-lgx",
"Latn, Arab",
}
m["kgf"] = {
"Kube",
11732359,
"ngf-kto",
"Latn",
}
m["kgg"] = {
"Kusunda",
33630,
"qfa-iso", -- central Nepal
"Latn",
}
m["kgi"] = {
"Selangor Sign Language",
33731,
"sgn",
}
m["kgj"] = {
"Gamale Kham",
22236996,
"sit-kha",
"Deva",
}
m["kgk"] = {
"Kaiwá",
3111883,
"gn",
"Latn",
}
m["kgl"] = {
"Kunggari",
10550184,
"aus-pam",
"Latn",
}
m["kgn"] = {
"Karingani",
6371041,
"xme-ttc",
"fa-Arab, Latn",
ancestors = "xme-ttc-nor",
}
m["kgo"] = {
"Krongo",
6438927,
"qfa-kad",
"Latn",
}
m["kgp"] = {
"Kaingang",
2665734,
"sai-sje",
"Latn",
}
m["kgq"] = {
"Kamoro",
6359001,
"ngf-ask",
"Latn",
}
m["kgr"] = {
"Abun",
56657,
"qfa-iso", -- Papuan; isolate in Ethnologue, Glottolog and Palmer (2018); grouped with West Papuan by Ross (2005)
"Latn",
}
m["kgs"] = {
"Kumbainggar",
3915412,
"aus-pam",
"Latn",
}
m["kgt"] = {
"Somyev",
3913354,
"nic-mmb",
"Latn",
}
m["kgu"] = {
"Kobol",
11732325,
"ngf-omo",
"Latn",
}
m["kgv"] = {
"Karas",
6368621,
"qfa-dis", -- Divergent Papuan language; grouped with Mbaham-Iha by Glottolog to form a (mainland) West Bomberai
-- family, but with Mbaham-Iha and Timor-Alor-Pantar by Wikipedia (following Usher and Schapper 2022)
-- into a (Greater) West Bomberai family.
"Latn",
}
m["kgw"] = {
"Karon Dori",
56817,
"paa-may",
"Latn",
}
m["kgx"] = {
"Kamaru",
12953604,
"poz-wot",
"Latn",
}
m["kgy"] = {
"Kyerung",
12952691,
"sit-kyk",
}
m["kha"] = {
"Khasi",
33584,
"aav-pkl",
"Latn, as-Beng",
}
m["khb"] = {
"Lü",
36948,
"tai-swe",
"Talu, Lana",
translit = {Talu = "Talu-translit"},
strip_diacritics = {remove_diacritics = c.ZWNJ},
sort_key = {
Talu = "Talu-sortkey",
Lana = "Lana-sortkey",
},
}
m["khc"] = {
"North Tukang Besi",
18611555,
"poz",
}
m["khd"] = {
"Bädi Kanum",
20888004,
"paa-ngk",
"Latn",
}
m["khe"] = {
"Korowai",
6432598,
"ngf-bda",
"Latn",
}
m["khf"] = {
"Khuen",
27144893,
"mkh",
}
m["khh"] = {
"Kehu",
10994953,
}
m["khj"] = {
"Kuturmi",
3914490,
"nic-plc",
"Latn",
}
m["khl"] = {
"Lusi",
3267788,
"poz-ocw",
"Latn",
}
m["khn"] = {
"Khandeshi",
33726,
"inc-sou",
}
m["kho"] = {
"Khotanese",
6583551,
"xsc-sak",
"Brah, Khar",
-- Brah translit in [[Module:scripts/data]]
}
m["khp"] = {
"Kapauri",
3502575,
"qfa-dis", -- isolate per Glottolog, possibly Greater Kwerba per Wikipedia in Kapauri-Sause family
"Latn",
}
m["khq"] = {
"Koyra Chiini",
33600,
"son",
"Latn, Arab",
}
m["khr"] = {
"Kharia",
3915562,
"mun",
}
m["khs"] = {
"Kasua",
6374863,
"ngf-bos",
"Latn",
}
m["kht"] = {
"Khamti",
3915502,
"tai-swe",
"Mymr",
display_text = s["kht-displaytext"],
strip_diacritics = s["kht-stripdiacritics"],
}
m["khu"] = {
"Nkhumbi",
11019169,
"bnt-swb",
}
m["khv"] = {
"Khvarshi",
56425,
"cau-wts",
"Cyrl",
translit = "khv-translit",
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {Cyrl = s["cau-Cyrl-stripdiacritics"]},
}
m["khw"] = {
"Khowar",
938216,
"inc-chi",
"Arab",
strip_diacritics = {
-- character "ۂ" code U+06C2 to "ه" and "هٔ" (U+0647 + U+0654) to "ه"; hamzatu l-waṣli to a regular alif
from = {"هٔ", "ۂ", "ٱ"},
to = {"ہ", "ہ", "ا"},
remove_diacritics = c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun .. c.nunghunna .. c.superalef
},
}
m["khx"] = {
"Kanu",
12952571,
"bnt-lgb",
}
m["khy"] = {
"Ekele",
6385549,
"bnt-ske",
"Latn",
}
m["khz"] = {
"Keapara",
12952603,
"poz-ocw",
"Latn",
}
m["kia"] = {
"Kim",
35685,
"alv-kim",
}
m["kib"] = {
"Koalib",
35859,
"alv-hei",
}
m["kic"] = {
"Kickapoo",
20162127,
"alg-sfk",
"Latn",
}
m["kid"] = {
"Koshin",
35632,
"nic-beb",
"Latn",
}
m["kie"] = {
"Kibet",
56893,
}
m["kif"] = {
"Eastern Parbate Kham",
12953022,
"sit-kha",
"Deva",
}
m["kig"] = {
"Kimaama",
11732321,
"paa-kol",
"Latn",
}
m["kih"] = {
"Kilmeri",
6408020,
"paa-bew",
"Latn",
}
m["kii"] = {
"Kitsai",
56627,
"cdd",
"Latn",
}
m["kij"] = {
"Kilivila",
3196601,
"poz-ocw",
"Latn",
}
m["kil"] = {
"Kariya",
3438708,
"cdc-wst",
}
m["kim"] = {
"Tofa",
36848,
"trk-ssb",
"Cyrl",
}
m["kio"] = {
"Kiowa",
56631,
"nai-kta",
"Latn",
}
m["kip"] = {
"Sheshi Kham",
12952622,
"sit-kha",
"Deva",
}
m["kiq"] = {
"Kosadle",
6432994,
"paa-kko",
"Latn",
}
m["kis"] = {
"Kis",
6416362,
"poz-ocw",
"Latn",
}
m["kit"] = {
"Agob",
3332143,
"paa-pah",
"Latn",
}
m["kiv"] = {
"Kimbu",
10997740,
"bnt-tkm",
}
m["kiw"] = {
"Northeast Kiwai",
11732324,
"paa-kiw",
"Latn",
}
m["kix"] = {
"Khiamniungan Naga",
6401546,
"sit-kch",
"Latn",
}
m["kiy"] = {
"Kirikiri",
6415159,
"paa-wlp",
"Latn",
}
m["kiz"] = {
"Kisi",
3912772,
"bnt-bki",
}
m["kja"] = {
"Mlap",
6885683,
"paa-nim",
"Latn",
}
m["kjb"] = {
"Q'anjob'al",
35551,
"myn",
"Latn",
}
m["kjc"] = {
"Coastal Konjo",
3198689,
"poz",
"Latn",
}
m["kjd"] = {
"Southern Kiwai",
11732322,
"paa-kiw",
"Latn",
}
m["kje"] = {
"Kisar",
3197441,
"poz",
"Latn",
}
m["kjg"] = {
"Khmu",
33335,
"mkh",
"Laoo",
ancestors = "mkh-khm-pro",
sort_key = "Laoo-sortkey",
}
m["kjh"] = {
"Khakas",
33575,
"trk-ssb",
"Cyrl",
translit = "kjh-translit",
override_translit = true,
}
m["kji"] = {
"Zabana",
379130,
"poz-ocw",
"Latn",
}
m["kjj"] = {
"Khinalug",
35278,
"cau-nec",
"Cyrl, Latn",
translit = "kjj-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Cyrl = s["cau-Cyrl-stripdiacritics"],
Latn = s["cau-Latn-stripdiacritics"],
},
}
m["kjk"] = {
"Highland Konjo",
3198688,
"poz",
}
m["kjl"] = {
"Western Parbate Kham",
22237017,
"sit-kha",
"Deva",
}
m["kjm"] = {
"Kháng",
6403501,
"mkh-pal",
}
m["kjn"] = {
"Kunjen",
3200468,
"aus-pmn",
"Latn",
}
m["kjo"] = {
"Harijan Kinnauri",
5657463,
"him",
"Takr, Deva",
}
m["kjp"] = {
"Eastern Pwo",
5330390,
"kar",
"Mymr, Leke, Thai",
translit = "kjp-translit",
override_translit = true,
}
m["kjq"] = {
"Western Keres",
12645568,
"nai-ker",
"Latn",
}
m["kjr"] = {
"Kurudu",
12952678,
"poz-hce",
"Latn",
}
m["kjs"] = {
"East Kewa",
20050949,
"ngf-ank",
"Latn",
}
m["kjt"] = {
"Phrae Pwo",
7187991,
"kar",
"Thai",
}
m["kju"] = {
"Kashaya",
3193689,
"nai-pom",
"Latn",
}
m["kjx"] = {
"Ramopa",
56830,
"paa-nbo",
"Latn",
}
m["kjy"] = {
"Erave",
12952416,
"ngf-ank",
"Latn",
}
m["kjz"] = {
"Bumthangkha",
2786408,
"sit-ebo",
"Tibt",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["kka"] = {
"Kakanda",
3915342,
"alv-ngb",
}
m["kkb"] = {
"Kwerisa",
56881,
"paa-clp",
"Latn",
}
m["kkc"] = {
"Odoodee",
12952987,
"ngf-est",
"Latn",
}
m["kkd"] = {
"Kinuku",
6414422,
"nic-kau",
}
m["kke"] = {
"Kakabe",
3913966,
"dmn-mok",
"Latn",
}
m["kkf"] = {
"Kalaktang Monpa",
63257089,
"sit-tsk",
"Tibt, Latn, Deva",
override_translit = true,
-- Tibt translit, display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["kkg"] = {
"Mabaka Valley Kalinga",
18753304,
"phi",
}
m["kkh"] = {
"Khün",
3545044,
"tai-swe",
"Lana, Thai",
sort_key = {
Lana = "Lana-sortkey",
Thai = "Thai-sortkey"
},
}
m["kki"] = {
"Kagulu",
12952537,
"bnt-ruv",
"Latn",
}
m["kkj"] = {
"Kako",
35755,
"bnt-kak",
}
m["kkk"] = {
"Kokota",
3198399,
"poz-ocw",
"Latn",
}
m["kkl"] = {
"Kosarek Yale",
6432995,
"ngf-mek",
"Latn",
}
m["kkm"] = {
"Kiong",
6414512,
"nic-ucr",
"Latn",
}
m["kkn"] = {
"Kon Keu",
6428686,
"mkh-pal",
}
m["kko"] = {
"Karko",
35529,
"nub-hil",
}
m["kkp"] = {
"Koko-Bera",
6426699,
"aus-pmn",
"Latn",
}
m["kkq"] = {
"Kaiku",
6347840,
"bnt-kbi",
"Latn",
}
m["kkr"] = {
"Kir-Balar",
3440527,
"cdc-wst",
"Latn",
}
m["kks"] = {
"Kirfi",
56242,
"cdc-wst",
"Latn",
}
m["kkt"] = {
"Koi",
6426194,
"sit-kiw",
}
m["kku"] = {
"Tumi",
3913934,
"nic-kau",
}
m["kkv"] = {
"Kangean",
2071325,
"poz-msa",
"Latn",
}
m["kkw"] = {
"Teke-Kukuya",
36560,
"bnt-tek",
}
m["kkx"] = {
"Kohin",
6425997,
"poz-brw",
}
m["kky"] = {
"Guugu Yimidhirr",
56543,
"aus-pam",
"Latn",
}
m["kkz"] = {
"Kaska",
20823,
"ath-nor",
"Latn",
}
m["kla"] = {
"Klamath-Modoc",
2669248,
"nai-plp",
"Latn",
}
m["klb"] = {
"Kiliwa",
3182593,
"nai-yuc",
"Latn",
}
m["klc"] = {
"Kolbila",
6427122,
"alv-lek",
}
m["kld"] = {
"Gamilaraay",
3111818,
"aus-cww",
"Latn",
}
m["kle"] = {
"Kulung",
6443304,
"sit-kic",
}
m["klf"] = {
"Kendeje",
56895,
}
m["klg"] = {
"Tagakaulu Kalagan",
18756514,
"phi",
"Latn",
}
m["klh"] = {
"Weliki",
7981017,
"ngf-uru",
"Latn",
}
m["kli"] = {
"Kalumpang",
13561407,
"poz",
}
m["klj"] = {
"Khalaj",
33455,
"trk",
"fa-Arab, Latn",
ancestors = "klj-arg",
strip_diacritics = {
remove_diacritics = c.kashida .. c.fathatan .. c.dammatan .. c.kasratan .. c.fatha .. c.damma .. c.kasra .. c.shadda .. c.sukun,
}
}
m["klk"] = {
"Kono (Nigeria)",
6429589,
"nic-kau",
"Latn",
}
m["kll"] = {
"Kagan Kalagan",
18748913,
"phi",
}
m["klm"] = {
"Kolom",
6844970,
"ngf-rai",
"Latn",
}
m["kln"] = {
"Kalenjin",
637228,
"sdv-nma",
"Latn",
}
m["klo"] = {
"Kapya",
6367410,
"nic-ykb",
}
m["klp"] = {
"Kamasa",
6356107,
"ngf-woj",
"Latn",
}
m["klq"] = {
"Rumu",
7379420,
"paa-tki",
"Latn",
}
m["klr"] = {
"Khaling",
56381,
"sit-kiw",
"Deva",
}
m["kls"] = {
"Kalasha",
33416,
"inc-chi",
"Latn, ks-Arab",
}
m["klt"] = {
"Nukna",
7068874,
"ngf-uru",
"Latn",
}
m["klu"] = {
"Klao",
3914866,
"kro-wkr",
}
m["klv"] = {
"Maskelynes",
3297282,
"poz-vnc",
"Latn",
}
m["klw"] = {
"Lindu",
18390055,
"poz-kal",
"Latn",
}
m["klx"] = {
"Koluwawa",
6427954,
"poz-ocw",
"Latn",
}
m["kly"] = {
"Kalao",
6350643,
"poz-wot",
"Latn",
}
m["klz"] = {
"Kabola",
11732258,
"paa-alp",
"Latn",
}
m["kma"] = {
"Konni",
35680,
"nic-buk",
}
m["kmb"] = {
"Kimbundu",
35891,
"bnt-kmb",
"Latn",
}
m["kmc"] = {
"Southern Kam",
35379,
"qfa-kms",
"Latn",
}
m["kmd"] = {
"Madukayang Kalinga",
18753305,
"phi",
}
m["kme"] = {
"Bakole",
35068,
"bnt-kpw",
"Latn",
}
m["kmf"] = {
"Kare (New Guinea)",
11732286,
"ngf-mab",
"Latn",
}
m["kmg"] = {
"Kâte",
3201059,
"ngf-kma",
"Latn",
}
m["kmh"] = {
"Kalam",
12952550,
"ngf-kak",
"Latn",
}
m["kmi"] = {
"Kami",
3915372,
"alv-ngb",
"Latn",
}
m["kmj"] = {
"Kumarbhag Paharia",
3130374,
"dra-mlo",
"Beng, Deva",
}
m["kmk"] = {
"Limos Kalinga",
18753303,
"phi",
"Latn",
}
m["kml"] = {
"Tanudan Kalinga",
18753307,
"phi",
"Latn",
}
m["kmm"] = {
"Kom (India)",
12952647,
"tbq-kuk",
}
m["kmn"] = {
"Awtuw",
3504217,
"paa-sep",
"Latn",
}
m["kmo"] = {
"Kwoma",
11732376,
"paa-sep",
"Latn",
}
m["kmp"] = {
"Gimme",
11152236,
"alv-dur",
}
m["kmq"] = {
"Kwama",
2591184,
"ssa-kom",
}
m["kmr"] = {
"Northern Kurdish",
36163,
"ku",
"Latn, Cyrl, Armn, ku-Arab, Yezi",
translit = {
Cyrl = "kmr-translit",
-- Armn translit in [[Module:scripts/data]]
["ku-Arab"] = "ckb-translit",
},
strip_diacritics = {
Latn = {
remove_diacritics = "'’",
from = {"r̄", "R̄", "ẍ", "Ẍ"},
to = {"rr", "Rr", "x", "X"}
},
},
wikimedia_codes = "ku",
}
m["kms"] = {
"Kamasau",
6356117,
"paa-mar",
"Latn",
}
m["kmt"] = {
"Kemtuik",
6387179,
"paa-nim",
"Latn",
}
m["kmu"] = {
"Kanite",
12952567,
"ngf-kya",
"Latn",
}
m["kmv"] = {
"Karipúna Creole French",
2523999,
"crp",
"Latn",
ancestors = "fr",
sort_key = s["roa-oil-sortkey"],
}
m["kmw"] = {
"Kumu",
6428450,
"bnt-kbi",
"Latn",
}
m["kmx"] = {
"Waboda",
7958705,
"paa-kiw",
"Latn",
}
m["kmy"] = {
"Koma",
35634,
"alv-dur",
}
m["kmz"] = {
"Khorasani Turkish",
35373,
"trk-ogz",
"Arab",
ancestors = "trk-oat",
}
m["kna"] = {
"Kanakuru",
56811,
"cdc-wst",
"Latn",
}
m["knb"] = {
"Lubuagan Kalinga",
12953602,
"phi",
"Latn",
}
m["knd"] = {
"Konda",
11732340,
"ngf-sbh",
"Latn",
}
m["kne"] = {
"Kankanaey",
18753329,
"phi",
"Latn",
strip_diacritics = {
Latn = {
remove_diacritics = c.grave .. c.acute .. c.circ .. c.diaer,
}
},
sort_key = {
Latn = "tl-sortkey",
},
standard_chars = {
Latn = "AaBbKkDdEeGgHhIiLlMmNnOoPpRrSsTtUuWwYy" .. c.punc,
},
}
m["knf"] = {
"Mankanya",
35789,
"alv-pap",
"Latn",
}
m["kni"] = {
"Kanufi",
3913297,
"nic-nin",
"Latn",
}
m["knj"] = {
"Akatek",
34923,
"myn",
"Latn",
}
m["knk"] = {
"Kuranko",
3198896,
"dmn-mok",
"Latn",
}
m["knl"] = {
"Keninjal",
6389309,
"poz-mly",
"Latn",
}
m["knm"] = { -- two unrelated lects have this name; this is the Katukinian one
"Kanamari",
3438373,
"sai-ktk",
"Latn",
}
m["kno"] = {
"Kono (Sierra Leone)",
35675,
"dmn-vak",
"Latn",
}
m["knp"] = {
"Kwanja",
35641,
"nic-mmb",
"Latn",
}
m["knq"] = {
"Kintaq",
6414335,
"mkh-asl",
}
m["knr"] = {
"Kaningra",
6363253,
"paa-sep",
"Latn",
}
m["kns"] = {
"Kensiu",
6391529,
"mkh-asl",
}
m["knt"] = {
"Katukina",
3194265,
"sai-pan",
"Latn",
}
m["knu"] = { -- a dialect of 'kpe'
"Kono (Guinea)",
3198703,
"dmn-msw",
"Latn, Kpel",
ancestors = "kpe",
}
m["knv"] = {
"Tabo",
7959888,
"aav",
}
m["knx"] = {
"Kendayan",
6388963,
"poz-mly",
"Latn",
}
m["kny"] = {
"Kanyok",
11110766,
"bnt-lub",
"Latn",
}
m["knz"] = {
"Kalamsé",
3914000,
"nic-gnn",
}
m["koa"] = {
"Konomala",
3198732,
"poz-ocw",
"Latn",
}
m["koc"] = {
"Kpati",
3913279,
"nic-nge",
"Latn",
}
m["kod"] = {
"Kodi",
4577633,
"poz-cet",
"Latn",
}
m["koe"] = {
"Kacipo-Balesi",
5364424,
"sdv",
}
m["kof"] = {
"Kubi",
3438718,
"cdc-wst",
"Latn",
}
m["kog"] = {
"Cogui",
3198286,
"cba",
"Latn",
}
m["koh"] = {
"Koyo",
35649,
"bnt-mbo",
"Latn",
}
m["koi"] = {
"Komi-Permyak",
56318,
"kv",
"Cyrl",
translit = "kv-translit",
strip_diacritics = {remove_diacritics = c.acute},
override_translit = true,
}
m["kok"] = {
"Konkani",
34239,
"inc-sou",
"Deva, Knda, Mlym, fa-Arab, Latn",
translit = {
Deva = "mr-translit",
},
-- Knda translit in [[Module:scripts/data]]
-- Mlym translit in [[Module:scripts/data]]
strip_diacritics = {
-- FIXME: Separate out the scripts
from = {"च़", "ज़", "झ़", "ಚ಼", "ಜ಼", "ಝ಼"},
to = {"च", "ज", "झ", "ಚ", "ಜ", "ಝ"}
} ,
}
m["kol"] = {
"Kol (New Guinea)",
4227542,
}
m["koo"] = {
"Konzo",
2361829,
"bnt-glb",
"Latn",
}
m["kop"] = {
"Waube",
11732373,
"ngf-nur",
"Latn",
}
m["koq"] = {
"Kota (Gabon)",
35607,
"bnt-kel",
"Latn",
}
m["kos"] = {
"Kosraean",
33464,
"poz-mic",
"Latn",
}
m["kot"] = {
"Lagwan",
3502264,
"cdc-cbm",
"Latn",
}
m["kou"] = {
"Koke",
797249,
"alv-bua",
}
m["kov"] = {
"Kudu-Camo",
3915850,
"nic-jer",
}
m["kow"] = {
"Kugama",
3913307,
"alv-mye",
}
m["koy"] = {
"Koyukon",
28304,
"ath-nor",
"Latn",
}
m["koz"] = {
"Korak",
6431365,
"ngf-kow",
"Latn",
}
m["kpa"] = {
"Kutto",
3437656,
"cdc-wst",
}
m["kpb"] = {
"Mullu Kurumba",
19573111,
"dra-mal",
}
m["kpc"] = {
"Curripaco",
2882543,
"awd-nwk",
"Latn",
}
m["kpd"] = {
"Koba",
6424249,
"poz",
}
m["kpe"] = {
"Kpelle",
35673,
"dmn-msw",
"Latn, Kpel",
}
m["kpf"] = {
"Komba",
6428239,
"ngf-kab",
"Latn",
}
m["kpg"] = {
"Kapingamarangi",
35771,
"poz-pnp",
"Latn",
}
m["kph"] = {
"Kplang",
35628,
"alv-gng",
}
m["kpi"] = {
"Kofei",
6425665,
"paa-egb",
"Latn",
}
m["kpj"] = {
"Karajá",
10322066,
"sai-mje",
"Latn",
}
m["kpk"] = {
"Kpan",
3915380,
"nic-jkn",
"Latn",
}
m["kpl"] = {
"Kpala",
11154769,
"nic-nkk",
"Latn",
}
m["kpm"] = {
"Koho",
3511919,
"mkh-ban",
"Latn",
}
m["kpn"] = {
"Kepkiriwát",
3195366,
"tup",
"Latn",
}
m["kpo"] = {
"Ikposo",
35029,
"alv-ktg",
"Latn",
}
m["kpq"] = {
"Korupun-Sela",
6432769,
"ngf-mek",
"Latn",
}
m["kpr"] = {
"Korafe-Yegha",
11732347,
"ngf-gko",
"Latn",
}
m["kps"] = {
"Tehit",
7694851,
"paa-wbh",
"Latn",
}
m["kpt"] = {
"Karata",
56636,
"cau-and",
"Cyrl",
translit = "kpt-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {Cyrl = s["cau-Cyrl-stripdiacritics"]},
}
m["kpu"] = {
"Kafoa",
6346151,
"paa-alp",
"Latn",
}
m["kpv"] = {
"Komi-Zyrian",
34114,
"kv",
"Cyrl",
translit = "kv-translit",
override_translit = true,
wikimedia_codes = "kv",
}
m["kpw"] = {
"Kobon",
11732326,
"ngf-kak",
"Latn",
}
m["kpx"] = {
"Mountain Koiari",
6925030,
"ngf-koi",
"Latn",
}
m["kpy"] = {
"Koryak",
36199,
"qfa-ckn",
"Cyrl",
strip_diacritics = {
from = {"['’]"},
to = {"ʼ"}
},
sort_key = {
from = {"вʼ", "гʼ", "ё", "ӄ", "ӈ"},
to = {"в" .. p[1], "г" .. p[1], "е" .. p[1], "к" .. p[1], "н" .. p[1]}
},
translit = "kpy-translit",
}
m["kpz"] = {
"Kupsabiny",
56445,
"sdv-kln",
}
m["kqa"] = {
"Mum",
6935252,
"ngf-nso",
"Latn",
}
m["kqb"] = {
"Kovai",
6434822,
"ngf-ehu",
"Latn",
}
m["kqc"] = {
"Doromu-Koki",
5298175,
"paa-man",
"Latn",
}
m["kqd"] = {
"Koy Sanjaq Surat",
33463,
"sem-nna",
}
m["kqe"] = {
"Kalagan",
18748906,
"phi",
"Latn",
}
m["kqf"] = {
"Kakabai",
6349119,
"poz-ocw",
"Latn",
}
m["kqg"] = {
"Khe",
3914015,
"nic-gur",
}
m["kqh"] = {
"Kisankasa",
6416409,
"sdv",
}
m["kqi"] = {
"Koitabu",
6426363,
"ngf-koi",
"Latn",
}
m["kqj"] = {
"Koromira",
6432520,
"paa-sbo",
"Latn",
}
m["kqk"] = {
"Kotafon Gbe",
12952447,
"alv-pph",
}
m["kql"] = {
"Kyenele",
11732453,
"paa-yua",
"Latn",
}
m["kqm"] = {
"Khisa",
3913955,
"nic-gur",
}
m["kqn"] = {
"Kaonde",
33601,
"bnt-lub",
"Latn",
}
m["kqo"] = {
"Eastern Krahn",
3915374,
"kro-wee",
}
m["kqp"] = {
"Kimré",
3441210,
"cdc-est",
}
m["kqq"] = {
"Krenak",
6436747,
"sai-cer",
}
m["kqr"] = {
"Kimaragang",
3196845,
"poz-san",
"Latn",
}
m["kqs"] = {
"Northern Kissi",
19921576,
"alv-kis",
}
m["kqt"] = {
"Klias River Kadazan",
12953594,
"poz-san",
}
m["kqu"] = {
"Seroa",
33127766,
"khi-tuu",
}
m["kqv"] = {
"Okolod",
7082487,
"poz-san",
}
m["kqw"] = {
"Kandas",
3192590,
"poz-ocw",
"Latn",
}
m["kqx"] = {
"Mser",
3502347,
"cdc-cbm",
}
m["kqy"] = {
"Koorete",
6430753,
"omv-eom",
"Ethi, Latn",
}
m["kqz"] = {
"Korana",
2756709,
"khi-khk",
"Latn",
}
m["kra"] = {
"Kumhali",
13580783,
"inc-bih",
}
m["krb"] = {
"Karkin",
3193345,
"nai-utn",
"Latn",
}
m["krc"] = {
"Karachay-Balkar",
33714,
"trk-kcu",
"Cyrl",
translit = "krc-translit",
sort_key = {
from = {"гъ", "дж", "ё", "къ", "нг"},
to = {"г" .. p[1], "д" .. p[1], "е" .. p[1], "к" .. p[1], "н" .. p[1]}
},
}
m["krd"] = {
"Kairui-Midiki",
12953277,
"poz-tim",
}
m["kre"] = {
"Panará",
3361895,
"sai-cer",
"Latn",
}
m["krf"] = {
"Koro (Vanuatu)",
3198995,
"poz-vnn",
"Latn",
}
m["krh"] = {
"Kurama",
35593,
"nic-kau",
}
m["kri"] = {
"Krio",
35744,
"crp",
"Latn",
ancestors = "en",
strip_diacritics = {remove_diacritics = c.grave .. c.acute .. c.circ},
sort_key = {
from = {"ɛ", "gb", "kp", "ɔ"},
to = {"e" .. p[1], "g" .. p[1], "k" .. p[1], "o" .. p[1]}
},
}
m["krj"] = {
"Kinaray-a",
33720,
"phi",
"Latn",
}
m["krk"] = {
"Kerek",
332792,
"qfa-ckn",
"Cyrl",
}
m["krl"] = {
"Karelian",
33557,
"urj-fin",
"Latn",
sort_key = {
from = {
"č", "š", "ž", "ü", "ä", "ö", -- 2 chars
"z", "'" -- 1 char
},
to = {
"c" .. p[1], "s" .. p[1], "s" .. p[3], "y" .. p[1], "y" .. p[2], "y" .. p[3],
"s" .. p[2], "y" .. p[4],
}
},
}
m["krm"] = {
"Krim",
35713,
"alv",
}
m["krn"] = {
"Sapo",
3915386,
"kro-wee",
}
m["krp"] = {
"Korop",
35626,
"nic-ucr",
"Latn",
}
m["krr"] = {
"Kru'ng",
12953650,
"mkh-ban",
}
m["krs"] = {
"Kresh",
56674,
"csu-bkr",
}
m["kru"] = {
"Kurux",
33492,
"dra-kml",
"Deva, Tols",
translit = {
Deva = "hi-translit",
},
}
m["krv"] = {
"Kavet",
12953649,
"sai-ktk",
"Latn",
}
m["krw"] = {
"Western Krahn",
10975611,
"kro-wee",
}
m["krx"] = {
"Karon",
35704,
"alv-jol",
}
m["kry"] = {
"Kryts",
35861,
"cau-ssm",
"Latn, Cyrl",
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {
Latn = s["cau-Latn-stripdiacritics"],
Cyrl = s["cau-Cyrl-stripdiacritics"],
},
}
m["krz"] = {
"Sota Kanum",
12952568,
"paa-kan",
"Latn",
}
m["ksa"] = {
"Shuwa-Zamani",
3913929,
"nic-kau",
}
m["ksb"] = {
"Shambala",
3788739,
"bnt-seu",
"Latn",
}
m["ksc"] = {
"Southern Kalinga",
18753301,
"phi",
}
m["ksd"] = {
"Tolai",
35870,
"poz-ocw",
"Latn",
}
m["kse"] = {
"Kuni",
6444619,
"poz-ocw",
"Latn",
}
m["ksf"] = {
"Bafia",
34930,
"bnt-baf",
"Latn",
}
m["ksg"] = {
"Kusaghe",
3200638,
"poz-ocw",
"Latn",
}
m["ksi"] = {
"Krisa",
841704,
"paa-sko",
"Latn",
}
m["ksj"] = {
"Uare",
6450052,
"paa-kwa",
"Latn",
}
m["ksk"] = {
"Kansa",
3192772,
"sio-dhe",
"Latn",
}
m["ksl"] = {
"Kumalu",
17584381,
"poz-ocw",
"Latn",
}
m["ksm"] = {
"Kumba",
3913972,
"alv-mye",
}
m["ksn"] = {
"Kasiguranin",
6374525,
"phi",
}
m["kso"] = {
"Kofa",
56278,
"cdc-cbm",
}
m["ksp"] = {
"Kaba",
3915316,
"csu-sar",
}
m["ksq"] = {
"Kwaami",
3440525,
"cdc-wst",
}
m["ksr"] = {
"Borong",
4946263,
"ngf-kbm",
"Latn",
}
m["kss"] = {
"Southern Kissi",
11028974,
"alv-kis",
}
m["kst"] = {
"Winyé",
3913360,
"nic-gnw",
}
m["ksu"] = {
"Khamyang",
6583541,
"tai-swe",
}
m["ksv"] = {
"Kusu",
6448199,
"bnt-tet",
}
m["ksw"] = {
"S'gaw Karen",
56410,
"kar",
"Mymr",
translit = "ksw-translit",
}
m["ksx"] = {
"Kedang",
6382520,
"poz",
"Latn",
}
m["ksy"] = {
"Kharia Thar",
6400661,
"inc-eas",
}
m["ksz"] = {
"Kodaku",
21179986,
"mun",
}
m["kta"] = {
"Katua",
6378404,
"mkh-ban",
}
m["ktb"] = {
"Kambaata",
35664,
"cus-hec",
"Latn",
}
m["ktc"] = {
"Kholok",
3440464,
"cdc-wst",
}
m["ktd"] = {
"Kokata",
10547021,
"aus-pam",
"Latn",
}
m["ktf"] = {
"Kwami",
12952687,
"bnt-lgb",
}
m["ktg"] = {
"Kalkatungu",
3914057,
"aus-pam",
"Latn",
}
m["kth"] = {
"Karanga",
713643,
}
m["kti"] = {
"North Muyu",
20857698,
"ngf-lok",
"Latn",
}
m["ktj"] = {
"Plapo Krumen",
10975356,
"kro-grb",
}
m["ktk"] = {
"Kaniet",
3399050,
"poz-aay",
"Latn",
}
m["ktl"] = {
"Koroshi",
3775265,
"ira-nwi",
ancestors = "bal",
}
m["ktm"] = {
"Kurti",
3200615,
"poz-aay",
"Latn",
}
m["ktn"] = {
"Karitiâna",
3112184,
"tup",
"Latn",
}
m["kto"] = {
"Kuot",
56537,
}
m["ktp"] = {
"Kaduo",
769809,
"tbq-bka",
}
m["ktq"] = {
"Katabaga",
3193895,
}
m["ktr"] = {
"Kota Marudu Tinagas",
18642280,
}
m["kts"] = {
"South Muyu",
42308820,
"ngf-lok",
"Latn",
}
m["ktt"] = {
"Ketum",
12952616,
"ngf-dum",
"Latn",
}
m["ktu"] = {
"Kituba",
35746,
"crp",
"Latn",
ancestors = "kg",
}
m["ktv"] = {
"Eastern Katu",
22808951,
"mkh-kat",
"Latn",
}
m["ktw"] = {
"Kato",
20831,
"ath-pco",
"Latn",
}
m["ktx"] = {
"Kaxararí",
6380124,
"sai-pan",
"Latn",
}
m["kty"] = {
"Kango",
6362818,
"bnt-bta",
"Latn",
}
m["ktz"] = {
"Juǀ'hoan",
1192295,
"khi-kxa",
"Latn",
}
m["kub"] = {
"Kutep",
35645,
"nic-jkn",
}
m["kuc"] = {
"Kwinsu",
6450460,
"paa-tor",
"Latn",
}
m["kud"] = {
"Auhelawa",
5166,
"poz-ocw",
"Latn",
}
m["kue"] = {
"Kuman",
137525,
"ngf-sim",
"Latn",
}
m["kuf"] = {
"Western Katu",
6378400,
"mkh-kat",
"Laoo, Tale, Latn",
}
m["kug"] = {
"Kupa",
3915336,
"alv-ngb",
}
m["kuh"] = {
"Kushi",
3438747,
"cdc-wst",
}
m["kui"] = {
"Kuikúro",
3915522,
"sai-kui",
"Latn",
}
m["kuj"] = {
"Kuria",
6445968,
"bnt-lok",
"Latn",
}
m["kuk"] = {
"Kepo'",
6393217,
"poz",
}
m["kul"] = {
"Kulere",
3440506,
"cdc-wst",
}
m["kum"] = {
"Kumyk",
36209,
"trk-kcu",
"Cyrl",
translit = "kum-translit",
sort_key = {
from = {"гъ", "гь", "ё", "къ", "нг", "оь", "уь"},
to = {"г" .. p[1], "г" .. p[2], "е" .. p[1], "к" .. p[1], "н" .. p[1], "о" .. p[1], "у" .. p[1]}
},
}
m["kun"] = {
"Kunama",
36041,
}
m["kuo"] = {
"Kumukio",
11732362,
"ngf-dal",
"Latn",
}
m["kup"] = {
"Kunimaipa",
6444696,
"paa-kun",
"Latn",
}
m["kuq"] = {
"Karipuna",
6371071,
"tup-gua",
"Latn",
}
m["kus"] = {
"Kusaal",
35708,
"nic-dag",
"Latn",
}
m["kut"] = {
"Ktunaxa",
33434,
"qfa-iso",
"Latn",
}
m["kuu"] = {
"Upper Kuskokwim",
28062,
"ath-nor",
"Latn",
}
m["kuv"] = {
"Kur",
12635082,
"poz-cma",
"Latn",
}
m["kuw"] = {
"Kpagua",
11137573,
"bad-cnt",
}
m["kux"] = {
"Kukatja",
10549839,
"aus-pam",
"Latn",
}
m["kuy"] = {
"Kuuku-Ya'u",
10550697,
"aus-pmn",
"Latn",
}
m["kuz"] = {
"Kunza",
2669181,
"qfa-iso",
"Latn",
}
m["kva"] = {
"Bagvalal",
56638,
"cau-and",
"Cyrl",
translit = "cau-nec-translit",
override_translit = true,
display_text = {Cyrl = s["cau-Cyrl-displaytext"]},
strip_diacritics = {Cyrl = s["cau-Cyrl-stripdiacritics"]},
}
m["kvb"] = {
"Kubu",
6441341,
"poz-mly",
}
m["kvc"] = {
"Kove",
3199402,
"poz-ocw",
"Latn",
}
m["kvd"] = {
"Kui (Indonesia)",
6442230,
"paa-alp",
"Latn",
}
m["kve"] = {
"Kalabakan",
6350003,
"poz-san",
"Latn",
}
m["kvf"] = {
"Kabalai",
3440427,
"cdc-est",
}
m["kvg"] = {
"Kuni-Boazi",
2907551,
"paa-boa",
"Latn",
}
m["kvh"] = {
"Komodo",
3198565,
"poz-cet",
"Latn",
}
m["kvi"] = {
"Kwang",
3440398,
"cdc-est",
"Latn",
}
m["kvj"] = {
"Psikye",
56304,
"cdc-cbm",
}
m["kvk"] = {
"Korean Sign Language",
3073428,
"sgn-jsl",
}
m["kvl"] = {
"Brek Karen",
12952577,
"kar",
}
m["kvm"] = {
"Kendem",
35751,
"nic-mam",
"Latn",
}
m["kvn"] = {
"Border Kuna",
31777873,
"cba",
}
m["kvo"] = {
"Dobel",
5286559,
"poz",
"Latn",
}
m["kvp"] = {
"Kompane",
18343041,
"poz",
}
m["kvq"] = {
"Geba Karen",
12952581,
"kar",
"Latn, Mymr",
}
m["kvr"] = {
"Kerinci",
3195442,
"poz-mly",
"Latn, Arab", -- Also Incung, which we don't have
}
m["kvt"] = {
"Lahta Karen",
12952582,
"kar",
}
m["kvu"] = {
"Yinbaw Karen",
14426328,
"kar",
}
m["kvv"] = {
"Kola",
6426967,
"poz",
"Latn",
}
m["kvw"] = {
"Wersing",
7983599,
"paa-alp",
"Latn",
}
m["kvx"] = {
"Parkari Koli",
3244176,
"inc-wes",
}
m["kvy"] = {
"Yintale Karen",
14426329,
"kar",
}
m["kvz"] = {
"Tsakwambo",
7849438,
"ngf-kts",
"Latn",
}
m["kwa"] = {
"Dâw",
3042278,
"sai-nad",
"Latn",
}
m["kwb"] = {
"Baa",
34842,
"alv-ada",
}
m["kwc"] = {
"Likwala",
35597,
"bnt-mbo",
}
m["kwd"] = {
"Kwaio",
3200796,
"poz-sls",
"Latn",
}
m["kwe"] = {
"Kwerba",
6450328,
"paa-kwe",
"Latn",
}
m["kwf"] = {
"Kwara'ae",
3200829,
"poz-sls",
"Latn",
}
m["kwg"] = {
"Sara Kaba Deme",
3915384,
"csu-kab",
}
m["kwh"] = {
"Kowiai",
6435028,
"poz",
"Latn",
}
m["kwi"] = {
"Awa-Cuaiquer",
2603103,
"sai-bar",
"Latn",
}
m["kwj"] = {
"Kwanga",
3438383,
"paa-sep",
"Latn",
}
m["kwk"] = {
"Kwak'wala",
2640628,
"wak",
"Latn",
}
m["kwl"] = {
"Kofyar",
3441382,
"cdc-wst",
"Latn",
}
m["kwm"] = {
"Kwambi",
3487165,
"bnt-ova",
}
m["kwn"] = {
"Kwangali",
36334,
"bnt-kav",
"Latn",
}
m["kwo"] = {
"Kwomtari",
3508116,
"paa-kwo",
"Latn",
}
m["kwp"] = {
"Kodia",
3914867,
"kro-ekr",
}
m["kwq"] = {
"Kwak",
11014183,
"nic-nka",
ancestors = "yam",
}
m["kwr"] = {
"Kwer",
12635137,
"ngf-wok",
"Latn",
}
m["kws"] = {
"Kwese",
3200846,
"bnt-pen",
}
m["kwt"] = {
"Kwesten",
6450354,
"paa-tor",
"Latn",
}
m["kwu"] = {
"Kwakum",
35624,
"bnt-kak",
}
m["kwv"] = {
"Sara Kaba Náà",
3915361,
"csu-kab",
"Latn",
}
m["kww"] = {
"Kwinti",
721182,
"crp",
"Latn",
ancestors = "en"
}
m["kwx"] = {
"Khirwar",
12976968,
"dra",
}
m["kwz"] = {
"Kwadi",
2364661,
"khi-kkw",
"Latn",
}
m["kxa"] = {
"Kairiru",
3398785,
"poz-ocw",
"Latn",
}
m["kxb"] = {
"Krobu",
35586,
"alv-ptn",
"Latn",
}
m["kxc"] = {
"Konso",
56624,
"cus-eas",
"Ethi, Latn",
}
m["kxd"] = {
"Brunei Malay",
3182878,
"poz-mly",
"Latn, ms-Arab",
}
m["kxe"] = {
"Kakihum",
3914433,
"nic-kam",
ancestors = "tvd",
}
m["kxf"] = {
"Manumanaw Karen",
12952592,
"kar",
"Mymr, Latn",
}
m["kxh"] = {
"Karo",
3447116,
"omv-aro",
}
m["kxi"] = {
"Keningau Murut",
6389308,
"poz-san",
"Latn",
}
m["kxj"] = {
"Kulfa",
713654,
"csu-kab",
}
m["kxk"] = {
"Zayein Karen",
14352960,
"kar",
}
-- Nepali Kurux [kxl] treated as part of Kurux [kru], consistent with ISO merger in 2020
m["kxm"] = {
"Northern Khmer",
3502234,
"mkh-kmr",
"Thai, Khmr",
ancestors = "xhm",
sort_key = {
from = {"[%pๆ]", "[็-๎]", "([เแโใไ])([ก-ฮ])"},
to = {"", "", "%2%1"}
},
}
m["kxn"] = {
"Kanowit",
6364300,
"poz-bnn",
"Latn",
}
m["kxo"] = {
"Kanoé",
4356223,
"qfa-iso",
"Latn",
}
m["kxp"] = {
"Wadiyara Koli",
12953645,
"inc-wes",
}
m["kxq"] = {
"Smärky Kanum",
12952569,
"paa-kan",
"Latn",
}
m["kxr"] = {
"Manus Koro",
3198994,
"poz-aay",
"Latn",
}
m["kxs"] = {
"Kangjia",
3182570,
"xgn-shr",
"Latn",
}
m["kxt"] = {
"Koiwat",
6426388,
"paa-nnd",
"Latn",
}
m["kxu"] = {
"Kui (India)",
33919,
"dra-kki",
"Orya",
translit = "kxv-translit",
strip_diacritics = {
remove_diacritics = "୕",
from = {"ଆଆ", "ଇଇ", "ଉଉ", "ଏଏ", "ଓଓ", "ିଇ", "ୁଉ", "େଏ", "ୋଓ"},
to = {"ଆ", "ଈ", "ଊ", "ଏ", "ଓ", "ୀ", "ୂ", "େ", "ୋ"},
},
}
m["kxv"] = {
"Kuvi",
3200721,
"dra-kki",
"Orya",
translit = "kxv-translit",
strip_diacritics = {
remove_diacritics = "୕",
from = {"ଆଆ", "ଇଇ", "ଉଉ", "ଏଏ", "ଓଓ", "([କ-ହ])ଆ", "ିଇ", "ୁଉ", "େଏ", "ୋଓ"},
to = {"ଆ", "ଈ", "ଊ", "ଏ", "ଓ", "%1ା", "ୀ", "ୂ", "େ", "ୋ"},
},
}
m["kxw"] = {
"Konai",
11732339,
"ngf-est",
"Latn",
}
m["kxx"] = {
"Likuba",
35646,
"bnt-bmo",
}
m["kxy"] = {
"Kayong",
6380673,
"mkh",
}
m["kxz"] = {
"Kerewo",
6393847,
"paa-kiw",
"Latn",
}
m["kya"] = {
"Kwaya",
6450276,
"bnt-haj",
"Latn",
}
m["kyb"] = {
"Butbut Kalinga",
18753300,
"phi",
"Latn",
}
m["kyc"] = {
"Kyaka",
12952690,
"ngf-enc",
"Latn",
}
m["kyd"] = {
"Karey",
6370196,
"poz",
}
m["kye"] = {
"Krache",
35658,
"alv-gng",
}
m["kyf"] = {
"Kouya",
35595,
"kro-bet",
}
m["kyg"] = {
"Keyagana",
6398208,
"ngf-kya",
"Latn",
}
m["kyh"] = {
"Karok",
1288440,
"qfa-iso", -- or Hokan?
"Latn",
}
m["kyi"] = {
"Kiput",
3038653,
"poz-swa",
"Latn",
}
m["kyj"] = {
"Karao",
3192950,
"phi",
"Latn",
}
m["kyk"] = {
"Kamayo",
3192339,
"phi",
"Latn",
}
m["kyl"] = {
"Kalapuya",
3192120,
"nai-klp",
}
m["kym"] = {
"Kpatili",
3913982,
"znd",
}
m["kyn"] = {
"Karolanos",
6373093,
"phi",
}
m["kyo"] = {
"Kelon",
6386414,
"paa-alp",
"Latn",
}
m["kyp"] = {
"Kang",
25559558,
"tai",
}
m["kyq"] = {
"Kenga",
35707,
"csu-bgr",
}
m["kyr"] = {
"Kuruáya",
3200633,
"tup",
"Latn",
}
m["kys"] = {
"Baram Kayan",
2883794,
"poz",
"Latn",
}
m["kyt"] = {
"Kayagar",
6380394,
"paa-kay",
"Latn",
}
m["kyu"] = {
"Western Kayah",
12952596,
"kar",
"Kali, Mymr, Latn",
translit = {Kali = "Kali-translit"},
}
m["kyv"] = {
"Kayort",
6380675,
"inc-krd",
"Deva",
}
m["kyw"] = {
"Kudmali",
6446173,
"inc-bih",
"Deva, as-Beng, Orya, Chis",
}
m["kyx"] = {
"Rapoisi",
7294279,
"paa-nbo",
"Latn",
}
m["kyy"] = {
"Kambaira",
6356254,
"ngf-kai",
"Latn",
}
m["kyz"] = {
"Kayabí",
6380372,
"tup-gua",
"Latn",
}
m["kza"] = {
"Western Karaboro",
36601,
"alv-krb",
}
m["kzb"] = {
"Kaibobo",
6347565,
"poz-cma",
}
m["kzc"] = {
"Bondoukou Kulango",
11031321,
"alv-kul",
"Latn",
}
m["kzd"] = {
"Kadai",
7679471,
"poz-cma",
"Latn",
}
--kze (Kosena) made an etym-only child of auy (Auyana) per [[Wiktionary:Language_treatment_requests#merge_Kosena_[kze]_into_Auyana_[auy]]]
m["kzf"] = {
"Da'a Kaili",
33103997,
"poz-kal",
"Latn",
}
m["kzg"] = {
"Kikai",
3196527,
"jpx-nry",
"Jpan",
translit = s["jpx-translit"],
display_text = s["jpx-displaytext"],
strip_diacritics = s["jpx-stripdiacritics"],
sort_key = s["jpx-sortkey"],
}
m["kzh"] = {
"Dongolawi",
5295991,
"nub",
"Latn",
}
m["kzi"] = {
"Kelabit",
6385445,
"poz-swa",
"Latn",
}
m["kzj"] = {
"Coastal Kadazan",
3307195,
"poz-san",
"Latn",
}
m["kzk"] = {
"Kazukuru",
1089069,
"poz-ocw",
}
m["kzl"] = {
"Kayeli",
4207444,
"poz-cma",
"Latn",
}
m["kzm"] = {
"Kais",
6348319,
"ngf-sbh",
"Latn",
}
m["kzn"] = {
"Kokola",
11128329,
"bnt-mak",
"Latn",
ancestors = "vmw",
}
m["kzo"] = {
"Kaningi",
35683,
"bnt-mbt",
}
m["kzp"] = {
"Kaidipang",
6347611,
"phi",
"Latn",
}
m["kzq"] = {
"Kaike",
10951226,
"sit-tam",
}
m["kzr"] = {
"Karang",
35681,
"alv-mbm",
"Latn",
}
m["kzs"] = {
"Sugut Dusun",
12953510,
"poz-san",
"Latn",
}
m["kzt"] = {
"Tambunan Dusun",
12953514,
"poz-san",
"Latn",
}
m["kzu"] = {
"Kayupulau",
6380723,
"poz-ocw",
}
m["kzv"] = {
"Komyandaret",
6428671,
"ngf-kts",
"Latn",
}
m["kzw"] = { -- contrast xoo, sai-kat, sai-xoc, the last of which the ISO conflated into this code
"Kariri",
12953620,
"sai-mje",
"Latn",
}
m["kzx"] = {
"Kamarian",
6356040,
"poz-cma",
"Latn",
}
m["kzy"] = {
"Kango-Sua",
11008360,
"bnt-kbi",
"Latn",
ancestors = "bip",
}
m["kzz"] = {
"Kalabra",
6350038,
"paa-wbh",
"Latn",
}
return require("Module:languages").finalizeData(m, "language")
cde9rgm4ot172eeyv0u4lv3su75yy5w
ප්රවර්ගය:යෙදුම්, මැසඩෝනියානු පරිවර්තන සහිත
14
115376
234769
191650
2026-05-24T02:19:34Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:යෙදුම්, Macedonian පරිවර්තන සහිත]] සිට [[ප්රවර්ගය:යෙදුම්, මැසඩෝනියානු පරිවර්තන සහිත]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
171852
wikitext
text/x-wiki
{{auto cat}}
[[en:Category:Terms with Macedonian translations]]
7n7u4sphx54qa370jd689xmz2zu2w7s
ප්රවර්ගය:German Low German
14
117307
234822
179700
2026-05-24T08:04:46Z
Lee
19
Lee විසින් [[ප්රවර්ගය:German Low German භාෂාව]] සිට [[ප්රවර්ගය:German Low German]] වෙත පිටුව ගෙන යන ලදී
179700
wikitext
text/x-wiki
{{auto cat|Germany|setsister=Low Saxon}}
[[en:Category:German Low German language]]
qmcsu2ytj2cmqywx6pd740804cv2p4x
234827
234822
2026-05-24T08:08:33Z
Lee
19
234827
wikitext
text/x-wiki
{{auto cat|lect=1}}
[[en:Category:German Low German language]]
1o224sqhswipna7kzbf2hlskp4n2vu9
Module:etymology languages/canonical names
828
137335
234831
228621
2026-05-17T18:28:59Z
en>Theknightwho
0
[[MediaWiki:UpdateLanguageNameAndCode.js|updated]]
234831
Scribunto
text/plain
return {
["ALUPEC Kabuverdianu"] = "kea-alu",
["Abhiri"] = "pra-abh",
["Abron"] = "abr",
["Abuzeydabadi"] = "xme-abz",
["Abyanehi"] = "xme-aby",
["Acadian French"] = "fr-aca",
["Achaemenid Elamite"] = "elx-ach",
["Achterhoeks"] = "act",
["Adamawa Fulfulde"] = "fub",
["Addu Dhivehi"] = "dv-add",
["Aeolic Greek"] = "grc-aeo",
["Afghan Uzbek"] = "uz-afg",
["African Romance"] = "la-afr",
["Afridi"] = "ps-afr",
["Akhmimic Coptic"] = "cop-akh",
["Akuapem Twi"] = "tw-aku",
["Aleppine North Levantine Arabic"] = "apc-ale",
["Alsatian Alemannic German"] = "gsw-FR-als",
["Amdo Tibetan"] = "adx",
["American English"] = "en-US",
["Amorehi"] = "xme-amo",
["Ampezan Ladin"] = "lld-amp",
["Amrum North Frisian"] = "frr-amr",
["Anaraki"] = "xme-ana",
["Anatri Chuvash"] = "cv-ana",
["Anbarani"] = "tly-anb",
["Angkorian Old Khmer"] = "okz-ang",
["Anglian Old English"] = "ang-ang",
["Anglo-Norman"] = "xno",
["Anxi Hokkien"] = "nan-anx",
["Aquitanian"] = "xaq",
["Aranese"] = "oc-ara",
["Arbëresh Albanian"] = "aae",
["Arcadian Greek"] = "grc-arc",
["Arcadocypriot Greek"] = "grc-arp",
["Ardestani"] = "xme-ard",
["Ardhamagadhi Prakrit"] = "pra-ard",
["Arghu"] = "klj-arg",
["Armeno-Kipchak"] = "qwm-arm",
["Arvanitika Albanian"] = "aat",
["Asalemi"] = "tly-asa",
["Asante Twi"] = "tw-asa",
["Ashtiani"] = "atn",
["Attic Greek"] = "grc-att",
["Australian Aboriginal English"] = "en-aae",
["Australian English"] = "en-AU",
["Austrian German"] = "de-AT",
["Auvergnat"] = "oc-auv",
["Avahattha"] = "inc-aav",
["Avanti"] = "pra-ava",
["Ayutthaya Old Thai"] = "th-ayu",
["Azerbaijani Talysh"] = "tly-aze",
["Badiot Ladin"] = "lld-bad",
["Badrudi"] = "xme-bdr",
["Bagirmi Fulfulde"] = "fui",
["Bahliki"] = "pra-bah",
["Bajui"] = "sgh-baj",
["Baltic German"] = "de-bal",
["Bandari"] = "bsg-ban",
["Bangash"] = "ps-bng",
["Bannu"] = "ps-ban",
["Barlavento Kabuverdianu"] = "kea-bar",
["Barpetia Kamrupi Assamese"] = "as-bkm",
["Bartangi"] = "sgh-bar",
["Bartangi-Oroshori"] = "sgh-bro",
["Beijing Mandarin"] = "cmn-bei",
["Beijingic Mandarin"] = "cmn-bec",
["Belgian Dutch"] = "nl-BE",
["Besemah"] = "pse-bsm",
["Betawi Kota"] = "bew-kot",
["Bhaca"] = "xh-bha",
["Biblical Aramaic"] = "arc-bib",
["Biblical Hebrew"] = "hbo",
["Bidhandi"] = "xme-bid",
["Bijagani"] = "xme-bij",
["Boa Vista Kabuverdianu"] = "kea-bvi",
["Boeotian Greek"] = "grc-boi",
["Bohairic Coptic"] = "cop-boh",
["Bolivian Spanish"] = "es-BO",
["Bombay Hindi"] = "hi-mum",
["Borana"] = "gax",
["Borgu Fulfulde"] = "fue",
["Borujerdi"] = "xme-bor",
["Brahmanic Sanskrit"] = "sa-bra",
["Brava Kabuverdianu"] = "kea-bra",
["Brazilian Portuguese"] = "pt-BR",
["British English"] = "en-GB",
["Buddhist Hybrid Sanskrit"] = "sa-bhs",
["Burenjani"] = "fay-bur",
["Bushehri"] = "fay-bsh",
["Byzantine Greek"] = "gkm",
["Cadorino Ladin"] = "lld-cad",
["Cajun French"] = "frc",
["California English"] = "en-US-CA",
["Camorta"] = "ncb-cam",
["Campidanese"] = "sc-sro",
["Canadian English"] = "en-CA",
["Canadian French"] = "fr-CA",
["Canadian Ukrainian"] = "uk-CA",
["Candali"] = "pra-can",
["Capenate"] = "xfa-cap",
["Central Ghilzay"] = "ps-cgi",
["Central Korean"] = "ko-cen",
["Central Plains Mandarin"] = "cmn-cep",
["Central Talysh"] = "tly-cen",
["Central Tati"] = "xme-ttc-cen",
["Central-Eastern Niger Fulfulde"] = "fuq",
["Chakavian Serbo-Croatian"] = "ckm",
["Chakhar Mongolian"] = "mn-cha",
["Chali Tati"] = "tks-cal",
["Changtai Hokkien"] = "nan-cha",
["Chilean Spanish"] = "es-CL",
["Chimehi"] = "xme-cim",
["Christian Palestinian Aramaic"] = "arc-cpa",
["Chungcheong Korean"] = "ko-chu",
["Ci"] = "lzh-cii",
["Cisalpine Gaulish"] = "xcg",
["Classical Azerbaijani"] = "az-cls",
["Classical Cantonese"] = "lzh-yue",
["Classical Japanese"] = "ja-cla",
["Classical Latin"] = "la-cla",
["Classical Malay"] = "ms-cla",
["Classical Mandarin"] = "lzh-cmn",
["Classical Persian"] = "fa-cls",
["Classical Sanskrit"] = "cls",
["Classical Tagalog"] = "tl-cls",
["Classical Taishanese"] = "lzh-tai",
["Classical Taiwanese Mandarin"] = "lzh-cmn-TW",
["Colombian Spanish"] = "es-CO",
["Common Bantu"] = "bnt-cmn",
["Contemporary Latin"] = "la-con",
["Coptic Dialect G"] = "cop-ggg",
["Coptic Dialect J"] = "cop-jjj",
["Coptic Dialect K"] = "cop-kkk",
["Coptic Dialect P"] = "cop-ppp",
["Cretan Ancient Greek"] = "grc-kre",
["Cretan Greek"] = "el-crt",
["Cuban Spanish"] = "es-CU",
["Cuman"] = "qwm-cum",
["Cypriot Ancient Greek"] = "grc-cyp",
["Cypriot Greek"] = "el-cyp",
["Cypriot Turkish"] = "tr-CY",
["Dabu Hakka"] = "hak-dab",
["Daksinatya"] = "pra-dak",
["Damascene North Levantine Arabic"] = "apc-dam",
["Danesfani"] = "tks-dan",
["Danube Bulgar"] = "xbo-dan",
["Danzhou Chinese"] = "zhx-dan",
["Dari"] = "prs",
["Dashtaki"] = "fay-dsh",
["Davani"] = "fay-dav",
["Delijani"] = "xme-del",
["Dhakaiya Vaṅga Bengali"] = "bn-dvn",
["Digor Ossetian"] = "os-dig",
["Dnieper Baltic"] = "bat-dni",
["Dobrujan Tatar"] = "crh-dbj",
["Doric Greek"] = "grc-dor",
["Dramili"] = "pra-dra",
["Drents"] = "drt",
["Dutch Low Saxon"] = "nds-nl",
["Early Brythonic"] = "bry-ear",
["Early Mandarin"] = "cmn-ear",
["Early Medieval Latin"] = "la-eme",
["Early Middle Chinese"] = "ltc-ear",
["Early Middle Japanese"] = "ja-mid-ear",
["Early Middle Korean"] = "okm-ear",
["Early Middle Mongol"] = "xng-ear",
["Early Middle Persian"] = "pal-ear",
["Early Modern Czech"] = "cs-ear",
["Early Modern English"] = "en-ear",
["Early Modern Hakka"] = "hak-eam",
["Early Modern Japanese"] = "ja-ear",
["Early Modern Spanish"] = "es-ear",
["Early New High German"] = "de-ear",
["Early New Persian"] = "fa-ear",
["Early Old Chinese"] = "och-ear",
["Early Old Ossetic"] = "oos-ear",
["Early Old Persian"] = "peo-ear",
["Early Scots"] = "enm-esc",
["Early Sogdian"] = "sog-ear",
["East Frisian Low German"] = "frs",
["East Midland Middle English"] = "enm-emi",
["Eastern Armenian"] = "hye",
["Eastern Balochi"] = "bgp",
["Eastern Mansi"] = "mns-eas",
["Eastern Old Japanese"] = "ojp-eas",
["Eastern Tati"] = "xme-ttc-eas",
["Ebrahimabadi"] = "tks-ebr",
["Ecclesiastical Latin"] = "la-ecc",
["Elean Greek"] = "grc-ela",
["Emamzada Esmaili"] = "fay-eze",
["Epic Greek"] = "grc-epi",
["Epic Sanskrit"] = "sa-epi",
["Esfarvarini"] = "tks-esf",
["European Portuguese"] = "pt-PT",
["Fante Akan"] = "fat",
["Farizandi"] = "xme-far",
["Fascian Ladin"] = "lld-fas",
["Fayyumic Coptic"] = "cop-fay",
["Fodom Ladin"] = "lld-fod",
["Fogo Kabuverdianu"] = "kea-fog",
["Fornes Ladin"] = "lld-for",
["Frankish"] = "frk",
["Fumani"] = "tly-fum",
["Fuyu Kyrgyz"] = "kjh-fyu",
["Föhr North Frisian"] = "frr-foh",
["Föhr-Amrum North Frisian"] = "frr-fam",
["Gangwon Korean"] = "ko-gan",
["Gascon"] = "oc-gas",
["Gavkoshaki"] = "fay-gav",
["Gazi"] = "gzi",
["Geordie"] = "en-geo",
["German Low German"] = "nds-de",
["Ghat"] = "thv-ght",
["Gheg Albanian"] = "aln",
["Gherdëina Ladin"] = "lld-ghe",
["Goesharde North Frisian"] = "frr-goe",
["Golyad"] = "bat-gol",
["Goral"] = "pl-gor",
["Greater Polish"] = "pl-gre",
["Greenlandic Norse"] = "non-grn",
["Gronings"] = "gos",
["Guangzhou Cantonese"] = "yue-gua",
["Guanzhong Mandarin"] = "cmn-gua",
["Guernsey Norman"] = "nrf-grn",
["Guilin Mandarin"] = "cmn-gui",
["Gurjara Apabhramsa"] = "inc-agu",
["Gyeonggi Korean"] = "ko-gyg",
["Gyeongsang Korean"] = "ko-gys",
["Hailu Hakka"] = "hak-hai",
["Halligen North Frisian"] = "frr-hal",
["Hamadani"] = "xme-ham",
["Hamgyong Korean"] = "ko-ham",
["Hangzhounese"] = "wuu-han",
["Hanjani"] = "xme-han",
["Hanyu Pinyin"] = "cmn-pinyin",
["Harar Oromo"] = "hae",
["Hatran Aramaic"] = "arc-hat",
["Havigannada"] = "kn-hav",
["Hazaragi"] = "haz",
["Heligoland North Frisian"] = "frr-hel",
["Helu Prakrit"] = "pra-hel",
["Hengyang Xiang"] = "hsn-hya",
["Hengzhou Xiang"] = "hsn-hzh",
["Hermopolitan Coptic"] = "cop-her",
["High Alemannic German"] = "gsw-hig",
["Highest Alemannic German"] = "gsw-hst",
["Hokkaido Ainu"] = "ain-hok",
["Hong Kong Cantonese"] = "yue-HK",
["Hong Kong English"] = "en-HK",
["Hong Kong Hakka"] = "hak-HK",
["Hormozi"] = "bsg-hor",
["Houlu Min"] = "nan-hou",
["Hui'an Hokkien"] = "nan-hui",
["Huiyang Hakka"] = "hak-hui",
["Huvadhu Dhivehi"] = "dv-huv",
["Hwanghae Korean"] = "ko-hwa",
["Imperial Aramaic"] = "arc-imp",
["Indian English"] = "en-IN",
["Insular North Frisian"] = "frr-ins",
["Insular Scots"] = "sco-ins",
["Ionic Greek"] = "grc-ion",
["Iranian Persian"] = "fa-ira",
["Irish English"] = "en-IE",
["Iron Ossetian"] = "os-iro",
["Isfahani"] = "xme-isf",
["Israeli Hebrew"] = "he-IL",
["Jadrani"] = "ps-jad",
["Jeolla Korean"] = "ko-jeo",
["Jersey Norman"] = "nrf-jer",
["Jewish Babylonian Aramaic"] = "tmr",
["Jewish Literary Aramaic"] = "arc-jla",
["Jewish Palestinian Aramaic"] = "jpa",
["Jianghuai Mandarin"] = "cmn-jhu",
["Jinjiang Hokkien"] = "nan-jin",
["Jirofti"] = "rdb-jir",
["Jowshaqani"] = "xme-jow",
["Judeo-Arabic"] = "jrb",
["Kafroni"] = "xme-kaf",
["Kahaki"] = "xme-kah",
["Kahnuji"] = "rdb-kah",
["Kajkavian Serbo-Croatian"] = "kjv",
["Kakari"] = "ps-kak",
["Kaliarda"] = "el-kal",
["Kamviri"] = "xvi",
["Kandahari"] = "ps-kan",
["Kaniguram"] = "oru-kan",
["Karganrudi"] = "tly-kar",
["Karrharde North Frisian"] = "frr-kar",
["Kashani"] = "xme-kas",
["Kasmiri Apabhramsa"] = "inc-aka",
["Katchal"] = "ncb-kat",
["Katharevousa"] = "el-kth",
["Kathiyawadi"] = "gu-kat",
["Kativiri"] = "bsh-kat",
["Kentish Middle English"] = "enm-ken",
["Kentish Old English"] = "ang-ken",
["Kermani"] = "xme-krm",
["Kesehi"] = "xme-kes",
["Khalkha Mongolian"] = "mn-kha",
["Khamba"] = "kbg",
["Khams Tibetan"] = "khg",
["Khargi"] = "fay-kar",
["Khasa Prakrit"] = "pra-kha",
["Khatak"] = "ps-xat",
["Khiaraji"] = "tks-xia",
["Khollari"] = "fay-kho",
["Khorchin Mongolian"] = "mn-khr",
["Khoznini"] = "tks-xoz",
["Khufi"] = "sgh-xuf",
["Khughni"] = "sgh-xug",
["Khughni-Bajui"] = "sgh-xgb",
["Khunsari"] = "kfm",
["Khuri"] = "xme-xur",
["Khuzestani Arabic"] = "acm-khu",
["Kinmenese Hokkien"] = "nan-kin",
["Kinyarwanda"] = "rw-kin",
["Kirundi"] = "rw-run",
["Koine Greek"] = "grc-koi",
["Komjani"] = "xme-kom",
["Kondazi"] = "fay-kon",
["Korean Classical Chinese"] = "lzh-KO",
["Kosena"] = "kze",
["Kromanti"] = "alv-kro",
["Kundagannada"] = "kn-kun",
["Kuril Ainu"] = "ain-kur",
["Kölsch"] = "ksh",
["Languedocien"] = "oc-lan",
["Lanuvian"] = "itc-lan",
["Lanyin Mandarin"] = "cmn-lan",
["Late Babylonian"] = "akk-lbb",
["Late Brythonic"] = "bry-lat",
["Late Egyptian"] = "egy-lat",
["Late Khotanese"] = "kho-lat",
["Late Latin"] = "la-lat",
["Late Middle Chinese"] = "ltc-lat",
["Late Middle Japanese"] = "ja-mid-lat",
["Late Middle Mongol"] = "xng-lat",
["Late Middle Persian"] = "pal-lat",
["Late Old Chinese"] = "och-lat",
["Late Old Korean"] = "oko-lat",
["Late Old Ossetic"] = "oos-lat",
["Late Old Persian"] = "peo-lat",
["Late Old Swedish"] = "gmq-osw-lat",
["Late Sogdian"] = "sog-lat",
["Law French"] = "xno-law",
["Lebanese North Levantine Arabic"] = "apc-leb",
["Lesser Polish"] = "pl-les",
["Limousin"] = "oc-lim",
["Lisan ud-Dawat Gujarati"] = "gu-lda",
["Literary Cantonese"] = "yue-lit",
["Literary Chinese"] = "lzh-lit",
["Logar"] = "oru-log",
["Logudorese"] = "sc-src",
["Lombardic"] = "lng",
["Loudi Xiang"] = "hsn-lou",
["Louisiana French"] = "fr-lou",
["Low Alemannic German"] = "gsw-low",
["Low Prussian"] = "nds-lpr",
["Lucanian"] = "osc-luc",
["Lunfardo"] = "es-lun",
["Lycopolitan Coptic"] = "cop-lyc",
["Língua Geral Amazônica"] = "tpw-lga",
["Língua Geral Paulista"] = "tpw-lgp",
["Maasina Fulfulde"] = "ffm",
["Magadhi Prakrit"] = "pra-mag",
["Mahallati"] = "xme-mah",
["Maharastri Apabhramsa"] = "inc-ama",
["Maharastri Prakrit"] = "pra-mah",
["Mahsudi"] = "ps-mah",
["Mainland North Frisian"] = "frr-mai",
["Maio Kabuverdianu"] = "kea-mai",
["Malaysian Huiyang Hakka"] = "hak-hui-MY",
["Malaysian Mandarin"] = "cmn-MY",
["Mamluk-Kipchak"] = "qwm-mam",
["Manichaean Middle Persian"] = "xmn",
["Manx English"] = "en-IM",
["Masali"] = "tly-msa",
["Masarami"] = "fay-mas",
["Masovian Polish"] = "pl-mas",
["Masulei"] = "tly-msu",
["Medan Hokkien"] = "nan-med",
["Medieval Hebrew"] = "he-med",
["Medieval Latin"] = "la-med",
["Medieval Sinhalese"] = "si-med",
["Medieval Tashelhit"] = "shi-med",
["Meixian Hakka"] = "hak-mei",
["Mercian Old English"] = "ang-mer",
["Mexican Spanish"] = "es-MX",
["Meymehi"] = "xme-mey",
["Middle Assyrian"] = "akk-mas",
["Middle Babylonian"] = "akk-mbb",
["Middle Belarusian"] = "zle-mbe",
["Middle Bulgarian"] = "cu-bgm",
["Middle Chuvash"] = "cv-mid",
["Middle Egyptian"] = "egy-mid",
["Middle Elamite"] = "elx-mid",
["Middle Georgian"] = "ka-mid",
["Middle Hindi"] = "hi-mid",
["Middle Japanese"] = "ja-mid",
["Middle Konkani"] = "kok-mid",
["Middle Polish"] = "zlw-mpl",
["Middle Russian"] = "zle-mru",
["Middle Tamil"] = "ta-mid",
["Middle Ukrainian"] = "zle-muk",
["Minabi"] = "bsg-min",
["Mishnaic Hebrew"] = "he-mis",
["Missouri French"] = "fr-mis",
["Mitanni"] = "inc-mit",
["Moldovan"] = "ro-MD",
["Mooring North Frisian"] = "frr-moo",
["Mulaku Dhivehi"] = "dv-mul",
["Mumviri"] = "bsh-mum",
["Nabataean Aramaic"] = "arc-nab",
["Nalbaria Kamrupi Assamese"] = "as-nkm",
["Nancowry"] = "ncb-nan",
["Nanjing Mandarin"] = "cmn-nan",
["Naraqi"] = "xme-nar",
["Nashalji"] = "xme-nas",
["Natanzi"] = "ntz",
["Nayini"] = "nyq",
["Neo-Assyrian"] = "akk-nas",
["Neo-Babylonian"] = "akk-nbb",
["Neo-Elamite"] = "elx-neo",
["Neo-Middle Egyptian"] = "egy-nmi",
["New Latin"] = "la-new",
["New Sanskrit"] = "sa-neo",
["New Xiang"] = "hsn-new",
["New Zealand English"] = "en-NZ",
["Nigerian Fulfulde"] = "fuv",
["Ningbonese"] = "wuu-nin",
["Noakhailla Vaṅga Bengali"] = "bn-nvn",
["Nones Ladin"] = "lld-non",
["North Alaskan Inupiatun"] = "esi",
["North American English"] = "en-NNN",
["North Karelian"] = "krl-nor",
["North Lebanese North Levantine Arabic"] = "apc-nle",
["North Wales Welsh"] = "cy-nor",
["Northeastern Mandarin"] = "cmn-noe",
["Northeastern Pashto"] = "ps-nea",
["Northern Irish English"] = "en-GB-NIR",
["Northern Kankanaey"] = "xnn",
["Northern Lushootseed"] = "lut-nor",
["Northern Middle English"] = "enm-nor",
["Northern Scots"] = "sco-nor",
["Northern Talysh"] = "tly-nor",
["Northern Tati"] = "xme-ttc-nor",
["Northern Wu"] = "wuu-nor",
["Northumbrian Old English"] = "ang-nor",
["Northwest Alaskan Inupiatun"] = "esk",
["Northwestern Pashto"] = "ps-nwe",
["Nuorese"] = "sc-nuo",
["Nushabadi"] = "xme-nus",
["Odri"] = "pra-odr",
["Old Akkadian"] = "akk-old",
["Old Aramaic"] = "arc-old",
["Old Assyrian"] = "akk-oas",
["Old Avestan"] = "ae-old",
["Old Azari"] = "xme-azr",
["Old Babylonian"] = "akk-obb",
["Old Braj"] = "bra-old",
["Old Chuvash"] = "cv-old",
["Old Coptic"] = "cop-old",
["Old Dhivehi"] = "dv-old",
["Old East Norse"] = "non-oen",
["Old Egyptian"] = "egy-old",
["Old Elamite"] = "elx-old",
["Old Emilian"] = "egl-old",
["Old Franco-Provençal"] = "frp-old",
["Old Friulian"] = "fur-old",
["Old Italian"] = "roa-oit",
["Old Kazeruni"] = "fay-kzo",
["Old Khotanese"] = "kho-old",
["Old Kirghiz"] = "otk-kir",
["Old Konkani"] = "kok-old",
["Old Latin"] = "itc-ola",
["Old Ligurian"] = "lij-old",
["Old Lombard"] = "lmo-old",
["Old Malay"] = "ms-old",
["Old Mohawk"] = "iro-omo",
["Old Neapolitan"] = "nap-old",
["Old Northern French"] = "fro-nor",
["Old Onondaga"] = "iro-oon",
["Old Ossetic"] = "oos",
["Old Piedmontese"] = "pms-old",
["Old Provençal"] = "oc-pro-old",
["Old Pskovian"] = "zle-ops",
["Old Romagnol"] = "rgn-old",
["Old Romansh"] = "rm-old",
["Old Sardinian"] = "sc-old",
["Old Shirazi"] = "fay-sho",
["Old Sicilian"] = "scn-old",
["Old Tagalog"] = "tl-old",
["Old Thai"] = "th-old",
["Old Venetan"] = "vec-old",
["Old Wendat"] = "iro-ohu",
["Old West Norse"] = "non-own",
["Old Xiang"] = "hsn-old",
["Ontenu"] = "ont",
["Opuntian Locrian"] = "grc-opl",
["Ordos Mongolian"] = "mn-ord",
["Orkhon Turkic"] = "otk-ork",
["Orma"] = "orc",
["Oroshori"] = "sgh-oro",
["Oxyrhynchite Coptic"] = "cop-oxy",
["Ozolian Locrian"] = "grc-ozl",
["Paisaci Prakrit"] = "pra-pai",
["Palasbaria Kamrupi Assamese"] = "as-pkm",
["Palatine German"] = "pfl",
["Paleo-Balkan"] = "qsb-bal",
["Paleo-Hispanic"] = "qsb-ibe",
["Palladius"] = "cmn-palladius",
["Palmyrene Aramaic"] = "arc-pal",
["Pamphylian Greek"] = "grc-pam",
["Paphian Greek"] = "el-pap",
["Papuni"] = "fay-pap",
["Penang Hokkien"] = "nan-pen",
["Peruvian Spanish"] = "es-PE",
["Peshawari"] = "ps-pes",
["Philippine Hokkien"] = "nan-hbl-PH",
["Philippine Mandarin"] = "cmn-PH",
["Philippine Spanish"] = "es-PH",
["Picard Old French"] = "fro-pic",
["Polari"] = "pld",
["Postal Romanization"] = "zh-postal",
["Pracya"] = "pra-pra",
["Praenestine"] = "itc-pra",
["Pre-Angkorian Old Khmer"] = "okz-pre",
["Pre-Classical Chinese"] = "lzh-pre",
["Pre-Greek"] = "qsb-grc",
["Proto-Anglo-Frisian"] = "gmw-afr-pro",
["Proto-Arinic"] = "qfa-yrn-pro",
["Proto-Baltic"] = "bat-pro",
["Proto-Bulgar"] = "trk-bul-pro",
["Proto-Common Turkic"] = "trk-cmn-pro",
["Proto-Finno-Permic"] = "urj-fpr-pro",
["Proto-Finno-Ugric"] = "fiu-pro",
["Proto-Ketic"] = "qfa-yke-pro",
["Proto-Kottic"] = "qfa-yko-pro",
["Proto-Lycopolitan Coptic"] = "cop-ply",
["Proto-Middle Indo-Aryan"] = "inc-ash-pro",
["Proto-New Indo-Aryan"] = "pra-pro",
["Proto-North Sea Germanic"] = "gmw-nsg-pro",
["Proto-Oghur"] = "trk-ogr-pro",
["Proto-Oghuz"] = "trk-ogz-pro",
["Proto-Pumpokolic"] = "qfa-ypm-pro",
["Proto-Romance"] = "roa-pro",
["Proto-Tibeto-Burman"] = "tbq-pro",
["Provençal"] = "oc-pro",
["Puerto Rican Spanish"] = "es-PR",
["Pulaar"] = "fuc",
["Pular"] = "fuf",
["Puter Romansh"] = "rm-put",
["Pyongan Korean"] = "ko-pyo",
["Qalhari"] = "xme-qal",
["Qashqai"] = "qxq",
["Qianlu Min"] = "nan-qia",
["Qohrudi"] = "xme-qoh",
["Quanzhou Hokkien"] = "nan-qua",
["Renaissance Latin"] = "la-ren",
["Rigvedic Sanskrit"] = "sa-rig",
["Rioplatense Spanish"] = "es-AR",
["Roshani"] = "sgh-ros",
["Roshani-Khufi"] = "sgh-rsx",
["Rumantsch Grischun"] = "rm-gri",
["Russian Church Slavonic"] = "zls-chs-ru",
["Sabari"] = "pra-sab",
["Sagzabadi"] = "tks-sag",
["Sahidic Coptic"] = "cop-sah",
["Saint Dominican Creole French"] = "ht-sdm",
["Sakari"] = "pra-sak",
["Sakhalin Ainu"] = "ain-sak",
["Sal Kabuverdianu"] = "kea-sal",
["Sallands"] = "sdz",
["Samghani"] = "fay-sam",
["Samnite"] = "osc-sam",
["Santiago Kabuverdianu"] = "kea-san",
["Santo Antão Kabuverdianu"] = "kea-saa",
["Sauraseni Apabhramsa"] = "inc-asa",
["Sauraseni Prakrit"] = "pra-sau",
["Scottish English"] = "en-GB-SCT",
["Sedehi"] = "xme-sed",
["Shadi Wu"] = "wuu-chm",
["Shandarmani"] = "tly-san",
["Shanghainese"] = "wuu-sha",
["Shangsi Zhuang"] = "tai-shz",
["Sher"] = "ps-ser",
["Shirazi"] = "fay-shr",
["Shuadit"] = "oc-jud",
["Silesian East Central German"] = "sli",
["Singapore Hokkien"] = "nan-hbl-SG",
["Singapore Mandarin"] = "cmn-SG",
["Sixian Hakka"] = "hak-six",
["Skagit"] = "ska",
["Snohomish"] = "sno",
["Soi"] = "soj",
["Sorkhi"] = "fay-sor",
["Sotavento Kabuverdianu"] = "kea-sot",
["South African English"] = "en-ZA",
["South Karelian"] = "krl-sou",
["South Lebanese North Levantine Arabic"] = "apc-sle",
["South Wales Welsh"] = "cy-sou",
["Southeastern Pashto"] = "ps-sea",
["Southern Balochi"] = "bcc",
["Southern Lushootseed"] = "slh",
["Southern Malaysian Hokkien"] = "nan-spm",
["Southern Middle English"] = "enm-sou",
["Southern Scots"] = "sco-sou",
["Southern Talysh"] = "tly-sou",
["Southern Tati"] = "xme-ttc-sou",
["Southwestern Mandarin"] = "cmn-sow",
["Southwestern Pashto"] = "ps-swe",
["Standard Babylonian"] = "akk-stb",
["Stellingwerfs"] = "stl",
["Suevic"] = "gem-sue",
["Sukhothai Old Thai"] = "th-suk",
["Surmiran Romansh"] = "rm-srm",
["Sursilvan Romansh"] = "rm-srs",
["Sutsilvan Romansh"] = "rm-sut",
["Suzhounese"] = "wuu-suz",
["Swiss French"] = "fr-CH",
["Switzerland German"] = "de-CH",
["Switzerland Italian"] = "it-CH",
["Sylt North Frisian"] = "frr-syl",
["Syrian North Levantine Arabic"] = "apc-syr",
["São Nicolau Kabuverdianu"] = "kea-sni",
["São Vicente Kabuverdianu"] = "kea-svi",
["Taiwanese Hakka"] = "hak-TW",
["Taiwanese Hokkien"] = "nan-hbl-TW",
["Taiwanese Mandarin"] = "cmn-TW",
["Takestani"] = "tks-tak",
["Takka Apabhramsa"] = "inc-ata",
["Taleshdulabi"] = "tly-tal",
["Tamahaq"] = "thv",
["Tamasheq"] = "taq",
["Tarehi"] = "xme-trh",
["Tari"] = "xme-tar",
["Tawellemmet"] = "ttq",
["Tayert"] = "thz",
["Thessalian Greek"] = "grc-ths",
["Tianjin Mandarin"] = "cmn-tia",
["Tong'an Hokkien"] = "nan-ton",
["Tongyong Pinyin"] = "cmn-tongyong",
["Torlakian Serbo-Croatian"] = "sh-tor",
["Tosk Albanian"] = "als",
["Traditional Chinese poetry"] = "lzh-shi",
["Transalpine Gaulish"] = "xtg",
["Tseku"] = "tsk",
["Tularudi"] = "tly-tul",
["Twents"] = "twd",
["Twi Akan"] = "tw",
["Ukrainian Church Slavonic"] = "zls-chs-uk",
["Ulster English"] = "en-uls",
["Ulster Scots"] = "sco-uls",
["United States Spanish"] = "es-US",
["Upper Saxon German"] = "sxu",
["Vafsi"] = "vaf",
["Valencian"] = "ca-val",
["Vallader Romansh"] = "rm-val",
["Valujerdi"] = "xme-val",
["Varani"] = "xme-var",
["Varzenehi"] = "xme-vrz",
["Vedic Sanskrit"] = "vsn",
["Veluws"] = "vel",
["Venezuelan Spanish"] = "es-VE",
["Viennese German"] = "de-AT-vie",
["Vietnamese Classical Chinese"] = "lzh-VI",
["Viryal Chuvash"] = "cv-vir",
["Vivaro-Alpine"] = "oc-viv",
["Volga Bulgar"] = "xbo-vol",
["Vonishuni"] = "xme-von",
["Vracada Apabhramsa"] = "inc-avr",
["Vulgar Latin"] = "la-vul",
["Waata"] = "ssn",
["Wade–Giles"] = "cmn-wadegiles",
["Walser German"] = "wae",
["Wasa"] = "wss",
["Waziri"] = "ps-waz",
["Welsh English"] = "en-GB-WLS",
["Wenzhounese"] = "wuu-wen",
["West Midland Middle English"] = "enm-wmi",
["West Saxon Old English"] = "ang-wsx",
["Western Armenian"] = "hyw",
["Western Balochi"] = "bgn",
["Western Mansi"] = "mns-wes",
["Western Niger Fulfulde"] = "fuh",
["Western Punjabi"] = "pnb",
["Western Tati"] = "xme-ttc-wes",
["Westphalian"] = "wep",
["Wiedingharde North Frisian"] = "frr-wie",
["Written vernacular Cantonese"] = "yue-wvc",
["Written vernacular Mandarin"] = "cmn-wvc",
["Written vernacular Taishanese"] = "zhx-tai-wvc",
["Wuhan Mandarin"] = "cmn-wuh",
["Xiamen Hokkien"] = "nan-xia",
["Xining Mandarin"] = "cmn-xin",
["Yangzhou Mandarin"] = "cmn-yan",
["Yarandi"] = "xme-yar",
["Yazdi"] = "xme-yaz",
["Yongchun Hokkien"] = "nan-yon",
["Younger Avestan"] = "ae-yng",
["Yukjin Korean"] = "ko-yuk",
["Zarphatic"] = "zrp",
["Zefrehi"] = "xme-zef",
["Zhangping Hokkien"] = "nan-zhp",
["Zhangzhou Hokkien"] = "nan-zha",
["Zhao'an Hakka"] = "hak-zha",
["Zhao'an Hokkien"] = "nan-zho",
["Zhongshan Min"] = "zhx-zho",
["Zori"] = "xme-zor",
["Zoroastrian Dari"] = "gbz",
["taxonomic name"] = "mul-tax",
["the BMAC substrate"] = "qsb-bma",
}
71heeauo13igwnyrck6m9g0rwh3rjai
234832
234831
2026-05-24T08:15:55Z
Lee
19
[[:en:Module:etymology_languages/canonical_names]] වෙතින් එක් සංශෝධනයක්
234831
Scribunto
text/plain
return {
["ALUPEC Kabuverdianu"] = "kea-alu",
["Abhiri"] = "pra-abh",
["Abron"] = "abr",
["Abuzeydabadi"] = "xme-abz",
["Abyanehi"] = "xme-aby",
["Acadian French"] = "fr-aca",
["Achaemenid Elamite"] = "elx-ach",
["Achterhoeks"] = "act",
["Adamawa Fulfulde"] = "fub",
["Addu Dhivehi"] = "dv-add",
["Aeolic Greek"] = "grc-aeo",
["Afghan Uzbek"] = "uz-afg",
["African Romance"] = "la-afr",
["Afridi"] = "ps-afr",
["Akhmimic Coptic"] = "cop-akh",
["Akuapem Twi"] = "tw-aku",
["Aleppine North Levantine Arabic"] = "apc-ale",
["Alsatian Alemannic German"] = "gsw-FR-als",
["Amdo Tibetan"] = "adx",
["American English"] = "en-US",
["Amorehi"] = "xme-amo",
["Ampezan Ladin"] = "lld-amp",
["Amrum North Frisian"] = "frr-amr",
["Anaraki"] = "xme-ana",
["Anatri Chuvash"] = "cv-ana",
["Anbarani"] = "tly-anb",
["Angkorian Old Khmer"] = "okz-ang",
["Anglian Old English"] = "ang-ang",
["Anglo-Norman"] = "xno",
["Anxi Hokkien"] = "nan-anx",
["Aquitanian"] = "xaq",
["Aranese"] = "oc-ara",
["Arbëresh Albanian"] = "aae",
["Arcadian Greek"] = "grc-arc",
["Arcadocypriot Greek"] = "grc-arp",
["Ardestani"] = "xme-ard",
["Ardhamagadhi Prakrit"] = "pra-ard",
["Arghu"] = "klj-arg",
["Armeno-Kipchak"] = "qwm-arm",
["Arvanitika Albanian"] = "aat",
["Asalemi"] = "tly-asa",
["Asante Twi"] = "tw-asa",
["Ashtiani"] = "atn",
["Attic Greek"] = "grc-att",
["Australian Aboriginal English"] = "en-aae",
["Australian English"] = "en-AU",
["Austrian German"] = "de-AT",
["Auvergnat"] = "oc-auv",
["Avahattha"] = "inc-aav",
["Avanti"] = "pra-ava",
["Ayutthaya Old Thai"] = "th-ayu",
["Azerbaijani Talysh"] = "tly-aze",
["Badiot Ladin"] = "lld-bad",
["Badrudi"] = "xme-bdr",
["Bagirmi Fulfulde"] = "fui",
["Bahliki"] = "pra-bah",
["Bajui"] = "sgh-baj",
["Baltic German"] = "de-bal",
["Bandari"] = "bsg-ban",
["Bangash"] = "ps-bng",
["Bannu"] = "ps-ban",
["Barlavento Kabuverdianu"] = "kea-bar",
["Barpetia Kamrupi Assamese"] = "as-bkm",
["Bartangi"] = "sgh-bar",
["Bartangi-Oroshori"] = "sgh-bro",
["Beijing Mandarin"] = "cmn-bei",
["Beijingic Mandarin"] = "cmn-bec",
["Belgian Dutch"] = "nl-BE",
["Besemah"] = "pse-bsm",
["Betawi Kota"] = "bew-kot",
["Bhaca"] = "xh-bha",
["Biblical Aramaic"] = "arc-bib",
["Biblical Hebrew"] = "hbo",
["Bidhandi"] = "xme-bid",
["Bijagani"] = "xme-bij",
["Boa Vista Kabuverdianu"] = "kea-bvi",
["Boeotian Greek"] = "grc-boi",
["Bohairic Coptic"] = "cop-boh",
["Bolivian Spanish"] = "es-BO",
["Bombay Hindi"] = "hi-mum",
["Borana"] = "gax",
["Borgu Fulfulde"] = "fue",
["Borujerdi"] = "xme-bor",
["Brahmanic Sanskrit"] = "sa-bra",
["Brava Kabuverdianu"] = "kea-bra",
["Brazilian Portuguese"] = "pt-BR",
["British English"] = "en-GB",
["Buddhist Hybrid Sanskrit"] = "sa-bhs",
["Burenjani"] = "fay-bur",
["Bushehri"] = "fay-bsh",
["Byzantine Greek"] = "gkm",
["Cadorino Ladin"] = "lld-cad",
["Cajun French"] = "frc",
["California English"] = "en-US-CA",
["Camorta"] = "ncb-cam",
["Campidanese"] = "sc-sro",
["Canadian English"] = "en-CA",
["Canadian French"] = "fr-CA",
["Canadian Ukrainian"] = "uk-CA",
["Candali"] = "pra-can",
["Capenate"] = "xfa-cap",
["Central Ghilzay"] = "ps-cgi",
["Central Korean"] = "ko-cen",
["Central Plains Mandarin"] = "cmn-cep",
["Central Talysh"] = "tly-cen",
["Central Tati"] = "xme-ttc-cen",
["Central-Eastern Niger Fulfulde"] = "fuq",
["Chakavian Serbo-Croatian"] = "ckm",
["Chakhar Mongolian"] = "mn-cha",
["Chali Tati"] = "tks-cal",
["Changtai Hokkien"] = "nan-cha",
["Chilean Spanish"] = "es-CL",
["Chimehi"] = "xme-cim",
["Christian Palestinian Aramaic"] = "arc-cpa",
["Chungcheong Korean"] = "ko-chu",
["Ci"] = "lzh-cii",
["Cisalpine Gaulish"] = "xcg",
["Classical Azerbaijani"] = "az-cls",
["Classical Cantonese"] = "lzh-yue",
["Classical Japanese"] = "ja-cla",
["Classical Latin"] = "la-cla",
["Classical Malay"] = "ms-cla",
["Classical Mandarin"] = "lzh-cmn",
["Classical Persian"] = "fa-cls",
["Classical Sanskrit"] = "cls",
["Classical Tagalog"] = "tl-cls",
["Classical Taishanese"] = "lzh-tai",
["Classical Taiwanese Mandarin"] = "lzh-cmn-TW",
["Colombian Spanish"] = "es-CO",
["Common Bantu"] = "bnt-cmn",
["Contemporary Latin"] = "la-con",
["Coptic Dialect G"] = "cop-ggg",
["Coptic Dialect J"] = "cop-jjj",
["Coptic Dialect K"] = "cop-kkk",
["Coptic Dialect P"] = "cop-ppp",
["Cretan Ancient Greek"] = "grc-kre",
["Cretan Greek"] = "el-crt",
["Cuban Spanish"] = "es-CU",
["Cuman"] = "qwm-cum",
["Cypriot Ancient Greek"] = "grc-cyp",
["Cypriot Greek"] = "el-cyp",
["Cypriot Turkish"] = "tr-CY",
["Dabu Hakka"] = "hak-dab",
["Daksinatya"] = "pra-dak",
["Damascene North Levantine Arabic"] = "apc-dam",
["Danesfani"] = "tks-dan",
["Danube Bulgar"] = "xbo-dan",
["Danzhou Chinese"] = "zhx-dan",
["Dari"] = "prs",
["Dashtaki"] = "fay-dsh",
["Davani"] = "fay-dav",
["Delijani"] = "xme-del",
["Dhakaiya Vaṅga Bengali"] = "bn-dvn",
["Digor Ossetian"] = "os-dig",
["Dnieper Baltic"] = "bat-dni",
["Dobrujan Tatar"] = "crh-dbj",
["Doric Greek"] = "grc-dor",
["Dramili"] = "pra-dra",
["Drents"] = "drt",
["Dutch Low Saxon"] = "nds-nl",
["Early Brythonic"] = "bry-ear",
["Early Mandarin"] = "cmn-ear",
["Early Medieval Latin"] = "la-eme",
["Early Middle Chinese"] = "ltc-ear",
["Early Middle Japanese"] = "ja-mid-ear",
["Early Middle Korean"] = "okm-ear",
["Early Middle Mongol"] = "xng-ear",
["Early Middle Persian"] = "pal-ear",
["Early Modern Czech"] = "cs-ear",
["Early Modern English"] = "en-ear",
["Early Modern Hakka"] = "hak-eam",
["Early Modern Japanese"] = "ja-ear",
["Early Modern Spanish"] = "es-ear",
["Early New High German"] = "de-ear",
["Early New Persian"] = "fa-ear",
["Early Old Chinese"] = "och-ear",
["Early Old Ossetic"] = "oos-ear",
["Early Old Persian"] = "peo-ear",
["Early Scots"] = "enm-esc",
["Early Sogdian"] = "sog-ear",
["East Frisian Low German"] = "frs",
["East Midland Middle English"] = "enm-emi",
["Eastern Armenian"] = "hye",
["Eastern Balochi"] = "bgp",
["Eastern Mansi"] = "mns-eas",
["Eastern Old Japanese"] = "ojp-eas",
["Eastern Tati"] = "xme-ttc-eas",
["Ebrahimabadi"] = "tks-ebr",
["Ecclesiastical Latin"] = "la-ecc",
["Elean Greek"] = "grc-ela",
["Emamzada Esmaili"] = "fay-eze",
["Epic Greek"] = "grc-epi",
["Epic Sanskrit"] = "sa-epi",
["Esfarvarini"] = "tks-esf",
["European Portuguese"] = "pt-PT",
["Fante Akan"] = "fat",
["Farizandi"] = "xme-far",
["Fascian Ladin"] = "lld-fas",
["Fayyumic Coptic"] = "cop-fay",
["Fodom Ladin"] = "lld-fod",
["Fogo Kabuverdianu"] = "kea-fog",
["Fornes Ladin"] = "lld-for",
["Frankish"] = "frk",
["Fumani"] = "tly-fum",
["Fuyu Kyrgyz"] = "kjh-fyu",
["Föhr North Frisian"] = "frr-foh",
["Föhr-Amrum North Frisian"] = "frr-fam",
["Gangwon Korean"] = "ko-gan",
["Gascon"] = "oc-gas",
["Gavkoshaki"] = "fay-gav",
["Gazi"] = "gzi",
["Geordie"] = "en-geo",
["German Low German"] = "nds-de",
["Ghat"] = "thv-ght",
["Gheg Albanian"] = "aln",
["Gherdëina Ladin"] = "lld-ghe",
["Goesharde North Frisian"] = "frr-goe",
["Golyad"] = "bat-gol",
["Goral"] = "pl-gor",
["Greater Polish"] = "pl-gre",
["Greenlandic Norse"] = "non-grn",
["Gronings"] = "gos",
["Guangzhou Cantonese"] = "yue-gua",
["Guanzhong Mandarin"] = "cmn-gua",
["Guernsey Norman"] = "nrf-grn",
["Guilin Mandarin"] = "cmn-gui",
["Gurjara Apabhramsa"] = "inc-agu",
["Gyeonggi Korean"] = "ko-gyg",
["Gyeongsang Korean"] = "ko-gys",
["Hailu Hakka"] = "hak-hai",
["Halligen North Frisian"] = "frr-hal",
["Hamadani"] = "xme-ham",
["Hamgyong Korean"] = "ko-ham",
["Hangzhounese"] = "wuu-han",
["Hanjani"] = "xme-han",
["Hanyu Pinyin"] = "cmn-pinyin",
["Harar Oromo"] = "hae",
["Hatran Aramaic"] = "arc-hat",
["Havigannada"] = "kn-hav",
["Hazaragi"] = "haz",
["Heligoland North Frisian"] = "frr-hel",
["Helu Prakrit"] = "pra-hel",
["Hengyang Xiang"] = "hsn-hya",
["Hengzhou Xiang"] = "hsn-hzh",
["Hermopolitan Coptic"] = "cop-her",
["High Alemannic German"] = "gsw-hig",
["Highest Alemannic German"] = "gsw-hst",
["Hokkaido Ainu"] = "ain-hok",
["Hong Kong Cantonese"] = "yue-HK",
["Hong Kong English"] = "en-HK",
["Hong Kong Hakka"] = "hak-HK",
["Hormozi"] = "bsg-hor",
["Houlu Min"] = "nan-hou",
["Hui'an Hokkien"] = "nan-hui",
["Huiyang Hakka"] = "hak-hui",
["Huvadhu Dhivehi"] = "dv-huv",
["Hwanghae Korean"] = "ko-hwa",
["Imperial Aramaic"] = "arc-imp",
["Indian English"] = "en-IN",
["Insular North Frisian"] = "frr-ins",
["Insular Scots"] = "sco-ins",
["Ionic Greek"] = "grc-ion",
["Iranian Persian"] = "fa-ira",
["Irish English"] = "en-IE",
["Iron Ossetian"] = "os-iro",
["Isfahani"] = "xme-isf",
["Israeli Hebrew"] = "he-IL",
["Jadrani"] = "ps-jad",
["Jeolla Korean"] = "ko-jeo",
["Jersey Norman"] = "nrf-jer",
["Jewish Babylonian Aramaic"] = "tmr",
["Jewish Literary Aramaic"] = "arc-jla",
["Jewish Palestinian Aramaic"] = "jpa",
["Jianghuai Mandarin"] = "cmn-jhu",
["Jinjiang Hokkien"] = "nan-jin",
["Jirofti"] = "rdb-jir",
["Jowshaqani"] = "xme-jow",
["Judeo-Arabic"] = "jrb",
["Kafroni"] = "xme-kaf",
["Kahaki"] = "xme-kah",
["Kahnuji"] = "rdb-kah",
["Kajkavian Serbo-Croatian"] = "kjv",
["Kakari"] = "ps-kak",
["Kaliarda"] = "el-kal",
["Kamviri"] = "xvi",
["Kandahari"] = "ps-kan",
["Kaniguram"] = "oru-kan",
["Karganrudi"] = "tly-kar",
["Karrharde North Frisian"] = "frr-kar",
["Kashani"] = "xme-kas",
["Kasmiri Apabhramsa"] = "inc-aka",
["Katchal"] = "ncb-kat",
["Katharevousa"] = "el-kth",
["Kathiyawadi"] = "gu-kat",
["Kativiri"] = "bsh-kat",
["Kentish Middle English"] = "enm-ken",
["Kentish Old English"] = "ang-ken",
["Kermani"] = "xme-krm",
["Kesehi"] = "xme-kes",
["Khalkha Mongolian"] = "mn-kha",
["Khamba"] = "kbg",
["Khams Tibetan"] = "khg",
["Khargi"] = "fay-kar",
["Khasa Prakrit"] = "pra-kha",
["Khatak"] = "ps-xat",
["Khiaraji"] = "tks-xia",
["Khollari"] = "fay-kho",
["Khorchin Mongolian"] = "mn-khr",
["Khoznini"] = "tks-xoz",
["Khufi"] = "sgh-xuf",
["Khughni"] = "sgh-xug",
["Khughni-Bajui"] = "sgh-xgb",
["Khunsari"] = "kfm",
["Khuri"] = "xme-xur",
["Khuzestani Arabic"] = "acm-khu",
["Kinmenese Hokkien"] = "nan-kin",
["Kinyarwanda"] = "rw-kin",
["Kirundi"] = "rw-run",
["Koine Greek"] = "grc-koi",
["Komjani"] = "xme-kom",
["Kondazi"] = "fay-kon",
["Korean Classical Chinese"] = "lzh-KO",
["Kosena"] = "kze",
["Kromanti"] = "alv-kro",
["Kundagannada"] = "kn-kun",
["Kuril Ainu"] = "ain-kur",
["Kölsch"] = "ksh",
["Languedocien"] = "oc-lan",
["Lanuvian"] = "itc-lan",
["Lanyin Mandarin"] = "cmn-lan",
["Late Babylonian"] = "akk-lbb",
["Late Brythonic"] = "bry-lat",
["Late Egyptian"] = "egy-lat",
["Late Khotanese"] = "kho-lat",
["Late Latin"] = "la-lat",
["Late Middle Chinese"] = "ltc-lat",
["Late Middle Japanese"] = "ja-mid-lat",
["Late Middle Mongol"] = "xng-lat",
["Late Middle Persian"] = "pal-lat",
["Late Old Chinese"] = "och-lat",
["Late Old Korean"] = "oko-lat",
["Late Old Ossetic"] = "oos-lat",
["Late Old Persian"] = "peo-lat",
["Late Old Swedish"] = "gmq-osw-lat",
["Late Sogdian"] = "sog-lat",
["Law French"] = "xno-law",
["Lebanese North Levantine Arabic"] = "apc-leb",
["Lesser Polish"] = "pl-les",
["Limousin"] = "oc-lim",
["Lisan ud-Dawat Gujarati"] = "gu-lda",
["Literary Cantonese"] = "yue-lit",
["Literary Chinese"] = "lzh-lit",
["Logar"] = "oru-log",
["Logudorese"] = "sc-src",
["Lombardic"] = "lng",
["Loudi Xiang"] = "hsn-lou",
["Louisiana French"] = "fr-lou",
["Low Alemannic German"] = "gsw-low",
["Low Prussian"] = "nds-lpr",
["Lucanian"] = "osc-luc",
["Lunfardo"] = "es-lun",
["Lycopolitan Coptic"] = "cop-lyc",
["Língua Geral Amazônica"] = "tpw-lga",
["Língua Geral Paulista"] = "tpw-lgp",
["Maasina Fulfulde"] = "ffm",
["Magadhi Prakrit"] = "pra-mag",
["Mahallati"] = "xme-mah",
["Maharastri Apabhramsa"] = "inc-ama",
["Maharastri Prakrit"] = "pra-mah",
["Mahsudi"] = "ps-mah",
["Mainland North Frisian"] = "frr-mai",
["Maio Kabuverdianu"] = "kea-mai",
["Malaysian Huiyang Hakka"] = "hak-hui-MY",
["Malaysian Mandarin"] = "cmn-MY",
["Mamluk-Kipchak"] = "qwm-mam",
["Manichaean Middle Persian"] = "xmn",
["Manx English"] = "en-IM",
["Masali"] = "tly-msa",
["Masarami"] = "fay-mas",
["Masovian Polish"] = "pl-mas",
["Masulei"] = "tly-msu",
["Medan Hokkien"] = "nan-med",
["Medieval Hebrew"] = "he-med",
["Medieval Latin"] = "la-med",
["Medieval Sinhalese"] = "si-med",
["Medieval Tashelhit"] = "shi-med",
["Meixian Hakka"] = "hak-mei",
["Mercian Old English"] = "ang-mer",
["Mexican Spanish"] = "es-MX",
["Meymehi"] = "xme-mey",
["Middle Assyrian"] = "akk-mas",
["Middle Babylonian"] = "akk-mbb",
["Middle Belarusian"] = "zle-mbe",
["Middle Bulgarian"] = "cu-bgm",
["Middle Chuvash"] = "cv-mid",
["Middle Egyptian"] = "egy-mid",
["Middle Elamite"] = "elx-mid",
["Middle Georgian"] = "ka-mid",
["Middle Hindi"] = "hi-mid",
["Middle Japanese"] = "ja-mid",
["Middle Konkani"] = "kok-mid",
["Middle Polish"] = "zlw-mpl",
["Middle Russian"] = "zle-mru",
["Middle Tamil"] = "ta-mid",
["Middle Ukrainian"] = "zle-muk",
["Minabi"] = "bsg-min",
["Mishnaic Hebrew"] = "he-mis",
["Missouri French"] = "fr-mis",
["Mitanni"] = "inc-mit",
["Moldovan"] = "ro-MD",
["Mooring North Frisian"] = "frr-moo",
["Mulaku Dhivehi"] = "dv-mul",
["Mumviri"] = "bsh-mum",
["Nabataean Aramaic"] = "arc-nab",
["Nalbaria Kamrupi Assamese"] = "as-nkm",
["Nancowry"] = "ncb-nan",
["Nanjing Mandarin"] = "cmn-nan",
["Naraqi"] = "xme-nar",
["Nashalji"] = "xme-nas",
["Natanzi"] = "ntz",
["Nayini"] = "nyq",
["Neo-Assyrian"] = "akk-nas",
["Neo-Babylonian"] = "akk-nbb",
["Neo-Elamite"] = "elx-neo",
["Neo-Middle Egyptian"] = "egy-nmi",
["New Latin"] = "la-new",
["New Sanskrit"] = "sa-neo",
["New Xiang"] = "hsn-new",
["New Zealand English"] = "en-NZ",
["Nigerian Fulfulde"] = "fuv",
["Ningbonese"] = "wuu-nin",
["Noakhailla Vaṅga Bengali"] = "bn-nvn",
["Nones Ladin"] = "lld-non",
["North Alaskan Inupiatun"] = "esi",
["North American English"] = "en-NNN",
["North Karelian"] = "krl-nor",
["North Lebanese North Levantine Arabic"] = "apc-nle",
["North Wales Welsh"] = "cy-nor",
["Northeastern Mandarin"] = "cmn-noe",
["Northeastern Pashto"] = "ps-nea",
["Northern Irish English"] = "en-GB-NIR",
["Northern Kankanaey"] = "xnn",
["Northern Lushootseed"] = "lut-nor",
["Northern Middle English"] = "enm-nor",
["Northern Scots"] = "sco-nor",
["Northern Talysh"] = "tly-nor",
["Northern Tati"] = "xme-ttc-nor",
["Northern Wu"] = "wuu-nor",
["Northumbrian Old English"] = "ang-nor",
["Northwest Alaskan Inupiatun"] = "esk",
["Northwestern Pashto"] = "ps-nwe",
["Nuorese"] = "sc-nuo",
["Nushabadi"] = "xme-nus",
["Odri"] = "pra-odr",
["Old Akkadian"] = "akk-old",
["Old Aramaic"] = "arc-old",
["Old Assyrian"] = "akk-oas",
["Old Avestan"] = "ae-old",
["Old Azari"] = "xme-azr",
["Old Babylonian"] = "akk-obb",
["Old Braj"] = "bra-old",
["Old Chuvash"] = "cv-old",
["Old Coptic"] = "cop-old",
["Old Dhivehi"] = "dv-old",
["Old East Norse"] = "non-oen",
["Old Egyptian"] = "egy-old",
["Old Elamite"] = "elx-old",
["Old Emilian"] = "egl-old",
["Old Franco-Provençal"] = "frp-old",
["Old Friulian"] = "fur-old",
["Old Italian"] = "roa-oit",
["Old Kazeruni"] = "fay-kzo",
["Old Khotanese"] = "kho-old",
["Old Kirghiz"] = "otk-kir",
["Old Konkani"] = "kok-old",
["Old Latin"] = "itc-ola",
["Old Ligurian"] = "lij-old",
["Old Lombard"] = "lmo-old",
["Old Malay"] = "ms-old",
["Old Mohawk"] = "iro-omo",
["Old Neapolitan"] = "nap-old",
["Old Northern French"] = "fro-nor",
["Old Onondaga"] = "iro-oon",
["Old Ossetic"] = "oos",
["Old Piedmontese"] = "pms-old",
["Old Provençal"] = "oc-pro-old",
["Old Pskovian"] = "zle-ops",
["Old Romagnol"] = "rgn-old",
["Old Romansh"] = "rm-old",
["Old Sardinian"] = "sc-old",
["Old Shirazi"] = "fay-sho",
["Old Sicilian"] = "scn-old",
["Old Tagalog"] = "tl-old",
["Old Thai"] = "th-old",
["Old Venetan"] = "vec-old",
["Old Wendat"] = "iro-ohu",
["Old West Norse"] = "non-own",
["Old Xiang"] = "hsn-old",
["Ontenu"] = "ont",
["Opuntian Locrian"] = "grc-opl",
["Ordos Mongolian"] = "mn-ord",
["Orkhon Turkic"] = "otk-ork",
["Orma"] = "orc",
["Oroshori"] = "sgh-oro",
["Oxyrhynchite Coptic"] = "cop-oxy",
["Ozolian Locrian"] = "grc-ozl",
["Paisaci Prakrit"] = "pra-pai",
["Palasbaria Kamrupi Assamese"] = "as-pkm",
["Palatine German"] = "pfl",
["Paleo-Balkan"] = "qsb-bal",
["Paleo-Hispanic"] = "qsb-ibe",
["Palladius"] = "cmn-palladius",
["Palmyrene Aramaic"] = "arc-pal",
["Pamphylian Greek"] = "grc-pam",
["Paphian Greek"] = "el-pap",
["Papuni"] = "fay-pap",
["Penang Hokkien"] = "nan-pen",
["Peruvian Spanish"] = "es-PE",
["Peshawari"] = "ps-pes",
["Philippine Hokkien"] = "nan-hbl-PH",
["Philippine Mandarin"] = "cmn-PH",
["Philippine Spanish"] = "es-PH",
["Picard Old French"] = "fro-pic",
["Polari"] = "pld",
["Postal Romanization"] = "zh-postal",
["Pracya"] = "pra-pra",
["Praenestine"] = "itc-pra",
["Pre-Angkorian Old Khmer"] = "okz-pre",
["Pre-Classical Chinese"] = "lzh-pre",
["Pre-Greek"] = "qsb-grc",
["Proto-Anglo-Frisian"] = "gmw-afr-pro",
["Proto-Arinic"] = "qfa-yrn-pro",
["Proto-Baltic"] = "bat-pro",
["Proto-Bulgar"] = "trk-bul-pro",
["Proto-Common Turkic"] = "trk-cmn-pro",
["Proto-Finno-Permic"] = "urj-fpr-pro",
["Proto-Finno-Ugric"] = "fiu-pro",
["Proto-Ketic"] = "qfa-yke-pro",
["Proto-Kottic"] = "qfa-yko-pro",
["Proto-Lycopolitan Coptic"] = "cop-ply",
["Proto-Middle Indo-Aryan"] = "inc-ash-pro",
["Proto-New Indo-Aryan"] = "pra-pro",
["Proto-North Sea Germanic"] = "gmw-nsg-pro",
["Proto-Oghur"] = "trk-ogr-pro",
["Proto-Oghuz"] = "trk-ogz-pro",
["Proto-Pumpokolic"] = "qfa-ypm-pro",
["Proto-Romance"] = "roa-pro",
["Proto-Tibeto-Burman"] = "tbq-pro",
["Provençal"] = "oc-pro",
["Puerto Rican Spanish"] = "es-PR",
["Pulaar"] = "fuc",
["Pular"] = "fuf",
["Puter Romansh"] = "rm-put",
["Pyongan Korean"] = "ko-pyo",
["Qalhari"] = "xme-qal",
["Qashqai"] = "qxq",
["Qianlu Min"] = "nan-qia",
["Qohrudi"] = "xme-qoh",
["Quanzhou Hokkien"] = "nan-qua",
["Renaissance Latin"] = "la-ren",
["Rigvedic Sanskrit"] = "sa-rig",
["Rioplatense Spanish"] = "es-AR",
["Roshani"] = "sgh-ros",
["Roshani-Khufi"] = "sgh-rsx",
["Rumantsch Grischun"] = "rm-gri",
["Russian Church Slavonic"] = "zls-chs-ru",
["Sabari"] = "pra-sab",
["Sagzabadi"] = "tks-sag",
["Sahidic Coptic"] = "cop-sah",
["Saint Dominican Creole French"] = "ht-sdm",
["Sakari"] = "pra-sak",
["Sakhalin Ainu"] = "ain-sak",
["Sal Kabuverdianu"] = "kea-sal",
["Sallands"] = "sdz",
["Samghani"] = "fay-sam",
["Samnite"] = "osc-sam",
["Santiago Kabuverdianu"] = "kea-san",
["Santo Antão Kabuverdianu"] = "kea-saa",
["Sauraseni Apabhramsa"] = "inc-asa",
["Sauraseni Prakrit"] = "pra-sau",
["Scottish English"] = "en-GB-SCT",
["Sedehi"] = "xme-sed",
["Shadi Wu"] = "wuu-chm",
["Shandarmani"] = "tly-san",
["Shanghainese"] = "wuu-sha",
["Shangsi Zhuang"] = "tai-shz",
["Sher"] = "ps-ser",
["Shirazi"] = "fay-shr",
["Shuadit"] = "oc-jud",
["Silesian East Central German"] = "sli",
["Singapore Hokkien"] = "nan-hbl-SG",
["Singapore Mandarin"] = "cmn-SG",
["Sixian Hakka"] = "hak-six",
["Skagit"] = "ska",
["Snohomish"] = "sno",
["Soi"] = "soj",
["Sorkhi"] = "fay-sor",
["Sotavento Kabuverdianu"] = "kea-sot",
["South African English"] = "en-ZA",
["South Karelian"] = "krl-sou",
["South Lebanese North Levantine Arabic"] = "apc-sle",
["South Wales Welsh"] = "cy-sou",
["Southeastern Pashto"] = "ps-sea",
["Southern Balochi"] = "bcc",
["Southern Lushootseed"] = "slh",
["Southern Malaysian Hokkien"] = "nan-spm",
["Southern Middle English"] = "enm-sou",
["Southern Scots"] = "sco-sou",
["Southern Talysh"] = "tly-sou",
["Southern Tati"] = "xme-ttc-sou",
["Southwestern Mandarin"] = "cmn-sow",
["Southwestern Pashto"] = "ps-swe",
["Standard Babylonian"] = "akk-stb",
["Stellingwerfs"] = "stl",
["Suevic"] = "gem-sue",
["Sukhothai Old Thai"] = "th-suk",
["Surmiran Romansh"] = "rm-srm",
["Sursilvan Romansh"] = "rm-srs",
["Sutsilvan Romansh"] = "rm-sut",
["Suzhounese"] = "wuu-suz",
["Swiss French"] = "fr-CH",
["Switzerland German"] = "de-CH",
["Switzerland Italian"] = "it-CH",
["Sylt North Frisian"] = "frr-syl",
["Syrian North Levantine Arabic"] = "apc-syr",
["São Nicolau Kabuverdianu"] = "kea-sni",
["São Vicente Kabuverdianu"] = "kea-svi",
["Taiwanese Hakka"] = "hak-TW",
["Taiwanese Hokkien"] = "nan-hbl-TW",
["Taiwanese Mandarin"] = "cmn-TW",
["Takestani"] = "tks-tak",
["Takka Apabhramsa"] = "inc-ata",
["Taleshdulabi"] = "tly-tal",
["Tamahaq"] = "thv",
["Tamasheq"] = "taq",
["Tarehi"] = "xme-trh",
["Tari"] = "xme-tar",
["Tawellemmet"] = "ttq",
["Tayert"] = "thz",
["Thessalian Greek"] = "grc-ths",
["Tianjin Mandarin"] = "cmn-tia",
["Tong'an Hokkien"] = "nan-ton",
["Tongyong Pinyin"] = "cmn-tongyong",
["Torlakian Serbo-Croatian"] = "sh-tor",
["Tosk Albanian"] = "als",
["Traditional Chinese poetry"] = "lzh-shi",
["Transalpine Gaulish"] = "xtg",
["Tseku"] = "tsk",
["Tularudi"] = "tly-tul",
["Twents"] = "twd",
["Twi Akan"] = "tw",
["Ukrainian Church Slavonic"] = "zls-chs-uk",
["Ulster English"] = "en-uls",
["Ulster Scots"] = "sco-uls",
["United States Spanish"] = "es-US",
["Upper Saxon German"] = "sxu",
["Vafsi"] = "vaf",
["Valencian"] = "ca-val",
["Vallader Romansh"] = "rm-val",
["Valujerdi"] = "xme-val",
["Varani"] = "xme-var",
["Varzenehi"] = "xme-vrz",
["Vedic Sanskrit"] = "vsn",
["Veluws"] = "vel",
["Venezuelan Spanish"] = "es-VE",
["Viennese German"] = "de-AT-vie",
["Vietnamese Classical Chinese"] = "lzh-VI",
["Viryal Chuvash"] = "cv-vir",
["Vivaro-Alpine"] = "oc-viv",
["Volga Bulgar"] = "xbo-vol",
["Vonishuni"] = "xme-von",
["Vracada Apabhramsa"] = "inc-avr",
["Vulgar Latin"] = "la-vul",
["Waata"] = "ssn",
["Wade–Giles"] = "cmn-wadegiles",
["Walser German"] = "wae",
["Wasa"] = "wss",
["Waziri"] = "ps-waz",
["Welsh English"] = "en-GB-WLS",
["Wenzhounese"] = "wuu-wen",
["West Midland Middle English"] = "enm-wmi",
["West Saxon Old English"] = "ang-wsx",
["Western Armenian"] = "hyw",
["Western Balochi"] = "bgn",
["Western Mansi"] = "mns-wes",
["Western Niger Fulfulde"] = "fuh",
["Western Punjabi"] = "pnb",
["Western Tati"] = "xme-ttc-wes",
["Westphalian"] = "wep",
["Wiedingharde North Frisian"] = "frr-wie",
["Written vernacular Cantonese"] = "yue-wvc",
["Written vernacular Mandarin"] = "cmn-wvc",
["Written vernacular Taishanese"] = "zhx-tai-wvc",
["Wuhan Mandarin"] = "cmn-wuh",
["Xiamen Hokkien"] = "nan-xia",
["Xining Mandarin"] = "cmn-xin",
["Yangzhou Mandarin"] = "cmn-yan",
["Yarandi"] = "xme-yar",
["Yazdi"] = "xme-yaz",
["Yongchun Hokkien"] = "nan-yon",
["Younger Avestan"] = "ae-yng",
["Yukjin Korean"] = "ko-yuk",
["Zarphatic"] = "zrp",
["Zefrehi"] = "xme-zef",
["Zhangping Hokkien"] = "nan-zhp",
["Zhangzhou Hokkien"] = "nan-zha",
["Zhao'an Hakka"] = "hak-zha",
["Zhao'an Hokkien"] = "nan-zho",
["Zhongshan Min"] = "zhx-zho",
["Zori"] = "xme-zor",
["Zoroastrian Dari"] = "gbz",
["taxonomic name"] = "mul-tax",
["the BMAC substrate"] = "qsb-bma",
}
71heeauo13igwnyrck6m9g0rwh3rjai
234833
234832
2026-05-24T08:16:48Z
Lee
19
පැරණි සංස්කරණයකින් ගත් කොටස්...
234833
Scribunto
text/plain
return {
["ALUPEC Kabuverdianu"] = "kea-alu",
["Abhiri"] = "pra-abh",
["Abron"] = "abr",
["Abuzeydabadi"] = "xme-abz",
["Abyanehi"] = "xme-aby",
["Acadian French"] = "fr-aca",
["Achaemenid Elamite"] = "elx-ach",
["Achterhoeks"] = "act",
["Adamawa Fulfulde"] = "fub",
["Addu Dhivehi"] = "dv-add",
["Aeolic Greek"] = "grc-aeo",
["Afghan Uzbek"] = "uz-afg",
["African Romance"] = "la-afr",
["Afridi"] = "ps-afr",
["Akhmimic Coptic"] = "cop-akh",
["Akuapem Twi"] = "tw-aku",
["Aleppine North Levantine Arabic"] = "apc-ale",
["Alsatian Alemannic German"] = "gsw-FR-als",
["Amdo Tibetan"] = "adx",
["American English"] = "en-US",
["Amorehi"] = "xme-amo",
["Ampezan Ladin"] = "lld-amp",
["Amrum North Frisian"] = "frr-amr",
["Anaraki"] = "xme-ana",
["Anatri Chuvash"] = "cv-ana",
["Anbarani"] = "tly-anb",
["Angkorian Old Khmer"] = "okz-ang",
["Anglian Old English"] = "ang-ang",
["ඇන්ග්ලෝ-නෝමන්"] = "xno",
["Anxi Hokkien"] = "nan-anx",
["Aquitanian"] = "xaq",
["Aranese"] = "oc-ara",
["Arbëresh Albanian"] = "aae",
["Arcadian Greek"] = "grc-arc",
["Arcadocypriot Greek"] = "grc-arp",
["Ardestani"] = "xme-ard",
["Ardhamagadhi Prakrit"] = "pra-ard",
["Arghu"] = "klj-arg",
["Armeno-Kipchak"] = "qwm-arm",
["Arvanitika Albanian"] = "aat",
["Asalemi"] = "tly-asa",
["Asante Twi"] = "tw-asa",
["Ashtiani"] = "atn",
["Attic Greek"] = "grc-att",
["Australian Aboriginal English"] = "en-aae",
["Australian English"] = "en-AU",
["Austrian German"] = "de-AT",
["Auvergnat"] = "oc-auv",
["Avahattha"] = "inc-aav",
["Avanti"] = "pra-ava",
["Ayutthaya Old Thai"] = "th-ayu",
["Azerbaijani Talysh"] = "tly-aze",
["Badiot Ladin"] = "lld-bad",
["Badrudi"] = "xme-bdr",
["Bagirmi Fulfulde"] = "fui",
["Bahliki"] = "pra-bah",
["Bajui"] = "sgh-baj",
["Baltic German"] = "de-bal",
["Bandari"] = "bsg-ban",
["Bangash"] = "ps-bng",
["Bannu"] = "ps-ban",
["Barlavento Kabuverdianu"] = "kea-bar",
["Barpetia Kamrupi Assamese"] = "as-bkm",
["Bartangi"] = "sgh-bar",
["Bartangi-Oroshori"] = "sgh-bro",
["Beijing Mandarin"] = "cmn-bei",
["Beijingic Mandarin"] = "cmn-bec",
["Belgian Dutch"] = "nl-BE",
["Besemah"] = "pse-bsm",
["Betawi Kota"] = "bew-kot",
["Bhaca"] = "xh-bha",
["Biblical Aramaic"] = "arc-bib",
["Biblical Hebrew"] = "hbo",
["Bidhandi"] = "xme-bid",
["Bijagani"] = "xme-bij",
["Boa Vista Kabuverdianu"] = "kea-bvi",
["Boeotian Greek"] = "grc-boi",
["Bohairic Coptic"] = "cop-boh",
["Bolivian Spanish"] = "es-BO",
["Bombay Hindi"] = "hi-mum",
["Borana"] = "gax",
["Borgu Fulfulde"] = "fue",
["Borujerdi"] = "xme-bor",
["Brahmanic Sanskrit"] = "sa-bra",
["Brava Kabuverdianu"] = "kea-bra",
["Brazilian Portuguese"] = "pt-BR",
["British English"] = "en-GB",
["Buddhist Hybrid Sanskrit"] = "sa-bhs",
["Burenjani"] = "fay-bur",
["Bushehri"] = "fay-bsh",
["Byzantine Greek"] = "gkm",
["Cadorino Ladin"] = "lld-cad",
["Cajun French"] = "frc",
["California English"] = "en-US-CA",
["Camorta"] = "ncb-cam",
["Campidanese"] = "sc-sro",
["Canadian English"] = "en-CA",
["Canadian French"] = "fr-CA",
["Canadian Ukrainian"] = "uk-CA",
["Candali"] = "pra-can",
["Capenate"] = "xfa-cap",
["Central Ghilzay"] = "ps-cgi",
["Central Korean"] = "ko-cen",
["Central Plains Mandarin"] = "cmn-cep",
["Central Talysh"] = "tly-cen",
["Central Tati"] = "xme-ttc-cen",
["Central-Eastern Niger Fulfulde"] = "fuq",
["Chakavian Serbo-Croatian"] = "ckm",
["Chakhar Mongolian"] = "mn-cha",
["Chali Tati"] = "tks-cal",
["Changtai Hokkien"] = "nan-cha",
["Chilean Spanish"] = "es-CL",
["Chimehi"] = "xme-cim",
["Christian Palestinian Aramaic"] = "arc-cpa",
["Chungcheong Korean"] = "ko-chu",
["Ci"] = "lzh-cii",
["Cisalpine Gaulish"] = "xcg",
["Classical Azerbaijani"] = "az-cls",
["Classical Cantonese"] = "lzh-yue",
["Classical Japanese"] = "ja-cla",
["Classical Latin"] = "la-cla",
["Classical Malay"] = "ms-cla",
["Classical Mandarin"] = "lzh-cmn",
["Classical Persian"] = "fa-cls",
["Classical Sanskrit"] = "cls",
["Classical Tagalog"] = "tl-cls",
["Classical Taishanese"] = "lzh-tai",
["Classical Taiwanese Mandarin"] = "lzh-cmn-TW",
["Colombian Spanish"] = "es-CO",
["Common Bantu"] = "bnt-cmn",
["Contemporary Latin"] = "la-con",
["Coptic Dialect G"] = "cop-ggg",
["Coptic Dialect J"] = "cop-jjj",
["Coptic Dialect K"] = "cop-kkk",
["Coptic Dialect P"] = "cop-ppp",
["Cretan Ancient Greek"] = "grc-kre",
["Cretan Greek"] = "el-crt",
["Cuban Spanish"] = "es-CU",
["Cuman"] = "qwm-cum",
["Cypriot Ancient Greek"] = "grc-cyp",
["Cypriot Greek"] = "el-cyp",
["Cypriot Turkish"] = "tr-CY",
["Dabu Hakka"] = "hak-dab",
["Daksinatya"] = "pra-dak",
["Damascene North Levantine Arabic"] = "apc-dam",
["Danesfani"] = "tks-dan",
["Danube Bulgar"] = "xbo-dan",
["Danzhou Chinese"] = "zhx-dan",
["Dari"] = "prs",
["Dashtaki"] = "fay-dsh",
["Davani"] = "fay-dav",
["Delijani"] = "xme-del",
["Dhakaiya Vaṅga Bengali"] = "bn-dvn",
["Digor Ossetian"] = "os-dig",
["Dnieper Baltic"] = "bat-dni",
["Dobrujan Tatar"] = "crh-dbj",
["Doric Greek"] = "grc-dor",
["Dramili"] = "pra-dra",
["Drents"] = "drt",
["Dutch Low Saxon"] = "nds-nl",
["Early Brythonic"] = "bry-ear",
["Early Mandarin"] = "cmn-ear",
["Early Medieval Latin"] = "la-eme",
["Early Middle Chinese"] = "ltc-ear",
["Early Middle Japanese"] = "ja-mid-ear",
["Early Middle Korean"] = "okm-ear",
["Early Middle Mongol"] = "xng-ear",
["Early Middle Persian"] = "pal-ear",
["Early Modern Czech"] = "cs-ear",
["Early Modern English"] = "en-ear",
["Early Modern Hakka"] = "hak-eam",
["Early Modern Japanese"] = "ja-ear",
["Early Modern Spanish"] = "es-ear",
["Early New High German"] = "de-ear",
["Early New Persian"] = "fa-ear",
["Early Old Chinese"] = "och-ear",
["Early Old Ossetic"] = "oos-ear",
["Early Old Persian"] = "peo-ear",
["Early Scots"] = "enm-esc",
["Early Sogdian"] = "sog-ear",
["East Frisian Low German"] = "frs",
["East Midland Middle English"] = "enm-emi",
["Eastern Armenian"] = "hye",
["Eastern Balochi"] = "bgp",
["Eastern Mansi"] = "mns-eas",
["Eastern Old Japanese"] = "ojp-eas",
["Eastern Tati"] = "xme-ttc-eas",
["Ebrahimabadi"] = "tks-ebr",
["Ecclesiastical Latin"] = "la-ecc",
["Elean Greek"] = "grc-ela",
["Emamzada Esmaili"] = "fay-eze",
["Epic Greek"] = "grc-epi",
["Epic Sanskrit"] = "sa-epi",
["Esfarvarini"] = "tks-esf",
["European Portuguese"] = "pt-PT",
["Fante Akan"] = "fat",
["Farizandi"] = "xme-far",
["Fascian Ladin"] = "lld-fas",
["Fayyumic Coptic"] = "cop-fay",
["Fodom Ladin"] = "lld-fod",
["Fogo Kabuverdianu"] = "kea-fog",
["Fornes Ladin"] = "lld-for",
["Frankish"] = "frk",
["Fumani"] = "tly-fum",
["Fuyu Kyrgyz"] = "kjh-fyu",
["Föhr North Frisian"] = "frr-foh",
["Föhr-Amrum North Frisian"] = "frr-fam",
["Gangwon Korean"] = "ko-gan",
["Gascon"] = "oc-gas",
["Gavkoshaki"] = "fay-gav",
["Gazi"] = "gzi",
["Geordie"] = "en-geo",
["German Low German"] = "nds-de",
["Ghat"] = "thv-ght",
["Gheg Albanian"] = "aln",
["Gherdëina Ladin"] = "lld-ghe",
["Goesharde North Frisian"] = "frr-goe",
["Golyad"] = "bat-gol",
["Goral"] = "pl-gor",
["Greater Polish"] = "pl-gre",
["Greenlandic Norse"] = "non-grn",
["Gronings"] = "gos",
["Guangzhou Cantonese"] = "yue-gua",
["Guanzhong Mandarin"] = "cmn-gua",
["Guernsey Norman"] = "nrf-grn",
["Guilin Mandarin"] = "cmn-gui",
["Gurjara Apabhramsa"] = "inc-agu",
["Gyeonggi Korean"] = "ko-gyg",
["Gyeongsang Korean"] = "ko-gys",
["Hailu Hakka"] = "hak-hai",
["Halligen North Frisian"] = "frr-hal",
["Hamadani"] = "xme-ham",
["Hamgyong Korean"] = "ko-ham",
["Hangzhounese"] = "wuu-han",
["Hanjani"] = "xme-han",
["Hanyu Pinyin"] = "cmn-pinyin",
["Harar Oromo"] = "hae",
["Hatran Aramaic"] = "arc-hat",
["Havigannada"] = "kn-hav",
["Hazaragi"] = "haz",
["Heligoland North Frisian"] = "frr-hel",
["එළු ප්රාකෘත"] = "pra-hel",
["Hengyang Xiang"] = "hsn-hya",
["Hengzhou Xiang"] = "hsn-hzh",
["Hermopolitan Coptic"] = "cop-her",
["High Alemannic German"] = "gsw-hig",
["Highest Alemannic German"] = "gsw-hst",
["Hokkaido Ainu"] = "ain-hok",
["Hong Kong Cantonese"] = "yue-HK",
["Hong Kong English"] = "en-HK",
["Hong Kong Hakka"] = "hak-HK",
["Hormozi"] = "bsg-hor",
["Houlu Min"] = "nan-hou",
["Hui'an Hokkien"] = "nan-hui",
["Huiyang Hakka"] = "hak-hui",
["Huvadhu Dhivehi"] = "dv-huv",
["Hwanghae Korean"] = "ko-hwa",
["Imperial Aramaic"] = "arc-imp",
["Indian English"] = "en-IN",
["Insular North Frisian"] = "frr-ins",
["Insular Scots"] = "sco-ins",
["Ionic Greek"] = "grc-ion",
["Iranian Persian"] = "fa-ira",
["Irish English"] = "en-IE",
["Iron Ossetian"] = "os-iro",
["Isfahani"] = "xme-isf",
["Israeli Hebrew"] = "he-IL",
["Jadrani"] = "ps-jad",
["Jeolla Korean"] = "ko-jeo",
["Jersey Norman"] = "nrf-jer",
["Jewish Babylonian Aramaic"] = "tmr",
["Jewish Literary Aramaic"] = "arc-jla",
["Jewish Palestinian Aramaic"] = "jpa",
["Jianghuai Mandarin"] = "cmn-jhu",
["Jinjiang Hokkien"] = "nan-jin",
["Jirofti"] = "rdb-jir",
["Jowshaqani"] = "xme-jow",
["Judeo-Arabic"] = "jrb",
["Kafroni"] = "xme-kaf",
["Kahaki"] = "xme-kah",
["Kahnuji"] = "rdb-kah",
["Kajkavian Serbo-Croatian"] = "kjv",
["Kakari"] = "ps-kak",
["Kaliarda"] = "el-kal",
["Kamviri"] = "xvi",
["Kandahari"] = "ps-kan",
["Kaniguram"] = "oru-kan",
["Karganrudi"] = "tly-kar",
["Karrharde North Frisian"] = "frr-kar",
["Kashani"] = "xme-kas",
["Kasmiri Apabhramsa"] = "inc-aka",
["Katchal"] = "ncb-kat",
["Katharevousa"] = "el-kth",
["Kathiyawadi"] = "gu-kat",
["Kativiri"] = "bsh-kat",
["Kentish Middle English"] = "enm-ken",
["Kentish Old English"] = "ang-ken",
["Kermani"] = "xme-krm",
["Kesehi"] = "xme-kes",
["Khalkha Mongolian"] = "mn-kha",
["Khamba"] = "kbg",
["Khams Tibetan"] = "khg",
["Khargi"] = "fay-kar",
["Khasa Prakrit"] = "pra-kha",
["Khatak"] = "ps-xat",
["Khiaraji"] = "tks-xia",
["Khollari"] = "fay-kho",
["Khorchin Mongolian"] = "mn-khr",
["Khoznini"] = "tks-xoz",
["Khufi"] = "sgh-xuf",
["Khughni"] = "sgh-xug",
["Khughni-Bajui"] = "sgh-xgb",
["Khunsari"] = "kfm",
["Khuri"] = "xme-xur",
["Khuzestani Arabic"] = "acm-khu",
["Kinmenese Hokkien"] = "nan-kin",
["Kinyarwanda"] = "rw-kin",
["Kirundi"] = "rw-run",
["Koine Greek"] = "grc-koi",
["Komjani"] = "xme-kom",
["Kondazi"] = "fay-kon",
["Korean Classical Chinese"] = "lzh-KO",
["Kosena"] = "kze",
["Kromanti"] = "alv-kro",
["Kundagannada"] = "kn-kun",
["Kuril Ainu"] = "ain-kur",
["Kölsch"] = "ksh",
["Languedocien"] = "oc-lan",
["Lanuvian"] = "itc-lan",
["Lanyin Mandarin"] = "cmn-lan",
["Late Babylonian"] = "akk-lbb",
["Late Brythonic"] = "bry-lat",
["Late Egyptian"] = "egy-lat",
["Late Khotanese"] = "kho-lat",
["Late Latin"] = "la-lat",
["Late Middle Chinese"] = "ltc-lat",
["Late Middle Japanese"] = "ja-mid-lat",
["Late Middle Mongol"] = "xng-lat",
["Late Middle Persian"] = "pal-lat",
["Late Old Chinese"] = "och-lat",
["Late Old Korean"] = "oko-lat",
["Late Old Ossetic"] = "oos-lat",
["Late Old Persian"] = "peo-lat",
["Late Old Swedish"] = "gmq-osw-lat",
["Late Sogdian"] = "sog-lat",
["Law French"] = "xno-law",
["Lebanese North Levantine Arabic"] = "apc-leb",
["Lesser Polish"] = "pl-les",
["Limousin"] = "oc-lim",
["Lisan ud-Dawat Gujarati"] = "gu-lda",
["Literary Cantonese"] = "yue-lit",
["Literary Chinese"] = "lzh-lit",
["Logar"] = "oru-log",
["Logudorese"] = "sc-src",
["Lombardic"] = "lng",
["Loudi Xiang"] = "hsn-lou",
["Louisiana French"] = "fr-lou",
["Low Alemannic German"] = "gsw-low",
["Low Prussian"] = "nds-lpr",
["Lucanian"] = "osc-luc",
["Lunfardo"] = "es-lun",
["Lycopolitan Coptic"] = "cop-lyc",
["Língua Geral Amazônica"] = "tpw-lga",
["Língua Geral Paulista"] = "tpw-lgp",
["Maasina Fulfulde"] = "ffm",
["Magadhi Prakrit"] = "pra-mag",
["Mahallati"] = "xme-mah",
["Maharastri Apabhramsa"] = "inc-ama",
["Maharastri Prakrit"] = "pra-mah",
["Mahsudi"] = "ps-mah",
["Mainland North Frisian"] = "frr-mai",
["Maio Kabuverdianu"] = "kea-mai",
["Malaysian Huiyang Hakka"] = "hak-hui-MY",
["Malaysian Mandarin"] = "cmn-MY",
["Mamluk-Kipchak"] = "qwm-mam",
["Manichaean Middle Persian"] = "xmn",
["Manx English"] = "en-IM",
["Masali"] = "tly-msa",
["Masarami"] = "fay-mas",
["Masovian Polish"] = "pl-mas",
["Masulei"] = "tly-msu",
["Medan Hokkien"] = "nan-med",
["Medieval Hebrew"] = "he-med",
["Medieval Latin"] = "la-med",
["Medieval Sinhalese"] = "si-med",
["Medieval Tashelhit"] = "shi-med",
["Meixian Hakka"] = "hak-mei",
["Mercian Old English"] = "ang-mer",
["Mexican Spanish"] = "es-MX",
["Meymehi"] = "xme-mey",
["Middle Assyrian"] = "akk-mas",
["Middle Babylonian"] = "akk-mbb",
["Middle Belarusian"] = "zle-mbe",
["Middle Bulgarian"] = "cu-bgm",
["Middle Chuvash"] = "cv-mid",
["Middle Egyptian"] = "egy-mid",
["Middle Elamite"] = "elx-mid",
["Middle Georgian"] = "ka-mid",
["Middle Hindi"] = "hi-mid",
["Middle Japanese"] = "ja-mid",
["Middle Konkani"] = "kok-mid",
["Middle Polish"] = "zlw-mpl",
["Middle Russian"] = "zle-mru",
["Middle Tamil"] = "ta-mid",
["Middle Ukrainian"] = "zle-muk",
["Minabi"] = "bsg-min",
["Mishnaic Hebrew"] = "he-mis",
["Missouri French"] = "fr-mis",
["Mitanni"] = "inc-mit",
["Moldovan"] = "ro-MD",
["Mooring North Frisian"] = "frr-moo",
["Mulaku Dhivehi"] = "dv-mul",
["Mumviri"] = "bsh-mum",
["Nabataean Aramaic"] = "arc-nab",
["Nalbaria Kamrupi Assamese"] = "as-nkm",
["Nancowry"] = "ncb-nan",
["Nanjing Mandarin"] = "cmn-nan",
["Naraqi"] = "xme-nar",
["Nashalji"] = "xme-nas",
["Natanzi"] = "ntz",
["Nayini"] = "nyq",
["Neo-Assyrian"] = "akk-nas",
["Neo-Babylonian"] = "akk-nbb",
["Neo-Elamite"] = "elx-neo",
["Neo-Middle Egyptian"] = "egy-nmi",
["New Latin"] = "la-new",
["New Sanskrit"] = "sa-neo",
["New Xiang"] = "hsn-new",
["New Zealand English"] = "en-NZ",
["Nigerian Fulfulde"] = "fuv",
["Ningbonese"] = "wuu-nin",
["Noakhailla Vaṅga Bengali"] = "bn-nvn",
["Nones Ladin"] = "lld-non",
["North Alaskan Inupiatun"] = "esi",
["North American ඉංග්රීසි"] = "en-NNN",
["North Karelian"] = "krl-nor",
["North Lebanese North Levantine Arabic"] = "apc-nle",
["North Wales Welsh"] = "cy-nor",
["Northeastern Mandarin"] = "cmn-noe",
["Northeastern Pashto"] = "ps-nea",
["Northern Irish English"] = "en-GB-NIR",
["Northern Kankanaey"] = "xnn",
["Northern Lushootseed"] = "lut-nor",
["Northern Middle English"] = "enm-nor",
["Northern Scots"] = "sco-nor",
["Northern Talysh"] = "tly-nor",
["Northern Tati"] = "xme-ttc-nor",
["Northern Wu"] = "wuu-nor",
["Northumbrian Old English"] = "ang-nor",
["Northwest Alaskan Inupiatun"] = "esk",
["Northwestern Pashto"] = "ps-nwe",
["Nuorese"] = "sc-nuo",
["Nushabadi"] = "xme-nus",
["Odri"] = "pra-odr",
["Old Akkadian"] = "akk-old",
["Old Aramaic"] = "arc-old",
["Old Assyrian"] = "akk-oas",
["Old Avestan"] = "ae-old",
["Old Azari"] = "xme-azr",
["Old Babylonian"] = "akk-obb",
["Old Braj"] = "bra-old",
["Old Chuvash"] = "cv-old",
["Old Coptic"] = "cop-old",
["Old Dhivehi"] = "dv-old",
["Old East Norse"] = "non-oen",
["Old Egyptian"] = "egy-old",
["Old Elamite"] = "elx-old",
["Old Emilian"] = "egl-old",
["Old Franco-Provençal"] = "frp-old",
["Old Friulian"] = "fur-old",
["Old Italian"] = "roa-oit",
["Old Kazeruni"] = "fay-kzo",
["Old Khotanese"] = "kho-old",
["Old Kirghiz"] = "otk-kir",
["Old Konkani"] = "kok-old",
["Old Latin"] = "itc-ola",
["Old Ligurian"] = "lij-old",
["Old Lombard"] = "lmo-old",
["Old Malay"] = "ms-old",
["Old Mohawk"] = "iro-omo",
["Old Neapolitan"] = "nap-old",
["Old Northern French"] = "fro-nor",
["Old Onondaga"] = "iro-oon",
["Old Ossetic"] = "oos",
["Old Piedmontese"] = "pms-old",
["Old Provençal"] = "oc-pro-old",
["Old Pskovian"] = "zle-ops",
["Old Romagnol"] = "rgn-old",
["Old Romansh"] = "rm-old",
["Old Sardinian"] = "sc-old",
["Old Shirazi"] = "fay-sho",
["Old Sicilian"] = "scn-old",
["Old Tagalog"] = "tl-old",
["Old Thai"] = "th-old",
["Old Venetan"] = "vec-old",
["Old Wendat"] = "iro-ohu",
["Old West Norse"] = "non-own",
["Old Xiang"] = "hsn-old",
["Ontenu"] = "ont",
["Opuntian Locrian"] = "grc-opl",
["Ordos Mongolian"] = "mn-ord",
["Orkhon Turkic"] = "otk-ork",
["Orma"] = "orc",
["Oroshori"] = "sgh-oro",
["Oxyrhynchite Coptic"] = "cop-oxy",
["Ozolian Locrian"] = "grc-ozl",
["Paisaci Prakrit"] = "pra-pai",
["Palasbaria Kamrupi Assamese"] = "as-pkm",
["Palatine German"] = "pfl",
["Paleo-Balkan"] = "qsb-bal",
["Paleo-Hispanic"] = "qsb-ibe",
["Palladius"] = "cmn-palladius",
["Palmyrene Aramaic"] = "arc-pal",
["Pamphylian Greek"] = "grc-pam",
["Paphian Greek"] = "el-pap",
["Papuni"] = "fay-pap",
["Penang Hokkien"] = "nan-pen",
["Peruvian Spanish"] = "es-PE",
["Peshawari"] = "ps-pes",
["Philippine Hokkien"] = "nan-hbl-PH",
["Philippine Mandarin"] = "cmn-PH",
["Philippine Spanish"] = "es-PH",
["Picard Old French"] = "fro-pic",
["Polari"] = "pld",
["Postal Romanization"] = "zh-postal",
["Pracya"] = "pra-pra",
["Praenestine"] = "itc-pra",
["Pre-Angkorian Old Khmer"] = "okz-pre",
["Pre-Classical Chinese"] = "lzh-pre",
["Pre-Greek"] = "qsb-grc",
["Proto-Anglo-Frisian"] = "gmw-afr-pro",
["Proto-Arinic"] = "qfa-yrn-pro",
["Proto-Baltic"] = "bat-pro",
["Proto-Bulgar"] = "trk-bul-pro",
["Proto-Common Turkic"] = "trk-cmn-pro",
["Proto-Finno-Permic"] = "urj-fpr-pro",
["Proto-Finno-Ugric"] = "fiu-pro",
["Proto-Ketic"] = "qfa-yke-pro",
["Proto-Kottic"] = "qfa-yko-pro",
["Proto-Lycopolitan Coptic"] = "cop-ply",
["Proto-Middle Indo-Aryan"] = "inc-ash-pro",
["Proto-New Indo-Aryan"] = "pra-pro",
["Proto-North Sea Germanic"] = "gmw-nsg-pro",
["Proto-Oghur"] = "trk-ogr-pro",
["Proto-Oghuz"] = "trk-ogz-pro",
["Proto-Pumpokolic"] = "qfa-ypm-pro",
["Proto-Romance"] = "roa-pro",
["Proto-Tibeto-Burman"] = "tbq-pro",
["Provençal"] = "oc-pro",
["Puerto Rican Spanish"] = "es-PR",
["Pulaar"] = "fuc",
["Pular"] = "fuf",
["Puter Romansh"] = "rm-put",
["Pyongan Korean"] = "ko-pyo",
["Qalhari"] = "xme-qal",
["Qashqai"] = "qxq",
["Qianlu Min"] = "nan-qia",
["Qohrudi"] = "xme-qoh",
["Quanzhou Hokkien"] = "nan-qua",
["Renaissance Latin"] = "la-ren",
["Rigvedic Sanskrit"] = "sa-rig",
["Rioplatense Spanish"] = "es-AR",
["Roshani"] = "sgh-ros",
["Roshani-Khufi"] = "sgh-rsx",
["Rumantsch Grischun"] = "rm-gri",
["Russian Church Slavonic"] = "zls-chs-ru",
["Sabari"] = "pra-sab",
["Sagzabadi"] = "tks-sag",
["Sahidic Coptic"] = "cop-sah",
["Saint Dominican Creole French"] = "ht-sdm",
["Sakari"] = "pra-sak",
["Sakhalin Ainu"] = "ain-sak",
["Sal Kabuverdianu"] = "kea-sal",
["Sallands"] = "sdz",
["Samghani"] = "fay-sam",
["Samnite"] = "osc-sam",
["Santiago Kabuverdianu"] = "kea-san",
["Santo Antão Kabuverdianu"] = "kea-saa",
["Sauraseni Apabhramsa"] = "inc-asa",
["Sauraseni Prakrit"] = "pra-sau",
["Scottish English"] = "en-GB-SCT",
["Sedehi"] = "xme-sed",
["Shadi Wu"] = "wuu-chm",
["Shandarmani"] = "tly-san",
["Shanghainese"] = "wuu-sha",
["Shangsi Zhuang"] = "tai-shz",
["Sher"] = "ps-ser",
["Shirazi"] = "fay-shr",
["Shuadit"] = "oc-jud",
["Silesian East Central German"] = "sli",
["Singapore Hokkien"] = "nan-hbl-SG",
["Singapore Mandarin"] = "cmn-SG",
["Sixian Hakka"] = "hak-six",
["Skagit"] = "ska",
["Snohomish"] = "sno",
["Soi"] = "soj",
["Sorkhi"] = "fay-sor",
["Sotavento Kabuverdianu"] = "kea-sot",
["South African English"] = "en-ZA",
["South Karelian"] = "krl-sou",
["South Lebanese North Levantine Arabic"] = "apc-sle",
["South Wales Welsh"] = "cy-sou",
["Southeastern Pashto"] = "ps-sea",
["Southern Balochi"] = "bcc",
["Southern Lushootseed"] = "slh",
["Southern Malaysian Hokkien"] = "nan-spm",
["Southern Middle English"] = "enm-sou",
["Southern Scots"] = "sco-sou",
["Southern Talysh"] = "tly-sou",
["Southern Tati"] = "xme-ttc-sou",
["Southwestern Mandarin"] = "cmn-sow",
["Southwestern Pashto"] = "ps-swe",
["Standard Babylonian"] = "akk-stb",
["Stellingwerfs"] = "stl",
["Suevic"] = "gem-sue",
["Sukhothai Old Thai"] = "th-suk",
["Surmiran Romansh"] = "rm-srm",
["Sursilvan Romansh"] = "rm-srs",
["Sutsilvan Romansh"] = "rm-sut",
["Suzhounese"] = "wuu-suz",
["Swiss French"] = "fr-CH",
["Switzerland German"] = "de-CH",
["Switzerland Italian"] = "it-CH",
["Sylt North Frisian"] = "frr-syl",
["Syrian North Levantine Arabic"] = "apc-syr",
["São Nicolau Kabuverdianu"] = "kea-sni",
["São Vicente Kabuverdianu"] = "kea-svi",
["Taiwanese Hakka"] = "hak-TW",
["Taiwanese Hokkien"] = "nan-hbl-TW",
["Taiwanese Mandarin"] = "cmn-TW",
["Takestani"] = "tks-tak",
["Takka Apabhramsa"] = "inc-ata",
["Taleshdulabi"] = "tly-tal",
["Tamahaq"] = "thv",
["Tamasheq"] = "taq",
["Tarehi"] = "xme-trh",
["Tari"] = "xme-tar",
["Tawellemmet"] = "ttq",
["Tayert"] = "thz",
["Thessalian Greek"] = "grc-ths",
["Tianjin Mandarin"] = "cmn-tia",
["Tong'an Hokkien"] = "nan-ton",
["Tongyong Pinyin"] = "cmn-tongyong",
["Torlakian Serbo-Croatian"] = "sh-tor",
["Tosk Albanian"] = "als",
["Traditional Chinese poetry"] = "lzh-shi",
["Transalpine Gaulish"] = "xtg",
["Tseku"] = "tsk",
["Tularudi"] = "tly-tul",
["Twents"] = "twd",
["Twi Akan"] = "tw",
["Ukrainian Church Slavonic"] = "zls-chs-uk",
["Ulster English"] = "en-uls",
["Ulster Scots"] = "sco-uls",
["United States Spanish"] = "es-US",
["Upper Saxon German"] = "sxu",
["Vafsi"] = "vaf",
["Valencian"] = "ca-val",
["Vallader Romansh"] = "rm-val",
["Valujerdi"] = "xme-val",
["Varani"] = "xme-var",
["Varzenehi"] = "xme-vrz",
["Vedic Sanskrit"] = "vsn",
["Veluws"] = "vel",
["Venezuelan Spanish"] = "es-VE",
["Viennese German"] = "de-AT-vie",
["Vietnamese Classical Chinese"] = "lzh-VI",
["Viryal Chuvash"] = "cv-vir",
["Vivaro-Alpine"] = "oc-viv",
["Volga Bulgar"] = "xbo-vol",
["Vonishuni"] = "xme-von",
["Vracada Apabhramsa"] = "inc-avr",
["Vulgar Latin"] = "la-vul",
["Waata"] = "ssn",
["Wade–Giles"] = "cmn-wadegiles",
["Walser German"] = "wae",
["Wasa"] = "wss",
["Waziri"] = "ps-waz",
["Welsh English"] = "en-GB-WLS",
["Wenzhounese"] = "wuu-wen",
["West Midland Middle English"] = "enm-wmi",
["West Saxon Old English"] = "ang-wsx",
["Western Armenian"] = "hyw",
["Western Balochi"] = "bgn",
["Western Mansi"] = "mns-wes",
["Western Niger Fulfulde"] = "fuh",
["Western Punjabi"] = "pnb",
["Western Tati"] = "xme-ttc-wes",
["Westphalian"] = "wep",
["Wiedingharde North Frisian"] = "frr-wie",
["Written vernacular Cantonese"] = "yue-wvc",
["Written vernacular Mandarin"] = "cmn-wvc",
["Written vernacular Taishanese"] = "zhx-tai-wvc",
["Wuhan Mandarin"] = "cmn-wuh",
["Xiamen Hokkien"] = "nan-xia",
["Xining Mandarin"] = "cmn-xin",
["Yangzhou Mandarin"] = "cmn-yan",
["Yarandi"] = "xme-yar",
["Yazdi"] = "xme-yaz",
["Yongchun Hokkien"] = "nan-yon",
["Younger Avestan"] = "ae-yng",
["Yukjin Korean"] = "ko-yuk",
["Zarphatic"] = "zrp",
["Zefrehi"] = "xme-zef",
["Zhangping Hokkien"] = "nan-zhp",
["Zhangzhou Hokkien"] = "nan-zha",
["Zhao'an Hakka"] = "hak-zha",
["Zhao'an Hokkien"] = "nan-zho",
["Zhongshan Min"] = "zhx-zho",
["Zori"] = "xme-zor",
["Zoroastrian Dari"] = "gbz",
["taxonomic name"] = "mul-tax",
["the BMAC substrate"] = "qsb-bma",
}
gum81phh0bmnxrgk59szz3bplgfgaom
Module:etymology languages/code to canonical name
828
137337
234834
228625
2026-05-17T18:28:58Z
en>Theknightwho
0
[[MediaWiki:UpdateLanguageNameAndCode.js|updated]]
234834
Scribunto
text/plain
return {
["aae"] = "Arbëresh Albanian",
["aat"] = "Arvanitika Albanian",
["abr"] = "Abron",
["acm-khu"] = "Khuzestani Arabic",
["act"] = "Achterhoeks",
["adx"] = "Amdo Tibetan",
["ae-old"] = "Old Avestan",
["ae-yng"] = "Younger Avestan",
["ain-hok"] = "Hokkaido Ainu",
["ain-kur"] = "Kuril Ainu",
["ain-sak"] = "Sakhalin Ainu",
["akk-lbb"] = "Late Babylonian",
["akk-mas"] = "Middle Assyrian",
["akk-mbb"] = "Middle Babylonian",
["akk-nas"] = "Neo-Assyrian",
["akk-nbb"] = "Neo-Babylonian",
["akk-oas"] = "Old Assyrian",
["akk-obb"] = "Old Babylonian",
["akk-old"] = "Old Akkadian",
["akk-stb"] = "Standard Babylonian",
["aln"] = "Gheg Albanian",
["als"] = "Tosk Albanian",
["alv-kro"] = "Kromanti",
["ang-ang"] = "Anglian Old English",
["ang-ken"] = "Kentish Old English",
["ang-mer"] = "Mercian Old English",
["ang-nor"] = "Northumbrian Old English",
["ang-wsx"] = "West Saxon Old English",
["apc-ale"] = "Aleppine North Levantine Arabic",
["apc-dam"] = "Damascene North Levantine Arabic",
["apc-leb"] = "Lebanese North Levantine Arabic",
["apc-nle"] = "North Lebanese North Levantine Arabic",
["apc-sle"] = "South Lebanese North Levantine Arabic",
["apc-syr"] = "Syrian North Levantine Arabic",
["arc-bib"] = "Biblical Aramaic",
["arc-cpa"] = "Christian Palestinian Aramaic",
["arc-hat"] = "Hatran Aramaic",
["arc-imp"] = "Imperial Aramaic",
["arc-jla"] = "Jewish Literary Aramaic",
["arc-nab"] = "Nabataean Aramaic",
["arc-old"] = "Old Aramaic",
["arc-pal"] = "Palmyrene Aramaic",
["as-bkm"] = "Barpetia Kamrupi Assamese",
["as-nkm"] = "Nalbaria Kamrupi Assamese",
["as-pkm"] = "Palasbaria Kamrupi Assamese",
["atn"] = "Ashtiani",
["az-cls"] = "Classical Azerbaijani",
["bat-dni"] = "Dnieper Baltic",
["bat-gol"] = "Golyad",
["bat-pro"] = "Proto-Baltic",
["bcc"] = "Southern Balochi",
["bew-kot"] = "Betawi Kota",
["bgn"] = "Western Balochi",
["bgp"] = "Eastern Balochi",
["bn-dvn"] = "Dhakaiya Vaṅga Bengali",
["bn-nvn"] = "Noakhailla Vaṅga Bengali",
["bnt-cmn"] = "Common Bantu",
["bra-old"] = "Old Braj",
["bry-ear"] = "Early Brythonic",
["bry-lat"] = "Late Brythonic",
["bsg-ban"] = "Bandari",
["bsg-hor"] = "Hormozi",
["bsg-min"] = "Minabi",
["bsh-kat"] = "Kativiri",
["bsh-mum"] = "Mumviri",
["ca-val"] = "Valencian",
["ckm"] = "Chakavian Serbo-Croatian",
["cls"] = "Classical Sanskrit",
["cmn-MY"] = "Malaysian Mandarin",
["cmn-PH"] = "Philippine Mandarin",
["cmn-SG"] = "Singapore Mandarin",
["cmn-TW"] = "Taiwanese Mandarin",
["cmn-bec"] = "Beijingic Mandarin",
["cmn-bei"] = "Beijing Mandarin",
["cmn-cep"] = "Central Plains Mandarin",
["cmn-ear"] = "Early Mandarin",
["cmn-gua"] = "Guanzhong Mandarin",
["cmn-gui"] = "Guilin Mandarin",
["cmn-jhu"] = "Jianghuai Mandarin",
["cmn-lan"] = "Lanyin Mandarin",
["cmn-nan"] = "Nanjing Mandarin",
["cmn-noe"] = "Northeastern Mandarin",
["cmn-palladius"] = "Palladius",
["cmn-pinyin"] = "Hanyu Pinyin",
["cmn-sow"] = "Southwestern Mandarin",
["cmn-tia"] = "Tianjin Mandarin",
["cmn-tongyong"] = "Tongyong Pinyin",
["cmn-wadegiles"] = "Wade–Giles",
["cmn-wuh"] = "Wuhan Mandarin",
["cmn-wvc"] = "Written vernacular Mandarin",
["cmn-xin"] = "Xining Mandarin",
["cmn-yan"] = "Yangzhou Mandarin",
["cop-akh"] = "Akhmimic Coptic",
["cop-boh"] = "Bohairic Coptic",
["cop-fay"] = "Fayyumic Coptic",
["cop-ggg"] = "Coptic Dialect G",
["cop-her"] = "Hermopolitan Coptic",
["cop-jjj"] = "Coptic Dialect J",
["cop-kkk"] = "Coptic Dialect K",
["cop-lyc"] = "Lycopolitan Coptic",
["cop-old"] = "Old Coptic",
["cop-oxy"] = "Oxyrhynchite Coptic",
["cop-ply"] = "Proto-Lycopolitan Coptic",
["cop-ppp"] = "Coptic Dialect P",
["cop-sah"] = "Sahidic Coptic",
["crh-dbj"] = "Dobrujan Tatar",
["cs-ear"] = "Early Modern Czech",
["cu-bgm"] = "Middle Bulgarian",
["cv-ana"] = "Anatri Chuvash",
["cv-mid"] = "Middle Chuvash",
["cv-old"] = "Old Chuvash",
["cv-vir"] = "Viryal Chuvash",
["cy-nor"] = "North Wales Welsh",
["cy-sou"] = "South Wales Welsh",
["de-AT"] = "Austrian German",
["de-AT-vie"] = "Viennese German",
["de-CH"] = "Switzerland German",
["de-bal"] = "Baltic German",
["de-ear"] = "Early New High German",
["drt"] = "Drents",
["dv-add"] = "Addu Dhivehi",
["dv-huv"] = "Huvadhu Dhivehi",
["dv-mul"] = "Mulaku Dhivehi",
["dv-old"] = "Old Dhivehi",
["egl-old"] = "Old Emilian",
["egy-lat"] = "Late Egyptian",
["egy-mid"] = "Middle Egyptian",
["egy-nmi"] = "Neo-Middle Egyptian",
["egy-old"] = "Old Egyptian",
["el-crt"] = "Cretan Greek",
["el-cyp"] = "Cypriot Greek",
["el-kal"] = "Kaliarda",
["el-kth"] = "Katharevousa",
["el-pap"] = "Paphian Greek",
["elx-ach"] = "Achaemenid Elamite",
["elx-mid"] = "Middle Elamite",
["elx-neo"] = "Neo-Elamite",
["elx-old"] = "Old Elamite",
["en-AU"] = "Australian English",
["en-CA"] = "Canadian English",
["en-GB"] = "British English",
["en-GB-NIR"] = "Northern Irish English",
["en-GB-SCT"] = "Scottish English",
["en-GB-WLS"] = "Welsh English",
["en-HK"] = "Hong Kong English",
["en-IE"] = "Irish English",
["en-IM"] = "Manx English",
["en-IN"] = "Indian English",
["en-NNN"] = "North American English",
["en-NZ"] = "New Zealand English",
["en-US"] = "American English",
["en-US-CA"] = "California English",
["en-ZA"] = "South African English",
["en-aae"] = "Australian Aboriginal English",
["en-ear"] = "Early Modern English",
["en-geo"] = "Geordie",
["en-uls"] = "Ulster English",
["enm-emi"] = "East Midland Middle English",
["enm-esc"] = "Early Scots",
["enm-ken"] = "Kentish Middle English",
["enm-nor"] = "Northern Middle English",
["enm-sou"] = "Southern Middle English",
["enm-wmi"] = "West Midland Middle English",
["es-AR"] = "Rioplatense Spanish",
["es-BO"] = "Bolivian Spanish",
["es-CL"] = "Chilean Spanish",
["es-CO"] = "Colombian Spanish",
["es-CU"] = "Cuban Spanish",
["es-MX"] = "Mexican Spanish",
["es-PE"] = "Peruvian Spanish",
["es-PH"] = "Philippine Spanish",
["es-PR"] = "Puerto Rican Spanish",
["es-US"] = "United States Spanish",
["es-VE"] = "Venezuelan Spanish",
["es-ear"] = "Early Modern Spanish",
["es-lun"] = "Lunfardo",
["esi"] = "North Alaskan Inupiatun",
["esk"] = "Northwest Alaskan Inupiatun",
["fa-cls"] = "Classical Persian",
["fa-ear"] = "Early New Persian",
["fa-ira"] = "Iranian Persian",
["fat"] = "Fante Akan",
["fay-bsh"] = "Bushehri",
["fay-bur"] = "Burenjani",
["fay-dav"] = "Davani",
["fay-dsh"] = "Dashtaki",
["fay-eze"] = "Emamzada Esmaili",
["fay-gav"] = "Gavkoshaki",
["fay-kar"] = "Khargi",
["fay-kho"] = "Khollari",
["fay-kon"] = "Kondazi",
["fay-kzo"] = "Old Kazeruni",
["fay-mas"] = "Masarami",
["fay-pap"] = "Papuni",
["fay-sam"] = "Samghani",
["fay-sho"] = "Old Shirazi",
["fay-shr"] = "Shirazi",
["fay-sor"] = "Sorkhi",
["ffm"] = "Maasina Fulfulde",
["fiu-pro"] = "Proto-Finno-Ugric",
["fr-CA"] = "Canadian French",
["fr-CH"] = "Swiss French",
["fr-aca"] = "Acadian French",
["fr-lou"] = "Louisiana French",
["fr-mis"] = "Missouri French",
["frc"] = "Cajun French",
["frk"] = "Frankish",
["fro-nor"] = "Old Northern French",
["fro-pic"] = "Picard Old French",
["frp-old"] = "Old Franco-Provençal",
["frr-amr"] = "Amrum North Frisian",
["frr-fam"] = "Föhr-Amrum North Frisian",
["frr-foh"] = "Föhr North Frisian",
["frr-goe"] = "Goesharde North Frisian",
["frr-hal"] = "Halligen North Frisian",
["frr-hel"] = "Heligoland North Frisian",
["frr-ins"] = "Insular North Frisian",
["frr-kar"] = "Karrharde North Frisian",
["frr-mai"] = "Mainland North Frisian",
["frr-moo"] = "Mooring North Frisian",
["frr-syl"] = "Sylt North Frisian",
["frr-wie"] = "Wiedingharde North Frisian",
["frs"] = "East Frisian Low German",
["fub"] = "Adamawa Fulfulde",
["fuc"] = "Pulaar",
["fue"] = "Borgu Fulfulde",
["fuf"] = "Pular",
["fuh"] = "Western Niger Fulfulde",
["fui"] = "Bagirmi Fulfulde",
["fuq"] = "Central-Eastern Niger Fulfulde",
["fur-old"] = "Old Friulian",
["fuv"] = "Nigerian Fulfulde",
["gax"] = "Borana",
["gbz"] = "Zoroastrian Dari",
["gem-sue"] = "Suevic",
["gkm"] = "Byzantine Greek",
["gmq-osw-lat"] = "Late Old Swedish",
["gmw-afr-pro"] = "Proto-Anglo-Frisian",
["gmw-nsg-pro"] = "Proto-North Sea Germanic",
["gos"] = "Gronings",
["grc-aeo"] = "Aeolic Greek",
["grc-arc"] = "Arcadian Greek",
["grc-arp"] = "Arcadocypriot Greek",
["grc-att"] = "Attic Greek",
["grc-boi"] = "Boeotian Greek",
["grc-cyp"] = "Cypriot Ancient Greek",
["grc-dor"] = "Doric Greek",
["grc-ela"] = "Elean Greek",
["grc-epi"] = "Epic Greek",
["grc-ion"] = "Ionic Greek",
["grc-koi"] = "Koine Greek",
["grc-kre"] = "Cretan Ancient Greek",
["grc-opl"] = "Opuntian Locrian",
["grc-ozl"] = "Ozolian Locrian",
["grc-pam"] = "Pamphylian Greek",
["grc-ths"] = "Thessalian Greek",
["gsw-FR-als"] = "Alsatian Alemannic German",
["gsw-hig"] = "High Alemannic German",
["gsw-hst"] = "Highest Alemannic German",
["gsw-low"] = "Low Alemannic German",
["gu-kat"] = "Kathiyawadi",
["gu-lda"] = "Lisan ud-Dawat Gujarati",
["gzi"] = "Gazi",
["hae"] = "Harar Oromo",
["hak-HK"] = "Hong Kong Hakka",
["hak-TW"] = "Taiwanese Hakka",
["hak-dab"] = "Dabu Hakka",
["hak-eam"] = "Early Modern Hakka",
["hak-hai"] = "Hailu Hakka",
["hak-hui"] = "Huiyang Hakka",
["hak-hui-MY"] = "Malaysian Huiyang Hakka",
["hak-mei"] = "Meixian Hakka",
["hak-six"] = "Sixian Hakka",
["hak-zha"] = "Zhao'an Hakka",
["haz"] = "Hazaragi",
["hbo"] = "Biblical Hebrew",
["he-IL"] = "Israeli Hebrew",
["he-med"] = "Medieval Hebrew",
["he-mis"] = "Mishnaic Hebrew",
["hi-mid"] = "Middle Hindi",
["hi-mum"] = "Bombay Hindi",
["hsn-hya"] = "Hengyang Xiang",
["hsn-hzh"] = "Hengzhou Xiang",
["hsn-lou"] = "Loudi Xiang",
["hsn-new"] = "New Xiang",
["hsn-old"] = "Old Xiang",
["ht-sdm"] = "Saint Dominican Creole French",
["hye"] = "Eastern Armenian",
["hyw"] = "Western Armenian",
["inc-aav"] = "Avahattha",
["inc-agu"] = "Gurjara Apabhramsa",
["inc-aka"] = "Kasmiri Apabhramsa",
["inc-ama"] = "Maharastri Apabhramsa",
["inc-asa"] = "Sauraseni Apabhramsa",
["inc-ash-pro"] = "Proto-Middle Indo-Aryan",
["inc-ata"] = "Takka Apabhramsa",
["inc-avr"] = "Vracada Apabhramsa",
["inc-mit"] = "Mitanni",
["iro-ohu"] = "Old Wendat",
["iro-omo"] = "Old Mohawk",
["iro-oon"] = "Old Onondaga",
["it-CH"] = "Switzerland Italian",
["itc-lan"] = "Lanuvian",
["itc-ola"] = "Old Latin",
["itc-pra"] = "Praenestine",
["ja-cla"] = "Classical Japanese",
["ja-ear"] = "Early Modern Japanese",
["ja-mid"] = "Middle Japanese",
["ja-mid-ear"] = "Early Middle Japanese",
["ja-mid-lat"] = "Late Middle Japanese",
["jpa"] = "Jewish Palestinian Aramaic",
["jrb"] = "Judeo-Arabic",
["ka-mid"] = "Middle Georgian",
["kbg"] = "Khamba",
["kea-alu"] = "ALUPEC Kabuverdianu",
["kea-bar"] = "Barlavento Kabuverdianu",
["kea-bra"] = "Brava Kabuverdianu",
["kea-bvi"] = "Boa Vista Kabuverdianu",
["kea-fog"] = "Fogo Kabuverdianu",
["kea-mai"] = "Maio Kabuverdianu",
["kea-saa"] = "Santo Antão Kabuverdianu",
["kea-sal"] = "Sal Kabuverdianu",
["kea-san"] = "Santiago Kabuverdianu",
["kea-sni"] = "São Nicolau Kabuverdianu",
["kea-sot"] = "Sotavento Kabuverdianu",
["kea-svi"] = "São Vicente Kabuverdianu",
["kfm"] = "Khunsari",
["khg"] = "Khams Tibetan",
["kho-lat"] = "Late Khotanese",
["kho-old"] = "Old Khotanese",
["kjh-fyu"] = "Fuyu Kyrgyz",
["kjv"] = "Kajkavian Serbo-Croatian",
["klj-arg"] = "Arghu",
["kn-hav"] = "Havigannada",
["kn-kun"] = "Kundagannada",
["ko-cen"] = "Central Korean",
["ko-chu"] = "Chungcheong Korean",
["ko-gan"] = "Gangwon Korean",
["ko-gyg"] = "Gyeonggi Korean",
["ko-gys"] = "Gyeongsang Korean",
["ko-ham"] = "Hamgyong Korean",
["ko-hwa"] = "Hwanghae Korean",
["ko-jeo"] = "Jeolla Korean",
["ko-pyo"] = "Pyongan Korean",
["ko-yuk"] = "Yukjin Korean",
["kok-mid"] = "Middle Konkani",
["kok-old"] = "Old Konkani",
["krl-nor"] = "North Karelian",
["krl-sou"] = "South Karelian",
["ksh"] = "Kölsch",
["kze"] = "Kosena",
["la-afr"] = "African Romance",
["la-cla"] = "Classical Latin",
["la-con"] = "Contemporary Latin",
["la-ecc"] = "Ecclesiastical Latin",
["la-eme"] = "Early Medieval Latin",
["la-lat"] = "Late Latin",
["la-med"] = "Medieval Latin",
["la-new"] = "New Latin",
["la-ren"] = "Renaissance Latin",
["la-vul"] = "Vulgar Latin",
["lij-old"] = "Old Ligurian",
["lld-amp"] = "Ampezan Ladin",
["lld-bad"] = "Badiot Ladin",
["lld-cad"] = "Cadorino Ladin",
["lld-fas"] = "Fascian Ladin",
["lld-fod"] = "Fodom Ladin",
["lld-for"] = "Fornes Ladin",
["lld-ghe"] = "Gherdëina Ladin",
["lld-non"] = "Nones Ladin",
["lmo-old"] = "Old Lombard",
["lng"] = "Lombardic",
["ltc-ear"] = "Early Middle Chinese",
["ltc-lat"] = "Late Middle Chinese",
["lut-nor"] = "Northern Lushootseed",
["lzh-KO"] = "Korean Classical Chinese",
["lzh-VI"] = "Vietnamese Classical Chinese",
["lzh-cii"] = "Ci",
["lzh-cmn"] = "Classical Mandarin",
["lzh-cmn-TW"] = "Classical Taiwanese Mandarin",
["lzh-lit"] = "Literary Chinese",
["lzh-pre"] = "Pre-Classical Chinese",
["lzh-shi"] = "Traditional Chinese poetry",
["lzh-tai"] = "Classical Taishanese",
["lzh-yue"] = "Classical Cantonese",
["mn-cha"] = "Chakhar Mongolian",
["mn-kha"] = "Khalkha Mongolian",
["mn-khr"] = "Khorchin Mongolian",
["mn-ord"] = "Ordos Mongolian",
["mns-eas"] = "Eastern Mansi",
["mns-wes"] = "Western Mansi",
["ms-cla"] = "Classical Malay",
["ms-old"] = "Old Malay",
["mul-tax"] = "taxonomic name",
["nan-anx"] = "Anxi Hokkien",
["nan-cha"] = "Changtai Hokkien",
["nan-hbl-PH"] = "Philippine Hokkien",
["nan-hbl-SG"] = "Singapore Hokkien",
["nan-hbl-TW"] = "Taiwanese Hokkien",
["nan-hou"] = "Houlu Min",
["nan-hui"] = "Hui'an Hokkien",
["nan-jin"] = "Jinjiang Hokkien",
["nan-kin"] = "Kinmenese Hokkien",
["nan-med"] = "Medan Hokkien",
["nan-pen"] = "Penang Hokkien",
["nan-qia"] = "Qianlu Min",
["nan-qua"] = "Quanzhou Hokkien",
["nan-spm"] = "Southern Malaysian Hokkien",
["nan-ton"] = "Tong'an Hokkien",
["nan-xia"] = "Xiamen Hokkien",
["nan-yon"] = "Yongchun Hokkien",
["nan-zha"] = "Zhangzhou Hokkien",
["nan-zho"] = "Zhao'an Hokkien",
["nan-zhp"] = "Zhangping Hokkien",
["nap-old"] = "Old Neapolitan",
["ncb-cam"] = "Camorta",
["ncb-kat"] = "Katchal",
["ncb-nan"] = "Nancowry",
["nds-de"] = "German Low German",
["nds-lpr"] = "Low Prussian",
["nds-nl"] = "Dutch Low Saxon",
["nl-BE"] = "Belgian Dutch",
["non-grn"] = "Greenlandic Norse",
["non-oen"] = "Old East Norse",
["non-own"] = "Old West Norse",
["nrf-grn"] = "Guernsey Norman",
["nrf-jer"] = "Jersey Norman",
["ntz"] = "Natanzi",
["nyq"] = "Nayini",
["oc-ara"] = "Aranese",
["oc-auv"] = "Auvergnat",
["oc-gas"] = "Gascon",
["oc-jud"] = "Shuadit",
["oc-lan"] = "Languedocien",
["oc-lim"] = "Limousin",
["oc-pro"] = "Provençal",
["oc-pro-old"] = "Old Provençal",
["oc-viv"] = "Vivaro-Alpine",
["och-ear"] = "Early Old Chinese",
["och-lat"] = "Late Old Chinese",
["ojp-eas"] = "Eastern Old Japanese",
["okm-ear"] = "Early Middle Korean",
["oko-lat"] = "Late Old Korean",
["okz-ang"] = "Angkorian Old Khmer",
["okz-pre"] = "Pre-Angkorian Old Khmer",
["ont"] = "Ontenu",
["oos"] = "Old Ossetic",
["oos-ear"] = "Early Old Ossetic",
["oos-lat"] = "Late Old Ossetic",
["orc"] = "Orma",
["oru-kan"] = "Kaniguram",
["oru-log"] = "Logar",
["os-dig"] = "Digor Ossetian",
["os-iro"] = "Iron Ossetian",
["osc-luc"] = "Lucanian",
["osc-sam"] = "Samnite",
["otk-kir"] = "Old Kirghiz",
["otk-ork"] = "Orkhon Turkic",
["pal-ear"] = "Early Middle Persian",
["pal-lat"] = "Late Middle Persian",
["peo-ear"] = "Early Old Persian",
["peo-lat"] = "Late Old Persian",
["pfl"] = "Palatine German",
["pl-gor"] = "Goral",
["pl-gre"] = "Greater Polish",
["pl-les"] = "Lesser Polish",
["pl-mas"] = "Masovian Polish",
["pld"] = "Polari",
["pms-old"] = "Old Piedmontese",
["pnb"] = "Western Punjabi",
["pra-abh"] = "Abhiri",
["pra-ard"] = "Ardhamagadhi Prakrit",
["pra-ava"] = "Avanti",
["pra-bah"] = "Bahliki",
["pra-can"] = "Candali",
["pra-dak"] = "Daksinatya",
["pra-dra"] = "Dramili",
["pra-hel"] = "Helu Prakrit",
["pra-kha"] = "Khasa Prakrit",
["pra-mag"] = "Magadhi Prakrit",
["pra-mah"] = "Maharastri Prakrit",
["pra-odr"] = "Odri",
["pra-pai"] = "Paisaci Prakrit",
["pra-pra"] = "Pracya",
["pra-pro"] = "Proto-New Indo-Aryan",
["pra-sab"] = "Sabari",
["pra-sak"] = "Sakari",
["pra-sau"] = "Sauraseni Prakrit",
["prs"] = "Dari",
["ps-afr"] = "Afridi",
["ps-ban"] = "Bannu",
["ps-bng"] = "Bangash",
["ps-cgi"] = "Central Ghilzay",
["ps-jad"] = "Jadrani",
["ps-kak"] = "Kakari",
["ps-kan"] = "Kandahari",
["ps-mah"] = "Mahsudi",
["ps-nea"] = "Northeastern Pashto",
["ps-nwe"] = "Northwestern Pashto",
["ps-pes"] = "Peshawari",
["ps-sea"] = "Southeastern Pashto",
["ps-ser"] = "Sher",
["ps-swe"] = "Southwestern Pashto",
["ps-waz"] = "Waziri",
["ps-xat"] = "Khatak",
["pse-bsm"] = "Besemah",
["pt-BR"] = "Brazilian Portuguese",
["pt-PT"] = "European Portuguese",
["qfa-yke-pro"] = "Proto-Ketic",
["qfa-yko-pro"] = "Proto-Kottic",
["qfa-ypm-pro"] = "Proto-Pumpokolic",
["qfa-yrn-pro"] = "Proto-Arinic",
["qsb-bal"] = "Paleo-Balkan",
["qsb-bma"] = "the BMAC substrate",
["qsb-grc"] = "Pre-Greek",
["qsb-ibe"] = "Paleo-Hispanic",
["qwm-arm"] = "Armeno-Kipchak",
["qwm-cum"] = "Cuman",
["qwm-mam"] = "Mamluk-Kipchak",
["qxq"] = "Qashqai",
["rdb-jir"] = "Jirofti",
["rdb-kah"] = "Kahnuji",
["rgn-old"] = "Old Romagnol",
["rm-gri"] = "Rumantsch Grischun",
["rm-old"] = "Old Romansh",
["rm-put"] = "Puter Romansh",
["rm-srm"] = "Surmiran Romansh",
["rm-srs"] = "Sursilvan Romansh",
["rm-sut"] = "Sutsilvan Romansh",
["rm-val"] = "Vallader Romansh",
["ro-MD"] = "Moldovan",
["roa-oit"] = "Old Italian",
["roa-pro"] = "Proto-Romance",
["rw-kin"] = "Kinyarwanda",
["rw-run"] = "Kirundi",
["sa-bhs"] = "Buddhist Hybrid Sanskrit",
["sa-bra"] = "Brahmanic Sanskrit",
["sa-epi"] = "Epic Sanskrit",
["sa-neo"] = "New Sanskrit",
["sa-rig"] = "Rigvedic Sanskrit",
["sc-nuo"] = "Nuorese",
["sc-old"] = "Old Sardinian",
["sc-src"] = "Logudorese",
["sc-sro"] = "Campidanese",
["scn-old"] = "Old Sicilian",
["sco-ins"] = "Insular Scots",
["sco-nor"] = "Northern Scots",
["sco-sou"] = "Southern Scots",
["sco-uls"] = "Ulster Scots",
["sdz"] = "Sallands",
["sgh-baj"] = "Bajui",
["sgh-bar"] = "Bartangi",
["sgh-bro"] = "Bartangi-Oroshori",
["sgh-oro"] = "Oroshori",
["sgh-ros"] = "Roshani",
["sgh-rsx"] = "Roshani-Khufi",
["sgh-xgb"] = "Khughni-Bajui",
["sgh-xuf"] = "Khufi",
["sgh-xug"] = "Khughni",
["sh-tor"] = "Torlakian Serbo-Croatian",
["shi-med"] = "Medieval Tashelhit",
["si-med"] = "Medieval Sinhalese",
["ska"] = "Skagit",
["slh"] = "Southern Lushootseed",
["sli"] = "Silesian East Central German",
["sno"] = "Snohomish",
["sog-ear"] = "Early Sogdian",
["sog-lat"] = "Late Sogdian",
["soj"] = "Soi",
["ssn"] = "Waata",
["stl"] = "Stellingwerfs",
["sxu"] = "Upper Saxon German",
["ta-mid"] = "Middle Tamil",
["tai-shz"] = "Shangsi Zhuang",
["taq"] = "Tamasheq",
["tbq-pro"] = "Proto-Tibeto-Burman",
["th-ayu"] = "Ayutthaya Old Thai",
["th-old"] = "Old Thai",
["th-suk"] = "Sukhothai Old Thai",
["thv"] = "Tamahaq",
["thv-ght"] = "Ghat",
["thz"] = "Tayert",
["tks-cal"] = "Chali Tati",
["tks-dan"] = "Danesfani",
["tks-ebr"] = "Ebrahimabadi",
["tks-esf"] = "Esfarvarini",
["tks-sag"] = "Sagzabadi",
["tks-tak"] = "Takestani",
["tks-xia"] = "Khiaraji",
["tks-xoz"] = "Khoznini",
["tl-cls"] = "Classical Tagalog",
["tl-old"] = "Old Tagalog",
["tly-anb"] = "Anbarani",
["tly-asa"] = "Asalemi",
["tly-aze"] = "Azerbaijani Talysh",
["tly-cen"] = "Central Talysh",
["tly-fum"] = "Fumani",
["tly-kar"] = "Karganrudi",
["tly-msa"] = "Masali",
["tly-msu"] = "Masulei",
["tly-nor"] = "Northern Talysh",
["tly-san"] = "Shandarmani",
["tly-sou"] = "Southern Talysh",
["tly-tal"] = "Taleshdulabi",
["tly-tul"] = "Tularudi",
["tmr"] = "Jewish Babylonian Aramaic",
["tpw-lga"] = "Língua Geral Amazônica",
["tpw-lgp"] = "Língua Geral Paulista",
["tr-CY"] = "Cypriot Turkish",
["trk-bul-pro"] = "Proto-Bulgar",
["trk-cmn-pro"] = "Proto-Common Turkic",
["trk-ogr-pro"] = "Proto-Oghur",
["trk-ogz-pro"] = "Proto-Oghuz",
["tsk"] = "Tseku",
["ttq"] = "Tawellemmet",
["tw"] = "Twi Akan",
["tw-aku"] = "Akuapem Twi",
["tw-asa"] = "Asante Twi",
["twd"] = "Twents",
["uk-CA"] = "Canadian Ukrainian",
["urj-fpr-pro"] = "Proto-Finno-Permic",
["uz-afg"] = "Afghan Uzbek",
["vaf"] = "Vafsi",
["vec-old"] = "Old Venetan",
["vel"] = "Veluws",
["vsn"] = "Vedic Sanskrit",
["wae"] = "Walser German",
["wep"] = "Westphalian",
["wss"] = "Wasa",
["wuu-chm"] = "Shadi Wu",
["wuu-han"] = "Hangzhounese",
["wuu-nin"] = "Ningbonese",
["wuu-nor"] = "Northern Wu",
["wuu-sha"] = "Shanghainese",
["wuu-suz"] = "Suzhounese",
["wuu-wen"] = "Wenzhounese",
["xaq"] = "Aquitanian",
["xbo-dan"] = "Danube Bulgar",
["xbo-vol"] = "Volga Bulgar",
["xcg"] = "Cisalpine Gaulish",
["xfa-cap"] = "Capenate",
["xh-bha"] = "Bhaca",
["xme-aby"] = "Abyanehi",
["xme-abz"] = "Abuzeydabadi",
["xme-amo"] = "Amorehi",
["xme-ana"] = "Anaraki",
["xme-ard"] = "Ardestani",
["xme-azr"] = "Old Azari",
["xme-bdr"] = "Badrudi",
["xme-bid"] = "Bidhandi",
["xme-bij"] = "Bijagani",
["xme-bor"] = "Borujerdi",
["xme-cim"] = "Chimehi",
["xme-del"] = "Delijani",
["xme-far"] = "Farizandi",
["xme-ham"] = "Hamadani",
["xme-han"] = "Hanjani",
["xme-isf"] = "Isfahani",
["xme-jow"] = "Jowshaqani",
["xme-kaf"] = "Kafroni",
["xme-kah"] = "Kahaki",
["xme-kas"] = "Kashani",
["xme-kes"] = "Kesehi",
["xme-kom"] = "Komjani",
["xme-krm"] = "Kermani",
["xme-mah"] = "Mahallati",
["xme-mey"] = "Meymehi",
["xme-nar"] = "Naraqi",
["xme-nas"] = "Nashalji",
["xme-nus"] = "Nushabadi",
["xme-qal"] = "Qalhari",
["xme-qoh"] = "Qohrudi",
["xme-sed"] = "Sedehi",
["xme-tar"] = "Tari",
["xme-trh"] = "Tarehi",
["xme-ttc-cen"] = "Central Tati",
["xme-ttc-eas"] = "Eastern Tati",
["xme-ttc-nor"] = "Northern Tati",
["xme-ttc-sou"] = "Southern Tati",
["xme-ttc-wes"] = "Western Tati",
["xme-val"] = "Valujerdi",
["xme-var"] = "Varani",
["xme-von"] = "Vonishuni",
["xme-vrz"] = "Varzenehi",
["xme-xur"] = "Khuri",
["xme-yar"] = "Yarandi",
["xme-yaz"] = "Yazdi",
["xme-zef"] = "Zefrehi",
["xme-zor"] = "Zori",
["xmn"] = "Manichaean Middle Persian",
["xng-ear"] = "Early Middle Mongol",
["xng-lat"] = "Late Middle Mongol",
["xnn"] = "Northern Kankanaey",
["xno"] = "Anglo-Norman",
["xno-law"] = "Law French",
["xtg"] = "Transalpine Gaulish",
["xvi"] = "Kamviri",
["yue-HK"] = "Hong Kong Cantonese",
["yue-gua"] = "Guangzhou Cantonese",
["yue-lit"] = "Literary Cantonese",
["yue-wvc"] = "Written vernacular Cantonese",
["zh-postal"] = "Postal Romanization",
["zhx-dan"] = "Danzhou Chinese",
["zhx-tai-wvc"] = "Written vernacular Taishanese",
["zhx-zho"] = "Zhongshan Min",
["zle-mbe"] = "Middle Belarusian",
["zle-mru"] = "Middle Russian",
["zle-muk"] = "Middle Ukrainian",
["zle-ops"] = "Old Pskovian",
["zls-chs-ru"] = "Russian Church Slavonic",
["zls-chs-uk"] = "Ukrainian Church Slavonic",
["zlw-mpl"] = "Middle Polish",
["zrp"] = "Zarphatic",
}
53ni4cd6865w3lj7xl9r67m9zabkxy1
234835
234834
2026-05-24T08:17:44Z
Lee
19
[[:en:Module:etymology_languages/code_to_canonical_name]] වෙතින් එක් සංශෝධනයක්
234834
Scribunto
text/plain
return {
["aae"] = "Arbëresh Albanian",
["aat"] = "Arvanitika Albanian",
["abr"] = "Abron",
["acm-khu"] = "Khuzestani Arabic",
["act"] = "Achterhoeks",
["adx"] = "Amdo Tibetan",
["ae-old"] = "Old Avestan",
["ae-yng"] = "Younger Avestan",
["ain-hok"] = "Hokkaido Ainu",
["ain-kur"] = "Kuril Ainu",
["ain-sak"] = "Sakhalin Ainu",
["akk-lbb"] = "Late Babylonian",
["akk-mas"] = "Middle Assyrian",
["akk-mbb"] = "Middle Babylonian",
["akk-nas"] = "Neo-Assyrian",
["akk-nbb"] = "Neo-Babylonian",
["akk-oas"] = "Old Assyrian",
["akk-obb"] = "Old Babylonian",
["akk-old"] = "Old Akkadian",
["akk-stb"] = "Standard Babylonian",
["aln"] = "Gheg Albanian",
["als"] = "Tosk Albanian",
["alv-kro"] = "Kromanti",
["ang-ang"] = "Anglian Old English",
["ang-ken"] = "Kentish Old English",
["ang-mer"] = "Mercian Old English",
["ang-nor"] = "Northumbrian Old English",
["ang-wsx"] = "West Saxon Old English",
["apc-ale"] = "Aleppine North Levantine Arabic",
["apc-dam"] = "Damascene North Levantine Arabic",
["apc-leb"] = "Lebanese North Levantine Arabic",
["apc-nle"] = "North Lebanese North Levantine Arabic",
["apc-sle"] = "South Lebanese North Levantine Arabic",
["apc-syr"] = "Syrian North Levantine Arabic",
["arc-bib"] = "Biblical Aramaic",
["arc-cpa"] = "Christian Palestinian Aramaic",
["arc-hat"] = "Hatran Aramaic",
["arc-imp"] = "Imperial Aramaic",
["arc-jla"] = "Jewish Literary Aramaic",
["arc-nab"] = "Nabataean Aramaic",
["arc-old"] = "Old Aramaic",
["arc-pal"] = "Palmyrene Aramaic",
["as-bkm"] = "Barpetia Kamrupi Assamese",
["as-nkm"] = "Nalbaria Kamrupi Assamese",
["as-pkm"] = "Palasbaria Kamrupi Assamese",
["atn"] = "Ashtiani",
["az-cls"] = "Classical Azerbaijani",
["bat-dni"] = "Dnieper Baltic",
["bat-gol"] = "Golyad",
["bat-pro"] = "Proto-Baltic",
["bcc"] = "Southern Balochi",
["bew-kot"] = "Betawi Kota",
["bgn"] = "Western Balochi",
["bgp"] = "Eastern Balochi",
["bn-dvn"] = "Dhakaiya Vaṅga Bengali",
["bn-nvn"] = "Noakhailla Vaṅga Bengali",
["bnt-cmn"] = "Common Bantu",
["bra-old"] = "Old Braj",
["bry-ear"] = "Early Brythonic",
["bry-lat"] = "Late Brythonic",
["bsg-ban"] = "Bandari",
["bsg-hor"] = "Hormozi",
["bsg-min"] = "Minabi",
["bsh-kat"] = "Kativiri",
["bsh-mum"] = "Mumviri",
["ca-val"] = "Valencian",
["ckm"] = "Chakavian Serbo-Croatian",
["cls"] = "Classical Sanskrit",
["cmn-MY"] = "Malaysian Mandarin",
["cmn-PH"] = "Philippine Mandarin",
["cmn-SG"] = "Singapore Mandarin",
["cmn-TW"] = "Taiwanese Mandarin",
["cmn-bec"] = "Beijingic Mandarin",
["cmn-bei"] = "Beijing Mandarin",
["cmn-cep"] = "Central Plains Mandarin",
["cmn-ear"] = "Early Mandarin",
["cmn-gua"] = "Guanzhong Mandarin",
["cmn-gui"] = "Guilin Mandarin",
["cmn-jhu"] = "Jianghuai Mandarin",
["cmn-lan"] = "Lanyin Mandarin",
["cmn-nan"] = "Nanjing Mandarin",
["cmn-noe"] = "Northeastern Mandarin",
["cmn-palladius"] = "Palladius",
["cmn-pinyin"] = "Hanyu Pinyin",
["cmn-sow"] = "Southwestern Mandarin",
["cmn-tia"] = "Tianjin Mandarin",
["cmn-tongyong"] = "Tongyong Pinyin",
["cmn-wadegiles"] = "Wade–Giles",
["cmn-wuh"] = "Wuhan Mandarin",
["cmn-wvc"] = "Written vernacular Mandarin",
["cmn-xin"] = "Xining Mandarin",
["cmn-yan"] = "Yangzhou Mandarin",
["cop-akh"] = "Akhmimic Coptic",
["cop-boh"] = "Bohairic Coptic",
["cop-fay"] = "Fayyumic Coptic",
["cop-ggg"] = "Coptic Dialect G",
["cop-her"] = "Hermopolitan Coptic",
["cop-jjj"] = "Coptic Dialect J",
["cop-kkk"] = "Coptic Dialect K",
["cop-lyc"] = "Lycopolitan Coptic",
["cop-old"] = "Old Coptic",
["cop-oxy"] = "Oxyrhynchite Coptic",
["cop-ply"] = "Proto-Lycopolitan Coptic",
["cop-ppp"] = "Coptic Dialect P",
["cop-sah"] = "Sahidic Coptic",
["crh-dbj"] = "Dobrujan Tatar",
["cs-ear"] = "Early Modern Czech",
["cu-bgm"] = "Middle Bulgarian",
["cv-ana"] = "Anatri Chuvash",
["cv-mid"] = "Middle Chuvash",
["cv-old"] = "Old Chuvash",
["cv-vir"] = "Viryal Chuvash",
["cy-nor"] = "North Wales Welsh",
["cy-sou"] = "South Wales Welsh",
["de-AT"] = "Austrian German",
["de-AT-vie"] = "Viennese German",
["de-CH"] = "Switzerland German",
["de-bal"] = "Baltic German",
["de-ear"] = "Early New High German",
["drt"] = "Drents",
["dv-add"] = "Addu Dhivehi",
["dv-huv"] = "Huvadhu Dhivehi",
["dv-mul"] = "Mulaku Dhivehi",
["dv-old"] = "Old Dhivehi",
["egl-old"] = "Old Emilian",
["egy-lat"] = "Late Egyptian",
["egy-mid"] = "Middle Egyptian",
["egy-nmi"] = "Neo-Middle Egyptian",
["egy-old"] = "Old Egyptian",
["el-crt"] = "Cretan Greek",
["el-cyp"] = "Cypriot Greek",
["el-kal"] = "Kaliarda",
["el-kth"] = "Katharevousa",
["el-pap"] = "Paphian Greek",
["elx-ach"] = "Achaemenid Elamite",
["elx-mid"] = "Middle Elamite",
["elx-neo"] = "Neo-Elamite",
["elx-old"] = "Old Elamite",
["en-AU"] = "Australian English",
["en-CA"] = "Canadian English",
["en-GB"] = "British English",
["en-GB-NIR"] = "Northern Irish English",
["en-GB-SCT"] = "Scottish English",
["en-GB-WLS"] = "Welsh English",
["en-HK"] = "Hong Kong English",
["en-IE"] = "Irish English",
["en-IM"] = "Manx English",
["en-IN"] = "Indian English",
["en-NNN"] = "North American English",
["en-NZ"] = "New Zealand English",
["en-US"] = "American English",
["en-US-CA"] = "California English",
["en-ZA"] = "South African English",
["en-aae"] = "Australian Aboriginal English",
["en-ear"] = "Early Modern English",
["en-geo"] = "Geordie",
["en-uls"] = "Ulster English",
["enm-emi"] = "East Midland Middle English",
["enm-esc"] = "Early Scots",
["enm-ken"] = "Kentish Middle English",
["enm-nor"] = "Northern Middle English",
["enm-sou"] = "Southern Middle English",
["enm-wmi"] = "West Midland Middle English",
["es-AR"] = "Rioplatense Spanish",
["es-BO"] = "Bolivian Spanish",
["es-CL"] = "Chilean Spanish",
["es-CO"] = "Colombian Spanish",
["es-CU"] = "Cuban Spanish",
["es-MX"] = "Mexican Spanish",
["es-PE"] = "Peruvian Spanish",
["es-PH"] = "Philippine Spanish",
["es-PR"] = "Puerto Rican Spanish",
["es-US"] = "United States Spanish",
["es-VE"] = "Venezuelan Spanish",
["es-ear"] = "Early Modern Spanish",
["es-lun"] = "Lunfardo",
["esi"] = "North Alaskan Inupiatun",
["esk"] = "Northwest Alaskan Inupiatun",
["fa-cls"] = "Classical Persian",
["fa-ear"] = "Early New Persian",
["fa-ira"] = "Iranian Persian",
["fat"] = "Fante Akan",
["fay-bsh"] = "Bushehri",
["fay-bur"] = "Burenjani",
["fay-dav"] = "Davani",
["fay-dsh"] = "Dashtaki",
["fay-eze"] = "Emamzada Esmaili",
["fay-gav"] = "Gavkoshaki",
["fay-kar"] = "Khargi",
["fay-kho"] = "Khollari",
["fay-kon"] = "Kondazi",
["fay-kzo"] = "Old Kazeruni",
["fay-mas"] = "Masarami",
["fay-pap"] = "Papuni",
["fay-sam"] = "Samghani",
["fay-sho"] = "Old Shirazi",
["fay-shr"] = "Shirazi",
["fay-sor"] = "Sorkhi",
["ffm"] = "Maasina Fulfulde",
["fiu-pro"] = "Proto-Finno-Ugric",
["fr-CA"] = "Canadian French",
["fr-CH"] = "Swiss French",
["fr-aca"] = "Acadian French",
["fr-lou"] = "Louisiana French",
["fr-mis"] = "Missouri French",
["frc"] = "Cajun French",
["frk"] = "Frankish",
["fro-nor"] = "Old Northern French",
["fro-pic"] = "Picard Old French",
["frp-old"] = "Old Franco-Provençal",
["frr-amr"] = "Amrum North Frisian",
["frr-fam"] = "Föhr-Amrum North Frisian",
["frr-foh"] = "Föhr North Frisian",
["frr-goe"] = "Goesharde North Frisian",
["frr-hal"] = "Halligen North Frisian",
["frr-hel"] = "Heligoland North Frisian",
["frr-ins"] = "Insular North Frisian",
["frr-kar"] = "Karrharde North Frisian",
["frr-mai"] = "Mainland North Frisian",
["frr-moo"] = "Mooring North Frisian",
["frr-syl"] = "Sylt North Frisian",
["frr-wie"] = "Wiedingharde North Frisian",
["frs"] = "East Frisian Low German",
["fub"] = "Adamawa Fulfulde",
["fuc"] = "Pulaar",
["fue"] = "Borgu Fulfulde",
["fuf"] = "Pular",
["fuh"] = "Western Niger Fulfulde",
["fui"] = "Bagirmi Fulfulde",
["fuq"] = "Central-Eastern Niger Fulfulde",
["fur-old"] = "Old Friulian",
["fuv"] = "Nigerian Fulfulde",
["gax"] = "Borana",
["gbz"] = "Zoroastrian Dari",
["gem-sue"] = "Suevic",
["gkm"] = "Byzantine Greek",
["gmq-osw-lat"] = "Late Old Swedish",
["gmw-afr-pro"] = "Proto-Anglo-Frisian",
["gmw-nsg-pro"] = "Proto-North Sea Germanic",
["gos"] = "Gronings",
["grc-aeo"] = "Aeolic Greek",
["grc-arc"] = "Arcadian Greek",
["grc-arp"] = "Arcadocypriot Greek",
["grc-att"] = "Attic Greek",
["grc-boi"] = "Boeotian Greek",
["grc-cyp"] = "Cypriot Ancient Greek",
["grc-dor"] = "Doric Greek",
["grc-ela"] = "Elean Greek",
["grc-epi"] = "Epic Greek",
["grc-ion"] = "Ionic Greek",
["grc-koi"] = "Koine Greek",
["grc-kre"] = "Cretan Ancient Greek",
["grc-opl"] = "Opuntian Locrian",
["grc-ozl"] = "Ozolian Locrian",
["grc-pam"] = "Pamphylian Greek",
["grc-ths"] = "Thessalian Greek",
["gsw-FR-als"] = "Alsatian Alemannic German",
["gsw-hig"] = "High Alemannic German",
["gsw-hst"] = "Highest Alemannic German",
["gsw-low"] = "Low Alemannic German",
["gu-kat"] = "Kathiyawadi",
["gu-lda"] = "Lisan ud-Dawat Gujarati",
["gzi"] = "Gazi",
["hae"] = "Harar Oromo",
["hak-HK"] = "Hong Kong Hakka",
["hak-TW"] = "Taiwanese Hakka",
["hak-dab"] = "Dabu Hakka",
["hak-eam"] = "Early Modern Hakka",
["hak-hai"] = "Hailu Hakka",
["hak-hui"] = "Huiyang Hakka",
["hak-hui-MY"] = "Malaysian Huiyang Hakka",
["hak-mei"] = "Meixian Hakka",
["hak-six"] = "Sixian Hakka",
["hak-zha"] = "Zhao'an Hakka",
["haz"] = "Hazaragi",
["hbo"] = "Biblical Hebrew",
["he-IL"] = "Israeli Hebrew",
["he-med"] = "Medieval Hebrew",
["he-mis"] = "Mishnaic Hebrew",
["hi-mid"] = "Middle Hindi",
["hi-mum"] = "Bombay Hindi",
["hsn-hya"] = "Hengyang Xiang",
["hsn-hzh"] = "Hengzhou Xiang",
["hsn-lou"] = "Loudi Xiang",
["hsn-new"] = "New Xiang",
["hsn-old"] = "Old Xiang",
["ht-sdm"] = "Saint Dominican Creole French",
["hye"] = "Eastern Armenian",
["hyw"] = "Western Armenian",
["inc-aav"] = "Avahattha",
["inc-agu"] = "Gurjara Apabhramsa",
["inc-aka"] = "Kasmiri Apabhramsa",
["inc-ama"] = "Maharastri Apabhramsa",
["inc-asa"] = "Sauraseni Apabhramsa",
["inc-ash-pro"] = "Proto-Middle Indo-Aryan",
["inc-ata"] = "Takka Apabhramsa",
["inc-avr"] = "Vracada Apabhramsa",
["inc-mit"] = "Mitanni",
["iro-ohu"] = "Old Wendat",
["iro-omo"] = "Old Mohawk",
["iro-oon"] = "Old Onondaga",
["it-CH"] = "Switzerland Italian",
["itc-lan"] = "Lanuvian",
["itc-ola"] = "Old Latin",
["itc-pra"] = "Praenestine",
["ja-cla"] = "Classical Japanese",
["ja-ear"] = "Early Modern Japanese",
["ja-mid"] = "Middle Japanese",
["ja-mid-ear"] = "Early Middle Japanese",
["ja-mid-lat"] = "Late Middle Japanese",
["jpa"] = "Jewish Palestinian Aramaic",
["jrb"] = "Judeo-Arabic",
["ka-mid"] = "Middle Georgian",
["kbg"] = "Khamba",
["kea-alu"] = "ALUPEC Kabuverdianu",
["kea-bar"] = "Barlavento Kabuverdianu",
["kea-bra"] = "Brava Kabuverdianu",
["kea-bvi"] = "Boa Vista Kabuverdianu",
["kea-fog"] = "Fogo Kabuverdianu",
["kea-mai"] = "Maio Kabuverdianu",
["kea-saa"] = "Santo Antão Kabuverdianu",
["kea-sal"] = "Sal Kabuverdianu",
["kea-san"] = "Santiago Kabuverdianu",
["kea-sni"] = "São Nicolau Kabuverdianu",
["kea-sot"] = "Sotavento Kabuverdianu",
["kea-svi"] = "São Vicente Kabuverdianu",
["kfm"] = "Khunsari",
["khg"] = "Khams Tibetan",
["kho-lat"] = "Late Khotanese",
["kho-old"] = "Old Khotanese",
["kjh-fyu"] = "Fuyu Kyrgyz",
["kjv"] = "Kajkavian Serbo-Croatian",
["klj-arg"] = "Arghu",
["kn-hav"] = "Havigannada",
["kn-kun"] = "Kundagannada",
["ko-cen"] = "Central Korean",
["ko-chu"] = "Chungcheong Korean",
["ko-gan"] = "Gangwon Korean",
["ko-gyg"] = "Gyeonggi Korean",
["ko-gys"] = "Gyeongsang Korean",
["ko-ham"] = "Hamgyong Korean",
["ko-hwa"] = "Hwanghae Korean",
["ko-jeo"] = "Jeolla Korean",
["ko-pyo"] = "Pyongan Korean",
["ko-yuk"] = "Yukjin Korean",
["kok-mid"] = "Middle Konkani",
["kok-old"] = "Old Konkani",
["krl-nor"] = "North Karelian",
["krl-sou"] = "South Karelian",
["ksh"] = "Kölsch",
["kze"] = "Kosena",
["la-afr"] = "African Romance",
["la-cla"] = "Classical Latin",
["la-con"] = "Contemporary Latin",
["la-ecc"] = "Ecclesiastical Latin",
["la-eme"] = "Early Medieval Latin",
["la-lat"] = "Late Latin",
["la-med"] = "Medieval Latin",
["la-new"] = "New Latin",
["la-ren"] = "Renaissance Latin",
["la-vul"] = "Vulgar Latin",
["lij-old"] = "Old Ligurian",
["lld-amp"] = "Ampezan Ladin",
["lld-bad"] = "Badiot Ladin",
["lld-cad"] = "Cadorino Ladin",
["lld-fas"] = "Fascian Ladin",
["lld-fod"] = "Fodom Ladin",
["lld-for"] = "Fornes Ladin",
["lld-ghe"] = "Gherdëina Ladin",
["lld-non"] = "Nones Ladin",
["lmo-old"] = "Old Lombard",
["lng"] = "Lombardic",
["ltc-ear"] = "Early Middle Chinese",
["ltc-lat"] = "Late Middle Chinese",
["lut-nor"] = "Northern Lushootseed",
["lzh-KO"] = "Korean Classical Chinese",
["lzh-VI"] = "Vietnamese Classical Chinese",
["lzh-cii"] = "Ci",
["lzh-cmn"] = "Classical Mandarin",
["lzh-cmn-TW"] = "Classical Taiwanese Mandarin",
["lzh-lit"] = "Literary Chinese",
["lzh-pre"] = "Pre-Classical Chinese",
["lzh-shi"] = "Traditional Chinese poetry",
["lzh-tai"] = "Classical Taishanese",
["lzh-yue"] = "Classical Cantonese",
["mn-cha"] = "Chakhar Mongolian",
["mn-kha"] = "Khalkha Mongolian",
["mn-khr"] = "Khorchin Mongolian",
["mn-ord"] = "Ordos Mongolian",
["mns-eas"] = "Eastern Mansi",
["mns-wes"] = "Western Mansi",
["ms-cla"] = "Classical Malay",
["ms-old"] = "Old Malay",
["mul-tax"] = "taxonomic name",
["nan-anx"] = "Anxi Hokkien",
["nan-cha"] = "Changtai Hokkien",
["nan-hbl-PH"] = "Philippine Hokkien",
["nan-hbl-SG"] = "Singapore Hokkien",
["nan-hbl-TW"] = "Taiwanese Hokkien",
["nan-hou"] = "Houlu Min",
["nan-hui"] = "Hui'an Hokkien",
["nan-jin"] = "Jinjiang Hokkien",
["nan-kin"] = "Kinmenese Hokkien",
["nan-med"] = "Medan Hokkien",
["nan-pen"] = "Penang Hokkien",
["nan-qia"] = "Qianlu Min",
["nan-qua"] = "Quanzhou Hokkien",
["nan-spm"] = "Southern Malaysian Hokkien",
["nan-ton"] = "Tong'an Hokkien",
["nan-xia"] = "Xiamen Hokkien",
["nan-yon"] = "Yongchun Hokkien",
["nan-zha"] = "Zhangzhou Hokkien",
["nan-zho"] = "Zhao'an Hokkien",
["nan-zhp"] = "Zhangping Hokkien",
["nap-old"] = "Old Neapolitan",
["ncb-cam"] = "Camorta",
["ncb-kat"] = "Katchal",
["ncb-nan"] = "Nancowry",
["nds-de"] = "German Low German",
["nds-lpr"] = "Low Prussian",
["nds-nl"] = "Dutch Low Saxon",
["nl-BE"] = "Belgian Dutch",
["non-grn"] = "Greenlandic Norse",
["non-oen"] = "Old East Norse",
["non-own"] = "Old West Norse",
["nrf-grn"] = "Guernsey Norman",
["nrf-jer"] = "Jersey Norman",
["ntz"] = "Natanzi",
["nyq"] = "Nayini",
["oc-ara"] = "Aranese",
["oc-auv"] = "Auvergnat",
["oc-gas"] = "Gascon",
["oc-jud"] = "Shuadit",
["oc-lan"] = "Languedocien",
["oc-lim"] = "Limousin",
["oc-pro"] = "Provençal",
["oc-pro-old"] = "Old Provençal",
["oc-viv"] = "Vivaro-Alpine",
["och-ear"] = "Early Old Chinese",
["och-lat"] = "Late Old Chinese",
["ojp-eas"] = "Eastern Old Japanese",
["okm-ear"] = "Early Middle Korean",
["oko-lat"] = "Late Old Korean",
["okz-ang"] = "Angkorian Old Khmer",
["okz-pre"] = "Pre-Angkorian Old Khmer",
["ont"] = "Ontenu",
["oos"] = "Old Ossetic",
["oos-ear"] = "Early Old Ossetic",
["oos-lat"] = "Late Old Ossetic",
["orc"] = "Orma",
["oru-kan"] = "Kaniguram",
["oru-log"] = "Logar",
["os-dig"] = "Digor Ossetian",
["os-iro"] = "Iron Ossetian",
["osc-luc"] = "Lucanian",
["osc-sam"] = "Samnite",
["otk-kir"] = "Old Kirghiz",
["otk-ork"] = "Orkhon Turkic",
["pal-ear"] = "Early Middle Persian",
["pal-lat"] = "Late Middle Persian",
["peo-ear"] = "Early Old Persian",
["peo-lat"] = "Late Old Persian",
["pfl"] = "Palatine German",
["pl-gor"] = "Goral",
["pl-gre"] = "Greater Polish",
["pl-les"] = "Lesser Polish",
["pl-mas"] = "Masovian Polish",
["pld"] = "Polari",
["pms-old"] = "Old Piedmontese",
["pnb"] = "Western Punjabi",
["pra-abh"] = "Abhiri",
["pra-ard"] = "Ardhamagadhi Prakrit",
["pra-ava"] = "Avanti",
["pra-bah"] = "Bahliki",
["pra-can"] = "Candali",
["pra-dak"] = "Daksinatya",
["pra-dra"] = "Dramili",
["pra-hel"] = "Helu Prakrit",
["pra-kha"] = "Khasa Prakrit",
["pra-mag"] = "Magadhi Prakrit",
["pra-mah"] = "Maharastri Prakrit",
["pra-odr"] = "Odri",
["pra-pai"] = "Paisaci Prakrit",
["pra-pra"] = "Pracya",
["pra-pro"] = "Proto-New Indo-Aryan",
["pra-sab"] = "Sabari",
["pra-sak"] = "Sakari",
["pra-sau"] = "Sauraseni Prakrit",
["prs"] = "Dari",
["ps-afr"] = "Afridi",
["ps-ban"] = "Bannu",
["ps-bng"] = "Bangash",
["ps-cgi"] = "Central Ghilzay",
["ps-jad"] = "Jadrani",
["ps-kak"] = "Kakari",
["ps-kan"] = "Kandahari",
["ps-mah"] = "Mahsudi",
["ps-nea"] = "Northeastern Pashto",
["ps-nwe"] = "Northwestern Pashto",
["ps-pes"] = "Peshawari",
["ps-sea"] = "Southeastern Pashto",
["ps-ser"] = "Sher",
["ps-swe"] = "Southwestern Pashto",
["ps-waz"] = "Waziri",
["ps-xat"] = "Khatak",
["pse-bsm"] = "Besemah",
["pt-BR"] = "Brazilian Portuguese",
["pt-PT"] = "European Portuguese",
["qfa-yke-pro"] = "Proto-Ketic",
["qfa-yko-pro"] = "Proto-Kottic",
["qfa-ypm-pro"] = "Proto-Pumpokolic",
["qfa-yrn-pro"] = "Proto-Arinic",
["qsb-bal"] = "Paleo-Balkan",
["qsb-bma"] = "the BMAC substrate",
["qsb-grc"] = "Pre-Greek",
["qsb-ibe"] = "Paleo-Hispanic",
["qwm-arm"] = "Armeno-Kipchak",
["qwm-cum"] = "Cuman",
["qwm-mam"] = "Mamluk-Kipchak",
["qxq"] = "Qashqai",
["rdb-jir"] = "Jirofti",
["rdb-kah"] = "Kahnuji",
["rgn-old"] = "Old Romagnol",
["rm-gri"] = "Rumantsch Grischun",
["rm-old"] = "Old Romansh",
["rm-put"] = "Puter Romansh",
["rm-srm"] = "Surmiran Romansh",
["rm-srs"] = "Sursilvan Romansh",
["rm-sut"] = "Sutsilvan Romansh",
["rm-val"] = "Vallader Romansh",
["ro-MD"] = "Moldovan",
["roa-oit"] = "Old Italian",
["roa-pro"] = "Proto-Romance",
["rw-kin"] = "Kinyarwanda",
["rw-run"] = "Kirundi",
["sa-bhs"] = "Buddhist Hybrid Sanskrit",
["sa-bra"] = "Brahmanic Sanskrit",
["sa-epi"] = "Epic Sanskrit",
["sa-neo"] = "New Sanskrit",
["sa-rig"] = "Rigvedic Sanskrit",
["sc-nuo"] = "Nuorese",
["sc-old"] = "Old Sardinian",
["sc-src"] = "Logudorese",
["sc-sro"] = "Campidanese",
["scn-old"] = "Old Sicilian",
["sco-ins"] = "Insular Scots",
["sco-nor"] = "Northern Scots",
["sco-sou"] = "Southern Scots",
["sco-uls"] = "Ulster Scots",
["sdz"] = "Sallands",
["sgh-baj"] = "Bajui",
["sgh-bar"] = "Bartangi",
["sgh-bro"] = "Bartangi-Oroshori",
["sgh-oro"] = "Oroshori",
["sgh-ros"] = "Roshani",
["sgh-rsx"] = "Roshani-Khufi",
["sgh-xgb"] = "Khughni-Bajui",
["sgh-xuf"] = "Khufi",
["sgh-xug"] = "Khughni",
["sh-tor"] = "Torlakian Serbo-Croatian",
["shi-med"] = "Medieval Tashelhit",
["si-med"] = "Medieval Sinhalese",
["ska"] = "Skagit",
["slh"] = "Southern Lushootseed",
["sli"] = "Silesian East Central German",
["sno"] = "Snohomish",
["sog-ear"] = "Early Sogdian",
["sog-lat"] = "Late Sogdian",
["soj"] = "Soi",
["ssn"] = "Waata",
["stl"] = "Stellingwerfs",
["sxu"] = "Upper Saxon German",
["ta-mid"] = "Middle Tamil",
["tai-shz"] = "Shangsi Zhuang",
["taq"] = "Tamasheq",
["tbq-pro"] = "Proto-Tibeto-Burman",
["th-ayu"] = "Ayutthaya Old Thai",
["th-old"] = "Old Thai",
["th-suk"] = "Sukhothai Old Thai",
["thv"] = "Tamahaq",
["thv-ght"] = "Ghat",
["thz"] = "Tayert",
["tks-cal"] = "Chali Tati",
["tks-dan"] = "Danesfani",
["tks-ebr"] = "Ebrahimabadi",
["tks-esf"] = "Esfarvarini",
["tks-sag"] = "Sagzabadi",
["tks-tak"] = "Takestani",
["tks-xia"] = "Khiaraji",
["tks-xoz"] = "Khoznini",
["tl-cls"] = "Classical Tagalog",
["tl-old"] = "Old Tagalog",
["tly-anb"] = "Anbarani",
["tly-asa"] = "Asalemi",
["tly-aze"] = "Azerbaijani Talysh",
["tly-cen"] = "Central Talysh",
["tly-fum"] = "Fumani",
["tly-kar"] = "Karganrudi",
["tly-msa"] = "Masali",
["tly-msu"] = "Masulei",
["tly-nor"] = "Northern Talysh",
["tly-san"] = "Shandarmani",
["tly-sou"] = "Southern Talysh",
["tly-tal"] = "Taleshdulabi",
["tly-tul"] = "Tularudi",
["tmr"] = "Jewish Babylonian Aramaic",
["tpw-lga"] = "Língua Geral Amazônica",
["tpw-lgp"] = "Língua Geral Paulista",
["tr-CY"] = "Cypriot Turkish",
["trk-bul-pro"] = "Proto-Bulgar",
["trk-cmn-pro"] = "Proto-Common Turkic",
["trk-ogr-pro"] = "Proto-Oghur",
["trk-ogz-pro"] = "Proto-Oghuz",
["tsk"] = "Tseku",
["ttq"] = "Tawellemmet",
["tw"] = "Twi Akan",
["tw-aku"] = "Akuapem Twi",
["tw-asa"] = "Asante Twi",
["twd"] = "Twents",
["uk-CA"] = "Canadian Ukrainian",
["urj-fpr-pro"] = "Proto-Finno-Permic",
["uz-afg"] = "Afghan Uzbek",
["vaf"] = "Vafsi",
["vec-old"] = "Old Venetan",
["vel"] = "Veluws",
["vsn"] = "Vedic Sanskrit",
["wae"] = "Walser German",
["wep"] = "Westphalian",
["wss"] = "Wasa",
["wuu-chm"] = "Shadi Wu",
["wuu-han"] = "Hangzhounese",
["wuu-nin"] = "Ningbonese",
["wuu-nor"] = "Northern Wu",
["wuu-sha"] = "Shanghainese",
["wuu-suz"] = "Suzhounese",
["wuu-wen"] = "Wenzhounese",
["xaq"] = "Aquitanian",
["xbo-dan"] = "Danube Bulgar",
["xbo-vol"] = "Volga Bulgar",
["xcg"] = "Cisalpine Gaulish",
["xfa-cap"] = "Capenate",
["xh-bha"] = "Bhaca",
["xme-aby"] = "Abyanehi",
["xme-abz"] = "Abuzeydabadi",
["xme-amo"] = "Amorehi",
["xme-ana"] = "Anaraki",
["xme-ard"] = "Ardestani",
["xme-azr"] = "Old Azari",
["xme-bdr"] = "Badrudi",
["xme-bid"] = "Bidhandi",
["xme-bij"] = "Bijagani",
["xme-bor"] = "Borujerdi",
["xme-cim"] = "Chimehi",
["xme-del"] = "Delijani",
["xme-far"] = "Farizandi",
["xme-ham"] = "Hamadani",
["xme-han"] = "Hanjani",
["xme-isf"] = "Isfahani",
["xme-jow"] = "Jowshaqani",
["xme-kaf"] = "Kafroni",
["xme-kah"] = "Kahaki",
["xme-kas"] = "Kashani",
["xme-kes"] = "Kesehi",
["xme-kom"] = "Komjani",
["xme-krm"] = "Kermani",
["xme-mah"] = "Mahallati",
["xme-mey"] = "Meymehi",
["xme-nar"] = "Naraqi",
["xme-nas"] = "Nashalji",
["xme-nus"] = "Nushabadi",
["xme-qal"] = "Qalhari",
["xme-qoh"] = "Qohrudi",
["xme-sed"] = "Sedehi",
["xme-tar"] = "Tari",
["xme-trh"] = "Tarehi",
["xme-ttc-cen"] = "Central Tati",
["xme-ttc-eas"] = "Eastern Tati",
["xme-ttc-nor"] = "Northern Tati",
["xme-ttc-sou"] = "Southern Tati",
["xme-ttc-wes"] = "Western Tati",
["xme-val"] = "Valujerdi",
["xme-var"] = "Varani",
["xme-von"] = "Vonishuni",
["xme-vrz"] = "Varzenehi",
["xme-xur"] = "Khuri",
["xme-yar"] = "Yarandi",
["xme-yaz"] = "Yazdi",
["xme-zef"] = "Zefrehi",
["xme-zor"] = "Zori",
["xmn"] = "Manichaean Middle Persian",
["xng-ear"] = "Early Middle Mongol",
["xng-lat"] = "Late Middle Mongol",
["xnn"] = "Northern Kankanaey",
["xno"] = "Anglo-Norman",
["xno-law"] = "Law French",
["xtg"] = "Transalpine Gaulish",
["xvi"] = "Kamviri",
["yue-HK"] = "Hong Kong Cantonese",
["yue-gua"] = "Guangzhou Cantonese",
["yue-lit"] = "Literary Cantonese",
["yue-wvc"] = "Written vernacular Cantonese",
["zh-postal"] = "Postal Romanization",
["zhx-dan"] = "Danzhou Chinese",
["zhx-tai-wvc"] = "Written vernacular Taishanese",
["zhx-zho"] = "Zhongshan Min",
["zle-mbe"] = "Middle Belarusian",
["zle-mru"] = "Middle Russian",
["zle-muk"] = "Middle Ukrainian",
["zle-ops"] = "Old Pskovian",
["zls-chs-ru"] = "Russian Church Slavonic",
["zls-chs-uk"] = "Ukrainian Church Slavonic",
["zlw-mpl"] = "Middle Polish",
["zrp"] = "Zarphatic",
}
53ni4cd6865w3lj7xl9r67m9zabkxy1
234836
234835
2026-05-24T08:18:47Z
Lee
19
පැරණි සංස්කරණයකින් ගත් කොටස්...
234836
Scribunto
text/plain
return {
["aae"] = "Arbëresh Albanian",
["aat"] = "Arvanitika Albanian",
["abr"] = "Abron",
["acm-khu"] = "Khuzestani Arabic",
["act"] = "Achterhoeks",
["adx"] = "Amdo Tibetan",
["ae-old"] = "Old Avestan",
["ae-yng"] = "Younger Avestan",
["ain-hok"] = "Hokkaido Ainu",
["ain-kur"] = "Kuril Ainu",
["ain-sak"] = "Sakhalin Ainu",
["akk-lbb"] = "Late Babylonian",
["akk-mas"] = "Middle Assyrian",
["akk-mbb"] = "Middle Babylonian",
["akk-nas"] = "Neo-Assyrian",
["akk-nbb"] = "Neo-Babylonian",
["akk-oas"] = "Old Assyrian",
["akk-obb"] = "Old Babylonian",
["akk-old"] = "Old Akkadian",
["akk-stb"] = "Standard Babylonian",
["aln"] = "Gheg Albanian",
["als"] = "Tosk Albanian",
["alv-kro"] = "Kromanti",
["ang-ang"] = "Anglian Old English",
["ang-ken"] = "Kentish Old English",
["ang-mer"] = "Mercian Old English",
["ang-nor"] = "Northumbrian Old English",
["ang-wsx"] = "West Saxon Old English",
["apc-ale"] = "Aleppine North Levantine Arabic",
["apc-dam"] = "Damascene North Levantine Arabic",
["apc-leb"] = "Lebanese North Levantine Arabic",
["apc-nle"] = "North Lebanese North Levantine Arabic",
["apc-sle"] = "South Lebanese North Levantine Arabic",
["apc-syr"] = "Syrian North Levantine Arabic",
["arc-bib"] = "Biblical Aramaic",
["arc-cpa"] = "Christian Palestinian Aramaic",
["arc-hat"] = "Hatran Aramaic",
["arc-imp"] = "Imperial Aramaic",
["arc-jla"] = "Jewish Literary Aramaic",
["arc-nab"] = "Nabataean Aramaic",
["arc-old"] = "Old Aramaic",
["arc-pal"] = "Palmyrene Aramaic",
["as-bkm"] = "Barpetia Kamrupi Assamese",
["as-nkm"] = "Nalbaria Kamrupi Assamese",
["as-pkm"] = "Palasbaria Kamrupi Assamese",
["atn"] = "Ashtiani",
["az-cls"] = "Classical Azerbaijani",
["bat-dni"] = "Dnieper Baltic",
["bat-gol"] = "Golyad",
["bat-pro"] = "Proto-Baltic",
["bcc"] = "Southern Balochi",
["bew-kot"] = "Betawi Kota",
["bgn"] = "Western Balochi",
["bgp"] = "Eastern Balochi",
["bn-dvn"] = "Dhakaiya Vaṅga Bengali",
["bn-nvn"] = "Noakhailla Vaṅga Bengali",
["bnt-cmn"] = "Common Bantu",
["bra-old"] = "Old Braj",
["bry-ear"] = "Early Brythonic",
["bry-lat"] = "Late Brythonic",
["bsg-ban"] = "Bandari",
["bsg-hor"] = "Hormozi",
["bsg-min"] = "Minabi",
["bsh-kat"] = "Kativiri",
["bsh-mum"] = "Mumviri",
["ca-val"] = "Valencian",
["ckm"] = "Chakavian Serbo-Croatian",
["cls"] = "Classical Sanskrit",
["cmn-MY"] = "Malaysian Mandarin",
["cmn-PH"] = "Philippine Mandarin",
["cmn-SG"] = "Singapore Mandarin",
["cmn-TW"] = "Taiwanese Mandarin",
["cmn-bec"] = "Beijingic Mandarin",
["cmn-bei"] = "Beijing Mandarin",
["cmn-cep"] = "Central Plains Mandarin",
["cmn-ear"] = "Early Mandarin",
["cmn-gua"] = "Guanzhong Mandarin",
["cmn-gui"] = "Guilin Mandarin",
["cmn-jhu"] = "Jianghuai Mandarin",
["cmn-lan"] = "Lanyin Mandarin",
["cmn-nan"] = "Nanjing Mandarin",
["cmn-noe"] = "Northeastern Mandarin",
["cmn-palladius"] = "Palladius",
["cmn-pinyin"] = "Hanyu Pinyin",
["cmn-sow"] = "Southwestern Mandarin",
["cmn-tia"] = "Tianjin Mandarin",
["cmn-tongyong"] = "Tongyong Pinyin",
["cmn-wadegiles"] = "Wade–Giles",
["cmn-wuh"] = "Wuhan Mandarin",
["cmn-wvc"] = "Written vernacular Mandarin",
["cmn-xin"] = "Xining Mandarin",
["cmn-yan"] = "Yangzhou Mandarin",
["cop-akh"] = "Akhmimic Coptic",
["cop-boh"] = "Bohairic Coptic",
["cop-fay"] = "Fayyumic Coptic",
["cop-ggg"] = "Coptic Dialect G",
["cop-her"] = "Hermopolitan Coptic",
["cop-jjj"] = "Coptic Dialect J",
["cop-kkk"] = "Coptic Dialect K",
["cop-lyc"] = "Lycopolitan Coptic",
["cop-old"] = "Old Coptic",
["cop-oxy"] = "Oxyrhynchite Coptic",
["cop-ply"] = "Proto-Lycopolitan Coptic",
["cop-ppp"] = "Coptic Dialect P",
["cop-sah"] = "Sahidic Coptic",
["crh-dbj"] = "Dobrujan Tatar",
["cs-ear"] = "Early Modern Czech",
["cu-bgm"] = "Middle Bulgarian",
["cv-ana"] = "Anatri Chuvash",
["cv-mid"] = "Middle Chuvash",
["cv-old"] = "Old Chuvash",
["cv-vir"] = "Viryal Chuvash",
["cy-nor"] = "North Wales Welsh",
["cy-sou"] = "South Wales Welsh",
["de-AT"] = "Austrian German",
["de-AT-vie"] = "Viennese German",
["de-CH"] = "Switzerland German",
["de-bal"] = "Baltic German",
["de-ear"] = "Early New High German",
["drt"] = "Drents",
["dv-add"] = "Addu Dhivehi",
["dv-huv"] = "Huvadhu Dhivehi",
["dv-mul"] = "Mulaku Dhivehi",
["dv-old"] = "Old Dhivehi",
["egl-old"] = "Old Emilian",
["egy-lat"] = "Late Egyptian",
["egy-mid"] = "Middle Egyptian",
["egy-nmi"] = "Neo-Middle Egyptian",
["egy-old"] = "Old Egyptian",
["el-crt"] = "Cretan Greek",
["el-cyp"] = "Cypriot Greek",
["el-kal"] = "Kaliarda",
["el-kth"] = "Katharevousa",
["el-pap"] = "Paphian Greek",
["elx-ach"] = "Achaemenid Elamite",
["elx-mid"] = "Middle Elamite",
["elx-neo"] = "Neo-Elamite",
["elx-old"] = "Old Elamite",
["en-AU"] = "Australian English",
["en-CA"] = "Canadian English",
["en-GB"] = "British English",
["en-GB-NIR"] = "Northern Irish English",
["en-GB-SCT"] = "Scottish English",
["en-GB-WLS"] = "Welsh English",
["en-HK"] = "Hong Kong English",
["en-IE"] = "Irish English",
["en-IM"] = "Manx English",
["en-IN"] = "Indian English",
["en-NNN"] = "North American ඉංග්රීසි",
["en-NZ"] = "New Zealand English",
["en-US"] = "American English",
["en-US-CA"] = "California English",
["en-ZA"] = "South African English",
["en-aae"] = "Australian Aboriginal English",
["en-ear"] = "Early Modern English",
["en-geo"] = "Geordie",
["en-uls"] = "Ulster English",
["enm-emi"] = "East Midland Middle English",
["enm-esc"] = "Early Scots",
["enm-ken"] = "Kentish Middle English",
["enm-nor"] = "Northern Middle English",
["enm-sou"] = "Southern Middle English",
["enm-wmi"] = "West Midland Middle English",
["es-AR"] = "Rioplatense Spanish",
["es-BO"] = "Bolivian Spanish",
["es-CL"] = "Chilean Spanish",
["es-CO"] = "Colombian Spanish",
["es-CU"] = "Cuban Spanish",
["es-MX"] = "Mexican Spanish",
["es-PE"] = "Peruvian Spanish",
["es-PH"] = "Philippine Spanish",
["es-PR"] = "Puerto Rican Spanish",
["es-US"] = "United States Spanish",
["es-VE"] = "Venezuelan Spanish",
["es-ear"] = "Early Modern Spanish",
["es-lun"] = "Lunfardo",
["esi"] = "North Alaskan Inupiatun",
["esk"] = "Northwest Alaskan Inupiatun",
["fa-cls"] = "Classical Persian",
["fa-ear"] = "Early New Persian",
["fa-ira"] = "Iranian Persian",
["fat"] = "Fante Akan",
["fay-bsh"] = "Bushehri",
["fay-bur"] = "Burenjani",
["fay-dav"] = "Davani",
["fay-dsh"] = "Dashtaki",
["fay-eze"] = "Emamzada Esmaili",
["fay-gav"] = "Gavkoshaki",
["fay-kar"] = "Khargi",
["fay-kho"] = "Khollari",
["fay-kon"] = "Kondazi",
["fay-kzo"] = "Old Kazeruni",
["fay-mas"] = "Masarami",
["fay-pap"] = "Papuni",
["fay-sam"] = "Samghani",
["fay-sho"] = "Old Shirazi",
["fay-shr"] = "Shirazi",
["fay-sor"] = "Sorkhi",
["ffm"] = "Maasina Fulfulde",
["fiu-pro"] = "Proto-Finno-Ugric",
["fr-CA"] = "Canadian French",
["fr-CH"] = "Swiss French",
["fr-aca"] = "Acadian French",
["fr-lou"] = "Louisiana French",
["fr-mis"] = "Missouri French",
["frc"] = "Cajun French",
["frk"] = "Frankish",
["fro-nor"] = "Old Northern French",
["fro-pic"] = "Picard Old French",
["frp-old"] = "Old Franco-Provençal",
["frr-amr"] = "Amrum North Frisian",
["frr-fam"] = "Föhr-Amrum North Frisian",
["frr-foh"] = "Föhr North Frisian",
["frr-goe"] = "Goesharde North Frisian",
["frr-hal"] = "Halligen North Frisian",
["frr-hel"] = "Heligoland North Frisian",
["frr-ins"] = "Insular North Frisian",
["frr-kar"] = "Karrharde North Frisian",
["frr-mai"] = "Mainland North Frisian",
["frr-moo"] = "Mooring North Frisian",
["frr-syl"] = "Sylt North Frisian",
["frr-wie"] = "Wiedingharde North Frisian",
["frs"] = "East Frisian Low German",
["fub"] = "Adamawa Fulfulde",
["fuc"] = "Pulaar",
["fue"] = "Borgu Fulfulde",
["fuf"] = "Pular",
["fuh"] = "Western Niger Fulfulde",
["fui"] = "Bagirmi Fulfulde",
["fuq"] = "Central-Eastern Niger Fulfulde",
["fur-old"] = "Old Friulian",
["fuv"] = "Nigerian Fulfulde",
["gax"] = "Borana",
["gbz"] = "Zoroastrian Dari",
["gem-sue"] = "Suevic",
["gkm"] = "Byzantine Greek",
["gmq-osw-lat"] = "Late Old Swedish",
["gmw-afr-pro"] = "Proto-Anglo-Frisian",
["gmw-nsg-pro"] = "Proto-North Sea Germanic",
["gos"] = "Gronings",
["grc-aeo"] = "Aeolic Greek",
["grc-arc"] = "Arcadian Greek",
["grc-arp"] = "Arcadocypriot Greek",
["grc-att"] = "Attic Greek",
["grc-boi"] = "Boeotian Greek",
["grc-cyp"] = "Cypriot Ancient Greek",
["grc-dor"] = "Doric Greek",
["grc-ela"] = "Elean Greek",
["grc-epi"] = "Epic Greek",
["grc-ion"] = "Ionic Greek",
["grc-koi"] = "Koine Greek",
["grc-kre"] = "Cretan Ancient Greek",
["grc-opl"] = "Opuntian Locrian",
["grc-ozl"] = "Ozolian Locrian",
["grc-pam"] = "Pamphylian Greek",
["grc-ths"] = "Thessalian Greek",
["gsw-FR-als"] = "Alsatian Alemannic German",
["gsw-hig"] = "High Alemannic German",
["gsw-hst"] = "Highest Alemannic German",
["gsw-low"] = "Low Alemannic German",
["gu-kat"] = "Kathiyawadi",
["gu-lda"] = "Lisan ud-Dawat Gujarati",
["gzi"] = "Gazi",
["hae"] = "Harar Oromo",
["hak-HK"] = "Hong Kong Hakka",
["hak-TW"] = "Taiwanese Hakka",
["hak-dab"] = "Dabu Hakka",
["hak-eam"] = "Early Modern Hakka",
["hak-hai"] = "Hailu Hakka",
["hak-hui"] = "Huiyang Hakka",
["hak-hui-MY"] = "Malaysian Huiyang Hakka",
["hak-mei"] = "Meixian Hakka",
["hak-six"] = "Sixian Hakka",
["hak-zha"] = "Zhao'an Hakka",
["haz"] = "Hazaragi",
["hbo"] = "Biblical Hebrew",
["he-IL"] = "Israeli Hebrew",
["he-med"] = "Medieval Hebrew",
["he-mis"] = "Mishnaic Hebrew",
["hi-mid"] = "Middle Hindi",
["hi-mum"] = "Bombay Hindi",
["hsn-hya"] = "Hengyang Xiang",
["hsn-hzh"] = "Hengzhou Xiang",
["hsn-lou"] = "Loudi Xiang",
["hsn-new"] = "New Xiang",
["hsn-old"] = "Old Xiang",
["ht-sdm"] = "Saint Dominican Creole French",
["hye"] = "Eastern Armenian",
["hyw"] = "Western Armenian",
["inc-aav"] = "Avahattha",
["inc-agu"] = "Gurjara Apabhramsa",
["inc-aka"] = "Kasmiri Apabhramsa",
["inc-ama"] = "Maharastri Apabhramsa",
["inc-asa"] = "Sauraseni Apabhramsa",
["inc-ash-pro"] = "Proto-Middle Indo-Aryan",
["inc-ata"] = "Takka Apabhramsa",
["inc-avr"] = "Vracada Apabhramsa",
["inc-mit"] = "Mitanni",
["iro-ohu"] = "Old Wendat",
["iro-omo"] = "Old Mohawk",
["iro-oon"] = "Old Onondaga",
["it-CH"] = "Switzerland Italian",
["itc-lan"] = "Lanuvian",
["itc-ola"] = "Old Latin",
["itc-pra"] = "Praenestine",
["ja-cla"] = "Classical Japanese",
["ja-ear"] = "Early Modern Japanese",
["ja-mid"] = "Middle Japanese",
["ja-mid-ear"] = "Early Middle Japanese",
["ja-mid-lat"] = "Late Middle Japanese",
["jpa"] = "Jewish Palestinian Aramaic",
["jrb"] = "Judeo-Arabic",
["ka-mid"] = "Middle Georgian",
["kbg"] = "Khamba",
["kea-alu"] = "ALUPEC Kabuverdianu",
["kea-bar"] = "Barlavento Kabuverdianu",
["kea-bra"] = "Brava Kabuverdianu",
["kea-bvi"] = "Boa Vista Kabuverdianu",
["kea-fog"] = "Fogo Kabuverdianu",
["kea-mai"] = "Maio Kabuverdianu",
["kea-saa"] = "Santo Antão Kabuverdianu",
["kea-sal"] = "Sal Kabuverdianu",
["kea-san"] = "Santiago Kabuverdianu",
["kea-sni"] = "São Nicolau Kabuverdianu",
["kea-sot"] = "Sotavento Kabuverdianu",
["kea-svi"] = "São Vicente Kabuverdianu",
["kfm"] = "Khunsari",
["khg"] = "Khams Tibetan",
["kho-lat"] = "Late Khotanese",
["kho-old"] = "Old Khotanese",
["kjh-fyu"] = "Fuyu Kyrgyz",
["kjv"] = "Kajkavian Serbo-Croatian",
["klj-arg"] = "Arghu",
["kn-hav"] = "Havigannada",
["kn-kun"] = "Kundagannada",
["ko-cen"] = "Central Korean",
["ko-chu"] = "Chungcheong Korean",
["ko-gan"] = "Gangwon Korean",
["ko-gyg"] = "Gyeonggi Korean",
["ko-gys"] = "Gyeongsang Korean",
["ko-ham"] = "Hamgyong Korean",
["ko-hwa"] = "Hwanghae Korean",
["ko-jeo"] = "Jeolla Korean",
["ko-pyo"] = "Pyongan Korean",
["ko-yuk"] = "Yukjin Korean",
["kok-mid"] = "Middle Konkani",
["kok-old"] = "Old Konkani",
["krl-nor"] = "North Karelian",
["krl-sou"] = "South Karelian",
["ksh"] = "Kölsch",
["kze"] = "Kosena",
["la-afr"] = "African Romance",
["la-cla"] = "Classical Latin",
["la-con"] = "Contemporary Latin",
["la-ecc"] = "Ecclesiastical Latin",
["la-eme"] = "Early Medieval Latin",
["la-lat"] = "Late Latin",
["la-med"] = "Medieval Latin",
["la-new"] = "New Latin",
["la-ren"] = "Renaissance Latin",
["la-vul"] = "Vulgar Latin",
["lij-old"] = "Old Ligurian",
["lld-amp"] = "Ampezan Ladin",
["lld-bad"] = "Badiot Ladin",
["lld-cad"] = "Cadorino Ladin",
["lld-fas"] = "Fascian Ladin",
["lld-fod"] = "Fodom Ladin",
["lld-for"] = "Fornes Ladin",
["lld-ghe"] = "Gherdëina Ladin",
["lld-non"] = "Nones Ladin",
["lmo-old"] = "Old Lombard",
["lng"] = "Lombardic",
["ltc-ear"] = "Early Middle Chinese",
["ltc-lat"] = "Late Middle Chinese",
["lut-nor"] = "Northern Lushootseed",
["lzh-KO"] = "Korean Classical Chinese",
["lzh-VI"] = "Vietnamese Classical Chinese",
["lzh-cii"] = "Ci",
["lzh-cmn"] = "Classical Mandarin",
["lzh-cmn-TW"] = "Classical Taiwanese Mandarin",
["lzh-lit"] = "Literary Chinese",
["lzh-pre"] = "Pre-Classical Chinese",
["lzh-shi"] = "Traditional Chinese poetry",
["lzh-tai"] = "Classical Taishanese",
["lzh-yue"] = "Classical Cantonese",
["mn-cha"] = "Chakhar Mongolian",
["mn-kha"] = "Khalkha Mongolian",
["mn-khr"] = "Khorchin Mongolian",
["mn-ord"] = "Ordos Mongolian",
["mns-eas"] = "Eastern Mansi",
["mns-wes"] = "Western Mansi",
["ms-cla"] = "Classical Malay",
["ms-old"] = "Old Malay",
["mul-tax"] = "taxonomic name",
["nan-anx"] = "Anxi Hokkien",
["nan-cha"] = "Changtai Hokkien",
["nan-hbl-PH"] = "Philippine Hokkien",
["nan-hbl-SG"] = "Singapore Hokkien",
["nan-hbl-TW"] = "Taiwanese Hokkien",
["nan-hou"] = "Houlu Min",
["nan-hui"] = "Hui'an Hokkien",
["nan-jin"] = "Jinjiang Hokkien",
["nan-kin"] = "Kinmenese Hokkien",
["nan-med"] = "Medan Hokkien",
["nan-pen"] = "Penang Hokkien",
["nan-qia"] = "Qianlu Min",
["nan-qua"] = "Quanzhou Hokkien",
["nan-spm"] = "Southern Malaysian Hokkien",
["nan-ton"] = "Tong'an Hokkien",
["nan-xia"] = "Xiamen Hokkien",
["nan-yon"] = "Yongchun Hokkien",
["nan-zha"] = "Zhangzhou Hokkien",
["nan-zho"] = "Zhao'an Hokkien",
["nan-zhp"] = "Zhangping Hokkien",
["nap-old"] = "Old Neapolitan",
["ncb-cam"] = "Camorta",
["ncb-kat"] = "Katchal",
["ncb-nan"] = "Nancowry",
["nds-de"] = "German Low German",
["nds-lpr"] = "Low Prussian",
["nds-nl"] = "Dutch Low Saxon",
["nl-BE"] = "Belgian Dutch",
["non-grn"] = "Greenlandic Norse",
["non-oen"] = "Old East Norse",
["non-own"] = "Old West Norse",
["nrf-grn"] = "Guernsey Norman",
["nrf-jer"] = "Jersey Norman",
["ntz"] = "Natanzi",
["nyq"] = "Nayini",
["oc-ara"] = "Aranese",
["oc-auv"] = "Auvergnat",
["oc-gas"] = "Gascon",
["oc-jud"] = "Shuadit",
["oc-lan"] = "Languedocien",
["oc-lim"] = "Limousin",
["oc-pro"] = "Provençal",
["oc-pro-old"] = "Old Provençal",
["oc-viv"] = "Vivaro-Alpine",
["och-ear"] = "Early Old Chinese",
["och-lat"] = "Late Old Chinese",
["ojp-eas"] = "Eastern Old Japanese",
["okm-ear"] = "Early Middle Korean",
["oko-lat"] = "Late Old Korean",
["okz-ang"] = "Angkorian Old Khmer",
["okz-pre"] = "Pre-Angkorian Old Khmer",
["ont"] = "Ontenu",
["oos"] = "Old Ossetic",
["oos-ear"] = "Early Old Ossetic",
["oos-lat"] = "Late Old Ossetic",
["orc"] = "Orma",
["oru-kan"] = "Kaniguram",
["oru-log"] = "Logar",
["os-dig"] = "Digor Ossetian",
["os-iro"] = "Iron Ossetian",
["osc-luc"] = "Lucanian",
["osc-sam"] = "Samnite",
["otk-kir"] = "Old Kirghiz",
["otk-ork"] = "Orkhon Turkic",
["pal-ear"] = "Early Middle Persian",
["pal-lat"] = "Late Middle Persian",
["peo-ear"] = "Early Old Persian",
["peo-lat"] = "Late Old Persian",
["pfl"] = "Palatine German",
["pl-gor"] = "Goral",
["pl-gre"] = "Greater Polish",
["pl-les"] = "Lesser Polish",
["pl-mas"] = "Masovian Polish",
["pld"] = "Polari",
["pms-old"] = "Old Piedmontese",
["pnb"] = "Western Punjabi",
["pra-abh"] = "Abhiri",
["pra-ard"] = "Ardhamagadhi Prakrit",
["pra-ava"] = "Avanti",
["pra-bah"] = "Bahliki",
["pra-can"] = "Candali",
["pra-dak"] = "Daksinatya",
["pra-dra"] = "Dramili",
["pra-hel"] = "එළු ප්රාකෘත",
["pra-kha"] = "Khasa Prakrit",
["pra-mag"] = "Magadhi Prakrit",
["pra-mah"] = "Maharastri Prakrit",
["pra-odr"] = "Odri",
["pra-pai"] = "Paisaci Prakrit",
["pra-pra"] = "Pracya",
["pra-pro"] = "Proto-New Indo-Aryan",
["pra-sab"] = "Sabari",
["pra-sak"] = "Sakari",
["pra-sau"] = "Sauraseni Prakrit",
["prs"] = "Dari",
["ps-afr"] = "Afridi",
["ps-ban"] = "Bannu",
["ps-bng"] = "Bangash",
["ps-cgi"] = "Central Ghilzay",
["ps-jad"] = "Jadrani",
["ps-kak"] = "Kakari",
["ps-kan"] = "Kandahari",
["ps-mah"] = "Mahsudi",
["ps-nea"] = "Northeastern Pashto",
["ps-nwe"] = "Northwestern Pashto",
["ps-pes"] = "Peshawari",
["ps-sea"] = "Southeastern Pashto",
["ps-ser"] = "Sher",
["ps-swe"] = "Southwestern Pashto",
["ps-waz"] = "Waziri",
["ps-xat"] = "Khatak",
["pse-bsm"] = "Besemah",
["pt-BR"] = "Brazilian Portuguese",
["pt-PT"] = "European Portuguese",
["qfa-yke-pro"] = "Proto-Ketic",
["qfa-yko-pro"] = "Proto-Kottic",
["qfa-ypm-pro"] = "Proto-Pumpokolic",
["qfa-yrn-pro"] = "Proto-Arinic",
["qsb-bal"] = "Paleo-Balkan",
["qsb-bma"] = "the BMAC substrate",
["qsb-grc"] = "Pre-Greek",
["qsb-ibe"] = "Paleo-Hispanic",
["qwm-arm"] = "Armeno-Kipchak",
["qwm-cum"] = "Cuman",
["qwm-mam"] = "Mamluk-Kipchak",
["qxq"] = "Qashqai",
["rdb-jir"] = "Jirofti",
["rdb-kah"] = "Kahnuji",
["rgn-old"] = "Old Romagnol",
["rm-gri"] = "Rumantsch Grischun",
["rm-old"] = "Old Romansh",
["rm-put"] = "Puter Romansh",
["rm-srm"] = "Surmiran Romansh",
["rm-srs"] = "Sursilvan Romansh",
["rm-sut"] = "Sutsilvan Romansh",
["rm-val"] = "Vallader Romansh",
["ro-MD"] = "Moldovan",
["roa-oit"] = "Old Italian",
["roa-pro"] = "Proto-Romance",
["rw-kin"] = "Kinyarwanda",
["rw-run"] = "Kirundi",
["sa-bhs"] = "Buddhist Hybrid Sanskrit",
["sa-bra"] = "Brahmanic Sanskrit",
["sa-epi"] = "Epic Sanskrit",
["sa-neo"] = "New Sanskrit",
["sa-rig"] = "Rigvedic Sanskrit",
["sc-nuo"] = "Nuorese",
["sc-old"] = "Old Sardinian",
["sc-src"] = "Logudorese",
["sc-sro"] = "Campidanese",
["scn-old"] = "Old Sicilian",
["sco-ins"] = "Insular Scots",
["sco-nor"] = "Northern Scots",
["sco-sou"] = "Southern Scots",
["sco-uls"] = "Ulster Scots",
["sdz"] = "Sallands",
["sgh-baj"] = "Bajui",
["sgh-bar"] = "Bartangi",
["sgh-bro"] = "Bartangi-Oroshori",
["sgh-oro"] = "Oroshori",
["sgh-ros"] = "Roshani",
["sgh-rsx"] = "Roshani-Khufi",
["sgh-xgb"] = "Khughni-Bajui",
["sgh-xuf"] = "Khufi",
["sgh-xug"] = "Khughni",
["sh-tor"] = "Torlakian Serbo-Croatian",
["shi-med"] = "Medieval Tashelhit",
["si-med"] = "Medieval Sinhalese",
["ska"] = "Skagit",
["slh"] = "Southern Lushootseed",
["sli"] = "Silesian East Central German",
["sno"] = "Snohomish",
["sog-ear"] = "Early Sogdian",
["sog-lat"] = "Late Sogdian",
["soj"] = "Soi",
["ssn"] = "Waata",
["stl"] = "Stellingwerfs",
["sxu"] = "Upper Saxon German",
["ta-mid"] = "Middle Tamil",
["tai-shz"] = "Shangsi Zhuang",
["taq"] = "Tamasheq",
["tbq-pro"] = "Proto-Tibeto-Burman",
["th-ayu"] = "Ayutthaya Old Thai",
["th-old"] = "Old Thai",
["th-suk"] = "Sukhothai Old Thai",
["thv"] = "Tamahaq",
["thv-ght"] = "Ghat",
["thz"] = "Tayert",
["tks-cal"] = "Chali Tati",
["tks-dan"] = "Danesfani",
["tks-ebr"] = "Ebrahimabadi",
["tks-esf"] = "Esfarvarini",
["tks-sag"] = "Sagzabadi",
["tks-tak"] = "Takestani",
["tks-xia"] = "Khiaraji",
["tks-xoz"] = "Khoznini",
["tl-cls"] = "Classical Tagalog",
["tl-old"] = "Old Tagalog",
["tly-anb"] = "Anbarani",
["tly-asa"] = "Asalemi",
["tly-aze"] = "Azerbaijani Talysh",
["tly-cen"] = "Central Talysh",
["tly-fum"] = "Fumani",
["tly-kar"] = "Karganrudi",
["tly-msa"] = "Masali",
["tly-msu"] = "Masulei",
["tly-nor"] = "Northern Talysh",
["tly-san"] = "Shandarmani",
["tly-sou"] = "Southern Talysh",
["tly-tal"] = "Taleshdulabi",
["tly-tul"] = "Tularudi",
["tmr"] = "Jewish Babylonian Aramaic",
["tpw-lga"] = "Língua Geral Amazônica",
["tpw-lgp"] = "Língua Geral Paulista",
["tr-CY"] = "Cypriot Turkish",
["trk-bul-pro"] = "Proto-Bulgar",
["trk-cmn-pro"] = "Proto-Common Turkic",
["trk-ogr-pro"] = "Proto-Oghur",
["trk-ogz-pro"] = "Proto-Oghuz",
["tsk"] = "Tseku",
["ttq"] = "Tawellemmet",
["tw"] = "Twi Akan",
["tw-aku"] = "Akuapem Twi",
["tw-asa"] = "Asante Twi",
["twd"] = "Twents",
["uk-CA"] = "Canadian Ukrainian",
["urj-fpr-pro"] = "Proto-Finno-Permic",
["uz-afg"] = "Afghan Uzbek",
["vaf"] = "Vafsi",
["vec-old"] = "Old Venetan",
["vel"] = "Veluws",
["vsn"] = "Vedic Sanskrit",
["wae"] = "Walser German",
["wep"] = "Westphalian",
["wss"] = "Wasa",
["wuu-chm"] = "Shadi Wu",
["wuu-han"] = "Hangzhounese",
["wuu-nin"] = "Ningbonese",
["wuu-nor"] = "Northern Wu",
["wuu-sha"] = "Shanghainese",
["wuu-suz"] = "Suzhounese",
["wuu-wen"] = "Wenzhounese",
["xaq"] = "Aquitanian",
["xbo-dan"] = "Danube Bulgar",
["xbo-vol"] = "Volga Bulgar",
["xcg"] = "Cisalpine Gaulish",
["xfa-cap"] = "Capenate",
["xh-bha"] = "Bhaca",
["xme-aby"] = "Abyanehi",
["xme-abz"] = "Abuzeydabadi",
["xme-amo"] = "Amorehi",
["xme-ana"] = "Anaraki",
["xme-ard"] = "Ardestani",
["xme-azr"] = "Old Azari",
["xme-bdr"] = "Badrudi",
["xme-bid"] = "Bidhandi",
["xme-bij"] = "Bijagani",
["xme-bor"] = "Borujerdi",
["xme-cim"] = "Chimehi",
["xme-del"] = "Delijani",
["xme-far"] = "Farizandi",
["xme-ham"] = "Hamadani",
["xme-han"] = "Hanjani",
["xme-isf"] = "Isfahani",
["xme-jow"] = "Jowshaqani",
["xme-kaf"] = "Kafroni",
["xme-kah"] = "Kahaki",
["xme-kas"] = "Kashani",
["xme-kes"] = "Kesehi",
["xme-kom"] = "Komjani",
["xme-krm"] = "Kermani",
["xme-mah"] = "Mahallati",
["xme-mey"] = "Meymehi",
["xme-nar"] = "Naraqi",
["xme-nas"] = "Nashalji",
["xme-nus"] = "Nushabadi",
["xme-qal"] = "Qalhari",
["xme-qoh"] = "Qohrudi",
["xme-sed"] = "Sedehi",
["xme-tar"] = "Tari",
["xme-trh"] = "Tarehi",
["xme-ttc-cen"] = "Central Tati",
["xme-ttc-eas"] = "Eastern Tati",
["xme-ttc-nor"] = "Northern Tati",
["xme-ttc-sou"] = "Southern Tati",
["xme-ttc-wes"] = "Western Tati",
["xme-val"] = "Valujerdi",
["xme-var"] = "Varani",
["xme-von"] = "Vonishuni",
["xme-vrz"] = "Varzenehi",
["xme-xur"] = "Khuri",
["xme-yar"] = "Yarandi",
["xme-yaz"] = "Yazdi",
["xme-zef"] = "Zefrehi",
["xme-zor"] = "Zori",
["xmn"] = "Manichaean Middle Persian",
["xng-ear"] = "Early Middle Mongol",
["xng-lat"] = "Late Middle Mongol",
["xnn"] = "Northern Kankanaey",
["xno"] = "ඇන්ග්ලෝ-නෝමන්",
["xno-law"] = "Law French",
["xtg"] = "Transalpine Gaulish",
["xvi"] = "Kamviri",
["yue-HK"] = "Hong Kong Cantonese",
["yue-gua"] = "Guangzhou Cantonese",
["yue-lit"] = "Literary Cantonese",
["yue-wvc"] = "Written vernacular Cantonese",
["zh-postal"] = "Postal Romanization",
["zhx-dan"] = "Danzhou Chinese",
["zhx-tai-wvc"] = "Written vernacular Taishanese",
["zhx-zho"] = "Zhongshan Min",
["zle-mbe"] = "Middle Belarusian",
["zle-mru"] = "Middle Russian",
["zle-muk"] = "Middle Ukrainian",
["zle-ops"] = "Old Pskovian",
["zls-chs-ru"] = "Russian Church Slavonic",
["zls-chs-uk"] = "Ukrainian Church Slavonic",
["zlw-mpl"] = "Middle Polish",
["zrp"] = "Zarphatic",
}
n676v26guahb36k7sgs08mxpdbxrl72
Module:etymology languages/data
828
137340
234828
230526
2026-05-17T18:28:36Z
en>Theknightwho
0
Ancient Greek and Sanskrit varieties.
234828
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
----------------------------------------------------------------------------------------------------------------------
-- Afroasiatic varieties --
----------------------------------------------------------------------------------------------------------------------
--------------------------------------------------------------------------------------
-- Berber varieties --
--------------------------------------------------------------------------------------
m["shi-med"] = {
"Medieval Tashelhit",
34152,
"shi",
}
-- Tuareg lects
m["thv"] = {
"Tamahaq",
56703,
"tmh",
}
m["ttq"] = {
"Tawellemmet",
56390,
"tmh",
}
m["taq"] = {
"Tamasheq",
4670066,
"tmh",
}
m["thz"] = {
"Tayert",
56388,
"tmh",
}
m["thv-ght"] = {
"Ghat",
47012900,
"thv",
}
--------------------------------------------------------------------------------------
-- Cushitic varieties --
--------------------------------------------------------------------------------------
-- Oromo varieties
m["hae"] = {
"Harar Oromo",
5330355,
"om",
aliases = {"Eastern Oromo"},
}
m["gax"] = {
"Borana",
2910610,
"om",
aliases = {"Southern Oromo"},
}
m["orc"] = {
"Orma",
2919128,
"om",
}
m["ssn"] = {
"Waata",
3501553,
"om",
}
--------------------------------------------------------------------------------------
-- Egyptian varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Ancient Egyptian varieties --
-----------------------------------------------------
m["egy-old"] = {
"Old Egyptian",
447117,
"egy",
}
m["egy-mid"] = {
"Middle Egyptian",
657330,
"egy",
aliases = {"Classical Egyptian"},
}
m["egy-nmi"] = {
"Neo-Middle Egyptian",
123735278,
"egy",
aliases = {"Égyptien de tradition", "Traditional Egyptian"},
}
m["egy-lat"] = {
"Late Egyptian",
1852329,
"egy",
}
-----------------------------------------------------
-- Coptic varieties --
-----------------------------------------------------
m["cop-akh"] = {
"Akhmimic Coptic",
125176464,
"cop",
aliases = {"Akhmimic"},
}
m["cop-boh"] = {
"Bohairic Coptic",
890733,
"cop",
aliases = {"Bohairic", "Memphitic Coptic", "Memphitic"},
}
m["cop-ggg"] = {
"Coptic Dialect G",
nil,
"cop",
aliases = {"Dialect G", "Mansuric Coptic", "Mansuric"},
}
m["cop-jjj"] = {
"Coptic Dialect J",
nil,
"cop",
}
m["cop-kkk"] = {
"Coptic Dialect K",
nil,
"cop",
}
m["cop-ppp"] = {
"Coptic Dialect P",
nil,
"cop",
aliases = {"Proto-Theban Coptic", "Palaeo-Theban Coptic"},
}
m["cop-fay"] = {
"Fayyumic Coptic",
1399115,
"cop",
aliases = {"Fayyumic", "Faiyumic Coptic", "Faiyumic", "Fayumic Coptic", "Fayumic",
"Bashmuric Coptic", "Bashmuric"},
}
m["cop-her"] = {
"Hermopolitan Coptic",
nil,
"cop",
aliases = {"Hermopolitan", "Coptic Dialect H", "Ashmuninic", "Ashmuninic Coptic"},
}
m["cop-lyc"] = {
"Lycopolitan Coptic",
nil,
"cop",
aliases = {
"Lycopolitan",
"Assiutic Coptic", "Asyutic Coptic", "Assiutic", "Asyutic",
"Lyco-Diospolitan Coptic", "Lyco-Diospolitan",
"Subakhmimic Coptic", "Subakhmimic"
},
}
m["cop-old"] = {
"Old Coptic",
115518040,
"cop",
}
m["cop-oxy"] = {
"Oxyrhynchite Coptic",
nil,
"cop",
aliases = {"Oxyrhynchite", "Mesokemic Coptic", "Mesokemic", "Middle Egyptian Coptic"},
}
m["cop-ply"] = {
"Proto-Lycopolitan Coptic",
nil,
"cop",
aliases = {"Coptic Dialect i", "Proto-Lyco-Diospolitan Coptic"},
}
m["cop-sah"] = {
"Sahidic Coptic",
2645851,
"cop",
aliases = {"Sahidic", "Saidic Coptic", "Saidic", "Thebaic Coptic", "Thebaic"},
}
--------------------------------------------------------------------------------------
-- Semitic varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Akkadian varieties --
-----------------------------------------------------
m["akk-old"] = {
"Old Akkadian",
nil,
"akk",
}
m["akk-obb"] = {
"Old Babylonian",
nil,
"akk",
}
m["akk-oas"] = {
"Old Assyrian",
nil,
"akk",
}
m["akk-mbb"] = {
"Middle Babylonian",
nil,
"akk",
}
m["akk-mas"] = {
"Middle Assyrian",
nil,
"akk",
}
m["akk-nbb"] = {
"Neo-Babylonian",
nil,
"akk",
}
m["akk-nas"] = {
"Neo-Assyrian",
nil,
"akk",
}
m["akk-lbb"] = {
"Late Babylonian",
nil,
"akk",
}
m["akk-stb"] = {
"Standard Babylonian",
nil,
"akk",
}
-----------------------------------------------------
-- Arabic varieties --
-----------------------------------------------------
m["jrb"] = {
"Judeo-Arabic",
37733,
"ar",
pseudo_families = "qfa-jew",
}
m["apc-leb"] = {
"Lebanese North Levantine Arabic",
1516642,
"apc",
aliases = {"Lebanese Arabic"},
}
m["apc-sle"] = {
"South Lebanese North Levantine Arabic",
14206590,
"apc",
aliases = {"South Lebanese Arabic"},
}
m["apc-nle"] = {
"North Lebanese North Levantine Arabic",
nil,
"apc",
aliases = {"North Lebanese Arabic"},
}
m["apc-syr"] = {
"Syrian North Levantine Arabic",
2143071,
"apc",
aliases = {"Syrian Arabic"},
}
m["apc-ale"] = {
"Aleppine North Levantine Arabic",
7056921,
"apc-syr",
aliases = {"Aleppo Arabic", "Aleppine Arabic"},
}
m["apc-dam"] = {
"Damascene North Levantine Arabic",
12237466,
"apc-syr",
aliases = {"Damascus Arabic", "Damascene Arabic"},
}
m["acm-khu"] = {
"Khuzestani Arabic",
1040944,
"acm",
}
-----------------------------------------------------
-- Aramaic varieties --
-----------------------------------------------------
m["arc-bib"] = {
"Biblical Aramaic",
843235,
"arc",
family = "sem-are",
}
m["arc-cpa"] = {
"Christian Palestinian Aramaic",
60790119,
"arc",
family = "sem-arw",
aliases = {"Melkite Aramaic", "Palestinian Syriac", "Syropalestinian Aramaic"},
}
m["arc-imp"] = {
"Imperial Aramaic",
7079491,
"arc",
aliases = {"Official Aramaic"},
}
m["arc-hat"] = {
"Hatran Aramaic",
3832926,
"arc",
family = "sem-are",
}
m["arc-jla"] = {
"Jewish Literary Aramaic",
105952842,
"arc",
pseudo_families = "qfa-jew",
}
m["arc-nab"] = {
"Nabataean Aramaic",
36178,
"arc",
}
m["arc-old"] = {
"Old Aramaic",
3398392,
"arc",
}
m["arc-pal"] = {
"Palmyrene Aramaic",
1510113,
"arc",
family = "sem-arw",
}
m["tmr"] = {
"Jewish Babylonian Aramaic",
33407,
"arc",
family = "sem-ase",
pseudo_families = "qfa-jew",
}
m["jpa"] = {
"Jewish Palestinian Aramaic",
948909,
"arc",
family = "sem-arw",
aliases = {"Galilean Aramaic"},
pseudo_families = "qfa-jew",
}
-----------------------------------------------------
-- Hebrew varieties --
-----------------------------------------------------
m["hbo"] = {
"Biblical Hebrew",
1982248,
"he",
aliases = {"Classical Hebrew"},
}
m["he-mis"] = {
"Mishnaic Hebrew",
1649362,
"he",
ancestors = "hbo",
}
m["he-med"] = {
"Medieval Hebrew",
2712572,
"he",
ancestors = "he-mis",
}
m["he-IL"] = {
"Israeli Hebrew",
8141,
"he",
}
----------------------------------------------------------------------------------------------------------------------
-- Ainu varieties --
----------------------------------------------------------------------------------------------------------------------
m["ain-hok"] = {
"Hokkaido Ainu",
20968488,
"ain",
aliases = {"Hokkaidō Ainu"},
}
m["ain-kur"] = {
"Kuril Ainu",
20967012,
"ain",
}
m["ain-sak"] = {
"Sakhalin Ainu",
20747371,
"ain",
}
----------------------------------------------------------------------------------------------------------------------
-- American indigenous varieties --
----------------------------------------------------------------------------------------------------------------------
-----------------------------------------------------
-- Inuit varieties --
-----------------------------------------------------
m["esi"] = {
"North Alaskan Inupiatun",
nil,
"ik"
}
m["esk"] = {
"Northwest Alaskan Inupiatun",
25559714,
"ik"
}
-----------------------------------------------------
-- Iroquoian varieties --
-----------------------------------------------------
m["iro-ohu"] = {
"Old Wendat",
nil,
"wdt",
}
m["iro-omo"] = {
"Old Mohawk",
nil,
"moh",
}
m["iro-oon"] = {
"Old Onondaga",
nil,
"ono",
}
-----------------------------------------------------
-- Tupi-Guarani varieties --
-----------------------------------------------------
-- Old Tupi varieties
m["tpw-lga"] = {
"Língua Geral Amazônica",
18275323,
"tpw",
aliases = {"Língua Geral"},
}
m["tpw-lgp"] = {
"Língua Geral Paulista",
2669239,
"tpw",
}
----------------------------------------------------------------------------------------------------------------------
-- Austroasiatic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Khmer varieties
m["okz-ang"] = {
"Angkorian Old Khmer",
nil,
"okz",
wikipedia_article = "Khmer language#Historical periods",
}
m["okz-pre"] = {
"Pre-Angkorian Old Khmer",
nil,
"okz",
wikipedia_article = "Khmer language#Historical periods",
}
-- Central Nicobarese varieties
m["ncb-cam"] = {
"Camorta",
5026908,
"ncb",
aliases = {"Kamorta"},
}
m["ncb-kat"] = {
"Katchal",
17064263,
"ncb",
aliases = {"Tehnu"},
}
m["ncb-nan"] = {
"Nancowry",
6962504,
"ncb",
aliases = {"Nankwari"},
}
----------------------------------------------------------------------------------------------------------------------
-- Austronesian varieties --
----------------------------------------------------------------------------------------------------------------------
-- Malay and related varieties
m["ms-old"] = { -- this has the ISO code 'omy'
"Old Malay",
nil,
"ms",
}
m["ms-cla"] = {
"Classical Malay",
nil,
"ms",
ancestors = "ms-old",
}
m["pse-bsm"] = {
"Besemah",
nil,
"pse",
}
m["bew-kot"] = {
"Betawi Kota",
nil,
"bew",
aliases = {"Urban Betawi"}, -- in Jakarta
}
-- Philippine varieties
m["xnn"] = {
"Northern Kankanaey",
12953609,
"kne",
aliases = {"Northern Kankanay", "Northern Kankana-ey"},
}
m["tl-old"] = {
"Old Tagalog",
12967437,
"tl",
}
m["tl-cls"] = {
"Classical Tagalog",
nil,
"tl",
}
----------------------------------------------------------------------------------------------------------------------
-- Caucasian varieties --
----------------------------------------------------------------------------------------------------------------------
-- Kartvelian varieties
m["ka-mid"] = {
"Middle Georgian",
nil,
"ka",
ancestors = "oge",
}
----------------------------------------------------------------------------------------------------------------------
-- Dravidian varieties --
----------------------------------------------------------------------------------------------------------------------
m["ta-mid"] = {
"Middle Tamil",
20987434,
"ta",
}
m["kn-hav"] = {
"Havigannada",
24276369,
"kn",
}
m["kn-kun"] = {
"Kundagannada",
6444255,
"kn",
}
----------------------------------------------------------------------------------------------------------------------
-- Indo-European varieties --
----------------------------------------------------------------------------------------------------------------------
--------------------------------------------------------------------------------------
-- Albanian varieties --
--------------------------------------------------------------------------------------
m["aln"] = {
"Gheg Albanian",
181037,
"sq",
aliases = {"Gheg"},
}
m["aae"] = {
"Arbëresh Albanian",
1075302,
"als",
aliases = {"Arbëreshë", "Arbëresh"},
}
m["aat"] = {
"Arvanitika Albanian",
29347,
"als",
aliases = {"Arvanitika"},
}
m["als"] = {
"Tosk Albanian",
180937,
"sq",
aliases = {"Tosk"},
}
--------------------------------------------------------------------------------------
-- Armenian varieties --
--------------------------------------------------------------------------------------
m["hyw"] = {
"Western Armenian",
180945,
"hy",
}
m["hye"] = {
"Eastern Armenian",
181059,
"hy",
}
--------------------------------------------------------------------------------------
-- Balto-Slavic varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Baltic varieties --
-------------------------------------------------------------------------
m["bat-pro"] = {
"Proto-Baltic",
1703347,
"ine-bsl-pro",
}
m["bat-dni"] = {
"Dnieper Baltic",
4163178,
"bat-pro",
family = "bat",
aliases = {"Dniepr Baltic", "Dnieper-Oka Baltic", "Dniepr-Oka Baltic"},
}
m["bat-gol"] = {
"Golyad",
4142855,
"bat-dni",
aliases = {"Eastern Galindian", "East Galindian"},
}
-------------------------------------------------------------------------
-- Slavic varieties --
-------------------------------------------------------------------------
-----------------------------------------------------
-- Bulgarian varieties --
-----------------------------------------------------
m["cu-bgm"] = {
"Middle Bulgarian",
12294897,
"cu",
ancestors = "cu"
}
-----------------------------------------------------
-- Church Slavonic varieties --
-----------------------------------------------------
-- Old Moscow Church Slavonic deleted as it seems not distinct enough from Russian (Synodal) Church Slavonic.
m["zls-chs-ru"] = {
"Russian Church Slavonic",
21662400,
"zls-chs",
aliases = {"Synodal Church Slavonic", "New Moscow Church Slavonic", "Novomoskovsk Church Slavonic"},
}
m["zls-chs-uk"] = {
"Ukrainian Church Slavonic",
12153548,
"zls-chs",
aliases = {"Rusyn Church Slavonic", "Belarusian Church Slavonic"},
}
--[=[
-- Not sure about these yet.
m["zls-chs-bg"] = {
"Bulgarian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-cs"] = {
"Czech Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-hr"] = {
"Croatian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-mk"] = {
"Macedonian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-ro"] = {
"Romanian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-sr"] = {
"Serbian Church Slavonic",
nil,
"zls-chs",
}
]=]
-----------------------------------------------------
-- Czech varieties --
-----------------------------------------------------
m["cs-ear"] = {
"Early Modern Czech",
nil,
"cs",
ancestors = "zlw-ocs"
}
-----------------------------------------------------
-- East Slavic varieties --
-----------------------------------------------------
m["zle-ops"] = {
"Old Pskovian",
4167885,
"zle-ono",
}
m["zle-mru"] = {
"Middle Russian",
35228,
"ru",
"Cyrs",
ancestors = "orv",
translit = "ru-translit",
strip_diacritics = {
Cyrs = {
remove_diacritics = c.grave .. c.acute .. c.diaer,
},
},
}
m["zle-mbe"] = {
"Middle Belarusian",
13211,
"zle-ort",
}
m["zle-muk"] = {
"Middle Ukrainian",
13211,
"zle-ort",
}
m["uk-CA"] = {
"Canadian Ukrainian",
4161010,
"uk",
}
-----------------------------------------------------
-- Polish varieties --
-----------------------------------------------------
m["zlw-mpl"] = {
"Middle Polish",
402878,
"pl",
ancestors = "zlw-opl",
strip_diacritics = {
remove_diacritics = c.acute,
remove_exceptions = {"Ć", "ć", "Ń", "ń", "Ó", "ó", "Ś", "ś", "Ź", "ź"},
},
}
m["pl-gre"] = {
"Greater Polish",
4106789,
"pl",
}
m["pl-les"] = {
"Lesser Polish",
361709,
"pl",
}
m["pl-mas"] = {
"Masovian Polish",
4274559,
"pl",
}
m["pl-gor"] = {
"Goral",
452889,
"pl",
}
-----------------------------------------------------
-- Serbo-Croatian varieties --
-----------------------------------------------------
m["ckm"] = {
"Chakavian Serbo-Croatian",
337565,
"sh",
aliases = {"Čakavian"},
}
m["kjv"] = {
"Kajkavian Serbo-Croatian",
838165,
"sh",
}
m["sh-tor"] = { -- Linguist code srp-tor
"Torlakian Serbo-Croatian",
1078803,
"sh",
aliases = {"Torlak"},
}
--------------------------------------------------------------------------------------
-- Celtic varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Brythonic varieties --
-----------------------------------------------------
m["bry-ear"] = {
"Early Brythonic",
nil,
"cel-bry-pro",
}
m["bry-lat"] = {
"Late Brythonic",
nil,
"cel-bry-pro",
}
-----------------------------------------------------
-- Gaulish varieties --
-----------------------------------------------------
m["xcg"] = {
"Cisalpine Gaulish",
3832927,
"cel-gau",
}
m["xtg"] = {
"Transalpine Gaulish",
29977,
"cel-gau",
}
-----------------------------------------------------
-- Welsh varieties --
-----------------------------------------------------
m["cy-nor"] = {
"North Wales Welsh",
13127692,
"cy",
aliases = {"North Walian Welsh", "Northern Welsh"},
}
m["cy-sou"] = {
"South Wales Welsh",
13127689,
"cy",
aliases = {"South Walian Welsh", "Southern Welsh"},
}
--------------------------------------------------------------------------------------
-- Germanic varieties --
--------------------------------------------------------------------------------------
-- Proto-West Germanic varieties
m["frk"] = {
"Frankish",
10860505,
"gmw-pro",
family = "gmw-frk",
aliases = {"Old Frankish"},
}
m["gem-sue"] = {
"Suevic",
134600275,
"gmw-pro",
aliases = {"Suebian"},
}
m["gmw-afr-pro"] = {
"Proto-Anglo-Frisian",
134603379,
"gmw-nsg-pro",
family = "gmw-afr",
}
m["gmw-nsg-pro"] = {
"Proto-North Sea Germanic",
134603374,
"gmw-pro",
family = "gmw-nsg",
aliases = {"Proto-Ingvaeonic"},
}
-----------------------------------------------------
-- Dutch varieties --
-----------------------------------------------------
m["nl-BE"] = {
"Belgian Dutch",
34147,
"nl",
aliases = {"Flemish", "Flemish Dutch", "Southern Dutch"},
}
-----------------------------------------------------
-- English and Scots varieties --
-----------------------------------------------------
-- English varieties
m["en-AU"] = {
"Australian English",
44679,
"en",
}
m["en-GB"] = {
"British English",
7979,
"en",
}
m["en-GB-SCT"] = {
"Scottish English",
44676,
"en-GB",
}
m["en-GB-WLS"] = {
"Welsh English",
44676,
"en-GB",
}
m["en-IM"] = {
"Manx English",
6753295,
"en-GB",
}
m["en-aae"] = {
"Australian Aboriginal English",
783347,
"en-AU",
}
m["en-ear"] = {
"Early Modern English",
1472196,
"en",
ancestors = "enm",
aliases = {"Early New English"},
}
m["en-geo"] = {
"Geordie",
653421,
"en",
ancestors = "enm-nor",
}
m["en-IE"] = { -- FIXME: "IE" doesn't cover Northern Ireland
"Irish English",
665624,
"en",
}
m["en-uls"] = {
"Ulster English",
6840826,
"en-IE",
}
m["en-GB-NIR"] = {
"Northern Irish English",
6840826, -- actually the code for Ulster English
"en-uls",
}
m["en-NNN"] = { -- NA = Namibia; NNN is NATO 3-letter code for North America
"North American English",
7053766,
"en",
ietf_subtag = "en-021" -- 021 = UN M49 code for "Northern America" (i.e. North America wihout Central America or the Caribbean)
}
m["en-US"] = {
"American English",
7976,
"en-NNN",
}
m["en-NZ"] = {
"New Zealand English",
44661,
"en"
}
m["en-ZA"] = {
"South African English",
1156228,
"en"
}
m["en-US-CA"] = {
"California English",
1026812,
"en-US",
}
m["en-CA"] = {
"Canadian English",
44676,
"en-US",
}
m["en-HK"] = {
"Hong Kong English",
1068863,
"en",
}
m["en-IN"] = {
"Indian English",
1348800,
"en",
}
m["pld"] = {
"Polari",
1359130,
"en",
}
-- Scots varieties
m["sco-ins"] = {
"Insular Scots",
16919205,
"sco",
}
m["sco-uls"] = {
"Ulster Scots",
201966,
"sco",
}
m["sco-nor"] = {
"Northern Scots",
16928150,
"sco",
}
m["sco-sou"] = {
"Southern Scots",
7570457,
"sco",
aliases = {"South Scots", "Borders Scots"},
}
-- Middle English varieties
m["enm-esc"] = { -- Part of Middle English until it developed into Middle Scots.
"Early Scots",
5326738,
"enm",
ancestors = "enm-nor",
aliases = {"Old Scots", "Scottish Middle English"},
}
m["enm-emi"] = {
"East Midland Middle English",
134238810,
"enm",
ancestors = "ang-ang", -- Technically ang-mer, but attested Mercian is mostly WM IIRC
}
m["enm-ken"] = {
"Kentish Middle English",
134238532,
"enm",
ancestors = "ang-ken",
}
m["enm-nor"] = {
"Northern Middle English",
134238541,
"enm",
ancestors = "ang-nor",
}
m["enm-sou"] = {
"Southern Middle English",
134238528,
"enm",
ancestors = "ang-wsx",
}
m["enm-wmi"] = {
"West Midland Middle English",
134238824,
"enm",
ancestors = "ang-mer",
}
-- Old English varieties
-- Includes both Mercian and Northumbrian.
m["ang-ang"] = {
"Anglian Old English",
121142917,
"ang",
}
m["ang-ken"] = {
"Kentish Old English",
11687485,
"ang",
}
m["ang-mer"] = {
"Mercian Old English",
602072,
"ang-ang",
}
m["ang-nor"] = {
"Northumbrian Old English",
1798915,
"ang-ang",
}
m["ang-wsx"] = {
"West Saxon Old English",
2658603,
"ang",
}
-----------------------------------------------------
-- High German varieties --
-----------------------------------------------------
-- (modern) German varieties
m["de-AT"] = {
"Austrian German",
306626,
"de",
}
m["de-AT-vie"] = {
"Viennese German",
56474,
"de-AT",
}
m["de-CH"] = {
"Switzerland German",
1366643,
"de",
aliases = {"Schweizer Hochdeutsch", "Swiss Standard German", "Swiss High German"},
}
m["de-bal"] = {
"Baltic German",
15785413,
"de",
}
m["de-ear"] = {
"Early New High German",
1472199,
"de",
ancestors = "gmh",
aliases = {"Early Modern High German"},
}
m["ksh"] = {
"Kölsch",
4624,
"gmw-cfr",
}
m["pfl"] = {
"Palatine German",
23014,
"gmw-rfr",
aliases = {"Pfälzisch", "Pälzisch", "Palatinate German"},
}
m["sli"] = {
"Silesian East Central German",
152965,
"gmw-ecg",
aliases = {"Silesian"},
}
m["sxu"] = {
"Upper Saxon German",
699284,
"gmw-ecg",
}
-- Old High German varieties
m["lng"] = {
"Lombardic",
35972,
"goh",
}
-- Alemannic German varieties
m["gsw-low"] = {
"Low Alemannic German",
503724,
"gsw",
}
m["gsw-FR-als"] = {
"Alsatian Alemannic German",
8786,
"gsw-low",
}
m["gsw-hig"] = {
"High Alemannic German",
503728,
"gsw",
}
m["gsw-hst"] = {
"Highest Alemannic German",
687538,
"gsw",
}
m["wae"] = {
"Walser German",
680517,
"gsw-hst",
}
-----------------------------------------------------
-- Low German varieties --
-----------------------------------------------------
m["nds-de"] = {
"German Low German",
25433,
"nds",
ietf_subtag = "nds-DE", -- should we make this the actual code?
wikimedia_codes = "nds",
}
m["nds-nl"] = {
"Dutch Low Saxon",
516137,
"nds",
ietf_subtag = "nds-NL", -- should we make this the actual code?
wikimedia_codes = "nds-nl",
}
m["act"] = {
"Achterhoeks",
153627,
"nds-nl",
aliases = {"Achterhoek", "Achterhooks"},
}
m["drt"] = {
"Drents",
2736709,
"nds-nl",
aliases = {"Drèents", "Dreins", "Dreints", "Drints"},
}
m["frs"] = {
"East Frisian Low German",
149208,
"nds-de",
aliases = {"East Frisian", "East Frisian Low Saxon"},
}
m["gos"] = {
"Gronings",
508854,
"nds-nl",
aliases = {"Grunnegs", "Grönnegs"},
}
m["nds-lpr"] = {
"Low Prussian",
33982,
"nds-de",
}
m["sdz"] = {
"Sallands",
3436668,
"nds-nl",
aliases = {"Sallaans", "Sallaands"},
}
m["stl"] = {
"Stellingwerfs",
506010,
"nds-nl",
aliases = {"Stellingwarfs"},
}
m["twd"] = {
"Twents",
497363,
"nds-nl",
aliases = {"Tweants"},
}
m["vel"] = {
"Veluws",
2484810,
"nds-nl",
}
m["wep"] = {
"Westphalian",
505655,
"nds-de",
aliases = {"Westfalish", "Westphalien"},
}
-----------------------------------------------------
-- North Frisian varieties --
-----------------------------------------------------
m["frr-ins"] = {
"Insular North Frisian",
110629610,
"frr",
}
m["frr-fam"] = {
"Föhr-Amrum North Frisian",
110629601,
"frr-ins",
}
m["frr-foh"] = {
"Föhr North Frisian",
28185,
"frr-fam",
aliases = {"Föhr Frisian", "Fering",
"Ferring", -- Glottolog
},
varieties = {"Aasdring", "Weesdring"},
}
m["frr-amr"] = {
"Amrum North Frisian",
28192,
"frr-fam",
aliases = {"Amrum Frisian", "Amrum", "Öömrang"},
}
m["frr-hel"] = {
"Heligoland North Frisian",
28086,
"frr-ins",
aliases = {"Heligoland Frisian", "Halunder", "Heligolandic Frisian", "Heligolandic North Frisian",
"Helgoland Frisian", "Helgoland North Frisian", "Helgoland"},
}
m["frr-syl"] = {
"Sylt North Frisian",
28181,
"frr-ins",
aliases = {"Sylt Frisian", "Söl'ring",
"Sölreng", -- Glottolog
},
}
m["frr-mai"] = {
"Mainland North Frisian",
110629626,
"frr",
}
m["frr-hal"] = {
"Halligen North Frisian",
28177,
"frr-mai",
aliases = {"Halligen Frisian", "Halifreesk", "Hallingen Frisian", "Hallingen North Frisian",
"Hallingen", -- Glottolog
},
}
m["frr-moo"] = {
"Mooring North Frisian",
28187,
"frr-mai",
aliases = {"Bökingharde North Frisian", "Bökingharde Frisian", "Böökinghiirder frasch",
"Mooring", "Moring",
},
varieties = {{"East Mooring", "Ostermooring"}, {"West Mooring", "Westermooring"}},
}
m["frr-kar"] = {
"Karrharde North Frisian",
28191,
"frr-mai",
aliases = {"Karrharde Frisian", "Karrharder",
},
}
m["frr-goe"] = {
-- Technically this refers to three adjacent dialects (Northern, Central and Southern), the latter of which went
-- extinct in 1980-1981. As a result, Glottolog speaks of "Norder-Mittelgoesharde", referring to the remaining two.
"Goesharde North Frisian",
28183,
"frr-mai",
aliases = {"Norder-Mittelgoesharde North Frisian", "Norder-Mittelgoesharde Frisian", "Norder-Mittelgoesharde",
"Goesharde Frisian", "Goesharde", "Gooshiirder",
},
}
m["frr-wie"] = {
"Wiedingharde North Frisian",
28171,
"frr-mai",
aliases = {"Wiedingharde Frisian", "Wiedingharde", "Wiringhiirder freesk",
},
}
-----------------------------------------------------
-- Old Norse varieties --
-----------------------------------------------------
m["non-grn"] = {
"Greenlandic Norse",
855236,
"non-own",
}
m["non-oen"] = {
"Old East Norse",
10498031,
"non",
ancestors = "non",
}
m["non-own"] = {
"Old West Norse",
2377483,
"non",
ancestors = "non",
}
-----------------------------------------------------
-- Old Swedish varieties --
-----------------------------------------------------
m["gmq-osw-lat"] = {
"Late Old Swedish",
10723594,
"gmq-osw",
ancestors = "gmq-osw",
}
--------------------------------------------------------------------------------------
-- Greek varieties --
--------------------------------------------------------------------------------------
m["qsb-grc"] = {
"Pre-Greek",
965052,
"und",
family = "qfa-sub",
}
m["grc-aeo"] = {
"Aeolic Greek",
406373,
"grc",
aliases = {"Lesbic Greek", "Lesbian Greek", "Aeolian Greek"},
}
m["grc-arc"] = {
"Arcadian Greek",
nil,
"grc-arp",
}
m["grc-arp"] = {
"Arcadocypriot Greek",
499602,
"grc",
}
m["grc-att"] = {
"Attic Greek",
506588,
"grc",
}
m["grc-boi"] = {
"Boeotian Greek",
406373,
"grc-aeo",
}
m["grc-cyp"] = {
"Cypriot Ancient Greek", -- to distinguish from Cypriot Greek below
nil,
"grc-arp",
}
m["grc-dor"] = {
"Doric Greek",
285494,
"grc",
}
m["grc-ela"] = {
"Elean Greek",
nil,
"grc",
}
m["grc-epi"] = {
"Epic Greek",
990062,
"grc",
aliases = {"Homeric Greek"},
}
m["grc-ion"] = {
"Ionic Greek",
504165,
"grc",
}
m["grc-koi"] = {
"Koine Greek",
107358,
"grc",
ancestors = "grc-att",
aliases = {"Hellenistic Greek"},
}
m["grc-kre"] = {
"Cretan Ancient Greek", -- to distinguish from Cretan Greek below
nil,
"grc-dor",
}
m["grc-opl"] = {
"Opuntian Locrian",
nil,
"grc",
}
m["grc-ozl"] = {
"Ozolian Locrian",
nil,
"grc",
}
m["grc-pam"] = {
"Pamphylian Greek",
2271793,
"grc",
}
m["grc-ths"] = {
"Thessalian Greek",
406373,
"grc-aeo",
}
m["gkm"] = {
"Byzantine Greek",
36387,
"grc",
ancestors = "grc-koi",
aliases = {"Medieval Greek"},
}
m["el-cyp"] = {
"Cypriot Greek",
245899,
"el",
aliases = {"Cypriotic Greek"},
}
m["el-pap"] = {
"Paphian Greek",
nil,
"el",
}
m["el-crt"] = {
"Cretan Greek",
588306,
"el",
}
m["el-kth"] = {
"Katharevousa",
35961,
"el",
"Polyt",
ancestors = "gkm",
aliases = {"Katharevousa Greek"},
-- Polyt display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["el-kal"] = {
"Kaliarda",
12878658,
"el",
}
--------------------------------------------------------------------------------------
-- Indo-Iranian varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Indo-Aryan varieties --
-------------------------------------------------------------------------
-- reconstructed intermediate stages
m["pra-pro"] = {
"Proto-New Indo-Aryan",
nil,
"pra",
}
m["inc-ash-pro"] = {
"Proto-Middle Indo-Aryan",
nil,
"inc-ash",
}
m["inc-mit"] = {
"Mitanni",
1986700,
"inc-pro",
}
m["bra-old"] = {
"Old Braj",
nil,
"bra",
}
-- Apabhramsas
m["inc-aav"] = {
"Avahattha",
nil,
"inc-apa",
aliases = {"Abahattha"},
}
m["inc-asa"] = {
"Sauraseni Apabhramsa",
nil,
"inc-apa",
}
m["inc-agu"] = {
"Gurjara Apabhramsa",
nil,
"inc-apa",
}
m["inc-aka"] = {
"Kasmiri Apabhramsa",
nil,
"inc-apa",
}
m["inc-ama"] = {
"Maharastri Apabhramsa",
nil,
"inc-apa",
}
m["inc-ata"] = {
"Takka Apabhramsa",
nil,
"inc-apa",
}
m["inc-avr"] = {
"Vracada Apabhramsa",
nil,
"inc-apa",
}
-- Assamese varieties
m["as-bkm"] = {
"Barpetia Kamrupi Assamese",
30642960,
"as",
}
m["as-nkm"] = {
"Nalbaria Kamrupi Assamese",
85787678,
"as",
}
m["as-pkm"] = {
"Palasbaria Kamrupi Assamese",
nil,
"as",
}
-- Bengali varieties
m["bn-dvn"] = {
"Dhakaiya Vaṅga Bengali",
48726851,
"bn", -- Eastern Bengali variety
}
m["bn-nvn"] = {
"Noakhailla Vaṅga Bengali",
107548681,
"bn", -- Eastern Bengali variety
}
-- Dhivehi varieties
m["dv-old"] = {
"Old Dhivehi",
117790875,
"dv",
}
m["dv-mul"] = {
"Mulaku Dhivehi",
nil,
"dv",
aliases = {"Mulaku Divehi", "Mulaku Bas"},
}
m["dv-huv"] = {
"Huvadhu Dhivehi",
nil,
"dv",
aliases = {"Huvadhu Divehi", "Huvadhu Bas"},
}
m["dv-add"] = {
"Addu Dhivehi",
nil,
"dv",
aliases = {"Addu Divehi", "Addu Bas"},
}
-- Gujarati varieties
m["gu-kat"] = {
"Kathiyawadi",
nil,
"gu",
aliases = {"Kathiyawadi Gujarati", "Kathiawadi"},
}
m["gu-lda"] = {
"Lisan ud-Dawat Gujarati",
nil,
"gu",
aliases = {"Lisan ud-Dawat", "LDA"},
}
-- Hindi varieties
m["hi-mum"] = {
"Bombay Hindi",
3543151,
"hi",
aliases = {"Mumbai Hindi", "Bambaiyya Hindi"},
}
m["hi-mid"] = {
"Middle Hindi",
nil,
"inc-ohi",
ancestors = "inc-ohi",
}
-- Konkani varieties
m["kok-mid"] = {
"Middle Konkani",
nil,
"kok",
aliases = {"Medieval Konkani"},
}
m["kok-old"] = {
"Old Konkani",
nil,
"kok",
aliases = {"Early Konkani"},
}
-- Prakrits
m["pra-ard"] = {
"Ardhamagadhi Prakrit",
35217,
"pra",
aliases = {"Ardhamagadhi"},
}
m["pra-hel"] = {
"Helu Prakrit",
15080869,
"pra",
aliases = {"Elu", "Elu Prakrit", "Helu"},
}
m["pra-kha"] = {
"Khasa Prakrit",
nil,
"pra",
aliases = {"Khasa"},
}
m["pra-mag"] = {
"Magadhi Prakrit", -- Not to be confused with Magahi (mag)
2652214,
"pra",
aliases = {"Magadhi"},
}
m["pra-mah"] = {
"Maharastri Prakrit",
2586773,
"pra",
aliases = {"Maharashtri Prakrit", "Maharastri", "Maharashtri"},
}
m["pra-pai"] = {
"Paisaci Prakrit",
2995607,
"pra-sau",
aliases = {"Paisaci", "Paisachi"},
ancestors = "pra-sau"
}
m["pra-sau"] = {
"Sauraseni Prakrit",
2452885,
"pra",
aliases = {"Sauraseni", "Shauraseni"},
}
m["pra-ava"] = {
"Avanti",
nil,
"pra",
aliases = {"Avanti Prakrit"},
}
m["pra-pra"] = {
"Pracya",
nil,
"pra",
aliases = {"Pracya Prakrit"},
}
m["pra-bah"] = {
"Bahliki",
nil,
"pra",
aliases = {"Bahliki Prakrit"},
}
m["pra-dak"] = {
"Daksinatya",
nil,
"pra",
aliases = {"Daksinatya Prakrit"},
}
m["pra-sak"] = {
"Sakari",
nil,
"pra",
aliases = {"Sakari Prakrit"},
}
m["pra-can"] = {
"Candali",
nil,
"pra",
aliases = {"Candali Prakrit"},
}
m["pra-sab"] = {
"Sabari",
nil,
"pra",
aliases = {"Sabari Prakrit"},
}
m["pra-abh"] = {
"Abhiri",
nil,
"pra",
aliases = {"Abhiri Prakrit"},
}
m["pra-dra"] = {
"Dramili",
nil,
"pra",
aliases = {"Dramili Prakrit"},
}
m["pra-odr"] = {
"Odri",
nil,
"pra",
aliases = {"Odri Prakrit"},
}
-- Punjabi varieties
m["pnb"] = {
"Western Punjabi",
58635,
"pa",
"pa-Arab",
}
-- Sanskrit varieties
m["vsn"] = {
"Vedic Sanskrit",
36858,
"sa",
}
m["cls"] = {
"Classical Sanskrit",
9333703,
"sa",
}
m["sa-bhs"] = {
"Buddhist Hybrid Sanskrit",
248758,
"sa",
}
m["sa-bra"] = {
"Brahmanic Sanskrit",
139822891,
"vsn",
}
m["sa-epi"] = {
"Epic Sanskrit",
56702805,
"cls",
}
m["sa-neo"] = {
"New Sanskrit",
nil,
"sa",
}
m["sa-rig"] = {
"Rigvedic Sanskrit",
139822680,
"vsn",
}
-- Sinhalese varieties
m["si-med"] = {
"Medieval Sinhalese",
nil,
"si",
aliases = {"Medieval Sinhala"},
}
-------------------------------------------------------------------------
-- Iranian varieties --
-------------------------------------------------------------------------
m["qsb-bma"] = {
"the BMAC substrate",
133187435,
"und",
family = "qfa-sub",
aliases = {"the Bactria-Margiana substrate", "the Bactria-Margiana Archaeological Complex substrate"},
}
-- Historical and current Iranian dialects
m["ae-old"] = {
"Old Avestan",
29572,
"ae",
aliases = {"Gathic Avestan"},
}
m["ae-yng"] = {
"Younger Avestan",
29572,
"ae-old",
aliases = {"Young Avestan"},
}
m["bcc"] = {
"Southern Balochi",
33049,
"bal",
aliases = {"Southern Baluchi"},
}
m["bgp"] = {
"Eastern Balochi",
33049,
"bal",
aliases = {"Eastern Baluchi"},
}
m["bgn"] = {
"Western Balochi",
33049,
"bal",
aliases = {"Western Baluchi"},
}
m["bsg-ban"] = {
"Bandari",
nil,
"bsg",
}
m["bsg-hor"] = {
"Hormozi",
nil,
"bsg",
}
m["bsg-min"] = {
"Minabi",
nil,
"bsg",
}
m["kho-old"] = {
"Old Khotanese",
nil,
"kho",
}
m["kho-lat"] = {
"Late Khotanese",
nil,
"kho-old",
}
m["peo-ear"] = {
"Early Old Persian",
nil,
"peo",
}
m["peo-lat"] = {
"Late Old Persian",
nil,
"peo",
}
m["pal-ear"] = {
"Early Middle Persian",
nil,
"pal",
}
m["pal-lat"] = {
"Late Middle Persian",
nil,
"pal",
ancestors = "pal-ear",
}
m["ps-nwe"] = {
"Northwestern Pashto",
nil,
"ps",
}
m["ps-cgi"] = {
"Central Ghilzay",
nil,
"ps-nwe",
}
m["ps-mah"] = {
"Mahsudi",
nil,
"ps-nwe",
}
m["ps-nea"] = {
"Northeastern Pashto",
nil,
"ps",
}
m["ps-afr"] = {
"Afridi",
nil,
"ps-nea",
}
m["ps-bng"] = {
"Bangash",
nil,
"ps-nea",
}
m["ps-xat"] = {
"Khatak",
nil,
"ps-nea",
}
m["ps-pes"] = {
"Peshawari",
nil,
"ps-nea",
}
m["ps-sea"] = {
"Southeastern Pashto",
nil,
"ps",
}
m["ps-ban"] = {
"Bannu",
nil,
"ps-sea",
}
m["ps-kak"] = {
"Kakari",
nil,
"ps-sea",
}
m["ps-ser"] = {
"Sher",
nil,
"ps-sea",
}
m["ps-waz"] = {
"Waziri",
12274473,
"ps-sea",
}
m["ps-swe"] = {
"Southwestern Pashto",
nil,
"ps",
}
m["ps-kan"] = {
"Kandahari",
nil,
"ps-swe",
}
m["ps-jad"] = {
"Jadrani",
nil,
"ps",
ancestors = "ira-pat-pro"
}
m["xme-azr"] = {
"Old Azari",
nil,
"xme-ott",
aliases = {"Old Azeri", "Azari", "Azeri", "Āḏarī", "Adari", "Adhari"},
}
m["xme-ttc-cen"] = {
"Central Tati",
nil,
"xme-ott",
}
m["xme-ttc-eas"] = {
"Eastern Tati",
nil,
"xme-ott",
}
m["xme-ttc-nor"] = {
"Northern Tati",
nil,
"xme-ott",
}
m["xme-ttc-sou"] = {
"Southern Tati",
nil,
"xme-ott",
}
m["xme-ttc-wes"] = {
"Western Tati",
nil,
"xme-ott",
}
m["xmn"] = {
"Manichaean Middle Persian",
nil,
"pal-lat",
}
m["fa-ear"] = {
"Early New Persian",
127413796,
"fa",
ancestors = "pal-lat",
translit = "fa-cls-translit",
}
m["fa-cls"] = {
"Classical Persian",
9168,
"fa",
ancestors = "fa-ear",
translit = "fa-cls-translit",
}
m["fa-ira"] = {
"Iranian Persian",
3513637,
"fa",
aliases = {"Modern Persian", "Western Persian"},
translit = "fa-ira-translit",
}
m["prs"] = {
"Dari",
178440,
"fa",
aliases = {"Dari Persian", "Central Persian", "Eastern Persian", "Afghan Persian"},
translit = "fa-cls-translit",
}
m["haz"] = {
"Hazaragi",
33398,
"prs",
translit = "fa-cls-translit",
}
m["os-dig"] = {
"Digor Ossetian",
3027861,
"os",
aliases = {"Digoron", "Digor"},
}
m["os-iro"] = {
"Iron Ossetian",
nil,
"os",
aliases = {"Iron"},
}
m["sog-ear"] = {
"Early Sogdian",
nil,
"sog",
}
m["sog-lat"] = {
"Late Sogdian",
nil,
"sog-ear",
}
m["ro-MD"] = {
"Moldovan",
36392,
"ro",
aliases = {"Moldavian"},
}
m["oru-kan"] = {
"Kaniguram",
6363164,
"oru",
}
m["oru-log"] = {
"Logar",
nil,
"oru",
}
m["oos"] = {
"Old Ossetic",
65455882,
"xln",
}
m["oos-ear"] = {
"Early Old Ossetic",
nil,
"oos",
}
m["oos-lat"] = {
"Late Old Ossetic",
nil,
"oos",
}
m["rdb-jir"] = {
"Jirofti",
nil,
"rdb",
}
m["rdb-kah"] = {
"Kahnuji",
nil,
"rdb",
}
-- Southwestern Fars lects
m["fay-bur"] = {
"Burenjani",
nil,
"fay",
}
m["fay-bsh"] = {
"Bushehri",
nil,
"fay",
}
m["fay-dsh"] = {
"Dashtaki",
nil,
"fay",
}
m["fay-dav"] = {
"Davani",
5228140,
"fay",
}
m["fay-eze"] = {
"Emamzada Esmaili",
nil,
"fay",
}
m["fay-gav"] = {
"Gavkoshaki",
nil,
"fay",
}
m["fay-kho"] = {
"Khollari",
nil,
"fay",
}
m["fay-kon"] = {
"Kondazi",
nil,
"fay",
}
m["fay-kzo"] = {
"Old Kazeruni",
nil,
"fay",
}
m["fay-mas"] = {
"Masarami",
nil,
"fay",
}
m["fay-pap"] = {
"Papuni",
nil,
"fay",
}
m["fay-sam"] = {
"Samghani",
nil,
"fay",
}
m["fay-shr"] = {
"Shirazi",
nil,
"fay",
}
m["fay-sho"] = {
"Old Shirazi",
nil,
"fay",
}
m["fay-kar"] = {
"Khargi",
nil,
"fay",
}
m["fay-sor"] = {
"Sorkhi",
nil,
"fay",
}
-- Talysh lects
m["tly-cen"] = {
"Central Talysh",
nil,
"tly",
}
m["tly-asa"] = {
"Asalemi",
nil,
"tly-cen",
}
m["tly-kar"] = {
"Karganrudi",
nil,
"tly-cen",
}
m["tly-tul"] = {
"Tularudi",
nil,
"tly-cen",
}
m["tly-tal"] = {
"Taleshdulabi",
nil,
"tly-cen",
}
m["tly-nor"] = {
"Northern Talysh",
nil,
"tly",
}
m["tly-aze"] = {
"Azerbaijani Talysh",
nil,
"tly-nor",
}
m["tly-anb"] = {
"Anbarani",
nil,
"tly-nor",
}
m["tly-sou"] = {
"Southern Talysh",
nil,
"tly",
}
m["tly-fum"] = {
"Fumani",
nil,
"tly-sou",
}
m["tly-msu"] = {
"Masulei",
nil,
"tly-sou",
}
m["tly-msa"] = {
"Masali",
nil,
"tly-sou",
}
m["tly-san"] = {
"Shandarmani",
nil,
"tly-sou",
}
-- Tafreshi lects
m["xme-amo"] = {
"Amorehi",
nil,
"xme-taf",
}
m["atn"] = {
"Ashtiani",
3436590,
"xme-taf",
}
m["xme-bor"] = {
"Borujerdi",
nil,
"xme-taf",
}
m["xme-ham"] = {
"Hamadani",
6302426,
"xme-taf",
}
m["xme-kah"] = {
"Kahaki",
nil,
"xme-taf",
}
m["vaf"] = {
"Vafsi",
32611,
"xme-taf",
}
-- Kermanic lects
m["kfm"] = {
"Khunsari",
6403030,
"xme-ker",
}
m["xme-mah"] = {
"Mahallati",
nil,
"xme-ker",
}
m["xme-von"] = {
"Vonishuni",
nil,
"xme-ker",
}
m["xme-bdr"] = {
"Badrudi",
nil,
"xme-ker",
}
m["xme-del"] = {
"Delijani",
nil,
"xme-ker",
}
m["xme-kas"] = {
"Kashani",
nil,
"xme-ker",
}
m["xme-kes"] = {
"Kesehi",
nil,
"xme-ker",
}
m["xme-mey"] = {
"Meymehi",
nil,
"xme-ker",
}
m["ntz"] = {
"Natanzi",
6968399,
"xme-ker",
}
m["xme-abz"] = {
"Abuzeydabadi",
nil,
"xme-ker",
}
m["xme-aby"] = {
"Abyanehi",
nil,
"xme-ker",
}
m["xme-far"] = {
"Farizandi",
nil,
"xme-ker",
}
m["xme-jow"] = {
"Jowshaqani",
nil,
"xme-ker",
}
m["xme-nas"] = {
"Nashalji",
nil,
"xme-ker",
}
m["xme-qoh"] = {
"Qohrudi",
nil,
"xme-ker",
}
m["xme-yar"] = {
"Yarandi",
nil,
"xme-ker",
}
m["soj"] = {
"Soi",
7930463,
"xme-ker",
aliases = {"Sohi"},
}
m["xme-tar"] = {
"Tari",
nil,
"xme-ker",
}
m["gzi"] = {
"Gazi",
5529130,
"xme-ker",
}
m["xme-sed"] = {
"Sedehi",
nil,
"xme-ker",
}
m["xme-ard"] = {
"Ardestani",
nil,
"xme-ker",
}
m["xme-zef"] = {
"Zefrehi",
nil,
"xme-ker",
}
m["xme-isf"] = {
"Isfahani",
nil,
"xme-ker",
}
m["xme-kaf"] = {
"Kafroni",
nil,
"xme-ker",
}
m["xme-vrz"] = {
"Varzenehi",
nil,
"xme-ker",
}
m["xme-xur"] = {
"Khuri",
nil,
"xme-ker",
}
m["nyq"] = {
"Nayini",
6983146,
"xme-ker",
}
m["xme-ana"] = {
"Anaraki",
nil,
"xme-ker",
}
m["gbz"] = {
"Zoroastrian Dari",
32389,
"xme-ker",
aliases = {"Behdināni", "Gabri", "Gavrŭni", "Gabrōni"},
}
m["xme-krm"] = {
"Kermani",
nil,
"xme-ker",
}
m["xme-yaz"] = {
"Yazdi",
nil,
"xme-ker",
}
m["xme-bid"] = {
"Bidhandi",
nil,
"xme-ker",
}
m["xme-bij"] = {
"Bijagani",
nil,
"xme-ker",
}
m["xme-cim"] = {
"Chimehi",
nil,
"xme-ker",
}
m["xme-han"] = {
"Hanjani",
nil,
"xme-ker",
}
m["xme-kom"] = {
"Komjani",
nil,
"xme-ker",
}
m["xme-nar"] = {
"Naraqi",
nil,
"xme-ker",
}
m["xme-nus"] = {
"Nushabadi",
nil,
"xme-ker",
}
m["xme-qal"] = {
"Qalhari",
nil,
"xme-ker",
}
m["xme-trh"] = {
"Tarehi",
nil,
"xme-ker",
}
m["xme-val"] = {
"Valujerdi",
nil,
"xme-ker",
}
m["xme-var"] = {
"Varani",
nil,
"xme-ker",
}
m["xme-zor"] = {
"Zori",
nil,
"xme-ker",
}
-- Ramandi lects
m["tks-ebr"] = {
"Ebrahimabadi",
nil,
"tks",
}
m["tks-sag"] = {
"Sagzabadi",
nil,
"tks",
}
m["tks-esf"] = {
"Esfarvarini",
nil,
"tks",
}
m["tks-tak"] = {
"Takestani",
nil,
"tks",
}
m["tks-cal"] = {
"Chali Tati",
nil,
"tks",
aliases = {"Chāli"},
}
m["tks-dan"] = {
"Danesfani",
nil,
"tks",
}
m["tks-xia"] = {
"Khiaraji",
nil,
"tks",
}
m["tks-xoz"] = {
"Khoznini",
nil,
"tks",
}
-- Shughni dialects
m["sgh-bro"] = {
"Bartangi-Oroshori",
nil,
"sgh",
}
m["sgh-bar"] = {
"Bartangi",
nil,
"sgh-bro",
}
m["sgh-oro"] = {
"Oroshori",
nil,
"sgh-bro",
aliases = {"Roshorvi"},
}
m["sgh-rsx"] = {
"Roshani-Khufi",
nil,
"sgh",
}
m["sgh-xuf"] = {
"Khufi",
2562249,
"sgh-rsx",
aliases = {"Xufi", "Xūfī"},
}
m["sgh-ros"] = {
"Roshani",
2597566,
"sgh-rsx",
aliases = {"Rushani", "Rōšāni"},
}
m["sgh-xgb"] = {
"Khughni-Bajui",
nil,
"sgh",
}
m["sgh-xug"] = {
"Khughni",
nil,
"sgh-xgb",
}
m["sgh-baj"] = {
"Bajui",
nil,
"sgh-xgb",
}
-------------------------------------------------------------------------
-- Nuristani varieties --
-------------------------------------------------------------------------
m["bsh-kat"] = {
"Kativiri",
2605045,
"bsh",
aliases = {"Katə́viri"},
}
m["xvi"] = {
"Kamviri",
1193495,
"bsh",
aliases = {"Kamvíri"},
}
m["bsh-mum"] = {
"Mumviri",
nil,
"bsh",
aliases = {"Mumvíri"},
}
--------------------------------------------------------------------------------------
-- Italic varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Latin varieties --
-------------------------------------------------------------------------
-- Latin varieties by period
m["itc-ola"] = {
"Old Latin",
12289,
"la",
"Latn, Ital",
translit = {
Ital = "Ital-translit"
},
}
m["itc-lan"] = {
"Lanuvian",
16890829,
"itc-ola",
aliases = {"Lanuvine"},
}
m["itc-pra"] = {
"Praenestine",
16889772,
"itc-ola",
aliases = {"Praenestinian"},
}
m["la-cla"] = {
"Classical Latin",
253854,
"la",
}
m["la-vul"] = {
"Vulgar Latin",
37560,
"la-cla",
}
m["la-afr"] = {
"African Romance",
162064,
"roa-pro",
}
m["la-lat"] = {
"Late Latin",
1503113,
"la",
ancestors = "la-cla",
}
m["la-med"] = {
"Medieval Latin",
1163234,
"la",
ancestors = "la-lat",
}
m["la-eme"] = {
"Early Medieval Latin",
nil,
"la-med",
}
m["la-ecc"] = {
"Ecclesiastical Latin",
1247932,
"la",
aliases = {"Church Latin", "Liturgical Latin"},
ancestors = "la-lat",
}
m["la-ren"] = {
"Renaissance Latin",
499083,
"la",
ancestors = "la-med",
}
m["la-new"] = {
"New Latin",
1248221,
"la",
aliases = {"Modern Latin"},
ancestors = "la-ren",
}
m["la-con"] = {
"Contemporary Latin",
1246397,
"la-new",
}
-------------------------------------------------------------------------
-- Miscellaneous Italic varieties --
-------------------------------------------------------------------------
m["xfa-cap"] = {
"Capenate",
133182969,
"xfa",
}
m["osc-luc"] = {
"Lucanian",
3265025,
"osc",
}
m["osc-sam"] = {
"Samnite",
133184287,
"osc",
}
-------------------------------------------------------------------------
-- Romance varieties --
-------------------------------------------------------------------------
m["roa-pro"] = {
"Proto-Romance",
3408029,
"la-lat",
ancestors = "la-vul",
}
-----------------------------------------------------
-- Catalan varieties --
-----------------------------------------------------
m["ca-val"] = {
"Valencian",
32641,
"ca",
}
-----------------------------------------------------
-- Franco-Provençal varieties --
-----------------------------------------------------
m["frp-old"] = {
"Old Franco-Provençal",
nil,
"frp",
}
-----------------------------------------------------
-- French and derived creole varieties --
-----------------------------------------------------
m["fro-nor"] = {
"Old Northern French",
2044917,
"fro",
aliases = {"Old Norman", "Old Norman French"},
}
m["fro-pic"] = {
"Picard Old French",
nil,
"fro",
}
m["xno"] = {
"Anglo-Norman",
35214,
"fro-nor",
}
m["xno-law"] = {
"Law French",
2044323,
"xno",
}
m["zrp"] = {
"Zarphatic",
36994,
"fro",
aliases = {"Judeo-French"},
pseudo_families = "qfa-jew",
}
m["fr-CA"] = {
"Canadian French",
1450506,
"fr",
}
m["fr-CH"] = {
"Swiss French",
1480152,
"fr",
}
m["fr-aca"] = {
"Acadian French",
415109,
"fr",
}
m["fr-lou"] = {
"Louisiana French",
3083213,
"fr",
}
m["fr-mis"] = {
"Missouri French",
3083210,
"fr",
}
m["frc"] = {
"Cajun French",
880301,
"fr-lou",
}
m["ht-sdm"] = {
"Saint Dominican Creole French",
nil,
"ht",
ancestors = "fr",
}
-- Norman varieties
m["nrf-grn"] = {
"Guernsey Norman",
56428,
"nrf",
aliases = {"Guernsey"},
}
m["nrf-jer"] = {
"Jersey Norman",
56430,
"nrf",
aliases = {"Jersey"},
}
-----------------------------------------------------
-- Gallo-Italic varieties --
-----------------------------------------------------
m["egl-old"] = {
"Old Emilian",
nil,
"egl",
}
m["lij-old"] = {
"Old Ligurian",
nil,
"lij",
aliases = {"Old Genoese"},
}
m["lmo-old"] = {
"Old Lombard",
97165320,
"lmo",
}
m["pms-old"] = {
"Old Piedmontese",
nil,
"pms",
aliases = {"Old Piemontese"},
}
m["vec-old"] = {
"Old Venetan",
nil,
"vec",
aliases = {"Old Venetian"},
}
m["rgn-old"] = {
"Old Romagnol",
nil,
"rgn",
}
-----------------------------------------------------
-- Italo-Romance varieties --
-----------------------------------------------------
-- Italian varieties
m["roa-oit"] = {
"Old Italian",
nil,
"it",
}
m["it-CH"] = {
"Switzerland Italian",
672147,
"it",
}
-- Other Italo-Romance varieties
m["nap-old"] = {
"Old Neapolitan",
nil,
"nap",
}
m["scn-old"] = {
"Old Sicilian",
nil,
"scn",
}
-----------------------------------------------------
-- Occitan varieties --
-----------------------------------------------------
m["oc-auv"] = {
"Auvergnat",
35359,
"oc",
aliases = {"Auvernhat", "Auvergnese"},
}
m["oc-gas"] = {
"Gascon",
35735,
"oc",
}
-- standardized dialect of Gascon
m["oc-ara"] = {
"Aranese",
10196,
"oc-gas",
}
m["oc-lan"] = {
"Languedocien",
942602,
"oc",
aliases = {"Lengadocian"},
}
m["oc-lim"] = {
"Limousin",
427614,
"oc",
}
m["oc-pro"] = {
"Provençal",
241243,
"oc",
aliases = {"Provencal"},
}
m["oc-pro-old"] = {
"Old Provençal",
2779185,
"pro",
}
m["oc-viv"] = {
"Vivaro-Alpine",
1649613,
"oc",
}
m["oc-jud"] = {
"Shuadit",
56472,
"oc",
aliases = {
"Chouhadite", "Chouhadit", "Chouadite", "Chouadit", "Shuhadit",
"Judeo-Occitan", "Judæo-Occitan", "Judaeo-Occitan",
"Judeo-Provençal", "Judæo-Provençal", "Judaeo-Provençal",
"Judeo-Provencal", "Judaeo-Provencal",
"Judeo-Comtadin", "Judæo-Comtadin", "Judaeo-Comtadin",
},
pseudo_families = "qfa-jew",
}
-----------------------------------------------------
-- Portuguese and derived creole varieties --
-----------------------------------------------------
-- Portuguese
m["pt-BR"] = {
"Brazilian Portuguese",
750553,
"pt",
}
m["pt-PT"] = {
"European Portuguese",
922399,
"pt",
}
-- Kabuverdianu (Cape Verde Creole, Cape Verdean Creole)
m["kea-bar"] = {
"Barlavento Kabuverdianu",
2217638,
"kea",
aliases = {"Barlavento", "Barlavento Creole", "Sampadjudu"},
}
m["kea-bvi"] = {
"Boa Vista Kabuverdianu",
16501837,
"kea-bar",
aliases = {"Boa Vista Creole"},
}
m["kea-sal"] = {
"Sal Kabuverdianu",
18707467,
"kea-bar",
aliases = {"Sal Creole"},
}
m["kea-saa"] = {
"Santo Antão Kabuverdianu",
18707472,
"kea-bar",
aliases = {"Santo Antão Creole"},
}
m["kea-sni"] = {
"São Nicolau Kabuverdianu",
18707549,
"kea-bar",
aliases = {"São Nicolau Creole"},
}
m["kea-svi"] = {
"São Vicente Kabuverdianu",
18707550,
"kea-bar",
aliases = {"São Vicente Creole"},
}
m["kea-sot"] = {
"Sotavento Kabuverdianu",
10261559,
"kea",
aliases = {"Sotavento", "Sotavento Creole", "Badiu"},
}
m["kea-bra"] = {
"Brava Kabuverdianu",
18670181,
"kea-sot",
aliases = {"Brava Creole"},
}
m["kea-fog"] = {
"Fogo Kabuverdianu",
18706861,
"kea-sot",
aliases = {"Fogo Creole"},
}
m["kea-mai"] = {
"Maio Kabuverdianu",
18707286,
"kea-sot",
aliases = {"Maio Creole"},
}
m["kea-san"] = {
"Santiago Kabuverdianu",
35117,
"kea-sot",
aliases = {"Santiago Creole"},
}
m["kea-alu"] = {
"ALUPEC Kabuverdianu",
375704,
"kea",
aliases = {"ALUPEC", "Alfabeto Unificado para a Escrita do Cabo-Verdiano"},
}
-----------------------------------------------------
-- Rhaeto-Romance varieties --
-----------------------------------------------------
-- Friulian varieties
m["fur-old"] = {
"Old Friulian",
nil,
"fur",
}
-- Ladin varieties
m["lld-amp"] = {
"Ampezan Ladin",
25617466,
"lld",
aliases = {"Anpezan", "Ampezan", "Ampezzan", "Ampezzano"},
}
m["lld-bad"] = {
"Badiot Ladin",
3706562,
"lld",
aliases = {"Badiot", "Badioto", "Badiotto"},
}
m["lld-cad"] = {
"Cadorino Ladin",
3706570,
"lld",
aliases = {"Cadorino"},
}
m["lld-fas"] = {
"Fascian Ladin",
742627,
"lld",
aliases = {"Fascian", "Fassano"},
}
m["lld-fod"] = {
"Fodom Ladin",
3706605,
"lld",
aliases = {"Fodom", "Livinallese"},
}
m["lld-for"] = {
"Fornes Ladin",
5470374,
"lld",
aliases = {"Fornes"},
}
m["lld-ghe"] = {
"Gherdëina Ladin",
3706597,
"lld",
aliases = {"Gherdëina", "Gardenese", "Val Gardena"},
}
m["lld-non"] = {
"Nones Ladin",
1055027,
"lld",
aliases = {"Nones", "Noneso"},
}
-- Romansh varieties
m["rm-old"] = {
"Old Romansh",
nil,
"rm",
}
m["rm-put"] = {
"Puter Romansh",
688309,
"rm",
aliases = {"Puter", "Putèr", "Upper Engadine", "rm-puter"},
}
m["rm-srm"] = {
"Surmiran Romansh",
690216,
"rm",
aliases = {"Surmiran", "rm-surmiran",
"Surmiran-Albula", -- Glottolog
},
}
m["rm-srs"] = {
"Sursilvan Romansh",
688348,
"rm",
aliases = {"Sursilvan", "rm-sursilv"},
}
m["rm-sut"] = {
"Sutsilvan Romansh",
688272,
"rm",
aliases = {"Sutsilvan", "rm-sutsilv"},
varieties = {"Scharans Sutsilvan"}, -- per Glottolog
}
m["rm-val"] = {
"Vallader Romansh",
690226,
"rm",
aliases = {"Vallader", "Putèr", "Lower Engadine", "rm-vallader"},
}
m["rm-gri"] = {
"Rumantsch Grischun",
688873,
"rm",
aliases = {"rm-rumgr"},
}
-----------------------------------------------------
-- Sardinian varieties --
-----------------------------------------------------
m["sc-old"] = {
"Old Sardinian",
nil,
"sc",
}
m["sc-src"] = {
"Logudorese",
777974,
"sc",
aliases = {"Logudorese Sardinian"},
}
m["sc-nuo"] = {
"Nuorese",
nil,
"sc-src",
aliases = {"Nuorese Sardinian"},
}
m["sc-sro"] = {
"Campidanese",
35348,
"sc",
aliases = {"Campidanese Sardinian"},
}
-----------------------------------------------------
-- Spanish varieties --
-----------------------------------------------------
m["es-ear"] = {
"Early Modern Spanish",
5364419,
"es",
}
m["es-AR"] = {
"Rioplatense Spanish",
509780,
"es",
}
m["es-BO"] = {
"Bolivian Spanish",
510730,
"es",
}
m["es-CL"] = {
"Chilean Spanish",
857295,
"es",
}
m["es-CO"] = {
"Colombian Spanish",
1115875,
"es",
}
m["es-CU"] = {
"Cuban Spanish",
824909,
"es",
}
m["es-MX"] = {
"Mexican Spanish",
616620,
"es",
}
m["es-PE"] = {
"Peruvian Spanish",
736236,
"es",
}
m["es-PH"] = {
"Philippine Spanish",
22091406,
"es",
}
m["es-US"] = {
"United States Spanish",
2301077,
"es",
aliases = {"US Spanish"},
}
--use label "US Spanish" to put Spanish terms in this category
m["es-PR"] = {
"Puerto Rican Spanish",
7258609,
"es",
}
m["es-VE"] = {
"Venezuelan Spanish",
840017,
"es",
}
m["es-lun"] = {
"Lunfardo",
1401612,
"es",
}
----------------------------------------------------------------------------------------------------------------------
-- Japonic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Japanese varieties
m["ja-mid"] = {
"Middle Japanese",
6841474,
"ojp",
ancestors = "ojp",
}
m["ja-mid-ear"] = {
"Early Middle Japanese",
182695,
"ja-mid",
}
m["ja-mid-lat"] = {
"Late Middle Japanese",
1816184,
"ja-mid",
ancestors = "ja-mid-ear",
}
m["ja-ear"] = {
"Early Modern Japanese",
5326692,
"ja",
ancestors = "ja-mid-lat",
}
m["ojp-eas"] = {
"Eastern Old Japanese",
65247957,
"ojp",
}
m["ja-cla"] = {
"Classical Japanese",
1332057,
"ja",
-- FIXME: This is redundant because Classical Japanese is considered a child of (Modern) Japanese, which has ja-mid-ear
-- (as well as ja-mid-lat) as ancestors. However, the intent here is that the *direct* ancestor of ja-cla is ja-mid-ear
-- and ja-mid-lat is not an ancestor. Need to rethink ancestor handling.
-- ancestors = "ja-mid-ear",
}
----------------------------------------------------------------------------------------------------------------------
-- Koreanic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Korean varieties
m["oko-lat"] = {
"Late Old Korean",
nil,
"oko",
}
m["okm-ear"] = {
"Early Middle Korean",
nil,
"okm",
}
m["ko-cen"] = {
"Central Korean",
nil,
"ko",
}
m["ko-gyg"] = {
"Gyeonggi Korean",
485492,
"ko-cen",
aliases = {"Seoul Korean"},
}
m["ko-chu"] = {
"Chungcheong Korean",
625800,
"ko-cen",
aliases = {"Hoseo Korean"},
}
m["ko-hwa"] = {
"Hwanghae Korean",
16183706,
"ko-cen",
}
m["ko-gan"] = {
"Gangwon Korean",
11260444,
"ko-cen",
aliases = {"Yeongdong Korean"},
}
m["ko-gys"] = {
"Gyeongsang Korean",
488002,
"ko",
aliases = {"Southeastern Korean"},
}
m["ko-jeo"] = {
"Jeolla Korean",
11250166,
"ko",
aliases = {"Southwestern Korean"},
}
m["ko-pyo"] = {
"Pyongan Korean",
7263142,
"ko",
aliases = {"Northwestern Korean"},
}
m["ko-ham"] = {
"Hamgyong Korean",
860702,
"ko",
aliases = {"Northeastern Korean"},
}
m["ko-yuk"] = {
"Yukjin Korean",
16171275,
"ko",
aliases = {"Yukchin Korean", "Ryukjin Korean", "Ryukchin Korean"},
}
----------------------------------------------------------------------------------------------------------------------
-- Mongolic varieties --
----------------------------------------------------------------------------------------------------------------------
m["xng-ear"] = {
"Early Middle Mongol",
nil,
"xng",
}
m["xng-lat"] = {
"Late Middle Mongol",
nil,
"xng",
ancestors = "xng-ear",
}
m["mn-kha"] = {
"Khalkha Mongolian",
6399808,
"mn",
aliases = {"Khalkha"},
}
m["mn-ord"] = {
"Ordos Mongolian",
716904,
"mn",
aliases = {"Ordos"},
}
m["mn-cha"] = {
"Chakhar Mongolian",
907425,
"mn",
aliases = {"Chakhar"},
}
m["mn-khr"] = {
"Khorchin Mongolian",
3196210,
"mn",
aliases = {"Khorchin"},
}
----------------------------------------------------------------------------------------------------------------------
-- Niger-Congo varieties --
----------------------------------------------------------------------------------------------------------------------
-----------------------------------------------------
-- Akan varieties --
-----------------------------------------------------
m["tw"] = {
"Twi Akan",
36850,
"ak",
aliases = {"Twi"},
}
m["abr"] = {
"Abron",
34831,
"tw",
aliases = {"Brong", "Bono", "Bono Twi"},
}
m["tw-asa"] = {
"Asante Twi",
19261685,
"tw",
aliases = {"Asante", "Ashanti", "Ashante"},
}
m["tw-aku"] = {
"Akuapem Twi",
31150449,
"tw",
aliases = {"Akuapem", "Akuapim", "Akwapem Twi", "Akwapi"},
}
m["fat"] = {
"Fante Akan",
35570,
"ak",
aliases = {"Fante", "Fanti", "Fantse", "Mfantse"},
}
m["wss"] = {
"Wasa",
36914,
"ak",
}
-- creole
m["alv-kro"] = {
"Kromanti",
1093206,
"crp-mar",
}
-----------------------------------------------------
-- Bantu varieties --
-----------------------------------------------------
m["bnt-cmn"] = {
"Common Bantu",
nil,
"bnt-pro",
}
m["xh-bha"] = {
"Bhaca",
4900493,
"xh",
aliases = {"isiBhaca", "IsiBhaca"},
}
-- Rwanda-Rundi varieties
m["rw-kin"] = {
"Kinyarwanda",
33573,
"rw",
aliases = {"Rwanda"},
}
m["rw-run"] = {
"Kirundi",
33583,
"rw",
aliases = {"Rundi"},
}
-----------------------------------------------------
-- Fula varieties --
-----------------------------------------------------
m["fuc"] = {
"Pulaar",
1420205,
"ff",
}
m["fuf"] = {
"Pular",
3915357,
"ff",
}
m["ffm"] = {
"Maasina Fulfulde",
3915322,
"ff",
}
m["fue"] = {
-- no enwiki entry as of yet but frwiki and pmswiki have one
"Borgu Fulfulde",
12952426,
"ff",
}
m["fuh"] = {
-- no enwiki entry as of yet but frwiki and pmswiki have one
"Western Niger Fulfulde",
12952430,
"ff",
}
m["fuq"] = {
-- no enwiki entry as of yet but frwiki, hrwiki and pmswiki have one
"Central-Eastern Niger Fulfulde",
12628799,
"ff",
}
m["fuv"] = {
-- no enwiki entry as of yet but dewiki, frwiki, hrwiki, pmswiki and swwiki have one
"Nigerian Fulfulde",
36129,
"ff",
}
m["fub"] = {
-- no enwiki entry as of yet but dewiki, frwiki, hrwiki, pmswiki, ptwiki, swwiki and yowiki have one
"Adamawa Fulfulde",
34776,
"ff",
}
m["fui"] = {
-- no enwiki entry as of yet but pmswiki and swwiki have one
"Bagirmi Fulfulde",
11003859,
"ff",
}
----------------------------------------------------------------------------------------------------------------------
-- Papuan varieties --
----------------------------------------------------------------------------------------------------------------------
m["kze"] = {
"Kosena",
12952663,
"auy",
}
m["ont"] = {
"Ontenu",
3352827,
"gaj",
aliases = {"Ontena"},
}
----------------------------------------------------------------------------------------------------------------------
-- Salishan varieties --
----------------------------------------------------------------------------------------------------------------------
m["lut-nor"] = {
"Northern Lushootseed",
nil,
"lut",
aliases = {"Northern Puget Sound Salish"},
}
m["slh"] = {
"Southern Lushootseed",
7997684,
"lut",
aliases = {"Southern Puget Sound Salish", "Twulshootseed", "Whulshootseed"},
}
m["ska"] = {
"Skagit",
12642471,
"lut-nor",
}
m["sno"] = {
"Snohomish",
25559662,
"lut-nor",
}
----------------------------------------------------------------------------------------------------------------------
-- Sino-Tibetan varieties --
----------------------------------------------------------------------------------------------------------------------
m["tbq-pro"] = {
"Proto-Tibeto-Burman",
7251864,
"sit-pro",
}
-----------------------------------------------------
-- Chinese varieties --
-----------------------------------------------------
------------- Old Chinese, Middle Chinese -------------
m["och-ear"] = {
"Early Old Chinese",
nil,
"och",
}
m["och-lat"] = {
"Late Old Chinese",
nil,
"och",
}
m["ltc-ear"] = {
"Early Middle Chinese",
nil,
"ltc",
}
m["ltc-lat"] = {
"Late Middle Chinese",
nil,
"ltc",
}
------------- Classical/Literary varieties -------------
-- FIXME: Temporary.
m["lzh-shi"] = {
"Traditional Chinese poetry",
1759242,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cii"] = {
"Ci",
1091366,
"lzh",
}
-- FIXME: Temporary.
m["lzh-yue"] = {
"Classical Cantonese",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cmn"] = {
"Classical Mandarin",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-tai"] = {
"Classical Taishanese",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cmn-TW"] = {
"Classical Taiwanese Mandarin",
nil,
"lzh-cmn",
}
-- FIXME: Temporary.
m["lzh-VI"] = {
"Vietnamese Classical Chinese",
17034227,
"lzh",
}
-- FIXME: Temporary.
m["lzh-KO"] = {
"Korean Classical Chinese",
10496257,
"lzh",
ietf_subtag = "lzh-KR" -- KR = South Korea, as there is no code for Korea as a whole
}
-- FIXME: Temporary.
m["lzh-lit"] = {
"Literary Chinese",
nil,
"lzh",
}
-- FIXME: Temporary. FIXME: Do we need this? How does it differ from Old Chinese?
m["lzh-pre"] = {
"Pre-Classical Chinese",
nil,
"lzh",
}
------------- Written Vernacular varieties -------------
-- FIXME: Temporary.
m["cmn-wvc"] = {
"Written vernacular Mandarin",
783605,
"cmn",
}
-- FIXME: Temporary. FIXME: How does this differ from "Literary Cantonese"?
m["yue-wvc"] = {
"Written vernacular Cantonese",
nil,
"yue",
}
-- FIXME: Temporary.
m["zhx-tai-wvc"] = {
"Written vernacular Taishanese",
nil,
"zhx-tai",
}
------------- Mandarin varieties -------------
-- FIXME: Temporary. NOTE: The Linguist List assigns the "w:Beijing dialect" (Wikidata 1147606) the code "cmn-bej" and
-- the larger "w:Beijing Mandarin (division of Mandarin)" dialect group (Wikidata 2169652; what we call "Beijingic
-- Mandarin", after Glottolog) the code "cmn-bei".
m["cmn-bei"] = {
"Beijing Mandarin",
1147606,
"cmn-bec",
}
-- FIXME: Temporary.
m["cmn-bec"] = {
"Beijingic Mandarin",
2169652,
"cmn",
}
-- FIXME: Temporary. NOTE: The Linguist List uses the code cmn-zho.
m["cmn-cep"] = {
"Central Plains Mandarin",
3048775,
"cmn",
aliases = {"Zhongyuan Mandarin"},
}
m["cmn-ear"] = {
"Early Mandarin",
837169,
"cmn",
ancestors = "ltc",
}
-- FIXME: Temporary.
m["cmn-gua"] = {
"Guanzhong Mandarin",
3431648,
"cmn-cep",
}
-- FIXME: Temporary. Appears to be a subdialect of Guiliu Mandarin, which in turn is a subdialect of Southwestern Mandarin.
m["cmn-gui"] = {
"Guilin Mandarin",
11111636,
"cmn-sow",
}
m["cmn-jhu"] = {
"Jianghuai Mandarin",
2128953,
"cmn",
aliases = {"Lower Yangtze Mandarin"},
}
-- FIXME: Temporary.
m["cmn-lan"] = {
"Lanyin Mandarin",
662754,
"cmn",
}
-- FIXME: Temporary.
m["cmn-MY"] = {
"Malaysian Mandarin",
13646143,
"cmn",
}
-- FIXME: Temporary.
m["cmn-nan"] = {
"Nanjing Mandarin",
2681098,
"cmn-jhu",
}
-- FIXME: Temporary.
m["cmn-noe"] = {
"Northeastern Mandarin",
1064504,
"cmn",
}
-- FIXME: Temporary.
m["cmn-PH"] = {
"Philippine Mandarin",
7185155,
"cmn",
}
-- FIXME: Temporary.
m["cmn-SG"] = {
"Singapore Mandarin",
1048980,
"cmn",
}
-- FIXME: Temporary.
m["cmn-sow"] = {
"Southwestern Mandarin",
2609239,
"cmn",
}
-- FIXME: Temporary. Appears to be a subdialect of Jilu Mandarin.
m["cmn-tia"] = {
"Tianjin Mandarin",
7800220,
"cmn",
}
-- FIXME: Temporary. NOTE: Wikidata also has Q4380827 "Taiwanese Mandarin", defined as "rare dialect of Standard Chinese
-- (Mandarin) used in Taiwan, which is strongly influenced by Taiwanese Hokkien; mostly used by elderlies" and having no
-- English Wikipedia article (but see w:zh:臺灣國語).
m["cmn-TW"] = {
"Taiwanese Mandarin",
262828,
"cmn",
}
-- FIXME: Temporary. Appears to be a subdialect of Wu-Tian Mandarin, in turn a subdialect of Southwestern Mandarin.
-- Given the code cmn-xwu in the Linguist List.
m["cmn-wuh"] = {
"Wuhan Mandarin",
11124731,
"cmn-sow",
aliases = {"Wuhanese"},
}
-- FIXME: Temporary. Appears to be a subdialect of Lanyin Mandarin.
m["cmn-xin"] = {
"Xining Mandarin",
nil,
"cmn-lan",
}
-- FIXME: Temporary.
m["cmn-yan"] = {
"Yangzhou Mandarin",
nil,
"cmn-jhu",
}
------------- Cantonese varieties -------------
-- FIXME: Temporary.
m["yue-gua"] = {
"Guangzhou Cantonese",
nil,
"yue",
}
-- FIXME: Temporary. Given the codes yue-yue or yue-can in the Linguist List.
m["yue-HK"] = {
"Hong Kong Cantonese",
5894342,
"yue",
}
-- FIXME: Temporary. FIXME: How does this differ from "Written vernacular Cantonese"?
m["yue-lit"] = {
"Literary Cantonese",
2472605,
"yue",
}
------------- Wu varieties -------------
m["wuu-han"] = {
"Hangzhounese",
5648144,
"wuu",
}
m["wuu-nin"] = {
"Ningbonese",
3972199,
"wuu",
}
-- FIXME: Temporary.
m["wuu-nor"] = {
"Northern Wu",
7675988,
"wuu",
aliases = {"Taihu Wu"},
}
-- FIXME: Temporary? Subvariety of Taihu Wu. NOTE: "chm" stands for Chongming, the main dialect, to avoid a conflict
-- with Shanghainese.
m["wuu-chm"] = {
"Shadi Wu",
6112340,
"wuu-nor",
}
m["wuu-sha"] = {
"Shanghainese",
36718,
"wuu-nor",
}
m["wuu-suz"] = {
"Suzhounese",
831744,
"wuu-nor",
}
-- FIXME: Temporary. May be converted into a full language and/or split.
m["wuu-wen"] = {
"Wenzhounese",
710218,
"wuu",
}
------------- Xiang varieties -------------
m["hsn-lou"] = {
"Loudi Xiang",
10943823,
"hsn-old",
}
m["hsn-hya"] = {
"Hengyang Xiang",
20689035,
"hsn-hzh",
}
m["hsn-hzh"] = {
"Hengzhou Xiang",
nil,
"hsn",
}
m["hsn-new"] = {
"New Xiang",
7012696,
"hsn",
aliases = {"Chang-Yi"},
}
m["hsn-old"] = {
"Old Xiang",
7085453,
"hsn",
aliases = {"Lou-Shao"},
}
------------- Hakka varieties -------------
-- FIXME: Temporary.
m["hak-dab"] = {
"Dabu Hakka",
19855566,
"hak", -- formerly hak-TW but seems to be spoken primary in Dabu County in Guangdong
}
-- FIXME: Temporary.
m["hak-eam"] = {
"Early Modern Hakka",
nil,
"hak",
}
-- FIXME: Temporary.
m["hak-hai"] = {
"Hailu Hakka",
17038519,
"hak", -- often considered a Taiwanese lect but also spoken in [[Shanwei]], [[Guangdong]]
}
-- FIXME: Temporary.
m["hak-HK"] = {
"Hong Kong Hakka",
2675834,
"hak",
}
-- FIXME: Temporary.
m["hak-hui"] = {
"Huiyang Hakka",
16873881,
"hak",
}
-- FIXME: Temporary.
m["hak-hui-MY"] = {
"Malaysian Huiyang Hakka",
nil,
"hak-hui",
}
-- FIXME: Temporary. Similar to and possibly the parent of Sixian Hakka in Taiwan.
m["hak-mei"] = {
"Meixian Hakka",
839295,
"hak",
aliases = {"Moiyan Hakka", "Meizhou Hakka"},
}
-- FIXME: Temporary.
m["hak-six"] = {
"Sixian Hakka",
9668261,
"hak-TW",
}
-- FIXME: Temporary.
m["hak-TW"] = {
"Taiwanese Hakka",
2391532,
"hak",
}
-- FIXME: Temporary.
m["hak-zha"] = {
"Zhao'an Hakka",
6703311,
"hak",
aliases = {"Zhangzhou Hakka"},
}
-- Southern Min varieties --
m["nan-anx"] = {
"Anxi Hokkien",
97064149,
"nan-qua",
}
m["nan-cha"] = {
"Changtai Hokkien",
nil,
"nan-zha",
}
m["nan-hou"] = {
"Houlu Min",
19855492,
"nan-dat",
}
m["nan-hui"] = {
"Hui'an Hokkien",
16241797,
"nan-qua",
}
m["nan-jin"] = {
"Jinjiang Hokkien",
11089375,
"nan-qua",
}
m["nan-kin"] = {
"Kinmenese Hokkien",
56278342,
"nan-xia",
aliases = {"Kinmen Hokkien"},
}
m["nan-med"] = {
"Medan Hokkien",
6805114,
"nan-zha",
}
m["nan-pen"] = {
"Penang Hokkien",
11120689,
"nan-zha",
}
m["nan-hbl-PH"] = {
"Philippine Hokkien",
3236692,
"nan-qua",
}
m["nan-qia"] = {
"Qianlu Min",
19842517,
"nan-dat",
}
m["nan-qua"] = {
"Quanzhou Hokkien",
2251677,
"nan-hbl",
aliases = {"Chinchew", "Choanchew"},
}
-- FIXME: Temporary? Derived from both Quanzhou and Zhangzhou Hokkien.
m["nan-hbl-SG"] = {
"Singapore Hokkien",
3846528,
"nan-hbl",
}
m["nan-spm"] = {
"Southern Malaysian Hokkien",
7570322,
"nan-qua",
aliases = {"Southern Malaysia Hokkien", "Southern Peninsular Malaysian Hokkien", "Southern Peninsular Malaysia Hokkien"}
}
m["nan-hbl-TW"] = {
"Taiwanese Hokkien",
36778,
"nan-hbl",
}
m["nan-ton"] = {
"Tong'an Hokkien",
nil,
"nan-xia",
}
m["nan-xia"] = {
"Xiamen Hokkien",
68744,
"nan-hbl",
aliases = {"Amoy", "Amoyese", "Amoynese", "Xiamenese"},
}
m["nan-yon"] = {
"Yongchun Hokkien",
65118728,
"nan-qua",
}
m["nan-zha"] = {
"Zhangzhou Hokkien",
8070492,
"nan-hbl",
aliases = {"Changchew", "Chiangchew", "Changchow"},
}
m["nan-zho"] = {
"Zhao'an Hokkien",
65118728,
"nan-zha",
aliases = {"Zhao'an", "Chawan", "Chawan Hokkien"},
}
m["nan-zhp"] = {
"Zhangping Hokkien",
15937822,
"nan-zha",
}
------------- Other Min varieties -------------
-- FIXME: Temporary. Affiliation within Min uncertain; some combination of Eastern and Southern.
m["zhx-zho"] = {
"Zhongshan Min",
8070958,
"zh",
}
------------- Other Chinese varieties -------------
-- FIXME: Temporary. Affiliation within Chinese uncertain; possibly Yue.
m["zhx-dan"] = {
"Danzhou Chinese",
2578935,
"zh",
}
------------- Chinese romanization varieties -------------
-- [[Wiktionary:Information desk/2022/June#Etymology Coding Issue]]
-- [[Wiktionary:Grease pit/2022/June#Transliteration Systems in Etymologies 2]]
m["cmn-pinyin"] = {
"Hanyu Pinyin",
42222,
"cmn",
aliases = {"Pinyin"},
}
m["cmn-tongyong"] = {
"Tongyong Pinyin",
700739,
"cmn",
}
m["cmn-wadegiles"] = {
"Wade–Giles",
208442,
"cmn",
aliases = {"Wade-Giles", "Wade Giles"},
}
m["zh-postal"] = {
"Postal Romanization",
151868,
"zh",
}
-- Chinese cyrillization
m["cmn-palladius"] = {
"Palladius",
1234239,
"cmn",
aliases = {"Palladius system"},
}
-----------------------------------------------------
-- Tibetic varieties --
-----------------------------------------------------
m["adx"] = {
"Amdo Tibetan",
56509,
"bo",
}
m["kbg"] = {
"Khamba",
12952626,
"bo",
}
m["khg"] = {
"Khams Tibetan",
56601,
"bo",
}
m["tsk"] = {
"Tseku",
11159532,
"bo",
}
----------------------------------------------------------------------------------------------------------------------
-- Tai-Kadai varieties --
----------------------------------------------------------------------------------------------------------------------
m["th-old"] = {
"Old Thai",
nil,
"tai-swe-pro",
wikipedia_article = "Thai language#Old Thai",
}
m["th-suk"] = {
"Sukhothai Old Thai", -- 1238-1438. Cannot use "Sukhothai Thai" as Sukhothai is the current city and "Sukhothai Thai" is a lect.
nil,
"th-old",
aliases = {"Sukhothai Siamese"},
wikipedia_article = "Thai language#Old Thai",
}
m["th-ayu"] = {
"Ayutthaya Old Thai", -- 1351-1767. Cannot use "Ayutthaya Thai" as Ayutthaya is the current city.
nil,
"th-old",
aliases = {"Ayutthaya Siamese"},
wikipedia_article = "Thai language#Old Thai",
}
--[[
m["th-new"] = {
"Hacked Thai", -- temporary for testing new translit/display methods
nil,
"th",
translit = "User:Benwing2/th-scraping-translit",
display_text = "User:Benwing2/th-scraping-translit",
strip_diacritics = "User:Benwing2/th-scraping-translit",
preprocess_links = "User:Benwing2/th-scraping-translit",
}
]]
m["tai-shz"] = {
"Shangsi Zhuang",
13216,
"za",
}
----------------------------------------------------------------------------------------------------------------------
-- Turkic varieties --
----------------------------------------------------------------------------------------------------------------------
m["trk-cmn-pro"] = {
"Proto-Common Turkic",
1126028,
"trk-pro",
}
m["trk-ogr-pro"] = {
"Proto-Oghur",
1422731,
"trk-pro",
family = "trk-ogr",
}
m["trk-bul-pro"] = {
"Proto-Bulgar",
nil,
"trk-ogr-pro",
}
m["trk-ogz-pro"] = {
"Proto-Oghuz",
494600,
"trk-pro",
family = "trk-ogz",
aliases = {"Southwestern Common Turkic"},
}
m["crh-dbj"] = {
"Dobrujan Tatar",
12811566,
"crh",
aliases = {"Romanian Tatar"},
}
m["cv-ana"] = {
"Anatri Chuvash",
nil,
"cv",
aliases = {"Anatri", "Lower Chuvash"},
}
m["cv-mid"] = {
"Middle Chuvash",
nil,
"cv",
ancestors = "cv-old",
}
m["cv-old"] = {
"Old Chuvash",
nil,
"cv",
ancestors = "xbo-vol",
}
m["cv-vir"] = {
"Viryal Chuvash",
4278332,
"cv",
aliases = {"Viryal", "Upper Chuvash"},
}
m["kjh-fyu"] = {
"Fuyu Kyrgyz",
2598963,
"kjh",
aliases = {"Fuyu Kirgiz", "Fuyu Kirghiz", "Manchurian Kyrgyz", "Manchurian Kirgiz", "Manchurian Kirghiz"},
}
m["klj-arg"] = {
"Arghu",
33455,
"klj",
ancestors = "trk-cmn-pro",
}
m["otk-kir"] = {
"Old Kirghiz",
83142,
"otk",
aliases = {"Yenisei Turkic", "Yenisei Kyrgyz"},
}
m["otk-ork"] = {
"Orkhon Turkic",
31295480,
"otk",
}
m["qwm-cum"] = {
"Cuman",
1075050,
"qwm",
aliases = {"Kuman", "Polovtsian", "Polovcian"},
}
m["qwm-arm"] = {
"Armeno-Kipchak",
2027503,
"qwm",
ancestors = "qwm-cum",
aliases = {"Xıpçaχ tili", "Tatarça"},
}
m["qwm-mam"] = {
"Mamluk-Kipchak",
4279942,
"qwm",
aliases = {"Mameluk-Kipchak"},
}
m["az-cls"] = {
"Classical Azerbaijani",
nil,
"az",
aliases = {"Classical Azeri"},
}
m["qxq"] = {
"Qashqai",
13192,
"az",
aliases = {"Qaşqay", "Qashqayi", "Kashkai", "Kashkay"},
}
m["tr-CY"] = {
"Cypriot Turkish",
7917392,
"tr",
}
m["uz-afg"] = {
-- NOTE: has ISO 639-3 code uzs assigned to it.
"Afghan Uzbek",
1066787,
"uz",
aliases = {"Southern Uzbek"},
translit = "uz-afg-translit",
}
m["xbo-dan"] = {
"Danube Bulgar",
nil,
"xbo",
}
m["xbo-vol"] = {
"Volga Bulgar",
nil,
"xbo",
}
----------------------------------------------------------------------------------------------------------------------
-- Uralic varieties --
----------------------------------------------------------------------------------------------------------------------
m["fiu-pro"] = {
"Proto-Finno-Ugric",
79890,
"urj-pro",
}
m["urj-fpr-pro"] = {
"Proto-Finno-Permic",
nil,
"urj-pro",
}
m["krl-nor"] = {
"North Karelian",
125501196,
"krl",
}
m["krl-sou"] = {
"South Karelian",
129812730,
"krl",
}
m["mns-eas"] = {
"Eastern Mansi",
30311755,
"mns-cen",
}
m["mns-wes"] = {
"Western Mansi",
30311756,
"mns-cen",
}
----------------------------------------------------------------------------------------------------------------------
-- Yeneseian varieties --
----------------------------------------------------------------------------------------------------------------------
m["qfa-yke-pro"] = {
"Proto-Ketic",
nil,
"qfa-yen-pro",
family = "qfa-yke",
}
m["qfa-yko-pro"] = {
"Proto-Kottic",
nil,
"qfa-yen-pro",
family = "qfa-yko",
}
m["qfa-yrn-pro"] = {
"Proto-Arinic",
nil,
"qfa-yen-pro",
family = "qfa-yrn",
}
m["qfa-ypm-pro"] = {
"Proto-Pumpokolic",
nil,
"qfa-yen-pro",
family = "qfa-ypm",
}
----------------------------------------------------------------------------------------------------------------------
-- Miscellaneous varieties --
----------------------------------------------------------------------------------------------------------------------
m["mul-tax"] = {
"taxonomic name",
522190,
"mul",
}
-----------------------------------------------------
-- Elamite varieties --
-----------------------------------------------------
m["elx-old"] = {
"Old Elamite",
nil,
"elx",
}
m["elx-mid"] = {
"Middle Elamite",
nil,
"elx",
}
m["elx-neo"] = {
"Neo-Elamite",
nil,
"elx",
}
m["elx-ach"] = {
"Achaemenid Elamite",
nil,
"elx",
}
-----------------------------------------------------
-- Substrates --
-----------------------------------------------------
-- Pre-Roman substrates
m["qsb-ibe"] = {
"Paleo-Hispanic",
246801,
"und",
family = "qfa-sub",
aliases = {"Palaeo-Hispanic", "Paleohispanic", "Palaeohispanic", "Paleo-Iberian", "Palaeo-Iberian"},
}
m["qsb-bal"] = {
"Paleo-Balkan",
1815070,
"und",
family = "qfa-sub",
aliases = {"Palaeo-Balkan", "Paleobalkan", "Palaeobalkan"},
}
m["xaq"] = {
"Aquitanian",
500522,
"euq-pro",
family = "euq",
}
return require("Module:languages").finalizeData(m, "language", true)
m0kf8si8j2kroiptllxmke9gy47tv4l
234829
234828
2026-05-24T08:11:04Z
Lee
19
[[:en:Module:etymology_languages/data]] වෙතින් එක් සංශෝධනයක්
234828
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
----------------------------------------------------------------------------------------------------------------------
-- Afroasiatic varieties --
----------------------------------------------------------------------------------------------------------------------
--------------------------------------------------------------------------------------
-- Berber varieties --
--------------------------------------------------------------------------------------
m["shi-med"] = {
"Medieval Tashelhit",
34152,
"shi",
}
-- Tuareg lects
m["thv"] = {
"Tamahaq",
56703,
"tmh",
}
m["ttq"] = {
"Tawellemmet",
56390,
"tmh",
}
m["taq"] = {
"Tamasheq",
4670066,
"tmh",
}
m["thz"] = {
"Tayert",
56388,
"tmh",
}
m["thv-ght"] = {
"Ghat",
47012900,
"thv",
}
--------------------------------------------------------------------------------------
-- Cushitic varieties --
--------------------------------------------------------------------------------------
-- Oromo varieties
m["hae"] = {
"Harar Oromo",
5330355,
"om",
aliases = {"Eastern Oromo"},
}
m["gax"] = {
"Borana",
2910610,
"om",
aliases = {"Southern Oromo"},
}
m["orc"] = {
"Orma",
2919128,
"om",
}
m["ssn"] = {
"Waata",
3501553,
"om",
}
--------------------------------------------------------------------------------------
-- Egyptian varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Ancient Egyptian varieties --
-----------------------------------------------------
m["egy-old"] = {
"Old Egyptian",
447117,
"egy",
}
m["egy-mid"] = {
"Middle Egyptian",
657330,
"egy",
aliases = {"Classical Egyptian"},
}
m["egy-nmi"] = {
"Neo-Middle Egyptian",
123735278,
"egy",
aliases = {"Égyptien de tradition", "Traditional Egyptian"},
}
m["egy-lat"] = {
"Late Egyptian",
1852329,
"egy",
}
-----------------------------------------------------
-- Coptic varieties --
-----------------------------------------------------
m["cop-akh"] = {
"Akhmimic Coptic",
125176464,
"cop",
aliases = {"Akhmimic"},
}
m["cop-boh"] = {
"Bohairic Coptic",
890733,
"cop",
aliases = {"Bohairic", "Memphitic Coptic", "Memphitic"},
}
m["cop-ggg"] = {
"Coptic Dialect G",
nil,
"cop",
aliases = {"Dialect G", "Mansuric Coptic", "Mansuric"},
}
m["cop-jjj"] = {
"Coptic Dialect J",
nil,
"cop",
}
m["cop-kkk"] = {
"Coptic Dialect K",
nil,
"cop",
}
m["cop-ppp"] = {
"Coptic Dialect P",
nil,
"cop",
aliases = {"Proto-Theban Coptic", "Palaeo-Theban Coptic"},
}
m["cop-fay"] = {
"Fayyumic Coptic",
1399115,
"cop",
aliases = {"Fayyumic", "Faiyumic Coptic", "Faiyumic", "Fayumic Coptic", "Fayumic",
"Bashmuric Coptic", "Bashmuric"},
}
m["cop-her"] = {
"Hermopolitan Coptic",
nil,
"cop",
aliases = {"Hermopolitan", "Coptic Dialect H", "Ashmuninic", "Ashmuninic Coptic"},
}
m["cop-lyc"] = {
"Lycopolitan Coptic",
nil,
"cop",
aliases = {
"Lycopolitan",
"Assiutic Coptic", "Asyutic Coptic", "Assiutic", "Asyutic",
"Lyco-Diospolitan Coptic", "Lyco-Diospolitan",
"Subakhmimic Coptic", "Subakhmimic"
},
}
m["cop-old"] = {
"Old Coptic",
115518040,
"cop",
}
m["cop-oxy"] = {
"Oxyrhynchite Coptic",
nil,
"cop",
aliases = {"Oxyrhynchite", "Mesokemic Coptic", "Mesokemic", "Middle Egyptian Coptic"},
}
m["cop-ply"] = {
"Proto-Lycopolitan Coptic",
nil,
"cop",
aliases = {"Coptic Dialect i", "Proto-Lyco-Diospolitan Coptic"},
}
m["cop-sah"] = {
"Sahidic Coptic",
2645851,
"cop",
aliases = {"Sahidic", "Saidic Coptic", "Saidic", "Thebaic Coptic", "Thebaic"},
}
--------------------------------------------------------------------------------------
-- Semitic varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Akkadian varieties --
-----------------------------------------------------
m["akk-old"] = {
"Old Akkadian",
nil,
"akk",
}
m["akk-obb"] = {
"Old Babylonian",
nil,
"akk",
}
m["akk-oas"] = {
"Old Assyrian",
nil,
"akk",
}
m["akk-mbb"] = {
"Middle Babylonian",
nil,
"akk",
}
m["akk-mas"] = {
"Middle Assyrian",
nil,
"akk",
}
m["akk-nbb"] = {
"Neo-Babylonian",
nil,
"akk",
}
m["akk-nas"] = {
"Neo-Assyrian",
nil,
"akk",
}
m["akk-lbb"] = {
"Late Babylonian",
nil,
"akk",
}
m["akk-stb"] = {
"Standard Babylonian",
nil,
"akk",
}
-----------------------------------------------------
-- Arabic varieties --
-----------------------------------------------------
m["jrb"] = {
"Judeo-Arabic",
37733,
"ar",
pseudo_families = "qfa-jew",
}
m["apc-leb"] = {
"Lebanese North Levantine Arabic",
1516642,
"apc",
aliases = {"Lebanese Arabic"},
}
m["apc-sle"] = {
"South Lebanese North Levantine Arabic",
14206590,
"apc",
aliases = {"South Lebanese Arabic"},
}
m["apc-nle"] = {
"North Lebanese North Levantine Arabic",
nil,
"apc",
aliases = {"North Lebanese Arabic"},
}
m["apc-syr"] = {
"Syrian North Levantine Arabic",
2143071,
"apc",
aliases = {"Syrian Arabic"},
}
m["apc-ale"] = {
"Aleppine North Levantine Arabic",
7056921,
"apc-syr",
aliases = {"Aleppo Arabic", "Aleppine Arabic"},
}
m["apc-dam"] = {
"Damascene North Levantine Arabic",
12237466,
"apc-syr",
aliases = {"Damascus Arabic", "Damascene Arabic"},
}
m["acm-khu"] = {
"Khuzestani Arabic",
1040944,
"acm",
}
-----------------------------------------------------
-- Aramaic varieties --
-----------------------------------------------------
m["arc-bib"] = {
"Biblical Aramaic",
843235,
"arc",
family = "sem-are",
}
m["arc-cpa"] = {
"Christian Palestinian Aramaic",
60790119,
"arc",
family = "sem-arw",
aliases = {"Melkite Aramaic", "Palestinian Syriac", "Syropalestinian Aramaic"},
}
m["arc-imp"] = {
"Imperial Aramaic",
7079491,
"arc",
aliases = {"Official Aramaic"},
}
m["arc-hat"] = {
"Hatran Aramaic",
3832926,
"arc",
family = "sem-are",
}
m["arc-jla"] = {
"Jewish Literary Aramaic",
105952842,
"arc",
pseudo_families = "qfa-jew",
}
m["arc-nab"] = {
"Nabataean Aramaic",
36178,
"arc",
}
m["arc-old"] = {
"Old Aramaic",
3398392,
"arc",
}
m["arc-pal"] = {
"Palmyrene Aramaic",
1510113,
"arc",
family = "sem-arw",
}
m["tmr"] = {
"Jewish Babylonian Aramaic",
33407,
"arc",
family = "sem-ase",
pseudo_families = "qfa-jew",
}
m["jpa"] = {
"Jewish Palestinian Aramaic",
948909,
"arc",
family = "sem-arw",
aliases = {"Galilean Aramaic"},
pseudo_families = "qfa-jew",
}
-----------------------------------------------------
-- Hebrew varieties --
-----------------------------------------------------
m["hbo"] = {
"Biblical Hebrew",
1982248,
"he",
aliases = {"Classical Hebrew"},
}
m["he-mis"] = {
"Mishnaic Hebrew",
1649362,
"he",
ancestors = "hbo",
}
m["he-med"] = {
"Medieval Hebrew",
2712572,
"he",
ancestors = "he-mis",
}
m["he-IL"] = {
"Israeli Hebrew",
8141,
"he",
}
----------------------------------------------------------------------------------------------------------------------
-- Ainu varieties --
----------------------------------------------------------------------------------------------------------------------
m["ain-hok"] = {
"Hokkaido Ainu",
20968488,
"ain",
aliases = {"Hokkaidō Ainu"},
}
m["ain-kur"] = {
"Kuril Ainu",
20967012,
"ain",
}
m["ain-sak"] = {
"Sakhalin Ainu",
20747371,
"ain",
}
----------------------------------------------------------------------------------------------------------------------
-- American indigenous varieties --
----------------------------------------------------------------------------------------------------------------------
-----------------------------------------------------
-- Inuit varieties --
-----------------------------------------------------
m["esi"] = {
"North Alaskan Inupiatun",
nil,
"ik"
}
m["esk"] = {
"Northwest Alaskan Inupiatun",
25559714,
"ik"
}
-----------------------------------------------------
-- Iroquoian varieties --
-----------------------------------------------------
m["iro-ohu"] = {
"Old Wendat",
nil,
"wdt",
}
m["iro-omo"] = {
"Old Mohawk",
nil,
"moh",
}
m["iro-oon"] = {
"Old Onondaga",
nil,
"ono",
}
-----------------------------------------------------
-- Tupi-Guarani varieties --
-----------------------------------------------------
-- Old Tupi varieties
m["tpw-lga"] = {
"Língua Geral Amazônica",
18275323,
"tpw",
aliases = {"Língua Geral"},
}
m["tpw-lgp"] = {
"Língua Geral Paulista",
2669239,
"tpw",
}
----------------------------------------------------------------------------------------------------------------------
-- Austroasiatic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Khmer varieties
m["okz-ang"] = {
"Angkorian Old Khmer",
nil,
"okz",
wikipedia_article = "Khmer language#Historical periods",
}
m["okz-pre"] = {
"Pre-Angkorian Old Khmer",
nil,
"okz",
wikipedia_article = "Khmer language#Historical periods",
}
-- Central Nicobarese varieties
m["ncb-cam"] = {
"Camorta",
5026908,
"ncb",
aliases = {"Kamorta"},
}
m["ncb-kat"] = {
"Katchal",
17064263,
"ncb",
aliases = {"Tehnu"},
}
m["ncb-nan"] = {
"Nancowry",
6962504,
"ncb",
aliases = {"Nankwari"},
}
----------------------------------------------------------------------------------------------------------------------
-- Austronesian varieties --
----------------------------------------------------------------------------------------------------------------------
-- Malay and related varieties
m["ms-old"] = { -- this has the ISO code 'omy'
"Old Malay",
nil,
"ms",
}
m["ms-cla"] = {
"Classical Malay",
nil,
"ms",
ancestors = "ms-old",
}
m["pse-bsm"] = {
"Besemah",
nil,
"pse",
}
m["bew-kot"] = {
"Betawi Kota",
nil,
"bew",
aliases = {"Urban Betawi"}, -- in Jakarta
}
-- Philippine varieties
m["xnn"] = {
"Northern Kankanaey",
12953609,
"kne",
aliases = {"Northern Kankanay", "Northern Kankana-ey"},
}
m["tl-old"] = {
"Old Tagalog",
12967437,
"tl",
}
m["tl-cls"] = {
"Classical Tagalog",
nil,
"tl",
}
----------------------------------------------------------------------------------------------------------------------
-- Caucasian varieties --
----------------------------------------------------------------------------------------------------------------------
-- Kartvelian varieties
m["ka-mid"] = {
"Middle Georgian",
nil,
"ka",
ancestors = "oge",
}
----------------------------------------------------------------------------------------------------------------------
-- Dravidian varieties --
----------------------------------------------------------------------------------------------------------------------
m["ta-mid"] = {
"Middle Tamil",
20987434,
"ta",
}
m["kn-hav"] = {
"Havigannada",
24276369,
"kn",
}
m["kn-kun"] = {
"Kundagannada",
6444255,
"kn",
}
----------------------------------------------------------------------------------------------------------------------
-- Indo-European varieties --
----------------------------------------------------------------------------------------------------------------------
--------------------------------------------------------------------------------------
-- Albanian varieties --
--------------------------------------------------------------------------------------
m["aln"] = {
"Gheg Albanian",
181037,
"sq",
aliases = {"Gheg"},
}
m["aae"] = {
"Arbëresh Albanian",
1075302,
"als",
aliases = {"Arbëreshë", "Arbëresh"},
}
m["aat"] = {
"Arvanitika Albanian",
29347,
"als",
aliases = {"Arvanitika"},
}
m["als"] = {
"Tosk Albanian",
180937,
"sq",
aliases = {"Tosk"},
}
--------------------------------------------------------------------------------------
-- Armenian varieties --
--------------------------------------------------------------------------------------
m["hyw"] = {
"Western Armenian",
180945,
"hy",
}
m["hye"] = {
"Eastern Armenian",
181059,
"hy",
}
--------------------------------------------------------------------------------------
-- Balto-Slavic varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Baltic varieties --
-------------------------------------------------------------------------
m["bat-pro"] = {
"Proto-Baltic",
1703347,
"ine-bsl-pro",
}
m["bat-dni"] = {
"Dnieper Baltic",
4163178,
"bat-pro",
family = "bat",
aliases = {"Dniepr Baltic", "Dnieper-Oka Baltic", "Dniepr-Oka Baltic"},
}
m["bat-gol"] = {
"Golyad",
4142855,
"bat-dni",
aliases = {"Eastern Galindian", "East Galindian"},
}
-------------------------------------------------------------------------
-- Slavic varieties --
-------------------------------------------------------------------------
-----------------------------------------------------
-- Bulgarian varieties --
-----------------------------------------------------
m["cu-bgm"] = {
"Middle Bulgarian",
12294897,
"cu",
ancestors = "cu"
}
-----------------------------------------------------
-- Church Slavonic varieties --
-----------------------------------------------------
-- Old Moscow Church Slavonic deleted as it seems not distinct enough from Russian (Synodal) Church Slavonic.
m["zls-chs-ru"] = {
"Russian Church Slavonic",
21662400,
"zls-chs",
aliases = {"Synodal Church Slavonic", "New Moscow Church Slavonic", "Novomoskovsk Church Slavonic"},
}
m["zls-chs-uk"] = {
"Ukrainian Church Slavonic",
12153548,
"zls-chs",
aliases = {"Rusyn Church Slavonic", "Belarusian Church Slavonic"},
}
--[=[
-- Not sure about these yet.
m["zls-chs-bg"] = {
"Bulgarian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-cs"] = {
"Czech Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-hr"] = {
"Croatian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-mk"] = {
"Macedonian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-ro"] = {
"Romanian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-sr"] = {
"Serbian Church Slavonic",
nil,
"zls-chs",
}
]=]
-----------------------------------------------------
-- Czech varieties --
-----------------------------------------------------
m["cs-ear"] = {
"Early Modern Czech",
nil,
"cs",
ancestors = "zlw-ocs"
}
-----------------------------------------------------
-- East Slavic varieties --
-----------------------------------------------------
m["zle-ops"] = {
"Old Pskovian",
4167885,
"zle-ono",
}
m["zle-mru"] = {
"Middle Russian",
35228,
"ru",
"Cyrs",
ancestors = "orv",
translit = "ru-translit",
strip_diacritics = {
Cyrs = {
remove_diacritics = c.grave .. c.acute .. c.diaer,
},
},
}
m["zle-mbe"] = {
"Middle Belarusian",
13211,
"zle-ort",
}
m["zle-muk"] = {
"Middle Ukrainian",
13211,
"zle-ort",
}
m["uk-CA"] = {
"Canadian Ukrainian",
4161010,
"uk",
}
-----------------------------------------------------
-- Polish varieties --
-----------------------------------------------------
m["zlw-mpl"] = {
"Middle Polish",
402878,
"pl",
ancestors = "zlw-opl",
strip_diacritics = {
remove_diacritics = c.acute,
remove_exceptions = {"Ć", "ć", "Ń", "ń", "Ó", "ó", "Ś", "ś", "Ź", "ź"},
},
}
m["pl-gre"] = {
"Greater Polish",
4106789,
"pl",
}
m["pl-les"] = {
"Lesser Polish",
361709,
"pl",
}
m["pl-mas"] = {
"Masovian Polish",
4274559,
"pl",
}
m["pl-gor"] = {
"Goral",
452889,
"pl",
}
-----------------------------------------------------
-- Serbo-Croatian varieties --
-----------------------------------------------------
m["ckm"] = {
"Chakavian Serbo-Croatian",
337565,
"sh",
aliases = {"Čakavian"},
}
m["kjv"] = {
"Kajkavian Serbo-Croatian",
838165,
"sh",
}
m["sh-tor"] = { -- Linguist code srp-tor
"Torlakian Serbo-Croatian",
1078803,
"sh",
aliases = {"Torlak"},
}
--------------------------------------------------------------------------------------
-- Celtic varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Brythonic varieties --
-----------------------------------------------------
m["bry-ear"] = {
"Early Brythonic",
nil,
"cel-bry-pro",
}
m["bry-lat"] = {
"Late Brythonic",
nil,
"cel-bry-pro",
}
-----------------------------------------------------
-- Gaulish varieties --
-----------------------------------------------------
m["xcg"] = {
"Cisalpine Gaulish",
3832927,
"cel-gau",
}
m["xtg"] = {
"Transalpine Gaulish",
29977,
"cel-gau",
}
-----------------------------------------------------
-- Welsh varieties --
-----------------------------------------------------
m["cy-nor"] = {
"North Wales Welsh",
13127692,
"cy",
aliases = {"North Walian Welsh", "Northern Welsh"},
}
m["cy-sou"] = {
"South Wales Welsh",
13127689,
"cy",
aliases = {"South Walian Welsh", "Southern Welsh"},
}
--------------------------------------------------------------------------------------
-- Germanic varieties --
--------------------------------------------------------------------------------------
-- Proto-West Germanic varieties
m["frk"] = {
"Frankish",
10860505,
"gmw-pro",
family = "gmw-frk",
aliases = {"Old Frankish"},
}
m["gem-sue"] = {
"Suevic",
134600275,
"gmw-pro",
aliases = {"Suebian"},
}
m["gmw-afr-pro"] = {
"Proto-Anglo-Frisian",
134603379,
"gmw-nsg-pro",
family = "gmw-afr",
}
m["gmw-nsg-pro"] = {
"Proto-North Sea Germanic",
134603374,
"gmw-pro",
family = "gmw-nsg",
aliases = {"Proto-Ingvaeonic"},
}
-----------------------------------------------------
-- Dutch varieties --
-----------------------------------------------------
m["nl-BE"] = {
"Belgian Dutch",
34147,
"nl",
aliases = {"Flemish", "Flemish Dutch", "Southern Dutch"},
}
-----------------------------------------------------
-- English and Scots varieties --
-----------------------------------------------------
-- English varieties
m["en-AU"] = {
"Australian English",
44679,
"en",
}
m["en-GB"] = {
"British English",
7979,
"en",
}
m["en-GB-SCT"] = {
"Scottish English",
44676,
"en-GB",
}
m["en-GB-WLS"] = {
"Welsh English",
44676,
"en-GB",
}
m["en-IM"] = {
"Manx English",
6753295,
"en-GB",
}
m["en-aae"] = {
"Australian Aboriginal English",
783347,
"en-AU",
}
m["en-ear"] = {
"Early Modern English",
1472196,
"en",
ancestors = "enm",
aliases = {"Early New English"},
}
m["en-geo"] = {
"Geordie",
653421,
"en",
ancestors = "enm-nor",
}
m["en-IE"] = { -- FIXME: "IE" doesn't cover Northern Ireland
"Irish English",
665624,
"en",
}
m["en-uls"] = {
"Ulster English",
6840826,
"en-IE",
}
m["en-GB-NIR"] = {
"Northern Irish English",
6840826, -- actually the code for Ulster English
"en-uls",
}
m["en-NNN"] = { -- NA = Namibia; NNN is NATO 3-letter code for North America
"North American English",
7053766,
"en",
ietf_subtag = "en-021" -- 021 = UN M49 code for "Northern America" (i.e. North America wihout Central America or the Caribbean)
}
m["en-US"] = {
"American English",
7976,
"en-NNN",
}
m["en-NZ"] = {
"New Zealand English",
44661,
"en"
}
m["en-ZA"] = {
"South African English",
1156228,
"en"
}
m["en-US-CA"] = {
"California English",
1026812,
"en-US",
}
m["en-CA"] = {
"Canadian English",
44676,
"en-US",
}
m["en-HK"] = {
"Hong Kong English",
1068863,
"en",
}
m["en-IN"] = {
"Indian English",
1348800,
"en",
}
m["pld"] = {
"Polari",
1359130,
"en",
}
-- Scots varieties
m["sco-ins"] = {
"Insular Scots",
16919205,
"sco",
}
m["sco-uls"] = {
"Ulster Scots",
201966,
"sco",
}
m["sco-nor"] = {
"Northern Scots",
16928150,
"sco",
}
m["sco-sou"] = {
"Southern Scots",
7570457,
"sco",
aliases = {"South Scots", "Borders Scots"},
}
-- Middle English varieties
m["enm-esc"] = { -- Part of Middle English until it developed into Middle Scots.
"Early Scots",
5326738,
"enm",
ancestors = "enm-nor",
aliases = {"Old Scots", "Scottish Middle English"},
}
m["enm-emi"] = {
"East Midland Middle English",
134238810,
"enm",
ancestors = "ang-ang", -- Technically ang-mer, but attested Mercian is mostly WM IIRC
}
m["enm-ken"] = {
"Kentish Middle English",
134238532,
"enm",
ancestors = "ang-ken",
}
m["enm-nor"] = {
"Northern Middle English",
134238541,
"enm",
ancestors = "ang-nor",
}
m["enm-sou"] = {
"Southern Middle English",
134238528,
"enm",
ancestors = "ang-wsx",
}
m["enm-wmi"] = {
"West Midland Middle English",
134238824,
"enm",
ancestors = "ang-mer",
}
-- Old English varieties
-- Includes both Mercian and Northumbrian.
m["ang-ang"] = {
"Anglian Old English",
121142917,
"ang",
}
m["ang-ken"] = {
"Kentish Old English",
11687485,
"ang",
}
m["ang-mer"] = {
"Mercian Old English",
602072,
"ang-ang",
}
m["ang-nor"] = {
"Northumbrian Old English",
1798915,
"ang-ang",
}
m["ang-wsx"] = {
"West Saxon Old English",
2658603,
"ang",
}
-----------------------------------------------------
-- High German varieties --
-----------------------------------------------------
-- (modern) German varieties
m["de-AT"] = {
"Austrian German",
306626,
"de",
}
m["de-AT-vie"] = {
"Viennese German",
56474,
"de-AT",
}
m["de-CH"] = {
"Switzerland German",
1366643,
"de",
aliases = {"Schweizer Hochdeutsch", "Swiss Standard German", "Swiss High German"},
}
m["de-bal"] = {
"Baltic German",
15785413,
"de",
}
m["de-ear"] = {
"Early New High German",
1472199,
"de",
ancestors = "gmh",
aliases = {"Early Modern High German"},
}
m["ksh"] = {
"Kölsch",
4624,
"gmw-cfr",
}
m["pfl"] = {
"Palatine German",
23014,
"gmw-rfr",
aliases = {"Pfälzisch", "Pälzisch", "Palatinate German"},
}
m["sli"] = {
"Silesian East Central German",
152965,
"gmw-ecg",
aliases = {"Silesian"},
}
m["sxu"] = {
"Upper Saxon German",
699284,
"gmw-ecg",
}
-- Old High German varieties
m["lng"] = {
"Lombardic",
35972,
"goh",
}
-- Alemannic German varieties
m["gsw-low"] = {
"Low Alemannic German",
503724,
"gsw",
}
m["gsw-FR-als"] = {
"Alsatian Alemannic German",
8786,
"gsw-low",
}
m["gsw-hig"] = {
"High Alemannic German",
503728,
"gsw",
}
m["gsw-hst"] = {
"Highest Alemannic German",
687538,
"gsw",
}
m["wae"] = {
"Walser German",
680517,
"gsw-hst",
}
-----------------------------------------------------
-- Low German varieties --
-----------------------------------------------------
m["nds-de"] = {
"German Low German",
25433,
"nds",
ietf_subtag = "nds-DE", -- should we make this the actual code?
wikimedia_codes = "nds",
}
m["nds-nl"] = {
"Dutch Low Saxon",
516137,
"nds",
ietf_subtag = "nds-NL", -- should we make this the actual code?
wikimedia_codes = "nds-nl",
}
m["act"] = {
"Achterhoeks",
153627,
"nds-nl",
aliases = {"Achterhoek", "Achterhooks"},
}
m["drt"] = {
"Drents",
2736709,
"nds-nl",
aliases = {"Drèents", "Dreins", "Dreints", "Drints"},
}
m["frs"] = {
"East Frisian Low German",
149208,
"nds-de",
aliases = {"East Frisian", "East Frisian Low Saxon"},
}
m["gos"] = {
"Gronings",
508854,
"nds-nl",
aliases = {"Grunnegs", "Grönnegs"},
}
m["nds-lpr"] = {
"Low Prussian",
33982,
"nds-de",
}
m["sdz"] = {
"Sallands",
3436668,
"nds-nl",
aliases = {"Sallaans", "Sallaands"},
}
m["stl"] = {
"Stellingwerfs",
506010,
"nds-nl",
aliases = {"Stellingwarfs"},
}
m["twd"] = {
"Twents",
497363,
"nds-nl",
aliases = {"Tweants"},
}
m["vel"] = {
"Veluws",
2484810,
"nds-nl",
}
m["wep"] = {
"Westphalian",
505655,
"nds-de",
aliases = {"Westfalish", "Westphalien"},
}
-----------------------------------------------------
-- North Frisian varieties --
-----------------------------------------------------
m["frr-ins"] = {
"Insular North Frisian",
110629610,
"frr",
}
m["frr-fam"] = {
"Föhr-Amrum North Frisian",
110629601,
"frr-ins",
}
m["frr-foh"] = {
"Föhr North Frisian",
28185,
"frr-fam",
aliases = {"Föhr Frisian", "Fering",
"Ferring", -- Glottolog
},
varieties = {"Aasdring", "Weesdring"},
}
m["frr-amr"] = {
"Amrum North Frisian",
28192,
"frr-fam",
aliases = {"Amrum Frisian", "Amrum", "Öömrang"},
}
m["frr-hel"] = {
"Heligoland North Frisian",
28086,
"frr-ins",
aliases = {"Heligoland Frisian", "Halunder", "Heligolandic Frisian", "Heligolandic North Frisian",
"Helgoland Frisian", "Helgoland North Frisian", "Helgoland"},
}
m["frr-syl"] = {
"Sylt North Frisian",
28181,
"frr-ins",
aliases = {"Sylt Frisian", "Söl'ring",
"Sölreng", -- Glottolog
},
}
m["frr-mai"] = {
"Mainland North Frisian",
110629626,
"frr",
}
m["frr-hal"] = {
"Halligen North Frisian",
28177,
"frr-mai",
aliases = {"Halligen Frisian", "Halifreesk", "Hallingen Frisian", "Hallingen North Frisian",
"Hallingen", -- Glottolog
},
}
m["frr-moo"] = {
"Mooring North Frisian",
28187,
"frr-mai",
aliases = {"Bökingharde North Frisian", "Bökingharde Frisian", "Böökinghiirder frasch",
"Mooring", "Moring",
},
varieties = {{"East Mooring", "Ostermooring"}, {"West Mooring", "Westermooring"}},
}
m["frr-kar"] = {
"Karrharde North Frisian",
28191,
"frr-mai",
aliases = {"Karrharde Frisian", "Karrharder",
},
}
m["frr-goe"] = {
-- Technically this refers to three adjacent dialects (Northern, Central and Southern), the latter of which went
-- extinct in 1980-1981. As a result, Glottolog speaks of "Norder-Mittelgoesharde", referring to the remaining two.
"Goesharde North Frisian",
28183,
"frr-mai",
aliases = {"Norder-Mittelgoesharde North Frisian", "Norder-Mittelgoesharde Frisian", "Norder-Mittelgoesharde",
"Goesharde Frisian", "Goesharde", "Gooshiirder",
},
}
m["frr-wie"] = {
"Wiedingharde North Frisian",
28171,
"frr-mai",
aliases = {"Wiedingharde Frisian", "Wiedingharde", "Wiringhiirder freesk",
},
}
-----------------------------------------------------
-- Old Norse varieties --
-----------------------------------------------------
m["non-grn"] = {
"Greenlandic Norse",
855236,
"non-own",
}
m["non-oen"] = {
"Old East Norse",
10498031,
"non",
ancestors = "non",
}
m["non-own"] = {
"Old West Norse",
2377483,
"non",
ancestors = "non",
}
-----------------------------------------------------
-- Old Swedish varieties --
-----------------------------------------------------
m["gmq-osw-lat"] = {
"Late Old Swedish",
10723594,
"gmq-osw",
ancestors = "gmq-osw",
}
--------------------------------------------------------------------------------------
-- Greek varieties --
--------------------------------------------------------------------------------------
m["qsb-grc"] = {
"Pre-Greek",
965052,
"und",
family = "qfa-sub",
}
m["grc-aeo"] = {
"Aeolic Greek",
406373,
"grc",
aliases = {"Lesbic Greek", "Lesbian Greek", "Aeolian Greek"},
}
m["grc-arc"] = {
"Arcadian Greek",
nil,
"grc-arp",
}
m["grc-arp"] = {
"Arcadocypriot Greek",
499602,
"grc",
}
m["grc-att"] = {
"Attic Greek",
506588,
"grc",
}
m["grc-boi"] = {
"Boeotian Greek",
406373,
"grc-aeo",
}
m["grc-cyp"] = {
"Cypriot Ancient Greek", -- to distinguish from Cypriot Greek below
nil,
"grc-arp",
}
m["grc-dor"] = {
"Doric Greek",
285494,
"grc",
}
m["grc-ela"] = {
"Elean Greek",
nil,
"grc",
}
m["grc-epi"] = {
"Epic Greek",
990062,
"grc",
aliases = {"Homeric Greek"},
}
m["grc-ion"] = {
"Ionic Greek",
504165,
"grc",
}
m["grc-koi"] = {
"Koine Greek",
107358,
"grc",
ancestors = "grc-att",
aliases = {"Hellenistic Greek"},
}
m["grc-kre"] = {
"Cretan Ancient Greek", -- to distinguish from Cretan Greek below
nil,
"grc-dor",
}
m["grc-opl"] = {
"Opuntian Locrian",
nil,
"grc",
}
m["grc-ozl"] = {
"Ozolian Locrian",
nil,
"grc",
}
m["grc-pam"] = {
"Pamphylian Greek",
2271793,
"grc",
}
m["grc-ths"] = {
"Thessalian Greek",
406373,
"grc-aeo",
}
m["gkm"] = {
"Byzantine Greek",
36387,
"grc",
ancestors = "grc-koi",
aliases = {"Medieval Greek"},
}
m["el-cyp"] = {
"Cypriot Greek",
245899,
"el",
aliases = {"Cypriotic Greek"},
}
m["el-pap"] = {
"Paphian Greek",
nil,
"el",
}
m["el-crt"] = {
"Cretan Greek",
588306,
"el",
}
m["el-kth"] = {
"Katharevousa",
35961,
"el",
"Polyt",
ancestors = "gkm",
aliases = {"Katharevousa Greek"},
-- Polyt display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["el-kal"] = {
"Kaliarda",
12878658,
"el",
}
--------------------------------------------------------------------------------------
-- Indo-Iranian varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Indo-Aryan varieties --
-------------------------------------------------------------------------
-- reconstructed intermediate stages
m["pra-pro"] = {
"Proto-New Indo-Aryan",
nil,
"pra",
}
m["inc-ash-pro"] = {
"Proto-Middle Indo-Aryan",
nil,
"inc-ash",
}
m["inc-mit"] = {
"Mitanni",
1986700,
"inc-pro",
}
m["bra-old"] = {
"Old Braj",
nil,
"bra",
}
-- Apabhramsas
m["inc-aav"] = {
"Avahattha",
nil,
"inc-apa",
aliases = {"Abahattha"},
}
m["inc-asa"] = {
"Sauraseni Apabhramsa",
nil,
"inc-apa",
}
m["inc-agu"] = {
"Gurjara Apabhramsa",
nil,
"inc-apa",
}
m["inc-aka"] = {
"Kasmiri Apabhramsa",
nil,
"inc-apa",
}
m["inc-ama"] = {
"Maharastri Apabhramsa",
nil,
"inc-apa",
}
m["inc-ata"] = {
"Takka Apabhramsa",
nil,
"inc-apa",
}
m["inc-avr"] = {
"Vracada Apabhramsa",
nil,
"inc-apa",
}
-- Assamese varieties
m["as-bkm"] = {
"Barpetia Kamrupi Assamese",
30642960,
"as",
}
m["as-nkm"] = {
"Nalbaria Kamrupi Assamese",
85787678,
"as",
}
m["as-pkm"] = {
"Palasbaria Kamrupi Assamese",
nil,
"as",
}
-- Bengali varieties
m["bn-dvn"] = {
"Dhakaiya Vaṅga Bengali",
48726851,
"bn", -- Eastern Bengali variety
}
m["bn-nvn"] = {
"Noakhailla Vaṅga Bengali",
107548681,
"bn", -- Eastern Bengali variety
}
-- Dhivehi varieties
m["dv-old"] = {
"Old Dhivehi",
117790875,
"dv",
}
m["dv-mul"] = {
"Mulaku Dhivehi",
nil,
"dv",
aliases = {"Mulaku Divehi", "Mulaku Bas"},
}
m["dv-huv"] = {
"Huvadhu Dhivehi",
nil,
"dv",
aliases = {"Huvadhu Divehi", "Huvadhu Bas"},
}
m["dv-add"] = {
"Addu Dhivehi",
nil,
"dv",
aliases = {"Addu Divehi", "Addu Bas"},
}
-- Gujarati varieties
m["gu-kat"] = {
"Kathiyawadi",
nil,
"gu",
aliases = {"Kathiyawadi Gujarati", "Kathiawadi"},
}
m["gu-lda"] = {
"Lisan ud-Dawat Gujarati",
nil,
"gu",
aliases = {"Lisan ud-Dawat", "LDA"},
}
-- Hindi varieties
m["hi-mum"] = {
"Bombay Hindi",
3543151,
"hi",
aliases = {"Mumbai Hindi", "Bambaiyya Hindi"},
}
m["hi-mid"] = {
"Middle Hindi",
nil,
"inc-ohi",
ancestors = "inc-ohi",
}
-- Konkani varieties
m["kok-mid"] = {
"Middle Konkani",
nil,
"kok",
aliases = {"Medieval Konkani"},
}
m["kok-old"] = {
"Old Konkani",
nil,
"kok",
aliases = {"Early Konkani"},
}
-- Prakrits
m["pra-ard"] = {
"Ardhamagadhi Prakrit",
35217,
"pra",
aliases = {"Ardhamagadhi"},
}
m["pra-hel"] = {
"Helu Prakrit",
15080869,
"pra",
aliases = {"Elu", "Elu Prakrit", "Helu"},
}
m["pra-kha"] = {
"Khasa Prakrit",
nil,
"pra",
aliases = {"Khasa"},
}
m["pra-mag"] = {
"Magadhi Prakrit", -- Not to be confused with Magahi (mag)
2652214,
"pra",
aliases = {"Magadhi"},
}
m["pra-mah"] = {
"Maharastri Prakrit",
2586773,
"pra",
aliases = {"Maharashtri Prakrit", "Maharastri", "Maharashtri"},
}
m["pra-pai"] = {
"Paisaci Prakrit",
2995607,
"pra-sau",
aliases = {"Paisaci", "Paisachi"},
ancestors = "pra-sau"
}
m["pra-sau"] = {
"Sauraseni Prakrit",
2452885,
"pra",
aliases = {"Sauraseni", "Shauraseni"},
}
m["pra-ava"] = {
"Avanti",
nil,
"pra",
aliases = {"Avanti Prakrit"},
}
m["pra-pra"] = {
"Pracya",
nil,
"pra",
aliases = {"Pracya Prakrit"},
}
m["pra-bah"] = {
"Bahliki",
nil,
"pra",
aliases = {"Bahliki Prakrit"},
}
m["pra-dak"] = {
"Daksinatya",
nil,
"pra",
aliases = {"Daksinatya Prakrit"},
}
m["pra-sak"] = {
"Sakari",
nil,
"pra",
aliases = {"Sakari Prakrit"},
}
m["pra-can"] = {
"Candali",
nil,
"pra",
aliases = {"Candali Prakrit"},
}
m["pra-sab"] = {
"Sabari",
nil,
"pra",
aliases = {"Sabari Prakrit"},
}
m["pra-abh"] = {
"Abhiri",
nil,
"pra",
aliases = {"Abhiri Prakrit"},
}
m["pra-dra"] = {
"Dramili",
nil,
"pra",
aliases = {"Dramili Prakrit"},
}
m["pra-odr"] = {
"Odri",
nil,
"pra",
aliases = {"Odri Prakrit"},
}
-- Punjabi varieties
m["pnb"] = {
"Western Punjabi",
58635,
"pa",
"pa-Arab",
}
-- Sanskrit varieties
m["vsn"] = {
"Vedic Sanskrit",
36858,
"sa",
}
m["cls"] = {
"Classical Sanskrit",
9333703,
"sa",
}
m["sa-bhs"] = {
"Buddhist Hybrid Sanskrit",
248758,
"sa",
}
m["sa-bra"] = {
"Brahmanic Sanskrit",
139822891,
"vsn",
}
m["sa-epi"] = {
"Epic Sanskrit",
56702805,
"cls",
}
m["sa-neo"] = {
"New Sanskrit",
nil,
"sa",
}
m["sa-rig"] = {
"Rigvedic Sanskrit",
139822680,
"vsn",
}
-- Sinhalese varieties
m["si-med"] = {
"Medieval Sinhalese",
nil,
"si",
aliases = {"Medieval Sinhala"},
}
-------------------------------------------------------------------------
-- Iranian varieties --
-------------------------------------------------------------------------
m["qsb-bma"] = {
"the BMAC substrate",
133187435,
"und",
family = "qfa-sub",
aliases = {"the Bactria-Margiana substrate", "the Bactria-Margiana Archaeological Complex substrate"},
}
-- Historical and current Iranian dialects
m["ae-old"] = {
"Old Avestan",
29572,
"ae",
aliases = {"Gathic Avestan"},
}
m["ae-yng"] = {
"Younger Avestan",
29572,
"ae-old",
aliases = {"Young Avestan"},
}
m["bcc"] = {
"Southern Balochi",
33049,
"bal",
aliases = {"Southern Baluchi"},
}
m["bgp"] = {
"Eastern Balochi",
33049,
"bal",
aliases = {"Eastern Baluchi"},
}
m["bgn"] = {
"Western Balochi",
33049,
"bal",
aliases = {"Western Baluchi"},
}
m["bsg-ban"] = {
"Bandari",
nil,
"bsg",
}
m["bsg-hor"] = {
"Hormozi",
nil,
"bsg",
}
m["bsg-min"] = {
"Minabi",
nil,
"bsg",
}
m["kho-old"] = {
"Old Khotanese",
nil,
"kho",
}
m["kho-lat"] = {
"Late Khotanese",
nil,
"kho-old",
}
m["peo-ear"] = {
"Early Old Persian",
nil,
"peo",
}
m["peo-lat"] = {
"Late Old Persian",
nil,
"peo",
}
m["pal-ear"] = {
"Early Middle Persian",
nil,
"pal",
}
m["pal-lat"] = {
"Late Middle Persian",
nil,
"pal",
ancestors = "pal-ear",
}
m["ps-nwe"] = {
"Northwestern Pashto",
nil,
"ps",
}
m["ps-cgi"] = {
"Central Ghilzay",
nil,
"ps-nwe",
}
m["ps-mah"] = {
"Mahsudi",
nil,
"ps-nwe",
}
m["ps-nea"] = {
"Northeastern Pashto",
nil,
"ps",
}
m["ps-afr"] = {
"Afridi",
nil,
"ps-nea",
}
m["ps-bng"] = {
"Bangash",
nil,
"ps-nea",
}
m["ps-xat"] = {
"Khatak",
nil,
"ps-nea",
}
m["ps-pes"] = {
"Peshawari",
nil,
"ps-nea",
}
m["ps-sea"] = {
"Southeastern Pashto",
nil,
"ps",
}
m["ps-ban"] = {
"Bannu",
nil,
"ps-sea",
}
m["ps-kak"] = {
"Kakari",
nil,
"ps-sea",
}
m["ps-ser"] = {
"Sher",
nil,
"ps-sea",
}
m["ps-waz"] = {
"Waziri",
12274473,
"ps-sea",
}
m["ps-swe"] = {
"Southwestern Pashto",
nil,
"ps",
}
m["ps-kan"] = {
"Kandahari",
nil,
"ps-swe",
}
m["ps-jad"] = {
"Jadrani",
nil,
"ps",
ancestors = "ira-pat-pro"
}
m["xme-azr"] = {
"Old Azari",
nil,
"xme-ott",
aliases = {"Old Azeri", "Azari", "Azeri", "Āḏarī", "Adari", "Adhari"},
}
m["xme-ttc-cen"] = {
"Central Tati",
nil,
"xme-ott",
}
m["xme-ttc-eas"] = {
"Eastern Tati",
nil,
"xme-ott",
}
m["xme-ttc-nor"] = {
"Northern Tati",
nil,
"xme-ott",
}
m["xme-ttc-sou"] = {
"Southern Tati",
nil,
"xme-ott",
}
m["xme-ttc-wes"] = {
"Western Tati",
nil,
"xme-ott",
}
m["xmn"] = {
"Manichaean Middle Persian",
nil,
"pal-lat",
}
m["fa-ear"] = {
"Early New Persian",
127413796,
"fa",
ancestors = "pal-lat",
translit = "fa-cls-translit",
}
m["fa-cls"] = {
"Classical Persian",
9168,
"fa",
ancestors = "fa-ear",
translit = "fa-cls-translit",
}
m["fa-ira"] = {
"Iranian Persian",
3513637,
"fa",
aliases = {"Modern Persian", "Western Persian"},
translit = "fa-ira-translit",
}
m["prs"] = {
"Dari",
178440,
"fa",
aliases = {"Dari Persian", "Central Persian", "Eastern Persian", "Afghan Persian"},
translit = "fa-cls-translit",
}
m["haz"] = {
"Hazaragi",
33398,
"prs",
translit = "fa-cls-translit",
}
m["os-dig"] = {
"Digor Ossetian",
3027861,
"os",
aliases = {"Digoron", "Digor"},
}
m["os-iro"] = {
"Iron Ossetian",
nil,
"os",
aliases = {"Iron"},
}
m["sog-ear"] = {
"Early Sogdian",
nil,
"sog",
}
m["sog-lat"] = {
"Late Sogdian",
nil,
"sog-ear",
}
m["ro-MD"] = {
"Moldovan",
36392,
"ro",
aliases = {"Moldavian"},
}
m["oru-kan"] = {
"Kaniguram",
6363164,
"oru",
}
m["oru-log"] = {
"Logar",
nil,
"oru",
}
m["oos"] = {
"Old Ossetic",
65455882,
"xln",
}
m["oos-ear"] = {
"Early Old Ossetic",
nil,
"oos",
}
m["oos-lat"] = {
"Late Old Ossetic",
nil,
"oos",
}
m["rdb-jir"] = {
"Jirofti",
nil,
"rdb",
}
m["rdb-kah"] = {
"Kahnuji",
nil,
"rdb",
}
-- Southwestern Fars lects
m["fay-bur"] = {
"Burenjani",
nil,
"fay",
}
m["fay-bsh"] = {
"Bushehri",
nil,
"fay",
}
m["fay-dsh"] = {
"Dashtaki",
nil,
"fay",
}
m["fay-dav"] = {
"Davani",
5228140,
"fay",
}
m["fay-eze"] = {
"Emamzada Esmaili",
nil,
"fay",
}
m["fay-gav"] = {
"Gavkoshaki",
nil,
"fay",
}
m["fay-kho"] = {
"Khollari",
nil,
"fay",
}
m["fay-kon"] = {
"Kondazi",
nil,
"fay",
}
m["fay-kzo"] = {
"Old Kazeruni",
nil,
"fay",
}
m["fay-mas"] = {
"Masarami",
nil,
"fay",
}
m["fay-pap"] = {
"Papuni",
nil,
"fay",
}
m["fay-sam"] = {
"Samghani",
nil,
"fay",
}
m["fay-shr"] = {
"Shirazi",
nil,
"fay",
}
m["fay-sho"] = {
"Old Shirazi",
nil,
"fay",
}
m["fay-kar"] = {
"Khargi",
nil,
"fay",
}
m["fay-sor"] = {
"Sorkhi",
nil,
"fay",
}
-- Talysh lects
m["tly-cen"] = {
"Central Talysh",
nil,
"tly",
}
m["tly-asa"] = {
"Asalemi",
nil,
"tly-cen",
}
m["tly-kar"] = {
"Karganrudi",
nil,
"tly-cen",
}
m["tly-tul"] = {
"Tularudi",
nil,
"tly-cen",
}
m["tly-tal"] = {
"Taleshdulabi",
nil,
"tly-cen",
}
m["tly-nor"] = {
"Northern Talysh",
nil,
"tly",
}
m["tly-aze"] = {
"Azerbaijani Talysh",
nil,
"tly-nor",
}
m["tly-anb"] = {
"Anbarani",
nil,
"tly-nor",
}
m["tly-sou"] = {
"Southern Talysh",
nil,
"tly",
}
m["tly-fum"] = {
"Fumani",
nil,
"tly-sou",
}
m["tly-msu"] = {
"Masulei",
nil,
"tly-sou",
}
m["tly-msa"] = {
"Masali",
nil,
"tly-sou",
}
m["tly-san"] = {
"Shandarmani",
nil,
"tly-sou",
}
-- Tafreshi lects
m["xme-amo"] = {
"Amorehi",
nil,
"xme-taf",
}
m["atn"] = {
"Ashtiani",
3436590,
"xme-taf",
}
m["xme-bor"] = {
"Borujerdi",
nil,
"xme-taf",
}
m["xme-ham"] = {
"Hamadani",
6302426,
"xme-taf",
}
m["xme-kah"] = {
"Kahaki",
nil,
"xme-taf",
}
m["vaf"] = {
"Vafsi",
32611,
"xme-taf",
}
-- Kermanic lects
m["kfm"] = {
"Khunsari",
6403030,
"xme-ker",
}
m["xme-mah"] = {
"Mahallati",
nil,
"xme-ker",
}
m["xme-von"] = {
"Vonishuni",
nil,
"xme-ker",
}
m["xme-bdr"] = {
"Badrudi",
nil,
"xme-ker",
}
m["xme-del"] = {
"Delijani",
nil,
"xme-ker",
}
m["xme-kas"] = {
"Kashani",
nil,
"xme-ker",
}
m["xme-kes"] = {
"Kesehi",
nil,
"xme-ker",
}
m["xme-mey"] = {
"Meymehi",
nil,
"xme-ker",
}
m["ntz"] = {
"Natanzi",
6968399,
"xme-ker",
}
m["xme-abz"] = {
"Abuzeydabadi",
nil,
"xme-ker",
}
m["xme-aby"] = {
"Abyanehi",
nil,
"xme-ker",
}
m["xme-far"] = {
"Farizandi",
nil,
"xme-ker",
}
m["xme-jow"] = {
"Jowshaqani",
nil,
"xme-ker",
}
m["xme-nas"] = {
"Nashalji",
nil,
"xme-ker",
}
m["xme-qoh"] = {
"Qohrudi",
nil,
"xme-ker",
}
m["xme-yar"] = {
"Yarandi",
nil,
"xme-ker",
}
m["soj"] = {
"Soi",
7930463,
"xme-ker",
aliases = {"Sohi"},
}
m["xme-tar"] = {
"Tari",
nil,
"xme-ker",
}
m["gzi"] = {
"Gazi",
5529130,
"xme-ker",
}
m["xme-sed"] = {
"Sedehi",
nil,
"xme-ker",
}
m["xme-ard"] = {
"Ardestani",
nil,
"xme-ker",
}
m["xme-zef"] = {
"Zefrehi",
nil,
"xme-ker",
}
m["xme-isf"] = {
"Isfahani",
nil,
"xme-ker",
}
m["xme-kaf"] = {
"Kafroni",
nil,
"xme-ker",
}
m["xme-vrz"] = {
"Varzenehi",
nil,
"xme-ker",
}
m["xme-xur"] = {
"Khuri",
nil,
"xme-ker",
}
m["nyq"] = {
"Nayini",
6983146,
"xme-ker",
}
m["xme-ana"] = {
"Anaraki",
nil,
"xme-ker",
}
m["gbz"] = {
"Zoroastrian Dari",
32389,
"xme-ker",
aliases = {"Behdināni", "Gabri", "Gavrŭni", "Gabrōni"},
}
m["xme-krm"] = {
"Kermani",
nil,
"xme-ker",
}
m["xme-yaz"] = {
"Yazdi",
nil,
"xme-ker",
}
m["xme-bid"] = {
"Bidhandi",
nil,
"xme-ker",
}
m["xme-bij"] = {
"Bijagani",
nil,
"xme-ker",
}
m["xme-cim"] = {
"Chimehi",
nil,
"xme-ker",
}
m["xme-han"] = {
"Hanjani",
nil,
"xme-ker",
}
m["xme-kom"] = {
"Komjani",
nil,
"xme-ker",
}
m["xme-nar"] = {
"Naraqi",
nil,
"xme-ker",
}
m["xme-nus"] = {
"Nushabadi",
nil,
"xme-ker",
}
m["xme-qal"] = {
"Qalhari",
nil,
"xme-ker",
}
m["xme-trh"] = {
"Tarehi",
nil,
"xme-ker",
}
m["xme-val"] = {
"Valujerdi",
nil,
"xme-ker",
}
m["xme-var"] = {
"Varani",
nil,
"xme-ker",
}
m["xme-zor"] = {
"Zori",
nil,
"xme-ker",
}
-- Ramandi lects
m["tks-ebr"] = {
"Ebrahimabadi",
nil,
"tks",
}
m["tks-sag"] = {
"Sagzabadi",
nil,
"tks",
}
m["tks-esf"] = {
"Esfarvarini",
nil,
"tks",
}
m["tks-tak"] = {
"Takestani",
nil,
"tks",
}
m["tks-cal"] = {
"Chali Tati",
nil,
"tks",
aliases = {"Chāli"},
}
m["tks-dan"] = {
"Danesfani",
nil,
"tks",
}
m["tks-xia"] = {
"Khiaraji",
nil,
"tks",
}
m["tks-xoz"] = {
"Khoznini",
nil,
"tks",
}
-- Shughni dialects
m["sgh-bro"] = {
"Bartangi-Oroshori",
nil,
"sgh",
}
m["sgh-bar"] = {
"Bartangi",
nil,
"sgh-bro",
}
m["sgh-oro"] = {
"Oroshori",
nil,
"sgh-bro",
aliases = {"Roshorvi"},
}
m["sgh-rsx"] = {
"Roshani-Khufi",
nil,
"sgh",
}
m["sgh-xuf"] = {
"Khufi",
2562249,
"sgh-rsx",
aliases = {"Xufi", "Xūfī"},
}
m["sgh-ros"] = {
"Roshani",
2597566,
"sgh-rsx",
aliases = {"Rushani", "Rōšāni"},
}
m["sgh-xgb"] = {
"Khughni-Bajui",
nil,
"sgh",
}
m["sgh-xug"] = {
"Khughni",
nil,
"sgh-xgb",
}
m["sgh-baj"] = {
"Bajui",
nil,
"sgh-xgb",
}
-------------------------------------------------------------------------
-- Nuristani varieties --
-------------------------------------------------------------------------
m["bsh-kat"] = {
"Kativiri",
2605045,
"bsh",
aliases = {"Katə́viri"},
}
m["xvi"] = {
"Kamviri",
1193495,
"bsh",
aliases = {"Kamvíri"},
}
m["bsh-mum"] = {
"Mumviri",
nil,
"bsh",
aliases = {"Mumvíri"},
}
--------------------------------------------------------------------------------------
-- Italic varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Latin varieties --
-------------------------------------------------------------------------
-- Latin varieties by period
m["itc-ola"] = {
"Old Latin",
12289,
"la",
"Latn, Ital",
translit = {
Ital = "Ital-translit"
},
}
m["itc-lan"] = {
"Lanuvian",
16890829,
"itc-ola",
aliases = {"Lanuvine"},
}
m["itc-pra"] = {
"Praenestine",
16889772,
"itc-ola",
aliases = {"Praenestinian"},
}
m["la-cla"] = {
"Classical Latin",
253854,
"la",
}
m["la-vul"] = {
"Vulgar Latin",
37560,
"la-cla",
}
m["la-afr"] = {
"African Romance",
162064,
"roa-pro",
}
m["la-lat"] = {
"Late Latin",
1503113,
"la",
ancestors = "la-cla",
}
m["la-med"] = {
"Medieval Latin",
1163234,
"la",
ancestors = "la-lat",
}
m["la-eme"] = {
"Early Medieval Latin",
nil,
"la-med",
}
m["la-ecc"] = {
"Ecclesiastical Latin",
1247932,
"la",
aliases = {"Church Latin", "Liturgical Latin"},
ancestors = "la-lat",
}
m["la-ren"] = {
"Renaissance Latin",
499083,
"la",
ancestors = "la-med",
}
m["la-new"] = {
"New Latin",
1248221,
"la",
aliases = {"Modern Latin"},
ancestors = "la-ren",
}
m["la-con"] = {
"Contemporary Latin",
1246397,
"la-new",
}
-------------------------------------------------------------------------
-- Miscellaneous Italic varieties --
-------------------------------------------------------------------------
m["xfa-cap"] = {
"Capenate",
133182969,
"xfa",
}
m["osc-luc"] = {
"Lucanian",
3265025,
"osc",
}
m["osc-sam"] = {
"Samnite",
133184287,
"osc",
}
-------------------------------------------------------------------------
-- Romance varieties --
-------------------------------------------------------------------------
m["roa-pro"] = {
"Proto-Romance",
3408029,
"la-lat",
ancestors = "la-vul",
}
-----------------------------------------------------
-- Catalan varieties --
-----------------------------------------------------
m["ca-val"] = {
"Valencian",
32641,
"ca",
}
-----------------------------------------------------
-- Franco-Provençal varieties --
-----------------------------------------------------
m["frp-old"] = {
"Old Franco-Provençal",
nil,
"frp",
}
-----------------------------------------------------
-- French and derived creole varieties --
-----------------------------------------------------
m["fro-nor"] = {
"Old Northern French",
2044917,
"fro",
aliases = {"Old Norman", "Old Norman French"},
}
m["fro-pic"] = {
"Picard Old French",
nil,
"fro",
}
m["xno"] = {
"Anglo-Norman",
35214,
"fro-nor",
}
m["xno-law"] = {
"Law French",
2044323,
"xno",
}
m["zrp"] = {
"Zarphatic",
36994,
"fro",
aliases = {"Judeo-French"},
pseudo_families = "qfa-jew",
}
m["fr-CA"] = {
"Canadian French",
1450506,
"fr",
}
m["fr-CH"] = {
"Swiss French",
1480152,
"fr",
}
m["fr-aca"] = {
"Acadian French",
415109,
"fr",
}
m["fr-lou"] = {
"Louisiana French",
3083213,
"fr",
}
m["fr-mis"] = {
"Missouri French",
3083210,
"fr",
}
m["frc"] = {
"Cajun French",
880301,
"fr-lou",
}
m["ht-sdm"] = {
"Saint Dominican Creole French",
nil,
"ht",
ancestors = "fr",
}
-- Norman varieties
m["nrf-grn"] = {
"Guernsey Norman",
56428,
"nrf",
aliases = {"Guernsey"},
}
m["nrf-jer"] = {
"Jersey Norman",
56430,
"nrf",
aliases = {"Jersey"},
}
-----------------------------------------------------
-- Gallo-Italic varieties --
-----------------------------------------------------
m["egl-old"] = {
"Old Emilian",
nil,
"egl",
}
m["lij-old"] = {
"Old Ligurian",
nil,
"lij",
aliases = {"Old Genoese"},
}
m["lmo-old"] = {
"Old Lombard",
97165320,
"lmo",
}
m["pms-old"] = {
"Old Piedmontese",
nil,
"pms",
aliases = {"Old Piemontese"},
}
m["vec-old"] = {
"Old Venetan",
nil,
"vec",
aliases = {"Old Venetian"},
}
m["rgn-old"] = {
"Old Romagnol",
nil,
"rgn",
}
-----------------------------------------------------
-- Italo-Romance varieties --
-----------------------------------------------------
-- Italian varieties
m["roa-oit"] = {
"Old Italian",
nil,
"it",
}
m["it-CH"] = {
"Switzerland Italian",
672147,
"it",
}
-- Other Italo-Romance varieties
m["nap-old"] = {
"Old Neapolitan",
nil,
"nap",
}
m["scn-old"] = {
"Old Sicilian",
nil,
"scn",
}
-----------------------------------------------------
-- Occitan varieties --
-----------------------------------------------------
m["oc-auv"] = {
"Auvergnat",
35359,
"oc",
aliases = {"Auvernhat", "Auvergnese"},
}
m["oc-gas"] = {
"Gascon",
35735,
"oc",
}
-- standardized dialect of Gascon
m["oc-ara"] = {
"Aranese",
10196,
"oc-gas",
}
m["oc-lan"] = {
"Languedocien",
942602,
"oc",
aliases = {"Lengadocian"},
}
m["oc-lim"] = {
"Limousin",
427614,
"oc",
}
m["oc-pro"] = {
"Provençal",
241243,
"oc",
aliases = {"Provencal"},
}
m["oc-pro-old"] = {
"Old Provençal",
2779185,
"pro",
}
m["oc-viv"] = {
"Vivaro-Alpine",
1649613,
"oc",
}
m["oc-jud"] = {
"Shuadit",
56472,
"oc",
aliases = {
"Chouhadite", "Chouhadit", "Chouadite", "Chouadit", "Shuhadit",
"Judeo-Occitan", "Judæo-Occitan", "Judaeo-Occitan",
"Judeo-Provençal", "Judæo-Provençal", "Judaeo-Provençal",
"Judeo-Provencal", "Judaeo-Provencal",
"Judeo-Comtadin", "Judæo-Comtadin", "Judaeo-Comtadin",
},
pseudo_families = "qfa-jew",
}
-----------------------------------------------------
-- Portuguese and derived creole varieties --
-----------------------------------------------------
-- Portuguese
m["pt-BR"] = {
"Brazilian Portuguese",
750553,
"pt",
}
m["pt-PT"] = {
"European Portuguese",
922399,
"pt",
}
-- Kabuverdianu (Cape Verde Creole, Cape Verdean Creole)
m["kea-bar"] = {
"Barlavento Kabuverdianu",
2217638,
"kea",
aliases = {"Barlavento", "Barlavento Creole", "Sampadjudu"},
}
m["kea-bvi"] = {
"Boa Vista Kabuverdianu",
16501837,
"kea-bar",
aliases = {"Boa Vista Creole"},
}
m["kea-sal"] = {
"Sal Kabuverdianu",
18707467,
"kea-bar",
aliases = {"Sal Creole"},
}
m["kea-saa"] = {
"Santo Antão Kabuverdianu",
18707472,
"kea-bar",
aliases = {"Santo Antão Creole"},
}
m["kea-sni"] = {
"São Nicolau Kabuverdianu",
18707549,
"kea-bar",
aliases = {"São Nicolau Creole"},
}
m["kea-svi"] = {
"São Vicente Kabuverdianu",
18707550,
"kea-bar",
aliases = {"São Vicente Creole"},
}
m["kea-sot"] = {
"Sotavento Kabuverdianu",
10261559,
"kea",
aliases = {"Sotavento", "Sotavento Creole", "Badiu"},
}
m["kea-bra"] = {
"Brava Kabuverdianu",
18670181,
"kea-sot",
aliases = {"Brava Creole"},
}
m["kea-fog"] = {
"Fogo Kabuverdianu",
18706861,
"kea-sot",
aliases = {"Fogo Creole"},
}
m["kea-mai"] = {
"Maio Kabuverdianu",
18707286,
"kea-sot",
aliases = {"Maio Creole"},
}
m["kea-san"] = {
"Santiago Kabuverdianu",
35117,
"kea-sot",
aliases = {"Santiago Creole"},
}
m["kea-alu"] = {
"ALUPEC Kabuverdianu",
375704,
"kea",
aliases = {"ALUPEC", "Alfabeto Unificado para a Escrita do Cabo-Verdiano"},
}
-----------------------------------------------------
-- Rhaeto-Romance varieties --
-----------------------------------------------------
-- Friulian varieties
m["fur-old"] = {
"Old Friulian",
nil,
"fur",
}
-- Ladin varieties
m["lld-amp"] = {
"Ampezan Ladin",
25617466,
"lld",
aliases = {"Anpezan", "Ampezan", "Ampezzan", "Ampezzano"},
}
m["lld-bad"] = {
"Badiot Ladin",
3706562,
"lld",
aliases = {"Badiot", "Badioto", "Badiotto"},
}
m["lld-cad"] = {
"Cadorino Ladin",
3706570,
"lld",
aliases = {"Cadorino"},
}
m["lld-fas"] = {
"Fascian Ladin",
742627,
"lld",
aliases = {"Fascian", "Fassano"},
}
m["lld-fod"] = {
"Fodom Ladin",
3706605,
"lld",
aliases = {"Fodom", "Livinallese"},
}
m["lld-for"] = {
"Fornes Ladin",
5470374,
"lld",
aliases = {"Fornes"},
}
m["lld-ghe"] = {
"Gherdëina Ladin",
3706597,
"lld",
aliases = {"Gherdëina", "Gardenese", "Val Gardena"},
}
m["lld-non"] = {
"Nones Ladin",
1055027,
"lld",
aliases = {"Nones", "Noneso"},
}
-- Romansh varieties
m["rm-old"] = {
"Old Romansh",
nil,
"rm",
}
m["rm-put"] = {
"Puter Romansh",
688309,
"rm",
aliases = {"Puter", "Putèr", "Upper Engadine", "rm-puter"},
}
m["rm-srm"] = {
"Surmiran Romansh",
690216,
"rm",
aliases = {"Surmiran", "rm-surmiran",
"Surmiran-Albula", -- Glottolog
},
}
m["rm-srs"] = {
"Sursilvan Romansh",
688348,
"rm",
aliases = {"Sursilvan", "rm-sursilv"},
}
m["rm-sut"] = {
"Sutsilvan Romansh",
688272,
"rm",
aliases = {"Sutsilvan", "rm-sutsilv"},
varieties = {"Scharans Sutsilvan"}, -- per Glottolog
}
m["rm-val"] = {
"Vallader Romansh",
690226,
"rm",
aliases = {"Vallader", "Putèr", "Lower Engadine", "rm-vallader"},
}
m["rm-gri"] = {
"Rumantsch Grischun",
688873,
"rm",
aliases = {"rm-rumgr"},
}
-----------------------------------------------------
-- Sardinian varieties --
-----------------------------------------------------
m["sc-old"] = {
"Old Sardinian",
nil,
"sc",
}
m["sc-src"] = {
"Logudorese",
777974,
"sc",
aliases = {"Logudorese Sardinian"},
}
m["sc-nuo"] = {
"Nuorese",
nil,
"sc-src",
aliases = {"Nuorese Sardinian"},
}
m["sc-sro"] = {
"Campidanese",
35348,
"sc",
aliases = {"Campidanese Sardinian"},
}
-----------------------------------------------------
-- Spanish varieties --
-----------------------------------------------------
m["es-ear"] = {
"Early Modern Spanish",
5364419,
"es",
}
m["es-AR"] = {
"Rioplatense Spanish",
509780,
"es",
}
m["es-BO"] = {
"Bolivian Spanish",
510730,
"es",
}
m["es-CL"] = {
"Chilean Spanish",
857295,
"es",
}
m["es-CO"] = {
"Colombian Spanish",
1115875,
"es",
}
m["es-CU"] = {
"Cuban Spanish",
824909,
"es",
}
m["es-MX"] = {
"Mexican Spanish",
616620,
"es",
}
m["es-PE"] = {
"Peruvian Spanish",
736236,
"es",
}
m["es-PH"] = {
"Philippine Spanish",
22091406,
"es",
}
m["es-US"] = {
"United States Spanish",
2301077,
"es",
aliases = {"US Spanish"},
}
--use label "US Spanish" to put Spanish terms in this category
m["es-PR"] = {
"Puerto Rican Spanish",
7258609,
"es",
}
m["es-VE"] = {
"Venezuelan Spanish",
840017,
"es",
}
m["es-lun"] = {
"Lunfardo",
1401612,
"es",
}
----------------------------------------------------------------------------------------------------------------------
-- Japonic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Japanese varieties
m["ja-mid"] = {
"Middle Japanese",
6841474,
"ojp",
ancestors = "ojp",
}
m["ja-mid-ear"] = {
"Early Middle Japanese",
182695,
"ja-mid",
}
m["ja-mid-lat"] = {
"Late Middle Japanese",
1816184,
"ja-mid",
ancestors = "ja-mid-ear",
}
m["ja-ear"] = {
"Early Modern Japanese",
5326692,
"ja",
ancestors = "ja-mid-lat",
}
m["ojp-eas"] = {
"Eastern Old Japanese",
65247957,
"ojp",
}
m["ja-cla"] = {
"Classical Japanese",
1332057,
"ja",
-- FIXME: This is redundant because Classical Japanese is considered a child of (Modern) Japanese, which has ja-mid-ear
-- (as well as ja-mid-lat) as ancestors. However, the intent here is that the *direct* ancestor of ja-cla is ja-mid-ear
-- and ja-mid-lat is not an ancestor. Need to rethink ancestor handling.
-- ancestors = "ja-mid-ear",
}
----------------------------------------------------------------------------------------------------------------------
-- Koreanic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Korean varieties
m["oko-lat"] = {
"Late Old Korean",
nil,
"oko",
}
m["okm-ear"] = {
"Early Middle Korean",
nil,
"okm",
}
m["ko-cen"] = {
"Central Korean",
nil,
"ko",
}
m["ko-gyg"] = {
"Gyeonggi Korean",
485492,
"ko-cen",
aliases = {"Seoul Korean"},
}
m["ko-chu"] = {
"Chungcheong Korean",
625800,
"ko-cen",
aliases = {"Hoseo Korean"},
}
m["ko-hwa"] = {
"Hwanghae Korean",
16183706,
"ko-cen",
}
m["ko-gan"] = {
"Gangwon Korean",
11260444,
"ko-cen",
aliases = {"Yeongdong Korean"},
}
m["ko-gys"] = {
"Gyeongsang Korean",
488002,
"ko",
aliases = {"Southeastern Korean"},
}
m["ko-jeo"] = {
"Jeolla Korean",
11250166,
"ko",
aliases = {"Southwestern Korean"},
}
m["ko-pyo"] = {
"Pyongan Korean",
7263142,
"ko",
aliases = {"Northwestern Korean"},
}
m["ko-ham"] = {
"Hamgyong Korean",
860702,
"ko",
aliases = {"Northeastern Korean"},
}
m["ko-yuk"] = {
"Yukjin Korean",
16171275,
"ko",
aliases = {"Yukchin Korean", "Ryukjin Korean", "Ryukchin Korean"},
}
----------------------------------------------------------------------------------------------------------------------
-- Mongolic varieties --
----------------------------------------------------------------------------------------------------------------------
m["xng-ear"] = {
"Early Middle Mongol",
nil,
"xng",
}
m["xng-lat"] = {
"Late Middle Mongol",
nil,
"xng",
ancestors = "xng-ear",
}
m["mn-kha"] = {
"Khalkha Mongolian",
6399808,
"mn",
aliases = {"Khalkha"},
}
m["mn-ord"] = {
"Ordos Mongolian",
716904,
"mn",
aliases = {"Ordos"},
}
m["mn-cha"] = {
"Chakhar Mongolian",
907425,
"mn",
aliases = {"Chakhar"},
}
m["mn-khr"] = {
"Khorchin Mongolian",
3196210,
"mn",
aliases = {"Khorchin"},
}
----------------------------------------------------------------------------------------------------------------------
-- Niger-Congo varieties --
----------------------------------------------------------------------------------------------------------------------
-----------------------------------------------------
-- Akan varieties --
-----------------------------------------------------
m["tw"] = {
"Twi Akan",
36850,
"ak",
aliases = {"Twi"},
}
m["abr"] = {
"Abron",
34831,
"tw",
aliases = {"Brong", "Bono", "Bono Twi"},
}
m["tw-asa"] = {
"Asante Twi",
19261685,
"tw",
aliases = {"Asante", "Ashanti", "Ashante"},
}
m["tw-aku"] = {
"Akuapem Twi",
31150449,
"tw",
aliases = {"Akuapem", "Akuapim", "Akwapem Twi", "Akwapi"},
}
m["fat"] = {
"Fante Akan",
35570,
"ak",
aliases = {"Fante", "Fanti", "Fantse", "Mfantse"},
}
m["wss"] = {
"Wasa",
36914,
"ak",
}
-- creole
m["alv-kro"] = {
"Kromanti",
1093206,
"crp-mar",
}
-----------------------------------------------------
-- Bantu varieties --
-----------------------------------------------------
m["bnt-cmn"] = {
"Common Bantu",
nil,
"bnt-pro",
}
m["xh-bha"] = {
"Bhaca",
4900493,
"xh",
aliases = {"isiBhaca", "IsiBhaca"},
}
-- Rwanda-Rundi varieties
m["rw-kin"] = {
"Kinyarwanda",
33573,
"rw",
aliases = {"Rwanda"},
}
m["rw-run"] = {
"Kirundi",
33583,
"rw",
aliases = {"Rundi"},
}
-----------------------------------------------------
-- Fula varieties --
-----------------------------------------------------
m["fuc"] = {
"Pulaar",
1420205,
"ff",
}
m["fuf"] = {
"Pular",
3915357,
"ff",
}
m["ffm"] = {
"Maasina Fulfulde",
3915322,
"ff",
}
m["fue"] = {
-- no enwiki entry as of yet but frwiki and pmswiki have one
"Borgu Fulfulde",
12952426,
"ff",
}
m["fuh"] = {
-- no enwiki entry as of yet but frwiki and pmswiki have one
"Western Niger Fulfulde",
12952430,
"ff",
}
m["fuq"] = {
-- no enwiki entry as of yet but frwiki, hrwiki and pmswiki have one
"Central-Eastern Niger Fulfulde",
12628799,
"ff",
}
m["fuv"] = {
-- no enwiki entry as of yet but dewiki, frwiki, hrwiki, pmswiki and swwiki have one
"Nigerian Fulfulde",
36129,
"ff",
}
m["fub"] = {
-- no enwiki entry as of yet but dewiki, frwiki, hrwiki, pmswiki, ptwiki, swwiki and yowiki have one
"Adamawa Fulfulde",
34776,
"ff",
}
m["fui"] = {
-- no enwiki entry as of yet but pmswiki and swwiki have one
"Bagirmi Fulfulde",
11003859,
"ff",
}
----------------------------------------------------------------------------------------------------------------------
-- Papuan varieties --
----------------------------------------------------------------------------------------------------------------------
m["kze"] = {
"Kosena",
12952663,
"auy",
}
m["ont"] = {
"Ontenu",
3352827,
"gaj",
aliases = {"Ontena"},
}
----------------------------------------------------------------------------------------------------------------------
-- Salishan varieties --
----------------------------------------------------------------------------------------------------------------------
m["lut-nor"] = {
"Northern Lushootseed",
nil,
"lut",
aliases = {"Northern Puget Sound Salish"},
}
m["slh"] = {
"Southern Lushootseed",
7997684,
"lut",
aliases = {"Southern Puget Sound Salish", "Twulshootseed", "Whulshootseed"},
}
m["ska"] = {
"Skagit",
12642471,
"lut-nor",
}
m["sno"] = {
"Snohomish",
25559662,
"lut-nor",
}
----------------------------------------------------------------------------------------------------------------------
-- Sino-Tibetan varieties --
----------------------------------------------------------------------------------------------------------------------
m["tbq-pro"] = {
"Proto-Tibeto-Burman",
7251864,
"sit-pro",
}
-----------------------------------------------------
-- Chinese varieties --
-----------------------------------------------------
------------- Old Chinese, Middle Chinese -------------
m["och-ear"] = {
"Early Old Chinese",
nil,
"och",
}
m["och-lat"] = {
"Late Old Chinese",
nil,
"och",
}
m["ltc-ear"] = {
"Early Middle Chinese",
nil,
"ltc",
}
m["ltc-lat"] = {
"Late Middle Chinese",
nil,
"ltc",
}
------------- Classical/Literary varieties -------------
-- FIXME: Temporary.
m["lzh-shi"] = {
"Traditional Chinese poetry",
1759242,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cii"] = {
"Ci",
1091366,
"lzh",
}
-- FIXME: Temporary.
m["lzh-yue"] = {
"Classical Cantonese",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cmn"] = {
"Classical Mandarin",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-tai"] = {
"Classical Taishanese",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cmn-TW"] = {
"Classical Taiwanese Mandarin",
nil,
"lzh-cmn",
}
-- FIXME: Temporary.
m["lzh-VI"] = {
"Vietnamese Classical Chinese",
17034227,
"lzh",
}
-- FIXME: Temporary.
m["lzh-KO"] = {
"Korean Classical Chinese",
10496257,
"lzh",
ietf_subtag = "lzh-KR" -- KR = South Korea, as there is no code for Korea as a whole
}
-- FIXME: Temporary.
m["lzh-lit"] = {
"Literary Chinese",
nil,
"lzh",
}
-- FIXME: Temporary. FIXME: Do we need this? How does it differ from Old Chinese?
m["lzh-pre"] = {
"Pre-Classical Chinese",
nil,
"lzh",
}
------------- Written Vernacular varieties -------------
-- FIXME: Temporary.
m["cmn-wvc"] = {
"Written vernacular Mandarin",
783605,
"cmn",
}
-- FIXME: Temporary. FIXME: How does this differ from "Literary Cantonese"?
m["yue-wvc"] = {
"Written vernacular Cantonese",
nil,
"yue",
}
-- FIXME: Temporary.
m["zhx-tai-wvc"] = {
"Written vernacular Taishanese",
nil,
"zhx-tai",
}
------------- Mandarin varieties -------------
-- FIXME: Temporary. NOTE: The Linguist List assigns the "w:Beijing dialect" (Wikidata 1147606) the code "cmn-bej" and
-- the larger "w:Beijing Mandarin (division of Mandarin)" dialect group (Wikidata 2169652; what we call "Beijingic
-- Mandarin", after Glottolog) the code "cmn-bei".
m["cmn-bei"] = {
"Beijing Mandarin",
1147606,
"cmn-bec",
}
-- FIXME: Temporary.
m["cmn-bec"] = {
"Beijingic Mandarin",
2169652,
"cmn",
}
-- FIXME: Temporary. NOTE: The Linguist List uses the code cmn-zho.
m["cmn-cep"] = {
"Central Plains Mandarin",
3048775,
"cmn",
aliases = {"Zhongyuan Mandarin"},
}
m["cmn-ear"] = {
"Early Mandarin",
837169,
"cmn",
ancestors = "ltc",
}
-- FIXME: Temporary.
m["cmn-gua"] = {
"Guanzhong Mandarin",
3431648,
"cmn-cep",
}
-- FIXME: Temporary. Appears to be a subdialect of Guiliu Mandarin, which in turn is a subdialect of Southwestern Mandarin.
m["cmn-gui"] = {
"Guilin Mandarin",
11111636,
"cmn-sow",
}
m["cmn-jhu"] = {
"Jianghuai Mandarin",
2128953,
"cmn",
aliases = {"Lower Yangtze Mandarin"},
}
-- FIXME: Temporary.
m["cmn-lan"] = {
"Lanyin Mandarin",
662754,
"cmn",
}
-- FIXME: Temporary.
m["cmn-MY"] = {
"Malaysian Mandarin",
13646143,
"cmn",
}
-- FIXME: Temporary.
m["cmn-nan"] = {
"Nanjing Mandarin",
2681098,
"cmn-jhu",
}
-- FIXME: Temporary.
m["cmn-noe"] = {
"Northeastern Mandarin",
1064504,
"cmn",
}
-- FIXME: Temporary.
m["cmn-PH"] = {
"Philippine Mandarin",
7185155,
"cmn",
}
-- FIXME: Temporary.
m["cmn-SG"] = {
"Singapore Mandarin",
1048980,
"cmn",
}
-- FIXME: Temporary.
m["cmn-sow"] = {
"Southwestern Mandarin",
2609239,
"cmn",
}
-- FIXME: Temporary. Appears to be a subdialect of Jilu Mandarin.
m["cmn-tia"] = {
"Tianjin Mandarin",
7800220,
"cmn",
}
-- FIXME: Temporary. NOTE: Wikidata also has Q4380827 "Taiwanese Mandarin", defined as "rare dialect of Standard Chinese
-- (Mandarin) used in Taiwan, which is strongly influenced by Taiwanese Hokkien; mostly used by elderlies" and having no
-- English Wikipedia article (but see w:zh:臺灣國語).
m["cmn-TW"] = {
"Taiwanese Mandarin",
262828,
"cmn",
}
-- FIXME: Temporary. Appears to be a subdialect of Wu-Tian Mandarin, in turn a subdialect of Southwestern Mandarin.
-- Given the code cmn-xwu in the Linguist List.
m["cmn-wuh"] = {
"Wuhan Mandarin",
11124731,
"cmn-sow",
aliases = {"Wuhanese"},
}
-- FIXME: Temporary. Appears to be a subdialect of Lanyin Mandarin.
m["cmn-xin"] = {
"Xining Mandarin",
nil,
"cmn-lan",
}
-- FIXME: Temporary.
m["cmn-yan"] = {
"Yangzhou Mandarin",
nil,
"cmn-jhu",
}
------------- Cantonese varieties -------------
-- FIXME: Temporary.
m["yue-gua"] = {
"Guangzhou Cantonese",
nil,
"yue",
}
-- FIXME: Temporary. Given the codes yue-yue or yue-can in the Linguist List.
m["yue-HK"] = {
"Hong Kong Cantonese",
5894342,
"yue",
}
-- FIXME: Temporary. FIXME: How does this differ from "Written vernacular Cantonese"?
m["yue-lit"] = {
"Literary Cantonese",
2472605,
"yue",
}
------------- Wu varieties -------------
m["wuu-han"] = {
"Hangzhounese",
5648144,
"wuu",
}
m["wuu-nin"] = {
"Ningbonese",
3972199,
"wuu",
}
-- FIXME: Temporary.
m["wuu-nor"] = {
"Northern Wu",
7675988,
"wuu",
aliases = {"Taihu Wu"},
}
-- FIXME: Temporary? Subvariety of Taihu Wu. NOTE: "chm" stands for Chongming, the main dialect, to avoid a conflict
-- with Shanghainese.
m["wuu-chm"] = {
"Shadi Wu",
6112340,
"wuu-nor",
}
m["wuu-sha"] = {
"Shanghainese",
36718,
"wuu-nor",
}
m["wuu-suz"] = {
"Suzhounese",
831744,
"wuu-nor",
}
-- FIXME: Temporary. May be converted into a full language and/or split.
m["wuu-wen"] = {
"Wenzhounese",
710218,
"wuu",
}
------------- Xiang varieties -------------
m["hsn-lou"] = {
"Loudi Xiang",
10943823,
"hsn-old",
}
m["hsn-hya"] = {
"Hengyang Xiang",
20689035,
"hsn-hzh",
}
m["hsn-hzh"] = {
"Hengzhou Xiang",
nil,
"hsn",
}
m["hsn-new"] = {
"New Xiang",
7012696,
"hsn",
aliases = {"Chang-Yi"},
}
m["hsn-old"] = {
"Old Xiang",
7085453,
"hsn",
aliases = {"Lou-Shao"},
}
------------- Hakka varieties -------------
-- FIXME: Temporary.
m["hak-dab"] = {
"Dabu Hakka",
19855566,
"hak", -- formerly hak-TW but seems to be spoken primary in Dabu County in Guangdong
}
-- FIXME: Temporary.
m["hak-eam"] = {
"Early Modern Hakka",
nil,
"hak",
}
-- FIXME: Temporary.
m["hak-hai"] = {
"Hailu Hakka",
17038519,
"hak", -- often considered a Taiwanese lect but also spoken in [[Shanwei]], [[Guangdong]]
}
-- FIXME: Temporary.
m["hak-HK"] = {
"Hong Kong Hakka",
2675834,
"hak",
}
-- FIXME: Temporary.
m["hak-hui"] = {
"Huiyang Hakka",
16873881,
"hak",
}
-- FIXME: Temporary.
m["hak-hui-MY"] = {
"Malaysian Huiyang Hakka",
nil,
"hak-hui",
}
-- FIXME: Temporary. Similar to and possibly the parent of Sixian Hakka in Taiwan.
m["hak-mei"] = {
"Meixian Hakka",
839295,
"hak",
aliases = {"Moiyan Hakka", "Meizhou Hakka"},
}
-- FIXME: Temporary.
m["hak-six"] = {
"Sixian Hakka",
9668261,
"hak-TW",
}
-- FIXME: Temporary.
m["hak-TW"] = {
"Taiwanese Hakka",
2391532,
"hak",
}
-- FIXME: Temporary.
m["hak-zha"] = {
"Zhao'an Hakka",
6703311,
"hak",
aliases = {"Zhangzhou Hakka"},
}
-- Southern Min varieties --
m["nan-anx"] = {
"Anxi Hokkien",
97064149,
"nan-qua",
}
m["nan-cha"] = {
"Changtai Hokkien",
nil,
"nan-zha",
}
m["nan-hou"] = {
"Houlu Min",
19855492,
"nan-dat",
}
m["nan-hui"] = {
"Hui'an Hokkien",
16241797,
"nan-qua",
}
m["nan-jin"] = {
"Jinjiang Hokkien",
11089375,
"nan-qua",
}
m["nan-kin"] = {
"Kinmenese Hokkien",
56278342,
"nan-xia",
aliases = {"Kinmen Hokkien"},
}
m["nan-med"] = {
"Medan Hokkien",
6805114,
"nan-zha",
}
m["nan-pen"] = {
"Penang Hokkien",
11120689,
"nan-zha",
}
m["nan-hbl-PH"] = {
"Philippine Hokkien",
3236692,
"nan-qua",
}
m["nan-qia"] = {
"Qianlu Min",
19842517,
"nan-dat",
}
m["nan-qua"] = {
"Quanzhou Hokkien",
2251677,
"nan-hbl",
aliases = {"Chinchew", "Choanchew"},
}
-- FIXME: Temporary? Derived from both Quanzhou and Zhangzhou Hokkien.
m["nan-hbl-SG"] = {
"Singapore Hokkien",
3846528,
"nan-hbl",
}
m["nan-spm"] = {
"Southern Malaysian Hokkien",
7570322,
"nan-qua",
aliases = {"Southern Malaysia Hokkien", "Southern Peninsular Malaysian Hokkien", "Southern Peninsular Malaysia Hokkien"}
}
m["nan-hbl-TW"] = {
"Taiwanese Hokkien",
36778,
"nan-hbl",
}
m["nan-ton"] = {
"Tong'an Hokkien",
nil,
"nan-xia",
}
m["nan-xia"] = {
"Xiamen Hokkien",
68744,
"nan-hbl",
aliases = {"Amoy", "Amoyese", "Amoynese", "Xiamenese"},
}
m["nan-yon"] = {
"Yongchun Hokkien",
65118728,
"nan-qua",
}
m["nan-zha"] = {
"Zhangzhou Hokkien",
8070492,
"nan-hbl",
aliases = {"Changchew", "Chiangchew", "Changchow"},
}
m["nan-zho"] = {
"Zhao'an Hokkien",
65118728,
"nan-zha",
aliases = {"Zhao'an", "Chawan", "Chawan Hokkien"},
}
m["nan-zhp"] = {
"Zhangping Hokkien",
15937822,
"nan-zha",
}
------------- Other Min varieties -------------
-- FIXME: Temporary. Affiliation within Min uncertain; some combination of Eastern and Southern.
m["zhx-zho"] = {
"Zhongshan Min",
8070958,
"zh",
}
------------- Other Chinese varieties -------------
-- FIXME: Temporary. Affiliation within Chinese uncertain; possibly Yue.
m["zhx-dan"] = {
"Danzhou Chinese",
2578935,
"zh",
}
------------- Chinese romanization varieties -------------
-- [[Wiktionary:Information desk/2022/June#Etymology Coding Issue]]
-- [[Wiktionary:Grease pit/2022/June#Transliteration Systems in Etymologies 2]]
m["cmn-pinyin"] = {
"Hanyu Pinyin",
42222,
"cmn",
aliases = {"Pinyin"},
}
m["cmn-tongyong"] = {
"Tongyong Pinyin",
700739,
"cmn",
}
m["cmn-wadegiles"] = {
"Wade–Giles",
208442,
"cmn",
aliases = {"Wade-Giles", "Wade Giles"},
}
m["zh-postal"] = {
"Postal Romanization",
151868,
"zh",
}
-- Chinese cyrillization
m["cmn-palladius"] = {
"Palladius",
1234239,
"cmn",
aliases = {"Palladius system"},
}
-----------------------------------------------------
-- Tibetic varieties --
-----------------------------------------------------
m["adx"] = {
"Amdo Tibetan",
56509,
"bo",
}
m["kbg"] = {
"Khamba",
12952626,
"bo",
}
m["khg"] = {
"Khams Tibetan",
56601,
"bo",
}
m["tsk"] = {
"Tseku",
11159532,
"bo",
}
----------------------------------------------------------------------------------------------------------------------
-- Tai-Kadai varieties --
----------------------------------------------------------------------------------------------------------------------
m["th-old"] = {
"Old Thai",
nil,
"tai-swe-pro",
wikipedia_article = "Thai language#Old Thai",
}
m["th-suk"] = {
"Sukhothai Old Thai", -- 1238-1438. Cannot use "Sukhothai Thai" as Sukhothai is the current city and "Sukhothai Thai" is a lect.
nil,
"th-old",
aliases = {"Sukhothai Siamese"},
wikipedia_article = "Thai language#Old Thai",
}
m["th-ayu"] = {
"Ayutthaya Old Thai", -- 1351-1767. Cannot use "Ayutthaya Thai" as Ayutthaya is the current city.
nil,
"th-old",
aliases = {"Ayutthaya Siamese"},
wikipedia_article = "Thai language#Old Thai",
}
--[[
m["th-new"] = {
"Hacked Thai", -- temporary for testing new translit/display methods
nil,
"th",
translit = "User:Benwing2/th-scraping-translit",
display_text = "User:Benwing2/th-scraping-translit",
strip_diacritics = "User:Benwing2/th-scraping-translit",
preprocess_links = "User:Benwing2/th-scraping-translit",
}
]]
m["tai-shz"] = {
"Shangsi Zhuang",
13216,
"za",
}
----------------------------------------------------------------------------------------------------------------------
-- Turkic varieties --
----------------------------------------------------------------------------------------------------------------------
m["trk-cmn-pro"] = {
"Proto-Common Turkic",
1126028,
"trk-pro",
}
m["trk-ogr-pro"] = {
"Proto-Oghur",
1422731,
"trk-pro",
family = "trk-ogr",
}
m["trk-bul-pro"] = {
"Proto-Bulgar",
nil,
"trk-ogr-pro",
}
m["trk-ogz-pro"] = {
"Proto-Oghuz",
494600,
"trk-pro",
family = "trk-ogz",
aliases = {"Southwestern Common Turkic"},
}
m["crh-dbj"] = {
"Dobrujan Tatar",
12811566,
"crh",
aliases = {"Romanian Tatar"},
}
m["cv-ana"] = {
"Anatri Chuvash",
nil,
"cv",
aliases = {"Anatri", "Lower Chuvash"},
}
m["cv-mid"] = {
"Middle Chuvash",
nil,
"cv",
ancestors = "cv-old",
}
m["cv-old"] = {
"Old Chuvash",
nil,
"cv",
ancestors = "xbo-vol",
}
m["cv-vir"] = {
"Viryal Chuvash",
4278332,
"cv",
aliases = {"Viryal", "Upper Chuvash"},
}
m["kjh-fyu"] = {
"Fuyu Kyrgyz",
2598963,
"kjh",
aliases = {"Fuyu Kirgiz", "Fuyu Kirghiz", "Manchurian Kyrgyz", "Manchurian Kirgiz", "Manchurian Kirghiz"},
}
m["klj-arg"] = {
"Arghu",
33455,
"klj",
ancestors = "trk-cmn-pro",
}
m["otk-kir"] = {
"Old Kirghiz",
83142,
"otk",
aliases = {"Yenisei Turkic", "Yenisei Kyrgyz"},
}
m["otk-ork"] = {
"Orkhon Turkic",
31295480,
"otk",
}
m["qwm-cum"] = {
"Cuman",
1075050,
"qwm",
aliases = {"Kuman", "Polovtsian", "Polovcian"},
}
m["qwm-arm"] = {
"Armeno-Kipchak",
2027503,
"qwm",
ancestors = "qwm-cum",
aliases = {"Xıpçaχ tili", "Tatarça"},
}
m["qwm-mam"] = {
"Mamluk-Kipchak",
4279942,
"qwm",
aliases = {"Mameluk-Kipchak"},
}
m["az-cls"] = {
"Classical Azerbaijani",
nil,
"az",
aliases = {"Classical Azeri"},
}
m["qxq"] = {
"Qashqai",
13192,
"az",
aliases = {"Qaşqay", "Qashqayi", "Kashkai", "Kashkay"},
}
m["tr-CY"] = {
"Cypriot Turkish",
7917392,
"tr",
}
m["uz-afg"] = {
-- NOTE: has ISO 639-3 code uzs assigned to it.
"Afghan Uzbek",
1066787,
"uz",
aliases = {"Southern Uzbek"},
translit = "uz-afg-translit",
}
m["xbo-dan"] = {
"Danube Bulgar",
nil,
"xbo",
}
m["xbo-vol"] = {
"Volga Bulgar",
nil,
"xbo",
}
----------------------------------------------------------------------------------------------------------------------
-- Uralic varieties --
----------------------------------------------------------------------------------------------------------------------
m["fiu-pro"] = {
"Proto-Finno-Ugric",
79890,
"urj-pro",
}
m["urj-fpr-pro"] = {
"Proto-Finno-Permic",
nil,
"urj-pro",
}
m["krl-nor"] = {
"North Karelian",
125501196,
"krl",
}
m["krl-sou"] = {
"South Karelian",
129812730,
"krl",
}
m["mns-eas"] = {
"Eastern Mansi",
30311755,
"mns-cen",
}
m["mns-wes"] = {
"Western Mansi",
30311756,
"mns-cen",
}
----------------------------------------------------------------------------------------------------------------------
-- Yeneseian varieties --
----------------------------------------------------------------------------------------------------------------------
m["qfa-yke-pro"] = {
"Proto-Ketic",
nil,
"qfa-yen-pro",
family = "qfa-yke",
}
m["qfa-yko-pro"] = {
"Proto-Kottic",
nil,
"qfa-yen-pro",
family = "qfa-yko",
}
m["qfa-yrn-pro"] = {
"Proto-Arinic",
nil,
"qfa-yen-pro",
family = "qfa-yrn",
}
m["qfa-ypm-pro"] = {
"Proto-Pumpokolic",
nil,
"qfa-yen-pro",
family = "qfa-ypm",
}
----------------------------------------------------------------------------------------------------------------------
-- Miscellaneous varieties --
----------------------------------------------------------------------------------------------------------------------
m["mul-tax"] = {
"taxonomic name",
522190,
"mul",
}
-----------------------------------------------------
-- Elamite varieties --
-----------------------------------------------------
m["elx-old"] = {
"Old Elamite",
nil,
"elx",
}
m["elx-mid"] = {
"Middle Elamite",
nil,
"elx",
}
m["elx-neo"] = {
"Neo-Elamite",
nil,
"elx",
}
m["elx-ach"] = {
"Achaemenid Elamite",
nil,
"elx",
}
-----------------------------------------------------
-- Substrates --
-----------------------------------------------------
-- Pre-Roman substrates
m["qsb-ibe"] = {
"Paleo-Hispanic",
246801,
"und",
family = "qfa-sub",
aliases = {"Palaeo-Hispanic", "Paleohispanic", "Palaeohispanic", "Paleo-Iberian", "Palaeo-Iberian"},
}
m["qsb-bal"] = {
"Paleo-Balkan",
1815070,
"und",
family = "qfa-sub",
aliases = {"Palaeo-Balkan", "Paleobalkan", "Palaeobalkan"},
}
m["xaq"] = {
"Aquitanian",
500522,
"euq-pro",
family = "euq",
}
return require("Module:languages").finalizeData(m, "language", true)
m0kf8si8j2kroiptllxmke9gy47tv4l
234830
234829
2026-05-24T08:12:37Z
Lee
19
පැරණි සංස්කරණයකින් ගත් කොටස්...
234830
Scribunto
text/plain
local m_langdata = require("Module:languages/data")
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string utilities").char
return u(...)
end
local c = m_langdata.chars
local p = m_langdata.puaChars
local s = m_langdata.shared
local m = {}
----------------------------------------------------------------------------------------------------------------------
-- Afroasiatic varieties --
----------------------------------------------------------------------------------------------------------------------
--------------------------------------------------------------------------------------
-- Berber varieties --
--------------------------------------------------------------------------------------
m["shi-med"] = {
"Medieval Tashelhit",
34152,
"shi",
}
-- Tuareg lects
m["thv"] = {
"Tamahaq",
56703,
"tmh",
}
m["ttq"] = {
"Tawellemmet",
56390,
"tmh",
}
m["taq"] = {
"Tamasheq",
4670066,
"tmh",
}
m["thz"] = {
"Tayert",
56388,
"tmh",
}
m["thv-ght"] = {
"Ghat",
47012900,
"thv",
}
--------------------------------------------------------------------------------------
-- Cushitic varieties --
--------------------------------------------------------------------------------------
-- Oromo varieties
m["hae"] = {
"Harar Oromo",
5330355,
"om",
aliases = {"Eastern Oromo"},
}
m["gax"] = {
"Borana",
2910610,
"om",
aliases = {"Southern Oromo"},
}
m["orc"] = {
"Orma",
2919128,
"om",
}
m["ssn"] = {
"Waata",
3501553,
"om",
}
--------------------------------------------------------------------------------------
-- Egyptian varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Ancient Egyptian varieties --
-----------------------------------------------------
m["egy-old"] = {
"Old Egyptian",
447117,
"egy",
}
m["egy-mid"] = {
"Middle Egyptian",
657330,
"egy",
aliases = {"Classical Egyptian"},
}
m["egy-nmi"] = {
"Neo-Middle Egyptian",
123735278,
"egy",
aliases = {"Égyptien de tradition", "Traditional Egyptian"},
}
m["egy-lat"] = {
"Late Egyptian",
1852329,
"egy",
}
-----------------------------------------------------
-- Coptic varieties --
-----------------------------------------------------
m["cop-akh"] = {
"Akhmimic Coptic",
125176464,
"cop",
aliases = {"Akhmimic"},
}
m["cop-boh"] = {
"Bohairic Coptic",
890733,
"cop",
aliases = {"Bohairic", "Memphitic Coptic", "Memphitic"},
}
m["cop-ggg"] = {
"Coptic Dialect G",
nil,
"cop",
aliases = {"Dialect G", "Mansuric Coptic", "Mansuric"},
}
m["cop-jjj"] = {
"Coptic Dialect J",
nil,
"cop",
}
m["cop-kkk"] = {
"Coptic Dialect K",
nil,
"cop",
}
m["cop-ppp"] = {
"Coptic Dialect P",
nil,
"cop",
aliases = {"Proto-Theban Coptic", "Palaeo-Theban Coptic"},
}
m["cop-fay"] = {
"Fayyumic Coptic",
1399115,
"cop",
aliases = {"Fayyumic", "Faiyumic Coptic", "Faiyumic", "Fayumic Coptic", "Fayumic",
"Bashmuric Coptic", "Bashmuric"},
}
m["cop-her"] = {
"Hermopolitan Coptic",
nil,
"cop",
aliases = {"Hermopolitan", "Coptic Dialect H", "Ashmuninic", "Ashmuninic Coptic"},
}
m["cop-lyc"] = {
"Lycopolitan Coptic",
nil,
"cop",
aliases = {
"Lycopolitan",
"Assiutic Coptic", "Asyutic Coptic", "Assiutic", "Asyutic",
"Lyco-Diospolitan Coptic", "Lyco-Diospolitan",
"Subakhmimic Coptic", "Subakhmimic"
},
}
m["cop-old"] = {
"Old Coptic",
115518040,
"cop",
}
m["cop-oxy"] = {
"Oxyrhynchite Coptic",
nil,
"cop",
aliases = {"Oxyrhynchite", "Mesokemic Coptic", "Mesokemic", "Middle Egyptian Coptic"},
}
m["cop-ply"] = {
"Proto-Lycopolitan Coptic",
nil,
"cop",
aliases = {"Coptic Dialect i", "Proto-Lyco-Diospolitan Coptic"},
}
m["cop-sah"] = {
"Sahidic Coptic",
2645851,
"cop",
aliases = {"Sahidic", "Saidic Coptic", "Saidic", "Thebaic Coptic", "Thebaic"},
}
--------------------------------------------------------------------------------------
-- Semitic varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Akkadian varieties --
-----------------------------------------------------
m["akk-old"] = {
"Old Akkadian",
nil,
"akk",
}
m["akk-obb"] = {
"Old Babylonian",
nil,
"akk",
}
m["akk-oas"] = {
"Old Assyrian",
nil,
"akk",
}
m["akk-mbb"] = {
"Middle Babylonian",
nil,
"akk",
}
m["akk-mas"] = {
"Middle Assyrian",
nil,
"akk",
}
m["akk-nbb"] = {
"Neo-Babylonian",
nil,
"akk",
}
m["akk-nas"] = {
"Neo-Assyrian",
nil,
"akk",
}
m["akk-lbb"] = {
"Late Babylonian",
nil,
"akk",
}
m["akk-stb"] = {
"Standard Babylonian",
nil,
"akk",
}
-----------------------------------------------------
-- Arabic varieties --
-----------------------------------------------------
m["jrb"] = {
"Judeo-Arabic",
37733,
"ar",
pseudo_families = "qfa-jew",
}
m["apc-leb"] = {
"Lebanese North Levantine Arabic",
1516642,
"apc",
aliases = {"Lebanese Arabic"},
}
m["apc-sle"] = {
"South Lebanese North Levantine Arabic",
14206590,
"apc",
aliases = {"South Lebanese Arabic"},
}
m["apc-nle"] = {
"North Lebanese North Levantine Arabic",
nil,
"apc",
aliases = {"North Lebanese Arabic"},
}
m["apc-syr"] = {
"Syrian North Levantine Arabic",
2143071,
"apc",
aliases = {"Syrian Arabic"},
}
m["apc-ale"] = {
"Aleppine North Levantine Arabic",
7056921,
"apc-syr",
aliases = {"Aleppo Arabic", "Aleppine Arabic"},
}
m["apc-dam"] = {
"Damascene North Levantine Arabic",
12237466,
"apc-syr",
aliases = {"Damascus Arabic", "Damascene Arabic"},
}
m["acm-khu"] = {
"Khuzestani Arabic",
1040944,
"acm",
}
-----------------------------------------------------
-- Aramaic varieties --
-----------------------------------------------------
m["arc-bib"] = {
"Biblical Aramaic",
843235,
"arc",
family = "sem-are",
}
m["arc-cpa"] = {
"Christian Palestinian Aramaic",
60790119,
"arc",
family = "sem-arw",
aliases = {"Melkite Aramaic", "Palestinian Syriac", "Syropalestinian Aramaic"},
}
m["arc-imp"] = {
"Imperial Aramaic",
7079491,
"arc",
aliases = {"Official Aramaic"},
}
m["arc-hat"] = {
"Hatran Aramaic",
3832926,
"arc",
family = "sem-are",
}
m["arc-jla"] = {
"Jewish Literary Aramaic",
105952842,
"arc",
pseudo_families = "qfa-jew",
}
m["arc-nab"] = {
"Nabataean Aramaic",
36178,
"arc",
}
m["arc-old"] = {
"Old Aramaic",
3398392,
"arc",
}
m["arc-pal"] = {
"Palmyrene Aramaic",
1510113,
"arc",
family = "sem-arw",
}
m["tmr"] = {
"Jewish Babylonian Aramaic",
33407,
"arc",
family = "sem-ase",
pseudo_families = "qfa-jew",
}
m["jpa"] = {
"Jewish Palestinian Aramaic",
948909,
"arc",
family = "sem-arw",
aliases = {"Galilean Aramaic"},
pseudo_families = "qfa-jew",
}
-----------------------------------------------------
-- Hebrew varieties --
-----------------------------------------------------
m["hbo"] = {
"Biblical Hebrew",
1982248,
"he",
aliases = {"Classical Hebrew"},
}
m["he-mis"] = {
"Mishnaic Hebrew",
1649362,
"he",
ancestors = "hbo",
}
m["he-med"] = {
"Medieval Hebrew",
2712572,
"he",
ancestors = "he-mis",
}
m["he-IL"] = {
"Israeli Hebrew",
8141,
"he",
}
----------------------------------------------------------------------------------------------------------------------
-- Ainu varieties --
----------------------------------------------------------------------------------------------------------------------
m["ain-hok"] = {
"Hokkaido Ainu",
20968488,
"ain",
aliases = {"Hokkaidō Ainu"},
}
m["ain-kur"] = {
"Kuril Ainu",
20967012,
"ain",
}
m["ain-sak"] = {
"Sakhalin Ainu",
20747371,
"ain",
}
----------------------------------------------------------------------------------------------------------------------
-- American indigenous varieties --
----------------------------------------------------------------------------------------------------------------------
-----------------------------------------------------
-- Inuit varieties --
-----------------------------------------------------
m["esi"] = {
"North Alaskan Inupiatun",
nil,
"ik"
}
m["esk"] = {
"Northwest Alaskan Inupiatun",
25559714,
"ik"
}
-----------------------------------------------------
-- Iroquoian varieties --
-----------------------------------------------------
m["iro-ohu"] = {
"Old Wendat",
nil,
"wdt",
}
m["iro-omo"] = {
"Old Mohawk",
nil,
"moh",
}
m["iro-oon"] = {
"Old Onondaga",
nil,
"ono",
}
-----------------------------------------------------
-- Tupi-Guarani varieties --
-----------------------------------------------------
-- Old Tupi varieties
m["tpw-lga"] = {
"Língua Geral Amazônica",
18275323,
"tpw",
aliases = {"Língua Geral"},
}
m["tpw-lgp"] = {
"Língua Geral Paulista",
2669239,
"tpw",
}
----------------------------------------------------------------------------------------------------------------------
-- Austroasiatic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Khmer varieties
m["okz-ang"] = {
"Angkorian Old Khmer",
nil,
"okz",
wikipedia_article = "Khmer language#Historical periods",
}
m["okz-pre"] = {
"Pre-Angkorian Old Khmer",
nil,
"okz",
wikipedia_article = "Khmer language#Historical periods",
}
-- Central Nicobarese varieties
m["ncb-cam"] = {
"Camorta",
5026908,
"ncb",
aliases = {"Kamorta"},
}
m["ncb-kat"] = {
"Katchal",
17064263,
"ncb",
aliases = {"Tehnu"},
}
m["ncb-nan"] = {
"Nancowry",
6962504,
"ncb",
aliases = {"Nankwari"},
}
----------------------------------------------------------------------------------------------------------------------
-- Austronesian varieties --
----------------------------------------------------------------------------------------------------------------------
-- Malay and related varieties
m["ms-old"] = { -- this has the ISO code 'omy'
"Old Malay",
nil,
"ms",
}
m["ms-cla"] = {
"Classical Malay",
nil,
"ms",
ancestors = "ms-old",
}
m["pse-bsm"] = {
"Besemah",
nil,
"pse",
}
m["bew-kot"] = {
"Betawi Kota",
nil,
"bew",
aliases = {"Urban Betawi"}, -- in Jakarta
}
-- Philippine varieties
m["xnn"] = {
"Northern Kankanaey",
12953609,
"kne",
aliases = {"Northern Kankanay", "Northern Kankana-ey"},
}
m["tl-old"] = {
"Old Tagalog",
12967437,
"tl",
}
m["tl-cls"] = {
"Classical Tagalog",
nil,
"tl",
}
----------------------------------------------------------------------------------------------------------------------
-- Caucasian varieties --
----------------------------------------------------------------------------------------------------------------------
-- Kartvelian varieties
m["ka-mid"] = {
"Middle Georgian",
nil,
"ka",
ancestors = "oge",
}
----------------------------------------------------------------------------------------------------------------------
-- Dravidian varieties --
----------------------------------------------------------------------------------------------------------------------
m["ta-mid"] = {
"Middle Tamil",
20987434,
"ta",
}
m["kn-hav"] = {
"Havigannada",
24276369,
"kn",
}
m["kn-kun"] = {
"Kundagannada",
6444255,
"kn",
}
----------------------------------------------------------------------------------------------------------------------
-- Indo-European varieties --
----------------------------------------------------------------------------------------------------------------------
--------------------------------------------------------------------------------------
-- Albanian varieties --
--------------------------------------------------------------------------------------
m["aln"] = {
"Gheg Albanian",
181037,
"sq",
aliases = {"Gheg"},
}
m["aae"] = {
"Arbëresh Albanian",
1075302,
"als",
aliases = {"Arbëreshë", "Arbëresh"},
}
m["aat"] = {
"Arvanitika Albanian",
29347,
"als",
aliases = {"Arvanitika"},
}
m["als"] = {
"Tosk Albanian",
180937,
"sq",
aliases = {"Tosk"},
}
--------------------------------------------------------------------------------------
-- Armenian varieties --
--------------------------------------------------------------------------------------
m["hyw"] = {
"Western Armenian",
180945,
"hy",
}
m["hye"] = {
"Eastern Armenian",
181059,
"hy",
}
--------------------------------------------------------------------------------------
-- Balto-Slavic varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Baltic varieties --
-------------------------------------------------------------------------
m["bat-pro"] = {
"Proto-Baltic",
1703347,
"ine-bsl-pro",
}
m["bat-dni"] = {
"Dnieper Baltic",
4163178,
"bat-pro",
family = "bat",
aliases = {"Dniepr Baltic", "Dnieper-Oka Baltic", "Dniepr-Oka Baltic"},
}
m["bat-gol"] = {
"Golyad",
4142855,
"bat-dni",
aliases = {"Eastern Galindian", "East Galindian"},
}
-------------------------------------------------------------------------
-- Slavic varieties --
-------------------------------------------------------------------------
-----------------------------------------------------
-- Bulgarian varieties --
-----------------------------------------------------
m["cu-bgm"] = {
"Middle Bulgarian",
12294897,
"cu",
ancestors = "cu"
}
-----------------------------------------------------
-- Church Slavonic varieties --
-----------------------------------------------------
-- Old Moscow Church Slavonic deleted as it seems not distinct enough from Russian (Synodal) Church Slavonic.
m["zls-chs-ru"] = {
"Russian Church Slavonic",
21662400,
"zls-chs",
aliases = {"Synodal Church Slavonic", "New Moscow Church Slavonic", "Novomoskovsk Church Slavonic"},
}
m["zls-chs-uk"] = {
"Ukrainian Church Slavonic",
12153548,
"zls-chs",
aliases = {"Rusyn Church Slavonic", "Belarusian Church Slavonic"},
}
--[=[
-- Not sure about these yet.
m["zls-chs-bg"] = {
"Bulgarian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-cs"] = {
"Czech Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-hr"] = {
"Croatian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-mk"] = {
"Macedonian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-ro"] = {
"Romanian Church Slavonic",
nil,
"zls-chs",
}
m["zls-chs-sr"] = {
"Serbian Church Slavonic",
nil,
"zls-chs",
}
]=]
-----------------------------------------------------
-- Czech varieties --
-----------------------------------------------------
m["cs-ear"] = {
"Early Modern Czech",
nil,
"cs",
ancestors = "zlw-ocs"
}
-----------------------------------------------------
-- East Slavic varieties --
-----------------------------------------------------
m["zle-ops"] = {
"Old Pskovian",
4167885,
"zle-ono",
}
m["zle-mru"] = {
"Middle Russian",
35228,
"ru",
"Cyrs",
ancestors = "orv",
translit = "ru-translit",
strip_diacritics = {
Cyrs = {
remove_diacritics = c.grave .. c.acute .. c.diaer,
},
},
}
m["zle-mbe"] = {
"Middle Belarusian",
13211,
"zle-ort",
}
m["zle-muk"] = {
"Middle Ukrainian",
13211,
"zle-ort",
}
m["uk-CA"] = {
"Canadian Ukrainian",
4161010,
"uk",
}
-----------------------------------------------------
-- Polish varieties --
-----------------------------------------------------
m["zlw-mpl"] = {
"Middle Polish",
402878,
"pl",
ancestors = "zlw-opl",
strip_diacritics = {
remove_diacritics = c.acute,
remove_exceptions = {"Ć", "ć", "Ń", "ń", "Ó", "ó", "Ś", "ś", "Ź", "ź"},
},
}
m["pl-gre"] = {
"Greater Polish",
4106789,
"pl",
}
m["pl-les"] = {
"Lesser Polish",
361709,
"pl",
}
m["pl-mas"] = {
"Masovian Polish",
4274559,
"pl",
}
m["pl-gor"] = {
"Goral",
452889,
"pl",
}
-----------------------------------------------------
-- Serbo-Croatian varieties --
-----------------------------------------------------
m["ckm"] = {
"Chakavian Serbo-Croatian",
337565,
"sh",
aliases = {"Čakavian"},
}
m["kjv"] = {
"Kajkavian Serbo-Croatian",
838165,
"sh",
}
m["sh-tor"] = { -- Linguist code srp-tor
"Torlakian Serbo-Croatian",
1078803,
"sh",
aliases = {"Torlak"},
}
--------------------------------------------------------------------------------------
-- Celtic varieties --
--------------------------------------------------------------------------------------
-----------------------------------------------------
-- Brythonic varieties --
-----------------------------------------------------
m["bry-ear"] = {
"Early Brythonic",
nil,
"cel-bry-pro",
}
m["bry-lat"] = {
"Late Brythonic",
nil,
"cel-bry-pro",
}
-----------------------------------------------------
-- Gaulish varieties --
-----------------------------------------------------
m["xcg"] = {
"Cisalpine Gaulish",
3832927,
"cel-gau",
}
m["xtg"] = {
"Transalpine Gaulish",
29977,
"cel-gau",
}
-----------------------------------------------------
-- Welsh varieties --
-----------------------------------------------------
m["cy-nor"] = {
"North Wales Welsh",
13127692,
"cy",
aliases = {"North Walian Welsh", "Northern Welsh"},
}
m["cy-sou"] = {
"South Wales Welsh",
13127689,
"cy",
aliases = {"South Walian Welsh", "Southern Welsh"},
}
--------------------------------------------------------------------------------------
-- Germanic varieties --
--------------------------------------------------------------------------------------
-- Proto-West Germanic varieties
m["frk"] = {
"Frankish",
10860505,
"gmw-pro",
family = "gmw-frk",
aliases = {"Old Frankish"},
}
m["gem-sue"] = {
"Suevic",
134600275,
"gmw-pro",
aliases = {"Suebian"},
}
m["gmw-afr-pro"] = {
"Proto-Anglo-Frisian",
134603379,
"gmw-nsg-pro",
family = "gmw-afr",
}
m["gmw-nsg-pro"] = {
"Proto-North Sea Germanic",
134603374,
"gmw-pro",
family = "gmw-nsg",
aliases = {"Proto-Ingvaeonic"},
}
-----------------------------------------------------
-- Dutch varieties --
-----------------------------------------------------
m["nl-BE"] = {
"Belgian Dutch",
34147,
"nl",
aliases = {"Flemish", "Flemish Dutch", "Southern Dutch"},
}
-----------------------------------------------------
-- English and Scots varieties --
-----------------------------------------------------
-- English varieties
m["en-AU"] = {
"Australian English",
44679,
"en",
}
m["en-GB"] = {
"British English",
7979,
"en",
}
m["en-GB-SCT"] = {
"Scottish English",
44676,
"en-GB",
}
m["en-GB-WLS"] = {
"Welsh English",
44676,
"en-GB",
}
m["en-IM"] = {
"Manx English",
6753295,
"en-GB",
}
m["en-aae"] = {
"Australian Aboriginal English",
783347,
"en-AU",
}
m["en-ear"] = {
"Early Modern English",
1472196,
"en",
ancestors = "enm",
aliases = {"Early New English"},
}
m["en-geo"] = {
"Geordie",
653421,
"en",
ancestors = "enm-nor",
}
m["en-IE"] = { -- FIXME: "IE" doesn't cover Northern Ireland
"Irish English",
665624,
"en",
}
m["en-uls"] = {
"Ulster English",
6840826,
"en-IE",
}
m["en-GB-NIR"] = {
"Northern Irish English",
6840826, -- actually the code for Ulster English
"en-uls",
}
m["en-NNN"] = { -- NA = Namibia; NNN is NATO 3-letter code for North America
"North American ඉංග්රීසි",
7053766,
"en",
ietf_subtag = "en-021" -- 021 = UN M49 code for "Northern America" (i.e. North America wihout Central America or the Caribbean)
}
m["en-US"] = {
"American English",
7976,
"en-NNN",
}
m["en-NZ"] = {
"New Zealand English",
44661,
"en"
}
m["en-ZA"] = {
"South African English",
1156228,
"en"
}
m["en-US-CA"] = {
"California English",
1026812,
"en-US",
}
m["en-CA"] = {
"Canadian English",
44676,
"en-US",
}
m["en-HK"] = {
"Hong Kong English",
1068863,
"en",
}
m["en-IN"] = {
"Indian English",
1348800,
"en",
}
m["pld"] = {
"Polari",
1359130,
"en",
}
-- Scots varieties
m["sco-ins"] = {
"Insular Scots",
16919205,
"sco",
}
m["sco-uls"] = {
"Ulster Scots",
201966,
"sco",
}
m["sco-nor"] = {
"Northern Scots",
16928150,
"sco",
}
m["sco-sou"] = {
"Southern Scots",
7570457,
"sco",
aliases = {"South Scots", "Borders Scots"},
}
-- Middle English varieties
m["enm-esc"] = { -- Part of Middle English until it developed into Middle Scots.
"Early Scots",
5326738,
"enm",
ancestors = "enm-nor",
aliases = {"Old Scots", "Scottish Middle English"},
}
m["enm-emi"] = {
"East Midland Middle English",
134238810,
"enm",
ancestors = "ang-ang", -- Technically ang-mer, but attested Mercian is mostly WM IIRC
}
m["enm-ken"] = {
"Kentish Middle English",
134238532,
"enm",
ancestors = "ang-ken",
}
m["enm-nor"] = {
"Northern Middle English",
134238541,
"enm",
ancestors = "ang-nor",
}
m["enm-sou"] = {
"Southern Middle English",
134238528,
"enm",
ancestors = "ang-wsx",
}
m["enm-wmi"] = {
"West Midland Middle English",
134238824,
"enm",
ancestors = "ang-mer",
}
-- Old English varieties
-- Includes both Mercian and Northumbrian.
m["ang-ang"] = {
"Anglian Old English",
121142917,
"ang",
}
m["ang-ken"] = {
"Kentish Old English",
11687485,
"ang",
}
m["ang-mer"] = {
"Mercian Old English",
602072,
"ang-ang",
}
m["ang-nor"] = {
"Northumbrian Old English",
1798915,
"ang-ang",
}
m["ang-wsx"] = {
"West Saxon Old English",
2658603,
"ang",
}
-----------------------------------------------------
-- High German varieties --
-----------------------------------------------------
-- (modern) German varieties
m["de-AT"] = {
"Austrian German",
306626,
"de",
}
m["de-AT-vie"] = {
"Viennese German",
56474,
"de-AT",
}
m["de-CH"] = {
"Switzerland German",
1366643,
"de",
aliases = {"Schweizer Hochdeutsch", "Swiss Standard German", "Swiss High German"},
}
m["de-bal"] = {
"Baltic German",
15785413,
"de",
}
m["de-ear"] = {
"Early New High German",
1472199,
"de",
ancestors = "gmh",
aliases = {"Early Modern High German"},
}
m["ksh"] = {
"Kölsch",
4624,
"gmw-cfr",
}
m["pfl"] = {
"Palatine German",
23014,
"gmw-rfr",
aliases = {"Pfälzisch", "Pälzisch", "Palatinate German"},
}
m["sli"] = {
"Silesian East Central German",
152965,
"gmw-ecg",
aliases = {"Silesian"},
}
m["sxu"] = {
"Upper Saxon German",
699284,
"gmw-ecg",
}
-- Old High German varieties
m["lng"] = {
"Lombardic",
35972,
"goh",
}
-- Alemannic German varieties
m["gsw-low"] = {
"Low Alemannic German",
503724,
"gsw",
}
m["gsw-FR-als"] = {
"Alsatian Alemannic German",
8786,
"gsw-low",
}
m["gsw-hig"] = {
"High Alemannic German",
503728,
"gsw",
}
m["gsw-hst"] = {
"Highest Alemannic German",
687538,
"gsw",
}
m["wae"] = {
"Walser German",
680517,
"gsw-hst",
}
-----------------------------------------------------
-- Low German varieties --
-----------------------------------------------------
m["nds-de"] = {
"German Low German",
25433,
"nds",
ietf_subtag = "nds-DE", -- should we make this the actual code?
wikimedia_codes = "nds",
}
m["nds-nl"] = {
"Dutch Low Saxon",
516137,
"nds",
ietf_subtag = "nds-NL", -- should we make this the actual code?
wikimedia_codes = "nds-nl",
}
m["act"] = {
"Achterhoeks",
153627,
"nds-nl",
aliases = {"Achterhoek", "Achterhooks"},
}
m["drt"] = {
"Drents",
2736709,
"nds-nl",
aliases = {"Drèents", "Dreins", "Dreints", "Drints"},
}
m["frs"] = {
"East Frisian Low German",
149208,
"nds-de",
aliases = {"East Frisian", "East Frisian Low Saxon"},
}
m["gos"] = {
"Gronings",
508854,
"nds-nl",
aliases = {"Grunnegs", "Grönnegs"},
}
m["nds-lpr"] = {
"Low Prussian",
33982,
"nds-de",
}
m["sdz"] = {
"Sallands",
3436668,
"nds-nl",
aliases = {"Sallaans", "Sallaands"},
}
m["stl"] = {
"Stellingwerfs",
506010,
"nds-nl",
aliases = {"Stellingwarfs"},
}
m["twd"] = {
"Twents",
497363,
"nds-nl",
aliases = {"Tweants"},
}
m["vel"] = {
"Veluws",
2484810,
"nds-nl",
}
m["wep"] = {
"Westphalian",
505655,
"nds-de",
aliases = {"Westfalish", "Westphalien"},
}
-----------------------------------------------------
-- North Frisian varieties --
-----------------------------------------------------
m["frr-ins"] = {
"Insular North Frisian",
110629610,
"frr",
}
m["frr-fam"] = {
"Föhr-Amrum North Frisian",
110629601,
"frr-ins",
}
m["frr-foh"] = {
"Föhr North Frisian",
28185,
"frr-fam",
aliases = {"Föhr Frisian", "Fering",
"Ferring", -- Glottolog
},
varieties = {"Aasdring", "Weesdring"},
}
m["frr-amr"] = {
"Amrum North Frisian",
28192,
"frr-fam",
aliases = {"Amrum Frisian", "Amrum", "Öömrang"},
}
m["frr-hel"] = {
"Heligoland North Frisian",
28086,
"frr-ins",
aliases = {"Heligoland Frisian", "Halunder", "Heligolandic Frisian", "Heligolandic North Frisian",
"Helgoland Frisian", "Helgoland North Frisian", "Helgoland"},
}
m["frr-syl"] = {
"Sylt North Frisian",
28181,
"frr-ins",
aliases = {"Sylt Frisian", "Söl'ring",
"Sölreng", -- Glottolog
},
}
m["frr-mai"] = {
"Mainland North Frisian",
110629626,
"frr",
}
m["frr-hal"] = {
"Halligen North Frisian",
28177,
"frr-mai",
aliases = {"Halligen Frisian", "Halifreesk", "Hallingen Frisian", "Hallingen North Frisian",
"Hallingen", -- Glottolog
},
}
m["frr-moo"] = {
"Mooring North Frisian",
28187,
"frr-mai",
aliases = {"Bökingharde North Frisian", "Bökingharde Frisian", "Böökinghiirder frasch",
"Mooring", "Moring",
},
varieties = {{"East Mooring", "Ostermooring"}, {"West Mooring", "Westermooring"}},
}
m["frr-kar"] = {
"Karrharde North Frisian",
28191,
"frr-mai",
aliases = {"Karrharde Frisian", "Karrharder",
},
}
m["frr-goe"] = {
-- Technically this refers to three adjacent dialects (Northern, Central and Southern), the latter of which went
-- extinct in 1980-1981. As a result, Glottolog speaks of "Norder-Mittelgoesharde", referring to the remaining two.
"Goesharde North Frisian",
28183,
"frr-mai",
aliases = {"Norder-Mittelgoesharde North Frisian", "Norder-Mittelgoesharde Frisian", "Norder-Mittelgoesharde",
"Goesharde Frisian", "Goesharde", "Gooshiirder",
},
}
m["frr-wie"] = {
"Wiedingharde North Frisian",
28171,
"frr-mai",
aliases = {"Wiedingharde Frisian", "Wiedingharde", "Wiringhiirder freesk",
},
}
-----------------------------------------------------
-- Old Norse varieties --
-----------------------------------------------------
m["non-grn"] = {
"Greenlandic Norse",
855236,
"non-own",
}
m["non-oen"] = {
"Old East Norse",
10498031,
"non",
ancestors = "non",
}
m["non-own"] = {
"Old West Norse",
2377483,
"non",
ancestors = "non",
}
-----------------------------------------------------
-- Old Swedish varieties --
-----------------------------------------------------
m["gmq-osw-lat"] = {
"Late Old Swedish",
10723594,
"gmq-osw",
ancestors = "gmq-osw",
}
--------------------------------------------------------------------------------------
-- Greek varieties --
--------------------------------------------------------------------------------------
m["qsb-grc"] = {
"Pre-Greek",
965052,
"und",
family = "qfa-sub",
}
m["grc-aeo"] = {
"Aeolic Greek",
406373,
"grc",
aliases = {"Lesbic Greek", "Lesbian Greek", "Aeolian Greek"},
}
m["grc-arc"] = {
"Arcadian Greek",
nil,
"grc-arp",
}
m["grc-arp"] = {
"Arcadocypriot Greek",
499602,
"grc",
}
m["grc-att"] = {
"Attic Greek",
506588,
"grc",
}
m["grc-boi"] = {
"Boeotian Greek",
406373,
"grc-aeo",
}
m["grc-cyp"] = {
"Cypriot Ancient Greek", -- to distinguish from Cypriot Greek below
nil,
"grc-arp",
}
m["grc-dor"] = {
"Doric Greek",
285494,
"grc",
}
m["grc-ela"] = {
"Elean Greek",
nil,
"grc",
}
m["grc-epi"] = {
"Epic Greek",
990062,
"grc",
aliases = {"Homeric Greek"},
}
m["grc-ion"] = {
"Ionic Greek",
504165,
"grc",
}
m["grc-koi"] = {
"Koine Greek",
107358,
"grc",
ancestors = "grc-att",
aliases = {"Hellenistic Greek"},
}
m["grc-kre"] = {
"Cretan Ancient Greek", -- to distinguish from Cretan Greek below
nil,
"grc-dor",
}
m["grc-opl"] = {
"Opuntian Locrian",
nil,
"grc",
}
m["grc-ozl"] = {
"Ozolian Locrian",
nil,
"grc",
}
m["grc-pam"] = {
"Pamphylian Greek",
2271793,
"grc",
}
m["grc-ths"] = {
"Thessalian Greek",
406373,
"grc-aeo",
}
m["gkm"] = {
"Byzantine Greek",
36387,
"grc",
ancestors = "grc-koi",
aliases = {"Medieval Greek"},
}
m["el-cyp"] = {
"Cypriot Greek",
245899,
"el",
aliases = {"Cypriotic Greek"},
}
m["el-pap"] = {
"Paphian Greek",
nil,
"el",
}
m["el-crt"] = {
"Cretan Greek",
588306,
"el",
}
m["el-kth"] = {
"Katharevousa",
35961,
"el",
"Polyt",
ancestors = "gkm",
aliases = {"Katharevousa Greek"},
-- Polyt display_text, strip_diacritics, sort_key in [[Module:scripts/data]]
}
m["el-kal"] = {
"Kaliarda",
12878658,
"el",
}
--------------------------------------------------------------------------------------
-- Indo-Iranian varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Indo-Aryan varieties --
-------------------------------------------------------------------------
-- reconstructed intermediate stages
m["pra-pro"] = {
"Proto-New Indo-Aryan",
nil,
"pra",
}
m["inc-ash-pro"] = {
"Proto-Middle Indo-Aryan",
nil,
"inc-ash",
}
m["inc-mit"] = {
"Mitanni",
1986700,
"inc-pro",
}
m["bra-old"] = {
"Old Braj",
nil,
"bra",
}
-- Apabhramsas
m["inc-aav"] = {
"Avahattha",
nil,
"inc-apa",
aliases = {"Abahattha"},
}
m["inc-asa"] = {
"Sauraseni Apabhramsa",
nil,
"inc-apa",
}
m["inc-agu"] = {
"Gurjara Apabhramsa",
nil,
"inc-apa",
}
m["inc-aka"] = {
"Kasmiri Apabhramsa",
nil,
"inc-apa",
}
m["inc-ama"] = {
"Maharastri Apabhramsa",
nil,
"inc-apa",
}
m["inc-ata"] = {
"Takka Apabhramsa",
nil,
"inc-apa",
}
m["inc-avr"] = {
"Vracada Apabhramsa",
nil,
"inc-apa",
}
-- Assamese varieties
m["as-bkm"] = {
"Barpetia Kamrupi Assamese",
30642960,
"as",
}
m["as-nkm"] = {
"Nalbaria Kamrupi Assamese",
85787678,
"as",
}
m["as-pkm"] = {
"Palasbaria Kamrupi Assamese",
nil,
"as",
}
-- Bengali varieties
m["bn-dvn"] = {
"Dhakaiya Vaṅga Bengali",
48726851,
"bn", -- Eastern Bengali variety
}
m["bn-nvn"] = {
"Noakhailla Vaṅga Bengali",
107548681,
"bn", -- Eastern Bengali variety
}
-- Dhivehi varieties
m["dv-old"] = {
"Old Dhivehi",
117790875,
"dv",
}
m["dv-mul"] = {
"Mulaku Dhivehi",
nil,
"dv",
aliases = {"Mulaku Divehi", "Mulaku Bas"},
}
m["dv-huv"] = {
"Huvadhu Dhivehi",
nil,
"dv",
aliases = {"Huvadhu Divehi", "Huvadhu Bas"},
}
m["dv-add"] = {
"Addu Dhivehi",
nil,
"dv",
aliases = {"Addu Divehi", "Addu Bas"},
}
-- Gujarati varieties
m["gu-kat"] = {
"Kathiyawadi",
nil,
"gu",
aliases = {"Kathiyawadi Gujarati", "Kathiawadi"},
}
m["gu-lda"] = {
"Lisan ud-Dawat Gujarati",
nil,
"gu",
aliases = {"Lisan ud-Dawat", "LDA"},
}
-- Hindi varieties
m["hi-mum"] = {
"Bombay Hindi",
3543151,
"hi",
aliases = {"Mumbai Hindi", "Bambaiyya Hindi"},
}
m["hi-mid"] = {
"Middle Hindi",
nil,
"inc-ohi",
ancestors = "inc-ohi",
}
-- Konkani varieties
m["kok-mid"] = {
"Middle Konkani",
nil,
"kok",
aliases = {"Medieval Konkani"},
}
m["kok-old"] = {
"Old Konkani",
nil,
"kok",
aliases = {"Early Konkani"},
}
-- Prakrits
m["pra-ard"] = {
"Ardhamagadhi Prakrit",
35217,
"pra",
aliases = {"Ardhamagadhi"},
}
m["pra-hel"] = {
"එළු ප්රාකෘත",
15080869,
"pra",
aliases = {"Elu", "Elu Prakrit", "Helu", "Helu Prakrit"},
}
m["pra-kha"] = {
"Khasa Prakrit",
nil,
"pra",
aliases = {"Khasa"},
}
m["pra-mag"] = {
"Magadhi Prakrit", -- Not to be confused with Magahi (mag)
2652214,
"pra",
aliases = {"Magadhi"},
}
m["pra-mah"] = {
"Maharastri Prakrit",
2586773,
"pra",
aliases = {"Maharashtri Prakrit", "Maharastri", "Maharashtri"},
}
m["pra-pai"] = {
"Paisaci Prakrit",
2995607,
"pra-sau",
aliases = {"Paisaci", "Paisachi"},
ancestors = "pra-sau"
}
m["pra-sau"] = {
"Sauraseni Prakrit",
2452885,
"pra",
aliases = {"Sauraseni", "Shauraseni"},
}
m["pra-ava"] = {
"Avanti",
nil,
"pra",
aliases = {"Avanti Prakrit"},
}
m["pra-pra"] = {
"Pracya",
nil,
"pra",
aliases = {"Pracya Prakrit"},
}
m["pra-bah"] = {
"Bahliki",
nil,
"pra",
aliases = {"Bahliki Prakrit"},
}
m["pra-dak"] = {
"Daksinatya",
nil,
"pra",
aliases = {"Daksinatya Prakrit"},
}
m["pra-sak"] = {
"Sakari",
nil,
"pra",
aliases = {"Sakari Prakrit"},
}
m["pra-can"] = {
"Candali",
nil,
"pra",
aliases = {"Candali Prakrit"},
}
m["pra-sab"] = {
"Sabari",
nil,
"pra",
aliases = {"Sabari Prakrit"},
}
m["pra-abh"] = {
"Abhiri",
nil,
"pra",
aliases = {"Abhiri Prakrit"},
}
m["pra-dra"] = {
"Dramili",
nil,
"pra",
aliases = {"Dramili Prakrit"},
}
m["pra-odr"] = {
"Odri",
nil,
"pra",
aliases = {"Odri Prakrit"},
}
-- Punjabi varieties
m["pnb"] = {
"Western Punjabi",
58635,
"pa",
"pa-Arab",
}
-- Sanskrit varieties
m["vsn"] = {
"Vedic Sanskrit",
36858,
"sa",
}
m["cls"] = {
"Classical Sanskrit",
9333703,
"sa",
}
m["sa-bhs"] = {
"Buddhist Hybrid Sanskrit",
248758,
"sa",
}
m["sa-bra"] = {
"Brahmanic Sanskrit",
139822891,
"vsn",
}
m["sa-epi"] = {
"Epic Sanskrit",
56702805,
"cls",
}
m["sa-neo"] = {
"New Sanskrit",
nil,
"sa",
}
m["sa-rig"] = {
"Rigvedic Sanskrit",
139822680,
"vsn",
}
-- Sinhalese varieties
m["si-med"] = {
"Medieval Sinhalese",
nil,
"si",
aliases = {"Medieval Sinhala"},
}
-------------------------------------------------------------------------
-- Iranian varieties --
-------------------------------------------------------------------------
m["qsb-bma"] = {
"the BMAC substrate",
133187435,
"und",
family = "qfa-sub",
aliases = {"the Bactria-Margiana substrate", "the Bactria-Margiana Archaeological Complex substrate"},
}
-- Historical and current Iranian dialects
m["ae-old"] = {
"Old Avestan",
29572,
"ae",
aliases = {"Gathic Avestan"},
}
m["ae-yng"] = {
"Younger Avestan",
29572,
"ae-old",
aliases = {"Young Avestan"},
}
m["bcc"] = {
"Southern Balochi",
33049,
"bal",
aliases = {"Southern Baluchi"},
}
m["bgp"] = {
"Eastern Balochi",
33049,
"bal",
aliases = {"Eastern Baluchi"},
}
m["bgn"] = {
"Western Balochi",
33049,
"bal",
aliases = {"Western Baluchi"},
}
m["bsg-ban"] = {
"Bandari",
nil,
"bsg",
}
m["bsg-hor"] = {
"Hormozi",
nil,
"bsg",
}
m["bsg-min"] = {
"Minabi",
nil,
"bsg",
}
m["kho-old"] = {
"Old Khotanese",
nil,
"kho",
}
m["kho-lat"] = {
"Late Khotanese",
nil,
"kho-old",
}
m["peo-ear"] = {
"Early Old Persian",
nil,
"peo",
}
m["peo-lat"] = {
"Late Old Persian",
nil,
"peo",
}
m["pal-ear"] = {
"Early Middle Persian",
nil,
"pal",
}
m["pal-lat"] = {
"Late Middle Persian",
nil,
"pal",
ancestors = "pal-ear",
}
m["ps-nwe"] = {
"Northwestern Pashto",
nil,
"ps",
}
m["ps-cgi"] = {
"Central Ghilzay",
nil,
"ps-nwe",
}
m["ps-mah"] = {
"Mahsudi",
nil,
"ps-nwe",
}
m["ps-nea"] = {
"Northeastern Pashto",
nil,
"ps",
}
m["ps-afr"] = {
"Afridi",
nil,
"ps-nea",
}
m["ps-bng"] = {
"Bangash",
nil,
"ps-nea",
}
m["ps-xat"] = {
"Khatak",
nil,
"ps-nea",
}
m["ps-pes"] = {
"Peshawari",
nil,
"ps-nea",
}
m["ps-sea"] = {
"Southeastern Pashto",
nil,
"ps",
}
m["ps-ban"] = {
"Bannu",
nil,
"ps-sea",
}
m["ps-kak"] = {
"Kakari",
nil,
"ps-sea",
}
m["ps-ser"] = {
"Sher",
nil,
"ps-sea",
}
m["ps-waz"] = {
"Waziri",
12274473,
"ps-sea",
}
m["ps-swe"] = {
"Southwestern Pashto",
nil,
"ps",
}
m["ps-kan"] = {
"Kandahari",
nil,
"ps-swe",
}
m["ps-jad"] = {
"Jadrani",
nil,
"ps",
ancestors = "ira-pat-pro"
}
m["xme-azr"] = {
"Old Azari",
nil,
"xme-ott",
aliases = {"Old Azeri", "Azari", "Azeri", "Āḏarī", "Adari", "Adhari"},
}
m["xme-ttc-cen"] = {
"Central Tati",
nil,
"xme-ott",
}
m["xme-ttc-eas"] = {
"Eastern Tati",
nil,
"xme-ott",
}
m["xme-ttc-nor"] = {
"Northern Tati",
nil,
"xme-ott",
}
m["xme-ttc-sou"] = {
"Southern Tati",
nil,
"xme-ott",
}
m["xme-ttc-wes"] = {
"Western Tati",
nil,
"xme-ott",
}
m["xmn"] = {
"Manichaean Middle Persian",
nil,
"pal-lat",
}
m["fa-ear"] = {
"Early New Persian",
127413796,
"fa",
ancestors = "pal-lat",
translit = "fa-cls-translit",
}
m["fa-cls"] = {
"Classical Persian",
9168,
"fa",
ancestors = "fa-ear",
translit = "fa-cls-translit",
}
m["fa-ira"] = {
"Iranian Persian",
3513637,
"fa",
aliases = {"Modern Persian", "Western Persian"},
translit = "fa-ira-translit",
}
m["prs"] = {
"Dari",
178440,
"fa",
aliases = {"Dari Persian", "Central Persian", "Eastern Persian", "Afghan Persian"},
translit = "fa-cls-translit",
}
m["haz"] = {
"Hazaragi",
33398,
"prs",
translit = "fa-cls-translit",
}
m["os-dig"] = {
"Digor Ossetian",
3027861,
"os",
aliases = {"Digoron", "Digor"},
}
m["os-iro"] = {
"Iron Ossetian",
nil,
"os",
aliases = {"Iron"},
}
m["sog-ear"] = {
"Early Sogdian",
nil,
"sog",
}
m["sog-lat"] = {
"Late Sogdian",
nil,
"sog-ear",
}
m["ro-MD"] = {
"Moldovan",
36392,
"ro",
aliases = {"Moldavian"},
}
m["oru-kan"] = {
"Kaniguram",
6363164,
"oru",
}
m["oru-log"] = {
"Logar",
nil,
"oru",
}
m["oos"] = {
"Old Ossetic",
65455882,
"xln",
}
m["oos-ear"] = {
"Early Old Ossetic",
nil,
"oos",
}
m["oos-lat"] = {
"Late Old Ossetic",
nil,
"oos",
}
m["rdb-jir"] = {
"Jirofti",
nil,
"rdb",
}
m["rdb-kah"] = {
"Kahnuji",
nil,
"rdb",
}
-- Southwestern Fars lects
m["fay-bur"] = {
"Burenjani",
nil,
"fay",
}
m["fay-bsh"] = {
"Bushehri",
nil,
"fay",
}
m["fay-dsh"] = {
"Dashtaki",
nil,
"fay",
}
m["fay-dav"] = {
"Davani",
5228140,
"fay",
}
m["fay-eze"] = {
"Emamzada Esmaili",
nil,
"fay",
}
m["fay-gav"] = {
"Gavkoshaki",
nil,
"fay",
}
m["fay-kho"] = {
"Khollari",
nil,
"fay",
}
m["fay-kon"] = {
"Kondazi",
nil,
"fay",
}
m["fay-kzo"] = {
"Old Kazeruni",
nil,
"fay",
}
m["fay-mas"] = {
"Masarami",
nil,
"fay",
}
m["fay-pap"] = {
"Papuni",
nil,
"fay",
}
m["fay-sam"] = {
"Samghani",
nil,
"fay",
}
m["fay-shr"] = {
"Shirazi",
nil,
"fay",
}
m["fay-sho"] = {
"Old Shirazi",
nil,
"fay",
}
m["fay-kar"] = {
"Khargi",
nil,
"fay",
}
m["fay-sor"] = {
"Sorkhi",
nil,
"fay",
}
-- Talysh lects
m["tly-cen"] = {
"Central Talysh",
nil,
"tly",
}
m["tly-asa"] = {
"Asalemi",
nil,
"tly-cen",
}
m["tly-kar"] = {
"Karganrudi",
nil,
"tly-cen",
}
m["tly-tul"] = {
"Tularudi",
nil,
"tly-cen",
}
m["tly-tal"] = {
"Taleshdulabi",
nil,
"tly-cen",
}
m["tly-nor"] = {
"Northern Talysh",
nil,
"tly",
}
m["tly-aze"] = {
"Azerbaijani Talysh",
nil,
"tly-nor",
}
m["tly-anb"] = {
"Anbarani",
nil,
"tly-nor",
}
m["tly-sou"] = {
"Southern Talysh",
nil,
"tly",
}
m["tly-fum"] = {
"Fumani",
nil,
"tly-sou",
}
m["tly-msu"] = {
"Masulei",
nil,
"tly-sou",
}
m["tly-msa"] = {
"Masali",
nil,
"tly-sou",
}
m["tly-san"] = {
"Shandarmani",
nil,
"tly-sou",
}
-- Tafreshi lects
m["xme-amo"] = {
"Amorehi",
nil,
"xme-taf",
}
m["atn"] = {
"Ashtiani",
3436590,
"xme-taf",
}
m["xme-bor"] = {
"Borujerdi",
nil,
"xme-taf",
}
m["xme-ham"] = {
"Hamadani",
6302426,
"xme-taf",
}
m["xme-kah"] = {
"Kahaki",
nil,
"xme-taf",
}
m["vaf"] = {
"Vafsi",
32611,
"xme-taf",
}
-- Kermanic lects
m["kfm"] = {
"Khunsari",
6403030,
"xme-ker",
}
m["xme-mah"] = {
"Mahallati",
nil,
"xme-ker",
}
m["xme-von"] = {
"Vonishuni",
nil,
"xme-ker",
}
m["xme-bdr"] = {
"Badrudi",
nil,
"xme-ker",
}
m["xme-del"] = {
"Delijani",
nil,
"xme-ker",
}
m["xme-kas"] = {
"Kashani",
nil,
"xme-ker",
}
m["xme-kes"] = {
"Kesehi",
nil,
"xme-ker",
}
m["xme-mey"] = {
"Meymehi",
nil,
"xme-ker",
}
m["ntz"] = {
"Natanzi",
6968399,
"xme-ker",
}
m["xme-abz"] = {
"Abuzeydabadi",
nil,
"xme-ker",
}
m["xme-aby"] = {
"Abyanehi",
nil,
"xme-ker",
}
m["xme-far"] = {
"Farizandi",
nil,
"xme-ker",
}
m["xme-jow"] = {
"Jowshaqani",
nil,
"xme-ker",
}
m["xme-nas"] = {
"Nashalji",
nil,
"xme-ker",
}
m["xme-qoh"] = {
"Qohrudi",
nil,
"xme-ker",
}
m["xme-yar"] = {
"Yarandi",
nil,
"xme-ker",
}
m["soj"] = {
"Soi",
7930463,
"xme-ker",
aliases = {"Sohi"},
}
m["xme-tar"] = {
"Tari",
nil,
"xme-ker",
}
m["gzi"] = {
"Gazi",
5529130,
"xme-ker",
}
m["xme-sed"] = {
"Sedehi",
nil,
"xme-ker",
}
m["xme-ard"] = {
"Ardestani",
nil,
"xme-ker",
}
m["xme-zef"] = {
"Zefrehi",
nil,
"xme-ker",
}
m["xme-isf"] = {
"Isfahani",
nil,
"xme-ker",
}
m["xme-kaf"] = {
"Kafroni",
nil,
"xme-ker",
}
m["xme-vrz"] = {
"Varzenehi",
nil,
"xme-ker",
}
m["xme-xur"] = {
"Khuri",
nil,
"xme-ker",
}
m["nyq"] = {
"Nayini",
6983146,
"xme-ker",
}
m["xme-ana"] = {
"Anaraki",
nil,
"xme-ker",
}
m["gbz"] = {
"Zoroastrian Dari",
32389,
"xme-ker",
aliases = {"Behdināni", "Gabri", "Gavrŭni", "Gabrōni"},
}
m["xme-krm"] = {
"Kermani",
nil,
"xme-ker",
}
m["xme-yaz"] = {
"Yazdi",
nil,
"xme-ker",
}
m["xme-bid"] = {
"Bidhandi",
nil,
"xme-ker",
}
m["xme-bij"] = {
"Bijagani",
nil,
"xme-ker",
}
m["xme-cim"] = {
"Chimehi",
nil,
"xme-ker",
}
m["xme-han"] = {
"Hanjani",
nil,
"xme-ker",
}
m["xme-kom"] = {
"Komjani",
nil,
"xme-ker",
}
m["xme-nar"] = {
"Naraqi",
nil,
"xme-ker",
}
m["xme-nus"] = {
"Nushabadi",
nil,
"xme-ker",
}
m["xme-qal"] = {
"Qalhari",
nil,
"xme-ker",
}
m["xme-trh"] = {
"Tarehi",
nil,
"xme-ker",
}
m["xme-val"] = {
"Valujerdi",
nil,
"xme-ker",
}
m["xme-var"] = {
"Varani",
nil,
"xme-ker",
}
m["xme-zor"] = {
"Zori",
nil,
"xme-ker",
}
-- Ramandi lects
m["tks-ebr"] = {
"Ebrahimabadi",
nil,
"tks",
}
m["tks-sag"] = {
"Sagzabadi",
nil,
"tks",
}
m["tks-esf"] = {
"Esfarvarini",
nil,
"tks",
}
m["tks-tak"] = {
"Takestani",
nil,
"tks",
}
m["tks-cal"] = {
"Chali Tati",
nil,
"tks",
aliases = {"Chāli"},
}
m["tks-dan"] = {
"Danesfani",
nil,
"tks",
}
m["tks-xia"] = {
"Khiaraji",
nil,
"tks",
}
m["tks-xoz"] = {
"Khoznini",
nil,
"tks",
}
-- Shughni dialects
m["sgh-bro"] = {
"Bartangi-Oroshori",
nil,
"sgh",
}
m["sgh-bar"] = {
"Bartangi",
nil,
"sgh-bro",
}
m["sgh-oro"] = {
"Oroshori",
nil,
"sgh-bro",
aliases = {"Roshorvi"},
}
m["sgh-rsx"] = {
"Roshani-Khufi",
nil,
"sgh",
}
m["sgh-xuf"] = {
"Khufi",
2562249,
"sgh-rsx",
aliases = {"Xufi", "Xūfī"},
}
m["sgh-ros"] = {
"Roshani",
2597566,
"sgh-rsx",
aliases = {"Rushani", "Rōšāni"},
}
m["sgh-xgb"] = {
"Khughni-Bajui",
nil,
"sgh",
}
m["sgh-xug"] = {
"Khughni",
nil,
"sgh-xgb",
}
m["sgh-baj"] = {
"Bajui",
nil,
"sgh-xgb",
}
-------------------------------------------------------------------------
-- Nuristani varieties --
-------------------------------------------------------------------------
m["bsh-kat"] = {
"Kativiri",
2605045,
"bsh",
aliases = {"Katə́viri"},
}
m["xvi"] = {
"Kamviri",
1193495,
"bsh",
aliases = {"Kamvíri"},
}
m["bsh-mum"] = {
"Mumviri",
nil,
"bsh",
aliases = {"Mumvíri"},
}
--------------------------------------------------------------------------------------
-- Italic varieties --
--------------------------------------------------------------------------------------
-------------------------------------------------------------------------
-- Latin varieties --
-------------------------------------------------------------------------
-- Latin varieties by period
m["itc-ola"] = {
"පුරාතන ලතින්",
12289,
"la",
"Latn, Ital",
translit = {
Ital = "Ital-translit"
},
}
m["itc-lan"] = {
"Lanuvian",
16890829,
"itc-ola",
aliases = {"Lanuvine"},
}
m["itc-pra"] = {
"Praenestine",
16889772,
"itc-ola",
aliases = {"Praenestinian"},
}
m["la-cla"] = {
"Classical Latin",
253854,
"la",
}
m["la-vul"] = {
"Vulgar Latin",
37560,
"la-cla",
}
m["la-afr"] = {
"African Romance",
162064,
"roa-pro",
}
m["la-lat"] = {
"Late Latin",
1503113,
"la",
ancestors = "la-cla",
}
m["la-med"] = {
"Medieval Latin",
1163234,
"la",
ancestors = "la-lat",
}
m["la-eme"] = {
"Early Medieval Latin",
nil,
"la-med",
}
m["la-ecc"] = {
"Ecclesiastical Latin",
1247932,
"la",
aliases = {"Church Latin", "Liturgical Latin"},
ancestors = "la-lat",
}
m["la-ren"] = {
"Renaissance Latin",
499083,
"la",
ancestors = "la-med",
}
m["la-new"] = {
"New Latin",
1248221,
"la",
aliases = {"Modern Latin"},
ancestors = "la-ren",
}
m["la-con"] = {
"Contemporary Latin",
1246397,
"la-new",
}
-------------------------------------------------------------------------
-- Miscellaneous Italic varieties --
-------------------------------------------------------------------------
m["xfa-cap"] = {
"Capenate",
133182969,
"xfa",
}
m["osc-luc"] = {
"Lucanian",
3265025,
"osc",
}
m["osc-sam"] = {
"Samnite",
133184287,
"osc",
}
-------------------------------------------------------------------------
-- Romance varieties --
-------------------------------------------------------------------------
m["roa-pro"] = {
"Proto-Romance",
3408029,
"la-lat",
ancestors = "la-vul",
}
-----------------------------------------------------
-- Catalan varieties --
-----------------------------------------------------
m["ca-val"] = {
"Valencian",
32641,
"ca",
}
-----------------------------------------------------
-- Franco-Provençal varieties --
-----------------------------------------------------
m["frp-old"] = {
"Old Franco-Provençal",
nil,
"frp",
}
-----------------------------------------------------
-- French and derived creole varieties --
-----------------------------------------------------
m["fro-nor"] = {
"Old Northern French",
2044917,
"fro",
aliases = {"Old Norman", "Old Norman French"},
}
m["fro-pic"] = {
"Picard Old French",
nil,
"fro",
}
m["xno"] = {
"ඇන්ග්ලෝ-නෝමන්",
35214,
"fro-nor",
}
m["xno-law"] = {
"Law French",
2044323,
"xno",
}
m["zrp"] = {
"Zarphatic",
36994,
"fro",
aliases = {"Judeo-French"},
pseudo_families = "qfa-jew",
}
m["fr-CA"] = {
"Canadian French",
1450506,
"fr",
}
m["fr-CH"] = {
"Swiss French",
1480152,
"fr",
}
m["fr-aca"] = {
"Acadian French",
415109,
"fr",
}
m["fr-lou"] = {
"Louisiana French",
3083213,
"fr",
}
m["fr-mis"] = {
"Missouri French",
3083210,
"fr",
}
m["frc"] = {
"Cajun French",
880301,
"fr-lou",
}
m["ht-sdm"] = {
"Saint Dominican Creole French",
nil,
"ht",
ancestors = "fr",
}
-- Norman varieties
m["nrf-grn"] = {
"Guernsey Norman",
56428,
"nrf",
aliases = {"Guernsey"},
}
m["nrf-jer"] = {
"Jersey Norman",
56430,
"nrf",
aliases = {"Jersey"},
}
-----------------------------------------------------
-- Gallo-Italic varieties --
-----------------------------------------------------
m["egl-old"] = {
"Old Emilian",
nil,
"egl",
}
m["lij-old"] = {
"Old Ligurian",
nil,
"lij",
aliases = {"Old Genoese"},
}
m["lmo-old"] = {
"Old Lombard",
97165320,
"lmo",
}
m["pms-old"] = {
"Old Piedmontese",
nil,
"pms",
aliases = {"Old Piemontese"},
}
m["vec-old"] = {
"Old Venetan",
nil,
"vec",
aliases = {"Old Venetian"},
}
m["rgn-old"] = {
"Old Romagnol",
nil,
"rgn",
}
-----------------------------------------------------
-- Italo-Romance varieties --
-----------------------------------------------------
-- Italian varieties
m["roa-oit"] = {
"Old Italian",
nil,
"it",
}
m["it-CH"] = {
"Switzerland Italian",
672147,
"it",
}
-- Other Italo-Romance varieties
m["nap-old"] = {
"Old Neapolitan",
nil,
"nap",
}
m["scn-old"] = {
"Old Sicilian",
nil,
"scn",
}
-----------------------------------------------------
-- Occitan varieties --
-----------------------------------------------------
m["oc-auv"] = {
"Auvergnat",
35359,
"oc",
aliases = {"Auvernhat", "Auvergnese"},
}
m["oc-gas"] = {
"Gascon",
35735,
"oc",
}
-- standardized dialect of Gascon
m["oc-ara"] = {
"Aranese",
10196,
"oc-gas",
}
m["oc-lan"] = {
"Languedocien",
942602,
"oc",
aliases = {"Lengadocian"},
}
m["oc-lim"] = {
"Limousin",
427614,
"oc",
}
m["oc-pro"] = {
"Provençal",
241243,
"oc",
aliases = {"Provencal"},
}
m["oc-pro-old"] = {
"Old Provençal",
2779185,
"pro",
}
m["oc-viv"] = {
"Vivaro-Alpine",
1649613,
"oc",
}
m["oc-jud"] = {
"Shuadit",
56472,
"oc",
aliases = {
"Chouhadite", "Chouhadit", "Chouadite", "Chouadit", "Shuhadit",
"Judeo-Occitan", "Judæo-Occitan", "Judaeo-Occitan",
"Judeo-Provençal", "Judæo-Provençal", "Judaeo-Provençal",
"Judeo-Provencal", "Judaeo-Provencal",
"Judeo-Comtadin", "Judæo-Comtadin", "Judaeo-Comtadin",
},
pseudo_families = "qfa-jew",
}
-----------------------------------------------------
-- Portuguese and derived creole varieties --
-----------------------------------------------------
-- Portuguese
m["pt-BR"] = {
"බ්රසීල පෘතුගීසි",
750553,
"pt",
}
m["pt-PT"] = {
"European Portuguese",
922399,
"pt",
}
-- Kabuverdianu (Cape Verde Creole, Cape Verdean Creole)
m["kea-bar"] = {
"Barlavento Kabuverdianu",
2217638,
"kea",
aliases = {"Barlavento", "Barlavento Creole", "Sampadjudu"},
}
m["kea-bvi"] = {
"Boa Vista Kabuverdianu",
16501837,
"kea-bar",
aliases = {"Boa Vista Creole"},
}
m["kea-sal"] = {
"Sal Kabuverdianu",
18707467,
"kea-bar",
aliases = {"Sal Creole"},
}
m["kea-saa"] = {
"Santo Antão Kabuverdianu",
18707472,
"kea-bar",
aliases = {"Santo Antão Creole"},
}
m["kea-sni"] = {
"São Nicolau Kabuverdianu",
18707549,
"kea-bar",
aliases = {"São Nicolau Creole"},
}
m["kea-svi"] = {
"São Vicente Kabuverdianu",
18707550,
"kea-bar",
aliases = {"São Vicente Creole"},
}
m["kea-sot"] = {
"Sotavento Kabuverdianu",
10261559,
"kea",
aliases = {"Sotavento", "Sotavento Creole", "Badiu"},
}
m["kea-bra"] = {
"Brava Kabuverdianu",
18670181,
"kea-sot",
aliases = {"Brava Creole"},
}
m["kea-fog"] = {
"Fogo Kabuverdianu",
18706861,
"kea-sot",
aliases = {"Fogo Creole"},
}
m["kea-mai"] = {
"Maio Kabuverdianu",
18707286,
"kea-sot",
aliases = {"Maio Creole"},
}
m["kea-san"] = {
"Santiago Kabuverdianu",
35117,
"kea-sot",
aliases = {"Santiago Creole"},
}
m["kea-alu"] = {
"ALUPEC Kabuverdianu",
375704,
"kea",
aliases = {"ALUPEC", "Alfabeto Unificado para a Escrita do Cabo-Verdiano"},
}
-----------------------------------------------------
-- Rhaeto-Romance varieties --
-----------------------------------------------------
-- Friulian varieties
m["fur-old"] = {
"Old Friulian",
nil,
"fur",
}
-- Ladin varieties
m["lld-amp"] = {
"Ampezan Ladin",
25617466,
"lld",
aliases = {"Anpezan", "Ampezan", "Ampezzan", "Ampezzano"},
}
m["lld-bad"] = {
"Badiot Ladin",
3706562,
"lld",
aliases = {"Badiot", "Badioto", "Badiotto"},
}
m["lld-cad"] = {
"Cadorino Ladin",
3706570,
"lld",
aliases = {"Cadorino"},
}
m["lld-fas"] = {
"Fascian Ladin",
742627,
"lld",
aliases = {"Fascian", "Fassano"},
}
m["lld-fod"] = {
"Fodom Ladin",
3706605,
"lld",
aliases = {"Fodom", "Livinallese"},
}
m["lld-for"] = {
"Fornes Ladin",
5470374,
"lld",
aliases = {"Fornes"},
}
m["lld-ghe"] = {
"Gherdëina Ladin",
3706597,
"lld",
aliases = {"Gherdëina", "Gardenese", "Val Gardena"},
}
m["lld-non"] = {
"Nones Ladin",
1055027,
"lld",
aliases = {"Nones", "Noneso"},
}
-- Romansh varieties
m["rm-old"] = {
"Old Romansh",
nil,
"rm",
}
m["rm-put"] = {
"Puter Romansh",
688309,
"rm",
aliases = {"Puter", "Putèr", "Upper Engadine", "rm-puter"},
}
m["rm-srm"] = {
"Surmiran Romansh",
690216,
"rm",
aliases = {"Surmiran", "rm-surmiran",
"Surmiran-Albula", -- Glottolog
},
}
m["rm-srs"] = {
"Sursilvan Romansh",
688348,
"rm",
aliases = {"Sursilvan", "rm-sursilv"},
}
m["rm-sut"] = {
"Sutsilvan Romansh",
688272,
"rm",
aliases = {"Sutsilvan", "rm-sutsilv"},
varieties = {"Scharans Sutsilvan"}, -- per Glottolog
}
m["rm-val"] = {
"Vallader Romansh",
690226,
"rm",
aliases = {"Vallader", "Putèr", "Lower Engadine", "rm-vallader"},
}
m["rm-gri"] = {
"Rumantsch Grischun",
688873,
"rm",
aliases = {"rm-rumgr"},
}
-----------------------------------------------------
-- Sardinian varieties --
-----------------------------------------------------
m["sc-old"] = {
"Old Sardinian",
nil,
"sc",
}
m["sc-src"] = {
"Logudorese",
777974,
"sc",
aliases = {"Logudorese Sardinian"},
}
m["sc-nuo"] = {
"Nuorese",
nil,
"sc-src",
aliases = {"Nuorese Sardinian"},
}
m["sc-sro"] = {
"Campidanese",
35348,
"sc",
aliases = {"Campidanese Sardinian"},
}
-----------------------------------------------------
-- Spanish varieties --
-----------------------------------------------------
m["es-ear"] = {
"Early Modern Spanish",
5364419,
"es",
}
m["es-AR"] = {
"Rioplatense Spanish",
509780,
"es",
}
m["es-BO"] = {
"Bolivian Spanish",
510730,
"es",
}
m["es-CL"] = {
"Chilean Spanish",
857295,
"es",
}
m["es-CO"] = {
"Colombian Spanish",
1115875,
"es",
}
m["es-CU"] = {
"Cuban Spanish",
824909,
"es",
}
m["es-MX"] = {
"Mexican Spanish",
616620,
"es",
}
m["es-PE"] = {
"Peruvian Spanish",
736236,
"es",
}
m["es-PH"] = {
"Philippine Spanish",
22091406,
"es",
}
m["es-US"] = {
"United States Spanish",
2301077,
"es",
aliases = {"US Spanish"},
}
--use label "US Spanish" to put Spanish terms in this category
m["es-PR"] = {
"Puerto Rican Spanish",
7258609,
"es",
}
m["es-VE"] = {
"Venezuelan Spanish",
840017,
"es",
}
m["es-lun"] = {
"Lunfardo",
1401612,
"es",
}
----------------------------------------------------------------------------------------------------------------------
-- Japonic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Japanese varieties
m["ja-mid"] = {
"Middle Japanese",
6841474,
"ojp",
ancestors = "ojp",
}
m["ja-mid-ear"] = {
"Early Middle Japanese",
182695,
"ja-mid",
}
m["ja-mid-lat"] = {
"Late Middle Japanese",
1816184,
"ja-mid",
ancestors = "ja-mid-ear",
}
m["ja-ear"] = {
"Early Modern Japanese",
5326692,
"ja",
ancestors = "ja-mid-lat",
}
m["ojp-eas"] = {
"Eastern Old Japanese",
65247957,
"ojp",
}
m["ja-cla"] = {
"Classical Japanese",
1332057,
"ja",
-- FIXME: This is redundant because Classical Japanese is considered a child of (Modern) Japanese, which has ja-mid-ear
-- (as well as ja-mid-lat) as ancestors. However, the intent here is that the *direct* ancestor of ja-cla is ja-mid-ear
-- and ja-mid-lat is not an ancestor. Need to rethink ancestor handling.
-- ancestors = "ja-mid-ear",
}
----------------------------------------------------------------------------------------------------------------------
-- Koreanic varieties --
----------------------------------------------------------------------------------------------------------------------
-- Korean varieties
m["oko-lat"] = {
"Late Old Korean",
nil,
"oko",
}
m["okm-ear"] = {
"Early Middle Korean",
nil,
"okm",
}
m["ko-cen"] = {
"Central Korean",
nil,
"ko",
}
m["ko-gyg"] = {
"Gyeonggi Korean",
485492,
"ko-cen",
aliases = {"Seoul Korean"},
}
m["ko-chu"] = {
"Chungcheong Korean",
625800,
"ko-cen",
aliases = {"Hoseo Korean"},
}
m["ko-hwa"] = {
"Hwanghae Korean",
16183706,
"ko-cen",
}
m["ko-gan"] = {
"Gangwon Korean",
11260444,
"ko-cen",
aliases = {"Yeongdong Korean"},
}
m["ko-gys"] = {
"Gyeongsang Korean",
488002,
"ko",
aliases = {"Southeastern Korean"},
}
m["ko-jeo"] = {
"Jeolla Korean",
11250166,
"ko",
aliases = {"Southwestern Korean"},
}
m["ko-pyo"] = {
"Pyongan Korean",
7263142,
"ko",
aliases = {"Northwestern Korean"},
}
m["ko-ham"] = {
"Hamgyong Korean",
860702,
"ko",
aliases = {"Northeastern Korean"},
}
m["ko-yuk"] = {
"Yukjin Korean",
16171275,
"ko",
aliases = {"Yukchin Korean", "Ryukjin Korean", "Ryukchin Korean"},
}
----------------------------------------------------------------------------------------------------------------------
-- Mongolic varieties --
----------------------------------------------------------------------------------------------------------------------
m["xng-ear"] = {
"Early Middle Mongol",
nil,
"xng",
}
m["xng-lat"] = {
"Late Middle Mongol",
nil,
"xng",
ancestors = "xng-ear",
}
m["mn-kha"] = {
"Khalkha Mongolian",
6399808,
"mn",
aliases = {"Khalkha"},
}
m["mn-ord"] = {
"Ordos Mongolian",
716904,
"mn",
aliases = {"Ordos"},
}
m["mn-cha"] = {
"Chakhar Mongolian",
907425,
"mn",
aliases = {"Chakhar"},
}
m["mn-khr"] = {
"Khorchin Mongolian",
3196210,
"mn",
aliases = {"Khorchin"},
}
----------------------------------------------------------------------------------------------------------------------
-- Niger-Congo varieties --
----------------------------------------------------------------------------------------------------------------------
-----------------------------------------------------
-- Akan varieties --
-----------------------------------------------------
m["tw"] = {
"Twi Akan",
36850,
"ak",
aliases = {"Twi"},
}
m["abr"] = {
"Abron",
34831,
"tw",
aliases = {"Brong", "Bono", "Bono Twi"},
}
m["tw-asa"] = {
"Asante Twi",
19261685,
"tw",
aliases = {"Asante", "Ashanti", "Ashante"},
}
m["tw-aku"] = {
"Akuapem Twi",
31150449,
"tw",
aliases = {"Akuapem", "Akuapim", "Akwapem Twi", "Akwapi"},
}
m["fat"] = {
"Fante Akan",
35570,
"ak",
aliases = {"Fante", "Fanti", "Fantse", "Mfantse"},
}
m["wss"] = {
"Wasa",
36914,
"ak",
}
-- creole
m["alv-kro"] = {
"Kromanti",
1093206,
"crp-mar",
}
-----------------------------------------------------
-- Bantu varieties --
-----------------------------------------------------
m["bnt-cmn"] = {
"Common Bantu",
nil,
"bnt-pro",
}
m["xh-bha"] = {
"Bhaca",
4900493,
"xh",
aliases = {"isiBhaca", "IsiBhaca"},
}
-- Rwanda-Rundi varieties
m["rw-kin"] = {
"Kinyarwanda",
33573,
"rw",
aliases = {"Rwanda"},
}
m["rw-run"] = {
"Kirundi",
33583,
"rw",
aliases = {"Rundi"},
}
-----------------------------------------------------
-- Fula varieties --
-----------------------------------------------------
m["fuc"] = {
"Pulaar",
1420205,
"ff",
}
m["fuf"] = {
"Pular",
3915357,
"ff",
}
m["ffm"] = {
"Maasina Fulfulde",
3915322,
"ff",
}
m["fue"] = {
-- no enwiki entry as of yet but frwiki and pmswiki have one
"Borgu Fulfulde",
12952426,
"ff",
}
m["fuh"] = {
-- no enwiki entry as of yet but frwiki and pmswiki have one
"Western Niger Fulfulde",
12952430,
"ff",
}
m["fuq"] = {
-- no enwiki entry as of yet but frwiki, hrwiki and pmswiki have one
"Central-Eastern Niger Fulfulde",
12628799,
"ff",
}
m["fuv"] = {
-- no enwiki entry as of yet but dewiki, frwiki, hrwiki, pmswiki and swwiki have one
"Nigerian Fulfulde",
36129,
"ff",
}
m["fub"] = {
-- no enwiki entry as of yet but dewiki, frwiki, hrwiki, pmswiki, ptwiki, swwiki and yowiki have one
"Adamawa Fulfulde",
34776,
"ff",
}
m["fui"] = {
-- no enwiki entry as of yet but pmswiki and swwiki have one
"Bagirmi Fulfulde",
11003859,
"ff",
}
----------------------------------------------------------------------------------------------------------------------
-- Papuan varieties --
----------------------------------------------------------------------------------------------------------------------
m["kze"] = {
"Kosena",
12952663,
"auy",
}
m["ont"] = {
"Ontenu",
3352827,
"gaj",
aliases = {"Ontena"},
}
----------------------------------------------------------------------------------------------------------------------
-- Salishan varieties --
----------------------------------------------------------------------------------------------------------------------
m["lut-nor"] = {
"Northern Lushootseed",
nil,
"lut",
aliases = {"Northern Puget Sound Salish"},
}
m["slh"] = {
"Southern Lushootseed",
7997684,
"lut",
aliases = {"Southern Puget Sound Salish", "Twulshootseed", "Whulshootseed"},
}
m["ska"] = {
"Skagit",
12642471,
"lut-nor",
}
m["sno"] = {
"Snohomish",
25559662,
"lut-nor",
}
----------------------------------------------------------------------------------------------------------------------
-- Sino-Tibetan varieties --
----------------------------------------------------------------------------------------------------------------------
m["tbq-pro"] = {
"Proto-Tibeto-Burman",
7251864,
"sit-pro",
}
-----------------------------------------------------
-- Chinese varieties --
-----------------------------------------------------
------------- Old Chinese, Middle Chinese -------------
m["och-ear"] = {
"Early Old Chinese",
nil,
"och",
}
m["och-lat"] = {
"Late Old Chinese",
nil,
"och",
}
m["ltc-ear"] = {
"Early Middle Chinese",
nil,
"ltc",
}
m["ltc-lat"] = {
"Late Middle Chinese",
nil,
"ltc",
}
------------- Classical/Literary varieties -------------
-- FIXME: Temporary.
m["lzh-shi"] = {
"Traditional Chinese poetry",
1759242,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cii"] = {
"Ci",
1091366,
"lzh",
}
-- FIXME: Temporary.
m["lzh-yue"] = {
"Classical Cantonese",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cmn"] = {
"Classical Mandarin",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-tai"] = {
"Classical Taishanese",
nil,
"lzh",
}
-- FIXME: Temporary.
m["lzh-cmn-TW"] = {
"Classical Taiwanese Mandarin",
nil,
"lzh-cmn",
}
-- FIXME: Temporary.
m["lzh-VI"] = {
"Vietnamese Classical Chinese",
17034227,
"lzh",
}
-- FIXME: Temporary.
m["lzh-KO"] = {
"Korean Classical Chinese",
10496257,
"lzh",
ietf_subtag = "lzh-KR" -- KR = South Korea, as there is no code for Korea as a whole
}
-- FIXME: Temporary.
m["lzh-lit"] = {
"Literary Chinese",
nil,
"lzh",
}
-- FIXME: Temporary. FIXME: Do we need this? How does it differ from Old Chinese?
m["lzh-pre"] = {
"Pre-Classical Chinese",
nil,
"lzh",
}
------------- Written Vernacular varieties -------------
-- FIXME: Temporary.
m["cmn-wvc"] = {
"Written vernacular Mandarin",
783605,
"cmn",
}
-- FIXME: Temporary. FIXME: How does this differ from "Literary Cantonese"?
m["yue-wvc"] = {
"Written vernacular Cantonese",
nil,
"yue",
}
-- FIXME: Temporary.
m["zhx-tai-wvc"] = {
"Written vernacular Taishanese",
nil,
"zhx-tai",
}
------------- Mandarin varieties -------------
-- FIXME: Temporary. NOTE: The Linguist List assigns the "w:Beijing dialect" (Wikidata 1147606) the code "cmn-bej" and
-- the larger "w:Beijing Mandarin (division of Mandarin)" dialect group (Wikidata 2169652; what we call "Beijingic
-- Mandarin", after Glottolog) the code "cmn-bei".
m["cmn-bei"] = {
"Beijing Mandarin",
1147606,
"cmn-bec",
}
-- FIXME: Temporary.
m["cmn-bec"] = {
"Beijingic Mandarin",
2169652,
"cmn",
}
-- FIXME: Temporary. NOTE: The Linguist List uses the code cmn-zho.
m["cmn-cep"] = {
"Central Plains Mandarin",
3048775,
"cmn",
aliases = {"Zhongyuan Mandarin"},
}
m["cmn-ear"] = {
"Early Mandarin",
837169,
"cmn",
ancestors = "ltc",
}
-- FIXME: Temporary.
m["cmn-gua"] = {
"Guanzhong Mandarin",
3431648,
"cmn-cep",
}
-- FIXME: Temporary. Appears to be a subdialect of Guiliu Mandarin, which in turn is a subdialect of Southwestern Mandarin.
m["cmn-gui"] = {
"Guilin Mandarin",
11111636,
"cmn-sow",
}
m["cmn-jhu"] = {
"Jianghuai Mandarin",
2128953,
"cmn",
aliases = {"Lower Yangtze Mandarin"},
}
-- FIXME: Temporary.
m["cmn-lan"] = {
"Lanyin Mandarin",
662754,
"cmn",
}
-- FIXME: Temporary.
m["cmn-MY"] = {
"Malaysian Mandarin",
13646143,
"cmn",
}
-- FIXME: Temporary.
m["cmn-nan"] = {
"Nanjing Mandarin",
2681098,
"cmn-jhu",
}
-- FIXME: Temporary.
m["cmn-noe"] = {
"Northeastern Mandarin",
1064504,
"cmn",
}
-- FIXME: Temporary.
m["cmn-PH"] = {
"Philippine Mandarin",
7185155,
"cmn",
}
-- FIXME: Temporary.
m["cmn-SG"] = {
"Singapore Mandarin",
1048980,
"cmn",
}
-- FIXME: Temporary.
m["cmn-sow"] = {
"Southwestern Mandarin",
2609239,
"cmn",
}
-- FIXME: Temporary. Appears to be a subdialect of Jilu Mandarin.
m["cmn-tia"] = {
"Tianjin Mandarin",
7800220,
"cmn",
}
-- FIXME: Temporary. NOTE: Wikidata also has Q4380827 "Taiwanese Mandarin", defined as "rare dialect of Standard Chinese
-- (Mandarin) used in Taiwan, which is strongly influenced by Taiwanese Hokkien; mostly used by elderlies" and having no
-- English Wikipedia article (but see w:zh:臺灣國語).
m["cmn-TW"] = {
"Taiwanese Mandarin",
262828,
"cmn",
}
-- FIXME: Temporary. Appears to be a subdialect of Wu-Tian Mandarin, in turn a subdialect of Southwestern Mandarin.
-- Given the code cmn-xwu in the Linguist List.
m["cmn-wuh"] = {
"Wuhan Mandarin",
11124731,
"cmn-sow",
aliases = {"Wuhanese"},
}
-- FIXME: Temporary. Appears to be a subdialect of Lanyin Mandarin.
m["cmn-xin"] = {
"Xining Mandarin",
nil,
"cmn-lan",
}
-- FIXME: Temporary.
m["cmn-yan"] = {
"Yangzhou Mandarin",
nil,
"cmn-jhu",
}
------------- Cantonese varieties -------------
-- FIXME: Temporary.
m["yue-gua"] = {
"Guangzhou Cantonese",
nil,
"yue",
}
-- FIXME: Temporary. Given the codes yue-yue or yue-can in the Linguist List.
m["yue-HK"] = {
"Hong Kong Cantonese",
5894342,
"yue",
}
-- FIXME: Temporary. FIXME: How does this differ from "Written vernacular Cantonese"?
m["yue-lit"] = {
"Literary Cantonese",
2472605,
"yue",
}
------------- Wu varieties -------------
m["wuu-han"] = {
"Hangzhounese",
5648144,
"wuu",
}
m["wuu-nin"] = {
"Ningbonese",
3972199,
"wuu",
}
-- FIXME: Temporary.
m["wuu-nor"] = {
"Northern Wu",
7675988,
"wuu",
aliases = {"Taihu Wu"},
}
-- FIXME: Temporary? Subvariety of Taihu Wu. NOTE: "chm" stands for Chongming, the main dialect, to avoid a conflict
-- with Shanghainese.
m["wuu-chm"] = {
"Shadi Wu",
6112340,
"wuu-nor",
}
m["wuu-sha"] = {
"Shanghainese",
36718,
"wuu-nor",
}
m["wuu-suz"] = {
"Suzhounese",
831744,
"wuu-nor",
}
-- FIXME: Temporary. May be converted into a full language and/or split.
m["wuu-wen"] = {
"Wenzhounese",
710218,
"wuu",
}
------------- Xiang varieties -------------
m["hsn-lou"] = {
"Loudi Xiang",
10943823,
"hsn-old",
}
m["hsn-hya"] = {
"Hengyang Xiang",
20689035,
"hsn-hzh",
}
m["hsn-hzh"] = {
"Hengzhou Xiang",
nil,
"hsn",
}
m["hsn-new"] = {
"New Xiang",
7012696,
"hsn",
aliases = {"Chang-Yi"},
}
m["hsn-old"] = {
"Old Xiang",
7085453,
"hsn",
aliases = {"Lou-Shao"},
}
------------- Hakka varieties -------------
-- FIXME: Temporary.
m["hak-dab"] = {
"Dabu Hakka",
19855566,
"hak", -- formerly hak-TW but seems to be spoken primary in Dabu County in Guangdong
}
-- FIXME: Temporary.
m["hak-eam"] = {
"Early Modern Hakka",
nil,
"hak",
}
-- FIXME: Temporary.
m["hak-hai"] = {
"Hailu Hakka",
17038519,
"hak", -- often considered a Taiwanese lect but also spoken in [[Shanwei]], [[Guangdong]]
}
-- FIXME: Temporary.
m["hak-HK"] = {
"Hong Kong Hakka",
2675834,
"hak",
}
-- FIXME: Temporary.
m["hak-hui"] = {
"Huiyang Hakka",
16873881,
"hak",
}
-- FIXME: Temporary.
m["hak-hui-MY"] = {
"Malaysian Huiyang Hakka",
nil,
"hak-hui",
}
-- FIXME: Temporary. Similar to and possibly the parent of Sixian Hakka in Taiwan.
m["hak-mei"] = {
"Meixian Hakka",
839295,
"hak",
aliases = {"Moiyan Hakka", "Meizhou Hakka"},
}
-- FIXME: Temporary.
m["hak-six"] = {
"Sixian Hakka",
9668261,
"hak-TW",
}
-- FIXME: Temporary.
m["hak-TW"] = {
"Taiwanese Hakka",
2391532,
"hak",
}
-- FIXME: Temporary.
m["hak-zha"] = {
"Zhao'an Hakka",
6703311,
"hak",
aliases = {"Zhangzhou Hakka"},
}
-- Southern Min varieties --
m["nan-anx"] = {
"Anxi Hokkien",
97064149,
"nan-qua",
}
m["nan-cha"] = {
"Changtai Hokkien",
nil,
"nan-zha",
}
m["nan-hou"] = {
"Houlu Min",
19855492,
"nan-dat",
}
m["nan-hui"] = {
"Hui'an Hokkien",
16241797,
"nan-qua",
}
m["nan-jin"] = {
"Jinjiang Hokkien",
11089375,
"nan-qua",
}
m["nan-kin"] = {
"Kinmenese Hokkien",
56278342,
"nan-xia",
aliases = {"Kinmen Hokkien"},
}
m["nan-med"] = {
"Medan Hokkien",
6805114,
"nan-zha",
}
m["nan-pen"] = {
"Penang Hokkien",
11120689,
"nan-zha",
}
m["nan-hbl-PH"] = {
"Philippine Hokkien",
3236692,
"nan-qua",
}
m["nan-qia"] = {
"Qianlu Min",
19842517,
"nan-dat",
}
m["nan-qua"] = {
"Quanzhou Hokkien",
2251677,
"nan-hbl",
aliases = {"Chinchew", "Choanchew"},
}
-- FIXME: Temporary? Derived from both Quanzhou and Zhangzhou Hokkien.
m["nan-hbl-SG"] = {
"Singapore Hokkien",
3846528,
"nan-hbl",
}
m["nan-spm"] = {
"Southern Malaysian Hokkien",
7570322,
"nan-qua",
aliases = {"Southern Malaysia Hokkien", "Southern Peninsular Malaysian Hokkien", "Southern Peninsular Malaysia Hokkien"}
}
m["nan-hbl-TW"] = {
"Taiwanese Hokkien",
36778,
"nan-hbl",
}
m["nan-ton"] = {
"Tong'an Hokkien",
nil,
"nan-xia",
}
m["nan-xia"] = {
"Xiamen Hokkien",
68744,
"nan-hbl",
aliases = {"Amoy", "Amoyese", "Amoynese", "Xiamenese"},
}
m["nan-yon"] = {
"Yongchun Hokkien",
65118728,
"nan-qua",
}
m["nan-zha"] = {
"Zhangzhou Hokkien",
8070492,
"nan-hbl",
aliases = {"Changchew", "Chiangchew", "Changchow"},
}
m["nan-zho"] = {
"Zhao'an Hokkien",
65118728,
"nan-zha",
aliases = {"Zhao'an", "Chawan", "Chawan Hokkien"},
}
m["nan-zhp"] = {
"Zhangping Hokkien",
15937822,
"nan-zha",
}
------------- Other Min varieties -------------
-- FIXME: Temporary. Affiliation within Min uncertain; some combination of Eastern and Southern.
m["zhx-zho"] = {
"Zhongshan Min",
8070958,
"zh",
}
------------- Other Chinese varieties -------------
-- FIXME: Temporary. Affiliation within Chinese uncertain; possibly Yue.
m["zhx-dan"] = {
"Danzhou Chinese",
2578935,
"zh",
}
------------- Chinese romanization varieties -------------
-- [[Wiktionary:Information desk/2022/June#Etymology Coding Issue]]
-- [[Wiktionary:Grease pit/2022/June#Transliteration Systems in Etymologies 2]]
m["cmn-pinyin"] = {
"Hanyu Pinyin",
42222,
"cmn",
aliases = {"Pinyin"},
}
m["cmn-tongyong"] = {
"Tongyong Pinyin",
700739,
"cmn",
}
m["cmn-wadegiles"] = {
"Wade–Giles",
208442,
"cmn",
aliases = {"Wade-Giles", "Wade Giles"},
}
m["zh-postal"] = {
"Postal Romanization",
151868,
"zh",
}
-- Chinese cyrillization
m["cmn-palladius"] = {
"Palladius",
1234239,
"cmn",
aliases = {"Palladius system"},
}
-----------------------------------------------------
-- Tibetic varieties --
-----------------------------------------------------
m["adx"] = {
"Amdo Tibetan",
56509,
"bo",
}
m["kbg"] = {
"Khamba",
12952626,
"bo",
}
m["khg"] = {
"Khams Tibetan",
56601,
"bo",
}
m["tsk"] = {
"Tseku",
11159532,
"bo",
}
----------------------------------------------------------------------------------------------------------------------
-- Tai-Kadai varieties --
----------------------------------------------------------------------------------------------------------------------
m["th-old"] = {
"Old Thai",
nil,
"tai-swe-pro",
wikipedia_article = "Thai language#Old Thai",
}
m["th-suk"] = {
"Sukhothai Old Thai", -- 1238-1438. Cannot use "Sukhothai Thai" as Sukhothai is the current city and "Sukhothai Thai" is a lect.
nil,
"th-old",
aliases = {"Sukhothai Siamese"},
wikipedia_article = "Thai language#Old Thai",
}
m["th-ayu"] = {
"Ayutthaya Old Thai", -- 1351-1767. Cannot use "Ayutthaya Thai" as Ayutthaya is the current city.
nil,
"th-old",
aliases = {"Ayutthaya Siamese"},
wikipedia_article = "Thai language#Old Thai",
}
--[[
m["th-new"] = {
"Hacked Thai", -- temporary for testing new translit/display methods
nil,
"th",
translit = "User:Benwing2/th-scraping-translit",
display_text = "User:Benwing2/th-scraping-translit",
strip_diacritics = "User:Benwing2/th-scraping-translit",
preprocess_links = "User:Benwing2/th-scraping-translit",
}
]]
m["tai-shz"] = {
"Shangsi Zhuang",
13216,
"za",
}
----------------------------------------------------------------------------------------------------------------------
-- Turkic varieties --
----------------------------------------------------------------------------------------------------------------------
m["trk-cmn-pro"] = {
"Proto-Common Turkic",
1126028,
"trk-pro",
}
m["trk-ogr-pro"] = {
"Proto-Oghur",
1422731,
"trk-pro",
family = "trk-ogr",
}
m["trk-bul-pro"] = {
"Proto-Bulgar",
nil,
"trk-ogr-pro",
}
m["trk-ogz-pro"] = {
"Proto-Oghuz",
494600,
"trk-pro",
family = "trk-ogz",
aliases = {"Southwestern Common Turkic"},
}
m["crh-dbj"] = {
"Dobrujan Tatar",
12811566,
"crh",
aliases = {"Romanian Tatar"},
}
m["cv-ana"] = {
"Anatri Chuvash",
nil,
"cv",
aliases = {"Anatri", "Lower Chuvash"},
}
m["cv-mid"] = {
"Middle Chuvash",
nil,
"cv",
ancestors = "cv-old",
}
m["cv-old"] = {
"Old Chuvash",
nil,
"cv",
ancestors = "xbo-vol",
}
m["cv-vir"] = {
"Viryal Chuvash",
4278332,
"cv",
aliases = {"Viryal", "Upper Chuvash"},
}
m["kjh-fyu"] = {
"Fuyu Kyrgyz",
2598963,
"kjh",
aliases = {"Fuyu Kirgiz", "Fuyu Kirghiz", "Manchurian Kyrgyz", "Manchurian Kirgiz", "Manchurian Kirghiz"},
}
m["klj-arg"] = {
"Arghu",
33455,
"klj",
ancestors = "trk-cmn-pro",
}
m["otk-kir"] = {
"Old Kirghiz",
83142,
"otk",
aliases = {"Yenisei Turkic", "Yenisei Kyrgyz"},
}
m["otk-ork"] = {
"Orkhon Turkic",
31295480,
"otk",
}
m["qwm-cum"] = {
"Cuman",
1075050,
"qwm",
aliases = {"Kuman", "Polovtsian", "Polovcian"},
}
m["qwm-arm"] = {
"Armeno-Kipchak",
2027503,
"qwm",
ancestors = "qwm-cum",
aliases = {"Xıpçaχ tili", "Tatarça"},
}
m["qwm-mam"] = {
"Mamluk-Kipchak",
4279942,
"qwm",
aliases = {"Mameluk-Kipchak"},
}
m["az-cls"] = {
"Classical Azerbaijani",
nil,
"az",
aliases = {"Classical Azeri"},
}
m["qxq"] = {
"Qashqai",
13192,
"az",
aliases = {"Qaşqay", "Qashqayi", "Kashkai", "Kashkay"},
}
m["tr-CY"] = {
"Cypriot Turkish",
7917392,
"tr",
}
m["uz-afg"] = {
-- NOTE: has ISO 639-3 code uzs assigned to it.
"Afghan Uzbek",
1066787,
"uz",
aliases = {"Southern Uzbek"},
translit = "uz-afg-translit",
}
m["xbo-dan"] = {
"Danube Bulgar",
nil,
"xbo",
}
m["xbo-vol"] = {
"Volga Bulgar",
nil,
"xbo",
}
----------------------------------------------------------------------------------------------------------------------
-- Uralic varieties --
----------------------------------------------------------------------------------------------------------------------
m["fiu-pro"] = {
"Proto-Finno-Ugric",
79890,
"urj-pro",
}
m["urj-fpr-pro"] = {
"Proto-Finno-Permic",
nil,
"urj-pro",
}
m["krl-nor"] = {
"North Karelian",
125501196,
"krl",
}
m["krl-sou"] = {
"South Karelian",
129812730,
"krl",
}
m["mns-eas"] = {
"Eastern Mansi",
30311755,
"mns-cen",
}
m["mns-wes"] = {
"Western Mansi",
30311756,
"mns-cen",
}
----------------------------------------------------------------------------------------------------------------------
-- Yeneseian varieties --
----------------------------------------------------------------------------------------------------------------------
m["qfa-yke-pro"] = {
"Proto-Ketic",
nil,
"qfa-yen-pro",
family = "qfa-yke",
}
m["qfa-yko-pro"] = {
"Proto-Kottic",
nil,
"qfa-yen-pro",
family = "qfa-yko",
}
m["qfa-yrn-pro"] = {
"Proto-Arinic",
nil,
"qfa-yen-pro",
family = "qfa-yrn",
}
m["qfa-ypm-pro"] = {
"Proto-Pumpokolic",
nil,
"qfa-yen-pro",
family = "qfa-ypm",
}
----------------------------------------------------------------------------------------------------------------------
-- Miscellaneous varieties --
----------------------------------------------------------------------------------------------------------------------
m["mul-tax"] = {
"taxonomic name",
522190,
"mul",
}
-----------------------------------------------------
-- Elamite varieties --
-----------------------------------------------------
m["elx-old"] = {
"Old Elamite",
nil,
"elx",
}
m["elx-mid"] = {
"Middle Elamite",
nil,
"elx",
}
m["elx-neo"] = {
"Neo-Elamite",
nil,
"elx",
}
m["elx-ach"] = {
"Achaemenid Elamite",
nil,
"elx",
}
-----------------------------------------------------
-- Substrates --
-----------------------------------------------------
-- Pre-Roman substrates
m["qsb-ibe"] = {
"Paleo-Hispanic",
246801,
"und",
family = "qfa-sub",
aliases = {"Palaeo-Hispanic", "Paleohispanic", "Palaeohispanic", "Paleo-Iberian", "Palaeo-Iberian"},
}
m["qsb-bal"] = {
"Paleo-Balkan",
1815070,
"und",
family = "qfa-sub",
aliases = {"Palaeo-Balkan", "Paleobalkan", "Palaeobalkan"},
}
m["xaq"] = {
"Aquitanian",
500522,
"euq-pro",
family = "euq",
}
return require("Module:languages").finalizeData(m, "language", true)
7v4us8jkjasehjazm8pvntczij6rj8g
Module:bg-pronunciation
828
137952
234872
222988
2026-05-19T21:19:35Z
en>Kiril kovachev
0
The real reason this function is necessary is just to treat ў and Ў from the respelling as у and У. So, rather than this way of removing "breves" from the respelling, let us just replace ў/Ў with у/У.
234872
Scribunto
text/plain
local export = {}
local substring = mw.ustring.sub
local rsubn = mw.ustring.gsub
local rmatch = mw.ustring.match
local rsplit = mw.text.split
local rlen = mw.ustring.len
local U = require("Module:string/char")
local lang = require("Module:languages").getByCode("bg")
local script = require("Module:scripts").getByCode("Cyrl")
local ipa_module = "Module:IPA"
local audio_module = "Module:audio"
local headword_data_module = "Module:headword/data"
local homophones_module = "Module:homophones"
local hyphenation_module = "Module:hyphenation"
local parameters_module = "Module:parameters"
local rhymes_module = "Module:rhymes"
local table_module = "Module:table"
local tracking_module = "Module:debug/track"
local GRAVE = U(0x300)
local ACUTE = U(0x301)
local BREVE = U(0x306)
local PRIMARY = U(0x2C8)
local SECONDARY = U(0x2CC)
local TIE = U(0x361)
local FRONTED = U(0x31F)
local DOTUNDER = U(0x323)
local HYPH = U(0x2027)
local BREAK_MARKER = "."
local vowels = "aɤɔuɛiɐo"
local vowels_c = "[" .. vowels .. "]"
local cons = "bvɡdʒzjklɫwmnprstfxʃɣʲ" .. TIE
local cons_c = "[" .. cons .. "]"
local hcons_c = "[бвгджзйклмнпрстфхшщьчц#БВГДЖЗЙКЛМНПРСТФХШЩЬЧЦ=]"
local hvowels_c = "[аъоуеияѝюАЪОУЕИЯЍЮ]"
local capital_letters_c = "[БВГДЖЗЙКЛМНПРСТФХШЩЬЧЦАЪОУЕИЯЍЮ]"
local accents = PRIMARY .. SECONDARY
local accents_c = "[" .. accents .. "]"
-- single characters that map to IPA sounds
local phonetic_chars_map = {
["а"] = "a",
["б"] = "b",
["в"] = "v",
["г"] = "ɡ",
["д"] = "d",
["е"] = "ɛ",
["ж"] = "ʒ",
["з"] = "z",
["и"] = "i",
["й"] = "j",
["к"] = "k",
["л"] = "l",
["м"] = "m",
["н"] = "n",
["о"] = "ɔ",
["п"] = "p",
["р"] = "r",
["с"] = "s",
["т"] = "t",
["у"] = "u",
["ў"] = "w",
["ф"] = "f",
["х"] = "x",
["ц"] = "t" .. TIE .. "s",
["ч"] = "t" .. TIE .. "ʃ",
["ш"] = "ʃ",
["щ"] = "ʃt",
["ъ"] = "ɤ",
["ь"] = "ʲ",
["ю"] = "ʲu",
["я"] = "ʲa",
[GRAVE] = SECONDARY,
[ACUTE] = PRIMARY
}
local devoicing = {
["b"] = "p", ["d"] = "t", ["ɡ"] = "k",
["z"] = "s", ["ʒ"] = "ʃ",
["v"] = "f"
}
local voicing = {
["p"] = "b", ["t"] = "d", ["k"] = "ɡ",
["s"] = "z", ["ʃ"] = "ʒ", ["x"] = "ɣ",
["f"] = "v"
}
-- Prefixes where, if they occur at the beginning of the word and the stress is on the next syllable, we place the
-- syllable division directly after the prefix. For example, the default syllable-breaking algorithm would convert
-- безбра́чие to беˈзбрачие; but because it begins with без-, we convert it to безˈбрачие. Note that we don't (yet?)
-- convert измра́ to изˈмра instead of default измˈра, although we probably should.
--
-- Think twice before putting prefixes like на-, пре- and от- here, because of the existence of над-, пред-, and о-,
-- which are also prefixes.
local IPA_prefixes = {"bɛz", "vɤz", "vɤzproiz", "iz", "naiz", "poiz", "prɛvɤz", "proiz", "raz"}
-- version of rsubn() that discards all but the first return value
local function rsub(term, foo, bar)
local retval = rsubn(term, foo, bar)
return retval
end
-- version of rsubn() that discards all but the count value
local function count_matches(term, pattern)
local _, match_count = rsubn(term, pattern, "")
return match_count
end
-- apply rsub() repeatedly until no change
local function rsub_repeatedly(term, foo, bar)
while true do
local new_term = rsub(term, foo, bar)
if new_term == term then
return term
end
term = new_term
end
end
local function char_at(str, index)
return substring(str, index, index)
end
local function starts_with(str, substr)
return substring(str, 1, rlen(substr)) == substr
end
local function count_vowels(word)
return count_matches(word, hvowels_c)
end
local function count_capital_letters(word)
return count_matches(word, capital_letters_c)
end
local function count_accents(ipa)
return count_matches(ipa, accents_c)
end
local function count_ipa_vowels(ipa)
return count_matches(ipa, vowels_c)
end
function export.remove_pron_notations(text, remove_grave)
text = rsub(text, "[." .. DOTUNDER .. "]", "")
text = rsub(text, "ў", "у")
text = rsub(text, "Ў", "У")
-- Remove grave accents from annotations but maybe not from phonetic respelling
if remove_grave then
text = mw.ustring.toNFC(rsub(mw.ustring.toNFD(text), GRAVE, ""))
end
return text
end
function export.toIPA(term, endschwa)
if type(term) == "table" then -- called from a template or a bot
endschwa = term.args.endschwa
term = term.args[1]
end
local origterm = term
term = mw.ustring.toNFD(mw.ustring.lower(term))
term = rsub(term, "у" .. BREVE, "ў") -- recompose ў
term = rsub(term, "и" .. BREVE, "й") -- recompose й
if term:find(GRAVE) and not term:find(ACUTE) then
error("Use acute accent, not grave accent, for primary stress: " .. origterm)
end
-- allow DOTUNDER to signal same as endschwa=1
term = rsub(term, "а(" .. accents_c .. "?)" .. DOTUNDER, "ъ%1")
term = rsub(term, "я(" .. accents_c .. "?)" .. DOTUNDER, "ʲɤ%1")
term = rsub(term, ".", phonetic_chars_map)
-- Mark word boundaries
term = rsub(term, "(%s+)", "#%1#")
term = "#" .. term .. "#"
-- Convert verbal and definite endings
if endschwa then
term = rsub(term, "a(" .. PRIMARY .. "?t?#)", "ɤ%1")
end
-- Change ʲ to j after vowels or word-initially
term = rsub(term, "([" .. vowels .. "#]" .. accents_c .. "?)ʲ", "%1j")
-------------------- Move stress ---------------
-- First, move leftwards over the vowel.
term = rsub(term, "(" .. vowels_c .. ")(" .. accents_c .. ")", "%2%1")
-- Then, move leftwards over j or soft sign.
term = rsub(term, "([jʲ])(" .. accents_c .. ")", "%2%1")
-- Then, move leftwards over a single consonant.
term = rsub(term, "(" .. cons_c .. ")(" .. accents_c .. ")", "%2%1")
-- Then, move leftwards over Cl/Cr combinations where C is an obstruent (NOTE: IPA ɡ).
term = rsub(term, "([bdɡptkxfv]" .. ")(" .. accents_c .. ")([rl])", "%2%1%3")
-- Then, move leftwards over kv/gv (NOTE: IPA ɡ).
term = rsub(term, "([kɡ]" .. ")(" .. accents_c .. ")(v)", "%2%1%3")
-- Then, move leftwards over sC combinations, where C is a stop or resonant (NOTE: IPA ɡ).
term = rsub(term, "([sz]" .. ")(" .. accents_c .. ")([bdɡptkvlrmn])", "%2%1%3")
-- Then, move leftwards over affricates not followed by a consonant.
term = rsub(term, "([td]" .. TIE .. "?)(" .. accents_c .. ")([szʃʒ][" .. vowels .. "ʲ])", "%2%1%3")
-- If we ended up in the middle of a tied affricate, move to its right.
term = rsub(term, "(" .. TIE .. ")(" .. accents_c .. ")(" .. cons_c .. ")", "%1%3%2")
-- Then, move leftwards over any remaining consonants at the beginning of a word.
term = rsub(term, "#(" .. cons_c .. "*)(" .. accents_c .. ")", "#%2%1")
-- Then correct for known prefixes.
for _, prefix in ipairs(IPA_prefixes) do
local prefix_prefix, prefix_final_cons = rmatch(prefix, "^(.-)(" .. cons_c .. "*)$")
if prefix_final_cons then
-- Check for accent moved too far to the left into a prefix, e.g. безбрачие accented as беˈзбрачие instead
-- of безˈбрачие
term = rsub(term, "#(" .. prefix_prefix .. ")(" .. accents_c .. ")(" .. prefix_final_cons .. ")", "#%1%3%2")
end
end
-- If the previous substitution resulted in a stress occuring immediately after a consonant
-- but before a palatalizer mark, then put the stress before the consonant.
term = rsub(term, "(" .. cons_c .. ")" .. "(" .. accents_c .. ")" .. "ʲ", "%2%1ʲ")
-- Finally, if there is an explicit syllable boundary in the cluster of consonants where the stress is, put it there.
-- First check for accent to the right of the explicit syllable boundary.
term = rsub(term, "(" .. cons_c .. "*)%.(" .. cons_c .. "*)(" .. accents_c .. ")(" .. cons_c .. "*)", "%1%3%2%4")
-- Then check for accent to the left of the explicit syllable boundary.
term = rsub(term, "(" .. cons_c .. "*)(" .. accents_c .. ")(" .. cons_c .. "*)%.(" .. cons_c .. "*)", "%1%3%2%4")
-- Finally, remove any remaining syllable boundaries.
term = rsub(term, "%.", "")
-------------------- Vowel reduction (in unstressed syllables) ---------------
local function reduce_vowel(vowel)
return rsub(vowel, "[aɔɤu]", { ["a"] = "ɐ", ["ɔ"] = "o", ["ɤ"] = "ɐ", ["u"] = "o" })
end
-- Reduce all vowels before the stress, except if the word has no accent at all. (FIXME: This is presumably
-- intended for single-syllable words without accents, but if the word is multisyllabic without accents,
-- presumably all vowels should be reduced.)
term = rsub(term, "(#[^#" .. accents .. "]*)(.-#)", function(a, b)
if count_vowels(origterm) <= 1 then
return a .. b
else
return reduce_vowel(a) .. b
end
end)
-- Reduce all vowels after the accent except the first vowel after the accent mark (which is stressed).
term = rsub(term, "(" .. accents_c .. "[^aɛiɔuɤ#]*[aɛiɔuɤ])([^#" .. accents .. "]*)", function(a, b)
return a .. reduce_vowel(b)
end)
-------------------- Vowel assimilation to adjacent consonants (fronting/raising) ---------------
term = rsub(term, "([ʃʒʲj])([aouɤ])", "%1%2" .. FRONTED)
-- Hard l
term = rsub_repeatedly(term, "l([^ʲɛi])", "ɫ%1")
-- Voicing assimilation
term = rsub(term, "([bdɡzʒv" .. TIE .. "]*)(" .. accents_c .. "?[ptksʃfx#])", function(a, b)
return rsub(a, ".", devoicing) .. b end)
term = rsub(term, "([ptksʃfx" .. TIE .. "]*)(" .. accents_c .. "?[bdɡzʒ])", function(a, b)
return rsub(a, ".", voicing) .. b end)
term = rsub(term, "n(" .. accents_c .. "?[ɡk]+)", "ŋ%1")
term = rsub(term, "m(" .. accents_c .. "?[fv]+)", "ɱ%1")
-- Sibilant assimilation
term = rsub(term, "[sz](" .. accents_c .. "?[td]?" .. TIE .. "?)([ʃʒ])", "%2%1%2")
-- Reduce consonant clusters
term = rsub(term, "([szʃʒ])[td](" .. accents_c .. "?)([tdknml])", "%2%1%3")
-- Strip hashes
term = rsub(term, "#", "")
return term
end
----Syllabification code----
-- Authorship: Chernorizets
-- Lua port: Kiril Kovachev
local function set_of(t)
local out = {}
for _, v in pairs(t) do
out[v] = true
end
return out
end
local function in_set(set, value)
return set[value] == true
end
-- Classification of letters by phonetic category
local vowels_syllab = set_of {"а", "ъ", "о", "у", "е", "и", "ю", "я"}
local sonorants = set_of { "л", "м", "н", "р", "й", "ў"}
local stops = set_of {"б", "п", "г", "к", "д", "т"}
local fricatives = set_of {"в", "ф", "ж", "ш", "з", "с", "х"}
local affricates = set_of {"ч", "ц"}
local function is_vowel(ch)
return in_set(vowels_syllab, ch)
end
local function is_palatalizer(ch)
return ch == "ь"
end
local function is_sonorant(ch)
return in_set(sonorants, ch)
end
local function is_stop(ch)
return in_set(stops, ch)
end
local function is_fricative(ch)
return in_set(fricatives, ch)
end
local function is_affricate(ch)
return in_set(affricates, ch)
end
--[[
Sonority objects:
Sonority objects take the form of a table with the following attributes:
{
rank (int): the numerical value representing the position of the sound in the sonority hierarchy;
first_index (int): the index of the first letter that makes up the sound within the word.
The index of the first letter in a word with this sonority rank.
The affricates "дж" and "дз" are represented by two letters each, but
for sonority purposes they function as a "unit", hence we just need
the index of the first letter of the affricate.
}
--]]
local function new_sonority(rank, first_index)
return {
["rank"] = rank,
["first_index"] = first_index
}
end
local function get_sonority_rank(ch)
if is_fricative(ch) then
return 1
end
if is_stop(ch) or is_affricate(ch) then
return 2
end
if is_sonorant(ch) then
return 3
end
if is_vowel(ch) then
return 4
end
return 0
end
-- Get the representation of a word as a list of sequential sonority objects, stored in a table.
-- Their representation is just {[1] = (sonority object #1), [2] = (sonority object #2)} etc.
-- Please see above for description of sonority objects' layout.
local function get_sonority_model(word, start_idx, end_idx)
local sonorities = {}
word = mw.ustring.lower(word)
local i = start_idx
while i < end_idx do
local curr = char_at(word, i)
if curr == "щ" then
-- One letter representing 2 sounds - decompose it.
table.insert(sonorities, new_sonority(get_sonority_rank("ш"), i))
table.insert(sonorities, new_sonority(get_sonority_rank("т"), i));
elseif curr == "д" then
-- Handle affricates with 'д' - only 'дж' here for illustration.
local next_char = (i == end_idx - 1 and " ") or char_at(word, i+1)
local should_skip = false
if next_char == "ж" then
table.insert(sonorities, new_sonority(2, i)) -- 2 = affricate sonority rank
i = i + 1 -- Skip over the 'ж'
should_skip = true
end
if not should_skip then table.insert(sonorities, new_sonority(get_sonority_rank("д"), i)) end
elseif not is_palatalizer(curr) then
-- Skip over 'ь' since it doesn't change the sonority.
table.insert(sonorities, new_sonority(get_sonority_rank(curr), i))
end
i = i + 1
end
return sonorities
end
-- Forced breaks when the user inputs a break marker into the input string
-- word: string; start and end are integers indexing the string
local function find_forced_break(word, range_start, range_end)
if range_start >= range_end then return -1 end
local marker_pos = mw.ustring.find(word, BREAK_MARKER, range_start, true) or -1
return marker_pos >= range_end and -1 or marker_pos
end
local function strip_forced_breaks(segment)
return rsub(segment, "[.]", "");
end
---- Morphological prefix handling
--[[
This code brings morphological prefix awareness to syllabification.
This is necessary, because following the principle of rising sonority
alone fails to determine syllable boundaries correctly in some cases
— that is, when certain prefixes should be kept together as a first syllable.
]]
--[[
Affected prefixes. Each of them ends in a consonant that can be followed
by another consonant of a higher sonority in some words. In such cases,
naive syllable breaking would chop off the prefix's last consonant, and
glue it to the onset of the next syllable.
]]
local prefixes = {
-- без- family
"без",
-- из- family
"безиз", "наиз", "поиз", "произ", "преиз", "неиз", "из",
-- въз- family
"безвъз", "превъз", "невъз", "въз",
-- раз- family
"безраз", "предраз", "пораз", "нараз", "прераз", "нераз", "раз",
-- от- family
"неот", "поот", "от",
-- ending in fricatives
"екс", "таз", "дис",
-- ending in stops
"пред"
}
--[[
Finds the (zero-based) separation point between a
morphological prefix and the rest of the word.
By convention, that's the index of the first character
after the prefix.
word: the word to check for prefixes
return -1 if no prefix found, or if the separation point
is handled by the sonority model. A non-zero index otherwise.
]]
local function followed_by_higher_sonority_cons(prefix, word) -- prefix, word are both strings
prefix = mw.ustring.lower(prefix)
word = mw.ustring.lower(word)
local prefix_last_char = char_at(prefix, rlen(prefix))
local first_char_after_prefix = char_at(word, rlen(prefix) + 1)
-- Prefixes followed by vowels do, in fact, get broken up.
if is_vowel(first_char_after_prefix) then return false end
return get_sonority_rank(prefix_last_char) < get_sonority_rank(first_char_after_prefix)
end
local function find_separation_points(word)
local matching_prefixes = {}
word = mw.ustring.lower(word)
for _, prefix in pairs(prefixes) do
if starts_with(word, prefix) and followed_by_higher_sonority_cons(prefix, word) then
table.insert(matching_prefixes, rlen(prefix) + 1)
end
end
return matching_prefixes
end
---- Main syllabification code
---Context objects:
--[[ encoded as a table like
{
word (string),
prefix_separation_points (table[int])
}
]]
local function new_context(word, pos)
return {
["word"] = word,
["prefix_separation_points"] = pos
}
end
--[[
Consonant clusters that exhibit rising sonority, but should be
broken up regardless to produce natural-sounding syllables.
The breakpoint for clusters of 3 or more consonants can vary –
here we provide a zero-based offset within the cluster for each.
]]
local sonority_exception_break = {
["км"] = 1, ["гм"] = 1, ["дм"] = 1, ["вм"] = 1,
["зм"] = 1, ["цм"] = 1, ["чм"] = 1,
["дн"] = 1, ["вн"] = 1, ["тн"] = 1, ["чн"] = 1,
["кн"] = 1, ["гн"] = 1, ["цн"] = 1,
["зд"] = 1, ["зч"] = 1, ["зц"] = 1,
["вк"] = 1, ["вг"] = 1, ["дл"] = 1, ["жд"] = 1,
["згн"] = 1, ["здн"] = 2, ["вдж"] = 1
}
local sonority_exception_keep = {
"ств", "св", "вс"
}
local function normalize_word(word)
if word == nil then return "" end
word = rsub(rsub(word, "^\\s+", ""), "\\s+^", "") -- Strip spaces
return word
end
local function normalize_syllable(syllable)
local normalized = strip_forced_breaks(syllable)
normalized = rsub(normalized, "ў", "у")
normalized = rsub(normalized, "Ў", "У")
return normalized
end
local function find_rising_sonority_break(sonorities)
local prev_rank = -1;
for _, curr in pairs(sonorities) do
if curr.rank <= prev_rank then
-- Found a break.
return curr.first_index
end
prev_rank = curr.rank
end
-- There was no rising sonority break. Start syllable at first index.
return sonorities[1].first_index
end
local function matches(str, substr, start_idx, end_idx)
local strlen = end_idx - start_idx
if strlen ~= rlen(substr) then return false end
str = mw.ustring.lower(str)
substr = mw.ustring.lower(substr)
local i = start_idx
local j = 1
while i < end_idx do
if char_at(str, i) ~= char_at(substr, j) then return false end
i = i + 1
j = j + 1
end
return true
end
-- ctx: context object
-- left and right vowels: integers
-- sonority break: integer
local function fixup_syllable_onset(ctx, left_vowel, sonority_break, right_vowel)
local word = mw.ustring.lower(ctx.word)
-- 'щр' is a syllable onset when in front of a vowel.
-- Although 'щ' + sonorant technically follows rising sonority, syllables
-- like щнV, щлV etc. are unnatural and incorrect. In such cases, we treat
-- the sonorant as the onset of the next syllable.
if char_at(word, right_vowel - 2) == "щ" then
local penult = char_at(word, right_vowel - 1)
if penult == "р" then return (right_vowel - 2) end
if is_sonorant(penult) then return (right_vowel - 1) end
end
-- Check for situations where we shouldn't break the cluster.
local match_found = false
for _, cluster in pairs(sonority_exception_keep) do
if matches(word, cluster, left_vowel + 1, right_vowel) then
match_found = true
break
end
end
if (match_found) then return left_vowel + 1 end -- syllable onset == beginning of cluster
-- Check for situations where we should break the cluster even if
-- it obeys the principle of rising sonority.
local maybe_cluster = nil
for cluster, _ in pairs(sonority_exception_break) do
if matches(word, cluster, left_vowel + 1, right_vowel) then
maybe_cluster = cluster
break
end
end
if maybe_cluster ~= nil then
local offset = sonority_exception_break[maybe_cluster]
return left_vowel + 1 + offset
end
local separation_points = ctx.prefix_separation_points
local separation_match = nil
for _, pos in pairs(separation_points) do
if pos > left_vowel and pos < right_vowel then
separation_match = pos
break
end
end
if separation_match ~= nil then return separation_match else return sonority_break end
end
-- ctx: context object
-- left/right vowels: integers
local function find_next_syllable_onset(ctx, left_vowel, right_vowel)
local n_cons = right_vowel - left_vowel - 1
-- No consonants - syllable starts on rightVowel
if n_cons == 0 then return right_vowel end
-- Check for forced breaks
local break_pos = find_forced_break(ctx.word, left_vowel + 1, right_vowel)
if break_pos ~= -1 then return break_pos + 1 end
-- Single consonant between two vowels - starts a syllable
if n_cons == 1 then return left_vowel + 1 end
-- Two or more consonants between the vowels. Find the point (if any)
-- where we break from rising sonority, and treat it as the tentative
-- onset of a new syllable.
local sonorities = get_sonority_model(ctx.word, left_vowel + 1, right_vowel)
local sonority_break = find_rising_sonority_break(sonorities)
-- Apply exceptions to the rising sonority principle to avoid
-- unnatural-sounding syllables.
return fixup_syllable_onset(ctx, left_vowel, sonority_break, right_vowel)
end
local function deaccent(term)
return rsub(term, "[" .. ACUTE .. GRAVE .. DOTUNDER .. "]", "")
end
local function deaccent_all(term)
term = rsub(term, "ў", "у")
term = rsub(term, "Ў", "У")
return deaccent(term)
end
-- Returns a table of strings (list)
local function syllabify_poly(word)
local syllables = {}
local ctx = new_context(word, find_separation_points(word))
local prev_vowel = -1
local prev_onset = 1;
for i = 1, rlen(word) do
if is_vowel(mw.ustring.lower(char_at(word, i))) then
-- A vowel, yay!
local should_skip = false
if prev_vowel == -1 then
prev_vowel = i
should_skip = true;
end
-- This is not the first vowel we've seen. In-between
-- the previous vowel and this one, there is a syllable
-- break, and the first character after the break starts
-- a new syllable.
if not should_skip then
local next_onset = find_next_syllable_onset(ctx, prev_vowel, i)
table.insert(syllables, substring(word, prev_onset, next_onset - 1))
prev_vowel = i
prev_onset = next_onset
end
end
end
-- Add the last syllable
table.insert(syllables, substring(word, prev_onset))
return syllables
end
function export.syllabify_word(word)
local norm = normalize_word(word)
if rlen(norm) == 0 then return "" end;
local n_vowels = count_vowels(norm)
local syllables = n_vowels <= 1 and {norm} or syllabify_poly(norm)
local out = {}
for k, v in pairs(syllables) do
out[k] = normalize_syllable(v)
end
return table.concat(out, HYPH)
end
local function tokenize_words(term)
local out = {}
local prev_index = 1
local len = rlen(term)
for i = 1, len do
local current_char = char_at(term, i)
if current_char == "-" or current_char == " " then
table.insert(out, substring(term, prev_index, i))
prev_index = i + 1
end
end
table.insert(out, substring(term, prev_index, len))
return out
end
function export.syllabify(term)
term = deaccent(term)
local words = tokenize_words(term)
local out = {}
for _, word in pairs(words) do
table.insert(out, export.syllabify_word(word))
end
return table.concat(out, "")
end
---Hyphenation
-- Hyphenate a word from its existing syllabification
function export.hyphenate(syllabification)
-- Source: http://logic.fmi.uni-sofia.bg/hyphenation/hyph-bg.html#hyphenation-rules-between-1983-and-2012
-- Also note: the rules from 2012 onward, which encode the modern standard, are entirely
-- backwards-compatible with the previous standard. Thus our code can generate valid 2012
-- hyphenations despite only explicitly implementing the older (1983) rules.
---Pre-processing----
local word = deaccent(syllabification)
word = rsub_repeatedly(word, HYPH .. "дж", HYPH .. "#")
word = rsub_repeatedly(word, "дж$", "#")
word = rsub_repeatedly(word, "^дж", "#")
word = rsub_repeatedly(word, "(" .. hvowels_c .. ")" .. HYPH .. "(" .. hcons_c .. ")(" .. rsub(hcons_c, "[ьЬ]", "") .. "+)", "%1%2" .. HYPH .. "%3")
word = rsub_repeatedly(word, "(" .. rsub(hcons_c, "[йЙ]", "") .. ")(" .. hcons_c .. "+)" .. HYPH, "%1" .. HYPH .. "%2")
word = rsub_repeatedly(word, "^(" .. hvowels_c .. ")" .. HYPH, "%1")
word = rsub_repeatedly(word, HYPH .. "(" .. hvowels_c .. ")$", "%1")
word = rsub_repeatedly(word, "(" .. hvowels_c .. ")" .. HYPH .. "(" .. hvowels_c .. ")" .. HYPH .. "(" .. hvowels_c .. ")", "%1%2" .. HYPH .. "%3")
word = rsub_repeatedly(word, HYPH .. "(" .. hvowels_c .. ")" .. HYPH .. "(" .. hcons_c .. ")", HYPH .. "%1%2")
word = rsub_repeatedly(word, "#", "дж")
return word
end
-- Hyphenate a word directly, no need to calculate its syllabification beforehand (used in test suite)
function export.hyphenate_total(word)
local syllabification = export.syllabify(word)
return export.hyphenate(syllabification)
end
local function get_anntext(term, ann)
if ann == "1" or ann == "y" then
-- remove secondary stress annotations
return "'''" .. export.remove_pron_notations(term, true) .. "''': "
elseif ann then
return "'''" .. ann .. "''': "
else
return ""
end
end
local HYPHENATION_LABEL = "Hyphenation<sup>([[Appendix:Bulgarian hyphenation#Hyphenation|key]])</sup>"
local SYLLABIFICATION_LABEL = "Syllabification<sup>([[Appendix:Bulgarian hyphenation#Syllabification|key]])</sup>"
local function format_hyphenation(hyphenation, label)
hyphenation = deaccent(hyphenation) -- remove grave/acute accent
local syllables = rsplit(hyphenation, HYPH)
label = label or HYPHENATION_LABEL
return require(hyphenation_module).format_hyphenations {
lang = lang,
hyphs = { { hyph = syllables } },
sc = script,
caption = label,
}
end
local function format_syllabification(syllabification)
return format_hyphenation(syllabification, SYLLABIFICATION_LABEL)
end
-- Display syllabification and hyphenation, together if the same, and on separate lines if not;
-- allows specifying an indentation level, if the hyphenation must be indented to more than one level.
local function render_bg_hyph(term, indentation, syllabification, hyphenation)
syllabification = syllabification or export.syllabify(term)
hyphenation = hyphenation or export.hyphenate(syllabification)
local out = ""
-- Users must put a * (or **) before the template usage
if syllabification == hyphenation then
if syllabification ~= "-" then
out = format_syllabification(syllabification)
end
else
local syllabification_text = format_syllabification(syllabification)
local hyphenation_text = format_hyphenation(hyphenation)
if syllabification ~= "-" then
out = syllabification_text
end
if hyphenation ~= "-" then
if syllabification == "-" then
out = hyphenation_text
else
out = out .. "\n" .. mw.ustring.rep("*", indentation) .. " " .. hyphenation_text
end
end
end
return out
end
-- Entry point to {{bg-hyph}}
function export.show_hyphenation(frame)
local params = {
[1] = {},
["indent"] = { type = "number" }
}
local title = mw.title.getCurrentTitle()
local args = require(parameters_module).process(frame:getParent().args, params)
local term = args[1] or title.nsText == "Template" and "при́мер" or title.text
local indent = args["indent"] or 1
return render_bg_hyph(term, indent)
end
function export.get_rhymes(ipa)
ipa = rsub(ipa, FRONTED, "")
local length = rlen(ipa)
local i = length
local vowels_seen = 0
local final_consonant_found = false
-- March until accent is found
while i > 0 do
-- Track vowel or final consonant if found
if vowels_seen == 0 and rmatch(char_at(ipa, i), cons_c) then
final_consonant_found = true
end
if rmatch(char_at(ipa, i), vowels_c) then
vowels_seen = vowels_seen + 1
end
if rmatch(char_at(ipa, i), accents_c) then
-- Note whether letter before the accent was vowel
local final_vowel_cluster = rmatch(ipa, vowels_c .. accents_c .. vowels_c .. "$")
-- March until the vowel first following the accent is found
while i <= length and not rmatch(char_at(ipa, i), vowels_c) do
i = i + 1
end
-- March back if only a single word-final vowel was previously spotted –
-- this corresponds to final-syllable-stressed words, whose rhyme
-- needs to include a consonant according to Bulgarian rhyming rules.
if vowels_seen <= 1 and not final_consonant_found and not final_vowel_cluster then
while i > 1 and not rmatch(char_at(ipa, i), rsub(cons_c, "ʲ", "")) do
i = i - 1
end
-- Account for affricates (note: this can only occur in
-- consonant-rhyme, i.e. final-stressed words)
if i > 1 and char_at(ipa, i-1) == TIE then
-- If a tie is present, there must be a letter before it as well.
i = i - 2
elseif i > 1 and char_at(ipa, i) == "ʒ" and char_at(ipa, i-1) == "d" then
-- Treat [dʒ] sequence as an affricate – this can have some edge cases.
-- In future, the module should distinguish [d.ʒ] and [d͡ʒ].
i = i - 1
end
end
return substring(ipa, i)
end
i = i - 1
end
local n_vowels = count_ipa_vowels(ipa)
if n_vowels == 1 then
i = length
if rmatch(char_at(ipa, i), cons_c) then
while i > 1 and not rmatch(char_at(ipa, i), vowels_c) do
i = i - 1
end
else
while i > 1 and not rmatch(char_at(ipa, i), rsub(cons_c, "ʲ", "")) do
i = i - 1
end
end
if i > 1 and char_at(ipa, i - 1) == TIE then
i = i - 2
end
return substring(ipa, i)
end
return nil
end
-- Render a single IPA transcription as wikitext (with optional qualifiers + accent labels)
local function format_ipa(ipa, q, qq, a, aa)
-- Introduce narrow transcription brackets
ipa = "[" .. ipa .. "]"
local ipa_data = {
lang = lang,
items = {{ pron = ipa }},
q = q,
qq = qq,
a = a,
aa = aa,
}
return require(ipa_module).format_IPA_full(ipa_data)
end
function export.show(frame)
local params = {
[1] = {},
["endschwa"] = { type = "boolean" },
["ann"] = {},
["q"] = { type = "qualifier" },
["qq"] = { type = "qualifier" },
["a"] = { type = "labels" },
["aa"] = { type = "labels" },
["pagename"] = {},
}
local args = require(parameters_module).process(frame:getParent().args, params)
local term = args[1] or args.pagename or mw.title.getCurrentTitle().nsText == "Template" and "при́мер" or
mw.loadData(headword_data_module).pagename
local ipa = export.toIPA(term, args.endschwa)
local ipa_text = format_ipa(ipa, args.q, args.qq, args.a, args.aa)
local anntext = get_anntext(term, args.ann)
-- Terms with a lack of stress despite not being monosyllabic
if count_vowels(term) > 1 and count_accents(ipa) == 0 then
require(tracking_module)("bg-IPA/no stress")
end
return anntext .. ipa_text
end
-- Convert rhyme suffix and optional syllable count to wikitext
local function format_rhymes(rhyme_suffix, syllable_counts, q, qq, l, ll)
return require(rhymes_module).format_rhymes({
lang = lang,
rhymes = {
{rhyme = rhyme_suffix, num_syl = syllable_counts, q = q, qq = qq, a = l, aa = ll},
},
})
end
-- Entry point for {{bg-rhymes}}
function export.show_rhymes(frame)
-- TODO: add qualifiers / labels
local params = {
[1] = {},
["pagename"] = {},
["s"] = { sublist = true, type = "number", },
["q"] = { type = "qualifier", },
["qq"] = { type = "qualifier", },
["a"] = { type = "labels", },
["aa"] = { type = "labels", },
}
local args = require(parameters_module).process(frame:getParent().args, params)
local term = args[1] or args.pagename or mw.title.getCurrentTitle().nsText == "Template" and "при́мер" or
mw.loadData(headword_data_module).pagename
local ipa = export.toIPA(term, args.endschwa)
local rhymes = export.get_rhymes(ipa)
local syllable_counts = args.s or {count_vowels(term)}
return format_rhymes(rhymes, syllable_counts, args.q, args.qq, args.a, args.aa)
end
-- Matches patterns such as: Bg-къща.ogg<Sofia>,
-- with capture groups [1]="Bg-къща.ogg", [2]="Sofia"
local accent_qualifier_pattern = "(.-)<(.+)>"
-- Matches speaker profiles, i.e. a shorthand for representing a given
-- speaker and the properties of their audio
local speaker_profile_pattern = "%[([^:~]-)([:~]?)([^:~]*)%]"
local speaker_profiles = require("Module:bg-pronunciation/speaker profiles").speaker_profiles
local audio_functions = require("Module:bg-pronunciation/speaker profiles").audio_functions
-- Return a list of audio formatted as wikitext
local function format_audio_list(list, ipa, pagename, corresponding_respelling)
local request_rfap = false
if list == nil then
return {}, request_rfap
end
-- Audio list is separated by # symbols.
local file_specs = rsplit(list, "#")
local audios = {}
for _, spec in pairs(file_specs) do
-- Try to match speaker profile
local speaker_profile_name, separator, term_override = rmatch(spec, speaker_profile_pattern)
-- FIXME
if speaker_profile_name == "" and term_override ~= "" then
speaker_profile_name = term_override
term_override = nil
end
if speaker_profile_name then
local speaker_profile = speaker_profiles[speaker_profile_name]
if not speaker_profile then
error("Speaker profile named '" .. speaker_profile_name .. "' does not exist")
end
-- Track uses of a particular speaker profile
require(tracking_module)("bg-pr/speaker-profile/" .. speaker_profile_name)
-- E.g. [ABC~2] on page="човек" is equivalent to: [ABC:човек-2].
if separator == "~" then
term_override = mw.loadData(headword_data_module).pagename .. "-" .. term_override
end
if term_override == "" then
term_override = corresponding_respelling
end
local renderer_name = speaker_profile["renderer"]
local filename = term_override or pagename
local rendered = audio_functions[renderer_name].display(speaker_profile, filename, {ipa=ipa})
if rendered then
table.insert(audios, rendered)
else
request_rfap = true
end
else
-- Attempt to match qualifiers; if none given, then the entire spec is simply interpreted as a file name.
local filename, accents_string = rmatch(spec, accent_qualifier_pattern)
filename = filename or spec
local accents_list = accents_string and rsplit(accents_string, ",") or nil
table.insert(audios,
require(audio_module).format_audio({
lang = lang,
file = filename,
a = accents_list,
})
)
end
end
return audios, request_rfap
end
local function format_homophones(homophones_list)
local homophones_data = {}
for _, hmp in pairs(homophones_list) do
table.insert(homophones_data, {
term = hmp
})
end
return require(homophones_module).format_homophones({
lang = lang,
homophones = homophones_data,
})
end
-- Entry point for {{bg-pr}}
function export.show_all(frame)
local params = {
[1] = { list = true, disallow_holes = true},
["q"] = { list = true, type = "qualifier", allow_holes=true },
["qq"] = { list = true, type = "qualifier", allow_holes=true },
["l"] = { list = true, type = "labels", allow_holes=true },
["ll"] = { list = true, type = "labels", allow_holes=true },
["ann"] = { list = true, allow_holes=true, separate_no_index = true },
["audio"] = { list = true, allow_holes=true },
["a"] = { alias_of = "audio", list = true, allow_holes=true },
["rhymes"] = { list = true, separate_no_index = true, allow_holes=true },
["s"] = { list = true, type = "number", separate_no_index = true, allow_holes=true },
["syllabification"] = { list = true, separate_no_index = true, allow_holes=true },
["syl"] = { alias_of = "syllabification", list = true, separate_no_index = true, allow_holes=true },
["hyphenation"] = { list = true, separate_no_index = true, allow_holes=true },
["hyph"] = { alias_of = "hyphenation", list = true, separate_no_index = true, allow_holes=true },
["homophones"] = { list = true, allow_holes=true },
["hs"] = { list = true, separate_no_index = true, allow_holes=true}, -- Hyphenation and syllabification override at once
["hmp"] = { alias_of = "homophones", list = true, allow_holes=true },
["endreduce"] = { list = true, allow_holes=true },
["endschwa"] = { alias_of = "endreduce", list = true, allow_holes=true },
["raw"] = { list = true, allow_holes=true },
["pagename"] = {},
}
local args = require(parameters_module).process(frame:getParent().args, params)
local pagename = args.pagename or mw.title.getCurrentTitle().nsText == "Template" and "при́мер" or
mw.loadData(headword_data_module).pagename
-- Ensure at least one pronunciation line present (unlikely to be desired in the case of multisyllabic words, though)
if #args[1] == 0 then
args[1] = {pagename}
end
-- Returns the hyphenation for a term if one is given by the user,
-- or automatically generate one from the respelling if it meets the criteria:
--[[
- must have more than one vowel
- the respelling given must be the same as the page title (when accents
are removed)
--]]
local syllabify = export.syllabify
local function hyphenate(x) return export.hyphenate(export.syllabify(x)) end
local function deal_with_hyph_syl_respellings(given, respelling, hyphenate_or_syllabify)
if given == "+" then
return hyphenate_or_syllabify(respelling)
elseif given == "#" then
return hyphenate_or_syllabify(pagename)
elseif given then
return rsub(given, "%.", HYPH)
elseif count_vowels(respelling) == 1 or rsub(deaccent_all(respelling), "%.", "") ~= pagename then
return "-"
else
return hyphenate_or_syllabify(respelling)
end
end
-- Return nil if a rhyme should not be added based on the term.
--[[ The current rules are:
- if a manual override is given by the user, that will be the rhyme regardless
- if no override is given and the term contains a space or hyphen, return nil
- if there is no space and hyphen, but there is more than 1 capital letter,
then the term will be diagonosed as an abbreviation, and nil will be returned
(this logic will help to keep rhymes for names, e.g. Петър)
- if there is more than 1 accent mark (primary or secondary combined)
in the IPA, then nil is returned
- if all the above guards fail, the module will generate a rhyme
(despite appearances, this will actually be most words anyway)
--]]
local function deal_with_rhymes(override, ipa)
if override then
return override
end
if count_capital_letters(pagename) > 1 then
return nil
end
if count_accents(ipa) > 1 then
return nil
end
if rmatch(ipa, "[ %-]") or rmatch(pagename, "[ %-]") then
return nil
end
return export.get_rhymes(ipa)
end
-- Track whether an audio file has been included using a speaker profile but doesn't yet exist; automatically {{rfap}} if so.
local request_rfap = false
-- Build up wikitext output for each pronunciation line
local pronunciation_lines = {}
for i, respelling in pairs(args[1]) do
local q = args.q[i]
local qq = args.qq[i]
local l = args.l[i]
local ll = args.ll[i]
local num_syllables = args.s.default or args.s[i] or count_vowels(respelling)
local ipa = args.raw[i] or export.toIPA(respelling, args.endreduce[i])
local audio, request_rfap_local = format_audio_list(args.audio.default or args.audio[i], ipa, pagename, respelling)
local rhymes = deal_with_rhymes(args.rhymes.default or args.rhymes[i], ipa) or "-"
local homophones = args.homophones[i] and rsplit(args.homophones[i], "#")
local syllabification = deal_with_hyph_syl_respellings(args.hs.default or args.hs[1] or args.syllabification.default or args.syllabification[i], respelling, syllabify)
local hyphenation = deal_with_hyph_syl_respellings(args.hs.default or args.hs[1] or args.hyphenation.default or args.hyphenation[i], respelling, hyphenate)
local ann = args.ann.default or args.ann[i]
table.insert(pronunciation_lines, {
term = respelling,
q = q,
qq = qq,
l = l,
ll = ll,
num_syllables = num_syllables,
ipa = ipa,
audio = audio,
rhymes = rhymes,
homophones = homophones,
syllabification = syllabification,
hyphenation = hyphenation,
ann = ann,
})
if args.rhymes[i] then
require(tracking_module)("bg-pr/manual rhyme")
if export.get_rhymes(pronunciation_lines[i]["ipa"]) ~= args.rhymes[i] then
-- Manual rhyme actually changes the displayed rhyme
require(tracking_module)("bg-pr/rhyme override discrepancy")
end
end
if request_rfap_local then
request_rfap = true
end
-- Terms with a lack of stress despite not being monosyllabic
if count_vowels(respelling) > 1 and count_accents(ipa) == 0 then
require(tracking_module)("bg-pr/no stress")
end
end
-- This function is used to check whether all pronunciation lines have the same value for
-- a particular property. If they do, then that property should only be rendered once,
-- underneath each IPA.
-- If the properties are different, then each IPA should have that property value specified
-- indented underneath it, e.g. multiple IPAs with different audio files should have
-- their audios indented beneath each IPA.
local function all_the_same(property, eq) -- `eq` allows the notion of "the_same" to be overridden
eq = eq or function(a, b) return a == b end -- Use "==" as default definition of equality
local first = pronunciation_lines[1][property]
for _, pronunciation_line in pairs(pronunciation_lines) do
if not eq(pronunciation_line[property], first) then
return first, false
end
end
return first, true
end
-- Render overall output as text
local output_lines = {}
-- Check whether values for each property are all the same,
-- in which case they can all be merged at the end of the template,
-- instead of being duplicated per-pronunciation-line.
local first_hyphenation, all_hyphenations_the_same = all_the_same("hyphenation")
local first_syllabification, all_syllabifications_the_same = all_the_same("syllabification")
local first_rhyme, all_rhymes_the_same = all_the_same("rhymes")
local first_homophones, all_homophones_the_same = all_the_same("homophones", require(table_module).deepEquals)
local first_audio, all_audio_the_same = all_the_same("audio", require(table_module).deepEquals)
-- Generate text for each pronunciation line.
for _, pronunciation_line in pairs(pronunciation_lines) do
-- Unpack data
local ipa = pronunciation_line["ipa"]
local term = pronunciation_line["term"]
local ann = pronunciation_line["ann"]
local q = pronunciation_line["q"]
local qq = pronunciation_line["qq"]
local l = pronunciation_line["l"]
local ll = pronunciation_line["ll"]
local audios = pronunciation_line["audio"]
local rhymes = pronunciation_line["rhymes"]
local homophones = pronunciation_line["homophones"]
local hyphenation = pronunciation_line["hyphenation"]
local syllabification = pronunciation_line["syllabification"]
local ipa_text = format_ipa(ipa, q, qq, l, ll)
local ann_text = get_anntext(term, ann)
local out = {"* " .. ann_text .. ipa_text}
if audios and not all_audio_the_same then
for _, audio in pairs(audios) do
table.insert(out, "** " .. audio)
end
end
if rhymes ~= "-" and not all_rhymes_the_same then
local num_syllables = pronunciation_line["num_syllables"]
local rhymes_text = format_rhymes(rhymes, {num_syllables})
table.insert(out, "** " .. rhymes_text)
end
if homophones and not all_homophones_the_same then
local homophones_text = format_homophones(homophones)
table.insert(out, "** " .. homophones_text)
end
local syllabification_text = format_syllabification(syllabification)
if syllabification == hyphenation and syllabification ~= "-" then
if not (all_hyphenations_the_same and all_syllabifications_the_same) then
table.insert(out, "** " .. syllabification_text)
end
else
local hyphenation_text = format_hyphenation(hyphenation)
if not all_syllabifications_the_same and syllabification ~= "-" then
table.insert(out, "** " .. syllabification_text)
end
if not all_hyphenations_the_same and hyphenation ~= "-" then
table.insert(out, "** " .. hyphenation_text)
end
end
-- Produce output for one pronunciation line at a time
table.insert(output_lines, table.concat(out, "\n"))
end
-- Group audios all together if they are all identical
if all_audio_the_same and first_audio then
for _, audio in pairs(first_audio) do
table.insert(output_lines, "* " .. audio)
end
end
-- Group rhymes all together if they are all identical
if all_rhymes_the_same and first_rhyme ~= "-" then
-- Take all syllable counts for all pronunciation lines
-- to inform the syllable count of the rhyme.
local num_syllables = {}
for _, line in pairs(pronunciation_lines) do
table.insert(num_syllables, line["num_syllables"])
end
local rhymes_text = format_rhymes(first_rhyme, num_syllables)
table.insert(output_lines, "* " .. rhymes_text)
end
-- Group homophones all together if they are all identical
if all_homophones_the_same and first_homophones then
local homophones_text = format_homophones(first_homophones)
table.insert(output_lines, "* " .. homophones_text)
end
-- If some hyphenations or syllabifications are absent, then the outermost text should not include these,
-- rather they should have been appended to the relevant pronunciations lines above.
if all_hyphenations_the_same and all_syllabifications_the_same and first_hyphenation == first_syllabification and first_hyphenation ~= "-" then
local syllabification_text = format_syllabification(first_hyphenation)
table.insert(output_lines, "* " .. syllabification_text)
elseif first_hyphenation ~= first_syllabification then
if all_syllabifications_the_same and first_syllabification ~= "-" then
local syllabification_text = format_syllabification(first_syllabification)
table.insert(output_lines, "* " .. syllabification_text)
end
if all_hyphenations_the_same and first_hyphenation ~= "-" then
local hyphenation_text = format_hyphenation(first_hyphenation)
table.insert(output_lines, "* " .. hyphenation_text)
end
end
if request_rfap then
table.insert(output_lines, frame:preprocess("{{rfap|bg}}"))
end
return table.concat(output_lines, "\n")
end
return export
3infwrt3y6rxhu8biiaakk2o27agf6i
234873
234872
2026-05-24T09:38:22Z
Lee
19
[[:en:Module:bg-pronunciation]] වෙතින් එක් සංශෝධනයක්
234872
Scribunto
text/plain
local export = {}
local substring = mw.ustring.sub
local rsubn = mw.ustring.gsub
local rmatch = mw.ustring.match
local rsplit = mw.text.split
local rlen = mw.ustring.len
local U = require("Module:string/char")
local lang = require("Module:languages").getByCode("bg")
local script = require("Module:scripts").getByCode("Cyrl")
local ipa_module = "Module:IPA"
local audio_module = "Module:audio"
local headword_data_module = "Module:headword/data"
local homophones_module = "Module:homophones"
local hyphenation_module = "Module:hyphenation"
local parameters_module = "Module:parameters"
local rhymes_module = "Module:rhymes"
local table_module = "Module:table"
local tracking_module = "Module:debug/track"
local GRAVE = U(0x300)
local ACUTE = U(0x301)
local BREVE = U(0x306)
local PRIMARY = U(0x2C8)
local SECONDARY = U(0x2CC)
local TIE = U(0x361)
local FRONTED = U(0x31F)
local DOTUNDER = U(0x323)
local HYPH = U(0x2027)
local BREAK_MARKER = "."
local vowels = "aɤɔuɛiɐo"
local vowels_c = "[" .. vowels .. "]"
local cons = "bvɡdʒzjklɫwmnprstfxʃɣʲ" .. TIE
local cons_c = "[" .. cons .. "]"
local hcons_c = "[бвгджзйклмнпрстфхшщьчц#БВГДЖЗЙКЛМНПРСТФХШЩЬЧЦ=]"
local hvowels_c = "[аъоуеияѝюАЪОУЕИЯЍЮ]"
local capital_letters_c = "[БВГДЖЗЙКЛМНПРСТФХШЩЬЧЦАЪОУЕИЯЍЮ]"
local accents = PRIMARY .. SECONDARY
local accents_c = "[" .. accents .. "]"
-- single characters that map to IPA sounds
local phonetic_chars_map = {
["а"] = "a",
["б"] = "b",
["в"] = "v",
["г"] = "ɡ",
["д"] = "d",
["е"] = "ɛ",
["ж"] = "ʒ",
["з"] = "z",
["и"] = "i",
["й"] = "j",
["к"] = "k",
["л"] = "l",
["м"] = "m",
["н"] = "n",
["о"] = "ɔ",
["п"] = "p",
["р"] = "r",
["с"] = "s",
["т"] = "t",
["у"] = "u",
["ў"] = "w",
["ф"] = "f",
["х"] = "x",
["ц"] = "t" .. TIE .. "s",
["ч"] = "t" .. TIE .. "ʃ",
["ш"] = "ʃ",
["щ"] = "ʃt",
["ъ"] = "ɤ",
["ь"] = "ʲ",
["ю"] = "ʲu",
["я"] = "ʲa",
[GRAVE] = SECONDARY,
[ACUTE] = PRIMARY
}
local devoicing = {
["b"] = "p", ["d"] = "t", ["ɡ"] = "k",
["z"] = "s", ["ʒ"] = "ʃ",
["v"] = "f"
}
local voicing = {
["p"] = "b", ["t"] = "d", ["k"] = "ɡ",
["s"] = "z", ["ʃ"] = "ʒ", ["x"] = "ɣ",
["f"] = "v"
}
-- Prefixes where, if they occur at the beginning of the word and the stress is on the next syllable, we place the
-- syllable division directly after the prefix. For example, the default syllable-breaking algorithm would convert
-- безбра́чие to беˈзбрачие; but because it begins with без-, we convert it to безˈбрачие. Note that we don't (yet?)
-- convert измра́ to изˈмра instead of default измˈра, although we probably should.
--
-- Think twice before putting prefixes like на-, пре- and от- here, because of the existence of над-, пред-, and о-,
-- which are also prefixes.
local IPA_prefixes = {"bɛz", "vɤz", "vɤzproiz", "iz", "naiz", "poiz", "prɛvɤz", "proiz", "raz"}
-- version of rsubn() that discards all but the first return value
local function rsub(term, foo, bar)
local retval = rsubn(term, foo, bar)
return retval
end
-- version of rsubn() that discards all but the count value
local function count_matches(term, pattern)
local _, match_count = rsubn(term, pattern, "")
return match_count
end
-- apply rsub() repeatedly until no change
local function rsub_repeatedly(term, foo, bar)
while true do
local new_term = rsub(term, foo, bar)
if new_term == term then
return term
end
term = new_term
end
end
local function char_at(str, index)
return substring(str, index, index)
end
local function starts_with(str, substr)
return substring(str, 1, rlen(substr)) == substr
end
local function count_vowels(word)
return count_matches(word, hvowels_c)
end
local function count_capital_letters(word)
return count_matches(word, capital_letters_c)
end
local function count_accents(ipa)
return count_matches(ipa, accents_c)
end
local function count_ipa_vowels(ipa)
return count_matches(ipa, vowels_c)
end
function export.remove_pron_notations(text, remove_grave)
text = rsub(text, "[." .. DOTUNDER .. "]", "")
text = rsub(text, "ў", "у")
text = rsub(text, "Ў", "У")
-- Remove grave accents from annotations but maybe not from phonetic respelling
if remove_grave then
text = mw.ustring.toNFC(rsub(mw.ustring.toNFD(text), GRAVE, ""))
end
return text
end
function export.toIPA(term, endschwa)
if type(term) == "table" then -- called from a template or a bot
endschwa = term.args.endschwa
term = term.args[1]
end
local origterm = term
term = mw.ustring.toNFD(mw.ustring.lower(term))
term = rsub(term, "у" .. BREVE, "ў") -- recompose ў
term = rsub(term, "и" .. BREVE, "й") -- recompose й
if term:find(GRAVE) and not term:find(ACUTE) then
error("Use acute accent, not grave accent, for primary stress: " .. origterm)
end
-- allow DOTUNDER to signal same as endschwa=1
term = rsub(term, "а(" .. accents_c .. "?)" .. DOTUNDER, "ъ%1")
term = rsub(term, "я(" .. accents_c .. "?)" .. DOTUNDER, "ʲɤ%1")
term = rsub(term, ".", phonetic_chars_map)
-- Mark word boundaries
term = rsub(term, "(%s+)", "#%1#")
term = "#" .. term .. "#"
-- Convert verbal and definite endings
if endschwa then
term = rsub(term, "a(" .. PRIMARY .. "?t?#)", "ɤ%1")
end
-- Change ʲ to j after vowels or word-initially
term = rsub(term, "([" .. vowels .. "#]" .. accents_c .. "?)ʲ", "%1j")
-------------------- Move stress ---------------
-- First, move leftwards over the vowel.
term = rsub(term, "(" .. vowels_c .. ")(" .. accents_c .. ")", "%2%1")
-- Then, move leftwards over j or soft sign.
term = rsub(term, "([jʲ])(" .. accents_c .. ")", "%2%1")
-- Then, move leftwards over a single consonant.
term = rsub(term, "(" .. cons_c .. ")(" .. accents_c .. ")", "%2%1")
-- Then, move leftwards over Cl/Cr combinations where C is an obstruent (NOTE: IPA ɡ).
term = rsub(term, "([bdɡptkxfv]" .. ")(" .. accents_c .. ")([rl])", "%2%1%3")
-- Then, move leftwards over kv/gv (NOTE: IPA ɡ).
term = rsub(term, "([kɡ]" .. ")(" .. accents_c .. ")(v)", "%2%1%3")
-- Then, move leftwards over sC combinations, where C is a stop or resonant (NOTE: IPA ɡ).
term = rsub(term, "([sz]" .. ")(" .. accents_c .. ")([bdɡptkvlrmn])", "%2%1%3")
-- Then, move leftwards over affricates not followed by a consonant.
term = rsub(term, "([td]" .. TIE .. "?)(" .. accents_c .. ")([szʃʒ][" .. vowels .. "ʲ])", "%2%1%3")
-- If we ended up in the middle of a tied affricate, move to its right.
term = rsub(term, "(" .. TIE .. ")(" .. accents_c .. ")(" .. cons_c .. ")", "%1%3%2")
-- Then, move leftwards over any remaining consonants at the beginning of a word.
term = rsub(term, "#(" .. cons_c .. "*)(" .. accents_c .. ")", "#%2%1")
-- Then correct for known prefixes.
for _, prefix in ipairs(IPA_prefixes) do
local prefix_prefix, prefix_final_cons = rmatch(prefix, "^(.-)(" .. cons_c .. "*)$")
if prefix_final_cons then
-- Check for accent moved too far to the left into a prefix, e.g. безбрачие accented as беˈзбрачие instead
-- of безˈбрачие
term = rsub(term, "#(" .. prefix_prefix .. ")(" .. accents_c .. ")(" .. prefix_final_cons .. ")", "#%1%3%2")
end
end
-- If the previous substitution resulted in a stress occuring immediately after a consonant
-- but before a palatalizer mark, then put the stress before the consonant.
term = rsub(term, "(" .. cons_c .. ")" .. "(" .. accents_c .. ")" .. "ʲ", "%2%1ʲ")
-- Finally, if there is an explicit syllable boundary in the cluster of consonants where the stress is, put it there.
-- First check for accent to the right of the explicit syllable boundary.
term = rsub(term, "(" .. cons_c .. "*)%.(" .. cons_c .. "*)(" .. accents_c .. ")(" .. cons_c .. "*)", "%1%3%2%4")
-- Then check for accent to the left of the explicit syllable boundary.
term = rsub(term, "(" .. cons_c .. "*)(" .. accents_c .. ")(" .. cons_c .. "*)%.(" .. cons_c .. "*)", "%1%3%2%4")
-- Finally, remove any remaining syllable boundaries.
term = rsub(term, "%.", "")
-------------------- Vowel reduction (in unstressed syllables) ---------------
local function reduce_vowel(vowel)
return rsub(vowel, "[aɔɤu]", { ["a"] = "ɐ", ["ɔ"] = "o", ["ɤ"] = "ɐ", ["u"] = "o" })
end
-- Reduce all vowels before the stress, except if the word has no accent at all. (FIXME: This is presumably
-- intended for single-syllable words without accents, but if the word is multisyllabic without accents,
-- presumably all vowels should be reduced.)
term = rsub(term, "(#[^#" .. accents .. "]*)(.-#)", function(a, b)
if count_vowels(origterm) <= 1 then
return a .. b
else
return reduce_vowel(a) .. b
end
end)
-- Reduce all vowels after the accent except the first vowel after the accent mark (which is stressed).
term = rsub(term, "(" .. accents_c .. "[^aɛiɔuɤ#]*[aɛiɔuɤ])([^#" .. accents .. "]*)", function(a, b)
return a .. reduce_vowel(b)
end)
-------------------- Vowel assimilation to adjacent consonants (fronting/raising) ---------------
term = rsub(term, "([ʃʒʲj])([aouɤ])", "%1%2" .. FRONTED)
-- Hard l
term = rsub_repeatedly(term, "l([^ʲɛi])", "ɫ%1")
-- Voicing assimilation
term = rsub(term, "([bdɡzʒv" .. TIE .. "]*)(" .. accents_c .. "?[ptksʃfx#])", function(a, b)
return rsub(a, ".", devoicing) .. b end)
term = rsub(term, "([ptksʃfx" .. TIE .. "]*)(" .. accents_c .. "?[bdɡzʒ])", function(a, b)
return rsub(a, ".", voicing) .. b end)
term = rsub(term, "n(" .. accents_c .. "?[ɡk]+)", "ŋ%1")
term = rsub(term, "m(" .. accents_c .. "?[fv]+)", "ɱ%1")
-- Sibilant assimilation
term = rsub(term, "[sz](" .. accents_c .. "?[td]?" .. TIE .. "?)([ʃʒ])", "%2%1%2")
-- Reduce consonant clusters
term = rsub(term, "([szʃʒ])[td](" .. accents_c .. "?)([tdknml])", "%2%1%3")
-- Strip hashes
term = rsub(term, "#", "")
return term
end
----Syllabification code----
-- Authorship: Chernorizets
-- Lua port: Kiril Kovachev
local function set_of(t)
local out = {}
for _, v in pairs(t) do
out[v] = true
end
return out
end
local function in_set(set, value)
return set[value] == true
end
-- Classification of letters by phonetic category
local vowels_syllab = set_of {"а", "ъ", "о", "у", "е", "и", "ю", "я"}
local sonorants = set_of { "л", "м", "н", "р", "й", "ў"}
local stops = set_of {"б", "п", "г", "к", "д", "т"}
local fricatives = set_of {"в", "ф", "ж", "ш", "з", "с", "х"}
local affricates = set_of {"ч", "ц"}
local function is_vowel(ch)
return in_set(vowels_syllab, ch)
end
local function is_palatalizer(ch)
return ch == "ь"
end
local function is_sonorant(ch)
return in_set(sonorants, ch)
end
local function is_stop(ch)
return in_set(stops, ch)
end
local function is_fricative(ch)
return in_set(fricatives, ch)
end
local function is_affricate(ch)
return in_set(affricates, ch)
end
--[[
Sonority objects:
Sonority objects take the form of a table with the following attributes:
{
rank (int): the numerical value representing the position of the sound in the sonority hierarchy;
first_index (int): the index of the first letter that makes up the sound within the word.
The index of the first letter in a word with this sonority rank.
The affricates "дж" and "дз" are represented by two letters each, but
for sonority purposes they function as a "unit", hence we just need
the index of the first letter of the affricate.
}
--]]
local function new_sonority(rank, first_index)
return {
["rank"] = rank,
["first_index"] = first_index
}
end
local function get_sonority_rank(ch)
if is_fricative(ch) then
return 1
end
if is_stop(ch) or is_affricate(ch) then
return 2
end
if is_sonorant(ch) then
return 3
end
if is_vowel(ch) then
return 4
end
return 0
end
-- Get the representation of a word as a list of sequential sonority objects, stored in a table.
-- Their representation is just {[1] = (sonority object #1), [2] = (sonority object #2)} etc.
-- Please see above for description of sonority objects' layout.
local function get_sonority_model(word, start_idx, end_idx)
local sonorities = {}
word = mw.ustring.lower(word)
local i = start_idx
while i < end_idx do
local curr = char_at(word, i)
if curr == "щ" then
-- One letter representing 2 sounds - decompose it.
table.insert(sonorities, new_sonority(get_sonority_rank("ш"), i))
table.insert(sonorities, new_sonority(get_sonority_rank("т"), i));
elseif curr == "д" then
-- Handle affricates with 'д' - only 'дж' here for illustration.
local next_char = (i == end_idx - 1 and " ") or char_at(word, i+1)
local should_skip = false
if next_char == "ж" then
table.insert(sonorities, new_sonority(2, i)) -- 2 = affricate sonority rank
i = i + 1 -- Skip over the 'ж'
should_skip = true
end
if not should_skip then table.insert(sonorities, new_sonority(get_sonority_rank("д"), i)) end
elseif not is_palatalizer(curr) then
-- Skip over 'ь' since it doesn't change the sonority.
table.insert(sonorities, new_sonority(get_sonority_rank(curr), i))
end
i = i + 1
end
return sonorities
end
-- Forced breaks when the user inputs a break marker into the input string
-- word: string; start and end are integers indexing the string
local function find_forced_break(word, range_start, range_end)
if range_start >= range_end then return -1 end
local marker_pos = mw.ustring.find(word, BREAK_MARKER, range_start, true) or -1
return marker_pos >= range_end and -1 or marker_pos
end
local function strip_forced_breaks(segment)
return rsub(segment, "[.]", "");
end
---- Morphological prefix handling
--[[
This code brings morphological prefix awareness to syllabification.
This is necessary, because following the principle of rising sonority
alone fails to determine syllable boundaries correctly in some cases
— that is, when certain prefixes should be kept together as a first syllable.
]]
--[[
Affected prefixes. Each of them ends in a consonant that can be followed
by another consonant of a higher sonority in some words. In such cases,
naive syllable breaking would chop off the prefix's last consonant, and
glue it to the onset of the next syllable.
]]
local prefixes = {
-- без- family
"без",
-- из- family
"безиз", "наиз", "поиз", "произ", "преиз", "неиз", "из",
-- въз- family
"безвъз", "превъз", "невъз", "въз",
-- раз- family
"безраз", "предраз", "пораз", "нараз", "прераз", "нераз", "раз",
-- от- family
"неот", "поот", "от",
-- ending in fricatives
"екс", "таз", "дис",
-- ending in stops
"пред"
}
--[[
Finds the (zero-based) separation point between a
morphological prefix and the rest of the word.
By convention, that's the index of the first character
after the prefix.
word: the word to check for prefixes
return -1 if no prefix found, or if the separation point
is handled by the sonority model. A non-zero index otherwise.
]]
local function followed_by_higher_sonority_cons(prefix, word) -- prefix, word are both strings
prefix = mw.ustring.lower(prefix)
word = mw.ustring.lower(word)
local prefix_last_char = char_at(prefix, rlen(prefix))
local first_char_after_prefix = char_at(word, rlen(prefix) + 1)
-- Prefixes followed by vowels do, in fact, get broken up.
if is_vowel(first_char_after_prefix) then return false end
return get_sonority_rank(prefix_last_char) < get_sonority_rank(first_char_after_prefix)
end
local function find_separation_points(word)
local matching_prefixes = {}
word = mw.ustring.lower(word)
for _, prefix in pairs(prefixes) do
if starts_with(word, prefix) and followed_by_higher_sonority_cons(prefix, word) then
table.insert(matching_prefixes, rlen(prefix) + 1)
end
end
return matching_prefixes
end
---- Main syllabification code
---Context objects:
--[[ encoded as a table like
{
word (string),
prefix_separation_points (table[int])
}
]]
local function new_context(word, pos)
return {
["word"] = word,
["prefix_separation_points"] = pos
}
end
--[[
Consonant clusters that exhibit rising sonority, but should be
broken up regardless to produce natural-sounding syllables.
The breakpoint for clusters of 3 or more consonants can vary –
here we provide a zero-based offset within the cluster for each.
]]
local sonority_exception_break = {
["км"] = 1, ["гм"] = 1, ["дм"] = 1, ["вм"] = 1,
["зм"] = 1, ["цм"] = 1, ["чм"] = 1,
["дн"] = 1, ["вн"] = 1, ["тн"] = 1, ["чн"] = 1,
["кн"] = 1, ["гн"] = 1, ["цн"] = 1,
["зд"] = 1, ["зч"] = 1, ["зц"] = 1,
["вк"] = 1, ["вг"] = 1, ["дл"] = 1, ["жд"] = 1,
["згн"] = 1, ["здн"] = 2, ["вдж"] = 1
}
local sonority_exception_keep = {
"ств", "св", "вс"
}
local function normalize_word(word)
if word == nil then return "" end
word = rsub(rsub(word, "^\\s+", ""), "\\s+^", "") -- Strip spaces
return word
end
local function normalize_syllable(syllable)
local normalized = strip_forced_breaks(syllable)
normalized = rsub(normalized, "ў", "у")
normalized = rsub(normalized, "Ў", "У")
return normalized
end
local function find_rising_sonority_break(sonorities)
local prev_rank = -1;
for _, curr in pairs(sonorities) do
if curr.rank <= prev_rank then
-- Found a break.
return curr.first_index
end
prev_rank = curr.rank
end
-- There was no rising sonority break. Start syllable at first index.
return sonorities[1].first_index
end
local function matches(str, substr, start_idx, end_idx)
local strlen = end_idx - start_idx
if strlen ~= rlen(substr) then return false end
str = mw.ustring.lower(str)
substr = mw.ustring.lower(substr)
local i = start_idx
local j = 1
while i < end_idx do
if char_at(str, i) ~= char_at(substr, j) then return false end
i = i + 1
j = j + 1
end
return true
end
-- ctx: context object
-- left and right vowels: integers
-- sonority break: integer
local function fixup_syllable_onset(ctx, left_vowel, sonority_break, right_vowel)
local word = mw.ustring.lower(ctx.word)
-- 'щр' is a syllable onset when in front of a vowel.
-- Although 'щ' + sonorant technically follows rising sonority, syllables
-- like щнV, щлV etc. are unnatural and incorrect. In such cases, we treat
-- the sonorant as the onset of the next syllable.
if char_at(word, right_vowel - 2) == "щ" then
local penult = char_at(word, right_vowel - 1)
if penult == "р" then return (right_vowel - 2) end
if is_sonorant(penult) then return (right_vowel - 1) end
end
-- Check for situations where we shouldn't break the cluster.
local match_found = false
for _, cluster in pairs(sonority_exception_keep) do
if matches(word, cluster, left_vowel + 1, right_vowel) then
match_found = true
break
end
end
if (match_found) then return left_vowel + 1 end -- syllable onset == beginning of cluster
-- Check for situations where we should break the cluster even if
-- it obeys the principle of rising sonority.
local maybe_cluster = nil
for cluster, _ in pairs(sonority_exception_break) do
if matches(word, cluster, left_vowel + 1, right_vowel) then
maybe_cluster = cluster
break
end
end
if maybe_cluster ~= nil then
local offset = sonority_exception_break[maybe_cluster]
return left_vowel + 1 + offset
end
local separation_points = ctx.prefix_separation_points
local separation_match = nil
for _, pos in pairs(separation_points) do
if pos > left_vowel and pos < right_vowel then
separation_match = pos
break
end
end
if separation_match ~= nil then return separation_match else return sonority_break end
end
-- ctx: context object
-- left/right vowels: integers
local function find_next_syllable_onset(ctx, left_vowel, right_vowel)
local n_cons = right_vowel - left_vowel - 1
-- No consonants - syllable starts on rightVowel
if n_cons == 0 then return right_vowel end
-- Check for forced breaks
local break_pos = find_forced_break(ctx.word, left_vowel + 1, right_vowel)
if break_pos ~= -1 then return break_pos + 1 end
-- Single consonant between two vowels - starts a syllable
if n_cons == 1 then return left_vowel + 1 end
-- Two or more consonants between the vowels. Find the point (if any)
-- where we break from rising sonority, and treat it as the tentative
-- onset of a new syllable.
local sonorities = get_sonority_model(ctx.word, left_vowel + 1, right_vowel)
local sonority_break = find_rising_sonority_break(sonorities)
-- Apply exceptions to the rising sonority principle to avoid
-- unnatural-sounding syllables.
return fixup_syllable_onset(ctx, left_vowel, sonority_break, right_vowel)
end
local function deaccent(term)
return rsub(term, "[" .. ACUTE .. GRAVE .. DOTUNDER .. "]", "")
end
local function deaccent_all(term)
term = rsub(term, "ў", "у")
term = rsub(term, "Ў", "У")
return deaccent(term)
end
-- Returns a table of strings (list)
local function syllabify_poly(word)
local syllables = {}
local ctx = new_context(word, find_separation_points(word))
local prev_vowel = -1
local prev_onset = 1;
for i = 1, rlen(word) do
if is_vowel(mw.ustring.lower(char_at(word, i))) then
-- A vowel, yay!
local should_skip = false
if prev_vowel == -1 then
prev_vowel = i
should_skip = true;
end
-- This is not the first vowel we've seen. In-between
-- the previous vowel and this one, there is a syllable
-- break, and the first character after the break starts
-- a new syllable.
if not should_skip then
local next_onset = find_next_syllable_onset(ctx, prev_vowel, i)
table.insert(syllables, substring(word, prev_onset, next_onset - 1))
prev_vowel = i
prev_onset = next_onset
end
end
end
-- Add the last syllable
table.insert(syllables, substring(word, prev_onset))
return syllables
end
function export.syllabify_word(word)
local norm = normalize_word(word)
if rlen(norm) == 0 then return "" end;
local n_vowels = count_vowels(norm)
local syllables = n_vowels <= 1 and {norm} or syllabify_poly(norm)
local out = {}
for k, v in pairs(syllables) do
out[k] = normalize_syllable(v)
end
return table.concat(out, HYPH)
end
local function tokenize_words(term)
local out = {}
local prev_index = 1
local len = rlen(term)
for i = 1, len do
local current_char = char_at(term, i)
if current_char == "-" or current_char == " " then
table.insert(out, substring(term, prev_index, i))
prev_index = i + 1
end
end
table.insert(out, substring(term, prev_index, len))
return out
end
function export.syllabify(term)
term = deaccent(term)
local words = tokenize_words(term)
local out = {}
for _, word in pairs(words) do
table.insert(out, export.syllabify_word(word))
end
return table.concat(out, "")
end
---Hyphenation
-- Hyphenate a word from its existing syllabification
function export.hyphenate(syllabification)
-- Source: http://logic.fmi.uni-sofia.bg/hyphenation/hyph-bg.html#hyphenation-rules-between-1983-and-2012
-- Also note: the rules from 2012 onward, which encode the modern standard, are entirely
-- backwards-compatible with the previous standard. Thus our code can generate valid 2012
-- hyphenations despite only explicitly implementing the older (1983) rules.
---Pre-processing----
local word = deaccent(syllabification)
word = rsub_repeatedly(word, HYPH .. "дж", HYPH .. "#")
word = rsub_repeatedly(word, "дж$", "#")
word = rsub_repeatedly(word, "^дж", "#")
word = rsub_repeatedly(word, "(" .. hvowels_c .. ")" .. HYPH .. "(" .. hcons_c .. ")(" .. rsub(hcons_c, "[ьЬ]", "") .. "+)", "%1%2" .. HYPH .. "%3")
word = rsub_repeatedly(word, "(" .. rsub(hcons_c, "[йЙ]", "") .. ")(" .. hcons_c .. "+)" .. HYPH, "%1" .. HYPH .. "%2")
word = rsub_repeatedly(word, "^(" .. hvowels_c .. ")" .. HYPH, "%1")
word = rsub_repeatedly(word, HYPH .. "(" .. hvowels_c .. ")$", "%1")
word = rsub_repeatedly(word, "(" .. hvowels_c .. ")" .. HYPH .. "(" .. hvowels_c .. ")" .. HYPH .. "(" .. hvowels_c .. ")", "%1%2" .. HYPH .. "%3")
word = rsub_repeatedly(word, HYPH .. "(" .. hvowels_c .. ")" .. HYPH .. "(" .. hcons_c .. ")", HYPH .. "%1%2")
word = rsub_repeatedly(word, "#", "дж")
return word
end
-- Hyphenate a word directly, no need to calculate its syllabification beforehand (used in test suite)
function export.hyphenate_total(word)
local syllabification = export.syllabify(word)
return export.hyphenate(syllabification)
end
local function get_anntext(term, ann)
if ann == "1" or ann == "y" then
-- remove secondary stress annotations
return "'''" .. export.remove_pron_notations(term, true) .. "''': "
elseif ann then
return "'''" .. ann .. "''': "
else
return ""
end
end
local HYPHENATION_LABEL = "Hyphenation<sup>([[Appendix:Bulgarian hyphenation#Hyphenation|key]])</sup>"
local SYLLABIFICATION_LABEL = "Syllabification<sup>([[Appendix:Bulgarian hyphenation#Syllabification|key]])</sup>"
local function format_hyphenation(hyphenation, label)
hyphenation = deaccent(hyphenation) -- remove grave/acute accent
local syllables = rsplit(hyphenation, HYPH)
label = label or HYPHENATION_LABEL
return require(hyphenation_module).format_hyphenations {
lang = lang,
hyphs = { { hyph = syllables } },
sc = script,
caption = label,
}
end
local function format_syllabification(syllabification)
return format_hyphenation(syllabification, SYLLABIFICATION_LABEL)
end
-- Display syllabification and hyphenation, together if the same, and on separate lines if not;
-- allows specifying an indentation level, if the hyphenation must be indented to more than one level.
local function render_bg_hyph(term, indentation, syllabification, hyphenation)
syllabification = syllabification or export.syllabify(term)
hyphenation = hyphenation or export.hyphenate(syllabification)
local out = ""
-- Users must put a * (or **) before the template usage
if syllabification == hyphenation then
if syllabification ~= "-" then
out = format_syllabification(syllabification)
end
else
local syllabification_text = format_syllabification(syllabification)
local hyphenation_text = format_hyphenation(hyphenation)
if syllabification ~= "-" then
out = syllabification_text
end
if hyphenation ~= "-" then
if syllabification == "-" then
out = hyphenation_text
else
out = out .. "\n" .. mw.ustring.rep("*", indentation) .. " " .. hyphenation_text
end
end
end
return out
end
-- Entry point to {{bg-hyph}}
function export.show_hyphenation(frame)
local params = {
[1] = {},
["indent"] = { type = "number" }
}
local title = mw.title.getCurrentTitle()
local args = require(parameters_module).process(frame:getParent().args, params)
local term = args[1] or title.nsText == "Template" and "при́мер" or title.text
local indent = args["indent"] or 1
return render_bg_hyph(term, indent)
end
function export.get_rhymes(ipa)
ipa = rsub(ipa, FRONTED, "")
local length = rlen(ipa)
local i = length
local vowels_seen = 0
local final_consonant_found = false
-- March until accent is found
while i > 0 do
-- Track vowel or final consonant if found
if vowels_seen == 0 and rmatch(char_at(ipa, i), cons_c) then
final_consonant_found = true
end
if rmatch(char_at(ipa, i), vowels_c) then
vowels_seen = vowels_seen + 1
end
if rmatch(char_at(ipa, i), accents_c) then
-- Note whether letter before the accent was vowel
local final_vowel_cluster = rmatch(ipa, vowels_c .. accents_c .. vowels_c .. "$")
-- March until the vowel first following the accent is found
while i <= length and not rmatch(char_at(ipa, i), vowels_c) do
i = i + 1
end
-- March back if only a single word-final vowel was previously spotted –
-- this corresponds to final-syllable-stressed words, whose rhyme
-- needs to include a consonant according to Bulgarian rhyming rules.
if vowels_seen <= 1 and not final_consonant_found and not final_vowel_cluster then
while i > 1 and not rmatch(char_at(ipa, i), rsub(cons_c, "ʲ", "")) do
i = i - 1
end
-- Account for affricates (note: this can only occur in
-- consonant-rhyme, i.e. final-stressed words)
if i > 1 and char_at(ipa, i-1) == TIE then
-- If a tie is present, there must be a letter before it as well.
i = i - 2
elseif i > 1 and char_at(ipa, i) == "ʒ" and char_at(ipa, i-1) == "d" then
-- Treat [dʒ] sequence as an affricate – this can have some edge cases.
-- In future, the module should distinguish [d.ʒ] and [d͡ʒ].
i = i - 1
end
end
return substring(ipa, i)
end
i = i - 1
end
local n_vowels = count_ipa_vowels(ipa)
if n_vowels == 1 then
i = length
if rmatch(char_at(ipa, i), cons_c) then
while i > 1 and not rmatch(char_at(ipa, i), vowels_c) do
i = i - 1
end
else
while i > 1 and not rmatch(char_at(ipa, i), rsub(cons_c, "ʲ", "")) do
i = i - 1
end
end
if i > 1 and char_at(ipa, i - 1) == TIE then
i = i - 2
end
return substring(ipa, i)
end
return nil
end
-- Render a single IPA transcription as wikitext (with optional qualifiers + accent labels)
local function format_ipa(ipa, q, qq, a, aa)
-- Introduce narrow transcription brackets
ipa = "[" .. ipa .. "]"
local ipa_data = {
lang = lang,
items = {{ pron = ipa }},
q = q,
qq = qq,
a = a,
aa = aa,
}
return require(ipa_module).format_IPA_full(ipa_data)
end
function export.show(frame)
local params = {
[1] = {},
["endschwa"] = { type = "boolean" },
["ann"] = {},
["q"] = { type = "qualifier" },
["qq"] = { type = "qualifier" },
["a"] = { type = "labels" },
["aa"] = { type = "labels" },
["pagename"] = {},
}
local args = require(parameters_module).process(frame:getParent().args, params)
local term = args[1] or args.pagename or mw.title.getCurrentTitle().nsText == "Template" and "при́мер" or
mw.loadData(headword_data_module).pagename
local ipa = export.toIPA(term, args.endschwa)
local ipa_text = format_ipa(ipa, args.q, args.qq, args.a, args.aa)
local anntext = get_anntext(term, args.ann)
-- Terms with a lack of stress despite not being monosyllabic
if count_vowels(term) > 1 and count_accents(ipa) == 0 then
require(tracking_module)("bg-IPA/no stress")
end
return anntext .. ipa_text
end
-- Convert rhyme suffix and optional syllable count to wikitext
local function format_rhymes(rhyme_suffix, syllable_counts, q, qq, l, ll)
return require(rhymes_module).format_rhymes({
lang = lang,
rhymes = {
{rhyme = rhyme_suffix, num_syl = syllable_counts, q = q, qq = qq, a = l, aa = ll},
},
})
end
-- Entry point for {{bg-rhymes}}
function export.show_rhymes(frame)
-- TODO: add qualifiers / labels
local params = {
[1] = {},
["pagename"] = {},
["s"] = { sublist = true, type = "number", },
["q"] = { type = "qualifier", },
["qq"] = { type = "qualifier", },
["a"] = { type = "labels", },
["aa"] = { type = "labels", },
}
local args = require(parameters_module).process(frame:getParent().args, params)
local term = args[1] or args.pagename or mw.title.getCurrentTitle().nsText == "Template" and "при́мер" or
mw.loadData(headword_data_module).pagename
local ipa = export.toIPA(term, args.endschwa)
local rhymes = export.get_rhymes(ipa)
local syllable_counts = args.s or {count_vowels(term)}
return format_rhymes(rhymes, syllable_counts, args.q, args.qq, args.a, args.aa)
end
-- Matches patterns such as: Bg-къща.ogg<Sofia>,
-- with capture groups [1]="Bg-къща.ogg", [2]="Sofia"
local accent_qualifier_pattern = "(.-)<(.+)>"
-- Matches speaker profiles, i.e. a shorthand for representing a given
-- speaker and the properties of their audio
local speaker_profile_pattern = "%[([^:~]-)([:~]?)([^:~]*)%]"
local speaker_profiles = require("Module:bg-pronunciation/speaker profiles").speaker_profiles
local audio_functions = require("Module:bg-pronunciation/speaker profiles").audio_functions
-- Return a list of audio formatted as wikitext
local function format_audio_list(list, ipa, pagename, corresponding_respelling)
local request_rfap = false
if list == nil then
return {}, request_rfap
end
-- Audio list is separated by # symbols.
local file_specs = rsplit(list, "#")
local audios = {}
for _, spec in pairs(file_specs) do
-- Try to match speaker profile
local speaker_profile_name, separator, term_override = rmatch(spec, speaker_profile_pattern)
-- FIXME
if speaker_profile_name == "" and term_override ~= "" then
speaker_profile_name = term_override
term_override = nil
end
if speaker_profile_name then
local speaker_profile = speaker_profiles[speaker_profile_name]
if not speaker_profile then
error("Speaker profile named '" .. speaker_profile_name .. "' does not exist")
end
-- Track uses of a particular speaker profile
require(tracking_module)("bg-pr/speaker-profile/" .. speaker_profile_name)
-- E.g. [ABC~2] on page="човек" is equivalent to: [ABC:човек-2].
if separator == "~" then
term_override = mw.loadData(headword_data_module).pagename .. "-" .. term_override
end
if term_override == "" then
term_override = corresponding_respelling
end
local renderer_name = speaker_profile["renderer"]
local filename = term_override or pagename
local rendered = audio_functions[renderer_name].display(speaker_profile, filename, {ipa=ipa})
if rendered then
table.insert(audios, rendered)
else
request_rfap = true
end
else
-- Attempt to match qualifiers; if none given, then the entire spec is simply interpreted as a file name.
local filename, accents_string = rmatch(spec, accent_qualifier_pattern)
filename = filename or spec
local accents_list = accents_string and rsplit(accents_string, ",") or nil
table.insert(audios,
require(audio_module).format_audio({
lang = lang,
file = filename,
a = accents_list,
})
)
end
end
return audios, request_rfap
end
local function format_homophones(homophones_list)
local homophones_data = {}
for _, hmp in pairs(homophones_list) do
table.insert(homophones_data, {
term = hmp
})
end
return require(homophones_module).format_homophones({
lang = lang,
homophones = homophones_data,
})
end
-- Entry point for {{bg-pr}}
function export.show_all(frame)
local params = {
[1] = { list = true, disallow_holes = true},
["q"] = { list = true, type = "qualifier", allow_holes=true },
["qq"] = { list = true, type = "qualifier", allow_holes=true },
["l"] = { list = true, type = "labels", allow_holes=true },
["ll"] = { list = true, type = "labels", allow_holes=true },
["ann"] = { list = true, allow_holes=true, separate_no_index = true },
["audio"] = { list = true, allow_holes=true },
["a"] = { alias_of = "audio", list = true, allow_holes=true },
["rhymes"] = { list = true, separate_no_index = true, allow_holes=true },
["s"] = { list = true, type = "number", separate_no_index = true, allow_holes=true },
["syllabification"] = { list = true, separate_no_index = true, allow_holes=true },
["syl"] = { alias_of = "syllabification", list = true, separate_no_index = true, allow_holes=true },
["hyphenation"] = { list = true, separate_no_index = true, allow_holes=true },
["hyph"] = { alias_of = "hyphenation", list = true, separate_no_index = true, allow_holes=true },
["homophones"] = { list = true, allow_holes=true },
["hs"] = { list = true, separate_no_index = true, allow_holes=true}, -- Hyphenation and syllabification override at once
["hmp"] = { alias_of = "homophones", list = true, allow_holes=true },
["endreduce"] = { list = true, allow_holes=true },
["endschwa"] = { alias_of = "endreduce", list = true, allow_holes=true },
["raw"] = { list = true, allow_holes=true },
["pagename"] = {},
}
local args = require(parameters_module).process(frame:getParent().args, params)
local pagename = args.pagename or mw.title.getCurrentTitle().nsText == "Template" and "при́мер" or
mw.loadData(headword_data_module).pagename
-- Ensure at least one pronunciation line present (unlikely to be desired in the case of multisyllabic words, though)
if #args[1] == 0 then
args[1] = {pagename}
end
-- Returns the hyphenation for a term if one is given by the user,
-- or automatically generate one from the respelling if it meets the criteria:
--[[
- must have more than one vowel
- the respelling given must be the same as the page title (when accents
are removed)
--]]
local syllabify = export.syllabify
local function hyphenate(x) return export.hyphenate(export.syllabify(x)) end
local function deal_with_hyph_syl_respellings(given, respelling, hyphenate_or_syllabify)
if given == "+" then
return hyphenate_or_syllabify(respelling)
elseif given == "#" then
return hyphenate_or_syllabify(pagename)
elseif given then
return rsub(given, "%.", HYPH)
elseif count_vowels(respelling) == 1 or rsub(deaccent_all(respelling), "%.", "") ~= pagename then
return "-"
else
return hyphenate_or_syllabify(respelling)
end
end
-- Return nil if a rhyme should not be added based on the term.
--[[ The current rules are:
- if a manual override is given by the user, that will be the rhyme regardless
- if no override is given and the term contains a space or hyphen, return nil
- if there is no space and hyphen, but there is more than 1 capital letter,
then the term will be diagonosed as an abbreviation, and nil will be returned
(this logic will help to keep rhymes for names, e.g. Петър)
- if there is more than 1 accent mark (primary or secondary combined)
in the IPA, then nil is returned
- if all the above guards fail, the module will generate a rhyme
(despite appearances, this will actually be most words anyway)
--]]
local function deal_with_rhymes(override, ipa)
if override then
return override
end
if count_capital_letters(pagename) > 1 then
return nil
end
if count_accents(ipa) > 1 then
return nil
end
if rmatch(ipa, "[ %-]") or rmatch(pagename, "[ %-]") then
return nil
end
return export.get_rhymes(ipa)
end
-- Track whether an audio file has been included using a speaker profile but doesn't yet exist; automatically {{rfap}} if so.
local request_rfap = false
-- Build up wikitext output for each pronunciation line
local pronunciation_lines = {}
for i, respelling in pairs(args[1]) do
local q = args.q[i]
local qq = args.qq[i]
local l = args.l[i]
local ll = args.ll[i]
local num_syllables = args.s.default or args.s[i] or count_vowels(respelling)
local ipa = args.raw[i] or export.toIPA(respelling, args.endreduce[i])
local audio, request_rfap_local = format_audio_list(args.audio.default or args.audio[i], ipa, pagename, respelling)
local rhymes = deal_with_rhymes(args.rhymes.default or args.rhymes[i], ipa) or "-"
local homophones = args.homophones[i] and rsplit(args.homophones[i], "#")
local syllabification = deal_with_hyph_syl_respellings(args.hs.default or args.hs[1] or args.syllabification.default or args.syllabification[i], respelling, syllabify)
local hyphenation = deal_with_hyph_syl_respellings(args.hs.default or args.hs[1] or args.hyphenation.default or args.hyphenation[i], respelling, hyphenate)
local ann = args.ann.default or args.ann[i]
table.insert(pronunciation_lines, {
term = respelling,
q = q,
qq = qq,
l = l,
ll = ll,
num_syllables = num_syllables,
ipa = ipa,
audio = audio,
rhymes = rhymes,
homophones = homophones,
syllabification = syllabification,
hyphenation = hyphenation,
ann = ann,
})
if args.rhymes[i] then
require(tracking_module)("bg-pr/manual rhyme")
if export.get_rhymes(pronunciation_lines[i]["ipa"]) ~= args.rhymes[i] then
-- Manual rhyme actually changes the displayed rhyme
require(tracking_module)("bg-pr/rhyme override discrepancy")
end
end
if request_rfap_local then
request_rfap = true
end
-- Terms with a lack of stress despite not being monosyllabic
if count_vowels(respelling) > 1 and count_accents(ipa) == 0 then
require(tracking_module)("bg-pr/no stress")
end
end
-- This function is used to check whether all pronunciation lines have the same value for
-- a particular property. If they do, then that property should only be rendered once,
-- underneath each IPA.
-- If the properties are different, then each IPA should have that property value specified
-- indented underneath it, e.g. multiple IPAs with different audio files should have
-- their audios indented beneath each IPA.
local function all_the_same(property, eq) -- `eq` allows the notion of "the_same" to be overridden
eq = eq or function(a, b) return a == b end -- Use "==" as default definition of equality
local first = pronunciation_lines[1][property]
for _, pronunciation_line in pairs(pronunciation_lines) do
if not eq(pronunciation_line[property], first) then
return first, false
end
end
return first, true
end
-- Render overall output as text
local output_lines = {}
-- Check whether values for each property are all the same,
-- in which case they can all be merged at the end of the template,
-- instead of being duplicated per-pronunciation-line.
local first_hyphenation, all_hyphenations_the_same = all_the_same("hyphenation")
local first_syllabification, all_syllabifications_the_same = all_the_same("syllabification")
local first_rhyme, all_rhymes_the_same = all_the_same("rhymes")
local first_homophones, all_homophones_the_same = all_the_same("homophones", require(table_module).deepEquals)
local first_audio, all_audio_the_same = all_the_same("audio", require(table_module).deepEquals)
-- Generate text for each pronunciation line.
for _, pronunciation_line in pairs(pronunciation_lines) do
-- Unpack data
local ipa = pronunciation_line["ipa"]
local term = pronunciation_line["term"]
local ann = pronunciation_line["ann"]
local q = pronunciation_line["q"]
local qq = pronunciation_line["qq"]
local l = pronunciation_line["l"]
local ll = pronunciation_line["ll"]
local audios = pronunciation_line["audio"]
local rhymes = pronunciation_line["rhymes"]
local homophones = pronunciation_line["homophones"]
local hyphenation = pronunciation_line["hyphenation"]
local syllabification = pronunciation_line["syllabification"]
local ipa_text = format_ipa(ipa, q, qq, l, ll)
local ann_text = get_anntext(term, ann)
local out = {"* " .. ann_text .. ipa_text}
if audios and not all_audio_the_same then
for _, audio in pairs(audios) do
table.insert(out, "** " .. audio)
end
end
if rhymes ~= "-" and not all_rhymes_the_same then
local num_syllables = pronunciation_line["num_syllables"]
local rhymes_text = format_rhymes(rhymes, {num_syllables})
table.insert(out, "** " .. rhymes_text)
end
if homophones and not all_homophones_the_same then
local homophones_text = format_homophones(homophones)
table.insert(out, "** " .. homophones_text)
end
local syllabification_text = format_syllabification(syllabification)
if syllabification == hyphenation and syllabification ~= "-" then
if not (all_hyphenations_the_same and all_syllabifications_the_same) then
table.insert(out, "** " .. syllabification_text)
end
else
local hyphenation_text = format_hyphenation(hyphenation)
if not all_syllabifications_the_same and syllabification ~= "-" then
table.insert(out, "** " .. syllabification_text)
end
if not all_hyphenations_the_same and hyphenation ~= "-" then
table.insert(out, "** " .. hyphenation_text)
end
end
-- Produce output for one pronunciation line at a time
table.insert(output_lines, table.concat(out, "\n"))
end
-- Group audios all together if they are all identical
if all_audio_the_same and first_audio then
for _, audio in pairs(first_audio) do
table.insert(output_lines, "* " .. audio)
end
end
-- Group rhymes all together if they are all identical
if all_rhymes_the_same and first_rhyme ~= "-" then
-- Take all syllable counts for all pronunciation lines
-- to inform the syllable count of the rhyme.
local num_syllables = {}
for _, line in pairs(pronunciation_lines) do
table.insert(num_syllables, line["num_syllables"])
end
local rhymes_text = format_rhymes(first_rhyme, num_syllables)
table.insert(output_lines, "* " .. rhymes_text)
end
-- Group homophones all together if they are all identical
if all_homophones_the_same and first_homophones then
local homophones_text = format_homophones(first_homophones)
table.insert(output_lines, "* " .. homophones_text)
end
-- If some hyphenations or syllabifications are absent, then the outermost text should not include these,
-- rather they should have been appended to the relevant pronunciations lines above.
if all_hyphenations_the_same and all_syllabifications_the_same and first_hyphenation == first_syllabification and first_hyphenation ~= "-" then
local syllabification_text = format_syllabification(first_hyphenation)
table.insert(output_lines, "* " .. syllabification_text)
elseif first_hyphenation ~= first_syllabification then
if all_syllabifications_the_same and first_syllabification ~= "-" then
local syllabification_text = format_syllabification(first_syllabification)
table.insert(output_lines, "* " .. syllabification_text)
end
if all_hyphenations_the_same and first_hyphenation ~= "-" then
local hyphenation_text = format_hyphenation(first_hyphenation)
table.insert(output_lines, "* " .. hyphenation_text)
end
end
if request_rfap then
table.insert(output_lines, frame:preprocess("{{rfap|bg}}"))
end
return table.concat(output_lines, "\n")
end
return export
3infwrt3y6rxhu8biiaakk2o27agf6i
Module:bg-pronunciation/testcases
828
137954
234880
222992
2025-12-30T19:10:43Z
en>Kiril kovachev
0
Add accents to hyphenation test cases as well
234880
Scribunto
text/plain
local tests = require("Module:UnitTests")
local m_pron = require("Module:bg-pronunciation")
local rhymes_module = "Module:rhymes"
local Bulgarian = require("Module:languages").getByCode("bg")
local Cyrillic = require("Module:scripts").getByCode("Cyrl")
local function link(term)
return require("Module:links").full_link{ term = term, lang = Bulgarian, sc = Cyrillic }
end
local function tag_IPA(IPA)
return '<span class="IPA">' .. IPA .. '</span>'
end
local function identity(x)
return x
end
local display_hyphenation = identity
local display_syllabification = identity
local function display_rhymes(ipa)
return require(rhymes_module).show_row({"bg", ipa})
end
function tests:check_output_ipa(term, expected, endschwa)
local normalized_term = m_pron.remove_pron_notations(term)
tests:equals(
link(normalized_term) ..
(term ~= normalized_term and " (respelled " .. term .. ")" or "") ..
(endschwa and ", endschwa=true" or ""),
m_pron.toIPA(term, endschwa),
expected,
{ display = tag_IPA }
)
end
function tests:check_output_hyphenation(term, expected)
tests:equals(
link(term),
m_pron.hyphenate_total(term),
mw.ustring.gsub(expected, "[.]", "‧"),
{ display = display_hyphenation }
)
end
function tests:check_output_syllabification(term, expected)
tests:equals(
link(term),
m_pron.syllabify(term),
mw.ustring.gsub(expected, "[.]", "‧"),
{ display = display_syllabification }
)
end
function tests:check_output_rhymes(term, expected)
tests:equals(
link((type(term) == "table" and term.args[1] or term):gsub("̣", "")),
m_pron.get_rhymes(m_pron.toIPA(term)),
expected,
{ display = display_rhymes }
)
end
function tests:test_ipa()
local list = {
{ "къ́ща", "ˈkɤʃtɐ" },
{ "сгъстя́ се", "zɡɐˈstʲɤ̟ sɛ", true },
{ "сгъстя̣́ се", "zɡɐˈstʲɤ̟ sɛ"},
{ "а̀бдики́ращ", "ˌabdiˈkirɐʃt" },
{ "безшу́мен", "bɛʃˈʃu̟mɛn" },
{ "щастли́в", "ʃtɐˈslif" },
{ "народността́", "nɐrodnoˈsta" },
{ "я", "ja̟" },
{ "юг", "ju̟k" },
{ "яйце́", "jɐjˈt͡sɛ" },
{ "изя́м", "iˈzʲa̟m"}, -- not morphological, but seemingly necessary to avoid a palatalization-initial syllable.
{ "учи́лище", "oˈt͡ʃiliʃtɛ" },
{ "чорбаджи́я", "t͡ʃo̟rbɐˈdʒijɐ" },
{ "уби́йца", "oˈbijt͡sɐ" },
{ "безбра́чие", "bɛzˈbrat͡ʃiɛ" },
{ "из.мра́", "izˈmra" },
{ "сала́та", "sɐˈɫatɐ" },
{ "шега́", "ʃɛˈɡa" },
{ "жена́", "ʒɛˈna" },
{ "инти́мен", "inˈtimɛn" },
{ "посо́лство", "poˈsɔɫstvo" },
{ "ъ́гъл", "ˈɤɡɐɫ"},
{ "усу́квам", "oˈsukvɐm"},
{ "ле́ща", "ˈlɛʃtɐ" },
{ "липа́", "liˈpa" },
{ "океа́н", "okɛˈan" },
{ "меки́ца", "mɛˈkit͡sɐ" },
{ "ла́гер", "ˈɫaɡɛr" },
{ "маги́я", "mɐˈɡijɐ" },
{ "хем", "xɛm" },
{ "химн", "ximn"},
{ "тулу́п", "toˈɫup"},
{ "жа̀р-пти́ца", "ˌʒa̟r-pˈtit͡sɐ" },
{ "в о́фис", "f ˈɔfis" },
{ "във Фра́нция", "vɐf ˈfrant͡sijɐ" },
{ "ня́колко", "ˈnʲa̟koɫko" },
{ "в Япо́ния", "f jɐˈpɔnijɐ" },
{ "автоплу́г", "ɐftoˈpɫuk" }, --ʊ in previous module
{ "ўе́бса́йт", "ˈwɛpˈsajt" },
{ "ўе́лски", "ˈwɛɫski" },
{ "ўе́стърн", "ˈwɛstɐrn" },
{ "О́ўен", "ˈɔwɛn" },
{ "но́ўхаў", "ˈnɔwxɐw" },
{ "Джо́ўзеф", "ˈdʒɔwzɛf" },
{ "бо́ўлинг", "ˈbɔwliŋk" },
{ "даўнло́ўд", "dɐwnˈɫɔwt" },
{ "ўи́ски", "ˈwiski" },
{ "ўи́кенд", "ˈwikɛnt" },
{ "Ўо́рўик", "ˈwɔrwik" },
{ "Хе́лоўин", "ˈxɛɫowin" },
}
--[[
Additions take this form –
{ "word with acutes", "IPA" },
{ "", "" },
Make sure to include the comma, or the module will return an error.
]]
self:iterate(list, "check_output_ipa")
end
function tests:test_hyphenation()
local list = {
{ "височина́", "ви.со.чи.на" },
{ "сестра́", "сес.тра" },
{ "пле́нник", "плен.ник" },
{ "преодоле́я", "пре.одо.лея" },
{ "маои́зъм", "мао.изъм" },
{ "ма́йка", "май.ка" },
{ "а́йс.берг", "айс.берг" },
{ "майо́р", "ма.йор" },
{ "фризьо́р", "фри.зьор" },
{ "суджу́к", "су.джук" },
{ "над.живе́я", "над.жи.вея" },
{ "сестра́", "сес.тра" },
{ "поту́ри", "по.ту.ри"},
{ "слани́на", "сла.ни.на"},
{ "пра́жа", "пра.жа"},
{ "спринцо́вка", "сприн.цов.ка"},
{ "пъ́ржа", "пър.жа"},
{ "я́ркост", "яр.кост"},
{ "рало", "ра.ло"},
{ "бели́ло", "бе.ли.ло"},
{ "шеви́ца", "ше.ви.ца"},
{ "дои́ло", "до.ило"},
{ "нача́ло", "на.ча.ло"},
{ "хи́трост", "хит.рост"},
{ "хи́тър", "хи.тър"},
{ "шеви́ца", "ше.ви.ца"},
{ "вдлъ́бна", "вдлъб.на"},
{ "разма́хам", "раз.ма.хам"},
{ "у́кор", "укор"},
{ "упори́т", "упо.рит"},
{ "о́сем", "осем"},
{ "оце́нка", "оцен.ка"},
{ "ле́я", "лея"},
{ "а́з", "аз"}, -- test out accenting monosyllables just for extra rigor
{ "тя́", "тя"},
{ "е́", "е"},
{ "ме́н", "мен"},
{ "стра́ст", "страст"},
{ "пръст", "пръст"},
{ "шофьо́р", "шо.фьор" },
{ "фотьо́йл", "фо.тьойл" },
{ "бельо́", "бе.льо" },
{ "шедьо́вър", "ше.дьо.вър" },
{ "ме́ниджър", "ме.ни.джър" },
{ "джудже́", "джу.дже" },
{ "жа́р-пти́ца", "жар-пти.ца"},
{ "мора́лно-нра́вствен", "мо.рал.но-нрав.ствен" },
{ "кандида́т-студе́нт", "кан.ди.дат-сту.дент" },
{ "мини́стър-председа́тел", "ми.нис.тър-пред.се.да.тел" },
{ "член-кореспонде́нт", "член-ко.рес.пон.дент" },
{ "би́знес администра́ция", "биз.нес ад.ми.нис.тра‧ция" },
{ "е́кшън геро́й", "ек.шън ге.рой" },
{ "те́нис ко́рт", "те.нис корт" },
{ "заме́стник мини́стър-председа́тел", "за.мес.тник ми.нис.тър-пред.се.да.тел" },
{ "заме́стник нача́лник-управле́ние", "за.мес.тник на.чал.ник-уп.рав.ле.ние" },
{ "SIM ка́рта", "SIM кар.та" },
{ "VIP зо́на", "VIP зо.на" }
}
--[[
Additions take this form –
{ "word (with no accent required)", "expected hyphenation" },
{ "", "" },
Make sure to include the comma, or the module will return an error.
]]
self:iterate(list, "check_output_hyphenation")
end
function tests:test_syllabification()
-- Left side of elements: input to the function, which may include dots (.) for manual syllable division
-- Right side of elements: expected output, with syllable breaks indicated with a dot
local list = {
-- 1. Single.letter words
{ "а", "а" },
{ "в", "в" },
{ "е", "е" },
{ "и", "и" },
{ "ѝ", "ѝ" },
{ "о", "о" },
{ "с", "с" },
{ "у", "у" },
-- 2. Simple monosyllabic words
{ "аз", "аз" },
{ "ти", "ти" },
{ "той", "той" },
{ "тя", "тя" },
{ "във", "във" },
{ "със", "със" },
-- 3. More complex monosyllabic words
{ "принц", "принц" },
{ "спринт", "спринт" },
{ "глист", "глист" },
{ "скункс", "скункс" },
-- 4. Single consonant between two vowels: 3-letter words
{ "ами́", "а.ми" },
{ "ала́", "а.ла" },
{ "ако́", "а.ко" },
{ "уви́", "у.ви" },
{ "или́", "и.ли" },
-- 5. Single consonant between two vowels: stops and fricatives
{ "саламу́ра", "са.ла.му.ра" },
{ "бараба́н", "ба.ра.бан" },
{ "сполу́ка", "спо.лу.ка" },
{ "ща́вя", "ща.вя" },
{ "стри́на", "стри.на" },
{ "кога́то", "ко.га.то" },
{ "изя́м", "и.зям" },
-- 6. Single consonant between two vowels: щ, and single-letter affricates
{ "стари́цата", "ста.ри.ца.та" },
{ "полу́чените", "по.лу.че.ни.те" },
{ "подоба́ващите", "по.до.ба.ва.щи.те" },
{ "обуча́ващите", "о.бу.ча.ва.щи.те" },
-- 7. Single consonant between two vowels: дж
{ "джудже́", "джу.дже" },
{ "суджу́к", "су.джук" },
{ "дамаджа́на", "да.ма.джа.на" },
{ "джа́джите", "джа.джи.те" },
-- 8. Single consonant between two vowels: й
{ "койо́т", "ко.йот" },
{ "майоне́за", "ма.йо.не.за" },
{ "пейорати́вен", "пе.йо.ра.ти.вен" },
{ "майо́р", "ма.йор" },
-- 9. Single consonant between two vowels: morphological prefixes get split
{ "бези́менен", "бе.зи.ме.нен" },
{ "изопача́вам", "и.зо.па.ча.вам" },
{ "оти́вам", "о.ти.вам" },
{ "разора́н", "ра.зо.ран" },
-- 10. Single consonant between two vowels: palatalized by ь
{ "бульо́н", "бу.льон" },
{ "фризьо́р", "фри.зьор" },
{ "шедьо́вър", "ше.дьо.вър" },
{ "гьозу́м", "гьо.зум" },
{ "ликьо́р", "ли.кьор" },
-- 11. Zero consonants between two vowels: at most one elsewhere in word
{ "воа́л", "во.ал" },
{ "маои́зъм", "ма.о.и.зъм" },
{ "фее́рия", "фе.е.ри.я" },
{ "воайо́р", "во.а.йор" },
{ "миока́рд", "ми.о.кард" },
{ "кьо́поолу", "кьо.по.о.лу" },
{ "аятола́х", "а.я.то.лах" },
{ "ава́рия", "а.ва.ри.я" },
{ "пози́ции", "по.зи.ци.и" },
{ "хазя́и", "ха.зя.и" },
{ "дерибе́и", "де.ри.бе.и" },
{ "преодоле́я", "пре.о.до.ле.я" },
-- 12. Two or more consonants between two vowels: щр
{ "нащре́к", "на.щрек" },
{ "поощря́вам", "по.о.щря.вам" },
{ "защрихо́вам", "за.щри.хо.вам" },
{ "поощри́телен", "по.о.щри.те.лен" },
{ "изщра́кване", "из.щрак.ва.не" },
{ "Ва́йерщра̀с", "Ва.йер.щрас" },
{ "Кьо́нигщра̀се", "Кьо.ниг.щра.се" },
-- 13. Two or more consonants between two vowels: щ + other sonorant before vowel
{ "о́бщност", "общ.ност" },
{ "всъ́щност", "всъщ.ност" },
{ "помо́щник", "по.мощ.ник" },
{ "чорапога́щник", "чо.ра.по.гащ.ник" },
{ "но́щница", "нощ.ни.ца" },
{ "чудо́вищност", "чу.до.вищ.ност" },
{ "немощливо", "не.мощ.ли.во" }, -- correct stress?
{ "съобща́вам", "съ.об.ща.вам" },
{ "въобще́", "въ.об.ще" },
-- 14. Two or more consonants between two vowels: дж affricate present
{ "ма́нджа", "ман.джа" },
{ "калайджи́я", "ка.лай.джи.я" },
{ "авджи́я", "ав.джи.я" },
{ "изджва́ка", "из.джва.ка" },
-- 15. Two or more consonants between two vowels: adjacent sonorants or stops
{ "пле́нник", "плен.ник" },
{ "ма́йка", "май.ка" },
{ "про̀фаши́стки", "про.фа.шист.ки" },
{ "гле́дка", "глед.ка" },
{ "кра́чка", "крач.ка" },
{ "це́дка", "цед.ка" },
-- 16a. Two consonants between two vowels: other
{ "звезда́", "звез.да" },
{ "спринцо́вка", "сприн.цов.ка" },
{ "бъ́рзо", "бър.зо" },
{ "ма́лко", "мал.ко" },
{ "по́сле", "по.сле" },
{ "па́ртия", "пар.ти.я" },
{ "гла́нцов", "глан.цов" },
{ "пе́пелник", "пе.пел.ник" },
{ "пи́лци", "пил.ци" },
{ "аншоа́", "ан.шо.а" },
{ "ядро́", "я.дро" },
-- 16b. As above, testing clusters чн, цм, цн, чм
{ "ирони́чност", "и.ро.нич.ност"},
{ "профилакти́чна", "про.фи.лак.тич.на"},
{ "бо́цна", "боц.на"},
{ "спе́цна", "спец.на"},
{ "бичме́", "бич.ме"},
{ "кръ́чма", "кръч.ма"},
{ "бо́цман", "боц.ман"},
{ "сачма́", "сач.ма"},
{ "Ри́чмънд", "Рич.мънд"},
{ "ми́чман", "мич.ман"},
{ "разче́ша", "раз.че.ша"},
{ "пе́цма", "пец.ма"}, -- Probably not a real word
-- 17. Complex consonant clusters: general
{ "сестра́", "се.стра" },
{ "ца́рство", "цар.ство" },
{ "нра́вствен", "нрав.ствен" },
{ "ма́ндраджия", "ман.дра.джи.я" },
{ "мизансце́н", "ми.зан.сцен" },
{ "стра́нство", "стран.ство" },
{ "простра́нство", "про.стран.ство" },
{ "ро́бство", "роб.ство" },
{ "транспо́рт", "тран.спорт" },
-- 18. Consonant cluster not split: св
{ "посви́кна", "по.свик.на" },
-- 19. Forced syllable breaks: when absent
{ "скръ́ндза", "скрън.дза" },
{ "годзи́ла", "год.зи.ла" },
{ "камика́дзе", "ка.ми.кад.зе" },
{ "надживе́я", "на.джи.ве.я" },
-- 20. Forced syllable breaks: when present
{ "скръ́н.дза", "скрън.дза" },
{ "го.дзи́ла", "го.дзи.ла" },
{ "камика́.дзе", "ка.ми.ка.дзе" },
{ "над.живе́я", "над.жи.ве.я" },
-- 21. Morphological prefix handling: без- + equal sonority
{ "безси́лен", "без.си.лен" },
{ "безшу́мен", "без.шу.мен" },
{ "безвъзвра́тен", "без.въз.вра.тен" },
{ "безхабе́рен", "без.ха.бе.рен" },
{ "безстра́шен", "без.стра.шен" },
{ "безхле́бна", "без.хле.бна" },
{ "безвре́мие", "без.вре.ми.е" },
-- 22. Morphological prefix handling: без- + higher sonority
{ "безме́рен", "без.ме.рен" },
{ "безли́чен", "без.ли.чен" },
{ "безнака́зан", "без.на.ка.зан" },
{ "безразбо́рен", "без.раз.бо.рен" },
{ "безде́тен", "без.де.тен" },
{ "безпардо́нен", "без.пар.до.нен" },
{ "безтеле́сен", "без.те.ле.сен" },
{ "безгла́в", "без.глав" },
{ "безче́стен", "без.че.стен" },
{ "безпризо́рен", "без.при.зо.рен" },
{ "безгре́шен", "без.гре.шен" },
{ "безкра́ен", "без.кра.ен" },
{ "безбре́жен", "без.бре.жен" },
{ "бе́здна", "безд.на" },
-- 23. Morphological prefix handling: из- + equal sonority
{ "изхвъ́рлям", "из.хвър.лям" },
{ "изсте́на", "из.сте.на" },
{ "и́звор", "из.вор" },
{ "изво́звам", "из.воз.вам" },
{ "извла́ча", "из.вла.ча" },
{ "изхра́чване", "из.храч.ва.не" },
{ "изшму́гна", "из.шмуг.на" },
{ "изживя́ното", "из.жи.вя.но.то" },
-- 24. Morphological prefix handling: из- + higher sonority
{ "изнена́да", "из.не.на.да" },
{ "излъ́гах", "из.лъ.гах" },
{ "измя́на", "из.мя.на" },
{ "и́зрод", "из.род" },
{ "изтрезви́телно", "из.трез.ви.тел.но" },
{ "изпростя́вял", "из.про.стя.вял" },
{ "изклю́чвам", "из.ключ.вам" },
{ "избли́за", "из.бли.за" },
-- 25. Morphological prefix handling: над- + equal/lower sonority
{ "надсло́в", "над.слов" },
{ "надхвъ́рлен", "над.хвър.лен" },
{ "надви́квам", "над.вик.вам" },
{ "надве́", "над.ве" },
{ "надгро́бен", "над.гро.бен" },
{ "на́дпис", "над.пис" },
{ "надценя́вам", "над.це.ня.вам" },
{ "надделе́я", "над.де.ле.я" },
-- 26. Morphological prefix handling: над- + higher sonority
{ "над.ра́ствам", "над.ра.ствам" },
{ "надмо́щие", "над.мо.щи.е" },
{ "ненадми́нат", "не.над.ми.нат" },
{ "безнадзо́рен", "без.над.зо.рен" },
{ "на́дница", "над.ни.ца" },
{ "надме́нност", "над.мен.ност" },
{ "на.длъ́ж", "на.длъж" },
{ "надробе́н", "на.дро.бен" },
{ "надръ́нкам", "на.дрън.кам" },
{ "надра́скам", "на.дра.скам" },
{ "надру́сам", "на.дру.сам" },
{ "надра́н", "на.дран" },
-- 27. Morphological prefix handling: под. + equal/lower sonority
{ "подстрека́тел", "под.стре.ка.тел" },
{ "подхо́д", "под.ход" },
{ "подви́жен", "под.ви.жен" },
{ "подзагла́вие", "под.за.гла.ви.е" },
{ "подкла́ждам", "под.клаж.дам" },
{ "подбо́р", "под.бор" },
{ "подпи́рам", "под.пи.рам" },
{ "подценя́вам", "под.це.ня.вам" },
-- 28. Morphological prefix handling: под. + higher sonority
{ "подновя́вам", "под.но.вя.вам" },
{ "подма́мвам", "под.мам.вам" },
{ "по́длост", "под.лост" },
{ "под.разделе́ние", "под.раз.де.ле.ни.е" },
{ "подро́бен", "по.дро.бен" },
{ "подража́вам", "по.дра.жа.вам" },
{ "подре́мя", "по.дре.мя" },
{ "подру́сам", "по.дру.сам" },
-- 29. Multiple prefixes
{ "безизра́зен", "бе.зиз.ра.зен" },
{ "безизра́зност", "бе.зиз.ра.зност" },
{ "безвъзме́зден", "без.въз.мез.ден" },
{ "безвъзду́шен", "без.въз.ду.шен" },
{ "безразли́чен", "без.раз.ли.чен" },
{ "безразбо́рност", "без.раз.бор.ност" },
{ "безпредме́тен", "без.пред.ме.тен" },
{ "поизпра́вя", "по.из.пра.вя" },
{ "поизмъ́ча", "по.из.мъ.ча" },
{ "поизгла́дя", "по.из.гла.дя" },
{ "произноше́ние", "про.из.но.ше.ни.е" },
{ "произти́ча", "про.из.ти.ча" },
{ "наизми́слил", "на.из.ми.слил" },
{ "наизле́злите", "на.из.ле.зли.те" },
{ "предразположе́ние", "пред.раз.по.ло.же.ни.е" },
{ "преразгле́ждане", "пре.раз.глеж.да.не" },
{ "преразпределе́ние", "пре.раз.пре.де.ле.ни.е" },
{ "прера́зказ", "пре.раз.каз" },
{ "превъзмо́гна", "пре.въз.мог.на" },
{ "превъзпита́ние", "пре.въз.пи.та.ни.е" },
{ "преизда́вам", "пре.из.да.вам" },
{ "преизби́рам", "пре.из.би.рам" },
{ "невъзмо́жен", "не.въз.мо.жен" },
{ "невъзпи́тан", "не.въз.пи.тан" },
{ "неизбе́жен", "не.из.бе.жен" },
{ "неизме́нност", "не.из.мен.ност" },
{ "неразде́лен", "не.раз.де.лен" },
{ "неразположе́ние", "не.раз.по.ло.же.ни.е" },
{ "поразми́сля", "по.раз.ми.сля" },
{ "пораздру́сам", "по.раз.дру.сам" },
{ "наразка́зах", "на.раз.ка.зах" },
{ "наразлепи́л", "на.раз.ле.пил" },
{ "неотло́жен", "не.от.ло.жен" },
{ "неотмени́м", "не.от.ме.ним" },
{ "поотло́жа", "по.от.ло.жа" },
{ "поотми́на", "по.от.ми.на" },
-- 30. Loanwords with /w/ as a consonant: default spelling with 'у'
{ "уе́лски", "у.ел.ски" },
{ "уе́бсайт", "у.еб.сайт" },
{ "уе́стърн", "у.е.стърн" },
{ "О́уен", "О.у.ен" },
{ "но́уха̀у", "но.у.ха.у" },
{ "Джо́узеф", "Джо.у.зеф" },
{ "бо́улинг", "бо.у.линг" },
{ "да̀унло́уд", "да.ун.ло.уд" },
{ "уи́ски", "у.и.ски" },
{ "уи́кенд", "у.и.кенд" },
{ "Уо́руик", "У.о.ру.ик" },
{ "Хе́лоуин", "Хе.ло.у.ин" },
-- 31. Loanwords with /w/ as a consonant: alternative spelling with 'ў'
{ "ўе́лски", "уел.ски" },
{ "ўе́бсайт", "уеб.сайт" },
{ "ўе́стърн", "уе.стърн" },
{ "О́ўен", "О.уен" },
{ "но́ўха̀ў", "ноу.хау" },
{ "Джо́ўзеф", "Джоу.зеф" },
{ "бо́ўлинг", "боу.линг" },
{ "да̀ўн.ло́ўд", "даун.лоуд" },
{ "ўи́ски", "уи.ски" },
{ "ўи́кенд", "уи.кенд" },
{ "Ўо́рўик", "Уор.уик" },
{ "Хе́лоўин", "Хе.ло.уин" },
{ "ўи́нд.сърфинг", "уинд.сър.финг" },
-- 32. Multiple-word terms with hyphens or spaces
{ "ра́зни хо́ра-ра́зни вку́сове", "раз.ни хо.ра-раз.ни вку.со.ве", },
{ "акуше́р-гинеколо́г", "а.ку.шер-ги.не.ко.лог" },
{ "на́й-напре́д", "най-на.пред" },
{ "ампер-ча́с", "ам.пер-час" },
{ "га́-га́", "га-га" }, -- no-op
{ "пи́-пи́", "пи-пи" },
{ "Гвине́я-Биса́у", "Гви.не.я-Би.са.у" },
{ "ша́м-фъстъ́к", "шам-фъ.стък" },
{ "вълна́-уби́ец", "въл.на-у.би.ец" },
{ "акуше́р-гинеколо́г", "а.ку.шер-ги.не.ко.лог" },
{ "по́-добре́ къ́сно, отко́лкото ни́кога", "по-до.бре къ.сно, от.кол.ко.то ни.ко.га" },
{ "зени́тно-раке́тен", "зе.нит.но-ра.ке.тен" },
{ "го́ре-до́лу", "го.ре-до.лу" },
{ "на́й-по́сле", "най-по.сле" },
{ "чик-чири́к", "чик-чи.рик" },
{ "сре́ден ро́д", "сре.ден род" },
{ "божа́ кра́вичка", "бо.жа кра.вич.ка" },
{ "Съедине́ни америка́нски ща́ти", "Съ.е.ди.не.ни а.ме.ри.кан.ски ща.ти" },
{ "от мла́дих до ста́рих", "от мла.дих до ста.рих" },
{ "со кро́тце, со бла́го и со ма́лко кюте́к", "со крот.це, со бла.го и со мал.ко кю.тек" }
}
--[[
Additions take this form –
{ "word (with no accent required)", "expected syllabification" },
{ "", "" },
Make sure to include the comma, or the module will return an error.
]]
self:iterate(list, "check_output_syllabification")
end
function tests:test_rhymes()
local function make_args(tbl)
return { args=tbl }
end
local list = {
-- Words rhyming in -am
{"грам", "am"},
{"прям", "am"},
{"сам", "am"},
{"едва́м", "am"},
{"хипопота́м", "am"},
-- Words rhyming in -it͡ʃɛn
{"ли́чен", "it͡ʃɛn"},
{"графи́чен", "it͡ʃɛn"},
{"психи́чен", "it͡ʃɛn"},
{"ритми́чен", "it͡ʃɛn"},
{"цини́чен", "it͡ʃɛn"},
{"части́чен", "it͡ʃɛn"},
{"себи́чен", "it͡ʃɛn"},
{"категори́чен", "it͡ʃɛn"},
{"мелоди́чен", "it͡ʃɛn"},
{"микроскопи́чен", "it͡ʃɛn"},
{"етимологи́чен", "it͡ʃɛn"},
{"епидемиологи́чен", "it͡ʃɛn"},
-- Words rhyming in -ɔf
{"зов", "ɔf"},
{"нов", "ɔf"},
{"оф", "ɔf"},
{"карто́ф", "ɔf"},
{"пищо́в", "ɔf"},
{"Цветко́в", "ɔf"},
{"Попо́в", "ɔf"},
{"Свищо́в", "ɔf"},
{"надсло́в", "ɔf"},
{"апостро́ф", "ɔf"},
{"полугото́в", "ɔf"},
-- Words rhyming in -ɛnɐ
{"вселе́на", "ɛnɐ"},
{"Еле́на", "ɛnɐ"},
-- Words rhyming in -ɛtɐ
{"ге́та", "ɛtɐ"},
{"че́та", "ɛtɐ"},
{"баре́та", "ɛtɐ"},
{"касе́та", "ɛtɐ"},
{"соле́та", "ɛtɐ"},
{"раке́та", "ɛtɐ"},
{"каре́та", "ɛtɐ"},
-- Words rhyming in -ɛt͡ʃk
{"кле́чка", "ɛt͡ʃkɐ"},
{"пе́чка", "ɛt͡ʃkɐ"},
{"апте́чка", "ɛt͡ʃkɐ"},
{"пресе́чка", "ɛt͡ʃkɐ"},
{"юрде́чка", "ɛt͡ʃkɐ"},
{"буболе́чка", "ɛt͡ʃkɐ"},
-- Words rhyming in -ɤn
{"вън", "ɤn"},
{"звън", "ɤn"},
{"мрън", "ɤn"},
{"трън", "ɤn"},
{"сън", "ɤn"},
{"алтъ́н", "ɤn"},
{"сакъ́н", "ɤn"},
{"насъ́н", "ɤn"},
{"гръмотръ́н", "ɤn"},
-- Words rhyming in -un
{"хун", "un"},
{"басту́н", "un"},
{"Перу́н", "un"},
{"харпу́н", "un"},
{"шогу́н", "un"},
{"сапу́н", "un"},
{"саму́н", "un"},
{"Непту́н", "un"},
{"Камеру́н", "un"},
{"опеку́н", "un"},
-- Words rhyming in -urɐ
{"му́ра", "urɐ"},
{"су́ра", "urɐ"},
{"брошу́ра", "urɐ"},
{"култу́ра", "urɐ"},
{"фризу́ра", "urɐ"},
{"мату́ра", "urɐ"},
{"цезу́ра", "urɐ"},
{"агенту́ра", "urɐ"},
{"армату́ра", "urɐ"},
{"саламу́ра", "urɐ"},
{"архитекту́ра", "urɐ"},
{"аквакулту́ра", "urɐ"},
{"агрикулту́ра", "urɐ"},
-- Words rhyming in -va
{"два", "va"},
{"брава́", "va"},
{"трева́", "va"},
{"глава́", "va"},
{"това́", "va"},
{"едва́", "va"},
{"баклава́", "va"},
{"затова́", "va"},
{"тетива́", "va"},
-- Words rhyming in -a
{"боа́", "a"},
{"Беноа́", "a"},
{"аншоа́", "a"},
{"амплоа́", "a"},
{"Франсоа́", "a"},
{"буржоа́", "a"},
{"Делакроа́", "a"},
-- Words ending in the -та definite article stressed
{make_args{"света́", endschwa=1}, "tɤ"},
{make_args{"съвестта́", endschwa=1}, "tɤ"},
{make_args{"песента́", endschwa=1}, "tɤ"},
{make_args{"областта́", endschwa=1}, "tɤ"},
{make_args{"болестта́", endschwa=1}, "tɤ"},
{make_args{"мъдростта́", endschwa=1}, "tɤ"},
{make_args{"разсъдливостта́", endschwa=1}, "tɤ"},
-- Verbs ending in a stressed а/я
{make_args{"боля́", endschwa=1}, "lʲɤ"},
{make_args{"бедя́", endschwa=1}, "dʲɤ"},
{make_args{"бумтя́", endschwa=1}, "tʲɤ"},
{make_args{"вися́", endschwa=1}, "sʲɤ"},
{make_args{"бода́", endschwa=1}, "dɤ"},
{make_args{"веда́", endschwa=1}, "dɤ"},
{make_args{"възпроизведа́", endschwa=1}, "dɤ"},
{make_args{"зда", endschwa=1}, "dɤ"},
{make_args{"бера́", endschwa=1}, "rɤ"},
{make_args{"възпра́", endschwa=1}, "rɤ"},
{make_args{"вра", endschwa=1}, "rɤ"},
{make_args{"навра́", endschwa=1}, "rɤ"},
{make_args{"буя́", endschwa=1}, "jɤ"},
{make_args{"доя́", endschwa=1}, "jɤ"},
{make_args{"безпокоя́", endschwa=1}, "jɤ"},
{make_args{"греба́", endschwa=1}, "bɤ"},
{make_args{"измета́", endschwa=1}, "tɤ"},
{make_args{"лежа́", endschwa=1}, "ʒɤ"},
{make_args{"държа́", endschwa=1}, "ʒɤ"},
{make_args{"дължа́", endschwa=1}, "ʒɤ"},
{make_args{"кова́", endschwa=1}, "vɤ"},
-- Words ending in an affricate followed by a stressed vowel
{make_args{"дередже́"}, "dʒɛ"}, -- "d͡ʒ might be preferable, but this is the current IPA and it seems to be acceptable"
{make_args{"коскоджа́"}, "dʒa"},
{make_args{"хвърча́", endschwa=1}, "t͡ʃɤ"},
{make_args{"хълца́", endschwa=1}, "t͡sɤ"}, -- fake word for illustration
}
self:iterate(list, "check_output_rhymes")
end
return tests
pr8zva8fsaklmq688jnra5ky261xyl3
234881
234880
2026-05-24T09:40:42Z
Lee
19
[[:en:Module:bg-pronunciation/testcases]] වෙතින් එක් සංශෝධනයක්
234880
Scribunto
text/plain
local tests = require("Module:UnitTests")
local m_pron = require("Module:bg-pronunciation")
local rhymes_module = "Module:rhymes"
local Bulgarian = require("Module:languages").getByCode("bg")
local Cyrillic = require("Module:scripts").getByCode("Cyrl")
local function link(term)
return require("Module:links").full_link{ term = term, lang = Bulgarian, sc = Cyrillic }
end
local function tag_IPA(IPA)
return '<span class="IPA">' .. IPA .. '</span>'
end
local function identity(x)
return x
end
local display_hyphenation = identity
local display_syllabification = identity
local function display_rhymes(ipa)
return require(rhymes_module).show_row({"bg", ipa})
end
function tests:check_output_ipa(term, expected, endschwa)
local normalized_term = m_pron.remove_pron_notations(term)
tests:equals(
link(normalized_term) ..
(term ~= normalized_term and " (respelled " .. term .. ")" or "") ..
(endschwa and ", endschwa=true" or ""),
m_pron.toIPA(term, endschwa),
expected,
{ display = tag_IPA }
)
end
function tests:check_output_hyphenation(term, expected)
tests:equals(
link(term),
m_pron.hyphenate_total(term),
mw.ustring.gsub(expected, "[.]", "‧"),
{ display = display_hyphenation }
)
end
function tests:check_output_syllabification(term, expected)
tests:equals(
link(term),
m_pron.syllabify(term),
mw.ustring.gsub(expected, "[.]", "‧"),
{ display = display_syllabification }
)
end
function tests:check_output_rhymes(term, expected)
tests:equals(
link((type(term) == "table" and term.args[1] or term):gsub("̣", "")),
m_pron.get_rhymes(m_pron.toIPA(term)),
expected,
{ display = display_rhymes }
)
end
function tests:test_ipa()
local list = {
{ "къ́ща", "ˈkɤʃtɐ" },
{ "сгъстя́ се", "zɡɐˈstʲɤ̟ sɛ", true },
{ "сгъстя̣́ се", "zɡɐˈstʲɤ̟ sɛ"},
{ "а̀бдики́ращ", "ˌabdiˈkirɐʃt" },
{ "безшу́мен", "bɛʃˈʃu̟mɛn" },
{ "щастли́в", "ʃtɐˈslif" },
{ "народността́", "nɐrodnoˈsta" },
{ "я", "ja̟" },
{ "юг", "ju̟k" },
{ "яйце́", "jɐjˈt͡sɛ" },
{ "изя́м", "iˈzʲa̟m"}, -- not morphological, but seemingly necessary to avoid a palatalization-initial syllable.
{ "учи́лище", "oˈt͡ʃiliʃtɛ" },
{ "чорбаджи́я", "t͡ʃo̟rbɐˈdʒijɐ" },
{ "уби́йца", "oˈbijt͡sɐ" },
{ "безбра́чие", "bɛzˈbrat͡ʃiɛ" },
{ "из.мра́", "izˈmra" },
{ "сала́та", "sɐˈɫatɐ" },
{ "шега́", "ʃɛˈɡa" },
{ "жена́", "ʒɛˈna" },
{ "инти́мен", "inˈtimɛn" },
{ "посо́лство", "poˈsɔɫstvo" },
{ "ъ́гъл", "ˈɤɡɐɫ"},
{ "усу́квам", "oˈsukvɐm"},
{ "ле́ща", "ˈlɛʃtɐ" },
{ "липа́", "liˈpa" },
{ "океа́н", "okɛˈan" },
{ "меки́ца", "mɛˈkit͡sɐ" },
{ "ла́гер", "ˈɫaɡɛr" },
{ "маги́я", "mɐˈɡijɐ" },
{ "хем", "xɛm" },
{ "химн", "ximn"},
{ "тулу́п", "toˈɫup"},
{ "жа̀р-пти́ца", "ˌʒa̟r-pˈtit͡sɐ" },
{ "в о́фис", "f ˈɔfis" },
{ "във Фра́нция", "vɐf ˈfrant͡sijɐ" },
{ "ня́колко", "ˈnʲa̟koɫko" },
{ "в Япо́ния", "f jɐˈpɔnijɐ" },
{ "автоплу́г", "ɐftoˈpɫuk" }, --ʊ in previous module
{ "ўе́бса́йт", "ˈwɛpˈsajt" },
{ "ўе́лски", "ˈwɛɫski" },
{ "ўе́стърн", "ˈwɛstɐrn" },
{ "О́ўен", "ˈɔwɛn" },
{ "но́ўхаў", "ˈnɔwxɐw" },
{ "Джо́ўзеф", "ˈdʒɔwzɛf" },
{ "бо́ўлинг", "ˈbɔwliŋk" },
{ "даўнло́ўд", "dɐwnˈɫɔwt" },
{ "ўи́ски", "ˈwiski" },
{ "ўи́кенд", "ˈwikɛnt" },
{ "Ўо́рўик", "ˈwɔrwik" },
{ "Хе́лоўин", "ˈxɛɫowin" },
}
--[[
Additions take this form –
{ "word with acutes", "IPA" },
{ "", "" },
Make sure to include the comma, or the module will return an error.
]]
self:iterate(list, "check_output_ipa")
end
function tests:test_hyphenation()
local list = {
{ "височина́", "ви.со.чи.на" },
{ "сестра́", "сес.тра" },
{ "пле́нник", "плен.ник" },
{ "преодоле́я", "пре.одо.лея" },
{ "маои́зъм", "мао.изъм" },
{ "ма́йка", "май.ка" },
{ "а́йс.берг", "айс.берг" },
{ "майо́р", "ма.йор" },
{ "фризьо́р", "фри.зьор" },
{ "суджу́к", "су.джук" },
{ "над.живе́я", "над.жи.вея" },
{ "сестра́", "сес.тра" },
{ "поту́ри", "по.ту.ри"},
{ "слани́на", "сла.ни.на"},
{ "пра́жа", "пра.жа"},
{ "спринцо́вка", "сприн.цов.ка"},
{ "пъ́ржа", "пър.жа"},
{ "я́ркост", "яр.кост"},
{ "рало", "ра.ло"},
{ "бели́ло", "бе.ли.ло"},
{ "шеви́ца", "ше.ви.ца"},
{ "дои́ло", "до.ило"},
{ "нача́ло", "на.ча.ло"},
{ "хи́трост", "хит.рост"},
{ "хи́тър", "хи.тър"},
{ "шеви́ца", "ше.ви.ца"},
{ "вдлъ́бна", "вдлъб.на"},
{ "разма́хам", "раз.ма.хам"},
{ "у́кор", "укор"},
{ "упори́т", "упо.рит"},
{ "о́сем", "осем"},
{ "оце́нка", "оцен.ка"},
{ "ле́я", "лея"},
{ "а́з", "аз"}, -- test out accenting monosyllables just for extra rigor
{ "тя́", "тя"},
{ "е́", "е"},
{ "ме́н", "мен"},
{ "стра́ст", "страст"},
{ "пръст", "пръст"},
{ "шофьо́р", "шо.фьор" },
{ "фотьо́йл", "фо.тьойл" },
{ "бельо́", "бе.льо" },
{ "шедьо́вър", "ше.дьо.вър" },
{ "ме́ниджър", "ме.ни.джър" },
{ "джудже́", "джу.дже" },
{ "жа́р-пти́ца", "жар-пти.ца"},
{ "мора́лно-нра́вствен", "мо.рал.но-нрав.ствен" },
{ "кандида́т-студе́нт", "кан.ди.дат-сту.дент" },
{ "мини́стър-председа́тел", "ми.нис.тър-пред.се.да.тел" },
{ "член-кореспонде́нт", "член-ко.рес.пон.дент" },
{ "би́знес администра́ция", "биз.нес ад.ми.нис.тра‧ция" },
{ "е́кшън геро́й", "ек.шън ге.рой" },
{ "те́нис ко́рт", "те.нис корт" },
{ "заме́стник мини́стър-председа́тел", "за.мес.тник ми.нис.тър-пред.се.да.тел" },
{ "заме́стник нача́лник-управле́ние", "за.мес.тник на.чал.ник-уп.рав.ле.ние" },
{ "SIM ка́рта", "SIM кар.та" },
{ "VIP зо́на", "VIP зо.на" }
}
--[[
Additions take this form –
{ "word (with no accent required)", "expected hyphenation" },
{ "", "" },
Make sure to include the comma, or the module will return an error.
]]
self:iterate(list, "check_output_hyphenation")
end
function tests:test_syllabification()
-- Left side of elements: input to the function, which may include dots (.) for manual syllable division
-- Right side of elements: expected output, with syllable breaks indicated with a dot
local list = {
-- 1. Single.letter words
{ "а", "а" },
{ "в", "в" },
{ "е", "е" },
{ "и", "и" },
{ "ѝ", "ѝ" },
{ "о", "о" },
{ "с", "с" },
{ "у", "у" },
-- 2. Simple monosyllabic words
{ "аз", "аз" },
{ "ти", "ти" },
{ "той", "той" },
{ "тя", "тя" },
{ "във", "във" },
{ "със", "със" },
-- 3. More complex monosyllabic words
{ "принц", "принц" },
{ "спринт", "спринт" },
{ "глист", "глист" },
{ "скункс", "скункс" },
-- 4. Single consonant between two vowels: 3-letter words
{ "ами́", "а.ми" },
{ "ала́", "а.ла" },
{ "ако́", "а.ко" },
{ "уви́", "у.ви" },
{ "или́", "и.ли" },
-- 5. Single consonant between two vowels: stops and fricatives
{ "саламу́ра", "са.ла.му.ра" },
{ "бараба́н", "ба.ра.бан" },
{ "сполу́ка", "спо.лу.ка" },
{ "ща́вя", "ща.вя" },
{ "стри́на", "стри.на" },
{ "кога́то", "ко.га.то" },
{ "изя́м", "и.зям" },
-- 6. Single consonant between two vowels: щ, and single-letter affricates
{ "стари́цата", "ста.ри.ца.та" },
{ "полу́чените", "по.лу.че.ни.те" },
{ "подоба́ващите", "по.до.ба.ва.щи.те" },
{ "обуча́ващите", "о.бу.ча.ва.щи.те" },
-- 7. Single consonant between two vowels: дж
{ "джудже́", "джу.дже" },
{ "суджу́к", "су.джук" },
{ "дамаджа́на", "да.ма.джа.на" },
{ "джа́джите", "джа.джи.те" },
-- 8. Single consonant between two vowels: й
{ "койо́т", "ко.йот" },
{ "майоне́за", "ма.йо.не.за" },
{ "пейорати́вен", "пе.йо.ра.ти.вен" },
{ "майо́р", "ма.йор" },
-- 9. Single consonant between two vowels: morphological prefixes get split
{ "бези́менен", "бе.зи.ме.нен" },
{ "изопача́вам", "и.зо.па.ча.вам" },
{ "оти́вам", "о.ти.вам" },
{ "разора́н", "ра.зо.ран" },
-- 10. Single consonant between two vowels: palatalized by ь
{ "бульо́н", "бу.льон" },
{ "фризьо́р", "фри.зьор" },
{ "шедьо́вър", "ше.дьо.вър" },
{ "гьозу́м", "гьо.зум" },
{ "ликьо́р", "ли.кьор" },
-- 11. Zero consonants between two vowels: at most one elsewhere in word
{ "воа́л", "во.ал" },
{ "маои́зъм", "ма.о.и.зъм" },
{ "фее́рия", "фе.е.ри.я" },
{ "воайо́р", "во.а.йор" },
{ "миока́рд", "ми.о.кард" },
{ "кьо́поолу", "кьо.по.о.лу" },
{ "аятола́х", "а.я.то.лах" },
{ "ава́рия", "а.ва.ри.я" },
{ "пози́ции", "по.зи.ци.и" },
{ "хазя́и", "ха.зя.и" },
{ "дерибе́и", "де.ри.бе.и" },
{ "преодоле́я", "пре.о.до.ле.я" },
-- 12. Two or more consonants between two vowels: щр
{ "нащре́к", "на.щрек" },
{ "поощря́вам", "по.о.щря.вам" },
{ "защрихо́вам", "за.щри.хо.вам" },
{ "поощри́телен", "по.о.щри.те.лен" },
{ "изщра́кване", "из.щрак.ва.не" },
{ "Ва́йерщра̀с", "Ва.йер.щрас" },
{ "Кьо́нигщра̀се", "Кьо.ниг.щра.се" },
-- 13. Two or more consonants between two vowels: щ + other sonorant before vowel
{ "о́бщност", "общ.ност" },
{ "всъ́щност", "всъщ.ност" },
{ "помо́щник", "по.мощ.ник" },
{ "чорапога́щник", "чо.ра.по.гащ.ник" },
{ "но́щница", "нощ.ни.ца" },
{ "чудо́вищност", "чу.до.вищ.ност" },
{ "немощливо", "не.мощ.ли.во" }, -- correct stress?
{ "съобща́вам", "съ.об.ща.вам" },
{ "въобще́", "въ.об.ще" },
-- 14. Two or more consonants between two vowels: дж affricate present
{ "ма́нджа", "ман.джа" },
{ "калайджи́я", "ка.лай.джи.я" },
{ "авджи́я", "ав.джи.я" },
{ "изджва́ка", "из.джва.ка" },
-- 15. Two or more consonants between two vowels: adjacent sonorants or stops
{ "пле́нник", "плен.ник" },
{ "ма́йка", "май.ка" },
{ "про̀фаши́стки", "про.фа.шист.ки" },
{ "гле́дка", "глед.ка" },
{ "кра́чка", "крач.ка" },
{ "це́дка", "цед.ка" },
-- 16a. Two consonants between two vowels: other
{ "звезда́", "звез.да" },
{ "спринцо́вка", "сприн.цов.ка" },
{ "бъ́рзо", "бър.зо" },
{ "ма́лко", "мал.ко" },
{ "по́сле", "по.сле" },
{ "па́ртия", "пар.ти.я" },
{ "гла́нцов", "глан.цов" },
{ "пе́пелник", "пе.пел.ник" },
{ "пи́лци", "пил.ци" },
{ "аншоа́", "ан.шо.а" },
{ "ядро́", "я.дро" },
-- 16b. As above, testing clusters чн, цм, цн, чм
{ "ирони́чност", "и.ро.нич.ност"},
{ "профилакти́чна", "про.фи.лак.тич.на"},
{ "бо́цна", "боц.на"},
{ "спе́цна", "спец.на"},
{ "бичме́", "бич.ме"},
{ "кръ́чма", "кръч.ма"},
{ "бо́цман", "боц.ман"},
{ "сачма́", "сач.ма"},
{ "Ри́чмънд", "Рич.мънд"},
{ "ми́чман", "мич.ман"},
{ "разче́ша", "раз.че.ша"},
{ "пе́цма", "пец.ма"}, -- Probably not a real word
-- 17. Complex consonant clusters: general
{ "сестра́", "се.стра" },
{ "ца́рство", "цар.ство" },
{ "нра́вствен", "нрав.ствен" },
{ "ма́ндраджия", "ман.дра.джи.я" },
{ "мизансце́н", "ми.зан.сцен" },
{ "стра́нство", "стран.ство" },
{ "простра́нство", "про.стран.ство" },
{ "ро́бство", "роб.ство" },
{ "транспо́рт", "тран.спорт" },
-- 18. Consonant cluster not split: св
{ "посви́кна", "по.свик.на" },
-- 19. Forced syllable breaks: when absent
{ "скръ́ндза", "скрън.дза" },
{ "годзи́ла", "год.зи.ла" },
{ "камика́дзе", "ка.ми.кад.зе" },
{ "надживе́я", "на.джи.ве.я" },
-- 20. Forced syllable breaks: when present
{ "скръ́н.дза", "скрън.дза" },
{ "го.дзи́ла", "го.дзи.ла" },
{ "камика́.дзе", "ка.ми.ка.дзе" },
{ "над.живе́я", "над.жи.ве.я" },
-- 21. Morphological prefix handling: без- + equal sonority
{ "безси́лен", "без.си.лен" },
{ "безшу́мен", "без.шу.мен" },
{ "безвъзвра́тен", "без.въз.вра.тен" },
{ "безхабе́рен", "без.ха.бе.рен" },
{ "безстра́шен", "без.стра.шен" },
{ "безхле́бна", "без.хле.бна" },
{ "безвре́мие", "без.вре.ми.е" },
-- 22. Morphological prefix handling: без- + higher sonority
{ "безме́рен", "без.ме.рен" },
{ "безли́чен", "без.ли.чен" },
{ "безнака́зан", "без.на.ка.зан" },
{ "безразбо́рен", "без.раз.бо.рен" },
{ "безде́тен", "без.де.тен" },
{ "безпардо́нен", "без.пар.до.нен" },
{ "безтеле́сен", "без.те.ле.сен" },
{ "безгла́в", "без.глав" },
{ "безче́стен", "без.че.стен" },
{ "безпризо́рен", "без.при.зо.рен" },
{ "безгре́шен", "без.гре.шен" },
{ "безкра́ен", "без.кра.ен" },
{ "безбре́жен", "без.бре.жен" },
{ "бе́здна", "безд.на" },
-- 23. Morphological prefix handling: из- + equal sonority
{ "изхвъ́рлям", "из.хвър.лям" },
{ "изсте́на", "из.сте.на" },
{ "и́звор", "из.вор" },
{ "изво́звам", "из.воз.вам" },
{ "извла́ча", "из.вла.ча" },
{ "изхра́чване", "из.храч.ва.не" },
{ "изшму́гна", "из.шмуг.на" },
{ "изживя́ното", "из.жи.вя.но.то" },
-- 24. Morphological prefix handling: из- + higher sonority
{ "изнена́да", "из.не.на.да" },
{ "излъ́гах", "из.лъ.гах" },
{ "измя́на", "из.мя.на" },
{ "и́зрод", "из.род" },
{ "изтрезви́телно", "из.трез.ви.тел.но" },
{ "изпростя́вял", "из.про.стя.вял" },
{ "изклю́чвам", "из.ключ.вам" },
{ "избли́за", "из.бли.за" },
-- 25. Morphological prefix handling: над- + equal/lower sonority
{ "надсло́в", "над.слов" },
{ "надхвъ́рлен", "над.хвър.лен" },
{ "надви́квам", "над.вик.вам" },
{ "надве́", "над.ве" },
{ "надгро́бен", "над.гро.бен" },
{ "на́дпис", "над.пис" },
{ "надценя́вам", "над.це.ня.вам" },
{ "надделе́я", "над.де.ле.я" },
-- 26. Morphological prefix handling: над- + higher sonority
{ "над.ра́ствам", "над.ра.ствам" },
{ "надмо́щие", "над.мо.щи.е" },
{ "ненадми́нат", "не.над.ми.нат" },
{ "безнадзо́рен", "без.над.зо.рен" },
{ "на́дница", "над.ни.ца" },
{ "надме́нност", "над.мен.ност" },
{ "на.длъ́ж", "на.длъж" },
{ "надробе́н", "на.дро.бен" },
{ "надръ́нкам", "на.дрън.кам" },
{ "надра́скам", "на.дра.скам" },
{ "надру́сам", "на.дру.сам" },
{ "надра́н", "на.дран" },
-- 27. Morphological prefix handling: под. + equal/lower sonority
{ "подстрека́тел", "под.стре.ка.тел" },
{ "подхо́д", "под.ход" },
{ "подви́жен", "под.ви.жен" },
{ "подзагла́вие", "под.за.гла.ви.е" },
{ "подкла́ждам", "под.клаж.дам" },
{ "подбо́р", "под.бор" },
{ "подпи́рам", "под.пи.рам" },
{ "подценя́вам", "под.це.ня.вам" },
-- 28. Morphological prefix handling: под. + higher sonority
{ "подновя́вам", "под.но.вя.вам" },
{ "подма́мвам", "под.мам.вам" },
{ "по́длост", "под.лост" },
{ "под.разделе́ние", "под.раз.де.ле.ни.е" },
{ "подро́бен", "по.дро.бен" },
{ "подража́вам", "по.дра.жа.вам" },
{ "подре́мя", "по.дре.мя" },
{ "подру́сам", "по.дру.сам" },
-- 29. Multiple prefixes
{ "безизра́зен", "бе.зиз.ра.зен" },
{ "безизра́зност", "бе.зиз.ра.зност" },
{ "безвъзме́зден", "без.въз.мез.ден" },
{ "безвъзду́шен", "без.въз.ду.шен" },
{ "безразли́чен", "без.раз.ли.чен" },
{ "безразбо́рност", "без.раз.бор.ност" },
{ "безпредме́тен", "без.пред.ме.тен" },
{ "поизпра́вя", "по.из.пра.вя" },
{ "поизмъ́ча", "по.из.мъ.ча" },
{ "поизгла́дя", "по.из.гла.дя" },
{ "произноше́ние", "про.из.но.ше.ни.е" },
{ "произти́ча", "про.из.ти.ча" },
{ "наизми́слил", "на.из.ми.слил" },
{ "наизле́злите", "на.из.ле.зли.те" },
{ "предразположе́ние", "пред.раз.по.ло.же.ни.е" },
{ "преразгле́ждане", "пре.раз.глеж.да.не" },
{ "преразпределе́ние", "пре.раз.пре.де.ле.ни.е" },
{ "прера́зказ", "пре.раз.каз" },
{ "превъзмо́гна", "пре.въз.мог.на" },
{ "превъзпита́ние", "пре.въз.пи.та.ни.е" },
{ "преизда́вам", "пре.из.да.вам" },
{ "преизби́рам", "пре.из.би.рам" },
{ "невъзмо́жен", "не.въз.мо.жен" },
{ "невъзпи́тан", "не.въз.пи.тан" },
{ "неизбе́жен", "не.из.бе.жен" },
{ "неизме́нност", "не.из.мен.ност" },
{ "неразде́лен", "не.раз.де.лен" },
{ "неразположе́ние", "не.раз.по.ло.же.ни.е" },
{ "поразми́сля", "по.раз.ми.сля" },
{ "пораздру́сам", "по.раз.дру.сам" },
{ "наразка́зах", "на.раз.ка.зах" },
{ "наразлепи́л", "на.раз.ле.пил" },
{ "неотло́жен", "не.от.ло.жен" },
{ "неотмени́м", "не.от.ме.ним" },
{ "поотло́жа", "по.от.ло.жа" },
{ "поотми́на", "по.от.ми.на" },
-- 30. Loanwords with /w/ as a consonant: default spelling with 'у'
{ "уе́лски", "у.ел.ски" },
{ "уе́бсайт", "у.еб.сайт" },
{ "уе́стърн", "у.е.стърн" },
{ "О́уен", "О.у.ен" },
{ "но́уха̀у", "но.у.ха.у" },
{ "Джо́узеф", "Джо.у.зеф" },
{ "бо́улинг", "бо.у.линг" },
{ "да̀унло́уд", "да.ун.ло.уд" },
{ "уи́ски", "у.и.ски" },
{ "уи́кенд", "у.и.кенд" },
{ "Уо́руик", "У.о.ру.ик" },
{ "Хе́лоуин", "Хе.ло.у.ин" },
-- 31. Loanwords with /w/ as a consonant: alternative spelling with 'ў'
{ "ўе́лски", "уел.ски" },
{ "ўе́бсайт", "уеб.сайт" },
{ "ўе́стърн", "уе.стърн" },
{ "О́ўен", "О.уен" },
{ "но́ўха̀ў", "ноу.хау" },
{ "Джо́ўзеф", "Джоу.зеф" },
{ "бо́ўлинг", "боу.линг" },
{ "да̀ўн.ло́ўд", "даун.лоуд" },
{ "ўи́ски", "уи.ски" },
{ "ўи́кенд", "уи.кенд" },
{ "Ўо́рўик", "Уор.уик" },
{ "Хе́лоўин", "Хе.ло.уин" },
{ "ўи́нд.сърфинг", "уинд.сър.финг" },
-- 32. Multiple-word terms with hyphens or spaces
{ "ра́зни хо́ра-ра́зни вку́сове", "раз.ни хо.ра-раз.ни вку.со.ве", },
{ "акуше́р-гинеколо́г", "а.ку.шер-ги.не.ко.лог" },
{ "на́й-напре́д", "най-на.пред" },
{ "ампер-ча́с", "ам.пер-час" },
{ "га́-га́", "га-га" }, -- no-op
{ "пи́-пи́", "пи-пи" },
{ "Гвине́я-Биса́у", "Гви.не.я-Би.са.у" },
{ "ша́м-фъстъ́к", "шам-фъ.стък" },
{ "вълна́-уби́ец", "въл.на-у.би.ец" },
{ "акуше́р-гинеколо́г", "а.ку.шер-ги.не.ко.лог" },
{ "по́-добре́ къ́сно, отко́лкото ни́кога", "по-до.бре къ.сно, от.кол.ко.то ни.ко.га" },
{ "зени́тно-раке́тен", "зе.нит.но-ра.ке.тен" },
{ "го́ре-до́лу", "го.ре-до.лу" },
{ "на́й-по́сле", "най-по.сле" },
{ "чик-чири́к", "чик-чи.рик" },
{ "сре́ден ро́д", "сре.ден род" },
{ "божа́ кра́вичка", "бо.жа кра.вич.ка" },
{ "Съедине́ни америка́нски ща́ти", "Съ.е.ди.не.ни а.ме.ри.кан.ски ща.ти" },
{ "от мла́дих до ста́рих", "от мла.дих до ста.рих" },
{ "со кро́тце, со бла́го и со ма́лко кюте́к", "со крот.це, со бла.го и со мал.ко кю.тек" }
}
--[[
Additions take this form –
{ "word (with no accent required)", "expected syllabification" },
{ "", "" },
Make sure to include the comma, or the module will return an error.
]]
self:iterate(list, "check_output_syllabification")
end
function tests:test_rhymes()
local function make_args(tbl)
return { args=tbl }
end
local list = {
-- Words rhyming in -am
{"грам", "am"},
{"прям", "am"},
{"сам", "am"},
{"едва́м", "am"},
{"хипопота́м", "am"},
-- Words rhyming in -it͡ʃɛn
{"ли́чен", "it͡ʃɛn"},
{"графи́чен", "it͡ʃɛn"},
{"психи́чен", "it͡ʃɛn"},
{"ритми́чен", "it͡ʃɛn"},
{"цини́чен", "it͡ʃɛn"},
{"части́чен", "it͡ʃɛn"},
{"себи́чен", "it͡ʃɛn"},
{"категори́чен", "it͡ʃɛn"},
{"мелоди́чен", "it͡ʃɛn"},
{"микроскопи́чен", "it͡ʃɛn"},
{"етимологи́чен", "it͡ʃɛn"},
{"епидемиологи́чен", "it͡ʃɛn"},
-- Words rhyming in -ɔf
{"зов", "ɔf"},
{"нов", "ɔf"},
{"оф", "ɔf"},
{"карто́ф", "ɔf"},
{"пищо́в", "ɔf"},
{"Цветко́в", "ɔf"},
{"Попо́в", "ɔf"},
{"Свищо́в", "ɔf"},
{"надсло́в", "ɔf"},
{"апостро́ф", "ɔf"},
{"полугото́в", "ɔf"},
-- Words rhyming in -ɛnɐ
{"вселе́на", "ɛnɐ"},
{"Еле́на", "ɛnɐ"},
-- Words rhyming in -ɛtɐ
{"ге́та", "ɛtɐ"},
{"че́та", "ɛtɐ"},
{"баре́та", "ɛtɐ"},
{"касе́та", "ɛtɐ"},
{"соле́та", "ɛtɐ"},
{"раке́та", "ɛtɐ"},
{"каре́та", "ɛtɐ"},
-- Words rhyming in -ɛt͡ʃk
{"кле́чка", "ɛt͡ʃkɐ"},
{"пе́чка", "ɛt͡ʃkɐ"},
{"апте́чка", "ɛt͡ʃkɐ"},
{"пресе́чка", "ɛt͡ʃkɐ"},
{"юрде́чка", "ɛt͡ʃkɐ"},
{"буболе́чка", "ɛt͡ʃkɐ"},
-- Words rhyming in -ɤn
{"вън", "ɤn"},
{"звън", "ɤn"},
{"мрън", "ɤn"},
{"трън", "ɤn"},
{"сън", "ɤn"},
{"алтъ́н", "ɤn"},
{"сакъ́н", "ɤn"},
{"насъ́н", "ɤn"},
{"гръмотръ́н", "ɤn"},
-- Words rhyming in -un
{"хун", "un"},
{"басту́н", "un"},
{"Перу́н", "un"},
{"харпу́н", "un"},
{"шогу́н", "un"},
{"сапу́н", "un"},
{"саму́н", "un"},
{"Непту́н", "un"},
{"Камеру́н", "un"},
{"опеку́н", "un"},
-- Words rhyming in -urɐ
{"му́ра", "urɐ"},
{"су́ра", "urɐ"},
{"брошу́ра", "urɐ"},
{"култу́ра", "urɐ"},
{"фризу́ра", "urɐ"},
{"мату́ра", "urɐ"},
{"цезу́ра", "urɐ"},
{"агенту́ра", "urɐ"},
{"армату́ра", "urɐ"},
{"саламу́ра", "urɐ"},
{"архитекту́ра", "urɐ"},
{"аквакулту́ра", "urɐ"},
{"агрикулту́ра", "urɐ"},
-- Words rhyming in -va
{"два", "va"},
{"брава́", "va"},
{"трева́", "va"},
{"глава́", "va"},
{"това́", "va"},
{"едва́", "va"},
{"баклава́", "va"},
{"затова́", "va"},
{"тетива́", "va"},
-- Words rhyming in -a
{"боа́", "a"},
{"Беноа́", "a"},
{"аншоа́", "a"},
{"амплоа́", "a"},
{"Франсоа́", "a"},
{"буржоа́", "a"},
{"Делакроа́", "a"},
-- Words ending in the -та definite article stressed
{make_args{"света́", endschwa=1}, "tɤ"},
{make_args{"съвестта́", endschwa=1}, "tɤ"},
{make_args{"песента́", endschwa=1}, "tɤ"},
{make_args{"областта́", endschwa=1}, "tɤ"},
{make_args{"болестта́", endschwa=1}, "tɤ"},
{make_args{"мъдростта́", endschwa=1}, "tɤ"},
{make_args{"разсъдливостта́", endschwa=1}, "tɤ"},
-- Verbs ending in a stressed а/я
{make_args{"боля́", endschwa=1}, "lʲɤ"},
{make_args{"бедя́", endschwa=1}, "dʲɤ"},
{make_args{"бумтя́", endschwa=1}, "tʲɤ"},
{make_args{"вися́", endschwa=1}, "sʲɤ"},
{make_args{"бода́", endschwa=1}, "dɤ"},
{make_args{"веда́", endschwa=1}, "dɤ"},
{make_args{"възпроизведа́", endschwa=1}, "dɤ"},
{make_args{"зда", endschwa=1}, "dɤ"},
{make_args{"бера́", endschwa=1}, "rɤ"},
{make_args{"възпра́", endschwa=1}, "rɤ"},
{make_args{"вра", endschwa=1}, "rɤ"},
{make_args{"навра́", endschwa=1}, "rɤ"},
{make_args{"буя́", endschwa=1}, "jɤ"},
{make_args{"доя́", endschwa=1}, "jɤ"},
{make_args{"безпокоя́", endschwa=1}, "jɤ"},
{make_args{"греба́", endschwa=1}, "bɤ"},
{make_args{"измета́", endschwa=1}, "tɤ"},
{make_args{"лежа́", endschwa=1}, "ʒɤ"},
{make_args{"държа́", endschwa=1}, "ʒɤ"},
{make_args{"дължа́", endschwa=1}, "ʒɤ"},
{make_args{"кова́", endschwa=1}, "vɤ"},
-- Words ending in an affricate followed by a stressed vowel
{make_args{"дередже́"}, "dʒɛ"}, -- "d͡ʒ might be preferable, but this is the current IPA and it seems to be acceptable"
{make_args{"коскоджа́"}, "dʒa"},
{make_args{"хвърча́", endschwa=1}, "t͡ʃɤ"},
{make_args{"хълца́", endschwa=1}, "t͡sɤ"}, -- fake word for illustration
}
self:iterate(list, "check_output_rhymes")
end
return tests
pr8zva8fsaklmq688jnra5ky261xyl3
Module:bg-pronunciation/documentation
828
137955
234874
222994
2025-08-21T19:34:08Z
en>Kiril kovachev
0
Add sentence on bg-pr
234874
wikitext
text/x-wiki
This module automatically converts Bulgarian orthography to a phonetic transcription in the International Phonetic Alphabet. It also generates hyphenations and syllabifications. It supports generating all various parts of pronunciation sections together, including the above and audio and rhymes, using the <code>show_all</code> entry point.
===Testcases===
{{#invoke:bg-pronunciation/testcases|run_tests}}
===References===
*{{cite-book<!--
-->|bg<!--
-->|last=Тилков<!--
-->|first=Димитър<!--
-->|last2=Бояджиев<!--
-->|first2=Тодор<!--
-->|last3=Георгиева<!--
-->|first3=Елена<!--
-->|last4=Пенчев<!--
-->|first4=Йордан<!--
-->|last5=Станков<!--
-->|first5=Валентин<!--
-->|title=Граматика на съвременния български книжовен език<!--
-->|location=Sofia<!--
-->|publisher=ABAGAR<!--
-->|edition=3rd<!--
-->|year=1998<!--
-->|volume=1<!--
-->}}
s9a14tw14mlkixjxknfygfaq5xfh17q
234875
234874
2026-05-24T09:39:56Z
Lee
19
[[:en:Module:bg-pronunciation/documentation]] වෙතින් එක් සංශෝධනයක්
234874
wikitext
text/x-wiki
This module automatically converts Bulgarian orthography to a phonetic transcription in the International Phonetic Alphabet. It also generates hyphenations and syllabifications. It supports generating all various parts of pronunciation sections together, including the above and audio and rhymes, using the <code>show_all</code> entry point.
===Testcases===
{{#invoke:bg-pronunciation/testcases|run_tests}}
===References===
*{{cite-book<!--
-->|bg<!--
-->|last=Тилков<!--
-->|first=Димитър<!--
-->|last2=Бояджиев<!--
-->|first2=Тодор<!--
-->|last3=Георгиева<!--
-->|first3=Елена<!--
-->|last4=Пенчев<!--
-->|first4=Йордан<!--
-->|last5=Станков<!--
-->|first5=Валентин<!--
-->|title=Граматика на съвременния български книжовен език<!--
-->|location=Sofia<!--
-->|publisher=ABAGAR<!--
-->|edition=3rd<!--
-->|year=1998<!--
-->|volume=1<!--
-->}}
s9a14tw14mlkixjxknfygfaq5xfh17q
Module:labels/data/lang/nds
828
143721
234825
2026-02-16T01:06:10Z
en>Benwing2
0
add DLS region info
234825
Scribunto
text/plain
local labels = {}
-- German Low German varieties
labels["Brazilian Pomeranian"] = {
aliases = {"Eastern Pomeranian in Brazil", "East Pomeranian in Brazil", "Pomeranian in Brazil", "Brazilian Eastern Pomeranian"},
region = "the Eastern Pomeranian dialect in <country>",
country = "Brazil",
regional_categories = true,
parent = "Eastern Pomeranian",
}
labels["East Frisian"] = { -- for East Frisian dialectal Low German, not Frisian language
aliases = {"East Frisian Low Saxon", "East Frisian Low German", "Oostfreesch"},
Wikipedia = "East Frisian Low Saxon",
region = "East Frisia",
country = "Germany",
regional_categories = true,
parent = "German Low German",
}
labels["Eastern Pomeranian"] = {
aliases = {"Eastern Pomeranian Low German", "East Pomeranian Low German", "Eastern Pomeranian LG", "East Pomeranian LG", "East Pomeranian"},
display = "Eastern Pomeranian",
region = "the historical region of {{w|Eastern Pomerania}} (currently in [[Poland]]), as well as [[Brazil]] and the [[United States]]",
country = "Germany,Poland,Brazil,the [[United States]]",
regional_categories = true,
parent = "Pomeranian",
}
labels["German Low German"] = {
aliases = {"GLG"},
Wikipedia = {"Low German", "German Low German dialects"},
region = "<country>",
country = "Germany,Poland,Brazil,the [[United States]]",
plain_categories = true,
parent = true,
}
labels["Hamburg"] = {
aliases = {"Hamburgisch"},
display = "Hamburgisch",
Wikipedia = "Hamburgisch dialect",
regional_categories = true,
parent = "Northern",
}
labels["Holstein"] = {
aliases = {"Holsteinisch"},
Wikipedia = true,
regional_categories = true,
parent = "Northern",
}
labels["Low Prussian"] = {
Wikipedia = "Low Prussian dialect",
region = "{{w|East Prussia}}, {{w|West Prussia}}, and [[Danzig]]",
plain_categories = true,
parent = "German Low German",
country = "Germany,Poland",
}
labels["Märkisch"] = {
Wikipedia = "Brandenburgisch dialect",
region = "märkisches Sauerland (former [[w:County of Mark|County of Mark]]), [[Germany]]",
regional_categories = true,
parent = "Westphalian",
}
labels["Mecklenburg"] = {
aliases = {"Mecklenburg Low German", "Mecklenburgisch Low German", "Mecklenburgisch", "Mecklenburgish"},
display = "Mecklenburgisch",
Wikipedia = "Mecklenburgisch dialect",
regional_categories = true,
parent = "German Low German",
country = "Germany",
}
labels["Münsterland"] = {
aliases = {"Münster", "Münsterländisch", "Mönsterlannsch"},
Wikipedia = true,
regional_categories = true,
parent = "Westphalian",
}
labels["Northern"] = {
regional_categories = true,
region = "the states of [[Lower Saxony]], [[Bremen]], [[Schleswig-Holstein]] and [[Hamburg]] in northern [[Germany]]",
parent = "German Low German",
country = "Germany",
}
labels["Oldenburg"] = {
aliases = {"Bremen", "Breemsch", "Ollnborg", "Oldenborgsch"},
Wikipedia = true,
regional_categories = true,
parent = "Northern",
}
labels["Paderbornisch"] = {
regional_categories = true,
region = "the city of [[Paderborn]] in eastern [[North Rhine-Westphalia]], [[Germany]]",
parent = "Westphalian",
}
labels["Pomeranian"] = {
aliases = {"Pomeranian Low German", "Pomeranian LG"},
region = "Pomerania",
Wikipedia = true,
regional_categories = true,
parent = "German Low German",
country = "Germany,Poland",
}
labels["Schleswig"] = {
aliases = {"Schleswigsch"},
Wikipedia = true,
regional_categories = true,
parent = "Northern",
}
labels["Vest Recklinghausen"] = {
aliases = {"Vest Recklinghusen"},
Wikipedia = true,
regional_categories = true,
parent = "Westphalian",
extinct = true,
}
labels["Western Pomeranian"] = {
aliases = {"Western Pomeranian Low German", "West Pomeranian Low German", "Western Pomeranian LG", "West Pomeranian LG", "West Pomeranian"},
region = "{{w|Western Pomerania}}",
regional_categories = true,
parent = "Pomeranian Low German",
country = "Germany",
}
labels["Westphalian"] = {
aliases = {"Westphalia"},
Wikipedia = "Westphalian language",
region = "Westphalia",
plain_categories = true, -- FIXME, rename to 'Westphalian Low German' to distinguish from 'Westphalian German'
parent = "German Low German",
country = "Germany",
}
-- Dutch Low Saxon varieties
labels["Achterhoeks"] = {
aliases = {"Achterhooks", "Achterhoek"},
Wikipedia = true,
region = "the {{w|Achterhoek}} in Eastern [[Netherlands]]",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Drents"] = {
aliases = {"Drèents", "Drenthe"},
Wikipedia = true,
region = "Drenthe",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Dutch Low Saxon"] = {
aliases = {"DLS"},
Wikipedia = true,
region = "<country>",
country = "the [[Netherlands]]",
plain_categories = true,
parent = true,
}
labels["Gronings"] = {
aliases = {"Grunnegs", "Grönnegs", "Groningen"},
Wikipedia = true,
region = "Groningen",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Sallands"] = {
aliases = {"Sallaans", "Salland"},
Wikipedia = true,
region = "{{w|Salland}}",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Stellingwerfs"] = {
aliases = {"Stellingwarfs", "Stellingwerf"},
Wikipedia = true,
region = "{{w|Ooststellingwerf}} and {{w|Weststellingwerf}} in [[Friesland]]",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Twents"] = {
aliases = {"Tweants", "Twente"},
Wikipedia = true,
region = "{{w|Twente}}",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Urkers"] = {
Wikipedia = "Urkers dialect",
region = "the former island of [[Urk]], on the west coast of [[Flevoland]] in the [[Netherlands]]",
plain_categories = "Urkers Low German",
parent = "Dutch Low Saxon",
}
labels["Veluws"] = {
aliases = {"Veluwe"},
Wikipedia = true,
region = "the [[Veluwe]]",
plain_categories = true,
parent = "Dutch Low Saxon",
}
return require("Module:labels").finalize_data(labels)
6yqtd1a3kaabh2vvzrufv6mrcq2n9ti
234826
234366
2026-05-24T08:06:50Z
Lee
19
[[:en:Module:labels/data/lang/nds]] වෙතින් එක් සංශෝධනයක්
234366
Scribunto
text/plain
local labels = {}
-- German Low German varieties
labels["Brazilian Pomeranian"] = {
aliases = {"Eastern Pomeranian in Brazil", "East Pomeranian in Brazil", "Pomeranian in Brazil", "Brazilian Eastern Pomeranian"},
region = "the Eastern Pomeranian dialect in <country>",
country = "Brazil",
regional_categories = true,
parent = "Eastern Pomeranian",
}
labels["East Frisian"] = { -- for East Frisian dialectal Low German, not Frisian language
aliases = {"East Frisian Low Saxon", "East Frisian Low German", "Oostfreesch"},
Wikipedia = "East Frisian Low Saxon",
region = "East Frisia",
country = "Germany",
regional_categories = true,
parent = "German Low German",
}
labels["Eastern Pomeranian"] = {
aliases = {"Eastern Pomeranian Low German", "East Pomeranian Low German", "Eastern Pomeranian LG", "East Pomeranian LG", "East Pomeranian"},
display = "Eastern Pomeranian",
region = "the historical region of {{w|Eastern Pomerania}} (currently in [[Poland]]), as well as [[Brazil]] and the [[United States]]",
country = "Germany,Poland,Brazil,the [[United States]]",
regional_categories = true,
parent = "Pomeranian",
}
labels["German Low German"] = {
aliases = {"GLG"},
Wikipedia = {"Low German", "German Low German dialects"},
region = "<country>",
country = "Germany,Poland,Brazil,the [[United States]]",
plain_categories = true,
parent = true,
}
labels["Hamburg"] = {
aliases = {"Hamburgisch"},
display = "Hamburgisch",
Wikipedia = "Hamburgisch dialect",
regional_categories = true,
parent = "Northern",
}
labels["Holstein"] = {
aliases = {"Holsteinisch"},
Wikipedia = true,
regional_categories = true,
parent = "Northern",
}
labels["Low Prussian"] = {
Wikipedia = "Low Prussian dialect",
region = "{{w|East Prussia}}, {{w|West Prussia}}, and [[Danzig]]",
plain_categories = true,
parent = "German Low German",
country = "Germany,Poland",
}
labels["Märkisch"] = {
Wikipedia = "Brandenburgisch dialect",
region = "märkisches Sauerland (former [[w:County of Mark|County of Mark]]), [[Germany]]",
regional_categories = true,
parent = "Westphalian",
}
labels["Mecklenburg"] = {
aliases = {"Mecklenburg Low German", "Mecklenburgisch Low German", "Mecklenburgisch", "Mecklenburgish"},
display = "Mecklenburgisch",
Wikipedia = "Mecklenburgisch dialect",
regional_categories = true,
parent = "German Low German",
country = "Germany",
}
labels["Münsterland"] = {
aliases = {"Münster", "Münsterländisch", "Mönsterlannsch"},
Wikipedia = true,
regional_categories = true,
parent = "Westphalian",
}
labels["Northern"] = {
regional_categories = true,
region = "the states of [[Lower Saxony]], [[Bremen]], [[Schleswig-Holstein]] and [[Hamburg]] in northern [[Germany]]",
parent = "German Low German",
country = "Germany",
}
labels["Oldenburg"] = {
aliases = {"Bremen", "Breemsch", "Ollnborg", "Oldenborgsch"},
Wikipedia = true,
regional_categories = true,
parent = "Northern",
}
labels["Paderbornisch"] = {
regional_categories = true,
region = "the city of [[Paderborn]] in eastern [[North Rhine-Westphalia]], [[Germany]]",
parent = "Westphalian",
}
labels["Pomeranian"] = {
aliases = {"Pomeranian Low German", "Pomeranian LG"},
region = "Pomerania",
Wikipedia = true,
regional_categories = true,
parent = "German Low German",
country = "Germany,Poland",
}
labels["Schleswig"] = {
aliases = {"Schleswigsch"},
Wikipedia = true,
regional_categories = true,
parent = "Northern",
}
labels["Vest Recklinghausen"] = {
aliases = {"Vest Recklinghusen"},
Wikipedia = true,
regional_categories = true,
parent = "Westphalian",
extinct = true,
}
labels["Western Pomeranian"] = {
aliases = {"Western Pomeranian Low German", "West Pomeranian Low German", "Western Pomeranian LG", "West Pomeranian LG", "West Pomeranian"},
region = "{{w|Western Pomerania}}",
regional_categories = true,
parent = "Pomeranian Low German",
country = "Germany",
}
labels["Westphalian"] = {
aliases = {"Westphalia"},
Wikipedia = "Westphalian language",
region = "Westphalia",
plain_categories = true, -- FIXME, rename to 'Westphalian Low German' to distinguish from 'Westphalian German'
parent = "German Low German",
country = "Germany",
}
-- Dutch Low Saxon varieties
labels["Achterhoeks"] = {
aliases = {"Achterhooks", "Achterhoek"},
Wikipedia = true,
region = "the {{w|Achterhoek}} in Eastern [[Netherlands]]",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Drents"] = {
aliases = {"Drèents", "Drenthe"},
Wikipedia = true,
region = "Drenthe",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Dutch Low Saxon"] = {
aliases = {"DLS"},
Wikipedia = true,
region = "<country>",
country = "the [[Netherlands]]",
plain_categories = true,
parent = true,
}
labels["Gronings"] = {
aliases = {"Grunnegs", "Grönnegs", "Groningen"},
Wikipedia = true,
region = "Groningen",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Sallands"] = {
aliases = {"Sallaans", "Salland"},
Wikipedia = true,
region = "{{w|Salland}}",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Stellingwerfs"] = {
aliases = {"Stellingwarfs", "Stellingwerf"},
Wikipedia = true,
region = "{{w|Ooststellingwerf}} and {{w|Weststellingwerf}} in [[Friesland]]",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Twents"] = {
aliases = {"Tweants", "Twente"},
Wikipedia = true,
region = "{{w|Twente}}",
plain_categories = true,
parent = "Dutch Low Saxon",
}
labels["Urkers"] = {
Wikipedia = "Urkers dialect",
region = "the former island of [[Urk]], on the west coast of [[Flevoland]] in the [[Netherlands]]",
plain_categories = "Urkers Low German",
parent = "Dutch Low Saxon",
}
labels["Veluws"] = {
aliases = {"Veluwe"},
Wikipedia = true,
region = "the [[Veluwe]]",
plain_categories = true,
parent = "Dutch Low Saxon",
}
return require("Module:labels").finalize_data(labels)
6yqtd1a3kaabh2vvzrufv6mrcq2n9ti
Module:category tree/lang/ine-bsl-pro
828
143899
234765
2026-04-23T09:55:16Z
en>Mellohi!
0
234765
Scribunto
text/plain
local labels = {}
--------------------------------- Nouns/Pronouns/Numerals --------------------------------
labels["consonant-stem nouns"] = {
description = "{{{langname}}} consonant-stem nouns, deriving from Proto-Indo-European consonant-stem nouns.",
additional = "These nouns are differentiated by the presence of a stem-final consonant.",
breadcrumb = "consonant-stem",
parents = {"nouns by inflection type"},
}
labels["nouns by accent paradigm"] = {
description = "{{{langname}}} nouns categorized by accent position patterns across their paradigm.",
breadcrumb = "by accent paradigm",
parents = {"nouns by inflection type"},
}
labels["nouns with fixed accent"] = {
description = "{{{langname}}} nouns with accent fixed on the first syllable throughout their declension.",
parents = {"nouns by accent paradigm"},
}
labels["nouns with mobile accent"] = {
description = "{{{langname}}} nouns with accent fixed on the last syllable in some forms of their declension, but not all forms.",
parents = {"nouns by accent paradigm"},
}
labels["nouns with unspecified accent"] = {
description = "{{{langname}}} nouns with accent without a specified accent pattern.",
parents = {"nouns by accent paradigm"},
}
--[=[
Noun declension specifications. The top-level key is the stem class, and the value is an object containing properties of
the stem class. If the stem class contains the word 'GENDER' in it, it expands into labels both for a parent category
that subsumes several genders (obtained by removing the word 'GENDER' and following whitespace) as well as
gender-specific children categories (obtained by replacing the word 'GENDER' with the genders specified in the
`possible_genders` field). The stem class can contain literal Latin-script text (e.g. suffixes), which will be
italicized in breadcrumbs and titles. The fields of the property object for a given stem class are as follows:
* `gender`: The description of the gender(s) of the stem class. If preceded by ~, the description is preceded by
"most commonly". This appears in the `additional` field of the label properties. It is not used in gender-specific
children categories; instead the gender of that category is used.
* `possible_genders`: The possible genders this class occurs in. If this is specified, the word 'GENDER' must occur in
the stem class, and gender-specific variants of the stem class (with GENDER replaced by the possible genders) are
handled along with a parent category subsuming all genders.
* `breadcrumb`: The breadcrumb for the category, appearing in the trail of breadcrumbs at the top of the page. If this
stem has gender-specific variants, the breadcrumb specified here is used only for the parent category, while the
gender-specific child categories use the gender as the breadcrumb. If not specified, it defaults to `sortkey`. If that
is also not specified, or if the breadcrumb has the value "+", the stem class (without the word 'GENDER') is used.
(Use "+" when a sortkey is specified but the stem class should be used as the breadcrumb.)
* `parent`: The parent category or categories. If specified, the actual category label is formed by appending the part
of speech (e.g. "nouns"). Defaults to "POS by inflection type" where POS is the part of speech. Note that
gender-specific child categories do not use this, but always have the gender-subsuming parent stem class category as
their parent.
* `sortkey`: The sort key used for sorting this category among its parent's children. Defaults to the stem class
(without the word 'GENDER'). Note that gender-specific child categories do not use this, but always use the gender
as the sort key.
]=]
local noun_decls = {
["GENDER <o>-stem"] = {
gender = "masculine or neuter",
possible_genders = {"masculine", "neuter"},
addl = "These nouns derive from Proto-Indo-European thematic nouns ending in {{m|cel-pro|*-os}} (masculine) and {{m|cel-pro|*-om}} " ..
"(neuter).",
},
["<ā>-stem"] = {
gender = "feminine",
},
["<ī>-stem"] = {
gender = "feminine",
},
["GENDER <i>-stem"] = {
gender = "masculine, feminine or neuter",
possible_genders = {"masculine or feminine", "neuter"},
},
["GENDER <u>-stem"] = {
gender = "masculine, feminine or neuter",
possible_genders = {"masculine or feminine", "neuter"},
},
["<r>-stem"] = {
gender = "masculine or feminine",
parent = "consonant-stem",
},
["neuter <s>-stem"] = {
gender = "neuter",
parent = "consonant-stem",
},
["GENDER <n>-stem"] = {
gender = "masculine or neuter",
possible_genders = {"masculine", "neuter"},
parent = "consonant-stem",
},
["<ū>-stem"] = {
gender = "masculine or feminine",
parent = "consonant-stem",
},
["GENDER consonant-stem"] = {
gender = "masculine, feminine or neuter",
possible_genders = {"masculine or feminine", "neuter"},
},
}
require("Module:category tree/utilities").add_inflection_labels {
labels = labels,
pos = "noun",
stem_classes = noun_decls,
principal_parts = {
},
}
return {LABELS = labels}
9tmqb20ziq9ha8tx4p46ti6ihjj0nnn
234766
234765
2026-05-24T02:17:22Z
Lee
19
[[:en:Module:category_tree/lang/ine-bsl-pro]] වෙතින් එක් සංශෝධනයක්
234765
Scribunto
text/plain
local labels = {}
--------------------------------- Nouns/Pronouns/Numerals --------------------------------
labels["consonant-stem nouns"] = {
description = "{{{langname}}} consonant-stem nouns, deriving from Proto-Indo-European consonant-stem nouns.",
additional = "These nouns are differentiated by the presence of a stem-final consonant.",
breadcrumb = "consonant-stem",
parents = {"nouns by inflection type"},
}
labels["nouns by accent paradigm"] = {
description = "{{{langname}}} nouns categorized by accent position patterns across their paradigm.",
breadcrumb = "by accent paradigm",
parents = {"nouns by inflection type"},
}
labels["nouns with fixed accent"] = {
description = "{{{langname}}} nouns with accent fixed on the first syllable throughout their declension.",
parents = {"nouns by accent paradigm"},
}
labels["nouns with mobile accent"] = {
description = "{{{langname}}} nouns with accent fixed on the last syllable in some forms of their declension, but not all forms.",
parents = {"nouns by accent paradigm"},
}
labels["nouns with unspecified accent"] = {
description = "{{{langname}}} nouns with accent without a specified accent pattern.",
parents = {"nouns by accent paradigm"},
}
--[=[
Noun declension specifications. The top-level key is the stem class, and the value is an object containing properties of
the stem class. If the stem class contains the word 'GENDER' in it, it expands into labels both for a parent category
that subsumes several genders (obtained by removing the word 'GENDER' and following whitespace) as well as
gender-specific children categories (obtained by replacing the word 'GENDER' with the genders specified in the
`possible_genders` field). The stem class can contain literal Latin-script text (e.g. suffixes), which will be
italicized in breadcrumbs and titles. The fields of the property object for a given stem class are as follows:
* `gender`: The description of the gender(s) of the stem class. If preceded by ~, the description is preceded by
"most commonly". This appears in the `additional` field of the label properties. It is not used in gender-specific
children categories; instead the gender of that category is used.
* `possible_genders`: The possible genders this class occurs in. If this is specified, the word 'GENDER' must occur in
the stem class, and gender-specific variants of the stem class (with GENDER replaced by the possible genders) are
handled along with a parent category subsuming all genders.
* `breadcrumb`: The breadcrumb for the category, appearing in the trail of breadcrumbs at the top of the page. If this
stem has gender-specific variants, the breadcrumb specified here is used only for the parent category, while the
gender-specific child categories use the gender as the breadcrumb. If not specified, it defaults to `sortkey`. If that
is also not specified, or if the breadcrumb has the value "+", the stem class (without the word 'GENDER') is used.
(Use "+" when a sortkey is specified but the stem class should be used as the breadcrumb.)
* `parent`: The parent category or categories. If specified, the actual category label is formed by appending the part
of speech (e.g. "nouns"). Defaults to "POS by inflection type" where POS is the part of speech. Note that
gender-specific child categories do not use this, but always have the gender-subsuming parent stem class category as
their parent.
* `sortkey`: The sort key used for sorting this category among its parent's children. Defaults to the stem class
(without the word 'GENDER'). Note that gender-specific child categories do not use this, but always use the gender
as the sort key.
]=]
local noun_decls = {
["GENDER <o>-stem"] = {
gender = "masculine or neuter",
possible_genders = {"masculine", "neuter"},
addl = "These nouns derive from Proto-Indo-European thematic nouns ending in {{m|cel-pro|*-os}} (masculine) and {{m|cel-pro|*-om}} " ..
"(neuter).",
},
["<ā>-stem"] = {
gender = "feminine",
},
["<ī>-stem"] = {
gender = "feminine",
},
["GENDER <i>-stem"] = {
gender = "masculine, feminine or neuter",
possible_genders = {"masculine or feminine", "neuter"},
},
["GENDER <u>-stem"] = {
gender = "masculine, feminine or neuter",
possible_genders = {"masculine or feminine", "neuter"},
},
["<r>-stem"] = {
gender = "masculine or feminine",
parent = "consonant-stem",
},
["neuter <s>-stem"] = {
gender = "neuter",
parent = "consonant-stem",
},
["GENDER <n>-stem"] = {
gender = "masculine or neuter",
possible_genders = {"masculine", "neuter"},
parent = "consonant-stem",
},
["<ū>-stem"] = {
gender = "masculine or feminine",
parent = "consonant-stem",
},
["GENDER consonant-stem"] = {
gender = "masculine, feminine or neuter",
possible_genders = {"masculine or feminine", "neuter"},
},
}
require("Module:category tree/utilities").add_inflection_labels {
labels = labels,
pos = "noun",
stem_classes = noun_decls,
principal_parts = {
},
}
return {LABELS = labels}
9tmqb20ziq9ha8tx4p46ti6ihjj0nnn
Module:category tree/lang/egy
828
143900
234767
2026-03-02T00:20:43Z
en>Fenakhay
0
Created page with "local labels = {} local lang = require("Module:languages").getByCode("egy") labels["terms with reconstructed IPA pronunciation"] = { description = "Egyptian terms with [[Appendix:Egyptian pronunciation|reconstructed]] pronunciation in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].", breadcrumb = "reconstructed IPA", parents = {"terms with IPA pronunciation"}, } labels["terms with reconstructed Old Egyptian IPA pronunciation"] = { descrip..."
234767
Scribunto
text/plain
local labels = {}
local lang = require("Module:languages").getByCode("egy")
labels["terms with reconstructed IPA pronunciation"] = {
description = "Egyptian terms with [[Appendix:Egyptian pronunciation|reconstructed]] pronunciation in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "reconstructed IPA",
parents = {"terms with IPA pronunciation"},
}
labels["terms with reconstructed Old Egyptian IPA pronunciation"] = {
description = "Egyptian terms with pronunciation in the [[w:Old Egyptian|Old Egyptian]] stage (c. 2500 BCE) in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "Old Egyptian IPA",
parents = {"terms with reconstructed IPA pronunciation"},
}
labels["terms with reconstructed Middle Egyptian IPA pronunciation"] = {
description = "Egyptian terms with pronunciation in the [[w:Middle Egyptian language|Middle Egyptian]] stage (c. 1700 BCE) in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "Middle Egyptian IPA",
parents = {"terms with reconstructed IPA pronunciation"},
}
labels["terms with reconstructed Amarna-period Late Egyptian IPA pronunciation"] = {
description = "Egyptian terms with pronunciation in the [[w:Late Egyptian language|Amarna-period Late Egyptian]] stage (c. 1350 BCE) in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "Amarna-period Late Egyptian IPA",
parents = {"terms with reconstructed IPA pronunciation"},
}
labels["terms with reconstructed Late Egyptian IPA pronunciation"] = {
description = "Egyptian terms with pronunciation in the [[w:Late Egyptian language|Late Egyptian]] stage (c. 800 BCE) in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "Late Egyptian IPA",
parents = {"terms with reconstructed IPA pronunciation"},
}
return { LABELS = labels }
ehyky6uqex07d90hdyd6wa0ejll7o5n
234768
234767
2026-05-24T02:17:45Z
Lee
19
[[:en:Module:category_tree/lang/egy]] වෙතින් එක් සංශෝධනයක්
234767
Scribunto
text/plain
local labels = {}
local lang = require("Module:languages").getByCode("egy")
labels["terms with reconstructed IPA pronunciation"] = {
description = "Egyptian terms with [[Appendix:Egyptian pronunciation|reconstructed]] pronunciation in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "reconstructed IPA",
parents = {"terms with IPA pronunciation"},
}
labels["terms with reconstructed Old Egyptian IPA pronunciation"] = {
description = "Egyptian terms with pronunciation in the [[w:Old Egyptian|Old Egyptian]] stage (c. 2500 BCE) in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "Old Egyptian IPA",
parents = {"terms with reconstructed IPA pronunciation"},
}
labels["terms with reconstructed Middle Egyptian IPA pronunciation"] = {
description = "Egyptian terms with pronunciation in the [[w:Middle Egyptian language|Middle Egyptian]] stage (c. 1700 BCE) in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "Middle Egyptian IPA",
parents = {"terms with reconstructed IPA pronunciation"},
}
labels["terms with reconstructed Amarna-period Late Egyptian IPA pronunciation"] = {
description = "Egyptian terms with pronunciation in the [[w:Late Egyptian language|Amarna-period Late Egyptian]] stage (c. 1350 BCE) in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "Amarna-period Late Egyptian IPA",
parents = {"terms with reconstructed IPA pronunciation"},
}
labels["terms with reconstructed Late Egyptian IPA pronunciation"] = {
description = "Egyptian terms with pronunciation in the [[w:Late Egyptian language|Late Egyptian]] stage (c. 800 BCE) in the [[w:International Phonetic Alphabet|International Phonetic Alphabet]].",
breadcrumb = "Late Egyptian IPA",
parents = {"terms with reconstructed IPA pronunciation"},
}
return { LABELS = labels }
ehyky6uqex07d90hdyd6wa0ejll7o5n
ප්රවර්ගය:යෙදුම්, Macedonian පරිවර්තන සහිත
14
143901
234770
2026-05-24T02:19:35Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:යෙදුම්, Macedonian පරිවර්තන සහිත]] සිට [[ප්රවර්ගය:යෙදුම්, මැසඩෝනියානු පරිවර්තන සහිත]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234770
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:යෙදුම්, මැසඩෝනියානු පරිවර්තන සහිත]]
2jex0btz3tsgotj236bg1h1mi8bgwv9
234771
234770
2026-05-24T02:19:44Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234771
wikitext
text/x-wiki
{{category redirect|යෙදුම්, මැසඩෝනියානු පරිවර්තන සහිත}}
2dvarf1449nktzh7xmnrm19cwawx3d0
ප්රවර්ගය:Terms with මැසඩෝනියානු translations
14
143902
234772
2026-05-24T02:19:54Z
Pinthura
2424
සේවා: මෘදු ප්රවර්ග යළියොමුවක් නිර්මාණය.
234772
wikitext
text/x-wiki
{{category redirect|යෙදුම්, මැසඩෝනියානු පරිවර්තන සහිත}}
2dvarf1449nktzh7xmnrm19cwawx3d0
ප්රවර්ගය:කලාපීය ප්රොටෝ-බටහිර ජර්මානු
14
143903
234773
2023-09-19T00:17:00Z
en>Benwing2
0
234773
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234774
234773
2026-05-24T07:44:44Z
Lee
19
[[:en:Category:Regional_Proto-West_Germanic]] වෙතින් එක් සංශෝධනයක්
234773
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234777
234774
2026-05-24T07:46:04Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Regional Proto-West Germanic]] සිට [[ප්රවර්ගය:කලාපීය ප්රොටෝ-බටහිර ජර්මානු]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234773
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234781
234777
2026-05-24T07:46:24Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234781
wikitext
text/x-wiki
{{auto cat}}
[[en:Category:Regional Proto-West Germanic]]
j80s5ftcg6evvwt204hyvdpc2rgly0z
ප්රවර්ගය:ප්රොටෝ-බටහිර ජර්මානු ප්රභේද
14
143904
234775
2023-09-24T06:14:39Z
en>WingerBot
0
Created page with "{{auto cat}}"
234775
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234776
234775
2026-05-24T07:45:13Z
Lee
19
[[:en:Category:Varieties_of_Proto-West_Germanic]] වෙතින් එක් සංශෝධනයක්
234775
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234779
234776
2026-05-24T07:46:14Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Varieties of Proto-West Germanic]] සිට [[ප්රවර්ගය:ප්රොටෝ-බටහිර ජර්මානු ප්රභේද]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234775
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234782
234779
2026-05-24T07:46:34Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234782
wikitext
text/x-wiki
{{auto cat}}
[[en:Category:Varieties of Proto-West Germanic]]
4kux0qpi3tpe7yfqhub775h5kbh6hri
ප්රවර්ගය:Regional Proto-West Germanic
14
143905
234778
2026-05-24T07:46:05Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Regional Proto-West Germanic]] සිට [[ප්රවර්ගය:කලාපීය ප්රොටෝ-බටහිර ජර්මානු]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234778
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:කලාපීය ප්රොටෝ-බටහිර ජර්මානු]]
mrci5lvvxgzowrg4dtttj0oxb2z6njq
234783
234778
2026-05-24T07:46:44Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234783
wikitext
text/x-wiki
{{category redirect|කලාපීය ප්රොටෝ-බටහිර ජර්මානු}}
0o4mg0zmxfmytvxqumvrky0lqttrly7
ප්රවර්ගය:Varieties of Proto-West Germanic
14
143906
234780
2026-05-24T07:46:15Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Varieties of Proto-West Germanic]] සිට [[ප්රවර්ගය:ප්රොටෝ-බටහිර ජර්මානු ප්රභේද]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234780
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:ප්රොටෝ-බටහිර ජර්මානු ප්රභේද]]
e4kl75inu3ugwjwyvug3icsxzdh87bv
234784
234780
2026-05-24T07:46:54Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234784
wikitext
text/x-wiki
{{category redirect|ප්රොටෝ-බටහිර ජර්මානු ප්රභේද}}
o3wkv3x6os293lp84xiewup3f8ci1d6
ප්රවර්ගය:කලාපීය Proto-West Germanic
14
143907
234785
2026-05-24T07:47:04Z
Pinthura
2424
සේවා: මෘදු ප්රවර්ග යළියොමුවක් නිර්මාණය.
234785
wikitext
text/x-wiki
{{category redirect|කලාපීය ප්රොටෝ-බටහිර ජර්මානු}}
0o4mg0zmxfmytvxqumvrky0lqttrly7
ප්රවර්ගය:Proto-West Germanic ප්රභේද
14
143908
234786
2026-05-24T07:47:14Z
Pinthura
2424
සේවා: මෘදු ප්රවර්ග යළියොමුවක් නිර්මාණය.
234786
wikitext
text/x-wiki
{{category redirect|ප්රොටෝ-බටහිර ජර්මානු ප්රභේද}}
o3wkv3x6os293lp84xiewup3f8ci1d6
ප්රවර්ගය:Regional ප්රොටෝ-බටහිර ජර්මානු
14
143909
234787
2026-05-24T07:47:24Z
Pinthura
2424
සේවා: මෘදු ප්රවර්ග යළියොමුවක් නිර්මාණය.
234787
wikitext
text/x-wiki
{{category redirect|කලාපීය ප්රොටෝ-බටහිර ජර්මානු}}
0o4mg0zmxfmytvxqumvrky0lqttrly7
ප්රවර්ගය:Varieties of ප්රොටෝ-බටහිර ජර්මානු
14
143910
234788
2026-05-24T07:47:34Z
Pinthura
2424
සේවා: මෘදු ප්රවර්ග යළියොමුවක් නිර්මාණය.
234788
wikitext
text/x-wiki
{{category redirect|ප්රොටෝ-බටහිර ජර්මානු ප්රභේද}}
o3wkv3x6os293lp84xiewup3f8ci1d6
ප්රවර්ගය:යෙදුම්, Classical Chinese පරිවර්තන සහිත
14
143911
234789
2026-02-11T05:24:44Z
en>WingerBot
0
WingerBot moved page [[Category:Terms with Literary Chinese translations]] to [[Category:Terms with Classical Chinese translations]] without leaving a redirect: Literary Chinese -> Classical Chinese in categories per [[Wiktionary:Language_treatment_requests#merge_"Literary_Chinese"_and_"Literary_Chinese"]]
234789
wikitext
text/x-wiki
{{auto cat}}
[[Category:Terms with Chinese translations]]
bzkn14qnyjhiywj9ezm45vgiu3yzttk
234790
234789
2026-05-24T07:52:18Z
Lee
19
[[:en:Category:Terms_with_Classical_Chinese_translations]] වෙතින් එක් සංශෝධනයක්
234789
wikitext
text/x-wiki
{{auto cat}}
[[Category:Terms with Chinese translations]]
bzkn14qnyjhiywj9ezm45vgiu3yzttk
234800
234790
2026-05-24T07:56:05Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Terms with Classical Chinese translations]] සිට [[ප්රවර්ගය:යෙදුම්, Classical Chinese පරිවර්තන සහිත]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234789
wikitext
text/x-wiki
{{auto cat}}
[[Category:Terms with Chinese translations]]
bzkn14qnyjhiywj9ezm45vgiu3yzttk
234810
234800
2026-05-24T07:56:55Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234810
wikitext
text/x-wiki
{{auto cat}}
[[Category:Terms with Chinese translations]]
[[en:Category:Terms with Classical Chinese translations]]
2wvwr92qpokd7orih0rtukwc9zx1xag
ප්රවර්ගය:Classical Chinese ප්රවේශ නඩත්තුව
14
143912
234791
2026-02-11T05:23:59Z
en>WingerBot
0
WingerBot moved page [[Category:Literary Chinese entry maintenance]] to [[Category:Classical Chinese entry maintenance]] without leaving a redirect: Literary Chinese -> Classical Chinese in categories per [[Wiktionary:Language_treatment_requests#merge_"Literary_Chinese"_and_"Literary_Chinese"]]
234791
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234792
234791
2026-05-24T07:52:30Z
Lee
19
[[:en:Category:Classical_Chinese_entry_maintenance]] වෙතින් එක් සංශෝධනයක්
234791
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234802
234792
2026-05-24T07:56:15Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Classical Chinese entry maintenance]] සිට [[ප්රවර්ගය:Classical Chinese ප්රවේශ නඩත්තුව]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234791
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234811
234802
2026-05-24T07:57:05Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234811
wikitext
text/x-wiki
{{auto cat}}
[[en:Category:Classical Chinese entry maintenance]]
ss7r8sv87fq1ezeuraec100afutba79
ප්රවර්ගය:Classical Chinese භාෂාව
14
143913
234793
2026-02-11T05:24:00Z
en>WingerBot
0
WingerBot moved page [[Category:Literary Chinese language]] to [[Category:Classical Chinese language]] without leaving a redirect: Literary Chinese -> Classical Chinese in categories per [[Wiktionary:Language_treatment_requests#merge_"Literary_Chinese"_and_"Literary_Chinese"]]
234793
wikitext
text/x-wiki
{{auto cat|China|Japan}}
qi8t3qss0y9h8k5zidvehhbl94rq5kc
234794
234793
2026-05-24T07:52:50Z
Lee
19
[[:en:Category:Classical_Chinese_language]] වෙතින් එක් සංශෝධනයක්
234793
wikitext
text/x-wiki
{{auto cat|China|Japan}}
qi8t3qss0y9h8k5zidvehhbl94rq5kc
234804
234794
2026-05-24T07:56:25Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Classical Chinese language]] සිට [[ප්රවර්ගය:Classical Chinese භාෂාව]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234793
wikitext
text/x-wiki
{{auto cat|China|Japan}}
qi8t3qss0y9h8k5zidvehhbl94rq5kc
234812
234804
2026-05-24T07:57:14Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234812
wikitext
text/x-wiki
{{auto cat|China|Japan}}
[[en:Category:Classical Chinese language]]
2n7lf2d2pgqplwxaxlp3owt8kiux3ou
ප්රවර්ගය:Terms with East Circassian translations
14
143914
234795
2026-05-24T07:55:03Z
Lee
19
නිර්මාණය
234795
wikitext
text/x-wiki
{{category redirect|යෙදුම්, East Circassian පරිවර්තන සහිත}}
fwedn0jslosihozxtomjthuvndh8kpr
ප්රවර්ගය:East Circassian ප්රවේශ නඩත්තුව
14
143915
234796
2026-02-15T02:47:33Z
en>WingerBot
0
WingerBot moved page [[Category:Kabardian entry maintenance]] to [[Category:East Circassian entry maintenance]] without leaving a redirect: Kabardian -> East Circassian per [[Wiktionary:Language_treatment_requests#Circassian_renames]] and [[Wiktionary:Beer_parlour/2026/February#preparing_to_rename_Adyghe_->_West_Circassian,_Kabardian_->_East_Circassian]]
234796
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234797
234796
2026-05-24T07:55:22Z
Lee
19
[[:en:Category:East_Circassian_entry_maintenance]] වෙතින් එක් සංශෝධනයක්
234796
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234806
234797
2026-05-24T07:56:35Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:East Circassian entry maintenance]] සිට [[ප්රවර්ගය:East Circassian ප්රවේශ නඩත්තුව]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234796
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234813
234806
2026-05-24T07:57:25Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234813
wikitext
text/x-wiki
{{auto cat}}
[[en:Category:East Circassian entry maintenance]]
1ohyw4gkjtcakkevararpwgq21ewp32
ප්රවර්ගය:East Circassian භාෂාව
14
143916
234798
2026-02-15T02:47:43Z
en>WingerBot
0
WingerBot moved page [[Category:Kabardian language]] to [[Category:East Circassian language]] without leaving a redirect: Kabardian -> East Circassian per [[Wiktionary:Language_treatment_requests#Circassian_renames]] and [[Wiktionary:Beer_parlour/2026/February#preparing_to_rename_Adyghe_->_West_Circassian,_Kabardian_->_East_Circassian]]
234798
wikitext
text/x-wiki
{{auto cat|Russia|Turkey|the Caucasus}}
mkdpn361n74nqkj8tby76vyx4ssit1d
234799
234798
2026-05-24T07:55:46Z
Lee
19
[[:en:Category:East_Circassian_language]] වෙතින් එක් සංශෝධනයක්
234798
wikitext
text/x-wiki
{{auto cat|Russia|Turkey|the Caucasus}}
mkdpn361n74nqkj8tby76vyx4ssit1d
234808
234799
2026-05-24T07:56:45Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:East Circassian language]] සිට [[ප්රවර්ගය:East Circassian භාෂාව]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234798
wikitext
text/x-wiki
{{auto cat|Russia|Turkey|the Caucasus}}
mkdpn361n74nqkj8tby76vyx4ssit1d
234814
234808
2026-05-24T07:57:35Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234814
wikitext
text/x-wiki
{{auto cat|Russia|Turkey|the Caucasus}}
[[en:Category:East Circassian language]]
dtp0hemsvzvxa4x8hfmyom9mfjyat29
ප්රවර්ගය:Terms with Classical Chinese translations
14
143917
234801
2026-05-24T07:56:05Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Terms with Classical Chinese translations]] සිට [[ප්රවර්ගය:යෙදුම්, Classical Chinese පරිවර්තන සහිත]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234801
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:යෙදුම්, Classical Chinese පරිවර්තන සහිත]]
iv5k8269am7dh9dqm4v113mxg6r2yn0
234815
234801
2026-05-24T07:57:45Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234815
wikitext
text/x-wiki
{{category redirect|යෙදුම්, Classical Chinese පරිවර්තන සහිත}}
1aqqstm2q5e11yuge5xct0d7q68stcd
ප්රවර්ගය:Classical Chinese entry maintenance
14
143918
234803
2026-05-24T07:56:15Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Classical Chinese entry maintenance]] සිට [[ප්රවර්ගය:Classical Chinese ප්රවේශ නඩත්තුව]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234803
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:Classical Chinese ප්රවේශ නඩත්තුව]]
36hnx0vhop679duugb26xm9muluu9ov
234816
234803
2026-05-24T07:57:55Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234816
wikitext
text/x-wiki
{{category redirect|Classical Chinese ප්රවේශ නඩත්තුව}}
r7jrfvzw4omab60shajizle43j2h0oa
ප්රවර්ගය:Classical Chinese language
14
143919
234805
2026-05-24T07:56:25Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Classical Chinese language]] සිට [[ප්රවර්ගය:Classical Chinese භාෂාව]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234805
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:Classical Chinese භාෂාව]]
rkyh1jgtbuekix0klj6eyil2ve448ty
234817
234805
2026-05-24T07:58:05Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234817
wikitext
text/x-wiki
{{category redirect|Classical Chinese භාෂාව}}
2bosq82crs4prrhf4ld24b86ktl04gi
ප්රවර්ගය:East Circassian entry maintenance
14
143920
234807
2026-05-24T07:56:35Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:East Circassian entry maintenance]] සිට [[ප්රවර්ගය:East Circassian ප්රවේශ නඩත්තුව]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234807
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:East Circassian ප්රවේශ නඩත්තුව]]
le8nt19ksb4nz0fj7zkqt1y2za3vlip
234818
234807
2026-05-24T07:58:15Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234818
wikitext
text/x-wiki
{{category redirect|East Circassian ප්රවේශ නඩත්තුව}}
agervhs494fx9wkley3aywvxrn82pa4
ප්රවර්ගය:East Circassian language
14
143921
234809
2026-05-24T07:56:45Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:East Circassian language]] සිට [[ප්රවර්ගය:East Circassian භාෂාව]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234809
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:East Circassian භාෂාව]]
mcf53u0c1e7s6philbvxfr09f56k41i
234819
234809
2026-05-24T07:58:25Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234819
wikitext
text/x-wiki
{{category redirect|East Circassian භාෂාව}}
4x45jjrgyyuxadwvvmkjndcjes0zhiz
ප්රවර්ගය:German Low German භාෂාව
14
143922
234823
2026-05-24T08:04:46Z
Lee
19
Lee විසින් [[ප්රවර්ගය:German Low German භාෂාව]] සිට [[ප්රවර්ගය:German Low German]] වෙත පිටුව ගෙන යන ලදී
234823
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:German Low German]]
1e1rlkzkugnfaxdymvff2akorcxuyjn
234824
234823
2026-05-24T08:06:16Z
Pinthura
2424
රොබෝ: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම
234824
wikitext
text/x-wiki
{{category redirect|German Low German}}
ffg204r6n0j3rzr58d6r2092wlysq5s
ප්රවර්ගය:Literary Chinese
14
143923
234839
2026-02-12T02:26:19Z
en>Benwing2
0
234839
wikitext
text/x-wiki
{{auto cat|lect=1|verb=written|prep=from|the 2nd century AD until the 20th century as a [[literary language]] that continued the Classical Chinese of the 5th century BC to the 2nd century AD|othercat=Old Chinese lemmas,Middle Chinese lemmas|noreg=1|type=extinct}}
hba1nrk18fvwvzsnz0yemv93fwq9ms3
234840
234839
2026-05-24T09:09:32Z
Lee
19
[[:en:Category:Literary_Chinese]] වෙතින් එක් සංශෝධනයක්
234839
wikitext
text/x-wiki
{{auto cat|lect=1|verb=written|prep=from|the 2nd century AD until the 20th century as a [[literary language]] that continued the Classical Chinese of the 5th century BC to the 2nd century AD|othercat=Old Chinese lemmas,Middle Chinese lemmas|noreg=1|type=extinct}}
hba1nrk18fvwvzsnz0yemv93fwq9ms3
ප්රවර්ගය:Classical Chinese ප්රභේද
14
143924
234841
2026-02-11T05:24:49Z
en>WingerBot
0
WingerBot moved page [[Category:Varieties of Literary Chinese]] to [[Category:Varieties of Classical Chinese]] without leaving a redirect: Literary Chinese -> Classical Chinese in categories per [[Wiktionary:Language_treatment_requests#merge_"Literary_Chinese"_and_"Literary_Chinese"]]
234841
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234842
234841
2026-05-24T09:10:03Z
Lee
19
[[:en:Category:Varieties_of_Classical_Chinese]] වෙතින් එක් සංශෝධනයක්
234841
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234843
234842
2026-05-24T09:10:35Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Varieties of Classical Chinese]] සිට [[ප්රවර්ගය:Classical Chinese ප්රභේද]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234841
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234845
234843
2026-05-24T09:10:45Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234845
wikitext
text/x-wiki
{{auto cat}}
[[en:Category:Varieties of Classical Chinese]]
t5i99gh9bdrw0w5esugwmi4u792pzax
ප්රවර්ගය:Varieties of Classical Chinese
14
143925
234844
2026-05-24T09:10:36Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Varieties of Classical Chinese]] සිට [[ප්රවර්ගය:Classical Chinese ප්රභේද]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234844
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:Classical Chinese ප්රභේද]]
d3o0ba8n1mhvv578u0pdleo7itib221
234846
234844
2026-05-24T09:10:55Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234846
wikitext
text/x-wiki
{{category redirect|Classical Chinese ප්රභේද}}
tvawgy940esvmb6k705cu0avmpof971
ප්රවර්ගය:කලාපීය Low German
14
143926
234847
2026-02-14T00:03:15Z
en>Benwing2
0
234847
wikitext
text/x-wiki
{{wp|Low German dialects,Dutch Low Saxon dialects}}
{{auto cat}}
og2j6n5266o4oj6rsz5a19cwjhl06lx
234848
234847
2026-05-24T09:12:33Z
Lee
19
[[:en:Category:Regional_Low_German]] වෙතින් එක් සංශෝධනයක්
234847
wikitext
text/x-wiki
{{wp|Low German dialects,Dutch Low Saxon dialects}}
{{auto cat}}
og2j6n5266o4oj6rsz5a19cwjhl06lx
234851
234848
2026-05-24T09:13:02Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Regional Low German]] සිට [[ප්රවර්ගය:කලාපීය Low German]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234847
wikitext
text/x-wiki
{{wp|Low German dialects,Dutch Low Saxon dialects}}
{{auto cat}}
og2j6n5266o4oj6rsz5a19cwjhl06lx
234855
234851
2026-05-24T09:13:22Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234855
wikitext
text/x-wiki
{{wp|Low German dialects,Dutch Low Saxon dialects}}
{{auto cat}}
[[en:Category:Regional Low German]]
qegom2f2fazrttxbdze0as06xp3hjct
234859
234855
2026-05-24T09:14:02Z
Pinthura
2424
සේවා: auto cat භාවිතය පරික්ෂාව
234859
wikitext
text/x-wiki
{{auto cat}}{{wp|Low German dialects,Dutch Low Saxon dialects}}
[[en:Category:Regional Low German]]
3v1l30sec32607uc7zdsbuk1vbb2hjj
ප්රවර්ගය:Low German ප්රභේද
14
143927
234849
2023-09-24T06:13:01Z
en>WingerBot
0
Created page with "{{auto cat}}"
234849
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234850
234849
2026-05-24T09:12:47Z
Lee
19
[[:en:Category:Varieties_of_Low_German]] වෙතින් එක් සංශෝධනයක්
234849
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234853
234850
2026-05-24T09:13:13Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Varieties of Low German]] සිට [[ප්රවර්ගය:Low German ප්රභේද]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234849
wikitext
text/x-wiki
{{auto cat}}
eomzlm5v4j7ond1phrju7cnue91g5qx
234856
234853
2026-05-24T09:13:33Z
Pinthura
2424
සේවා: ඉංග්රීසි ව්යාපෘතිය වෙත සබැඳියක් එක් කිරීම.
234856
wikitext
text/x-wiki
{{auto cat}}
[[en:Category:Varieties of Low German]]
l0uhfi6cf0amn1mfacmm4uvyare03s5
ප්රවර්ගය:Regional Low German
14
143928
234852
2026-05-24T09:13:03Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Regional Low German]] සිට [[ප්රවර්ගය:කලාපීය Low German]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234852
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:කලාපීය Low German]]
ekc34qvrnjfj4cw9bd2rp9qe6t4s679
234857
234852
2026-05-24T09:13:42Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234857
wikitext
text/x-wiki
{{category redirect|කලාපීය Low German}}
cryom19lxax7ce05al42zgd1vfrxcgj
ප්රවර්ගය:Varieties of Low German
14
143929
234854
2026-05-24T09:13:13Z
Pinthura
2424
Pinthura විසින් [[ප්රවර්ගය:Varieties of Low German]] සිට [[ප්රවර්ගය:Low German ප්රභේද]] වෙත පිටුව ගෙන යන ලදී: සේවා: නව ප්රවර්ග නාමය වෙත ගෙනයාම.
234854
wikitext
text/x-wiki
#යළියොමුව [[:ප්රවර්ගය:Low German ප්රභේද]]
b8fwpgurxzjakla9wox8y3atnuzp843
234858
234854
2026-05-24T09:13:52Z
Pinthura
2424
සේවා: යළියොමුව, මෘදු ප්රවර්ග යළියොමුවක් බවට හැරවීම.
234858
wikitext
text/x-wiki
{{category redirect|Low German ප්රභේද}}
sui0fs1hijmzproluy1tjij54pf60wy
Module:Syrc-stripdiacritics
828
143930
234860
2025-12-21T06:15:36Z
en>Benwing2
0
"entry name" as a concept is going away in favor of "strip diacritics" + logical-to-physical
234860
Scribunto
text/plain
local export = {}
local u = mw.ustring.char
function export.stripDiacritics(text, lang, sc)
-- tilde, macron, dot above, diaeresis, dot below, breve below, tilde below, macron below, superscript aleph, pthaha, zqapha, rbasa, zlama, hbasa, esasa, rwaha, feminine dot, qushshaya
local replacements = {
u(0x303), u(0x304), u(0x307), u(0x308), u(0x323), u(0x32E), u(0x330), u(0x331), u(0x711), "[" .. u(0x730) .. "-" .. u(0x74A) .. "]"
}
for _, replacement in ipairs(replacements) do
text = mw.ustring.gsub(text, replacement, "")
end
return text
end
return export
jcojgzqvqt2iz9x51ey9emjp4vbm7b7
234861
234860
2026-05-24T09:31:09Z
Lee
19
[[:en:Module:Syrc-stripdiacritics]] වෙතින් එක් සංශෝධනයක්
234860
Scribunto
text/plain
local export = {}
local u = mw.ustring.char
function export.stripDiacritics(text, lang, sc)
-- tilde, macron, dot above, diaeresis, dot below, breve below, tilde below, macron below, superscript aleph, pthaha, zqapha, rbasa, zlama, hbasa, esasa, rwaha, feminine dot, qushshaya
local replacements = {
u(0x303), u(0x304), u(0x307), u(0x308), u(0x323), u(0x32E), u(0x330), u(0x331), u(0x711), "[" .. u(0x730) .. "-" .. u(0x74A) .. "]"
}
for _, replacement in ipairs(replacements) do
text = mw.ustring.gsub(text, replacement, "")
end
return text
end
return export
jcojgzqvqt2iz9x51ey9emjp4vbm7b7
Module:Syrc-stripdiacritics/testcases/documentation
828
143931
234862
2025-12-21T06:17:51Z
en>Benwing2
0
"entry name" as a concept is going away in favor of "strip diacritics" + logical-to-physical
234862
wikitext
text/x-wiki
{{#invoke:Syrc-stripdiacritics/testcases|run_tests|differs_at=true}}
ks2w8fxjz2qqmt7j6iye5o8um2o82zc
234863
234862
2026-05-24T09:31:37Z
Lee
19
[[:en:Module:Syrc-stripdiacritics/testcases/documentation]] වෙතින් එක් සංශෝධනයක්
234862
wikitext
text/x-wiki
{{#invoke:Syrc-stripdiacritics/testcases|run_tests|differs_at=true}}
ks2w8fxjz2qqmt7j6iye5o8um2o82zc
Module:Syrc-stripdiacritics/testcases
828
143932
234864
2025-12-21T06:15:16Z
en>Benwing2
0
"entry name" as a concept is going away in favor of "strip diacritics" + logical-to-physical
234864
Scribunto
text/plain
local tests = require("Module:UnitTests")
local stripDiacritics = require("Module:Syrc-stripdiacritics").stripDiacritics
local function tag(text)
return '<span>' .. text .. '</span>'
end
function tests:test_stripDiacritics()
self:iterate({
-- common words
{ "ܠܹܗ", "ܠܗ" },
{ "ܡ̣ܢ", "ܡܢ" },
{ "ܠܗܘܿܢ", "ܠܗܘܢ" },
{ "ܒܸܬ", "ܒܬ" },
{ "ܝܠܹܗ", "ܝܠܗ" },
{ "ܣܵܒܵܒ", "ܣܒܒ" },
{ "ܐܝܼܢܵܐ", "ܐܝܢܐ" },
{ "ܠܹܐ", "ܠܐ" },
{ "ܟܹܐ", "ܟܐ" },
{ "ܠܝܼ", "ܠܝ" },
{ "ܠܵܐ", "ܠܐ" },
{ "ܓܵܘ", "ܓܘ" },
{ "ܝܼܫܘܿܥ", "ܝܫܘܥ" },
{ "ܗ̇ܘ", "ܗܘ" },
{ "ܐܵܗܵܐ", "ܐܗܐ" },
-- { "", "" },
-- edge cases
{ "ܐܲܩܠܵܐ", "ܐܩܠܐ" },
{ "ܬܸܦ̮ܠܵܐ", "ܬܦܠܐ" },
{ "ܓ̰ܵܘܹܓ̰", "ܓܘܓ" },
{ "ܡܲܕܢ̱ܚܵܐ", "ܡܕܢܚܐ" },
{ "ܡܲܩܕ̄ܫܵܐ", "ܡܩܕܫܐ" },
{ "ܫ̃", "ܫ" },
},
function(self, example, expected)
self:equals(tag(example), stripDiacritics(example), expected)
end)
end
return tests
s01wdhmzcn734mx7vroc9fnqalrzie6
234865
234864
2026-05-24T09:31:43Z
Lee
19
[[:en:Module:Syrc-stripdiacritics/testcases]] වෙතින් එක් සංශෝධනයක්
234864
Scribunto
text/plain
local tests = require("Module:UnitTests")
local stripDiacritics = require("Module:Syrc-stripdiacritics").stripDiacritics
local function tag(text)
return '<span>' .. text .. '</span>'
end
function tests:test_stripDiacritics()
self:iterate({
-- common words
{ "ܠܹܗ", "ܠܗ" },
{ "ܡ̣ܢ", "ܡܢ" },
{ "ܠܗܘܿܢ", "ܠܗܘܢ" },
{ "ܒܸܬ", "ܒܬ" },
{ "ܝܠܹܗ", "ܝܠܗ" },
{ "ܣܵܒܵܒ", "ܣܒܒ" },
{ "ܐܝܼܢܵܐ", "ܐܝܢܐ" },
{ "ܠܹܐ", "ܠܐ" },
{ "ܟܹܐ", "ܟܐ" },
{ "ܠܝܼ", "ܠܝ" },
{ "ܠܵܐ", "ܠܐ" },
{ "ܓܵܘ", "ܓܘ" },
{ "ܝܼܫܘܿܥ", "ܝܫܘܥ" },
{ "ܗ̇ܘ", "ܗܘ" },
{ "ܐܵܗܵܐ", "ܐܗܐ" },
-- { "", "" },
-- edge cases
{ "ܐܲܩܠܵܐ", "ܐܩܠܐ" },
{ "ܬܸܦ̮ܠܵܐ", "ܬܦܠܐ" },
{ "ܓ̰ܵܘܹܓ̰", "ܓܘܓ" },
{ "ܡܲܕܢ̱ܚܵܐ", "ܡܕܢܚܐ" },
{ "ܡܲܩܕ̄ܫܵܐ", "ܡܩܕܫܐ" },
{ "ܫ̃", "ܫ" },
},
function(self, example, expected)
self:equals(tag(example), stripDiacritics(example), expected)
end)
end
return tests
s01wdhmzcn734mx7vroc9fnqalrzie6
Module:Syrc-stripdiacritics/documentation
828
143933
234866
2025-12-21T05:39:02Z
en>Benwing2
0
Benwing2 moved page [[Module:Syrc-entryname/documentation]] to [[Module:Syrc-stripdiacritics/documentation]]: "entry name" as concept is going away, replaced by "strip diacritics" + logical-to-physical
234866
wikitext
text/x-wiki
{{strip diacritics module documentation}}
4ee7ih8ihukb9zn2x59k8le2phktzzx
234867
234866
2026-05-24T09:31:51Z
Lee
19
[[:en:Module:Syrc-stripdiacritics/documentation]] වෙතින් එක් සංශෝධනයක්
234866
wikitext
text/x-wiki
{{strip diacritics module documentation}}
4ee7ih8ihukb9zn2x59k8le2phktzzx
Module:sga-sortkey
828
143934
234868
2024-04-27T09:38:02Z
en>SurjectionBot
0
Protected "[[Module:sga-sortkey]]": (bot) automatically protect highly visible templates/modules (reference score: 1999+ >= 1000) ([Edit=Allow only autoconfirmed users] (indefinite) [Move=Allow only autoconfirmed users] (indefinite))
234868
Scribunto
text/plain
local export = {}
local u = mw.ustring.char
local remove_diacritics = u(0x0301) .. "-"
local oneChar = {
["æ"] = "e"
}
function export.makeSortKey(text, lang, sc)
text = mw.ustring.gsub(mw.ustring.lower(mw.ustring.toNFD(text)), "^h", "")
return mw.ustring.upper(mw.ustring.toNFC(mw.ustring.gsub(mw.ustring.toNFD(mw.ustring.gsub(text, ".", oneChar)), "[" .. remove_diacritics .. "]", "")))
end
return export
g8l1xcks9sd0qwhtd9kkgbbwzg9ahpf
234869
234868
2026-05-24T09:33:19Z
Lee
19
[[:en:Module:sga-sortkey]] වෙතින් එක් සංශෝධනයක්
234868
Scribunto
text/plain
local export = {}
local u = mw.ustring.char
local remove_diacritics = u(0x0301) .. "-"
local oneChar = {
["æ"] = "e"
}
function export.makeSortKey(text, lang, sc)
text = mw.ustring.gsub(mw.ustring.lower(mw.ustring.toNFD(text)), "^h", "")
return mw.ustring.upper(mw.ustring.toNFC(mw.ustring.gsub(mw.ustring.toNFD(mw.ustring.gsub(text, ".", oneChar)), "[" .. remove_diacritics .. "]", "")))
end
return export
g8l1xcks9sd0qwhtd9kkgbbwzg9ahpf
Module:sga-sortkey/documentation
828
143935
234870
2025-11-09T14:46:05Z
en>Santi2222
0
Created page with "{{sortkey module documentation}}"
234870
wikitext
text/x-wiki
{{sortkey module documentation}}
3pw08nb331a76oaibaa62cali7uojmw
234871
234870
2026-05-24T09:33:54Z
Lee
19
[[:en:Module:sga-sortkey/documentation]] වෙතින් එක් සංශෝධනයක්
234870
wikitext
text/x-wiki
{{sortkey module documentation}}
3pw08nb331a76oaibaa62cali7uojmw
Module:bg-pronunciation/speaker profiles
828
143936
234876
2026-02-16T00:32:47Z
en>Kiril kovachev
0
Allow viewing a list of each speaker profile's usages
234876
Scribunto
text/plain
local export = {}
local audio_module = "Module:audio"
local lang = require("Module:languages").getByCode("bg")
-- Table that encodes the recognized audio speakers and how their audio files
-- are named (prefix, suffix).
export.speaker_profiles = {
["KK"] = {
user = "Kiril kovachev",
prefix = "LL-Q7918 (bul)-Kiril kovachev-",
suffix = ".wav",
renderer = "dark-l"
},
["KK2"] = {
user = "Kiril kovachev",
prefix = "LL-Q7918 (bul)-Kiril kovachev-",
suffix = ".wav",
renderer = "standard",
comments = "This profile is for when I want to mark that I haven't used l-vocalization in a given audio like I usually do."
},
["PC"] = {
user = "SixtyShips",
prefix = "LL-Q7918 (bul)-SixtyShips-",
suffix = ".wav",
renderer = "standard"
},
["SP"] = {
user = "SixtyShips",
prefix = "LL-Q7918 (bul)-SixtyShips-",
suffix = ".wav",
renderer = "moesian",
comments = "This profile is used when I want to pronounce local dialect words, especially typical for Ruse dialect."
},
-- Add yourself here!:
-- * uncomment the code below starting from ["KK"]... (i.e., remove the dashes)
-- * replace "KK" below with a short name to represent your profile
-- * change the "user =" property to your username
-- * change "prefix =" and "suffix =" to the beginning and ending of
-- your typical audio filenames; e.g., mine are usually
-- LL-Q7918 (bul)-Kiril kovachev-(page name).wav
-- ... so ".wav" is the suffix and "LL-Q7918 (bul)-Kiril kovachev-" is
-- the prefix. The audio's actual name will be inserted between these two
-- automatically.
-- * change "renderer =" to either "standard" or "dark-l"; use "dark-l" if
-- you have l-vocalization in your accent, otherwise use "standard".
-- If you speak anything besides Standard Bulgarian, a new rendering
-- function should be added to represent that.
-- ["KK"] = {
-- user = "Kiril kovachev",
-- prefix = "LL-Q7918 (bul)-Kiril kovachev-",
-- suffix = ".wav",
-- renderer = "dark-l"
-- },
}
local function format_audio(prefix, suffix, name, accents)
local filename = prefix .. name .. suffix
if mw.title.new("Media:" .. filename).exists then
return require(audio_module).format_audio({
lang = lang,
file = filename,
a = accents
})
else
return nil
end
end
-- Table of functions which take care of rendering the audio based on inputs.
export.audio_functions = {
["plain"] = {
name = "Unlabelled audio",
description = "This display function simply shows the audio, no extra features such as accent labels. Can be used if you don't care about displaying extra information to readers.",
display = function(profile, term_override, _extras)
return format_audio(profile.prefix, profile.suffix, term_override, nil)
end
},
["standard"] = {
name = "Standard accent",
description = "This display function simply displays the given audio with the \"Standard Bulgarian\" label before it. This can be used to indicate that your speech is completely standard in all recordings.",
display = function(profile, term_override, _extras)
local accents_list = {"Standard Bulgarian"}
return format_audio(profile.prefix, profile.suffix, term_override, accents_list)
end
},
["dark-l"] = {
name = "Standard accent with L-vocalization",
description = "This display function displays the given audio with the \"Standard Bulgarian\" label before it, but also detects whether the word (based on its IPA) ought to contain an instance of l-vocalization, as is common in younger Bulgarian speakers. Using this display method, the template will figure out whether this label is necessary or not per-entry, but will only display \"Standard Bulgarian\" by itself if it's not.",
display = function(profile, term_override, extras)
local ipa = extras.ipa
local accents_list = {"Standard Bulgarian"}
if mw.ustring.find(ipa, "ɫ") then
table.insert(accents_list, "l-vocalization")
end
return format_audio(profile.prefix, profile.suffix, term_override, accents_list)
end
},
["moesian"] = {
name = "Moesian dialects",
description = "This display function will provide the label 'Moesian' alongside the audio.",
display = function(profile, term_override, _extras)
local accents_list = {"Moesian"}
return format_audio(profile.prefix, profile.suffix, term_override, accents_list)
end,
}
}
function export.show_data(frame)
local lines = {"==Available speaker profiles=="}
for code, profile in pairs(export.speaker_profiles) do
table.insert(lines, "* Profile name: '''" .. code .. "'''")
table.insert(lines, "** User: [[User:" .. profile.user .. "|" .. profile.user .. "]]")
table.insert(lines, "** Prefix: <code>" .. profile.prefix .. "</code>")
table.insert(lines, "** Suffix: <code>" .. profile.suffix .. "</code>")
table.insert(lines, "** Display function: <code>" .. profile.renderer .. "</code>")
table.insert(lines, "** Entries: [[Special:WhatLinksHere/Wiktionary:Tracking/bg-pr/speaker-profile/" .. code .. "|list]]")
if profile.comments then table.insert(lines, "** Comments: " .. profile.comments) end
end
table.insert(lines, "")
table.insert(lines, "==Available display functions==")
for name, displayer in pairs(export.audio_functions) do
table.insert(lines, "* Display function name: '''" .. displayer.name .. "'''")
table.insert(lines, "** Internal code name: <code>" .. name .. "</code>")
table.insert(lines, "** Description: " .. displayer.description)
end
return frame:preprocess(table.concat(lines, "\n"))
end
return export
2434dr0mpr5lt05vg4w2p6ogyrsdf54
234877
234876
2026-05-24T09:40:13Z
Lee
19
[[:en:Module:bg-pronunciation/speaker_profiles]] වෙතින් එක් සංශෝධනයක්
234876
Scribunto
text/plain
local export = {}
local audio_module = "Module:audio"
local lang = require("Module:languages").getByCode("bg")
-- Table that encodes the recognized audio speakers and how their audio files
-- are named (prefix, suffix).
export.speaker_profiles = {
["KK"] = {
user = "Kiril kovachev",
prefix = "LL-Q7918 (bul)-Kiril kovachev-",
suffix = ".wav",
renderer = "dark-l"
},
["KK2"] = {
user = "Kiril kovachev",
prefix = "LL-Q7918 (bul)-Kiril kovachev-",
suffix = ".wav",
renderer = "standard",
comments = "This profile is for when I want to mark that I haven't used l-vocalization in a given audio like I usually do."
},
["PC"] = {
user = "SixtyShips",
prefix = "LL-Q7918 (bul)-SixtyShips-",
suffix = ".wav",
renderer = "standard"
},
["SP"] = {
user = "SixtyShips",
prefix = "LL-Q7918 (bul)-SixtyShips-",
suffix = ".wav",
renderer = "moesian",
comments = "This profile is used when I want to pronounce local dialect words, especially typical for Ruse dialect."
},
-- Add yourself here!:
-- * uncomment the code below starting from ["KK"]... (i.e., remove the dashes)
-- * replace "KK" below with a short name to represent your profile
-- * change the "user =" property to your username
-- * change "prefix =" and "suffix =" to the beginning and ending of
-- your typical audio filenames; e.g., mine are usually
-- LL-Q7918 (bul)-Kiril kovachev-(page name).wav
-- ... so ".wav" is the suffix and "LL-Q7918 (bul)-Kiril kovachev-" is
-- the prefix. The audio's actual name will be inserted between these two
-- automatically.
-- * change "renderer =" to either "standard" or "dark-l"; use "dark-l" if
-- you have l-vocalization in your accent, otherwise use "standard".
-- If you speak anything besides Standard Bulgarian, a new rendering
-- function should be added to represent that.
-- ["KK"] = {
-- user = "Kiril kovachev",
-- prefix = "LL-Q7918 (bul)-Kiril kovachev-",
-- suffix = ".wav",
-- renderer = "dark-l"
-- },
}
local function format_audio(prefix, suffix, name, accents)
local filename = prefix .. name .. suffix
if mw.title.new("Media:" .. filename).exists then
return require(audio_module).format_audio({
lang = lang,
file = filename,
a = accents
})
else
return nil
end
end
-- Table of functions which take care of rendering the audio based on inputs.
export.audio_functions = {
["plain"] = {
name = "Unlabelled audio",
description = "This display function simply shows the audio, no extra features such as accent labels. Can be used if you don't care about displaying extra information to readers.",
display = function(profile, term_override, _extras)
return format_audio(profile.prefix, profile.suffix, term_override, nil)
end
},
["standard"] = {
name = "Standard accent",
description = "This display function simply displays the given audio with the \"Standard Bulgarian\" label before it. This can be used to indicate that your speech is completely standard in all recordings.",
display = function(profile, term_override, _extras)
local accents_list = {"Standard Bulgarian"}
return format_audio(profile.prefix, profile.suffix, term_override, accents_list)
end
},
["dark-l"] = {
name = "Standard accent with L-vocalization",
description = "This display function displays the given audio with the \"Standard Bulgarian\" label before it, but also detects whether the word (based on its IPA) ought to contain an instance of l-vocalization, as is common in younger Bulgarian speakers. Using this display method, the template will figure out whether this label is necessary or not per-entry, but will only display \"Standard Bulgarian\" by itself if it's not.",
display = function(profile, term_override, extras)
local ipa = extras.ipa
local accents_list = {"Standard Bulgarian"}
if mw.ustring.find(ipa, "ɫ") then
table.insert(accents_list, "l-vocalization")
end
return format_audio(profile.prefix, profile.suffix, term_override, accents_list)
end
},
["moesian"] = {
name = "Moesian dialects",
description = "This display function will provide the label 'Moesian' alongside the audio.",
display = function(profile, term_override, _extras)
local accents_list = {"Moesian"}
return format_audio(profile.prefix, profile.suffix, term_override, accents_list)
end,
}
}
function export.show_data(frame)
local lines = {"==Available speaker profiles=="}
for code, profile in pairs(export.speaker_profiles) do
table.insert(lines, "* Profile name: '''" .. code .. "'''")
table.insert(lines, "** User: [[User:" .. profile.user .. "|" .. profile.user .. "]]")
table.insert(lines, "** Prefix: <code>" .. profile.prefix .. "</code>")
table.insert(lines, "** Suffix: <code>" .. profile.suffix .. "</code>")
table.insert(lines, "** Display function: <code>" .. profile.renderer .. "</code>")
table.insert(lines, "** Entries: [[Special:WhatLinksHere/Wiktionary:Tracking/bg-pr/speaker-profile/" .. code .. "|list]]")
if profile.comments then table.insert(lines, "** Comments: " .. profile.comments) end
end
table.insert(lines, "")
table.insert(lines, "==Available display functions==")
for name, displayer in pairs(export.audio_functions) do
table.insert(lines, "* Display function name: '''" .. displayer.name .. "'''")
table.insert(lines, "** Internal code name: <code>" .. name .. "</code>")
table.insert(lines, "** Description: " .. displayer.description)
end
return frame:preprocess(table.concat(lines, "\n"))
end
return export
2434dr0mpr5lt05vg4w2p6ogyrsdf54
Module:bg-pronunciation/speaker profiles/documentation
828
143937
234878
2025-08-20T14:35:36Z
en>Kiril kovachev
0
Create entry
234878
wikitext
text/x-wiki
This module contains the registry of "speakers" of audio used in the template {{template|bg-pr}}. This template allows users to specify audio by using a string such as "[UN]", where 'UN' is an abbreviation found inside this module that represents a particular user's way of recording audio.
This module allows you to specify the typical file name structure of audios you record, as well as what rules to use to automatically render those details onto the page.
The details one has control over are:
* The prefix that a user's audio files typically have, e.g. "Bg-" for files like "Bg-крава.ogg";
* The suffix that a user's audio files typically have, e.g. ".ogg" for the same example above;
* The choice of how to render the information; see below for supported ways.
In order to add yourself to the module, you can create a new field in the "speaker_profiles" table, filling in the required details. Using speaker profiles works best if you always use a particular naming convention for your files, which is especially easy using [[lingualibre:|Lingua Libre]].
{{#invoke:bg-pronunciation/speaker profiles|show_data}}
kf6zz626xiepltdkyleo29jbfepsxna
234879
234878
2026-05-24T09:40:19Z
Lee
19
[[:en:Module:bg-pronunciation/speaker_profiles/documentation]] වෙතින් එක් සංශෝධනයක්
234878
wikitext
text/x-wiki
This module contains the registry of "speakers" of audio used in the template {{template|bg-pr}}. This template allows users to specify audio by using a string such as "[UN]", where 'UN' is an abbreviation found inside this module that represents a particular user's way of recording audio.
This module allows you to specify the typical file name structure of audios you record, as well as what rules to use to automatically render those details onto the page.
The details one has control over are:
* The prefix that a user's audio files typically have, e.g. "Bg-" for files like "Bg-крава.ogg";
* The suffix that a user's audio files typically have, e.g. ".ogg" for the same example above;
* The choice of how to render the information; see below for supported ways.
In order to add yourself to the module, you can create a new field in the "speaker_profiles" table, filling in the required details. Using speaker profiles works best if you always use a particular naming convention for your files, which is especially easy using [[lingualibre:|Lingua Libre]].
{{#invoke:bg-pronunciation/speaker profiles|show_data}}
kf6zz626xiepltdkyleo29jbfepsxna
ප්රවර්ගය:Dutch Low Saxon
14
143938
234888
2026-02-13T23:51:28Z
en>Benwing2
0
Created page with "{{auto cat|lect=1|<country>|country=the Netherlands}}"
234888
wikitext
text/x-wiki
{{auto cat|lect=1|<country>|country=the Netherlands}}
5goqrs207hth3xhll57cy37c4e3ml4j
234889
234888
2026-05-24T09:47:57Z
Lee
19
[[:en:Category:Dutch_Low_Saxon]] වෙතින් එක් සංශෝධනයක්
234888
wikitext
text/x-wiki
{{auto cat|lect=1|<country>|country=the Netherlands}}
5goqrs207hth3xhll57cy37c4e3ml4j