@wikimedia/language-data
Version:
Language data and utilities.
912 lines (908 loc) • 31.7 kB
YAML
languages:
aa: [Latn, [AF], Qafár af]
aae: [Latn, [EU], arbërisht]
ab: [Cyrl, [EU], аԥсшәа]
abe: [Latn, [AM], Wôbanakiôdwawôgan]
abr: [Latn, [AF], Abron]
abs: [Latn, [AS], Bahasa Ambon]
ace: [Latn, [AS, PA], Acèh]
acf: [Latn, [AM], Kwéyòl Sent Lisi]
acm: [Arab, [ME], عراقي]
acq: [Arab, [ME, AF], تعزية-عدنية]
ada: [Latn, [AF], Dangme]
ady: [Cyrl, [EU, ME], адыгабзэ]
ady-cyrl: [ady]
ady-latn: [Latn, [EU, ME], Adygabze]
aeb: [aeb-arab]
aeb-arab: [Arab, [AF], تونسي]
aeb-latn: [Latn, [AF], Tûnsî]
af: [Latn, [AF], Afrikaans]
agq: [Latn, [AF], aghɨ̂m]
ahr: [Deva, [AS], अहिराणी]
aii: [Syrc, [ME], ܣܘܪܝܬ]
ajg: [Latn, [AF], ajagbe]
# The code ajp was deprecated by ISO and merged into apc:
# https://iso639-3.sil.org/code/ajp
ajp: [apc]
ajp-arab: [apc]
ajp-latn: [apc-latn]
akz: [Latn, [AM], Albaamo innaaɬiilka]
ale: [Latn, [AM, AS], unangam tunuu]
ale-cyrl: [Cyrl, [AS], унаӈам тунуу]
aln: [Latn, [EU], Gegë]
als: [sq]
alt: [Cyrl, [EU, AS], алтай тил]
am: [Ethi, [AF], አማርኛ]
ami: [Latn, [AS], Pangcah]
an: [Latn, [EU], aragonés]
ang: [Latn, [EU], Ænglisc]
ann: [Latn, [AF], Obolo]
anp: [Deva, [AS], अंगिका]
apc: [Arab, [ME], شامي]
apc-arab: [apc]
apc-latn: [Latn, [ME], šāmi]
apw: [Latn, [AM], "Ndee biyati'"]
ar: [Arab, [AF, ME], العربية]
arc: [Syrc, [ME], ܐܪܡܝܐ]
arn: [Latn, [AM], mapudungun]
aro: [Latn, [AM], Araona]
arq: [Arab, [AF, ME], جازايرية]
ars: [Arab, [ME], نجدي]
ary: [Arab, [AF, ME], الدارجة]
ary-arab: [ary]
ary-latn: [Latn, [AF, ME], ed-dārija]
arz: [Arab, [AF, ME], مصرى]
as: [Beng, [AS], অসমীয়া]
ase: [Sgnw, [AM], American Sign Language]
ast: [Latn, [EU], asturianu]
atj: [Latn, [AM], atikamekw]
atv: [Cyrl, [EU, AS], тÿндÿк алтай тил]
av: [Cyrl, [EU], авар]
avk: [Latn, [WW], Kotava]
awa: [Deva, [AS], अवधी]
ay: [Latn, [AM], Aymar aru]
# The Latin script is the default in the North Azerbaijani Wikipedia,
# which uses the macro code 'az'. Its own standard code is 'azj'.
# The Arabic script is the default in the South Azerbaijani Wikipedia,
# which correctly uses the code 'azb'.
# CLDR uses az-latn and az-arab.
az: [az-latn]
az-arab: [Arab, [AS, ME], تۆرکجه]
az-cyrl: [Cyrl, [EU, ME], азәрбајҹанҹа]
az-latn: [Latn, [EU, ME], azərbaycanca]
azb: [az-arab]
azj: [az-latn]
ba: [Cyrl, [EU], башҡортса]
# The common modern default.
ban: [Latn, [AS, PA], Bali]
# For support in webfonts.
ban-bali: [Bali, [AS, PA], ᬩᬮᬶ]
bar: [Latn, [EU], Boarisch]
bas: [Latn, [AF], ɓasaá]
bat-smg: [sgs]
bbc: [bbc-latn]
bbc-batk: [Batk, [AS], ᯅᯖᯂ᯲ ᯖᯬᯅ]
bbc-latn: [Latn, [AS], Batak Toba]
bcc: [Arab, [AS, ME], جهلسری بلوچی]
bci: [Latn, [AF], wawle]
bcl: [Latn, [AS], Bikol Central]
bdr: [Latn, [AS], Bajau Sama]
be: [Cyrl, [EU], беларуская]
be-tarask: [Cyrl, [EU], беларуская (тарашкевіца)]
be-x-old: [be-tarask]
bem: [Latn, [AF], IciBemba]
bew: [Latn, [AS], Betawi]
bfa: [Latn, [AF], Bari]
bfq: [Taml, [AS], படகா]
bft: [Arab, [AS], بلتی]
bg: [Cyrl, [EU], български]
bgc: [Deva, [AS], हरियाणवी]
bgn: [Arab, [AS, ME], روچ کپتین بلوچی]
# FIXME - currently says Bhojpuri, but it's a macrolanguage.
bh: [bho]
bho: [Deva, [AS], भोजपुरी]
bi: [Latn, [PA], Bislama]
bin: [Latn, [AF], Ẹdo]
bjn: [Latn, [AS], Banjar]
bkm: [Latn, [AF], Itaŋikom]
blc: [Latn, [AM], ItNuxalkmc]
blk: [Mymr, [AS], ပအိုဝ်ႏဘာႏသာႏ]
bm: [Latn, [AF], bamanankan]
bn: [Beng, [AS], বাংলা]
bnn: [Latn, [AS], bunun]
bo: [Tibt, [AS], བོད་ཡིག]
bol: [Latn, [AF], bòo pìkkà]
bom: [Latn, [AF], bèrom]
bpy: [Beng, [AS], বিষ্ণুপ্রিয়া মণিপুরী]
bqi: [Arab, [AS, ME], بختیاری]
br: [Latn, [EU], brezhoneg]
brh: [Latn, [ME, AS], Bráhuí]
brx: [Deva, [AS], "बर'"]
bs: [Latn, [EU], bosanski]
btm: [Latn, [AS], Mandailing]
bto: [Latn, [AS], Iriga Bicolano]
bug: [Latn, [AS, PA], Basa Ugi]
bug-bugi: [Bugi, [AS, PA], ᨅᨔ ᨕᨘᨁᨗ]
bug-latn: [bug]
bum: [Latn, [AF], bulu]
bwr: [Latn, [AF], bura]
bxr: [Cyrl, [AS], буряад]
byn: [Ethi, [AF], ብሊን]
bzj: [Latn, [AM], Bileez Kriol]
bzs: [Sgnw, [AM], Língua brasileira de sinais]
ca: [Latn, [EU], català]
cak: [Latn, [AM], Kaqchikel]
cbk: [Latn, [AS], Chavacano de Zamboanga]
cbk-zam: [cbk]
ccp: [Cakm, [AS], 𑄌𑄋𑄴𑄟𑄳𑄦]
# FIXME cdo will be modified later to split to Latin and Chinese more cleanly
cdo: [Latn, [AS], 閩東語 / Mìng-dĕ̤ng-ngṳ̄]
cdo-hani: [Hani, [AS], 閩東語(漢字)]
cdo-latn: [Latn, [AS], Mìng-dĕ̤ng-ngṳ̄ Bàng-uâ-cê]
ce: [Cyrl, [EU], нохчийн]
ceb: [Latn, [AS], Cebuano]
ch: [Latn, [PA], Chamoru]
# FIXME chm is actually a macro language that includes
# mhr and mrj, but CLDR Territory-Language information
# uses chm instead of mhr, so for practical reasons
# it should redirect there.
# A better fix would be this:
# https://phabricator.wikimedia.org/T136164
chm: [mhr]
chn: [Latn, [AM], chinuk wawa]
cho: [Latn, [AM], Chahta anumpa]
chr: [Cher, [AM], ᏣᎳᎩ]
chy: [Latn, [AM], Tsetsêhestâhese]
ciw: [Latn, [AM], Anishinaabemowin]
cjk: [Latn, [AF], cokwe]
cjy: [Hant, [AS], 晉語]
cjy-hans: [Hans, [AS], 晋语(简化字)]
cjy-hant: [Hant, [AS], 晉語(正字)]
ckb: [Arab, [ME], کوردی]
ckt: [Cyrl, [AS], ԓыгъоравэтԓьэн]
cnh: [Latn, [AS], Lai holh]
cnr: [cnr-latn]
cnr-cyrl: [Cyrl, [EU], црногорски]
cnr-latn: [Latn, [EU], crnogorski]
co: [Latn, [EU], corsu]
cop: [Copt, [AF, ME], ϯⲙⲉⲧⲣⲉⲙⲛ̀ⲭⲏⲙⲓ]
cps: [Latn, [AS], Capiceño]
cpx: [Hant, [AS], 莆仙語 / Pó-sing-gṳ̂]
cpx-hans: [Hans, [AS], 莆仙语(简体)]
cpx-hant: [Hant, [AS], 莆仙語(繁體)]
cpx-latn: [Latn, [AS], Pó-sing-gṳ̂ (Báⁿ-uā-ci̍)]
cr: [Cans, [AM], ᓀᐦᐃᔭᐍᐏᐣ]
cr-cans: [cr]
cr-latn: [Latn, [AM], Nēhiyawēwin]
crh: [Latn, [EU], qırımtatarca]
crh-cyrl: [Cyrl, [EU], къырымтатарджа]
crh-latn: [crh]
crh-ro: [Latn, [EU], tatarşa]
cs: [Latn, [EU], čeština]
csb: [Latn, [EU], kaszëbsczi]
# FIXME: which script to prefer?..
cu: [Cyrl, [EU], словѣньскъ / ⰔⰎⰑⰂⰡⰐⰠⰔⰍⰟ]
cv: [Cyrl, [EU], чӑвашла]
cy: [Latn, [EU], Cymraeg]
da: [Latn, [EU], dansk]
dag: [Latn, [AF], dagbanli]
dar: [Cyrl, [EU], дарган]
ddn: [Latn, [AF], dendi]
de: [Latn, [EU], Deutsch]
de-at: [Latn, [EU], Österreichisches Deutsch]
de-ch: [Latn, [EU], Schweizer Hochdeutsch]
de-formal: [Latn, [EU], Deutsch (Sie-Form)]
dga: [Latn, [AF], Dagaare]
# In ISO 639, it refers to Rek Dinka. It may
# be changed like that here, too, but for
# now, redirect it to macro Dinka.
dik: [din]
din: [Latn, [AF], Thuɔŋjäŋ]
diq: [Latn, [EU, AS], Zazaki]
doi: [Deva, [AS], डोगरी]
dsb: [Latn, [EU], dolnoserbski]
dtp: [Latn, [AS], Dusun Bundu-liwan]
dty: [Deva, [AS], डोटेली]
dv: [Thaa, [AS], ދިވެހިބަސް]
dyu: [Latn, [AF], Julakan]
dz: [Tibt, [AS], ཇོང་ཁ]
ee: [Latn, [AF], eʋegbe]
efi: [Latn, [AF], efịk]
egl: [Latn, [EU], Emiliàn]
ekp: [Latn, [AF], ẹkpeye]
el: [Grek, [EU], Ελληνικά]
elm: [Latn, [AF], Eleme]
eml: [Latn, [EU], emiliàn e rumagnòl]
en: [Latn, [EU, AM, AF, ME, AS, PA, WW], English]
en-ca: [Latn, [AM], Canadian English]
en-gb: [Latn, [EU, AS, PA], British English]
en-simple: [Latn, [WW], Simple English]
en-us: [Latn, [AM], American English]
eo: [Latn, [WW], Esperanto]
es: [Latn, [EU, AM, AF, WW, PA], español]
es-419: [Latn, [AM], español de América Latina]
es-formal: [Latn, [EU, AM, AF, WW], español (formal)]
es-ni: [Latn, [AM], español nicaragüense]
esu: [Latn, [AM], "Yup'ik"]
et: [Latn, [EU], eesti]
eu: [Latn, [EU], euskara]
ext: [Latn, [EU], estremeñu]
eya: [Latn, [AM], I·ya·q]
fa: [Arab, [AS, ME], فارسی]
fan: [Latn, [AF], Faŋ]
fat: [Latn, [AF], mfantse]
fax: [Latn, [EU], Fala]
ff: [Latn, [AF], Fulfulde]
fi: [Latn, [EU], suomi]
fil: [tl]
fit: [Latn, [EU], meänkieli]
fiu-vro: [vro]
fj: [Latn, [PA], Na Vosa Vakaviti]
fkv: [Latn, [EU], kvääni]
fo: [Latn, [EU], føroyskt]
fon: [Latn, [AF], fɔ̀ngbè]
fr: [Latn, [EU, AM, WW], français]
frc: [Latn, [AM], français cadien]
frp: [Latn, [EU], arpetan]
frr: [Latn, [EU], Nordfriisk]
fuf: [Latn, [AF], Fuuta Jalon]
fur: [Latn, [EU], furlan]
# In ISO 639, it refers to Nigerian Fula. It may
# be changed like that here, too, but for
# now, redirect it to macro Fula.
fuv: [ff]
fvr: [Latn, [AF], poor’íŋ belé’ŋ]
fy: [Latn, [EU], Frysk]
ga: [Latn, [EU], Gaeilge]
gaa: [Latn, [AF], Ga]
gag: [Latn, [EU], Gagauz]
gah: [Latn, [AS], Alekano]
gan: [Hant, [AS], 贛語]
gan-hans: [Hans, [AS], 赣语(简体)]
gan-hant: [Hant, [AS], 贛語(繁體)]
# In ISO 639, it refers to West Central Oromo. It may
# be changed like that here, too, but for
# now, redirect it to macro Oromo.
gaz: [om]
gbm: [Deva, [AS], गढ़वळि]
gbz: [Latn, [AS], Dari-e Mazdeyasnā]
gcf: [Latn, [AM], kréyòl Gwadloup]
gcr: [Latn, [AM], kriyòl gwiyannen]
gd: [Latn, [EU], Gàidhlig]
gez: [Ethi, [AF], ግዕዝ]
gl: [Latn, [EU], galego]
gld: [Cyrl, [AS], на̄ни]
glk: [Arab, [AS, ME], گیلکی]
gn: [Latn, [AM], "Avañe'ẽ"]
gom: [gom-deva]
gom-deva: [Deva, [AS], गोंयची कोंकणी]
gom-latn: [Latn, [AS], Gõychi Konknni]
gor: [Latn, [AS], Bahasa Hulontalo]
got: [Goth, [EU], 𐌲𐌿𐍄𐌹𐍃𐌺]
gpe: [Latn, [AF], Ghanaian Pidgin]
grc: [Grek, [EU], Ἀρχαία ἑλληνικὴ]
gsw: [Latn, [EU], Alemannisch]
gu: [Gujr, [AS], ગુજરાતી]
guc: [Latn, [AM], wayuunaiki]
gum: [Latn, [AM], Namtrik]
gur: [Latn, [AF], farefare]
guw: [Latn, [AF], gungbe]
gv: [Latn, [EU], Gaelg]
# CLDR uses ha for Latin script and ha-arab for Arabic script.
# Latin is more common and is used in Wikipedia.
ha: [Latn, [AF], Hausa]
ha-arab: [Arab, [AF], هَوُسَ]
ha-latn: [ha]
hai: [Latn, [AM], X̱aat Kíl]
hak: [Latn, [AS], Hak-kâ-fa]
hak-hans: [Hans, [AS], 客家语(简体)]
hak-hant: [Hant, [AS], 客家語(繁體)]
haw: [Latn, [AM, PA], Hawaiʻi]
he: [Hebr, [ME], עברית]
hi: [Deva, [AS], हिन्दी]
hif: [Latn, [PA, AS], Fiji Hindi]
hif-deva: [Deva, [AS], फ़ीजी हिन्दी]
hif-latn: [hif]
hil: [Latn, [AS], Ilonggo]
hke: [Latn, [AF], kihunde]
hne: [Deva, [AS], छत्तीसगढ़ी]
hno: [Arab, [AS], ہندکو]
ho: [Latn, [PA], Hiri Motu]
hoc: [Wara, [AS], 𑢹𑣉𑣉]
hr: [Latn, [EU], hrvatski]
hrx: [Latn, [AM], Hunsrik]
hsb: [Latn, [EU], hornjoserbsce]
hsn: [Hans, [AS], 湘语]
ht: [Latn, [AM], Kreyòl ayisyen]
hu: [Latn, [EU], magyar]
hu-formal: [Latn, [EU], Magyar (magázó)]
hy: [Armn, [EU, ME], հայերեն]
hyw: [Armn, [EU, ME], Արեւմտահայերէն]
hz: [Latn, [AF], Otsiherero]
ia: [Latn, [WW], interlingua]
iba: [Latn, [AS, PA], Jaku Iban]
ibb: [Latn, [AF], ibibio]
id: [Latn, [AS, PA], Bahasa Indonesia]
ie: [Latn, [WW], Interlingue]
ig: [Latn, [AF], Igbo]
igb: [Latn, [AF], Ebira]
igl: [Latn, [AF], Igala]
ii: [Yiii, [AS], ꆇꉙ]
ik: [Latn, [AM], Iñupiatun]
ike-cans: [Cans, [AM], ᐃᓄᒃᑎᑐᑦ]
ike-latn: [Latn, [AM], inuktitut]
ilo: [Latn, [AS], Ilokano]
inh: [Cyrl, [EU], гӀалгӀай]
io: [Latn, [WW], Ido]
is: [Latn, [EU], íslenska]
ish: [Latn, [AF], awain]
isv: [isv-latn]
isv-cyrl: [Cyrl, [EU], меджусловјанскы]
isv-latn: [Latn, [EU], medžuslovjansky]
it: [Latn, [EU], italiano]
iu: [ike-cans]
izh: [Latn, [EU], ižoran keel]
ja: [Jpan, [AS], 日本語]
jac: [Latn, [AM], Abꞌxubꞌal Poptiꞌ]
jam: [Latn, [AM], Patois]
jbo: [Latn, [WW], lojban]
jdt: [jdt-cyrl]
jdt-cyrl: [Cyrl, [EU, AS], жугьури]
jje: [Kore, [AS], 제주말]
jut: [Latn, [EU], jysk]
jv: [Latn, [AS, PA], Jawa]
# For support in webfonts.
jv-java: [Java, [AS, PA], ꦗꦮ]
ka: [Geor, [EU], ქართული]
kaa: [Latn, [AS], Qaraqalpaqsha]
# Can also be Tfng, but the Wikipedia is mostly Latn
kab: [Latn, [AF, EU], Taqbaylit]
kac: [Latn, [AS], Jinghpaw]
kai: [Latn, [AF], Karai-karai]
kam: [Latn, [AF], kĩkamba]
kbd: [Cyrl, [EU, ME], адыгэбзэ]
kbd-cyrl: [kbd]
kbd-latn: [Latn, [EU], Qabardjajəbza]
kbp: [Latn, [AF], Kabɩyɛ]
kcg: [Latn, [AF], Tyap]
kck: [Latn, [AF], tjikalanga]
kea: [Latn, [AF], kabuverdianu]
ken: [Latn, [AF], kɛ́nyáŋ]
kg: [Latn, [AF], Kongo]
kge: [Latn, [AS, PA], Basa Kumoring]
kge-arab: [Arab, [AS, PA], باس كوموريڠ]
kgp: [Latn, [AM], Kaingáng]
khk: [mn]
khw: [Arab, [ME, AS], کھوار]
ki: [Latn, [AF], Gĩkũyũ]
kip: [Deva, [AS], शेषी पाङ]
kiu: [Latn, [EU, ME], Kırmancki]
kj: [Latn, [AF], Kwanyama]
kjh: [Cyrl, [AS], хакас]
kjp: [Mymr, [AS], ဖၠုံလိက်]
kk: [kk-cyrl]
kk-arab: [Arab, [EU, AS], قازاقشا (تٶتە)]
kk-cn: [kk-arab]
kk-cyrl: [Cyrl, [EU, AS], қазақша]
kk-kz: [kk-cyrl]
kk-latn: [Latn, [EU, AS, ME], qazaqşa]
kk-tr: [kk-latn]
kl: [Latn, [AM, EU], kalaallisut]
km: [Khmr, [AS], ភាសាខ្មែរ]
kmb: [Latn, [AF], kimbundu]
kmr: [ku-latn]
kn: [Knda, [AS], ಕನ್ನಡ]
# In ISO 639, it refers to Central Kanuri. It may
# be changed like that here, too, but for
# now, redirect it to macro Kanuri.
knc: [kr]
knn: [Deva, [AS], महाराष्ट्रीय कोंकणी]
ko: [Kore, [AS], 한국어]
ko-kp: [Kore, [AS], 조선말]
koi: [Cyrl, [EU], перем коми]
koy: [Latn, [AM], "Denaakkenaageʼ"]
kr: [Latn, [AF], kanuri]
krc: [Cyrl, [EU], къарачай-малкъар]
kri: [Latn, [AF], Krio]
krj: [Latn, [AS], Kinaray-a]
krl: [Latn, [EU], Karjala]
ks: [ks-arab]
ks-arab: [Arab, [AS], کٲشُر]
ks-deva: [Deva, [AS], कॉशुर]
ksf: [Latn, [AF], Bafia]
ksh: [Latn, [EU], Ripoarisch]
ksw: [Mymr, [AS], စှီၤ]
# CLDR uses ku-latn and ku-arab. Latin is more common and is used in Wikipedia.
ku: [ku-latn]
# Note: The first word here is the same as the name of ckb.
# It should probably be made less ambiguous.
ku-arab: [Arab, [EU, ME], کوردی (عەرەبی)]
ku-latn: [Latn, [EU, ME], kurdî]
kum: [Cyrl, [EU], къумукъ]
kus: [Latn, [AF], Kʋsaal]
kv: [Cyrl, [EU], коми]
kw: [Latn, [EU], kernowek]
ky: [Cyrl, [AS], кыргызча]
la: [Latn, [EU], Latina]
lad: [lad-latn]
lad-hebr: [Hebr, [ME, EU, AM], לאדינו]
lad-latn: [Latn, [ME, EU, AM], Ladino]
lag: [Latn, [AF], Kilaangi]
lb: [Latn, [EU], Lëtzebuergesch]
lbe: [Cyrl, [EU], лакку]
ldn: [Latn, [WW], Láadan]
lez: [Cyrl, [EU], лезги]
lfn: [Latn, [WW], Lingua Franca Nova]
lg: [Latn, [AF], Luganda]
li: [Latn, [EU], Limburgs]
lij: [Latn, [EU], Ligure]
lij-mc: [Latn, [EU], munegascu]
liv: [Latn, [EU], Līvõ kēļ]
lki: [Arab, [AS, ME], لەکی]
lkt: [Latn, [AM], Lakȟótiyapi]
lld: [Latn, [EU], Ladin]
lmo: [Latn, [EU], lombard]
ln: [Latn, [AF], lingála]
lo: [Laoo, [AS], ລາວ]
loz: [Latn, [AF], Silozi]
lrc: [Arab, [AS, ME], لۊری شومالی]
lt: [Latn, [EU], lietuvių]
ltg: [Latn, [EU], latgaļu]
lua: [Latn, [AF], ciluba]
lud: [Latn, [EU], lüüdi]
lue: [Latn, [AF], chiluvale]
luo: [Latn, [AF], dholuo]
lus: [Latn, [AS], Mizo ţawng]
lut: [Latn, [AM], dxʷləšucid]
luz: [Arab, [ME], لئری دوٙمینی]
lv: [Latn, [EU], latviešu]
lvs: [lv]
lzh: [Hant, [AS], 文言]
# Also Geor, but the incubator is in Latn
lzz: [Latn, [EU, ME], Lazuri]
mad: [Latn, [AS], Madhurâ]
mag: [Deva, [AS], मगही]
mai: [Deva, [AS], मैथिली]
mak: [Latn, [AS, PA], Mangkasarak]
mak-bugi: [Bugi, [AS, PA], ᨆᨀᨔᨑ]
map-bms: [Latn, [AS], Basa Banyumasan]
mcn: [Latn, [AF], vùn màsànà]
mdf: [Cyrl, [EU], мокшень]
mey: [Arab, [AF], الحسانية]
mfe: [Latn, [AM], Morisyen]
mg: [Latn, [AF], Malagasy]
mh: [Latn, [PA], Ebon]
mhr: [Cyrl, [EU], олык марий]
mi: [Latn, [PA], Māori]
mic: [Latn, [AM], "Mi'kmaq"]
min: [Latn, [AS], Minangkabau]
miq: [Latn, [AM], Mískitu]
mk: [Cyrl, [EU], македонски]
ml: [Mlym, [AS, ME], മലയാളം]
mn: [Cyrl, [AS], монгол]
mn-cyrl: [mn]
mn-mong: [mvf]
mnc: [Mong, [AS], ᠮᠠᠨᠵᡠ ᡤᡳᠰᡠᠨ]
mnc-latn: [Latn, [AS], Manju gisun]
mni: [Mtei, [AS], ꯃꯤꯇꯩ ꯂꯣꯟ]
mni-beng: [Beng, [AS], মেইতেই লোন্]
mnw: [Mymr, [AS], ဘာသာမန်]
mo: [Cyrl, [EU], молдовеняскэ]
moe: [Latn, [AM], innu-aimun]
mos: [Latn, [AF], moore]
mr: [Deva, [AS, ME], मराठी]
mrh: [Latn, [AS], Mara]
mrj: [Cyrl, [EU], кырык мары]
mrv: [Latn, [PA], Magareva]
ms: [Latn, [AS], Bahasa Melayu]
ms-arab: [Arab, [AS], بهاس ملايو]
mt: [Latn, [EU], Malti]
mui: [Latn, [AS], Baso Palembang]
mus: [Latn, [AM], Mvskoke]
mvf: [Mong, [AS], ᠮᠣᠩᠭᠣᠯ]
mwl: [Latn, [EU], Mirandés]
mwv: [Latn, [AS], Behase Mentawei]
mww: [mww-latn]
mww-latn: [Latn, [AS], Hmoob Dawb]
my: [Mymr, [AS], မြန်မာဘာသာ]
myv: [Cyrl, [EU], эрзянь]
mzn: [Arab, [ME, AS], مازِرونی]
na: [Latn, [PA], Dorerin Naoero]
nah: [Latn, [AM], Nāhuatl]
nan: [Latn, [AS], 閩南語 / Bân-lâm-gú]
nan-hani: [Hani, [AS], 閩南語(漢字)]
nan-hans: [Hans, [AS], 闽南语(简化汉字)]
nan-hant: [Hant, [AS], 閩南語(傳統漢字)]
nan-latn: [Latn, [AS], Bân-lâm-gú (Lô-má-jī)]
nan-latn-pehoeji: [Latn, [AS], Bân-lâm-gú (Pe̍h-ōe-jī)]
nan-latn-tailo: [Latn, [AS], Bân-lâm-gú (Tâi-lô)]
nap: [Latn, [EU], Napulitano]
nb: [Latn, [EU], norsk (bokmål)]
nd: [Latn, [AF], siNdebele saseNyakatho]
nds: [Latn, [EU], Plattdüütsch]
nds-nl: [Latn, [EU], Nedersaksisch]
ne: [Deva, [AS], नेपाली]
new: [Deva, [AS], नेपाल भाषा]
ng: [Latn, [AF], Oshiwambo]
nia: [Latn, [AS], Li Niha]
nit: [Telu, [AS], కొలామి]
niu: [Latn, [PA], ko e vagahau Niuē]
njo: [Latn, [AS], Ao]
nl: [Latn, [EU, AM], Nederlands]
nl-informal: [Latn, [EU, AM], Nederlands (informeel)]
nmz: [Latn, [AF], nawdm]
nn: [Latn, [EU], norsk (nynorsk)]
nn-hognorsk: [Latn, [EU], norsk (høgnorsk)]
# There's also nb for Bokmål and nn for Nynorsk
"no": [Latn, [EU], norsk]
nod: [Lana, [AS], ᨣᩴᩤᨾᩮᩥᩬᨦ]
nod-thai: [Thai, [AS], คำเมือง]
nog: [Cyrl, [EU], ногайша]
nov: [Latn, [WW], Novial]
npi: [ne]
nqo: [Nkoo, [AF], ߒߞߏ]
nr: [Latn, [AF], isiNdebele seSewula]
nrf-gg: [Latn, [EU], Guernésiais]
nrf-je: [Latn, [EU], Jèrriais]
nrm: [Latn, [EU], Nouormand]
nso: [Latn, [AF], Sesotho sa Leboa]
nup: [Latn, [AF], Nupe]
nus: [Latn, [AF], Thok Naath]
nv: [Latn, [AM], Diné bizaad]
ny: [Latn, [AF], Chi-Chewa]
nyn: [Latn, [AF], runyankore]
nyo: [Latn, [AF], Orunyoro]
nys: [Latn, [PA], Nyungar]
nzi: [Latn, [AF], Nzema]
oc: [Latn, [EU], occitan]
ojb: [Latn, [AM], Ojibwemowin]
oka: [Latn, [AM], n̓səl̓xcin̓]
olo: [Latn, [EU], livvinkarjala]
om: [Latn, [AF], Oromoo]
ood: [Latn, [AM], "ʼOʼodham ha-ñeʼokĭ"]
or: [Orya, [AS], ଓଡ଼ିଆ]
ory: [or]
os: [Cyrl, [EU], ирон]
osi: [Latn, [AS], Using]
ota: [Arab, [AS, EU], لسان عثمانى]
ovd: [Latn, [EU], övdalsk]
pa: [pa-guru]
pa-guru: [Guru, [AS], ਪੰਜਾਬੀ]
pag: [Latn, [AS], Pangasinan]
pam: [Latn, [AS], Kapampangan]
pap: [Latn, [AM], Papiamentu]
pap-aw: [Latn, [AM], Papiamento]
pbb: [Latn, [AM], Nasa Yuwe]
# In ISO 639, it refers to Southern Pashto. It may
# be changed like that here, too, but for
# now, redirect it to macro Pashto.
pbt: [ps]
pcd: [Latn, [EU], Picard]
pcm: [Latn, [AF], Naijá]
pdc: [Latn, [EU, AM], Deitsch]
pdt: [Latn, [EU, AM], Plautdietsch]
pes: [fa]
pey: [Latn, [EU, PA, AS], Petjoh]
pfl: [Latn, [EU], Pälzisch]
phr: [Arab, [AS], پوٹھواری]
pi: [Deva, [AS], पालि]
pih: [Latn, [PA], Norfuk / Pitkern]
pis: [Latn, [PA], Pijin]
piu: [Latn, [PA], Pintupi-Luritja]
pjt: [Latn, [PA], Pitjantjatjara]
pko: [Latn, [AF], Pökoot]
pl: [Latn, [EU], polski]
plt: [mg]
pms: [Latn, [EU], Piemontèis]
pnb: [Arab, [AS, ME], پنجابی]
pnt: [Grek, [EU], Ποντιακά]
pov: [Latn, [AF], guinensi]
ppl: [Latn, [AM], Nawat]
prg: [Latn, [EU], Prūsiskan]
prs: [Arab, [AS, ME], دری]
ps: [Arab, [AS, ME], پښتو]
pt: [Latn, [EU, AM, AS, PA, AF, WW], português]
pt-br: [Latn, [AM], português do Brasil]
pwn: [Latn, [AS], pinayuanan]
qu: [Latn, [AM], Runa Simi]
quc: [Latn, [AM], "K'iche'"]
qug: [Latn, [AM], Runa shimi]
# In ISO 639, it refers to Chanka Quechua. It may
# be changed like that here, too, but for
# now, redirect it to macro Quechua.
quy: [qu]
qwh: [Latn, [AM], anqash qichwa]
rag: [Latn, [AF], Lologooli]
rap: [Latn, [PA, AM], arero rapa nui]
rcf: [Latn, [AF], Kreol Réyoné]
rej: [Latn, [AS, PA], Jang]
rgn: [Latn, [EU], Rumagnôl]
rhg: [Rohg, [AS], 𐴌𐴟𐴇𐴥𐴝𐴚𐴒𐴙𐴝]
rif: [Latn, [AF], Tarifit]
rki: [Mymr, [AS], ရခိုင်]
rm: [Latn, [EU], rumantsch]
rm-puter: [Latn, [EU], puter]
rm-rumgr: [Latn, [EU], rumantsch grischun]
rm-surmiran: [Latn, [EU], surmiran]
rm-sursilv: [Latn, [EU], sursilvan]
rm-sutsilv: [Latn, [EU], sutsilvan]
rm-vallader: [Latn, [EU], vallader]
rmc: [Latn, [EU], romaňi čhib]
# Also known as Fíntika Rómma
rmf: [Latn, [EU], kaalengo tšimb]
rmy: [Latn, [EU], Romani]
rn: [Latn, [AF], ikirundi]
ro: [Latn, [EU], română]
roa-rup: [rup]
roa-tara: [Latn, [EU], tarandíne]
rsk: [Cyrl, [EU], руски]
rtm: [Latn, [PA], Faeag Rotuma]
ru: [Cyrl, [EU, AS, ME], русский]
rue: [Cyrl, [EU], русиньскый]
rup: [Latn, [EU], armãneashti]
ruq: [Cyrl, [EU], Влахесте]
ruq-cyrl: [ruq]
# FIXME: broken autonym
ruq-grek: [Grek, [EU], Megleno-Romanian (Greek script)]
ruq-latn: [Latn, [EU], Vlăheşte]
rut: [Cyrl, [EU], мыхаӀбишды]
rw: [Latn, [AF], Ikinyarwanda]
# Bug: 60815
rwr: [Deva, [AS], मारवाड़ी]
ryu: [Jpan, [AS], うちなーぐち]
sa: [Deva, [AS], संस्कृतम्]
sah: [Cyrl, [EU, AS], саха тыла]
sat: [Olck, [AS], ᱥᱟᱱᱛᱟᱲᱤ]
saz: [Saur, [AS], ꢱꣃꢬꢵꢯ꣄ꢡ꣄ꢬꢵ]
sc: [Latn, [EU], sardu]
scn: [Latn, [EU], sicilianu]
sco: [Latn, [EU], Scots]
sd: [Arab, [AS], سنڌي]
sdc: [Latn, [EU], Sassaresu]
sdh: [Arab, [ME], کوردی خوارگ]
se: [Latn, [EU], davvisámegiella]
se-fi: [Latn, [EU], davvisámegiella (Suoma bealde)]
se-no: [Latn, [EU], davvisámegiella (Norgga bealde)]
se-se: [Latn, [EU], davvisámegiella (Ruoŧa bealde)]
sei: [Latn, [AM], Cmique Itom]
ses: [Latn, [AF], Koyraboro Senni]
sg: [Latn, [AF], Sängö]
sgs: [Latn, [EU], žemaitėška]
sh: [Latn, [EU], srpskohrvatski / српскохрватски]
sh-cyrl: [Cyrl, [EU], српскохрватски]
sh-latn: [Latn, [EU], srpskohrvatski]
shi: [shi-latn]
shi-latn: [Latn, [AF], Taclḥit]
shi-tfng: [Tfng, [AF], ⵜⴰⵛⵍⵃⵉⵜ]
shn: [Mymr, [AS], လိၵ်ႈတႆး]
shy: [shy-latn]
shy-latn: [Latn, [AF], tacawit]
si: [Sinh, [AS], සිංහල]
simple: [en-simple]
sjd: [Cyrl, [EU], кӣллт са̄мь кӣлл]
sje: [Latn, [EU], bidumsámegiella]
sjo: [Mong, [AS], ᠰᡞᠪᡝ ᡤᡞᠰᡠᠨ]
sju: [Latn, [EU], ubmejesámiengiälla]
sk: [Latn, [EU], slovenčina]
skr: [skr-arab]
skr-arab: [Arab, [AS], سرائیکی]
sl: [Latn, [EU], slovenščina]
sli: [Latn, [EU], Schläsch]
slr: [Latn, [AS], Salırça]
sly: [Latn, [AS], Bahasa Selayar]
sm: [Latn, [PA], Gagana Samoa]
sma: [Latn, [EU], åarjelsaemien]
smj: [Latn, [EU], julevsámegiella]
smn: [Latn, [EU], anarâškielâ]
sms: [Latn, [EU], nuõrttsääʹmǩiõll]
sn: [Latn, [AF], chiShona]
so: [Latn, [AF], Soomaaliga]
son: [Latn, [AF], soŋay]
sq: [Latn, [EU], shqip]
sr: [sr-cyrl]
sr-cyrl: [Cyrl, [EU], српски]
sr-ec: [sr-cyrl]
sr-el: [sr-latn]
sr-latn: [Latn, [EU], srpski]
srn: [Latn, [AM, EU], Sranantongo]
sro: [Latn, [EU], sardu campidanesu]
srq: [Latn, [AM], mbia cheë]
ss: [Latn, [AF], SiSwati]
st: [Latn, [AF], Sesotho]
stq: [Latn, [EU], Seeltersk]
sty: [Cyrl, [EU, AS], себертатар]
su: [Latn, [AS], Sunda]
sv: [Latn, [EU], svenska]
sw: [Latn, [AF], Kiswahili]
swb: [Latn, [AF], Shikomoro]
swh: [sw]
sxu: [Latn, [EU], Säggssch]
syc: [Syrc, [ME], ܣܘܪܝܝܐ]
syl: [Sylo, [AS], ꠍꠤꠟꠐꠤ]
syl-beng: [Beng, [AS], সিলেটি]
syl-sylo: [syl]
szl: [Latn, [EU], ślůnski]
szy: [Latn, [AS], Sakizaya]
ta: [Taml, [AS], தமிழ்]
# This is initially added for Wikimiedia MinT, which outputs Tifinagh.
# Perhaps some day it can be changed to Latin as default.
taq: [taq-tfng]
taq-latn: [Latn, [AF], təmajəq]
taq-tfng: [Tfng, [AF], ⵜⴰⵎⴰⵌⴰⵆ]
tay: [Latn, [AS], Tayal]
tcy: [Knda, [AS], ತುಳು]
tdd: [Tale, [AS], ᥖᥭᥰ ᥖᥬᥲ ᥑᥨᥒᥰ]
te: [Telu, [AS], తెలుగు]
tet: [Latn, [AS, PA], tetun]
tg: [tg-cyrl]
tg-cyrl: [Cyrl, [AS], тоҷикӣ]
tg-latn: [Latn, [AS], tojikī]
th: [Thai, [AS], ไทย]
ti: [Ethi, [AF], ትግርኛ]
tig: [Ethi, [AF], ትግረ]
tk: [Latn, [AS], Türkmençe]
tkr: [Cyrl, [AS], цӀаӀхна миз]
tl: [Latn, [AS], Tagalog]
tly: [Latn, [EU, AS, ME], tolışi]
tly-cyrl: [Cyrl, [EU, AS, ME], толыши]
tmr: [Hebr, [ME, EU, AM], ארמית בבלית]
tn: [Latn, [AF], Setswana]
to: [Latn, [PA], lea faka-Tonga]
toi: [Latn, [AF], chitonga]
tok: [Latn, [WW], toki pona]
tokipona: [tok]
tpi: [Latn, [PA, AS], Tok Pisin]
tr: [Latn, [EU, ME], Türkçe]
trp: [Latn, [AS], Kokborok]
tru: [Latn, [AS], Ṫuroyo]
trv: [Latn, [AS], Seediq]
trw: [Arab, [AS], توروالی]
ts: [Latn, [AF], Xitsonga]
tsd: [Grek, [EU], Τσακωνικά]
tsg: [Latn, [AS], Sinūg]
tt: [Cyrl, [EU], татарча]
tt-cyrl: [tt]
tt-latn: [Latn, [EU], tatarça]
ttj: [Latn, [AF], Orutooro]
ttt: [Cyrl, [AS], Tati]
tum: [Latn, [AF], chiTumbuka]
tw: [Latn, [AF], Twi]
twd: [Latn, [EU], Tweants]
ty: [Latn, [PA], reo tahiti]
tyv: [Cyrl, [AS], тыва дыл]
tzl: [Latn, [WW], Talossan]
tzm: [Tfng, [AF], ⵜⴰⵎⴰⵣⵉⵖⵜ]
udm: [Cyrl, [EU], удмурт]
# CLDR uses ug-arab, ug-latn and ug-cyrl.
# Arabic seems to have the largest number of users and is the main script in the Wikipedia.
ug: [ug-arab]
ug-arab: [Arab, [AS], ئۇيغۇرچە]
ug-cyrl: [Cyrl, [AS], уйғурчә]
ug-latn: [Latn, [AS], uyghurche]
uk: [Cyrl, [EU], українська]
umb: [Latn, [AF], umbundu]
umu: [Latn, [AM], Huluníixsuwaakan]
ur: [Arab, [AS, ME], اردو]
uz: [Latn, [AS], oʻzbekcha]
uz-cyrl: [Cyrl, [AS], ўзбекча]
uz-latn: [uz]
uzn: [uz]
vai: [Vaii, [AF], ꕙꔤ]
ve: [Latn, [AF], Tshivenda]
vec: [Latn, [EU, AM], vèneto]
vep: [Latn, [EU], vepsän kel’]
vi: [Latn, [AS], Tiếng Việt]
vls: [Latn, [EU], West-Vlams]
vmf: [Latn, [EU], Mainfränkisch]
vmw: [Latn, [AF], emakhuwa]
vo: [Latn, [WW], Volapük]
vot: [Latn, [EU], Vaďďa]
vro: [Latn, [EU], võro]
wa: [Latn, [EU], walon]
wal: [Latn, [AF], wolaytta]
war: [Latn, [AS], Winaray]
wls: [Latn, [PA], "Faka'uvea"]
wlx: [Latn, [AF], waale]
wo: [Latn, [AF], Wolof]
wsg: [Telu, [AS], గోండి]
wuu: [Hani, [AS], 吴语]
wuu-hans: [Hans, [AS], 吴语(简体)]
wuu-hant: [Hant, [AS], 吳語(正體)]
xal: [Cyrl, [EU], хальмг]
xh: [Latn, [AF], isiXhosa]
xmf: [Geor, [EU], მარგალური]
xmm: [Latn, [AS, PA], Manado]
xsy: [Latn, [AS], SaiSiyat]
ydd: [yi]
yi: [Hebr, [ME, EU, AM], ייִדיש]
yo: [Latn, [AF], Yorùbá]
yoi: [Jpan, [AS], 与那国物言]
yrk: [Cyrl, [AS], ненэцяʼ вада]
yrl: [Latn, [AM], Nhẽẽgatú]
yua: [Latn, [AM], "Maaya T'aan"]
yue: [Hant, [AS], 粵語]
yue-hans: [Hans, [AS], 粵语(简体)]
yue-hant: [Hant, [AS], 粵語(繁體)]
za: [Latn, [AS], Vahcuengh]
zea: [Latn, [EU], Zeêuws]
zgh: [Tfng, [AF], ⵜⴰⵎⴰⵣⵉⵖⵜ ⵜⴰⵏⴰⵡⴰⵢⵜ]
zgh-latn: [Latn, [AF], tamaziɣt tanawayt]
zh: [Hani, [AS, PA, AM, WW], 中文]
zh-cdo: [cdo]
zh-classical: [lzh]
zh-cn: [Hans, [AS], 中文(中国大陆)]
zh-hans: [Hans, [AS, PA, AM, WW], 中文(简体)]
zh-hant: [Hant, [AS, PA, AM, WW], 中文(繁體)]
zh-hk: [Hant, [AS], 中文(香港)]
zh-min-nan: [nan]
zh-mo: [Hant, [AS], 中文(澳門)]
zh-my: [Hans, [AS], 中文(马来西亚)]
zh-sg: [Hans, [AS], 中文(新加坡)]
zh-tw: [Hant, [AS], 中文(臺灣)]
zh-yue: [yue]
zsm: [ms]
zu: [Latn, [AF], isiZulu]
zun: [Latn, [AM], "Shiwi'ma"]
# All the supported scripts, grouped logically.
#
# The codes are taken from http://unicode.org/iso15924/iso15924-codes.html .
#
# The classification is roughly based on http://www.unicode.org/charts/
# with some practical corrections.
#
# The order of the groups affects display. Pau Giner suggested the order;
# the rationale of the order is to distance the largest groups from
# one another to improve discoverability.
#
# The group name "Other" is reserved.
scriptgroups:
# It's hard to find a better place for Goth except the Latin group.
Latin: [Latn, Goth]
# Greek is probably different enough from Latin and Cyrillic, but user testing
# may prove otherwise.
Greek: [Grek]
WestCaucasian: [Armn, Geor]
Arabic: [Arab]
# Maybe MiddleEastern can be unified with Arabic.
# Maybe Thaana can be moved here from SouthAsian.
# Maybe it can be unified with African.
MiddleEastern: [Hebr, Syrc]
African: [Copt, Ethi, Nkoo, Tfng, Vaii]
# India, Nepal, Bangladesh, Sri-Lanka, Bhutan, Maldives.
#
# Thaana (Thaa, the script of Maldives) is here, even though it's RTL,
# because it's closer geographically to India. Maybe it should be moved
# to MiddleEastern or to Arabic, if that would be easier to users.
#
# Tibetan (Tibt) is here, even though it's classified as "Central Asian" by
# Unicode, because linguistically and geographically it's closely related to
# the Brahmic family.
SouthAsian: [Beng, Cakm, Deva, Gujr, Guru, Knda, Mlym, Mtei, Olck, Orya, Rohg, Saur, Sinh, Sylo, Taml, Telu, Tibt, Thaa, Wara]
Cyrillic: [Cyrl]
CJK: [Hani, Hans, Hant, Kore, Jpan, Yiii]
SouthEastAsian: [Bali, Batk, Bugi, Java, Khmr, Laoo, Lana, Mymr, Thai, Tale]
Mongolian: [Mong]
SignWriting: [Sgnw]
NativeAmerican: [Cher, Cans]
# Undetermined script
Special: [Zyyy]
rtlscripts:
[Arab, Hebr, Syrc, Nkoo, Rohg, Thaa]
# The numbers are also used in HTML id attributes
regiongroups:
# Worldwide, international
WW: 1
# Special languages. To be shown near Worldwide when relevant.
SP: 1
# America
AM: 2
# Europe
EU: 3
# Middle East
ME: 3
# Africa
AF: 3
# Asia
AS: 4
# Pacific
PA: 4