Added autonyms directly to langdb.yaml

* Can add languages not in MW
* Can get rid of foo / bar names which include different scripts
* Can get rid of directionality marks
* PHP scripts to generate the jquery.uls.data.js is now independent of
  mediawiki and moved the scripts to lib/jquery.uls/data
* No pretty printing for the jquery.uls.data.js and added a 'do not edit' comment.
* Related changes in RL module definition and example html

Change-Id: I9a360dbdec4e9312aa5c76f801424ff95a8550d6
This commit is contained in:
Niklas Laxström
2012-08-12 19:28:23 +00:00
committed by Gerrit Code Review
parent 7414184593
commit 23763bd247
10 changed files with 579 additions and 1460 deletions

View File

@@ -0,0 +1,551 @@
languages:
aa: [Latn, [AF], Qafár af]
ab: [Cyrl, [EU], Аҧсшәа]
ace: [Latn, [AS, PA], Acèh]
ady-cyrl: [Cyrl, [EU], Адыгэбзэ]
ady-latn: [Latn, [EU], Adygabze]
ady: [[Cyrl, Latn], [EU], [Адыгэбзэ, Adygabze]]
aeb: [Arab, [AF], زَوُن]
af: [Latn, [AF], Afrikaans]
ahr: [Deva, [AS], अहिराणी]
ak: [Latn, [AF], Akan]
akz: [Latn, [NA], Albaamo innaaɬiilka]
aln: [Latn, [EU], Gegë]
am: [Ethi, [AF], አማርኛ]
an: [Latn, [EU], aragonés]
ang: [Latn, [EU], Ænglisc]
anp: [Deva, [AS], अङ्गिका]
ar: [Arab, [ME], العربية]
arc: [Syrc, [ME], ܐܪܡܝܐ]
arn: [Latn, [SA], mapudungun]
aro: [Latn, [LA], Araona]
arq: [Latn, [AF], Dziri]
ary: [Latn, [ME], Maġribi]
arz: [Arab, [ME], مصرى]
as: [Beng, [AS], অসমীয়া]
ase: [Sgnw, [NA], American sign language]
ast: [Latn, [EU], asturianu]
av: [Cyrl, [EU], авар]
avk: [Latn, [WW], Kotava]
ay: [Latn, [SA], Aymar aru]
# also Arab, and in the past - Cyrl
az: [Latn, [EU, ME], azərbaycanca]
ba: [Cyrl, [EU], башҡортса]
bar: [Latn, [EU], Boarisch]
bbc-latn: [Latn, [AS], Batak Toba]
# FIXME
bbc: [Batk, [AS], Batak Toba/Batak autonym unknown]
bcc: [Arab, [AS, ME], بلوچی مکرانی]
bcl: [Latn, [AS], Bikol Central]
# FIXME: which is the correct code?
be-tarask: [Cyrl, [EU], беларуская (тарашкевіца)]
be-x-old: [Cyrl, [EU], беларуская (тарашкевіца)]
be: [Cyrl, [EU], беларуская]
bew: [Latn, [AS], Bahasa Betawi]
bfq: [Taml, [AS], படகா]
bg: [Cyrl, [EU], български]
bh: [Deva, [AS], भोजपुरी]
bho: [Deva, [AS], भोजपुरी]
bi: [Latn, [PA], Bislama]
bjn: [Latn, [AS], Bahasa Banjar]
bm: [Latn, [AF], bamanankan]
bn: [Beng, [AS], বাংলা]
bo: [Tibt, [AS], བོད་ཡིག]
bpy: [Beng, [AS], বিষ্ণুপ্রিয়া মণিপুরী]
bqi: [Arab, [ME], بختياري]
br: [Latn, [EU], brezhoneg]
brh: [Latn, [ME, AS], Bráhuí]
bs: [Latn, [EU], bosanski]
bto: [Latn, [AS], Iriga Bicolano]
bug: [Bugi, [AS], ᨅᨔ ᨕᨘᨁᨗ]
bxr: [Cyrl, [AS], буряад]
ca: [Latn, [EU], català]
cbk-zam: [Latn, [AS], Chavacano de Zamboanga]
cdo: [Latn, [AS], Mìng-dĕ̤ng-ngṳ̄]
ce: [Cyrl, [EU], нохчийн]
ceb: [Latn, [AS], Cebuano]
ch: [Latn, [PA], Chamoru]
cho: [Latn, [NA], Choctaw]
chr: [Cher, [NA], ᏣᎳᎩ]
chy: [Latn, [NA], Tsetsêhestâhese]
ckb: [Arab, [ME], کوردی]
co: [Latn, [EU], corsu]
cps: [Latn, [AS], Capiceño]
cr-cans: [Cans, [NA], ᓀᐦᐃᔭᐍᐏᐣ]
cr-latn: [Latn, [NA], Nēhiyawēwin]
cr: [[Latn, Cans], [NA], [Nēhiyawēwin, ᓀᐦᐃᔭᐍᐏᐣ]]
crh-cyrl: [Cyrl, [EU], къырымтатарджа (Кирилл)]
crh-latn: [Latn, [EU], qırımtatarca (Latin)]
# Latn is default, Cyrl is common IRL
crh: [[Curl, Latn], [EU], [къырымтатарджа, qırımtatarca]]
cs: [Latn, [EU], česky]
csb: [Latn, [EU], kaszëbsczi]
# FIXME: what script?
cu: [Cyrl, [EU], словѣ́ньскъ / ⰔⰎⰑⰂⰡⰐⰠⰔⰍⰟ]
cv: [Cyrl, [EU], Чӑвашла]
cy: [Latn, [EU], Cymraeg]
da: [Latn, [EU], dansk]
de-at: [Latn, [EU], Österreichisches Deutsch]
de-ch: [Latn, [EU], Schweizer Hochdeutsch]
de-formal: [Latn, [EU], Deutsch (Sie-Form)]
de: [Latn, [EU], Deutsch]
diq: [Latn, [EU, AS], Zazaki]
dsb: [Latn, [EU], dolnoserbski]
dtp: [Latn, [AS], Dusun Bundu-liwan]
dv: [Thaa, [AS], ދިވެހިބަސް]
dz: [Tibt, [AS], ཇོང་ཁ]
ee: [Latn, [AF], eʋegbe]
egl: [Latn, [EU], Emiliàn]
el: [Grek, [EU], Ελληνικά]
eml: [Latn, [EU], emiliàn e rumagnòl]
en-ca: [Latn, [NA], Canadian English]
en-gb: [Latn, [EU, AS, AU], British English]
# world?
en: [Latn, [EU, NA, AU, AF, ME, AS, PA, WW], English]
eo: [Latn, [WW], Esperanto]
es-419: [Latn, [LA], espanol de America Latina]
# world?
es-formal: [Latn, [EU, NA, LA, SA, AF, WW], Español (formal)]
# world?
es: [Latn, [EU, NA, LA, SA, AF, WW], español]
esu: [Latn, [NA], "Yup'ik"]
et: [Latn, [EU], eesti]
eu: [Latn, [EU], euskara]
ext: [Latn, [EU], estremeñu]
fa: [Arab, [ME], فارسی]
ff: [Latn, [AF], Fulfulde]
fi: [Latn, [EU], suomi]
fit: [Latn, [EU], meänkieli]
fj: [Latn, [PA], Na Vosa Vakaviti]
fo: [Latn, [EU], føroyskt]
fr: [Latn, [EU], français]
frc: [Latn, [EU], français cadien]
frp: [Latn, [EU], arpetan]
frr: [Latn, [EU], Nordfriisk]
fur: [Latn, [EU], furlan]
fy: [Latn, [EU], Frysk]
ga: [Latn, [EU], Gaeilge]
gag: [Latn, [EU], Gagauz]
gah: [Latn, [AS], Alekano]
gan-hans: [Hans, [AS], 赣语(简体)]
gan-hant: [Hant, [AS], 贛語(繁體)]
gan: [Hant, [AS], 贛語]
gbz: [Latn, [AS], Dari]
gcf: [Latn, [LA], Guadeloupean Creole French]
gd: [Latn, [EU], Gàidhlig]
gl: [Latn, [EU], galego]
glk: [Arab, [ME], گیلکی]
gn: [Latn, [LA], "Avañe'ẽ"]
gom-deva: [Deva, [AS], कोंकणी]
gom-latn: [Latn, [AS], Konknni]
gom: [[Deva, Latn], [AS], [कोंकणी, Konknni]]
# hmph??
got: [Goth, [EU], 𐌲𐌿𐍄𐌹𐍃𐌺]
grc: [Grek, [EU], Ἀρχαία ἑλληνικὴ]
gsw: [Latn, [EU], Alemannisch]
gu: [Gujr, [AS], ગુજરાતી]
guc: [Latn, [LA], Wayúu]
gur: [Latn, [AF], Gurenɛ]
gv: [Latn, [EU], Gaelg]
# The name in Names.php is Arabic, but everything else is Latn
ha: [Latn, [AF], هَوُسَ]
hak: [Latn, [AS], Hak-kâ-fa]
haw: [Latn, [NA, PA], Hawai`i]
he: [Hebr, [ME], עברית]
# Or maybe world?
hi: [Deva, [AS], हिन्दी]
hif-deva: [Deva, [AS], फ़ीजी हिन्दी]
hif-latn: [Latn, [PA, AU, AS], Fiji Hindi]
hif: [[Deva, Latn[, [PA, AU, AS], [फ़ीजी हिन्दी, Fiji Hindi]]
hil: [Latn, [AS], Ilonggo]
hne: [Deva, [AS], छत्तीसगढ़ी]
ho: [Latn, [PA], Hiri Motu]
hr: [Latn, [EU], hrvatski]
hsb: [Latn, [EU], hornjoserbsce]
hsn: [Hans, [AS], 湘语]
# Haitian Creole. North America, right?
ht: [Latn, [NA], Kreyòl ayisyen]
hu-formal: [Latn, [EU], Magyar (magázó)]
hu: [Latn, [EU], magyar]
hy: [Armn, [EU, ME], Հայերեն]
hz: [Latn, [AF], Otsiherero]
ia: [Latn, [WW], interlingua]
id: [Latn, [AS], Bahasa Indonesia]
ie: [Latn, [WW], Interlingue]
ig: [Latn, [AF], Igbo]
ii: [Yiii, [AS], ꆇꉙ]
ik: [Latn, [NA], Iñupiak]
ike-cans: [Cans, [NA], ᐃᓄᒃᑎᑐᑦ]
ike-latn: [Latn, [NA], inuktitut]
ike: [[Cans, Latn], [NA], [ᐃᓄᒃᑎᑐᑦ, inuktitut]]
ilo: [Latn, [AS], Ilokano]
inh: [Cyrl, [EU], ГӀалгӀай]
io: [Latn, [WW], Ido]
is: [Latn, [EU], íslenska]
it: [Latn, [EU], italiano]
# FIXME: relation to ike?
iu: [Cans, [NA], ᐃᓄᒃᑎᑐᑦ/inuktitut]
ja: [Jpan, [AS], 日本語]
jam: [Latn, [NA], Patois]
jbo: [Latn, [WW], Lojban]
jut: [Latn, [EU], jysk]
# also in the Javanese script (Java), but the Wikipedia is in Latn
jv: [Latn, [AS, PA], Basa Jawa]
ka: [Geor, [EU], ქართული]
kaa: [Latn, [AS], Qaraqalpaqsha]
# Can also be Tfng, but the Wikipedia is mostly Latn
kab: [Latn, [AF, EU], Taqbaylit]
kbd-cyrl: [Cyrl, [EU, ME], Адыгэбзэ]
kbd-latn: [Latn, [EU], Qabardjajəbza]
kbd: [Cyrl, [EU, ME], Адыгэбзэ]
kea: [Latn, [AF], Kabuverdianu]
kg: [Latn, [AF], Kongo]
kgp: [Latn, [LA], Kaingáng]
khw: [Arab, [ME, AS], کھوار]
ki: [Latn, [AF], Gĩkũyũ]
kiu: [Latn, [EU, ME], Kırmancki]
kj: [Latn, [AF], Kwanyama]
kk-arab: [Arab, [EU, AS], قازاقشا (تٴوتە)]
kk-cn: [Arab, [EU, AS, ME], قازاقشا (جۇنگو)]
kk-cyrl: [Cyrl, [EU, AS], қазақша (кирил)]
kk-kz: [Cyrl, [EU, AS], қазақша (Қазақстан)]
kk-latn: [Latn, [EU, AS, ME], qazaqşa (latın)]
kk-tr: [Latn, [EU, AS, ME], qazaqşa (Türkïya)]
kk: [[Arab, Cyrl, Latn] [EU, AS], [قازاقشا, қазақша, qazaqşa]]
kl: [Latn, [NA, EU], kalaallisut]
km: [Khmr, [AS], ភាសាខ្មែរ]
kn: [Knda, [AS], ಕನ್ನಡ]
# Here Hang may be even more appropriate, because kp has more resistance to Han
ko-kp: [Kore, [AS], 한국어 (조선)]
# Kore is an alias for Hangul+Han. Maybe Hang is more appropriate?
ko: [Kore, [AS], 한국어]
koi: [Cyrl, [EU], Перем Коми]
kr: [Latn, [AF], Kanuri]
krc: [Cyrl, [EU], къарачай-малкъар]
kri: [Latn, [AF], Krio]
krj: [Latn, [ME, EU], Kinaray-a]
krl: [Latn, [EU], Karjala]
ks-arab: [Arab, [AS], کٲشُر]
ks-deva: [Deva, [AS], कॉशुर]
# Just because it's the current default in the Wikipedia. Deva may be needed, too.
ks: [[Deva, Arab], [AS], [कॉशुर, کٲشُر]]
ksf: [Latn, [AF], Bafia]
ksh: [Latn, [EU], Ripoarisch]
ku-arab: [Arab, [EU, ME], كوردي (عەرەبی)]
ku-latn: [Latn, [EU, ME], Kurdî (latînî)]
ku: [[Arab, Latn], [EU, ME], [كوردي , Kurdî]]
kv: [Cyrl, [EU], коми]
kw: [Latn, [EU], kernowek]
ky: [Cyrl, [AS], Кыргызча]
la: [Latn, [EU], Latina]
# Most identified with Turkey, Bulgaria, Greece, Spain and Israel,
# but also spoken in Latin America and elsewhere.
# Wikipedia is mostly in Latn, but also in Hebr. (Comparable to az.)
lad: [Latn, [ME, EU, LA], Ladino]
lb: [Latn, [EU], Lëtzebuergesch]
lbe: [Cyrl, [EU], лакку]
lez: [Cyrl, [EU], лезги]
lfn: [Latn, [WW], Lingua Franca Nova]
lg: [Latn, [AF], Luganda]
li: [Latn, [EU], Limburgs]
lij: [Latn, [EU], Ligure]
liv: [Latn, [EU], Līvõ kēļ]
lld: [Latn, [EU], Ladin]
lmo: [Latn, [EU], lumbaart]
ln: [Latn, [AF], lingála]
lo: [Laoo, [AS], ລາວ]
loz: [Latn, [AF], Silozi]
lt: [Latn, [EU], lietuvių]
ltg: [Latn, [EU], latgaļu]
lus: [Latn, [AS], Mizo ţawng]
lv: [Latn, [EU], latviešu]
lzh: [Hant, [AS], 文言]
# Also Geor, but the incubator is in Latn
lzz: [Latn, [EU, ME], Lazuri]
mai: [Deva, [AS], मैथिली]
map-bms: [Latn, [AS], Basa Banyumasan]
mdf: [Cyrl, [EU], мокшень]
mfe: [Latn, [LA], Morisyen]
mg: [Latn, [AF], Malagasy]
mh: [Latn, [PA], Ebon]
mhr: [Cyrl, [EU], олык марий]
mi: [Latn, [PA, AU], Māori]
mic: [Latn, [NA], "Mi'kmaq"]
min: [Latn, [AS], Baso Minangkabau]
mk: [Cyrl, [EU], македонски]
ml: [Mlym, [AS, ME], മലയാളം]
# Hmm, can also have Mong some day in some way
mn: [Cyrl, [AS], монгол]
mnc: [Mong, [AS], ᠮᠠᠨᠵᡠ ᡤᡳᠰᡠᠨ]
mni: [Beng, [AS], মেইতেই লোন্]
mnw: [Mymr, [AS], ဘာသာ မန်]
mo: [Cyrl, [EU], молдовеняскэ]
mr: [Deva, [AS, ME], मराठी]
mrj: [Cyrl, [EU], кырык мары]
ms: [Latn, [AS], Bahasa Melayu]
mt: [Latn, [EU], Malti]
mui: [Latn, [AS], Musi]
mus: [Latn, [NA], Mvskoke]
mwl: [Latn, [EU], Mirandés]
mwv: [Latn, [AS], Behase Mentawei]
my: [Mymr, [AS], မြန်မာဘာသာ]
myv: [Cyrl, [EU], эрзянь]
mzn: [Arab, [ME, AS], مازِرونی]
na: [Latn, [PA, AU], Dorerin Naoero]
nah: [Latn, [NA, LA], Nāhuatl]
nan: [Latn, [AS], Bân-lâm-gú]
nap: [Latn, [EU], Nnapulitano]
nb: [Latn, [EU], norsk (bokmål)]
nds-nl: [Latn, [EU], Nedersaksisch]
nds: [Latn, [EU], Plattdüütsch]
ne: [Deva, [AS], नेपाली]
new: [Deva, [AS], नेपाल भाषा]
ng: [Latn, [AF], Oshiwambo]
niu: [Latn, [PA], ko e vagahau Niuē]
njo: [Latn, [AS], Ao]
nl-informal: [Latn, [EU, SA], Nederlands (informeel)]
nl: [Latn, [EU, SA], Nederlands]
nn: [Latn, [EU], norsk (nynorsk)]
"no": [Latn, [EU]]
nov: [Latn, [WW], Novial]
nqo: [Nkoo, [AF], ߒߞߏ]
nrm: [Latn, [EU], Nouormand]
nso: [Latn, [AF], Sesotho sa Leboa]
nv: [Latn, [NA], Diné bizaad]
ny: [Latn, [AF], Chi-Chewa]
oc: [Latn, [EU], occitan]
om: [Latn, [AF], Oromoo]
or: [Orya, [AS], ଓଡ଼ିଆ]
os: [Cyrl, [EU], Ирон]
pa: [Guru, [AS], ਪੰਜਾਬੀ]
pag: [Latn, [AS], Pangasinan]
pam: [Latn, [AS], Kapampangan]
pap: [Latn, [LA], Papiamentu]
pcd: [Latn, [EU], Picard]
pdc: [Latn, [EU, NA, SA], Deitsch]
pdt: [Latn, [EU, NA, SA], Plautdietsch]
pfl: [Latn, [EU], Pälzisch]
pi: [Deva, [AS], पाळि]
pih: [Latn, [PA], Norfuk / Pitkern]
pis: [Latn, [PA], Pijin]
pko: [Latn, [AF], Pökoot]
pl: [Latn, [EU], polski]
pms: [Latn, [EU], Piemontèis]
pnb: [Arab, [AS, ME], پنجابی]
pnt: [Grek, [EU], Ποντιακά]
ppl: [Latn, [LA], Nawat]
prg: [Latn, [EU], Prūsiskan]
pru: [Latn, [EU], Prūsiskan]
ps: [Arab, [AS, ME], پښتو]
pt-br: [Latn, [SA, LA], português do Brasil]
# world?
pt: [Latn, [EU, LA, AS, PA, AF], português]
qu: [Latn, [SA], Runa Simi]
qug: [Latn, [SA], Runa shimi]
rap: [Latn, [LA], arero rapa nui]
rgn: [Latn, [EU], Rumagnôl]
rif: [Latn, [AF], Tarifit]
rki: [Mymr, [AS], ရခိုင်]
rm: [Latn, [EU], rumantsch]
rmy: [Latn, [EU], Romani]
rn: [Latn, [AF], Kirundi]
ro: [Latn, [EU], română]
roa-rup: [Latn, [EU], Armãneashce]
roa-tara: [Latn, [EU], tarandíne]
rtm: [Latn, [PA], Faeag Rotuma]
# world?
ru: [Cyrl, [EU, AS, ME], русский]
rue: [Cyrl, [EU], русиньскый]
rup: [Latn, [EU], Armãneashce]
ruq: [Latn, [EU], Vlăheşte]
ruq-cyrl: [Cyrl, [EU], Влахесте]
# FIXME: broken autonym
ruq-grek: [Grek, [EU], Megleno-Romanian (Greek script)]
ruq-latn: [Latn, [EU], Vlăheşte]
rw: [Latn, [AF], Kinyarwanda]
ryu: [Kana, [AS], ʔucināguci]
sa: [Deva, [AS], संस्कृतम्]
# Russian Far East - Europe, Asia, or both?
sah: [Cyrl, [EU, AS], саха тыла]
# Currently Latn, potentially Olck
sat: [Latn, [AS], Santali]
saz: [Saur, [AS], ꢱꣃꢬꢵꢯ꣄ꢡ꣄ꢬꢵ]
sc: [Latn, [EU], sardu]
scn: [Latn, [EU], sicilianu]
sco: [Latn, [EU], Scots]
sd: [Arab, [AS], سنڌي]
sdc: [Latn, [EU], Sassaresu]
se: [Latn, [EU], sámegiella]
sei: [Latn, [NA, LA], Cmique Itom]
sg: [Latn, [AF], Sängö]
sgs: [Latn, [EU], žemaitėška]
sh-cyrl: [Cyrl, [EU], српскохрватски]
sh-latn: [Latn, [EU], srpskohrvatski]
sh: [[Latn, Cyrl], [EU], [srpskohrvatski, српскохрватски]]
shi-latn: [Latn, [AF], Tašlḥiyt]
shi-tfng: [Tfng, [AF], ⵜⴰⵛⵍⵃⵉⵜ]
shi: [[Latn, Tfng], [AF], [Tašlḥiyt, ⵜⴰⵛⵍⵃⵉⵜ]]
shn: [Mymr, [AS], လိၵ်ႈတႆး]
si: [Sinh, [AS], සිංහල]
simple: [Latn, [WW], Simple English]
sk: [Latn, [EU], slovenčina]
sl: [Latn, [EU], slovenščina]
sli: [Latn, [EU], Schläsch]
slr: [Latn, [AS], Salırça]
sly: [Latn, [AS], Bahasa Selayar]
sm: [Latn, [PA], Gagana Samoa]
sma: [Latn, [EU], Åarjelsaemien]
sn: [Latn, [AF], chiShona]
so: [Latn, [AF], Soomaaliga]
sq: [Latn, [EU], shqip]
sr-ec: [Cyrl, [EU], српски (ћирилица)]
sr-el: [Latn, [EU], srpski (latinica)]
sr: [[Cyrl, Latn], [EU], [српски, srpski]]
srn: [Latn, [SA, NA, EU], Sranantongo]
ss: [Latn, [AF], SiSwati]
st: [Latn, [AF], Sesotho]
stq: [Latn, [EU], Seeltersk]
su: [Latn, [AS], Basa Sunda]
sv: [Latn, [EU], svenska]
sw: [Latn, [AF], Kiswahili]
swb: [Latn, [AF], Shikomoro]
sxu: [Latn, [EU], Säggssch]
szl: [Latn, [EU], ślůnski]
ta: [Taml, [AS], தமிழ்]
tcy: [Knda, [AS], ತುಳು]
te: [Telu, [AS], తెలుగు]
tet: [Latn, [AS, PA], tetun]
tg-cyrl: [Cyrl, [AS], тоҷикӣ]
tg-latn: [Latn, [AS], tojikī]
tg: [Cyrl, [AS], тоҷикӣ]
th: [Thai, [AS], ไทย]
ti: [Ethi, [AF], ትግርኛ]
tk: [Latn, [AS], Türkmençe]
tkr: [Cyrl, [AS], ЦӀаьхна миз]
tl: [Latn, [AS], Tagalog]
# A very complicated case. Names.php is Cyrl. In TWN they argue about Cyrl, Latn, and Arab. I can't find reliable external sources. --Amir
tly: [Cyrl, [EU, AS, ME], толышә зывон]
tn: [Latn, [AF], Setswana]
to: [Latn, [PA], lea faka-Tonga]
tokipona: [Latn, [WW], Toki Pona]
tpi: [Latn, [PA, AS], Tok Pisin]
tr: [Latn, [EU, ME], Türkçe]
trp: [Latn, [AS], Kokborok (Tripuri)]
tru: [Latn, [AS], Ṫuroyo]
ts: [Latn, [AF], Xitsonga]
tsd: [Grek, [EU], Τσακωνικά]
tt-cyrl: [Cyrl, [EU], татарча]
tt-latn: [Latn, [EU], tatarça]
tt: [[Cyrl, Latn] [EU], [татарча, tatarça]]
ttt: [Cyrl, [AS], Tati]
tum: [Latn, [AF], chiTumbuka]
tw: [Latn, [AF], Twi]
twd: [Latn, [EU], Tweants]
ty: [Latn, [PA], Reo Mā`ohi]
tyv: [Cyrl, [AS], тыва дыл]
tzm: [Tfng, [AF], ⵜⴰⵎⴰⵣⵉⵖⵜ]
udm: [Cyrl, [EU], удмурт]
ug-arab: [Arab, [AS], ئۇيغۇرچە]
ug-latn: [Latn, [AS], Uyghurche]
ug: [[Arab, Latn], [AS], [ئۇيغۇرچە, Uyghurche]]
uk: [Cyrl, [EU], українська]
ur: [Arab, [AS, ME], اردو]
uz: [Latn, [AS], oʻzbekcha]
ve: [Latn, [AF], Tshivenda]
vec: [Latn, [EU], vèneto]
vep: [Latn, [EU], vepsän kel]
vi: [Latn, [AS], Tiếng Việt]
vls: [Latn, [EU], West-Vlams]
vmf: [Latn, [EU], Mainfränkisch]
vo: [Latn, [WW], Volapük]
vot: [Latn, [EU], Vaďďa]
vro: [Latn, [EU], Võro]
wa: [Latn, [EU], walon]
war: [Latn, [AS], Winaray]
wls: [Latn, [PA], "Faka'uvea"]
wo: [Latn, [AF], Wolof]
wuu: [Hans, [EU], 吴语]
xal: [Cyrl, [EU], хальмг]
xh: [Latn, [AF], isiXhosa]
xmf: [Geor, [EU], მარგალური]
ydd: [Hebr, [AS, EU], Eastern Yiddish]
yi: [Hebr, [ME, EU, NA, SA], ייִדיש]
yo: [Latn, [AF], Yorùbá]
yrk: [Cyrl, [AS], Ненэцяʼ вада]
yrl: [Latn, [LA], "ñe'engatú"]
yua: [Latn, [NA, LA], "Maaya T'aan"]
# world?
yue: [Hant, [AS], 粵語]
za: [Latn, [AS], Vahcuengh]
zea: [Latn, [EU], Zeêuws]
zh-classical: [Hant, [AS], 文言]
zh-cn: [Hans, [AS], 中文(中国大陆)]
zh-hans: [Hans, [AS], 中文(简体)]
zh-hant: [Hant, [AS], 中文(繁體)]
zh-hk: [Hant, [AS], 中文(香港)]
zh-min-nan: [Latn, [AS], Bân-lâm-gú]
zh-mo: [Hant, [AS], 中文(澳門)]
zh-my: [Hans, [AS], 中文(马来西亚)]
zh-sg: [Hans, [AS], 中文(新加坡)]
zh-tw: [Hant, [AS], 中文(台灣)]
zh-yue: [Hans, [AS], 粵語]
zh: [Hans, [AS], 中文]
zu: [Latn, [AF], isiZulu]
# The codes are taken from http://unicode.org/iso15924/iso15924-codes.html .
#
# The classification is roughly based on http://www.unicode.org/charts/
# with some practical corrections.
scriptgroups:
# Other is reserved
# Large groups, one script in each
Cyrillic: [Cyrl]
Arabic: [Arab]
# It's probalby different enough from Latin and Cyrillic, but user testing
# may prove otherwise.
Greek: [Grek]
# Couldn't find a better place for Goth.
Latin: [Latn, Goth]
WestCaucasian: [Armn, Geor]
# Maybe it can be unified with Arabic.
# Maybe Thaana can be moved here from SouthAsian.
# Maybe it can be unified with African.
MiddleEastern: [Hebr, Syrc]
African: [Ethi, Nkoo, Tfng]
# India, Nepal, Bangladesh, Sri-Lanka, Bhutan, Maldives.
#
# Thaana (Thaa, the script of Maldives) is here, even though it's RTL,
# because it's closer geographically to India. Maybe it should be moved
# to MiddleEastern or to Arabic, if that would be easier to users.
#
# Tibetan (Tibt) is here, even though it's classified as "Central Asian" by
# Unicode, because linguistically and geographically it's closely related to
# the Brahmic family.
SouthAsian: [Beng, Deva, Gujr, Guru, Knda, Mlym, Orya, Saur, Sinh, Taml, Telu, Tibt, Thaa]
SouthEastAsian: [Batk, Bugi, Java, Khmr, Laoo, Mymr, Thai]
Mongolian: [Mong]
SignWriting: [Sgnw]
CJK: [Hans, Hant, Kana, Kore, Jpan, Yiii]
NativeAmerican: [Cher, Cans]
regiongroups:
# north-america
NA: 1
# latin-america
LA: 1
# south-america
SA: 1
# europe
EU: 2
# middle-east
ME: 2
# africa
AF: 2
# asia
AS: 3
# pacific
PA: 3
# australia
AU: 3
# world wide, international
WW: 4