cb23d50f38
Routine update by running scripts, ignoring clang-format's extensive grumbles. Added notes to util/locale_database/'s README, on the need for that, and enumdata.py, on when to add entries. As usual, several new locales are also added, for existing languages, territories and scripts. [ChangeLog][QtCore][QLocale] Updated to new version of CLDR (the Unicode Consortium's Common Locale Data Repository) v37. Fixes: QTBUG-84669 Pick-to: 5.15 Change-Id: Ib76848bf4bd1219180faf46820077e8d8049a4e3 Reviewed-by: Mårten Nordheim <marten.nordheim@qt.io>
892 lines
45 KiB
Python
892 lines
45 KiB
Python
#!/usr/bin/env python
|
|
#############################################################################
|
|
##
|
|
## Copyright (C) 2020 The Qt Company Ltd.
|
|
## Contact: https://www.qt.io/licensing/
|
|
##
|
|
## This file is part of the test suite of the Qt Toolkit.
|
|
##
|
|
## $QT_BEGIN_LICENSE:GPL-EXCEPT$
|
|
## Commercial License Usage
|
|
## Licensees holding valid commercial Qt licenses may use this file in
|
|
## accordance with the commercial license agreement provided with the
|
|
## Software or, alternatively, in accordance with the terms contained in
|
|
## a written agreement between you and The Qt Company. For licensing terms
|
|
## and conditions see https://www.qt.io/terms-conditions. For further
|
|
## information use the contact form at https://www.qt.io/contact-us.
|
|
##
|
|
## GNU General Public License Usage
|
|
## Alternatively, this file may be used under the terms of the GNU
|
|
## General Public License version 3 as published by the Free Software
|
|
## Foundation with exceptions as appearing in the file LICENSE.GPL3-EXCEPT
|
|
## included in the packaging of this file. Please review the following
|
|
## information to ensure the GNU General Public License requirements will
|
|
## be met: https://www.gnu.org/licenses/gpl-3.0.html.
|
|
##
|
|
## $QT_END_LICENSE$
|
|
##
|
|
#############################################################################
|
|
|
|
# A run of cldr2qlocalexml.py will produce output reporting any
|
|
# language, script and country codes it sees, in data, for which it
|
|
# can find a name (taken always from en.xml) that could potentially be
|
|
# used. There is no point adding a mapping for such a code unless the
|
|
# CLDR's common/main/ contains an XML file for at least one locale
|
|
# that exerciss it.
|
|
|
|
# Each *_list reflects the current values of its enums in qlocale.h;
|
|
# if new xml language files are available in CLDR, these languages and
|
|
# countries need to be *appended* to this list (for compatibility
|
|
# between versions). Include any spaces present in names (scripts
|
|
# shall squish them out for the enum entries) in *_list, but use the
|
|
# squished forms of names in the *_aliases mappings.
|
|
|
|
### Qt 6: restore alphabetic order in each list.
|
|
|
|
language_list = {
|
|
0: ["AnyLanguage", " "],
|
|
1: ["C", " "],
|
|
2: ["Abkhazian", "ab"],
|
|
3: ["Oromo", "om"], # macrolanguage
|
|
4: ["Afar", "aa"],
|
|
5: ["Afrikaans", "af"],
|
|
6: ["Albanian", "sq"], # macrolanguage
|
|
7: ["Amharic", "am"],
|
|
8: ["Arabic", "ar"], # macrolanguage
|
|
9: ["Armenian", "hy"],
|
|
10: ["Assamese", "as"],
|
|
11: ["Aymara", "ay"], # macrolanguage
|
|
12: ["Azerbaijani", "az"], # macrolanguage
|
|
13: ["Bashkir", "ba"],
|
|
14: ["Basque", "eu"],
|
|
15: ["Bengali", "bn"],
|
|
16: ["Dzongkha", "dz"],
|
|
17: ["Bihari", "bh"],
|
|
18: ["Bislama", "bi"],
|
|
19: ["Breton", "br"],
|
|
20: ["Bulgarian", "bg"],
|
|
21: ["Burmese", "my"],
|
|
22: ["Belarusian", "be"],
|
|
23: ["Khmer", "km"],
|
|
24: ["Catalan", "ca"],
|
|
25: ["Chinese", "zh"], # macrolanguage
|
|
26: ["Corsican", "co"],
|
|
27: ["Croatian", "hr"],
|
|
28: ["Czech", "cs"],
|
|
29: ["Danish", "da"],
|
|
30: ["Dutch", "nl"],
|
|
31: ["English", "en"],
|
|
32: ["Esperanto", "eo"],
|
|
33: ["Estonian", "et"], # macrolanguage
|
|
34: ["Faroese", "fo"],
|
|
35: ["Fijian", "fj"],
|
|
36: ["Finnish", "fi"],
|
|
37: ["French", "fr"],
|
|
38: ["Western Frisian", "fy"],
|
|
39: ["Gaelic", "gd"],
|
|
40: ["Galician", "gl"],
|
|
41: ["Georgian", "ka"],
|
|
42: ["German", "de"],
|
|
43: ["Greek", "el"],
|
|
44: ["Greenlandic", "kl"],
|
|
45: ["Guarani", "gn"], # macrolanguage
|
|
46: ["Gujarati", "gu"],
|
|
47: ["Hausa", "ha"],
|
|
48: ["Hebrew", "he"],
|
|
49: ["Hindi", "hi"],
|
|
50: ["Hungarian", "hu"],
|
|
51: ["Icelandic", "is"],
|
|
52: ["Indonesian", "id"],
|
|
53: ["Interlingua", "ia"],
|
|
54: ["Interlingue", "ie"],
|
|
55: ["Inuktitut", "iu"], # macrolanguage
|
|
56: ["Inupiak", "ik"], # macrolanguage
|
|
57: ["Irish", "ga"],
|
|
58: ["Italian", "it"],
|
|
59: ["Japanese", "ja"],
|
|
60: ["Javanese", "jv"],
|
|
61: ["Kannada", "kn"],
|
|
62: ["Kashmiri", "ks"],
|
|
63: ["Kazakh", "kk"],
|
|
64: ["Kinyarwanda", "rw"],
|
|
65: ["Kirghiz", "ky"],
|
|
66: ["Korean", "ko"],
|
|
67: ["Kurdish", "ku"], # macrolanguage
|
|
68: ["Rundi", "rn"],
|
|
69: ["Lao", "lo"],
|
|
70: ["Latin", "la"],
|
|
71: ["Latvian", "lv"], # macrolanguage
|
|
72: ["Lingala", "ln"],
|
|
73: ["Lithuanian", "lt"],
|
|
74: ["Macedonian", "mk"],
|
|
75: ["Malagasy", "mg"], # macrolanguage
|
|
76: ["Malay", "ms"], # macrolanguage
|
|
77: ["Malayalam", "ml"],
|
|
78: ["Maltese", "mt"],
|
|
79: ["Maori", "mi"],
|
|
80: ["Marathi", "mr"],
|
|
81: ["Marshallese", "mh"],
|
|
82: ["Mongolian", "mn"], # macrolanguage
|
|
83: ["Nauru", "na"],
|
|
84: ["Nepali", "ne"], # macrolanguage
|
|
85: ["Norwegian Bokmal", "nb"],
|
|
86: ["Occitan", "oc"],
|
|
87: ["Oriya", "or"], # macrolanguage
|
|
88: ["Pashto", "ps"], # macrolanguage
|
|
89: ["Persian", "fa"], # macrolanguage
|
|
90: ["Polish", "pl"],
|
|
91: ["Portuguese", "pt"],
|
|
92: ["Punjabi", "pa"],
|
|
93: ["Quechua", "qu"], # macrolanguage
|
|
94: ["Romansh", "rm"],
|
|
95: ["Romanian", "ro"],
|
|
96: ["Russian", "ru"],
|
|
97: ["Samoan", "sm"],
|
|
98: ["Sango", "sg"],
|
|
99: ["Sanskrit", "sa"],
|
|
100: ["Serbian", "sr"],
|
|
101: ["Ossetic", "os"],
|
|
102: ["Southern Sotho", "st"],
|
|
103: ["Tswana", "tn"],
|
|
104: ["Shona", "sn"],
|
|
105: ["Sindhi", "sd"],
|
|
106: ["Sinhala", "si"],
|
|
107: ["Swati", "ss"],
|
|
108: ["Slovak", "sk"],
|
|
109: ["Slovenian", "sl"],
|
|
110: ["Somali", "so"],
|
|
111: ["Spanish", "es"],
|
|
112: ["Sundanese", "su"],
|
|
113: ["Swahili", "sw"], # macrolanguage
|
|
114: ["Swedish", "sv"],
|
|
115: ["Sardinian", "sc"], # macrolanguage
|
|
116: ["Tajik", "tg"],
|
|
117: ["Tamil", "ta"],
|
|
118: ["Tatar", "tt"],
|
|
119: ["Telugu", "te"],
|
|
120: ["Thai", "th"],
|
|
121: ["Tibetan", "bo"],
|
|
122: ["Tigrinya", "ti"],
|
|
123: ["Tongan", "to"],
|
|
124: ["Tsonga", "ts"],
|
|
125: ["Turkish", "tr"],
|
|
126: ["Turkmen", "tk"],
|
|
127: ["Tahitian", "ty"],
|
|
128: ["Uighur", "ug"],
|
|
129: ["Ukrainian", "uk"],
|
|
130: ["Urdu", "ur"],
|
|
131: ["Uzbek", "uz"], # macrolanguage
|
|
132: ["Vietnamese", "vi"],
|
|
133: ["Volapuk", "vo"],
|
|
134: ["Welsh", "cy"],
|
|
135: ["Wolof", "wo"],
|
|
136: ["Xhosa", "xh"],
|
|
137: ["Yiddish", "yi"], # macrolanguage
|
|
138: ["Yoruba", "yo"],
|
|
139: ["Zhuang", "za"], # macrolanguage
|
|
140: ["Zulu", "zu"],
|
|
141: ["Norwegian Nynorsk", "nn"],
|
|
142: ["Bosnian", "bs"],
|
|
143: ["Divehi", "dv"],
|
|
144: ["Manx", "gv"],
|
|
145: ["Cornish", "kw"],
|
|
146: ["Akan", "ak"], # macrolanguage
|
|
147: ["Konkani", "kok"],
|
|
148: ["Ga", "gaa"],
|
|
149: ["Igbo", "ig" ],
|
|
150: ["Kamba", "kam"],
|
|
151: ["Syriac", "syr"],
|
|
152: ["Blin", "byn"],
|
|
153: ["Geez", "gez"],
|
|
154: ["Koro", "kfo"],
|
|
155: ["Sidamo", "sid"],
|
|
156: ["Atsam", "cch"],
|
|
157: ["Tigre", "tig"],
|
|
158: ["Jju", "kaj"],
|
|
159: ["Friulian", "fur"],
|
|
160: ["Venda", "ve" ],
|
|
161: ["Ewe", "ee" ],
|
|
162: ["Walamo", "wal"],
|
|
163: ["Hawaiian", "haw"],
|
|
164: ["Tyap", "kcg"],
|
|
165: ["Nyanja", "ny" ],
|
|
166: ["Filipino", "fil"],
|
|
167: ["Swiss German", "gsw"],
|
|
168: ["Sichuan Yi", "ii" ],
|
|
169: ["Kpelle", "kpe"],
|
|
170: ["Low German", "nds"],
|
|
171: ["South Ndebele", "nr" ],
|
|
172: ["Northern Sotho", "nso"],
|
|
173: ["Northern Sami", "se" ],
|
|
174: ["Taroko", "trv"],
|
|
175: ["Gusii", "guz"],
|
|
176: ["Taita", "dav"],
|
|
177: ["Fulah", "ff"], # macrolanguage
|
|
178: ["Kikuyu", "ki"],
|
|
179: ["Samburu", "saq"],
|
|
180: ["Sena", "seh"],
|
|
181: ["North Ndebele", "nd"],
|
|
182: ["Rombo", "rof"],
|
|
183: ["Tachelhit", "shi"],
|
|
184: ["Kabyle", "kab"],
|
|
185: ["Nyankole", "nyn"],
|
|
186: ["Bena", "bez"],
|
|
187: ["Vunjo", "vun"],
|
|
188: ["Bambara", "bm"],
|
|
189: ["Embu", "ebu"],
|
|
190: ["Cherokee", "chr"],
|
|
191: ["Morisyen", "mfe"],
|
|
192: ["Makonde", "kde"],
|
|
193: ["Langi", "lag"],
|
|
194: ["Ganda", "lg"],
|
|
195: ["Bemba", "bem"],
|
|
196: ["Kabuverdianu", "kea"],
|
|
197: ["Meru", "mer"],
|
|
198: ["Kalenjin", "kln"],
|
|
199: ["Nama", "naq"],
|
|
200: ["Machame", "jmc"],
|
|
201: ["Colognian", "ksh"],
|
|
202: ["Masai", "mas"],
|
|
203: ["Soga", "xog"],
|
|
204: ["Luyia", "luy"],
|
|
205: ["Asu", "asa"],
|
|
206: ["Teso", "teo"],
|
|
207: ["Saho", "ssy"],
|
|
208: ["Koyra Chiini", "khq"],
|
|
209: ["Rwa", "rwk"],
|
|
210: ["Luo", "luo"],
|
|
211: ["Chiga", "cgg"],
|
|
212: ["Central Morocco Tamazight", "tzm"],
|
|
213: ["Koyraboro Senni", "ses"],
|
|
214: ["Shambala", "ksb"],
|
|
215: ["Bodo", "brx"],
|
|
216: ["Avaric", "av"],
|
|
217: ["Chamorro", "ch"],
|
|
218: ["Chechen", "ce"],
|
|
219: ["Church", "cu"], # macrolanguage
|
|
220: ["Chuvash", "cv"],
|
|
221: ["Cree", "cr"], # macrolanguage
|
|
222: ["Haitian", "ht"],
|
|
223: ["Herero", "hz"],
|
|
224: ["Hiri Motu", "ho"],
|
|
225: ["Kanuri", "kr"], # macrolanguage
|
|
226: ["Komi", "kv"], # macrolanguage
|
|
227: ["Kongo", "kg"], # macrolanguage
|
|
228: ["Kwanyama", "kj"],
|
|
229: ["Limburgish", "li"],
|
|
230: ["Luba Katanga", "lu"],
|
|
231: ["Luxembourgish", "lb"],
|
|
232: ["Navaho", "nv"],
|
|
233: ["Ndonga", "ng"],
|
|
234: ["Ojibwa", "oj"], # macrolanguage
|
|
235: ["Pali", "pi"], # macrolanguage
|
|
236: ["Walloon", "wa"],
|
|
237: ["Aghem", "agq"],
|
|
238: ["Basaa", "bas"],
|
|
239: ["Zarma", "dje"],
|
|
240: ["Duala", "dua"],
|
|
241: ["Jola Fonyi", "dyo"],
|
|
242: ["Ewondo", "ewo"],
|
|
243: ["Bafia", "ksf"],
|
|
244: ["Makhuwa Meetto", "mgh"],
|
|
245: ["Mundang", "mua"],
|
|
246: ["Kwasio", "nmg"],
|
|
247: ["Nuer", "nus"],
|
|
248: ["Sakha", "sah"],
|
|
249: ["Sangu", "sbp"],
|
|
250: ["Congo Swahili", "swc"],
|
|
251: ["Tasawaq", "twq"],
|
|
252: ["Vai", "vai"],
|
|
253: ["Walser", "wae"],
|
|
254: ["Yangben", "yav"],
|
|
255: ["Avestan", "ae"],
|
|
256: ["Asturian", "ast"],
|
|
257: ["Ngomba", "jgo"],
|
|
258: ["Kako", "kkj"],
|
|
259: ["Meta", "mgo"],
|
|
260: ["Ngiemboon", "nnh"],
|
|
261: ["Aragonese", "an"],
|
|
262: ["Akkadian", "akk"],
|
|
263: ["Ancient Egyptian", "egy"],
|
|
264: ["Ancient Greek", "grc"],
|
|
265: ["Aramaic", "arc"],
|
|
266: ["Balinese", "ban"],
|
|
267: ["Bamun", "bax"],
|
|
268: ["Batak Toba", "bbc"],
|
|
269: ["Buginese", "bug"],
|
|
270: ["Buhid", "bku"],
|
|
271: ["Carian", "xcr"],
|
|
272: ["Chakma", "ccp"],
|
|
273: ["Classical Mandaic", "myz"],
|
|
274: ["Coptic", "cop"],
|
|
275: ["Dogri", "doi"], # macrolanguage
|
|
276: ["Eastern Cham", "cjm"],
|
|
277: ["Eastern Kayah", "eky"],
|
|
278: ["Etruscan", "ett"],
|
|
279: ["Gothic", "got"],
|
|
280: ["Hanunoo", "hnn"],
|
|
281: ["Ingush", "inh"],
|
|
282: ["Large Flowery Miao", "hmd"],
|
|
283: ["Lepcha", "lep"],
|
|
284: ["Limbu", "lif"],
|
|
285: ["Lisu", "lis"],
|
|
286: ["Lu", "khb"],
|
|
287: ["Lycian", "xlc"],
|
|
288: ["Lydian", "xld"],
|
|
289: ["Mandingo", "man"], # macrolanguage
|
|
290: ["Manipuri", "mni"],
|
|
291: ["Meroitic", "xmr"],
|
|
292: ["Northern Thai", "nod"],
|
|
293: ["Old Irish", "sga"],
|
|
294: ["Old Norse", "non"],
|
|
295: ["Old Persian", "peo"],
|
|
296: ["Old Turkish", "otk"],
|
|
297: ["Pahlavi", "pal"],
|
|
298: ["Parthian", "xpr"],
|
|
299: ["Phoenician", "phn"],
|
|
300: ["Prakrit Language", "pra"],
|
|
301: ["Rejang", "rej"],
|
|
302: ["Sabaean", "xsa"],
|
|
303: ["Samaritan", "smp"],
|
|
304: ["Santali", "sat"],
|
|
305: ["Saurashtra", "saz"],
|
|
306: ["Sora", "srb"],
|
|
307: ["Sylheti", "syl"],
|
|
308: ["Tagbanwa", "tbw"],
|
|
309: ["Tai Dam", "blt"],
|
|
310: ["Tai Nua", "tdd"],
|
|
311: ["Ugaritic", "uga"],
|
|
312: ["Akoose", "bss"],
|
|
313: ["Lakota", "lkt"],
|
|
314: ["Standard Moroccan Tamazight", "zgh"],
|
|
315: ["Mapuche", "arn"],
|
|
316: ["Central Kurdish", "ckb"],
|
|
317: ["Lower Sorbian", "dsb"],
|
|
318: ["Upper Sorbian", "hsb"],
|
|
319: ["Kenyang", "ken"],
|
|
320: ["Mohawk", "moh"],
|
|
321: ["Nko", "nqo"],
|
|
322: ["Prussian", "prg"],
|
|
323: ["Kiche", "quc"],
|
|
324: ["Southern Sami", "sma"],
|
|
325: ["Lule Sami", "smj"],
|
|
326: ["Inari Sami", "smn"],
|
|
327: ["Skolt Sami", "sms"],
|
|
328: ["Warlpiri", "wbp"],
|
|
329: ["Manichaean Middle Persian", "xmn"],
|
|
330: ["Mende", "men"],
|
|
331: ["Ancient North Arabian", "xna"],
|
|
332: ["Linear A", "lab"],
|
|
333: ["Hmong Njua", "hnj"],
|
|
334: ["Ho", "hoc"],
|
|
335: ["Lezghian", "lez"],
|
|
336: ["Bassa", "bsq"],
|
|
337: ["Mono", "mru"],
|
|
338: ["Tedim Chin", "ctd"],
|
|
339: ["Maithili", "mai"],
|
|
340: ["Ahom", "aho"],
|
|
341: ["American Sign Language", "ase"],
|
|
342: ["Ardhamagadhi Prakrit", "pka"],
|
|
343: ["Bhojpuri", "bho"],
|
|
344: ["Hieroglyphic Luwian", "hlu"],
|
|
345: ["Literary Chinese", "lzh"],
|
|
346: ["Mazanderani", "mzn"],
|
|
347: ["Mru", "mro"],
|
|
348: ["Newari", "new"],
|
|
349: ["Northern Luri", "lrc"],
|
|
350: ["Palauan", "pau"],
|
|
351: ["Papiamento", "pap"],
|
|
352: ["Saraiki", "skr"],
|
|
353: ["Tokelau", "tkl"],
|
|
354: ["Tok Pisin", "tpi"],
|
|
355: ["Tuvalu", "tvl"],
|
|
356: ["Uncoded Languages", "mis"],
|
|
357: ["Cantonese", "yue"],
|
|
358: ["Osage", "osa"],
|
|
359: ["Tangut", "txg"],
|
|
360: ["Ido", "io"],
|
|
361: ["Lojban", "jbo"],
|
|
362: ["Sicilian", "scn"],
|
|
363: ["Southern Kurdish", "sdh"],
|
|
364: ["Western Balochi", "bgn"],
|
|
365: ["Cebuano", "ceb"],
|
|
366: ["Erzya", "myv"],
|
|
367: ["Chickasaw", "cic"],
|
|
368: ["Muscogee", "mus"],
|
|
369: ["Silesian", "szl"],
|
|
370: ["Nigerian Pidgin", "pcm"],
|
|
}
|
|
|
|
language_aliases = {
|
|
# Legacy - should disappear at some point:
|
|
'Norwegian': 'NorwegianBokmal',
|
|
'Moldavian': 'Romanian',
|
|
'SerboCroatian': 'Serbian',
|
|
'Tagalog': 'Filipino',
|
|
'Twi': 'Akan',
|
|
# Renamings:
|
|
'Afan': 'Oromo',
|
|
'Byelorussian': 'Belarusian',
|
|
'Bhutani': 'Dzongkha',
|
|
'Cambodian': 'Khmer',
|
|
'Kurundi': 'Rundi',
|
|
'RhaetoRomance': 'Romansh',
|
|
'Chewa': 'Nyanja',
|
|
'Frisian': 'WesternFrisian',
|
|
'Uigur': 'Uighur',
|
|
}
|
|
|
|
country_list = {
|
|
0: ["AnyCountry", "ZZ"],
|
|
1: ["Afghanistan", "AF"],
|
|
2: ["Albania", "AL"],
|
|
3: ["Algeria", "DZ"],
|
|
4: ["American Samoa", "AS"],
|
|
5: ["Andorra", "AD"],
|
|
6: ["Angola", "AO"],
|
|
7: ["Anguilla", "AI"],
|
|
8: ["Antarctica", "AQ"],
|
|
9: ["Antigua And Barbuda", "AG"],
|
|
10: ["Argentina", "AR"],
|
|
11: ["Armenia", "AM"],
|
|
12: ["Aruba", "AW"],
|
|
13: ["Australia", "AU"],
|
|
14: ["Austria", "AT"],
|
|
15: ["Azerbaijan", "AZ"],
|
|
16: ["Bahamas", "BS"],
|
|
17: ["Bahrain", "BH"],
|
|
18: ["Bangladesh", "BD"],
|
|
19: ["Barbados", "BB"],
|
|
20: ["Belarus", "BY"],
|
|
21: ["Belgium", "BE"],
|
|
22: ["Belize", "BZ"],
|
|
23: ["Benin", "BJ"],
|
|
24: ["Bermuda", "BM"],
|
|
25: ["Bhutan", "BT"],
|
|
26: ["Bolivia", "BO"],
|
|
27: ["Bosnia And Herzegowina", "BA"],
|
|
28: ["Botswana", "BW"],
|
|
29: ["Bouvet Island", "BV"],
|
|
30: ["Brazil", "BR"],
|
|
31: ["British Indian Ocean Territory", "IO"],
|
|
32: ["Brunei", "BN"],
|
|
33: ["Bulgaria", "BG"],
|
|
34: ["Burkina Faso", "BF"],
|
|
35: ["Burundi", "BI"],
|
|
36: ["Cambodia", "KH"],
|
|
37: ["Cameroon", "CM"],
|
|
38: ["Canada", "CA"],
|
|
39: ["Cape Verde", "CV"],
|
|
40: ["Cayman Islands", "KY"],
|
|
41: ["Central African Republic", "CF"],
|
|
42: ["Chad", "TD"],
|
|
43: ["Chile", "CL"],
|
|
44: ["China", "CN"],
|
|
45: ["Christmas Island", "CX"],
|
|
46: ["Cocos Islands", "CC"],
|
|
47: ["Colombia", "CO"],
|
|
48: ["Comoros", "KM"],
|
|
49: ["Congo Kinshasa", "CD"],
|
|
50: ["Congo Brazzaville", "CG"],
|
|
51: ["Cook Islands", "CK"],
|
|
52: ["Costa Rica", "CR"],
|
|
53: ["Ivory Coast", "CI"],
|
|
54: ["Croatia", "HR"],
|
|
55: ["Cuba", "CU"],
|
|
56: ["Cyprus", "CY"],
|
|
57: ["Czech Republic", "CZ"],
|
|
58: ["Denmark", "DK"],
|
|
59: ["Djibouti", "DJ"],
|
|
60: ["Dominica", "DM"],
|
|
61: ["Dominican Republic", "DO"],
|
|
62: ["East Timor", "TL"],
|
|
63: ["Ecuador", "EC"],
|
|
64: ["Egypt", "EG"],
|
|
65: ["El Salvador", "SV"],
|
|
66: ["Equatorial Guinea", "GQ"],
|
|
67: ["Eritrea", "ER"],
|
|
68: ["Estonia", "EE"],
|
|
69: ["Ethiopia", "ET"],
|
|
70: ["Falkland Islands", "FK"],
|
|
71: ["Faroe Islands", "FO"],
|
|
72: ["Fiji", "FJ"],
|
|
73: ["Finland", "FI"],
|
|
74: ["France", "FR"],
|
|
75: ["Guernsey", "GG"],
|
|
76: ["French Guiana", "GF"],
|
|
77: ["French Polynesia", "PF"],
|
|
78: ["French Southern Territories", "TF"],
|
|
79: ["Gabon", "GA"],
|
|
80: ["Gambia", "GM"],
|
|
81: ["Georgia", "GE"],
|
|
82: ["Germany", "DE"],
|
|
83: ["Ghana", "GH"],
|
|
84: ["Gibraltar", "GI"],
|
|
85: ["Greece", "GR"],
|
|
86: ["Greenland", "GL"],
|
|
87: ["Grenada", "GD"],
|
|
88: ["Guadeloupe", "GP"],
|
|
89: ["Guam", "GU"],
|
|
90: ["Guatemala", "GT"],
|
|
91: ["Guinea", "GN"],
|
|
92: ["Guinea Bissau", "GW"],
|
|
93: ["Guyana", "GY"],
|
|
94: ["Haiti", "HT"],
|
|
95: ["Heard And McDonald Islands", "HM"],
|
|
96: ["Honduras", "HN"],
|
|
97: ["Hong Kong", "HK"],
|
|
98: ["Hungary", "HU"],
|
|
99: ["Iceland", "IS"],
|
|
100: ["India", "IN"],
|
|
101: ["Indonesia", "ID"],
|
|
102: ["Iran", "IR"],
|
|
103: ["Iraq", "IQ"],
|
|
104: ["Ireland", "IE"],
|
|
105: ["Israel", "IL"],
|
|
106: ["Italy", "IT"],
|
|
107: ["Jamaica", "JM"],
|
|
108: ["Japan", "JP"],
|
|
109: ["Jordan", "JO"],
|
|
110: ["Kazakhstan", "KZ"],
|
|
111: ["Kenya", "KE"],
|
|
112: ["Kiribati", "KI"],
|
|
113: ["North Korea", "KP"],
|
|
114: ["South Korea", "KR"],
|
|
115: ["Kuwait", "KW"],
|
|
116: ["Kyrgyzstan", "KG"],
|
|
117: ["Laos", "LA"],
|
|
118: ["Latvia", "LV"],
|
|
119: ["Lebanon", "LB"],
|
|
120: ["Lesotho", "LS"],
|
|
121: ["Liberia", "LR"],
|
|
122: ["Libya", "LY"],
|
|
123: ["Liechtenstein", "LI"],
|
|
124: ["Lithuania", "LT"],
|
|
125: ["Luxembourg", "LU"],
|
|
126: ["Macau", "MO"],
|
|
127: ["Macedonia", "MK"],
|
|
128: ["Madagascar", "MG"],
|
|
129: ["Malawi", "MW"],
|
|
130: ["Malaysia", "MY"],
|
|
131: ["Maldives", "MV"],
|
|
132: ["Mali", "ML"],
|
|
133: ["Malta", "MT"],
|
|
134: ["Marshall Islands", "MH"],
|
|
135: ["Martinique", "MQ"],
|
|
136: ["Mauritania", "MR"],
|
|
137: ["Mauritius", "MU"],
|
|
138: ["Mayotte", "YT"],
|
|
139: ["Mexico", "MX"],
|
|
140: ["Micronesia", "FM"],
|
|
141: ["Moldova", "MD"],
|
|
142: ["Monaco", "MC"],
|
|
143: ["Mongolia", "MN"],
|
|
144: ["Montserrat", "MS"],
|
|
145: ["Morocco", "MA"],
|
|
146: ["Mozambique", "MZ"],
|
|
147: ["Myanmar", "MM"],
|
|
148: ["Namibia", "NA"],
|
|
149: ["Nauru", "NR"],
|
|
150: ["Nepal", "NP"],
|
|
151: ["Netherlands", "NL"],
|
|
152: ["Cura Sao", "CW"],
|
|
153: ["New Caledonia", "NC"],
|
|
154: ["New Zealand", "NZ"],
|
|
155: ["Nicaragua", "NI"],
|
|
156: ["Niger", "NE"],
|
|
157: ["Nigeria", "NG"],
|
|
158: ["Niue", "NU"],
|
|
159: ["Norfolk Island", "NF"],
|
|
160: ["Northern Mariana Islands", "MP"],
|
|
161: ["Norway", "NO"],
|
|
162: ["Oman", "OM"],
|
|
163: ["Pakistan", "PK"],
|
|
164: ["Palau", "PW"],
|
|
165: ["Palestinian Territories", "PS"],
|
|
166: ["Panama", "PA"],
|
|
167: ["Papua New Guinea", "PG"],
|
|
168: ["Paraguay", "PY"],
|
|
169: ["Peru", "PE"],
|
|
170: ["Philippines", "PH"],
|
|
171: ["Pitcairn", "PN"],
|
|
172: ["Poland", "PL"],
|
|
173: ["Portugal", "PT"],
|
|
174: ["Puerto Rico", "PR"],
|
|
175: ["Qatar", "QA"],
|
|
176: ["Reunion", "RE"],
|
|
177: ["Romania", "RO"],
|
|
178: ["Russia", "RU"],
|
|
179: ["Rwanda", "RW"],
|
|
180: ["Saint Kitts And Nevis", "KN"],
|
|
181: ["Saint Lucia", "LC"],
|
|
182: ["Saint Vincent And The Grenadines", "VC"],
|
|
183: ["Samoa", "WS"],
|
|
184: ["San Marino", "SM"],
|
|
185: ["Sao Tome And Principe", "ST"],
|
|
186: ["Saudi Arabia", "SA"],
|
|
187: ["Senegal", "SN"],
|
|
188: ["Seychelles", "SC"],
|
|
189: ["Sierra Leone", "SL"],
|
|
190: ["Singapore", "SG"],
|
|
191: ["Slovakia", "SK"],
|
|
192: ["Slovenia", "SI"],
|
|
193: ["Solomon Islands", "SB"],
|
|
194: ["Somalia", "SO"],
|
|
195: ["South Africa", "ZA"],
|
|
196: ["South Georgia And The South Sandwich Islands", "GS"],
|
|
197: ["Spain", "ES"],
|
|
198: ["Sri Lanka", "LK"],
|
|
199: ["Saint Helena", "SH"],
|
|
200: ["Saint Pierre And Miquelon", "PM"],
|
|
201: ["Sudan", "SD"],
|
|
202: ["Suriname", "SR"],
|
|
203: ["Svalbard And Jan Mayen Islands", "SJ"],
|
|
204: ["Swaziland", "SZ"],
|
|
205: ["Sweden", "SE"],
|
|
206: ["Switzerland", "CH"],
|
|
207: ["Syria", "SY"],
|
|
208: ["Taiwan", "TW"],
|
|
209: ["Tajikistan", "TJ"],
|
|
210: ["Tanzania", "TZ"],
|
|
211: ["Thailand", "TH"],
|
|
212: ["Togo", "TG"],
|
|
213: ["Tokelau", "TK"],
|
|
214: ["Tonga", "TO"],
|
|
215: ["Trinidad And Tobago", "TT"],
|
|
216: ["Tunisia", "TN"],
|
|
217: ["Turkey", "TR"],
|
|
218: ["Turkmenistan", "TM"],
|
|
219: ["Turks And Caicos Islands", "TC"],
|
|
220: ["Tuvalu", "TV"],
|
|
221: ["Uganda", "UG"],
|
|
222: ["Ukraine", "UA"],
|
|
223: ["United Arab Emirates", "AE"],
|
|
224: ["United Kingdom", "GB"],
|
|
225: ["United States", "US"],
|
|
226: ["United States Minor Outlying Islands", "UM"],
|
|
227: ["Uruguay", "UY"],
|
|
228: ["Uzbekistan", "UZ"],
|
|
229: ["Vanuatu", "VU"],
|
|
230: ["Vatican City State", "VA"],
|
|
231: ["Venezuela", "VE"],
|
|
232: ["Vietnam", "VN"],
|
|
233: ["British Virgin Islands", "VG"],
|
|
234: ["United States Virgin Islands", "VI"],
|
|
235: ["Wallis And Futuna Islands", "WF"],
|
|
236: ["Western Sahara", "EH"],
|
|
237: ["Yemen", "YE"],
|
|
238: ["Canary Islands", "IC"],
|
|
239: ["Zambia", "ZM"],
|
|
240: ["Zimbabwe", "ZW"],
|
|
241: ["Clipperton Island", "CP"],
|
|
242: ["Montenegro", "ME"],
|
|
243: ["Serbia", "RS"],
|
|
244: ["Saint Barthelemy", "BL"],
|
|
245: ["Saint Martin", "MF"],
|
|
246: ["Latin America", "419"],
|
|
247: ["Ascension Island", "AC"],
|
|
248: ["Aland Islands", "AX"],
|
|
249: ["Diego Garcia", "DG"],
|
|
250: ["Ceuta And Melilla", "EA"],
|
|
251: ["Isle Of Man", "IM"],
|
|
252: ["Jersey", "JE"],
|
|
253: ["Tristan Da Cunha", "TA"],
|
|
254: ["South Sudan", "SS"],
|
|
255: ["Bonaire", "BQ"],
|
|
256: ["Sint Maarten", "SX"],
|
|
257: ["Kosovo", "XK"],
|
|
258: ["European Union", "EU"],
|
|
259: ["Outlying Oceania", "QO"],
|
|
260: ["World", "001"],
|
|
261: ["Europe", "150"],
|
|
}
|
|
|
|
country_aliases = {
|
|
# Deprecated:
|
|
'Tokelau': 'TokelauCountry',
|
|
'Tuvalu': 'TuvaluCountry',
|
|
# Renamings:
|
|
'DemocraticRepublicOfCongo': 'CongoKinshasa',
|
|
'PeoplesRepublicOfCongo': 'CongoBrazzaville',
|
|
'DemocraticRepublicOfKorea': 'NorthKorea',
|
|
'RepublicOfKorea': 'SouthKorea',
|
|
'RussianFederation': 'Russia',
|
|
'SyrianArabRepublic': 'Syria',
|
|
'LatinAmericaAndTheCaribbean': 'LatinAmerica',
|
|
}
|
|
|
|
script_list = {
|
|
0: ["AnyScript", "Zzzz"],
|
|
1: ["Arabic", "Arab"],
|
|
2: ["Cyrillic", "Cyrl"],
|
|
3: ["Deseret", "Dsrt"],
|
|
4: ["Gurmukhi", "Guru"],
|
|
5: ["Simplified Han", "Hans"],
|
|
6: ["Traditional Han", "Hant"],
|
|
7: ["Latin", "Latn"],
|
|
8: ["Mongolian", "Mong"],
|
|
9: ["Tifinagh", "Tfng"],
|
|
10: ["Armenian", "Armn"],
|
|
11: ["Bengali", "Beng"],
|
|
12: ["Cherokee", "Cher"],
|
|
13: ["Devanagari", "Deva"],
|
|
14: ["Ethiopic", "Ethi"],
|
|
15: ["Georgian", "Geor"],
|
|
16: ["Greek", "Grek"],
|
|
17: ["Gujarati", "Gujr"],
|
|
18: ["Hebrew", "Hebr"],
|
|
19: ["Japanese", "Jpan"],
|
|
20: ["Khmer", "Khmr"],
|
|
21: ["Kannada", "Knda"],
|
|
22: ["Korean", "Kore"],
|
|
23: ["Lao", "Laoo"],
|
|
24: ["Malayalam", "Mlym"],
|
|
25: ["Myanmar", "Mymr"],
|
|
26: ["Oriya", "Orya"],
|
|
27: ["Tamil", "Taml"],
|
|
28: ["Telugu", "Telu"],
|
|
29: ["Thaana", "Thaa"],
|
|
30: ["Thai", "Thai"],
|
|
31: ["Tibetan", "Tibt"],
|
|
32: ["Sinhala", "Sinh"],
|
|
33: ["Syriac", "Syrc"],
|
|
34: ["Yi", "Yiii"],
|
|
35: ["Vai", "Vaii"],
|
|
36: ["Avestan", "Avst"],
|
|
37: ["Balinese", "Bali"],
|
|
38: ["Bamum", "Bamu"],
|
|
39: ["Batak", "Batk"],
|
|
40: ["Bopomofo", "Bopo"],
|
|
41: ["Brahmi", "Brah"],
|
|
42: ["Buginese", "Bugi"],
|
|
43: ["Buhid", "Buhd"],
|
|
44: ["Canadian Aboriginal", "Cans"],
|
|
45: ["Carian", "Cari"],
|
|
46: ["Chakma", "Cakm"],
|
|
47: ["Cham", "Cham"],
|
|
48: ["Coptic", "Copt"],
|
|
49: ["Cypriot", "Cprt"],
|
|
50: ["Egyptian Hieroglyphs", "Egyp"],
|
|
51: ["Fraser", "Lisu"],
|
|
52: ["Glagolitic", "Glag"],
|
|
53: ["Gothic", "Goth"],
|
|
54: ["Han", "Hani"],
|
|
55: ["Hangul", "Hang"],
|
|
56: ["Hanunoo", "Hano"],
|
|
57: ["Imperial Aramaic", "Armi"],
|
|
58: ["Inscriptional Pahlavi", "Phli"],
|
|
59: ["Inscriptional Parthian", "Prti"],
|
|
60: ["Javanese", "Java"],
|
|
61: ["Kaithi", "Kthi"],
|
|
62: ["Katakana", "Kana"],
|
|
63: ["Kayah Li", "Kali"],
|
|
64: ["Kharoshthi", "Khar"],
|
|
65: ["Lanna", "Lana"],
|
|
66: ["Lepcha", "Lepc"],
|
|
67: ["Limbu", "Limb"],
|
|
68: ["Linear B", "Linb"],
|
|
69: ["Lycian", "Lyci"],
|
|
70: ["Lydian", "Lydi"],
|
|
71: ["Mandaean", "Mand"],
|
|
72: ["Meitei Mayek", "Mtei"],
|
|
73: ["Meroitic", "Mero"],
|
|
74: ["Meroitic Cursive", "Merc"],
|
|
75: ["Nko", "Nkoo"],
|
|
76: ["New Tai Lue", "Talu"],
|
|
77: ["Ogham", "Ogam"],
|
|
78: ["Ol Chiki", "Olck"],
|
|
79: ["Old Italic", "Ital"],
|
|
80: ["Old Persian", "Xpeo"],
|
|
81: ["Old South Arabian", "Sarb"],
|
|
82: ["Orkhon", "Orkh"],
|
|
83: ["Osmanya", "Osma"],
|
|
84: ["Phags Pa", "Phag"],
|
|
85: ["Phoenician", "Phnx"],
|
|
86: ["Pollard Phonetic", "Plrd"],
|
|
87: ["Rejang", "Rjng"],
|
|
88: ["Runic", "Runr"],
|
|
89: ["Samaritan", "Samr"],
|
|
90: ["Saurashtra", "Saur"],
|
|
91: ["Sharada", "Shrd"],
|
|
92: ["Shavian", "Shaw"],
|
|
93: ["Sora Sompeng", "Sora"],
|
|
94: ["Cuneiform", "Xsux"],
|
|
95: ["Sundanese", "Sund"],
|
|
96: ["Syloti Nagri", "Sylo"],
|
|
97: ["Tagalog", "Tglg"],
|
|
98: ["Tagbanwa", "Tagb"],
|
|
99: ["Tai Le", "Tale"],
|
|
100: ["Tai Viet", "Tavt"],
|
|
101: ["Takri", "Takr"],
|
|
102: ["Ugaritic", "Ugar"],
|
|
103: ["Braille", "Brai"],
|
|
104: ["Hiragana", "Hira"],
|
|
105: ["Caucasian Albanian", "Aghb"],
|
|
106: ["Bassa Vah", "Bass"],
|
|
107: ["Duployan", "Dupl"],
|
|
108: ["Elbasan", "Elba"],
|
|
109: ["Grantha", "Gran"],
|
|
110: ["Pahawh Hmong", "Hmng"],
|
|
111: ["Khojki", "Khoj"],
|
|
112: ["Linear A", "Lina"],
|
|
113: ["Mahajani", "Mahj"],
|
|
114: ["Manichaean", "Mani"],
|
|
115: ["Mende Kikakui", "Mend"],
|
|
116: ["Modi", "Modi"],
|
|
117: ["Mro", "Mroo"],
|
|
118: ["Old North Arabian", "Narb"],
|
|
119: ["Nabataean", "Nbat"],
|
|
120: ["Palmyrene", "Palm"],
|
|
121: ["Pau Cin Hau", "Pauc"],
|
|
122: ["Old Permic", "Perm"],
|
|
123: ["Psalter Pahlavi", "Phlp"],
|
|
124: ["Siddham", "Sidd"],
|
|
125: ["Khudawadi", "Sind"],
|
|
126: ["Tirhuta", "Tirh"],
|
|
127: ["Varang Kshiti", "Wara"],
|
|
128: ["Ahom", "Ahom"],
|
|
129: ["Anatolian Hieroglyphs", "Hluw"],
|
|
130: ["Hatran", "Hatr"],
|
|
131: ["Multani", "Mult"],
|
|
132: ["Old Hungarian", "Hung"],
|
|
133: ["Sign Writing", "Sgnw"],
|
|
134: ["Adlam", "Adlm"],
|
|
135: ["Bhaiksuki", "Bhks"],
|
|
136: ["Marchen", "Marc"],
|
|
137: ["Newa", "Newa"],
|
|
138: ["Osage", "Osge"],
|
|
139: ["Tangut", "Tang"],
|
|
140: ["Han with Bopomofo", "Hanb"],
|
|
141: ["Jamo", "Jamo"],
|
|
}
|
|
|
|
script_aliases = {
|
|
# Renamings:
|
|
'SimplifiedChineseScript': 'SimplifiedHanScript',
|
|
'TraditionalChineseScript': 'TraditionalHanScript',
|
|
}
|
|
|
|
def countryCodeToId(code):
|
|
if not code:
|
|
return 0
|
|
for country_id in country_list:
|
|
if country_list[country_id][1] == code:
|
|
return country_id
|
|
return -1
|
|
|
|
def languageCodeToId(code):
|
|
if not code:
|
|
return 0
|
|
for language_id in language_list:
|
|
if language_list[language_id][1] == code:
|
|
return language_id
|
|
return -1
|
|
|
|
def scriptCodeToId(code):
|
|
if not code:
|
|
return 0
|
|
for script_id in script_list:
|
|
if script_list[script_id][1] == code:
|
|
return script_id
|
|
return -1
|