qt5base-lts/util/locale_database/enumdata.py
Edward Welbourne 3a1bc4bad5 Purge deprecated language and country codes from QLocale
Requires subsequent re-numbering of the enum tables to eliminate gaps,
before locale data can be regenerated. However, it will work with the
present locale data, since it merely loses the means to use some names
for which the available data was just the name and code. This implies
a transient issue of recognising some codes for which there is no
actual enum member; but relevant code will work as before, finding
nothing but the code and its name. This shall be resolved by a coming
BiC change to resort the language, country and script codes, changing
the numbering (almost) completely.

[ChangeLog][QtCore][QLocale] Various obsolete language and country
codes have been removed. Some lacked locale data, others were obsolete
aliases. All have been deprecated in 5.15.

Task-number: QTBUG-84669
Change-Id: I45fc76a5f2f6c3b0ea3c1bb61e917da984183783
Reviewed-by: Volker Hilsheimer <volker.hilsheimer@qt.io>
2020-10-29 10:44:38 +00:00

840 lines
42 KiB
Python

#!/usr/bin/env python
#############################################################################
##
## Copyright (C) 2020 The Qt Company Ltd.
## Contact: https://www.qt.io/licensing/
##
## This file is part of the test suite of the Qt Toolkit.
##
## $QT_BEGIN_LICENSE:GPL-EXCEPT$
## Commercial License Usage
## Licensees holding valid commercial Qt licenses may use this file in
## accordance with the commercial license agreement provided with the
## Software or, alternatively, in accordance with the terms contained in
## a written agreement between you and The Qt Company. For licensing terms
## and conditions see https://www.qt.io/terms-conditions. For further
## information use the contact form at https://www.qt.io/contact-us.
##
## GNU General Public License Usage
## Alternatively, this file may be used under the terms of the GNU
## General Public License version 3 as published by the Free Software
## Foundation with exceptions as appearing in the file LICENSE.GPL3-EXCEPT
## included in the packaging of this file. Please review the following
## information to ensure the GNU General Public License requirements will
## be met: https://www.gnu.org/licenses/gpl-3.0.html.
##
## $QT_END_LICENSE$
##
#############################################################################
# A run of cldr2qlocalexml.py will produce output reporting any
# language, script and country codes it sees, in data, for which it
# can find a name (taken always from en.xml) that could potentially be
# used. There is no point adding a mapping for such a code unless the
# CLDR's common/main/ contains an XML file for at least one locale
# that exerciss it.
# Each *_list reflects the current values of its enums in qlocale.h;
# if new xml language files are available in CLDR, these languages and
# countries need to be *appended* to this list (for compatibility
# between versions). Include any spaces present in names (scripts
# shall squish them out for the enum entries) in *_list, but use the
# squished forms of names in the *_aliases mappings.
### Qt 6: restore alphabetic order in each list.
language_list = {
0: ["AnyLanguage", " "],
1: ["C", " "],
2: ["Abkhazian", "ab"],
3: ["Oromo", "om"], # macrolanguage
4: ["Afar", "aa"],
5: ["Afrikaans", "af"],
6: ["Albanian", "sq"], # macrolanguage
7: ["Amharic", "am"],
8: ["Arabic", "ar"], # macrolanguage
9: ["Armenian", "hy"],
10: ["Assamese", "as"],
11: ["Aymara", "ay"], # macrolanguage
12: ["Azerbaijani", "az"], # macrolanguage
13: ["Bashkir", "ba"],
14: ["Basque", "eu"],
15: ["Bengali", "bn"],
16: ["Dzongkha", "dz"],
18: ["Bislama", "bi"],
19: ["Breton", "br"],
20: ["Bulgarian", "bg"],
21: ["Burmese", "my"],
22: ["Belarusian", "be"],
23: ["Khmer", "km"],
24: ["Catalan", "ca"],
25: ["Chinese", "zh"], # macrolanguage
26: ["Corsican", "co"],
27: ["Croatian", "hr"],
28: ["Czech", "cs"],
29: ["Danish", "da"],
30: ["Dutch", "nl"],
31: ["English", "en"],
32: ["Esperanto", "eo"],
33: ["Estonian", "et"], # macrolanguage
34: ["Faroese", "fo"],
35: ["Fijian", "fj"],
36: ["Finnish", "fi"],
37: ["French", "fr"],
38: ["Western Frisian", "fy"],
39: ["Gaelic", "gd"],
40: ["Galician", "gl"],
41: ["Georgian", "ka"],
42: ["German", "de"],
43: ["Greek", "el"],
44: ["Greenlandic", "kl"],
45: ["Guarani", "gn"], # macrolanguage
46: ["Gujarati", "gu"],
47: ["Hausa", "ha"],
48: ["Hebrew", "he"],
49: ["Hindi", "hi"],
50: ["Hungarian", "hu"],
51: ["Icelandic", "is"],
52: ["Indonesian", "id"],
53: ["Interlingua", "ia"],
54: ["Interlingue", "ie"],
55: ["Inuktitut", "iu"], # macrolanguage
56: ["Inupiak", "ik"], # macrolanguage
57: ["Irish", "ga"],
58: ["Italian", "it"],
59: ["Japanese", "ja"],
60: ["Javanese", "jv"],
61: ["Kannada", "kn"],
62: ["Kashmiri", "ks"],
63: ["Kazakh", "kk"],
64: ["Kinyarwanda", "rw"],
65: ["Kirghiz", "ky"],
66: ["Korean", "ko"],
67: ["Kurdish", "ku"], # macrolanguage
68: ["Rundi", "rn"],
69: ["Lao", "lo"],
70: ["Latin", "la"],
71: ["Latvian", "lv"], # macrolanguage
72: ["Lingala", "ln"],
73: ["Lithuanian", "lt"],
74: ["Macedonian", "mk"],
75: ["Malagasy", "mg"], # macrolanguage
76: ["Malay", "ms"], # macrolanguage
77: ["Malayalam", "ml"],
78: ["Maltese", "mt"],
79: ["Maori", "mi"],
80: ["Marathi", "mr"],
81: ["Marshallese", "mh"],
82: ["Mongolian", "mn"], # macrolanguage
83: ["Nauru", "na"],
84: ["Nepali", "ne"], # macrolanguage
85: ["Norwegian Bokmal", "nb"],
86: ["Occitan", "oc"],
87: ["Oriya", "or"], # macrolanguage
88: ["Pashto", "ps"], # macrolanguage
89: ["Persian", "fa"], # macrolanguage
90: ["Polish", "pl"],
91: ["Portuguese", "pt"],
92: ["Punjabi", "pa"],
93: ["Quechua", "qu"], # macrolanguage
94: ["Romansh", "rm"],
95: ["Romanian", "ro"],
96: ["Russian", "ru"],
97: ["Samoan", "sm"],
98: ["Sango", "sg"],
99: ["Sanskrit", "sa"],
100: ["Serbian", "sr"],
101: ["Ossetic", "os"],
102: ["Southern Sotho", "st"],
103: ["Tswana", "tn"],
104: ["Shona", "sn"],
105: ["Sindhi", "sd"],
106: ["Sinhala", "si"],
107: ["Swati", "ss"],
108: ["Slovak", "sk"],
109: ["Slovenian", "sl"],
110: ["Somali", "so"],
111: ["Spanish", "es"],
112: ["Sundanese", "su"],
113: ["Swahili", "sw"], # macrolanguage
114: ["Swedish", "sv"],
115: ["Sardinian", "sc"], # macrolanguage
116: ["Tajik", "tg"],
117: ["Tamil", "ta"],
118: ["Tatar", "tt"],
119: ["Telugu", "te"],
120: ["Thai", "th"],
121: ["Tibetan", "bo"],
122: ["Tigrinya", "ti"],
123: ["Tongan", "to"],
124: ["Tsonga", "ts"],
125: ["Turkish", "tr"],
126: ["Turkmen", "tk"],
127: ["Tahitian", "ty"],
128: ["Uighur", "ug"],
129: ["Ukrainian", "uk"],
130: ["Urdu", "ur"],
131: ["Uzbek", "uz"], # macrolanguage
132: ["Vietnamese", "vi"],
133: ["Volapuk", "vo"],
134: ["Welsh", "cy"],
135: ["Wolof", "wo"],
136: ["Xhosa", "xh"],
137: ["Yiddish", "yi"], # macrolanguage
138: ["Yoruba", "yo"],
139: ["Zhuang", "za"], # macrolanguage
140: ["Zulu", "zu"],
141: ["Norwegian Nynorsk", "nn"],
142: ["Bosnian", "bs"],
143: ["Divehi", "dv"],
144: ["Manx", "gv"],
145: ["Cornish", "kw"],
146: ["Akan", "ak"], # macrolanguage
147: ["Konkani", "kok"],
148: ["Ga", "gaa"],
149: ["Igbo", "ig" ],
150: ["Kamba", "kam"],
151: ["Syriac", "syr"],
152: ["Blin", "byn"],
153: ["Geez", "gez"],
154: ["Koro", "kfo"],
155: ["Sidamo", "sid"],
156: ["Atsam", "cch"],
157: ["Tigre", "tig"],
158: ["Jju", "kaj"],
159: ["Friulian", "fur"],
160: ["Venda", "ve" ],
161: ["Ewe", "ee" ],
162: ["Walamo", "wal"],
163: ["Hawaiian", "haw"],
164: ["Tyap", "kcg"],
165: ["Nyanja", "ny" ],
166: ["Filipino", "fil"],
167: ["Swiss German", "gsw"],
168: ["Sichuan Yi", "ii" ],
169: ["Kpelle", "kpe"],
170: ["Low German", "nds"],
171: ["South Ndebele", "nr" ],
172: ["Northern Sotho", "nso"],
173: ["Northern Sami", "se" ],
174: ["Taroko", "trv"],
175: ["Gusii", "guz"],
176: ["Taita", "dav"],
177: ["Fulah", "ff"], # macrolanguage
178: ["Kikuyu", "ki"],
179: ["Samburu", "saq"],
180: ["Sena", "seh"],
181: ["North Ndebele", "nd"],
182: ["Rombo", "rof"],
183: ["Tachelhit", "shi"],
184: ["Kabyle", "kab"],
185: ["Nyankole", "nyn"],
186: ["Bena", "bez"],
187: ["Vunjo", "vun"],
188: ["Bambara", "bm"],
189: ["Embu", "ebu"],
190: ["Cherokee", "chr"],
191: ["Morisyen", "mfe"],
192: ["Makonde", "kde"],
193: ["Langi", "lag"],
194: ["Ganda", "lg"],
195: ["Bemba", "bem"],
196: ["Kabuverdianu", "kea"],
197: ["Meru", "mer"],
198: ["Kalenjin", "kln"],
199: ["Nama", "naq"],
200: ["Machame", "jmc"],
201: ["Colognian", "ksh"],
202: ["Masai", "mas"],
203: ["Soga", "xog"],
204: ["Luyia", "luy"],
205: ["Asu", "asa"],
206: ["Teso", "teo"],
207: ["Saho", "ssy"],
208: ["Koyra Chiini", "khq"],
209: ["Rwa", "rwk"],
210: ["Luo", "luo"],
211: ["Chiga", "cgg"],
212: ["Central Morocco Tamazight", "tzm"],
213: ["Koyraboro Senni", "ses"],
214: ["Shambala", "ksb"],
215: ["Bodo", "brx"],
216: ["Avaric", "av"],
217: ["Chamorro", "ch"],
218: ["Chechen", "ce"],
219: ["Church", "cu"], # macrolanguage
220: ["Chuvash", "cv"],
221: ["Cree", "cr"], # macrolanguage
222: ["Haitian", "ht"],
223: ["Herero", "hz"],
224: ["Hiri Motu", "ho"],
225: ["Kanuri", "kr"], # macrolanguage
226: ["Komi", "kv"], # macrolanguage
227: ["Kongo", "kg"], # macrolanguage
228: ["Kwanyama", "kj"],
229: ["Limburgish", "li"],
230: ["Luba Katanga", "lu"],
231: ["Luxembourgish", "lb"],
232: ["Navaho", "nv"],
233: ["Ndonga", "ng"],
234: ["Ojibwa", "oj"], # macrolanguage
235: ["Pali", "pi"], # macrolanguage
236: ["Walloon", "wa"],
237: ["Aghem", "agq"],
238: ["Basaa", "bas"],
239: ["Zarma", "dje"],
240: ["Duala", "dua"],
241: ["Jola Fonyi", "dyo"],
242: ["Ewondo", "ewo"],
243: ["Bafia", "ksf"],
244: ["Makhuwa Meetto", "mgh"],
245: ["Mundang", "mua"],
246: ["Kwasio", "nmg"],
247: ["Nuer", "nus"],
248: ["Sakha", "sah"],
249: ["Sangu", "sbp"],
251: ["Tasawaq", "twq"],
252: ["Vai", "vai"],
253: ["Walser", "wae"],
254: ["Yangben", "yav"],
255: ["Avestan", "ae"],
256: ["Asturian", "ast"],
257: ["Ngomba", "jgo"],
258: ["Kako", "kkj"],
259: ["Meta", "mgo"],
260: ["Ngiemboon", "nnh"],
261: ["Aragonese", "an"],
262: ["Akkadian", "akk"],
263: ["Ancient Egyptian", "egy"],
264: ["Ancient Greek", "grc"],
265: ["Aramaic", "arc"],
266: ["Balinese", "ban"],
267: ["Bamun", "bax"],
268: ["Batak Toba", "bbc"],
269: ["Buginese", "bug"],
272: ["Chakma", "ccp"],
274: ["Coptic", "cop"],
275: ["Dogri", "doi"], # macrolanguage
279: ["Gothic", "got"],
281: ["Ingush", "inh"],
289: ["Mandingo", "man"], # macrolanguage
290: ["Manipuri", "mni"],
293: ["Old Irish", "sga"],
294: ["Old Norse", "non"],
295: ["Old Persian", "peo"],
297: ["Pahlavi", "pal"],
299: ["Phoenician", "phn"],
304: ["Santali", "sat"],
305: ["Saurashtra", "saz"],
309: ["Tai Dam", "blt"],
311: ["Ugaritic", "uga"],
312: ["Akoose", "bss"],
313: ["Lakota", "lkt"],
314: ["Standard Moroccan Tamazight", "zgh"],
315: ["Mapuche", "arn"],
316: ["Central Kurdish", "ckb"],
317: ["Lower Sorbian", "dsb"],
318: ["Upper Sorbian", "hsb"],
319: ["Kenyang", "ken"],
320: ["Mohawk", "moh"],
321: ["Nko", "nqo"],
322: ["Prussian", "prg"],
323: ["Kiche", "quc"],
324: ["Southern Sami", "sma"],
325: ["Lule Sami", "smj"],
326: ["Inari Sami", "smn"],
327: ["Skolt Sami", "sms"],
328: ["Warlpiri", "wbp"],
330: ["Mende", "men"],
335: ["Lezghian", "lez"],
339: ["Maithili", "mai"],
341: ["American Sign Language", "ase"],
343: ["Bhojpuri", "bho"],
345: ["Literary Chinese", "lzh"],
346: ["Mazanderani", "mzn"],
348: ["Newari", "new"],
349: ["Northern Luri", "lrc"],
350: ["Palauan", "pau"],
351: ["Papiamento", "pap"],
353: ["Tokelau", "tkl"],
354: ["Tok Pisin", "tpi"],
355: ["Tuvalu", "tvl"],
357: ["Cantonese", "yue"],
358: ["Osage", "osa"],
360: ["Ido", "io"],
361: ["Lojban", "jbo"],
362: ["Sicilian", "scn"],
363: ["Southern Kurdish", "sdh"],
364: ["Western Balochi", "bgn"],
365: ["Cebuano", "ceb"],
366: ["Erzya", "myv"],
367: ["Chickasaw", "cic"],
368: ["Muscogee", "mus"],
369: ["Silesian", "szl"],
370: ["Nigerian Pidgin", "pcm"],
}
language_aliases = {
# Renamings:
'Afan': 'Oromo',
'Byelorussian': 'Belarusian',
'Bhutani': 'Dzongkha',
'Cambodian': 'Khmer',
'Kurundi': 'Rundi',
'RhaetoRomance': 'Romansh',
'Chewa': 'Nyanja',
'Frisian': 'WesternFrisian',
'Uigur': 'Uighur',
}
country_list = {
0: ["AnyCountry", "ZZ"],
1: ["Afghanistan", "AF"],
2: ["Albania", "AL"],
3: ["Algeria", "DZ"],
4: ["American Samoa", "AS"],
5: ["Andorra", "AD"],
6: ["Angola", "AO"],
7: ["Anguilla", "AI"],
8: ["Antarctica", "AQ"],
9: ["Antigua And Barbuda", "AG"],
10: ["Argentina", "AR"],
11: ["Armenia", "AM"],
12: ["Aruba", "AW"],
13: ["Australia", "AU"],
14: ["Austria", "AT"],
15: ["Azerbaijan", "AZ"],
16: ["Bahamas", "BS"],
17: ["Bahrain", "BH"],
18: ["Bangladesh", "BD"],
19: ["Barbados", "BB"],
20: ["Belarus", "BY"],
21: ["Belgium", "BE"],
22: ["Belize", "BZ"],
23: ["Benin", "BJ"],
24: ["Bermuda", "BM"],
25: ["Bhutan", "BT"],
26: ["Bolivia", "BO"],
27: ["Bosnia And Herzegowina", "BA"],
28: ["Botswana", "BW"],
29: ["Bouvet Island", "BV"],
30: ["Brazil", "BR"],
31: ["British Indian Ocean Territory", "IO"],
32: ["Brunei", "BN"],
33: ["Bulgaria", "BG"],
34: ["Burkina Faso", "BF"],
35: ["Burundi", "BI"],
36: ["Cambodia", "KH"],
37: ["Cameroon", "CM"],
38: ["Canada", "CA"],
39: ["Cape Verde", "CV"],
40: ["Cayman Islands", "KY"],
41: ["Central African Republic", "CF"],
42: ["Chad", "TD"],
43: ["Chile", "CL"],
44: ["China", "CN"],
45: ["Christmas Island", "CX"],
46: ["Cocos Islands", "CC"],
47: ["Colombia", "CO"],
48: ["Comoros", "KM"],
49: ["Congo Kinshasa", "CD"],
50: ["Congo Brazzaville", "CG"],
51: ["Cook Islands", "CK"],
52: ["Costa Rica", "CR"],
53: ["Ivory Coast", "CI"],
54: ["Croatia", "HR"],
55: ["Cuba", "CU"],
56: ["Cyprus", "CY"],
57: ["Czech Republic", "CZ"],
58: ["Denmark", "DK"],
59: ["Djibouti", "DJ"],
60: ["Dominica", "DM"],
61: ["Dominican Republic", "DO"],
62: ["East Timor", "TL"],
63: ["Ecuador", "EC"],
64: ["Egypt", "EG"],
65: ["El Salvador", "SV"],
66: ["Equatorial Guinea", "GQ"],
67: ["Eritrea", "ER"],
68: ["Estonia", "EE"],
69: ["Ethiopia", "ET"],
70: ["Falkland Islands", "FK"],
71: ["Faroe Islands", "FO"],
72: ["Fiji", "FJ"],
73: ["Finland", "FI"],
74: ["France", "FR"],
75: ["Guernsey", "GG"],
76: ["French Guiana", "GF"],
77: ["French Polynesia", "PF"],
78: ["French Southern Territories", "TF"],
79: ["Gabon", "GA"],
80: ["Gambia", "GM"],
81: ["Georgia", "GE"],
82: ["Germany", "DE"],
83: ["Ghana", "GH"],
84: ["Gibraltar", "GI"],
85: ["Greece", "GR"],
86: ["Greenland", "GL"],
87: ["Grenada", "GD"],
88: ["Guadeloupe", "GP"],
89: ["Guam", "GU"],
90: ["Guatemala", "GT"],
91: ["Guinea", "GN"],
92: ["Guinea Bissau", "GW"],
93: ["Guyana", "GY"],
94: ["Haiti", "HT"],
95: ["Heard And McDonald Islands", "HM"],
96: ["Honduras", "HN"],
97: ["Hong Kong", "HK"],
98: ["Hungary", "HU"],
99: ["Iceland", "IS"],
100: ["India", "IN"],
101: ["Indonesia", "ID"],
102: ["Iran", "IR"],
103: ["Iraq", "IQ"],
104: ["Ireland", "IE"],
105: ["Israel", "IL"],
106: ["Italy", "IT"],
107: ["Jamaica", "JM"],
108: ["Japan", "JP"],
109: ["Jordan", "JO"],
110: ["Kazakhstan", "KZ"],
111: ["Kenya", "KE"],
112: ["Kiribati", "KI"],
113: ["North Korea", "KP"],
114: ["South Korea", "KR"],
115: ["Kuwait", "KW"],
116: ["Kyrgyzstan", "KG"],
117: ["Laos", "LA"],
118: ["Latvia", "LV"],
119: ["Lebanon", "LB"],
120: ["Lesotho", "LS"],
121: ["Liberia", "LR"],
122: ["Libya", "LY"],
123: ["Liechtenstein", "LI"],
124: ["Lithuania", "LT"],
125: ["Luxembourg", "LU"],
126: ["Macau", "MO"],
127: ["Macedonia", "MK"],
128: ["Madagascar", "MG"],
129: ["Malawi", "MW"],
130: ["Malaysia", "MY"],
131: ["Maldives", "MV"],
132: ["Mali", "ML"],
133: ["Malta", "MT"],
134: ["Marshall Islands", "MH"],
135: ["Martinique", "MQ"],
136: ["Mauritania", "MR"],
137: ["Mauritius", "MU"],
138: ["Mayotte", "YT"],
139: ["Mexico", "MX"],
140: ["Micronesia", "FM"],
141: ["Moldova", "MD"],
142: ["Monaco", "MC"],
143: ["Mongolia", "MN"],
144: ["Montserrat", "MS"],
145: ["Morocco", "MA"],
146: ["Mozambique", "MZ"],
147: ["Myanmar", "MM"],
148: ["Namibia", "NA"],
149: ["Nauru", "NR"],
150: ["Nepal", "NP"],
151: ["Netherlands", "NL"],
152: ["Cura Sao", "CW"],
153: ["New Caledonia", "NC"],
154: ["New Zealand", "NZ"],
155: ["Nicaragua", "NI"],
156: ["Niger", "NE"],
157: ["Nigeria", "NG"],
158: ["Niue", "NU"],
159: ["Norfolk Island", "NF"],
160: ["Northern Mariana Islands", "MP"],
161: ["Norway", "NO"],
162: ["Oman", "OM"],
163: ["Pakistan", "PK"],
164: ["Palau", "PW"],
165: ["Palestinian Territories", "PS"],
166: ["Panama", "PA"],
167: ["Papua New Guinea", "PG"],
168: ["Paraguay", "PY"],
169: ["Peru", "PE"],
170: ["Philippines", "PH"],
171: ["Pitcairn", "PN"],
172: ["Poland", "PL"],
173: ["Portugal", "PT"],
174: ["Puerto Rico", "PR"],
175: ["Qatar", "QA"],
176: ["Reunion", "RE"],
177: ["Romania", "RO"],
178: ["Russia", "RU"],
179: ["Rwanda", "RW"],
180: ["Saint Kitts And Nevis", "KN"],
181: ["Saint Lucia", "LC"],
182: ["Saint Vincent And The Grenadines", "VC"],
183: ["Samoa", "WS"],
184: ["San Marino", "SM"],
185: ["Sao Tome And Principe", "ST"],
186: ["Saudi Arabia", "SA"],
187: ["Senegal", "SN"],
188: ["Seychelles", "SC"],
189: ["Sierra Leone", "SL"],
190: ["Singapore", "SG"],
191: ["Slovakia", "SK"],
192: ["Slovenia", "SI"],
193: ["Solomon Islands", "SB"],
194: ["Somalia", "SO"],
195: ["South Africa", "ZA"],
196: ["South Georgia And The South Sandwich Islands", "GS"],
197: ["Spain", "ES"],
198: ["Sri Lanka", "LK"],
199: ["Saint Helena", "SH"],
200: ["Saint Pierre And Miquelon", "PM"],
201: ["Sudan", "SD"],
202: ["Suriname", "SR"],
203: ["Svalbard And Jan Mayen Islands", "SJ"],
204: ["Swaziland", "SZ"],
205: ["Sweden", "SE"],
206: ["Switzerland", "CH"],
207: ["Syria", "SY"],
208: ["Taiwan", "TW"],
209: ["Tajikistan", "TJ"],
210: ["Tanzania", "TZ"],
211: ["Thailand", "TH"],
212: ["Togo", "TG"],
213: ["Tokelau", "TK"],
214: ["Tonga", "TO"],
215: ["Trinidad And Tobago", "TT"],
216: ["Tunisia", "TN"],
217: ["Turkey", "TR"],
218: ["Turkmenistan", "TM"],
219: ["Turks And Caicos Islands", "TC"],
220: ["Tuvalu", "TV"],
221: ["Uganda", "UG"],
222: ["Ukraine", "UA"],
223: ["United Arab Emirates", "AE"],
224: ["United Kingdom", "GB"],
225: ["United States", "US"],
226: ["United States Minor Outlying Islands", "UM"],
227: ["Uruguay", "UY"],
228: ["Uzbekistan", "UZ"],
229: ["Vanuatu", "VU"],
230: ["Vatican City State", "VA"],
231: ["Venezuela", "VE"],
232: ["Vietnam", "VN"],
233: ["British Virgin Islands", "VG"],
234: ["United States Virgin Islands", "VI"],
235: ["Wallis And Futuna Islands", "WF"],
236: ["Western Sahara", "EH"],
237: ["Yemen", "YE"],
238: ["Canary Islands", "IC"],
239: ["Zambia", "ZM"],
240: ["Zimbabwe", "ZW"],
241: ["Clipperton Island", "CP"],
242: ["Montenegro", "ME"],
243: ["Serbia", "RS"],
244: ["Saint Barthelemy", "BL"],
245: ["Saint Martin", "MF"],
246: ["Latin America", "419"],
247: ["Ascension Island", "AC"],
248: ["Aland Islands", "AX"],
249: ["Diego Garcia", "DG"],
250: ["Ceuta And Melilla", "EA"],
251: ["Isle Of Man", "IM"],
252: ["Jersey", "JE"],
253: ["Tristan Da Cunha", "TA"],
254: ["South Sudan", "SS"],
255: ["Bonaire", "BQ"],
256: ["Sint Maarten", "SX"],
257: ["Kosovo", "XK"],
258: ["European Union", "EU"],
259: ["Outlying Oceania", "QO"],
260: ["World", "001"],
261: ["Europe", "150"],
}
country_aliases = {
# Renamings:
'DemocraticRepublicOfCongo': 'CongoKinshasa',
'PeoplesRepublicOfCongo': 'CongoBrazzaville',
'DemocraticRepublicOfKorea': 'NorthKorea',
'RepublicOfKorea': 'SouthKorea',
'RussianFederation': 'Russia',
'SyrianArabRepublic': 'Syria',
'LatinAmericaAndTheCaribbean': 'LatinAmerica',
}
script_list = {
0: ["AnyScript", "Zzzz"],
1: ["Arabic", "Arab"],
2: ["Cyrillic", "Cyrl"],
3: ["Deseret", "Dsrt"],
4: ["Gurmukhi", "Guru"],
5: ["Simplified Han", "Hans"],
6: ["Traditional Han", "Hant"],
7: ["Latin", "Latn"],
8: ["Mongolian", "Mong"],
9: ["Tifinagh", "Tfng"],
10: ["Armenian", "Armn"],
11: ["Bengali", "Beng"],
12: ["Cherokee", "Cher"],
13: ["Devanagari", "Deva"],
14: ["Ethiopic", "Ethi"],
15: ["Georgian", "Geor"],
16: ["Greek", "Grek"],
17: ["Gujarati", "Gujr"],
18: ["Hebrew", "Hebr"],
19: ["Japanese", "Jpan"],
20: ["Khmer", "Khmr"],
21: ["Kannada", "Knda"],
22: ["Korean", "Kore"],
23: ["Lao", "Laoo"],
24: ["Malayalam", "Mlym"],
25: ["Myanmar", "Mymr"],
26: ["Oriya", "Orya"],
27: ["Tamil", "Taml"],
28: ["Telugu", "Telu"],
29: ["Thaana", "Thaa"],
30: ["Thai", "Thai"],
31: ["Tibetan", "Tibt"],
32: ["Sinhala", "Sinh"],
33: ["Syriac", "Syrc"],
34: ["Yi", "Yiii"],
35: ["Vai", "Vaii"],
36: ["Avestan", "Avst"],
37: ["Balinese", "Bali"],
38: ["Bamum", "Bamu"],
39: ["Batak", "Batk"],
40: ["Bopomofo", "Bopo"],
41: ["Brahmi", "Brah"],
42: ["Buginese", "Bugi"],
43: ["Buhid", "Buhd"],
44: ["Canadian Aboriginal", "Cans"],
45: ["Carian", "Cari"],
46: ["Chakma", "Cakm"],
47: ["Cham", "Cham"],
48: ["Coptic", "Copt"],
49: ["Cypriot", "Cprt"],
50: ["Egyptian Hieroglyphs", "Egyp"],
51: ["Fraser", "Lisu"],
52: ["Glagolitic", "Glag"],
53: ["Gothic", "Goth"],
54: ["Han", "Hani"],
55: ["Hangul", "Hang"],
56: ["Hanunoo", "Hano"],
57: ["Imperial Aramaic", "Armi"],
58: ["Inscriptional Pahlavi", "Phli"],
59: ["Inscriptional Parthian", "Prti"],
60: ["Javanese", "Java"],
61: ["Kaithi", "Kthi"],
62: ["Katakana", "Kana"],
63: ["Kayah Li", "Kali"],
64: ["Kharoshthi", "Khar"],
65: ["Lanna", "Lana"],
66: ["Lepcha", "Lepc"],
67: ["Limbu", "Limb"],
68: ["Linear B", "Linb"],
69: ["Lycian", "Lyci"],
70: ["Lydian", "Lydi"],
71: ["Mandaean", "Mand"],
72: ["Meitei Mayek", "Mtei"],
73: ["Meroitic", "Mero"],
74: ["Meroitic Cursive", "Merc"],
75: ["Nko", "Nkoo"],
76: ["New Tai Lue", "Talu"],
77: ["Ogham", "Ogam"],
78: ["Ol Chiki", "Olck"],
79: ["Old Italic", "Ital"],
80: ["Old Persian", "Xpeo"],
81: ["Old South Arabian", "Sarb"],
82: ["Orkhon", "Orkh"],
83: ["Osmanya", "Osma"],
84: ["Phags Pa", "Phag"],
85: ["Phoenician", "Phnx"],
86: ["Pollard Phonetic", "Plrd"],
87: ["Rejang", "Rjng"],
88: ["Runic", "Runr"],
89: ["Samaritan", "Samr"],
90: ["Saurashtra", "Saur"],
91: ["Sharada", "Shrd"],
92: ["Shavian", "Shaw"],
93: ["Sora Sompeng", "Sora"],
94: ["Cuneiform", "Xsux"],
95: ["Sundanese", "Sund"],
96: ["Syloti Nagri", "Sylo"],
97: ["Tagalog", "Tglg"],
98: ["Tagbanwa", "Tagb"],
99: ["Tai Le", "Tale"],
100: ["Tai Viet", "Tavt"],
101: ["Takri", "Takr"],
102: ["Ugaritic", "Ugar"],
103: ["Braille", "Brai"],
104: ["Hiragana", "Hira"],
105: ["Caucasian Albanian", "Aghb"],
106: ["Bassa Vah", "Bass"],
107: ["Duployan", "Dupl"],
108: ["Elbasan", "Elba"],
109: ["Grantha", "Gran"],
110: ["Pahawh Hmong", "Hmng"],
111: ["Khojki", "Khoj"],
112: ["Linear A", "Lina"],
113: ["Mahajani", "Mahj"],
114: ["Manichaean", "Mani"],
115: ["Mende Kikakui", "Mend"],
116: ["Modi", "Modi"],
117: ["Mro", "Mroo"],
118: ["Old North Arabian", "Narb"],
119: ["Nabataean", "Nbat"],
120: ["Palmyrene", "Palm"],
121: ["Pau Cin Hau", "Pauc"],
122: ["Old Permic", "Perm"],
123: ["Psalter Pahlavi", "Phlp"],
124: ["Siddham", "Sidd"],
125: ["Khudawadi", "Sind"],
126: ["Tirhuta", "Tirh"],
127: ["Varang Kshiti", "Wara"],
128: ["Ahom", "Ahom"],
129: ["Anatolian Hieroglyphs", "Hluw"],
130: ["Hatran", "Hatr"],
131: ["Multani", "Mult"],
132: ["Old Hungarian", "Hung"],
133: ["Sign Writing", "Sgnw"],
134: ["Adlam", "Adlm"],
135: ["Bhaiksuki", "Bhks"],
136: ["Marchen", "Marc"],
137: ["Newa", "Newa"],
138: ["Osage", "Osge"],
139: ["Tangut", "Tang"],
140: ["Han with Bopomofo", "Hanb"],
141: ["Jamo", "Jamo"],
}
script_aliases = {
# Renamings:
'SimplifiedChineseScript': 'SimplifiedHanScript',
'TraditionalChineseScript': 'TraditionalHanScript',
}
def countryCodeToId(code):
if not code:
return 0
for country_id in country_list:
if country_list[country_id][1] == code:
return country_id
return -1
def languageCodeToId(code):
if not code:
return 0
for language_id in language_list:
if language_list[language_id][1] == code:
return language_id
return -1
def scriptCodeToId(code):
if not code:
return 0
for script_id in script_list:
if script_list[script_id][1] == code:
return script_id
return -1