scuffed-code/icu4c/data/root.txt

1164 lines
37 KiB
Plaintext
Raw Normal View History

// *******************************************************************************
// *
// * Copyright (C) 1997-2000, International Business Machines
// * Corporation and others. All Rights Reserved.
// *
// *******************************************************************************
// Date Name Description
// 11/17/99 aliu Added support for transliterators.
// Please search for 'DUP FIXME' - duplicate lang/country names commented out
root {
Version { "3" }
"%%EURO" { "Euro" } // Euro variant display name
"%%B" { "Bokm\u00e5l" } // Norwegian variant display name
"%%NY" { "Nynorsk" } // Norwegian variant display name
"%%AL" { "\u00C5land" } // Aland variant display name
CollationElements {
Version { "1.0" }
Override { "FALSE" }
Sequence { "" }
}
// Formats for the display name of a locale, for a list of
// items, and for composing two items in a list into one item.
// The list patterns are used in the variant name and in the
// full display name.
//
// This is the language-neutral form of this resource.
//
LocaleNamePatterns {
{
"{0,choice,0#|1#{1}|2#{1} ({2})}", // Display name
"{0,choice,0#|1#{1}|2#{1},{2}|3#{1},{2},{3}}", // List
"{0},{1}" // List composition
}
}
//------------------------------------------------------------
// BEGIN Transliterator support
//------------------------------------------------------------
// See also icu/data/translit/index.txt
TransliteratorNamePattern {
// Format for the display name of a Transliterator.
// This is the language-neutral form of this resource.
"{0,choice,0#|1#{1}|2#{1}-{2}}" // Display name
}
//------------------------------------------------------------
// END Transliterator support
//------------------------------------------------------------
//------------------------------------------------------------
// BEGIN BreakIterator support
//------------------------------------------------------------
CharacterBreakRules {
// ignore non-spacing marks and enclosing marks (since we never
// put a break before ignore characters, this keeps combining
// accents with the base characters they modify)
"$ignore=[[:Mn:][:Me:]];"
// other category definitions
"choseong=[\u1100-\u115f];"
"jungseong=[\u1160-\u11a7];"
"jongseong=[\u11a8-\u11ff];"
"surr-hi=[\ud800-\udbff];"
"surr-lo=[\udc00-\udfff];"
// break after every character, except as follows:
".;"
// keep CRLF sequences together
"\r\n;"
// keep surrogate pairs together
"{surr-hi}{surr-lo};"
// keep Hangul syllables spelled out using conjoining jamo together
"{choseong}*{jungseong}*{jongseong}*;"
// various additions for Hindi support
"nukta=[\u093c];"
"danda=[\u0964\u0965];"
"virama=[\u094d];"
"devVowelSign=[\u093e-\u094c\u0962\u0963];"
"devConsonant=[\u0915-\u0939];"
"devNuktaConsonant=[\u0958-\u095f];"
"devCharEnd=[\u0902\u0903\u0951-\u0954];"
"zwj=[\u200d];"
"devCAMN=({devConsonant}{nukta}?);"
"devConsonant1=({devNuktaConsonant}|{devCAMN});"
"devConjunct=(({devConsonant1}{virama}{zwj}?)?{devConsonant1});"
"{devConjunct}{devVowelSign}?{devCharEnd}?;"
"{danda}{nukta};"
}
// default rules for finding word boundaries
WordBreakRules {
// ignore non-spacing marks, enclosing marks, and format characters,
// all of which should not influence the algorithm
"$ignore=[[:Mn:][:Me:][:Cf:]];"
// Hindi phrase separator, kanji, katakana, hiragana, CJK diacriticals,
// other letters, and digits
"danda=[\u0964\u0965];"
"kanji=[\u3005\u4e00-\u9fa5\uf900-\ufa2d];"
"kata=[\u3099-\u309c\u30a1-\u30fe];"
"hira=[\u3041-\u309e\u30fc];"
"let=[[[:L:][:Mc:]]-[{kanji}{kata}{hira}]];"
"dgt=[:N:];"
// punctuation that can occur in the middle of a word: currently
// dashes, apostrophes, quotation marks, and periods
"mid-word=[[:Pd:]\u00ad\u2027\\\"\\\'\\.];"
// punctuation that can occur in the middle of a number: currently
// apostrophes, qoutation marks, periods, commas, and the Arabic
// decimal point
"mid-num=[\\\"\\\'\\,\u066b\\.];"
// punctuation that can occur at the beginning of a number: currently
// the period, the number sign, and all currency symbols except the cents sign
"pre-num=[[[:Sc:]-[\u00a2]]\\#\\.];"
// punctuation that can occur at the end of a number: currently
// the percent, per-thousand, per-ten-thousand, and Arabic percent
// signs, the cents sign, and the ampersand
"post-num=[\\%\\&\u00a2\u066a\u2030\u2031];"
// line separators: currently LF, FF, PS, and LS
"ls=[\n\u000c\u2028\u2029];"
// whitespace: all space separators and the tab character
"ws=[[:Zs:]\t];"
// a word is a sequence of letters that may contain internal
// punctuation, as long as it begins and ends with a letter and
// never contains two punctuation marks in a row
"word=({let}+({mid-word}{let}+)*{danda}?);"
// a number is a sequence of digits that may contain internal
// punctuation, as long as it begins and ends with a digit and
// never contains two punctuation marks in a row.
"number=({dgt}+({mid-num}{dgt}+)*);"
// break after every character, with the following exceptions
// (this will cause punctuation marks that aren't considered
// part of words or numbers to be treated as words unto themselves)
".;"
// keep together any sequence of contiguous words and numbers
// (including just one of either), plus an optional trailing
// number-suffix character
"{word}?({number}{word})*({number}{post-num}?)?;"
// keep together and sequence of contiguous words and numbers
// that starts with a number-prefix character and a number,
// and may end with a number-suffix character
"{pre-num}({number}{word})*({number}{post-num}?)?;"
// keep together runs of whitespace (optionally with a single trailing
// line separator or CRLF sequence)
"{ws}*\r?{ls}?;"
// keep together runs of Katakana
"{kata}*;"
// keep together runs of Hiragana
"{hira}*;"
// keep together runs of Kanji
"{kanji}*;"
}
// default rules for determining legal line-breaking positions
LineBreakRules {
// ignore non-spacing marks, enclosing marks, and format characters
"$ignore=[[:Mn:][:Me:][:Cf:]];"
// Hindi phrase separators
"danda=[\u0964\u0965];"
// characters that always cause a break: ETX, tab, LF, FF, LS, and PS
"break=[\u0003\t\n\f\u2028\u2029];"
// characters that always prevent a break: the non-breaking space
// and similar characters
"nbsp=[\u00a0\u2007\u2011\ufeff];"
// whitespace: space separators and control characters, except for
// CR and the other characters mentioned above
"space=[[[:Zs:][:Cc:]]-[{nbsp}{break}\r]];"
// dashes: dash punctuation and the discretionary hyphen, except for
// non-breaking hyphens
"dash=[[[:Pd:]\u00ad]-[{nbsp}]];"
// characters that stick to a word if they precede it: currency symbols
// (except the cents sign) and starting punctuation
"pre-word=[[[:Sc:]-[\u00a2]][:Ps:]\\\"\\\'];"
// characters that stick to a word if they follow it: ending punctuation,
// other punctuation that usually occurs at the end of a sentence,
// small Kana characters, some CJK diacritics, etc.
"post-word=[[:Pe:]\\!\\\"\\\'\\%\\.\\,\\:\\;\\?\u00a2\u00b0\u066a\u2030-\u2034"
"\u2103\u2105\u2109\u3001\u3002\u3005\u3041\u3043\u3045\u3047\u3049\u3063"
"\u3083\u3085\u3087\u308e\u3099-\u309e\u30a1\u30a3\u30a5\u30a7\u30a9"
"\u30c3\u30e3\u30e5\u30e7\u30ee\u30f5\u30f6\u30fc-\u30fe\uff01\uff0c"
"\uff0e\uff1f];"
// Kanji: actually includes both Kanji and Kana, except for small Kana and
// CJK diacritics
"kanji=[[\u4e00-\u9fa5\uf900-\ufa2d\u3041-\u3094\u30a1-\u30fa]-[{post-word}{$ignore}]];"
// digits
"digit=[[:Nd:][:No:]];"
// punctuation that can occur in the middle of a number: periods and commas
"mid-num=[\\.\\,];"
// everything not mentioned above, plus the quote marks (which are both
// <pre-word>, <post-word>, and <char>)
"char=[^{break}{space}{dash}{kanji}{nbsp}{$ignore}{pre-word}{post-word}{mid-num}{danda}\r\\\"\\\'];"
// a "number" is a run of prefix characters and dashes, followed by one or
// more digits with isolated number-punctuation characters interspersed
"number=([{pre-word}{dash}]*{digit}+({mid-num}{digit}+)*);"
// the basic core of a word can be either a "number" as defined above, a single
// "Kanji" character, or a run of any number of not-explicitly-mentioned
// characters (this includes Latin letters)
"word-core=([{pre-word}{char}]*|{kanji}|{number});"
// a word may end with an optional suffix that be either a run of one or
// more dashes or a run of word-suffix characters, followed by an optional
// run of whitespace
"word-suffix=(({dash}+|{post-word}*){space}*);"
// a word, thus, is an optional run of word-prefix characters, followed by
// a word core and a word suffix (the syntax of <word-core> and <word-suffix>
// actually allows either of them to match the empty string, putting a break
// between things like ")(" or "aaa(aaa"
"word=({pre-word}*{word-core}{word-suffix});"
// finally, the rule that does the work: Keep together any run of words that
// are joined by runs of one of more non-spacing mark. Also keep a trailing
// line-break character or CRLF combination with the word. (line separators
// "win" over nbsp's)
"{word}({nbsp}+{word})*\r?{break}?;"
}
// default rules for finding sentence boundaries
SentenceBreakRules {
// ignore non-spacing marks, enclosing marks, and format characters
"$ignore=[[:Mn:][:Me:][:Cf:]];"
// lowercase letters
"lc=[:Ll:];"
// uppercase Latin letters
"ucLatin=[A-Z];"
// whitespace (line separators are treated as whitespace)
"space=[\t\r\f\n\u2028[:Zs:]];"
// punctuation which may occur at the beginning of a sentence: "starting
// punctuation" and quotation marks
"start=[[:Ps:]\\\"\\\'];"
// punctuation with may occur at the end of a sentence: "ending punctuation"
// and quotation marks
"end=[[:Pe:]\\\"\\\'];"
// digits
"digit=[:N:];"
// characters that unambiguously signal the end of a sentence
"term=[\\!\\?\u3002\uff01\uff1f];"
// periods, which MAY signal the end of a sentence
"period=[\\.\uff0e];"
// characters that may occur at the beginning of a sentence: basically anything
// not mentioned above (lowercase letters and digits are specifically excluded)
"sent-start=[^{lc}{ucLatin}{space}{start}{end}{digit}{term}{period}\u2029{$ignore}];"
// Hindi phrase separator
"danda=[\u0964\u0965];"
// always break sentences after paragraph separators
".*?\u2029?;"
// always break after a danda, if it's followed by whitespace
".*?{danda}{space}*;"
// if you see a period, skip over additional periods and ending punctuation
// and if the next character is a paragraph separator, break after the
// paragraph separator
".*?{period}[{period}{end}]*{space}*\u2029;"
// if you see a period, skip over additional periods and ending punctuation,
// followed by optional whitespace, followed by optional starting punctuation,
// and if the next character is something that can start a sentence
// (basically, a capital letter), then put the sentence break between the
// whitespace and the opening punctuation
".*?{period}[{period}{end}]*{space}*/({start}*{sent-start}|{start}+{ucLatin});"
// same as above, except that there's a sentence break before a Latin capital
// letter only if there's at least one space after the period
".*?{period}[{period}{end}]*{space}+/{ucLatin};"
// if you see a sentence-terminating character, skip over any additional
// terminators, periods, or ending punctuation, followed by any whitespace,
// followed by a SINGLE optional paragraph separator, and put the break there
".*?{term}[{term}{period}{end}]*{space}*\u2029?;"
// The following rules are here to aid in backwards iteration. The automatically
// generated backwards state table will rewind to the beginning of the
// paragraph all the time (or all the way to the beginning of the document
// if the document doesn't use the Unicode PS character) because the only
// unambiguous character pairs are those involving paragraph separators.
// These specify a few more unambiguous breaking situations.
// if you see a sentence-starting character, followed by starting punctuation
// (remember, we're iterating backwards), followed by an optional run of
// whitespace, followed by an optional run of ending punctuation, followed
// by a period, this is a safe place to turn around
"![{sent-start}{ucLatin}]{start}*{space}+{end}*{period};"
// if you see a letter or a digit, followed by an optional run of
// starting punctuation, followed by an optional run of whitespace,
// followed by an optional run of ending punctuation, followed by
// a sentence terminator, this is a safe place to turn around
"![{sent-start}{lc}{digit}]{start}*{space}*{end}*{term};"
}
//------------------------------------------------------------
// END BreakIterator support
//------------------------------------------------------------
AmPmMarkers {
"AM",
"PM",
}
Countries {
AF { "Afghanistan" }
AL { "Albania" }
DZ { "Algeria" }
AD { "Andorra" }
AO { "Angola" }
AI { "Anguilla" }
AR { "Argentina" }
AM { "Armenia" }
AW { "Aruba" }
AU { "Australia" }
AT { "Austria" }
AZ { "Azerbaijan" }
BS { "Bahamas" }
BH { "Bahrain" }
BD { "Bangladesh" }
BB { "Barbados" }
BY { "Belarus" }
BE { "Belgium" }
BZ { "Belize" }
BJ { "Benin" }
BM { "Bermuda" }
BT { "Bhutan" }
BO { "Bolivia" }
BA { "Bosnia and Herzegovina" }
BW { "Botswana" }
BR { "Brazil" }
BN { "Brunei" }
BG { "Bulgaria" }
BF { "Burkina Faso" }
BI { "Burundi" }
KH { "Cambodia" }
CM { "Cameroon" }
CA { "Canada" }
CV { "Cape Verde" }
CF { "Central African Republic" }
TD { "Chad" }
CL { "Chile" }
CN { "China" }
CO { "Colombia" }
KM { "Comoros" }
CG { "Congo" }
CR { "Costa Rica" }
CI { "C\u00F4te d'Ivoire" }
HR { "Croatia" }
CU { "Cuba" }
CY { "Cyprus" }
CZ { "Czech Republic" }
DK { "Denmark" }
DJ { "Djibouti" }
DM { "Dominica" }
DO { "Dominican Republic" }
TP { "East Timor" }
EC { "Ecuador" }
EG { "Egypt" }
SV { "El Salvador" }
GQ { "Equatorial Guinea" }
ER { "Eritrea" }
EE { "Estonia" }
ET { "Ethiopia" }
FJ { "Fiji" }
FI { "Finland" }
FO { "Faroe Islands" } // http://www.din.de/gremien/nas/nabd/iso3166ma/codlstp1/en_listp1.html
FR { "France" }
GF { "French Guiana" }
GL { "Greenland" } // http://www.din.de/gremien/nas/nabd/iso3166ma/codlstp1/en_listp1.html
PF { "French Polynesia" }
TF { "French Southern Territories" }
GA { "Gabon" }
GM { "Gambia" }
GE { "Georgia" }
DE { "Germany" }
GH { "Ghana" }
GR { "Greece" }
GP { "Guadeloupe" }
GT { "Guatemala" }
GN { "Guinea" }
GW { "Guinea-Bissau" }
GY { "Guyana" }
HT { "Haiti" }
HN { "Honduras" }
HK { "Hong Kong" }
HU { "Hungary" }
IS { "Iceland" }
IN { "India" }
ID { "Indonesia" }
IR { "Iran" }
IQ { "Iraq" }
IE { "Ireland" }
IL { "Israel" }
IT { "Italy" }
JM { "Jamaica" }
JP { "Japan" }
JO { "Jordan" }
KZ { "Kazakhstan" }
KE { "Kenya" }
KI { "Kiribati" }
KP { "North Korea" }
KR { "South Korea" }
KW { "Kuwait" }
KG { "Kyrgyzstan" }
LA { "Laos" }
LV { "Latvia" }
LB { "Lebanon" }
LS { "Lesotho" }
LR { "Liberia" }
LY { "Libya" }
LI { "Liechtenstein" }
LT { "Lithuania" }
LU { "Luxembourg" }
MK { "Macedonia" }
MG { "Madagascar" }
MY { "Malaysia" }
ML { "Mali" }
MT { "Malta" }
MQ { "Martinique" }
MR { "Mauritania" }
MU { "Mauritius" }
YT { "Mayotte" }
MX { "Mexico" }
FM { "Micronesia" }
MD { "Moldova" }
MC { "Monaco" }
MN { "Mongolia" }
MS { "Montserrat" }
MA { "Morocco" }
MZ { "Mozambique" }
MM { "Myanmar" }
NA { "Namibia" }
NP { "Nepal" }
NL { "Netherlands" }
AN { "Netherlands Antilles" }
NC { "New Caledonia" }
NZ { "New Zealand" }
NI { "Nicaragua" }
NE { "Niger" }
NG { "Nigeria" }
NU { "Niue" }
NO { "Norway" }
OM { "Oman" }
PK { "Pakistan" }
PA { "Panama" }
PG { "Papua New Guinea" }
PY { "Paraguay" }
PE { "Peru" }
PH { "Philippines" }
PL { "Poland" }
PT { "Portugal" }
PR { "Puerto Rico" }
QA { "Qatar" }
RO { "Romania" }
RU { "Russia" }
RW { "Rwanda" }
SA { "Saudi Arabia" }
SN { "Senegal" }
SP { "Serbia" }
SC { "Seychelles" }
SL { "Sierra Leone" }
SG { "Singapore" }
SK { "Slovakia" }
SI { "Slovenia" }
SO { "Somalia" }
ZA { "South Africa" }
ES { "Spain" }
LK { "Sri Lanka" }
SD { "Sudan" }
SR { "Suriname" }
SZ { "Swaziland" }
SE { "Sweden" }
CH { "Switzerland" }
SY { "Syria" }
TW { "Taiwan" }
TJ { "Tajikistan" }
TZ { "Tanzania" }
TH { "Thailand" }
TG { "Togo" }
TK { "Tokelau" }
TO { "Tonga" }
TT { "Trinidad and Tobago" }
TN { "Tunisia" }
TR { "Turkey" }
TM { "Turkmenistan" }
UG { "Uganda" }
UA { "Ukraine" }
AE { "United Arab Emirates" }
GB { "United Kingdom" }
US { "United States" }
UY { "Uruguay" }
UZ { "Uzbekistan" }
VU { "Vanuatu" }
VA { "Vatican" }
VE { "Venezuela" }
VN { "Vietnam" }
VG { "British Virgin Islands" }
VI { "U.S. Virgin Islands" }
EH { "Western Sahara" }
YE { "Yemen" }
YU { "Yugoslavia" }
ZR { "Zaire" }
ZM { "Zambia" }
ZW { "Zimbabwe" }
}
CurrencyElements {
"\u00A4",
"XXX",
"",
}
DateTimeElements {
"1",
"1",
}
DateTimePatterns {
"h:mm:ss a z",
"h:mm:ss a z",
"h:mm:ss a",
"h:mm a",
"EEEE, MMMM d, yyyy",
"MMMM d, yyyy",
"MMM d, yyyy",
"M/d/yy",
"{1} {0}",
}
DayAbbreviations {
"Sun",
"Mon",
"Tue",
"Wed",
"Thu",
"Fri",
"Sat",
}
DayNames {
"Sunday",
"Monday",
"Tuesday",
"Wednesday",
"Thursday",
"Friday",
"Saturday",
}
Eras {
"BC",
"AD",
}
Languages {
aa { "Afar" }
ab { "Abkhazian" }
ace { "Achinese" }
ach { "Acoli" }
ada { "Adangme" }
ae { "Avestan" }
af { "Afrikaans" }
afa { "Afro-Asiatic (Other)" }
afh { "Afrihili" }
aka { "Akan" }
akk { "Akkadien" }
ale { "Aleut" }
alg { "Algonquian Languages" }
am { "Amharic" }
ang { "English, Old (ca.450-1100)" }
apa { "Apache Languages"}
ar { "Arabic" }
arc { "Aramaic" }
arn { "Araucanian" }
arp { "Arapaho" }
art { "Artificial (Other)" }
arw { "Arawak" }
as { "Assamese" }
ath { "Athapaskan Languages" }
aus { "Australian Languages" }
ava { "Avaric" }
awa { "Awadhi" }
ay { "Aymara" }
az { "Azerbaijani" }
ba { "Bashkir" }
bad { "Banda" }
bai { "Bamileke Languages" }
bal { "Baluuchi" }
bam { "Bambara" }
ban { "Balinese" }
bas { "Basa" }
bat { "Baltic (Other)" }
be { "Belarusian" }
bej { "Beja" }
bem { "Bemba" }
ber { "Beber" }
bg { "Bulgarian" }
bh { "Bihari" }
bho { "Bhojpuri" }
bi { "Bislama" }
bik { "Bikol" }
bin { "Bini" }
bla { "Siksika" }
bn { "Bengali" }
bnt { "Bantu" }
bo { "Tibetan" }
br { "Brenton" }
bra { "Braj" }
bs { "Bosnian"}
btk { "Batak" }
bua { "Buriat" }
bug { "Buginese" }
ca { "Catalan" }
cad { "Caddo" }
cai { "Central American Indian (Other)" }
car { "Carib" }
cau { "Caucasian (Other) " }
ce { "Chechen" }
ceb { "Cebuano" }
cel { "Celtic (Other)" }
ch { "Chamorro" }
chb { "Chibcha" }
chg { "Chagatai" }
chk { "Chuukese" }
chm { "Mari" }
chn { "Chinook Jargon" }
cho { "Choctaw" }
chp { "Chipewyan" }
chr { "Cherokee" }
chy { "Cheyenne" }
cmc { "Chamic Languages" }
co { "Corsican" }
cop { "Coptic" }
cpe { "Creoles and Pidgins, English-based (Other)" }
cpf { "Creoles and Pidgins, French-based (Other)" }
cre { "Cree" }
crp { "Creoles and Pidgins (Other)" }
cs { "Czech" }
cu { "Church Slavic" }
cus { "Cushitic (Other)" }
cv { "Chuvash" }
cy { "Welsh" }
da { "Danish" }
dak { "Dakota" }
day { "Dayak" }
de { "German" }
del { "Delaware" }
den { "Slave" }
dgr { "Dogrib" }
din { "Dinka" }
div { "Divehi" }
doi { "Dogri" }
dra { "Dravidian (Other)" }
dua { "Duala" }
dum { "Dutch, Middle (ca. 1050-1350)" }
dyu { "Dyula" }
dz { "Bhutani" }
dzo { "Dzongkha" }
efi { "Efik" }
egy { "Egyptian (Ancient)" }
eka { "Ekajuk" }
el { "Greek" } // Modern (1453-)
elx { "Elamite" }
en { "English" }
enm { "English, Middle( 1100 -1500)" }
eo { "Esperanto" }
es { "Spanish" }
et { "Estonian" }
eu { "Basque" }
ewe { "Ewe" }
ewo { "Ewondo" }
fa { "Persian" }
fan { "Fang" }
fat { "Fanti" }
fi { "Finnish" }
fiu { "Finno - Ugrian" }
fj { "Fiji" }
fo { "Faeroese" }
fon { "Fon" }
fr { "French" }
frm { "French, Middle (ca.1400-1600)" }
fro { "French, Old (842-ca.1400)" }
ful { "Fulah" }
fur { "Friulian" }
fy { "Frisian" }
ga { "Irish" }
gaa { "Ga" }
gay { "Gayo" }
gba {"Gbaya" }
gd { "Scots Gaelic" }
gem { "Germanic (Other)" }
gil { "Gilbertese" }
gl { "Gallegan" }
gla { "Gaelic (Scots)" }
gmh { "German, Middle High (ca.1050-1500)" }
gn { "Guarani" }
goh { " German, Old High (ca.750-1050)" }
gon { "Gondi" }
gor { "Gorontalo" }
got { "Gothic" }
grb { "Gerbo" }
grc { "Greek, Ancient (to 1453)" }
gu { "Gujarati" }
gv { "Manx" }
gwi { "Gwich'in" }
hai { "Haida" }
hau { "Hausa" }
haw { "Hawaiian" }
he { "Hebrew" }
hi { "Hindi" }
him { "Himachali" }
hit { "Hittite" }
hmn { "Hmong" }
ho { "Hiri Motu" }
hr { "Croatian" }
hu { "Hungarian" }
hup { "Hupa" }
hy { "Armenian" }
hz { "Herero" }
ia { "Interlingua" }
iba { "Iban" }
ibo { "Igbo" }
id { "Indonesian" }
ie { "Interlingue" }
ijo { "Ijo" }
ik { "Inupiak" }
ilo { "Iloko" }
inc { "Indic (Other)" }
ine { "Indo-European" }
ira { "Iranian " }
iro { "Iroguoian Languages" }
is { "Icelandic" }
it { "Italian" }
iu { "Inukitut" }
iw { "Hebrew" }
ja { "Japanese" }
jpr { "Judeo-Persian" }
jrb { "Judeo-Arabic" }
jw { "Javanese" }
ka { "Georgian" }
kaa { "Kara-Kalpak" }
kab { "Kabyle" }
kac { "Kachin" }
kam { "Kamba" }
kar { "Karen" }
kau { "Kanuri" }
kaw { "Kawi" }
kha { "Khasi" }
khi { "Khoisan" }
kho { "Khotanese" }
ki { "Kikuyu" }
kk { "Kazakh" }
kl { "Kalaallisut" }
km { "Khmer" }
kmb { "Kimbundu" }
kn { "Kannada" }
ko { "Korean" }
kok { "Konkani" }
kon { "Kongo" }
kos { "Kosrean" }
kpe { "Kpelle" }
kro { "Kru" }
kru { "Kuruckh" }
ks { "Kashmiri" }
ku { "Kurdish" }
kum { "Kumyk" }
kut { "Kutenai" }
kv { "Komi" }
kw { "Cornish" }
ky { "Kirghiz" }
la { "Latin" }
lad { "Ladino" }
lah { "Lahnda" }
lam { "Lamba" }
lb { "Letzeburgesch" }
lez { "Lezghian" }
lin { "Lingala" }
lit { "Lithuanian" }
ln { "Lingala" }
lo { "Lao" }
lol { "Mongo" }
loz { "Lozi" }
lt { "Lithuanian" }
lua { "Luba-Lulua" }
lub { "Luba-Katanga" }
lug { "Ganda" }
lui { "Luiseeno" }
lun { "Lunda" }
luo { "Lua" }
lus { "Lushai" }
lv { "Latvian (Lettish)" }
mad { "Madurese" }
mag { "Magahi" }
mai { "Maithili" }
mak { "Makasar" }
man { "Mandingue" }
map { "Austronesian" }
mas { "Masai" }
mdr { "Mandar" }
men { "Mende" }
mg { "Malagasy" }
mga { "Irish, Middle (900-1200)" }
mh { "Marshall"}
mi { "Maori" }
mic { "Mic-Mac" }
min { "Minangkabau" }
mis { "Miscellaneous Languages" }
mk { "Macedonian" }
mkh { "Mon-Khmer (Ohter)" }
ml { "Malayalam" }
mn { "Mongolian" }
mnc { "Manchu" }
mni { "Manipuri" }
mno { "Manobo Languages" }
mo { "Moldavian" }
moh { "Mohawk" }
mos { "Mossi" }
mr { "Marathi" }
ms { "Malay" }
mt { "Maltese" }
mul { "Multiple Languages" }
mun { "Munda Languages" }
mus { "Creek" }
mwr { "Marwari" }
my { "Burmese" }
myn { "Mayan" }
na { "Nauru" }
nah { "Nahuatl" }
nai { "North American Indian (Ohter)" }
nb { "Norwegian Bokm\u00e5l" }
nd { "Ndebele, North" }
nds { "Low German; Low Saxon" }
ne { "Nepali" }
new { "Newari" }
ng { "Ndonga" }
nia { "Nias" }
nic { "Niger - Kordofanian" }
niu { "Niuean" }
nl { "Dutch" }
nn { "Norwegian Nynorsk" }
no { "Norwegian" }
non { "Norse, Old" }
nr { "Ndebele, South" }
nso { "Sotho, Northern" }
nub { "Nubian Languages" }
nv {"Navajo"}
ny { " Chichewa; Nyanja" }
nym { "Nyamwezi" }
nyo { "Nyoro" }
nzi { "Nzima" }
oc { "Proven\u00E7al; Occitan (post 1500)"}
oji { "Ojibwa" }
om { "Oromo (Afan)" }
or { "Oriya" }
os { "Ossetic" }
osa { "Osage" }
ota { "Turkish (Ottoman Empire)" }
oto { "Otomian Languages" }
pa { "Punjabi" }
paa { "Papuan (Ohter)" }
pag { "Pangasinan" }
pal { "Pahlavi" }
pam { "pampamga" }
pap { "Papiamento" }
pau { "Palauan" }
peo { "Persian Old (ca.600-400 B.C.)" }
phi { "Philippine (Other)" }
phn { "Phoenician" }
pi { "Pali" }
pl { "Polish" }
pon { "Pohnpeian" }
pra { "Prakrit Languages" }
pro { "Proven<65>al, Old (to 1500)" }
ps { "Pashto (Pushto)" }
pt { "Portuguese" }
qu { "Quechua" }
raj { "Rajastani" }
rap { "Rapanui" }
rar { "Rarotongan" }
rm { "Rhaeto-Romance" }
rn { "Rundi" }
ro { "Romanian" }
roa { "Romance (Other)" }
rom { "Romany" }
ru { "Russian" }
rw { "Kinyarwanda" }
sa { "Sanskrit" }
sad { "Sandawe" }
sah { "Yakut" }
sai { "South American Indian (Ohter)" }
sal { "Salishan" }
sam { "Samritan" }
sas { "Saska" }
sat { "Santali" }
sc { "Sardinian" }
sco { "Scots" }
sd { "Sindhi" }
se { "Northern Sami" }
// http://lcweb.loc.gov/standards/iso639-2/englangn.html
// should provide the correct language code soon
// se { "Sami Languages" } // DUP FIXME
sel { "Selkup" }
sem { "Semitic" }
sg { "Sango" }
sga { "Irish, Old (to 900)" }
sgn { "Sign Languages" }
sh { "Serbo-Croatian" }
shn { "Shan" }
si { "Sinhalese" }
sid { "Sidamo" }
sio { "Siouan Languages" }
sit { "Sino-Tibetan (Other)" }
sk { "Slovak" }
sl { "Slovenian" }
sm { "Samoan" }
sn { "Shona" }
snk { "Soninke" }
so { "Somali" }
sog { "Sogdien" }
son { "Songhai" }
sq { "Albanian" }
sr { "Serbian" }
srr { "Serer" }
ss { "Swati" }
ssa { "Nilo-Saharam" }
st { "Sotho, Southern" }
su { "Sundanese" }
suk { "Sukuma" }
sus { "Susu" }
sux { "Sumerian"}
sv { "Swedish" }
sw { "Swahili" }
syr { "Syriac" }
ta { "Tamil" }
tai { "Tai (Other)" }
te { "Telugu" }
tem { "Timne" }
ter { "Tereno" }
tet { "Tetum" }
tg { "Tajik" }
th { "Thai" }
tig { "Tigre" }
tir { "Tigrinya" }
tiv { "Tiv" }
tk { "Turkmen" }
tl { "Tagalog" }
tli { "Tlingit" }
tmh { "Tamashek" }
tn { "Tswana" }
tog { "Tonga (Nyasa)" }
ton { "Tongan (Tonga Islands)" }
tr { "Turkish" }
ts { "Tsonga" }
tsi { "Tsimshian" }
tt { "Tatar" }
tum { "Tumbuka" }
tur { "Turkish" }
tut { "Altaic (Other)" }
tvl { "Tuvalu" }
tw { "Twi" }
ty { "Tahitian" }
tyv { "Tuvinian" }
ug { "Uighur" }
uga { "Ugaritic" }
uk { "Ukrainian" }
umb { "Umbundu" }
und { "Undetermined" }
ur { "Urdu" }
uz { "Uzbek" }
vai { "Vai" }
ven { "Venda" }
vi { "Vietnamese" }
vo { "Volapuk" }
vot { "Votic" }
wak { "Wakashan Languages" }
wal { "Walamo" }
war { "Waray" }
was { "Washo" }
wen { "Sorbian Languages" }
wo { "Wolof" }
xh { "Xhosa" }
yao { "Yao" }
yap { "Yapese" }
yi { "Yiddish" }
yor { "Yoruba" }
ypk { "Yupik Languages" }
za { "Zhuang" }
zap { "Zapotec" }
zen { "Zenaga" }
zh { "Chinese" }
znd { "Zande" }
zu { "Zulu" }
zun { "Zuni" }
}
LocaleID { "0000" }
LocaleString { "en" }
MonthAbbreviations {
"Jan",
"Feb",
"Mar",
"Apr",
"May",
"Jun",
"Jul",
"Aug",
"Sep",
"Oct",
"Nov",
"Dec",
"",
}
MonthNames {
"January",
"February",
"March",
"April",
"May",
"June",
"July",
"August",
"September",
"October",
"November",
"December",
"",
}
NumberElements {
".",
",",
";",
"%",
"0",
"#",
"-",
"E",
"\u2030",
"\u221E",
"\uFFFD",
}
NumberPatterns {
"#,##0.###;-#,##0.###",
"\u00A4 #,##0.00;-\u00A4 #,##0.00",
"#,##0%",
}
ShortCountry { "" }
ShortLanguage { "eng" }
localPatternChars { "GyMdkHmsSEDFwWahKzYe" }
zoneStrings {
{
"PST",
"Pacific Standard Time",
"PST",
"Pacific Daylight Time",
"PDT",
"San Francisco",
}
{
"MST",
"Mountain Standard Time",
"MST",
"Mountain Daylight Time",
"MDT",
"Denver",
}
{
"PNT",
"Mountain Standard Time",
"MST",
"Mountain Standard Time",
"MST",
"Phoenix",
}
{
"CST",
"Central Standard Time",
"CST",
"Central Daylight Time",
"CDT",
"Chicago",
}
{
"EST",
"Eastern Standard Time",
"EST",
"Eastern Daylight Time",
"EDT",
"New York",
}
{
"IET",
"Eastern Standard Time",
"EST",
"Eastern Standard Time",
"EST",
"Indianapolis",
}
{
"PRT",
"Atlantic Standard Time",
"AST",
"Atlantic Daylight Time",
"ADT",
"Halifax",
}
{
"HST",
"Hawaii Standard Time",
"HST",
"Hawaii Daylight Time",
"HDT",
"Honolulu",
}
{
"AST",
"Alaska Standard Time",
"AST",
"Alaska Daylight Time",
"ADT",
"Anchorage",
}
}
}