00e92f1e03
X-SVN-Rev: 4818
1167 lines
37 KiB
Plaintext
1167 lines
37 KiB
Plaintext
// *******************************************************************************
|
|
// *
|
|
// * Copyright (C) 1997-2001, International Business Machines
|
|
// * Corporation and others. All Rights Reserved.
|
|
// *
|
|
// *******************************************************************************
|
|
// Date Name Description
|
|
// 11/17/99 aliu Added support for transliterators.
|
|
|
|
// Please search for 'DUP FIXME' - duplicate lang/country names commented out
|
|
|
|
|
|
|
|
root {
|
|
Version { "3.1.1" }
|
|
"%%EURO" { "Euro" } // Euro variant display name
|
|
"%%B" { "Bokm\u00e5l" } // Norwegian variant display name
|
|
"%%NY" { "Nynorsk" } // Norwegian variant display name
|
|
"%%AL" { "\u00C5land" } // Aland variant display name
|
|
"%%UCARULES" { "UCARules.txt"} // UCARules
|
|
// no collation elements any more
|
|
// CollationElements {
|
|
// Version { "1.0" }
|
|
// Override { "FALSE" }
|
|
// Sequence { "" }
|
|
// }
|
|
// Formats for the display name of a locale, for a list of
|
|
// items, and for composing two items in a list into one item.
|
|
// The list patterns are used in the variant name and in the
|
|
// full display name.
|
|
//
|
|
// This is the language-neutral form of this resource.
|
|
//
|
|
LocaleNamePatterns {
|
|
{
|
|
"{0,choice,0#|1#{1}|2#{1} ({2})}", // Display name
|
|
"{0,choice,0#|1#{1}|2#{1},{2}|3#{1},{2},{3}}", // List
|
|
"{0},{1}" // List composition
|
|
}
|
|
}
|
|
|
|
//------------------------------------------------------------
|
|
// BEGIN Transliterator support
|
|
//------------------------------------------------------------
|
|
|
|
// See also icu/data/translit/index.txt
|
|
|
|
TransliteratorNamePattern {
|
|
// Format for the display name of a Transliterator.
|
|
// This is the language-neutral form of this resource.
|
|
"{0,choice,0#|1#{1}|2#{1}-{2}}" // Display name
|
|
}
|
|
|
|
//------------------------------------------------------------
|
|
// END Transliterator support
|
|
//------------------------------------------------------------
|
|
|
|
//------------------------------------------------------------
|
|
// BEGIN BreakIterator support
|
|
//------------------------------------------------------------
|
|
|
|
CharacterBreakRules {
|
|
// ignore non-spacing marks and enclosing marks (since we never
|
|
// put a break before ignore characters, this keeps combining
|
|
// accents with the base characters they modify)
|
|
"$ignore=[[:Mn:][:Me:]];"
|
|
|
|
// other category definitions
|
|
"choseong=[\u1100-\u115f];"
|
|
"jungseong=[\u1160-\u11a7];"
|
|
"jongseong=[\u11a8-\u11ff];"
|
|
"surr-hi=[\ud800-\udbff];"
|
|
"surr-lo=[\udc00-\udfff];"
|
|
|
|
// break after every character, except as follows:
|
|
".;"
|
|
|
|
// keep CRLF sequences together
|
|
"\r\n;"
|
|
|
|
// keep surrogate pairs together
|
|
"{surr-hi}{surr-lo};"
|
|
|
|
// keep Hangul syllables spelled out using conjoining jamo together
|
|
"{choseong}*{jungseong}*{jongseong}*;"
|
|
|
|
// various additions for Hindi support
|
|
"nukta=[\u093c];"
|
|
"danda=[\u0964\u0965];"
|
|
"virama=[\u094d];"
|
|
"devVowelSign=[\u093e-\u094c\u0962\u0963];"
|
|
"devConsonant=[\u0915-\u0939];"
|
|
"devNuktaConsonant=[\u0958-\u095f];"
|
|
"devCharEnd=[\u0902\u0903\u0951-\u0954];"
|
|
"zwj=[\u200d];"
|
|
|
|
"devCAMN=({devConsonant}{nukta}?);"
|
|
"devConsonant1=({devNuktaConsonant}|{devCAMN});"
|
|
"devConjunct=(({devConsonant1}{virama}{zwj}?)?{devConsonant1});"
|
|
|
|
"{devConjunct}{devVowelSign}?{devCharEnd}?;"
|
|
"{danda}{nukta};"
|
|
}
|
|
|
|
// default rules for finding word boundaries
|
|
WordBreakRules {
|
|
// ignore non-spacing marks, enclosing marks, and format characters,
|
|
// all of which should not influence the algorithm
|
|
"$ignore=[[:Mn:][:Me:][:Cf:]];"
|
|
|
|
// Hindi phrase separator, kanji, katakana, hiragana, CJK diacriticals,
|
|
// other letters, and digits
|
|
"danda=[\u0964\u0965];"
|
|
"kanji=[\u3005\u4e00-\u9fa5\uf900-\ufa2d];"
|
|
"kata=[\u3099-\u309c\u30a1-\u30fe];"
|
|
"hira=[\u3041-\u309e\u30fc];"
|
|
"let=[[[:L:][:Mc:]]-[{kanji}{kata}{hira}]];"
|
|
"dgt=[:N:];"
|
|
|
|
// punctuation that can occur in the middle of a word: currently
|
|
// dashes, apostrophes, quotation marks, and periods
|
|
"mid-word=[[:Pd:]\u00ad\u2027\\\"\\\'\\.];"
|
|
|
|
// punctuation that can occur in the middle of a number: currently
|
|
// apostrophes, qoutation marks, periods, commas, and the Arabic
|
|
// decimal point
|
|
"mid-num=[\\\"\\\'\\,\u066b\\.];"
|
|
|
|
// punctuation that can occur at the beginning of a number: currently
|
|
// the period, the number sign, and all currency symbols except the cents sign
|
|
"pre-num=[[[:Sc:]-[\u00a2]]\\#\\.];"
|
|
|
|
// punctuation that can occur at the end of a number: currently
|
|
// the percent, per-thousand, per-ten-thousand, and Arabic percent
|
|
// signs, the cents sign, and the ampersand
|
|
"post-num=[\\%\\&\u00a2\u066a\u2030\u2031];"
|
|
|
|
// line separators: currently LF, FF, PS, and LS
|
|
"ls=[\n\u000c\u2028\u2029];"
|
|
|
|
// whitespace: all space separators and the tab character
|
|
"ws=[[:Zs:]\t];"
|
|
|
|
// a word is a sequence of letters that may contain internal
|
|
// punctuation, as long as it begins and ends with a letter and
|
|
// never contains two punctuation marks in a row
|
|
"word=({let}+({mid-word}{let}+)*{danda}?);"
|
|
|
|
// a number is a sequence of digits that may contain internal
|
|
// punctuation, as long as it begins and ends with a digit and
|
|
// never contains two punctuation marks in a row.
|
|
"number=({dgt}+({mid-num}{dgt}+)*);"
|
|
|
|
// break after every character, with the following exceptions
|
|
// (this will cause punctuation marks that aren't considered
|
|
// part of words or numbers to be treated as words unto themselves)
|
|
".;"
|
|
|
|
// keep together any sequence of contiguous words and numbers
|
|
// (including just one of either), plus an optional trailing
|
|
// number-suffix character
|
|
"{word}?({number}{word})*({number}{post-num}?)?;"
|
|
|
|
// keep together and sequence of contiguous words and numbers
|
|
// that starts with a number-prefix character and a number,
|
|
// and may end with a number-suffix character
|
|
"{pre-num}({number}{word})*({number}{post-num}?)?;"
|
|
|
|
// keep together runs of whitespace (optionally with a single trailing
|
|
// line separator or CRLF sequence)
|
|
"{ws}*\r?{ls}?;"
|
|
|
|
// keep together runs of Katakana
|
|
"{kata}*;"
|
|
|
|
// keep together runs of Hiragana
|
|
"{hira}*;"
|
|
|
|
// keep together runs of Kanji
|
|
"{kanji}*;"
|
|
}
|
|
|
|
// default rules for determining legal line-breaking positions
|
|
LineBreakRules {
|
|
// ignore non-spacing marks, enclosing marks, and format characters
|
|
"$ignore=[[:Mn:][:Me:][:Cf:]];"
|
|
|
|
// Hindi phrase separators
|
|
"danda=[\u0964\u0965];"
|
|
|
|
// characters that always cause a break: ETX, tab, LF, FF, LS, and PS
|
|
"break=[\u0003\t\n\f\u2028\u2029];"
|
|
|
|
// characters that always prevent a break: the non-breaking space
|
|
// and similar characters
|
|
"nbsp=[\u00a0\u2007\u2011\ufeff];"
|
|
|
|
// whitespace: space separators and control characters, except for
|
|
// CR and the other characters mentioned above
|
|
"space=[[[:Zs:][:Cc:]]-[{nbsp}{break}\r]];"
|
|
|
|
// dashes: dash punctuation and the discretionary hyphen, except for
|
|
// non-breaking hyphens
|
|
"dash=[[[:Pd:]\u00ad]-[{nbsp}]];"
|
|
|
|
// characters that stick to a word if they precede it: currency symbols
|
|
// (except the cents sign) and starting punctuation
|
|
"pre-word=[[[:Sc:]-[\u00a2]][:Ps:]\\\"\\\'];"
|
|
|
|
// characters that stick to a word if they follow it: ending punctuation,
|
|
// other punctuation that usually occurs at the end of a sentence,
|
|
// small Kana characters, some CJK diacritics, etc.
|
|
"post-word=[[:Pe:]\\!\\\"\\\'\\%\\.\\,\\:\\;\\?\u00a2\u00b0\u066a\u2030-\u2034"
|
|
"\u2103\u2105\u2109\u3001\u3002\u3005\u3041\u3043\u3045\u3047\u3049\u3063"
|
|
"\u3083\u3085\u3087\u308e\u3099-\u309e\u30a1\u30a3\u30a5\u30a7\u30a9"
|
|
"\u30c3\u30e3\u30e5\u30e7\u30ee\u30f5\u30f6\u30fc-\u30fe\uff01\uff0c"
|
|
"\uff0e\uff1f];"
|
|
|
|
// Kanji: actually includes both Kanji and Kana, except for small Kana and
|
|
// CJK diacritics
|
|
"kanji=[[\u4e00-\u9fa5\uf900-\ufa2d\u3041-\u3094\u30a1-\u30fa]-[{post-word}{$ignore}]];"
|
|
|
|
// digits
|
|
"digit=[[:Nd:][:No:]];"
|
|
|
|
// punctuation that can occur in the middle of a number: periods and commas
|
|
"mid-num=[\\.\\,];"
|
|
|
|
// everything not mentioned above, plus the quote marks (which are both
|
|
// <pre-word>, <post-word>, and <char>)
|
|
"char=[^{break}{space}{dash}{kanji}{nbsp}{$ignore}{pre-word}{post-word}{mid-num}{danda}\r\\\"\\\'];"
|
|
|
|
// a "number" is a run of prefix characters and dashes, followed by one or
|
|
// more digits with isolated number-punctuation characters interspersed
|
|
"number=([{pre-word}{dash}]*{digit}+({mid-num}{digit}+)*);"
|
|
|
|
// the basic core of a word can be either a "number" as defined above, a single
|
|
// "Kanji" character, or a run of any number of not-explicitly-mentioned
|
|
// characters (this includes Latin letters)
|
|
"word-core=([{pre-word}{char}]*|{kanji}|{number});"
|
|
|
|
// a word may end with an optional suffix that be either a run of one or
|
|
// more dashes or a run of word-suffix characters, followed by an optional
|
|
// run of whitespace
|
|
"word-suffix=(({dash}+|{post-word}*){space}*);"
|
|
|
|
// a word, thus, is an optional run of word-prefix characters, followed by
|
|
// a word core and a word suffix (the syntax of <word-core> and <word-suffix>
|
|
// actually allows either of them to match the empty string, putting a break
|
|
// between things like ")(" or "aaa(aaa"
|
|
"word=({pre-word}*{word-core}{word-suffix});"
|
|
|
|
// finally, the rule that does the work: Keep together any run of words that
|
|
// are joined by runs of one of more non-spacing mark. Also keep a trailing
|
|
// line-break character or CRLF combination with the word. (line separators
|
|
// "win" over nbsp's)
|
|
"{word}({nbsp}+{word})*\r?{break}?;"
|
|
}
|
|
|
|
// default rules for finding sentence boundaries
|
|
SentenceBreakRules {
|
|
// ignore non-spacing marks, enclosing marks, and format characters
|
|
"$ignore=[[:Mn:][:Me:][:Cf:]];"
|
|
|
|
// lowercase letters
|
|
"lc=[:Ll:];"
|
|
|
|
// uppercase Latin letters
|
|
"ucLatin=[A-Z];"
|
|
|
|
// whitespace (line separators are treated as whitespace)
|
|
"space=[\t\r\f\n\u2028[:Zs:]];"
|
|
|
|
// punctuation which may occur at the beginning of a sentence: "starting
|
|
// punctuation" and quotation marks
|
|
"start=[[:Ps:]\\\"\\\'];"
|
|
|
|
// punctuation with may occur at the end of a sentence: "ending punctuation"
|
|
// and quotation marks
|
|
"end=[[:Pe:]\\\"\\\'];"
|
|
|
|
// digits
|
|
"digit=[:N:];"
|
|
|
|
// characters that unambiguously signal the end of a sentence
|
|
"term=[\\!\\?\u3002\uff01\uff1f];"
|
|
|
|
// periods, which MAY signal the end of a sentence
|
|
"period=[\\.\uff0e];"
|
|
|
|
// characters that may occur at the beginning of a sentence: basically anything
|
|
// not mentioned above (lowercase letters and digits are specifically excluded)
|
|
"sent-start=[^{lc}{ucLatin}{space}{start}{end}{digit}{term}{period}\u2029{$ignore}];"
|
|
|
|
// Hindi phrase separator
|
|
"danda=[\u0964\u0965];"
|
|
|
|
// always break sentences after paragraph separators
|
|
".*?\u2029?;"
|
|
|
|
// always break after a danda, if it's followed by whitespace
|
|
".*?{danda}{space}*;"
|
|
|
|
// if you see a period, skip over additional periods and ending punctuation
|
|
// and if the next character is a paragraph separator, break after the
|
|
// paragraph separator
|
|
".*?{period}[{period}{end}]*{space}*\u2029;"
|
|
|
|
// if you see a period, skip over additional periods and ending punctuation,
|
|
// followed by optional whitespace, followed by optional starting punctuation,
|
|
// and if the next character is something that can start a sentence
|
|
// (basically, a capital letter), then put the sentence break between the
|
|
// whitespace and the opening punctuation
|
|
".*?{period}[{period}{end}]*{space}*/({start}*{sent-start}|{start}+{ucLatin});"
|
|
|
|
// same as above, except that there's a sentence break before a Latin capital
|
|
// letter only if there's at least one space after the period
|
|
".*?{period}[{period}{end}]*{space}+/{ucLatin};"
|
|
|
|
// if you see a sentence-terminating character, skip over any additional
|
|
// terminators, periods, or ending punctuation, followed by any whitespace,
|
|
// followed by a SINGLE optional paragraph separator, and put the break there
|
|
".*?{term}[{term}{period}{end}]*{space}*\u2029?;"
|
|
|
|
// The following rules are here to aid in backwards iteration. The automatically
|
|
// generated backwards state table will rewind to the beginning of the
|
|
// paragraph all the time (or all the way to the beginning of the document
|
|
// if the document doesn't use the Unicode PS character) because the only
|
|
// unambiguous character pairs are those involving paragraph separators.
|
|
// These specify a few more unambiguous breaking situations.
|
|
|
|
// if you see a sentence-starting character, followed by starting punctuation
|
|
// (remember, we're iterating backwards), followed by an optional run of
|
|
// whitespace, followed by an optional run of ending punctuation, followed
|
|
// by a period, this is a safe place to turn around
|
|
"![{sent-start}{ucLatin}]{start}*{space}+{end}*{period};"
|
|
|
|
// if you see a letter or a digit, followed by an optional run of
|
|
// starting punctuation, followed by an optional run of whitespace,
|
|
// followed by an optional run of ending punctuation, followed by
|
|
// a sentence terminator, this is a safe place to turn around
|
|
"![{sent-start}{lc}{digit}]{start}*{space}*{end}*{term};"
|
|
}
|
|
|
|
//------------------------------------------------------------
|
|
// END BreakIterator support
|
|
//------------------------------------------------------------
|
|
|
|
AmPmMarkers {
|
|
"AM",
|
|
"PM",
|
|
}
|
|
Countries {
|
|
AF { "Afghanistan" }
|
|
AL { "Albania" }
|
|
DZ { "Algeria" }
|
|
AD { "Andorra" }
|
|
AO { "Angola" }
|
|
AI { "Anguilla" }
|
|
AR { "Argentina" }
|
|
AM { "Armenia" }
|
|
AW { "Aruba" }
|
|
AU { "Australia" }
|
|
AT { "Austria" }
|
|
AZ { "Azerbaijan" }
|
|
BS { "Bahamas" }
|
|
BH { "Bahrain" }
|
|
BD { "Bangladesh" }
|
|
BB { "Barbados" }
|
|
BY { "Belarus" }
|
|
BE { "Belgium" }
|
|
BZ { "Belize" }
|
|
BJ { "Benin" }
|
|
BM { "Bermuda" }
|
|
BT { "Bhutan" }
|
|
BO { "Bolivia" }
|
|
BA { "Bosnia and Herzegovina" }
|
|
BW { "Botswana" }
|
|
BR { "Brazil" }
|
|
BN { "Brunei" }
|
|
BG { "Bulgaria" }
|
|
BF { "Burkina Faso" }
|
|
BI { "Burundi" }
|
|
KH { "Cambodia" }
|
|
CM { "Cameroon" }
|
|
CA { "Canada" }
|
|
CV { "Cape Verde" }
|
|
CF { "Central African Republic" }
|
|
TD { "Chad" }
|
|
CL { "Chile" }
|
|
CN { "China" }
|
|
CO { "Colombia" }
|
|
KM { "Comoros" }
|
|
CG { "Congo" }
|
|
CR { "Costa Rica" }
|
|
CI { "C\u00F4te d'Ivoire" }
|
|
HR { "Croatia" }
|
|
CU { "Cuba" }
|
|
CY { "Cyprus" }
|
|
CZ { "Czech Republic" }
|
|
DK { "Denmark" }
|
|
DJ { "Djibouti" }
|
|
DM { "Dominica" }
|
|
DO { "Dominican Republic" }
|
|
TP { "East Timor" }
|
|
EC { "Ecuador" }
|
|
EG { "Egypt" }
|
|
SV { "El Salvador" }
|
|
GQ { "Equatorial Guinea" }
|
|
ER { "Eritrea" }
|
|
EE { "Estonia" }
|
|
ET { "Ethiopia" }
|
|
FJ { "Fiji" }
|
|
FI { "Finland" }
|
|
FO { "Faroe Islands" } // http://www.din.de/gremien/nas/nabd/iso3166ma/codlstp1/en_listp1.html
|
|
FR { "France" }
|
|
GF { "French Guiana" }
|
|
GL { "Greenland" } // http://www.din.de/gremien/nas/nabd/iso3166ma/codlstp1/en_listp1.html
|
|
PF { "French Polynesia" }
|
|
TF { "French Southern Territories" }
|
|
GA { "Gabon" }
|
|
GM { "Gambia" }
|
|
GE { "Georgia" }
|
|
DE { "Germany" }
|
|
GH { "Ghana" }
|
|
GR { "Greece" }
|
|
GP { "Guadeloupe" }
|
|
GT { "Guatemala" }
|
|
GN { "Guinea" }
|
|
GW { "Guinea-Bissau" }
|
|
GY { "Guyana" }
|
|
HT { "Haiti" }
|
|
HN { "Honduras" }
|
|
HK { "Hong Kong" }
|
|
HU { "Hungary" }
|
|
IS { "Iceland" }
|
|
IN { "India" }
|
|
ID { "Indonesia" }
|
|
IR { "Iran" }
|
|
IQ { "Iraq" }
|
|
IE { "Ireland" }
|
|
IL { "Israel" }
|
|
IT { "Italy" }
|
|
JM { "Jamaica" }
|
|
JP { "Japan" }
|
|
JO { "Jordan" }
|
|
KZ { "Kazakhstan" }
|
|
KE { "Kenya" }
|
|
KI { "Kiribati" }
|
|
KP { "North Korea" }
|
|
KR { "South Korea" }
|
|
KW { "Kuwait" }
|
|
KG { "Kyrgyzstan" }
|
|
LA { "Laos" }
|
|
LV { "Latvia" }
|
|
LB { "Lebanon" }
|
|
LS { "Lesotho" }
|
|
LR { "Liberia" }
|
|
LY { "Libya" }
|
|
LI { "Liechtenstein" }
|
|
LT { "Lithuania" }
|
|
LU { "Luxembourg" }
|
|
MK { "Macedonia" }
|
|
MG { "Madagascar" }
|
|
MY { "Malaysia" }
|
|
ML { "Mali" }
|
|
MT { "Malta" }
|
|
MQ { "Martinique" }
|
|
MR { "Mauritania" }
|
|
MU { "Mauritius" }
|
|
YT { "Mayotte" }
|
|
MX { "Mexico" }
|
|
FM { "Micronesia" }
|
|
MD { "Moldova" }
|
|
MC { "Monaco" }
|
|
MN { "Mongolia" }
|
|
MS { "Montserrat" }
|
|
MA { "Morocco" }
|
|
MZ { "Mozambique" }
|
|
MM { "Myanmar" }
|
|
NA { "Namibia" }
|
|
NP { "Nepal" }
|
|
NL { "Netherlands" }
|
|
AN { "Netherlands Antilles" }
|
|
NC { "New Caledonia" }
|
|
NZ { "New Zealand" }
|
|
NI { "Nicaragua" }
|
|
NE { "Niger" }
|
|
NG { "Nigeria" }
|
|
NU { "Niue" }
|
|
NO { "Norway" }
|
|
OM { "Oman" }
|
|
PK { "Pakistan" }
|
|
PA { "Panama" }
|
|
PG { "Papua New Guinea" }
|
|
PY { "Paraguay" }
|
|
PE { "Peru" }
|
|
PH { "Philippines" }
|
|
PL { "Poland" }
|
|
PT { "Portugal" }
|
|
PR { "Puerto Rico" }
|
|
QA { "Qatar" }
|
|
RO { "Romania" }
|
|
RU { "Russia" }
|
|
RW { "Rwanda" }
|
|
SA { "Saudi Arabia" }
|
|
SN { "Senegal" }
|
|
SP { "Serbia" }
|
|
SC { "Seychelles" }
|
|
SL { "Sierra Leone" }
|
|
SG { "Singapore" }
|
|
SK { "Slovakia" }
|
|
SI { "Slovenia" }
|
|
SO { "Somalia" }
|
|
ZA { "South Africa" }
|
|
ES { "Spain" }
|
|
LK { "Sri Lanka" }
|
|
SD { "Sudan" }
|
|
SR { "Suriname" }
|
|
SZ { "Swaziland" }
|
|
SE { "Sweden" }
|
|
CH { "Switzerland" }
|
|
SY { "Syria" }
|
|
TW { "Taiwan" }
|
|
TJ { "Tajikistan" }
|
|
TZ { "Tanzania" }
|
|
TH { "Thailand" }
|
|
TG { "Togo" }
|
|
TK { "Tokelau" }
|
|
TO { "Tonga" }
|
|
TT { "Trinidad and Tobago" }
|
|
TN { "Tunisia" }
|
|
TR { "Turkey" }
|
|
TM { "Turkmenistan" }
|
|
UG { "Uganda" }
|
|
UA { "Ukraine" }
|
|
AE { "United Arab Emirates" }
|
|
GB { "United Kingdom" }
|
|
US { "United States" }
|
|
UY { "Uruguay" }
|
|
UZ { "Uzbekistan" }
|
|
VU { "Vanuatu" }
|
|
VA { "Vatican" }
|
|
VE { "Venezuela" }
|
|
VN { "Vietnam" }
|
|
VG { "British Virgin Islands" }
|
|
VI { "U.S. Virgin Islands" }
|
|
EH { "Western Sahara" }
|
|
YE { "Yemen" }
|
|
YU { "Yugoslavia" }
|
|
ZR { "Zaire" }
|
|
ZM { "Zambia" }
|
|
ZW { "Zimbabwe" }
|
|
}
|
|
CurrencyElements {
|
|
"\u00A4",
|
|
"XXX",
|
|
"",
|
|
}
|
|
DateTimeElements {
|
|
"1",
|
|
"1",
|
|
}
|
|
DateTimePatterns {
|
|
"h:mm:ss a z",
|
|
"h:mm:ss a z",
|
|
"h:mm:ss a",
|
|
"h:mm a",
|
|
"EEEE, MMMM d, yyyy",
|
|
"MMMM d, yyyy",
|
|
"MMM d, yyyy",
|
|
"M/d/yy",
|
|
"{1} {0}",
|
|
}
|
|
DayAbbreviations {
|
|
"Sun",
|
|
"Mon",
|
|
"Tue",
|
|
"Wed",
|
|
"Thu",
|
|
"Fri",
|
|
"Sat",
|
|
}
|
|
DayNames {
|
|
"Sunday",
|
|
"Monday",
|
|
"Tuesday",
|
|
"Wednesday",
|
|
"Thursday",
|
|
"Friday",
|
|
"Saturday",
|
|
}
|
|
Eras {
|
|
"BC",
|
|
"AD",
|
|
}
|
|
Languages {
|
|
aa { "Afar" }
|
|
ab { "Abkhazian" }
|
|
ace { "Achinese" }
|
|
ach { "Acoli" }
|
|
ada { "Adangme" }
|
|
ae { "Avestan" }
|
|
af { "Afrikaans" }
|
|
afa { "Afro-Asiatic (Other)" }
|
|
afh { "Afrihili" }
|
|
aka { "Akan" }
|
|
akk { "Akkadien" }
|
|
ale { "Aleut" }
|
|
alg { "Algonquian Languages" }
|
|
am { "Amharic" }
|
|
ang { "English, Old (ca.450-1100)" }
|
|
apa { "Apache Languages"}
|
|
ar { "Arabic" }
|
|
arc { "Aramaic" }
|
|
arn { "Araucanian" }
|
|
arp { "Arapaho" }
|
|
art { "Artificial (Other)" }
|
|
arw { "Arawak" }
|
|
as { "Assamese" }
|
|
ath { "Athapaskan Languages" }
|
|
aus { "Australian Languages" }
|
|
ava { "Avaric" }
|
|
awa { "Awadhi" }
|
|
ay { "Aymara" }
|
|
az { "Azerbaijani" }
|
|
ba { "Bashkir" }
|
|
bad { "Banda" }
|
|
bai { "Bamileke Languages" }
|
|
bal { "Baluuchi" }
|
|
bam { "Bambara" }
|
|
ban { "Balinese" }
|
|
bas { "Basa" }
|
|
bat { "Baltic (Other)" }
|
|
be { "Belarusian" }
|
|
bej { "Beja" }
|
|
bem { "Bemba" }
|
|
ber { "Beber" }
|
|
bg { "Bulgarian" }
|
|
bh { "Bihari" }
|
|
bho { "Bhojpuri" }
|
|
bi { "Bislama" }
|
|
bik { "Bikol" }
|
|
bin { "Bini" }
|
|
bla { "Siksika" }
|
|
bn { "Bengali" }
|
|
bnt { "Bantu" }
|
|
bo { "Tibetan" }
|
|
br { "Brenton" }
|
|
bra { "Braj" }
|
|
bs { "Bosnian"}
|
|
btk { "Batak" }
|
|
bua { "Buriat" }
|
|
bug { "Buginese" }
|
|
ca { "Catalan" }
|
|
cad { "Caddo" }
|
|
cai { "Central American Indian (Other)" }
|
|
car { "Carib" }
|
|
cau { "Caucasian (Other) " }
|
|
ce { "Chechen" }
|
|
ceb { "Cebuano" }
|
|
cel { "Celtic (Other)" }
|
|
ch { "Chamorro" }
|
|
chb { "Chibcha" }
|
|
chg { "Chagatai" }
|
|
chk { "Chuukese" }
|
|
chm { "Mari" }
|
|
chn { "Chinook Jargon" }
|
|
cho { "Choctaw" }
|
|
chp { "Chipewyan" }
|
|
chr { "Cherokee" }
|
|
chy { "Cheyenne" }
|
|
cmc { "Chamic Languages" }
|
|
co { "Corsican" }
|
|
cop { "Coptic" }
|
|
cpe { "Creoles and Pidgins, English-based (Other)" }
|
|
cpf { "Creoles and Pidgins, French-based (Other)" }
|
|
cre { "Cree" }
|
|
crp { "Creoles and Pidgins (Other)" }
|
|
cs { "Czech" }
|
|
cu { "Church Slavic" }
|
|
cus { "Cushitic (Other)" }
|
|
cv { "Chuvash" }
|
|
cy { "Welsh" }
|
|
da { "Danish" }
|
|
dak { "Dakota" }
|
|
day { "Dayak" }
|
|
de { "German" }
|
|
del { "Delaware" }
|
|
den { "Slave" }
|
|
dgr { "Dogrib" }
|
|
din { "Dinka" }
|
|
div { "Divehi" }
|
|
doi { "Dogri" }
|
|
dra { "Dravidian (Other)" }
|
|
dua { "Duala" }
|
|
dum { "Dutch, Middle (ca. 1050-1350)" }
|
|
dyu { "Dyula" }
|
|
dz { "Bhutani" }
|
|
dzo { "Dzongkha" }
|
|
efi { "Efik" }
|
|
egy { "Egyptian (Ancient)" }
|
|
eka { "Ekajuk" }
|
|
el { "Greek" } // Modern (1453-)
|
|
elx { "Elamite" }
|
|
en { "English" }
|
|
enm { "English, Middle( 1100 -1500)" }
|
|
eo { "Esperanto" }
|
|
es { "Spanish" }
|
|
et { "Estonian" }
|
|
eu { "Basque" }
|
|
ewe { "Ewe" }
|
|
ewo { "Ewondo" }
|
|
fa { "Persian" }
|
|
fan { "Fang" }
|
|
fat { "Fanti" }
|
|
fi { "Finnish" }
|
|
fiu { "Finno - Ugrian" }
|
|
fj { "Fiji" }
|
|
fo { "Faeroese" }
|
|
fon { "Fon" }
|
|
fr { "French" }
|
|
frm { "French, Middle (ca.1400-1600)" }
|
|
fro { "French, Old (842-ca.1400)" }
|
|
ful { "Fulah" }
|
|
fur { "Friulian" }
|
|
fy { "Frisian" }
|
|
ga { "Irish" }
|
|
gaa { "Ga" }
|
|
gay { "Gayo" }
|
|
gba {"Gbaya" }
|
|
gd { "Scots Gaelic" }
|
|
gem { "Germanic (Other)" }
|
|
gil { "Gilbertese" }
|
|
gl { "Gallegan" }
|
|
gla { "Gaelic (Scots)" }
|
|
gmh { "German, Middle High (ca.1050-1500)" }
|
|
gn { "Guarani" }
|
|
goh { " German, Old High (ca.750-1050)" }
|
|
gon { "Gondi" }
|
|
gor { "Gorontalo" }
|
|
got { "Gothic" }
|
|
grb { "Gerbo" }
|
|
grc { "Greek, Ancient (to 1453)" }
|
|
gu { "Gujarati" }
|
|
gv { "Manx" }
|
|
gwi { "Gwich'in" }
|
|
hai { "Haida" }
|
|
hau { "Hausa" }
|
|
haw { "Hawaiian" }
|
|
he { "Hebrew" }
|
|
hi { "Hindi" }
|
|
him { "Himachali" }
|
|
hit { "Hittite" }
|
|
hmn { "Hmong" }
|
|
ho { "Hiri Motu" }
|
|
hr { "Croatian" }
|
|
hu { "Hungarian" }
|
|
hup { "Hupa" }
|
|
hy { "Armenian" }
|
|
hz { "Herero" }
|
|
ia { "Interlingua" }
|
|
iba { "Iban" }
|
|
ibo { "Igbo" }
|
|
id { "Indonesian" }
|
|
ie { "Interlingue" }
|
|
ijo { "Ijo" }
|
|
ik { "Inupiak" }
|
|
ilo { "Iloko" }
|
|
inc { "Indic (Other)" }
|
|
ine { "Indo-European" }
|
|
ira { "Iranian " }
|
|
iro { "Iroguoian Languages" }
|
|
is { "Icelandic" }
|
|
it { "Italian" }
|
|
iu { "Inukitut" }
|
|
iw { "Hebrew" }
|
|
ja { "Japanese" }
|
|
jpr { "Judeo-Persian" }
|
|
jrb { "Judeo-Arabic" }
|
|
jw { "Javanese" }
|
|
ka { "Georgian" }
|
|
kaa { "Kara-Kalpak" }
|
|
kab { "Kabyle" }
|
|
kac { "Kachin" }
|
|
kam { "Kamba" }
|
|
kar { "Karen" }
|
|
kau { "Kanuri" }
|
|
kaw { "Kawi" }
|
|
kha { "Khasi" }
|
|
khi { "Khoisan" }
|
|
kho { "Khotanese" }
|
|
ki { "Kikuyu" }
|
|
kk { "Kazakh" }
|
|
kl { "Kalaallisut" }
|
|
km { "Khmer" }
|
|
kmb { "Kimbundu" }
|
|
kn { "Kannada" }
|
|
ko { "Korean" }
|
|
kok { "Konkani" }
|
|
kon { "Kongo" }
|
|
kos { "Kosrean" }
|
|
kpe { "Kpelle" }
|
|
kro { "Kru" }
|
|
kru { "Kuruckh" }
|
|
ks { "Kashmiri" }
|
|
ku { "Kurdish" }
|
|
kum { "Kumyk" }
|
|
kut { "Kutenai" }
|
|
kv { "Komi" }
|
|
kw { "Cornish" }
|
|
ky { "Kirghiz" }
|
|
la { "Latin" }
|
|
lad { "Ladino" }
|
|
lah { "Lahnda" }
|
|
lam { "Lamba" }
|
|
lb { "Letzeburgesch" }
|
|
lez { "Lezghian" }
|
|
lin { "Lingala" }
|
|
lit { "Lithuanian" }
|
|
ln { "Lingala" }
|
|
lo { "Lao" }
|
|
lol { "Mongo" }
|
|
loz { "Lozi" }
|
|
lt { "Lithuanian" }
|
|
lua { "Luba-Lulua" }
|
|
lub { "Luba-Katanga" }
|
|
lug { "Ganda" }
|
|
lui { "Luiseeno" }
|
|
lun { "Lunda" }
|
|
luo { "Lua" }
|
|
lus { "Lushai" }
|
|
lv { "Latvian (Lettish)" }
|
|
mad { "Madurese" }
|
|
mag { "Magahi" }
|
|
mai { "Maithili" }
|
|
mak { "Makasar" }
|
|
man { "Mandingue" }
|
|
map { "Austronesian" }
|
|
mas { "Masai" }
|
|
mdr { "Mandar" }
|
|
men { "Mende" }
|
|
mg { "Malagasy" }
|
|
mga { "Irish, Middle (900-1200)" }
|
|
mh { "Marshall"}
|
|
mi { "Maori" }
|
|
mic { "Mic-Mac" }
|
|
min { "Minangkabau" }
|
|
mis { "Miscellaneous Languages" }
|
|
mk { "Macedonian" }
|
|
mkh { "Mon-Khmer (Ohter)" }
|
|
ml { "Malayalam" }
|
|
mn { "Mongolian" }
|
|
mnc { "Manchu" }
|
|
mni { "Manipuri" }
|
|
mno { "Manobo Languages" }
|
|
mo { "Moldavian" }
|
|
moh { "Mohawk" }
|
|
mos { "Mossi" }
|
|
mr { "Marathi" }
|
|
ms { "Malay" }
|
|
mt { "Maltese" }
|
|
mul { "Multiple Languages" }
|
|
mun { "Munda Languages" }
|
|
mus { "Creek" }
|
|
mwr { "Marwari" }
|
|
my { "Burmese" }
|
|
myn { "Mayan" }
|
|
na { "Nauru" }
|
|
nah { "Nahuatl" }
|
|
nai { "North American Indian (Ohter)" }
|
|
nb { "Norwegian Bokm\u00e5l" }
|
|
nd { "Ndebele, North" }
|
|
nds { "Low German; Low Saxon" }
|
|
ne { "Nepali" }
|
|
new { "Newari" }
|
|
ng { "Ndonga" }
|
|
nia { "Nias" }
|
|
nic { "Niger - Kordofanian" }
|
|
niu { "Niuean" }
|
|
nl { "Dutch" }
|
|
nn { "Norwegian Nynorsk" }
|
|
no { "Norwegian" }
|
|
non { "Norse, Old" }
|
|
nr { "Ndebele, South" }
|
|
nso { "Sotho, Northern" }
|
|
nub { "Nubian Languages" }
|
|
nv {"Navajo"}
|
|
ny { " Chichewa; Nyanja" }
|
|
nym { "Nyamwezi" }
|
|
nyo { "Nyoro" }
|
|
nzi { "Nzima" }
|
|
oc { "Proven\u00E7al; Occitan (post 1500)"}
|
|
oji { "Ojibwa" }
|
|
om { "Oromo (Afan)" }
|
|
or { "Oriya" }
|
|
os { "Ossetic" }
|
|
osa { "Osage" }
|
|
ota { "Turkish (Ottoman Empire)" }
|
|
oto { "Otomian Languages" }
|
|
pa { "Punjabi" }
|
|
paa { "Papuan (Ohter)" }
|
|
pag { "Pangasinan" }
|
|
pal { "Pahlavi" }
|
|
pam { "pampamga" }
|
|
pap { "Papiamento" }
|
|
pau { "Palauan" }
|
|
peo { "Persian Old (ca.600-400 B.C.)" }
|
|
phi { "Philippine (Other)" }
|
|
phn { "Phoenician" }
|
|
pi { "Pali" }
|
|
pl { "Polish" }
|
|
pon { "Pohnpeian" }
|
|
pra { "Prakrit Languages" }
|
|
pro { "Proven\u00E7al, Old (to 1500)" }
|
|
ps { "Pashto (Pushto)" }
|
|
pt { "Portuguese" }
|
|
qu { "Quechua" }
|
|
raj { "Rajastani" }
|
|
rap { "Rapanui" }
|
|
rar { "Rarotongan" }
|
|
rm { "Rhaeto-Romance" }
|
|
rn { "Rundi" }
|
|
ro { "Romanian" }
|
|
roa { "Romance (Other)" }
|
|
rom { "Romany" }
|
|
ru { "Russian" }
|
|
rw { "Kinyarwanda" }
|
|
sa { "Sanskrit" }
|
|
sad { "Sandawe" }
|
|
sah { "Yakut" }
|
|
sai { "South American Indian (Ohter)" }
|
|
sal { "Salishan" }
|
|
sam { "Samritan" }
|
|
sas { "Saska" }
|
|
sat { "Santali" }
|
|
sc { "Sardinian" }
|
|
sco { "Scots" }
|
|
sd { "Sindhi" }
|
|
se { "Northern Sami" }
|
|
// http://lcweb.loc.gov/standards/iso639-2/englangn.html
|
|
// should provide the correct language code soon
|
|
// se { "Sami Languages" } // DUP FIXME
|
|
sel { "Selkup" }
|
|
sem { "Semitic" }
|
|
sg { "Sango" }
|
|
sga { "Irish, Old (to 900)" }
|
|
sgn { "Sign Languages" }
|
|
sh { "Serbo-Croatian" }
|
|
shn { "Shan" }
|
|
si { "Sinhalese" }
|
|
sid { "Sidamo" }
|
|
sio { "Siouan Languages" }
|
|
sit { "Sino-Tibetan (Other)" }
|
|
sk { "Slovak" }
|
|
sl { "Slovenian" }
|
|
sm { "Samoan" }
|
|
sn { "Shona" }
|
|
snk { "Soninke" }
|
|
so { "Somali" }
|
|
sog { "Sogdien" }
|
|
son { "Songhai" }
|
|
sq { "Albanian" }
|
|
sr { "Serbian" }
|
|
srr { "Serer" }
|
|
ss { "Swati" }
|
|
ssa { "Nilo-Saharam" }
|
|
st { "Sotho, Southern" }
|
|
su { "Sundanese" }
|
|
suk { "Sukuma" }
|
|
sus { "Susu" }
|
|
sux { "Sumerian"}
|
|
sv { "Swedish" }
|
|
sw { "Swahili" }
|
|
syr { "Syriac" }
|
|
ta { "Tamil" }
|
|
tai { "Tai (Other)" }
|
|
te { "Telugu" }
|
|
tem { "Timne" }
|
|
ter { "Tereno" }
|
|
tet { "Tetum" }
|
|
tg { "Tajik" }
|
|
th { "Thai" }
|
|
tig { "Tigre" }
|
|
tir { "Tigrinya" }
|
|
tiv { "Tiv" }
|
|
tk { "Turkmen" }
|
|
tl { "Tagalog" }
|
|
tli { "Tlingit" }
|
|
tmh { "Tamashek" }
|
|
tn { "Tswana" }
|
|
tog { "Tonga (Nyasa)" }
|
|
ton { "Tongan (Tonga Islands)" }
|
|
tr { "Turkish" }
|
|
ts { "Tsonga" }
|
|
tsi { "Tsimshian" }
|
|
tt { "Tatar" }
|
|
tum { "Tumbuka" }
|
|
tur { "Turkish" }
|
|
tut { "Altaic (Other)" }
|
|
tvl { "Tuvalu" }
|
|
tw { "Twi" }
|
|
ty { "Tahitian" }
|
|
tyv { "Tuvinian" }
|
|
ug { "Uighur" }
|
|
uga { "Ugaritic" }
|
|
uk { "Ukrainian" }
|
|
umb { "Umbundu" }
|
|
und { "Undetermined" }
|
|
ur { "Urdu" }
|
|
uz { "Uzbek" }
|
|
vai { "Vai" }
|
|
ven { "Venda" }
|
|
vi { "Vietnamese" }
|
|
vo { "Volapuk" }
|
|
vot { "Votic" }
|
|
wak { "Wakashan Languages" }
|
|
wal { "Walamo" }
|
|
war { "Waray" }
|
|
was { "Washo" }
|
|
wen { "Sorbian Languages" }
|
|
wo { "Wolof" }
|
|
xh { "Xhosa" }
|
|
yao { "Yao" }
|
|
yap { "Yapese" }
|
|
yi { "Yiddish" }
|
|
yor { "Yoruba" }
|
|
ypk { "Yupik Languages" }
|
|
za { "Zhuang" }
|
|
zap { "Zapotec" }
|
|
zen { "Zenaga" }
|
|
zh { "Chinese" }
|
|
znd { "Zande" }
|
|
zu { "Zulu" }
|
|
zun { "Zuni" }
|
|
}
|
|
LocaleID { "0000" }
|
|
LocaleString { "en" }
|
|
MonthAbbreviations {
|
|
"Jan",
|
|
"Feb",
|
|
"Mar",
|
|
"Apr",
|
|
"May",
|
|
"Jun",
|
|
"Jul",
|
|
"Aug",
|
|
"Sep",
|
|
"Oct",
|
|
"Nov",
|
|
"Dec",
|
|
"",
|
|
}
|
|
MonthNames {
|
|
"January",
|
|
"February",
|
|
"March",
|
|
"April",
|
|
"May",
|
|
"June",
|
|
"July",
|
|
"August",
|
|
"September",
|
|
"October",
|
|
"November",
|
|
"December",
|
|
"",
|
|
}
|
|
NumberElements {
|
|
".",
|
|
",",
|
|
";",
|
|
"%",
|
|
"0",
|
|
"#",
|
|
"-",
|
|
"E",
|
|
"\u2030",
|
|
"\u221E",
|
|
"\uFFFD",
|
|
}
|
|
NumberPatterns {
|
|
"#,##0.###;-#,##0.###",
|
|
"\u00A4 #,##0.00;-\u00A4 #,##0.00",
|
|
"#,##0%",
|
|
"#E0"
|
|
}
|
|
ShortCountry { "" }
|
|
ShortLanguage { "eng" }
|
|
localPatternChars { "GyMdkHmsSEDFwWahKzYe" }
|
|
zoneStrings {
|
|
{
|
|
"PST",
|
|
"Pacific Standard Time",
|
|
"PST",
|
|
"Pacific Daylight Time",
|
|
"PDT",
|
|
"San Francisco",
|
|
}
|
|
{
|
|
"MST",
|
|
"Mountain Standard Time",
|
|
"MST",
|
|
"Mountain Daylight Time",
|
|
"MDT",
|
|
"Denver",
|
|
}
|
|
{
|
|
"PNT",
|
|
"Mountain Standard Time",
|
|
"MST",
|
|
"Mountain Standard Time",
|
|
"MST",
|
|
"Phoenix",
|
|
}
|
|
{
|
|
"CST",
|
|
"Central Standard Time",
|
|
"CST",
|
|
"Central Daylight Time",
|
|
"CDT",
|
|
"Chicago",
|
|
}
|
|
{
|
|
"EST",
|
|
"Eastern Standard Time",
|
|
"EST",
|
|
"Eastern Daylight Time",
|
|
"EDT",
|
|
"New York",
|
|
}
|
|
{
|
|
"IET",
|
|
"Eastern Standard Time",
|
|
"EST",
|
|
"Eastern Standard Time",
|
|
"EST",
|
|
"Indianapolis",
|
|
}
|
|
{
|
|
"PRT",
|
|
"Atlantic Standard Time",
|
|
"AST",
|
|
"Atlantic Daylight Time",
|
|
"ADT",
|
|
"Halifax",
|
|
}
|
|
{
|
|
"HST",
|
|
"Hawaii Standard Time",
|
|
"HST",
|
|
"Hawaii Daylight Time",
|
|
"HDT",
|
|
"Honolulu",
|
|
}
|
|
{
|
|
"AST",
|
|
"Alaska Standard Time",
|
|
"AST",
|
|
"Alaska Daylight Time",
|
|
"ADT",
|
|
"Anchorage",
|
|
}
|
|
}
|
|
}
|
|
|