scuffed-code/icu4c/data/th.txt
Ram Viswanadha b376a4453b ICU-899 Add locale script mapping support
X-SVN-Rev: 5200
2001-07-09 15:20:03 +00:00

249 lines
9.9 KiB
Plaintext

// *******************************************************************************
// *
// * Copyright (C) 1999-2001, International Business Machines
// * Corporation and others. All Rights Reserved.
// *
// *******************************************************************************
th {
BreakDictionaryData:import { "thaidict.brk" }
AmPmMarkers {
"\u0E01\u0E48\u0E2D\u0E19\u0E40\u0E17\u0E35\u0E48\u0E22\u0E07",
"\u0E2B\u0E25\u0E31\u0E07\u0E40\u0E17\u0E35\u0E48\u0E22\u0E07",
}
Version{ "1.1.1" }
// -------------------- ibm.597 --------------------
//
// First put in all of the consonants, after Z
//
CollationElements {
Version { "2.0" }
Sequence { "[normalization on]& Z "
"< \u0E01 " // KO KAI
"< \u0E02 " // KHO KHAI
"< \u0E03 " // KHO KHUAT
"< \u0E04 " // KHO KHWAI
"< \u0E05 " // KHO KHON
"< \u0E06 " // KHO RAKHANG
"< \u0E07 " // NGO NGU
"< \u0E08 " // CHO CHAN
"< \u0E09 " // CHO CHING
"< \u0E0A " // CHO CHANG
"< \u0E0B " // SO SO
"< \u0E0C " // CHO CHOE
"< \u0E0D " // YO YING
"< \u0E0E " // DO CHADA
"< \u0E0F " // TO PATAK
"< \u0E10 " // THO THAN
"< \u0E11 " // THO NANGMONTHO
"< \u0E12 " // THO PHUTHAO
"< \u0E13 " // NO NEN
"< \u0E14 " // DO DEK
"< \u0E15 " // TO TAO
"< \u0E16 " // THO THUNG
"< \u0E17 " // THO THAHAN
"< \u0E18 " // THO THONG
"< \u0E19 " // NO NU
"< \u0E1A " // BO BAIMAI
"< \u0E1B " // PO PLA
"< \u0E1C " // PHO PHUNG
"< \u0E1D " // FO FA
"< \u0E1E " // PHO PHAN
"< \u0E1F " // FO FAN
"< \u0E20 " // PHO SAMPHAO
"< \u0E21 " // MO MA
"< \u0E22 " // YO YAK
"< \u0E23 " // RO RUA
"< \u0E24 " // RU
"< \u0E24\u0E45 " // See the comment below on LAKKHANGYAO
"< \u0E25 " // LO LING
"< \u0E26 " // LU
"< \u0E26\u0E45 " // See the comment below on LAKKHANGYAO
"< \u0E27 " // WO WAEN
"< \u0E28 " // SO SALA
"< \u0E29 " // SO RUSI
"< \u0E2A " // SO SUA
"< \u0E2B " // HO HIP
"< \u0E2C " // LO CHULA
"< \u0E2D " // O ANG
"< \u0E2E " // HO NOKHUK
//
// Normal vowels
//
"< \u0E30 " // SARA A
"< \u0E31 " // MAI HAN-AKAT
"< \u0E32 " // SARA AA
// Normalizer will decompose this character to \u0e4d\u0e32.
// This is a Bad Thing, because we want the separate
// characters to sort differently than this individual one.
// Since there's no public way to set the decomposition to be
// used when creating a collator, there's no way around this
// right now. It's best to go ahead and leave the character
// in, because it occurs this way a lot more often than it
// occurs as separate characters.
"< \u0E33 " // SARA AM
"< \u0E34 " // SARA I
"< \u0E35 " // SARA II
"< \u0E36 " // SARA UE
"< \u0E37 " // SARA UEE
"< \u0E38 " // SARA U
"< \u0E39 " // SARA UU
//
// Preceding vowels
//
"< \u0E40 " // SARA E
"< \u0E41 " // SARA AE
"< \u0E42 " // SARA O
"< \u0E43 " // SARA AI MAIMUAN
"< \u0E44 " // SARA AI MAIMALAI
//
// Digits
//
"< \u0E50 " // DIGIT ZERO
"< \u0E51 " // DIGIT ONE
"< \u0E52 " // DIGIT TWO
"< \u0E53 " // DIGIT THREE
"< \u0E54 " // DIGIT FOUR
"< \u0E55 " // DIGIT FIVE
"< \u0E56 " // DIGIT SIX
"< \u0E57 " // DIGIT SEVEN
"< \u0E58 " // DIGIT EIGHT
"< \u0E59 " // DIGIT NINE
// Sorta tonal marks, but maybe not really
"< \u0E4D " // NIKHAHIT
// Thai symbols are supposed to sort "after white space". I'm
// treating this as making them sort just after the normal
// Latin-1 symbols, which are in turn after the white space.
"&'\u007d'" // right-brace
"< \u0E2F " // PAIYANNOI (ellipsis, abbreviation)
"< \u0E46 " // MAIYAMOK
"< \u0E4F " // FONGMAN
"< \u0E5A " // ANGKHANKHU
"< \u0E5B " // KHOMUT
"< \u0E3F " // CURRENCY SYMBOL BAHT
// These symbols are supposed to be "after all characters"
"< \u0E4E " // YAMAKKAN
// This rare symbol also comes after all characters. But when it is
// used in combination with RU and LU, the combination is treated as
// a separate letter, ala "CH" sorting after "C" in traditional Spanish.
// see above.
"< \u0E45 " // LAKKHANGYAO
// Tonal marks are primary ignorables but are treated as secondary
// differences
"& \u0301 " // acute accent
"; \u0E47 " // MAITAIKHU
"; \u0E48 " // MAI EK
"; \u0E49 " // MAI THO
"; \u0E4A " // MAI TRI
"; \u0E4B " // MAI CHATTAWA
"; \u0E4C " // THANTHAKHAT
// These are supposed to be ignored, so I'm treating them as controls
"& \u0001 "
"= \u0E3A " // PHINTHU
"= '.' " // period
}
}
Countries {
TH { "\u0E1B\u0E23\u0E30\u0E40\u0E17\u0E28\u0E44\u0E17\u0E22" }
}
DateTimePatterns {
"H' \u0E19\u0E32\u0E2C\u0E34\u0E01\u0E32 'm' \u0E19\u0E32\u0E17\u0E35 'ss' \u0E27"
"\u0E34\u0E19\u0E32\u0E17\u0E35'",
"H' \u0E19\u0E32\u0E2C\u0E34\u0E01\u0E32 'm' \u0E19\u0E32\u0E17\u0E35'",
"H:mm:ss",
"H:mm",
"EEEE'\u0E17\u0E35\u0E48 'd MMMM G yyyy",
"d MMMM yyyy",
"d MMM yyyy",
"d/M/yyyy",
"{1}, {0}",
}
DayAbbreviations {
"\u0E2D\u0E32.",
"\u0E08.",
"\u0E2D.",
"\u0E1E.",
"\u0E1E\u0E24.",
"\u0E28.",
"\u0E2A.",
}
DayNames {
"\u0E27\u0E31\u0E19\u0E2D\u0E32\u0E17\u0E34\u0E15\u0E22\u0E4C",
"\u0E27\u0E31\u0E19\u0E08\u0E31\u0E19\u0E17\u0E23\u0E4C",
"\u0E27\u0E31\u0E19\u0E2D\u0E31\u0E07\u0E04\u0E32\u0E23",
"\u0E27\u0E31\u0E19\u0E1E\u0E38\u0E18",
"\u0E27\u0E31\u0E19\u0E1E\u0E24\u0E2B\u0E31\u0E2A\u0E1A\u0E14\u0E35",
"\u0E27\u0E31\u0E19\u0E28\u0E38\u0E01\u0E23\u0E4C",
"\u0E27\u0E31\u0E19\u0E40\u0E2A\u0E32\u0E23\u0E4C",
}
Eras {
"\u0E1B\u0E35\u0E01\u0E48\u0E2D\u0E19\u0E04\u0E23\u0E34\u0E2A\u0E15\u0E4C\u0E01\u0E32"
"\u0E25\u0E17\u0E35\u0E48",
"\u0E04.\u0E28.",
}
Languages {
th { "\u0E44\u0E17\u0E22" }
}
LocaleID { "1e" }
LocaleString { "th" }
MonthAbbreviations {
"\u0E21.\u0E04.",
"\u0E01.\u0E1E.",
"\u0E21\u0E35.\u0E04.",
"\u0E40\u0E21.\u0E22.",
"\u0E1E.\u0E04.",
"\u0E21\u0E34.\u0E22.",
"\u0E01.\u0E04.",
"\u0E2A.\u0E04.",
"\u0E01.\u0E22.",
"\u0E15.\u0E04.",
"\u0E1E.\u0E22.",
"\u0E18.\u0E04.",
"",
}
MonthNames {
"\u0E21\u0E01\u0E23\u0E32\u0E04\u0E21",
"\u0E01\u0E38\u0E21\u0E20\u0E32\u0E1E\u0E31\u0E19\u0E18\u0E4C",
"\u0E21\u0E35\u0E19\u0E32\u0E04\u0E21",
"\u0E40\u0E21\u0E29\u0E32\u0E22\u0E19",
"\u0E1E\u0E24\u0E29\u0E20\u0E32\u0E04\u0E21",
"\u0E21\u0E34\u0E16\u0E38\u0E19\u0E32\u0E22\u0E19",
"\u0E01\u0E23\u0E01\u0E0E\u0E32\u0E04\u0E21",
"\u0E2A\u0E34\u0E07\u0E2B\u0E32\u0E04\u0E21",
"\u0E01\u0E31\u0E19\u0E22\u0E32\u0E22\u0E19",
"\u0E15\u0E38\u0E25\u0E32\u0E04\u0E21",
"\u0E1E\u0E24\u0E28\u0E08\u0E34\u0E01\u0E32\u0E22\u0E19",
"\u0E18\u0E31\u0E19\u0E27\u0E32\u0E04\u0E21",
"",
}
ShortLanguage { "tha" }
localPatternChars { "GanjkHmsSEDFwWxhKzAe" }
zoneStrings {
{
"THA",
"Thailand Time",
"THA",
"Thailand Time",
"THA",
"Bangkok",
}
}
LocaleScript{
"Thai", // Script Name
"Thai" // ISO 15924 Name
}
}