From 58814385b682dda1e1091fe07126ca9fc7a450f2 Mon Sep 17 00:00:00 2001 From: Ram Viswanadha Date: Sat, 16 Mar 2002 03:49:01 +0000 Subject: [PATCH] ICU-1775 Add data for exemplar characters X-SVN-Rev: 8069 --- icu4c/source/data/locales/af.txt | 1 + icu4c/source/data/locales/am.txt | 1 + icu4c/source/data/locales/ar.txt | 1 + icu4c/source/data/locales/az.txt | 1 + icu4c/source/data/locales/be.txt | 2 +- icu4c/source/data/locales/bg.txt | 1 + icu4c/source/data/locales/bn.txt | 1 + icu4c/source/data/locales/ca.txt | 1 + icu4c/source/data/locales/cs.txt | 1 + icu4c/source/data/locales/da.txt | 1 + icu4c/source/data/locales/de.txt | 2 +- icu4c/source/data/locales/div.txt | 4 +- icu4c/source/data/locales/el.txt | 1 + icu4c/source/data/locales/eo.txt | 2 +- icu4c/source/data/locales/es.txt | 3 +- icu4c/source/data/locales/et.txt | 1 + icu4c/source/data/locales/eu.txt | 2 + icu4c/source/data/locales/fa.txt | 1 + icu4c/source/data/locales/fi.txt | 1 + icu4c/source/data/locales/fo.txt | 1 + icu4c/source/data/locales/fr.txt | 1 + icu4c/source/data/locales/ga.txt | 1 + icu4c/source/data/locales/gl.txt | 2 + icu4c/source/data/locales/gu.txt | 3 +- icu4c/source/data/locales/he.txt | 2 +- icu4c/source/data/locales/hi.txt | 1 + icu4c/source/data/locales/hr.txt | 1 + icu4c/source/data/locales/hu.txt | 1 + icu4c/source/data/locales/hy.txt | 1 + icu4c/source/data/locales/is.txt | 1 + icu4c/source/data/locales/it.txt | 1 + icu4c/source/data/locales/ja.txt | 973 ++++++++++++++-------------- icu4c/source/data/locales/ka.txt | 1 + icu4c/source/data/locales/kk.txt | 4 +- icu4c/source/data/locales/kl.txt | 2 + icu4c/source/data/locales/kn.txt | 1 + icu4c/source/data/locales/ko.txt | 11 + icu4c/source/data/locales/kok.txt | 1 + icu4c/source/data/locales/ky.txt | 3 +- icu4c/source/data/locales/lt.txt | 1 + icu4c/source/data/locales/lv.txt | 1 + icu4c/source/data/locales/mk.txt | 1 + icu4c/source/data/locales/mn.txt | 2 + icu4c/source/data/locales/mr.txt | 1 + icu4c/source/data/locales/mt.txt | 2 + icu4c/source/data/locales/nb.txt | 2 + icu4c/source/data/locales/nl.txt | 1 + icu4c/source/data/locales/nn.txt | 2 +- icu4c/source/data/locales/pa.txt | 2 + icu4c/source/data/locales/pl.txt | 1 + icu4c/source/data/locales/pt.txt | 1 + icu4c/source/data/locales/ro.txt | 1 + icu4c/source/data/locales/root.txt | 2 +- icu4c/source/data/locales/ru.txt | 1 + icu4c/source/data/locales/sa.txt | 4 +- icu4c/source/data/locales/sh.txt | 1 + icu4c/source/data/locales/sk.txt | 1 + icu4c/source/data/locales/sl.txt | 1 + icu4c/source/data/locales/sq.txt | 1 + icu4c/source/data/locales/sr.txt | 1 + icu4c/source/data/locales/sv.txt | 3 +- icu4c/source/data/locales/syr.txt | 1 + icu4c/source/data/locales/ta.txt | 1 + icu4c/source/data/locales/te.txt | 3 +- icu4c/source/data/locales/th.txt | 2 +- icu4c/source/data/locales/ti.txt | 2 + icu4c/source/data/locales/tr.txt | 1 + icu4c/source/data/locales/tt.txt | 4 +- icu4c/source/data/locales/uk.txt | 1 + icu4c/source/data/locales/ur.txt | 4 +- icu4c/source/data/locales/uz.txt | 3 +- icu4c/source/data/locales/vi.txt | 2 + icu4c/source/data/locales/zh.txt | 31 + icu4c/source/data/locales/zh_TW.txt | 49 +- 74 files changed, 675 insertions(+), 502 deletions(-) diff --git a/icu4c/source/data/locales/af.txt b/icu4c/source/data/locales/af.txt index 00e9b589be..8e446e826e 100644 --- a/icu4c/source/data/locales/af.txt +++ b/icu4c/source/data/locales/af.txt @@ -73,6 +73,7 @@ af { // "\ufffd", // } LocaleID:int { 0x36 } + ExemplarCharacters { "[a-z \u00e1 \u00e9 \u00e8 \u00e2 \u00ea \u00ee \u00f4 \u00fb \u00eb \u00ef \u00f6]" } // LocaleScript{ // "Latn", // ISO 15924 Name // } diff --git a/icu4c/source/data/locales/am.txt b/icu4c/source/data/locales/am.txt index 0b15186182..abcd03a053 100644 --- a/icu4c/source/data/locales/am.txt +++ b/icu4c/source/data/locales/am.txt @@ -59,6 +59,7 @@ am { LocaleScript { "Ethi", } + ExemplarCharacters{"[:Ethi:]"} Eras { "\u12D3/\u12D3", "\u12D3/\u121D" diff --git a/icu4c/source/data/locales/ar.txt b/icu4c/source/data/locales/ar.txt index 328ff9f615..9d18934153 100644 --- a/icu4c/source/data/locales/ar.txt +++ b/icu4c/source/data/locales/ar.txt @@ -137,4 +137,5 @@ ar { LocaleScript:array { "Arab" } + ExemplarCharacters{"[\u0621 \u0627-\u063A \u0641-\u064A\u0651 \u0653-\u0655 \u0670-\u06B7 \u06BA-\u06BE \u06C1 \u06C3-\u06CE \u06D0-\u06D2]"} } diff --git a/icu4c/source/data/locales/az.txt b/icu4c/source/data/locales/az.txt index 651d1a8bb9..a73ab911ca 100644 --- a/icu4c/source/data/locales/az.txt +++ b/icu4c/source/data/locales/az.txt @@ -82,4 +82,5 @@ az{ } } LocaleScript:array{ "CYRL" } + ExemplarCharacters { "[\u0430-\u0438 \u043a-\u0445 \u0447 \u0448 \u044b \u0458 \u0493 \u049d \u04af \u04b9 \u04bb \u04d9 \u04e9]" } } diff --git a/icu4c/source/data/locales/be.txt b/icu4c/source/data/locales/be.txt index 8b76a09215..70e2a1a116 100644 --- a/icu4c/source/data/locales/be.txt +++ b/icu4c/source/data/locales/be.txt @@ -111,5 +111,5 @@ be { LocaleScript{ "Cyrl", // Abbreviation } - + ExemplarCharacters { "[\u0430-\u0437 \u0439-\u0448 \u044b-\u044f \u2019\u0451\u0456\u045e {\u0434\u0436} {\u0434\u0437}]" } } diff --git a/icu4c/source/data/locales/bg.txt b/icu4c/source/data/locales/bg.txt index aee90fe46c..120cdd9ea0 100644 --- a/icu4c/source/data/locales/bg.txt +++ b/icu4c/source/data/locales/bg.txt @@ -144,4 +144,5 @@ bg { LocaleScript{ "Cyrl", // Abbreviation } + ExemplarCharacters { "[\u0430-\u044c \u044e\u044f\u0463\u046b]" } } diff --git a/icu4c/source/data/locales/bn.txt b/icu4c/source/data/locales/bn.txt index 5ab100d5c7..724bc79a4a 100644 --- a/icu4c/source/data/locales/bn.txt +++ b/icu4c/source/data/locales/bn.txt @@ -63,4 +63,5 @@ bn { LocaleScript:array{ "Beng" } + ExemplarCharacters{"[:Beng:]"} } diff --git a/icu4c/source/data/locales/ca.txt b/icu4c/source/data/locales/ca.txt index 82686544a2..7e6f857387 100644 --- a/icu4c/source/data/locales/ca.txt +++ b/icu4c/source/data/locales/ca.txt @@ -105,5 +105,6 @@ ca { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e9 \u00ed \u00f3 \u00fa \u00e0 \u00e8 \u00f2 \u00ef \u00fc \u0140 \u00e7 \u00f1]" } } diff --git a/icu4c/source/data/locales/cs.txt b/icu4c/source/data/locales/cs.txt index 190a43563e..5a0dd1b3c8 100644 --- a/icu4c/source/data/locales/cs.txt +++ b/icu4c/source/data/locales/cs.txt @@ -113,4 +113,5 @@ cs { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00fd \u00e1 \u00e9 \u00ed \u00f3 \u00fa \u011b \u016f \u010d \u010f \u0148 \u0159 \u0161 \u0165 \u017e]" } } diff --git a/icu4c/source/data/locales/da.txt b/icu4c/source/data/locales/da.txt index de0d783684..f801ef5273 100644 --- a/icu4c/source/data/locales/da.txt +++ b/icu4c/source/data/locales/da.txt @@ -115,4 +115,5 @@ da { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e6 \u00e5 \u00f8 \u00e1 \u00e9 \u00ed \u00f3 \u00fa \u00fd]" } } diff --git a/icu4c/source/data/locales/de.txt b/icu4c/source/data/locales/de.txt index f35217029b..db3e69638e 100644 --- a/icu4c/source/data/locales/de.txt +++ b/icu4c/source/data/locales/de.txt @@ -517,7 +517,7 @@ de { // LocaleScript{ // "Latn", // ISO 15924 Name // } - + ExemplarCharacters { "[a-z \u00e4 \u00f6 \u00fc \u00df]" } //------------------------------------------------------------ // Rule Based Number Format Support //------------------------------------------------------------ diff --git a/icu4c/source/data/locales/div.txt b/icu4c/source/data/locales/div.txt index c8b9e1e396..0c5cb9f9b8 100644 --- a/icu4c/source/data/locales/div.txt +++ b/icu4c/source/data/locales/div.txt @@ -87,8 +87,8 @@ div { LocaleScript:array { "THAA" } - - CollationElements { + ExemplarCharacters { "[:Thaa:]" } + CollationElements { Version { "1.0" } Sequence { "[normalization on]" diff --git a/icu4c/source/data/locales/el.txt b/icu4c/source/data/locales/el.txt index e3a3414af8..a05aad9007 100644 --- a/icu4c/source/data/locales/el.txt +++ b/icu4c/source/data/locales/el.txt @@ -185,6 +185,7 @@ el { LocaleScript:array { "Grek" // ISO 15924 Name } + ExemplarCharacters{"[\u03ac-\u03ce]"} //------------------------------------------------------------ // Rule Based Number Format Support diff --git a/icu4c/source/data/locales/eo.txt b/icu4c/source/data/locales/eo.txt index 13f192ebcb..6973c72bc2 100644 --- a/icu4c/source/data/locales/eo.txt +++ b/icu4c/source/data/locales/eo.txt @@ -135,7 +135,7 @@ eo { // LocaleScript{ // "Latn", // ISO 15924 Name // } - + ExemplarCharacters { "[a-z \u016d \u0109 \u011d \u0125 \u0135 \u015d]" } //------------------------------------------------------------ // Rule Based Number Format Support //------------------------------------------------------------ diff --git a/icu4c/source/data/locales/es.txt b/icu4c/source/data/locales/es.txt index 5419e77271..c3db684258 100644 --- a/icu4c/source/data/locales/es.txt +++ b/icu4c/source/data/locales/es.txt @@ -269,7 +269,8 @@ es { // LocaleScript{ // "Latn", // ISO 15924 Name // } - + ExemplarCharacters { "[a-z \u00f1 \u00e1 \u00e9 \u00ed \u00f3 \u00fa]" } + //------------------------------------------------------------ // Rule Based Number Format Support //------------------------------------------------------------ diff --git a/icu4c/source/data/locales/et.txt b/icu4c/source/data/locales/et.txt index 80a8c8a992..20ad6079f4 100644 --- a/icu4c/source/data/locales/et.txt +++ b/icu4c/source/data/locales/et.txt @@ -110,4 +110,5 @@ et { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00f5 \u00e4 \u00f6 \u00fc \u0161 \u017e]" } } diff --git a/icu4c/source/data/locales/eu.txt b/icu4c/source/data/locales/eu.txt index bb181ea110..42f70f876c 100644 --- a/icu4c/source/data/locales/eu.txt +++ b/icu4c/source/data/locales/eu.txt @@ -70,6 +70,8 @@ eu { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00f1 \u00e7]" } + // /**************** Info Below is needed ****************/ // CollationElements{} // Countries{} diff --git a/icu4c/source/data/locales/fa.txt b/icu4c/source/data/locales/fa.txt index 572053979c..0fc6fbe59d 100644 --- a/icu4c/source/data/locales/fa.txt +++ b/icu4c/source/data/locales/fa.txt @@ -72,6 +72,7 @@ fa { LocaleScript:array { "Arab" // ISO 15924 Name } + ExemplarCharacters{"[\u06F0\u06F9 \u0621-\u063A \u0640-\u0648 \u064A-\u0652 \u067E \u0686 \u0698 \u06A9 \u06AF \u06CC]"} // /**************** Info Below is needed ****************/ // Countries{} // Eras{} diff --git a/icu4c/source/data/locales/fi.txt b/icu4c/source/data/locales/fi.txt index 83123917d6..85bdb5e210 100644 --- a/icu4c/source/data/locales/fi.txt +++ b/icu4c/source/data/locales/fi.txt @@ -217,6 +217,7 @@ fi { "GMT", } } + ExemplarCharacters { "[a-z \u00e4 \u00f6]" } // LocaleScript{ // "Latn", // ISO 15924 Name // } diff --git a/icu4c/source/data/locales/fo.txt b/icu4c/source/data/locales/fo.txt index 3c8331e3ed..932f9786b3 100644 --- a/icu4c/source/data/locales/fo.txt +++ b/icu4c/source/data/locales/fo.txt @@ -70,4 +70,5 @@ fo { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e1 \u00e6 \u00ed \u00f0 \u00f3 \u00f8 \u00fa \u00fd]" } } diff --git a/icu4c/source/data/locales/fr.txt b/icu4c/source/data/locales/fr.txt index 16d341d17a..d3629d52d4 100644 --- a/icu4c/source/data/locales/fr.txt +++ b/icu4c/source/data/locales/fr.txt @@ -386,6 +386,7 @@ fr { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e9 \u00e8 \u00f9 \u00e7 \u00e0 \u00e2 \u00ea \u00ee \u00f4 \u00fb \u00e6 \u0153 \u00eb \u00ef \u00fc \u00ff]" } // http://www.elections.ca/gen_info/backgrounders/ec90815_f.html // http://lcweb.loc.gov/standards/iso639-2/frenchlangn.html diff --git a/icu4c/source/data/locales/ga.txt b/icu4c/source/data/locales/ga.txt index 525e33a632..f89f1f1c95 100644 --- a/icu4c/source/data/locales/ga.txt +++ b/icu4c/source/data/locales/ga.txt @@ -70,4 +70,5 @@ ga{ // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e1 \u00e9 \u00ed \u00f3 \u00fa]" } } diff --git a/icu4c/source/data/locales/gl.txt b/icu4c/source/data/locales/gl.txt index ed941bffcf..b32562faa0 100644 --- a/icu4c/source/data/locales/gl.txt +++ b/icu4c/source/data/locales/gl.txt @@ -71,6 +71,8 @@ gl { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e1 \u00e9 \u00ed \u00f3 \u00fa \u00fc \u00f1]" } + // /**************** Info Below is needed ****************/ // CollationElements{} // Countries{} diff --git a/icu4c/source/data/locales/gu.txt b/icu4c/source/data/locales/gu.txt index 1e3dbb28f8..fe68927937 100644 --- a/icu4c/source/data/locales/gu.txt +++ b/icu4c/source/data/locales/gu.txt @@ -79,7 +79,8 @@ gu { "\ufffd", } LocaleScript:array { "Gujr" } - CollationElements { + ExemplarCharacters { "[:Gujr:]" } + CollationElements { Version { "1.0" } Sequence { "[normalization on]" diff --git a/icu4c/source/data/locales/he.txt b/icu4c/source/data/locales/he.txt index a618b55f59..928332d59a 100644 --- a/icu4c/source/data/locales/he.txt +++ b/icu4c/source/data/locales/he.txt @@ -98,7 +98,7 @@ he { LocaleScript:array { "Hebr" // ISO 15924 Name } - + ExemplarCharacters{"[:Hebr:]"} //------------------------------------------------------------ // Rule Based Number Format Support //------------------------------------------------------------ diff --git a/icu4c/source/data/locales/hi.txt b/icu4c/source/data/locales/hi.txt index 61869d61a7..d53191f059 100644 --- a/icu4c/source/data/locales/hi.txt +++ b/icu4c/source/data/locales/hi.txt @@ -333,5 +333,6 @@ hi { LocaleScript:array { "Deva" // ISO 15924 Name } + ExemplarCharacters{"[:Deva:]"} } diff --git a/icu4c/source/data/locales/hr.txt b/icu4c/source/data/locales/hr.txt index b3343aaec0..fb89ecb6a0 100644 --- a/icu4c/source/data/locales/hr.txt +++ b/icu4c/source/data/locales/hr.txt @@ -106,6 +106,7 @@ hr { "GMT", } } + ExemplarCharacters { "[a-p r-v z \u0111 \u0107 \u010d \u017e \u0161 {lj} {nj} {d\u017e}]" } // LocaleScript:array { // "Latn" // ISO 15924 Name // } diff --git a/icu4c/source/data/locales/hu.txt b/icu4c/source/data/locales/hu.txt index 0a6b3392d1..8b05ea4e7c 100644 --- a/icu4c/source/data/locales/hu.txt +++ b/icu4c/source/data/locales/hu.txt @@ -115,4 +115,5 @@ hu { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e1 \u00e9 \u00ed \u00f3 \u00fa \u00f6 \u00fc \u0151 \u0171]" } } diff --git a/icu4c/source/data/locales/hy.txt b/icu4c/source/data/locales/hy.txt index fdd296b02a..ddbbe2c1c8 100644 --- a/icu4c/source/data/locales/hy.txt +++ b/icu4c/source/data/locales/hy.txt @@ -76,6 +76,7 @@ hy{ LocaleScript{ "Armn", // Script Name } + ExemplarCharacters{"[:Armn:]"} Countries{ AM { "\u0540\u0561\u0575\u0561\u057D\u057F\u0561\u0576\u056B\u0020" "\u0540\u0561\u0576\u0580\u0561\u057A\u0565\u057F\u0578\u0582\u0569" diff --git a/icu4c/source/data/locales/is.txt b/icu4c/source/data/locales/is.txt index c5b4068729..f1ea3be5c5 100644 --- a/icu4c/source/data/locales/is.txt +++ b/icu4c/source/data/locales/is.txt @@ -105,4 +105,5 @@ is { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e1 \u00e9 \u00ed \u00f3 \u00fa \u00fd \u00f6 \u00e6 \u00f0 \u00fe]" } } diff --git a/icu4c/source/data/locales/it.txt b/icu4c/source/data/locales/it.txt index 09eaa066cd..490b910a49 100644 --- a/icu4c/source/data/locales/it.txt +++ b/icu4c/source/data/locales/it.txt @@ -114,6 +114,7 @@ it { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e9 \u00f3 \u00e0 \u00e8 \u00ec \u00f2 \u00ed \u00fa \u00f9 \u00ef]" } //------------------------------------------------------------ // Rule Based Number Format Support diff --git a/icu4c/source/data/locales/ja.txt b/icu4c/source/data/locales/ja.txt index 999b5c344e..2a2a6a640d 100644 --- a/icu4c/source/data/locales/ja.txt +++ b/icu4c/source/data/locales/ja.txt @@ -17,588 +17,588 @@ ja { Sequence { "[strength 4][hiraganaQ on]" - "&\u30FD=\u30FD=\u309D" // KATAKANA ITERATION MARK + "&\u30FD = \u30FD = \u309D" // KATAKANA ITERATION MARK // Rules for treating length mark "&[before 3]\u30A1" //KATAKANA LETTER SMALL A - "<<<\u30A1|\u30FC=\uFF67|\u30FC=\u3041|\u30FC" // A - "=\u30A2|\u30FC=\uFF71|\u30FC=\u3042|\u30FC" // A - "=\u30AB|\u30FC=\uFF76|\u30FC=\u304B|\u30FC" // KA - "=\u30AC|\u30FC=\u304C|\u30FC" // GA - "=\u30B5|\u30FC=\uFF7B|\u30FC=\u3055|\u30FC" // SA - "=\u30B6|\u30FC=\u3056|\u30FC" // ZA - "=\u30BF|\u30FC=\uFF80|\u30FC=\u305F|\u30FC" // TA - "=\u30C0|\u30FC=\u3060|\u30FC" // DA - "=\u30CA|\u30FC=\uFF85|\u30FC=\u306A|\u30FC" // NA - "=\u30CF|\u30FC=\uFF8A|\u30FC=\u306F|\u30FC" // HA - "=\u30D0|\u30FC=\u3070|\u30FC" // BA - "=\u30D1|\u30FC=\u3071|\u30FC" // PA - "=\u30DE|\u30FC=\uFF8F|\u30FC=\u307E|\u30FC" // MA - "=\u30E3|\u30FC=\uFF6C|\u30FC=\u3083|\u30FC" // YA - "=\u30E4|\u30FC=\uFF94|\u30FC=\u3084|\u30FC" // YA - "=\u30E9|\u30FC=\uFF97|\u30FC=\u3089|\u30FC" // RA - "=\u30EE|\u30FC=\u308E|\u30FC" // WA - "=\u30EF|\u30FC=\uFF9C|\u30FC=\u308F|\u30FC" // WA - "=\u30F5|\u30FC" // KA - "=\u30F7|\u30FC" // VA + "<<< \u30A1|\u30FC = \uFF67|\u30FC = \u3041|\u30FC" // A + "= \u30A2|\u30FC = \uFF71|\u30FC = \u3042|\u30FC" // A + "= \u30AB|\u30FC = \uFF76|\u30FC = \u304B|\u30FC" // KA + "= \u30AC|\u30FC = \u304C|\u30FC" // GA + "= \u30B5|\u30FC = \uFF7B|\u30FC = \u3055|\u30FC" // SA + "= \u30B6|\u30FC = \u3056|\u30FC" // ZA + "= \u30BF|\u30FC = \uFF80|\u30FC = \u305F|\u30FC" // TA + "= \u30C0|\u30FC = \u3060|\u30FC" // DA + "= \u30CA|\u30FC = \uFF85|\u30FC = \u306A|\u30FC" // NA + "= \u30CF|\u30FC = \uFF8A|\u30FC = \u306F|\u30FC" // HA + "= \u30D0|\u30FC = \u3070|\u30FC" // BA + "= \u30D1|\u30FC = \u3071|\u30FC" // PA + "= \u30DE|\u30FC = \uFF8F|\u30FC = \u307E|\u30FC" // MA + "= \u30E3|\u30FC = \uFF6C|\u30FC = \u3083|\u30FC" // YA + "= \u30E4|\u30FC = \uFF94|\u30FC = \u3084|\u30FC" // YA + "= \u30E9|\u30FC = \uFF97|\u30FC = \u3089|\u30FC" // RA + "= \u30EE|\u30FC = \u308E|\u30FC" // WA + "= \u30EF|\u30FC = \uFF9C|\u30FC = \u308F|\u30FC" // WA + "= \u30F5|\u30FC" // KA + "= \u30F7|\u30FC" // VA "&[before 3]\u30A3" //KATAKANA LETTER SMALL I - "<<<\u30A3|\u30FC=\uFF68|\u30FC=\u3043|\u30FC" // I - "=\u30A4|\u30FC=\uFF72|\u30FC=\u3044|\u30FC" // I - "=\u30AD|\u30FC=\uFF77|\u30FC=\u304D|\u30FC" // KI - "=\u30AE|\u30FC=\u304E|\u30FC" // GI - "=\u30B7|\u30FC=\uFF7C|\u30FC=\u3057|\u30FC" // SI - "=\u30B8|\u30FC=\u3058|\u30FC" // ZI - "=\u30C1|\u30FC=\uFF81|\u30FC=\u3061|\u30FC" // TI - "=\u30C2|\u30FC=\u3062|\u30FC" // DI - "=\u30CB|\u30FC=\uFF86|\u30FC=\u306B|\u30FC" // NI - "=\u30D2|\u30FC=\uFF8B|\u30FC=\u3072|\u30FC" // HI - "=\u30D3|\u30FC=\u3073|\u30FC" // BI - "=\u30D4|\u30FC=\u3074|\u30FC" // PI - "=\u30DF|\u30FC=\uFF90|\u30FC=\u307F|\u30FC" // MI - "=\u30EA|\u30FC=\uFF98|\u30FC=\u308A|\u30FC" // RI - "=\u30F0|\u30FC=\u3090|\u30FC" // WI - "=\u30F8|\u30FC" // VI + "<<< \u30A3|\u30FC = \uFF68|\u30FC = \u3043|\u30FC" // I + "= \u30A4|\u30FC = \uFF72|\u30FC = \u3044|\u30FC" // I + "= \u30AD|\u30FC = \uFF77|\u30FC = \u304D|\u30FC" // KI + "= \u30AE|\u30FC = \u304E|\u30FC" // GI + "= \u30B7|\u30FC = \uFF7C|\u30FC = \u3057|\u30FC" // SI + "= \u30B8|\u30FC = \u3058|\u30FC" // ZI + "= \u30C1|\u30FC = \uFF81|\u30FC = \u3061|\u30FC" // TI + "= \u30C2|\u30FC = \u3062|\u30FC" // DI + "= \u30CB|\u30FC = \uFF86|\u30FC = \u306B|\u30FC" // NI + "= \u30D2|\u30FC = \uFF8B|\u30FC = \u3072|\u30FC" // HI + "= \u30D3|\u30FC = \u3073|\u30FC" // BI + "= \u30D4|\u30FC = \u3074|\u30FC" // PI + "= \u30DF|\u30FC = \uFF90|\u30FC = \u307F|\u30FC" // MI + "= \u30EA|\u30FC = \uFF98|\u30FC = \u308A|\u30FC" // RI + "= \u30F0|\u30FC = \u3090|\u30FC" // WI + "= \u30F8|\u30FC" // VI "&[before 3]\u30A5" //KATAKANA LETTER SMALL U - "<<<\u30A5|\u30FC=\uFF69|\u30FC=\u3045|\u30FC" // U - "=\u30A6|\u30FC=\uFF73|\u30FC=\u3046|\u30FC" // U - "=\u30AF|\u30FC=\uFF78|\u30FC=\u304F|\u30FC" // KU - "=\u30B0|\u30FC=\u3050|\u30FC" // GU - "=\u30B9|\u30FC=\uFF7D|\u30FC=\u3059|\u30FC" // SU - "=\u30BA|\u30FC=\u305A|\u30FC" // ZU - "=\u30C3|\u30FC=\uFF6F|\u30FC=\u3063|\u30FC" // TU - "=\u30C4|\u30FC=\uFF82|\u30FC=\u3064|\u30FC" // TU - "=\u30C5|\u30FC=\u3065|\u30FC" // DU - "=\u30CC|\u30FC=\uFF87|\u30FC=\u306C|\u30FC" // NU - "=\u30D5|\u30FC=\uFF8C|\u30FC=\u3075|\u30FC" // HU - "=\u30D6|\u30FC=\u3076|\u30FC" // BU - "=\u30D7|\u30FC=\u3077|\u30FC" // PU - "=\u30E0|\u30FC=\uFF91|\u30FC=\u3080|\u30FC" // MU - "=\u30E5|\u30FC=\uFF6D|\u30FC=\u3085|\u30FC" // YU - "=\u30E6|\u30FC=\uFF95|\u30FC=\u3086|\u30FC" // YU - "=\u30EB|\u30FC=\uFF99|\u30FC=\u308B|\u30FC" // RU - "=\u30F4|\u30FC=\u3094|\u30FC" // VU + "<<< \u30A5|\u30FC = \uFF69|\u30FC = \u3045|\u30FC" // U + "= \u30A6|\u30FC = \uFF73|\u30FC = \u3046|\u30FC" // U + "= \u30AF|\u30FC = \uFF78|\u30FC = \u304F|\u30FC" // KU + "= \u30B0|\u30FC = \u3050|\u30FC" // GU + "= \u30B9|\u30FC = \uFF7D|\u30FC = \u3059|\u30FC" // SU + "= \u30BA|\u30FC = \u305A|\u30FC" // ZU + "= \u30C3|\u30FC = \uFF6F|\u30FC = \u3063|\u30FC" // TU + "= \u30C4|\u30FC = \uFF82|\u30FC = \u3064|\u30FC" // TU + "= \u30C5|\u30FC = \u3065|\u30FC" // DU + "= \u30CC|\u30FC = \uFF87|\u30FC = \u306C|\u30FC" // NU + "= \u30D5|\u30FC = \uFF8C|\u30FC = \u3075|\u30FC" // HU + "= \u30D6|\u30FC = \u3076|\u30FC" // BU + "= \u30D7|\u30FC = \u3077|\u30FC" // PU + "= \u30E0|\u30FC = \uFF91|\u30FC = \u3080|\u30FC" // MU + "= \u30E5|\u30FC = \uFF6D|\u30FC = \u3085|\u30FC" // YU + "= \u30E6|\u30FC = \uFF95|\u30FC = \u3086|\u30FC" // YU + "= \u30EB|\u30FC = \uFF99|\u30FC = \u308B|\u30FC" // RU + "= \u30F4|\u30FC = \u3094|\u30FC" // VU "&[before 3]\u30A7" //KATAKANA LETTER SMALL E - "<<<\u30A7|\u30FC=\uFF6A|\u30FC=\u3047|\u30FC" // E - "=\u30A8|\u30FC=\uFF74|\u30FC=\u3048|\u30FC" // E - "=\u30B1|\u30FC=\uFF79|\u30FC=\u3051|\u30FC" // KE - "=\u30B2|\u30FC=\u3052|\u30FC" // GE - "=\u30BB|\u30FC=\uFF7E|\u30FC=\u305B|\u30FC" // SE - "=\u30BC|\u30FC=\u305C|\u30FC" // ZE - "=\u30C6|\u30FC=\uFF83|\u30FC=\u3066|\u30FC" // TE - "=\u30C7|\u30FC=\u3067|\u30FC" // DE - "=\u30CD|\u30FC=\uFF88|\u30FC=\u306D|\u30FC" // NE - "=\u30D8|\u30FC=\uFF8D|\u30FC=\u3078|\u30FC" // HE - "=\u30D9|\u30FC=\u3079|\u30FC" // BE - "=\u30DA|\u30FC=\u307A|\u30FC" // PE - "=\u30E1|\u30FC=\uFF92|\u30FC=\u3081|\u30FC" // ME - "=\u30EC|\u30FC=\uFF9A|\u30FC=\u308C|\u30FC" // RE - "=\u30F1|\u30FC=\u3091|\u30FC" // WE - "=\u30F6|\u30FC" // KE - "=\u30F9|\u30FC" // VE + "<<< \u30A7|\u30FC = \uFF6A|\u30FC = \u3047|\u30FC" // E + "= \u30A8|\u30FC = \uFF74|\u30FC = \u3048|\u30FC" // E + "= \u30B1|\u30FC = \uFF79|\u30FC = \u3051|\u30FC" // KE + "= \u30B2|\u30FC = \u3052|\u30FC" // GE + "= \u30BB|\u30FC = \uFF7E|\u30FC = \u305B|\u30FC" // SE + "= \u30BC|\u30FC = \u305C|\u30FC" // ZE + "= \u30C6|\u30FC = \uFF83|\u30FC = \u3066|\u30FC" // TE + "= \u30C7|\u30FC = \u3067|\u30FC" // DE + "= \u30CD|\u30FC = \uFF88|\u30FC = \u306D|\u30FC" // NE + "= \u30D8|\u30FC = \uFF8D|\u30FC = \u3078|\u30FC" // HE + "= \u30D9|\u30FC = \u3079|\u30FC" // BE + "= \u30DA|\u30FC = \u307A|\u30FC" // PE + "= \u30E1|\u30FC = \uFF92|\u30FC = \u3081|\u30FC" // ME + "= \u30EC|\u30FC = \uFF9A|\u30FC = \u308C|\u30FC" // RE + "= \u30F1|\u30FC = \u3091|\u30FC" // WE + "= \u30F6|\u30FC" // KE + "= \u30F9|\u30FC" // VE "&[before 3]\u30A9" //KATAKANA LETTER SMALL O - "<<<\u30A9|\u30FC=\uFF6B|\u30FC=\u3049|\u30FC" // O - "=\u30AA|\u30FC=\uFF75|\u30FC=\u304A|\u30FC" // O - "=\u30B3|\u30FC=\uFF7A|\u30FC=\u3053|\u30FC" // KO - "=\u30B4|\u30FC=\u3054|\u30FC" // GO - "=\u30BD|\u30FC=\uFF7F|\u30FC=\u305D|\u30FC" // SO - "=\u30BE|\u30FC=\u305E|\u30FC" // ZO - "=\u30C8|\u30FC=\uFF84|\u30FC=\u3068|\u30FC" // TO - "=\u30C9|\u30FC=\u3069|\u30FC" // DO - "=\u30CE|\u30FC=\uFF89|\u30FC=\u306E|\u30FC" // NO - "=\u30DB|\u30FC=\uFF8E|\u30FC=\u307B|\u30FC" // HO - "=\u30DC|\u30FC=\u307C|\u30FC" // BO - "=\u30DD|\u30FC=\u307D|\u30FC" // PO - "=\u30E2|\u30FC=\uFF93|\u30FC=\u3082|\u30FC" // MO - "=\u30E7|\u30FC=\uFF6E|\u30FC=\u3087|\u30FC" // YO - "=\u30E8|\u30FC=\uFF96|\u30FC=\u3088|\u30FC" // YO - "=\u30ED|\u30FC=\uFF9B|\u30FC=\u308D|\u30FC" // RO - "=\u30F2|\u30FC=\uFF66|\u30FC=\u3092|\u30FC" // WO - "=\u30FA|\u30FC" // VO + "<<< \u30A9|\u30FC = \uFF6B|\u30FC = \u3049|\u30FC" // O + "= \u30AA|\u30FC = \uFF75|\u30FC = \u304A|\u30FC" // O + "= \u30B3|\u30FC = \uFF7A|\u30FC = \u3053|\u30FC" // KO + "= \u30B4|\u30FC = \u3054|\u30FC" // GO + "= \u30BD|\u30FC = \uFF7F|\u30FC = \u305D|\u30FC" // SO + "= \u30BE|\u30FC = \u305E|\u30FC" // ZO + "= \u30C8|\u30FC = \uFF84|\u30FC = \u3068|\u30FC" // TO + "= \u30C9|\u30FC = \u3069|\u30FC" // DO + "= \u30CE|\u30FC = \uFF89|\u30FC = \u306E|\u30FC" // NO + "= \u30DB|\u30FC = \uFF8E|\u30FC = \u307B|\u30FC" // HO + "= \u30DC|\u30FC = \u307C|\u30FC" // BO + "= \u30DD|\u30FC = \u307D|\u30FC" // PO + "= \u30E2|\u30FC = \uFF93|\u30FC = \u3082|\u30FC" // MO + "= \u30E7|\u30FC = \uFF6E|\u30FC = \u3087|\u30FC" // YO + "= \u30E8|\u30FC = \uFF96|\u30FC = \u3088|\u30FC" // YO + "= \u30ED|\u30FC = \uFF9B|\u30FC = \u308D|\u30FC" // RO + "= \u30F2|\u30FC = \uFF66|\u30FC = \u3092|\u30FC" // WO + "= \u30FA|\u30FC" // VO // Rules for treating iteration mark "&[before 3]\u30A2" //KATAKANA LETTER A - "<<<\u30A2|\u30FD=\uFF71|\u30FD=\u3042|\u309D" - "=\u30A1|\u30FD=\uFF67|\u30FD=\u3041|\u309D" + "<<< \u30A2|\u30FD = \uFF71|\u30FD = \u3042|\u309D" + "= \u30A1|\u30FD = \uFF67|\u30FD = \u3041|\u309D" "&[before 3]\u30A4" //KATAKANA LETTER I - "<<<\u30A4|\u30FD=\uFF72|\u30FD=\u3044|\u309D" - "=\u30A3|\u30FD=\uFF68|\u30FD=\u3043|\u309D" + "<<< \u30A4|\u30FD = \uFF72|\u30FD = \u3044|\u309D" + "= \u30A3|\u30FD = \uFF68|\u30FD = \u3043|\u309D" "&[before 3]\u30A6" //KATAKANA LETTER U - "<<<\u30A6|\u30FD=\uFF73|\u30FD=\u3046|\u309D" - "=\u30A5|\u30FD=\uFF69|\u30FD=\u3045|\u309D" - "=\u30F4|\u30FD=\u3094|\u309D" - "=\u30A6|\u30FE/\u3099=\uFF73|\u30FE/\u3099=\u3046|\u309E/\u3099" - "=\u30A5|\u30FE/\u3099=\uFF69|\u30FE/\u3099=\u3045|\u309E/\u3099" - "=\u30F4|\u30FE/\u3099=\u3094|\u309E/\u3099" + "<<< \u30A6|\u30FD = \uFF73|\u30FD = \u3046|\u309D" + "= \u30A5|\u30FD = \uFF69|\u30FD = \u3045|\u309D" + "= \u30F4|\u30FD = \u3094|\u309D" + "= \u30A6|\u30FE/\u3099 = \uFF73|\u30FE/\u3099 = \u3046|\u309E/\u3099" + "= \u30A5|\u30FE/\u3099 = \uFF69|\u30FE/\u3099 = \u3045|\u309E/\u3099" + "= \u30F4|\u30FE/\u3099 = \u3094|\u309E/\u3099" "&[before 3]\u30A8" //KATAKANA LETTER E - "<<<\u30A8|\u30FD=\uFF74|\u30FD=\u3048|\u309D" - "=\u30A7|\u30FD=\uFF6A|\u30FD=\u3047|\u309D" + "<<< \u30A8|\u30FD = \uFF74|\u30FD = \u3048|\u309D" + "= \u30A7|\u30FD = \uFF6A|\u30FD = \u3047|\u309D" "&[before 3]\u30AA" //KATAKANA LETTER O - "<<<\u30AA|\u30FD=\uFF75|\u30FD=\u304A|\u309D" - "=\u30A9|\u30FD=\uFF6B|\u30FD=\u3049|\u309D" + "<<< \u30AA|\u30FD = \uFF75|\u30FD = \u304A|\u309D" + "= \u30A9|\u30FD = \uFF6B|\u30FD = \u3049|\u309D" "&[before 3]\u30AB" //KATAKANA LETTER KA - "<<<\u30AB|\u30FD=\uFF76|\u30FD=\u304B|\u309D" - "=\u30F5|\u30FD" + "<<< \u30AB|\u30FD = \uFF76|\u30FD = \u304B|\u309D" + "= \u30F5|\u30FD" "&[before 3]\u30AC" //KATAKANA LETTER GA - "<<<\u30AC|\u30FD=\u304C|\u309D" + "<<< \u30AC|\u30FD = \u304C|\u309D" "&[before 3]\u30AD" //KATAKANA LETTER KI - "<<<\u30AD|\u30FD=\uFF77|\u30FD=\u304D|\u309D" - "=\u30AE|\u30FD=\u304E|\u309D" - "=\u30AD|\u30FE/\u3099=\uFF77|\u30FE/\u3099=\u304D|\u309E/\u3099" - "=\u30AE|\u30FE/\u3099=\u304E|\u309E/\u3099" + "<<< \u30AD|\u30FD = \uFF77|\u30FD = \u304D|\u309D" + "= \u30AE|\u30FD = \u304E|\u309D" + "= \u30AD|\u30FE/\u3099 = \uFF77|\u30FE/\u3099 = \u304D|\u309E/\u3099" + "= \u30AE|\u30FE/\u3099 = \u304E|\u309E/\u3099" "&[before 3]\u30AF" //KATAKANA LETTER KU - "<<<\u30AF|\u30FD=\uFF78|\u30FD=\u304F|\u309D" - "=\u30B0|\u30FD=\u3050|\u309D" - "=\u30AF|\u30FE/\u3099=\uFF78|\u30FE/\u3099=\u304F|\u309E/\u3099" - "=\u30B0|\u30FE/\u3099=\u3050|\u309E/\u3099" + "<<< \u30AF|\u30FD = \uFF78|\u30FD = \u304F|\u309D" + "= \u30B0|\u30FD = \u3050|\u309D" + "= \u30AF|\u30FE/\u3099 = \uFF78|\u30FE/\u3099 = \u304F|\u309E/\u3099" + "= \u30B0|\u30FE/\u3099 = \u3050|\u309E/\u3099" "&[before 3]\u30B1" //KATAKANA LETTER KE - "<<<\u30B1|\u30FD=\uFF79|\u30FD=\u3051|\u309D" - "=\u30F6|\u30FD" + "<<< \u30B1|\u30FD = \uFF79|\u30FD = \u3051|\u309D" + "= \u30F6|\u30FD" "&[before 3]\u30B2" //KATAKANA LETTER GE - "<<<\u30B2|\u30FD=\u3052|\u309D" + "<<< \u30B2|\u30FD = \u3052|\u309D" "&[before 3]\u30B3" //KATAKANA LETTER KO - "<<<\u30B3|\u30FD=\uFF7A|\u30FD=\u3053|\u309D" - "=\u30B4|\u30FD=\u3054|\u309D" - "=\u30B3|\u30FE/\u3099=\uFF7A|\u30FE/\u3099=\u3053|\u309E/\u3099" - "=\u30B4|\u30FE/\u3099=\u3054|\u309E/\u3099" + "<<< \u30B3|\u30FD = \uFF7A|\u30FD = \u3053|\u309D" + "= \u30B4|\u30FD = \u3054|\u309D" + "= \u30B3|\u30FE/\u3099 = \uFF7A|\u30FE/\u3099 = \u3053|\u309E/\u3099" + "= \u30B4|\u30FE/\u3099 = \u3054|\u309E/\u3099" "&[before 3]\u30B5" //KATAKANA LETTER SA - "<<<\u30B5|\u30FD=\uFF7B|\u30FD=\u3055|\u309D" - "=\u30B6|\u30FD=\u3056|\u309D" - "=\u30B5|\u30FE/\u3099=\uFF7B|\u30FE/\u3099=\u3055|\u309E/\u3099" - "=\u30B6|\u30FE/\u3099=\u3056|\u309E/\u3099" + "<<< \u30B5|\u30FD = \uFF7B|\u30FD = \u3055|\u309D" + "= \u30B6|\u30FD = \u3056|\u309D" + "= \u30B5|\u30FE/\u3099 = \uFF7B|\u30FE/\u3099 = \u3055|\u309E/\u3099" + "= \u30B6|\u30FE/\u3099 = \u3056|\u309E/\u3099" "&[before 3]\u30B7" //KATAKANA LETTER SI - "<<<\u30B7|\u30FD=\uFF7C|\u30FD=\u3057|\u309D" - "=\u30B8|\u30FD=\u3058|\u309D" - "=\u30B7|\u30FE/\u3099=\uFF7C|\u30FE/\u3099=\u3057|\u309E/\u3099" - "=\u30B8|\u30FE/\u3099=\u3058|\u309E/\u3099" + "<<< \u30B7|\u30FD = \uFF7C|\u30FD = \u3057|\u309D" + "= \u30B8|\u30FD = \u3058|\u309D" + "= \u30B7|\u30FE/\u3099 = \uFF7C|\u30FE/\u3099 = \u3057|\u309E/\u3099" + "= \u30B8|\u30FE/\u3099 = \u3058|\u309E/\u3099" "&[before 3]\u30B9" //KATAKANA LETTER SU - "<<<\u30B9|\u30FD=\uFF7D|\u30FD=\u3059|\u309D" - "=\u30BA|\u30FD=\u305A|\u309D" - "=\u30B9|\u30FE/\u3099=\uFF7D|\u30FE/\u3099=\u3059|\u309E/\u3099" - "=\u30BA|\u30FE/\u3099=\u305A|\u309E/\u3099" + "<<< \u30B9|\u30FD = \uFF7D|\u30FD = \u3059|\u309D" + "= \u30BA|\u30FD = \u305A|\u309D" + "= \u30B9|\u30FE/\u3099 = \uFF7D|\u30FE/\u3099 = \u3059|\u309E/\u3099" + "= \u30BA|\u30FE/\u3099 = \u305A|\u309E/\u3099" "&[before 3]\u30BB" //KATAKANA LETTER SE - "<<<\u30BB|\u30FD=\uFF7E|\u30FD=\u305B|\u309D" - "=\u30BC|\u30FD=\u305C|\u309D" - "=\u30BB|\u30FE/\u3099=\uFF7E|\u30FE/\u3099=\u305B|\u309E/\u3099" - "=\u30BC|\u30FE/\u3099=\u305C|\u309E/\u3099" + "<<< \u30BB|\u30FD = \uFF7E|\u30FD = \u305B|\u309D" + "= \u30BC|\u30FD = \u305C|\u309D" + "= \u30BB|\u30FE/\u3099 = \uFF7E|\u30FE/\u3099 = \u305B|\u309E/\u3099" + "= \u30BC|\u30FE/\u3099 = \u305C|\u309E/\u3099" "&[before 3]\u30BD" //KATAKANA LETTER SO - "<<<\u30BD|\u30FD=\uFF7F|\u30FD=\u305D|\u309D" - "=\u30BE|\u30FD=\u305E|\u309D" - "=\u30BD|\u30FE/\u3099=\uFF7F|\u30FE/\u3099=\u305D|\u309E/\u3099" - "=\u30BE|\u30FE/\u3099=\u305E|\u309E/\u3099" + "<<< \u30BD|\u30FD = \uFF7F|\u30FD = \u305D|\u309D" + "= \u30BE|\u30FD = \u305E|\u309D" + "= \u30BD|\u30FE/\u3099 = \uFF7F|\u30FE/\u3099 = \u305D|\u309E/\u3099" + "= \u30BE|\u30FE/\u3099 = \u305E|\u309E/\u3099" "&[before 3]\u30BF" //KATAKANA LETTER TA - "<<<\u30BF|\u30FD=\uFF80|\u30FD=\u305F|\u309D" - "=\u30C0|\u30FD=\u3060|\u309D" - "=\u30BF|\u30FE/\u3099=\uFF80|\u30FE/\u3099=\u305F|\u309E/\u3099" - "=\u30C0|\u30FE/\u3099=\u3060|\u309E/\u3099" + "<<< \u30BF|\u30FD = \uFF80|\u30FD = \u305F|\u309D" + "= \u30C0|\u30FD = \u3060|\u309D" + "= \u30BF|\u30FE/\u3099 = \uFF80|\u30FE/\u3099 = \u305F|\u309E/\u3099" + "= \u30C0|\u30FE/\u3099 = \u3060|\u309E/\u3099" "&[before 3]\u30C1" //KATAKANA LETTER TI - "<<<\u30C1|\u30FD=\uFF81|\u30FD=\u3061|\u309D" - "=\u30C2|\u30FD=\u3062|\u309D" - "=\u30C1|\u30FE/\u3099=\uFF81|\u30FE/\u3099=\u3061|\u309E/\u3099" - "=\u30C2|\u30FE/\u3099=\u3062|\u309E/\u3099" + "<<< \u30C1|\u30FD = \uFF81|\u30FD = \u3061|\u309D" + "= \u30C2|\u30FD = \u3062|\u309D" + "= \u30C1|\u30FE/\u3099 = \uFF81|\u30FE/\u3099 = \u3061|\u309E/\u3099" + "= \u30C2|\u30FE/\u3099 = \u3062|\u309E/\u3099" "&[before 3]\u30C4" //KATAKANA LETTER TU - "<<<\u30C4|\u30FD=\uFF82|\u30FD=\u3064|\u309D" - "=\u30C3|\u30FD=\uFF6F|\u30FD=\u3063|\u309D" - "=\u30C5|\u30FD=\u3065|\u309D" - "=\u30C4|\u30FE/\u3099=\uFF82|\u30FE/\u3099=\u3064|\u309E/\u3099" - "=\u30C5|\u30FE/\u3099=\u3065|\u309E/\u3099" - "=\u30C4|\u30FD=\uFF82|\u30FD=\u3064|\u309D" - "=\u30C3|\u30FE/\u3099=\uFF6F|\u30FE/\u3099=\u3063|\u309E/\u3099" - "=\u30C4|\u30FE/\u3099=\uFF82|\u30FE/\u3099=\u3064|\u309E/\u3099" + "<<< \u30C4|\u30FD = \uFF82|\u30FD = \u3064|\u309D" + "= \u30C3|\u30FD = \uFF6F|\u30FD = \u3063|\u309D" + "= \u30C5|\u30FD = \u3065|\u309D" + "= \u30C4|\u30FE/\u3099 = \uFF82|\u30FE/\u3099 = \u3064|\u309E/\u3099" + "= \u30C5|\u30FE/\u3099 = \u3065|\u309E/\u3099" + "= \u30C4|\u30FD = \uFF82|\u30FD = \u3064|\u309D" + "= \u30C3|\u30FE/\u3099 = \uFF6F|\u30FE/\u3099 = \u3063|\u309E/\u3099" + "= \u30C4|\u30FE/\u3099 = \uFF82|\u30FE/\u3099 = \u3064|\u309E/\u3099" "&[before 3]\u30C6" //KATAKANA LETTER TE - "<<<\u30C6|\u30FD=\uFF83|\u30FD=\u3066|\u309D" - "=\u30C7|\u30FD=\u3067|\u309D" - "=\u30C6|\u30FE/\u3099=\uFF83|\u30FE/\u3099=\u3066|\u309E/\u3099" - "=\u30C7|\u30FE/\u3099=\u3067|\u309E/\u3099" + "<<< \u30C6|\u30FD = \uFF83|\u30FD = \u3066|\u309D" + "= \u30C7|\u30FD = \u3067|\u309D" + "= \u30C6|\u30FE/\u3099 = \uFF83|\u30FE/\u3099 = \u3066|\u309E/\u3099" + "= \u30C7|\u30FE/\u3099 = \u3067|\u309E/\u3099" "&[before 3]\u30C8" //KATAKANA LETTER TO - "<<<\u30C8|\u30FD=\uFF84|\u30FD=\u3068|\u309D" - "=\u30C9|\u30FD=\u3069|\u309D" - "=\u30C8|\u30FE/\u3099=\uFF84|\u30FE/\u3099=\u3068|\u309E/\u3099" - "=\u30C9|\u30FE/\u3099=\u3069|\u309E/\u3099" + "<<< \u30C8|\u30FD = \uFF84|\u30FD = \u3068|\u309D" + "= \u30C9|\u30FD = \u3069|\u309D" + "= \u30C8|\u30FE/\u3099 = \uFF84|\u30FE/\u3099 = \u3068|\u309E/\u3099" + "= \u30C9|\u30FE/\u3099 = \u3069|\u309E/\u3099" "&[before 3]\u30CA" //KATAKANA LETTER NA - "<<<\u30CA|\u30FD=\uFF85|\u30FD=\u306A|\u309D" + "<<< \u30CA|\u30FD = \uFF85|\u30FD = \u306A|\u309D" "&[before 3]\u30CB" //KATAKANA LETTER NI - "<<<\u30CB|\u30FD=\uFF86|\u30FD=\u306B|\u309D" + "<<< \u30CB|\u30FD = \uFF86|\u30FD = \u306B|\u309D" "&[before 3]\u30CC" //KATAKANA LETTER NU - "<<<\u30CC|\u30FD=\uFF87|\u30FD=\u306C|\u309D" + "<<< \u30CC|\u30FD = \uFF87|\u30FD = \u306C|\u309D" "&[before 3]\u30CD" //KATAKANA LETTER NE - "<<<\u30CD|\u30FD=\uFF88|\u30FD=\u306D|\u309D" + "<<< \u30CD|\u30FD = \uFF88|\u30FD = \u306D|\u309D" "&[before 3]\u30CE" //KATAKANA LETTER NO - "<<<\u30CE|\u30FD=\uFF89|\u30FD=\u306E|\u309D" + "<<< \u30CE|\u30FD = \uFF89|\u30FD = \u306E|\u309D" "&[before 3]\u30CF" //KATAKANA LETTER HA - "<<<\u30CF|\u30FD=\uFF8A|\u30FD=\u306F|\u309D" - "=\u30D0|\u30FD=\u3070|\u309D" - "=\u30CF|\u30FE/\u3099=\uFF8A|\u30FE/\u3099=\u306F|\u309E/\u3099" - "=\u30D0|\u30FE/\u3099=\u3070|\u309E/\u3099" - "=\u30D1|\u30FD=\u3071|\u309D" - "=\u30D1|\u30FE/\u3099=\u3071|\u309E/\u3099" + "<<< \u30CF|\u30FD = \uFF8A|\u30FD = \u306F|\u309D" + "= \u30D0|\u30FD = \u3070|\u309D" + "= \u30CF|\u30FE/\u3099 = \uFF8A|\u30FE/\u3099 = \u306F|\u309E/\u3099" + "= \u30D0|\u30FE/\u3099 = \u3070|\u309E/\u3099" + "= \u30D1|\u30FD = \u3071|\u309D" + "= \u30D1|\u30FE/\u3099 = \u3071|\u309E/\u3099" "&[before 3]\u30D2" //KATAKANA LETTER HI - "<<<\u30D2|\u30FD=\uFF8B|\u30FD=\u3072|\u309D" - "=\u30D3|\u30FD=\u3073|\u309D" - "=\u30D2|\u30FE/\u3099=\uFF8B|\u30FE/\u3099=\u3072|\u309E/\u3099" - "=\u30D3|\u30FE/\u3099=\u3073|\u309E/\u3099" - "=\u30D4|\u30FD=\u3074|\u309D" - "=\u30D4|\u30FE/\u3099=\u3074|\u309E/\u3099" + "<<< \u30D2|\u30FD = \uFF8B|\u30FD = \u3072|\u309D" + "= \u30D3|\u30FD = \u3073|\u309D" + "= \u30D2|\u30FE/\u3099 = \uFF8B|\u30FE/\u3099 = \u3072|\u309E/\u3099" + "= \u30D3|\u30FE/\u3099 = \u3073|\u309E/\u3099" + "= \u30D4|\u30FD = \u3074|\u309D" + "= \u30D4|\u30FE/\u3099 = \u3074|\u309E/\u3099" "&[before 3]\u30D5" //KATAKANA LETTER HU - "<<<\u30D5|\u30FD=\uFF8C|\u30FD=\u3075|\u309D" - "=\u30D6|\u30FD=\u3076|\u309D" - "=\u30D5|\u30FE/\u3099=\uFF8C|\u30FE/\u3099=\u3075|\u309E/\u3099" - "=\u30D6|\u30FE/\u3099=\u3076|\u309E/\u3099" - "=\u30D7|\u30FD=\u3077|\u309D" - "=\u30D7|\u30FE/\u3099=\u3077|\u309E/\u3099" + "<<< \u30D5|\u30FD = \uFF8C|\u30FD = \u3075|\u309D" + "= \u30D6|\u30FD = \u3076|\u309D" + "= \u30D5|\u30FE/\u3099 = \uFF8C|\u30FE/\u3099 = \u3075|\u309E/\u3099" + "= \u30D6|\u30FE/\u3099 = \u3076|\u309E/\u3099" + "= \u30D7|\u30FD = \u3077|\u309D" + "= \u30D7|\u30FE/\u3099 = \u3077|\u309E/\u3099" "&[before 3]\u30D8" //KATAKANA LETTER HE - "<<<\u30D8|\u30FD=\uFF8D|\u30FD=\u3078|\u309D" - "=\u30D9|\u30FD=\u3079|\u309D" - "=\u30D8|\u30FE/\u3099=\uFF8D|\u30FE/\u3099=\u3078|\u309E/\u3099" - "=\u30D9|\u30FE/\u3099=\u3079|\u309E/\u3099" - "=\u30DA|\u30FD=\u307A|\u309D" - "=\u30DA|\u30FE/\u3099=\u307A|\u309E/\u3099" + "<<< \u30D8|\u30FD = \uFF8D|\u30FD = \u3078|\u309D" + "= \u30D9|\u30FD = \u3079|\u309D" + "= \u30D8|\u30FE/\u3099 = \uFF8D|\u30FE/\u3099 = \u3078|\u309E/\u3099" + "= \u30D9|\u30FE/\u3099 = \u3079|\u309E/\u3099" + "= \u30DA|\u30FD = \u307A|\u309D" + "= \u30DA|\u30FE/\u3099 = \u307A|\u309E/\u3099" "&[before 3]\u30DB" //KATAKANA LETTER HO - "<<<\u30DB|\u30FD=\uFF8E|\u30FD=\u307B|\u309D" - "=\u30DC|\u30FD=\u307C|\u309D" - "=\u30DB|\u30FE/\u3099=\uFF8E|\u30FE/\u3099=\u307B|\u309E/\u3099" - "=\u30DC|\u30FE/\u3099=\u307C|\u309E/\u3099" - "=\u30DD|\u30FD=\u307D|\u309D" - "=\u30DD|\u30FE/\u3099=\u307D|\u309E/\u3099" + "<<< \u30DB|\u30FD = \uFF8E|\u30FD = \u307B|\u309D" + "= \u30DC|\u30FD = \u307C|\u309D" + "= \u30DB|\u30FE/\u3099 = \uFF8E|\u30FE/\u3099 = \u307B|\u309E/\u3099" + "= \u30DC|\u30FE/\u3099 = \u307C|\u309E/\u3099" + "= \u30DD|\u30FD = \u307D|\u309D" + "= \u30DD|\u30FE/\u3099 = \u307D|\u309E/\u3099" "&[before 3]\u30DE" //KATAKANA LETTER MA - "<<<\u30DE|\u30FD=\uFF8F|\u30FD=\u307E|\u309D" + "<<< \u30DE|\u30FD = \uFF8F|\u30FD = \u307E|\u309D" "&[before 3]\u30DF" //KATAKANA LETTER MI - "<<<\u30DF|\u30FD=\uFF90|\u30FD=\u307F|\u309D" + "<<< \u30DF|\u30FD = \uFF90|\u30FD = \u307F|\u309D" "&[before 3]\u30E0" //KATAKANA LETTER MU - "<<<\u30E0|\u30FD=\uFF91|\u30FD=\u3080|\u309D" + "<<< \u30E0|\u30FD = \uFF91|\u30FD = \u3080|\u309D" "&[before 3]\u30E1" //KATAKANA LETTER ME - "<<<\u30E1|\u30FD=\uFF92|\u30FD=\u3081|\u309D" + "<<< \u30E1|\u30FD = \uFF92|\u30FD = \u3081|\u309D" "&[before 3]\u30E2" //KATAKANA LETTER MO - "<<<\u30E2|\u30FD=\uFF93|\u30FD=\u3082|\u309D" + "<<< \u30E2|\u30FD = \uFF93|\u30FD = \u3082|\u309D" "&[before 3]\u30E4" //KATAKANA LETTER YA - "<<<\u30E4|\u30FD=\uFF94|\u30FD=\u3084|\u309D" - "=\u30E3|\u30FD=\uFF6C|\u30FD=\u3083|\u309D" + "<<< \u30E4|\u30FD = \uFF94|\u30FD = \u3084|\u309D" + "= \u30E3|\u30FD = \uFF6C|\u30FD = \u3083|\u309D" "&[before 3]\u30E6" //KATAKANA LETTER YU - "<<<\u30E6|\u30FD=\uFF95|\u30FD=\u3086|\u309D" - "=\u30E5|\u30FD=\uFF6D|\u30FD=\u3085|\u309D" + "<<< \u30E6|\u30FD = \uFF95|\u30FD = \u3086|\u309D" + "= \u30E5|\u30FD = \uFF6D|\u30FD = \u3085|\u309D" "&[before 3]\u30E8" //KATAKANA LETTER YO - "<<<\u30E8|\u30FD=\uFF96|\u30FD=\u3088|\u309D" - "=\u30E7|\u30FD=\uFF6E|\u30FD=\u3087|\u309D" + "<<< \u30E8|\u30FD = \uFF96|\u30FD = \u3088|\u309D" + "= \u30E7|\u30FD = \uFF6E|\u30FD = \u3087|\u309D" "&[before 3]\u30E9" //KATAKANA LETTER RA - "<<<\u30E9|\u30FD=\uFF97|\u30FD=\u3089|\u309D" + "<<< \u30E9|\u30FD = \uFF97|\u30FD = \u3089|\u309D" "&[before 3]\u30EA" //KATAKANA LETTER RI - "<<<\u30EA|\u30FD=\uFF98|\u30FD=\u308A|\u309D" + "<<< \u30EA|\u30FD = \uFF98|\u30FD = \u308A|\u309D" "&[before 3]\u30EB" //KATAKANA LETTER RU - "<<<\u30EB|\u30FD=\uFF99|\u30FD=\u308B|\u309D" + "<<< \u30EB|\u30FD = \uFF99|\u30FD = \u308B|\u309D" "&[before 3]\u30EC" //KATAKANA LETTER RE - "<<<\u30EC|\u30FD=\uFF9A|\u30FD=\u308C|\u309D" + "<<< \u30EC|\u30FD = \uFF9A|\u30FD = \u308C|\u309D" "&[before 3]\u30ED" //KATAKANA LETTER RO - "<<<\u30ED|\u30FD=\uFF9B|\u30FD=\u308D|\u309D" + "<<< \u30ED|\u30FD = \uFF9B|\u30FD = \u308D|\u309D" "&[before 3]\u30EF" //KATAKANA LETTER WA - "<<<\u30EF|\u30FD=\uFF9C|\u30FD=\u308F|\u309D" - "=\u30EE|\u30FD=\u308E|\u309D" - "=\u30F7|\u30FD" - "=\u30EF|\u30FE/\u3099=\uFF9C|\u30FE/\u3099=\u308F|\u309E/\u3099" - "=\u30F7|\u30FE/\u3099" - "=\u30EE|\u30FE/\u3099=\u308E|\u309E/\u3099" + "<<< \u30EF|\u30FD = \uFF9C|\u30FD = \u308F|\u309D" + "= \u30EE|\u30FD = \u308E|\u309D" + "= \u30F7|\u30FD" + "= \u30EF|\u30FE/\u3099 = \uFF9C|\u30FE/\u3099 = \u308F|\u309E/\u3099" + "= \u30F7|\u30FE/\u3099" + "= \u30EE|\u30FE/\u3099 = \u308E|\u309E/\u3099" "&[before 3]\u30F0" //KATAKANA LETTER WI - "<<<\u30F0|\u30FD=\u3090|\u309D" - "=\u30F8|\u30FD" - "=\u30F0|\u30FE/\u3099=\u3090|\u309E/\u3099" - "=\u30F8|\u30FE/\u3099" + "<<< \u30F0|\u30FD = \u3090|\u309D" + "= \u30F8|\u30FD" + "= \u30F0|\u30FE/\u3099 = \u3090|\u309E/\u3099" + "= \u30F8|\u30FE/\u3099" "&[before 3]\u30F1" //KATAKANA LETTER WE - "<<<\u30F1|\u30FD=\u3091|\u309D" - "=\u30F9|\u30FD" - "=\u30F1|\u30FE/\u3099=\u3091|\u309E/\u3099" - "=\u30F9|\u30FE/\u3099" + "<<< \u30F1|\u30FD = \u3091|\u309D" + "= \u30F9|\u30FD" + "= \u30F1|\u30FE/\u3099 = \u3091|\u309E/\u3099" + "= \u30F9|\u30FE/\u3099" "&[before 3]\u30F2" //KATAKANA LETTER WO - "<<<\u30F2|\u30FD=\uFF66|\u30FD=\u3092|\u309D" - "=\u30FA|\u30FD" - "=\u30F2|\u30FE/\u3099=\uFF66|\u30FE/\u3099=\u3092|\u309E/\u3099" - "=\u30FA|\u30FE/\u3099" + "<<< \u30F2|\u30FD = \uFF66|\u30FD = \u3092|\u309D" + "= \u30FA|\u30FD" + "= \u30F2|\u30FE/\u3099 = \uFF66|\u30FE/\u3099 = \u3092|\u309E/\u3099" + "= \u30FA|\u30FE/\u3099" "&[before 3]\u30F3" //KATAKANA LETTER N - "<<<\u30F3|\u30FD=\uFF9D|\u30FD=\u3093|\u309D" + "<<< \u30F3|\u30FD = \uFF9D|\u30FD = \u3093|\u309D" // Equaling Katakana, Hiragana and compatibility - "&\u30A1=\u30A1=\u3041=\uFF67" // KATAKANA LETTER SMALL A - "&\u30A2=\u30A2=\u3042=\uFF71" // KATAKANA LETTER A - "&\u30A3=\u30A3=\u3043=\uFF68" // KATAKANA LETTER SMALL I - "&\u30A4=\u30A4=\u3044=\uFF72" // KATAKANA LETTER I - "&\u30A5=\u30A5=\u3045=\uFF69" // KATAKANA LETTER SMALL U - "&\u30A6=\u30A6=\u3046=\uFF73" // KATAKANA LETTER U - "&\u30A7=\u30A7=\u3047=\uFF6A" // KATAKANA LETTER SMALL E - "&\u30A8=\u30A8=\u3048=\uFF74" // KATAKANA LETTER E - "&\u30A9=\u30A9=\u3049=\uFF6B" // KATAKANA LETTER SMALL O - "&\u30AA=\u30AA=\u304A=\uFF75" // KATAKANA LETTER O - "&\u30AB=\u30AB=\u304B=\uFF76" // KATAKANA LETTER KA - "&\u30AD=\u30AD=\u304D=\uFF77" // KATAKANA LETTER KI - "&\u30AF=\u30AF=\u304F=\uFF78" // KATAKANA LETTER KU - "&\u30B1=\u30B1=\u3051=\uFF79" // KATAKANA LETTER KE - "&\u30B3=\u30B3=\u3053=\uFF7A" // KATAKANA LETTER KO - "&\u30B5=\u30B5=\u3055=\uFF7B" // KATAKANA LETTER SA - "&\u30B7=\u30B7=\u3057=\uFF7C" // KATAKANA LETTER SI - "&\u30B9=\u30B9=\u3059=\uFF7D" // KATAKANA LETTER SU - "&\u30BB=\u30BB=\u305B=\uFF7E" // KATAKANA LETTER SE - "&\u30BD=\u30BD=\u305D=\uFF7F" // KATAKANA LETTER SO - "&\u30BF=\u30BF=\u305F=\uFF80" // KATAKANA LETTER TA - "&\u30C1=\u30C1=\u3061=\uFF81" // KATAKANA LETTER TI - "&\u30C3=\u30C3=\u3063=\uFF6F" // KATAKANA LETTER SMALL TU - "&\u30C4=\u30C4=\u3064=\uFF82" // KATAKANA LETTER TU - "&\u30C6=\u30C6=\u3066=\uFF83" // KATAKANA LETTER TE - "&\u30C8=\u30C8=\u3068=\uFF84" // KATAKANA LETTER TO - "&\u30CA=\u30CA=\u306A=\uFF85" // KATAKANA LETTER NA - "&\u30CB=\u30CB=\u306B=\uFF86" // KATAKANA LETTER NI - "&\u30CC=\u30CC=\u306C=\uFF87" // KATAKANA LETTER NU - "&\u30CD=\u30CD=\u306D=\uFF88" // KATAKANA LETTER NE - "&\u30CE=\u30CE=\u306E=\uFF89" // KATAKANA LETTER NO - "&\u30CF=\u30CF=\u306F=\uFF8A" // KATAKANA LETTER HA - "&\u30D2=\u30D2=\u3072=\uFF8B" // KATAKANA LETTER HI - "&\u30D5=\u30D5=\u3075=\uFF8C" // KATAKANA LETTER HU - "&\u30D8=\u30D8=\u3078=\uFF8D" // KATAKANA LETTER HE - "&\u30DB=\u30DB=\u307B=\uFF8E" // KATAKANA LETTER HO - "&\u30DE=\u30DE=\u307E=\uFF8F" // KATAKANA LETTER MA - "&\u30DF=\u30DF=\u307F=\uFF90" // KATAKANA LETTER MI - "&\u30E0=\u30E0=\u3080=\uFF91" // KATAKANA LETTER MU - "&\u30E1=\u30E1=\u3081=\uFF92" // KATAKANA LETTER ME - "&\u30E2=\u30E2=\u3082=\uFF93" // KATAKANA LETTER MO - "&\u30E3=\u30E3=\u3083=\uFF6C" // KATAKANA LETTER SMALL YA - "&\u30E4=\u30E4=\u3084=\uFF94" // KATAKANA LETTER YA - "&\u30E5=\u30E5=\u3085=\uFF6D" // KATAKANA LETTER SMALL YU - "&\u30E6=\u30E6=\u3086=\uFF95" // KATAKANA LETTER YU - "&\u30E7=\u30E7=\u3087=\uFF6E" // KATAKANA LETTER SMALL YO - "&\u30E8=\u30E8=\u3088=\uFF96" // KATAKANA LETTER YO - "&\u30E9=\u30E9=\u3089=\uFF97" // KATAKANA LETTER RA - "&\u30EA=\u30EA=\u308A=\uFF98" // KATAKANA LETTER RI - "&\u30EB=\u30EB=\u308B=\uFF99" // KATAKANA LETTER RU - "&\u30EC=\u30EC=\u308C=\uFF9A" // KATAKANA LETTER RE - "&\u30ED=\u30ED=\u308D=\uFF9B" // KATAKANA LETTER RO - "&\u30EE=\u30EE=\u308E" // KATAKANA LETTER SMALL WA - "&\u30EF=\u30EF=\u308F=\uFF9C" // KATAKANA LETTER WA - "&\u30F0=\u30F0=\u3090" // KATAKANA LETTER WI - "&\u30F1=\u30F1=\u3091" // KATAKANA LETTER WE - "&\u30F2=\u30F2=\u3092=\uFF66" // KATAKANA LETTER WO - "&\u30F3=\u30F3=\u3093=\uFF9D" // KATAKANA LETTER N - "&\u30F5=\u30F5" // KATAKANA LETTER SMALL KA - "&\u30F6=\u30F6" // KATAKANA LETTER SMALL KE - "&\u30FC=\u30FC" // KATAKANA - HIRAGANA LENGTH MARK - "&\u3099=\u3099" - "&\u309A=\u309A" + "&\u30A1 = \u30A1 = \u3041 = \uFF67" // KATAKANA LETTER SMALL A + "&\u30A2 = \u30A2 = \u3042 = \uFF71" // KATAKANA LETTER A + "&\u30A3 = \u30A3 = \u3043 = \uFF68" // KATAKANA LETTER SMALL I + "&\u30A4 = \u30A4 = \u3044 = \uFF72" // KATAKANA LETTER I + "&\u30A5 = \u30A5 = \u3045 = \uFF69" // KATAKANA LETTER SMALL U + "&\u30A6 = \u30A6 = \u3046 = \uFF73" // KATAKANA LETTER U + "&\u30A7 = \u30A7 = \u3047 = \uFF6A" // KATAKANA LETTER SMALL E + "&\u30A8 = \u30A8 = \u3048 = \uFF74" // KATAKANA LETTER E + "&\u30A9 = \u30A9 = \u3049 = \uFF6B" // KATAKANA LETTER SMALL O + "&\u30AA = \u30AA = \u304A = \uFF75" // KATAKANA LETTER O + "&\u30AB = \u30AB = \u304B = \uFF76" // KATAKANA LETTER KA + "&\u30AD = \u30AD = \u304D = \uFF77" // KATAKANA LETTER KI + "&\u30AF = \u30AF = \u304F = \uFF78" // KATAKANA LETTER KU + "&\u30B1 = \u30B1 = \u3051 = \uFF79" // KATAKANA LETTER KE + "&\u30B3 = \u30B3 = \u3053 = \uFF7A" // KATAKANA LETTER KO + "&\u30B5 = \u30B5 = \u3055 = \uFF7B" // KATAKANA LETTER SA + "&\u30B7 = \u30B7 = \u3057 = \uFF7C" // KATAKANA LETTER SI + "&\u30B9 = \u30B9 = \u3059 = \uFF7D" // KATAKANA LETTER SU + "&\u30BB = \u30BB = \u305B = \uFF7E" // KATAKANA LETTER SE + "&\u30BD = \u30BD = \u305D = \uFF7F" // KATAKANA LETTER SO + "&\u30BF = \u30BF = \u305F = \uFF80" // KATAKANA LETTER TA + "&\u30C1 = \u30C1 = \u3061 = \uFF81" // KATAKANA LETTER TI + "&\u30C3 = \u30C3 = \u3063 = \uFF6F" // KATAKANA LETTER SMALL TU + "&\u30C4 = \u30C4 = \u3064 = \uFF82" // KATAKANA LETTER TU + "&\u30C6 = \u30C6 = \u3066 = \uFF83" // KATAKANA LETTER TE + "&\u30C8 = \u30C8 = \u3068 = \uFF84" // KATAKANA LETTER TO + "&\u30CA = \u30CA = \u306A = \uFF85" // KATAKANA LETTER NA + "&\u30CB = \u30CB = \u306B = \uFF86" // KATAKANA LETTER NI + "&\u30CC = \u30CC = \u306C = \uFF87" // KATAKANA LETTER NU + "&\u30CD = \u30CD = \u306D = \uFF88" // KATAKANA LETTER NE + "&\u30CE = \u30CE = \u306E = \uFF89" // KATAKANA LETTER NO + "&\u30CF = \u30CF = \u306F = \uFF8A" // KATAKANA LETTER HA + "&\u30D2 = \u30D2 = \u3072 = \uFF8B" // KATAKANA LETTER HI + "&\u30D5 = \u30D5 = \u3075 = \uFF8C" // KATAKANA LETTER HU + "&\u30D8 = \u30D8 = \u3078 = \uFF8D" // KATAKANA LETTER HE + "&\u30DB = \u30DB = \u307B = \uFF8E" // KATAKANA LETTER HO + "&\u30DE = \u30DE = \u307E = \uFF8F" // KATAKANA LETTER MA + "&\u30DF = \u30DF = \u307F = \uFF90" // KATAKANA LETTER MI + "&\u30E0 = \u30E0 = \u3080 = \uFF91" // KATAKANA LETTER MU + "&\u30E1 = \u30E1 = \u3081 = \uFF92" // KATAKANA LETTER ME + "&\u30E2 = \u30E2 = \u3082 = \uFF93" // KATAKANA LETTER MO + "&\u30E3 = \u30E3 = \u3083 = \uFF6C" // KATAKANA LETTER SMALL YA + "&\u30E4 = \u30E4 = \u3084 = \uFF94" // KATAKANA LETTER YA + "&\u30E5 = \u30E5 = \u3085 = \uFF6D" // KATAKANA LETTER SMALL YU + "&\u30E6 = \u30E6 = \u3086 = \uFF95" // KATAKANA LETTER YU + "&\u30E7 = \u30E7 = \u3087 = \uFF6E" // KATAKANA LETTER SMALL YO + "&\u30E8 = \u30E8 = \u3088 = \uFF96" // KATAKANA LETTER YO + "&\u30E9 = \u30E9 = \u3089 = \uFF97" // KATAKANA LETTER RA + "&\u30EA = \u30EA = \u308A = \uFF98" // KATAKANA LETTER RI + "&\u30EB = \u30EB = \u308B = \uFF99" // KATAKANA LETTER RU + "&\u30EC = \u30EC = \u308C = \uFF9A" // KATAKANA LETTER RE + "&\u30ED = \u30ED = \u308D = \uFF9B" // KATAKANA LETTER RO + "&\u30EE = \u30EE = \u308E" // KATAKANA LETTER SMALL WA + "&\u30EF = \u30EF = \u308F = \uFF9C" // KATAKANA LETTER WA + "&\u30F0 = \u30F0 = \u3090" // KATAKANA LETTER WI + "&\u30F1 = \u30F1 = \u3091" // KATAKANA LETTER WE + "&\u30F2 = \u30F2 = \u3092 = \uFF66" // KATAKANA LETTER WO + "&\u30F3 = \u30F3 = \u3093 = \uFF9D" // KATAKANA LETTER N + "&\u30F5 = \u30F5" // KATAKANA LETTER SMALL KA + "&\u30F6 = \u30F6" // KATAKANA LETTER SMALL KE + "&\u30FC = \u30FC" // KATAKANA - HIRAGANA LENGTH MARK + "&\u3099 = \u3099" + "&\u309A = \u309A" // Equaling normal and halfwidth/fullwidth characters "&' '=\u3000" // IDEOGRAPHIC SPACE - "&'\u0020'='\uFFE3'" // SPACE - "&'\u0021'='\uFF01'" // EXCLAMATION MARK - "&'\u0022'='\uFF02'" // QUOTATION MARK - "&'\u0023'='\uFF03'" // NUMBER SIGN - "&'\u0024'='\uFF04'" // DOLLAR SIGN - "&'\u0025'='\uFF05'" // PERCENT SIGN - "&'\u0026'='\uFF06'" // AMPERSAND - "&''='\uFF07'" // APOSTROPHE - "&'\u0028'='\uFF08'" // LEFT PARENTHESIS - "&'\u0029'='\uFF09'" // RIGHT PARENTHESIS - "&'\u002A'='\uFF0A'" // ASTERISK - "&'\u002B'='\uFF0B'" // PLUS SIGN - "&'\u002C'='\uFF0C'" // COMMA - "&'\u002D'='\uFF0D'" // HYPHEN-MINUS - "&'\u002E'='\uFF0E'" // FULL STOP - "&'\u002F'='\uFF0F'" // SOLIDUS - "&'\u0030'='\uFF10'" // DIGIT ZERO - "&'\u0031'='\uFF11'" // DIGIT ONE - "&'\u0032'='\uFF12'" // DIGIT TWO - "&'\u0033'='\uFF13'" // DIGIT THREE - "&'\u0034'='\uFF14'" // DIGIT FOUR - "&'\u0035'='\uFF15'" // DIGIT FIVE - "&'\u0036'='\uFF16'" // DIGIT SIX - "&'\u0037'='\uFF17'" // DIGIT SEVEN - "&'\u0038'='\uFF18'" // DIGIT EIGHT - "&'\u0039'='\uFF19'" // DIGIT NINE - "&'\u003A'='\uFF1A'" // COLON - "&'\u003B'='\uFF1B'" // SEMICOLON - "&'\u003C'='\uFF1C'" // LESS-THAN SIGN - "&'\u003D'='\uFF1D'" // EQUALS SIGN - "&'\u003E'='\uFF1E'" // GREATER-THAN SIGN - "&'\u003F'='\uFF1F'" // QUESTION MARK - "&'\u0040'='\uFF20'" // COMMERCIAL AT - "&'\u0041'='\uFF21'" // LATIN CAPITAL LETTER A - "&'\u0042'='\uFF22'" // LATIN CAPITAL LETTER B - "&'\u0043'='\uFF23'" // LATIN CAPITAL LETTER C - "&'\u0044'='\uFF24'" // LATIN CAPITAL LETTER D - "&'\u0045'='\uFF25'" // LATIN CAPITAL LETTER E - "&'\u0046'='\uFF26'" // LATIN CAPITAL LETTER F - "&'\u0047'='\uFF27'" // LATIN CAPITAL LETTER G - "&'\u0048'='\uFF28'" // LATIN CAPITAL LETTER H - "&'\u0049'='\uFF29'" // LATIN CAPITAL LETTER I - "&'\u004A'='\uFF2A'" // LATIN CAPITAL LETTER J - "&'\u004B'='\uFF2B'" // LATIN CAPITAL LETTER K - "&'\u004C'='\uFF2C'" // LATIN CAPITAL LETTER L - "&'\u004D'='\uFF2D'" // LATIN CAPITAL LETTER M - "&'\u004E'='\uFF2E'" // LATIN CAPITAL LETTER N - "&'\u004F'='\uFF2F'" // LATIN CAPITAL LETTER O - "&'\u0050'='\uFF30'" // LATIN CAPITAL LETTER P - "&'\u0051'='\uFF31'" // LATIN CAPITAL LETTER Q - "&'\u0052'='\uFF32'" // LATIN CAPITAL LETTER R - "&'\u0053'='\uFF33'" // LATIN CAPITAL LETTER S - "&'\u0054'='\uFF34'" // LATIN CAPITAL LETTER T - "&'\u0055'='\uFF35'" // LATIN CAPITAL LETTER U - "&'\u0056'='\uFF36'" // LATIN CAPITAL LETTER V - "&'\u0057'='\uFF37'" // LATIN CAPITAL LETTER W - "&'\u0058'='\uFF38'" // LATIN CAPITAL LETTER X - "&'\u0059'='\uFF39'" // LATIN CAPITAL LETTER Y - "&'\u005A'='\uFF3A'" // LATIN CAPITAL LETTER Z - "&'\u005B'='\uFF3B'" // LEFT SQUARE BRACKET - "&'\u005C'='\uFF3C'" // REVERSE SOLIDUS - "&'\u005D'='\uFF3D'" // RIGHT SQUARE BRACKET - "&'\u005E'='\uFF3E'" // CIRCUMFLEX ACCENT - "&'\u005F'='\uFF3F'" // LOW LINE - "&'\u0060'='\uFF40'" // GRAVE ACCENT - "&'\u0061'='\uFF41'" // LATIN SMALL LETTER A - "&'\u0062'='\uFF42'" // LATIN SMALL LETTER B - "&'\u0063'='\uFF43'" // LATIN SMALL LETTER C - "&'\u0064'='\uFF44'" // LATIN SMALL LETTER D - "&'\u0065'='\uFF45'" // LATIN SMALL LETTER E - "&'\u0066'='\uFF46'" // LATIN SMALL LETTER F - "&'\u0067'='\uFF47'" // LATIN SMALL LETTER G - "&'\u0068'='\uFF48'" // LATIN SMALL LETTER H - "&'\u0069'='\uFF49'" // LATIN SMALL LETTER I - "&'\u006A'='\uFF4A'" // LATIN SMALL LETTER J - "&'\u006B'='\uFF4B'" // LATIN SMALL LETTER K - "&'\u006C'='\uFF4C'" // LATIN SMALL LETTER L - "&'\u006D'='\uFF4D'" // LATIN SMALL LETTER M - "&'\u006E'='\uFF4E'" // LATIN SMALL LETTER N - "&'\u006F'='\uFF4F'" // LATIN SMALL LETTER O - "&'\u0070'='\uFF50'" // LATIN SMALL LETTER P - "&'\u0071'='\uFF51'" // LATIN SMALL LETTER Q - "&'\u0072'='\uFF52'" // LATIN SMALL LETTER R - "&'\u0073'='\uFF53'" // LATIN SMALL LETTER S - "&'\u0074'='\uFF54'" // LATIN SMALL LETTER T - "&'\u0075'='\uFF55'" // LATIN SMALL LETTER U - "&'\u0076'='\uFF56'" // LATIN SMALL LETTER V - "&'\u0077'='\uFF57'" // LATIN SMALL LETTER W - "&'\u0078'='\uFF58'" // LATIN SMALL LETTER X - "&'\u0079'='\uFF59'" // LATIN SMALL LETTER Y - "&'\u007A'='\uFF5A'" // LATIN SMALL LETTER Z - "&'\u007B'='\uFF5B'" // LEFT CURLY BRACKET - "&'\u007C'='\uFF5C'" // VERTICAL LINE - "&'\u007D'='\uFF5D'" // RIGHT CURLY BRACKET - "&'\u007E'='\uFF5E'" // TILDE - "&'\u00A2'='\uFFE0'" // CENT SIGN - "&'\u00A3'='\uFFE1'" // POUND SIGN - "&'\u00A5'='\uFFE5'" // YEN SIGN - "&'\u00A6'='\uFFE4'" // BROKEN BAR - "&'\u00AC'='\uFFE2'" // NOT SIGN - "&'\u1100'='\uFFA1'" // HANGUL CHOSEONG KIYEOK - "&'\u1101'='\uFFA2'" // HANGUL CHOSEONG SSANGKIYEOK - "&'\u1102'='\uFFA4'" // HANGUL CHOSEONG NIEUN - "&'\u1103'='\uFFA7'" // HANGUL CHOSEONG TIKEUT - "&'\u1104'='\uFFA8'" // HANGUL CHOSEONG SSANGTIKEUT - "&'\u1105'='\uFFA9'" // HANGUL CHOSEONG RIEUL - "&'\u1106'='\uFFB1'" // HANGUL CHOSEONG MIEUM - "&'\u1107'='\uFFB2'" // HANGUL CHOSEONG PIEUP - "&'\u1108'='\uFFB3'" // HANGUL CHOSEONG SSANGPIEUP - "&'\u1109'='\uFFB5'" // HANGUL CHOSEONG SIOS - "&'\u110A'='\uFFB6'" // HANGUL CHOSEONG SSANGSIOS - "&'\u110B'='\uFFB7'" // HANGUL CHOSEONG IEUNG - "&'\u110C'='\uFFB8'" // HANGUL CHOSEONG CIEUC - "&'\u110D'='\uFFB9'" // HANGUL CHOSEONG SSANGCIEUC - "&'\u110E'='\uFFBA'" // HANGUL CHOSEONG CHIEUCH - "&'\u110F'='\uFFBB'" // HANGUL CHOSEONG KHIEUKH - "&'\u1110'='\uFFBC'" // HANGUL CHOSEONG THIEUTH - "&'\u1111'='\uFFBD'" // HANGUL CHOSEONG PHIEUPH - "&'\u1112'='\uFFBE'" // HANGUL CHOSEONG HIEUH - "&'\u111A'='\uFFB0'" // HANGUL CHOSEONG RIEUL-HIEUH - "&'\u1121'='\uFFB4'" // HANGUL CHOSEONG PIEUP-SIOS - "&'\u1160'='\uFFA0'" // HANGUL JUNGSEONG FILLER - "&'\u1161'='\uFFC2'" // HANGUL JUNGSEONG A - "&'\u1162'='\uFFC3'" // HANGUL JUNGSEONG AE - "&'\u1163'='\uFFC4'" // HANGUL JUNGSEONG YA - "&'\u1164'='\uFFC5'" // HANGUL JUNGSEONG YAE - "&'\u1165'='\uFFC6'" // HANGUL JUNGSEONG EO - "&'\u1166'='\uFFC7'" // HANGUL JUNGSEONG E - "&'\u1167'='\uFFCA'" // HANGUL JUNGSEONG YEO - "&'\u1168'='\uFFCB'" // HANGUL JUNGSEONG YE - "&'\u1169'='\uFFCC'" // HANGUL JUNGSEONG O - "&'\u116A'='\uFFCD'" // HANGUL JUNGSEONG WA - "&'\u116B'='\uFFCE'" // HANGUL JUNGSEONG WAE - "&'\u116C'='\uFFCF'" // HANGUL JUNGSEONG OE - "&'\u116D'='\uFFD2'" // HANGUL JUNGSEONG YO - "&'\u116E'='\uFFD3'" // HANGUL JUNGSEONG U - "&'\u116F'='\uFFD4'" // HANGUL JUNGSEONG WEO - "&'\u1170'='\uFFD5'" // HANGUL JUNGSEONG WE - "&'\u1171'='\uFFD6'" // HANGUL JUNGSEONG WI - "&'\u1172'='\uFFD7'" // HANGUL JUNGSEONG YU - "&'\u1173'='\uFFDA'" // HANGUL JUNGSEONG EU - "&'\u1174'='\uFFDB'" // HANGUL JUNGSEONG YI - "&'\u1175'='\uFFDC'" // HANGUL JUNGSEONG I - "&'\u11AA'='\uFFA3'" // HANGUL JONGSEONG KIYEOK-SIOS - "&'\u11AC'='\uFFA5'" // HANGUL JONGSEONG NIEUN-CIEUC - "&'\u11AD'='\uFFA6'" // HANGUL JONGSEONG NIEUN-HIEUH - "&'\u11B0'='\uFFAA'" // HANGUL JONGSEONG RIEUL-KIYEOK - "&'\u11B1'='\uFFAB'" // HANGUL JONGSEONG RIEUL-MIEUM - "&'\u11B2'='\uFFAC'" // HANGUL JONGSEONG RIEUL-PIEUP - "&'\u11B3'='\uFFAD'" // HANGUL JONGSEONG RIEUL-SIOS - "&'\u11B4'='\uFFAE'" // HANGUL JONGSEONG RIEUL-THIEUTH - "&'\u11B5'='\uFFAF'" // HANGUL JONGSEONG RIEUL-PHIEUPH - "&'\u20A9'='\uFFE6'" // WON SIGN - "&'\u2190'='\uFFE9'" // LEFTWARDS ARROW - "&'\u2191'='\uFFEA'" // UPWARDS ARROW - "&'\u2192'='\uFFEB'" // RIGHTWARDS ARROW - "&'\u2193'='\uFFEC'" // DOWNWARDS ARROW - "&'\u2502'='\uFFE8'" // BOX DRAWINGS LIGHT VERTICAL - "&'\u25A0'='\uFFED'" // BLACK SQUARE - "&'\u25CB'='\uFFEE'" // WHITE CIRCLE - "&'\u3001'='\uFF64'" // IDEOGRAPHIC COMMA - "&'\u3002'='\uFF61'" // IDEOGRAPHIC FULL STOP - "&'\u300C'='\uFF62'" // LEFT CORNER BRACKET - "&'\u300D'='\uFF63'" // RIGHT CORNER BRACKET + "&'\u0020' = '\uFFE3'" // SPACE + "&'\u0021' = '\uFF01'" // EXCLAMATION MARK + "&'\u0022' = '\uFF02'" // QUOTATION MARK + "&'\u0023' = '\uFF03'" // NUMBER SIGN + "&'\u0024' = '\uFF04'" // DOLLAR SIGN + "&'\u0025' = '\uFF05'" // PERCENT SIGN + "&'\u0026' = '\uFF06'" // AMPERSAND + "&'' = '\uFF07'" // APOSTROPHE + "&'\u0028' = '\uFF08'" // LEFT PARENTHESIS + "&'\u0029' = '\uFF09'" // RIGHT PARENTHESIS + "&'\u002A' = '\uFF0A'" // ASTERISK + "&'\u002B' = '\uFF0B'" // PLUS SIGN + "&'\u002C' = '\uFF0C'" // COMMA + "&'\u002D' = '\uFF0D'" // HYPHEN-MINUS + "&'\u002E' = '\uFF0E'" // FULL STOP + "&'\u002F' = '\uFF0F'" // SOLIDUS + "&'\u0030' = '\uFF10'" // DIGIT ZERO + "&'\u0031' = '\uFF11'" // DIGIT ONE + "&'\u0032' = '\uFF12'" // DIGIT TWO + "&'\u0033' = '\uFF13'" // DIGIT THREE + "&'\u0034' = '\uFF14'" // DIGIT FOUR + "&'\u0035' = '\uFF15'" // DIGIT FIVE + "&'\u0036' = '\uFF16'" // DIGIT SIX + "&'\u0037' = '\uFF17'" // DIGIT SEVEN + "&'\u0038' = '\uFF18'" // DIGIT EIGHT + "&'\u0039' = '\uFF19'" // DIGIT NINE + "&'\u003A' = '\uFF1A'" // COLON + "&'\u003B' = '\uFF1B'" // SEMICOLON + "&'\u003C' = '\uFF1C'" // LESS-THAN SIGN + "&'\u003D' = '\uFF1D'" // EQUALS SIGN + "&'\u003E' = '\uFF1E'" // GREATER-THAN SIGN + "&'\u003F' = '\uFF1F'" // QUESTION MARK + "&'\u0040' = '\uFF20'" // COMMERCIAL AT + "&'\u0041' = '\uFF21'" // LATIN CAPITAL LETTER A + "&'\u0042' = '\uFF22'" // LATIN CAPITAL LETTER B + "&'\u0043' = '\uFF23'" // LATIN CAPITAL LETTER C + "&'\u0044' = '\uFF24'" // LATIN CAPITAL LETTER D + "&'\u0045' = '\uFF25'" // LATIN CAPITAL LETTER E + "&'\u0046' = '\uFF26'" // LATIN CAPITAL LETTER F + "&'\u0047' = '\uFF27'" // LATIN CAPITAL LETTER G + "&'\u0048' = '\uFF28'" // LATIN CAPITAL LETTER H + "&'\u0049' = '\uFF29'" // LATIN CAPITAL LETTER I + "&'\u004A' = '\uFF2A'" // LATIN CAPITAL LETTER J + "&'\u004B' = '\uFF2B'" // LATIN CAPITAL LETTER K + "&'\u004C' = '\uFF2C'" // LATIN CAPITAL LETTER L + "&'\u004D' = '\uFF2D'" // LATIN CAPITAL LETTER M + "&'\u004E' = '\uFF2E'" // LATIN CAPITAL LETTER N + "&'\u004F' = '\uFF2F'" // LATIN CAPITAL LETTER O + "&'\u0050' = '\uFF30'" // LATIN CAPITAL LETTER P + "&'\u0051' = '\uFF31'" // LATIN CAPITAL LETTER Q + "&'\u0052' = '\uFF32'" // LATIN CAPITAL LETTER R + "&'\u0053' = '\uFF33'" // LATIN CAPITAL LETTER S + "&'\u0054' = '\uFF34'" // LATIN CAPITAL LETTER T + "&'\u0055' = '\uFF35'" // LATIN CAPITAL LETTER U + "&'\u0056' = '\uFF36'" // LATIN CAPITAL LETTER V + "&'\u0057' = '\uFF37'" // LATIN CAPITAL LETTER W + "&'\u0058' = '\uFF38'" // LATIN CAPITAL LETTER X + "&'\u0059' = '\uFF39'" // LATIN CAPITAL LETTER Y + "&'\u005A' = '\uFF3A'" // LATIN CAPITAL LETTER Z + "&'\u005B' = '\uFF3B'" // LEFT SQUARE BRACKET + "&'\u005C' = '\uFF3C'" // REVERSE SOLIDUS + "&'\u005D' = '\uFF3D'" // RIGHT SQUARE BRACKET + "&'\u005E' = '\uFF3E'" // CIRCUMFLEX ACCENT + "&'\u005F' = '\uFF3F'" // LOW LINE + "&'\u0060' = '\uFF40'" // GRAVE ACCENT + "&'\u0061' = '\uFF41'" // LATIN SMALL LETTER A + "&'\u0062' = '\uFF42'" // LATIN SMALL LETTER B + "&'\u0063' = '\uFF43'" // LATIN SMALL LETTER C + "&'\u0064' = '\uFF44'" // LATIN SMALL LETTER D + "&'\u0065' = '\uFF45'" // LATIN SMALL LETTER E + "&'\u0066' = '\uFF46'" // LATIN SMALL LETTER F + "&'\u0067' = '\uFF47'" // LATIN SMALL LETTER G + "&'\u0068' = '\uFF48'" // LATIN SMALL LETTER H + "&'\u0069' = '\uFF49'" // LATIN SMALL LETTER I + "&'\u006A' = '\uFF4A'" // LATIN SMALL LETTER J + "&'\u006B' = '\uFF4B'" // LATIN SMALL LETTER K + "&'\u006C' = '\uFF4C'" // LATIN SMALL LETTER L + "&'\u006D' = '\uFF4D'" // LATIN SMALL LETTER M + "&'\u006E' = '\uFF4E'" // LATIN SMALL LETTER N + "&'\u006F' = '\uFF4F'" // LATIN SMALL LETTER O + "&'\u0070' = '\uFF50'" // LATIN SMALL LETTER P + "&'\u0071' = '\uFF51'" // LATIN SMALL LETTER Q + "&'\u0072' = '\uFF52'" // LATIN SMALL LETTER R + "&'\u0073' = '\uFF53'" // LATIN SMALL LETTER S + "&'\u0074' = '\uFF54'" // LATIN SMALL LETTER T + "&'\u0075' = '\uFF55'" // LATIN SMALL LETTER U + "&'\u0076' = '\uFF56'" // LATIN SMALL LETTER V + "&'\u0077' = '\uFF57'" // LATIN SMALL LETTER W + "&'\u0078' = '\uFF58'" // LATIN SMALL LETTER X + "&'\u0079' = '\uFF59'" // LATIN SMALL LETTER Y + "&'\u007A' = '\uFF5A'" // LATIN SMALL LETTER Z + "&'\u007B' = '\uFF5B'" // LEFT CURLY BRACKET + "&'\u007C' = '\uFF5C'" // VERTICAL LINE + "&'\u007D' = '\uFF5D'" // RIGHT CURLY BRACKET + "&'\u007E' = '\uFF5E'" // TILDE + "&'\u00A2' = '\uFFE0'" // CENT SIGN + "&'\u00A3' = '\uFFE1'" // POUND SIGN + "&'\u00A5' = '\uFFE5'" // YEN SIGN + "&'\u00A6' = '\uFFE4'" // BROKEN BAR + "&'\u00AC' = '\uFFE2'" // NOT SIGN + "&'\u1100' = '\uFFA1'" // HANGUL CHOSEONG KIYEOK + "&'\u1101' = '\uFFA2'" // HANGUL CHOSEONG SSANGKIYEOK + "&'\u1102' = '\uFFA4'" // HANGUL CHOSEONG NIEUN + "&'\u1103' = '\uFFA7'" // HANGUL CHOSEONG TIKEUT + "&'\u1104' = '\uFFA8'" // HANGUL CHOSEONG SSANGTIKEUT + "&'\u1105' = '\uFFA9'" // HANGUL CHOSEONG RIEUL + "&'\u1106' = '\uFFB1'" // HANGUL CHOSEONG MIEUM + "&'\u1107' = '\uFFB2'" // HANGUL CHOSEONG PIEUP + "&'\u1108' = '\uFFB3'" // HANGUL CHOSEONG SSANGPIEUP + "&'\u1109' = '\uFFB5'" // HANGUL CHOSEONG SIOS + "&'\u110A' = '\uFFB6'" // HANGUL CHOSEONG SSANGSIOS + "&'\u110B' = '\uFFB7'" // HANGUL CHOSEONG IEUNG + "&'\u110C' = '\uFFB8'" // HANGUL CHOSEONG CIEUC + "&'\u110D' = '\uFFB9'" // HANGUL CHOSEONG SSANGCIEUC + "&'\u110E' = '\uFFBA'" // HANGUL CHOSEONG CHIEUCH + "&'\u110F' = '\uFFBB'" // HANGUL CHOSEONG KHIEUKH + "&'\u1110' = '\uFFBC'" // HANGUL CHOSEONG THIEUTH + "&'\u1111' = '\uFFBD'" // HANGUL CHOSEONG PHIEUPH + "&'\u1112' = '\uFFBE'" // HANGUL CHOSEONG HIEUH + "&'\u111A' = '\uFFB0'" // HANGUL CHOSEONG RIEUL-HIEUH + "&'\u1121' = '\uFFB4'" // HANGUL CHOSEONG PIEUP-SIOS + "&'\u1160' = '\uFFA0'" // HANGUL JUNGSEONG FILLER + "&'\u1161' = '\uFFC2'" // HANGUL JUNGSEONG A + "&'\u1162' = '\uFFC3'" // HANGUL JUNGSEONG AE + "&'\u1163' = '\uFFC4'" // HANGUL JUNGSEONG YA + "&'\u1164' = '\uFFC5'" // HANGUL JUNGSEONG YAE + "&'\u1165' = '\uFFC6'" // HANGUL JUNGSEONG EO + "&'\u1166' = '\uFFC7'" // HANGUL JUNGSEONG E + "&'\u1167' = '\uFFCA'" // HANGUL JUNGSEONG YEO + "&'\u1168' = '\uFFCB'" // HANGUL JUNGSEONG YE + "&'\u1169' = '\uFFCC'" // HANGUL JUNGSEONG O + "&'\u116A' = '\uFFCD'" // HANGUL JUNGSEONG WA + "&'\u116B' = '\uFFCE'" // HANGUL JUNGSEONG WAE + "&'\u116C' = '\uFFCF'" // HANGUL JUNGSEONG OE + "&'\u116D' = '\uFFD2'" // HANGUL JUNGSEONG YO + "&'\u116E' = '\uFFD3'" // HANGUL JUNGSEONG U + "&'\u116F' = '\uFFD4'" // HANGUL JUNGSEONG WEO + "&'\u1170' = '\uFFD5'" // HANGUL JUNGSEONG WE + "&'\u1171' = '\uFFD6'" // HANGUL JUNGSEONG WI + "&'\u1172' = '\uFFD7'" // HANGUL JUNGSEONG YU + "&'\u1173' = '\uFFDA'" // HANGUL JUNGSEONG EU + "&'\u1174' = '\uFFDB'" // HANGUL JUNGSEONG YI + "&'\u1175' = '\uFFDC'" // HANGUL JUNGSEONG I + "&'\u11AA' = '\uFFA3'" // HANGUL JONGSEONG KIYEOK-SIOS + "&'\u11AC' = '\uFFA5'" // HANGUL JONGSEONG NIEUN-CIEUC + "&'\u11AD' = '\uFFA6'" // HANGUL JONGSEONG NIEUN-HIEUH + "&'\u11B0' = '\uFFAA'" // HANGUL JONGSEONG RIEUL-KIYEOK + "&'\u11B1' = '\uFFAB'" // HANGUL JONGSEONG RIEUL-MIEUM + "&'\u11B2' = '\uFFAC'" // HANGUL JONGSEONG RIEUL-PIEUP + "&'\u11B3' = '\uFFAD'" // HANGUL JONGSEONG RIEUL-SIOS + "&'\u11B4' = '\uFFAE'" // HANGUL JONGSEONG RIEUL-THIEUTH + "&'\u11B5' = '\uFFAF'" // HANGUL JONGSEONG RIEUL-PHIEUPH + "&'\u20A9' = '\uFFE6'" // WON SIGN + "&'\u2190' = '\uFFE9'" // LEFTWARDS ARROW + "&'\u2191' = '\uFFEA'" // UPWARDS ARROW + "&'\u2192' = '\uFFEB'" // RIGHTWARDS ARROW + "&'\u2193' = '\uFFEC'" // DOWNWARDS ARROW + "&'\u2502' = '\uFFE8'" // BOX DRAWINGS LIGHT VERTICAL + "&'\u25A0' = '\uFFED'" // BLACK SQUARE + "&'\u25CB' = '\uFFEE'" // WHITE CIRCLE + "&'\u3001' = '\uFF64'" // IDEOGRAPHIC COMMA + "&'\u3002' = '\uFF61'" // IDEOGRAPHIC FULL STOP + "&'\u300C' = '\uFF62'" // LEFT CORNER BRACKET + "&'\u300D' = '\uFF63'" // RIGHT CORNER BRACKET // Kanji, positioned over the top "& [top] " @@ -1742,6 +1742,17 @@ ja { } } LocaleScript{ "Kana","Hira", "Hani" } + + ExemplarCharacters{ + "[\u3041-\u307C \u308F-\u3092 " "\u30A1-\u30DC \u30F7-\u30FA \u30FC " + "\u4E14-\u4E19 \u4ED4-\u4ED9 \u5021-\u5026 " + "\u5BC2-\u5BC7 \u6291-\u6298 \u62C5-\u62CA " + "\u723A-\u7240 \u7A3B-\u7A40 \u8105-\u810A " + "\u8301-\u8306 \u91DA-\u91DF \u9ECC-\u9ED2 " + "\uCD3B \uCDCD \uFF61 \uFF66 \uFF73 " + "\uFF76-\uFF84 \uFF8A-\uFF8E \uFF9C]" + } + //------------------------------------------------------------ // Rule Based Number Format Support //------------------------------------------------------------ @@ -1764,24 +1775,24 @@ ja { SpelloutRules { "%financial:\n" - " \u96f6; \u58f1; \u5f10; \u53c2; \u56db; \u4f0d; \u516d; \u4e03; \u516b; \u4e5d;\n" - " \u62fe[>>];\n" - " 20: <<\u62fe[>>];\n" - " 100: <<\u767e[>>];\n" - " 1000: <<\u5343[>>];\n" - " 10,000: <<\u4e07[>>];\n" - " 100,000,000: <<\u5104[>>];\n" - " 1,000,000,000,000: <<\u5146[>>];\n" - " 10,000,000,000,000,000: =#,##0=;\n" + " \u96f6; \u58f1; \u5f10; \u53c2; \u56db; \u4f0d; \u516d; \u4e03; \u516b; \u4e5d;\n" + " \u62fe[>>];\n" + " 20: <<\u62fe[>>];\n" + " 100: <<\u767e[>>];\n" + " 1000: <<\u5343[>>];\n" + " 10,000: <<\u4e07[>>];\n" + " 100,000,000: <<\u5104[>>];\n" + " 1,000,000,000,000: <<\u5146[>>];\n" + " 10,000,000,000,000,000: =#,##0=;\n" "%traditional:\n" - " \u96f6; \u4e00; \u4e8c; \u4e09; \u56db; \u4e94; \u516d; \u4e03; \u516b; \u4e5d;\n" - " \u5341[>>];\n" - " 20: <<\u5341[>>];\n" - " 100: <<\u767e[>>];\n" - " 1000: <<\u5343[>>];\n" - " 10,000: <<\u4e07[>>];\n" - " 100,000,000: <<\u5104[>>];\n" - " 1,000,000,000,000: <<\u5146[>>];\n" - " 10,000,000,000,000,000: =#,##0=;" + " \u96f6; \u4e00; \u4e8c; \u4e09; \u56db; \u4e94; \u516d; \u4e03; \u516b; \u4e5d;\n" + " \u5341[>>];\n" + " 20: <<\u5341[>>];\n" + " 100: <<\u767e[>>];\n" + " 1000: <<\u5343[>>];\n" + " 10,000: <<\u4e07[>>];\n" + " 100,000,000: <<\u5104[>>];\n" + " 1,000,000,000,000: <<\u5146[>>];\n" + " 10,000,000,000,000,000: =#,##0=;" } } diff --git a/icu4c/source/data/locales/ka.txt b/icu4c/source/data/locales/ka.txt index 498138fef7..378c1352f0 100644 --- a/icu4c/source/data/locales/ka.txt +++ b/icu4c/source/data/locales/ka.txt @@ -75,6 +75,7 @@ ka{ "\ufffd", } LocaleScript:array { "Geor" } + ExemplarCharacters { "[:Geor:]" } CollationElements { Version { "1.0" } Sequence { diff --git a/icu4c/source/data/locales/kk.txt b/icu4c/source/data/locales/kk.txt index 263fa8a49c..2df19d01cb 100644 --- a/icu4c/source/data/locales/kk.txt +++ b/icu4c/source/data/locales/kk.txt @@ -79,8 +79,8 @@ kk{ "\u221E", "\uFFFD", } - LocaleScript:array{ "Cyrl" } - + LocaleScript{ "Cyrl" } + ExemplarCharacters { "[\u0430-\u0448 \u044b \u044d \u0451]" } CollationElements { Version { "1.0" } Sequence { diff --git a/icu4c/source/data/locales/kl.txt b/icu4c/source/data/locales/kl.txt index 3a80e19119..74f57bebc3 100644 --- a/icu4c/source/data/locales/kl.txt +++ b/icu4c/source/data/locales/kl.txt @@ -67,6 +67,8 @@ kl{ "\u221e", "\ufffd", } + ExemplarCharacters { "[a-z \u00e1 \u00e9 \u00ed \u00fa \u00e2 \u00ea \u00ee \u00f4 \u00fb \u00e6 \u00e5 \u00f8 \u00e3 \u0129 \u0169 \u0138]" } + // LocaleScript{ // "Latn", // ISO 15924 Name // } diff --git a/icu4c/source/data/locales/kn.txt b/icu4c/source/data/locales/kn.txt index 6e96fd76be..fd43d79566 100644 --- a/icu4c/source/data/locales/kn.txt +++ b/icu4c/source/data/locales/kn.txt @@ -89,6 +89,7 @@ kn { // "\ufffd", // } LocaleScript:array { "Knda" } + ExemplarCharacters { "[:Knda:]" } CollationElements { Version { "1.0" } Sequence { diff --git a/icu4c/source/data/locales/ko.txt b/icu4c/source/data/locales/ko.txt index 295f18bd93..d02409196f 100644 --- a/icu4c/source/data/locales/ko.txt +++ b/icu4c/source/data/locales/ko.txt @@ -2243,4 +2243,15 @@ ko { } } LocaleScript{ "Hang", "Hani" } + ExemplarCharacters{ + "[\u3041-\u3093 \u30A1-\u30F6 \u3131-\u318E " + "\uC5C4-\uC5CA \uC5FC-\uC601 \uC751-\uC758 " + "\u4ED4-\u4ED9 \u4F59-\u4F5E \u5143-\u5149 \u5167-\u516E " + "\u5236-\u523B \u540C-\u5411 \u5B95-\u5B9C \u5BC2-\u5BC7 \u5BE4-\u5BE9 " + "\u6664-\u6669 \u67CF-\u67D4 \u6B61-\u6B66 \u701A-\u701F \u795A-\u7960 " + "\u8105-\u810A \u8CA7-\u8CAC \u8CBF-\u8CC4 \u8FAD-\u8FB2 \u901D-\u9023 " + "\u907F-\u9084 \u9149-\u914E \u91CB-\u91D1 \uAC10-\uAC17 \uBCCF-\uBCD5]" + + + } } diff --git a/icu4c/source/data/locales/kok.txt b/icu4c/source/data/locales/kok.txt index 96621539c1..67dbfe3631 100644 --- a/icu4c/source/data/locales/kok.txt +++ b/icu4c/source/data/locales/kok.txt @@ -238,6 +238,7 @@ kok { LocaleScript:array { "Deva" // ISO 15924 Name } + ExemplarCharacters{ "[:Deva:]" } // CollationElements { // "" // } diff --git a/icu4c/source/data/locales/ky.txt b/icu4c/source/data/locales/ky.txt index ccb76b79fc..9e2d044795 100644 --- a/icu4c/source/data/locales/ky.txt +++ b/icu4c/source/data/locales/ky.txt @@ -74,7 +74,8 @@ ky{ "\u221e", "\ufffd", } - LocaleScript:array{ "Goer" } + LocaleScript:array{ "Cyrl" } + ExemplarCharacters { "[\u0430-\u0448 \u0456 \u0454 \u0457 \u0491]" } CollationElements { Version { "1.0" } Sequence { diff --git a/icu4c/source/data/locales/lt.txt b/icu4c/source/data/locales/lt.txt index b0e8228767..6c7db41f53 100644 --- a/icu4c/source/data/locales/lt.txt +++ b/icu4c/source/data/locales/lt.txt @@ -109,4 +109,5 @@ lt { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u0105 \u0119 \u012f \u0173 \u0117 \u016b \u010d \u0161 \u017e]" } } diff --git a/icu4c/source/data/locales/lv.txt b/icu4c/source/data/locales/lv.txt index 4e9e148db3..c01ab333bb 100644 --- a/icu4c/source/data/locales/lv.txt +++ b/icu4c/source/data/locales/lv.txt @@ -106,6 +106,7 @@ lv { "GMT", } } + ExemplarCharacters { "[a-z \u0101 \u0113 \u012b \u014d \u016b \u0123 \u0137 \u013c \u0146 \u0157 \u010d \u0161 \u017e]" } // LocaleScript{ // "Latn", // ISO 15924 Name // } diff --git a/icu4c/source/data/locales/mk.txt b/icu4c/source/data/locales/mk.txt index 7db3b50ee1..358b8782ce 100644 --- a/icu4c/source/data/locales/mk.txt +++ b/icu4c/source/data/locales/mk.txt @@ -139,4 +139,5 @@ mk { LocaleScript{ "Cyrl", // ISO 15924 Name } + ExemplarCharacters { "[\u0430-\u0438 \u043a-\u0448 \u0450 \u0453 \u0455 \u0458 \u0459 \u045a \u045c \u045d \u045f]" } } diff --git a/icu4c/source/data/locales/mn.txt b/icu4c/source/data/locales/mn.txt index a905525409..8a28a70b0a 100644 --- a/icu4c/source/data/locales/mn.txt +++ b/icu4c/source/data/locales/mn.txt @@ -74,6 +74,8 @@ mn{ "\u221e", "\ufffd", } + + ExemplarCharacters { "[\u0430-\u0448 \u0456 \u0454 \u0457 \u0491]" } LocaleScript:array{ "Cyrl" } CollationElements { Version { "1.0" } diff --git a/icu4c/source/data/locales/mr.txt b/icu4c/source/data/locales/mr.txt index 0873479182..cbb4a2d345 100644 --- a/icu4c/source/data/locales/mr.txt +++ b/icu4c/source/data/locales/mr.txt @@ -246,6 +246,7 @@ mr { LocaleScript:array { "Deva" // ISO 15924 Name } + ExemplarCharacters{"[[:Deva:]-[\u0958-\u095f]]"} } diff --git a/icu4c/source/data/locales/mt.txt b/icu4c/source/data/locales/mt.txt index 363cc4bb12..9d13fb039f 100644 --- a/icu4c/source/data/locales/mt.txt +++ b/icu4c/source/data/locales/mt.txt @@ -803,6 +803,8 @@ mt { // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[[a-z \u00e0 \u00ec \u00f9 \u00e8 \u00f2 {\u0063\u002e} {\u0068\u002f} {\u0067\u002e} {\u0067\u0068\u002f} {\u007a\u002e}]-[\u0063\u0079]]" } + // Spellout rules. Experimental. SpelloutRules { diff --git a/icu4c/source/data/locales/nb.txt b/icu4c/source/data/locales/nb.txt index 86c21f450b..2879a1e4b6 100644 --- a/icu4c/source/data/locales/nb.txt +++ b/icu4c/source/data/locales/nb.txt @@ -116,4 +116,6 @@ nb { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e6 \u00e5 \u00f8 \u00e9 \u00f3 \u00f4 \u00e0 \u00fc \u01ce]" } + } diff --git a/icu4c/source/data/locales/nl.txt b/icu4c/source/data/locales/nl.txt index c51ea073f1..020713299b 100644 --- a/icu4c/source/data/locales/nl.txt +++ b/icu4c/source/data/locales/nl.txt @@ -103,6 +103,7 @@ nl { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e1 \u00e9 \u00ed \u00f3 \u00fa \u00e4 \u00eb \u00ef \u00f6 \u00fc \u0133]" } //------------------------------------------------------------ // Rule Based Number Format Support diff --git a/icu4c/source/data/locales/nn.txt b/icu4c/source/data/locales/nn.txt index 30873c7b0d..68203185fb 100644 --- a/icu4c/source/data/locales/nn.txt +++ b/icu4c/source/data/locales/nn.txt @@ -112,7 +112,7 @@ nn{ "fredag", "laurdag", } - + ExemplarCharacters { "[a-z \u00e6 \u00e5 \u00f8 \u00e9 \u00f3 \u00f4 \u00e0 \u00fc \u01ce]" } LocaleID:int { 0x814 } // LocaleScript{ // "Latn", // ISO 15924 Name diff --git a/icu4c/source/data/locales/pa.txt b/icu4c/source/data/locales/pa.txt index 78d9a4022a..deaff9e6b9 100644 --- a/icu4c/source/data/locales/pa.txt +++ b/icu4c/source/data/locales/pa.txt @@ -86,6 +86,8 @@ pa { "#E0", } LocaleScript:array { "Guru" } + + ExemplarCharacters { "[:Guru:]" } CollationElements { Version { "1.0" } Sequence { diff --git a/icu4c/source/data/locales/pl.txt b/icu4c/source/data/locales/pl.txt index d3668b0805..05b677d325 100644 --- a/icu4c/source/data/locales/pl.txt +++ b/icu4c/source/data/locales/pl.txt @@ -117,4 +117,5 @@ pl { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00f3 \u0105 \u0119 \u0107 \u0144 \u015b \u017a \u0142 \u017c]" } } diff --git a/icu4c/source/data/locales/pt.txt b/icu4c/source/data/locales/pt.txt index 0bef344eb8..0146dd19e2 100644 --- a/icu4c/source/data/locales/pt.txt +++ b/icu4c/source/data/locales/pt.txt @@ -225,4 +225,5 @@ pt { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e3 \u00f5 \u00e7 \u00e1 \u00e9 \u00ed \u00f3 \u00fa \u00e0 \u00e2 \u00ea \u00f4 \u00fc \u00f2]" } } diff --git a/icu4c/source/data/locales/ro.txt b/icu4c/source/data/locales/ro.txt index aa618b2377..6b5a3c0458 100644 --- a/icu4c/source/data/locales/ro.txt +++ b/icu4c/source/data/locales/ro.txt @@ -109,4 +109,5 @@ ro { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e2 \u00ee \u0103 \u015f \u0163]" } } diff --git a/icu4c/source/data/locales/root.txt b/icu4c/source/data/locales/root.txt index e2bd5e3e2d..9b4fde0087 100644 --- a/icu4c/source/data/locales/root.txt +++ b/icu4c/source/data/locales/root.txt @@ -1274,7 +1274,7 @@ root { DurationRules { "=#,##0=;\n" } - + ExemplarCharacters{"[a-z]"} Scripts { ARAB { "Arabic" } ARMN { "Armenian" } diff --git a/icu4c/source/data/locales/ru.txt b/icu4c/source/data/locales/ru.txt index 77532c2049..dfb2e2faf7 100644 --- a/icu4c/source/data/locales/ru.txt +++ b/icu4c/source/data/locales/ru.txt @@ -291,6 +291,7 @@ ru { LocaleScript:array { "Cyrl" // ISO 15924 Name } + ExemplarCharacters { "[\u0430-\u044f \u0451 \u0456 \u0463 \u0473 \u0475]" } //------------------------------------------------------------ // Rule Based Number Format Support diff --git a/icu4c/source/data/locales/sa.txt b/icu4c/source/data/locales/sa.txt index 2c483b1e2a..6f88c7704a 100644 --- a/icu4c/source/data/locales/sa.txt +++ b/icu4c/source/data/locales/sa.txt @@ -84,8 +84,10 @@ sa { "##,##,##0%", "#E0", } + LocaleScript:array{ "Deva" } - CollationElements { + ExemplarCharacters { "[[[:Deva:][\u0951-\u0954]]-[\u0958-\u095f]]" } + CollationElements { Version { "1.0" } Sequence { "[normalization on]" diff --git a/icu4c/source/data/locales/sh.txt b/icu4c/source/data/locales/sh.txt index f32489c80c..332c65b925 100644 --- a/icu4c/source/data/locales/sh.txt +++ b/icu4c/source/data/locales/sh.txt @@ -361,4 +361,5 @@ sh { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-p r-v z \u0111 \u0107 \u010d \u017e \u0161 {lj} {nj} {d\u017e}]" } } diff --git a/icu4c/source/data/locales/sk.txt b/icu4c/source/data/locales/sk.txt index 20b79e789a..4f6b634729 100644 --- a/icu4c/source/data/locales/sk.txt +++ b/icu4c/source/data/locales/sk.txt @@ -110,4 +110,5 @@ sk { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00fd \u00e1 \u00e9 \u00ed \u00f3 \u00fa \u00e4 \u00f4 \u013a \u0155 \u010d \u010f \u013e \u0148 \u0161 \u0165 \u017e]" } } diff --git a/icu4c/source/data/locales/sl.txt b/icu4c/source/data/locales/sl.txt index 0cea35c3df..81c7ae0b31 100644 --- a/icu4c/source/data/locales/sl.txt +++ b/icu4c/source/data/locales/sl.txt @@ -111,4 +111,5 @@ sl { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-p r-v z \u010d \u0161 \u017e]" } } diff --git a/icu4c/source/data/locales/sq.txt b/icu4c/source/data/locales/sq.txt index 2e314fbded..e17c291bde 100644 --- a/icu4c/source/data/locales/sq.txt +++ b/icu4c/source/data/locales/sq.txt @@ -111,4 +111,5 @@ sq { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00eb \u00e7]" } } diff --git a/icu4c/source/data/locales/sr.txt b/icu4c/source/data/locales/sr.txt index 9dca218996..1c1b7f0274 100644 --- a/icu4c/source/data/locales/sr.txt +++ b/icu4c/source/data/locales/sr.txt @@ -383,4 +383,5 @@ sr { LocaleScript:array { "Cyrl" // ISO 15924 Name } + ExemplarCharacters { "[\u0430-\u0438 \u043a-\u0448 \u0452 \u0458 \u0459 \u045a \u045b \u045f]" } } diff --git a/icu4c/source/data/locales/sv.txt b/icu4c/source/data/locales/sv.txt index 744d32c766..c884c23789 100644 --- a/icu4c/source/data/locales/sv.txt +++ b/icu4c/source/data/locales/sv.txt @@ -209,7 +209,8 @@ sv { // LocaleScript{ // "Latn", // ISO 15924 Name // } - + ExemplarCharacters { "[a-z \u00e4 \u00f6 \u00e5 \u00e1 \u00e9 \u00eb \u00fc]" } + //------------------------------------------------------------ // Rule Based Number Format Support //------------------------------------------------------------ diff --git a/icu4c/source/data/locales/syr.txt b/icu4c/source/data/locales/syr.txt index ff2f703c9e..01f4233df7 100644 --- a/icu4c/source/data/locales/syr.txt +++ b/icu4c/source/data/locales/syr.txt @@ -76,6 +76,7 @@ syr{ // "\ufffd", // } LocaleScript:array { "Syrc" } + ExemplarCharacters{ "[:Syrc:]"} CollationElements { Version { "1.0" } Sequence { diff --git a/icu4c/source/data/locales/ta.txt b/icu4c/source/data/locales/ta.txt index e6d2e694ad..d05fda7b01 100644 --- a/icu4c/source/data/locales/ta.txt +++ b/icu4c/source/data/locales/ta.txt @@ -254,5 +254,6 @@ ta { LocaleScript:array { "Taml" // ISO 15924 Name } + ExemplarCharacters{"[:Taml:]"} } diff --git a/icu4c/source/data/locales/te.txt b/icu4c/source/data/locales/te.txt index b64c9376ba..edbf57002e 100644 --- a/icu4c/source/data/locales/te.txt +++ b/icu4c/source/data/locales/te.txt @@ -4,7 +4,7 @@ // * Corporation and others. All Rights Reserved. // * // *************************************************************************** -// $Revision: 1.11 $ +// $Revision: 1.12 $ // // Telugu Locale. Data by Ram [ram@jtcsv.com] @@ -78,6 +78,7 @@ te { LocaleScript{ "Telu", // ISO 15924 Name } + ExemplarCharacters{"[:Telu:]"} // /**************** Info Below is needed ****************/ // Countries{} // Eras{} diff --git a/icu4c/source/data/locales/th.txt b/icu4c/source/data/locales/th.txt index d4f5021e30..8963fde170 100644 --- a/icu4c/source/data/locales/th.txt +++ b/icu4c/source/data/locales/th.txt @@ -579,7 +579,7 @@ th { LocaleScript{ "Thai", // Script Name } - + ExemplarCharacters { "[:Thai:]" } //------------------------------------------------------------ // Rule Based Number Format Support //------------------------------------------------------------ diff --git a/icu4c/source/data/locales/ti.txt b/icu4c/source/data/locales/ti.txt index 36de27e880..8b081e25f9 100644 --- a/icu4c/source/data/locales/ti.txt +++ b/icu4c/source/data/locales/ti.txt @@ -66,5 +66,7 @@ ti{ ER { "\u12A4\u122D\u1275\u122B" } ET { "\u12A2\u1275\u12EE\u1335\u12EB" } } + LocaleScript{ "Ethi", } + ExemplarCharacters{"[:Ethi:]"} } diff --git a/icu4c/source/data/locales/tr.txt b/icu4c/source/data/locales/tr.txt index 76ca5ed75c..3e1adab2be 100644 --- a/icu4c/source/data/locales/tr.txt +++ b/icu4c/source/data/locales/tr.txt @@ -114,4 +114,5 @@ tr { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters { "[a-z \u00e2 \u00ee \u00fb \u00f6 \u00fc \u0131 \u00e7 \u015f \u011f]" } } diff --git a/icu4c/source/data/locales/tt.txt b/icu4c/source/data/locales/tt.txt index 52f5184a82..d9a4044900 100644 --- a/icu4c/source/data/locales/tt.txt +++ b/icu4c/source/data/locales/tt.txt @@ -74,7 +74,9 @@ tt{ "\ufffd", } LocaleScript:array { "Cyrl" } - CollationElements { + + ExemplarCharacters { "[\u0430-\u044f \u0451 \u0456 \u0463 \u0473 \u0475]" } + CollationElements { Version { "1.0" } Sequence { "[normalization on]" diff --git a/icu4c/source/data/locales/uk.txt b/icu4c/source/data/locales/uk.txt index d99ded1a94..8d89310112 100644 --- a/icu4c/source/data/locales/uk.txt +++ b/icu4c/source/data/locales/uk.txt @@ -144,4 +144,5 @@ uk { LocaleScript:array { "Cyrl" // ISO 15924 Name } + ExemplarCharacters { "[\u0430-\u0449 \u044e \u044f \u0454 \u0456 \u0457 \u0491]" } } diff --git a/icu4c/source/data/locales/ur.txt b/icu4c/source/data/locales/ur.txt index bb43209aa2..60141cc1d3 100644 --- a/icu4c/source/data/locales/ur.txt +++ b/icu4c/source/data/locales/ur.txt @@ -74,7 +74,9 @@ ur{ // "\ufffd", // } LocaleScript:array { "Arab" } - CollationElements { + + ExemplarCharacters { "[:Arab:]" } + CollationElements { Version { "1.0" } Sequence { "[normalization on]" diff --git a/icu4c/source/data/locales/uz.txt b/icu4c/source/data/locales/uz.txt index 5a99115203..ffe175feef 100644 --- a/icu4c/source/data/locales/uz.txt +++ b/icu4c/source/data/locales/uz.txt @@ -75,7 +75,8 @@ uz{ "\ufffd", } LocaleScript:array { "Cyrl" } - CollationElements { + ExemplarCharacters { "[\u0430-\u044f \u0451 \u0456 \u0463 \u0473 \u0475]" } + CollationElements { Version { "1.0" } Sequence { "[normalization on]" diff --git a/icu4c/source/data/locales/vi.txt b/icu4c/source/data/locales/vi.txt index e9a6880aae..1951c68a69 100644 --- a/icu4c/source/data/locales/vi.txt +++ b/icu4c/source/data/locales/vi.txt @@ -95,4 +95,6 @@ vi { // LocaleScript{ // "Latn", // ISO 15924 Name // } + ExemplarCharacters{ "[a-z \u1EA0-\u1Ef9 \u0111 \u01A1 \u00E0-\u00E3 \u00E8-\u00EA \u00EC \u00ED \u00F2-\u00F5 \u00F9 \u00FA \u00FD \u0103 \u0129 \u0169 \u01B0 +]" } } diff --git a/icu4c/source/data/locales/zh.txt b/icu4c/source/data/locales/zh.txt index df96018ff1..55d525a558 100644 --- a/icu4c/source/data/locales/zh.txt +++ b/icu4c/source/data/locales/zh.txt @@ -1175,4 +1175,35 @@ zh { } } LocaleScript:array { "Hani" } + ExemplarCharacters{ + "[\u4E07-\u4E0E \u4E18-\u4E1E \u4E4B-\u4E50 \u4E5C-\u4E61 \u4EA4-\u4EA9 " + " \u4EBF-\u4EC7 \u4ED3-\u4ED9 \u4F57-\u4F60 \u4FA5-\u4FAA \u5173-\u5179 " + " \u51F8-\u51FD \u5216-\u521B \u5236-\u523B \u529D-\u52A3 \u52A8-\u52AD " + " \u535E-\u5364 \u53C8-\u53CD \u53E8-\u53F3 \u540C-\u5413 \u5452-\u5459 " + " \u54A6-\u54AD \u54CC-\u54D5 \u54E5-\u54EA \u56DD-\u56E2 \u574C-\u5751 " + " \u575A-\u5761 \u5A03-\u5A09 \u5B57-\u5B5D \u5B97-\u5B9E \u5BA0-\u5BA6 " + " \u5C38-\u5C42 \u5C96-\u5C9C \u5E18-\u5E1D \u5EFE-\u5F04 \u5F87-\u5F8C " + " \u5FFD-\u6006 \u6025-\u602B \u6067-\u606D \u6078-\u607D \u60EB-\u60F0 " + " \u620A-\u6212 \u6269-\u6270 \u62C4-\u62CA \u62D6-\u62DC \u631D-\u6325 " + " \u634B-\u6350 \u65EC-\u65F1 \u6652-\u6657 \u67CF-\u67D4 \u6807-\u680C " + " \u6840-\u6846 \u6860-\u6869 \u6B62-\u6B67 \u6BD2-\u6BD7 \u6C5B-\u6C61 " + " \u6DA6-\u6DAB \u72EC-\u72F4 \u75AE-\u75B5 \u76CD-\u76D2 \u77FD-\u7802 " + " \u7837-\u783C \u795A-\u7960 \u7BA6-\u7BAD \u7E9F-\u7EAD \u7EB5-\u7EBA " + " \u7EBD-\u7ED5 \u7ED7-\u7EE3 \u7EE5-\u7EEB \u7EED-\u7EF8 \u7EFA-\u7F09 " + " \u7F11-\u7F1D \u7F1F-\u7F36 \u8014-\u8019 \u8025-\u802A \u80BC-\u80C4 " + " \u80D9-\u80DE \u80E7-\u80ED \u80EF-\u80F4 \u810D-\u8114 \u8179-\u8180 " + " \u8233-\u8239 \u82A8-\u82B1 \u82CA-\u82CF \u8301-\u8309 \u8363-\u836F " + " \u8537-\u853D \u8679-\u8682 \u89C4-\u89CC \u8BA0-\u8BAB \u8BB2-\u8BBA " + " \u8BBC-\u8BC6 \u8BC8-\u8BCF \u8BD1-\u8BE9 \u8BEB-\u8C08 \u8C0A-\u8C1D " + " \u8C1F-\u8C37 \u8D21-\u8D50 \u8D58-\u8D5E \u8F6B-\u8F7F \u8F81-\u8F8B " + " \u8F93-\u8F9C \u9000-\u9006 \u901D-\u9022 \u9149-\u9150 \u9174-\u9179 " + " \u9485-\u9490 \u9499-\u94C6 \u94C8-\u94CE \u94DB-\u94E5 \u94E7-\u94FA " + " \u94FC-\u951B \u9521-\u9526 \u9528-\u9532 \u9534-\u953C \u954C-\u9554 " + " \u9561-\u956D \u95ED-\u95FE \u9600-\u9606 \u9608-\u9612 \u9631-\u9636 " + " \u9644-\u9649 \u9875-\u988A \u989A-\u98A2 \u9967-\u9972 \u998F-\u9999 " + " \u9A6C-\u9A71 \u9A73-\u9A82 \u9A9A-\u9AA5 \u9C9E-\u9CA9 \u9CB0-\u9CB8 " + " \u9CCA-\u9CD0 \u9CD3-\u9CD9 \u9E28-\u9E2D \u9E35-\u9E3A \u9E41-\u9E4C " + " \u9E66-\u9E6D \u9F83-\u9F8C]" + + } } diff --git a/icu4c/source/data/locales/zh_TW.txt b/icu4c/source/data/locales/zh_TW.txt index f63f597559..34a4ea2c7b 100644 --- a/icu4c/source/data/locales/zh_TW.txt +++ b/icu4c/source/data/locales/zh_TW.txt @@ -1343,5 +1343,52 @@ zh_TW { "GMT", } } - LocaleScript { "Hani" , "Bopo" } + LocaleScript { "Hani" , "Bopo" } + ExemplarCharacters{ + "[\u3005-\u3015 \u3041-\u3093 \u30A1-\u30F6 \u3105-\u3129 " + " \u4E07-\u4E11 \u4F4C-\u4F64 \u4F73-\u4F89 \u4FD6-\u4FE1 " + " \u5011-\u501C \u5045-\u504F \u505A-\u5065 \u50AC-\u50B8 " + " \u5102-\u510C \u53E8-\u53F3 \u5406-\u5412 \u5424-\u542E " + " \u54A5-\u54B1 \u54BA-\u54C9 \u552C-\u5539 \u55C2-\u55D6 " + " \u5668-\u5674 \u57F0-\u57FD \u5804-\u580E \u582C-\u5839 " + " \u5879-\u5883 \u597B-\u5985 \u59CA-\u59D4 \u5AAE-\u5AC2 " + " \u5AD5-\u5AE3 \u5BDE-\u5BEC \u5C07-\u5C12 \u5C9F-\u5CB1 " + " \u5D30-\u5D3A \u5E66-\u5E70 \u5ED1-\u5EE3 \u6009-\u6017 " + " \u6024-\u602F \u6062-\u6070 \u60B4-\u60C1 \u60C3-\u60CF " + " \u60F0-\u60FC \u6144-\u614F \u61A7-\u61B6 \u61F5-\u6201 " + " \u62C6-\u62D4 \u62EB-\u6303 \u6340-\u6351 \u639B-\u63A5 " + " \u63A7-\u63B1 \u63C2-\u63D0 \u641E-\u6428 \u6572-\u657C " + " \u6602-\u6615 \u676F-\u677F \u67C8-\u67D4 \u67E9-\u67F8 " + " \u68A7-\u68B5 \u68EE-\u68FD \u690A-\u6915 \u6956-\u6960 " + " \u69A3-\u69B1 \u6BC3-\u6BCD \u6BFB-\u6C06 \u6C80-\u6C90 " + " \u6CB6-\u6CC7 \u6D07-\u6D12 \u6D27-\u6D42 \u6D5E-\u6D6A " + " \u6D74-\u6D80 \u6D82-\u6D8E \u6DCF-\u6DE6 \u6DE8-\u6DF7 " + " \u6E2B-\u6E36 \u6E5A-\u6E69 \u6E9B-\u6EA7 \u6EBC-\u6ED6 " + " \u6F29-\u6F33 \u6FA0-\u6FB4 \u715C-\u716A \u71BC-\u71CB " + " \u72F6-\u7301 \u737A-\u738B \u7403-\u740D \u7428-\u7436 " + " \u74D4-\u74E6 \u7528-\u7533 \u75B8-\u75C2 \u75EF-\u7601 " + " \u7619-\u7629 \u7731-\u773E \u7765-\u776F \u7799-\u77A3 " + " \u7825-\u7835 \u7923-\u792D \u7B2A-\u7B35 \u7B44-\u7B52 " + " \u7BD8-\u7BEB \u7D00-\u7D22 \u7D38-\u7D47 \u7DB7-\u7DC2 " + " \u7E08-\u7E17 \u7E1A-\u7E25 \u7E2D-\u7E49 \u7E50-\u7E5A " + " \u7E72-\u7E7E \u7FB5-\u7FC3 \u7FE8-\u7FF5 \u80D4-\u80DE " + " \u814A-\u8155 \u82B3-\u82BE \u8331-\u833C \u8347-\u8354 " + " \u8386-\u8390 \u83BF-\u83CC \u83DB-\u83E5 \u8409-\u8413 " + " \u842F-\u843D \u8497-\u84A2 \u84C9-\u84D4 \u8523-\u8531 " + " \u8560-\u856E \u8580-\u8591 \u8598-\u85A4 \u86B3-\u86C9 " + " \u8700-\u870E \u8720-\u872A \u874C-\u876F \u87B2-\u87C0 " + " \u87DB-\u87E8 \u88D4-\u88DF \u8910-\u891A \u8929-\u8933 " + " \u8956-\u8964 \u8AED-\u8AF8 \u8B0D-\u8B1E \u8B4E-\u8B5A " + " \u8C45-\u8C50 \u8CB2-\u8CC5 \u8CDC-\u8CE8 \u8D8C-\u8D96 " + " \u8E0F-\u8E27 \u8E59-\u8E67 \u8E84-\u8E8E \u8F4D-\u8F5B " + " \u8FFA-\u9006 \u9019-\u9024 \u9072-\u9088 \u90F9-\u9109 " + " \u9116-\u9124 \u9126-\u9136 \u9143-\u9150 \u9199-\u91A3 " + " \u91AA-\u91B5 \u9248-\u9254 \u9293-\u929D \u92A0-\u92AC " + " \u92C0-\u92D3 \u931D-\u932B \u93F5-\u9400 \u9409-\u9416 " + " \u946D-\u9478 \u96BF-\u96CE \u96D2-\u96DF \u9722-\u972C " + " \u977A-\u9785 \u97FD-\u9808 \u9927-\u9933 \u99AB-\u99B5 " + " \u99CB-\u99D9 \u9D96-\u9DA4 \u9DB1-\u9DBC \u9DD5-\u9DDF " + " \u9DFD-\u9E07 \u9F28-\u9F38]" + + } }