From 7f88594d99d29441df8a6fdea08c4c7433de99d6 Mon Sep 17 00:00:00 2001 From: Ram Viswanadha Date: Thu, 4 Oct 2001 01:34:53 +0000 Subject: [PATCH] ICU-1255 Indic Transliteration rules fixes X-SVN-Rev: 6039 --- icu4c/data/Bengali_InterIndic.txt | 190 ++++---- icu4c/data/Devanagari_InterIndic.txt | 232 +++++----- icu4c/data/Gujarati_InterIndic.txt | 165 ++++--- icu4c/data/Gurmukhi_InterIndic.txt | 159 ++++--- icu4c/data/InterIndic_Bengali.txt | 203 +++++---- icu4c/data/InterIndic_Devanagari.txt | 226 +++++----- icu4c/data/InterIndic_Gujarati.txt | 203 +++++---- icu4c/data/InterIndic_Gurmukhi.txt | 203 +++++---- icu4c/data/InterIndic_Kannada.txt | 203 +++++---- icu4c/data/InterIndic_Latin.txt | 414 ++++++++++++++++++ icu4c/data/InterIndic_Malayalam.txt | 203 +++++---- icu4c/data/InterIndic_Oriya.txt | 203 +++++---- icu4c/data/InterIndic_Tamil.txt | 203 +++++---- icu4c/data/InterIndic_Telugu.txt | 203 +++++---- icu4c/data/Kannada_InterIndic.txt | 169 ++++--- icu4c/data/Latin_InterIndic.txt | 336 ++++++++++++++ icu4c/data/Malayalam_InterIndic.txt | 165 ++++--- icu4c/data/Oriya_InterIndic.txt | 167 ++++--- icu4c/data/Tamil_InterIndic.txt | 131 +++--- icu4c/data/Telugu_InterIndic.txt | 169 ++++--- icu4c/data/resfiles.mk | 38 +- icu4c/data/translit_index.txt | 30 +- icu4c/source/data/locales/resfiles.mk | 38 +- icu4c/source/data/translit/translit_index.txt | 30 +- 24 files changed, 2548 insertions(+), 1735 deletions(-) create mode 100644 icu4c/data/InterIndic_Latin.txt create mode 100644 icu4c/data/Latin_InterIndic.txt diff --git a/icu4c/data/Bengali_InterIndic.txt b/icu4c/data/Bengali_InterIndic.txt index ae42fe72a4..164da2d9e5 100644 --- a/icu4c/data/Bengali_InterIndic.txt +++ b/icu4c/data/Bengali_InterIndic.txt @@ -1,17 +1,11 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- -// THIS IS A MACHINE-GENERATED FILE -// Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Bengali_InterIndic.utf8.txt -// Date: Thu Mar 1 20:03:54 2001 -//-------------------------------------------------------------------- // Bengali_InterIndic -Bengali_InterIndic { +Bengali-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,97 +15,97 @@ Bengali_InterIndic { //-------------------------------------------------------------------- // Bengali-InterIndic - -"ঁ>\uE001;" // SIGN CANDRABINDU -"ং>\uE002;" // SIGN ANUSVARA -"ঃ>\uE003;" // SIGN VISARGA -"অ>\uE005;" // LETTER A -"আ>\uE006;" // LETTER AA -"ই>\uE007;" // LETTER I -"ঈ>\uE008;" // LETTER II -"উ>\uE009;" // LETTER U -"ঊ>\uE00A;" // LETTER UU -"ঋ>\uE00B;" // LETTER VOCALIC R -"ঌ>\uE00C;" // LETTER VOCALIC L -"এ>\uE081;" // LETTER E -"ঐ>\uE010;" // LETTER AI -"ও>\uE082;" // LETTER O -"ঔ>\uE014;" // LETTER AU -"ক>\uE015;" // LETTER KA -"খ>\uE016;" // LETTER KHA -"গ>\uE017;" // LETTER GA -"ঘ>\uE018;" // LETTER GHA -"ঙ>\uE019;" // LETTER NGA -"চ>\uE01A;" // LETTER CA -"ছ>\uE01B;" // LETTER CHA -"জ>\uE01C;" // LETTER JA -"ঝ>\uE01D;" // LETTER JHA -"ঞ>\uE01E;" // LETTER NYA -"ট>\uE01F;" // LETTER TTA -"ঠ>\uE020;" // LETTER TTHA -"ড>\uE021;" // LETTER DDA -"ঢ>\uE022;" // LETTER DDHA -"ণ>\uE023;" // LETTER NNA -"ত>\uE024;" // LETTER TA -"থ>\uE025;" // LETTER THA -"দ>\uE026;" // LETTER DA -"ধ>\uE027;" // LETTER DHA -"ন>\uE028;" // LETTER NA -"প>\uE02A;" // LETTER PA -"ফ>\uE02B;" // LETTER PHA -"ব>\uE02C;" // LETTER BA -"ভ>\uE02D;" // LETTER BHA -"ম>\uE02E;" // LETTER MA -"য>\uE02F;" // LETTER YA -"র>\uE030;" // LETTER RA -"ল>\uE032;" // LETTER LA -"শ>\uE036;" // LETTER SHA -"ষ>\uE037;" // LETTER SSA -"স>\uE038;" // LETTER SA -"হ>\uE039;" // LETTER HA -"়>\uE03C;" // SIGN NUKTA -"া>\uE03E;" // VOWEL SIGN AA -"ি>\uE03F;" // VOWEL SIGN I -"ী>\uE040;" // VOWEL SIGN II -"ু>\uE041;" // VOWEL SIGN U -"ূ>\uE042;" // VOWEL SIGN UU -"ৃ>\uE043;" // VOWEL SIGN VOCALIC R -"ৄ>\uE044;" // VOWEL SIGN VOCALIC RR -"ে>\uE084;" // VOWEL SIGN E -"ৈ>\uE048;" // VOWEL SIGN AI -"ো>\uE085;" // VOWEL SIGN O -"ৌ>\uE04C;" // VOWEL SIGN AU -"্>\uE04D;" // SIGN VIRAMA -"ৗ>\uE057;" // AU LENGTH MARK -"ড়>\uE083;" // LETTER RRA -"ঢ়>\uE05D;" // LETTER RHA -"য়>\uE05F;" // LETTER YYA -"ৠ>\uE060;" // LETTER VOCALIC RR -"ৡ>\uE061;" // LETTER VOCALIC LL -"ৢ>\uE062;" // VOWEL SIGN VOCALIC L -"ৣ>\uE063;" // VOWEL SIGN VOCALIC LL -"০>\uE066;" // DIGIT ZERO -"১>\uE067;" // DIGIT ONE -"২>\uE068;" // DIGIT TWO -"৩>\uE069;" // DIGIT THREE -"৪>\uE06A;" // DIGIT FOUR -"৫>\uE06B;" // DIGIT FIVE -"৬>\uE06C;" // DIGIT SIX -"৭>\uE06D;" // DIGIT SEVEN -"৮>\uE06E;" // DIGIT EIGHT -"৯>\uE06F;" // DIGIT NINE -// ৰ>; // UNMAPPED Bengali-InterIndic: LETTER RA WITH MIDDLE DIAGONAL -// ৱ>; // UNMAPPED Bengali-InterIndic: LETTER RA WITH LOWER DIAGONAL -// ৲>; // UNMAPPED Bengali-InterIndic: RUPEE MARK -// ৳>; // UNMAPPED Bengali-InterIndic: RUPEE SIGN -// ৴>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR ONE -// ৵>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR TWO -// ৶>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR THREE -// ৷>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR FOUR -// ৸>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR -// ৹>; // UNMAPPED Bengali-InterIndic: CURRENCY DENOMINATOR SIXTEEN -"৺>\uE080;" // ISSHAR - +":: NFD (NFC) ;" +"\u0981>\ue001;" // SIGN CANDRABINDU +"\u0982>\ue002;" // SIGN ANUSVARA +"\u0983>\ue003;" // SIGN VISARGA +"\u0985>\ue005;" // LETTER A +"\u0986>\ue006;" // LETTER AA +"\u0987>\ue007;" // LETTER I +"\u0988>\ue008;" // LETTER II +"\u0989>\ue009;" // LETTER U +"\u098a>\ue00a;" // LETTER UU +"\u098b>\ue00b;" // LETTER VOCALIC R +"\u098c>\ue00c;" // LETTER VOCALIC L +"\u098f>\ue00f;" // LETTER E +"\u0990>\ue010;" // LETTER AI +"\u0993>\ue013;" // LETTER O +"\u0994>\ue014;" // LETTER AU +"\u0995>\ue015;" // LETTER KA +"\u0996>\ue016;" // LETTER KHA +"\u0997>\ue017;" // LETTER GA +"\u0998>\ue018;" // LETTER GHA +"\u0999>\ue019;" // LETTER NGA +"\u099a>\ue01a;" // LETTER CA +"\u099b>\ue01b;" // LETTER CHA +"\u099c>\ue01c;" // LETTER JA +"\u099d>\ue01d;" // LETTER JHA +"\u099e>\ue01e;" // LETTER NYA +"\u099f>\ue01f;" // LETTER TTA +"\u09a0>\ue020;" // LETTER TTHA +"\u09a1>\ue021;" // LETTER DDA +"\u09a2>\ue022;" // LETTER DDHA +"\u09a3>\ue023;" // LETTER NNA +"\u09a4>\ue024;" // LETTER TA +"\u09a5>\ue025;" // LETTER THA +"\u09a6>\ue026;" // LETTER DA +"\u09a7>\ue027;" // LETTER DHA +"\u09a8>\ue028;" // LETTER NA +"\u09aa>\ue02a;" // LETTER PA +"\u09ab>\ue02b;" // LETTER PHA +"\u09ac>\ue02c;" // LETTER BA +"\u09ad>\ue02d;" // LETTER BHA +"\u09ae>\ue02e;" // LETTER MA +"\u09af>\ue02f;" // LETTER YA +"\u09b0>\ue030;" // LETTER RA +"\u09b2>\ue032;" // LETTER LA +"\u09b6>\ue036;" // LETTER SHA +"\u09b7>\ue037;" // LETTER SSA +"\u09b8>\ue038;" // LETTER SA +"\u09b9>\ue039;" // LETTER HA +"\u09bc>\ue03c;" // SIGN NUKTA +"\u09be>\ue03e;" // VOWEL SIGN AA +"\u09bf>\ue03f;" // VOWEL SIGN I +"\u09c0>\ue040;" // VOWEL SIGN II +"\u09c1>\ue041;" // VOWEL SIGN U +"\u09c2>\ue042;" // VOWEL SIGN UU +"\u09c3>\ue043;" // VOWEL SIGN VOCALIC R +"\u09c4>\ue044;" // VOWEL SIGN VOCALIC RR +"\u09c7>\ue047;" // VOWEL SIGN E +"\u09c8>\ue048;" // VOWEL SIGN AI +"\u09cb>\ue04b;" // VOWEL SIGN O +"\u09cc>\ue04c;" // VOWEL SIGN AU +"\u09cd>\ue04d;" // SIGN VIRAMA +"\u09d7>\ue057;" // AU LENGTH MARK +"\u09dc>\ue053;" // LETTER RRA +"\u09dd>\ue05d;" // LETTER RHA +"\u09df>\ue05f;" // LETTER YYA +"\u09e0>\ue060;" // LETTER VOCALIC RR +"\u09e1>\ue061;" // LETTER VOCALIC LL +"\u09e2>\ue062;" // VOWEL SIGN VOCALIC L +"\u09e3>\ue063;" // VOWEL SIGN VOCALIC LL +"\u09e6>\ue066;" // DIGIT ZERO +"\u09e7>\ue067;" // DIGIT ONE +"\u09e8>\ue068;" // DIGIT TWO +"\u09e9>\ue069;" // DIGIT THREE +"\u09ea>\ue06a;" // DIGIT FOUR +"\u09eb>\ue06b;" // DIGIT FIVE +"\u09ec>\ue06c;" // DIGIT SIX +"\u09ed>\ue06d;" // DIGIT SEVEN +"\u09ee>\ue06e;" // DIGIT EIGHT +"\u09ef>\ue06f;" // DIGIT NINE +// \u09f0>; // UNMAPPED Bengali-InterIndic: LETTER RA WITH MIDDLE DIAGONAL +// \u09f1>; // UNMAPPED Bengali-InterIndic: LETTER RA WITH LOWER DIAGONAL +// \u09f2>; // UNMAPPED Bengali-InterIndic: RUPEE MARK +// \u09f3>; // UNMAPPED Bengali-InterIndic: RUPEE SIGN +// \u09f4>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR ONE +// \u09f5>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR TWO +// \u09f6>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR THREE +// \u09f7>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR FOUR +// \u09f8>; // UNMAPPED Bengali-InterIndic: CURRENCY NUMERATOR ONE LESS THAN THE DENOMINATOR +// \u09f9>; // UNMAPPED Bengali-InterIndic: CURRENCY DENOMINATOR SIXTEEN +"\u09fa>\ue070;" // ISSHAR + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/Devanagari_InterIndic.txt b/icu4c/data/Devanagari_InterIndic.txt index 92f3c37375..faa1492e74 100644 --- a/icu4c/data/Devanagari_InterIndic.txt +++ b/icu4c/data/Devanagari_InterIndic.txt @@ -1,17 +1,11 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- -// THIS IS A MACHINE-GENERATED FILE -// Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Devanagari_InterIndic.utf8.txt -// Date: Thu Mar 1 20:03:54 2001 -//-------------------------------------------------------------------- // Devanagari_InterIndic -Devanagari_InterIndic { +Devanagari-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,112 +15,124 @@ Devanagari_InterIndic { //-------------------------------------------------------------------- // Devanagari-InterIndic + ":: NFD (NFC) ;" + //Rules for Decomposed characters + "\u0928\u093c > \ue029;" //\u0929 + "\u0930\u093c > \ue031;" //\u0932 + "\u0933\u093c > \ue034;" //\u0934 + "\u0915\u093c > \ue058;" //\u0958 LETTER QA (For Urdu) + "\u0916\u093c > \ue059;" //\u0959 LETTER KHHA (For Urdu) + "\u0917\u093c > \ue05a;" //\u095a LETTER GHHA (For Urdu) + "\u091c\u093c > \ue05b;" //\u095b LETTER ZA (For Urdu) + "\u0921\u093c > \ue05c;" //\u095c LETTER DDDHA (pronounced RRA) + "\u0922\u093c > \ue05d;" //\u095d LETTER RHA (pronounced RRHA) + "\u092b\u093c > \ue05e;" //\u095e LETTER FA + "\u092f\u093c > \ue05f;" //\u095f LETTER YYA -"ँ>\uE001;" // SIGN CANDRABINDU -"ं>\uE002;" // SIGN ANUSVARA -"ः>\uE003;" // SIGN VISARGA -"अ>\uE005;" // LETTER A -"आ>\uE006;" // LETTER AA -"इ>\uE007;" // LETTER I -"ई>\uE008;" // LETTER II -"उ>\uE009;" // LETTER U -"ऊ>\uE00A;" // LETTER UU -"ऋ>\uE00B;" // LETTER VOCALIC R -"ऌ>\uE00C;" // LETTER VOCALIC L -// ऍ>; // UNMAPPED Devanagari-InterIndic: LETTER CANDRA E -// ऎ>; // UNMAPPED Devanagari-InterIndic: LETTER SHORT E -"ए>\uE081;" // LETTER E -"ऐ>\uE010;" // LETTER AI -// ऑ>; // UNMAPPED Devanagari-InterIndic: LETTER CANDRA O -// ऒ>; // UNMAPPED Devanagari-InterIndic: LETTER SHORT O -"ओ>\uE082;" // LETTER O -"औ>\uE014;" // LETTER AU -"क>\uE015;" // LETTER KA -"ख>\uE016;" // LETTER KHA -"ग>\uE017;" // LETTER GA -"घ>\uE018;" // LETTER GHA -"ङ>\uE019;" // LETTER NGA -"च>\uE01A;" // LETTER CA -"छ>\uE01B;" // LETTER CHA -"ज>\uE01C;" // LETTER JA -"झ>\uE01D;" // LETTER JHA -"ञ>\uE01E;" // LETTER NYA -"ट>\uE01F;" // LETTER TTA -"ठ>\uE020;" // LETTER TTHA -"ड>\uE021;" // LETTER DDA -"ढ>\uE022;" // LETTER DDHA -"ण>\uE023;" // LETTER NNA -"त>\uE024;" // LETTER TA -"थ>\uE025;" // LETTER THA -"द>\uE026;" // LETTER DA -"ध>\uE027;" // LETTER DHA -"न>\uE028;" // LETTER NA -"ऩ>\uE029;" // LETTER NNNA -"प>\uE02A;" // LETTER PA -"फ>\uE02B;" // LETTER PHA -"ब>\uE02C;" // LETTER BA -"भ>\uE02D;" // LETTER BHA -"म>\uE02E;" // LETTER MA -"य>\uE02F;" // LETTER YA -"र>\uE030;" // LETTER RA -"ऱ>\uE083;" // LETTER RRA -"ल>\uE032;" // LETTER LA -"ळ>\uE033;" // LETTER LLA -"ऴ>\uE034;" // LETTER LLLA -"व>\uE035;" // LETTER VA -"श>\uE036;" // LETTER SHA -"ष>\uE037;" // LETTER SSA -"स>\uE038;" // LETTER SA -"ह>\uE039;" // LETTER HA -"़>\uE03C;" // SIGN NUKTA -"ऽ>\uE03D;" // SIGN AVAGRAHA -"ा>\uE03E;" // VOWEL SIGN AA -"ि>\uE03F;" // VOWEL SIGN I -"ी>\uE040;" // VOWEL SIGN II -"ु>\uE041;" // VOWEL SIGN U -"ू>\uE042;" // VOWEL SIGN UU -"ृ>\uE043;" // VOWEL SIGN VOCALIC R -"ॄ>\uE044;" // VOWEL SIGN VOCALIC RR -"ॅ>\uE045;" // VOWEL SIGN CANDRA E -// ॆ>; // UNMAPPED Devanagari-InterIndic: VOWEL SIGN SHORT E -"े>\uE084;" // VOWEL SIGN E -"ै>\uE048;" // VOWEL SIGN AI -"ॉ>\uE049;" // VOWEL SIGN CANDRA O -// ॊ>; // UNMAPPED Devanagari-InterIndic: VOWEL SIGN SHORT O -"ो>\uE085;" // VOWEL SIGN O -"ौ>\uE04C;" // VOWEL SIGN AU -"्>\uE04D;" // SIGN VIRAMA -"ॐ>\uE050;" // OM -// ॑>; // UNMAPPED Devanagari-InterIndic: STRESS SIGN UDATTA -// ॒>; // UNMAPPED Devanagari-InterIndic: STRESS SIGN ANUDATTA -// ॓>; // UNMAPPED Devanagari-InterIndic: GRAVE ACCENT -// ॔>; // UNMAPPED Devanagari-InterIndic: ACUTE ACCENT -// क़>; // UNMAPPED Devanagari-InterIndic: LETTER QA -"ख़>\uE059;" // LETTER KHHA -"ग़>\uE05A;" // LETTER GHHA -"ज़>\uE05B;" // LETTER ZA -// ड़>; // UNMAPPED Devanagari-InterIndic: LETTER DDDHA -"ढ़>\uE05D;" // LETTER RHA -"फ़>\uE05E;" // LETTER FA -"य़>\uE05F;" // LETTER YYA -"ॠ>\uE060;" // LETTER VOCALIC RR -"ॡ>\uE061;" // LETTER VOCALIC LL -"ॢ>\uE062;" // VOWEL SIGN VOCALIC L -"ॣ>\uE063;" // VOWEL SIGN VOCALIC LL -// ।>; // UNMAPPED Devanagari-InterIndic: DANDA -// ॥>; // UNMAPPED Devanagari-InterIndic: DOUBLE DANDA -"०>\uE066;" // DIGIT ZERO -"१>\uE067;" // DIGIT ONE -"२>\uE068;" // DIGIT TWO -"३>\uE069;" // DIGIT THREE -"४>\uE06A;" // DIGIT FOUR -"५>\uE06B;" // DIGIT FIVE -"६>\uE06C;" // DIGIT SIX -"७>\uE06D;" // DIGIT SEVEN -"८>\uE06E;" // DIGIT EIGHT -"९>\uE06F;" // DIGIT NINE -// ॰>; // UNMAPPED Devanagari-InterIndic: ABBREVIATION SIGN - -// eof + "\u0901>\ue001;" // SIGN CANDRABINDU + "\u0902>\ue002;" // SIGN ANUSVARA + "\u0903>\ue003;" // SIGN VISARGA + "\u0905>\ue005;" // LETTER A + "\u0906>\ue006;" // LETTER AA + "\u0907>\ue007;" // LETTER I + "\u0908>\ue008;" // LETTER II + "\u0909>\ue009;" // LETTER U + "\u090a>\ue00a;" // LETTER UU + "\u090b>\ue00b;" // LETTER VOCALIC R + "\u090c>\ue00c;" // LETTER VOCALIC L + "\u090d>\ue00d;" // LETTER CANDRA E (For representing English sounds) +//"\u090e>\ue00e;" // UNMAPPED LETTER SHORT E(For Southern Scripts) + "\u090f>\ue00f;" // LETTER E + "\u0910>\ue010;" // LETTER AI + "\u0911>\ue011;" // LETTER CANDRA O (For representing English sounds) +//"\u0912>\ue012;" // UNMAPPED LETTER SHORT O (For Southern Scripts) + "\u0913>\ue013;" // LETTER O + "\u0914>\ue014;" // LETTER AU + "\u0915>\ue015;" // LETTER KA + "\u0916>\ue016;" // LETTER KHA + "\u0917>\ue017;" // LETTER GA + "\u0918>\ue018;" // LETTER GHA + "\u0919>\ue019;" // LETTER NGA + "\u091a>\ue01a;" // LETTER CA + "\u091b>\ue01b;" // LETTER CHA + "\u091c>\ue01c;" // LETTER JA + "\u091d>\ue01d;" // LETTER JHA + "\u091e>\ue01e;" // LETTER NYA + "\u091f>\ue01f;" // LETTER TTA + "\u0920>\ue020;" // LETTER TTHA + "\u0921>\ue021;" // LETTER DDA + "\u0922>\ue022;" // LETTER DDHA + "\u0923>\ue023;" // LETTER NNA + "\u0924>\ue024;" // LETTER TA + "\u0925>\ue025;" // LETTER THA + "\u0926>\ue026;" // LETTER DA + "\u0927>\ue027;" // LETTER DHA + "\u0928>\ue028;" // LETTER NA + "\u0929>\ue029;" // LETTER NNNA + "\u092a>\ue02a;" // LETTER PA + "\u092b>\ue02b;" // LETTER PHA + "\u092c>\ue02c;" // LETTER BA + "\u092d>\ue02d;" // LETTER BHA + "\u092e>\ue02e;" // LETTER MA + "\u092f>\ue02f;" // LETTER YA + "\u0930>\ue030;" // LETTER RA + //"\u0931>\ue031;" // UNMAPPED LETTER RRA (Eyelash RA for Southern scripts) + "\u0932>\ue032;" // LETTER LA + "\u0933>\ue033;" // LETTER LLA + //"\u0934>\ue034;" // UNMAPPED LETTER LLLA (LLLA for Southern scripts) + "\u0935>\ue035;" // LETTER VA + "\u0936>\ue036;" // LETTER SHA + "\u0937>\ue037;" // LETTER SSA + "\u0938>\ue038;" // LETTER SA + "\u0939>\ue039;" // LETTER HA + "\u093c>\ue03c;" // SIGN NUKTA + "\u093d>\ue03d;" // SIGN AVAGRAHA + "\u093e>\ue03e;" // VOWEL SIGN AA + "\u093f>\ue03f;" // VOWEL SIGN I + "\u0940>\ue040;" // VOWEL SIGN II + "\u0941>\ue041;" // VOWEL SIGN U + "\u0942>\ue042;" // VOWEL SIGN UU + "\u0943>\ue043;" // VOWEL SIGN VOCALIC R + "\u0944>\ue044;" // VOWEL SIGN VOCALIC RR + "\u0945>\ue045;" // VOWEL SIGN CANDRA E +//"\u0946>\ue046;" // UNMAPPED VOWEL SIGN SHORT E + "\u0947>\ue047;" // VOWEL SIGN E + "\u0948>\ue048;" // VOWEL SIGN AI + "\u0949>\ue049;" // VOWEL SIGN CANDRA O +//"\u094a>\ue04a;" // UNMAPPED VOWEL SIGN SHORT O + "\u094b>\ue04b;" // VOWEL SIGN O + "\u094c>\ue04c;" // VOWEL SIGN AU + "\u094d>\ue04d;" // SIGN VIRAMA + "\u0950>\ue050;" // OM +// "\u0951>;" // UNMAPPED STRESS SIGN UDATTA +// "\u0952>;" // UNMAPPED STRESS SIGN ANUDATTA +// "\u0953>;" // UNMAPPED GRAVE ACCENT +// "\u0954>;" // UNMAPPED ACUTE ACCENT + "\u0958>\ue058;" // LETTER QA (For Urdu) + "\u0959>\ue059;" // LETTER KHHA (For Urdu) + "\u095a>\ue05a;" // LETTER GHHA (For Urdu) + "\u095b>\ue05b;" // LETTER ZA (For Urdu) + "\u095c>\ue05c;" // LETTER DDDHA (pronounced RRA) + "\u095d>\ue05d;" // LETTER RHA (pronounced RRHA) + "\u095e>\ue05e;" // LETTER FA + "\u095f>\ue05f;" // LETTER YYA + "\u0960>\ue060;" // LETTER VOCALIC RR + "\u0961>\ue061;" // LETTER VOCALIC LL + "\u0962>\ue062;" // VOWEL SIGN VOCALIC L + "\u0963>\ue063;" // VOWEL SIGN VOCALIC LL +// "\u0964>;" // UNMAPPED Devanagari-InterIndic: DANDA +// "\u0965>;" // UNMAPPED Devanagari-InterIndic: DOUBLE DANDA + "\u0966>\ue066;" // DIGIT ZERO + "\u0967>\ue067;" // DIGIT ONE + "\u0968>\ue068;" // DIGIT TWO + "\u0969>\ue069;" // DIGIT THREE + "\u096a>\ue06a;" // DIGIT FOUR + "\u096b>\ue06b;" // DIGIT FIVE + "\u096c>\ue06c;" // DIGIT SIX + "\u096d>\ue06d;" // DIGIT SEVEN + "\u096e>\ue06e;" // DIGIT EIGHT + "\u096f>\ue06f;" // DIGIT NINE +// "\u0970>;" // UNMAPPED Devanagari-InterIndic: ABBREVIATION SIGN + ":: NFC (NFD) ;" } } diff --git a/icu4c/data/Gujarati_InterIndic.txt b/icu4c/data/Gujarati_InterIndic.txt index 8f9a7ad5c5..631d9ce2d6 100644 --- a/icu4c/data/Gujarati_InterIndic.txt +++ b/icu4c/data/Gujarati_InterIndic.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Gujarati_InterIndic.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_Gujarati_InterIndic.utf8.txt // Date: Thu Mar 1 20:03:54 2001 //-------------------------------------------------------------------- // Gujarati_InterIndic -Gujarati_InterIndic { +Gujarati-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,86 +20,86 @@ Gujarati_InterIndic { //-------------------------------------------------------------------- // Gujarati-InterIndic - -"ઁ>\uE001;" // SIGN CANDRABINDU -"ં>\uE002;" // SIGN ANUSVARA -"ઃ>\uE003;" // SIGN VISARGA -"અ>\uE005;" // LETTER A -"આ>\uE006;" // LETTER AA -"ઇ>\uE007;" // LETTER I -"ઈ>\uE008;" // LETTER II -"ઉ>\uE009;" // LETTER U -"ઊ>\uE00A;" // LETTER UU -"ઋ>\uE00B;" // LETTER VOCALIC R -// ઍ>; // UNMAPPED Gujarati-InterIndic: VOWEL CANDRA E -"એ>\uE081;" // LETTER E -"ઐ>\uE010;" // LETTER AI -// ઑ>; // UNMAPPED Gujarati-InterIndic: VOWEL CANDRA O -"ઓ>\uE082;" // LETTER O -"ઔ>\uE014;" // LETTER AU -"ક>\uE015;" // LETTER KA -"ખ>\uE016;" // LETTER KHA -"ગ>\uE017;" // LETTER GA -"ઘ>\uE018;" // LETTER GHA -"ઙ>\uE019;" // LETTER NGA -"ચ>\uE01A;" // LETTER CA -"છ>\uE01B;" // LETTER CHA -"જ>\uE01C;" // LETTER JA -"ઝ>\uE01D;" // LETTER JHA -"ઞ>\uE01E;" // LETTER NYA -"ટ>\uE01F;" // LETTER TTA -"ઠ>\uE020;" // LETTER TTHA -"ડ>\uE021;" // LETTER DDA -"ઢ>\uE022;" // LETTER DDHA -"ણ>\uE023;" // LETTER NNA -"ત>\uE024;" // LETTER TA -"થ>\uE025;" // LETTER THA -"દ>\uE026;" // LETTER DA -"ધ>\uE027;" // LETTER DHA -"ન>\uE028;" // LETTER NA -"પ>\uE02A;" // LETTER PA -"ફ>\uE02B;" // LETTER PHA -"બ>\uE02C;" // LETTER BA -"ભ>\uE02D;" // LETTER BHA -"મ>\uE02E;" // LETTER MA -"ય>\uE02F;" // LETTER YA -"ર>\uE030;" // LETTER RA -"લ>\uE032;" // LETTER LA -"ળ>\uE033;" // LETTER LLA -"વ>\uE035;" // LETTER VA -"શ>\uE036;" // LETTER SHA -"ષ>\uE037;" // LETTER SSA -"સ>\uE038;" // LETTER SA -"હ>\uE039;" // LETTER HA -"઼>\uE03C;" // SIGN NUKTA -"ઽ>\uE03D;" // SIGN AVAGRAHA -"ા>\uE03E;" // VOWEL SIGN AA -"િ>\uE03F;" // VOWEL SIGN I -"ી>\uE040;" // VOWEL SIGN II -"ુ>\uE041;" // VOWEL SIGN U -"ૂ>\uE042;" // VOWEL SIGN UU -"ૃ>\uE043;" // VOWEL SIGN VOCALIC R -"ૄ>\uE044;" // VOWEL SIGN VOCALIC RR -"ૅ>\uE045;" // VOWEL SIGN CANDRA E -"ે>\uE084;" // VOWEL SIGN E -"ૈ>\uE048;" // VOWEL SIGN AI -"ૉ>\uE049;" // VOWEL SIGN CANDRA O -"ો>\uE085;" // VOWEL SIGN O -"ૌ>\uE04C;" // VOWEL SIGN AU -"્>\uE04D;" // SIGN VIRAMA -"ૐ>\uE050;" // OM -"ૠ>\uE060;" // LETTER VOCALIC RR -"૦>\uE066;" // DIGIT ZERO -"૧>\uE067;" // DIGIT ONE -"૨>\uE068;" // DIGIT TWO -"૩>\uE069;" // DIGIT THREE -"૪>\uE06A;" // DIGIT FOUR -"૫>\uE06B;" // DIGIT FIVE -"૬>\uE06C;" // DIGIT SIX -"૭>\uE06D;" // DIGIT SEVEN -"૮>\uE06E;" // DIGIT EIGHT -"૯>\uE06F;" // DIGIT NINE - +":: NFD (NFC) ;" +"\u0a81>\ue001;" // SIGN CANDRABINDU +"\u0a82>\ue002;" // SIGN ANUSVARA +"\u0a83>\ue003;" // SIGN VISARGA +"\u0a85>\ue005;" // LETTER A +"\u0a86>\ue006;" // LETTER AA +"\u0a87>\ue007;" // LETTER I +"\u0a88>\ue008;" // LETTER II +"\u0a89>\ue009;" // LETTER U +"\u0a8a>\ue00a;" // LETTER UU +"\u0a8b>\ue00b;" // LETTER VOCALIC R +// \u0a8d>; // UNMAPPED Gujarati-InterIndic: VOWEL CANDRA E +"\u0a8f>\ue00f;" // LETTER E +"\u0a90>\ue010;" // LETTER AI +// \u0a91>; // UNMAPPED Gujarati-InterIndic: VOWEL CANDRA O +"\u0a93>\ue013;" // LETTER O +"\u0a94>\ue014;" // LETTER AU +"\u0a95>\ue015;" // LETTER KA +"\u0a96>\ue016;" // LETTER KHA +"\u0a97>\ue017;" // LETTER GA +"\u0a98>\ue018;" // LETTER GHA +"\u0a99>\ue019;" // LETTER NGA +"\u0a9a>\ue01a;" // LETTER CA +"\u0a9b>\ue01b;" // LETTER CHA +"\u0a9c>\ue01c;" // LETTER JA +"\u0a9d>\ue01d;" // LETTER JHA +"\u0a9e>\ue01e;" // LETTER NYA +"\u0a9f>\ue01f;" // LETTER TTA +"\u0aa0>\ue020;" // LETTER TTHA +"\u0aa1>\ue021;" // LETTER DDA +"\u0aa2>\ue022;" // LETTER DDHA +"\u0aa3>\ue023;" // LETTER NNA +"\u0aa4>\ue024;" // LETTER TA +"\u0aa5>\ue025;" // LETTER THA +"\u0aa6>\ue026;" // LETTER DA +"\u0aa7>\ue027;" // LETTER DHA +"\u0aa8>\ue028;" // LETTER NA +"\u0aaa>\ue02a;" // LETTER PA +"\u0aab>\ue02b;" // LETTER PHA +"\u0aac>\ue02c;" // LETTER BA +"\u0aad>\ue02d;" // LETTER BHA +"\u0aae>\ue02e;" // LETTER MA +"\u0aaf>\ue02f;" // LETTER YA +"\u0ab0>\ue030;" // LETTER RA +"\u0ab2>\ue032;" // LETTER LA +"\u0ab3>\ue033;" // LETTER LLA +"\u0ab5>\ue035;" // LETTER VA +"\u0ab6>\ue036;" // LETTER SHA +"\u0ab7>\ue037;" // LETTER SSA +"\u0ab8>\ue038;" // LETTER SA +"\u0ab9>\ue039;" // LETTER HA +"\u0abc>\ue03c;" // SIGN NUKTA +"\u0abd>\ue03d;" // SIGN AVAGRAHA +"\u0abe>\ue03e;" // VOWEL SIGN AA +"\u0abf>\ue03f;" // VOWEL SIGN I +"\u0ac0>\ue040;" // VOWEL SIGN II +"\u0ac1>\ue041;" // VOWEL SIGN U +"\u0ac2>\ue042;" // VOWEL SIGN UU +"\u0ac3>\ue043;" // VOWEL SIGN VOCALIC R +"\u0ac4>\ue044;" // VOWEL SIGN VOCALIC RR +"\u0ac5>\ue045;" // VOWEL SIGN CANDRA E +"\u0ac7>\ue047;" // VOWEL SIGN E +"\u0ac8>\ue048;" // VOWEL SIGN AI +"\u0ac9>\ue049;" // VOWEL SIGN CANDRA O +"\u0acb>\ue04b;" // VOWEL SIGN O +"\u0acc>\ue04c;" // VOWEL SIGN AU +"\u0acd>\ue04d;" // SIGN VIRAMA +"\u0ad0>\ue050;" // OM +"\u0ae0>\ue060;" // LETTER VOCALIC RR +"\u0ae6>\ue066;" // DIGIT ZERO +"\u0ae7>\ue067;" // DIGIT ONE +"\u0ae8>\ue068;" // DIGIT TWO +"\u0ae9>\ue069;" // DIGIT THREE +"\u0aea>\ue06a;" // DIGIT FOUR +"\u0aeb>\ue06b;" // DIGIT FIVE +"\u0aec>\ue06c;" // DIGIT SIX +"\u0aed>\ue06d;" // DIGIT SEVEN +"\u0aee>\ue06e;" // DIGIT EIGHT +"\u0aef>\ue06f;" // DIGIT NINE + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/Gurmukhi_InterIndic.txt b/icu4c/data/Gurmukhi_InterIndic.txt index 1c307cff38..6c57bef851 100644 --- a/icu4c/data/Gurmukhi_InterIndic.txt +++ b/icu4c/data/Gurmukhi_InterIndic.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Gurmukhi_InterIndic.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_Gurmukhi_InterIndic.utf8.txt // Date: Thu Mar 1 20:03:54 2001 //-------------------------------------------------------------------- // Gurmukhi_InterIndic -Gurmukhi_InterIndic { +Gurmukhi-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,83 +20,83 @@ Gurmukhi_InterIndic { //-------------------------------------------------------------------- // Gurmukhi-InterIndic - -"ਂ>\uE001;" // REMAP (indicExceptions.txt): ਁ>ਂ = SIGN CANDRABINDU>SIGN BINDI -"ਅ>\uE005;" // LETTER A -"ਆ>\uE006;" // LETTER AA -"ਇ>\uE007;" // LETTER I -"ਈ>\uE008;" // LETTER II -"ਉ>\uE009;" // LETTER U -"ਊ>\uE00A;" // LETTER UU -"ਏ>\uE00F;" // LETTER EE -"ਐ>\uE010;" // LETTER AI -"ਓ>\uE013;" // LETTER OO -"ਔ>\uE014;" // LETTER AU -"ਕ>\uE015;" // LETTER KA -"ਖ>\uE016;" // LETTER KHA -"ਗ>\uE017;" // LETTER GA -"ਘ>\uE018;" // LETTER GHA -"ਙ>\uE019;" // LETTER NGA -"ਚ>\uE01A;" // LETTER CA -"ਛ>\uE01B;" // LETTER CHA -"ਜ>\uE01C;" // LETTER JA -"ਝ>\uE01D;" // LETTER JHA -"ਞ>\uE01E;" // LETTER NYA -"ਟ>\uE01F;" // LETTER TTA -"ਠ>\uE020;" // LETTER TTHA -"ਡ>\uE021;" // LETTER DDA -"ਢ>\uE022;" // LETTER DDHA -"ਣ>\uE023;" // LETTER NNA -"ਤ>\uE024;" // LETTER TA -"ਥ>\uE025;" // LETTER THA -"ਦ>\uE026;" // LETTER DA -"ਧ>\uE027;" // LETTER DHA -"ਨ>\uE028;" // LETTER NA -"ਪ>\uE02A;" // LETTER PA -"ਫ>\uE02B;" // LETTER PHA -"ਬ>\uE02C;" // LETTER BA -"ਭ>\uE02D;" // LETTER BHA -"ਮ>\uE02E;" // LETTER MA -"ਯ>\uE02F;" // LETTER YA -"ਰ>\uE030;" // LETTER RA -"ਲ>\uE032;" // LETTER LA -"ਲ਼>\uE033;" // LETTER LLA -"ਵ>\uE035;" // LETTER VA -"ਸ਼>\uE036;" // LETTER SHA -"ਸ>\uE038;" // LETTER SA -"ਹ>\uE039;" // LETTER HA -"਼>\uE03C;" // SIGN NUKTA -"ਾ>\uE03E;" // VOWEL SIGN AA -"ਿ>\uE03F;" // VOWEL SIGN I -"ੀ>\uE040;" // VOWEL SIGN II -"ੁ>\uE041;" // VOWEL SIGN U -"ੂ>\uE042;" // VOWEL SIGN UU -"ੇ>\uE047;" // VOWEL SIGN EE -"ੈ>\uE048;" // VOWEL SIGN AI -"ੋ>\uE04B;" // VOWEL SIGN OO -"ੌ>\uE04C;" // VOWEL SIGN AU -"੍>\uE04D;" // SIGN VIRAMA -"ਖ਼>\uE059;" // LETTER KHHA -"ਗ਼>\uE05A;" // LETTER GHHA -"ਜ਼>\uE05B;" // LETTER ZA -"ੜ>\uE083;" // LETTER RRA -"ਫ਼>\uE05E;" // LETTER FA -"੦>\uE066;" // DIGIT ZERO -"੧>\uE067;" // DIGIT ONE -"੨>\uE068;" // DIGIT TWO -"੩>\uE069;" // DIGIT THREE -"੪>\uE06A;" // DIGIT FOUR -"੫>\uE06B;" // DIGIT FIVE -"੬>\uE06C;" // DIGIT SIX -"੭>\uE06D;" // DIGIT SEVEN -"੮>\uE06E;" // DIGIT EIGHT -"੯>\uE06F;" // DIGIT NINE -// ੰ>; // UNMAPPED Gurmukhi-InterIndic: TIPPI -// ੱ>; // UNMAPPED Gurmukhi-InterIndic: ADDAK -// ੲ>; // UNMAPPED Gurmukhi-InterIndic: IRI -// ੳ>; // UNMAPPED Gurmukhi-InterIndic: URA -// ੴ>; // UNMAPPED Gurmukhi-InterIndic: EK ONKAR - +":: NFD (NFC) ;" +"\u0a02>\ue001;" // REMAP (indicExceptions.txt): \u0a01>\u0a02 = SIGN CANDRABINDU>SIGN BINDI +"\u0a05>\ue005;" // LETTER A +"\u0a06>\ue006;" // LETTER AA +"\u0a07>\ue007;" // LETTER I +"\u0a08>\ue008;" // LETTER II +"\u0a09>\ue009;" // LETTER U +"\u0a0a>\ue00a;" // LETTER UU +"\u0a0f>\ue00f;" // LETTER EE +"\u0a10>\ue010;" // LETTER AI +"\u0a13>\ue013;" // LETTER OO +"\u0a14>\ue014;" // LETTER AU +"\u0a15>\ue015;" // LETTER KA +"\u0a16>\ue016;" // LETTER KHA +"\u0a17>\ue017;" // LETTER GA +"\u0a18>\ue018;" // LETTER GHA +"\u0a19>\ue019;" // LETTER NGA +"\u0a1a>\ue01a;" // LETTER CA +"\u0a1b>\ue01b;" // LETTER CHA +"\u0a1c>\ue01c;" // LETTER JA +"\u0a1d>\ue01d;" // LETTER JHA +"\u0a1e>\ue01e;" // LETTER NYA +"\u0a1f>\ue01f;" // LETTER TTA +"\u0a20>\ue020;" // LETTER TTHA +"\u0a21>\ue021;" // LETTER DDA +"\u0a22>\ue022;" // LETTER DDHA +"\u0a23>\ue023;" // LETTER NNA +"\u0a24>\ue024;" // LETTER TA +"\u0a25>\ue025;" // LETTER THA +"\u0a26>\ue026;" // LETTER DA +"\u0a27>\ue027;" // LETTER DHA +"\u0a28>\ue028;" // LETTER NA +"\u0a2a>\ue02a;" // LETTER PA +"\u0a2b>\ue02b;" // LETTER PHA +"\u0a2c>\ue02c;" // LETTER BA +"\u0a2d>\ue02d;" // LETTER BHA +"\u0a2e>\ue02e;" // LETTER MA +"\u0a2f>\ue02f;" // LETTER YA +"\u0a30>\ue030;" // LETTER RA +"\u0a32>\ue032;" // LETTER LA +"\u0a33>\ue033;" // LETTER LLA +"\u0a35>\ue035;" // LETTER VA +"\u0a36>\ue036;" // LETTER SHA +"\u0a38>\ue038;" // LETTER SA +"\u0a39>\ue039;" // LETTER HA +"\u0a3c>\ue03c;" // SIGN NUKTA +"\u0a3e>\ue03e;" // VOWEL SIGN AA +"\u0a3f>\ue03f;" // VOWEL SIGN I +"\u0a40>\ue040;" // VOWEL SIGN II +"\u0a41>\ue041;" // VOWEL SIGN U +"\u0a42>\ue042;" // VOWEL SIGN UU +"\u0a47>\ue047;" // VOWEL SIGN EE +"\u0a48>\ue048;" // VOWEL SIGN AI +"\u0a4b>\ue04b;" // VOWEL SIGN OO +"\u0a4c>\ue04c;" // VOWEL SIGN AU +"\u0a4d>\ue04d;" // SIGN VIRAMA +"\u0a59>\ue059;" // LETTER KHHA +"\u0a5a>\ue05a;" // LETTER GHHA +"\u0a5b>\ue05b;" // LETTER ZA +"\u0a5c>\ue05c;" // LETTER RRA +"\u0a5e>\ue05e;" // LETTER FA +"\u0a66>\ue066;" // DIGIT ZERO +"\u0a67>\ue067;" // DIGIT ONE +"\u0a68>\ue068;" // DIGIT TWO +"\u0a69>\ue069;" // DIGIT THREE +"\u0a6a>\ue06a;" // DIGIT FOUR +"\u0a6b>\ue06b;" // DIGIT FIVE +"\u0a6c>\ue06c;" // DIGIT SIX +"\u0a6d>\ue06d;" // DIGIT SEVEN +"\u0a6e>\ue06e;" // DIGIT EIGHT +"\u0a6f>\ue06f;" // DIGIT NINE +// \u0a70>; // UNMAPPED Gurmukhi-InterIndic: TIPPI +// \u0a71>; // UNMAPPED Gurmukhi-InterIndic: ADDAK +// \u0a72>; // UNMAPPED Gurmukhi-InterIndic: IRI +// \u0a73>; // UNMAPPED Gurmukhi-InterIndic: URA +// \u0a74>; // UNMAPPED Gurmukhi-InterIndic: EK ONKAR + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Bengali.txt b/icu4c/data/InterIndic_Bengali.txt index 23c8e0bc8b..86f17860a3 100644 --- a/icu4c/data/InterIndic_Bengali.txt +++ b/icu4c/data/InterIndic_Bengali.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Bengali.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Bengali.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Bengali -InterIndic_Bengali { +InterIndic-Bengali { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,105 +20,105 @@ InterIndic_Bengali { //-------------------------------------------------------------------- // InterIndic-Bengali - -"\uE001>ঁ;" // SIGN CANDRABINDU -"\uE002>ং;" // SIGN ANUSVARA -"\uE003>ঃ;" // SIGN VISARGA -"\uE005>অ;" // LETTER A -"\uE006>আ;" // LETTER AA -"\uE007>ই;" // LETTER I -"\uE008>ঈ;" // LETTER II -"\uE009>উ;" // LETTER U -"\uE00A>ঊ;" // LETTER UU -"\uE00B>ঋ;" // LETTER VOCALIC R -"\uE00C>ঌ;" // LETTER VOCALIC L -// \uE00F>; // UNMAPPED InterIndic-Bengali: LETTER EE (এ = LETTER E) -"\uE010>ঐ;" // LETTER AI -// \uE013>; // UNMAPPED InterIndic-Bengali: LETTER OO (ও = LETTER O) -"\uE014>ঔ;" // LETTER AU -"\uE015>ক;" // LETTER KA -"\uE016>খ;" // LETTER KHA -"\uE017>গ;" // LETTER GA -"\uE018>ঘ;" // LETTER GHA -"\uE019>ঙ;" // LETTER NGA -"\uE01A>চ;" // LETTER CA -"\uE01B>ছ;" // LETTER CHA -"\uE01C>জ;" // LETTER JA -"\uE01D>ঝ;" // LETTER JHA -"\uE01E>ঞ;" // LETTER NYA -"\uE01F>ট;" // LETTER TTA -"\uE020>ঠ;" // LETTER TTHA -"\uE021>ড;" // LETTER DDA -"\uE022>ঢ;" // LETTER DDHA -"\uE023>ণ;" // LETTER NNA -"\uE024>ত;" // LETTER TA -"\uE025>থ;" // LETTER THA -"\uE026>দ;" // LETTER DA -"\uE027>ধ;" // LETTER DHA -"\uE028>ন;" // LETTER NA -"\uE029>ন;" // REMAP (indicExceptions.txt): ঩>ন = LETTER NNNA>LETTER NA -"\uE02A>প;" // LETTER PA -"\uE02B>ফ;" // LETTER PHA -"\uE02C>ব;" // LETTER BA -"\uE02D>ভ;" // LETTER BHA -"\uE02E>ম;" // LETTER MA -"\uE02F>য;" // LETTER YA -"\uE030>র;" // LETTER RA -"\uE032>ল;" // LETTER LA -"\uE033>ল;" // REMAP (indicExceptions.txt): ঳>ল = LETTER LLA>LETTER LA -"\uE034>ল;" // REMAP (indicExceptions.txt): ঴>ল = LETTER LLLA>LETTER LA -"\uE035>ব;" // REMAP (indicExceptions.txt): ঵>ব = LETTER VA>LETTER BA -"\uE036>শ;" // LETTER SHA -"\uE037>ষ;" // LETTER SSA -"\uE038>স;" // LETTER SA -"\uE039>হ;" // LETTER HA -"\uE03C>়;" // SIGN NUKTA -// \uE03D>; // UNMAPPED InterIndic-Bengali: SIGN AVAGRAHA -"\uE03E>া;" // VOWEL SIGN AA -"\uE03F>ি;" // VOWEL SIGN I -"\uE040>ী;" // VOWEL SIGN II -"\uE041>ু;" // VOWEL SIGN U -"\uE042>ূ;" // VOWEL SIGN UU -"\uE043>ৃ;" // VOWEL SIGN VOCALIC R -"\uE044>ৄ;" // VOWEL SIGN VOCALIC RR -"\uE045>ে;" // REMAP (indicExceptions.txt): ৅>ে = VOWEL SIGN CANDRA E>VOWEL SIGN E -// \uE047>; // UNMAPPED InterIndic-Bengali: VOWEL SIGN EE (ে = VOWEL SIGN E) -"\uE048>ৈ;" // VOWEL SIGN AI -"\uE049>ো;" // REMAP (indicExceptions.txt): ৉>ো = VOWEL SIGN CANDRA O>VOWEL SIGN O -// \uE04B>; // UNMAPPED InterIndic-Bengali: VOWEL SIGN OO (ো = VOWEL SIGN O) -"\uE04C>ৌ;" // VOWEL SIGN AU -"\uE04D>্;" // SIGN VIRAMA -// \uE050>; // UNMAPPED InterIndic-Bengali: OM -// \uE055>; // UNMAPPED InterIndic-Bengali: LENGTH MARK -"\uE056>ৈ;" // REMAP (indicExceptions.txt): ৖>ৈ = AI LENGTH MARK>VOWEL SIGN AI -"\uE057>ৗ;" // AU LENGTH MARK -"\uE059>খ;" // REMAP (indicExceptions.txt): ৙>খ = LETTER KHHA>LETTER KHA -"\uE05A>গ;" // REMAP (indicExceptions.txt): ৚>গ = LETTER GHHA>LETTER GA -"\uE05B>জ;" // REMAP (indicExceptions.txt): ৛>জ = LETTER ZA>LETTER JA -"\uE05D>ঢ়;" // LETTER RHA -"\uE05E>ফ;" // REMAP (indicExceptions.txt): ৞>ফ = LETTER FA>LETTER PHA -"\uE05F>য়;" // LETTER YYA -"\uE060>ৠ;" // LETTER VOCALIC RR -"\uE061>ৡ;" // LETTER VOCALIC LL -"\uE062>ৢ;" // VOWEL SIGN VOCALIC L -"\uE063>ৣ;" // VOWEL SIGN VOCALIC LL -"\uE066>০;" // DIGIT ZERO -"\uE067>১;" // DIGIT ONE -"\uE068>২;" // DIGIT TWO -"\uE069>৩;" // DIGIT THREE -"\uE06A>৪;" // DIGIT FOUR -"\uE06B>৫;" // DIGIT FIVE -"\uE06C>৬;" // DIGIT SIX -"\uE06D>৭;" // DIGIT SEVEN -"\uE06E>৮;" // DIGIT EIGHT -"\uE06F>৯;" // DIGIT NINE -"\uE080>৺;" // ISSHAR -"\uE081>এ;" // LETTER E -"\uE082>ও;" // LETTER O -"\uE083>ড়;" // LETTER RRA -"\uE084>ে;" // VOWEL SIGN E -"\uE085>ো;" // VOWEL SIGN O - +":: NFD (NFC) ;" +"\ue001>\u0981;" // SIGN CANDRABINDU +"\ue002>\u0982;" // SIGN ANUSVARA +"\ue003>\u0983;" // SIGN VISARGA +"\ue005>\u0985;" // LETTER A +"\ue006>\u0986;" // LETTER AA +"\ue007>\u0987;" // LETTER I +"\ue008>\u0988;" // LETTER II +"\ue009>\u0989;" // LETTER U +"\ue00a>\u098a;" // LETTER UU +"\ue00b>\u098b;" // LETTER VOCALIC R +"\ue00c>\u098c;" // LETTER VOCALIC L +// \ue00f>; // UNMAPPED InterIndic-Bengali: LETTER EE (\u098f = LETTER E) +"\ue010>\u0990;" // LETTER AI +// \ue013>; // UNMAPPED InterIndic-Bengali: LETTER OO (\u0993 = LETTER O) +"\ue014>\u0994;" // LETTER AU +"\ue015>\u0995;" // LETTER KA +"\ue016>\u0996;" // LETTER KHA +"\ue017>\u0997;" // LETTER GA +"\ue018>\u0998;" // LETTER GHA +"\ue019>\u0999;" // LETTER NGA +"\ue01a>\u099a;" // LETTER CA +"\ue01b>\u099b;" // LETTER CHA +"\ue01c>\u099c;" // LETTER JA +"\ue01d>\u099d;" // LETTER JHA +"\ue01e>\u099e;" // LETTER NYA +"\ue01f>\u099f;" // LETTER TTA +"\ue020>\u09a0;" // LETTER TTHA +"\ue021>\u09a1;" // LETTER DDA +"\ue022>\u09a2;" // LETTER DDHA +"\ue023>\u09a3;" // LETTER NNA +"\ue024>\u09a4;" // LETTER TA +"\ue025>\u09a5;" // LETTER THA +"\ue026>\u09a6;" // LETTER DA +"\ue027>\u09a7;" // LETTER DHA +"\ue028>\u09a8;" // LETTER NA +"\ue029>\u09a8;" // REMAP (indicExceptions.txt): \u09a9>\u09a8 = LETTER NNNA>LETTER NA +"\ue02a>\u09aa;" // LETTER PA +"\ue02b>\u09ab;" // LETTER PHA +"\ue02c>\u09ac;" // LETTER BA +"\ue02d>\u09ad;" // LETTER BHA +"\ue02e>\u09ae;" // LETTER MA +"\ue02f>\u09af;" // LETTER YA +"\ue030>\u09b0;" // LETTER RA +"\ue032>\u09b2;" // LETTER LA +"\ue033>\u09b2;" // REMAP (indicExceptions.txt): \u09b3>\u09b2 = LETTER LLA>LETTER LA +"\ue034>\u09b2;" // REMAP (indicExceptions.txt): \u09b4>\u09b2 = LETTER LLLA>LETTER LA +"\ue035>\u09ac;" // REMAP (indicExceptions.txt): \u09b5>\u09ac = LETTER VA>LETTER BA +"\ue036>\u09b6;" // LETTER SHA +"\ue037>\u09b7;" // LETTER SSA +"\ue038>\u09b8;" // LETTER SA +"\ue039>\u09b9;" // LETTER HA +"\ue03c>\u09bc;" // SIGN NUKTA +// \ue03d>; // UNMAPPED InterIndic-Bengali: SIGN AVAGRAHA +"\ue03e>\u09be;" // VOWEL SIGN AA +"\ue03f>\u09bf;" // VOWEL SIGN I +"\ue040>\u09c0;" // VOWEL SIGN II +"\ue041>\u09c1;" // VOWEL SIGN U +"\ue042>\u09c2;" // VOWEL SIGN UU +"\ue043>\u09c3;" // VOWEL SIGN VOCALIC R +"\ue044>\u09c4;" // VOWEL SIGN VOCALIC RR +"\ue045>\u09c7;" // REMAP (indicExceptions.txt): \u09c5>\u09c7 = VOWEL SIGN CANDRA E>VOWEL SIGN E +// \ue047>; // UNMAPPED InterIndic-Bengali: VOWEL SIGN EE (\u09c7 = VOWEL SIGN E) +"\ue048>\u09c8;" // VOWEL SIGN AI +"\ue049>\u09cb;" // REMAP (indicExceptions.txt): \u09c9>\u09cb = VOWEL SIGN CANDRA O>VOWEL SIGN O +// \ue04b>; // UNMAPPED InterIndic-Bengali: VOWEL SIGN OO (\u09cb = VOWEL SIGN O) +"\ue04c>\u09cc;" // VOWEL SIGN AU +"\ue04d>\u09cd;" // SIGN VIRAMA +// \ue050>; // UNMAPPED InterIndic-Bengali: OM +// \ue055>; // UNMAPPED InterIndic-Bengali: LENGTH MARK +"\ue056>\u09c8;" // REMAP (indicExceptions.txt): \u09d6>\u09c8 = AI LENGTH MARK>VOWEL SIGN AI +"\ue057>\u09d7;" // AU LENGTH MARK +"\ue059>\u0996;" // REMAP (indicExceptions.txt): \u09d9>\u0996 = LETTER KHHA>LETTER KHA +"\ue05a>\u0997;" // REMAP (indicExceptions.txt): \u09da>\u0997 = LETTER GHHA>LETTER GA +"\ue05b>\u099c;" // REMAP (indicExceptions.txt): \u09db>\u099c = LETTER ZA>LETTER JA +"\ue05d>\u09dd;" // LETTER RHA +"\ue05e>\u09ab;" // REMAP (indicExceptions.txt): \u09de>\u09ab = LETTER FA>LETTER PHA +"\ue05f>\u09df;" // LETTER YYA +"\ue060>\u09e0;" // LETTER VOCALIC RR +"\ue061>\u09e1;" // LETTER VOCALIC LL +"\ue062>\u09e2;" // VOWEL SIGN VOCALIC L +"\ue063>\u09e3;" // VOWEL SIGN VOCALIC LL +"\ue066>\u09e6;" // DIGIT ZERO +"\ue067>\u09e7;" // DIGIT ONE +"\ue068>\u09e8;" // DIGIT TWO +"\ue069>\u09e9;" // DIGIT THREE +"\ue06a>\u09ea;" // DIGIT FOUR +"\ue06b>\u09eb;" // DIGIT FIVE +"\ue06c>\u09ec;" // DIGIT SIX +"\ue06d>\u09ed;" // DIGIT SEVEN +"\ue06e>\u09ee;" // DIGIT EIGHT +"\ue06f>\u09ef;" // DIGIT NINE +"\ue0fa>\u09fa;" // ISSHAR +"\ue00f>\u098f;" // LETTER E +"\ue013>\u0993;" // LETTER O +"\ue031>\u09dc;" // LETTER RRA +"\ue047>\u09c7;" // VOWEL SIGN E +"\ue04b>\u09cb;" // VOWEL SIGN O + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Devanagari.txt b/icu4c/data/InterIndic_Devanagari.txt index 3058e06680..43363a1fd3 100644 --- a/icu4c/data/InterIndic_Devanagari.txt +++ b/icu4c/data/InterIndic_Devanagari.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Devanagari.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Devanagari.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Devanagari -InterIndic_Devanagari { +InterIndic-Devanagari { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -22,104 +21,131 @@ InterIndic_Devanagari { // InterIndic-Devanagari -"\uE001>ँ;" // SIGN CANDRABINDU -"\uE002>ं;" // SIGN ANUSVARA -"\uE003>ः;" // SIGN VISARGA -"\uE005>अ;" // LETTER A -"\uE006>आ;" // LETTER AA -"\uE007>इ;" // LETTER I -"\uE008>ई;" // LETTER II -"\uE009>उ;" // LETTER U -"\uE00A>ऊ;" // LETTER UU -"\uE00B>ऋ;" // LETTER VOCALIC R -"\uE00C>ऌ;" // LETTER VOCALIC L -// \uE00F>; // UNMAPPED InterIndic-Devanagari: LETTER EE (ए = LETTER E) -"\uE010>ऐ;" // LETTER AI -// \uE013>; // UNMAPPED InterIndic-Devanagari: LETTER OO (ओ = LETTER O) -"\uE014>औ;" // LETTER AU -"\uE015>क;" // LETTER KA -"\uE016>ख;" // LETTER KHA -"\uE017>ग;" // LETTER GA -"\uE018>घ;" // LETTER GHA -"\uE019>ङ;" // LETTER NGA -"\uE01A>च;" // LETTER CA -"\uE01B>छ;" // LETTER CHA -"\uE01C>ज;" // LETTER JA -"\uE01D>झ;" // LETTER JHA -"\uE01E>ञ;" // LETTER NYA -"\uE01F>ट;" // LETTER TTA -"\uE020>ठ;" // LETTER TTHA -"\uE021>ड;" // LETTER DDA -"\uE022>ढ;" // LETTER DDHA -"\uE023>ण;" // LETTER NNA -"\uE024>त;" // LETTER TA -"\uE025>थ;" // LETTER THA -"\uE026>द;" // LETTER DA -"\uE027>ध;" // LETTER DHA -"\uE028>न;" // LETTER NA -"\uE029>ऩ;" // LETTER NNNA -"\uE02A>प;" // LETTER PA -"\uE02B>फ;" // LETTER PHA -"\uE02C>ब;" // LETTER BA -"\uE02D>भ;" // LETTER BHA -"\uE02E>म;" // LETTER MA -"\uE02F>य;" // LETTER YA -"\uE030>र;" // LETTER RA -"\uE032>ल;" // LETTER LA -"\uE033>ळ;" // LETTER LLA -"\uE034>ऴ;" // LETTER LLLA -"\uE035>व;" // LETTER VA -"\uE036>श;" // LETTER SHA -"\uE037>ष;" // LETTER SSA -"\uE038>स;" // LETTER SA -"\uE039>ह;" // LETTER HA -"\uE03C>़;" // SIGN NUKTA -"\uE03D>ऽ;" // SIGN AVAGRAHA -"\uE03E>ा;" // VOWEL SIGN AA -"\uE03F>ि;" // VOWEL SIGN I -"\uE040>ी;" // VOWEL SIGN II -"\uE041>ु;" // VOWEL SIGN U -"\uE042>ू;" // VOWEL SIGN UU -"\uE043>ृ;" // VOWEL SIGN VOCALIC R -"\uE044>ॄ;" // VOWEL SIGN VOCALIC RR -"\uE045>ॅ;" // VOWEL SIGN CANDRA E -// \uE047>; // UNMAPPED InterIndic-Devanagari: VOWEL SIGN EE (े = VOWEL SIGN E) -"\uE048>ै;" // VOWEL SIGN AI -"\uE049>ॉ;" // VOWEL SIGN CANDRA O -// \uE04B>; // UNMAPPED InterIndic-Devanagari: VOWEL SIGN OO (ो = VOWEL SIGN O) -"\uE04C>ौ;" // VOWEL SIGN AU -"\uE04D>्;" // SIGN VIRAMA -"\uE050>ॐ;" // OM -// \uE055>; // UNMAPPED InterIndic-Devanagari: LENGTH MARK -"\uE056>ै;" // REMAP (indicExceptions.txt): ॖ>ै = AI LENGTH MARK>VOWEL SIGN AI -"\uE057>ौ;" // REMAP (indicExceptions.txt): ॗ>ौ = AU LENGTH MARK>VOWEL SIGN AU -"\uE059>ख़;" // LETTER KHHA -"\uE05A>ग़;" // LETTER GHHA -"\uE05B>ज़;" // LETTER ZA -"\uE05D>ढ़;" // LETTER RHA -"\uE05E>फ़;" // LETTER FA -"\uE05F>य़;" // LETTER YYA -"\uE060>ॠ;" // LETTER VOCALIC RR -"\uE061>ॡ;" // LETTER VOCALIC LL -"\uE062>ॢ;" // VOWEL SIGN VOCALIC L -"\uE063>ॣ;" // VOWEL SIGN VOCALIC LL -"\uE066>०;" // DIGIT ZERO -"\uE067>१;" // DIGIT ONE -"\uE068>२;" // DIGIT TWO -"\uE069>३;" // DIGIT THREE -"\uE06A>४;" // DIGIT FOUR -"\uE06B>५;" // DIGIT FIVE -"\uE06C>६;" // DIGIT SIX -"\uE06D>७;" // DIGIT SEVEN -"\uE06E>८;" // DIGIT EIGHT -"\uE06F>९;" // DIGIT NINE -// \uE080>; // UNMAPPED InterIndic-Devanagari: ISSHAR -"\uE081>ए;" // LETTER E -"\uE082>ओ;" // LETTER O -"\uE083>ऱ;" // LETTER RRA -"\uE084>े;" // VOWEL SIGN E -"\uE085>ो;" // VOWEL SIGN O +":: NFD (NFC) ;" +//Rules for Decomposed characters + "\ue028\ue03c > \u0929;" //\ue029 + "\ue030\ue03c > \u0931;" //\ue031 + "\ue033\ue03c > \u0934;" //\ue034 + "\ue015\ue03c > \u0958;" //\ue058 LETTER QA (For Urdu) + "\ue016\ue03c > \u0959;" //\ue059 LETTER KHHA (For Urdu) + "\ue017\ue03c > \u095a;" //\ue05a LETTER GHHA (For Urdu) + "\ue01c\ue03c > \u095b;" //\ue05b LETTER ZA (For Urdu) + "\ue021\ue03c > \u095c;" //\ue05c LETTER DDDHA (pronounced RRA) + "\ue022\ue03c > \u095d;" //\ue05d LETTER RHA (pronounced RRHA) + "\ue02b\ue03c > \u095e;" //\ue05e LETTER FA + "\ue02f\ue03c > \u095f;" //\ue05f LETTER YYA + "\ue001 > \u0901;" // SIGN CANDRABINDU + "\ue002 > \u0902;" // SIGN ANUSVARA + "\ue003 > \u0903;" // SIGN VISARGA + "\ue005 > \u0905;" // LETTER A + "\ue006 > \u0906;" // LETTER AA + "\ue007 > \u0907;" // LETTER I + "\ue008 > \u0908;" // LETTER II + "\ue009 > \u0909;" // LETTER U + "\ue00a > \u090a;" // LETTER UU + "\ue00b > \u090b;" // LETTER VOCALIC R + "\ue00c > \u090c;" // LETTER VOCALIC L + "\ue00d > \u090d;" // LETTER CANDRA E (For representing English sounds) +//"\ue00e > \u090e;" // UNMAPPED LETTER SHORT E(For Southern Scripts) + "\ue00e > \u090f;" + "\ue00f > \u090f;" // LETTER E + "\ue010 > \u0910;" // LETTER AI + "\ue011 > \u0911;" // LETTER CANDRA O (For representing English sounds) +//"\ue012 > \u0912;" // UNMAPPED LETTER SHORT O (For Southern Scripts) + "\ue012 > \u0913;" + "\ue013 > \u0913;" // LETTER O + "\ue014 > \u0914;" // LETTER AU + "\ue015 > \u0915;" // LETTER KA + "\ue016 > \u0916;" // LETTER KHA + "\ue017 > \u0917;" // LETTER GA + "\ue018 > \u0918;" // LETTER GHA + "\ue019 > \u0919;" // LETTER NGA + "\ue01a > \u091a;" // LETTER CA + "\ue01b > \u091b;" // LETTER CHA + "\ue01c > \u091c;" // LETTER JA + "\ue01d > \u091d;" // LETTER JHA + "\ue01e > \u091e;" // LETTER NYA + "\ue01f > \u091f;" // LETTER TTA + "\ue020 > \u0920;" // LETTER TTHA + "\ue021 > \u0921;" // LETTER DDA + "\ue022 > \u0922;" // LETTER DDHA + "\ue023 > \u0923;" // LETTER NNA + "\ue024 > \u0924;" // LETTER TA + "\ue025 > \u0925;" // LETTER THA + "\ue026 > \u0926;" // LETTER DA + "\ue027 > \u0927;" // LETTER DHA + "\ue028 > \u0928;" // LETTER NA + "\ue029 > \u0929;" // LETTER NNNA + "\ue02a > \u092a;" // LETTER PA + "\ue02b > \u092b;" // LETTER PHA + "\ue02c > \u092c;" // LETTER BA + "\ue02d > \u092d;" // LETTER BHA + "\ue02e > \u092e;" // LETTER MA + "\ue02f > \u092f;" // LETTER YA + "\ue030 > \u0930;" // LETTER RA + //"\ue031 > \u0931;" // LETTER RRA (Eyelash RA for Southern scripts) + "\ue031 > \u0930;" + "\ue032 > \u0932;" // LETTER LA + "\ue033 > \u0933;" // LETTER LLA + //"\ue034 > \u0934;" // LETTER LLLA (LLLA for Southern scripts) + "\ue034 > \u0933;" + "\ue035 > \u0935;" // LETTER VA + "\ue036 > \u0936;" // LETTER SHA + "\ue037 > \u0937;" // LETTER SSA + "\ue038 > \u0938;" // LETTER SA + "\ue039 > \u0939;" // LETTER HA + "\ue03c > \u093c;" // SIGN NUKTA + "\ue03d > \u093d;" // SIGN AVAGRAHA + "\ue03e > \u093e;" // VOWEL SIGN AA + "\ue03f > \u093f;" // VOWEL SIGN I + "\ue040 > \u0940;" // VOWEL SIGN II + "\ue041 > \u0941;" // VOWEL SIGN U + "\ue042 > \u0942;" // VOWEL SIGN UU + "\ue043 > \u0943;" // VOWEL SIGN VOCALIC R + "\ue044 > \u0944;" // VOWEL SIGN VOCALIC RR + "\ue045 > \u0945;" // VOWEL SIGN CANDRA E +//"\ue046 > \u0946;" // UNMAPPED VOWEL SIGN SHORT E + "\ue046 > \u0947;" + "\ue047 > \u0947;" // VOWEL SIGN E + "\ue048 > \u0948;" // VOWEL SIGN AI + "\ue049 > \u0949;" // VOWEL SIGN CANDRA O +//"\ue04a > \u094a;" // UNMAPPED VOWEL SIGN SHORT O + "\ue04a > \u094b;" + "\ue04b > \u094b;" // VOWEL SIGN O + "\ue04c > \u094c;" // VOWEL SIGN AU + "\ue04d > \u094d;" // SIGN VIRAMA + "\ue050 > \u0950;" // OM +// \u0951 // UNMAPPED STRESS SIGN UDATTA +// \u0952 // UNMAPPED STRESS SIGN ANUDATTA +// \u0953 // UNMAPPED GRAVE ACCENT +// \u0954 // UNMAPPED ACUTE ACCENT + "\ue058 > \u0958;" // LETTER QA (For Urdu) + "\ue059 > \u0959;" // LETTER KHHA (For Urdu) + "\ue05a > \u095a;" // LETTER GHHA (For Urdu) + "\ue05b > \u095b;" // LETTER ZA (For Urdu) + "\ue05c > \u095c;" // LETTER DDDHA (pronounced RRA) + "\ue05d > \u095d;" // LETTER RHA (pronounced RRHA) + "\ue05e > \u095e;" // LETTER FA + "\ue05f > \u095f;" // LETTER YYA + "\ue060 > \u0960;" // LETTER VOCALIC RR + "\ue061 > \u0961;" // LETTER VOCALIC LL + "\ue062 > \u0962;" // VOWEL SIGN VOCALIC L + "\ue063 > \u0963;" // VOWEL SIGN VOCALIC LL +// > ;" \u0964 // UNMAPPED Devanagari-InterIndic: DANDA +// > ;" \u0965 // UNMAPPED Devanagari-InterIndic: DOUBLE DANDA + "\ue066 > \u0966;" // DIGIT ZERO + "\ue067 > \u0967;" // DIGIT ONE + "\ue068 > \u0968;" // DIGIT TWO + "\ue069 > \u0969;" // DIGIT THREE + "\ue06a > \u096a;" // DIGIT FOUR + "\ue06b > \u096b;" // DIGIT FIVE + "\ue06c > \u096c;" // DIGIT SIX + "\ue06d > \u096d;" // DIGIT SEVEN + "\ue06e > \u096e;" // DIGIT EIGHT + "\ue06f > \u096f;" // DIGIT NINE +// \u0970 // UNMAPPED Devanagari-InterIndic: ABBREVIATION SIGN + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Gujarati.txt b/icu4c/data/InterIndic_Gujarati.txt index 76fc332089..8de6e71abc 100644 --- a/icu4c/data/InterIndic_Gujarati.txt +++ b/icu4c/data/InterIndic_Gujarati.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Gujarati.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Gujarati.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Gujarati -InterIndic_Gujarati { +InterIndic-Gujarati { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,105 +20,105 @@ InterIndic_Gujarati { //-------------------------------------------------------------------- // InterIndic-Gujarati - -"\uE001>ઁ;" // SIGN CANDRABINDU -"\uE002>ં;" // SIGN ANUSVARA -"\uE003>ઃ;" // SIGN VISARGA -"\uE005>અ;" // LETTER A -"\uE006>આ;" // LETTER AA -"\uE007>ઇ;" // LETTER I -"\uE008>ઈ;" // LETTER II -"\uE009>ઉ;" // LETTER U -"\uE00A>ઊ;" // LETTER UU -"\uE00B>ઋ;" // LETTER VOCALIC R -"\uE00C>લૃ;" // REMAP (indicExceptions.txt): ઌ>લૃ = LETTER VOCALIC L>LETTER LA.VOWEL SIGN VOCALIC R -// \uE00F>; // UNMAPPED InterIndic-Gujarati: LETTER EE (એ = LETTER E) -"\uE010>ઐ;" // LETTER AI -// \uE013>; // UNMAPPED InterIndic-Gujarati: LETTER OO (ઓ = LETTER O) -"\uE014>ઔ;" // LETTER AU -"\uE015>ક;" // LETTER KA -"\uE016>ખ;" // LETTER KHA -"\uE017>ગ;" // LETTER GA -"\uE018>ઘ;" // LETTER GHA -"\uE019>ઙ;" // LETTER NGA -"\uE01A>ચ;" // LETTER CA -"\uE01B>છ;" // LETTER CHA -"\uE01C>જ;" // LETTER JA -"\uE01D>ઝ;" // LETTER JHA -"\uE01E>ઞ;" // LETTER NYA -"\uE01F>ટ;" // LETTER TTA -"\uE020>ઠ;" // LETTER TTHA -"\uE021>ડ;" // LETTER DDA -"\uE022>ઢ;" // LETTER DDHA -"\uE023>ણ;" // LETTER NNA -"\uE024>ત;" // LETTER TA -"\uE025>થ;" // LETTER THA -"\uE026>દ;" // LETTER DA -"\uE027>ધ;" // LETTER DHA -"\uE028>ન;" // LETTER NA -"\uE029>ન;" // REMAP (indicExceptions.txt): ઩>ન = LETTER NNNA>LETTER NA -"\uE02A>પ;" // LETTER PA -"\uE02B>ફ;" // LETTER PHA -"\uE02C>બ;" // LETTER BA -"\uE02D>ભ;" // LETTER BHA -"\uE02E>મ;" // LETTER MA -"\uE02F>ય;" // LETTER YA -"\uE030>ર;" // LETTER RA -"\uE032>લ;" // LETTER LA -"\uE033>ળ;" // LETTER LLA -"\uE034>ળ;" // REMAP (indicExceptions.txt): ઴>ળ = LETTER LLLA>LETTER LLA -"\uE035>વ;" // LETTER VA -"\uE036>શ;" // LETTER SHA -"\uE037>ષ;" // LETTER SSA -"\uE038>સ;" // LETTER SA -"\uE039>હ;" // LETTER HA -"\uE03C>઼;" // SIGN NUKTA -"\uE03D>ઽ;" // SIGN AVAGRAHA -"\uE03E>ા;" // VOWEL SIGN AA -"\uE03F>િ;" // VOWEL SIGN I -"\uE040>ી;" // VOWEL SIGN II -"\uE041>ુ;" // VOWEL SIGN U -"\uE042>ૂ;" // VOWEL SIGN UU -"\uE043>ૃ;" // VOWEL SIGN VOCALIC R -"\uE044>ૄ;" // VOWEL SIGN VOCALIC RR -"\uE045>ૅ;" // VOWEL SIGN CANDRA E -// \uE047>; // UNMAPPED InterIndic-Gujarati: VOWEL SIGN EE (ે = VOWEL SIGN E) -"\uE048>ૈ;" // VOWEL SIGN AI -"\uE049>ૉ;" // VOWEL SIGN CANDRA O -// \uE04B>; // UNMAPPED InterIndic-Gujarati: VOWEL SIGN OO (ો = VOWEL SIGN O) -"\uE04C>ૌ;" // VOWEL SIGN AU -"\uE04D>્;" // SIGN VIRAMA -"\uE050>ૐ;" // OM -// \uE055>; // UNMAPPED InterIndic-Gujarati: LENGTH MARK -"\uE056>ૈ;" // REMAP (indicExceptions.txt): ૖>ૈ = AI LENGTH MARK>VOWEL SIGN AI -"\uE057>ૌ;" // REMAP (indicExceptions.txt): ૗>ૌ = AU LENGTH MARK>VOWEL SIGN AU -"\uE059>ખ઼;" // REMAP (indicExceptions.txt): ૙>ખ઼ = LETTER KHHA>LETTER KHA.SIGN NUKTA -"\uE05A>ગ઼;" // REMAP (indicExceptions.txt): ૚>ગ઼ = LETTER GHHA>LETTER GA.SIGN NUKTA -"\uE05B>જ઼;" // REMAP (indicExceptions.txt): ૛>જ઼ = LETTER ZA>LETTER JA.SIGN NUKTA -"\uE05D>ઢ઼;" // REMAP (indicExceptions.txt): ૝>ઢ઼ = LETTER RHA>LETTER DDHA.SIGN NUKTA -"\uE05E>ફ઼;" // REMAP (indicExceptions.txt): ૞>ફ઼ = LETTER FA>LETTER PHA.SIGN NUKTA -"\uE05F>ય઼;" // REMAP (indicExceptions.txt): ૟>ય઼ = LETTER YYA>LETTER YA.SIGN NUKTA -"\uE060>ૠ;" // LETTER VOCALIC RR -"\uE061>લૃ;" // REMAP (indicExceptions.txt): ૡ>લૃ = LETTER VOCALIC LL>LETTER LA.VOWEL SIGN VOCALIC R -"\uE062>િ઼;" // REMAP (indicExceptions.txt): ૢ>િ઼ = VOWEL SIGN VOCALIC L>VOWEL SIGN I.SIGN NUKTA -"\uE063>ી઼;" // REMAP (indicExceptions.txt): ૣ>ી઼ = VOWEL SIGN VOCALIC LL>VOWEL SIGN II.SIGN NUKTA -"\uE066>૦;" // DIGIT ZERO -"\uE067>૧;" // DIGIT ONE -"\uE068>૨;" // DIGIT TWO -"\uE069>૩;" // DIGIT THREE -"\uE06A>૪;" // DIGIT FOUR -"\uE06B>૫;" // DIGIT FIVE -"\uE06C>૬;" // DIGIT SIX -"\uE06D>૭;" // DIGIT SEVEN -"\uE06E>૮;" // DIGIT EIGHT -"\uE06F>૯;" // DIGIT NINE -// \uE080>; // UNMAPPED InterIndic-Gujarati: ISSHAR -"\uE081>એ;" // LETTER E -"\uE082>ઓ;" // LETTER O -// \uE083>; // UNMAPPED InterIndic-Gujarati: LETTER RRA (ઃ = SIGN VISARGA) -"\uE084>ે;" // VOWEL SIGN E -"\uE085>ો;" // VOWEL SIGN O - +":: NFD (NFC) ;" +"\ue001>\u0a81;" // SIGN CANDRABINDU +"\ue002>\u0a82;" // SIGN ANUSVARA +"\ue003>\u0a83;" // SIGN VISARGA +"\ue005>\u0a85;" // LETTER A +"\ue006>\u0a86;" // LETTER AA +"\ue007>\u0a87;" // LETTER I +"\ue008>\u0a88;" // LETTER II +"\ue009>\u0a89;" // LETTER U +"\ue00a>\u0a8a;" // LETTER UU +"\ue00b>\u0a8b;" // LETTER VOCALIC R +"\ue00c>\u0ab2\u0ac3;" // REMAP (indicExceptions.txt): \u0a8c>\u0ab2\u0ac3 = LETTER VOCALIC L>LETTER LA.VOWEL SIGN VOCALIC R +// \ue00f>; // UNMAPPED InterIndic-Gujarati: LETTER EE (\u0a8f = LETTER E) +"\ue010>\u0a90;" // LETTER AI +// \ue013>; // UNMAPPED InterIndic-Gujarati: LETTER OO (\u0a93 = LETTER O) +"\ue014>\u0a94;" // LETTER AU +"\ue015>\u0a95;" // LETTER KA +"\ue016>\u0a96;" // LETTER KHA +"\ue017>\u0a97;" // LETTER GA +"\ue018>\u0a98;" // LETTER GHA +"\ue019>\u0a99;" // LETTER NGA +"\ue01a>\u0a9a;" // LETTER CA +"\ue01b>\u0a9b;" // LETTER CHA +"\ue01c>\u0a9c;" // LETTER JA +"\ue01d>\u0a9d;" // LETTER JHA +"\ue01e>\u0a9e;" // LETTER NYA +"\ue01f>\u0a9f;" // LETTER TTA +"\ue020>\u0aa0;" // LETTER TTHA +"\ue021>\u0aa1;" // LETTER DDA +"\ue022>\u0aa2;" // LETTER DDHA +"\ue023>\u0aa3;" // LETTER NNA +"\ue024>\u0aa4;" // LETTER TA +"\ue025>\u0aa5;" // LETTER THA +"\ue026>\u0aa6;" // LETTER DA +"\ue027>\u0aa7;" // LETTER DHA +"\ue028>\u0aa8;" // LETTER NA +"\ue029>\u0aa8;" // REMAP (indicExceptions.txt): \u0aa9>\u0aa8 = LETTER NNNA>LETTER NA +"\ue02a>\u0aaa;" // LETTER PA +"\ue02b>\u0aab;" // LETTER PHA +"\ue02c>\u0aac;" // LETTER BA +"\ue02d>\u0aad;" // LETTER BHA +"\ue02e>\u0aae;" // LETTER MA +"\ue02f>\u0aaf;" // LETTER YA +"\ue030>\u0ab0;" // LETTER RA +"\ue032>\u0ab2;" // LETTER LA +"\ue033>\u0ab3;" // LETTER LLA +"\ue034>\u0ab3;" // REMAP (indicExceptions.txt): \u0ab4>\u0ab3 = LETTER LLLA>LETTER LLA +"\ue035>\u0ab5;" // LETTER VA +"\ue036>\u0ab6;" // LETTER SHA +"\ue037>\u0ab7;" // LETTER SSA +"\ue038>\u0ab8;" // LETTER SA +"\ue039>\u0ab9;" // LETTER HA +"\ue03c>\u0abc;" // SIGN NUKTA +"\ue03d>\u0abd;" // SIGN AVAGRAHA +"\ue03e>\u0abe;" // VOWEL SIGN AA +"\ue03f>\u0abf;" // VOWEL SIGN I +"\ue040>\u0ac0;" // VOWEL SIGN II +"\ue041>\u0ac1;" // VOWEL SIGN U +"\ue042>\u0ac2;" // VOWEL SIGN UU +"\ue043>\u0ac3;" // VOWEL SIGN VOCALIC R +"\ue044>\u0ac4;" // VOWEL SIGN VOCALIC RR +"\ue045>\u0ac5;" // VOWEL SIGN CANDRA E +// \ue047>; // UNMAPPED InterIndic-Gujarati: VOWEL SIGN EE (\u0ac7 = VOWEL SIGN E) +"\ue048>\u0ac8;" // VOWEL SIGN AI +"\ue049>\u0ac9;" // VOWEL SIGN CANDRA O +// \ue04b>; // UNMAPPED InterIndic-Gujarati: VOWEL SIGN OO (\u0acb = VOWEL SIGN O) +"\ue04c>\u0acc;" // VOWEL SIGN AU +"\ue04d>\u0acd;" // SIGN VIRAMA +"\ue050>\u0ad0;" // OM +// \ue055>; // UNMAPPED InterIndic-Gujarati: LENGTH MARK +"\ue056>\u0ac8;" // REMAP (indicExceptions.txt): \u0ad6>\u0ac8 = AI LENGTH MARK>VOWEL SIGN AI +"\ue057>\u0acc;" // REMAP (indicExceptions.txt): \u0ad7>\u0acc = AU LENGTH MARK>VOWEL SIGN AU +"\ue059>\u0a96\u0abc;" // REMAP (indicExceptions.txt): \u0ad9>\u0a96\u0abc = LETTER KHHA>LETTER KHA.SIGN NUKTA +"\ue05a>\u0a97\u0abc;" // REMAP (indicExceptions.txt): \u0ada>\u0a97\u0abc = LETTER GHHA>LETTER GA.SIGN NUKTA +"\ue05b>\u0a9c\u0abc;" // REMAP (indicExceptions.txt): \u0adb>\u0a9c\u0abc = LETTER ZA>LETTER JA.SIGN NUKTA +"\ue05d>\u0aa2\u0abc;" // REMAP (indicExceptions.txt): \u0add>\u0aa2\u0abc = LETTER RHA>LETTER DDHA.SIGN NUKTA +"\ue05e>\u0aab\u0abc;" // REMAP (indicExceptions.txt): \u0ade>\u0aab\u0abc = LETTER FA>LETTER PHA.SIGN NUKTA +"\ue05f>\u0aaf\u0abc;" // REMAP (indicExceptions.txt): \u0adf>\u0aaf\u0abc = LETTER YYA>LETTER YA.SIGN NUKTA +"\ue060>\u0ae0;" // LETTER VOCALIC RR +"\ue061>\u0ab2\u0ac3;" // REMAP (indicExceptions.txt): \u0ae1>\u0ab2\u0ac3 = LETTER VOCALIC LL>LETTER LA.VOWEL SIGN VOCALIC R +"\ue062>\u0abf\u0abc;" // REMAP (indicExceptions.txt): \u0ae2>\u0abf\u0abc = VOWEL SIGN VOCALIC L>VOWEL SIGN I.SIGN NUKTA +"\ue063>\u0ac0\u0abc;" // REMAP (indicExceptions.txt): \u0ae3>\u0ac0\u0abc = VOWEL SIGN VOCALIC LL>VOWEL SIGN II.SIGN NUKTA +"\ue066>\u0ae6;" // DIGIT ZERO +"\ue067>\u0ae7;" // DIGIT ONE +"\ue068>\u0ae8;" // DIGIT TWO +"\ue069>\u0ae9;" // DIGIT THREE +"\ue06a>\u0aea;" // DIGIT FOUR +"\ue06b>\u0aeb;" // DIGIT FIVE +"\ue06c>\u0aec;" // DIGIT SIX +"\ue06d>\u0aed;" // DIGIT SEVEN +"\ue06e>\u0aee;" // DIGIT EIGHT +"\ue06f>\u0aef;" // DIGIT NINE +// \ue080>; // UNMAPPED InterIndic-Gujarati: ISSHAR +"\ue00f>\u0a8f;" // LETTER E +"\ue013>\u0a93;" // LETTER O +// \ue083>; // UNMAPPED InterIndic-Gujarati: LETTER RRA (\u0a83 = SIGN VISARGA) +"\ue047>\u0ac7;" // VOWEL SIGN E +"\ue04b>\u0acb;" // VOWEL SIGN O + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Gurmukhi.txt b/icu4c/data/InterIndic_Gurmukhi.txt index 874900eb98..53fb072603 100644 --- a/icu4c/data/InterIndic_Gurmukhi.txt +++ b/icu4c/data/InterIndic_Gurmukhi.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Gurmukhi.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Gurmukhi.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Gurmukhi -InterIndic_Gurmukhi { +InterIndic-Gurmukhi { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,105 +20,105 @@ InterIndic_Gurmukhi { //-------------------------------------------------------------------- // InterIndic-Gurmukhi - -"\uE001>ਂ;" // REMAP (indicExceptions.txt): ਁ>ਂ = SIGN CANDRABINDU>SIGN BINDI -// \uE002>; // UNMAPPED InterIndic-Gurmukhi: SIGN ANUSVARA (ਂ = SIGN BINDI) -// \uE003>; // UNMAPPED InterIndic-Gurmukhi: SIGN VISARGA -"\uE005>ਅ;" // LETTER A -"\uE006>ਆ;" // LETTER AA -"\uE007>ਇ;" // LETTER I -"\uE008>ਈ;" // LETTER II -"\uE009>ਉ;" // LETTER U -"\uE00A>ਊ;" // LETTER UU -"\uE00B>ਰਿ;" // REMAP (indicExceptions.txt): ਋>ਰਿ = LETTER VOCALIC R>LETTER RA.VOWEL SIGN I -"\uE00C>ਇ;" // REMAP (indicExceptions.txt): ਌>ਇ = LETTER VOCALIC L>LETTER I -"\uE00F>ਏ;" // LETTER EE -"\uE010>ਐ;" // LETTER AI -"\uE013>ਓ;" // LETTER OO -"\uE014>ਔ;" // LETTER AU -"\uE015>ਕ;" // LETTER KA -"\uE016>ਖ;" // LETTER KHA -"\uE017>ਗ;" // LETTER GA -"\uE018>ਘ;" // LETTER GHA -"\uE019>ਙ;" // LETTER NGA -"\uE01A>ਚ;" // LETTER CA -"\uE01B>ਛ;" // LETTER CHA -"\uE01C>ਜ;" // LETTER JA -"\uE01D>ਝ;" // LETTER JHA -"\uE01E>ਞ;" // LETTER NYA -"\uE01F>ਟ;" // LETTER TTA -"\uE020>ਠ;" // LETTER TTHA -"\uE021>ਡ;" // LETTER DDA -"\uE022>ਢ;" // LETTER DDHA -"\uE023>ਣ;" // LETTER NNA -"\uE024>ਤ;" // LETTER TA -"\uE025>ਥ;" // LETTER THA -"\uE026>ਦ;" // LETTER DA -"\uE027>ਧ;" // LETTER DHA -"\uE028>ਨ;" // LETTER NA -"\uE029>ਨ;" // REMAP (indicExceptions.txt): ਩>ਨ = LETTER NNNA>LETTER NA -"\uE02A>ਪ;" // LETTER PA -"\uE02B>ਫ;" // LETTER PHA -"\uE02C>ਬ;" // LETTER BA -"\uE02D>ਭ;" // LETTER BHA -"\uE02E>ਮ;" // LETTER MA -"\uE02F>ਯ;" // LETTER YA -"\uE030>ਰ;" // LETTER RA -"\uE032>ਲ;" // LETTER LA -"\uE033>ਲ਼;" // LETTER LLA -"\uE034>ਲ਼;" // REMAP (indicExceptions.txt): ਴>ਲ਼ = LETTER LLLA>LETTER LLA -"\uE035>ਵ;" // LETTER VA -"\uE036>ਸ਼;" // LETTER SHA -"\uE037>ਸ਼;" // REMAP (indicExceptions.txt): ਷>ਸ਼ = LETTER SSA>LETTER SHA -"\uE038>ਸ;" // LETTER SA -"\uE039>ਹ;" // LETTER HA -"\uE03C>਼;" // SIGN NUKTA -// \uE03D>; // UNMAPPED InterIndic-Gurmukhi: SIGN AVAGRAHA -"\uE03E>ਾ;" // VOWEL SIGN AA -"\uE03F>ਿ;" // VOWEL SIGN I -"\uE040>ੀ;" // VOWEL SIGN II -"\uE041>ੁ;" // VOWEL SIGN U -"\uE042>ੂ;" // VOWEL SIGN UU -// \uE043>; // UNMAPPED InterIndic-Gurmukhi: VOWEL SIGN VOCALIC R -// \uE044>; // UNMAPPED InterIndic-Gurmukhi: VOWEL SIGN VOCALIC RR -"\uE045>ੈ;" // REMAP (indicExceptions.txt): ੅>ੈ = VOWEL SIGN CANDRA E>VOWEL SIGN AI -"\uE047>ੇ;" // VOWEL SIGN EE -"\uE048>ੈ;" // VOWEL SIGN AI -"\uE049>ੌ;" // REMAP (indicExceptions.txt): ੉>ੌ = VOWEL SIGN CANDRA O>VOWEL SIGN AU -"\uE04B>ੋ;" // VOWEL SIGN OO -"\uE04C>ੌ;" // VOWEL SIGN AU -"\uE04D>੍;" // SIGN VIRAMA -// \uE050>; // UNMAPPED InterIndic-Gurmukhi: OM -// \uE055>; // UNMAPPED InterIndic-Gurmukhi: LENGTH MARK -"\uE056>ੈ;" // REMAP (indicExceptions.txt): ੖>ੈ = AI LENGTH MARK>VOWEL SIGN AI -"\uE057>ੌ;" // REMAP (indicExceptions.txt): ੗>ੌ = AU LENGTH MARK>VOWEL SIGN AU -"\uE059>ਖ਼;" // LETTER KHHA -"\uE05A>ਗ਼;" // LETTER GHHA -"\uE05B>ਜ਼;" // LETTER ZA -"\uE05D>ਢ਼;" // REMAP (indicExceptions.txt): ੝>ਢ਼ = LETTER RHA>LETTER DDHA.SIGN NUKTA -"\uE05E>ਫ਼;" // LETTER FA -"\uE05F>ਯ;" // REMAP (indicExceptions.txt): ੟>ਯ = LETTER YYA>LETTER YA -"\uE060>ਰਿ;" // REMAP (indicExceptions.txt): ੠>ਰਿ = LETTER VOCALIC RR>LETTER RA.VOWEL SIGN I -"\uE061>ਈ਼;" // REMAP (indicExceptions.txt): ੡>ਈ਼ = LETTER VOCALIC LL>LETTER II.SIGN NUKTA -"\uE062>ਿ਼;" // REMAP (indicExceptions.txt): ੢>ਿ਼ = VOWEL SIGN VOCALIC L>VOWEL SIGN I.SIGN NUKTA -"\uE063>ੀ਼;" // REMAP (indicExceptions.txt): ੣>ੀ਼ = VOWEL SIGN VOCALIC LL>VOWEL SIGN II.SIGN NUKTA -"\uE066>੦;" // DIGIT ZERO -"\uE067>੧;" // DIGIT ONE -"\uE068>੨;" // DIGIT TWO -"\uE069>੩;" // DIGIT THREE -"\uE06A>੪;" // DIGIT FOUR -"\uE06B>੫;" // DIGIT FIVE -"\uE06C>੬;" // DIGIT SIX -"\uE06D>੭;" // DIGIT SEVEN -"\uE06E>੮;" // DIGIT EIGHT -"\uE06F>੯;" // DIGIT NINE -// \uE080>; // UNMAPPED InterIndic-Gurmukhi: ISSHAR -// \uE081>; // UNMAPPED InterIndic-Gurmukhi: LETTER E -// \uE082>; // UNMAPPED InterIndic-Gurmukhi: LETTER O (ਂ = SIGN BINDI) -"\uE083>ੜ;" // LETTER RRA -// \uE084>; // UNMAPPED InterIndic-Gurmukhi: VOWEL SIGN E -// \uE085>; // UNMAPPED InterIndic-Gurmukhi: VOWEL SIGN O (ਅ = LETTER A) - +":: NFD (NFC) ;" +"\ue001>\u0a02;" // REMAP (indicExceptions.txt): \u0a01>\u0a02 = SIGN CANDRABINDU>SIGN BINDI +// \ue002>; // UNMAPPED InterIndic-Gurmukhi: SIGN ANUSVARA (\u0a02 = SIGN BINDI) +// \ue003>; // UNMAPPED InterIndic-Gurmukhi: SIGN VISARGA +"\ue005>\u0a05;" // LETTER A +"\ue006>\u0a06;" // LETTER AA +"\ue007>\u0a07;" // LETTER I +"\ue008>\u0a08;" // LETTER II +"\ue009>\u0a09;" // LETTER U +"\ue00a>\u0a0a;" // LETTER UU +"\ue00b>\u0a30\u0a3f;" // REMAP (indicExceptions.txt): \u0a0b>\u0a30\u0a3f = LETTER VOCALIC R>LETTER RA.VOWEL SIGN I +"\ue00c>\u0a07;" // REMAP (indicExceptions.txt): \u0a0c>\u0a07 = LETTER VOCALIC L>LETTER I +"\ue00f>\u0a0f;" // LETTER EE +"\ue010>\u0a10;" // LETTER AI +"\ue013>\u0a13;" // LETTER OO +"\ue014>\u0a14;" // LETTER AU +"\ue015>\u0a15;" // LETTER KA +"\ue016>\u0a16;" // LETTER KHA +"\ue017>\u0a17;" // LETTER GA +"\ue018>\u0a18;" // LETTER GHA +"\ue019>\u0a19;" // LETTER NGA +"\ue01a>\u0a1a;" // LETTER CA +"\ue01b>\u0a1b;" // LETTER CHA +"\ue01c>\u0a1c;" // LETTER JA +"\ue01d>\u0a1d;" // LETTER JHA +"\ue01e>\u0a1e;" // LETTER NYA +"\ue01f>\u0a1f;" // LETTER TTA +"\ue020>\u0a20;" // LETTER TTHA +"\ue021>\u0a21;" // LETTER DDA +"\ue022>\u0a22;" // LETTER DDHA +"\ue023>\u0a23;" // LETTER NNA +"\ue024>\u0a24;" // LETTER TA +"\ue025>\u0a25;" // LETTER THA +"\ue026>\u0a26;" // LETTER DA +"\ue027>\u0a27;" // LETTER DHA +"\ue028>\u0a28;" // LETTER NA +"\ue029>\u0a28;" // REMAP (indicExceptions.txt): \u0a29>\u0a28 = LETTER NNNA>LETTER NA +"\ue02a>\u0a2a;" // LETTER PA +"\ue02b>\u0a2b;" // LETTER PHA +"\ue02c>\u0a2c;" // LETTER BA +"\ue02d>\u0a2d;" // LETTER BHA +"\ue02e>\u0a2e;" // LETTER MA +"\ue02f>\u0a2f;" // LETTER YA +"\ue030>\u0a30;" // LETTER RA +"\ue032>\u0a32;" // LETTER LA +"\ue033>\u0a33;" // LETTER LLA +"\ue034>\u0a33;" // REMAP (indicExceptions.txt): \u0a34>\u0a33 = LETTER LLLA>LETTER LLA +"\ue035>\u0a35;" // LETTER VA +"\ue036>\u0a36;" // LETTER SHA +"\ue037>\u0a36;" // REMAP (indicExceptions.txt): \u0a37>\u0a36 = LETTER SSA>LETTER SHA +"\ue038>\u0a38;" // LETTER SA +"\ue039>\u0a39;" // LETTER HA +"\ue03c>\u0a3c;" // SIGN NUKTA +// \ue03d>; // UNMAPPED InterIndic-Gurmukhi: SIGN AVAGRAHA +"\ue03e>\u0a3e;" // VOWEL SIGN AA +"\ue03f>\u0a3f;" // VOWEL SIGN I +"\ue040>\u0a40;" // VOWEL SIGN II +"\ue041>\u0a41;" // VOWEL SIGN U +"\ue042>\u0a42;" // VOWEL SIGN UU +// \ue043>; // UNMAPPED InterIndic-Gurmukhi: VOWEL SIGN VOCALIC R +// \ue044>; // UNMAPPED InterIndic-Gurmukhi: VOWEL SIGN VOCALIC RR +"\ue045>\u0a48;" // REMAP (indicExceptions.txt): \u0a45>\u0a48 = VOWEL SIGN CANDRA E>VOWEL SIGN AI +"\ue047>\u0a47;" // VOWEL SIGN EE +"\ue048>\u0a48;" // VOWEL SIGN AI +"\ue049>\u0a4c;" // REMAP (indicExceptions.txt): \u0a49>\u0a4c = VOWEL SIGN CANDRA O>VOWEL SIGN AU +"\ue04b>\u0a4b;" // VOWEL SIGN OO +"\ue04c>\u0a4c;" // VOWEL SIGN AU +"\ue04d>\u0a4d;" // SIGN VIRAMA +// \ue050>; // UNMAPPED InterIndic-Gurmukhi: OM +// \ue055>; // UNMAPPED InterIndic-Gurmukhi: LENGTH MARK +"\ue056>\u0a48;" // REMAP (indicExceptions.txt): \u0a56>\u0a48 = AI LENGTH MARK>VOWEL SIGN AI +"\ue057>\u0a4c;" // REMAP (indicExceptions.txt): \u0a57>\u0a4c = AU LENGTH MARK>VOWEL SIGN AU +"\ue059>\u0a59;" // LETTER KHHA +"\ue05a>\u0a5a;" // LETTER GHHA +"\ue05b>\u0a5b;" // LETTER ZA +"\ue05d>\u0a22\u0a3c;" // REMAP (indicExceptions.txt): \u0a5d>\u0a22\u0a3c = LETTER RHA>LETTER DDHA.SIGN NUKTA +"\ue05e>\u0a5e;" // LETTER FA +"\ue05f>\u0a2f;" // REMAP (indicExceptions.txt): \u0a5f>\u0a2f = LETTER YYA>LETTER YA +"\ue060>\u0a30\u0a3f;" // REMAP (indicExceptions.txt): \u0a60>\u0a30\u0a3f = LETTER VOCALIC RR>LETTER RA.VOWEL SIGN I +"\ue061>\u0a08\u0a3c;" // REMAP (indicExceptions.txt): \u0a61>\u0a08\u0a3c = LETTER VOCALIC LL>LETTER II.SIGN NUKTA +"\ue062>\u0a3f\u0a3c;" // REMAP (indicExceptions.txt): \u0a62>\u0a3f\u0a3c = VOWEL SIGN VOCALIC L>VOWEL SIGN I.SIGN NUKTA +"\ue063>\u0a40\u0a3c;" // REMAP (indicExceptions.txt): \u0a63>\u0a40\u0a3c = VOWEL SIGN VOCALIC LL>VOWEL SIGN II.SIGN NUKTA +"\ue066>\u0a66;" // DIGIT ZERO +"\ue067>\u0a67;" // DIGIT ONE +"\ue068>\u0a68;" // DIGIT TWO +"\ue069>\u0a69;" // DIGIT THREE +"\ue06a>\u0a6a;" // DIGIT FOUR +"\ue06b>\u0a6b;" // DIGIT FIVE +"\ue06c>\u0a6c;" // DIGIT SIX +"\ue06d>\u0a6d;" // DIGIT SEVEN +"\ue06e>\u0a6e;" // DIGIT EIGHT +"\ue06f>\u0a6f;" // DIGIT NINE +// \ue080>; // UNMAPPED InterIndic-Gurmukhi: ISSHAR +// \ue081>; // UNMAPPED InterIndic-Gurmukhi: LETTER E +// \ue082>; // UNMAPPED InterIndic-Gurmukhi: LETTER O (\u0a02 = SIGN BINDI) +"\ue05c>\u0a5c;" // LETTER RRA +// \ue084>; // UNMAPPED InterIndic-Gurmukhi: VOWEL SIGN E +// \ue085>; // UNMAPPED InterIndic-Gurmukhi: VOWEL SIGN O (\u0a05 = LETTER A) + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Kannada.txt b/icu4c/data/InterIndic_Kannada.txt index 10038a0525..0162ce0a17 100644 --- a/icu4c/data/InterIndic_Kannada.txt +++ b/icu4c/data/InterIndic_Kannada.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Kannada.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Kannada.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Kannada -InterIndic_Kannada { +InterIndic-Kannada { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,105 +20,105 @@ InterIndic_Kannada { //-------------------------------------------------------------------- // InterIndic-Kannada - -"\uE001>ಂ;" // REMAP (indicExceptions.txt): ಁ>ಂ = SIGN CANDRABINDU>SIGN ANUSVARA -"\uE002>ಂ;" // SIGN ANUSVARA -"\uE003>ಃ;" // SIGN VISARGA -"\uE005>ಅ;" // LETTER A -"\uE006>ಆ;" // LETTER AA -"\uE007>ಇ;" // LETTER I -"\uE008>ಈ;" // LETTER II -"\uE009>ಉ;" // LETTER U -"\uE00A>ಊ;" // LETTER UU -"\uE00B>ಋ;" // LETTER VOCALIC R -"\uE00C>ಌ;" // LETTER VOCALIC L -"\uE00F>ಏ;" // LETTER EE -"\uE010>ಐ;" // LETTER AI -"\uE013>ಓ;" // LETTER OO -"\uE014>ಔ;" // LETTER AU -"\uE015>ಕ;" // LETTER KA -"\uE016>ಖ;" // LETTER KHA -"\uE017>ಗ;" // LETTER GA -"\uE018>ಘ;" // LETTER GHA -"\uE019>ಙ;" // LETTER NGA -"\uE01A>ಚ;" // LETTER CA -"\uE01B>ಛ;" // LETTER CHA -"\uE01C>ಜ;" // LETTER JA -"\uE01D>ಝ;" // LETTER JHA -"\uE01E>ಞ;" // LETTER NYA -"\uE01F>ಟ;" // LETTER TTA -"\uE020>ಠ;" // LETTER TTHA -"\uE021>ಡ;" // LETTER DDA -"\uE022>ಢ;" // LETTER DDHA -"\uE023>ಣ;" // LETTER NNA -"\uE024>ತ;" // LETTER TA -"\uE025>ಥ;" // LETTER THA -"\uE026>ದ;" // LETTER DA -"\uE027>ಧ;" // LETTER DHA -"\uE028>ನ;" // LETTER NA -"\uE029>ನ;" // REMAP (indicExceptions.txt): ಩>ನ = LETTER NNNA>LETTER NA -"\uE02A>ಪ;" // LETTER PA -"\uE02B>ಫ;" // LETTER PHA -"\uE02C>ಬ;" // LETTER BA -"\uE02D>ಭ;" // LETTER BHA -"\uE02E>ಮ;" // LETTER MA -"\uE02F>ಯ;" // LETTER YA -"\uE030>ರ;" // LETTER RA -"\uE032>ಲ;" // LETTER LA -"\uE033>ಳ;" // LETTER LLA -"\uE034>ಳ;" // REMAP (indicExceptions.txt): ಴>ಳ = LETTER LLLA>LETTER LLA -"\uE035>ವ;" // LETTER VA -"\uE036>ಶ;" // LETTER SHA -"\uE037>ಷ;" // LETTER SSA -"\uE038>ಸ;" // LETTER SA -"\uE039>ಹ;" // LETTER HA -// \uE03C>; // UNMAPPED InterIndic-Kannada: SIGN NUKTA -// \uE03D>; // UNMAPPED InterIndic-Kannada: SIGN AVAGRAHA -"\uE03E>ಾ;" // VOWEL SIGN AA -"\uE03F>ಿ;" // VOWEL SIGN I -"\uE040>ೀ;" // VOWEL SIGN II -"\uE041>ು;" // VOWEL SIGN U -"\uE042>ೂ;" // VOWEL SIGN UU -"\uE043>ೃ;" // VOWEL SIGN VOCALIC R -"\uE044>ೄ;" // VOWEL SIGN VOCALIC RR -"\uE045>ೆ;" // REMAP (indicExceptions.txt): ೅>ೆ = VOWEL SIGN CANDRA E>VOWEL SIGN E -"\uE047>ೇ;" // VOWEL SIGN EE -"\uE048>ೈ;" // VOWEL SIGN AI -"\uE049>ೊ;" // REMAP (indicExceptions.txt): ೉>ೊ = VOWEL SIGN CANDRA O>VOWEL SIGN O -"\uE04B>ೋ;" // VOWEL SIGN OO -"\uE04C>ೌ;" // VOWEL SIGN AU -"\uE04D>್;" // SIGN VIRAMA -"\uE050>ಓಂ;" // REMAP (indicExceptions.txt): ೐>ಓಂ = OM>LETTER OO.SIGN ANUSVARA -"\uE055>ೕ;" // LENGTH MARK -"\uE056>ೖ;" // AI LENGTH MARK -"\uE057>ೌ;" // REMAP (indicExceptions.txt): ೗>ೌ = AU LENGTH MARK>VOWEL SIGN AU -"\uE059>ಖ;" // REMAP (indicExceptions.txt): ೙>ಖ = LETTER KHHA>LETTER KHA -"\uE05A>ಗ;" // REMAP (indicExceptions.txt): ೚>ಗ = LETTER GHHA>LETTER GA -"\uE05B>ಜ;" // REMAP (indicExceptions.txt): ೛>ಜ = LETTER ZA>LETTER JA -"\uE05D>ಢ;" // REMAP (indicExceptions.txt): ೝ>ಢ = LETTER RHA>LETTER DDHA -"\uE05E>ೞ;" // LETTER FA -"\uE05F>ಯ;" // REMAP (indicExceptions.txt): ೟>ಯ = LETTER YYA>LETTER YA -"\uE060>ೠ;" // LETTER VOCALIC RR -"\uE061>ೡ;" // LETTER VOCALIC LL -"\uE062>ಿ;" // REMAP (indicExceptions.txt): ೢ>ಿ = VOWEL SIGN VOCALIC L>VOWEL SIGN I -"\uE063>ೀ;" // REMAP (indicExceptions.txt): ೣ>ೀ = VOWEL SIGN VOCALIC LL>VOWEL SIGN II -"\uE066>೦;" // DIGIT ZERO -"\uE067>೧;" // DIGIT ONE -"\uE068>೨;" // DIGIT TWO -"\uE069>೩;" // DIGIT THREE -"\uE06A>೪;" // DIGIT FOUR -"\uE06B>೫;" // DIGIT FIVE -"\uE06C>೬;" // DIGIT SIX -"\uE06D>೭;" // DIGIT SEVEN -"\uE06E>೮;" // DIGIT EIGHT -"\uE06F>೯;" // DIGIT NINE -// \uE080>; // UNMAPPED InterIndic-Kannada: ISSHAR -"\uE081>ಎ;" // LETTER E -"\uE082>ಒ;" // LETTER O -"\uE083>ಱ;" // LETTER RRA -"\uE084>ೆ;" // VOWEL SIGN E -"\uE085>ೊ;" // VOWEL SIGN O - +":: NFD (NFC) ;" +"\ue001>\u0c82;" // REMAP (indicExceptions.txt): \u0c81>\u0c82 = SIGN CANDRABINDU>SIGN ANUSVARA +"\ue002>\u0c82;" // SIGN ANUSVARA +"\ue003>\u0c83;" // SIGN VISARGA +"\ue005>\u0c85;" // LETTER A +"\ue006>\u0c86;" // LETTER AA +"\ue007>\u0c87;" // LETTER I +"\ue008>\u0c88;" // LETTER II +"\ue009>\u0c89;" // LETTER U +"\ue00a>\u0c8a;" // LETTER UU +"\ue00b>\u0c8b;" // LETTER VOCALIC R +"\ue00c>\u0c8c;" // LETTER VOCALIC L +"\ue00f>\u0c8f;" // LETTER EE +"\ue010>\u0c90;" // LETTER AI +"\ue013>\u0c93;" // LETTER OO +"\ue014>\u0c94;" // LETTER AU +"\ue015>\u0c95;" // LETTER KA +"\ue016>\u0c96;" // LETTER KHA +"\ue017>\u0c97;" // LETTER GA +"\ue018>\u0c98;" // LETTER GHA +"\ue019>\u0c99;" // LETTER NGA +"\ue01a>\u0c9a;" // LETTER CA +"\ue01b>\u0c9b;" // LETTER CHA +"\ue01c>\u0c9c;" // LETTER JA +"\ue01d>\u0c9d;" // LETTER JHA +"\ue01e>\u0c9e;" // LETTER NYA +"\ue01f>\u0c9f;" // LETTER TTA +"\ue020>\u0ca0;" // LETTER TTHA +"\ue021>\u0ca1;" // LETTER DDA +"\ue022>\u0ca2;" // LETTER DDHA +"\ue023>\u0ca3;" // LETTER NNA +"\ue024>\u0ca4;" // LETTER TA +"\ue025>\u0ca5;" // LETTER THA +"\ue026>\u0ca6;" // LETTER DA +"\ue027>\u0ca7;" // LETTER DHA +"\ue028>\u0ca8;" // LETTER NA +"\ue029>\u0ca8;" // REMAP (indicExceptions.txt): \u0ca9>\u0ca8 = LETTER NNNA>LETTER NA +"\ue02a>\u0caa;" // LETTER PA +"\ue02b>\u0cab;" // LETTER PHA +"\ue02c>\u0cac;" // LETTER BA +"\ue02d>\u0cad;" // LETTER BHA +"\ue02e>\u0cae;" // LETTER MA +"\ue02f>\u0caf;" // LETTER YA +"\ue030>\u0cb0;" // LETTER RA +"\ue032>\u0cb2;" // LETTER LA +"\ue033>\u0cb3;" // LETTER LLA +"\ue034>\u0cb3;" // REMAP (indicExceptions.txt): \u0cb4>\u0cb3 = LETTER LLLA>LETTER LLA +"\ue035>\u0cb5;" // LETTER VA +"\ue036>\u0cb6;" // LETTER SHA +"\ue037>\u0cb7;" // LETTER SSA +"\ue038>\u0cb8;" // LETTER SA +"\ue039>\u0cb9;" // LETTER HA +// \ue03c>; // UNMAPPED InterIndic-Kannada: SIGN NUKTA +// \ue03d>; // UNMAPPED InterIndic-Kannada: SIGN AVAGRAHA +"\ue03e>\u0cbe;" // VOWEL SIGN AA +"\ue03f>\u0cbf;" // VOWEL SIGN I +"\ue040>\u0cc0;" // VOWEL SIGN II +"\ue041>\u0cc1;" // VOWEL SIGN U +"\ue042>\u0cc2;" // VOWEL SIGN UU +"\ue043>\u0cc3;" // VOWEL SIGN VOCALIC R +"\ue044>\u0cc4;" // VOWEL SIGN VOCALIC RR +"\ue045>\u0cc6;" // REMAP (indicExceptions.txt): \u0cc5>\u0cc6 = VOWEL SIGN CANDRA E>VOWEL SIGN E +"\ue047>\u0cc7;" // VOWEL SIGN EE +"\ue048>\u0cc8;" // VOWEL SIGN AI +"\ue049>\u0cca;" // REMAP (indicExceptions.txt): \u0cc9>\u0cca = VOWEL SIGN CANDRA O>VOWEL SIGN O +"\ue04b>\u0ccb;" // VOWEL SIGN OO +"\ue04c>\u0ccc;" // VOWEL SIGN AU +"\ue04d>\u0ccd;" // SIGN VIRAMA +"\ue050>\u0c93\u0c82;" // REMAP (indicExceptions.txt): \u0cd0>\u0c93\u0c82 = OM>LETTER OO.SIGN ANUSVARA +"\ue055>\u0cd5;" // LENGTH MARK +"\ue056>\u0cd6;" // AI LENGTH MARK +"\ue057>\u0ccc;" // REMAP (indicExceptions.txt): \u0cd7>\u0ccc = AU LENGTH MARK>VOWEL SIGN AU +"\ue059>\u0c96;" // REMAP (indicExceptions.txt): \u0cd9>\u0c96 = LETTER KHHA>LETTER KHA +"\ue05a>\u0c97;" // REMAP (indicExceptions.txt): \u0cda>\u0c97 = LETTER GHHA>LETTER GA +"\ue05b>\u0c9c;" // REMAP (indicExceptions.txt): \u0cdb>\u0c9c = LETTER ZA>LETTER JA +"\ue05d>\u0ca2;" // REMAP (indicExceptions.txt): \u0cdd>\u0ca2 = LETTER RHA>LETTER DDHA +"\ue05e>\u0cde;" // LETTER FA +"\ue05f>\u0caf;" // REMAP (indicExceptions.txt): \u0cdf>\u0caf = LETTER YYA>LETTER YA +"\ue060>\u0ce0;" // LETTER VOCALIC RR +"\ue061>\u0ce1;" // LETTER VOCALIC LL +"\ue062>\u0cbf;" // REMAP (indicExceptions.txt): \u0ce2>\u0cbf = VOWEL SIGN VOCALIC L>VOWEL SIGN I +"\ue063>\u0cc0;" // REMAP (indicExceptions.txt): \u0ce3>\u0cc0 = VOWEL SIGN VOCALIC LL>VOWEL SIGN II +"\ue066>\u0ce6;" // DIGIT ZERO +"\ue067>\u0ce7;" // DIGIT ONE +"\ue068>\u0ce8;" // DIGIT TWO +"\ue069>\u0ce9;" // DIGIT THREE +"\ue06a>\u0cea;" // DIGIT FOUR +"\ue06b>\u0ceb;" // DIGIT FIVE +"\ue06c>\u0cec;" // DIGIT SIX +"\ue06d>\u0ced;" // DIGIT SEVEN +"\ue06e>\u0cee;" // DIGIT EIGHT +"\ue06f>\u0cef;" // DIGIT NINE +// \ue080>; // UNMAPPED InterIndic-Kannada: ISSHAR +"\ue00e>\u0c8e;" // LETTER E +"\ue012>\u0c92;" // LETTER O +"\ue031>\u0cb1;" // LETTER RRA +"\ue046>\u0cc6;" // VOWEL SIGN E +"\ue04a>\u0cca;" // VOWEL SIGN O + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Latin.txt b/icu4c/data/InterIndic_Latin.txt new file mode 100644 index 0000000000..5ade977fb8 --- /dev/null +++ b/icu4c/data/InterIndic_Latin.txt @@ -0,0 +1,414 @@ +//-------------------------------------------------------------------- +// Copyright (c) 2001-2004, International Business Machines +// Corporation and others. All Rights Reserved. +//-------------------------------------------------------------------- + +// InterIndic-Latin + +InterIndic-Latin{ + Rule{ + ":: NFD (NFC) ;" + //\u0e00 reserved + //consonants + "$chandrabindu=\ue001;" + "$anusvara=\ue002;" + "$visarga=\ue003;" + //\u0e004 reserved + // w represents the stand-alone form + "$wa=\ue005;" + "$waa=\ue006;" + "$wi=\ue007;" + "$wii=\ue008;" + "$wu=\ue009;" + "$wuu=\ue00a;" + "$wr=\ue00b;" + "$wl=\ue00c;" + + "$wce=\ue00d;" // LETTER CANDRA E + "$wse=\ue00e;" // LETTER SHORT E + + "$we=\ue00f;" // \u090f LETTER E + "$wai=\ue010;" + + "$wco=\ue011;" // LETTER CANDRA O + "$wso=\ue012;" // LETTER SHORT O + + "$wo=\ue013;" // \u0913 LETTER O + "$wau=\ue014;" + + "$ka=\ue015;" + "$kha=\ue016;" + "$ga=\ue017;" + "$gha=\ue018;" + "$nga=\ue019;" + + "$ca=\ue01a;" + "$cha=\ue01b;" + "$ja=\ue01c;" + "$jha=\ue01d;" + "$nya=\ue01e;" + + "$tta=\ue01f;" + "$ttha=\ue020;" + "$dda=\ue021;" + "$ddha=\ue022;" + "$nna=\ue023;" + + "$ta=\ue024;" + "$tha=\ue025;" + "$da=\ue026;" + "$dha=\ue027;" + "$na=\ue028;" + "$ena=\ue029;" //compatibility + + "$pa=\ue02a;" + "$pha=\ue02b;" + "$ba=\ue02c;" + "$bha=\ue02d;" + "$ma=\ue02e;" + + "$ya=\ue02f;" + "$ra=\ue030;" + "$rra=\ue031;" + "$la=\ue032;" + "$lla=\ue033;" + "$ela=\ue034;" //compatibility + "$va=\ue035;" + + "$sha=\ue036;" + "$ssa=\ue037;" + "$sa=\ue038;" + "$ha=\ue039;" +//\u093a Reserved +//\u093b Reserved + "$nukta=\ue03c;" + "$avagraha=\ue03d;" // SIGN AVAGRAHA + + // represents the dependent form + "$aa=\ue03e;" + "$i=\ue03f;" + "$ii=\ue040;" + "$u=\ue041;" + "$uu=\ue042;" + "$rh=\ue043;" + "$lh=\ue044;" + "$ce=\ue045;" //VOWEL SIGN CANDRA E + "$se=\ue046;" //VOWEL SIGN SHORT E + "$e=\ue047;" + "$ai=\ue048;" + "$co=\ue049;" // VOWEL SIGN CANDRA O + "$so=\ue04a;" // VOWEL SIGN SHORT O + "$o=\ue04b;" // \u094b + "$au=\ue04c;" + "$virama=\ue04d;" +// \u094e Reserved +// \u094f Reserved +//"\u0950>\ue050;" // OM +// \u0951>; // UNMAPPED STRESS SIGN UDATTA +// \u0952>; // UNMAPPED STRESS SIGN ANUDATTA +// \u0953>; // UNMAPPED GRAVE ACCENT +// \u0954>; // UNMAPPED ACUTE ACCENT + + "$lm = \ue055;"// Telugu Length Mark + "$ailm=\ue056;"// AI Length Mark + "$aulm=\ue057;"// AU Length Mark + + //urdu compatibity forms + "$uka=\ue058;" + "$ukha=\ue059;" + "$ugha=\ue05a;" + "$ujha=\ue05b;" + "$uddha=\ue05c;" + "$udha=\ue05d;" + "$ufa=\ue05e;" + "$uya=\ue05f;" + + "$wrr=\ue060;" + "$wll=\ue061;" + "$rrh=\ue062;" + "$llh=\ue063;" + + "$danda=\ue064;" + "$doubleDanda=\ue065;" + + "$zero=\ue066;" // DIGIT ZERO + "$one=\ue067;" // DIGIT ONE + "$two=\ue068;" // DIGIT TWO + "$three=\ue069;" // DIGIT THREE + "$four=\ue06a;" // DIGIT FOUR + "$five=\ue06b;" // DIGIT FIVE + "$six=\ue06c;" // DIGIT SIX + "$seven=\ue06d;" // DIGIT SEVEN + "$eight=\ue06e;" // DIGIT EIGHT + "$nine=\ue06f;" // DIGIT NINE + + // For all other scripts + "$ecp0=\ue070;" + "$ecp1=\ue071;" + "$ecp2=\ue072;" + "$ecp3=\ue073;" + "$ecp4=\ue074;" + "$ecp5=\ue075;" + "$ecp6=\ue076;" + "$ecp7=\ue077;" + "$ecp8=\ue078;" + "$ecp9=\ue079;" + "$ecpA=\ue07a;" + "$ecpB=\ue07b;" + "$ecpC=\ue07c;" + "$ecpD=\ue07d;" + "$ecpE=\ue07e;" + "$ecpF=\ue07f;" + + +// \u0970>; // UNMAPPED ABBREVIATION SIGN + + "$depVowelAbove=[\ue03e-\ue040\ue045-\ue04c];" + "$depVowelBelow=[\ue041-\ue044];" + "$endThing=[$danda$doubleDanda \u005c\u005cu0000-\udfff\ue080-\ufffd];" + + // $x was originally called '&'; $z was '%' + "$x=[$virama$aa$ai$au$ii$i$uu$u$rrh$rh$lh$e$o$se$ce$so$co];" + "$z=[bcdfghjklmnpqrstvwxyz];" + + + //##################################################################### + // convert from Native letters to Latin letters + //##################################################################### + + //transliterations for anusvara + "$anusvara} [$ka$kha$ga$gha$nga] > n\u0307;" + "$anusvara} [$ca$cha$ja$jha$nya] > n\u0304;" + "$anusvara} [$tta$ttha$dda$ddha$nna] > n\u0323;" + "$anusvara} [$ta$tha$da$dha$na] > n ;" + "$anusvara} [$pa$pha$ba$bha$ma] > m ;" + "$anusvara} [$ya$ra$lla$la$va$ssa$sha$sa$ha] > n ;" + "$anusvara>'-'m\u0307;" + + // normal consonants + + "$cha}$x>ch;" + "$cha>cha;" + "$ca$virama}$ha>c'';" + "$ca}$x>c;" + "$ca>ca;" + "$jha}$x>jh;" + "$jha>jha;" + "$ja$virama}$ha>j'';" + "$ja}$x>j;" + "$ja>ja;" + //"$nya}$x>ny;" + //"$nya>nya;" + "$nya }$x>n\u0303 ;" + "$nya > n\u0303a ;" + + "$ttha}$x>t\u0323h;" + "$tta$virama}$ha>t\u0323'';" + "$tta}$x>t\u0323;" + "$ddha}$x>d\u0323h;" + "$dda}$x$ha>d\u0323'';" + "$dda}$x>d\u0323;" + "$dha}$x>dh;" + "$da$virama}$ha>d'';" + "$da$virama}$ddha>d'';" + "$da$virama}$dda>d'';" + "$da$virama}$dha>d'';" + //"$da$virama}$da>dda;" + "$da}$x>d;" + "$tha}$x>th;" + "$ta$virama}$ha>t'';" + "$ta$virama}$ttha>t'';" + "$ta$virama}$tta>t'';" + "$ta$virama}$tha>t'';" + "$tta>t\u0323a;" + "$ttha>t\u0323ha;" + //"$ta$virama}$ta>tta;" + "$ta}$x>t;" + "$tha>tha;" + "$ta>ta;" + "$dda>d\u0323a;" + "$dha>dha;" + "$ddha>d\u0323ha;" + "$da>da;" + "$nna}$x>n\u0323 ;" + "$nna>n\u0323a ;" + "$na$virama}$ga>n'';" + "$na$virama}$ya>n'';" + "$na}$x>n;" + "$na>na;" + + "$kha}$x>kh;" + "$kha>kha;" + "$ka$virama}$ha>k'';" + "$ka}$x>k;" + "$ka>ka;" + "$gha}$x>gh;" + "$gha>gha;" + "$ga$virama}$ha>g'';" + "$ga}$x>g;" + "$ga>ga;" + //"ng<$nga}$x;" + //"nga<$nga;" + "$nga}$x>n\u0307;" + "$nga>n\u0307a ;" + + "$pha}$x>ph;" + "$pha>pha;" + "$pa$virama}$ha>p'';" + "$pa}$x>p;" + "$pa>pa;" + "$bha}$x>bh;" + "$bha>bha;" + "$ba$virama}$ha>b'';" + "$ba}$x>b;" + "$ba>ba;" + "$ma$virama}$ma>m'';" + //"$ma$virama}$anusvara>m'';" + "$ma}$x>m;" + "$ma>ma;" + + "$ya}$x>y;" + "$ya>ya;" + "$ra$virama}$ha>r'';" + "$ra}$x>r;" + "$ra>ra;" + "$la$virama}$ha>l'';" + "$la}$x>l;" + "$la>la;" + "$lla$virama}$ha>l\u0323'';" + "$lla}$x>l\u0323;" + "$lla>l\u0323a;" + "$va}$x>v;" + "$va>va;" + "$sha}$x>s\u0301;" + "$ssa}$x>s\u0323;" + "$sa$virama}$ha>s'';" + "$sa$virama}$sha>s'';" + "$sa$virama}$ssa>s'';" + "$sa$virama}$sa>s'';" + "$sa}$x>s;" + "$sha>s\u0301a;" + "$ssa>s\u0323a;" + "$sa>sa;" + "$ha}$x>h;" + "$ha>ha;" + + // Urdu compatibility + "$uya}$x > y\u0307 ;" + "$uya > y\u0307a ;" + "$ela}$x > l\u0331 ;" + "$ela > l\u0331a ;" + "$ena}$x > n\u0331 ;" + "$ena > n\u0331a ;" + + "$uka}$x > q ;" + "$uka > qa ;" + "$ukha}$x > k\u0323 ;" + "$ukha > k\u0323a ;" + "$ugha}$x > g\u0307 ;" + "$ugha > g\u0307a ;" + "$ujha}$x > z ;" + "$ujha > za ;" + "$udha}$x > r\u0323h ;" + "$udha > r\u0323ha;" + "$uddha}$x> r\u0323 ;" + "$uddha > r\u0323a ;" + "$ufa}$x > f\u0323 ;" + "$ufa > f\u0323a ;" + + // dependent vowels (should never occur except following consonants) + + "$aa > a\u0304 ;" + "$ai > ai ;" + "$au > au ;" + "$ii > i\u0304 ;" + "$i > i ;" + "$uu > u\u0304 ;" + "$u > u ;" + "$rrh > r\u0325\u0304 ;" + "$rh > r\u0325 ;" + "$llh > l\u0325\u0304 ;" + "$lh > l\u0325 ;" + "$e > e\u0304 ;" + "$o > o\u0304 ;" + //extra vowels + "$ce > e\u0306 ;" + "$co > o\u0306 ;" + "$se > e ;" + "$so > o ;" + + // independent vowels (when following consonants) + + "a}$waa > ''a\u0304 ;" + "$z}$waa > ''a\u0304 ;" + "a}$wai > ''ai ;" + "$z}$wai > ''ai ;" + "a}$wau > ''au ;" + "$z}$wau > ''au ;" + "a}$wii > ''i\u0304 ;" + "$z}$wii > ''i\u0304 ;" + "a}$wi > ''i ;" + "$z}$wi > ''i ;" + "a}$wuu > ''u\u0304 ;" + "$z}$wuu > ''u\u0304 ;" + "a}$wu > ''u ;" + "$z}$wu > ''u ;" + "$z}$wrr > ''r\u0325\u0304 ;" + "$z}$wr > ''r\u0325 ;" + "$z}$wll > ''l\u0325\u0304 ;" + "$z}$wl > ''l\u0325 ;" + "$z}$we > ''e\u0304 ;" + "$z}$wo > ''o\u0304 ;" + "a}$wa > ''a ;" + "$z}$wa > ''a ;" + //extra vowels + "$z}$wce > ''e\u0306 ;" + "$z}$wco > ''o\u0306 ;" + "$z}$wse > ''e ;" + "$z}$wso > ''o ;" + + // independent vowels (otherwise) + "$waa > a\u0304 ;" + "$wai > ai ;" + "$wau > au ;" + "$wii > i\u0304 ;" + "$wi > i ;" + "$wuu > u\u0304 ;" + "$wu > u ;" + "$wrr > r\u0325\u0304 ;" + "$wr > r\u0325 ;" + "$wll > l\u0325\u0304 ;" + "$wl > l\u0325 ;" + "$we > e\u0304 ;" + "$wo > o\u0304 ;" + "$wa > a ;" + //extra vowels + "$wce > e\u0306 ;" + "$wco > o\u0306 ;" + "$wse > e ;" + "$wso > o ;" + + //stress marks + "$avagraha > \u0315;" + "$chandrabindu$anusvara>'-'\u0303;" + "$chandrabindu > '-'m\u0310;" + "$visarga>'-'h\u0323;" + + + //numbers + "$zero > 0;" + "$one > 1;" + "$two > 2;" + "$three > 3;" + "$four > 4;" + "$five > 5;" + "$six > 6;" + "$seven > 7;" + "$eight > 8;" + "$nine > 9;" + + // blow away any remaining viramas + "$virama>;" + ":: NFC (NFD) ;" + } +} \ No newline at end of file diff --git a/icu4c/data/InterIndic_Malayalam.txt b/icu4c/data/InterIndic_Malayalam.txt index 1ae4a78ccb..4018b05c97 100644 --- a/icu4c/data/InterIndic_Malayalam.txt +++ b/icu4c/data/InterIndic_Malayalam.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Malayalam.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Malayalam.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Malayalam -InterIndic_Malayalam { +InterIndic-Malayalam { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,105 +20,105 @@ InterIndic_Malayalam { //-------------------------------------------------------------------- // InterIndic-Malayalam - -"\uE001>ം;" // REMAP (indicExceptions.txt): ഁ>ം = SIGN CANDRABINDU>SIGN ANUSVARA -"\uE002>ം;" // SIGN ANUSVARA -"\uE003>ഃ;" // SIGN VISARGA -"\uE005>അ;" // LETTER A -"\uE006>ആ;" // LETTER AA -"\uE007>ഇ;" // LETTER I -"\uE008>ഈ;" // LETTER II -"\uE009>ഉ;" // LETTER U -"\uE00A>ഊ;" // LETTER UU -"\uE00B>ഋ;" // LETTER VOCALIC R -"\uE00C>ഌ;" // LETTER VOCALIC L -"\uE00F>ഏ;" // LETTER EE -"\uE010>ഐ;" // LETTER AI -"\uE013>ഓ;" // LETTER OO -"\uE014>ഔ;" // LETTER AU -"\uE015>ക;" // LETTER KA -"\uE016>ഖ;" // LETTER KHA -"\uE017>ഗ;" // LETTER GA -"\uE018>ഘ;" // LETTER GHA -"\uE019>ങ;" // LETTER NGA -"\uE01A>ച;" // LETTER CA -"\uE01B>ഛ;" // LETTER CHA -"\uE01C>ജ;" // LETTER JA -"\uE01D>ഝ;" // LETTER JHA -"\uE01E>ഞ;" // LETTER NYA -"\uE01F>ട;" // LETTER TTA -"\uE020>ഠ;" // LETTER TTHA -"\uE021>ഡ;" // LETTER DDA -"\uE022>ഢ;" // LETTER DDHA -"\uE023>ണ;" // LETTER NNA -"\uE024>ത;" // LETTER TA -"\uE025>ഥ;" // LETTER THA -"\uE026>ദ;" // LETTER DA -"\uE027>ധ;" // LETTER DHA -"\uE028>ന;" // LETTER NA -"\uE029>ന;" // REMAP (indicExceptions.txt): ഩ>ന = LETTER NNNA>LETTER NA -"\uE02A>പ;" // LETTER PA -"\uE02B>ഫ;" // LETTER PHA -"\uE02C>ബ;" // LETTER BA -"\uE02D>ഭ;" // LETTER BHA -"\uE02E>മ;" // LETTER MA -"\uE02F>യ;" // LETTER YA -"\uE030>ര;" // LETTER RA -"\uE032>ല;" // LETTER LA -"\uE033>ള;" // LETTER LLA -"\uE034>ഴ;" // LETTER LLLA -"\uE035>വ;" // LETTER VA -"\uE036>ശ;" // LETTER SHA -"\uE037>ഷ;" // LETTER SSA -"\uE038>സ;" // LETTER SA -"\uE039>ഹ;" // LETTER HA -// \uE03C>; // UNMAPPED InterIndic-Malayalam: SIGN NUKTA -// \uE03D>; // UNMAPPED InterIndic-Malayalam: SIGN AVAGRAHA -"\uE03E>ാ;" // VOWEL SIGN AA -"\uE03F>ി;" // VOWEL SIGN I -"\uE040>ീ;" // VOWEL SIGN II -"\uE041>ു;" // VOWEL SIGN U -"\uE042>ൂ;" // VOWEL SIGN UU -"\uE043>ൃ;" // VOWEL SIGN VOCALIC R -// \uE044>; // UNMAPPED InterIndic-Malayalam: VOWEL SIGN VOCALIC RR -"\uE045>ാ;" // REMAP (indicExceptions.txt): ൅>ാ = VOWEL SIGN CANDRA E>VOWEL SIGN AA -"\uE047>േ;" // VOWEL SIGN EE -"\uE048>ൈ;" // VOWEL SIGN AI -"\uE049>ോ;" // REMAP (indicExceptions.txt): ൉>ോ = VOWEL SIGN CANDRA O>VOWEL SIGN OO -"\uE04B>ോ;" // VOWEL SIGN OO -"\uE04C>ൌ;" // VOWEL SIGN AU -"\uE04D>്;" // SIGN VIRAMA -// \uE050>; // UNMAPPED InterIndic-Malayalam: OM -// \uE055>; // UNMAPPED InterIndic-Malayalam: LENGTH MARK -"\uE056>ൈ;" // REMAP (indicExceptions.txt): ൖ>ൈ = AI LENGTH MARK>VOWEL SIGN AI -"\uE057>ൗ;" // AU LENGTH MARK -"\uE059>ഖ;" // REMAP (indicExceptions.txt): ൙>ഖ = LETTER KHHA>LETTER KHA -"\uE05A>ഗ;" // REMAP (indicExceptions.txt): ൚>ഗ = LETTER GHHA>LETTER GA -"\uE05B>ജ;" // REMAP (indicExceptions.txt): ൛>ജ = LETTER ZA>LETTER JA -"\uE05D>ഢ;" // REMAP (indicExceptions.txt): ൝>ഢ = LETTER RHA>LETTER DDHA -"\uE05E>ഫ;" // REMAP (indicExceptions.txt): ൞>ഫ = LETTER FA>LETTER PHA -"\uE05F>യ;" // REMAP (indicExceptions.txt): ൟ>യ = LETTER YYA>LETTER YA -"\uE060>ൠ;" // LETTER VOCALIC RR -"\uE061>ൡ;" // LETTER VOCALIC LL -// \uE062>; // UNMAPPED InterIndic-Malayalam: VOWEL SIGN VOCALIC L -// \uE063>; // UNMAPPED InterIndic-Malayalam: VOWEL SIGN VOCALIC LL -"\uE066>൦;" // DIGIT ZERO -"\uE067>൧;" // DIGIT ONE -"\uE068>൨;" // DIGIT TWO -"\uE069>൩;" // DIGIT THREE -"\uE06A>൪;" // DIGIT FOUR -"\uE06B>൫;" // DIGIT FIVE -"\uE06C>൬;" // DIGIT SIX -"\uE06D>൭;" // DIGIT SEVEN -"\uE06E>൮;" // DIGIT EIGHT -"\uE06F>൯;" // DIGIT NINE -// \uE080>; // UNMAPPED InterIndic-Malayalam: ISSHAR -"\uE081>എ;" // LETTER E -"\uE082>ഒ;" // LETTER O -"\uE083>റ;" // LETTER RRA -"\uE084>െ;" // VOWEL SIGN E -"\uE085>ൊ;" // VOWEL SIGN O - +":: NFD (NFC) ;" +"\ue001>\u0d02;" // REMAP (indicExceptions.txt): \u0d01>\u0d02 = SIGN CANDRABINDU>SIGN ANUSVARA +"\ue002>\u0d02;" // SIGN ANUSVARA +"\ue003>\u0d03;" // SIGN VISARGA +"\ue005>\u0d05;" // LETTER A +"\ue006>\u0d06;" // LETTER AA +"\ue007>\u0d07;" // LETTER I +"\ue008>\u0d08;" // LETTER II +"\ue009>\u0d09;" // LETTER U +"\ue00a>\u0d0a;" // LETTER UU +"\ue00b>\u0d0b;" // LETTER VOCALIC R +"\ue00c>\u0d0c;" // LETTER VOCALIC L +"\ue00f>\u0d0f;" // LETTER EE +"\ue010>\u0d10;" // LETTER AI +"\ue013>\u0d13;" // LETTER OO +"\ue014>\u0d14;" // LETTER AU +"\ue015>\u0d15;" // LETTER KA +"\ue016>\u0d16;" // LETTER KHA +"\ue017>\u0d17;" // LETTER GA +"\ue018>\u0d18;" // LETTER GHA +"\ue019>\u0d19;" // LETTER NGA +"\ue01a>\u0d1a;" // LETTER CA +"\ue01b>\u0d1b;" // LETTER CHA +"\ue01c>\u0d1c;" // LETTER JA +"\ue01d>\u0d1d;" // LETTER JHA +"\ue01e>\u0d1e;" // LETTER NYA +"\ue01f>\u0d1f;" // LETTER TTA +"\ue020>\u0d20;" // LETTER TTHA +"\ue021>\u0d21;" // LETTER DDA +"\ue022>\u0d22;" // LETTER DDHA +"\ue023>\u0d23;" // LETTER NNA +"\ue024>\u0d24;" // LETTER TA +"\ue025>\u0d25;" // LETTER THA +"\ue026>\u0d26;" // LETTER DA +"\ue027>\u0d27;" // LETTER DHA +"\ue028>\u0d28;" // LETTER NA +"\ue029>\u0d28;" // REMAP (indicExceptions.txt): \u0d29>\u0d28 = LETTER NNNA>LETTER NA +"\ue02a>\u0d2a;" // LETTER PA +"\ue02b>\u0d2b;" // LETTER PHA +"\ue02c>\u0d2c;" // LETTER BA +"\ue02d>\u0d2d;" // LETTER BHA +"\ue02e>\u0d2e;" // LETTER MA +"\ue02f>\u0d2f;" // LETTER YA +"\ue030>\u0d30;" // LETTER RA +"\ue032>\u0d32;" // LETTER LA +"\ue033>\u0d33;" // LETTER LLA +"\ue034>\u0d34;" // LETTER LLLA +"\ue035>\u0d35;" // LETTER VA +"\ue036>\u0d36;" // LETTER SHA +"\ue037>\u0d37;" // LETTER SSA +"\ue038>\u0d38;" // LETTER SA +"\ue039>\u0d39;" // LETTER HA +// \ue03c>; // UNMAPPED InterIndic-Malayalam: SIGN NUKTA +// \ue03d>; // UNMAPPED InterIndic-Malayalam: SIGN AVAGRAHA +"\ue03e>\u0d3e;" // VOWEL SIGN AA +"\ue03f>\u0d3f;" // VOWEL SIGN I +"\ue040>\u0d40;" // VOWEL SIGN II +"\ue041>\u0d41;" // VOWEL SIGN U +"\ue042>\u0d42;" // VOWEL SIGN UU +"\ue043>\u0d43;" // VOWEL SIGN VOCALIC R +// \ue044>; // UNMAPPED InterIndic-Malayalam: VOWEL SIGN VOCALIC RR +"\ue045>\u0d3e;" // REMAP (indicExceptions.txt): \u0d45>\u0d3e = VOWEL SIGN CANDRA E>VOWEL SIGN AA +"\ue047>\u0d47;" // VOWEL SIGN EE +"\ue048>\u0d48;" // VOWEL SIGN AI +"\ue049>\u0d4b;" // REMAP (indicExceptions.txt): \u0d49>\u0d4b = VOWEL SIGN CANDRA O>VOWEL SIGN OO +"\ue04b>\u0d4b;" // VOWEL SIGN OO +"\ue04c>\u0d4c;" // VOWEL SIGN AU +"\ue04d>\u0d4d;" // SIGN VIRAMA +// \ue050>; // UNMAPPED InterIndic-Malayalam: OM +// \ue055>; // UNMAPPED InterIndic-Malayalam: LENGTH MARK +"\ue056>\u0d48;" // REMAP (indicExceptions.txt): \u0d56>\u0d48 = AI LENGTH MARK>VOWEL SIGN AI +"\ue057>\u0d57;" // AU LENGTH MARK +"\ue059>\u0d16;" // REMAP (indicExceptions.txt): \u0d59>\u0d16 = LETTER KHHA>LETTER KHA +"\ue05a>\u0d17;" // REMAP (indicExceptions.txt): \u0d5a>\u0d17 = LETTER GHHA>LETTER GA +"\ue05b>\u0d1c;" // REMAP (indicExceptions.txt): \u0d5b>\u0d1c = LETTER ZA>LETTER JA +"\ue05d>\u0d22;" // REMAP (indicExceptions.txt): \u0d5d>\u0d22 = LETTER RHA>LETTER DDHA +"\ue05e>\u0d2b;" // REMAP (indicExceptions.txt): \u0d5e>\u0d2b = LETTER FA>LETTER PHA +"\ue05f>\u0d2f;" // REMAP (indicExceptions.txt): \u0d5f>\u0d2f = LETTER YYA>LETTER YA +"\ue060>\u0d60;" // LETTER VOCALIC RR +"\ue061>\u0d61;" // LETTER VOCALIC LL +// \ue062>; // UNMAPPED InterIndic-Malayalam: VOWEL SIGN VOCALIC L +// \ue063>; // UNMAPPED InterIndic-Malayalam: VOWEL SIGN VOCALIC LL +"\ue066>\u0d66;" // DIGIT ZERO +"\ue067>\u0d67;" // DIGIT ONE +"\ue068>\u0d68;" // DIGIT TWO +"\ue069>\u0d69;" // DIGIT THREE +"\ue06a>\u0d6a;" // DIGIT FOUR +"\ue06b>\u0d6b;" // DIGIT FIVE +"\ue06c>\u0d6c;" // DIGIT SIX +"\ue06d>\u0d6d;" // DIGIT SEVEN +"\ue06e>\u0d6e;" // DIGIT EIGHT +"\ue06f>\u0d6f;" // DIGIT NINE +// \ue080>; // UNMAPPED InterIndic-Malayalam: ISSHAR +"\ue00e>\u0d0e;" // LETTER E +"\ue012>\u0d12;" // LETTER O +"\ue031>\u0d31;" // LETTER RRA +"\ue046>\u0d46;" // VOWEL SIGN E +"\ue04a>\u0d4a;" // VOWEL SIGN O + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Oriya.txt b/icu4c/data/InterIndic_Oriya.txt index 1f93fd52f0..88033d6cba 100644 --- a/icu4c/data/InterIndic_Oriya.txt +++ b/icu4c/data/InterIndic_Oriya.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Oriya.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Oriya.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Oriya -InterIndic_Oriya { +InterIndic-Oriya { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,105 +20,105 @@ InterIndic_Oriya { //-------------------------------------------------------------------- // InterIndic-Oriya - -"\uE001>ଁ;" // SIGN CANDRABINDU -"\uE002>ଂ;" // SIGN ANUSVARA -"\uE003>ଃ;" // SIGN VISARGA -"\uE005>ଅ;" // LETTER A -"\uE006>ଆ;" // LETTER AA -"\uE007>ଇ;" // LETTER I -"\uE008>ଈ;" // LETTER II -"\uE009>ଉ;" // LETTER U -"\uE00A>ଊ;" // LETTER UU -"\uE00B>ଋ;" // LETTER VOCALIC R -"\uE00C>ଌ;" // LETTER VOCALIC L -// \uE00F>; // UNMAPPED InterIndic-Oriya: LETTER EE (ଏ = LETTER E) -"\uE010>ଐ;" // LETTER AI -// \uE013>; // UNMAPPED InterIndic-Oriya: LETTER OO (ଓ = LETTER O) -"\uE014>ଔ;" // LETTER AU -"\uE015>କ;" // LETTER KA -"\uE016>ଖ;" // LETTER KHA -"\uE017>ଗ;" // LETTER GA -"\uE018>ଘ;" // LETTER GHA -"\uE019>ଙ;" // LETTER NGA -"\uE01A>ଚ;" // LETTER CA -"\uE01B>ଛ;" // LETTER CHA -"\uE01C>ଜ;" // LETTER JA -"\uE01D>ଝ;" // LETTER JHA -"\uE01E>ଞ;" // LETTER NYA -"\uE01F>ଟ;" // LETTER TTA -"\uE020>ଠ;" // LETTER TTHA -"\uE021>ଡ;" // LETTER DDA -"\uE022>ଢ;" // LETTER DDHA -"\uE023>ଣ;" // LETTER NNA -"\uE024>ତ;" // LETTER TA -"\uE025>ଥ;" // LETTER THA -"\uE026>ଦ;" // LETTER DA -"\uE027>ଧ;" // LETTER DHA -"\uE028>ନ;" // LETTER NA -"\uE029>ନ;" // REMAP (indicExceptions.txt): ଩>ନ = LETTER NNNA>LETTER NA -"\uE02A>ପ;" // LETTER PA -"\uE02B>ଫ;" // LETTER PHA -"\uE02C>ବ;" // LETTER BA -"\uE02D>ଭ;" // LETTER BHA -"\uE02E>ମ;" // LETTER MA -"\uE02F>ଯ;" // LETTER YA -"\uE030>ର;" // LETTER RA -"\uE032>ଲ;" // LETTER LA -"\uE033>ଳ;" // LETTER LLA -"\uE034>ଳ;" // REMAP (indicExceptions.txt): ଴>ଳ = LETTER LLLA>LETTER LLA -"\uE035>ବ;" // REMAP (indicExceptions.txt): ଵ>ବ = LETTER VA>LETTER BA -"\uE036>ଶ;" // LETTER SHA -"\uE037>ଷ;" // LETTER SSA -"\uE038>ସ;" // LETTER SA -"\uE039>ହ;" // LETTER HA -"\uE03C>଼;" // SIGN NUKTA -"\uE03D>ଽ;" // SIGN AVAGRAHA -"\uE03E>ା;" // VOWEL SIGN AA -"\uE03F>ି;" // VOWEL SIGN I -"\uE040>ୀ;" // VOWEL SIGN II -"\uE041>ୁ;" // VOWEL SIGN U -"\uE042>ୂ;" // VOWEL SIGN UU -"\uE043>ୃ;" // VOWEL SIGN VOCALIC R -"\uE044>ୃ଼;" // REMAP (indicExceptions.txt): ୄ>ୃ଼ = VOWEL SIGN VOCALIC RR>VOWEL SIGN VOCALIC R.SIGN NUKTA -"\uE045>େ;" // REMAP (indicExceptions.txt): ୅>େ = VOWEL SIGN CANDRA E>VOWEL SIGN E -// \uE047>; // UNMAPPED InterIndic-Oriya: VOWEL SIGN EE (େ = VOWEL SIGN E) -"\uE048>ୈ;" // VOWEL SIGN AI -"\uE049>ୋ;" // REMAP (indicExceptions.txt): ୉>ୋ = VOWEL SIGN CANDRA O>VOWEL SIGN O -// \uE04B>; // UNMAPPED InterIndic-Oriya: VOWEL SIGN OO (ୋ = VOWEL SIGN O) -"\uE04C>ୌ;" // VOWEL SIGN AU -"\uE04D>୍;" // SIGN VIRAMA -"\uE050>ଓଁ;" // REMAP (indicExceptions.txt): ୐>ଓଁ = OM>LETTER O.SIGN CANDRABINDU -// \uE055>; // UNMAPPED InterIndic-Oriya: LENGTH MARK -"\uE056>ୖ;" // AI LENGTH MARK -"\uE057>ୗ;" // AU LENGTH MARK -"\uE059>ଖ଼;" // REMAP (indicExceptions.txt): ୙>ଖ଼ = LETTER KHHA>LETTER KHA.SIGN NUKTA -"\uE05A>ଗ଼;" // REMAP (indicExceptions.txt): ୚>ଗ଼ = LETTER GHHA>LETTER GA.SIGN NUKTA -"\uE05B>ଜ଼;" // REMAP (indicExceptions.txt): ୛>ଜ଼ = LETTER ZA>LETTER JA.SIGN NUKTA -"\uE05D>ଢ଼;" // LETTER RHA -"\uE05E>ଫ଼;" // REMAP (indicExceptions.txt): ୞>ଫ଼ = LETTER FA>LETTER PHA.SIGN NUKTA -"\uE05F>ୟ;" // LETTER YYA -"\uE060>ୠ;" // LETTER VOCALIC RR -"\uE061>ୡ;" // LETTER VOCALIC LL -"\uE062>ୖ଼;" // REMAP (indicExceptions.txt): ୢ>ୖ଼ = VOWEL SIGN VOCALIC L>AI LENGTH MARK.SIGN NUKTA -"\uE063>ୗ଼;" // REMAP (indicExceptions.txt): ୣ>ୗ଼ = VOWEL SIGN VOCALIC LL>AU LENGTH MARK.SIGN NUKTA -"\uE066>୦;" // DIGIT ZERO -"\uE067>୧;" // DIGIT ONE -"\uE068>୨;" // DIGIT TWO -"\uE069>୩;" // DIGIT THREE -"\uE06A>୪;" // DIGIT FOUR -"\uE06B>୫;" // DIGIT FIVE -"\uE06C>୬;" // DIGIT SIX -"\uE06D>୭;" // DIGIT SEVEN -"\uE06E>୮;" // DIGIT EIGHT -"\uE06F>୯;" // DIGIT NINE -"\uE080>୰;" // ISSHAR -"\uE081>ଏ;" // LETTER E -"\uE082>ଓ;" // LETTER O -"\uE083>ଡ଼;" // LETTER RRA -"\uE084>େ;" // VOWEL SIGN E -"\uE085>ୋ;" // VOWEL SIGN O - +":: NFD (NFC) ;" +"\ue001>\u0b01;" // SIGN CANDRABINDU +"\ue002>\u0b02;" // SIGN ANUSVARA +"\ue003>\u0b03;" // SIGN VISARGA +"\ue005>\u0b05;" // LETTER A +"\ue006>\u0b06;" // LETTER AA +"\ue007>\u0b07;" // LETTER I +"\ue008>\u0b08;" // LETTER II +"\ue009>\u0b09;" // LETTER U +"\ue00a>\u0b0a;" // LETTER UU +"\ue00b>\u0b0b;" // LETTER VOCALIC R +"\ue00c>\u0b0c;" // LETTER VOCALIC L +// \ue00f>; // UNMAPPED InterIndic-Oriya: LETTER EE (\u0b0f = LETTER E) +"\ue010>\u0b10;" // LETTER AI +// \ue013>; // UNMAPPED InterIndic-Oriya: LETTER OO (\u0b13 = LETTER O) +"\ue014>\u0b14;" // LETTER AU +"\ue015>\u0b15;" // LETTER KA +"\ue016>\u0b16;" // LETTER KHA +"\ue017>\u0b17;" // LETTER GA +"\ue018>\u0b18;" // LETTER GHA +"\ue019>\u0b19;" // LETTER NGA +"\ue01a>\u0b1a;" // LETTER CA +"\ue01b>\u0b1b;" // LETTER CHA +"\ue01c>\u0b1c;" // LETTER JA +"\ue01d>\u0b1d;" // LETTER JHA +"\ue01e>\u0b1e;" // LETTER NYA +"\ue01f>\u0b1f;" // LETTER TTA +"\ue020>\u0b20;" // LETTER TTHA +"\ue021>\u0b21;" // LETTER DDA +"\ue022>\u0b22;" // LETTER DDHA +"\ue023>\u0b23;" // LETTER NNA +"\ue024>\u0b24;" // LETTER TA +"\ue025>\u0b25;" // LETTER THA +"\ue026>\u0b26;" // LETTER DA +"\ue027>\u0b27;" // LETTER DHA +"\ue028>\u0b28;" // LETTER NA +"\ue029>\u0b28;" // REMAP (indicExceptions.txt): \u0b29>\u0b28 = LETTER NNNA>LETTER NA +"\ue02a>\u0b2a;" // LETTER PA +"\ue02b>\u0b2b;" // LETTER PHA +"\ue02c>\u0b2c;" // LETTER BA +"\ue02d>\u0b2d;" // LETTER BHA +"\ue02e>\u0b2e;" // LETTER MA +"\ue02f>\u0b2f;" // LETTER YA +"\ue030>\u0b30;" // LETTER RA +"\ue032>\u0b32;" // LETTER LA +"\ue033>\u0b33;" // LETTER LLA +"\ue034>\u0b33;" // REMAP (indicExceptions.txt): \u0b34>\u0b33 = LETTER LLLA>LETTER LLA +"\ue035>\u0b2c;" // REMAP (indicExceptions.txt): \u0b35>\u0b2c = LETTER VA>LETTER BA +"\ue036>\u0b36;" // LETTER SHA +"\ue037>\u0b37;" // LETTER SSA +"\ue038>\u0b38;" // LETTER SA +"\ue039>\u0b39;" // LETTER HA +"\ue03c>\u0b3c;" // SIGN NUKTA +"\ue03d>\u0b3d;" // SIGN AVAGRAHA +"\ue03e>\u0b3e;" // VOWEL SIGN AA +"\ue03f>\u0b3f;" // VOWEL SIGN I +"\ue040>\u0b40;" // VOWEL SIGN II +"\ue041>\u0b41;" // VOWEL SIGN U +"\ue042>\u0b42;" // VOWEL SIGN UU +"\ue043>\u0b43;" // VOWEL SIGN VOCALIC R +"\ue044>\u0b43\u0b3c;" // REMAP (indicExceptions.txt): \u0b44>\u0b43\u0b3c = VOWEL SIGN VOCALIC RR>VOWEL SIGN VOCALIC R.SIGN NUKTA +"\ue045>\u0b47;" // REMAP (indicExceptions.txt): \u0b45>\u0b47 = VOWEL SIGN CANDRA E>VOWEL SIGN E +// \ue047>; // UNMAPPED InterIndic-Oriya: VOWEL SIGN EE (\u0b47 = VOWEL SIGN E) +"\ue048>\u0b48;" // VOWEL SIGN AI +"\ue049>\u0b4b;" // REMAP (indicExceptions.txt): \u0b49>\u0b4b = VOWEL SIGN CANDRA O>VOWEL SIGN O +// \ue04b>; // UNMAPPED InterIndic-Oriya: VOWEL SIGN OO (\u0b4b = VOWEL SIGN O) +"\ue04c>\u0b4c;" // VOWEL SIGN AU +"\ue04d>\u0b4d;" // SIGN VIRAMA +"\ue050>\u0b13\u0b01;" // REMAP (indicExceptions.txt): \u0b50>\u0b13\u0b01 = OM>LETTER O.SIGN CANDRABINDU +// \ue055>; // UNMAPPED InterIndic-Oriya: LENGTH MARK +"\ue056>\u0b56;" // AI LENGTH MARK +"\ue057>\u0b57;" // AU LENGTH MARK +"\ue059>\u0b16\u0b3c;" // REMAP (indicExceptions.txt): \u0b59>\u0b16\u0b3c = LETTER KHHA>LETTER KHA.SIGN NUKTA +"\ue05a>\u0b17\u0b3c;" // REMAP (indicExceptions.txt): \u0b5a>\u0b17\u0b3c = LETTER GHHA>LETTER GA.SIGN NUKTA +"\ue05b>\u0b1c\u0b3c;" // REMAP (indicExceptions.txt): \u0b5b>\u0b1c\u0b3c = LETTER ZA>LETTER JA.SIGN NUKTA +"\ue05d>\u0b5d;" // LETTER RHA +"\ue05e>\u0b2b\u0b3c;" // REMAP (indicExceptions.txt): \u0b5e>\u0b2b\u0b3c = LETTER FA>LETTER PHA.SIGN NUKTA +"\ue05f>\u0b5f;" // LETTER YYA +"\ue060>\u0b60;" // LETTER VOCALIC RR +"\ue061>\u0b61;" // LETTER VOCALIC LL +"\ue062>\u0b56\u0b3c;" // REMAP (indicExceptions.txt): \u0b62>\u0b56\u0b3c = VOWEL SIGN VOCALIC L>AI LENGTH MARK.SIGN NUKTA +"\ue063>\u0b57\u0b3c;" // REMAP (indicExceptions.txt): \u0b63>\u0b57\u0b3c = VOWEL SIGN VOCALIC LL>AU LENGTH MARK.SIGN NUKTA +"\ue066>\u0b66;" // DIGIT ZERO +"\ue067>\u0b67;" // DIGIT ONE +"\ue068>\u0b68;" // DIGIT TWO +"\ue069>\u0b69;" // DIGIT THREE +"\ue06a>\u0b6a;" // DIGIT FOUR +"\ue06b>\u0b6b;" // DIGIT FIVE +"\ue06c>\u0b6c;" // DIGIT SIX +"\ue06d>\u0b6d;" // DIGIT SEVEN +"\ue06e>\u0b6e;" // DIGIT EIGHT +"\ue06f>\u0b6f;" // DIGIT NINE +"\ue070>\u0b70;" // ISSHAR +"\ue00e>\u0b0f;" // LETTER E +"\ue013>\u0b13;" // LETTER O +"\ue031>\u0b5c;" // LETTER RRA +"\ue047>\u0b47;" // VOWEL SIGN E +"\ue04b>\u0b4b;" // VOWEL SIGN O + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Tamil.txt b/icu4c/data/InterIndic_Tamil.txt index 7e833143b0..c23e330347 100644 --- a/icu4c/data/InterIndic_Tamil.txt +++ b/icu4c/data/InterIndic_Tamil.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Tamil.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Tamil.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Tamil -InterIndic_Tamil { +InterIndic-Tamil { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,105 +20,105 @@ InterIndic_Tamil { //-------------------------------------------------------------------- // InterIndic-Tamil - -// \uE001>; // UNMAPPED InterIndic-Tamil: SIGN CANDRABINDU -"\uE002>ஂ;" // SIGN ANUSVARA -"\uE003>ஃ;" // SIGN VISARGA -"\uE005>அ;" // LETTER A -"\uE006>ஆ;" // LETTER AA -"\uE007>இ;" // LETTER I -"\uE008>ஈ;" // LETTER II -"\uE009>உ;" // LETTER U -"\uE00A>ஊ;" // LETTER UU -"\uE00B>ரி;" // REMAP (indicExceptions.txt): ஋>ரி = LETTER VOCALIC R>LETTER RA.VOWEL SIGN I -"\uE00C>இ;" // REMAP (indicExceptions.txt): ஌>இ = LETTER VOCALIC L>LETTER I -"\uE00F>ஏ;" // LETTER EE -"\uE010>ஐ;" // LETTER AI -"\uE013>ஓ;" // LETTER OO -"\uE014>ஔ;" // LETTER AU -"\uE015>க;" // LETTER KA -"\uE016>க;" // REMAP (indicExceptions.txt): ஖>க = LETTER KHA>LETTER KA -"\uE017>க;" // REMAP (indicExceptions.txt): ஗>க = LETTER GA>LETTER KA -"\uE018>க;" // REMAP (indicExceptions.txt): ஘>க = LETTER GHA>LETTER KA -"\uE019>ங;" // LETTER NGA -"\uE01A>ச;" // LETTER CA -"\uE01B>ச;" // REMAP (indicExceptions.txt): ஛>ச = LETTER CHA>LETTER CA -"\uE01C>ஜ;" // LETTER JA -"\uE01D>ச;" // REMAP (indicExceptions.txt): ஝>ச = LETTER JHA>LETTER CA -"\uE01E>ஞ;" // LETTER NYA -"\uE01F>ட;" // LETTER TTA -"\uE020>ட;" // REMAP (indicExceptions.txt): ஠>ட = LETTER TTHA>LETTER TTA -"\uE021>ட;" // REMAP (indicExceptions.txt): ஡>ட = LETTER DDA>LETTER TTA -"\uE022>ட;" // REMAP (indicExceptions.txt): ஢>ட = LETTER DDHA>LETTER TTA -"\uE023>ண;" // LETTER NNA -"\uE024>த;" // LETTER TA -"\uE025>த;" // REMAP (indicExceptions.txt): ஥>த = LETTER THA>LETTER TA -"\uE026>த;" // REMAP (indicExceptions.txt): ஦>த = LETTER DA>LETTER TA -"\uE027>த;" // REMAP (indicExceptions.txt): ஧>த = LETTER DHA>LETTER TA -"\uE028>ந;" // LETTER NA -"\uE029>ன;" // LETTER NNNA -"\uE02A>ப;" // LETTER PA -"\uE02B>ப;" // REMAP (indicExceptions.txt): ஫>ப = LETTER PHA>LETTER PA -"\uE02C>ப;" // REMAP (indicExceptions.txt): ஬>ப = LETTER BA>LETTER PA -"\uE02D>ப;" // REMAP (indicExceptions.txt): ஭>ப = LETTER BHA>LETTER PA -"\uE02E>ம;" // LETTER MA -"\uE02F>ய;" // LETTER YA -"\uE030>ர;" // LETTER RA -"\uE032>ல;" // LETTER LA -"\uE033>ள;" // LETTER LLA -"\uE034>ழ;" // LETTER LLLA -"\uE035>வ;" // LETTER VA -"\uE036>ஷ;" // REMAP (indicExceptions.txt): ஶ>ஷ = LETTER SHA>LETTER SSA -"\uE037>ஷ;" // LETTER SSA -"\uE038>ஸ;" // LETTER SA -"\uE039>ஹ;" // LETTER HA -// \uE03C>; // UNMAPPED InterIndic-Tamil: SIGN NUKTA -// \uE03D>; // UNMAPPED InterIndic-Tamil: SIGN AVAGRAHA -"\uE03E>ா;" // VOWEL SIGN AA -"\uE03F>ி;" // VOWEL SIGN I -"\uE040>ீ;" // VOWEL SIGN II -"\uE041>ு;" // VOWEL SIGN U -"\uE042>ூ;" // VOWEL SIGN UU -"\uE043>்ரி;" // REMAP (indicExceptions.txt): ௃>்ரி = VOWEL SIGN VOCALIC R>SIGN VIRAMA.LETTER RA.VOWEL SIGN I -"\uE044>்ரி;" // REMAP (indicExceptions.txt): ௄>்ரி = VOWEL SIGN VOCALIC RR>SIGN VIRAMA.LETTER RA.VOWEL SIGN I -"\uE045>ா;" // REMAP (indicExceptions.txt): ௅>ா = VOWEL SIGN CANDRA E>VOWEL SIGN AA -"\uE047>ே;" // VOWEL SIGN EE -"\uE048>ை;" // VOWEL SIGN AI -"\uE049>ா;" // REMAP (indicExceptions.txt): ௉>ா = VOWEL SIGN CANDRA O>VOWEL SIGN AA -"\uE04B>ோ;" // VOWEL SIGN OO -"\uE04C>ௌ;" // VOWEL SIGN AU -"\uE04D>்;" // SIGN VIRAMA -"\uE050>ஓம்;" // REMAP (indicExceptions.txt): ௐ>ஓம் = OM>LETTER OO.LETTER MA.SIGN VIRAMA -// \uE055>; // UNMAPPED InterIndic-Tamil: LENGTH MARK -"\uE056>ை;" // REMAP (indicExceptions.txt): ௖>ை = AI LENGTH MARK>VOWEL SIGN AI -"\uE057>ௗ;" // AU LENGTH MARK -"\uE059>க;" // REMAP (indicExceptions.txt): ௙>க = LETTER KHHA>LETTER KA -"\uE05A>க;" // REMAP (indicExceptions.txt): ௚>க = LETTER GHHA>LETTER KA -"\uE05B>ஜ;" // REMAP (indicExceptions.txt): ௛>ஜ = LETTER ZA>LETTER JA -"\uE05D>ட;" // REMAP (indicExceptions.txt): ௝>ட = LETTER RHA>LETTER TTA -"\uE05E>ப;" // REMAP (indicExceptions.txt): ௞>ப = LETTER FA>LETTER PA -"\uE05F>ய;" // REMAP (indicExceptions.txt): ௟>ய = LETTER YYA>LETTER YA -"\uE060>ரி;" // REMAP (indicExceptions.txt): ௠>ரி = LETTER VOCALIC RR>LETTER RA.VOWEL SIGN I -"\uE061>ஈ;" // REMAP (indicExceptions.txt): ௡>ஈ = LETTER VOCALIC LL>LETTER II -// \uE062>; // UNMAPPED InterIndic-Tamil: VOWEL SIGN VOCALIC L -// \uE063>; // UNMAPPED InterIndic-Tamil: VOWEL SIGN VOCALIC LL -// \uE066>; // UNMAPPED InterIndic-Tamil: DIGIT ZERO -"\uE067>௧;" // DIGIT ONE -"\uE068>௨;" // DIGIT TWO -"\uE069>௩;" // DIGIT THREE -"\uE06A>௪;" // DIGIT FOUR -"\uE06B>௫;" // DIGIT FIVE -"\uE06C>௬;" // DIGIT SIX -"\uE06D>௭;" // DIGIT SEVEN -"\uE06E>௮;" // DIGIT EIGHT -"\uE06F>௯;" // DIGIT NINE -// \uE080>; // UNMAPPED InterIndic-Tamil: ISSHAR -"\uE081>எ;" // LETTER E -"\uE082>ஒ;" // LETTER O -"\uE083>ற;" // LETTER RRA -"\uE084>ெ;" // VOWEL SIGN E -"\uE085>ொ;" // VOWEL SIGN O - +":: NFD (NFC) ;" +// \ue001>; // UNMAPPED InterIndic-Tamil: SIGN CANDRABINDU +"\ue002>\u0b82;" // SIGN ANUSVARA +"\ue003>\u0b83;" // SIGN VISARGA +"\ue005>\u0b85;" // LETTER A +"\ue006>\u0b86;" // LETTER AA +"\ue007>\u0b87;" // LETTER I +"\ue008>\u0b88;" // LETTER II +"\ue009>\u0b89;" // LETTER U +"\ue00a>\u0b8a;" // LETTER UU +"\ue00b>\u0bb0\u0bbf;" // REMAP (indicExceptions.txt): \u0b8b>\u0bb0\u0bbf = LETTER VOCALIC R>LETTER RA.VOWEL SIGN I +"\ue00c>\u0b87;" // REMAP (indicExceptions.txt): \u0b8c>\u0b87 = LETTER VOCALIC L>LETTER I +"\ue00f>\u0b8f;" // LETTER EE +"\ue010>\u0b90;" // LETTER AI +"\ue013>\u0b93;" // LETTER OO +"\ue014>\u0b94;" // LETTER AU +"\ue015>\u0b95;" // LETTER KA +"\ue016>\u0b95;" // REMAP (indicExceptions.txt): \u0b96>\u0b95 = LETTER KHA>LETTER KA +"\ue017>\u0b95;" // REMAP (indicExceptions.txt): \u0b97>\u0b95 = LETTER GA>LETTER KA +"\ue018>\u0b95;" // REMAP (indicExceptions.txt): \u0b98>\u0b95 = LETTER GHA>LETTER KA +"\ue019>\u0b99;" // LETTER NGA +"\ue01a>\u0b9a;" // LETTER CA +"\ue01b>\u0b9a;" // REMAP (indicExceptions.txt): \u0b9b>\u0b9a = LETTER CHA>LETTER CA +"\ue01c>\u0b9c;" // LETTER JA +"\ue01d>\u0b9a;" // REMAP (indicExceptions.txt): \u0b9d>\u0b9a = LETTER JHA>LETTER CA +"\ue01e>\u0b9e;" // LETTER NYA +"\ue01f>\u0b9f;" // LETTER TTA +"\ue020>\u0b9f;" // REMAP (indicExceptions.txt): \u0ba0>\u0b9f = LETTER TTHA>LETTER TTA +"\ue021>\u0b9f;" // REMAP (indicExceptions.txt): \u0ba1>\u0b9f = LETTER DDA>LETTER TTA +"\ue022>\u0b9f;" // REMAP (indicExceptions.txt): \u0ba2>\u0b9f = LETTER DDHA>LETTER TTA +"\ue023>\u0ba3;" // LETTER NNA +"\ue024>\u0ba4;" // LETTER TA +"\ue025>\u0ba4;" // REMAP (indicExceptions.txt): \u0ba5>\u0ba4 = LETTER THA>LETTER TA +"\ue026>\u0ba4;" // REMAP (indicExceptions.txt): \u0ba6>\u0ba4 = LETTER DA>LETTER TA +"\ue027>\u0ba4;" // REMAP (indicExceptions.txt): \u0ba7>\u0ba4 = LETTER DHA>LETTER TA +"\ue028>\u0ba8;" // LETTER NA +"\ue029>\u0ba9;" // LETTER NNNA +"\ue02a>\u0baa;" // LETTER PA +"\ue02b>\u0baa;" // REMAP (indicExceptions.txt): \u0bab>\u0baa = LETTER PHA>LETTER PA +"\ue02c>\u0baa;" // REMAP (indicExceptions.txt): \u0bac>\u0baa = LETTER BA>LETTER PA +"\ue02d>\u0baa;" // REMAP (indicExceptions.txt): \u0bad>\u0baa = LETTER BHA>LETTER PA +"\ue02e>\u0bae;" // LETTER MA +"\ue02f>\u0baf;" // LETTER YA +"\ue030>\u0bb0;" // LETTER RA +"\ue032>\u0bb2;" // LETTER LA +"\ue033>\u0bb3;" // LETTER LLA +"\ue034>\u0bb4;" // LETTER LLLA +"\ue035>\u0bb5;" // LETTER VA +"\ue036>\u0bb7;" // REMAP (indicExceptions.txt): \u0bb6>\u0bb7 = LETTER SHA>LETTER SSA +"\ue037>\u0bb7;" // LETTER SSA +"\ue038>\u0bb8;" // LETTER SA +"\ue039>\u0bb9;" // LETTER HA +// \ue03c>; // UNMAPPED InterIndic-Tamil: SIGN NUKTA +// \ue03d>; // UNMAPPED InterIndic-Tamil: SIGN AVAGRAHA +"\ue03e>\u0bbe;" // VOWEL SIGN AA +"\ue03f>\u0bbf;" // VOWEL SIGN I +"\ue040>\u0bc0;" // VOWEL SIGN II +"\ue041>\u0bc1;" // VOWEL SIGN U +"\ue042>\u0bc2;" // VOWEL SIGN UU +"\ue043>\u0bcd\u0bb0\u0bbf;" // REMAP (indicExceptions.txt): \u0bc3>\u0bcd\u0bb0\u0bbf = VOWEL SIGN VOCALIC R>SIGN VIRAMA.LETTER RA.VOWEL SIGN I +"\ue044>\u0bcd\u0bb0\u0bbf;" // REMAP (indicExceptions.txt): \u0bc4>\u0bcd\u0bb0\u0bbf = VOWEL SIGN VOCALIC RR>SIGN VIRAMA.LETTER RA.VOWEL SIGN I +"\ue045>\u0bbe;" // REMAP (indicExceptions.txt): \u0bc5>\u0bbe = VOWEL SIGN CANDRA E>VOWEL SIGN AA +"\ue047>\u0bc7;" // VOWEL SIGN EE +"\ue048>\u0bc8;" // VOWEL SIGN AI +"\ue049>\u0bbe;" // REMAP (indicExceptions.txt): \u0bc9>\u0bbe = VOWEL SIGN CANDRA O>VOWEL SIGN AA +"\ue04b>\u0bcb;" // VOWEL SIGN OO +"\ue04c>\u0bcc;" // VOWEL SIGN AU +"\ue04d>\u0bcd;" // SIGN VIRAMA +"\ue050>\u0b93\u0bae\u0bcd;" // REMAP (indicExceptions.txt): \u0bd0>\u0b93\u0bae\u0bcd = OM>LETTER OO.LETTER MA.SIGN VIRAMA +// \ue055>; // UNMAPPED InterIndic-Tamil: LENGTH MARK +"\ue056>\u0bc8;" // REMAP (indicExceptions.txt): \u0bd6>\u0bc8 = AI LENGTH MARK>VOWEL SIGN AI +"\ue057>\u0bd7;" // AU LENGTH MARK +"\ue059>\u0b95;" // REMAP (indicExceptions.txt): \u0bd9>\u0b95 = LETTER KHHA>LETTER KA +"\ue05a>\u0b95;" // REMAP (indicExceptions.txt): \u0bda>\u0b95 = LETTER GHHA>LETTER KA +"\ue05b>\u0b9c;" // REMAP (indicExceptions.txt): \u0bdb>\u0b9c = LETTER ZA>LETTER JA +"\ue05d>\u0b9f;" // REMAP (indicExceptions.txt): \u0bdd>\u0b9f = LETTER RHA>LETTER TTA +"\ue05e>\u0baa;" // REMAP (indicExceptions.txt): \u0bde>\u0baa = LETTER FA>LETTER PA +"\ue05f>\u0baf;" // REMAP (indicExceptions.txt): \u0bdf>\u0baf = LETTER YYA>LETTER YA +"\ue060>\u0bb0\u0bbf;" // REMAP (indicExceptions.txt): \u0be0>\u0bb0\u0bbf = LETTER VOCALIC RR>LETTER RA.VOWEL SIGN I +"\ue061>\u0b88;" // REMAP (indicExceptions.txt): \u0be1>\u0b88 = LETTER VOCALIC LL>LETTER II +// \ue062>; // UNMAPPED InterIndic-Tamil: VOWEL SIGN VOCALIC L +// \ue063>; // UNMAPPED InterIndic-Tamil: VOWEL SIGN VOCALIC LL +// \ue066>; // UNMAPPED InterIndic-Tamil: DIGIT ZERO +"\ue067>\u0be7;" // DIGIT ONE +"\ue068>\u0be8;" // DIGIT TWO +"\ue069>\u0be9;" // DIGIT THREE +"\ue06a>\u0bea;" // DIGIT FOUR +"\ue06b>\u0beb;" // DIGIT FIVE +"\ue06c>\u0bec;" // DIGIT SIX +"\ue06d>\u0bed;" // DIGIT SEVEN +"\ue06e>\u0bee;" // DIGIT EIGHT +"\ue06f>\u0bef;" // DIGIT NINE +// \ue080>; // UNMAPPED InterIndic-Tamil: ISSHAR +"\ue00e>\u0b8e;" // LETTER E +"\ue012>\u0b92;" // LETTER O +"\ue031>\u0bb1;" // LETTER RRA +"\ue046>\u0bc6;" // VOWEL SIGN E +"\ue04a>\u0bca;" // VOWEL SIGN O + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/InterIndic_Telugu.txt b/icu4c/data/InterIndic_Telugu.txt index d49ab3bbb1..756b21dbc0 100644 --- a/icu4c/data/InterIndic_Telugu.txt +++ b/icu4c/data/InterIndic_Telugu.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_InterIndic_Telugu.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_InterIndic_Telugu.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // InterIndic_Telugu -InterIndic_Telugu { +InterIndic-Telugu { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,105 +20,105 @@ InterIndic_Telugu { //-------------------------------------------------------------------- // InterIndic-Telugu - -"\uE001>ఁ;" // SIGN CANDRABINDU -"\uE002>ం;" // SIGN ANUSVARA -"\uE003>ః;" // SIGN VISARGA -"\uE005>అ;" // LETTER A -"\uE006>ఆ;" // LETTER AA -"\uE007>ఇ;" // LETTER I -"\uE008>ఈ;" // LETTER II -"\uE009>ఉ;" // LETTER U -"\uE00A>ఊ;" // LETTER UU -"\uE00B>ఋ;" // LETTER VOCALIC R -"\uE00C>ఌ;" // LETTER VOCALIC L -"\uE00F>ఏ;" // LETTER EE -"\uE010>ఐ;" // LETTER AI -"\uE013>ఓ;" // LETTER OO -"\uE014>ఔ;" // LETTER AU -"\uE015>క;" // LETTER KA -"\uE016>ఖ;" // LETTER KHA -"\uE017>గ;" // LETTER GA -"\uE018>ఘ;" // LETTER GHA -"\uE019>ఙ;" // LETTER NGA -"\uE01A>చ;" // LETTER CA -"\uE01B>ఛ;" // LETTER CHA -"\uE01C>జ;" // LETTER JA -"\uE01D>ఝ;" // LETTER JHA -"\uE01E>ఞ;" // LETTER NYA -"\uE01F>ట;" // LETTER TTA -"\uE020>ఠ;" // LETTER TTHA -"\uE021>డ;" // LETTER DDA -"\uE022>ఢ;" // LETTER DDHA -"\uE023>ణ;" // LETTER NNA -"\uE024>త;" // LETTER TA -"\uE025>థ;" // LETTER THA -"\uE026>ద;" // LETTER DA -"\uE027>ధ;" // LETTER DHA -"\uE028>న;" // LETTER NA -"\uE029>న;" // REMAP (indicExceptions.txt): ఩>న = LETTER NNNA>LETTER NA -"\uE02A>ప;" // LETTER PA -"\uE02B>ఫ;" // LETTER PHA -"\uE02C>బ;" // LETTER BA -"\uE02D>భ;" // LETTER BHA -"\uE02E>మ;" // LETTER MA -"\uE02F>య;" // LETTER YA -"\uE030>ర;" // LETTER RA -"\uE032>ల;" // LETTER LA -"\uE033>ళ;" // LETTER LLA -"\uE034>ళ;" // REMAP (indicExceptions.txt): ఴ>ళ = LETTER LLLA>LETTER LLA -"\uE035>వ;" // LETTER VA -"\uE036>శ;" // LETTER SHA -"\uE037>ష;" // LETTER SSA -"\uE038>స;" // LETTER SA -"\uE039>హ;" // LETTER HA -// \uE03C>; // UNMAPPED InterIndic-Telugu: SIGN NUKTA -// \uE03D>; // UNMAPPED InterIndic-Telugu: SIGN AVAGRAHA -"\uE03E>ా;" // VOWEL SIGN AA -"\uE03F>ి;" // VOWEL SIGN I -"\uE040>ీ;" // VOWEL SIGN II -"\uE041>ు;" // VOWEL SIGN U -"\uE042>ూ;" // VOWEL SIGN UU -"\uE043>ృ;" // VOWEL SIGN VOCALIC R -"\uE044>ౄ;" // VOWEL SIGN VOCALIC RR -"\uE045>ె;" // REMAP (indicExceptions.txt): ౅>ె = VOWEL SIGN CANDRA E>VOWEL SIGN E -"\uE047>ే;" // VOWEL SIGN EE -"\uE048>ై;" // VOWEL SIGN AI -"\uE049>ొ;" // REMAP (indicExceptions.txt): ౉>ొ = VOWEL SIGN CANDRA O>VOWEL SIGN O -"\uE04B>ో;" // VOWEL SIGN OO -"\uE04C>ౌ;" // VOWEL SIGN AU -"\uE04D>్;" // SIGN VIRAMA -"\uE050>ఓం;" // REMAP (indicExceptions.txt): ౐>ఓం = OM>LETTER OO.SIGN ANUSVARA -"\uE055>ౕ;" // LENGTH MARK -"\uE056>ౖ;" // AI LENGTH MARK -"\uE057>ౌ;" // REMAP (indicExceptions.txt): ౗>ౌ = AU LENGTH MARK>VOWEL SIGN AU -"\uE059>ఖ;" // REMAP (indicExceptions.txt): ౙ>ఖ = LETTER KHHA>LETTER KHA -"\uE05A>గ;" // REMAP (indicExceptions.txt): ౚ>గ = LETTER GHHA>LETTER GA -"\uE05B>జ;" // REMAP (indicExceptions.txt): ౛>జ = LETTER ZA>LETTER JA -"\uE05D>ఢ;" // REMAP (indicExceptions.txt): ౝ>ఢ = LETTER RHA>LETTER DDHA -"\uE05E>ఫ;" // REMAP (indicExceptions.txt): ౞>ఫ = LETTER FA>LETTER PHA -"\uE05F>య;" // REMAP (indicExceptions.txt): ౟>య = LETTER YYA>LETTER YA -"\uE060>ౠ;" // LETTER VOCALIC RR -"\uE061>ౡ;" // LETTER VOCALIC LL -"\uE062>ి;" // REMAP (indicExceptions.txt): ౢ>ి = VOWEL SIGN VOCALIC L>VOWEL SIGN I -"\uE063>ీ;" // REMAP (indicExceptions.txt): ౣ>ీ = VOWEL SIGN VOCALIC LL>VOWEL SIGN II -"\uE066>౦;" // DIGIT ZERO -"\uE067>౧;" // DIGIT ONE -"\uE068>౨;" // DIGIT TWO -"\uE069>౩;" // DIGIT THREE -"\uE06A>౪;" // DIGIT FOUR -"\uE06B>౫;" // DIGIT FIVE -"\uE06C>౬;" // DIGIT SIX -"\uE06D>౭;" // DIGIT SEVEN -"\uE06E>౮;" // DIGIT EIGHT -"\uE06F>౯;" // DIGIT NINE -// \uE080>; // UNMAPPED InterIndic-Telugu: ISSHAR -"\uE081>ఎ;" // LETTER E -"\uE082>ఒ;" // LETTER O -"\uE083>ఱ;" // LETTER RRA -"\uE084>ె;" // VOWEL SIGN E -"\uE085>ొ;" // VOWEL SIGN O - +":: NFD (NFC) ;" +"\ue001>\u0c01;" // SIGN CANDRABINDU +"\ue002>\u0c02;" // SIGN ANUSVARA +"\ue003>\u0c03;" // SIGN VISARGA +"\ue005>\u0c05;" // LETTER A +"\ue006>\u0c06;" // LETTER AA +"\ue007>\u0c07;" // LETTER I +"\ue008>\u0c08;" // LETTER II +"\ue009>\u0c09;" // LETTER U +"\ue00a>\u0c0a;" // LETTER UU +"\ue00b>\u0c0b;" // LETTER VOCALIC R +"\ue00c>\u0c0c;" // LETTER VOCALIC L +"\ue00f>\u0c0f;" // LETTER EE +"\ue010>\u0c10;" // LETTER AI +"\ue013>\u0c13;" // LETTER OO +"\ue014>\u0c14;" // LETTER AU +"\ue015>\u0c15;" // LETTER KA +"\ue016>\u0c16;" // LETTER KHA +"\ue017>\u0c17;" // LETTER GA +"\ue018>\u0c18;" // LETTER GHA +"\ue019>\u0c19;" // LETTER NGA +"\ue01a>\u0c1a;" // LETTER CA +"\ue01b>\u0c1b;" // LETTER CHA +"\ue01c>\u0c1c;" // LETTER JA +"\ue01d>\u0c1d;" // LETTER JHA +"\ue01e>\u0c1e;" // LETTER NYA +"\ue01f>\u0c1f;" // LETTER TTA +"\ue020>\u0c20;" // LETTER TTHA +"\ue021>\u0c21;" // LETTER DDA +"\ue022>\u0c22;" // LETTER DDHA +"\ue023>\u0c23;" // LETTER NNA +"\ue024>\u0c24;" // LETTER TA +"\ue025>\u0c25;" // LETTER THA +"\ue026>\u0c26;" // LETTER DA +"\ue027>\u0c27;" // LETTER DHA +"\ue028>\u0c28;" // LETTER NA +"\ue029>\u0c28;" // REMAP (indicExceptions.txt): \u0c29>\u0c28 = LETTER NNNA>LETTER NA +"\ue02a>\u0c2a;" // LETTER PA +"\ue02b>\u0c2b;" // LETTER PHA +"\ue02c>\u0c2c;" // LETTER BA +"\ue02d>\u0c2d;" // LETTER BHA +"\ue02e>\u0c2e;" // LETTER MA +"\ue02f>\u0c2f;" // LETTER YA +"\ue030>\u0c30;" // LETTER RA +"\ue032>\u0c32;" // LETTER LA +"\ue033>\u0c33;" // LETTER LLA +"\ue034>\u0c33;" // REMAP (indicExceptions.txt): \u0c34>\u0c33 = LETTER LLLA>LETTER LLA +"\ue035>\u0c35;" // LETTER VA +"\ue036>\u0c36;" // LETTER SHA +"\ue037>\u0c37;" // LETTER SSA +"\ue038>\u0c38;" // LETTER SA +"\ue039>\u0c39;" // LETTER HA +// \ue03c>; // UNMAPPED InterIndic-Telugu: SIGN NUKTA +// \ue03d>; // UNMAPPED InterIndic-Telugu: SIGN AVAGRAHA +"\ue03e>\u0c3e;" // VOWEL SIGN AA +"\ue03f>\u0c3f;" // VOWEL SIGN I +"\ue040>\u0c40;" // VOWEL SIGN II +"\ue041>\u0c41;" // VOWEL SIGN U +"\ue042>\u0c42;" // VOWEL SIGN UU +"\ue043>\u0c43;" // VOWEL SIGN VOCALIC R +"\ue044>\u0c44;" // VOWEL SIGN VOCALIC RR +"\ue045>\u0c46;" // VOWEL SIGN CANDRA E>VOWEL SIGN E +"\ue047>\u0c47;" // VOWEL SIGN EE +"\ue048>\u0c48;" // VOWEL SIGN AI +"\ue049>\u0c4a;" // REMAP (indicExceptions.txt): \u0c49>\u0c4a = VOWEL SIGN CANDRA O>VOWEL SIGN O +"\ue04b>\u0c4b;" // VOWEL SIGN OO +"\ue04c>\u0c4c;" // VOWEL SIGN AU +"\ue04d>\u0c4d;" // SIGN VIRAMA +"\ue050>\u0c13\u0c02;" // REMAP (indicExceptions.txt): \u0c50>\u0c13\u0c02 = OM>LETTER OO.SIGN ANUSVARA +"\ue055>\u0c55;" // LENGTH MARK +"\ue056>\u0c56;" // AI LENGTH MARK +"\ue057>\u0c4c;" // REMAP (indicExceptions.txt): \u0c57>\u0c4c = AU LENGTH MARK>VOWEL SIGN AU +"\ue059>\u0c16;" // REMAP (indicExceptions.txt): \u0c59>\u0c16 = LETTER KHHA>LETTER KHA +"\ue05a>\u0c17;" // REMAP (indicExceptions.txt): \u0c5a>\u0c17 = LETTER GHHA>LETTER GA +"\ue05b>\u0c1c;" // REMAP (indicExceptions.txt): \u0c5b>\u0c1c = LETTER ZA>LETTER JA +"\ue05d>\u0c22;" // REMAP (indicExceptions.txt): \u0c5d>\u0c22 = LETTER RHA>LETTER DDHA +"\ue05e>\u0c2b;" // REMAP (indicExceptions.txt): \u0c5e>\u0c2b = LETTER FA>LETTER PHA +"\ue05f>\u0c2f;" // REMAP (indicExceptions.txt): \u0c5f>\u0c2f = LETTER YYA>LETTER YA +"\ue060>\u0c60;" // LETTER VOCALIC RR +"\ue061>\u0c61;" // LETTER VOCALIC LL +"\ue062>\u0c3f;" // REMAP (indicExceptions.txt): \u0c62>\u0c3f = VOWEL SIGN VOCALIC L>VOWEL SIGN I +"\ue063>\u0c40;" // REMAP (indicExceptions.txt): \u0c63>\u0c40 = VOWEL SIGN VOCALIC LL>VOWEL SIGN II +"\ue066>\u0c66;" // DIGIT ZERO +"\ue067>\u0c67;" // DIGIT ONE +"\ue068>\u0c68;" // DIGIT TWO +"\ue069>\u0c69;" // DIGIT THREE +"\ue06a>\u0c6a;" // DIGIT FOUR +"\ue06b>\u0c6b;" // DIGIT FIVE +"\ue06c>\u0c6c;" // DIGIT SIX +"\ue06d>\u0c6d;" // DIGIT SEVEN +"\ue06e>\u0c6e;" // DIGIT EIGHT +"\ue06f>\u0c6f;" // DIGIT NINE +// \ue080>; // UNMAPPED InterIndic-Telugu: ISSHAR +"\ue00e>\u0c0e;" // LETTER E +"\ue012>\u0c12;" // LETTER O +"\ue031>\u0c31;" // LETTER RRA +"\ue046>\u0c46;" // VOWEL SIGN E +"\ue04a>\u0c4a;" // VOWEL SIGN O + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/Kannada_InterIndic.txt b/icu4c/data/Kannada_InterIndic.txt index 29ac5048f3..61415bade3 100644 --- a/icu4c/data/Kannada_InterIndic.txt +++ b/icu4c/data/Kannada_InterIndic.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Kannada_InterIndic.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_Kannada_InterIndic.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // Kannada_InterIndic -Kannada_InterIndic { +Kannada-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,88 +20,88 @@ Kannada_InterIndic { //-------------------------------------------------------------------- // Kannada-InterIndic - -"ಂ>\uE002;" // SIGN ANUSVARA -"ಃ>\uE003;" // SIGN VISARGA -"ಅ>\uE005;" // LETTER A -"ಆ>\uE006;" // LETTER AA -"ಇ>\uE007;" // LETTER I -"ಈ>\uE008;" // LETTER II -"ಉ>\uE009;" // LETTER U -"ಊ>\uE00A;" // LETTER UU -"ಋ>\uE00B;" // LETTER VOCALIC R -"ಌ>\uE00C;" // LETTER VOCALIC L -"ಎ>\uE081;" // LETTER E -"ಏ>\uE00F;" // LETTER EE -"ಐ>\uE010;" // LETTER AI -"ಒ>\uE082;" // LETTER O -"ಓ>\uE013;" // LETTER OO -"ಔ>\uE014;" // LETTER AU -"ಕ>\uE015;" // LETTER KA -"ಖ>\uE016;" // LETTER KHA -"ಗ>\uE017;" // LETTER GA -"ಘ>\uE018;" // LETTER GHA -"ಙ>\uE019;" // LETTER NGA -"ಚ>\uE01A;" // LETTER CA -"ಛ>\uE01B;" // LETTER CHA -"ಜ>\uE01C;" // LETTER JA -"ಝ>\uE01D;" // LETTER JHA -"ಞ>\uE01E;" // LETTER NYA -"ಟ>\uE01F;" // LETTER TTA -"ಠ>\uE020;" // LETTER TTHA -"ಡ>\uE021;" // LETTER DDA -"ಢ>\uE022;" // LETTER DDHA -"ಣ>\uE023;" // LETTER NNA -"ತ>\uE024;" // LETTER TA -"ಥ>\uE025;" // LETTER THA -"ದ>\uE026;" // LETTER DA -"ಧ>\uE027;" // LETTER DHA -"ನ>\uE028;" // LETTER NA -"ಪ>\uE02A;" // LETTER PA -"ಫ>\uE02B;" // LETTER PHA -"ಬ>\uE02C;" // LETTER BA -"ಭ>\uE02D;" // LETTER BHA -"ಮ>\uE02E;" // LETTER MA -"ಯ>\uE02F;" // LETTER YA -"ರ>\uE030;" // LETTER RA -"ಱ>\uE083;" // LETTER RRA -"ಲ>\uE032;" // LETTER LA -"ಳ>\uE033;" // LETTER LLA -"ವ>\uE035;" // LETTER VA -"ಶ>\uE036;" // LETTER SHA -"ಷ>\uE037;" // LETTER SSA -"ಸ>\uE038;" // LETTER SA -"ಹ>\uE039;" // LETTER HA -"ಾ>\uE03E;" // VOWEL SIGN AA -"ಿ>\uE03F;" // VOWEL SIGN I -"ೀ>\uE040;" // VOWEL SIGN II -"ು>\uE041;" // VOWEL SIGN U -"ೂ>\uE042;" // VOWEL SIGN UU -"ೃ>\uE043;" // VOWEL SIGN VOCALIC R -"ೄ>\uE044;" // VOWEL SIGN VOCALIC RR -"ೆ>\uE084;" // VOWEL SIGN E -"ೇ>\uE047;" // VOWEL SIGN EE -"ೈ>\uE048;" // VOWEL SIGN AI -"ೊ>\uE085;" // VOWEL SIGN O -"ೋ>\uE04B;" // VOWEL SIGN OO -"ೌ>\uE04C;" // VOWEL SIGN AU -"್>\uE04D;" // SIGN VIRAMA -"ೕ>\uE055;" // LENGTH MARK -"ೖ>\uE056;" // AI LENGTH MARK -"ೞ>\uE05E;" // LETTER FA -"ೠ>\uE060;" // LETTER VOCALIC RR -"ೡ>\uE061;" // LETTER VOCALIC LL -"೦>\uE066;" // DIGIT ZERO -"೧>\uE067;" // DIGIT ONE -"೨>\uE068;" // DIGIT TWO -"೩>\uE069;" // DIGIT THREE -"೪>\uE06A;" // DIGIT FOUR -"೫>\uE06B;" // DIGIT FIVE -"೬>\uE06C;" // DIGIT SIX -"೭>\uE06D;" // DIGIT SEVEN -"೮>\uE06E;" // DIGIT EIGHT -"೯>\uE06F;" // DIGIT NINE - +":: NFD (NFC) ;" +"\u0c82>\ue002;" // SIGN ANUSVARA +"\u0c83>\ue003;" // SIGN VISARGA +"\u0c85>\ue005;" // LETTER A +"\u0c86>\ue006;" // LETTER AA +"\u0c87>\ue007;" // LETTER I +"\u0c88>\ue008;" // LETTER II +"\u0c89>\ue009;" // LETTER U +"\u0c8a>\ue00a;" // LETTER UU +"\u0c8b>\ue00b;" // LETTER VOCALIC R +"\u0c8c>\ue00c;" // LETTER VOCALIC L +"\u0c8e>\ue00e;" // LETTER E +"\u0c8f>\ue00f;" // LETTER EE +"\u0c90>\ue010;" // LETTER AI +"\u0c92>\ue012;" // LETTER O +"\u0c93>\ue013;" // LETTER OO +"\u0c94>\ue014;" // LETTER AU +"\u0c95>\ue015;" // LETTER KA +"\u0c96>\ue016;" // LETTER KHA +"\u0c97>\ue017;" // LETTER GA +"\u0c98>\ue018;" // LETTER GHA +"\u0c99>\ue019;" // LETTER NGA +"\u0c9a>\ue01a;" // LETTER CA +"\u0c9b>\ue01b;" // LETTER CHA +"\u0c9c>\ue01c;" // LETTER JA +"\u0c9d>\ue01d;" // LETTER JHA +"\u0c9e>\ue01e;" // LETTER NYA +"\u0c9f>\ue01f;" // LETTER TTA +"\u0ca0>\ue020;" // LETTER TTHA +"\u0ca1>\ue021;" // LETTER DDA +"\u0ca2>\ue022;" // LETTER DDHA +"\u0ca3>\ue023;" // LETTER NNA +"\u0ca4>\ue024;" // LETTER TA +"\u0ca5>\ue025;" // LETTER THA +"\u0ca6>\ue026;" // LETTER DA +"\u0ca7>\ue027;" // LETTER DHA +"\u0ca8>\ue028;" // LETTER NA +"\u0caa>\ue02a;" // LETTER PA +"\u0cab>\ue02b;" // LETTER PHA +"\u0cac>\ue02c;" // LETTER BA +"\u0cad>\ue02d;" // LETTER BHA +"\u0cae>\ue02e;" // LETTER MA +"\u0caf>\ue02f;" // LETTER YA +"\u0cb0>\ue030;" // LETTER RA +"\u0cb1>\ue031;" // LETTER RRA +"\u0cb2>\ue032;" // LETTER LA +"\u0cb3>\ue033;" // LETTER LLA +"\u0cb5>\ue035;" // LETTER VA +"\u0cb6>\ue036;" // LETTER SHA +"\u0cb7>\ue037;" // LETTER SSA +"\u0cb8>\ue038;" // LETTER SA +"\u0cb9>\ue039;" // LETTER HA +"\u0cbe>\ue03e;" // VOWEL SIGN AA +"\u0cbf>\ue03f;" // VOWEL SIGN I +"\u0cc0>\ue040;" // VOWEL SIGN II +"\u0cc1>\ue041;" // VOWEL SIGN U +"\u0cc2>\ue042;" // VOWEL SIGN UU +"\u0cc3>\ue043;" // VOWEL SIGN VOCALIC R +"\u0cc4>\ue044;" // VOWEL SIGN VOCALIC RR +"\u0cc6>\ue046;" // VOWEL SIGN E +"\u0cc7>\ue047;" // VOWEL SIGN EE +"\u0cc8>\ue048;" // VOWEL SIGN AI +"\u0cca>\ue04a;" // VOWEL SIGN O +"\u0ccb>\ue04b;" // VOWEL SIGN OO +"\u0ccc>\ue04c;" // VOWEL SIGN AU +"\u0ccd>\ue04d;" // SIGN VIRAMA +"\u0cd5>\ue055;" // LENGTH MARK +"\u0cd6>\ue056;" // AI LENGTH MARK +"\u0cde>\ue05e;" // LETTER FA +"\u0ce0>\ue060;" // LETTER VOCALIC RR +"\u0ce1>\ue061;" // LETTER VOCALIC LL +"\u0ce6>\ue066;" // DIGIT ZERO +"\u0ce7>\ue067;" // DIGIT ONE +"\u0ce8>\ue068;" // DIGIT TWO +"\u0ce9>\ue069;" // DIGIT THREE +"\u0cea>\ue06a;" // DIGIT FOUR +"\u0ceb>\ue06b;" // DIGIT FIVE +"\u0cec>\ue06c;" // DIGIT SIX +"\u0ced>\ue06d;" // DIGIT SEVEN +"\u0cee>\ue06e;" // DIGIT EIGHT +"\u0cef>\ue06f;" // DIGIT NINE + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/Latin_InterIndic.txt b/icu4c/data/Latin_InterIndic.txt new file mode 100644 index 0000000000..159a254329 --- /dev/null +++ b/icu4c/data/Latin_InterIndic.txt @@ -0,0 +1,336 @@ +//-------------------------------------------------------------------- +// Copyright (c) 2001-2004, International Business Machines +// Corporation and others. All Rights Reserved. +//-------------------------------------------------------------------- + +// Latin-InterIndic + +Latin-InterIndic{ + Rule{ + ":: NFD (NFC) ;" + //\u0e00 reserved + //consonants + "$chandrabindu=\ue001;" + "$anusvara=\ue002;" + "$visarga=\ue003;" + //\u0e004 reserved + // w represents the stand-alone form + "$wa=\ue005;" + "$waa=\ue006;" + "$wi=\ue007;" + "$wii=\ue008;" + "$wu=\ue009;" + "$wuu=\ue00a;" + "$wr=\ue00b;" + "$wl=\ue00c;" + + "$wce=\ue00d;" // LETTER CANDRA E + "$wse=\ue00e;" // LETTER SHORT E + + "$we=\ue00f;" // \u090f LETTER E + "$wai=\ue010;" + + "$wco=\ue011;" // LETTER CANDRA O + "$wso=\ue012;" // LETTER SHORT O + + "$wo=\ue013;" // \u0913 LETTER O + "$wau=\ue014;" + + "$ka=\ue015;" + "$kha=\ue016;" + "$ga=\ue017;" + "$gha=\ue018;" + "$nga=\ue019;" + + "$ca=\ue01a;" + "$cha=\ue01b;" + "$ja=\ue01c;" + "$jha=\ue01d;" + "$nya=\ue01e;" + + "$tta=\ue01f;" + "$ttha=\ue020;" + "$dda=\ue021;" + "$ddha=\ue022;" + "$nna=\ue023;" + + "$ta=\ue024;" + "$tha=\ue025;" + "$da=\ue026;" + "$dha=\ue027;" + "$na=\ue028;" + "$ena=\ue029;" //compatibility + + "$pa=\ue02a;" + "$pha=\ue02b;" + "$ba=\ue02c;" + "$bha=\ue02d;" + "$ma=\ue02e;" + + "$ya=\ue02f;" + "$ra=\ue030;" + "$rra=\ue031;" + "$la=\ue032;" + "$lla=\ue033;" + "$ela=\ue034;" //compatibility + "$va=\ue035;" + + "$sha=\ue036;" + "$ssa=\ue037;" + "$sa=\ue038;" + "$ha=\ue039;" +//\u093a Reserved +//\u093b Reserved + "$nukta=\ue03c;" + "$avagraha=\ue03d;" // SIGN AVAGRAHA + + // represents the dependent form + "$aa=\ue03e;" + "$i=\ue03f;" + "$ii=\ue040;" + "$u=\ue041;" + "$uu=\ue042;" + "$rh=\ue043;" + "$lh=\ue044;" + "$ce=\ue045;" //VOWEL SIGN CANDRA E + "$se=\ue046;" //VOWEL SIGN SHORT E + "$e=\ue047;" + "$ai=\ue048;" + "$co=\ue049;" // VOWEL SIGN CANDRA O + "$so=\ue04a;" // VOWEL SIGN SHORT O + "$o=\ue04b;" // \u094b + "$au=\ue04c;" + "$virama=\ue04d;" +// \u094e Reserved +// \u094f Reserved +//"\u0950>\ue050;" // OM +// \u0951>; // UNMAPPED STRESS SIGN UDATTA +// \u0952>; // UNMAPPED STRESS SIGN ANUDATTA +// \u0953>; // UNMAPPED GRAVE ACCENT +// \u0954>; // UNMAPPED ACUTE ACCENT + + "$lm = \ue055;"// Telugu Length Mark + "$ailm=\ue056;"// AI Length Mark + "$aulm=\ue057;"// AU Length Mark + + //urdu compatibity forms + "$uka=\ue058;" + "$ukha=\ue059;" + "$ugha=\ue05a;" + "$ujha=\ue05b;" + "$uddha=\ue05c;" + "$udha=\ue05d;" + "$ufa=\ue05e;" + "$uya=\ue05f;" + + "$wrr=\ue060;" + "$wll=\ue061;" + "$rrh=\ue062;" + "$llh=\ue063;" + + "$danda=\ue064;" + "$doubleDanda=\ue065;" + + "$zero=\ue066;" // DIGIT ZERO + "$one=\ue067;" // DIGIT ONE + "$two=\ue068;" // DIGIT TWO + "$three=\ue069;" // DIGIT THREE + "$four=\ue06a;" // DIGIT FOUR + "$five=\ue06b;" // DIGIT FIVE + "$six=\ue06c;" // DIGIT SIX + "$seven=\ue06d;" // DIGIT SEVEN + "$eight=\ue06e;" // DIGIT EIGHT + "$nine=\ue06f;" // DIGIT NINE + + // For all other scripts + "$ecp0=\ue070;" + "$ecp1=\ue071;" + "$ecp2=\ue072;" + "$ecp3=\ue073;" + "$ecp4=\ue074;" + "$ecp5=\ue075;" + "$ecp6=\ue076;" + "$ecp7=\ue077;" + "$ecp8=\ue078;" + "$ecp9=\ue079;" + "$ecpA=\ue07a;" + "$ecpB=\ue07b;" + "$ecpC=\ue07c;" + "$ecpD=\ue07d;" + "$ecpE=\ue07e;" + "$ecpF=\ue07f;" + + +// \u0970>; // UNMAPPED ABBREVIATION SIGN + + "$depVowelAbove=[\ue03e-\ue040\ue045-\ue04c];" + "$depVowelBelow=[\ue041-\ue044];" + "$endThing=[$danda$doubleDanda \u005c\u005cu0000-\udfff\ue080-\ufffd];" + + // $x was originally called '&'; $z was '%' + "$x=[$virama$aa$ai$au$ii$i$uu$u$rrh$rh$lh$e$o$se$ce$so$co];" + "$z=[bcdfghjklmnpqrstvwxyz];" + + "\u0315 > $avagraha;" + "'-'\u0303>$chandrabindu$anusvara;" + "'-'m\u0310>$chandrabindu;" + "'-'h\u0323>$visarga;" + + "mm>$anusvara;" + "x>$visarga;" + "aa>$waa;" + "a\u0304>$waa;" + "ai>$wai;" + "au>$wau;" + "ii>$wii;" + "i\u0304>$wii;" + "i>$wi;" + "uu>$wuu;" + "u\u0304>$wuu;" + "u>$wu;" + "rrh>$wrr;" + "r\u0325\u0304>$wrr;" + "rh>$wr; + "r\u0325>$wr;" + "l\u0325\u0304>$wll;" + "lh>$wl;"l\u0325>$wl;" + "e\u0304>$we;" + "o\u0304>$wo;" + "a>$wa;" + "e\u0306>$wce;" + "o\u0306>$wco;" + "e>$wse;" + "o>$wso;" + + "n}na > $na|$virama;" + + "n\u0307}[kg] > $anusvara;" + "n\u0307}n\u0303 > $anusvara;" + "n\u0304}[cj] > $anusvara;" + "n\u0304}n\u0307 > $anusvara;" + "n\u0323}[tdn]\u0323 > $anusvara;" + "n}[tdn] > $anusvara;" + "m}[pbm] > $anusvara;" + "n} [yrlvsh] > $anusvara;" + "'-'m\u0307 > $anusvara;" + + "y\u0307>$uya|$virama;" + "l\u0331>$ela|$virama;" + "n\u0331>$ena|$virama;" + "n\u0307>$nga|$virama;" + "n\u0303>$nya|$virama;" + "n\u0323>$nna|$virama;" + "t\u0323h>$ttha|$virama;" + "t\u0323>$tta|$virama;" + "r\u0323h>$udha|$virama;" + "r\u0323>$uddha|$virama;" + "d\u0323h>$ddha|$virama;" + "d\u0323>$dda|$virama;" + "kh>$kha|$virama;" + "k>$ka|$virama;" + "q>$ka|$virama;" + "gh>$gha|$virama;" + "g>$ga|$virama;" + "ch>$cha|$virama;" + "c>$ca|$virama;" + "jh>$jha|$virama;" + "j>$ja|$virama;" + "ny>$nya|$virama;" + "tth>$ttha|$virama;" + "ddh>$ddha|$virama;" + "th>$tha|$virama;" + "t>$ta|$virama;" + "dh>$dha|$virama;" + "d>$da|$virama;" + "n>$na|$virama;" + "ph>$pha|$virama;" + "p>$pa|$virama;" + "bh>$bha|$virama;" + "b>$ba|$virama;" + "m>$ma|$virama;" + "y>$ya|$virama;" + "r>$ra|$virama;" + "l\u0323a>$lla;" + "l>$la|$virama;" + "v>$va|$virama;" + "f>$va|$virama;" + "w>$va|$virama;" + "sh>$sha|$virama;" + "ss>$ssa|$virama;" + "s\u0323>$ssa|$virama;" + "s\u0301>$sha|$virama;" + "s>$sa|$virama;" + "z>$sa|$virama;" + "h>$ha|$virama;" + + "'.'>$danda;" + "$danda'.'>$doubleDanda;" + "$depVowelAbove{'~'>$anusvara;" + "$depVowelBelow{'~'>$chandrabindu;" + "$virama aa>$aa;" + "$virama a\u0304>$aa;" + "$virama ai>$ai;" + "$virama au>$au;" + "$virama ii>$ii;" + "$virama i\u0304>$ii;" + "$virama i>$i;" + "$virama uu>$uu;" + "$virama u\u0304>$uu;" + "$virama u>$u;" + "$virama rrh>$rrh;" + "$virama r\u0325\u0304>$rrh;" + "$virama rh>$rh;" + "$virama r\u0325>$rh;" + "$virama l\u0325\u0304>$llh;" + "$virama lh>$lh;" + "$virama l\u0325>$lh;" + "$virama e\u0304>$e;" + "$virama o\u0304>$o;" + "$virama a>;" + "$virama e\u0306>$ce;" + "$virama o\u0306>$co;" + "$virama e>$se;" + "$virama o>$so;" + "$virama''aa>$waa;" + "$virama''a\u0304>$waa;" + "$virama''ai>$wai;" + "$virama''au>$wau;" + "$virama''ii>$wii;" + "$virama''i\u0304>$wii;" + "$virama''i>$wi;" + "$virama''uu>$wuu;" + "$virama''u\u0304>$wuu;" + "$virama''u>$wu;" + "$virama''rrh>$wrr;" + "$virama''r\u0325\u0304>$wrr;" + "$virama''rh>$wr;" + "$virama''r\u0325>$wr;" + "$virama''l\u0325\u0304>$wll;" + "$virama''lh>$wl;" + "$virama''l\u0325>$wl;" + "$virama''e\u0304>$we;" + "$virama''o\u0304>$wo;" + "$virama''a>$wa;" + "$virama''e\u0306>$wce;" + "$virama''o\u0306>$wco;" + "$virama''e>$wse;" + "$virama''o>$wso;" + + "$virama } [$z] > $virama;" + "$virama } ' ' > $virama ;" + + "$virama}$endThing>;" + "0>$zero;" + "1>$one;" + "2>$two;" + "3>$three;" + "4>$four;" + "5>$five;" + "6>$six;" + "7>$seven;" + "8>$eight;" + "9>$nine;" + "''>;" + ":: NFC (NFD) ;" + } +} diff --git a/icu4c/data/Malayalam_InterIndic.txt b/icu4c/data/Malayalam_InterIndic.txt index 77eaae3013..ca6e3081b9 100644 --- a/icu4c/data/Malayalam_InterIndic.txt +++ b/icu4c/data/Malayalam_InterIndic.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Malayalam_InterIndic.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_Malayalam_InterIndic.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // Malayalam_InterIndic -Malayalam_InterIndic { +Malayalam-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,86 +20,86 @@ Malayalam_InterIndic { //-------------------------------------------------------------------- // Malayalam-InterIndic - -"ം>\uE002;" // SIGN ANUSVARA -"ഃ>\uE003;" // SIGN VISARGA -"അ>\uE005;" // LETTER A -"ആ>\uE006;" // LETTER AA -"ഇ>\uE007;" // LETTER I -"ഈ>\uE008;" // LETTER II -"ഉ>\uE009;" // LETTER U -"ഊ>\uE00A;" // LETTER UU -"ഋ>\uE00B;" // LETTER VOCALIC R -"ഌ>\uE00C;" // LETTER VOCALIC L -"എ>\uE081;" // LETTER E -"ഏ>\uE00F;" // LETTER EE -"ഐ>\uE010;" // LETTER AI -"ഒ>\uE082;" // LETTER O -"ഓ>\uE013;" // LETTER OO -"ഔ>\uE014;" // LETTER AU -"ക>\uE015;" // LETTER KA -"ഖ>\uE016;" // LETTER KHA -"ഗ>\uE017;" // LETTER GA -"ഘ>\uE018;" // LETTER GHA -"ങ>\uE019;" // LETTER NGA -"ച>\uE01A;" // LETTER CA -"ഛ>\uE01B;" // LETTER CHA -"ജ>\uE01C;" // LETTER JA -"ഝ>\uE01D;" // LETTER JHA -"ഞ>\uE01E;" // LETTER NYA -"ട>\uE01F;" // LETTER TTA -"ഠ>\uE020;" // LETTER TTHA -"ഡ>\uE021;" // LETTER DDA -"ഢ>\uE022;" // LETTER DDHA -"ണ>\uE023;" // LETTER NNA -"ത>\uE024;" // LETTER TA -"ഥ>\uE025;" // LETTER THA -"ദ>\uE026;" // LETTER DA -"ധ>\uE027;" // LETTER DHA -"ന>\uE028;" // LETTER NA -"പ>\uE02A;" // LETTER PA -"ഫ>\uE02B;" // LETTER PHA -"ബ>\uE02C;" // LETTER BA -"ഭ>\uE02D;" // LETTER BHA -"മ>\uE02E;" // LETTER MA -"യ>\uE02F;" // LETTER YA -"ര>\uE030;" // LETTER RA -"റ>\uE083;" // LETTER RRA -"ല>\uE032;" // LETTER LA -"ള>\uE033;" // LETTER LLA -"ഴ>\uE034;" // LETTER LLLA -"വ>\uE035;" // LETTER VA -"ശ>\uE036;" // LETTER SHA -"ഷ>\uE037;" // LETTER SSA -"സ>\uE038;" // LETTER SA -"ഹ>\uE039;" // LETTER HA -"ാ>\uE03E;" // VOWEL SIGN AA -"ി>\uE03F;" // VOWEL SIGN I -"ീ>\uE040;" // VOWEL SIGN II -"ു>\uE041;" // VOWEL SIGN U -"ൂ>\uE042;" // VOWEL SIGN UU -"ൃ>\uE043;" // VOWEL SIGN VOCALIC R -"െ>\uE084;" // VOWEL SIGN E -"േ>\uE047;" // VOWEL SIGN EE -"ൈ>\uE048;" // VOWEL SIGN AI -"ൊ>\uE085;" // VOWEL SIGN O -"ോ>\uE04B;" // VOWEL SIGN OO -"ൌ>\uE04C;" // VOWEL SIGN AU -"്>\uE04D;" // SIGN VIRAMA -"ൗ>\uE057;" // AU LENGTH MARK -"ൠ>\uE060;" // LETTER VOCALIC RR -"ൡ>\uE061;" // LETTER VOCALIC LL -"൦>\uE066;" // DIGIT ZERO -"൧>\uE067;" // DIGIT ONE -"൨>\uE068;" // DIGIT TWO -"൩>\uE069;" // DIGIT THREE -"൪>\uE06A;" // DIGIT FOUR -"൫>\uE06B;" // DIGIT FIVE -"൬>\uE06C;" // DIGIT SIX -"൭>\uE06D;" // DIGIT SEVEN -"൮>\uE06E;" // DIGIT EIGHT -"൯>\uE06F;" // DIGIT NINE - +":: NFD (NFC) ;" +"\u0d02>\ue002;" // SIGN ANUSVARA +"\u0d03>\ue003;" // SIGN VISARGA +"\u0d05>\ue005;" // LETTER A +"\u0d06>\ue006;" // LETTER AA +"\u0d07>\ue007;" // LETTER I +"\u0d08>\ue008;" // LETTER II +"\u0d09>\ue009;" // LETTER U +"\u0d0a>\ue00a;" // LETTER UU +"\u0d0b>\ue00b;" // LETTER VOCALIC R +"\u0d0c>\ue00c;" // LETTER VOCALIC L +"\u0d0e>\ue00e;" // LETTER E +"\u0d0f>\ue00f;" // LETTER EE +"\u0d10>\ue010;" // LETTER AI +"\u0d12>\ue012;" // LETTER O +"\u0d13>\ue013;" // LETTER OO +"\u0d14>\ue014;" // LETTER AU +"\u0d15>\ue015;" // LETTER KA +"\u0d16>\ue016;" // LETTER KHA +"\u0d17>\ue017;" // LETTER GA +"\u0d18>\ue018;" // LETTER GHA +"\u0d19>\ue019;" // LETTER NGA +"\u0d1a>\ue01a;" // LETTER CA +"\u0d1b>\ue01b;" // LETTER CHA +"\u0d1c>\ue01c;" // LETTER JA +"\u0d1d>\ue01d;" // LETTER JHA +"\u0d1e>\ue01e;" // LETTER NYA +"\u0d1f>\ue01f;" // LETTER TTA +"\u0d20>\ue020;" // LETTER TTHA +"\u0d21>\ue021;" // LETTER DDA +"\u0d22>\ue022;" // LETTER DDHA +"\u0d23>\ue023;" // LETTER NNA +"\u0d24>\ue024;" // LETTER TA +"\u0d25>\ue025;" // LETTER THA +"\u0d26>\ue026;" // LETTER DA +"\u0d27>\ue027;" // LETTER DHA +"\u0d28>\ue028;" // LETTER NA +"\u0d2a>\ue02a;" // LETTER PA +"\u0d2b>\ue02b;" // LETTER PHA +"\u0d2c>\ue02c;" // LETTER BA +"\u0d2d>\ue02d;" // LETTER BHA +"\u0d2e>\ue02e;" // LETTER MA +"\u0d2f>\ue02f;" // LETTER YA +"\u0d30>\ue030;" // LETTER RA +"\u0d31>\ue031;" // LETTER RRA +"\u0d32>\ue032;" // LETTER LA +"\u0d33>\ue033;" // LETTER LLA +"\u0d34>\ue034;" // LETTER LLLA +"\u0d35>\ue035;" // LETTER VA +"\u0d36>\ue036;" // LETTER SHA +"\u0d37>\ue037;" // LETTER SSA +"\u0d38>\ue038;" // LETTER SA +"\u0d39>\ue039;" // LETTER HA +"\u0d3e>\ue03e;" // VOWEL SIGN AA +"\u0d3f>\ue03f;" // VOWEL SIGN I +"\u0d40>\ue040;" // VOWEL SIGN II +"\u0d41>\ue041;" // VOWEL SIGN U +"\u0d42>\ue042;" // VOWEL SIGN UU +"\u0d43>\ue043;" // VOWEL SIGN VOCALIC R +"\u0d46>\ue046;" // VOWEL SIGN E +"\u0d47>\ue047;" // VOWEL SIGN EE +"\u0d48>\ue048;" // VOWEL SIGN AI +"\u0d4a>\ue04a;" // VOWEL SIGN O +"\u0d4b>\ue04b;" // VOWEL SIGN OO +"\u0d4c>\ue04c;" // VOWEL SIGN AU +"\u0d4d>\ue04d;" // SIGN VIRAMA +"\u0d57>\ue057;" // AU LENGTH MARK +"\u0d60>\ue060;" // LETTER VOCALIC RR +"\u0d61>\ue061;" // LETTER VOCALIC LL +"\u0d66>\ue066;" // DIGIT ZERO +"\u0d67>\ue067;" // DIGIT ONE +"\u0d68>\ue068;" // DIGIT TWO +"\u0d69>\ue069;" // DIGIT THREE +"\u0d6a>\ue06a;" // DIGIT FOUR +"\u0d6b>\ue06b;" // DIGIT FIVE +"\u0d6c>\ue06c;" // DIGIT SIX +"\u0d6d>\ue06d;" // DIGIT SEVEN +"\u0d6e>\ue06e;" // DIGIT EIGHT +"\u0d6f>\ue06f;" // DIGIT NINE + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/Oriya_InterIndic.txt b/icu4c/data/Oriya_InterIndic.txt index 22e772f11e..36a9b0fd07 100644 --- a/icu4c/data/Oriya_InterIndic.txt +++ b/icu4c/data/Oriya_InterIndic.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Oriya_InterIndic.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_Oriya_InterIndic.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // Oriya_InterIndic -Oriya_InterIndic { +Oriya-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,87 +20,87 @@ Oriya_InterIndic { //-------------------------------------------------------------------- // Oriya-InterIndic - -"ଁ>\uE001;" // SIGN CANDRABINDU -"ଂ>\uE002;" // SIGN ANUSVARA -"ଃ>\uE003;" // SIGN VISARGA -"ଅ>\uE005;" // LETTER A -"ଆ>\uE006;" // LETTER AA -"ଇ>\uE007;" // LETTER I -"ଈ>\uE008;" // LETTER II -"ଉ>\uE009;" // LETTER U -"ଊ>\uE00A;" // LETTER UU -"ଋ>\uE00B;" // LETTER VOCALIC R -"ଌ>\uE00C;" // LETTER VOCALIC L -"ଏ>\uE081;" // LETTER E -"ଐ>\uE010;" // LETTER AI -"ଓ>\uE082;" // LETTER O -"ଔ>\uE014;" // LETTER AU -"କ>\uE015;" // LETTER KA -"ଖ>\uE016;" // LETTER KHA -"ଗ>\uE017;" // LETTER GA -"ଘ>\uE018;" // LETTER GHA -"ଙ>\uE019;" // LETTER NGA -"ଚ>\uE01A;" // LETTER CA -"ଛ>\uE01B;" // LETTER CHA -"ଜ>\uE01C;" // LETTER JA -"ଝ>\uE01D;" // LETTER JHA -"ଞ>\uE01E;" // LETTER NYA -"ଟ>\uE01F;" // LETTER TTA -"ଠ>\uE020;" // LETTER TTHA -"ଡ>\uE021;" // LETTER DDA -"ଢ>\uE022;" // LETTER DDHA -"ଣ>\uE023;" // LETTER NNA -"ତ>\uE024;" // LETTER TA -"ଥ>\uE025;" // LETTER THA -"ଦ>\uE026;" // LETTER DA -"ଧ>\uE027;" // LETTER DHA -"ନ>\uE028;" // LETTER NA -"ପ>\uE02A;" // LETTER PA -"ଫ>\uE02B;" // LETTER PHA -"ବ>\uE02C;" // LETTER BA -"ଭ>\uE02D;" // LETTER BHA -"ମ>\uE02E;" // LETTER MA -"ଯ>\uE02F;" // LETTER YA -"ର>\uE030;" // LETTER RA -"ଲ>\uE032;" // LETTER LA -"ଳ>\uE033;" // LETTER LLA -"ଶ>\uE036;" // LETTER SHA -"ଷ>\uE037;" // LETTER SSA -"ସ>\uE038;" // LETTER SA -"ହ>\uE039;" // LETTER HA -"଼>\uE03C;" // SIGN NUKTA -"ଽ>\uE03D;" // SIGN AVAGRAHA -"ା>\uE03E;" // VOWEL SIGN AA -"ି>\uE03F;" // VOWEL SIGN I -"ୀ>\uE040;" // VOWEL SIGN II -"ୁ>\uE041;" // VOWEL SIGN U -"ୂ>\uE042;" // VOWEL SIGN UU -"ୃ>\uE043;" // VOWEL SIGN VOCALIC R -"େ>\uE084;" // VOWEL SIGN E -"ୈ>\uE048;" // VOWEL SIGN AI -"ୋ>\uE085;" // VOWEL SIGN O -"ୌ>\uE04C;" // VOWEL SIGN AU -"୍>\uE04D;" // SIGN VIRAMA -"ୖ>\uE056;" // AI LENGTH MARK -"ୗ>\uE057;" // AU LENGTH MARK -"ଡ଼>\uE083;" // LETTER RRA -"ଢ଼>\uE05D;" // LETTER RHA -"ୟ>\uE05F;" // LETTER YYA -"ୠ>\uE060;" // LETTER VOCALIC RR -"ୡ>\uE061;" // LETTER VOCALIC LL -"୦>\uE066;" // DIGIT ZERO -"୧>\uE067;" // DIGIT ONE -"୨>\uE068;" // DIGIT TWO -"୩>\uE069;" // DIGIT THREE -"୪>\uE06A;" // DIGIT FOUR -"୫>\uE06B;" // DIGIT FIVE -"୬>\uE06C;" // DIGIT SIX -"୭>\uE06D;" // DIGIT SEVEN -"୮>\uE06E;" // DIGIT EIGHT -"୯>\uE06F;" // DIGIT NINE -"୰>\uE080;" // ISSHAR - +":: NFD (NFC) ;" +"\u0b01>\ue001;" // SIGN CANDRABINDU +"\u0b02>\ue002;" // SIGN ANUSVARA +"\u0b03>\ue003;" // SIGN VISARGA +"\u0b05>\ue005;" // LETTER A +"\u0b06>\ue006;" // LETTER AA +"\u0b07>\ue007;" // LETTER I +"\u0b08>\ue008;" // LETTER II +"\u0b09>\ue009;" // LETTER U +"\u0b0a>\ue00a;" // LETTER UU +"\u0b0b>\ue00b;" // LETTER VOCALIC R +"\u0b0c>\ue00c;" // LETTER VOCALIC L +"\u0b0f>\ue00f;" // LETTER E +"\u0b10>\ue010;" // LETTER AI +"\u0b13>\ue013;" // LETTER O +"\u0b14>\ue014;" // LETTER AU +"\u0b15>\ue015;" // LETTER KA +"\u0b16>\ue016;" // LETTER KHA +"\u0b17>\ue017;" // LETTER GA +"\u0b18>\ue018;" // LETTER GHA +"\u0b19>\ue019;" // LETTER NGA +"\u0b1a>\ue01a;" // LETTER CA +"\u0b1b>\ue01b;" // LETTER CHA +"\u0b1c>\ue01c;" // LETTER JA +"\u0b1d>\ue01d;" // LETTER JHA +"\u0b1e>\ue01e;" // LETTER NYA +"\u0b1f>\ue01f;" // LETTER TTA +"\u0b20>\ue020;" // LETTER TTHA +"\u0b21>\ue021;" // LETTER DDA +"\u0b22>\ue022;" // LETTER DDHA +"\u0b23>\ue023;" // LETTER NNA +"\u0b24>\ue024;" // LETTER TA +"\u0b25>\ue025;" // LETTER THA +"\u0b26>\ue026;" // LETTER DA +"\u0b27>\ue027;" // LETTER DHA +"\u0b28>\ue028;" // LETTER NA +"\u0b2a>\ue02a;" // LETTER PA +"\u0b2b>\ue02b;" // LETTER PHA +"\u0b2c>\ue02c;" // LETTER BA +"\u0b2d>\ue02d;" // LETTER BHA +"\u0b2e>\ue02e;" // LETTER MA +"\u0b2f>\ue02f;" // LETTER YA +"\u0b30>\ue030;" // LETTER RA +"\u0b32>\ue032;" // LETTER LA +"\u0b33>\ue033;" // LETTER LLA +"\u0b36>\ue036;" // LETTER SHA +"\u0b37>\ue037;" // LETTER SSA +"\u0b38>\ue038;" // LETTER SA +"\u0b39>\ue039;" // LETTER HA +"\u0b3c>\ue03c;" // SIGN NUKTA +"\u0b3d>\ue03d;" // SIGN AVAGRAHA +"\u0b3e>\ue03e;" // VOWEL SIGN AA +"\u0b3f>\ue03f;" // VOWEL SIGN I +"\u0b40>\ue040;" // VOWEL SIGN II +"\u0b41>\ue041;" // VOWEL SIGN U +"\u0b42>\ue042;" // VOWEL SIGN UU +"\u0b43>\ue043;" // VOWEL SIGN VOCALIC R +"\u0b47>\ue047;" // VOWEL SIGN E +"\u0b48>\ue048;" // VOWEL SIGN AI +"\u0b4b>\ue04b;" // VOWEL SIGN O +"\u0b4c>\ue04c;" // VOWEL SIGN AU +"\u0b4d>\ue04d;" // SIGN VIRAMA +"\u0b56>\ue056;" // AI LENGTH MARK +"\u0b57>\ue057;" // AU LENGTH MARK +"\u0b5c>\ue05c;" // LETTER RRA +"\u0b5d>\ue05d;" // LETTER RHA +"\u0b5f>\ue05f;" // LETTER YYA +"\u0b60>\ue060;" // LETTER VOCALIC RR +"\u0b61>\ue061;" // LETTER VOCALIC LL +"\u0b66>\ue066;" // DIGIT ZERO +"\u0b67>\ue067;" // DIGIT ONE +"\u0b68>\ue068;" // DIGIT TWO +"\u0b69>\ue069;" // DIGIT THREE +"\u0b6a>\ue06a;" // DIGIT FOUR +"\u0b6b>\ue06b;" // DIGIT FIVE +"\u0b6c>\ue06c;" // DIGIT SIX +"\u0b6d>\ue06d;" // DIGIT SEVEN +"\u0b6e>\ue06e;" // DIGIT EIGHT +"\u0b6f>\ue06f;" // DIGIT NINE +"\u0b70>\ue070;" // ISSHAR + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/Tamil_InterIndic.txt b/icu4c/data/Tamil_InterIndic.txt index 878e374156..f6e14514f0 100644 --- a/icu4c/data/Tamil_InterIndic.txt +++ b/icu4c/data/Tamil_InterIndic.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Tamil_InterIndic.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_Tamil_InterIndic.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // Tamil_InterIndic -Tamil_InterIndic { +Tamil-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,69 +20,69 @@ Tamil_InterIndic { //-------------------------------------------------------------------- // Tamil-InterIndic - -"ஂ>\uE002;" // SIGN ANUSVARA -"ஃ>\uE003;" // SIGN VISARGA -"அ>\uE005;" // LETTER A -"ஆ>\uE006;" // LETTER AA -"இ>\uE007;" // LETTER I -"ஈ>\uE008;" // LETTER II -"உ>\uE009;" // LETTER U -"ஊ>\uE00A;" // LETTER UU -"எ>\uE081;" // LETTER E -"ஏ>\uE00F;" // LETTER EE -"ஐ>\uE010;" // LETTER AI -"ஒ>\uE082;" // LETTER O -"ஓ>\uE013;" // LETTER OO -"ஔ>\uE014;" // LETTER AU -"க>\uE015;" // LETTER KA -"ங>\uE019;" // LETTER NGA -"ச>\uE01A;" // LETTER CA -"ஜ>\uE01C;" // LETTER JA -"ஞ>\uE01E;" // LETTER NYA -"ட>\uE01F;" // LETTER TTA -"ண>\uE023;" // LETTER NNA -"த>\uE024;" // LETTER TA -"ந>\uE028;" // LETTER NA -"ன>\uE029;" // LETTER NNNA -"ப>\uE02A;" // LETTER PA -"ம>\uE02E;" // LETTER MA -"ய>\uE02F;" // LETTER YA -"ர>\uE030;" // LETTER RA -"ற>\uE083;" // LETTER RRA -"ல>\uE032;" // LETTER LA -"ள>\uE033;" // LETTER LLA -"ழ>\uE034;" // LETTER LLLA -"வ>\uE035;" // LETTER VA -"ஷ>\uE037;" // LETTER SSA -"ஸ>\uE038;" // LETTER SA -"ஹ>\uE039;" // LETTER HA -"ா>\uE03E;" // VOWEL SIGN AA -"ி>\uE03F;" // VOWEL SIGN I -"ீ>\uE040;" // VOWEL SIGN II -"ு>\uE041;" // VOWEL SIGN U -"ூ>\uE042;" // VOWEL SIGN UU -"ெ>\uE084;" // VOWEL SIGN E -"ே>\uE047;" // VOWEL SIGN EE -"ை>\uE048;" // VOWEL SIGN AI -"ொ>\uE085;" // VOWEL SIGN O -"ோ>\uE04B;" // VOWEL SIGN OO -"ௌ>\uE04C;" // VOWEL SIGN AU -"்>\uE04D;" // SIGN VIRAMA -"ௗ>\uE057;" // AU LENGTH MARK -"௧>\uE067;" // DIGIT ONE -"௨>\uE068;" // DIGIT TWO -"௩>\uE069;" // DIGIT THREE -"௪>\uE06A;" // DIGIT FOUR -"௫>\uE06B;" // DIGIT FIVE -"௬>\uE06C;" // DIGIT SIX -"௭>\uE06D;" // DIGIT SEVEN -"௮>\uE06E;" // DIGIT EIGHT -"௯>\uE06F;" // DIGIT NINE -// ௰>; // UNMAPPED Tamil-InterIndic: NUMBER TEN -// ௱>; // UNMAPPED Tamil-InterIndic: NUMBER ONE HUNDRED -// ௲>; // UNMAPPED Tamil-InterIndic: NUMBER ONE THOUSAND - +":: NFD (NFC) ;" +"\u0b82>\ue002;" // SIGN ANUSVARA +"\u0b83>\ue003;" // SIGN VISARGA +"\u0b85>\ue005;" // LETTER A +"\u0b86>\ue006;" // LETTER AA +"\u0b87>\ue007;" // LETTER I +"\u0b88>\ue008;" // LETTER II +"\u0b89>\ue009;" // LETTER U +"\u0b8a>\ue00a;" // LETTER UU +"\u0b8e>\ue00e;" // LETTER E +"\u0b8f>\ue00f;" // LETTER EE +"\u0b90>\ue010;" // LETTER AI +"\u0b92>\ue012;" // LETTER O +"\u0b93>\ue013;" // LETTER OO +"\u0b94>\ue014;" // LETTER AU +"\u0b95>\ue015;" // LETTER KA +"\u0b99>\ue019;" // LETTER NGA +"\u0b9a>\ue01a;" // LETTER CA +"\u0b9c>\ue01c;" // LETTER JA +"\u0b9e>\ue01e;" // LETTER NYA +"\u0b9f>\ue01f;" // LETTER TTA +"\u0ba3>\ue023;" // LETTER NNA +"\u0ba4>\ue024;" // LETTER TA +"\u0ba8>\ue028;" // LETTER NA +"\u0ba9>\ue029;" // LETTER NNNA +"\u0baa>\ue02a;" // LETTER PA +"\u0bae>\ue02e;" // LETTER MA +"\u0baf>\ue02f;" // LETTER YA +"\u0bb0>\ue030;" // LETTER RA +"\u0bb1>\ue031;" // LETTER RRA +"\u0bb2>\ue032;" // LETTER LA +"\u0bb3>\ue033;" // LETTER LLA +"\u0bb4>\ue034;" // LETTER LLLA +"\u0bb5>\ue035;" // LETTER VA +"\u0bb7>\ue037;" // LETTER SSA +"\u0bb8>\ue038;" // LETTER SA +"\u0bb9>\ue039;" // LETTER HA +"\u0bbe>\ue03e;" // VOWEL SIGN AA +"\u0bbf>\ue03f;" // VOWEL SIGN I +"\u0bc0>\ue040;" // VOWEL SIGN II +"\u0bc1>\ue041;" // VOWEL SIGN U +"\u0bc2>\ue042;" // VOWEL SIGN UU +"\u0bc6>\ue046;" // VOWEL SIGN E +"\u0bc7>\ue047;" // VOWEL SIGN EE +"\u0bc8>\ue048;" // VOWEL SIGN AI +"\u0bca>\ue04a;" // VOWEL SIGN O +"\u0bcb>\ue04b;" // VOWEL SIGN OO +"\u0bcc>\ue04c;" // VOWEL SIGN AU +"\u0bcd>\ue04d;" // SIGN VIRAMA +"\u0bd7>\ue057;" // AU LENGTH MARK +"\u0be7>\ue067;" // DIGIT ONE +"\u0be8>\ue068;" // DIGIT TWO +"\u0be9>\ue069;" // DIGIT THREE +"\u0bea>\ue06a;" // DIGIT FOUR +"\u0beb>\ue06b;" // DIGIT FIVE +"\u0bec>\ue06c;" // DIGIT SIX +"\u0bed>\ue06d;" // DIGIT SEVEN +"\u0bee>\ue06e;" // DIGIT EIGHT +"\u0bef>\ue06f;" // DIGIT NINE +// \u0bf0>; // UNMAPPED Tamil-InterIndic: NUMBER TEN +// \u0bf1>; // UNMAPPED Tamil-InterIndic: NUMBER ONE HUNDRED +// \u0bf2>; // UNMAPPED Tamil-InterIndic: NUMBER ONE THOUSAND + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/Telugu_InterIndic.txt b/icu4c/data/Telugu_InterIndic.txt index 16f0afa71e..b786d0c2a8 100644 --- a/icu4c/data/Telugu_InterIndic.txt +++ b/icu4c/data/Telugu_InterIndic.txt @@ -1,17 +1,16 @@ - // -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpICUrules.bat -// Source: \icu4j\src\com\ibm\text\resources/Transliterator_Telugu_InterIndic.utf8.txt +// Source: \u005cicu4j\u005csrc\u005ccom\u005cibm\u005ctext\u005cresources/Transliterator_Telugu_InterIndic.utf8.txt // Date: Thu Mar 1 20:03:55 2001 //-------------------------------------------------------------------- // Telugu_InterIndic -Telugu_InterIndic { +Telugu-InterIndic { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines @@ -21,88 +20,88 @@ Telugu_InterIndic { //-------------------------------------------------------------------- // Telugu-InterIndic - -"ఁ>\uE001;" // SIGN CANDRABINDU -"ం>\uE002;" // SIGN ANUSVARA -"ః>\uE003;" // SIGN VISARGA -"అ>\uE005;" // LETTER A -"ఆ>\uE006;" // LETTER AA -"ఇ>\uE007;" // LETTER I -"ఈ>\uE008;" // LETTER II -"ఉ>\uE009;" // LETTER U -"ఊ>\uE00A;" // LETTER UU -"ఋ>\uE00B;" // LETTER VOCALIC R -"ఌ>\uE00C;" // LETTER VOCALIC L -"ఎ>\uE081;" // LETTER E -"ఏ>\uE00F;" // LETTER EE -"ఐ>\uE010;" // LETTER AI -"ఒ>\uE082;" // LETTER O -"ఓ>\uE013;" // LETTER OO -"ఔ>\uE014;" // LETTER AU -"క>\uE015;" // LETTER KA -"ఖ>\uE016;" // LETTER KHA -"గ>\uE017;" // LETTER GA -"ఘ>\uE018;" // LETTER GHA -"ఙ>\uE019;" // LETTER NGA -"చ>\uE01A;" // LETTER CA -"ఛ>\uE01B;" // LETTER CHA -"జ>\uE01C;" // LETTER JA -"ఝ>\uE01D;" // LETTER JHA -"ఞ>\uE01E;" // LETTER NYA -"ట>\uE01F;" // LETTER TTA -"ఠ>\uE020;" // LETTER TTHA -"డ>\uE021;" // LETTER DDA -"ఢ>\uE022;" // LETTER DDHA -"ణ>\uE023;" // LETTER NNA -"త>\uE024;" // LETTER TA -"థ>\uE025;" // LETTER THA -"ద>\uE026;" // LETTER DA -"ధ>\uE027;" // LETTER DHA -"న>\uE028;" // LETTER NA -"ప>\uE02A;" // LETTER PA -"ఫ>\uE02B;" // LETTER PHA -"బ>\uE02C;" // LETTER BA -"భ>\uE02D;" // LETTER BHA -"మ>\uE02E;" // LETTER MA -"య>\uE02F;" // LETTER YA -"ర>\uE030;" // LETTER RA -"ఱ>\uE083;" // LETTER RRA -"ల>\uE032;" // LETTER LA -"ళ>\uE033;" // LETTER LLA -"వ>\uE035;" // LETTER VA -"శ>\uE036;" // LETTER SHA -"ష>\uE037;" // LETTER SSA -"స>\uE038;" // LETTER SA -"హ>\uE039;" // LETTER HA -"ా>\uE03E;" // VOWEL SIGN AA -"ి>\uE03F;" // VOWEL SIGN I -"ీ>\uE040;" // VOWEL SIGN II -"ు>\uE041;" // VOWEL SIGN U -"ూ>\uE042;" // VOWEL SIGN UU -"ృ>\uE043;" // VOWEL SIGN VOCALIC R -"ౄ>\uE044;" // VOWEL SIGN VOCALIC RR -"ె>\uE084;" // VOWEL SIGN E -"ే>\uE047;" // VOWEL SIGN EE -"ై>\uE048;" // VOWEL SIGN AI -"ొ>\uE085;" // VOWEL SIGN O -"ో>\uE04B;" // VOWEL SIGN OO -"ౌ>\uE04C;" // VOWEL SIGN AU -"్>\uE04D;" // SIGN VIRAMA -"ౕ>\uE055;" // LENGTH MARK -"ౖ>\uE056;" // AI LENGTH MARK -"ౠ>\uE060;" // LETTER VOCALIC RR -"ౡ>\uE061;" // LETTER VOCALIC LL -"౦>\uE066;" // DIGIT ZERO -"౧>\uE067;" // DIGIT ONE -"౨>\uE068;" // DIGIT TWO -"౩>\uE069;" // DIGIT THREE -"౪>\uE06A;" // DIGIT FOUR -"౫>\uE06B;" // DIGIT FIVE -"౬>\uE06C;" // DIGIT SIX -"౭>\uE06D;" // DIGIT SEVEN -"౮>\uE06E;" // DIGIT EIGHT -"౯>\uE06F;" // DIGIT NINE - +":: NFD (NFC) ;" +"\u0c01>\ue001;" // SIGN CANDRABINDU +"\u0c02>\ue002;" // SIGN ANUSVARA +"\u0c03>\ue003;" // SIGN VISARGA +"\u0c05>\ue005;" // LETTER A +"\u0c06>\ue006;" // LETTER AA +"\u0c07>\ue007;" // LETTER I +"\u0c08>\ue008;" // LETTER II +"\u0c09>\ue009;" // LETTER U +"\u0c0a>\ue00a;" // LETTER UU +"\u0c0b>\ue00b;" // LETTER VOCALIC R +"\u0c0c>\ue00c;" // LETTER VOCALIC L +"\u0c0e>\ue00e;" // LETTER E +"\u0c0f>\ue00f;" // LETTER EE +"\u0c10>\ue010;" // LETTER AI +"\u0c12>\ue012;" // LETTER O +"\u0c13>\ue013;" // LETTER OO +"\u0c14>\ue014;" // LETTER AU +"\u0c15>\ue015;" // LETTER KA +"\u0c16>\ue016;" // LETTER KHA +"\u0c17>\ue017;" // LETTER GA +"\u0c18>\ue018;" // LETTER GHA +"\u0c19>\ue019;" // LETTER NGA +"\u0c1a>\ue01a;" // LETTER CA +"\u0c1b>\ue01b;" // LETTER CHA +"\u0c1c>\ue01c;" // LETTER JA +"\u0c1d>\ue01d;" // LETTER JHA +"\u0c1e>\ue01e;" // LETTER NYA +"\u0c1f>\ue01f;" // LETTER TTA +"\u0c20>\ue020;" // LETTER TTHA +"\u0c21>\ue021;" // LETTER DDA +"\u0c22>\ue022;" // LETTER DDHA +"\u0c23>\ue023;" // LETTER NNA +"\u0c24>\ue024;" // LETTER TA +"\u0c25>\ue025;" // LETTER THA +"\u0c26>\ue026;" // LETTER DA +"\u0c27>\ue027;" // LETTER DHA +"\u0c28>\ue028;" // LETTER NA +"\u0c2a>\ue02a;" // LETTER PA +"\u0c2b>\ue02b;" // LETTER PHA +"\u0c2c>\ue02c;" // LETTER BA +"\u0c2d>\ue02d;" // LETTER BHA +"\u0c2e>\ue02e;" // LETTER MA +"\u0c2f>\ue02f;" // LETTER YA +"\u0c30>\ue030;" // LETTER RA +"\u0c31>\ue031;" // LETTER RRA +"\u0c32>\ue032;" // LETTER LA +"\u0c33>\ue033;" // LETTER LLA +"\u0c35>\ue035;" // LETTER VA +"\u0c36>\ue036;" // LETTER SHA +"\u0c37>\ue037;" // LETTER SSA +"\u0c38>\ue038;" // LETTER SA +"\u0c39>\ue039;" // LETTER HA +"\u0c3e>\ue03e;" // VOWEL SIGN AA +"\u0c3f>\ue03f;" // VOWEL SIGN I +"\u0c40>\ue040;" // VOWEL SIGN II +"\u0c41>\ue041;" // VOWEL SIGN U +"\u0c42>\ue042;" // VOWEL SIGN UU +"\u0c43>\ue043;" // VOWEL SIGN VOCALIC R +"\u0c44>\ue044;" // VOWEL SIGN VOCALIC RR +"\u0c46>\ue046;" // VOWEL SIGN E +"\u0c47>\ue047;" // VOWEL SIGN EE +"\u0c48>\ue048;" // VOWEL SIGN AI +"\u0c4a>\ue04a;" // VOWEL SIGN O +"\u0c4b>\ue04b;" // VOWEL SIGN OO +"\u0c4c>\ue04c;" // VOWEL SIGN AU +"\u0c4d>\ue04d;" // SIGN VIRAMA +"\u0c55>\ue055;" // LENGTH MARK +"\u0c56>\ue056;" // AI LENGTH MARK +"\u0c60>\ue060;" // LETTER VOCALIC RR +"\u0c61>\ue061;" // LETTER VOCALIC LL +"\u0c66>\ue066;" // DIGIT ZERO +"\u0c67>\ue067;" // DIGIT ONE +"\u0c68>\ue068;" // DIGIT TWO +"\u0c69>\ue069;" // DIGIT THREE +"\u0c6a>\ue06a;" // DIGIT FOUR +"\u0c6b>\ue06b;" // DIGIT FIVE +"\u0c6c>\ue06c;" // DIGIT SIX +"\u0c6d>\ue06d;" // DIGIT SEVEN +"\u0c6e>\ue06e;" // DIGIT EIGHT +"\u0c6f>\ue06f;" // DIGIT NINE + ":: NFC (NFD) ;" // eof } } diff --git a/icu4c/data/resfiles.mk b/icu4c/data/resfiles.mk index 8ad913dbd2..2ef5bc6ae4 100644 --- a/icu4c/data/resfiles.mk +++ b/icu4c/data/resfiles.mk @@ -107,22 +107,24 @@ TRANSLIT_SOURCE=fullhalf.txt translit_index.txt kana.txt kbdescl1.txt\ larabic.txt lcyril.txt ldevan.txt\ lgreek.txt lhebrew.txt ljamo.txt\ lkana.txt quotes.txt\ -Bengali_InterIndic.txt\ -Devanagari_InterIndic.txt\ -Gujarati_InterIndic.txt\ -Gurmukhi_InterIndic.txt\ -Kannada_InterIndic.txt\ -Malayalam_InterIndic.txt\ -Oriya_InterIndic.txt\ -Tamil_InterIndic.txt\ -Telugu_InterIndic.txt\ -InterIndic_Bengali.txt\ -InterIndic_Devanagari.txt\ -InterIndic_Gujarati.txt\ -InterIndic_Gurmukhi.txt\ -InterIndic_Kannada.txt\ -InterIndic_Malayalam.txt\ -InterIndic_Oriya.txt\ -InterIndic_Tamil.txt\ -InterIndic_Telugu.txt +Bengali-InterIndic.txt\ +Devanagari-InterIndic.txt\ +Gujarati-InterIndic.txt\ +Gurmukhi-InterIndic.txt\ +Kannada-InterIndic.txt\ +Malayalam-InterIndic.txt\ +Oriya-InterIndic.txt\ +Tamil-InterIndic.txt\ +Telugu-InterIndic.txt\ +InterIndic-Bengali.txt\ +InterIndic-Devanagari.txt\ +InterIndic-Gujarati.txt\ +InterIndic-Gurmukhi.txt\ +InterIndic-Kannada.txt\ +InterIndic-Malayalam.txt\ +InterIndic-Oriya.txt\ +InterIndic-Tamil.txt\ +InterIndic-Telugu.txt\ +Latin-InterIndic.txt\ +InterIndic-Latin.txt diff --git a/icu4c/data/translit_index.txt b/icu4c/data/translit_index.txt index 00a14882e8..9bfcd06032 100644 --- a/icu4c/data/translit_index.txt +++ b/icu4c/data/translit_index.txt @@ -70,8 +70,8 @@ translit_index { { "Latin-Cyrillic", "file", "lcyril", "FORWARD" }, { "Cyrillic-Latin", "file", "lcyril", "REVERSE" }, -{ "Latin-Devanagari", "file", "ldevan", "FORWARD" }, -{ "Devanagari-Latin", "file", "ldevan", "REVERSE" }, +//{ "Latin-Devanagari", "file", "ldevan", "FORWARD" }, +//{ "Devanagari-Latin", "file", "ldevan", "REVERSE" }, { "Latin-Greek", "file", "lgreek", "FORWARD" }, { "Greek-Latin", "file", "lgreek", "REVERSE" }, @@ -109,7 +109,7 @@ translit_index { { "Hangul-Latin", "alias", "[\uAC00-\uD7AF]NFD;Jamo-Latin", "" }, // Inter-Indic composed rules - +{ "Latin-InterIndic", "internal", "Latin_InterIndic", "FORWARD" }, { "Devanagari-InterIndic", "internal", "Devanagari_InterIndic", "FORWARD" }, { "Bengali-InterIndic", "internal", "Bengali_InterIndic", "FORWARD" }, { "Gurmukhi-InterIndic", "internal", "Gurmukhi_InterIndic", "FORWARD" }, @@ -120,6 +120,7 @@ translit_index { { "Kannada-InterIndic", "internal", "Kannada_InterIndic", "FORWARD" }, { "Malayalam-InterIndic", "internal", "Malayalam_InterIndic", "FORWARD" }, +{ "InterIndic-Latin", "internal", "InterIndic_Latin", "FORWARD" }, { "InterIndic-Devanagari", "internal", "InterIndic_Devanagari", "FORWARD" }, { "InterIndic-Bengali", "internal", "InterIndic_Bengali", "FORWARD" }, { "InterIndic-Gurmukhi", "internal", "InterIndic_Gurmukhi", "FORWARD" }, @@ -130,6 +131,29 @@ translit_index { { "InterIndic-Kannada", "internal", "InterIndic_Kannada", "FORWARD" }, { "InterIndic-Malayalam", "internal", "InterIndic_Malayalam", "FORWARD" }, +//Latin-X transliterators +{ "Latin-Devanagari", "alias", "Latin-InterIndic;InterIndic-Devanagari", "" }, +{ "Latin-Bengali", "alias", "Latin-InterIndic;InterIndic-Bengali", "" }, +{ "Latin-Gurmukhi", "alias", "Latin-InterIndic;InterIndic-Gurmukhi", "" }, +{ "Latin-Gujarati", "alias", "Latin-InterIndic;InterIndic-Gujarati", "" }, +{ "Latin-Oriya", "alias", "Latin-InterIndic;InterIndic-Oriya", "" }, +{ "Latin-Tamil", "alias", "Latin-InterIndic;InterIndic-Tamil", "" }, +{ "Latin-Telugu", "alias", "Latin-InterIndic;InterIndic-Telugu", "" }, +{ "Latin-Kannada", "alias", "Latin-InterIndic;InterIndic-Kannada", "" }, +{ "Latin-Malayalam", "alias", "Latin-InterIndic;InterIndic-Malayalam", "" }, + +//X-Latin transliterators +{ "Devanagari-Latin","alias", "Devanagari-InterIndic;InterIndic-Latin", "" }, +{ "Bengali-Latin", "alias", "Bengali-InterIndic;InterIndic-Latin", "" }, +{ "Gurmukhi-Latin", "alias", "Bengali-InterIndic;InterIndic-Latin", "" }, +{ "Gujarati-Latin", "alias", "Gujarati-InterIndic;InterIndic-Latin", "" }, +{ "Oriya-Latin", "alias", "Oriya-InterIndic;InterIndic-Latin", "" }, +{ "Tamil-Latin", "alias", "Tamil-InterIndic;InterIndic-Latin", "" }, +{ "Telugu-Latin", "alias", "Telugu-InterIndic;InterIndic-Latin", "" }, +{ "Kannada-Latin", "alias", "Kannada-InterIndic;InterIndic-Latin", "" }, +{ "Malayalam-Latin", "alias", "Malayalam-InterIndic;InterIndic-Latin", "" }, + + { "Devanagari-Bengali", "alias", "Devanagari-InterIndic;InterIndic-Bengali", "" }, { "Devanagari-Gurmukhi", "alias", "Devanagari-InterIndic;InterIndic-Gurmukhi", "" }, { "Devanagari-Gujarati", "alias", "Devanagari-InterIndic;InterIndic-Gujarati", "" }, diff --git a/icu4c/source/data/locales/resfiles.mk b/icu4c/source/data/locales/resfiles.mk index 8ad913dbd2..2ef5bc6ae4 100644 --- a/icu4c/source/data/locales/resfiles.mk +++ b/icu4c/source/data/locales/resfiles.mk @@ -107,22 +107,24 @@ TRANSLIT_SOURCE=fullhalf.txt translit_index.txt kana.txt kbdescl1.txt\ larabic.txt lcyril.txt ldevan.txt\ lgreek.txt lhebrew.txt ljamo.txt\ lkana.txt quotes.txt\ -Bengali_InterIndic.txt\ -Devanagari_InterIndic.txt\ -Gujarati_InterIndic.txt\ -Gurmukhi_InterIndic.txt\ -Kannada_InterIndic.txt\ -Malayalam_InterIndic.txt\ -Oriya_InterIndic.txt\ -Tamil_InterIndic.txt\ -Telugu_InterIndic.txt\ -InterIndic_Bengali.txt\ -InterIndic_Devanagari.txt\ -InterIndic_Gujarati.txt\ -InterIndic_Gurmukhi.txt\ -InterIndic_Kannada.txt\ -InterIndic_Malayalam.txt\ -InterIndic_Oriya.txt\ -InterIndic_Tamil.txt\ -InterIndic_Telugu.txt +Bengali-InterIndic.txt\ +Devanagari-InterIndic.txt\ +Gujarati-InterIndic.txt\ +Gurmukhi-InterIndic.txt\ +Kannada-InterIndic.txt\ +Malayalam-InterIndic.txt\ +Oriya-InterIndic.txt\ +Tamil-InterIndic.txt\ +Telugu-InterIndic.txt\ +InterIndic-Bengali.txt\ +InterIndic-Devanagari.txt\ +InterIndic-Gujarati.txt\ +InterIndic-Gurmukhi.txt\ +InterIndic-Kannada.txt\ +InterIndic-Malayalam.txt\ +InterIndic-Oriya.txt\ +InterIndic-Tamil.txt\ +InterIndic-Telugu.txt\ +Latin-InterIndic.txt\ +InterIndic-Latin.txt diff --git a/icu4c/source/data/translit/translit_index.txt b/icu4c/source/data/translit/translit_index.txt index 00a14882e8..9bfcd06032 100644 --- a/icu4c/source/data/translit/translit_index.txt +++ b/icu4c/source/data/translit/translit_index.txt @@ -70,8 +70,8 @@ translit_index { { "Latin-Cyrillic", "file", "lcyril", "FORWARD" }, { "Cyrillic-Latin", "file", "lcyril", "REVERSE" }, -{ "Latin-Devanagari", "file", "ldevan", "FORWARD" }, -{ "Devanagari-Latin", "file", "ldevan", "REVERSE" }, +//{ "Latin-Devanagari", "file", "ldevan", "FORWARD" }, +//{ "Devanagari-Latin", "file", "ldevan", "REVERSE" }, { "Latin-Greek", "file", "lgreek", "FORWARD" }, { "Greek-Latin", "file", "lgreek", "REVERSE" }, @@ -109,7 +109,7 @@ translit_index { { "Hangul-Latin", "alias", "[\uAC00-\uD7AF]NFD;Jamo-Latin", "" }, // Inter-Indic composed rules - +{ "Latin-InterIndic", "internal", "Latin_InterIndic", "FORWARD" }, { "Devanagari-InterIndic", "internal", "Devanagari_InterIndic", "FORWARD" }, { "Bengali-InterIndic", "internal", "Bengali_InterIndic", "FORWARD" }, { "Gurmukhi-InterIndic", "internal", "Gurmukhi_InterIndic", "FORWARD" }, @@ -120,6 +120,7 @@ translit_index { { "Kannada-InterIndic", "internal", "Kannada_InterIndic", "FORWARD" }, { "Malayalam-InterIndic", "internal", "Malayalam_InterIndic", "FORWARD" }, +{ "InterIndic-Latin", "internal", "InterIndic_Latin", "FORWARD" }, { "InterIndic-Devanagari", "internal", "InterIndic_Devanagari", "FORWARD" }, { "InterIndic-Bengali", "internal", "InterIndic_Bengali", "FORWARD" }, { "InterIndic-Gurmukhi", "internal", "InterIndic_Gurmukhi", "FORWARD" }, @@ -130,6 +131,29 @@ translit_index { { "InterIndic-Kannada", "internal", "InterIndic_Kannada", "FORWARD" }, { "InterIndic-Malayalam", "internal", "InterIndic_Malayalam", "FORWARD" }, +//Latin-X transliterators +{ "Latin-Devanagari", "alias", "Latin-InterIndic;InterIndic-Devanagari", "" }, +{ "Latin-Bengali", "alias", "Latin-InterIndic;InterIndic-Bengali", "" }, +{ "Latin-Gurmukhi", "alias", "Latin-InterIndic;InterIndic-Gurmukhi", "" }, +{ "Latin-Gujarati", "alias", "Latin-InterIndic;InterIndic-Gujarati", "" }, +{ "Latin-Oriya", "alias", "Latin-InterIndic;InterIndic-Oriya", "" }, +{ "Latin-Tamil", "alias", "Latin-InterIndic;InterIndic-Tamil", "" }, +{ "Latin-Telugu", "alias", "Latin-InterIndic;InterIndic-Telugu", "" }, +{ "Latin-Kannada", "alias", "Latin-InterIndic;InterIndic-Kannada", "" }, +{ "Latin-Malayalam", "alias", "Latin-InterIndic;InterIndic-Malayalam", "" }, + +//X-Latin transliterators +{ "Devanagari-Latin","alias", "Devanagari-InterIndic;InterIndic-Latin", "" }, +{ "Bengali-Latin", "alias", "Bengali-InterIndic;InterIndic-Latin", "" }, +{ "Gurmukhi-Latin", "alias", "Bengali-InterIndic;InterIndic-Latin", "" }, +{ "Gujarati-Latin", "alias", "Gujarati-InterIndic;InterIndic-Latin", "" }, +{ "Oriya-Latin", "alias", "Oriya-InterIndic;InterIndic-Latin", "" }, +{ "Tamil-Latin", "alias", "Tamil-InterIndic;InterIndic-Latin", "" }, +{ "Telugu-Latin", "alias", "Telugu-InterIndic;InterIndic-Latin", "" }, +{ "Kannada-Latin", "alias", "Kannada-InterIndic;InterIndic-Latin", "" }, +{ "Malayalam-Latin", "alias", "Malayalam-InterIndic;InterIndic-Latin", "" }, + + { "Devanagari-Bengali", "alias", "Devanagari-InterIndic;InterIndic-Bengali", "" }, { "Devanagari-Gurmukhi", "alias", "Devanagari-InterIndic;InterIndic-Gurmukhi", "" }, { "Devanagari-Gujarati", "alias", "Devanagari-InterIndic;InterIndic-Gujarati", "" },