// -*- Coding: utf-8; -*- //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // THIS IS A MACHINE-GENERATED FILE // Tool: dumpicurules.bat // Source: ../../text/resources/Transliterator_Cyrillic_Latin.txt // Date: Mon Nov 5 12:28:37 2001 //-------------------------------------------------------------------- // Cyrillic_Latin translit_Cyrillic_Latin { Rule { //-------------------------------------------------------------------- // Copyright (c) 1999-2001, International Business Machines // Corporation and others. All Rights Reserved. //-------------------------------------------------------------------- // $Source: /xsrl/Nsvn/icu/icu/source/data/translit/Attic/t_Cyrl_Latn.txt,v $ // $Date: 2001/11/05 20:38:59 $ // $Revision: 1.2 $ //-------------------------------------------------------------------- // TODO: add remaining characters // Should add variants for Russian-English, Russian-German // Those can use this as a base, and then remap cases // like a $hat to ya or ja. ":: NFD (NFC) ;" "$modprime = \u02B9;" "$modprime2 = \u02BA;" "$grave = \u0300;" "$acute = \u0301;" "$hat = \u0302;" "$breve = \u0306 ;" "$dot = \u0307 ;" "$caron = \u030C ;" "$comma = \u0326 ;" "$under = \u0331 ;" // move up so not masked "я <> a $hat ;" // CYRILLIC SMALL LETTER YA "Я <> A $hat ;" // CYRILLIC CAPITAL LETTER YA "ч <> c $caron ;" // CYRILLIC SMALL LETTER CHE "Ч <> C $caron;" // CYRILLIC CAPITAL LETTER CHE // ҷ <> XXX ; # CYRILLIC SMALL LETTER CHE WITH DESCENDER // Ҷ <> XXX ; # CYRILLIC CAPITAL LETTER CHE WITH DESCENDER // ӌ <> XXX ; # CYRILLIC SMALL LETTER KHAKASSIAN CHE // Ӌ <> XXX ; # CYRILLIC CAPITAL LETTER KHAKASSIAN CHE // ҹ <> XXX ; # CYRILLIC SMALL LETTER CHE WITH VERTICAL STROKE // Ҹ <> XXX ; # CYRILLIC CAPITAL LETTER CHE WITH VERTICAL STROKE "э <> e $acute;" // CYRILLIC SMALL LETTER E "Э <> E $acute;" // CYRILLIC CAPITAL LETTER E "є <> e $hat;" // CYRILLIC SMALL LETTER UKRAINIAN IE "Є <> E $hat;" // CYRILLIC CAPITAL LETTER UKRAINIAN IE "ш <> s $caron ;" // CYRILLIC SMALL LETTER SHA "Ш <> S $caron ;" // CYRILLIC CAPITAL LETTER SHA "щ <> s $hat ;" // CYRILLIC SMALL LETTER SHCHA "Щ <> S $hat;" // CYRILLIC CAPITAL LETTER SHCHA "ѕ <> z $hat ;" // CYRILLIC SMALL LETTER DZE "Ѕ <> Z $hat;" // CYRILLIC CAPITAL LETTER DZE // ӡ <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN DZE // Ӡ <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN DZE "ю <> u $hat ;" // CYRILLIC SMALL LETTER YU "Ю <> U $hat ;" // CYRILLIC CAPITAL LETTER YU "і <> i $acute;" // CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I "І <> I $acute;" // CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I "ј <> j $caron;" // CYRILLIC SMALL LETTER JE "Ј <> J $caron;" // CYRILLIC CAPITAL LETTER JE "љ <> l $hat ;" // CYRILLIC SMALL LETTER LJE "Љ <> L $hat ;" // CYRILLIC CAPITAL LETTER LJE "њ <> n $hat ;" // CYRILLIC SMALL LETTER NJE "Њ <> N $hat ;" // CYRILLIC CAPITAL LETTER NJE "ћ <> c $acute ;" // CYRILLIC SMALL LETTER TSHE "Ћ <> C $acute ;" // CYRILLIC CAPITAL LETTER TSHE "џ <> d $hat ;" // CYRILLIC SMALL LETTER DZHE "Џ <> D $hat ;" // CYRILLIC CAPITAL LETTER DZHE // Normal order "а <> a ;" // CYRILLIC SMALL LETTER A "А <> A ;" // CYRILLIC CAPITAL LETTER A "ә <> \u0259 ;" // CYRILLIC SMALL LETTER SCHWA "Ә <> \u018F ;" // CYRILLIC CAPITAL LETTER SCHWA "ӕ <> \u00E6 ;" // CYRILLIC SMALL LIGATURE A IE "Ӕ <> \u00C6 ;" // CYRILLIC CAPITAL LIGATURE A IE "б <> b ;" // CYRILLIC SMALL LETTER BE "Б <> B ;" // CYRILLIC CAPITAL LETTER BE "в <> v ;" // CYRILLIC SMALL LETTER VE "В <> V ;" // CYRILLIC CAPITAL LETTER VE "ґ <> g $grave ;" // CYRILLIC SMALL LETTER GHE WITH UPTURN "Ґ <> G $grave ;" // CYRILLIC CAPITAL LETTER GHE WITH UPTURN "ғ <> g $dot ;" // CYRILLIC SMALL LETTER GHE WITH STROKE "Ғ <> G $dot;" // CYRILLIC CAPITAL LETTER GHE WITH STROKE "ҕ <> g $breve;" // CYRILLIC SMALL LETTER GHE WITH MIDDLE HOOK "Ҕ <> G $breve;" // CYRILLIC CAPITAL LETTER GHE WITH MIDDLE HOOK "г <> g ;" // CYRILLIC SMALL LETTER GHE "Г <> G ;" // CYRILLIC CAPITAL LETTER GHE "д <> d;" // CYRILLIC SMALL LETTER DE "Д <> D;" // CYRILLIC CAPITAL LETTER DE "ђ <> đ ;" // CYRILLIC SMALL LETTER DJE "Ђ <> Đ ;" // CYRILLIC CAPITAL LETTER DJE "ҙ <> z $comma ;" // CYRILLIC SMALL LETTER ZE WITH DESCENDER "Ҙ <> Z $comma ;" // CYRILLIC CAPITAL LETTER ZE WITH DESCENDER "е <> e ;" // CYRILLIC SMALL LETTER IE "Е <> E;" // CYRILLIC CAPITAL LETTER IE "ж <> z $caron;" // CYRILLIC SMALL LETTER ZHE "Ж <> Z $caron;" // CYRILLIC CAPITAL LETTER ZHE // җ <> XXX ; # CYRILLIC SMALL LETTER ZHE WITH DESCENDER // Җ <> XXX ; # CYRILLIC CAPITAL LETTER ZHE WITH DESCENDER "з <> z ;" // CYRILLIC SMALL LETTER ZE "З <> Z;" // CYRILLIC CAPITAL LETTER ZE "й <> j ;" // CYRILLIC SMALL LETTER I "Й <> J ;" // CYRILLIC CAPITAL LETTER I "и <> i ;" // CYRILLIC SMALL LETTER I "И <> I ;" // CYRILLIC CAPITAL LETTER I "к <> k ;" // CYRILLIC SMALL LETTER KA "К <> K;" // CYRILLIC CAPITAL LETTER KA // қ <> XXX ; # CYRILLIC SMALL LETTER KA WITH DESCENDER // Қ <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH DESCENDER // ӄ <> XXX ; # CYRILLIC SMALL LETTER KA WITH HOOK // Ӄ <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH HOOK // ҡ <> XXX ; # CYRILLIC SMALL LETTER BASHKIR KA // Ҡ <> XXX ; # CYRILLIC CAPITAL LETTER BASHKIR KA // ҟ <> XXX ; # CYRILLIC SMALL LETTER KA WITH STROKE // Ҟ <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH STROKE // ҝ <> XXX ; # CYRILLIC SMALL LETTER KA WITH VERTICAL STROKE // Ҝ <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH VERTICAL STROKE "л <> l ;" // CYRILLIC SMALL LETTER EL "Л <> L;" // CYRILLIC CAPITAL LETTER EL "м <> m ;" // CYRILLIC SMALL LETTER EM "М <> M ;" // CYRILLIC CAPITAL LETTER EM "н <> n ;" // CYRILLIC SMALL LETTER EN "Н <> N;" // CYRILLIC CAPITAL LETTER EN // ң <> XXX ; # CYRILLIC SMALL LETTER EN WITH DESCENDER // Ң <> XXX ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER // ӈ <> XXX ; # CYRILLIC SMALL LETTER EN WITH HOOK // Ӈ <> XXX ; # CYRILLIC CAPITAL LETTER EN WITH HOOK // ҥ <> XXX ; # CYRILLIC SMALL LIGATURE EN GHE // Ҥ <> XXX ; # CYRILLIC CAPITAL LIGATURE EN GHE "о <> o ;" // CYRILLIC SMALL LETTER O "О <> O ;" // CYRILLIC CAPITAL LETTER O // ө <> XXX ; # CYRILLIC SMALL LETTER BARRED O // Ө <> XXX ; # CYRILLIC CAPITAL LETTER BARRED O "п <> p ;" // CYRILLIC SMALL LETTER PE "П <> P ;" // CYRILLIC CAPITAL LETTER PE // ҧ <> XXX ; # CYRILLIC SMALL LETTER PE WITH MIDDLE HOOK // Ҧ <> XXX ; # CYRILLIC CAPITAL LETTER PE WITH MIDDLE HOOK // ҁ <> XXX ; # CYRILLIC SMALL LETTER KOPPA // Ҁ <> XXX ; # CYRILLIC CAPITAL LETTER KOPPA "р <> r ;" // CYRILLIC SMALL LETTER ER "Р <> R ;" // CYRILLIC CAPITAL LETTER ER // ҏ <> XXX ; # CYRILLIC SMALL LETTER ER WITH TICK // Ҏ <> XXX ; # CYRILLIC CAPITAL LETTER ER WITH TICK "с <> s ;" // CYRILLIC SMALL LETTER ES "С <> S ;" // CYRILLIC CAPITAL LETTER ES // ҫ <> XXX ; # CYRILLIC SMALL LETTER ES WITH DESCENDER // Ҫ <> XXX ; # CYRILLIC CAPITAL LETTER ES WITH DESCENDER "т <> t ;" // CYRILLIC SMALL LETTER TE "Т <> T ;" // CYRILLIC CAPITAL LETTER TE // ҭ <> XXX ; # CYRILLIC SMALL LETTER TE WITH DESCENDER // Ҭ <> XXX ; # CYRILLIC CAPITAL LETTER TE WITH DESCENDER "у <> u ;" // CYRILLIC SMALL LETTER U "У <> U ;" // CYRILLIC CAPITAL LETTER U // ү <> XXX ; # CYRILLIC SMALL LETTER STRAIGHT U // Ү <> XXX ; # CYRILLIC CAPITAL LETTER STRAIGHT U // ұ <> XXX ; # CYRILLIC SMALL LETTER STRAIGHT U WITH STROKE // Ұ <> XXX ; # CYRILLIC CAPITAL LETTER STRAIGHT U WITH STROKE // ѹ <> XXX ; # CYRILLIC SMALL LETTER UK // Ѹ <> XXX ; # CYRILLIC CAPITAL LETTER UK "ф <> f ;" // CYRILLIC SMALL LETTER EF "Ф <> F ;" // CYRILLIC CAPITAL LETTER EF "х <> h ;" // CYRILLIC SMALL LETTER HA "Х <> H;" // CYRILLIC CAPITAL LETTER HA // ҳ <> XXX ; # CYRILLIC SMALL LETTER HA WITH DESCENDER // Ҳ <> XXX ; # CYRILLIC CAPITAL LETTER HA WITH DESCENDER // һ <> XXX ; # CYRILLIC SMALL LETTER SHHA // Һ <> XXX ; # CYRILLIC CAPITAL LETTER SHHA // ѡ <> XXX ; # CYRILLIC SMALL LETTER OMEGA // Ѡ <> XXX ; # CYRILLIC CAPITAL LETTER OMEGA // ѿ <> XXX ; # CYRILLIC SMALL LETTER OT // Ѿ <> XXX ; # CYRILLIC CAPITAL LETTER OT // ѽ <> XXX ; # CYRILLIC SMALL LETTER OMEGA WITH TITLO // Ѽ <> XXX ; # CYRILLIC CAPITAL LETTER OMEGA WITH TITLO // ѻ <> XXX ; # CYRILLIC SMALL LETTER ROUND OMEGA // Ѻ <> XXX ; # CYRILLIC CAPITAL LETTER ROUND OMEGA "ц <> c ;" // CYRILLIC SMALL LETTER TSE "Ц <> C;" // CYRILLIC CAPITAL LETTER TSE // ҵ <> XXX ; # CYRILLIC SMALL LIGATURE TE TSE // Ҵ <> XXX ; # CYRILLIC CAPITAL LIGATURE TE TSE // ҽ <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN CHE // Ҽ <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN CHE // ҿ <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN CHE WITH DESCENDER // Ҿ <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN CHE WITH DESCENDER "Ъ <> $modprime2 $under ;" // CYRILLIC CAPITAL LETTER HARD SIGN "ъ <> $modprime2 ;" // CYRILLIC SMALL LETTER HARD SIGN "Ь <> $modprime $under ;" // CYRILLIC CAPITAL LETTER SOFT SIGN "ь <> $modprime ;" // CYRILLIC SMALL LETTER SOFT SIGN "ы <> y ;" // CYRILLIC SMALL LETTER YERU "Ы <> Y ;" // CYRILLIC CAPITAL LETTER YERU // ҍ <> XXX ; # CYRILLIC SMALL LETTER SEMISOFT SIGN // Ҍ <> XXX ; # CYRILLIC CAPITAL LETTER SEMISOFT SIGN // ѣ <> XXX ; # CYRILLIC SMALL LETTER YAT // Ѣ <> XXX ; # CYRILLIC CAPITAL LETTER YAT // ѥ <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED E // Ѥ <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED E // ѧ <> XXX ; # CYRILLIC SMALL LETTER LITTLE YUS // Ѧ <> XXX ; # CYRILLIC CAPITAL LETTER LITTLE YUS // ѫ <> XXX ; # CYRILLIC SMALL LETTER BIG YUS // Ѫ <> XXX ; # CYRILLIC CAPITAL LETTER BIG YUS // ѩ <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED LITTLE YUS // Ѩ <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED LITTLE YUS // ѭ <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED BIG YUS // Ѭ <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED BIG YUS // ѯ <> XXX ; # CYRILLIC SMALL LETTER KSI // Ѯ <> XXX ; # CYRILLIC CAPITAL LETTER KSI // ѱ <> XXX ; # CYRILLIC SMALL LETTER PSI // Ѱ <> XXX ; # CYRILLIC CAPITAL LETTER PSI // ѳ <> XXX ; # CYRILLIC SMALL LETTER FITA // Ѳ <> XXX ; # CYRILLIC CAPITAL LETTER FITA // ѵ <> XXX ; # CYRILLIC SMALL LETTER IZHITSA // Ѵ <> XXX ; # CYRILLIC CAPITAL LETTER IZHITSA // ҩ <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN HA // Ҩ <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN HA // Ӏ <> XXX ; # CYRILLIC LETTER PALOCHKA //## ӑ <> XXX ; # CYRILLIC SMALL LETTER A //## Ӑ <> XXX ; # CYRILLIC CAPITAL LETTER A //## ӓ <> XXX ; # CYRILLIC SMALL LETTER A //## Ӓ <> XXX ; # CYRILLIC CAPITAL LETTER A //## ӛ <> XXX ; # CYRILLIC SMALL LETTER SCHWA //## Ӛ <> XXX ; # CYRILLIC CAPITAL LETTER SCHWA //## ѓ <> XXX ; # CYRILLIC SMALL LETTER GHE //## Ѓ <> XXX ; # CYRILLIC CAPITAL LETTER GHE //## ѐ <> XXX ; # CYRILLIC SMALL LETTER IE //## Ѐ <> XXX ; # CYRILLIC CAPITAL LETTER IE //## ё <> XXX ; # CYRILLIC SMALL LETTER IE //## Ё <> XXX ; # CYRILLIC CAPITAL LETTER IE //## ӗ <> XXX ; # CYRILLIC SMALL LETTER IE //## Ӗ <> XXX ; # CYRILLIC CAPITAL LETTER IE //## ӂ <> XXX ; # CYRILLIC SMALL LETTER ZHE //## Ӂ <> XXX ; # CYRILLIC CAPITAL LETTER ZHE //## ӝ <> XXX ; # CYRILLIC SMALL LETTER ZHE //## Ӝ <> XXX ; # CYRILLIC CAPITAL LETTER ZHE //## ӟ <> XXX ; # CYRILLIC SMALL LETTER ZE //## Ӟ <> XXX ; # CYRILLIC CAPITAL LETTER ZE //## ѝ <> XXX ; # CYRILLIC SMALL LETTER I //## Ѝ <> XXX ; # CYRILLIC CAPITAL LETTER I //## ӣ <> XXX ; # CYRILLIC SMALL LETTER I //## Ӣ <> XXX ; # CYRILLIC CAPITAL LETTER I //## ӥ <> XXX ; # CYRILLIC SMALL LETTER I //## Ӥ <> XXX ; # CYRILLIC CAPITAL LETTER I //## ї <> XXX ; # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I //## Ї <> XXX ; # CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I //## ӧ <> XXX ; # CYRILLIC SMALL LETTER O //## Ӧ <> XXX ; # CYRILLIC CAPITAL LETTER O //## ӫ <> XXX ; # CYRILLIC SMALL LETTER BARRED O //## Ӫ <> XXX ; # CYRILLIC CAPITAL LETTER BARRED O //## ќ <> XXX ; # CYRILLIC SMALL LETTER KA //## Ќ <> XXX ; # CYRILLIC CAPITAL LETTER KA //## ӯ <> XXX ; # CYRILLIC SMALL LETTER U //## Ӯ <> XXX ; # CYRILLIC CAPITAL LETTER U //## ў <> XXX ; # CYRILLIC SMALL LETTER U //## Ў <> XXX ; # CYRILLIC CAPITAL LETTER U //## ӱ <> XXX ; # CYRILLIC SMALL LETTER U //## Ӱ <> XXX ; # CYRILLIC CAPITAL LETTER U //## ӳ <> XXX ; # CYRILLIC SMALL LETTER U //## Ӳ <> XXX ; # CYRILLIC CAPITAL LETTER U //## ӵ <> XXX ; # CYRILLIC SMALL LETTER CHE //## Ӵ <> XXX ; # CYRILLIC CAPITAL LETTER CHE //## ӹ <> XXX ; # CYRILLIC SMALL LETTER YERU //## Ӹ <> XXX ; # CYRILLIC CAPITAL LETTER YERU //## ӭ <> XXX ; # CYRILLIC SMALL LETTER E //## Ӭ <> XXX ; # CYRILLIC CAPITAL LETTER E //## ѷ <> XXX ; # CYRILLIC SMALL LETTER IZHITSA //## Ѷ <> XXX ; # CYRILLIC CAPITAL LETTER IZHITSA // Completeness "$ignore = [[:Mark:]''] * ;" "| k < q ;" "| K < Q ;" "| u < w ;" "| U < W ;" "| KS < X } $ignore [:UppercaseLetter:] ;" "| KS < [:UppercaseLetter:] $ignore { X ;" "| Ks < X ;" "| ks < x ;" ":: NFC (NFD) ;" } }