ICU-3301 repair clobbered UTF8 files

X-SVN-Rev: 15483
This commit is contained in:
Alan Liu 2004-05-22 00:23:45 +00:00
parent 544bbc2977
commit 147e6b8116
4 changed files with 524 additions and 540 deletions

View File

@ -1,11 +1,7 @@
???#--------------------------------------------------------------------
#--------------------------------------------------------------------
# Copyright (c) 1999-2004, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# $Source: /xsrl/Nsvn/icu/icu4j/src/com/ibm/icu/impl/data/Attic/Transliterator_Cyrillic_Latin.txt,v $
# $Date: 2004/05/21 01:01:51 $
# $Revision: 1.12 $
#--------------------------------------------------------------------
# TODO: add remaining characters
# Should add variants for Russian-English, Russian-German
# Those can use this as a base, and then remap cases
@ -31,266 +27,266 @@ $under = \u0331 ;
# move up so not masked
?? <> a $hat ; # CYRILLIC SMALL LETTER YA
?? <> A $hat ; # CYRILLIC CAPITAL LETTER YA
я <> a $hat ; # CYRILLIC SMALL LETTER YA
Я <> A $hat ; # CYRILLIC CAPITAL LETTER YA
?? <> c $caron ; # CYRILLIC SMALL LETTER CHE
?? <> C $caron; # CYRILLIC CAPITAL LETTER CHE
# ?? <> XXX ; # CYRILLIC SMALL LETTER CHE WITH DESCENDER
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER CHE WITH DESCENDER
# ?? <> XXX ; # CYRILLIC SMALL LETTER KHAKASSIAN CHE
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER KHAKASSIAN CHE
# ?? <> XXX ; # CYRILLIC SMALL LETTER CHE WITH VERTICAL STROKE
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER CHE WITH VERTICAL STROKE
ч <> c $caron ; # CYRILLIC SMALL LETTER CHE
Ч <> C $caron; # CYRILLIC CAPITAL LETTER CHE
# ҷ <> XXX ; # CYRILLIC SMALL LETTER CHE WITH DESCENDER
# Ҷ <> XXX ; # CYRILLIC CAPITAL LETTER CHE WITH DESCENDER
# ӌ <> XXX ; # CYRILLIC SMALL LETTER KHAKASSIAN CHE
# Ӌ <> XXX ; # CYRILLIC CAPITAL LETTER KHAKASSIAN CHE
# ҹ <> XXX ; # CYRILLIC SMALL LETTER CHE WITH VERTICAL STROKE
# Ҹ <> XXX ; # CYRILLIC CAPITAL LETTER CHE WITH VERTICAL STROKE
?? <> e $acute; # CYRILLIC SMALL LETTER E
?? <> E $acute; # CYRILLIC CAPITAL LETTER E
?? <> e $hat; # CYRILLIC SMALL LETTER UKRAINIAN IE
?? <> E $hat; # CYRILLIC CAPITAL LETTER UKRAINIAN IE
э <> e $acute; # CYRILLIC SMALL LETTER E
Э <> E $acute; # CYRILLIC CAPITAL LETTER E
є <> e $hat; # CYRILLIC SMALL LETTER UKRAINIAN IE
Є <> E $hat; # CYRILLIC CAPITAL LETTER UKRAINIAN IE
?? <> s $caron ; # CYRILLIC SMALL LETTER SHA
?? <> S $caron ; # CYRILLIC CAPITAL LETTER SHA
?? <> s $hat ; # CYRILLIC SMALL LETTER SHCHA
?? <> S $hat; # CYRILLIC CAPITAL LETTER SHCHA
ш <> s $caron ; # CYRILLIC SMALL LETTER SHA
Ш <> S $caron ; # CYRILLIC CAPITAL LETTER SHA
щ <> s $hat ; # CYRILLIC SMALL LETTER SHCHA
Щ <> S $hat; # CYRILLIC CAPITAL LETTER SHCHA
?? <> z $hat ; # CYRILLIC SMALL LETTER DZE
?? <> Z $hat; # CYRILLIC CAPITAL LETTER DZE
# ?? <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN DZE
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN DZE
ѕ <> z $hat ; # CYRILLIC SMALL LETTER DZE
Ѕ <> Z $hat; # CYRILLIC CAPITAL LETTER DZE
# ӡ <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN DZE
# Ӡ <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN DZE
?? <> u $hat ; # CYRILLIC SMALL LETTER YU
?? <> U $hat ; # CYRILLIC CAPITAL LETTER YU
ю <> u $hat ; # CYRILLIC SMALL LETTER YU
Ю <> U $hat ; # CYRILLIC CAPITAL LETTER YU
?? <> i $acute; # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
?? <> I $acute; # CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
?? <> j $caron; # CYRILLIC SMALL LETTER JE
?? <> J $caron; # CYRILLIC CAPITAL LETTER JE
і <> i $acute; # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
І <> I $acute; # CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
ј <> j $caron; # CYRILLIC SMALL LETTER JE
Ј <> J $caron; # CYRILLIC CAPITAL LETTER JE
?? <> l $hat ; # CYRILLIC SMALL LETTER LJE
?? <> L $hat ; # CYRILLIC CAPITAL LETTER LJE
?? <> n $hat ; # CYRILLIC SMALL LETTER NJE
?? <> N $hat ; # CYRILLIC CAPITAL LETTER NJE
љ <> l $hat ; # CYRILLIC SMALL LETTER LJE
Љ <> L $hat ; # CYRILLIC CAPITAL LETTER LJE
њ <> n $hat ; # CYRILLIC SMALL LETTER NJE
Њ <> N $hat ; # CYRILLIC CAPITAL LETTER NJE
?? <> c $acute ; # CYRILLIC SMALL LETTER TSHE
?? <> C $acute ; # CYRILLIC CAPITAL LETTER TSHE
ћ <> c $acute ; # CYRILLIC SMALL LETTER TSHE
Ћ <> C $acute ; # CYRILLIC CAPITAL LETTER TSHE
?? <> d $hat ; # CYRILLIC SMALL LETTER DZHE
?? <> D $hat ; # CYRILLIC CAPITAL LETTER DZHE
џ <> d $hat ; # CYRILLIC SMALL LETTER DZHE
Џ <> D $hat ; # CYRILLIC CAPITAL LETTER DZHE
# Normal order
?? <> a ; # CYRILLIC SMALL LETTER A
?? <> A ; # CYRILLIC CAPITAL LETTER A
?? <> \u0259 ; # CYRILLIC SMALL LETTER SCHWA
?? <> \u018F ; # CYRILLIC CAPITAL LETTER SCHWA
?? <> \u00E6 ; # CYRILLIC SMALL LIGATURE A IE
?? <> \u00C6 ; # CYRILLIC CAPITAL LIGATURE A IE
?? <> b ; # CYRILLIC SMALL LETTER BE
?? <> B ; # CYRILLIC CAPITAL LETTER BE
?? <> v ; # CYRILLIC SMALL LETTER VE
?? <> V ; # CYRILLIC CAPITAL LETTER VE
а <> a ; # CYRILLIC SMALL LETTER A
А <> A ; # CYRILLIC CAPITAL LETTER A
ә <> \u0259 ; # CYRILLIC SMALL LETTER SCHWA
Ә <> \u018F ; # CYRILLIC CAPITAL LETTER SCHWA
ӕ <> \u00E6 ; # CYRILLIC SMALL LIGATURE A IE
Ӕ <> \u00C6 ; # CYRILLIC CAPITAL LIGATURE A IE
б <> b ; # CYRILLIC SMALL LETTER BE
Б <> B ; # CYRILLIC CAPITAL LETTER BE
в <> v ; # CYRILLIC SMALL LETTER VE
В <> V ; # CYRILLIC CAPITAL LETTER VE
?? <> g $grave ; # CYRILLIC SMALL LETTER GHE WITH UPTURN
?? <> G $grave ; # CYRILLIC CAPITAL LETTER GHE WITH UPTURN
?? <> g $dot ; # CYRILLIC SMALL LETTER GHE WITH STROKE
?? <> G $dot; # CYRILLIC CAPITAL LETTER GHE WITH STROKE
?? <> g $breve; # CYRILLIC SMALL LETTER GHE WITH MIDDLE HOOK
?? <> G $breve; # CYRILLIC CAPITAL LETTER GHE WITH MIDDLE HOOK
?? <> g ; # CYRILLIC SMALL LETTER GHE
?? <> G ; # CYRILLIC CAPITAL LETTER GHE
ґ <> g $grave ; # CYRILLIC SMALL LETTER GHE WITH UPTURN
Ґ <> G $grave ; # CYRILLIC CAPITAL LETTER GHE WITH UPTURN
ғ <> g $dot ; # CYRILLIC SMALL LETTER GHE WITH STROKE
Ғ <> G $dot; # CYRILLIC CAPITAL LETTER GHE WITH STROKE
ҕ <> g $breve; # CYRILLIC SMALL LETTER GHE WITH MIDDLE HOOK
Ҕ <> G $breve; # CYRILLIC CAPITAL LETTER GHE WITH MIDDLE HOOK
г <> g ; # CYRILLIC SMALL LETTER GHE
Г <> G ; # CYRILLIC CAPITAL LETTER GHE
?? <> d; # CYRILLIC SMALL LETTER DE
?? <> D; # CYRILLIC CAPITAL LETTER DE
?? <> ?? ; # CYRILLIC SMALL LETTER DJE
?? <> ?? ; # CYRILLIC CAPITAL LETTER DJE
?? <> z $comma ; # CYRILLIC SMALL LETTER ZE WITH DESCENDER
?? <> Z $comma ; # CYRILLIC CAPITAL LETTER ZE WITH DESCENDER
?? <> e ; # CYRILLIC SMALL LETTER IE
?? <> E; # CYRILLIC CAPITAL LETTER IE
д <> d; # CYRILLIC SMALL LETTER DE
Д <> D; # CYRILLIC CAPITAL LETTER DE
ђ <> đ ; # CYRILLIC SMALL LETTER DJE
Ђ <> Đ ; # CYRILLIC CAPITAL LETTER DJE
ҙ <> z $comma ; # CYRILLIC SMALL LETTER ZE WITH DESCENDER
Ҙ <> Z $comma ; # CYRILLIC CAPITAL LETTER ZE WITH DESCENDER
е <> e ; # CYRILLIC SMALL LETTER IE
Е <> E; # CYRILLIC CAPITAL LETTER IE
?? <> z $caron; # CYRILLIC SMALL LETTER ZHE
?? <> Z $caron; # CYRILLIC CAPITAL LETTER ZHE
ж <> z $caron; # CYRILLIC SMALL LETTER ZHE
Ж <> Z $caron; # CYRILLIC CAPITAL LETTER ZHE
# ?? <> XXX ; # CYRILLIC SMALL LETTER ZHE WITH DESCENDER
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER ZHE WITH DESCENDER
# җ <> XXX ; # CYRILLIC SMALL LETTER ZHE WITH DESCENDER
# Җ <> XXX ; # CYRILLIC CAPITAL LETTER ZHE WITH DESCENDER
?? <> z ; # CYRILLIC SMALL LETTER ZE
?? <> Z; # CYRILLIC CAPITAL LETTER ZE
з <> z ; # CYRILLIC SMALL LETTER ZE
З <> Z; # CYRILLIC CAPITAL LETTER ZE
???? <> j ; # CYRILLIC SMALL LETTER I
???? <> J ; # CYRILLIC CAPITAL LETTER I
?? <> i ; # CYRILLIC SMALL LETTER I
?? <> I ; # CYRILLIC CAPITAL LETTER I
й <> j ; # CYRILLIC SMALL LETTER I
Й <> J ; # CYRILLIC CAPITAL LETTER I
и <> i ; # CYRILLIC SMALL LETTER I
И <> I ; # CYRILLIC CAPITAL LETTER I
?? <> k ; # CYRILLIC SMALL LETTER KA
?? <> K; # CYRILLIC CAPITAL LETTER KA
к <> k ; # CYRILLIC SMALL LETTER KA
К <> K; # CYRILLIC CAPITAL LETTER KA
# ?? <> XXX ; # CYRILLIC SMALL LETTER KA WITH DESCENDER
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH DESCENDER
# ?? <> XXX ; # CYRILLIC SMALL LETTER KA WITH HOOK
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH HOOK
# ?? <> XXX ; # CYRILLIC SMALL LETTER BASHKIR KA
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER BASHKIR KA
# ?? <> XXX ; # CYRILLIC SMALL LETTER KA WITH STROKE
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH STROKE
# ?? <> XXX ; # CYRILLIC SMALL LETTER KA WITH VERTICAL STROKE
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH VERTICAL STROKE
?? <> l ; # CYRILLIC SMALL LETTER EL
?? <> L; # CYRILLIC CAPITAL LETTER EL
# қ <> XXX ; # CYRILLIC SMALL LETTER KA WITH DESCENDER
# Қ <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH DESCENDER
# ӄ <> XXX ; # CYRILLIC SMALL LETTER KA WITH HOOK
# Ӄ <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH HOOK
# ҡ <> XXX ; # CYRILLIC SMALL LETTER BASHKIR KA
# Ҡ <> XXX ; # CYRILLIC CAPITAL LETTER BASHKIR KA
# ҟ <> XXX ; # CYRILLIC SMALL LETTER KA WITH STROKE
# Ҟ <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH STROKE
# ҝ <> XXX ; # CYRILLIC SMALL LETTER KA WITH VERTICAL STROKE
# Ҝ <> XXX ; # CYRILLIC CAPITAL LETTER KA WITH VERTICAL STROKE
л <> l ; # CYRILLIC SMALL LETTER EL
Л <> L; # CYRILLIC CAPITAL LETTER EL
?? <> m ; # CYRILLIC SMALL LETTER EM
?? <> M ; # CYRILLIC CAPITAL LETTER EM
?? <> n ; # CYRILLIC SMALL LETTER EN
?? <> N; # CYRILLIC CAPITAL LETTER EN
# ?? <> XXX ; # CYRILLIC SMALL LETTER EN WITH DESCENDER
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER
# ?? <> XXX ; # CYRILLIC SMALL LETTER EN WITH HOOK
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER EN WITH HOOK
# ?? <> XXX ; # CYRILLIC SMALL LIGATURE EN GHE
# ?? <> XXX ; # CYRILLIC CAPITAL LIGATURE EN GHE
м <> m ; # CYRILLIC SMALL LETTER EM
М <> M ; # CYRILLIC CAPITAL LETTER EM
н <> n ; # CYRILLIC SMALL LETTER EN
Н <> N; # CYRILLIC CAPITAL LETTER EN
# ң <> XXX ; # CYRILLIC SMALL LETTER EN WITH DESCENDER
# Ң <> XXX ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER
# ӈ <> XXX ; # CYRILLIC SMALL LETTER EN WITH HOOK
# Ӈ <> XXX ; # CYRILLIC CAPITAL LETTER EN WITH HOOK
# ҥ <> XXX ; # CYRILLIC SMALL LIGATURE EN GHE
# Ҥ <> XXX ; # CYRILLIC CAPITAL LIGATURE EN GHE
?? <> o ; # CYRILLIC SMALL LETTER O
?? <> O ; # CYRILLIC CAPITAL LETTER O
# ?? <> XXX ; # CYRILLIC SMALL LETTER BARRED O
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER BARRED O
?? <> p ; # CYRILLIC SMALL LETTER PE
?? <> P ; # CYRILLIC CAPITAL LETTER PE
# ?? <> XXX ; # CYRILLIC SMALL LETTER PE WITH MIDDLE HOOK
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER PE WITH MIDDLE HOOK
# ?? <> XXX ; # CYRILLIC SMALL LETTER KOPPA
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER KOPPA
?? <> r ; # CYRILLIC SMALL LETTER ER
?? <> R ; # CYRILLIC CAPITAL LETTER ER
# ?? <> XXX ; # CYRILLIC SMALL LETTER ER WITH TICK
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER ER WITH TICK
?? <> s ; # CYRILLIC SMALL LETTER ES
?? <> S ; # CYRILLIC CAPITAL LETTER ES
# ?? <> XXX ; # CYRILLIC SMALL LETTER ES WITH DESCENDER
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER ES WITH DESCENDER
?? <> t ; # CYRILLIC SMALL LETTER TE
?? <> T ; # CYRILLIC CAPITAL LETTER TE
# ?? <> XXX ; # CYRILLIC SMALL LETTER TE WITH DESCENDER
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER TE WITH DESCENDER
о <> o ; # CYRILLIC SMALL LETTER O
О <> O ; # CYRILLIC CAPITAL LETTER O
# ө <> XXX ; # CYRILLIC SMALL LETTER BARRED O
# Ө <> XXX ; # CYRILLIC CAPITAL LETTER BARRED O
п <> p ; # CYRILLIC SMALL LETTER PE
П <> P ; # CYRILLIC CAPITAL LETTER PE
# ҧ <> XXX ; # CYRILLIC SMALL LETTER PE WITH MIDDLE HOOK
# Ҧ <> XXX ; # CYRILLIC CAPITAL LETTER PE WITH MIDDLE HOOK
# ҁ <> XXX ; # CYRILLIC SMALL LETTER KOPPA
# Ҁ <> XXX ; # CYRILLIC CAPITAL LETTER KOPPA
р <> r ; # CYRILLIC SMALL LETTER ER
Р <> R ; # CYRILLIC CAPITAL LETTER ER
# ҏ <> XXX ; # CYRILLIC SMALL LETTER ER WITH TICK
# Ҏ <> XXX ; # CYRILLIC CAPITAL LETTER ER WITH TICK
с <> s ; # CYRILLIC SMALL LETTER ES
С <> S ; # CYRILLIC CAPITAL LETTER ES
# ҫ <> XXX ; # CYRILLIC SMALL LETTER ES WITH DESCENDER
# Ҫ <> XXX ; # CYRILLIC CAPITAL LETTER ES WITH DESCENDER
т <> t ; # CYRILLIC SMALL LETTER TE
Т <> T ; # CYRILLIC CAPITAL LETTER TE
# ҭ <> XXX ; # CYRILLIC SMALL LETTER TE WITH DESCENDER
# Ҭ <> XXX ; # CYRILLIC CAPITAL LETTER TE WITH DESCENDER
?? <> u ; # CYRILLIC SMALL LETTER U
?? <> U ; # CYRILLIC CAPITAL LETTER U
# ?? <> XXX ; # CYRILLIC SMALL LETTER STRAIGHT U
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER STRAIGHT U
# ?? <> XXX ; # CYRILLIC SMALL LETTER STRAIGHT U WITH STROKE
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER STRAIGHT U WITH STROKE
# ?? <> XXX ; # CYRILLIC SMALL LETTER UK
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER UK
?? <> f ; # CYRILLIC SMALL LETTER EF
?? <> F ; # CYRILLIC CAPITAL LETTER EF
?? <> h ; # CYRILLIC SMALL LETTER HA
?? <> H; # CYRILLIC CAPITAL LETTER HA
# ?? <> XXX ; # CYRILLIC SMALL LETTER HA WITH DESCENDER
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER HA WITH DESCENDER
# ?? <> XXX ; # CYRILLIC SMALL LETTER SHHA
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER SHHA
# ?? <> XXX ; # CYRILLIC SMALL LETTER OMEGA
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER OMEGA
# ?? <> XXX ; # CYRILLIC SMALL LETTER OT
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER OT
# ?? <> XXX ; # CYRILLIC SMALL LETTER OMEGA WITH TITLO
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER OMEGA WITH TITLO
# ?? <> XXX ; # CYRILLIC SMALL LETTER ROUND OMEGA
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER ROUND OMEGA
?? <> c ; # CYRILLIC SMALL LETTER TSE
?? <> C; # CYRILLIC CAPITAL LETTER TSE
# ?? <> XXX ; # CYRILLIC SMALL LIGATURE TE TSE
# ?? <> XXX ; # CYRILLIC CAPITAL LIGATURE TE TSE
у <> u ; # CYRILLIC SMALL LETTER U
У <> U ; # CYRILLIC CAPITAL LETTER U
# ү <> XXX ; # CYRILLIC SMALL LETTER STRAIGHT U
# Ү <> XXX ; # CYRILLIC CAPITAL LETTER STRAIGHT U
# ұ <> XXX ; # CYRILLIC SMALL LETTER STRAIGHT U WITH STROKE
# Ұ <> XXX ; # CYRILLIC CAPITAL LETTER STRAIGHT U WITH STROKE
# ѹ <> XXX ; # CYRILLIC SMALL LETTER UK
# Ѹ <> XXX ; # CYRILLIC CAPITAL LETTER UK
ф <> f ; # CYRILLIC SMALL LETTER EF
Ф <> F ; # CYRILLIC CAPITAL LETTER EF
х <> h ; # CYRILLIC SMALL LETTER HA
Х <> H; # CYRILLIC CAPITAL LETTER HA
# ҳ <> XXX ; # CYRILLIC SMALL LETTER HA WITH DESCENDER
# Ҳ <> XXX ; # CYRILLIC CAPITAL LETTER HA WITH DESCENDER
# һ <> XXX ; # CYRILLIC SMALL LETTER SHHA
# Һ <> XXX ; # CYRILLIC CAPITAL LETTER SHHA
# ѡ <> XXX ; # CYRILLIC SMALL LETTER OMEGA
# Ѡ <> XXX ; # CYRILLIC CAPITAL LETTER OMEGA
# ѿ <> XXX ; # CYRILLIC SMALL LETTER OT
# Ѿ <> XXX ; # CYRILLIC CAPITAL LETTER OT
# ѽ <> XXX ; # CYRILLIC SMALL LETTER OMEGA WITH TITLO
# Ѽ <> XXX ; # CYRILLIC CAPITAL LETTER OMEGA WITH TITLO
# ѻ <> XXX ; # CYRILLIC SMALL LETTER ROUND OMEGA
# Ѻ <> XXX ; # CYRILLIC CAPITAL LETTER ROUND OMEGA
ц <> c ; # CYRILLIC SMALL LETTER TSE
Ц <> C; # CYRILLIC CAPITAL LETTER TSE
# ҵ <> XXX ; # CYRILLIC SMALL LIGATURE TE TSE
# Ҵ <> XXX ; # CYRILLIC CAPITAL LIGATURE TE TSE
# ?? <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN CHE
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN CHE
# ?? <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN CHE WITH DESCENDER
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN CHE WITH DESCENDER
# ҽ <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN CHE
# Ҽ <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN CHE
# ҿ <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN CHE WITH DESCENDER
# Ҿ <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN CHE WITH DESCENDER
?? <> $modprime2 $under ; # CYRILLIC CAPITAL LETTER HARD SIGN
?? <> $modprime2 ; # CYRILLIC SMALL LETTER HARD SIGN
?? <> $modprime $under ; # CYRILLIC CAPITAL LETTER SOFT SIGN
?? <> $modprime ; # CYRILLIC SMALL LETTER SOFT SIGN
Ъ <> $modprime2 $under ; # CYRILLIC CAPITAL LETTER HARD SIGN
ъ <> $modprime2 ; # CYRILLIC SMALL LETTER HARD SIGN
Ь <> $modprime $under ; # CYRILLIC CAPITAL LETTER SOFT SIGN
ь <> $modprime ; # CYRILLIC SMALL LETTER SOFT SIGN
?? <> y ; # CYRILLIC SMALL LETTER YERU
?? <> Y ; # CYRILLIC CAPITAL LETTER YERU
ы <> y ; # CYRILLIC SMALL LETTER YERU
Ы <> Y ; # CYRILLIC CAPITAL LETTER YERU
# ?? <> XXX ; # CYRILLIC SMALL LETTER SEMISOFT SIGN
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER SEMISOFT SIGN
# ?? <> XXX ; # CYRILLIC SMALL LETTER YAT
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER YAT
# ҍ <> XXX ; # CYRILLIC SMALL LETTER SEMISOFT SIGN
# Ҍ <> XXX ; # CYRILLIC CAPITAL LETTER SEMISOFT SIGN
# ѣ <> XXX ; # CYRILLIC SMALL LETTER YAT
# Ѣ <> XXX ; # CYRILLIC CAPITAL LETTER YAT
# ?? <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED E
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED E
# ?? <> XXX ; # CYRILLIC SMALL LETTER LITTLE YUS
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER LITTLE YUS
# ?? <> XXX ; # CYRILLIC SMALL LETTER BIG YUS
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER BIG YUS
# ?? <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED LITTLE YUS
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED LITTLE YUS
# ?? <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED BIG YUS
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED BIG YUS
# ?? <> XXX ; # CYRILLIC SMALL LETTER KSI
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER KSI
# ?? <> XXX ; # CYRILLIC SMALL LETTER PSI
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER PSI
# ?? <> XXX ; # CYRILLIC SMALL LETTER FITA
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER FITA
# ?? <> XXX ; # CYRILLIC SMALL LETTER IZHITSA
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER IZHITSA
# ?? <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN HA
# ?? <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN HA
# ?? <> XXX ; # CYRILLIC LETTER PALOCHKA
### ???? <> XXX ; # CYRILLIC SMALL LETTER A
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER A
### ???? <> XXX ; # CYRILLIC SMALL LETTER A
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER A
### ???? <> XXX ; # CYRILLIC SMALL LETTER SCHWA
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER SCHWA
### ???? <> XXX ; # CYRILLIC SMALL LETTER GHE
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER GHE
### ???? <> XXX ; # CYRILLIC SMALL LETTER IE
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER IE
### ???? <> XXX ; # CYRILLIC SMALL LETTER IE
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER IE
### ???? <> XXX ; # CYRILLIC SMALL LETTER IE
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER IE
### ???? <> XXX ; # CYRILLIC SMALL LETTER ZHE
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER ZHE
### ???? <> XXX ; # CYRILLIC SMALL LETTER ZHE
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER ZHE
### ???? <> XXX ; # CYRILLIC SMALL LETTER ZE
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER ZE
### ???? <> XXX ; # CYRILLIC SMALL LETTER I
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER I
### ???? <> XXX ; # CYRILLIC SMALL LETTER I
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER I
### ???? <> XXX ; # CYRILLIC SMALL LETTER I
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER I
### ???? <> XXX ; # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
### ???? <> XXX ; # CYRILLIC SMALL LETTER O
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER O
### ???? <> XXX ; # CYRILLIC SMALL LETTER BARRED O
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER BARRED O
### ???? <> XXX ; # CYRILLIC SMALL LETTER KA
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER KA
### ???? <> XXX ; # CYRILLIC SMALL LETTER U
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER U
### ???? <> XXX ; # CYRILLIC SMALL LETTER U
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER U
### ???? <> XXX ; # CYRILLIC SMALL LETTER U
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER U
### ???? <> XXX ; # CYRILLIC SMALL LETTER U
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER U
### ???? <> XXX ; # CYRILLIC SMALL LETTER CHE
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER CHE
### ???? <> XXX ; # CYRILLIC SMALL LETTER YERU
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER YERU
### ???? <> XXX ; # CYRILLIC SMALL LETTER E
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER E
### ???? <> XXX ; # CYRILLIC SMALL LETTER IZHITSA
### ???? <> XXX ; # CYRILLIC CAPITAL LETTER IZHITSA
# ѥ <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED E
# Ѥ <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED E
# ѧ <> XXX ; # CYRILLIC SMALL LETTER LITTLE YUS
# Ѧ <> XXX ; # CYRILLIC CAPITAL LETTER LITTLE YUS
# ѫ <> XXX ; # CYRILLIC SMALL LETTER BIG YUS
# Ѫ <> XXX ; # CYRILLIC CAPITAL LETTER BIG YUS
# ѩ <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED LITTLE YUS
# Ѩ <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED LITTLE YUS
# ѭ <> XXX ; # CYRILLIC SMALL LETTER IOTIFIED BIG YUS
# Ѭ <> XXX ; # CYRILLIC CAPITAL LETTER IOTIFIED BIG YUS
# ѯ <> XXX ; # CYRILLIC SMALL LETTER KSI
# Ѯ <> XXX ; # CYRILLIC CAPITAL LETTER KSI
# ѱ <> XXX ; # CYRILLIC SMALL LETTER PSI
# Ѱ <> XXX ; # CYRILLIC CAPITAL LETTER PSI
# ѳ <> XXX ; # CYRILLIC SMALL LETTER FITA
# Ѳ <> XXX ; # CYRILLIC CAPITAL LETTER FITA
# ѵ <> XXX ; # CYRILLIC SMALL LETTER IZHITSA
# Ѵ <> XXX ; # CYRILLIC CAPITAL LETTER IZHITSA
# ҩ <> XXX ; # CYRILLIC SMALL LETTER ABKHASIAN HA
# Ҩ <> XXX ; # CYRILLIC CAPITAL LETTER ABKHASIAN HA
# Ӏ <> XXX ; # CYRILLIC LETTER PALOCHKA
### ӑ <> XXX ; # CYRILLIC SMALL LETTER A
### Ӑ <> XXX ; # CYRILLIC CAPITAL LETTER A
### ӓ <> XXX ; # CYRILLIC SMALL LETTER A
### Ӓ <> XXX ; # CYRILLIC CAPITAL LETTER A
### ӛ <> XXX ; # CYRILLIC SMALL LETTER SCHWA
### Ӛ <> XXX ; # CYRILLIC CAPITAL LETTER SCHWA
### ѓ <> XXX ; # CYRILLIC SMALL LETTER GHE
### Ѓ <> XXX ; # CYRILLIC CAPITAL LETTER GHE
### ѐ <> XXX ; # CYRILLIC SMALL LETTER IE
### Ѐ <> XXX ; # CYRILLIC CAPITAL LETTER IE
### ё <> XXX ; # CYRILLIC SMALL LETTER IE
### Ё <> XXX ; # CYRILLIC CAPITAL LETTER IE
### ӗ <> XXX ; # CYRILLIC SMALL LETTER IE
### Ӗ <> XXX ; # CYRILLIC CAPITAL LETTER IE
### ӂ <> XXX ; # CYRILLIC SMALL LETTER ZHE
### Ӂ <> XXX ; # CYRILLIC CAPITAL LETTER ZHE
### ӝ <> XXX ; # CYRILLIC SMALL LETTER ZHE
### Ӝ <> XXX ; # CYRILLIC CAPITAL LETTER ZHE
### ӟ <> XXX ; # CYRILLIC SMALL LETTER ZE
### Ӟ <> XXX ; # CYRILLIC CAPITAL LETTER ZE
### ѝ <> XXX ; # CYRILLIC SMALL LETTER I
### Ѝ <> XXX ; # CYRILLIC CAPITAL LETTER I
### ӣ <> XXX ; # CYRILLIC SMALL LETTER I
### Ӣ <> XXX ; # CYRILLIC CAPITAL LETTER I
### ӥ <> XXX ; # CYRILLIC SMALL LETTER I
### Ӥ <> XXX ; # CYRILLIC CAPITAL LETTER I
### ї <> XXX ; # CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
### Ї <> XXX ; # CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
### ӧ <> XXX ; # CYRILLIC SMALL LETTER O
### Ӧ <> XXX ; # CYRILLIC CAPITAL LETTER O
### ӫ <> XXX ; # CYRILLIC SMALL LETTER BARRED O
### Ӫ <> XXX ; # CYRILLIC CAPITAL LETTER BARRED O
### ќ <> XXX ; # CYRILLIC SMALL LETTER KA
### Ќ <> XXX ; # CYRILLIC CAPITAL LETTER KA
### ӯ <> XXX ; # CYRILLIC SMALL LETTER U
### Ӯ <> XXX ; # CYRILLIC CAPITAL LETTER U
### ў <> XXX ; # CYRILLIC SMALL LETTER U
### Ў <> XXX ; # CYRILLIC CAPITAL LETTER U
### ӱ <> XXX ; # CYRILLIC SMALL LETTER U
### Ӱ <> XXX ; # CYRILLIC CAPITAL LETTER U
### ӳ <> XXX ; # CYRILLIC SMALL LETTER U
### Ӳ <> XXX ; # CYRILLIC CAPITAL LETTER U
### ӵ <> XXX ; # CYRILLIC SMALL LETTER CHE
### Ӵ <> XXX ; # CYRILLIC CAPITAL LETTER CHE
### ӹ <> XXX ; # CYRILLIC SMALL LETTER YERU
### Ӹ <> XXX ; # CYRILLIC CAPITAL LETTER YERU
### ӭ <> XXX ; # CYRILLIC SMALL LETTER E
### Ӭ <> XXX ; # CYRILLIC CAPITAL LETTER E
### ѷ <> XXX ; # CYRILLIC SMALL LETTER IZHITSA
### Ѷ <> XXX ; # CYRILLIC CAPITAL LETTER IZHITSA
# Completeness
$ignore = [[:Mark:]''] * ;

View File

@ -1,11 +1,7 @@
???#--------------------------------------------------------------------
#--------------------------------------------------------------------
# Copyright (c) 1999-2004, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# $Source: /xsrl/Nsvn/icu/icu4j/src/com/ibm/icu/impl/data/Attic/Transliterator_Greek_Latin.txt,v $
# $Date: 2004/05/21 01:01:51 $
# $Revision: 1.23 $
#--------------------------------------------------------------------
# Rules are predicated on running NFD first, and NFC afterwards
# :: [\u0000-\u007F \u0370-\u03FF [:Greek:] [:nonspacing mark:]] ;
@ -16,13 +12,13 @@
# TEST CASES
# ????????????? ??????????????? ????????????? ??????????????? ?????????????????????? ??? ????????????????
# ??? ??? ??? ??? ??? ???
# ??? ??? ??? ??? ???
# ????? ????? ????? ?????
# ????? ????? ????? ?????
# ????? ????? ????? ?????
# ???, ???, ???, ???, ???, ???
# Ὀλίγοι ἔμφονες πολλῶν ἀφρόνων φοβερώτεροι — Πλάτωνος
# ᾂ ᾒ ᾢ ᾃ ᾓ ᾣ
# ᾳ ῃ ῳ ὃ ὄ
# ὠς ὡς ὢς ὣς
# Ὠς Ὡς Ὢς Ὣς
# ὨΣ ὩΣ ὪΣ ὫΣ
# Ạ, ạ, Ẹ, ẹ, Ọ, ọ
# Useful variables
@ -39,8 +35,8 @@ $macron = \u0304 ;
$ddot = \u0308 ;
$ddotmac = [$ddot$macron];
$lcgvowel = [??????????????] ;
$ucgvowel = [??????????????] ;
$lcgvowel = [αεηιουω] ;
$ucgvowel = [ΑΕΗΙΟΥΩ] ;
$gvowel = [$lcgvowel $ucgvowel] ;
$lcgvowelC = [$lcgvowel $accent] ;
@ -48,11 +44,11 @@ $evowel = [aeiouyAEIOUY];
$evowel2 = [iuyIUY];
$vowel = [ $evowel $gvowel] ;
$gammaLike = [??????????????????] ;
$gammaLike = [ΓΚΞΧγκξχϰ] ;
$egammaLike = [GKXCgkxc] ;
$smooth = ?? ;
$rough = ?? ;
$iotasub = ?? ;
$smooth = ̓ ;
$rough = ̔ ;
$iotasub = ͅ ;
$evowel_i = [$evowel-[iI]] ;
$evowel2_i = [uyUY];
@ -64,7 +60,7 @@ $beforeLetter = [[:M:]\']* [:L:] ;
$beforeLower = $accent * $lower ;
$notLetter = [^[:L:][:M:]] ;
$under = ??;
$under = ̱;
# Fix punctuation
# preserve original
@ -72,7 +68,7 @@ $under = ??;
\? <> \? $under ;
\; <> \? ;
?? <> \: ;
· <> \: ;
# CIRCUMFLEX: convert greek circumflex to normal one. Could use tilde or inverted breve
@ -83,8 +79,8 @@ $under = ??;
$accent_minus = [[$accent]-[$iotasub$macron]];
?? } $accent_minus * $iotasub > | ?? $macron ;
?? } $accent_minus * $iotasub > | ?? $macron ;
Α } $accent_minus * $iotasub > | Α $macron ;
α } $accent_minus * $iotasub > | α $macron ;
# now convert to uppercase if after uppercase, ow to lowercase
@ -100,23 +96,23 @@ $iotasub > i ;
# Make A ` x = > H a x
?? ($macron?) $rough } $beforeLower > H | ?? $1;
?? $rough } $beforeLower > H | ??;
?? $rough } $beforeLower > H | ?? ;
?? ($ddot?) $rough } $beforeLower > H | ?? $1;
?? $rough } $beforeLower > H | ?? ;
?? $rough } $beforeLower > H | ?? ;
?? ($ddot?) $rough } $beforeLower > H | ?? $1;
Α ($macron?) $rough } $beforeLower > H | α $1;
Ε $rough } $beforeLower > H | ε;
Η $rough } $beforeLower > H | η ;
Ι ($ddot?) $rough } $beforeLower > H | ι $1;
Ο $rough } $beforeLower > H | ο ;
Υ $rough } $beforeLower > H | υ ;
Ω ($ddot?) $rough } $beforeLower > H | ω $1;
# Make A x ` = > H a x
?? ($glower $macron?) $rough > H | ?? $1 ;
?? ($glower) $rough > H | ?? $1 ;
?? ($glower) $rough > H | ?? $1 ;
?? ($glower $ddot?) $rough > H | ?? $1 ;
?? ($glower) $rough > H | ?? $1 ;
?? ($glower) $rough > H | ?? $1 ;
?? ($glower $ddot?) $rough > H | ?? $1 ;
Α ($glower $macron?) $rough > H | α $1 ;
Ε ($glower) $rough > H | ε $1 ;
Η ($glower) $rough > H | η $1 ;
Ι ($glower $ddot?) $rough > H | ι $1 ;
Ο ($glower) $rough > H | ο $1 ;
Υ ($glower) $rough > H | υ $1 ;
Ω ($glower $ddot?) $rough > H | ω $1 ;
#Otherwise, make x ` into h x and X ` into H X
@ -176,120 +172,120 @@ $smooth > ;
# remove now superfluous macron when returning
?? < A $macron ;
?? < a $macron ;
Α < A $macron ;
α < a $macron ;
?? <> e $macron ;
?? <> E $macron ;
η <> e $macron ;
Η <> E $macron ;
?? <> ph ;
?? } $beforeLower <> Ps ;
?? <> PS ;
φ <> ph ;
Ψ } $beforeLower <> Ps ;
Ψ <> PS ;
?? } $beforeLower <> Ph ;
?? <> PH ;
?? <> ps ;
Φ } $beforeLower <> Ph ;
Φ <> PH ;
ψ <> ps ;
?? <> o $macron ;
?? <> O $macron;
ω <> o $macron ;
Ω <> O $macron;
# NORMAL
?? <> a ;
?? <> A ;
α <> a ;
Α <> A ;
?? <> b ;
?? <> B ;
β <> b ;
Β <> B ;
?? } $gammaLike <> n } $egammaLike ;
?? <> g ;
?? } $gammaLike <> N } $egammaLike ;
?? <> G ;
γ } $gammaLike <> n } $egammaLike ;
γ <> g ;
Γ } $gammaLike <> N } $egammaLike ;
Γ <> G ;
?? <> d ;
?? <> D ;
δ <> d ;
Δ <> D ;
?? <> e ;
?? <> E ;
ε <> e ;
Ε <> E ;
?? <> z ;
?? <> Z ;
ζ <> z ;
Ζ <> Z ;
?? <> th ;
?? } $beforeLower <> Th ;
?? <> TH ;
θ <> th ;
Θ } $beforeLower <> Th ;
Θ <> TH ;
?? <> i ;
?? <> I ;
ι <> i ;
Ι <> I ;
?? <> k ;
?? <> K ;
κ <> k ;
Κ <> K ;
?? <> l ;
?? <> L ;
λ <> l ;
Λ <> L ;
?? <> m ;
?? <> M ;
μ <> m ;
Μ <> M ;
?? } $gammaLike > n\' ;
?? <> n ;
?? } $gammaLike <> N\' ;
?? <> N ;
ν } $gammaLike > n\' ;
ν <> n ;
Ν } $gammaLike <> N\' ;
Ν <> N ;
?? <> x ;
?? <> X ;
ξ <> x ;
Ξ <> X ;
?? <> o ;
?? <> O ;
ο <> o ;
Ο <> O ;
?? <> p ;
?? <> P ;
π <> p ;
Π <> P ;
?? $rough <> rh;
?? $rough } $beforeLower <> Rh ;
?? $rough <> RH ;
?? <> r ;
?? <> R ;
ρ $rough <> rh;
Ρ $rough } $beforeLower <> Rh ;
Ρ $rough <> RH ;
ρ <> r ;
Ρ <> R ;
# insert separator before things that turn into s
[Pp] { } [??????????????] > \' ;
[Pp] { } [ςσΣϷϸϺϻ] > \' ;
# special S variants
?? <> S?? ; # ?? GREEK CAPITAL LETTER SHO Uppercase_Letter Grek - L
?? <> s?? ; #?? GREEK SMALL LETTER SHO Lowercase_Letter Grek - L
?? <> S?? ; # ?? GREEK CAPITAL LETTER SAN Uppercase_Letter Grek - L
?? <> s?? ; # ?? GREEK SMALL LETTER SAN Lowercase_Letter Grek - L
Ϸ <> Š ; # Ϸ GREEK CAPITAL LETTER SHO Uppercase_Letter Grek - L
ϸ <> š ; #ϸ GREEK SMALL LETTER SHO Lowercase_Letter Grek - L
Ϻ <> Ŝ ; # Ϻ GREEK CAPITAL LETTER SAN Uppercase_Letter Grek - L
ϻ <> ŝ ; # ϻ GREEK SMALL LETTER SAN Lowercase_Letter Grek - L
# underbar means exception
# before a letter, initial
?? } $beforeLetter <> s $underbar } $beforeLetter;
?? } $beforeLetter <> s } $beforeLetter;
ς } $beforeLetter <> s $underbar } $beforeLetter;
σ } $beforeLetter <> s } $beforeLetter;
# otherwise, after a letter = final
$afterLetter { ?? <> $afterLetter { s $underbar;
$afterLetter { ?? <> $afterLetter { s ;
$afterLetter { σ <> $afterLetter { s $underbar;
$afterLetter { ς <> $afterLetter { s ;
# otherwise (isolated) = initial
?? <> s $underbar;
?? <> s ;
ς <> s $underbar;
σ <> s ;
# [Pp] { ?? <> \'S ;
?? <> S ;
# [Pp] { Σ <> \'S ;
Σ <> S ;
?? <> t ;
?? <> T ;
τ <> t ;
Τ <> T ;
$vowel {?? } <> u ;
?? <> y ;
$vowel { ?? <> U ;
?? <> Y ;
$vowel {υ } <> u ;
υ <> y ;
$vowel { Υ <> U ;
Υ <> Y ;
?? <> ch ;
?? } $beforeLower <> Ch ;
?? <> CH ;
χ <> ch ;
Χ } $beforeLower <> Ch ;
Χ <> CH ;
# Completeness for ASCII
@ -319,28 +315,28 @@ $rough <> h ;
# Completeness for Greek
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
ϐ > | β ;
ϑ > | θ ;
ϒ > | Υ ;
ϕ > | φ ;
ϖ > | π ;
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
?? > | ??; #U+03F9 GREEK CAPITAL LUNATE SIGMA SYMBOL
?? > j ;
?? > | ?? ;
?? > | ?? ;
ϰ > | κ ;
ϱ > | ρ ;
ϲ > | σ ;
Ϲ > | Σ; #U+03F9 GREEK CAPITAL LUNATE SIGMA SYMBOL
ϳ > j ;
ϴ > | Θ ;
ϵ > | ε ;
?? > | ?? ;
µ > | μ ;
?? > i;
ͺ > i;
# delete any trailing ' marks used for roundtripping
< [????] { \' } [Ss] ;
< [????] { \' } $egammaLike ;
< [Ππ] { \' } [Ss] ;
< [Νν] { \' } $egammaLike ;
::NFC (NFD) ;
# ([\u0000-\u007F [:Latin:] [:Greek:] [:nonspacing mark:]]) ;

View File

@ -1,17 +1,13 @@
???#--------------------------------------------------------------------
#--------------------------------------------------------------------
# Copyright (c) 1999-2004, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# $Source: /xsrl/Nsvn/icu/icu4j/src/com/ibm/icu/impl/data/Attic/Transliterator_Greek_Latin_UNGEGN.txt,v $
# $Date: 2004/05/21 01:01:50 $
# $Revision: 1.4 $
#--------------------------------------------------------------------
# For modern Greek, based on UNGEGN rules.
# Rules are predicated on running NFD first, and NFC afterwards
# MINIMAL FILTER GENERATED FOR: Greek-Latin/UNGEGN
# WARNING: need to add accents to both filters ###
# :: [????????;??????????????????????????????????????????????-????-????-????-????-????-????-????-????????-??????-??????????-??????-????-????-????-?????????????-??????-??????-??????-??????-??????-??????-??????-??????-??????-??????-??????-??????-??????-??????-??????-???????????????-??????-??????-?????????-??????-??????-??????-?????????-??????-??????-??????\u03F7-\u07FB\u03F9] ;
# :: [́̄̆̈;µ·ÀÂÈÊÌÎÒÔÙÛàâèêìîòôùûĈ-ĉĜ-ĝĤ-ĥĴ-ĵŜ-ŝŴ-ŷǛ-ǜǸ-ǹ̀̂̓-̔̀͂-̓ͅͺ;Ά-ΊΌΎ-ΡΣ-ώϐ-ϖϰ-ϵЀЍѐѝḔ-ḕṐ-ṑẀ-ẁẐ-ẑẤ-ậẰ-ằẾ-ệỐ-ộỜ-ờỪ-ừỲ-ỳἀ-ἕἘ-Ἕἠ-ὅὈ-Ὅὐ-ὗὙὛὝὟ-ώᾀ-ᾴᾶ-ᾼι῁-ῄῆ-῍῏-ΐῖ-Ί῝῟-῭ῲ-ῴῶ-ῼΩ\u03F7-\u07FB\u03F9] ;
:: [[[:Greek:][:Mn:][:Me:]] [\:-;?\u00B7\u037E\u0387]] ;
::NFD (NFC) ;
@ -22,11 +18,11 @@ $lower = [[:latin:][:greek:] & [:Ll:]] ;
$upper = [[:latin:][:greek:] & [:Lu:]] ;
$accent = [[:Mn:][:Me:]] ;
$macron = ?? ;
$ddot = ?? ;
$macron = ̄ ;
$ddot = ̈ ;
$lcgvowel = [??????????????] ;
$ucgvowel = [??????????????] ;
$lcgvowel = [αεηιουω] ;
$ucgvowel = [ΑΕΗΙΟΥΩ] ;
$gvowel = [$lcgvowel $ucgvowel] ;
$lcgvowelC = [$lcgvowel $accent] ;
@ -35,17 +31,17 @@ $vowel = [ $evowel $gvowel] ;
$beforeLower = $accent * $lower ;
$gammaLike = [??????????????????] ;
$gammaLike = [ΓΚΞΧγκξχϰ] ;
$egammaLike = [GKXCgkxc] ;
$smooth = ?? ;
$rough = ?? ;
$iotasub = ?? ;
$smooth = ̓ ;
$rough = ̔ ;
$iotasub = ͅ ;
$softener = [????????????????????????????????$gvowel] ;
$softener = [βΒγΓδΔζΖλΛμΜνΝρΡ$gvowel] ;
$under = ??;
$under = ̱;
$caron = ??;
$caron = ̌;
$afterLetter = [:L:] [\'$accent]* ;
$beforeLetter = [\'$accent]* [:L:] ;
@ -57,154 +53,154 @@ $beforeLetter = [\'$accent]* [:L:] ;
\? <> \? $under ;
\; <> \? ;
?? <> \: ;
· <> \: ;
# Fix any ancient characters that creep in
?? > ?? ;
?? > ?? ;
?? > ?? ;
͂ > ́ ;
̂ > ́ ;
̀ > ́ ;
$smooth > ;
$rough > ;
$iotasub > ;
?? > ;
ͺ > ;
# need to have these up here so the rules don't mask
?? <> i $under ;
?? <> I $under ;
η <> i $under ;
Η <> I $under ;
?? } $beforeLower <> Ps ;
?? <> PS ;
?? <> ps ;
Ψ } $beforeLower <> Ps ;
Ψ <> PS ;
ψ <> ps ;
?? <> o $under ;
?? <> O $under;
ω <> o $under ;
Ω <> O $under;
# at begining or end of word, convert mp to b
[^[:L:]$accent] { ???? > b ;
???? } [^[:L:]$accent] > b ;
[^[:L:]$accent] { [????][????] > B ;
[????][????] } [^[:L:]$accent] > B ;
[^[:L:]$accent] { μπ > b ;
μπ } [^[:L:]$accent] > b ;
[^[:L:]$accent] { [Μμ][Ππ] > B ;
[Μμ][Ππ] } [^[:L:]$accent] > B ;
???? < b ;
???? < B } $beforeLower ;
???? < B ;
μπ < b ;
Μπ < B } $beforeLower ;
ΜΠ < B ;
# handle diphthongs ending with upsilon
???? <> ou ;
???? <> OU ;
???? <> Ou ;
???? <> oU ;
ου <> ou ;
ΟΥ <> OU ;
Ου <> Ou ;
οΥ <> oU ;
$fmaker = [aeiAEI] $under ? ;
$shiftForwardVowels = [[:Mn:]-[\u0308]]; # note: a diaeresis keeps the items separate
$fmaker { ?? ( $shiftForwardVowels )* } $softener > $1 v $under ;
?? $1 < ( $shiftForwardVowels )* v $under ;
$fmaker { υ ( $shiftForwardVowels )* } $softener > $1 v $under ;
υ $1 < ( $shiftForwardVowels )* v $under ;
$fmaker { ?? ( $shiftForwardVowels )* } > $1 f $under;
?? $1 < ( $shiftForwardVowels )* f $under ;
$fmaker { υ ( $shiftForwardVowels )* } > $1 f $under;
υ $1 < ( $shiftForwardVowels )* f $under ;
$fmaker { ?? } $softener <> V $under ;
$fmaker { ?? <> U $under ;
$fmaker { Υ } $softener <> V $under ;
$fmaker { Υ <> U $under ;
?? <> y ;
?? <> Y ;
υ <> y ;
Υ <> Y ;
# NORMAL
?? <> a ;
?? <> A ;
α <> a ;
Α <> A ;
?? <> v ;
?? <> V ;
β <> v ;
Β <> V ;
?? } $gammaLike <> n } $egammaLike ;
?? <> g ;
?? } $gammaLike <> N } $egammaLike ;
?? <> G ;
γ } $gammaLike <> n } $egammaLike ;
γ <> g ;
Γ } $gammaLike <> N } $egammaLike ;
Γ <> G ;
?? <> d ;
?? <> D ;
δ <> d ;
Δ <> D ;
?? <> e ;
?? <> E ;
ε <> e ;
Ε <> E ;
?? <> z ;
?? <> Z ;
ζ <> z ;
Ζ <> Z ;
?? <> th ;
?? } $beforeLower <> Th ;
?? <> TH ;
θ <> th ;
Θ } $beforeLower <> Th ;
Θ <> TH ;
?? <> i ;
?? <> I ;
ι <> i ;
Ι <> I ;
?? <> k ;
?? <> K ;
κ <> k ;
Κ <> K ;
?? <> l ;
?? <> L ;
λ <> l ;
Λ <> L ;
?? <> m ;
?? <> M ;
μ <> m ;
Μ <> M ;
?? } $gammaLike > n\' ;
?? <> n ;
?? } $gammaLike <> N\' ;
?? <> N ;
ν } $gammaLike > n\' ;
ν <> n ;
Ν } $gammaLike <> N\' ;
Ν <> N ;
?? <> x ;
?? <> X ;
ξ <> x ;
Ξ <> X ;
?? <> o ;
?? <> O ;
ο <> o ;
Ο <> O ;
?? <> p ;
?? <> P ;
π <> p ;
Π <> P ;
?? <> r ;
?? <> R ;
ρ <> r ;
Ρ <> R ;
# insert separator before things that turn into s
[Pp] { } [??????????????] > \' ;
[Pp] { } [ςσΣϷϸϺϻ] > \' ;
# special S variants
?? <> S?? ; # ?? GREEK CAPITAL LETTER SHO Uppercase_Letter Grek - L
?? <> s?? ; #?? GREEK SMALL LETTER SHO Lowercase_Letter Grek - L
?? <> S?? ; # ?? GREEK CAPITAL LETTER SAN Uppercase_Letter Grek - L
?? <> s?? ; # ?? GREEK SMALL LETTER SAN Lowercase_Letter Grek - L
Ϸ <> Š ; # Ϸ GREEK CAPITAL LETTER SHO Uppercase_Letter Grek - L
ϸ <> š ; #ϸ GREEK SMALL LETTER SHO Lowercase_Letter Grek - L
Ϻ <> Ŝ ; # Ϻ GREEK CAPITAL LETTER SAN Uppercase_Letter Grek - L
ϻ <> ŝ ; # ϻ GREEK SMALL LETTER SAN Lowercase_Letter Grek - L
# Caron means exception
# before a letter, initial
?? } $beforeLetter <> s $under } $beforeLetter;
?? } $beforeLetter <> s } $beforeLetter;
ς } $beforeLetter <> s $under } $beforeLetter;
σ } $beforeLetter <> s } $beforeLetter;
# otherwise, after a letter = final
$afterLetter { ?? <> $afterLetter { s $under;
$afterLetter { ?? <> $afterLetter { s ;
$afterLetter { σ <> $afterLetter { s $under;
$afterLetter { ς <> $afterLetter { s ;
# otherwise (isolated) = initial
?? <> s $under;
?? <> s ;
ς <> s $under;
σ <> s ;
# [Pp] { ?? <> \'S ;
?? <> S ;
# [Pp] { Σ <> \'S ;
Σ <> S ;
?? <> t ;
?? <> T ;
τ <> t ;
Τ <> T ;
?? <> f ;
?? <> F ;
φ <> f ;
Φ <> F ;
?? <> ch ;
?? } $beforeLower <> Ch ;
?? <> CH ;
χ <> ch ;
Χ } $beforeLower <> Ch ;
Χ <> CH ;
# Completeness for ASCII
@ -230,25 +226,25 @@ $afterLetter { ?? <> $afterLetter { s ;
# Completeness for Greek
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
ϐ > | β ;
ϑ > | θ ;
ϒ > | Υ ;
ϕ > | φ ;
ϖ > | π ;
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
?? > | ??; #U+03F9 GREEK CAPITAL LUNATE SIGMA SYMBOL
?? > j ;
?? > | ?? ;
?? > | ?? ;
?? > | ?? ;
ϰ > | κ ;
ϱ > | ρ ;
ϲ > | σ ;
Ϲ > | Σ; #U+03F9 GREEK CAPITAL LUNATE SIGMA SYMBOL
ϳ > j ;
ϴ > | Θ ;
ϵ > | ε ;
µ > | μ ;
# delete any trailing ' marks used for roundtripping
< [????] { \' } [Ss] ;
< [????] { \' } $egammaLike ;
< [Ππ] { \' } [Ss] ;
< [Νν] { \' } $egammaLike ;
::NFC (NFD) ;

View File

@ -1,11 +1,7 @@
???#--------------------------------------------------------------------
#--------------------------------------------------------------------
# Copyright (c) 1999-2004, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# $Source: /xsrl/Nsvn/icu/icu4j/src/com/ibm/icu/impl/data/Attic/Transliterator_Hebrew_Latin.txt,v $
# $Date: 2004/05/21 01:01:51 $
# $Revision: 1.6 $
#--------------------------------------------------------------------
# Transliteration table for Hebrew
# Based on the UNGEGN table at:
@ -27,74 +23,74 @@
# For more information, see"
# http://oss.software.ibm.com/icu/userguide/Transliteration.html
:: [[:Hebrew:] [\u05B0-\u05B9\u05BB-\u05BC\u05C1-\u05C2\u2135-\u2138??\u05BF] - [\u05BD]] ;
:: [[:Hebrew:] [\u05B0-\u05B9\u05BB-\u05BC\u05C1-\u05C2\u2135-\u2138̄\u05BF] - [\u05BD]] ;
:: nfkd (nfc) ;
$letterAfter = [:M:]* [:L:] ;
# move longer items here to avoid masking
?? <> h?? ;
?? <> z?? } $letterAfter;
?? <> z?? ;
?? <> s?? ;
?? <> t?? ;
ח <> ẖ ;
צ <> ẕ } $letterAfter;
ץ <> ẕ ;
ש <> ş ;
ת <> ţ ;
?? <> ?? ;
?? <> b ;
?? <> g ;
?? <> d ;
?? <> h ;
?? <> w ;
?? <> z ;
?? <> t ;
?? <> y ;
?? <> k } $letterAfter;
?? <> k ;
?? <> l ;
?? <> m } $letterAfter;
?? <> m ;
?? <> n } $letterAfter;
?? <> n ;
?? <> s ;
?? <> ?? ;
?? <> p } $letterAfter;
?? <> p ;
?? <> q ;
?? <> r ;
א <> ʼ ;
ב <> b ;
ג <> g ;
ד <> d ;
ה <> h ;
ו <> w ;
ז <> z ;
ט <> t ;
י <> y ;
כ <> k } $letterAfter;
ך <> k ;
ל <> l ;
מ <> m } $letterAfter;
ם <> m ;
נ <> n } $letterAfter;
ן <> n ;
ס <> s ;
ע <> ʻ ;
פ <> p } $letterAfter;
ף <> p ;
ק <> q ;
ר <> r ;
?? > | ????; # HEBREW LIGATURE YIDDISH DOUBLE VAV
?? > | ????; # HEBREW LIGATURE YIDDISH VAV YOD
?? > | ???? ; # HEBREW LIGATURE YIDDISH DOUBLE YOD
װ > | וו; # HEBREW LIGATURE YIDDISH DOUBLE VAV
ױ > | וי; # HEBREW LIGATURE YIDDISH VAV YOD
ײ > | יי ; # HEBREW LIGATURE YIDDISH DOUBLE YOD
?? <> ?? ; # dagesh just goes to overdot for now
?? <> ?? ; # shin dot -> sh
?? <> ?? ; # sin dot -> s
ּ <> ̇ ; # dagesh just goes to overdot for now
ׁ <> ̌ ; # shin dot -> sh
ׂ <> ̂ ; # sin dot -> s
# points
?? <> a?? ;
?? <> a?? ;
?? <> e?? ;
?? <> e?? ;
?? <> e?? ;
?? <> i ;
?? <> o?? ;
?? <> u ;
ֲ <> à ;
ָ <> á ;
ֱ <> è ;
ֵ <> é ;
ְ <> ê ;
ִ <> i ;
ֹ <> ò ;
ֻ <> u ;
?? <> a ;
?? <> e ;
?? <> o ;
ַ <> a ;
ֶ <> e ;
ֳ <> o ;
\u05BF <> ?? ;
\u05BF <> ̄ ;
# fallbacks
?? < c ;
?? < f } $letterAfter;
?? < f ;
?? < j ;
?? < v ;
???? < x ;
ק < c ;
פ < f } $letterAfter;
ף < f ;
ז < j ;
ו < v ;
כס < x ;
:: (lower);
:: nfc (nfd) ;
:: ([[:Latin:] [\u02BB-\u02BC\u0300-\u0302\u0307\u030C\u0327\u0331\u0340-\u0341 ?? ]]);
:: ([[:Latin:] [\u02BB-\u02BC\u0300-\u0302\u0307\u030C\u0327\u0331\u0340-\u0341 ̄ ]]);