ICU-1231 Retire old files

X-SVN-Rev: 5918
This commit is contained in:
Mark Davis 2001-09-25 21:52:09 +00:00
parent c04ff458c1
commit f0547560a6
7 changed files with 0 additions and 2137 deletions

6
.gitattributes vendored
View File

@ -105,16 +105,10 @@ icu4j/src/com/ibm/text/resources/Transliterator_Kanji_English.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Kanji_OnRomaji.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_Kanji_OnRomaji.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Kannada_InterIndic.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_Kannada_InterIndic.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_KeyboardEscape_Latin1.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_KeyboardEscape_Latin1.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Latin_Arabic.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Latin_Cyrillic.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Latin_Devanagari.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_Latin_Devanagari.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Latin_Greek.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Latin_Hebrew.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Latin_Jamo.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_Latin_Jamo.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Latin_Kana.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Malayalam_InterIndic.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_Malayalam_InterIndic.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Oriya_InterIndic.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_Oriya_InterIndic.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_StraightQuotes_CurlyQuotes.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Tamil_InterIndic.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_Tamil_InterIndic.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_Telugu_InterIndic.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_Telugu_InterIndic.utf8.txt -text
icu4j/src/com/ibm/text/resources/Transliterator_UnicodeName_UnicodeChar.utf8.txt -text icu4j/src/com/ibm/text/resources/Transliterator_UnicodeName_UnicodeChar.utf8.txt -text

View File

@ -1,189 +0,0 @@
#--------------------------------------------------------------------
# Copyright (c) 1999-2001, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# Date: Tue Jan 23 2001
#--------------------------------------------------------------------
# To Do: finish adding shadda, add sokoon
# [Is this done? Can someone finish this?]
### $alefmadda=آ;
### $alefuhamza=أ;
### $wauuhamza=ؤ;
### $alefhamza=إ;
### $yehuhamza=ئ;
### $alef=ا;
### $beh=ب;
### $tehmarbuta=ة;
### $teh=ت;
### $theh=ث;
### $geem=ج;
### $hah=ح;
### $kha=خ;
### $dal=د;
### $dhal=ذ;
### $reh=ر;
### $zain=ز;
### $seen=س;
### $sheen=ش;
### $sad=ص;
### $dad=ض;
### $tah=ط;
### $zah=ظ;
### $ein=ع;
### $ghein=غ;
### $feh=ف;
### $qaaf=ق;
### $kaf=ك;
### $lam=ل;
### $meem=م;
### $noon=ن;
### $heh=ه;
### $wau=و;
### $yehmaqsura=ى;
### $yeh=ي;
### $peh=ڤ;
### $hamza=ء;
### $fathatein=ً;
### $dammatein=ٌ;
### $kasratein=ٍ;
### $fatha=َ;
### $damma=ُ;
### $kasra=ِ;
### $shadda=ّ;
### $sokoon=ْ;
# Doubles - liu
t'' < {ت} [تثةط];
h'' < {ه} [هح];
s'' < {س} ش;
# A few pathological special cases to make round
# trip work. - liu
d'~'d <> د د;
dh'~'dh <> ذ ذ;
dd'~'dd <> ض ض;
# Shadda: Map x ّ to x x, where x is dh, dd, or
# d (that is, ذ, ض, or د). If x is d, d'd is
# output. Net effect is to map s.th. like ض ّ
# to dd'dd. - liu
ذ {dh} <> dh {ّ};
ض {dd} <> dd {ّ};
د {''d} [^dh] <> d {ّ}; # Avoid d'dd or d'dh
# [This should be removed, but it's good for demos]
Arabic> \
تتمتع' ' \
اللغة' ' \
العرببية' ' \
ببنظم' ' \
كتاببية' ' \
جميلة;
# Main rules
''ai<a{آ;
ai<>آ;
''ae<a{أ;
ae<>أ;
''ao<a{إ;
ao<>إ;
''aa<a{ا;
aa<>ا;
''an<a{ً;
an<>ً;
''a<a{َ;
a<>َ;
b<>ب;
''dh<d{ذ;
dh<>ذ;
''dd<d{ض;
dd<>ض;
''d<d{د;
d<>د;
''e<a{ع;
''e<w{ع;
''e<y{ع;
e<>ع;
f<>ف;
gh<>غ;
''hh<d{ح;
''hh<t{ح;
''hh<k{ح;
''hh<s{ح;
hh<>ح;
''h<d{ه;
''h<t{ه;
''h<k{ه;
''h<s{ه;
h<>ه;
''ii<i{ٍ;
ii<>ٍ;
''i<i{ِ;
i<>ِ;
j<>ج;
kh<>خ;
k<>ك;
l<>ل;
''m<y{م;
''m<t{م;
m<>م;
n<>ن;
''o<a{ء;
o<>ء;
p<>ڤ;
q<>ق;
r<>ر;
sh<>ش;
''ss<s{ص;
ss<>ص;
''s<s{س;
s<>س;
th<>ث;
tm<>ة;
''tt<t{ط;
tt<>ط;
''t<t{ت;
t<>ت;
''uu<u{ٌ;
uu<>ٌ;
''u<u{ُ;
u<>ُ;
we<>ؤ;
w<>و;
ye<>ئ;
ym<>ى;
''y<y{ي;
y<>ي;
''zz<z{ظ;
zz<>ظ;
''z<z{ز;
z<>ز;
# One-way Latin-Arabic compatability rules
c>ك;
g>ج;
x>كّس;
v>ب;
# Digits
0<>٠; # Arabic digit 0
1<>١; # Arabic digit 1
2<>٢; # Arabic digit 2
3<>٣; # Arabic digit 3
4<>٤; # Arabic digit 4
5<>٥; # Arabic digit 5
6<>٦; # Arabic digit 6
7<>٧; # Arabic digit 7
8<>٨; # Arabic digit 8
9<>٩; # Arabic digit 9
'%'<>٪; # Arabic %
'.'<>٫; # Arabic decimal separator
','<>٬; # Arabic thousands separator
'*'<>٭; # Arabic five-pointed star
''>;
# eof

View File

@ -1,305 +0,0 @@
#--------------------------------------------------------------------
# Copyright (c) 1999-2001, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# Date: Tue Jan 23 12:42:05 2001
#--------------------------------------------------------------------
# Latin-Cyrillic
# These rules provide general Latin-Cyrillic
# transliteration. The standard Russian transliterations
# are generally used for the letters from Russian,
# with additional Cyrillic characters given consistent
# mappings.
### $S_hacek=Š;
### $s_hacek=š;
### $YO=Ё;
### $J=Ј;
### $A=А;
### $B=Б;
### $V=В;
### $G=Г;
### $D=Д;
### $YE=Е;
### $ZH=Ж;
### $Z=З;
### $YI=И;
### $Y=Й;
### $K=К;
### $L=Л;
### $M=М;
### $N=Н;
### $O=О;
### $P=П;
### $R=Р;
### $S=С;
### $T=Т;
### $U=У;
### $F=Ф;
### $KH=Х;
### $TS=Ц;
### $CH=Ч;
### $SH=Ш;
### $SHCH=Щ;
### $HARD=Ъ;
### $I=Ы;
### $SOFT=Ь;
### $E=Э;
### $YU=Ю;
### $YA=Я;
# Lowercase
### $a=а;
### $b=б;
### $v=в;
### $g=г;
### $d=д;
### $ye=е;
### $zh=ж;
### $z=з;
### $yi=и;
### $y=й;
### $k=к;
### $l=л;
### $m=м;
### $n=н;
### $o=о;
### $p=п;
### $r=р;
### $s=с;
### $t=т;
### $u=у;
### $f=ф;
### $kh=х;
### $ts=ц;
### $ch=ч;
### $sh=ш;
### $shch=щ;
### $hard=ъ;
### $i=ы;
### $soft=ь;
### $e=э;
### $yu=ю;
### $ya=я;
### $yo=ё;
### $j=ј;
# variables
# some are duplicated so lowercasing works
$csoft=[eiyEIY];
$CSOFT=[eiyEIY];
$BECOMES_H=[Ъъ];
$becomes_h=[Ъъ];
$BECOMES_S=[Сс];
$becomes_s=[Сс];
$BECOMES_C=[Чч];
$becomes_c=[Чч];
$BECOMES_VOWEL=[АЭЫОУаэыоу];
$becomes_vowel=[АЭЫОУаэыоу];
$letter=[[:Lu:][:Ll:]];
$lower=[[:Ll:]];
# Modified to combine display transliterator and typing transliterator.
# The display mapping uses accents for the "soft" vowels.
# It does not, although it could, use characters like š instead of digraphs
# like sh.
# #############################################
# Special titlecase forms, not duplicated
# #############################################
Sh''ch<>Шч; # LIU Distinguish Шч from Щ
Ch <> {Ч} $lower;
Kh <> {Х} $lower;
Shch <> {Щ}$lower;
Sh <> {Ш} $lower;
Ts <> {Ц} $lower;
Zh <> {Ж} $lower;
Yi>И;
Ye>Е;
Yo>Ё;
Yu>Ю;
Ya>Я;
# #############################################
# Rules to Duplicate
# To get the lowercase versions, copy these and lowercase
# #############################################
# variant spellings in English
SHTCH>Щ;
TCH>Ч;
TH>З;
Q>К;
WH>В;
W>В;
X>КС; #+ "X<КС;"
# Separate letters that would otherwise join
SH''<Ш}$BECOMES_C;
T''<Т}$BECOMES_S;
T''<Т}[ЧЩщ]; # LIU add special cases
K''<К}$BECOMES_H;
S''<С}$BECOMES_H;
T''<Т}$BECOMES_H;
Z''<З}$BECOMES_H;
Y''<Й}$BECOMES_VOWEL;
# Main letters
A<>А;
B<>Б;
CH<>Ч;
D<>Д;
E<>Э;
F<>Ф;
G<>Г;
Ì<>И;
I<>Ы;
KH<>Х;
K<>К;
L<>Л;
M<>М;
N<>Н;
O<>О;
P<>П;
R<>Р;
SHCH<>Щ;
SH>Ш; #+ "SH<Ш;"
Š<>Ш;
S<>С;
TS<>Ц;
T<>Т;
U<>У;
V<>В;
#ÌÀÈÒÙ
YE>Е; #+ "YE<Е;"
È<>Е;
YO>Ё; #+ "YO<Ё;"
Ò<>Ё;
YU>Ю; #+ "YU<Ю;"
Ù<>Ю;
YA>Я; #+ "YA<Я;"
À<>Я;
Y<>Й;
ZH<>Ж;
Z<>З;
H<>Ъ;
Ÿ<>Ь;
# Non-russian
J<>Ј;
# variant spellings in English
C}$csoft>С;
C>К;
# #############################################
# Duplicated Rules
# Copy and lowercase the above rules
# #############################################
# variant spellings in english
shtch>щ;
tch>ч;
th>з;
q>к;
wh>в;
w>в;
x>кс; #+ "x<кс;"
# separate letters that would otherwise join
sh''<ш}$becomes_c;
t''<т}$becomes_s;
t''<т}[чщ]; # LIU add special cases
k''<к}$becomes_h;
s''<с}$becomes_h;
t''<т}$becomes_h;
z''<з}$becomes_h;
y''<й}$becomes_vowel;
# main letters
a<>а;
b<>б;
ch<>ч;
d<>д;
e<>э;
f<>ф;
g<>г;
ì<>и;
i<>ы;
kh<>х;
k<>к;
l<>л;
m<>м;
n<>н;
o<>о;
p<>п;
r<>р;
shch<>щ;
sh>ш; #+ "sh<ш;"
š<>ш;
s<>с;
ts<>ц;
t<>т;
u<>у;
v<>в;
#ìàèòù
ye>е; #+ "ye<е;"
è<>е;
yo>ё; #+ "yo<ё;"
ò<>ё;
yu>ю; #+ "yu<ю;"
ù<>ю;
ya>я; #+ "ya<я;"
à<>я;
y<>й;
zh<>ж;
z<>з;
h<>ъ;
ÿ<>ь;
# non-russian
j<>ј;
# variant spellings in english
c}$csoft>с;
c>к;
# #############################################
# End of Duplicated Rules
# #############################################
#generally the last rule
''>;
# eof

View File

@ -1,375 +0,0 @@
#--------------------------------------------------------------------
# Copyright (c) 1999-2001, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# Date: Tue Jan 23 12:18:45 2001
#--------------------------------------------------------------------
# Latin-Greek
# ==============================================
# Modern Greek Transliteration Rules
#
# This transliterates modern Greek characters, but using rules
# that are traditional for Ancient Greek, and
# thus more resemble Greek words that have become part
# of English. It differs from the official Greek
# transliteration, which is more phonetic (since
# most modern Greek vowels, for example, have
# degenerated simply to sound like "ee").
#
# There are only a few tricky parts.
# 1. eta and omega don't map directly to Latin vowels,
# so we use a macron on e and o, and some
# other combinations if they are accented.
# 2. The accented, diaeresis i and y are substituted too.
# 3. Some letters use digraphs, like "ph". While typical,
# they need some special handling.
# 4. A gamma before a gamma or a few other letters is
# transliterated as an "n", as in "Anglo"
# 5. An ypsilon after a vowel is a "u", as in
# "Mouseio". Otherwise it is a "y" as in "Physikon"
# 6. The construction of the rules is made simpler by making sure
# that most rules for lowercase letters exactly correspond to the
# rules for uppercase letters, *except* for the case of the letters
# in the rule itself. That way, after modifying the uppercase rules,
# you can just copy, paste, and "set to lowercase" to get
# the rules for lowercase letters!
# ==============================================
# ==============================================
# Variables, used to make the rules more comprehensible
# and for conditionals.
# ==============================================
### $quote='\"';
# Latin Letters
### $E_MACRON=Ē;
### $e_macron=ē;
### $O_MACRON=Ō;
### $o_macron=ō;
### $Y_UMLAUT=Ÿ;
### $y_umlaut=ÿ;
#! // with real accents.
#! + "$E_MACRON_ACUTE=Ḗ;"
#! + "$e_macron_acute=ḗ;"
#! + "$O_MACRON_ACUTE=Ṓ;"
#! + "$o_macron_acute=ṓ;"
#! + "$y_umlaut_acute=ÿ́;"
#! + "$u00ef_acute=ḯ;"
#! + "$u00fc_acute=ǘ;"
#! //
# single letter equivalents
### $E_MACRON_ACUTE=Ê;
### $e_macron_acute=ê;
### $O_MACRON_ACUTE=Ô;
### $o_macron_acute=ô;
### $y_umlaut_acute=ŷ;
### $u00ef_acute=î;
### $u00fc_acute=û;
# Greek Letters
### $ALPHA=Α;
### $BETA=Β;
### $GAMMA=Γ;
### $DELTA=Δ;
### $EPSILON=Ε;
### $ZETA=Ζ;
### $ETA=Η;
### $THETA=Θ;
### $IOTA=Ι;
### $KAPPA=Κ;
### $LAMBDA=Λ;
### $MU=Μ;
### $NU=Ν;
### $XI=Ξ;
### $OMICRON=Ο;
### $PI=Π;
### $RHO=Ρ;
### $SIGMA=Σ;
### $TAU=Τ;
### $YPSILON=Υ;
### $PHI=Φ;
### $CHI=Χ;
### $PSI=Ψ;
### $OMEGA=Ω;
### $ALPHA2=Ά;
### $EPSILON2=Έ;
### $ETA2=Ή;
### $IOTA2=Ί;
### $OMICRON2=Ό;
### $YPSILON2=Ύ;
### $OMEGA2=Ώ;
### $IOTA_DIAERESIS=Ϊ;
### $YPSILON_DIAERESIS=Ϋ;
### $alpha=α;
### $beta=β;
### $gamma=γ;
### $delta=δ;
### $epsilon=ε;
### $zeta=ζ;
### $eta=η;
### $theta=θ;
### $iota=ι;
### $kappa=κ;
### $lambda=λ;
### $mu=μ;
### $nu=ν;
### $xi=ξ;
### $omicron=ο;
### $pi=π;
### $rho=ρ;
### $sigma=σ;
### $tau=τ;
### $ypsilon=υ;
### $phi=φ;
### $chi=χ;
### $psi=ψ;
### $omega=ω;
#forms
### $alpha2=ά;
### $epsilon2=έ;
### $eta2=ή;
### $iota2=ί;
### $omicron2=ό;
### $ypsilon2=ύ;
### $omega2=ώ;
### $iota_diaeresis=ϊ;
### $ypsilon_diaeresis=ϋ;
### $iota_diaeresis2=ΐ;
### $ypsilon_diaeresis2=ΰ;
### $sigma2=ς;
# Variables for conditional mappings
# Use lowercase for all variable names, to allow cut/paste below.
$letter=[~[:Lu:][:Ll:]];
$lower=[[:Ll:]];
$softener=[eiyEIY];
$vowel=[aeiouAEIOU \
ΑΕΗΙΟΥΩ \
ΆΈΉΊΌΎΏ \
ΪΫ \
αεηιουω \
άέήίόύώ \
ϊϋ \
ΐΰ \
];
$n_gamma=[GKXCgkxc];
$gamma_n=[ΓΚΧΞγκχξ];
$pp=[Pp];
# ==============================================
# Rules
# ==============================================
# The following are special titlecases, and should
# not be copied when duplicating the lowercase
# ==============================================
Th <> Θ}$lower;
Ph <> Φ}$lower;
Ch <> Χ}$lower;
#masked: + "Ps<Φ}$lower;"
# Because there is no uppercase forms for final sigma,
# we had to move all the sigma rules up here.
# Remember to insert ' to preserve round trip, for double letters
# don't need to do this for the digraphs with h,
# since it is not created when mapping back from greek
# use special form for s
''S <> $pp{Σ; # handle PS
S <> Σ;
# The following are a bit tricky. 's' takes two forms in greek
# final or non final.
# We use ~s to represent the abnormal form: final before letter
# or non-final before non-letter.
# We use 's to separate p and s (otherwise ps is one letter)
# so, we break out the following forms:
''s < $pp{σ}$letter;
s < σ}$letter;
'~'s < σ;
'~'s < ς}$letter;
''s < $pp{ς;
s < ς;
'~'s }$letter>ς;
'~'s > σ;
''s }$letter>σ;
''s > ς;
s }$letter>σ;
s > ς;
# because there are no uppercase forms, had to move these up too.
i'\"''`'>ΐ;
y'\"''`'>ΰ;
î<>ΐ;
û<>$vowel{ΰ;
ŷ<>ΰ;
# ==============================================
# Uppercase Forms.
# To make lowercase forms, just copy and lowercase below
# ==============================================
# Typing variants, in case the keyboard doesn't have accents
'A`'>Ά;
'E`'>Έ;
'EE`'>Ή;
EE>Η;
'I`'>Ί;
'O`'>Ό;
'OO`'>Ώ;
OO>Ω;
I'\"'>Ϊ;
Y'\"'>Ϋ;
# Basic Letters
A<>Α;
Á<>Ά;
B<>Β;
N }$n_gamma<>Γ}$gamma_n;
G<>Γ;
D<>Δ;
''E <> [Ee]{Ε; # handle EE
E<>Ε;
É<>Έ;
Z<>Ζ;
Ê<>Ή;
Ē<>Η;
TH<>Θ;
I<>Ι;
Í<>Ί;
Ï<>Ϊ;
K<>Κ;
L<>Λ;
M<>Μ;
N'' <> Ν}$gamma_n;
N<>Ν;
X<>Ξ;
''O <> [Oo]{ Ο; # handle OO
O<>Ο;
Ó<>Ό;
PH<>Φ; # needs ordering before P
PS<>Ψ; # needs ordering before P
P<>Π;
R<>Ρ;
T<>Τ;
U <> $vowel{Υ;
Ú <> $vowel{Ύ;
Ü <> $vowel{Ϋ;
Y<>Υ;
Ý<>Ύ;
Ÿ<>Ϋ;
CH<>Χ;
Ô<>Ώ;
Ō<>Ω;
# Extra English Letters. Mapped for completeness
C}$softener>|S;
C>|K;
F>|PH;
H>|CH;
J>|I;
Q>|K;
V>|U;
W>|U;
# ==============================================
# Lowercase Forms. Just copy above and lowercase
# ==============================================
# typing variants, in case the keyboard doesn't have accents
'a`'>ά;
'e`'>έ;
'ee`'>ή;
ee>η;
'i`'>ί;
'o`'>ό;
'oo`'>ώ;
oo>ω;
i'\"'>ϊ;
y'\"'>ϋ;
# basic letters
a<>α;
á<>ά;
b<>β;
n }$n_gamma<>γ}$gamma_n;
g<>γ;
d<>δ;
''e <> [Ee]{ε; # handle EE
e<>ε;
é<>έ;
z<>ζ;
ê<>ή;
ē<>η;
th<>θ;
i<>ι;
í<>ί;
ï<>ϊ;
k<>κ;
l<>λ;
m<>μ;
n'' <> ν}$gamma_n;
n<>ν;
x<>ξ;
''o <> [Oo]{ ο; # handle OO
o<>ο;
ó<>ό;
ph<>φ; # needs ordering before p
ps<>ψ; # needs ordering before p
p<>π;
r<>ρ;
t<>τ;
u <> $vowel{υ;
ú <> $vowel{ύ;
ü <> $vowel{ϋ;
y<>υ;
ý<>ύ;
ÿ<>ϋ;
ch<>χ;
ô<>ώ;
ō<>ω;
# extra english letters. mapped for completeness
c}$softener>|s;
c>|k;
f>|ph;
h>|ch;
j>|i;
q>|k;
v>|u;
w>|u;
# ====================================
# Normal final rule: remove '
# ====================================
#+ "''>;"
# eof

View File

@ -1,216 +0,0 @@
#--------------------------------------------------------------------
# Copyright (c) 1999-2001, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# Date: Tue Jan 23 12:42:06 2001
#--------------------------------------------------------------------
# Latin-Hebrew
# Variable names, derived from the Unicode names.
### $POINT_SHEVA=ְ;
### $POINT_HATAF_SEGOL=ֱ;
### $POINT_HATAF_PATAH=ֲ;
### $POINT_HATAF_QAMATS=ֳ;
### $POINT_HIRIQ=ִ;
### $POINT_TSERE=ֵ;
### $POINT_SEGOL=ֶ;
### $POINT_PATAH=ַ;
### $POINT_QAMATS=ָ;
### $POINT_HOLAM=ֹ;
### $POINT_QUBUTS=ֻ;
### $POINT_DAGESH_OR_MAPIQ=ּ;
### $POINT_METEG=ֽ;
### $PUNCTUATION_MAQAF=־;
### $POINT_RAFE=ֿ;
### $PUNCTUATION_PASEQ=׀;
### $POINT_SHIN_DOT=ׁ;
### $POINT_SIN_DOT=ׂ;
### $PUNCTUATION_SOF_PASUQ=׃;
### $ALEF=א;
### $BET=ב;
### $GIMEL=ג;
### $DALET=ד;
### $HE=ה;
### $VAV=ו;
### $ZAYIN=ז;
### $HET=ח;
### $TET=ט;
### $YOD=י;
### $FINAL_KAF=ך;
### $KAF=כ;
### $LAMED=ל;
### $FINAL_MEM=ם;
### $MEM=מ;
### $FINAL_NUN=ן;
### $NUN=נ;
### $SAMEKH=ס;
### $AYIN=ע;
### $FINAL_PE=ף;
### $PE=פ;
### $FINAL_TSADI=ץ;
### $TSADI=צ;
### $QOF=ק;
### $RESH=ר;
### $SHIN=ש;
### $TAV=ת;
### $YIDDISH_DOUBLE_VAV=װ;
### $YIDDISH_VAV_YOD=ױ;
### $YIDDISH_DOUBLE_YOD=ײ;
### $PUNCTUATION_GERESH=׳;
### $PUNCTUATION_GERSHAYIM=״;
$letter=[a-zA-Z];
$softvowel=[eiyEIY];
$vowellike=[אעיו];
$hebrew=[֐-׿]; # the whole block -liu
# [Why is this a special case? -liu]
k''h <> כ ה ;
# Mark non-final forms in final position as x~ -liu
k < כ } $hebrew ;
m < מ } $hebrew ;
n < נ } $hebrew ;
p < פ } $hebrew ;
ts < צ } $hebrew ;
k'~' <> כ ;
m'~' <> מ ;
n'~' <> נ ;
p'~' <> פ ;
ts'~'<> צ ;
# Mark final forms in non-final position as x^ -liu
k'^' <> ך } $hebrew ;
m'^' <> ם } $hebrew ;
n'^' <> ן } $hebrew ;
p'^' <> ף } $hebrew ;
ts'^'<> ץ } $hebrew ;
k < ך;
m < ם;
n < ן;
p < ף;
ts < ץ;
# Main rules
a<>א;
A>א;
b<>ב;
B>ב;
c}$softvowel>ס;
C}$softvowel>ס;
c}$letter>כ;
C}$letter>כ;
c>ך;
C>ך;
d<>ד;
D>ד;
e<>ע;
E>ע;
f}$letter>פ;
f>ף;
F}$letter>פ;
F>ף;
g<>ג;
G>ג;
h<>ה;
H>ה;
i>י;
I>י;
j>דש;
J>דש;
kh<>ח;
kH>ח;
Kh>ח;
KH>ח;
k}$letter>כ;
K}$letter>כ;
k>ך;
K>ך;
l<>ל;
L>ל;
m}$letter>מ;
m>ם;
M}$letter>מ;
M>ם;
n}$letter>נ;
n>ן;
N}$letter>נ;
N>ן;
o>ו;
O>ו;
p}$letter>פ;
p>ף;
P}$letter>פ;
P>ף;
q<>ק;
Q>ק;
r<>ר;
R>ר;
sh<>ש;
sH>ש;
Sh>ש;
SH>ש;
s''<ס}ה;
s<>ס;
S>ס;
th<>ת;
tH>ת;
Th>ת;
TH>ת;
tS}$letter>צ;
ts}$letter>צ;
Ts}$letter>צ;
TS}$letter>צ;
tS>ץ;
ts>ץ;
Ts>ץ;
TS>ץ;
t''<ט}[ה ס ש];
t<>ט;
T>ט;
v<ו}$vowellike;
u<>ו;
U>ו;
v>ו;
V>ו;
w>ו;
W>ו;
x>כס;
X>כס;
y<>י;
Y>י;
z<>ז;
Z>ז;
# Delete stray apostrophes
''>;
<'';
# eof

View File

@ -1,969 +0,0 @@
#--------------------------------------------------------------------
# Copyright (c) 1999-2001, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# Date: Tue Jan 23 12:18:46 2001
#--------------------------------------------------------------------
# Latin-Kana
# Japanese hiragana and katakana to and from latin
# (romaji). Lower case latin corresponds to hiragana;
# upper case latin to katakana. The handling of
# Hiragana and Katakana is largely the same. The bulk
# of the transliterator consists of two identical sets
# of rules, differing only in case.
# Because of minor differences between the two blocks
# (e.g., the existence of small katakana ka and ke, but
# no corresponding hiragana), some rules exist for only
# one script.
# Uses modified Hepburn. Small changes to make
# unambiguous.
#| Kunrei-shiki: Hepburn/MHepburn
#| ------------------------------
#| si: shi
#| si ~ya: sha
#| si ~yu: shu
#| si ~yo: sho
#| zi: ji
#| zi ~ya: ja
#| zi ~yu: ju
#| zi ~yo: jo
#| ti: chi
#| ti ~ya: cha
#| ti ~yu: chu
#| ti ~yu: cho
#| tu: tsu
#| di: ji/dji
#| du: zu/dzu
#| hu: fu
#| For foreign words:
#| -----------------
#| se ~i si
#| si ~e she
#|
#| ze ~i zi
#| zi ~e je
#|
#| te ~i ti
#| ti ~e che
#| te ~u tu
#|
#| de ~i di
#| de ~u du
#| de ~i di
#|
#| he ~u: hu
#| hu ~a fa
#| hu ~i fi
#| hu ~e he
#| hu ~o ho
# Most small forms are generated, but if necessary
# explicit small forms are given with ~a, ~ya, etc.
#------------------------------------------------------
# Variables
$vowel=[aeiou];
### $QUOTE='';
# Hiragana block
### $a2=ぁ;
### $a=あ;
### $i2=ぃ;
### $i=い;
### $u2=ぅ;
### $u=う;
### $e2=ぇ;
### $e=え;
### $o2=ぉ;
### $o=お;
### $ka=か;
### $ga=が;
### $ki=き;
### $gi=ぎ;
### $ku=く;
### $gu=ぐ;
### $ke=け;
### $ge=げ;
### $ko=こ;
### $go=ご;
### $sa=さ;
### $za=ざ;
### $si=し;
### $zi=じ;
### $su=す;
### $zu=ず;
### $se=せ;
### $ze=ぜ;
### $so=そ;
### $zo=ぞ;
### $ta=た;
### $da=だ;
### $ti=ち;
### $di=ぢ;
### $tu2=っ;
### $tu=つ;
### $du=づ;
### $te=て;
### $de=で;
### $to=と;
### $do=ど;
### $na=な;
### $ni=に;
### $nu=ぬ;
### $ne=ね;
### $no=の;
### $ha=は;
### $ba=ば;
### $pa=ぱ;
### $hi=ひ;
### $bi=び;
### $pi=ぴ;
### $hu=ふ;
### $bu=ぶ;
### $pu=ぷ;
### $he=へ;
### $be=べ;
### $pe=ぺ;
### $ho=ほ;
### $bo=ぼ;
### $po=ぽ;
### $ma=ま;
### $mi=み;
### $mu=む;
### $me=め;
### $mo=も;
### $ya2=ゃ;
### $ya=や;
### $yu2=ゅ;
### $yu=ゆ;
### $yo2=ょ;
### $yo=よ;
### $ra=ら;
### $ri=り;
### $ru=る;
### $re=れ;
### $ro=ろ;
### $wa2=ゎ;
### $wa=わ;
### $wi=ゐ;
### $we=ゑ;
### $wo=を;
### $n=ん;
### $vu=ゔ;
# Alternates, just to make the rules easier
### $yi2=ぃ;
### $yi=い;
### $ye2=ぇ;
### $ye=え;
### $wu=$u;
# End alternates
# Katakana block
### $A2=ァ;
### $A=ア;
### $I2=ィ;
### $I=イ;
### $U2=ゥ;
### $U=ウ;
### $E2=ェ;
### $E=エ;
### $O2=ォ;
### $O=オ;
### $KA=カ;
### $GA=ガ;
### $KI=キ;
### $GI=ギ;
### $KU=ク;
### $GU=グ;
### $KE=ケ;
### $GE=ゲ;
### $KO=コ;
### $GO=ゴ;
### $KA2=ヵ; # Small Katakana KA; no Hiragana equiv.
### $KE2=ヶ; # Small Katakana KE; no Hiragana equiv.
### $SA=サ;
### $ZA=ザ;
### $SI=シ;
### $ZI=ジ;
### $SU=ス;
### $ZU=ズ;
### $SE=セ;
### $ZE=ゼ;
### $SO=ソ;
### $ZO=ゾ;
### $TA=タ;
### $DA=ダ;
### $TI=チ;
### $DI=ヂ;
### $TU2=ッ;
### $TU=ツ;
### $DU=ヅ;
### $TE=テ;
### $DE=デ;
### $TO=ト;
### $DO=ド;
### $NA=ナ;
### $NI=ニ;
### $NU=ヌ;
### $NE=ネ;
### $NO=;
### $HA=ハ;
### $BA=バ;
### $PA=パ;
### $HI=ヒ;
### $BI=ビ;
### $PI=ピ;
### $HU=フ;
### $BU=ブ;
### $PU=プ;
### $HE=ヘ;
### $BE=ベ;
### $PE=ペ;
### $HO=ホ;
### $BO=ボ;
### $PO=ポ;
### $MA=マ;
### $MI=ミ;
### $MU=ム;
### $ME=メ;
### $MO=モ;
### $YA2=ャ;
### $YA=ヤ;
### $YU2=ュ;
### $YU=ユ;
### $YO2=ョ;
### $YO=ヨ;
### $WA2=ヮ;
# Alternates, just to make the rules easier
### $YI2=ィ;
### $YI=イ;
### $YE2=ェ;
### $YE=エ;
### $WU=$U;
# End alternates
### $RA=ラ;
### $RI=リ;
### $RU=ル;
### $RE=レ;
### $RO=ロ;
### $VA=ヷ;
### $VI=ヸ;
### $VU=ヴ;
### $VE=ヹ;
### $VO=ヺ;
### $WA=ワ;
### $WI=ヰ;
### $WE=ヱ;
### $WO=ヲ;
### $N=ン;
### $LONG=ー;
# Variables used for doubled-consonants with tsu
$K_START=[カキクケコかきくけこ];
$G_START=[ガギグゲゴがぎぐげご];
$S_START=[サシスセソさしすせそ];
$Z_START=[ザズゼゾざずぜぞ];
$J_START=[ジじ];
$T_START=[タチツテトたちつてと];
$D_START=[ダヂヅデドだぢづでど];
$N_START=[ナニヌネノなにぬねの];
$H_START=[ハヒヘホはひへほ];
$F_START=[フふ];
$B_START=[バビブベボばびぶべぼ];
$P_START=[パピプペポぱぴぷぺぽ];
$M_START=[マミムメモまみむめも];
$Y_START=[ヤユヨやゆよ];
$R_START=[ラリルレロらりるれろ];
$W_START=[ワヰヱヲわゐゑを];
$V_START=[ヷヸヴヹヺゔ];
# If ン is followed by $N_QUOTER, then it needs an
# apostrophe after its romaji form to disambiguate it.
# E.g., ン ア != ナ, so represent as "n'a", not "na".
$N_QUOTER = [ア イ ウ エ オ ナ ニ ヌ ネ \
ヤ ユ ヨ ン];
$n_quoter = [あ い う え お な に ぬ ね の \
や ゆ よ ん];
# Lowercase copies for convenience in making hiragana
# rule set copy
### $long = $LONG;
### $quote = $QUOTE;
### $k_start=$K_START;
### $g_start=$G_START;
### $s_start=$S_START;
### $z_start=$Z_START;
### $j_start=$J_START;
### $t_start=$T_START;
### $d_start=$D_START;
### $n_start=$N_START;
### $h_start=$H_START;
### $f_start=$F_START;
### $b_start=$B_START;
### $p_start=$P_START;
### $m_start=$M_START;
### $y_start=$Y_START;
### $r_start=$R_START;
### $w_start=$W_START;
### $v_start=$V_START;
#------------------------------------------------------
# Katakana rules
# The rules immediately following are not shared. That
# is, they exist only for katakana, not for hiragana.
VA<>ヷ;
VI<>ヸ;
VE<>ヹ;
VO<>ヺ;
'~KA'<>ヵ;
'~KE'<>ヶ;
# ~~~ BEGIN shared rules ~~~
# The shared rules are copied from katakana to hiragana
# and then mechanically lowercased.
A<>ア;
BA<>バ;
BYA<ビャ;
BYI<ビィ;
BYU<ビュ;
BYE<ビェ;
BYO<ビョ;
BI<>ビ;
BU<>ブ;
BE<>ベ;
BO<>ボ;
BY>ビ|'~Y';
CHA<チャ;
CHI'~I'<チィ; # Liu
CHU<チュ;
CHE<チェ;
CHO<チョ;
CHI<>チ;
CH>チ|'~Y';
C}I>|S;
C}E>|S;
DA<>ダ;
DI<>ディ;
DU<>デゥ;
DE<>デ;
DO<>ド;
DZU<>ヅ;
DJA<ヂャ;
DJI'~I'<ヂィ; # Liu
DJU<ヂュ;
DJE<ヂェ;
DJO<ヂョ;
DJI<>ヂ;
DJ>ヂ|'~Y';
E<>エ;
FA<ファ;
FI<フィ;
FE<フェ;
FO<フォ;
FU<>フ;
GA<>ガ;
GYA<ギャ;
GYI<ギィ;
GYU<ギュ;
GYE<ギェ;
GYO<ギョ;
GI<>ギ;
GU<>グ;
GE<>ゲ;
GO<>ゴ;
GY>ギ|'~Y';
HA<>ハ;
HI<>ヒ;
HU<>ヘゥ;
HE<>ヘ;
HO<>ホ;
I<>イ;
JA<ジャ;
JI'~I'<ジィ; # Liu
JU<ジュ;
JE<ジェ;
JO<ジョ;
JI<>ジ;
KA<>カ;
KYA<キャ;
KYI<キィ;
KYU<キュ;
KYE<キェ;
KYO<キョ;
KI<>キ;
KU<>ク;
KE<>ケ;
KO<>コ;
KY>キ|'~Y';
MA<>マ;
MYA<ミャ;
MYI<ミィ;
MYU<ミュ;
MYE<ミェ;
MYO<ミョ;
MI<>ミ;
MU<>ム;
ME<>メ;
MO<>モ;
MY>ミ|'~Y';
M}P>ン;
M}B>ン;
M}F>ン;
M}V>ン;
NA<>ナ;
NYA<ニャ;
NYI<ニィ;
NYU<ニュ;
NYE<ニェ;
NYO<ニョ;
NI<>ニ;
NU<>ヌ;
NE<>ネ;
NO<>;
NY>ニ|'~Y';
O<>オ;
PA<>パ;
PYA<ピャ;
PYI<ピィ;
PYU<ピュ;
PYE<ピェ;
PYO<ピョ;
PI<>ピ;
PU<>プ;
PE<>ペ;
PO<>ポ;
PY>ピ|'~Y';
RA<>ラ;
RYA<リャ;
RYI<リィ;
RYU<リュ;
RYE<リェ;
RYO<リョ;
RI<>リ;
RU<>ル;
RE<>レ;
RO<>ロ;
RY>リ|'~Y';
SA<>サ;
SI<>セィ;
SU<>ス;
SE<>セ;
SO<>ソ;
SHA<シャ;
SHI'~I'<シィ; # Liu
SHU<シュ;
SHE<シェ;
SHO<ショ;
SHI<>シ;
SH>シ|'~Y';
TA<>タ;
TI<>ティ;
TU<>テゥ;
TE<>テ;
TO<>ト;
# Double consonants
B}B<>ッ}$B_START;
C}K>ッ;
C}C>ッ;
C}Q>ッ;
D}D<>ッ}$D_START;
F}F<>ッ}$F_START;
G}G<>ッ}$G_START;
H}H<>ッ}$H_START;
J}J<>ッ}$J_START;
K}K<>ッ}$K_START;
L}L>ッ;
M}M<>ッ}$M_START;
N}N<>ッ}$N_START;
P}P<>ッ}$P_START;
Q}Q>ッ;
R}R<>ッ}$R_START;
S}SH>ッ;
S}S<>ッ}$S_START;
T}CH>ッ;
T}T<>ッ}$T_START;
V}V<>ッ}$V_START;
W}W<>ッ}$W_START;
X}X>ッ;
Y}Y<>ッ}$Y_START;
Z}Z<>ッ}$Z_START;
TSU<>ツ;
U<>ウ;
'V~A'<ヴァ; # Liu
'V~I'<ヴィ; # Liu
'V~E'<ヴェ; # Liu
'V~O'<ヴォ; # Liu
VU<>ヴ;
WA<>ワ;
WI<>ヰ;
WU>ウ;
WE<>ヱ;
WO<>ヲ;
YA<>ヤ;
YI>イ;
YU<>ユ;
YE>エ;
YO<>ヨ;
ZA<>ザ;
ZI<>ゼィ;
ZU<>ズ;
ZE<>ゼ;
ZO<>ゾ;
# Prolonged vowel mark. This indicates a doubling of
# the preceding vowel sound in both katakana and
# hiragana.
A<A{ー; # Liu
E<E{ー; # Liu
I<I{ー; # Liu
O<O{ー; # Liu
U<U{ー; # Liu
# Small forms
'~A'<>ァ;
'~I'<>ィ;
'~U'<>ゥ;
'~E'<>ェ;
'~O'<>ォ;
'~TSU'<>ッ;
'~WA'<>ヮ;
'~YA'<>ャ;
'~YI'>ィ;
'~YU'<>ュ;
'~YE'>ェ;
'~YO'<>ョ;
# One-way latin->kana rules. These do not occur in
# well-formed romaji representing actual Japanese text.
# Their purpose is to make all romaji map to kana of
# some sort.
# The following are not really necessary, but produce
# slightly more natural results.
CY>セィ;
DY>ディ;
HY>ヒ;
SY>セィ;
TY>ティ;
ZY>ゼィ;
# Simple substitutions using backup
C>|K;
F>フ|'~';
J>ジ|'~Y';
L>|R;
Q>|K;
V>ヴ|'~';
W>ウ|'~';
X>|KS;
# Isolated consonants listed here so as not to mask
# longer rules above.
B>ブ;
D>デ;
G>グ;
H>ヘ;
K>ク;
M>ン;
N''<ン}$N_QUOTER;
N<>ン;
P>プ;
R>ル;
S>ス;
T>テ;
Y>イ;
Z>ズ;
# ~~~ END shared rules ~~~
#------------------------------------------------------
# Hiragana rules
# Currently, there are no hiragana rules other than the
# shared rules.
# ~~~ BEGIN shared rules ~~~
# The shared rules are copied from katakana to hiragana
# and then mechanically lowercased.
a<>あ;
ba<>ば;
bya<びゃ;
byi<びぃ;
byu<びゅ;
bye<びぇ;
byo<びょ;
bi<>び;
bu<>ぶ;
be<>べ;
bo<>ぼ;
by>び|'~y';
cha<ちゃ;
chi'~i'<ちぃ; # liu
chu<ちゅ;
che<ちぇ;
cho<ちょ;
chi<>ち;
ch>ち|'~y';
c}i>|s;
c}e>|s;
da<>だ;
di<>でぃ;
du<>でぅ;
de<>で;
do<>ど;
dzu<>づ;
dja<ぢゃ;
dji'~i'<ぢぃ; # liu
dju<ぢゅ;
dje<ぢぇ;
djo<ぢょ;
dji<>ぢ;
dj>ぢ|'~y';
e<>え;
fa<ふぁ;
fi<ふぃ;
fe<ふぇ;
fo<ふぉ;
fu<>ふ;
ga<>が;
gya<ぎゃ;
gyi<ぎぃ;
gyu<ぎゅ;
gye<ぎぇ;
gyo<ぎょ;
gi<>ぎ;
gu<>ぐ;
ge<>げ;
go<>ご;
gy>ぎ|'~y';
ha<>は;
hi<>ひ;
hu<>へぅ;
he<>へ;
ho<>ほ;
i<>い;
ja<じゃ;
ji'~i'<じぃ; # liu
ju<じゅ;
je<じぇ;
jo<じょ;
ji<>じ;
ka<>か;
kya<きゃ;
kyi<きぃ;
kyu<きゅ;
kye<きぇ;
kyo<きょ;
ki<>き;
ku<>く;
ke<>け;
ko<>こ;
ky>き|'~y';
ma<>ま;
mya<みゃ;
myi<みぃ;
myu<みゅ;
mye<みぇ;
myo<みょ;
mi<>み;
mu<>む;
me<>め;
mo<>も;
my>み|'~y';
m}p>ん;
m}b>ん;
m}f>ん;
m}v>ん;
na<>な;
nya<にゃ;
nyi<にぃ;
nyu<にゅ;
nye<にぇ;
nyo<にょ;
ni<>に;
nu<>ぬ;
ne<>ね;
no<>の;
ny>に|'~y';
o<>お;
pa<>ぱ;
pya<ぴゃ;
pyi<ぴぃ;
pyu<ぴゅ;
pye<ぴぇ;
pyo<ぴょ;
pi<>ぴ;
pu<>ぷ;
pe<>ぺ;
po<>ぽ;
py>ぴ|'~y';
ra<>ら;
rya<りゃ;
ryi<りぃ;
ryu<りゅ;
rye<りぇ;
ryo<りょ;
ri<>り;
ru<>る;
re<>れ;
ro<>ろ;
ry>り|'~y';
sa<>さ;
si<>せぃ;
su<>す;
se<>せ;
so<>そ;
sha<しゃ;
shi'~i'<しぃ; # liu
shu<しゅ;
she<しぇ;
sho<しょ;
shi<>し;
sh>し|'~y';
ta<>た;
ti<>てぃ;
tu<>てぅ;
te<>て;
to<>と;
# double consonants
b}b<>っ}$B_START;
c}k>っ;
c}c>っ;
c}q>っ;
d}d<>っ}$D_START;
f}f<>っ}$F_START;
g}g<>っ}$G_START;
h}h<>っ}$H_START;
j}j<>っ}$J_START;
k}k<>っ}$K_START;
l}l>っ;
m}m<>っ}$M_START;
n}n<>っ}$N_START;
p}p<>っ}$P_START;
q}q>っ;
r}r<>っ}$R_START;
s}sh>っ;
s}s<>っ}$S_START;
t}ch>っ;
t}t<>っ}$T_START;
v}v<>っ}$V_START;
w}w<>っ}$W_START;
x}x>っ;
y}y<>っ}$Y_START;
z}z<>っ}$Z_START;
tsu<>つ;
u<>う;
'v~a'<ゔぁ; # liu
'v~i'<ゔぃ; # liu
'v~e'<ゔぇ; # liu
'v~o'<ゔぉ; # liu
vu<>ゔ;
wa<>わ;
wi<>ゐ;
wu>う;
we<>ゑ;
wo<>を;
ya<>や;
yi>い;
yu<>ゆ;
ye>え;
yo<>よ;
za<>ざ;
zi<>ぜぃ;
zu<>ず;
ze<>ぜ;
zo<>ぞ;
# prolonged vowel mark. this indicates a doubling of
# the preceding vowel sound in both katakana and
# hiragana.
a<a{ー; # liu
e<e{ー; # liu
i<i{ー; # liu
o<o{ー; # liu
u<u{ー; # liu
# small forms
'~a'<>ぁ;
'~i'<>ぃ;
'~u'<>ぅ;
'~e'<>ぇ;
'~o'<>ぉ;
'~tsu'<>っ;
'~wa'<>ゎ;
'~ya'<>ゃ;
'~yi'>ぃ;
'~yu'<>ゅ;
'~ye'>ぇ;
'~yo'<>ょ;
# one-way latin->kana rules. these do not occur in
# well-formed romaji representing actual japanese text.
# their purpose is to make all romaji map to kana of
# some sort.
# the following are not really necessary, but produce
# slightly more natural results.
cy>せぃ;
dy>でぃ;
hy>ひ;
sy>せぃ;
ty>てぃ;
zy>ぜぃ;
# simple substitutions using backup
c>|k;
f>ふ|'~';
j>じ|'~y';
l>|r;
q>|k;
v>ゔ|'~';
w>う|'~';
x>|ks;
# isolated consonants listed here so as not to mask
# longer rules above.
b>ぶ;
d>で;
g>ぐ;
h>へ;
k>く;
m>ん;
n''<ん}$n_quoter;
n<>ん;
p>ぷ;
r>る;
s>す;
t>て;
y>い;
z>ず;
# ~~~ END shared rules ~~~
#------------------------------------------------------
# Final cleanup
'~'>; # delete stray tildes
''>; # delete stray quotes
'-'>ー;
# eof

View File

@ -1,77 +0,0 @@
#--------------------------------------------------------------------
# Copyright (c) 1999-2001, International Business Machines
# Corporation and others. All Rights Reserved.
#--------------------------------------------------------------------
# Date: Tue Jan 23 12:42:07 2001
#--------------------------------------------------------------------
# StraightQuotes-CurlyQuotes
# Rewritten using character codes [LIU]
$white=[[:Zs:][:Zl:][:Zp:]];
$black=[^$white];
$open=[:Ps:];
### $dquote='\"';
### $lAng=〈;
### $ldAng=《;
### $lBrk='[';
### $lBrc='{';
### $lquote=;
### $rquote=;
### $ldquote=“;
### $rdquote=”;
### $ldguill=«;
### $rdguill=»;
### $lguill=;
### $rguill=;
### $mdash=—;
########################################
# Conversions from input
########################################
# join single quotes
''>“;
>“;
''>”;
>”;
#smart single quotes
$white{''>;
$open{''>;
$black{''>;
''>;
#smart doubles
$white{'\"'>“;
$open{'\"'>“;
$black{'\"'>”;
'\"'>“;
# join single guillemets
>»;
'>>'>»;
>«;
'<<'>«;
# prevent double spaces
\\ {\\ >;
# join hyphens into dash ### BIDIRECTIONAL ###
'--'<>—;
########################################
# Conversions back to input
########################################
#smart quotes
''<;
''<;
'\"'<“;
'\"'<”;
# eof