f82d62a85c
X-SVN-Rev: 39273
235 lines
11 KiB
Plaintext
235 lines
11 KiB
Plaintext
# © 2016 and later: Unicode, Inc. and others.
|
||
# License & terms of use: http://www.unicode.org/copyright.html#License
|
||
#
|
||
# File: und_FONIPA_und_FONXSAMP.txt
|
||
# Generated from CLDR
|
||
#
|
||
|
||
# Conversion between IPA and X-SAMPA phonetic transcription.
|
||
#
|
||
# See http://www.phon.ucl.ac.uk/home/sampa/x-sampa.htm for a description of
|
||
# X-SAMPA, an ASCII encoding of the International Phonetic Alphabet.
|
||
#
|
||
# The following obsolete or extended IPA symbols have no X-SAMPA equivalents
|
||
# and remain unaffected by this transform:
|
||
#
|
||
# ʞ LATIN SMALL LETTER TURNED K
|
||
# ʩ LATIN SMALL LETTER FENG DIGRAPH
|
||
# ʪ LATIN SMALL LETTER LS DIGRAPH
|
||
# ʫ LATIN SMALL LETTER LZ DIGRAPH
|
||
# ʬ LATIN LETTER BILABIAL PERCUSSIVE
|
||
# ʭ LATIN LETTER BIDENTAL PERCUSSIVE
|
||
#
|
||
# An IPA tie bar is transformed to an X-SAMPA underscore, per the official
|
||
# X-SAMPA guidelines. This can result in certain ambiguities: For example, the
|
||
# labial-velar nasal (http://en.wikipedia.org/wiki/Labial-velar_nasal) can be
|
||
# either written as [ŋ\u0361m] or [m\u0361ŋ] in IPA. However, neither version can be
|
||
# represented unambiguously in X-SAMPA: IPA [ŋ\u0361m] becomes X-SAMPA [N_m], which
|
||
# is also used to represent a hypothetical laminal (_m) velar nasal, IPA [ŋ\u033B];
|
||
# and IPA [m\u0361ŋ] becomes X-SAMPA [m_N], which can also represent a linguolabial
|
||
# (_N) nasal, IPA [m\u033C], which is more appropriately written [n\u033C]. To avoid
|
||
# unintended ambiguities, it may therefore be advisable to write affricates
|
||
# without tie bars.
|
||
#
|
||
$t = '_'; # X-SAMPA representation of IPA tie bar.
|
||
::NFD(NFC);
|
||
# 5-character X-SAMPA representations
|
||
ʯ ↔ 'z`_w='; # LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL
|
||
# Alternative 5-character X-SAMPA representations
|
||
n\u031F\u030A ← 'n_+_0';
|
||
n\u0320\u030A ← 'n_-_0';
|
||
n\u032A\u030A ← 'n_d_0';
|
||
n\u033A\u030A ← 'n_a_0';
|
||
n\u033B\u030A ← 'n_m_0';
|
||
n\u033C\u030A ← 'n_N_0';
|
||
ɻ\u030A ← 'r\`_0';
|
||
# 4-character X-SAMPA representations
|
||
ǁ ↔ '|\|\'; # LATIN LETTER LATERAL CLICK
|
||
ʄ ↔ 'J\_<'; # LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK
|
||
ʛ ↔ 'G\_<'; # LATIN LETTER SMALL CAPITAL G WITH HOOK
|
||
ʮ ↔ 'z_w='; # LATIN SMALL LETTER TURNED H WITH FISHHOOK
|
||
\u1DC4 ↔ '_H_T'; # COMBINING MACRON-ACUTE
|
||
\u1DC5 ↔ '_B_L'; # COMBINING GRAVE-MACRON
|
||
\u1DC8 ↔ '_R_F'; # COMBINING GRAVE-ACUTE-GRAVE
|
||
# Alternative 4-character X-SAMPA representations
|
||
ɭ\u030A ← 'l`_0';
|
||
ɰ\u030A ← 'M\_0';
|
||
ɳ\u030A ← 'n`_0';
|
||
ɽ\u030A ← 'r`_0';
|
||
# 3-character X-SAMPA representations
|
||
ɓ ↔ 'b_<'; # LATIN SMALL LETTER B WITH HOOK
|
||
ɗ ↔ 'd_<'; # LATIN SMALL LETTER D WITH HOOK
|
||
ɠ ↔ 'g_<'; # LATIN SMALL LETTER G WITH HOOK
|
||
ɻ ↔ 'r\`'; # LATIN SMALL LETTER TURNED R WITH HOOK
|
||
↗ ↔ '<R>'; # NORTH EAST ARROW
|
||
↘ ↔ '<F>'; # SOUTH EAST ARROW
|
||
# Alternative 3-character X-SAMPA representations
|
||
j\u030A ← 'j_0';
|
||
ŋ\u030A ← 'N_0';
|
||
ɥ\u030A ← 'H_0';
|
||
ɱ\u030A ← 'F_0';
|
||
ɲ\u030A ← 'J_0';
|
||
# 2-character X-SAMPA representations
|
||
ħ ↔ 'X\'; # LATIN SMALL LETTER H WITH STROKE
|
||
ǀ ↔ '|\'; # LATIN LETTER DENTAL CLICK
|
||
ǂ ↔ '=\'; # LATIN LETTER ALVEOLAR CLICK
|
||
ǃ ↔ '!\'; # LATIN LETTER RETROFLEX CLICK
|
||
ɕ ↔ 's\'; # LATIN SMALL LETTER C WITH CURL
|
||
ɖ ↔ 'd`'; # LATIN SMALL LETTER D WITH TAIL
|
||
ɘ ↔ '@\'; # LATIN SMALL LETTER REVERSED E
|
||
ɚ ↔ '@`'; # LATIN SMALL LETTER SCHWA WITH HOOK
|
||
ɝ ↔ '3`'; # LATIN SMALL LETTER REVERSED OPEN E WITH HOOK
|
||
ɞ ↔ '3\'; # LATIN SMALL LETTER CLOSED REVERSED OPEN E
|
||
ɟ ↔ 'J\'; # LATIN SMALL LETTER DOTLESS J WITH STROKE
|
||
ɢ ↔ 'G\'; # LATIN LETTER SMALL CAPITAL G
|
||
ɦ ↔ 'h\'; # LATIN SMALL LETTER H WITH HOOK
|
||
ɧ ↔ 'x\'; # LATIN SMALL LETTER HENG WITH HOOK
|
||
ɭ ↔ 'l`'; # LATIN SMALL LETTER L WITH RETROFLEX HOOK
|
||
ɮ ↔ 'K\'; # LATIN SMALL LETTER LEZH
|
||
ɰ ↔ 'M\'; # LATIN SMALL LETTER TURNED M WITH LONG LEG
|
||
ɳ ↔ 'n`'; # LATIN SMALL LETTER N WITH RETROFLEX HOOK
|
||
ɴ ↔ 'N\'; # LATIN LETTER SMALL CAPITAL N
|
||
ɸ ↔ 'p\'; # LATIN SMALL LETTER PHI
|
||
ɹ ↔ 'r\'; # LATIN SMALL LETTER TURNED R
|
||
ɺ ↔ 'l\'; # LATIN SMALL LETTER TURNED R WITH LONG LEG
|
||
ɽ ↔ 'r`'; # LATIN SMALL LETTER R WITH TAIL
|
||
ʀ ↔ 'R\'; # LATIN LETTER SMALL CAPITAL R
|
||
ʂ ↔ 's`'; # LATIN SMALL LETTER S WITH HOOK
|
||
ʈ ↔ 't`'; # LATIN SMALL LETTER T WITH RETROFLEX HOOK
|
||
ʐ ↔ 'z`'; # LATIN SMALL LETTER Z WITH RETROFLEX HOOK
|
||
ʑ ↔ 'z\'; # LATIN SMALL LETTER Z WITH CURL
|
||
ʕ ↔ '?\'; # LATIN LETTER PHARYNGEAL VOICED FRICATIVE
|
||
ʘ ↔ 'O\'; # LATIN LETTER BILABIAL CLICK
|
||
ʙ ↔ 'B\'; # LATIN LETTER SMALL CAPITAL B
|
||
ʜ ↔ 'H\'; # LATIN LETTER SMALL CAPITAL H
|
||
ʝ ↔ 'j\'; # LATIN SMALL LETTER J WITH CROSSED-TAIL
|
||
ʟ ↔ 'L\'; # LATIN LETTER SMALL CAPITAL L
|
||
ʡ ↔ '>\'; # LATIN LETTER GLOTTAL STOP WITH STROKE
|
||
ʢ ↔ '<\'; # LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE
|
||
ʰ ↔ '_h'; # MODIFIER LETTER SMALL H
|
||
ʷ ↔ '_w'; # MODIFIER LETTER SMALL W
|
||
ʼ ↔ '_>'; # MODIFIER LETTER APOSTROPHE
|
||
ˆ ↔ '_\'; # MODIFIER LETTER CIRCUMFLEX ACCENT
|
||
ˇ ↔ '_/'; # CARON
|
||
ˑ ↔ ':\'; # MODIFIER LETTER HALF TRIANGULAR COLON
|
||
ˠ ↔ '_G'; # MODIFIER LETTER SMALL GAMMA
|
||
ˡ ↔ '_l'; # MODIFIER LETTER SMALL L
|
||
ˤ ↔ '_?\'; # MODIFIER LETTER SMALL REVERSED GLOTTAL STOP
|
||
\u0300 ↔ '_L'; # COMBINING GRAVE ACCENT
|
||
\u0301 ↔ '_H'; # COMBINING ACUTE ACCENT
|
||
\u0302 ↔ '_F'; # COMBINING CIRCUMFLEX ACCENT
|
||
\u0304 ↔ '_M'; # COMBINING MACRON
|
||
\u0306 ↔ '_X'; # COMBINING BREVE
|
||
\u0308 ↔ '_"'; # COMBINING DIAERESIS
|
||
\u030B ↔ '_T'; # COMBINING DOUBLE ACUTE ACCENT
|
||
\u030C ↔ '_R'; # COMBINING CARON
|
||
\u030F ↔ '_B'; # COMBINING DOUBLE GRAVE ACCENT
|
||
\u0318 ↔ '_A'; # COMBINING LEFT TACK BELOW
|
||
\u0319 ↔ '_q'; # COMBINING RIGHT TACK BELOW
|
||
\u031A ↔ '_}'; # COMBINING LEFT ANGLE ABOVE
|
||
\u031C ↔ '_c'; # COMBINING LEFT HALF RING BELOW
|
||
\u031D ↔ '_r'; # COMBINING UP TACK BELOW
|
||
\u031E ↔ '_o'; # COMBINING DOWN TACK BELOW
|
||
\u031F ↔ '_+'; # COMBINING PLUS SIGN BELOW
|
||
\u0320 ↔ '_-'; # COMBINING MINUS SIGN BELOW
|
||
\u0324 ↔ '_t'; # COMBINING DIAERESIS BELOW
|
||
\u0325 ↔ '_0'; # COMBINING RING BELOW
|
||
\u032A ↔ '_d'; # COMBINING BRIDGE BELOW
|
||
\u032C ↔ '_v'; # COMBINING CARON BELOW
|
||
\u032F ↔ '_^'; # COMBINING INVERTED BREVE BELOW
|
||
\u0330 ↔ '_k'; # COMBINING TILDE BELOW
|
||
\u0334 ↔ '_e'; # COMBINING TILDE OVERLAY
|
||
\u0339 ↔ '_O'; # COMBINING RIGHT HALF RING BELOW
|
||
\u033A ↔ '_a'; # COMBINING INVERTED BRIDGE BELOW
|
||
\u033B ↔ '_m'; # COMBINING SQUARE BELOW
|
||
\u033C ↔ '_N'; # COMBINING SEAGULL BELOW
|
||
\u033D ↔ '_x'; # COMBINING X ABOVE
|
||
ᵻ ↔ 'I\'; # LATIN SMALL CAPITAL LETTER I WITH STROKE
|
||
ᵿ ↔ 'U\'; # LATIN SMALL CAPITAL LETTER U WITH STROKE
|
||
ⁿ ↔ '_n'; # MODIFIER LETTER LATIN SMALL LETTER N
|
||
# Alternative 2-character X-SAMPA representations
|
||
ʋ ← 'v\'; # LATIN SMALL LETTER V WITH HOOK
|
||
ʲ ← '_j'; # MODIFIER LETTER SMALL J
|
||
\u0303 ← '_~'; # COMBINING TILDE
|
||
\u0329 ← '_='; # COMBINING VERTICAL LINE BELOW
|
||
# 1-character X-SAMPA representations
|
||
c\u0327 ↔ C; # LATIN SMALL LETTER C WITH CEDILLA (decomposed)
|
||
æ ↔ '{'; # LATIN SMALL LETTER AE
|
||
ð ↔ D; # LATIN SMALL LETTER ETH
|
||
ø ↔ 2; # LATIN SMALL LETTER O WITH STROKE
|
||
ŋ ↔ N; # LATIN SMALL LETTER ENG
|
||
œ ↔ 9; # LATIN SMALL LIGATURE OE
|
||
ɐ ↔ 6; # LATIN SMALL LETTER TURNED A
|
||
ɑ ↔ A; # LATIN SMALL LETTER ALPHA
|
||
ɒ ↔ Q; # LATIN SMALL LETTER TURNED ALPHA
|
||
ɔ ↔ O; # LATIN SMALL LETTER OPEN O
|
||
ə ↔ '@'; # LATIN SMALL LETTER SCHWA
|
||
ɛ ↔ E; # LATIN SMALL LETTER OPEN E
|
||
ɜ ↔ 3; # LATIN SMALL LETTER REVERSED OPEN E
|
||
ɡ ↔ g; # LATIN SMALL LETTER SCRIPT G
|
||
ɣ ↔ G; # LATIN SMALL LETTER GAMMA
|
||
ɤ ↔ 7; # LATIN SMALL LETTER RAMS HORN
|
||
ɥ ↔ H; # LATIN SMALL LETTER TURNED H
|
||
ɨ ↔ 1; # LATIN SMALL LETTER I WITH STROKE
|
||
ɪ ↔ I; # LATIN LETTER SMALL CAPITAL I
|
||
ɫ ↔ 5; # LATIN SMALL LETTER L WITH MIDDLE TILDE
|
||
ɬ ↔ K; # LATIN SMALL LETTER L WITH BELT
|
||
ɯ ↔ M; # LATIN SMALL LETTER TURNED M
|
||
ɱ ↔ F; # LATIN SMALL LETTER M WITH HOOK
|
||
ɲ ↔ J; # LATIN SMALL LETTER N WITH LEFT HOOK
|
||
ɵ ↔ 8; # LATIN SMALL LETTER BARRED O
|
||
ɶ ↔ '&'; # LATIN LETTER SMALL CAPITAL OE
|
||
ɾ ↔ 4; # LATIN SMALL LETTER R WITH FISHHOOK
|
||
ʁ ↔ R; # LATIN LETTER SMALL CAPITAL INVERTED R
|
||
ʃ ↔ S; # LATIN SMALL LETTER ESH
|
||
ʉ ↔ '}'; # LATIN SMALL LETTER U BAR
|
||
ʊ ↔ U; # LATIN SMALL LETTER UPSILON
|
||
ʋ ↔ P; # LATIN SMALL LETTER V WITH HOOK
|
||
ʌ ↔ V; # LATIN SMALL LETTER TURNED V
|
||
ʍ ↔ W; # LATIN SMALL LETTER TURNED W
|
||
ʎ ↔ L; # LATIN SMALL LETTER TURNED Y
|
||
ʏ ↔ Y; # LATIN LETTER SMALL CAPITAL Y
|
||
ʒ ↔ Z; # LATIN SMALL LETTER EZH
|
||
ʔ ↔ '?'; # LATIN LETTER GLOTTAL STOP
|
||
ʲ ↔ \'; # MODIFIER LETTER SMALL J
|
||
ˈ ↔ '"'; # MODIFIER LETTER VERTICAL LINE
|
||
ˌ ↔ '%'; # MODIFIER LETTER LOW VERTICAL LINE
|
||
ː ↔ ':'; # MODIFIER LETTER TRIANGULAR COLON
|
||
˞ ↔ '`'; # MODIFIER LETTER RHOTIC HOOK
|
||
\u0303 ↔ '~'; # COMBINING TILDE
|
||
\u0329 ↔ '='; # COMBINING VERTICAL LINE BELOW
|
||
\u0361 ↔ $t; # COMBINING DOUBLE INVERTED BREVE
|
||
β ↔ B; # GREEK SMALL LETTER BETA
|
||
θ ↔ T; # GREEK SMALL LETTER THETA
|
||
χ ↔ X; # GREEK SMALL LETTER CHI
|
||
↑ ↔ '^'; # UPWARDS ARROW
|
||
↓ ↔ '!'; # DOWNWARDS ARROW
|
||
# Compatibility rules for variant or obsolete IPA symbols
|
||
g → g; # LATIN SMALL LETTER G (redundant, for additional clarity)
|
||
ȵ → J; # LATIN SMALL LETTER N WITH CURL
|
||
ɩ → I; # LATIN SMALL LETTER IOTA
|
||
ɷ → U; # LATIN SMALL LETTER CLOSED OMEGA
|
||
ɼ → 'r_r'; # LATIN SMALL LETTER R WITH LONG LEG
|
||
ɿ → 'z='; # LATIN SMALL LETTER REVERSED R WITH FISHHOOK
|
||
ʅ → 'z`='; # LATIN SMALL LETTER SQUAT REVERSED ESH
|
||
ʆ → S\'; # LATIN SMALL LETTER ESH WITH CURL
|
||
ʇ → '|\' ; # LATIN SMALL LETTER TURNED T
|
||
ʓ → Z\'; # LATIN SMALL LETTER EZH WITH CURL
|
||
ʖ → '|\|\'; # LATIN LETTER INVERTED GLOTTAL STOP
|
||
ʗ → '!\'; # LATIN LETTER STRETCHED C
|
||
ʚ → '3\'; # LATIN SMALL LETTER CLOSED OPEN E
|
||
ʠ → 'G\_<_0'; # LATIN SMALL LETTER Q WITH HOOK
|
||
ʣ → d $t z; # LATIN SMALL LETTER DZ DIGRAPH
|
||
ʤ → d $t Z; # LATIN SMALL LETTER DEZH DIGRAPH
|
||
ʥ → d $t 'z\'; # LATIN SMALL LETTER DZ DIGRAPH WITH CURL
|
||
ʦ → t $t s; # LATIN SMALL LETTER TS DIGRAPH
|
||
ʧ → t $t S; # LATIN SMALL LETTER TESH DIGRAPH
|
||
ʨ → t $t 's\'; # LATIN SMALL LETTER TC DIGRAPH WITH CURL
|
||
˔ → '_r'; # MODIFIER LETTER UP TACK
|
||
˕ → '_o'; # MODIFIER LETTER DOWN TACK
|
||
\u030A → '_0'; # COMBINING RING ABOVE
|
||
φ → 'p\'; # GREEK SMALL LETTER PHI
|
||
ꞎ → 'K`'; # LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT
|
||
::NFC(NFD);
|
||
|