scuffed-code/icu4c/source/data/translit/am_am_FONIPA.txt

# ***************************************************************************
# Copyright (C) 2016 and later: Unicode, Inc. and others.
# License & terms of use: http://www.unicode.org/copyright.html
# *
# *  Copyright (C) 2004-2016, International Business Machines
# *  Corporation; Unicode, Inc.; and others.  All Rights Reserved.
# *
# ***************************************************************************
# File: am_am_FONIPA.txt
# Generated from CLDR
#

# Transforms Amharic (am) to Amharic in phonemic IPA transcription (am_FONIPA).
#
# Long vowels, long/geminated consonants:
#     In the direction from am_FONIPA to am, we emit Ethiopic gemination
#     and vowel length markers (U+135D, U+135E, U+135F) although
#     they are rarely written in Amharic text. Exceptions include
#     school books and textbooks for non-native speakers.
#     Clients who do not want these markers can easily strip them off
#     in a post-processing step.
#
# Labialization:
#     Amharic speakers will usually say ሟ as [mʷa] instead of [mwa];
#     labializing [m] instead of saying [m] followed by a separate [w].
#     Most Amharic consonants can get labialized. To keep the phonemic
#     transcription simple, we emit /m/ + /w/; otherwise, our phoneme
#     set would almost double, and it would include very unusual phonemes
#     such as /ɲʷ/ or /t\u0361ʃʼʷ/.
#
# References:
#     [1] The Ge’ez Frontier Foundation: “Principles and Specification
#     for Mnemonic Ethiopic Keyboards.” Version of January 17, 2009;
#     retrieved on November 4, 2014.
#     http://keyboards.ethiopic.org/specification/GFF-MnemonicEthiopicKeyboardSpecification.pdf
#     Other than most online sources, this report uses correct IPA notation
#     with the exception of /j/, which it consistently (but wrongly)
#     writes as */y/.
$IPA_VOWEL = [aeəiɨou];
$IPA_CONSONANT = [mnɲɴ p{pʼ}bt{tʼ}dk{kʼ}ɡʔʕ fvs{sʼ}zʃʒxh lr {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}];
# Some consonants have a special syllable when labialized, such as ፗ ↔ /pʷa/.
# Amharic restricts this mostly to /a/ syllables. While the Ethiopic script
# does offer labialized syllables for other vowels, these are typically
# not written in Amharic.
$LABIALIZABLE_BEFORE_A = [p{pʼ}t{tʼ} {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}{d\u0361ʒʼ} s{sʼ}zʃʒ fv r];
← [ ʼ  \u0361  \u035C  \u032F];
::(null);
# Appendix B of [1] transcribes ሀ as /hə/. However, according to
# an Amharic-speaking person, there is no /hə/ sequence
# in Amharic; instead, it gets pronounced as /ha/.
ሀ → ha;
ሀ ← hə;
ሁ ↔ hu;
ሂ ↔ hi;
ሃ ↔ ha;
ሄ ↔ he;
ህ ↔ hɨ;
ሆ ↔ ho;
ሇ → ho;  # Dizi, Me’en, Mursi, Suri /hɔ/ ([1], Appendix E); not used in Amharic.
ህ ← h;
ለ ↔ lə;
ሉ ↔ lu;
ሊ ↔ li;
ላ ↔ la;
ሌ ↔ le;
ል ↔ lɨ;
ሎ ↔ lo;
ⶀ → lo;  # Dizi, Me’en, Mursi, Suri /lɔ/ ([1], Appendix E); not used in Amharic.
ሏ ↔ lwa;
ል ← l;
# Appendix B of [1] transcribes ሐ as Voiceless pharyngeal fricative
# /ħə/.  However, according to an Amharic-speaking person, Amharic
# makes no difference in pronunciation between ሐ...ሓ and ሀ...ሃ; both
# are pronounced as Voiceless glottal fricative /h/.  Also, according
# to the speaker there is no /hə/ sequence in Amharic; instead, it
# gets pronounced as /ha/.
ሐ → ha;
ሑ → hu;
ሒ → hi;
ሓ → ha;
ሔ → he;
ሕ → hɨ;
ሖ → ho;
ሗ → hwa;
መ ↔ mə;
ሙ ↔ mu;
ሚ ↔ mi;
ማ ↔ ma;
ሜ ↔ me;
ም ↔ mɨ;
ሞ ↔ mo;
ⶁ → mo;  # Dizi, Me’en, Mursi, Suri /mɔ/ ([1], Appendix E); not used in Amharic.
ᎀ → mwə;  # Sebatbeit /mwə/ ([1], Appendix H); not used in Amharic.
ᎃ → mwu;  # Sebatbeit /mwu/ ([1], Appendix H); not used in Amharic.
ᎁ → mwi;  # Sebatbeit /mwi/ ([1], Appendix H); not used in Amharic.
ሟ ↔ mwa;
ᎂ → mwe;  # Sebatbeit /mwe/ ([1], Appendix H); not used in Amharic.
ፙ → mja;  # Unclear which language; Appendix L of [1] transcribes ፙ as /mʲa/.
ም ← m;
ሠ → sə;
ሡ → su;
ሢ → si;
ሣ → sa;
ሤ → se;
ሥ → sɨ;
ሦ → so;
ሧ → swa;
ረ ↔ rə;
ሩ ↔ ru;
ሪ ↔ ri;
ራ ↔ ra;
ሬ ↔ re;
ር ↔ rɨ;
ሮ ↔ ro;
ⶂ → ro;  # Dizi, Me’en, Mursi, Suri /rɔ/ ([1], Appendix E); not used in Amharic.
ሯ ↔ rwa;
ፘ → rja;  # Unclear which language; Appendix L of [1] transcribes ፘ as /rʲa/.
ር ← r;
# Amharic speakers pronounce ⶠ like ሸ. Source: [1], Appendix B.
ⶠ → ʃə;
ⶡ → ʃu;
ⶢ → ʃi;
ⶣ → ʃa;
ⶤ → ʃe;
ⶥ → ʃɨ;
ⶦ → ʃo;
ሸ ↔ ʃə;
ሹ ↔ ʃu;
ሺ ↔ ʃi;
ሻ ↔ ʃa;
ሼ ↔ ʃe;
ሽ ↔ ʃɨ;
ሾ ↔ ʃo;
ⶄ → ʃo;  # Dizi, Me’en, Mursi, Suri /ʃɔ/ ([1], Appendix E); not used in Amharic.
ሿ ↔ ʃwa;
ሽ ← ʃ;
ቀ ↔ kʼə;
ቁ ↔ kʼu;
ቂ ↔ kʼi;
ቃ ↔ kʼa;
ቄ ↔ kʼe;
ቅ ↔ kʼɨ;
ቆ ↔ kʼo;
ቇ → kʼo;  # Dizi, Me’en, Mursi, Suri /kʼɔ/ ([1], Appendix E); not used in Amharic.
ቈ ↔ kʼwə;
ቍ ↔ kʼwu;
ቊ ↔ kʼwi;
ቋ ↔ kʼwa;
ቌ ↔ kʼwe;
ቅ ← kʼ;
# In Awngi, Blin, Qimant, and Xamtanga, ቐ is spoken as voiced uvular fricative [ʁ].
# Source: [1], Appendix C. However, */ʁ/ is not an Amharic phoneme.
# When reading foreign words with ቐ, Amharic speakers pronounce
# ቐ like ቀ, i.e. as velar ejective /kʼ/.
ቐ → kʼə;
ቑ → kʼu;
ቒ → kʼi;
ቓ → kʼa;
ቔ → kʼe;
ቕ → kʼɨ;
ቖ → kʼo;
ቘ → kʼwə;
ቝ → kʼwu;
ቚ → kʼwi;
ቛ → kʼwa;
ቜ → kʼwe;
# In Sebatbeit, ⷀ is spoken as palatalized velar ejective /kʼʲ/ ([1], Appendix H).
# In Amharic, the syllable is not used, but it might appear in names.
ⷀ → kʼjə;
ⷁ → kʼju;
ⷂ → kʼji;
ⷃ → kʼja;
ⷄ → kʼje;
ⷅ → kʼjɨ;
ⷆ → kʼjo;
በ ↔ bə;
ቡ ↔ bu;
ቢ ↔ bi;
ባ ↔ ba;
ቤ ↔ be;
ብ ↔ bɨ;
ቦ ↔ bo;
ⶅ → bo;  # Dizi, Me’en, Mursi, Suri /bɔ/ ([1], Appendix E); not used in Amharic.
ᎄ → bwə;  # Sebatbeit /bʷə/ ([1], Appendix H); not used in Amharic.
ᎇ → bwu;  # Sebatbeit /bʷu/ ([1], Appendix H); not used in Amharic.
ᎅ → bwi;  # Sebatbeit /bʷi/ ([1], Appendix H); not used in Amharic.
ቧ → bwa;  # Sebatbeit /bʷa/ ([1], Appendix H); not used in Amharic.
ᎆ → bwe;  # Sebatbeit /bʷe/ ([1], Appendix H); not used in Amharic.
ብ ← b;
ቨ ↔ və;
ቩ ↔ vu;
ቪ ↔ vi;
ቫ ↔ va;
ቬ ↔ ve;
ቭ ↔ vɨ;
ቮ ↔ vo;
ቯ ↔ vwa;
ቭ ← v;
# Unclear which Ethiopic language uses ⶨ. It only appears in the
# “Language Neutral” list of Appendix L in [1], which transcribes it as t\u0361ʃ.
# For Amharic, we pronounce ⶨ therefore like ቸ.
ⶨ → t\u0361ʃə;
ⶩ → t\u0361ʃu;
ⶪ → t\u0361ʃi;
ⶫ → t\u0361ʃa;
ⶬ → t\u0361ʃe;
ⶭ → t\u0361ʃɨ;
ⶮ → t\u0361ʃo;
# In Amharic, ኀ is pronounced like ሀ.
# Source: [1], section on “Phonological Redundancy” for Amharic, page 5.
# Appendix B of [1] transcribes ሀ as /hə/. However, according to
# an Amharic-speaking person, there is no /hə/ sequence in Amharic.
# Instead, ሀ (and hence also ኀ) gets pronounced as /ha/.
ኀ → ha;
ኁ → hu;
ኂ → hi;
ኃ → ha;
ኄ → he;
ኅ → hɨ;
ኆ → ho;
ኇ → ho;  # Dizi, Me’en, Mursi, Suri /ŋɔ/ ([1], Appendix E); not used in Amharic.
ኈ → hwə;
ኍ → hwu;
ኊ → hwi;
ኋ → hwa;
ኌ → hwe;
ነ ↔ nə;
ኑ ↔ nu;
ኒ ↔ ni;
ና ↔ na;
ኔ ↔ ne;
ን ↔ nɨ;
ኖ ↔ no;
ⶈ → no;  # Dizi, Me’en, Mursi, Suri /nɔ/ ([1], Appendix E); not used in Amharic.
ኗ ↔ nwa;
ን ← n;
ኘ ↔ ɲə;
ኙ ↔ ɲu;
ኚ ↔ ɲi;
ኛ ↔ ɲa;
ኜ ↔ ɲe;
ኝ ↔ ɲɨ;
ኞ ↔ ɲo;
ⶉ → ɲo;  # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic.
ኟ ↔ ɲwa;
ኝ ← ɲ;
# Amharic speakers pronounce ኸ as [h] because Amharic has no [x] sound.
# However, in transliterations of foreign (eg. Spanish) words with [x],
# several Amharic speakers have confirmed that they prefer ኻ over ሃ.
ዀ → hwə;
ዂ → hwi;
ዃ → hwa;
ዄ → hwe;
ዅ → hwɨ;
ኸ → hə;
ኹ → hu;
ኺ → hi;
ኻ → ha;
ኼ → he;
ኽ → hɨ;
ኾ → ho;
ዀ ← xwə;
ዂ ← xwi;
ዃ ← xwa;
ዄ ← xwe;
ዅ ← xwɨ;
ዅ ← xw;
ኸ ← xə;
ኹ ← xu;
ኺ ← xi;
ኻ ← xa;
ኼ ← xe;
ኽ ← xɨ;
ኾ ← xo;
ኽ ← x;
አ ↔ ʔə;
ኡ ↔ ʔu;
ኢ ↔ ʔi;
ኣ ↔ ʔa;
ኤ ↔ ʔe;
እ ↔ ʔɨ;
ኦ ↔ ʔo;
ⶊ → ʔo;  # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic.
እ ← ʔ;
ከ ↔ kə;
ኩ ↔ ku;
ኪ ↔ ki;
ካ ↔ ka;
ኬ ↔ ke;
ክ ↔ kɨ;
ኮ ↔ ko;
ኰ ↔ kwə;
ኵ ↔ kwu;
ኲ ↔ kwi;
ኳ ↔ kwa;
ኴ ↔ kwe;
ክ ← k;
# In Sebatbeit, ⷈ is spoken as palatalized velar plosive /kʲ/ ([1], Appendix H).
# Amharic speakers pronounce it as /k/ without palatalization.
ⷈ → kə;
ⷉ → ku;
ⷊ → ki;
ⷋ → ka;
ⷌ → ke;
ⷍ → kɨ;
ⷎ → ko;
# In Sebatbeit, ⷐ is spoken as palatalized voiceless velar fricative/xʲə/
# according to [1], Appendix H. When the syllable appears in names,
# Amharic speakers pronounce it as /kə/ without palatalization.
ⷐ → kə;
ⷑ → ku;
ⷒ → ki;
ⷓ → ka;
ⷔ → ke;
ⷕ → kɨ;
ⷖ → ko;
ወ ↔ wə;
ዉ ↔ wu;
ዊ ↔ wi;
ዋ ↔ wa;
ዌ ↔ we;
ው ↔ wɨ;
ዎ ↔ wo;
ዏ → wo;  # Dizi, Me’en, Mursi, Suri /wɔ/ ([1], Appendix E); not used in Amharic.
ው ← w;
ዐ ↔ ʕə;
ዑ ↔ ʕu;
ዒ ↔ ʕi;
ዓ ↔ ʕa;
ዔ ↔ ʕe;
ዕ ↔ ʕɨ;
ዖ ↔ ʕo;
ዒ ← ʕ;
ዘ ↔ zə;
ዙ ↔ zu;
ዚ ↔ zi;
ዛ ↔ za;
ዜ ↔ ze;
ዝ ↔ zɨ;
ዞ ↔ zo;
ⶋ → zo;  # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic.
ዟ ↔ zwa;
ዝ ← z;
ዠ ↔ ʒə;
ዡ ↔ ʒu;
ዢ ↔ ʒi;
ዣ ↔ ʒa;
ዤ ↔ ʒe;
ዥ ↔ ʒɨ;
ዦ ↔ ʒo;
ዧ ↔ ʒwa;
ዢ ← ʒ;
# Unclear which Ethiopic language uses ⶰ. It only appears in the
# “Language Neutral” list of Appendix L in [1], which transcribes it as ʒ.
# For Amharic, we pronounce ⶰ therefore like ዠ.
ⶰ → ʒə;
ⶱ → ʒu;
ⶲ → ʒi;
ⶳ → ʒa;
ⶴ → ʒe;
ⶵ → ʒɨ;
ⶶ → ʒo;
የ ↔ jə;
ዩ ↔ ju;
ዪ ↔ ji;
ያ ↔ ja;
ዬ ↔ je;
ይ ↔ jɨ;
ዮ ↔ jo;
ዯ → jo;  # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic.
ይ ← j;
ጀ ↔ d\u0361ʒə;
ጁ ↔ d\u0361ʒu;
ጂ ↔ d\u0361ʒi;
ጃ ↔ d\u0361ʒa;
ጄ ↔ d\u0361ʒe;
ጅ ↔ d\u0361ʒɨ;
ጆ ↔ d\u0361ʒo;
ጇ ↔ d\u0361ʒwa;
ጅ ← d\u0361ʒ;
ደ ↔ də;
ዱ ↔ du;
ዲ ↔ di;
ዳ ↔ da;
ዴ ↔ de;
ድ ↔ dɨ;
ዶ ↔ do;
ⶌ → do;  # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic.
ዷ ↔ dwa;
ድ ← d;
ገ ↔ ɡə;
ጉ ↔ ɡu;
ጊ ↔ ɡi;
ጋ ↔ ɡa;
ጌ ↔ ɡe;
ግ ↔ ɡɨ;
ጎ ↔ ɡo;
ጐ ↔ ɡwə;
ጕ ↔ ɡwu;
ጒ ↔ ɡwi;
ጓ ↔ ɡwa;
ጔ ↔ ɡwe;
ግ ← ɡ;
# In Awngi, Blin, Qimant, and Xamtanga, ጘ is spoken as voiced velar nasal [ŋ].
# Source: [1], Appendix C. While /ŋ/ is not an Amharic phoneme, Amharic speakers
# still can pronounce it according to our source. However, when transliterating
# foreign words with [ŋ], Amharic uses the sequence ንግ /nɡ/. For example,
# the Amharic transliteration of Washington /waʃiŋtən/ is ዋሺንግተን.
ጘ → ŋə;
ጙ → ŋu;
ጚ → ŋi;
ጛ → ŋa;
ጜ → ŋe;
ጝ → ŋɨ;
ጞ → ŋo;
ⶓ → ŋwə;
ⶖ → ŋwu;
ⶔ → ŋwi;
ጟ → ŋwa;
ⶕ → ŋwe;
# Since there is no uvular nasal [ɴ] in Amharic, we use the velar nasal [ŋ].
ጘ ← ɴə;
ጙ ← ɴu;
ጚ ← ɴi;
ጛ ← ɴa;
ጜ ← ɴe;
ጝ ← ɴɨ;
ጞ ← ɴo;
ጝ ← ɴ;
# In Sebatbeit, ⷘ is spoken as palatalized voiced velar stop /ɡj/ ([1], Appendix H).
# Amharic speakers pronounce it as voiced velar stop /ɡ/ without palatalization.
ⷘ → ɡə;
ⷙ → ɡu;
ⷚ → ɡi;
ⷛ → ɡa;
ⷜ → ɡe;
ⷝ → ɡɨ;
ⷞ → ɡo;
ጠ ↔ tʼə;
ጡ ↔ tʼu;
ጢ ↔ tʼi;
ጣ ↔ tʼa;
ጤ ↔ tʼe;
ጥ ↔ tʼɨ;
ጦ ↔ tʼo;
ጧ ↔ tʼwa;
ጢ ← tʼ;
ጨ ↔ t\u0361ʃʼə;
ጩ ↔ t\u0361ʃʼu;
ጪ ↔ t\u0361ʃʼi;
ጫ ↔ t\u0361ʃʼa;
ጬ ↔ t\u0361ʃʼe;
ጭ ↔ t\u0361ʃʼɨ;
ጮ ↔ t\u0361ʃʼo;
ⶐ → t\u0361ʃʼo;  # Dizi, Me’en, Mursi, Suri /t\u0361ʃʼɔ/ ([1], Appendix E); not used in Amharic.
ጯ ↔ t\u0361ʃʼwa;
ጪ ← t\u0361ʃʼ;
# According to Appendix B of [1], the following are used in the Bench language
# (aka Benchnon, Gimira). In Bench, ⶻ is pronounced as /ʈ\u0361ʂʼ/ Retroflex
# ejective affricate; with a phonemic distrinction to the non-retroflex version.
# Amharic does not have retroflex phonemes, so we go with /t\u0361ʃʼ/.
ⶸ → t\u0361ʃʼə;
ⶹ → t\u0361ʃʼu;
ⶺ → t\u0361ʃʼi;
ⶻ → t\u0361ʃʼa;
ⶼ → t\u0361ʃʼe;
ⶽ → t\u0361ʃʼɨ;
ⶾ → t\u0361ʃʼo;
ቸ ↔ t\u0361ʃə;
ቹ ↔ t\u0361ʃu;
ቺ ↔ t\u0361ʃi;
ቻ ↔ t\u0361ʃa;
ቼ ↔ t\u0361ʃe;
ች ↔ t\u0361ʃɨ;
ቾ ↔ t\u0361ʃo;
ቿ ↔ t\u0361ʃwa;
ች ← t\u0361ʃ;
ተ ↔ tə;
ቱ ↔ tu;
ቲ ↔ ti;
ታ ↔ ta;
ቴ ↔ te;
ት ↔ tɨ;
ቶ ↔ to;
ⶆ → to;  # Dizi, Me’en, Mursi, Suri /tɔ/ ([1], Appendix E); not used in Amharic.
ቷ ↔ twa;
ት ← t;
ጰ ↔ pʼə;
ጱ ↔ pʼu;
ጲ ↔ pʼi;
ጳ ↔ pʼa;
ጴ ↔ pʼe;
ጵ ↔ pʼɨ;
ጶ ↔ pʼo;
ⶑ → pʼo;  # Dizi, Me’en, Mursi, Suri /pʼɔ/ ([1], Appendix E); not used in Amharic.
ጷ ↔ pʼwa;
ጵ ← pʼ;
ጸ ↔ sʼə;
ጹ ↔ sʼu;
ጺ ↔ sʼi;
ጻ ↔ sʼa;
ጼ ↔ sʼe;
ጽ ↔ sʼɨ;
ጾ ↔ sʼo;
ጿ ↔ sʼwa;
ጽ ← sʼ;
# In Amharic, ፀ is pronounced like ጸ.
# Source: [1], section on “Phonological Redundancy” for Amharic, page 5.
ፀ → sʼə;
ፁ → sʼu;
ፂ → sʼi;
ፃ → sʼa;
ፄ → sʼe;
ፅ → sʼɨ;
ፆ → sʼo;
ፇ → sʼo;  # Dizi, Me’en, Mursi, Suri /sʼɔ/ ([1], Appendix E); not used in Amharic.
# Amharic speakers pronounce ሰ like ሠ. Source: [1], Appendix B.
ሰ ↔ sə;
ሱ ↔ su;
ሲ ↔ si;
ሳ ↔ sa;
ሴ ↔ se;
ስ ↔ sɨ;
ሶ ↔ so;
ⶃ → so;  # Dizi, Me’en, Mursi, Suri /sɔ/ ([1], Appendix E); not used in Amharic.
ሷ ↔ swa;
ስ ← s;
ፈ ↔ fə;
ፉ ↔ fu;
ፊ ↔ fi;
ፋ ↔ fa;
ፌ ↔ fe;
ፍ ↔ fɨ;
ፎ ↔ fo;
ᎈ → fwə;  # Sebatbeit /fwə/ ([1], Appendix H); not used in Amharic.
ᎉ → fwu;  # Sebatbeit /fwu/ ([1], Appendix H); not used in Amharic.
ᎋ → fwi;  # Sebatbeit /fwi/ ([1], Appendix H); not used in Amharic.
ፏ ↔ fwa;
ᎊ → fwe;  # Sebatbeit /fwe/ ([1], Appendix H); not used in Amharic.
ፚ → fja;  # Unclear which language; Appendix L of [1] transcribes ፚ as /fja/.
ፍ ← f;
ፐ ↔ pə;
ፑ ↔ pu;
ፒ ↔ pi;
ፓ ↔ pa;
ፔ ↔ pe;
ፕ ↔ pɨ;
ፖ ↔ po;
ⶒ → po;  # Dizi, Me’en, Mursi, Suri /pɔ/ ([1], Appendix E); not used in Amharic.
ᎌ → pwə;  # Sebatbeit /pwə/ ([1], Appendix H); not used in Amharic.
ᎍ → pwu;  # Sebatbeit /pwu/ ([1], Appendix H); not used in Amharic.
ᎏ → pwi;  # Sebatbeit /pwi/ ([1], Appendix H); not used in Amharic.
ፗ ↔ pwa;
ᎎ → pwe;  # Sebatbeit /pwe/ ([1], Appendix H); not used in Amharic.
ፕ ← p;
ኧ ↔ ə;
ኡ ← u;  # ኡላዓን ባዓታር ← Ulaan Baatar /ulaʕan baʕatar/
አ ← a;  # አምስተርዳም ← Amsterdam /amstərdam/
ኤ ← e;
እ ← ɨ;
ኦ ← o;  # ፖርት ኦፍ ስፔን ← Port of Spain /port of speːn/
ኢ ← i;  # ኢስላማባድ ← Islamabad /islamabad/
# Applications will typically split words before calling our rules.
# To be resilient, we replace punctuation by whitespace in IPA.
፠ → ' ';  # U+1360 ETHIOPIC SECTION MARK
፡ → ' ';  # U+1361 ETHIOPIC WORDSPACE
። → ' ';  # U+1362 ETHIOPIC FULL STOP
፣ → ' ';  # U+1363 ETHIOPIC COMMA
፤ → ' ';  # U+1364 ETHIOPIC SEMICOLON
፥ → ' ';  # U+1365 ETHIOPIC COLON
፦ → ' ';  # U+1366 ETHIOPIC PREFACE COLON
፧ → ' ';  # U+1367 ETHIOPIC QUESTION MARK
፨ → ' ';  # U+1368 ETHIOPIC PARAGRAPH SEPARATOR
# Likewise, Ethiopic numberals cannot be pronounced by these rules,
# so we replace them by whitespace in the output IPA notation.
# Applications will typically pre-process text before calling
# the am → am_FONIPA transform.
፩ → ' ';  # U+1369 ETHIOPIC DIGIT ONE
፪ → ' ';  # U+136A ETHIOPIC DIGIT TWO
፫ → ' ';  # U+136B ETHIOPIC DIGIT THREE
፬ → ' ';  # U+136C ETHIOPIC DIGIT FOUR
፭ → ' ';  # U+136D ETHIOPIC DIGIT FIVE
፮ → ' ';  # U+136E ETHIOPIC DIGIT SIX
፯ → ' ';  # U+136F ETHIOPIC DIGIT SEVEN
፰ → ' ';  # U+1370 ETHIOPIC DIGIT EIGHT
፱ → ' ';  # U+1371 ETHIOPIC DIGIT NINE
፲ → ' ';  # U+1372 ETHIOPIC NUMBER TEN
፳ → ' ';  # U+1373 ETHIOPIC NUMBER TWENTY
፴ → ' ';  # U+1374 ETHIOPIC NUMBER THIRTY
፵ → ' ';  # U+1375 ETHIOPIC NUMBER FORTY
፶ → ' ';  # U+1376 ETHIOPIC NUMBER FIFTY
፷ → ' ';  # U+1377 ETHIOPIC NUMBER SIXTY
፸ → ' ';  # U+1378 ETHIOPIC NUMBER SEVENTY
፹ → ' ';  # U+1379 ETHIOPIC NUMBER EIGHTY
፺ → ' ';  # U+137A ETHIOPIC NUMBER NINETY
፻ → ' ';  # U+137B ETHIOPIC NUMBER HUNDRED
፼ → ' ';  # U+137C ETHIOPIC NUMBER TEN THOUSAND
# Transform IPA length markers to one of these:
# U+135D ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK
# U+135E ETHIOPIC COMBINING VOWEL LENGTH MARK
# U+135F ETHIOPIC COMBINING GEMINATION MARK
::null();
← ː ;  # Strip off any remaining IPA length markers.
::(null);
($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135D → $1 ː $2 ː;
($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135E → $1 $2 ː;
($IPA_CONSONANT) ([jw]? $IPA_VOWEL?) \u135F → $1 ː $2;
[\u135D \u135E \u135F] → ;  # Strip off any remaining length markers.
$1 wa \u135D ← ($LABIALIZABLE_BEFORE_A) ː waː;  # ቷ\u135D ← [tːʷaː]
$1 wa \u135E ← ($LABIALIZABLE_BEFORE_A)   waː;  # ቷ\u135E ← [tʷaː]
$1 wa \u135F ← ($LABIALIZABLE_BEFORE_A) ː wa;   # አቷ\u135F ← [tːʷa]
$1 \u135F $2 \u135E ← ([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL) ː;
$1 \u135F $2 ← {([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL?)};
$1 \u135E ← ($IPA_VOWEL ː);
$1 \u135D ← (jː $IPA_VOWEL ː);
$1 \u135E ← ([jw] $IPA_VOWEL ː);
$1 \u135F ← (jː $IPA_VOWEL?);
$1 \u135D ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL ː);
$1 \u135E ← ($IPA_CONSONANT [w]? $IPA_VOWEL ː);
$1 \u135F ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL?);
# Insert syllable markers in a separate pass.
::null;
{($IPA_VOWEL ː?)} [[:L:]] → $1 \.;
::(null);
← [ˈˌ\. \u0303\u032F];
aj ← ai;     # Nairobi /nairobi/ ናይሮቢ, Cairo /kairo/ ካይሮ
aw ← au;     # Bissau /bisːau/ ቢሳው
eji ← ei;    # Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ
ewo ← eo;    # Montevideo /montevideo/ ሞንቴቪዴዎ
ija ← ia;    # Monrovia /monrovia/ ሞንሮቪያ
ijə ← iə;    # Reunion /rijunijən/ ሪዩኒየን
iw ← iu;     # Vilnius /vilnius/ ቪልኒውስ, New Delhi /niu deːli/ ኒው ዴሊ
jo ← io;     # Tokyo /tokio/ ቶክዮ
nɡ ← ŋɡ;     # Kongo /koŋɡo/ ኮንጎ, Hungary /həŋɡari/ ሀንጋሪ
nɡ ← ŋ;      # Bangkok /baŋkok/ ባንግኮክ, Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ
uwa ← ua;    # Kuala Lumpur /kuala lumpur/ ኩዋላ ሉምፑር, Ruanda /ruanda/ ሩዋንዳ
bwe ← bue;   # Buenos Aires /buenos aires/ ብዌኖስ አይሬስ
sʼ ← t\u0361s;     # Podgorica /podɡorit\u0361sa/ ፖድጎሪጻ, Vaduz /fadut\u0361s/ ፋዱጽ
uwi ← ui;    # Port Luis /port luis/ ፖርት ሉዊስ
uwe ← ue;    # Lithuania /lituenia/ ሊቱዌኒያ, Venezuela /venɨzuela/ ቬንዙዌላ
::(null);
ʔə ← \. ə;
ʔu ← \. u;
ʔi ← \. i;
ʔa ← \. a;
ʔe ← \. e;
ʔɨ ← \. ɨ;
ʔo ← \. o;
$1 w ← {($IPA_VOWEL ː?) \u032F} $IPA_VOWEL;  # /ewowa/ ← /e\u032Fo\u032Fa/
::(null);
n ← [n {n\u033C} {n\u033C\u030A} {m\u033A} {n\u030A} {n\u0325} ⁿ ᵑ];
m ← [ɱ {m\u0325} {m\u032A} ᵐ];
ɲ ← [{ɳ\u030A} {ɳ\u0325} ɳ {ɲ\u030A} {ɲ\u0325} ɲ];
ŋ ← [{ŋ\u030A} {ŋ\u0325} ŋ];
ɴ ← [{ɴ\u030A} {ɴ\u0325} ɴ];
p ← [{t\u033C} {p\u033A}];
pʼ ← [ʘ ɋ];
b ← [{d\u033C} {b\u033A} {ɾ\u033C} ɓ];
t ← [{t\u032A} ʈ];
tʼ ← [ǁ ʖ];
d ← [ɖ ɗ ᶑ];
k ← q;
kʼ ←  [ǃ ʗ];
ɡ ← [g ɢ ɣ ɠ ʛ];
nɡ ← ᵑɡ;
ʔ ← ʡ;
s ← [θ {θ\u0331} {θ\u031E} {θ\u033C} {ɸ\u033A}];
z ← [ð {ð\u0320} {ð\u033C} {β\u033A}];
sʼ ← [{t\u0361s} {t\u035Cs} ʦ];
t\u0361ʃ ← [{t\u035Cʃ} ʧ {t\u0361ɕ} {t\u035Cɕ} ʨ {ʈ\u0361ʂ} c];
t\u0361ʃʼ ← [ǀ ʇ ǂ ʄ];
d\u0361ʒ ← [ʤ ʣ {d\u0361z} {d\u035Cz} {d\u0361ɕ} ʥ {d\u0361ʑ} {d\u035Cʑ} {ɖ\u0361ʐ} {d\u0361ʐ} ɟ];
pf ← [{p\u032A} {p\u0346} ȹ {p\u0361f} {p\u032Af} {p\u032A\u035Cf}];
bv ← [{b\u032A} {b\u0346} ȸ {b\u0361v} {b\u032A\u0361v}];
ʃ ← [ʂ ɕ];
ʒ ← [ʐ ʑ];
r ← [ɾ ɽ ʁ];
rːʒ ← r\u031Dː;
rʒ ← r\u031D;
v ← β;
x ← [ç x χ];
ʕ ← ʕ\u031D;
h ← ɦ;
j ← [ʝ ʲ];
lj ← ʎ [iɨ]? [jʝʲ]?;
t\u0361ʃl ← [{t\u0361ɬ} {tɬ}];
ʃl ← ɬ;
w ← {u\u032F} $IPA_VOWEL;
w ← ʷ;
ʼː ← ːʼ;  # /pʼː/ ← /pːʼ/; /sʼː/ ← /sːʼ/; etc.
::(null);
i ← y;
ɨ ← [ɪ ʉ];
u ← [ʊ ɯ];
ə ← [ɛ æ ɘ];
o ← [ɔ ø];
a ← ɑ;
ʼ ← ʰ;
← [ʱ];
$1ːʲ ← ([pbtd])ʲː;  # [bːʲeː] ← [bʲːeː]
$1ːʷ ← ([pbtd])ʷː;  # [bːʷeː] ← [bʷːeː]
::(NFC);
← [ \u0303  \u0330  \u030B  \u0301  \u0304  \u0300  \u030F  \u030C  \u0302 ˥ ˦ ˧ ˨ ˩ ꜜ ꜛ ↗ ↘ ];
::(NFD);