1# © 2016 and later: Unicode, Inc. and others. 2# License & terms of use: http://www.unicode.org/copyright.html#License 3# 4# File: am_am_FONIPA.txt 5# Generated from CLDR 6# 7 8# Transforms Amharic (am) to Amharic in phonemic IPA transcription (am_FONIPA). 9# 10# Long vowels, long/geminated consonants: 11# In the direction from am_FONIPA to am, we emit Ethiopic gemination 12# and vowel length markers (U+135D, U+135E, U+135F) although 13# they are rarely written in Amharic text. Exceptions include 14# school books and textbooks for non-native speakers. 15# Clients who do not want these markers can easily strip them off 16# in a post-processing step. 17# 18# Labialization: 19# Amharic speakers will usually say ሟ as [mʷa] instead of [mwa]; 20# labializing [m] instead of saying [m] followed by a separate [w]. 21# Most Amharic consonants can get labialized. To keep the phonemic 22# transcription simple, we emit /m/ + /w/; otherwise, our phoneme 23# set would almost double, and it would include very unusual phonemes 24# such as /ɲʷ/ or /t\u0361ʃʼʷ/. 25# 26# References: 27# [1] The Ge’ez Frontier Foundation: “Principles and Specification 28# for Mnemonic Ethiopic Keyboards.” Version of January 17, 2009; 29# retrieved on November 4, 2014. 30# http://keyboards.ethiopic.org/specification/GFF-MnemonicEthiopicKeyboardSpecification.pdf 31# Other than most online sources, this report uses correct IPA notation 32# with the exception of /j/, which it consistently (but wrongly) 33# writes as */y/. 34$IPA_VOWEL = [aeəiɨou]; 35$IPA_CONSONANT = [mnɲɴ p{pʼ}bt{tʼ}dk{kʼ}ɡʔʕ fvs{sʼ}zʃʒxh lr {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}]; 36# Some consonants have a special syllable when labialized, such as ፗ ↔ /pʷa/. 37# Amharic restricts this mostly to /a/ syllables. While the Ethiopic script 38# does offer labialized syllables for other vowels, these are typically 39# not written in Amharic. 40$LABIALIZABLE_BEFORE_A = [p{pʼ}t{tʼ} {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}{d\u0361ʒʼ} s{sʼ}zʃʒ fv r]; 41← [ ʼ \u0361 \u035C \u032F]; 42::(null); 43# Appendix B of [1] transcribes ሀ as /hə/. However, according to 44# an Amharic-speaking person, there is no /hə/ sequence 45# in Amharic; instead, it gets pronounced as /ha/. 46ሀ → ha; 47ሀ ← hə; 48ሁ ↔ hu; 49ሂ ↔ hi; 50ሃ ↔ ha; 51ሄ ↔ he; 52ህ ↔ hɨ; 53ሆ ↔ ho; 54ሇ → ho; # Dizi, Me’en, Mursi, Suri /hɔ/ ([1], Appendix E); not used in Amharic. 55ህ ← h; 56ለ ↔ lə; 57ሉ ↔ lu; 58ሊ ↔ li; 59ላ ↔ la; 60ሌ ↔ le; 61ል ↔ lɨ; 62ሎ ↔ lo; 63ⶀ → lo; # Dizi, Me’en, Mursi, Suri /lɔ/ ([1], Appendix E); not used in Amharic. 64ሏ ↔ lwa; 65ል ← l; 66# Appendix B of [1] transcribes ሐ as Voiceless pharyngeal fricative 67# /ħə/. However, according to an Amharic-speaking person, Amharic 68# makes no difference in pronunciation between ሐ...ሓ and ሀ...ሃ; both 69# are pronounced as Voiceless glottal fricative /h/. Also, according 70# to the speaker there is no /hə/ sequence in Amharic; instead, it 71# gets pronounced as /ha/. 72ሐ → ha; 73ሑ → hu; 74ሒ → hi; 75ሓ → ha; 76ሔ → he; 77ሕ → hɨ; 78ሖ → ho; 79ሗ → hwa; 80መ ↔ mə; 81ሙ ↔ mu; 82ሚ ↔ mi; 83ማ ↔ ma; 84ሜ ↔ me; 85ም ↔ mɨ; 86ሞ ↔ mo; 87ⶁ → mo; # Dizi, Me’en, Mursi, Suri /mɔ/ ([1], Appendix E); not used in Amharic. 88ᎀ → mwə; # Sebatbeit /mwə/ ([1], Appendix H); not used in Amharic. 89ᎃ → mwu; # Sebatbeit /mwu/ ([1], Appendix H); not used in Amharic. 90ᎁ → mwi; # Sebatbeit /mwi/ ([1], Appendix H); not used in Amharic. 91ሟ ↔ mwa; 92ᎂ → mwe; # Sebatbeit /mwe/ ([1], Appendix H); not used in Amharic. 93ፙ → mja; # Unclear which language; Appendix L of [1] transcribes ፙ as /mʲa/. 94ም ← m; 95ሠ → sə; 96ሡ → su; 97ሢ → si; 98ሣ → sa; 99ሤ → se; 100ሥ → sɨ; 101ሦ → so; 102ሧ → swa; 103ረ ↔ rə; 104ሩ ↔ ru; 105ሪ ↔ ri; 106ራ ↔ ra; 107ሬ ↔ re; 108ር ↔ rɨ; 109ሮ ↔ ro; 110ⶂ → ro; # Dizi, Me’en, Mursi, Suri /rɔ/ ([1], Appendix E); not used in Amharic. 111ሯ ↔ rwa; 112ፘ → rja; # Unclear which language; Appendix L of [1] transcribes ፘ as /rʲa/. 113ር ← r; 114# Amharic speakers pronounce ⶠ like ሸ. Source: [1], Appendix B. 115ⶠ → ʃə; 116ⶡ → ʃu; 117ⶢ → ʃi; 118ⶣ → ʃa; 119ⶤ → ʃe; 120ⶥ → ʃɨ; 121ⶦ → ʃo; 122ሸ ↔ ʃə; 123ሹ ↔ ʃu; 124ሺ ↔ ʃi; 125ሻ ↔ ʃa; 126ሼ ↔ ʃe; 127ሽ ↔ ʃɨ; 128ሾ ↔ ʃo; 129ⶄ → ʃo; # Dizi, Me’en, Mursi, Suri /ʃɔ/ ([1], Appendix E); not used in Amharic. 130ሿ ↔ ʃwa; 131ሽ ← ʃ; 132ቀ ↔ kʼə; 133ቁ ↔ kʼu; 134ቂ ↔ kʼi; 135ቃ ↔ kʼa; 136ቄ ↔ kʼe; 137ቅ ↔ kʼɨ; 138ቆ ↔ kʼo; 139ቇ → kʼo; # Dizi, Me’en, Mursi, Suri /kʼɔ/ ([1], Appendix E); not used in Amharic. 140ቈ ↔ kʼwə; 141ቍ ↔ kʼwu; 142ቊ ↔ kʼwi; 143ቋ ↔ kʼwa; 144ቌ ↔ kʼwe; 145ቅ ← kʼ; 146# In Awngi, Blin, Qimant, and Xamtanga, ቐ is spoken as voiced uvular fricative [ʁ]. 147# Source: [1], Appendix C. However, */ʁ/ is not an Amharic phoneme. 148# When reading foreign words with ቐ, Amharic speakers pronounce 149# ቐ like ቀ, i.e. as velar ejective /kʼ/. 150ቐ → kʼə; 151ቑ → kʼu; 152ቒ → kʼi; 153ቓ → kʼa; 154ቔ → kʼe; 155ቕ → kʼɨ; 156ቖ → kʼo; 157ቘ → kʼwə; 158ቝ → kʼwu; 159ቚ → kʼwi; 160ቛ → kʼwa; 161ቜ → kʼwe; 162# In Sebatbeit, ⷀ is spoken as palatalized velar ejective /kʼʲ/ ([1], Appendix H). 163# In Amharic, the syllable is not used, but it might appear in names. 164ⷀ → kʼjə; 165ⷁ → kʼju; 166ⷂ → kʼji; 167ⷃ → kʼja; 168ⷄ → kʼje; 169ⷅ → kʼjɨ; 170ⷆ → kʼjo; 171በ ↔ bə; 172ቡ ↔ bu; 173ቢ ↔ bi; 174ባ ↔ ba; 175ቤ ↔ be; 176ብ ↔ bɨ; 177ቦ ↔ bo; 178ⶅ → bo; # Dizi, Me’en, Mursi, Suri /bɔ/ ([1], Appendix E); not used in Amharic. 179ᎄ → bwə; # Sebatbeit /bʷə/ ([1], Appendix H); not used in Amharic. 180ᎇ → bwu; # Sebatbeit /bʷu/ ([1], Appendix H); not used in Amharic. 181ᎅ → bwi; # Sebatbeit /bʷi/ ([1], Appendix H); not used in Amharic. 182ቧ → bwa; # Sebatbeit /bʷa/ ([1], Appendix H); not used in Amharic. 183ᎆ → bwe; # Sebatbeit /bʷe/ ([1], Appendix H); not used in Amharic. 184ብ ← b; 185ቨ ↔ və; 186ቩ ↔ vu; 187ቪ ↔ vi; 188ቫ ↔ va; 189ቬ ↔ ve; 190ቭ ↔ vɨ; 191ቮ ↔ vo; 192ቯ ↔ vwa; 193ቭ ← v; 194# Unclear which Ethiopic language uses ⶨ. It only appears in the 195# “Language Neutral” list of Appendix L in [1], which transcribes it as t\u0361ʃ. 196# For Amharic, we pronounce ⶨ therefore like ቸ. 197ⶨ → t\u0361ʃə; 198ⶩ → t\u0361ʃu; 199ⶪ → t\u0361ʃi; 200ⶫ → t\u0361ʃa; 201ⶬ → t\u0361ʃe; 202ⶭ → t\u0361ʃɨ; 203ⶮ → t\u0361ʃo; 204# In Amharic, ኀ is pronounced like ሀ. 205# Source: [1], section on “Phonological Redundancy” for Amharic, page 5. 206# Appendix B of [1] transcribes ሀ as /hə/. However, according to 207# an Amharic-speaking person, there is no /hə/ sequence in Amharic. 208# Instead, ሀ (and hence also ኀ) gets pronounced as /ha/. 209ኀ → ha; 210ኁ → hu; 211ኂ → hi; 212ኃ → ha; 213ኄ → he; 214ኅ → hɨ; 215ኆ → ho; 216ኇ → ho; # Dizi, Me’en, Mursi, Suri /ŋɔ/ ([1], Appendix E); not used in Amharic. 217ኈ → hwə; 218ኍ → hwu; 219ኊ → hwi; 220ኋ → hwa; 221ኌ → hwe; 222ነ ↔ nə; 223ኑ ↔ nu; 224ኒ ↔ ni; 225ና ↔ na; 226ኔ ↔ ne; 227ን ↔ nɨ; 228ኖ ↔ no; 229ⶈ → no; # Dizi, Me’en, Mursi, Suri /nɔ/ ([1], Appendix E); not used in Amharic. 230ኗ ↔ nwa; 231ን ← n; 232ኘ ↔ ɲə; 233ኙ ↔ ɲu; 234ኚ ↔ ɲi; 235ኛ ↔ ɲa; 236ኜ ↔ ɲe; 237ኝ ↔ ɲɨ; 238ኞ ↔ ɲo; 239ⶉ → ɲo; # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic. 240ኟ ↔ ɲwa; 241ኝ ← ɲ; 242# Amharic speakers pronounce ኸ as [h] because Amharic has no [x] sound. 243# However, in transliterations of foreign (eg. Spanish) words with [x], 244# several Amharic speakers have confirmed that they prefer ኻ over ሃ. 245ዀ → hwə; 246ዂ → hwi; 247ዃ → hwa; 248ዄ → hwe; 249ዅ → hwɨ; 250ኸ → hə; 251ኹ → hu; 252ኺ → hi; 253ኻ → ha; 254ኼ → he; 255ኽ → hɨ; 256ኾ → ho; 257ዀ ← xwə; 258ዂ ← xwi; 259ዃ ← xwa; 260ዄ ← xwe; 261ዅ ← xwɨ; 262ዅ ← xw; 263ኸ ← xə; 264ኹ ← xu; 265ኺ ← xi; 266ኻ ← xa; 267ኼ ← xe; 268ኽ ← xɨ; 269ኾ ← xo; 270ኽ ← x; 271አ ↔ ʔə; 272ኡ ↔ ʔu; 273ኢ ↔ ʔi; 274ኣ ↔ ʔa; 275ኤ ↔ ʔe; 276እ ↔ ʔɨ; 277ኦ ↔ ʔo; 278ⶊ → ʔo; # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic. 279እ ← ʔ; 280ከ ↔ kə; 281ኩ ↔ ku; 282ኪ ↔ ki; 283ካ ↔ ka; 284ኬ ↔ ke; 285ክ ↔ kɨ; 286ኮ ↔ ko; 287ኰ ↔ kwə; 288ኵ ↔ kwu; 289ኲ ↔ kwi; 290ኳ ↔ kwa; 291ኴ ↔ kwe; 292ክ ← k; 293# In Sebatbeit, ⷈ is spoken as palatalized velar plosive /kʲ/ ([1], Appendix H). 294# Amharic speakers pronounce it as /k/ without palatalization. 295ⷈ → kə; 296ⷉ → ku; 297ⷊ → ki; 298ⷋ → ka; 299ⷌ → ke; 300ⷍ → kɨ; 301ⷎ → ko; 302# In Sebatbeit, ⷐ is spoken as palatalized voiceless velar fricative/xʲə/ 303# according to [1], Appendix H. When the syllable appears in names, 304# Amharic speakers pronounce it as /kə/ without palatalization. 305ⷐ → kə; 306ⷑ → ku; 307ⷒ → ki; 308ⷓ → ka; 309ⷔ → ke; 310ⷕ → kɨ; 311ⷖ → ko; 312ወ ↔ wə; 313ዉ ↔ wu; 314ዊ ↔ wi; 315ዋ ↔ wa; 316ዌ ↔ we; 317ው ↔ wɨ; 318ዎ ↔ wo; 319ዏ → wo; # Dizi, Me’en, Mursi, Suri /wɔ/ ([1], Appendix E); not used in Amharic. 320ው ← w; 321ዐ ↔ ʕə; 322ዑ ↔ ʕu; 323ዒ ↔ ʕi; 324ዓ ↔ ʕa; 325ዔ ↔ ʕe; 326ዕ ↔ ʕɨ; 327ዖ ↔ ʕo; 328ዒ ← ʕ; 329ዘ ↔ zə; 330ዙ ↔ zu; 331ዚ ↔ zi; 332ዛ ↔ za; 333ዜ ↔ ze; 334ዝ ↔ zɨ; 335ዞ ↔ zo; 336ⶋ → zo; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. 337ዟ ↔ zwa; 338ዝ ← z; 339ዠ ↔ ʒə; 340ዡ ↔ ʒu; 341ዢ ↔ ʒi; 342ዣ ↔ ʒa; 343ዤ ↔ ʒe; 344ዥ ↔ ʒɨ; 345ዦ ↔ ʒo; 346ዧ ↔ ʒwa; 347ዢ ← ʒ; 348# Unclear which Ethiopic language uses ⶰ. It only appears in the 349# “Language Neutral” list of Appendix L in [1], which transcribes it as ʒ. 350# For Amharic, we pronounce ⶰ therefore like ዠ. 351ⶰ → ʒə; 352ⶱ → ʒu; 353ⶲ → ʒi; 354ⶳ → ʒa; 355ⶴ → ʒe; 356ⶵ → ʒɨ; 357ⶶ → ʒo; 358የ ↔ jə; 359ዩ ↔ ju; 360ዪ ↔ ji; 361ያ ↔ ja; 362ዬ ↔ je; 363ይ ↔ jɨ; 364ዮ ↔ jo; 365ዯ → jo; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. 366ይ ← j; 367ጀ ↔ d\u0361ʒə; 368ጁ ↔ d\u0361ʒu; 369ጂ ↔ d\u0361ʒi; 370ጃ ↔ d\u0361ʒa; 371ጄ ↔ d\u0361ʒe; 372ጅ ↔ d\u0361ʒɨ; 373ጆ ↔ d\u0361ʒo; 374ጇ ↔ d\u0361ʒwa; 375ጅ ← d\u0361ʒ; 376ደ ↔ də; 377ዱ ↔ du; 378ዲ ↔ di; 379ዳ ↔ da; 380ዴ ↔ de; 381ድ ↔ dɨ; 382ዶ ↔ do; 383ⶌ → do; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. 384ዷ ↔ dwa; 385ድ ← d; 386ገ ↔ ɡə; 387ጉ ↔ ɡu; 388ጊ ↔ ɡi; 389ጋ ↔ ɡa; 390ጌ ↔ ɡe; 391ግ ↔ ɡɨ; 392ጎ ↔ ɡo; 393ጐ ↔ ɡwə; 394ጕ ↔ ɡwu; 395ጒ ↔ ɡwi; 396ጓ ↔ ɡwa; 397ጔ ↔ ɡwe; 398ግ ← ɡ; 399# In Awngi, Blin, Qimant, and Xamtanga, ጘ is spoken as voiced velar nasal [ŋ]. 400# Source: [1], Appendix C. While /ŋ/ is not an Amharic phoneme, Amharic speakers 401# still can pronounce it according to our source. However, when transliterating 402# foreign words with [ŋ], Amharic uses the sequence ንግ /nɡ/. For example, 403# the Amharic transliteration of Washington /waʃiŋtən/ is ዋሺንግተን. 404ጘ → ŋə; 405ጙ → ŋu; 406ጚ → ŋi; 407ጛ → ŋa; 408ጜ → ŋe; 409ጝ → ŋɨ; 410ጞ → ŋo; 411ⶓ → ŋwə; 412ⶖ → ŋwu; 413ⶔ → ŋwi; 414ጟ → ŋwa; 415ⶕ → ŋwe; 416# Since there is no uvular nasal [ɴ] in Amharic, we use the velar nasal [ŋ]. 417ጘ ← ɴə; 418ጙ ← ɴu; 419ጚ ← ɴi; 420ጛ ← ɴa; 421ጜ ← ɴe; 422ጝ ← ɴɨ; 423ጞ ← ɴo; 424ጝ ← ɴ; 425# In Sebatbeit, ⷘ is spoken as palatalized voiced velar stop /ɡj/ ([1], Appendix H). 426# Amharic speakers pronounce it as voiced velar stop /ɡ/ without palatalization. 427ⷘ → ɡə; 428ⷙ → ɡu; 429ⷚ → ɡi; 430ⷛ → ɡa; 431ⷜ → ɡe; 432ⷝ → ɡɨ; 433ⷞ → ɡo; 434ጠ ↔ tʼə; 435ጡ ↔ tʼu; 436ጢ ↔ tʼi; 437ጣ ↔ tʼa; 438ጤ ↔ tʼe; 439ጥ ↔ tʼɨ; 440ጦ ↔ tʼo; 441ጧ ↔ tʼwa; 442ጢ ← tʼ; 443ጨ ↔ t\u0361ʃʼə; 444ጩ ↔ t\u0361ʃʼu; 445ጪ ↔ t\u0361ʃʼi; 446ጫ ↔ t\u0361ʃʼa; 447ጬ ↔ t\u0361ʃʼe; 448ጭ ↔ t\u0361ʃʼɨ; 449ጮ ↔ t\u0361ʃʼo; 450ⶐ → t\u0361ʃʼo; # Dizi, Me’en, Mursi, Suri /t\u0361ʃʼɔ/ ([1], Appendix E); not used in Amharic. 451ጯ ↔ t\u0361ʃʼwa; 452ጪ ← t\u0361ʃʼ; 453# According to Appendix B of [1], the following are used in the Bench language 454# (aka Benchnon, Gimira). In Bench, ⶻ is pronounced as /ʈ\u0361ʂʼ/ Retroflex 455# ejective affricate; with a phonemic distrinction to the non-retroflex version. 456# Amharic does not have retroflex phonemes, so we go with /t\u0361ʃʼ/. 457ⶸ → t\u0361ʃʼə; 458ⶹ → t\u0361ʃʼu; 459ⶺ → t\u0361ʃʼi; 460ⶻ → t\u0361ʃʼa; 461ⶼ → t\u0361ʃʼe; 462ⶽ → t\u0361ʃʼɨ; 463ⶾ → t\u0361ʃʼo; 464ቸ ↔ t\u0361ʃə; 465ቹ ↔ t\u0361ʃu; 466ቺ ↔ t\u0361ʃi; 467ቻ ↔ t\u0361ʃa; 468ቼ ↔ t\u0361ʃe; 469ች ↔ t\u0361ʃɨ; 470ቾ ↔ t\u0361ʃo; 471ቿ ↔ t\u0361ʃwa; 472ች ← t\u0361ʃ; 473ተ ↔ tə; 474ቱ ↔ tu; 475ቲ ↔ ti; 476ታ ↔ ta; 477ቴ ↔ te; 478ት ↔ tɨ; 479ቶ ↔ to; 480ⶆ → to; # Dizi, Me’en, Mursi, Suri /tɔ/ ([1], Appendix E); not used in Amharic. 481ቷ ↔ twa; 482ት ← t; 483ጰ ↔ pʼə; 484ጱ ↔ pʼu; 485ጲ ↔ pʼi; 486ጳ ↔ pʼa; 487ጴ ↔ pʼe; 488ጵ ↔ pʼɨ; 489ጶ ↔ pʼo; 490ⶑ → pʼo; # Dizi, Me’en, Mursi, Suri /pʼɔ/ ([1], Appendix E); not used in Amharic. 491ጷ ↔ pʼwa; 492ጵ ← pʼ; 493ጸ ↔ sʼə; 494ጹ ↔ sʼu; 495ጺ ↔ sʼi; 496ጻ ↔ sʼa; 497ጼ ↔ sʼe; 498ጽ ↔ sʼɨ; 499ጾ ↔ sʼo; 500ጿ ↔ sʼwa; 501ጽ ← sʼ; 502# In Amharic, ፀ is pronounced like ጸ. 503# Source: [1], section on “Phonological Redundancy” for Amharic, page 5. 504ፀ → sʼə; 505ፁ → sʼu; 506ፂ → sʼi; 507ፃ → sʼa; 508ፄ → sʼe; 509ፅ → sʼɨ; 510ፆ → sʼo; 511ፇ → sʼo; # Dizi, Me’en, Mursi, Suri /sʼɔ/ ([1], Appendix E); not used in Amharic. 512# Amharic speakers pronounce ሰ like ሠ. Source: [1], Appendix B. 513ሰ ↔ sə; 514ሱ ↔ su; 515ሲ ↔ si; 516ሳ ↔ sa; 517ሴ ↔ se; 518ስ ↔ sɨ; 519ሶ ↔ so; 520ⶃ → so; # Dizi, Me’en, Mursi, Suri /sɔ/ ([1], Appendix E); not used in Amharic. 521ሷ ↔ swa; 522ስ ← s; 523ፈ ↔ fə; 524ፉ ↔ fu; 525ፊ ↔ fi; 526ፋ ↔ fa; 527ፌ ↔ fe; 528ፍ ↔ fɨ; 529ፎ ↔ fo; 530ᎈ → fwə; # Sebatbeit /fwə/ ([1], Appendix H); not used in Amharic. 531ᎉ → fwu; # Sebatbeit /fwu/ ([1], Appendix H); not used in Amharic. 532ᎋ → fwi; # Sebatbeit /fwi/ ([1], Appendix H); not used in Amharic. 533ፏ ↔ fwa; 534ᎊ → fwe; # Sebatbeit /fwe/ ([1], Appendix H); not used in Amharic. 535ፚ → fja; # Unclear which language; Appendix L of [1] transcribes ፚ as /fja/. 536ፍ ← f; 537ፐ ↔ pə; 538ፑ ↔ pu; 539ፒ ↔ pi; 540ፓ ↔ pa; 541ፔ ↔ pe; 542ፕ ↔ pɨ; 543ፖ ↔ po; 544ⶒ → po; # Dizi, Me’en, Mursi, Suri /pɔ/ ([1], Appendix E); not used in Amharic. 545ᎌ → pwə; # Sebatbeit /pwə/ ([1], Appendix H); not used in Amharic. 546ᎍ → pwu; # Sebatbeit /pwu/ ([1], Appendix H); not used in Amharic. 547ᎏ → pwi; # Sebatbeit /pwi/ ([1], Appendix H); not used in Amharic. 548ፗ ↔ pwa; 549ᎎ → pwe; # Sebatbeit /pwe/ ([1], Appendix H); not used in Amharic. 550ፕ ← p; 551ኧ ↔ ə; 552ኡ ← u; # ኡላዓን ባዓታር ← Ulaan Baatar /ulaʕan baʕatar/ 553አ ← a; # አምስተርዳም ← Amsterdam /amstərdam/ 554ኤ ← e; 555እ ← ɨ; 556ኦ ← o; # ፖርት ኦፍ ስፔን ← Port of Spain /port of speːn/ 557ኢ ← i; # ኢስላማባድ ← Islamabad /islamabad/ 558# Applications will typically split words before calling our rules. 559# To be resilient, we replace punctuation by whitespace in IPA. 560፠ → ' '; # U+1360 ETHIOPIC SECTION MARK 561፡ → ' '; # U+1361 ETHIOPIC WORDSPACE 562። → ' '; # U+1362 ETHIOPIC FULL STOP 563፣ → ' '; # U+1363 ETHIOPIC COMMA 564፤ → ' '; # U+1364 ETHIOPIC SEMICOLON 565፥ → ' '; # U+1365 ETHIOPIC COLON 566፦ → ' '; # U+1366 ETHIOPIC PREFACE COLON 567፧ → ' '; # U+1367 ETHIOPIC QUESTION MARK 568፨ → ' '; # U+1368 ETHIOPIC PARAGRAPH SEPARATOR 569# Likewise, Ethiopic numberals cannot be pronounced by these rules, 570# so we replace them by whitespace in the output IPA notation. 571# Applications will typically pre-process text before calling 572# the am → am_FONIPA transform. 573፩ → ' '; # U+1369 ETHIOPIC DIGIT ONE 574፪ → ' '; # U+136A ETHIOPIC DIGIT TWO 575፫ → ' '; # U+136B ETHIOPIC DIGIT THREE 576፬ → ' '; # U+136C ETHIOPIC DIGIT FOUR 577፭ → ' '; # U+136D ETHIOPIC DIGIT FIVE 578፮ → ' '; # U+136E ETHIOPIC DIGIT SIX 579፯ → ' '; # U+136F ETHIOPIC DIGIT SEVEN 580፰ → ' '; # U+1370 ETHIOPIC DIGIT EIGHT 581፱ → ' '; # U+1371 ETHIOPIC DIGIT NINE 582፲ → ' '; # U+1372 ETHIOPIC NUMBER TEN 583፳ → ' '; # U+1373 ETHIOPIC NUMBER TWENTY 584፴ → ' '; # U+1374 ETHIOPIC NUMBER THIRTY 585፵ → ' '; # U+1375 ETHIOPIC NUMBER FORTY 586፶ → ' '; # U+1376 ETHIOPIC NUMBER FIFTY 587፷ → ' '; # U+1377 ETHIOPIC NUMBER SIXTY 588፸ → ' '; # U+1378 ETHIOPIC NUMBER SEVENTY 589፹ → ' '; # U+1379 ETHIOPIC NUMBER EIGHTY 590፺ → ' '; # U+137A ETHIOPIC NUMBER NINETY 591፻ → ' '; # U+137B ETHIOPIC NUMBER HUNDRED 592፼ → ' '; # U+137C ETHIOPIC NUMBER TEN THOUSAND 593# Transform IPA length markers to one of these: 594# U+135D ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK 595# U+135E ETHIOPIC COMBINING VOWEL LENGTH MARK 596# U+135F ETHIOPIC COMBINING GEMINATION MARK 597::null(); 598← ː ; # Strip off any remaining IPA length markers. 599::(null); 600($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135D → $1 ː $2 ː; 601($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135E → $1 $2 ː; 602($IPA_CONSONANT) ([jw]? $IPA_VOWEL?) \u135F → $1 ː $2; 603[\u135D \u135E \u135F] → ; # Strip off any remaining length markers. 604$1 wa \u135D ← ($LABIALIZABLE_BEFORE_A) ː waː; # ቷ\u135D ← [tːʷaː] 605$1 wa \u135E ← ($LABIALIZABLE_BEFORE_A) waː; # ቷ\u135E ← [tʷaː] 606$1 wa \u135F ← ($LABIALIZABLE_BEFORE_A) ː wa; # አቷ\u135F ← [tːʷa] 607$1 \u135F $2 \u135E ← ([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL) ː; 608$1 \u135F $2 ← {([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL?)}; 609$1 \u135E ← ($IPA_VOWEL ː); 610$1 \u135D ← (jː $IPA_VOWEL ː); 611$1 \u135E ← ([jw] $IPA_VOWEL ː); 612$1 \u135F ← (jː $IPA_VOWEL?); 613$1 \u135D ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL ː); 614$1 \u135E ← ($IPA_CONSONANT [w]? $IPA_VOWEL ː); 615$1 \u135F ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL?); 616# Insert syllable markers in a separate pass. 617::null; 618{($IPA_VOWEL ː?)} [[:L:]] → $1 \.; 619::(null); 620← [ˈˌ\. \u0303\u032F]; 621aj ← ai; # Nairobi /nairobi/ ናይሮቢ, Cairo /kairo/ ካይሮ 622aw ← au; # Bissau /bisːau/ ቢሳው 623eji ← ei; # Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ 624ewo ← eo; # Montevideo /montevideo/ ሞንቴቪዴዎ 625ija ← ia; # Monrovia /monrovia/ ሞንሮቪያ 626ijə ← iə; # Reunion /rijunijən/ ሪዩኒየን 627iw ← iu; # Vilnius /vilnius/ ቪልኒውስ, New Delhi /niu deːli/ ኒው ዴሊ 628jo ← io; # Tokyo /tokio/ ቶክዮ 629nɡ ← ŋɡ; # Kongo /koŋɡo/ ኮንጎ, Hungary /həŋɡari/ ሀንጋሪ 630nɡ ← ŋ; # Bangkok /baŋkok/ ባንግኮክ, Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ 631uwa ← ua; # Kuala Lumpur /kuala lumpur/ ኩዋላ ሉምፑር, Ruanda /ruanda/ ሩዋንዳ 632bwe ← bue; # Buenos Aires /buenos aires/ ብዌኖስ አይሬስ 633sʼ ← t\u0361s; # Podgorica /podɡorit\u0361sa/ ፖድጎሪጻ, Vaduz /fadut\u0361s/ ፋዱጽ 634uwi ← ui; # Port Luis /port luis/ ፖርት ሉዊስ 635uwe ← ue; # Lithuania /lituenia/ ሊቱዌኒያ, Venezuela /venɨzuela/ ቬንዙዌላ 636::(null); 637ʔə ← \. ə; 638ʔu ← \. u; 639ʔi ← \. i; 640ʔa ← \. a; 641ʔe ← \. e; 642ʔɨ ← \. ɨ; 643ʔo ← \. o; 644$1 w ← {($IPA_VOWEL ː?) \u032F} $IPA_VOWEL; # /ewowa/ ← /e\u032Fo\u032Fa/ 645::(null); 646n ← [n {n\u033C} {n\u033C\u030A} {m\u033A} {n\u030A} {n\u0325} ⁿ ᵑ]; 647m ← [ɱ {m\u0325} {m\u032A} ᵐ]; 648ɲ ← [{ɳ\u030A} {ɳ\u0325} ɳ {ɲ\u030A} {ɲ\u0325} ɲ]; 649ŋ ← [{ŋ\u030A} {ŋ\u0325} ŋ]; 650ɴ ← [{ɴ\u030A} {ɴ\u0325} ɴ]; 651p ← [{t\u033C} {p\u033A}]; 652pʼ ← [ʘ ɋ]; 653b ← [{d\u033C} {b\u033A} {ɾ\u033C} ɓ]; 654t ← [{t\u032A} ʈ]; 655tʼ ← [ǁ ʖ]; 656d ← [ɖ ɗ ᶑ]; 657k ← q; 658kʼ ← [ǃ ʗ]; 659ɡ ← [g ɢ ɣ ɠ ʛ]; 660nɡ ← ᵑɡ; 661ʔ ← ʡ; 662s ← [θ {θ\u0331} {θ\u031E} {θ\u033C} {ɸ\u033A}]; 663z ← [ð {ð\u0320} {ð\u033C} {β\u033A}]; 664sʼ ← [{t\u0361s} {t\u035Cs} ʦ]; 665t\u0361ʃ ← [{t\u035Cʃ} ʧ {t\u0361ɕ} {t\u035Cɕ} ʨ {ʈ\u0361ʂ} c]; 666t\u0361ʃʼ ← [ǀ ʇ ǂ ʄ]; 667d\u0361ʒ ← [ʤ ʣ {d\u0361z} {d\u035Cz} {d\u0361ɕ} ʥ {d\u0361ʑ} {d\u035Cʑ} {ɖ\u0361ʐ} {d\u0361ʐ} ɟ]; 668pf ← [{p\u032A} {p\u0346} ȹ {p\u0361f} {p\u032Af} {p\u032A\u035Cf}]; 669bv ← [{b\u032A} {b\u0346} ȸ {b\u0361v} {b\u032A\u0361v}]; 670ʃ ← [ʂ ɕ]; 671ʒ ← [ʐ ʑ]; 672r ← [ɾ ɽ ʁ]; 673rːʒ ← r\u031Dː; 674rʒ ← r\u031D; 675v ← β; 676x ← [ç x χ]; 677ʕ ← ʕ\u031D; 678h ← ɦ; 679j ← [ʝ ʲ]; 680lj ← ʎ [iɨ]? [jʝʲ]?; 681t\u0361ʃl ← [{t\u0361ɬ} {tɬ}]; 682ʃl ← ɬ; 683w ← {u\u032F} $IPA_VOWEL; 684w ← ʷ; 685ʼː ← ːʼ; # /pʼː/ ← /pːʼ/; /sʼː/ ← /sːʼ/; etc. 686::(null); 687i ← y; 688ɨ ← [ɪ ʉ]; 689u ← [ʊ ɯ]; 690ə ← [ɛ æ ɘ]; 691o ← [ɔ ø]; 692a ← ɑ; 693ʼ ← ʰ; 694← [ʱ]; 695$1ːʲ ← ([pbtd])ʲː; # [bːʲeː] ← [bʲːeː] 696$1ːʷ ← ([pbtd])ʷː; # [bːʷeː] ← [bʷːeː] 697::(NFC); 698← [ \u0303 \u0330 \u030B \u0301 \u0304 \u0300 \u030F \u030C \u0302 ˥ ˦ ˧ ˨ ˩ ꜜ ꜛ ↗ ↘ ]; 699::(NFD); 700 701