1# © 2016 and later: Unicode, Inc. and others. 2# License & terms of use: http://www.unicode.org/copyright.html 3# Generated using tools/cldr/cldr-to-icu/build-icu-data.xml 4# 5# File: am_am_FONIPA.txt 6# Generated from CLDR 7# 8 9# Transforms Amharic (am) to Amharic in phonemic IPA transcription (am_FONIPA). 10# 11# Long vowels, long/geminated consonants: 12# In the direction from am_FONIPA to am, we emit Ethiopic gemination 13# and vowel length markers (U+135D, U+135E, U+135F) although 14# they are rarely written in Amharic text. Exceptions include 15# school books and textbooks for non-native speakers. 16# Clients who do not want these markers can easily strip them off 17# in a post-processing step. 18# 19# Labialization: 20# Amharic speakers will usually say ሟ as [mʷa] instead of [mwa]; 21# labializing [m] instead of saying [m] followed by a separate [w]. 22# Most Amharic consonants can get labialized. To keep the phonemic 23# transcription simple, we emit /m/ + /w/; otherwise, our phoneme 24# set would almost double, and it would include very unusual phonemes 25# such as /ɲʷ/ or /t\u0361ʃʼʷ/. 26# 27# References: 28# [1] The Ge’ez Frontier Foundation: “Principles and Specification 29# for Mnemonic Ethiopic Keyboards.” Version of January 17, 2009; 30# retrieved on November 4, 2014. 31# http://keyboards.ethiopic.org/specification/GFF-MnemonicEthiopicKeyboardSpecification.pdf 32# Other than most online sources, this report uses correct IPA notation 33# with the exception of /j/, which it consistently (but wrongly) 34# writes as */y/. 35$IPA_VOWEL = [aeəiɨou]; 36$IPA_CONSONANT = [mnɲɴ p{pʼ}bt{tʼ}dk{kʼ}ɡʔʕ fvs{sʼ}zʃʒxh lr {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}]; 37# Some consonants have a special syllable when labialized, such as ፗ ↔ /pʷa/. 38# Amharic restricts this mostly to /a/ syllables. While the Ethiopic script 39# does offer labialized syllables for other vowels, these are typically 40# not written in Amharic. 41$LABIALIZABLE_BEFORE_A = [p{pʼ}t{tʼ} {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}{d\u0361ʒʼ} s{sʼ}zʃʒ fv r]; 42← [ ʼ \u0361 \u035C \u032F]; 43::(null); 44# Appendix B of [1] transcribes ሀ as /hə/. However, according to 45# an Amharic-speaking person, there is no /hə/ sequence 46# in Amharic; instead, it gets pronounced as /ha/. 47ሀ → ha; 48ሀ ← hə; 49ሁ ↔ hu; 50ሂ ↔ hi; 51ሃ ↔ ha; 52ሄ ↔ he; 53ህ ↔ hɨ; 54ሆ ↔ ho; 55ሇ → ho; # Dizi, Me’en, Mursi, Suri /hɔ/ ([1], Appendix E); not used in Amharic. 56ህ ← h; 57ለ ↔ lə; 58ሉ ↔ lu; 59ሊ ↔ li; 60ላ ↔ la; 61ሌ ↔ le; 62ል ↔ lɨ; 63ሎ ↔ lo; 64ⶀ → lo; # Dizi, Me’en, Mursi, Suri /lɔ/ ([1], Appendix E); not used in Amharic. 65ሏ ↔ lwa; 66ል ← l; 67# Appendix B of [1] transcribes ሐ as Voiceless pharyngeal fricative 68# /ħə/. However, according to an Amharic-speaking person, Amharic 69# makes no difference in pronunciation between ሐ...ሓ and ሀ...ሃ; both 70# are pronounced as Voiceless glottal fricative /h/. Also, according 71# to the speaker there is no /hə/ sequence in Amharic; instead, it 72# gets pronounced as /ha/. 73ሐ → ha; 74ሑ → hu; 75ሒ → hi; 76ሓ → ha; 77ሔ → he; 78ሕ → hɨ; 79ሖ → ho; 80ሗ → hwa; 81መ ↔ mə; 82ሙ ↔ mu; 83ሚ ↔ mi; 84ማ ↔ ma; 85ሜ ↔ me; 86ም ↔ mɨ; 87ሞ ↔ mo; 88ⶁ → mo; # Dizi, Me’en, Mursi, Suri /mɔ/ ([1], Appendix E); not used in Amharic. 89ᎀ → mwə; # Sebatbeit /mwə/ ([1], Appendix H); not used in Amharic. 90ᎃ → mwu; # Sebatbeit /mwu/ ([1], Appendix H); not used in Amharic. 91ᎁ → mwi; # Sebatbeit /mwi/ ([1], Appendix H); not used in Amharic. 92ሟ ↔ mwa; 93ᎂ → mwe; # Sebatbeit /mwe/ ([1], Appendix H); not used in Amharic. 94ፙ → mja; # Unclear which language; Appendix L of [1] transcribes ፙ as /mʲa/. 95ም ← m; 96ሠ → sə; 97ሡ → su; 98ሢ → si; 99ሣ → sa; 100ሤ → se; 101ሥ → sɨ; 102ሦ → so; 103ሧ → swa; 104ረ ↔ rə; 105ሩ ↔ ru; 106ሪ ↔ ri; 107ራ ↔ ra; 108ሬ ↔ re; 109ር ↔ rɨ; 110ሮ ↔ ro; 111ⶂ → ro; # Dizi, Me’en, Mursi, Suri /rɔ/ ([1], Appendix E); not used in Amharic. 112ሯ ↔ rwa; 113ፘ → rja; # Unclear which language; Appendix L of [1] transcribes ፘ as /rʲa/. 114ር ← r; 115# Amharic speakers pronounce ⶠ like ሸ. Source: [1], Appendix B. 116ⶠ → ʃə; 117ⶡ → ʃu; 118ⶢ → ʃi; 119ⶣ → ʃa; 120ⶤ → ʃe; 121ⶥ → ʃɨ; 122ⶦ → ʃo; 123ሸ ↔ ʃə; 124ሹ ↔ ʃu; 125ሺ ↔ ʃi; 126ሻ ↔ ʃa; 127ሼ ↔ ʃe; 128ሽ ↔ ʃɨ; 129ሾ ↔ ʃo; 130ⶄ → ʃo; # Dizi, Me’en, Mursi, Suri /ʃɔ/ ([1], Appendix E); not used in Amharic. 131ሿ ↔ ʃwa; 132ሽ ← ʃ; 133ቀ ↔ kʼə; 134ቁ ↔ kʼu; 135ቂ ↔ kʼi; 136ቃ ↔ kʼa; 137ቄ ↔ kʼe; 138ቅ ↔ kʼɨ; 139ቆ ↔ kʼo; 140ቇ → kʼo; # Dizi, Me’en, Mursi, Suri /kʼɔ/ ([1], Appendix E); not used in Amharic. 141ቈ ↔ kʼwə; 142ቍ ↔ kʼwu; 143ቊ ↔ kʼwi; 144ቋ ↔ kʼwa; 145ቌ ↔ kʼwe; 146ቅ ← kʼ; 147# In Awngi, Blin, Qimant, and Xamtanga, ቐ is spoken as voiced uvular fricative [ʁ]. 148# Source: [1], Appendix C. However, */ʁ/ is not an Amharic phoneme. 149# When reading foreign words with ቐ, Amharic speakers pronounce 150# ቐ like ቀ, i.e. as velar ejective /kʼ/. 151ቐ → kʼə; 152ቑ → kʼu; 153ቒ → kʼi; 154ቓ → kʼa; 155ቔ → kʼe; 156ቕ → kʼɨ; 157ቖ → kʼo; 158ቘ → kʼwə; 159ቝ → kʼwu; 160ቚ → kʼwi; 161ቛ → kʼwa; 162ቜ → kʼwe; 163# In Sebatbeit, ⷀ is spoken as palatalized velar ejective /kʼʲ/ ([1], Appendix H). 164# In Amharic, the syllable is not used, but it might appear in names. 165ⷀ → kʼjə; 166ⷁ → kʼju; 167ⷂ → kʼji; 168ⷃ → kʼja; 169ⷄ → kʼje; 170ⷅ → kʼjɨ; 171ⷆ → kʼjo; 172በ ↔ bə; 173ቡ ↔ bu; 174ቢ ↔ bi; 175ባ ↔ ba; 176ቤ ↔ be; 177ብ ↔ bɨ; 178ቦ ↔ bo; 179ⶅ → bo; # Dizi, Me’en, Mursi, Suri /bɔ/ ([1], Appendix E); not used in Amharic. 180ᎄ → bwə; # Sebatbeit /bʷə/ ([1], Appendix H); not used in Amharic. 181ᎇ → bwu; # Sebatbeit /bʷu/ ([1], Appendix H); not used in Amharic. 182ᎅ → bwi; # Sebatbeit /bʷi/ ([1], Appendix H); not used in Amharic. 183ቧ → bwa; # Sebatbeit /bʷa/ ([1], Appendix H); not used in Amharic. 184ᎆ → bwe; # Sebatbeit /bʷe/ ([1], Appendix H); not used in Amharic. 185ብ ← b; 186ቨ ↔ və; 187ቩ ↔ vu; 188ቪ ↔ vi; 189ቫ ↔ va; 190ቬ ↔ ve; 191ቭ ↔ vɨ; 192ቮ ↔ vo; 193ቯ ↔ vwa; 194ቭ ← v; 195# Unclear which Ethiopic language uses ⶨ. It only appears in the 196# “Language Neutral” list of Appendix L in [1], which transcribes it as t\u0361ʃ. 197# For Amharic, we pronounce ⶨ therefore like ቸ. 198ⶨ → t\u0361ʃə; 199ⶩ → t\u0361ʃu; 200ⶪ → t\u0361ʃi; 201ⶫ → t\u0361ʃa; 202ⶬ → t\u0361ʃe; 203ⶭ → t\u0361ʃɨ; 204ⶮ → t\u0361ʃo; 205# In Amharic, ኀ is pronounced like ሀ. 206# Source: [1], section on “Phonological Redundancy” for Amharic, page 5. 207# Appendix B of [1] transcribes ሀ as /hə/. However, according to 208# an Amharic-speaking person, there is no /hə/ sequence in Amharic. 209# Instead, ሀ (and hence also ኀ) gets pronounced as /ha/. 210ኀ → ha; 211ኁ → hu; 212ኂ → hi; 213ኃ → ha; 214ኄ → he; 215ኅ → hɨ; 216ኆ → ho; 217ኇ → ho; # Dizi, Me’en, Mursi, Suri /ŋɔ/ ([1], Appendix E); not used in Amharic. 218ኈ → hwə; 219ኍ → hwu; 220ኊ → hwi; 221ኋ → hwa; 222ኌ → hwe; 223ነ ↔ nə; 224ኑ ↔ nu; 225ኒ ↔ ni; 226ና ↔ na; 227ኔ ↔ ne; 228ን ↔ nɨ; 229ኖ ↔ no; 230ⶈ → no; # Dizi, Me’en, Mursi, Suri /nɔ/ ([1], Appendix E); not used in Amharic. 231ኗ ↔ nwa; 232ን ← n; 233ኘ ↔ ɲə; 234ኙ ↔ ɲu; 235ኚ ↔ ɲi; 236ኛ ↔ ɲa; 237ኜ ↔ ɲe; 238ኝ ↔ ɲɨ; 239ኞ ↔ ɲo; 240ⶉ → ɲo; # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic. 241ኟ ↔ ɲwa; 242ኝ ← ɲ; 243# Amharic speakers pronounce ኸ as [h] because Amharic has no [x] sound. 244# However, in transliterations of foreign (eg. Spanish) words with [x], 245# several Amharic speakers have confirmed that they prefer ኻ over ሃ. 246ዀ → hwə; 247ዂ → hwi; 248ዃ → hwa; 249ዄ → hwe; 250ዅ → hwɨ; 251ኸ → hə; 252ኹ → hu; 253ኺ → hi; 254ኻ → ha; 255ኼ → he; 256ኽ → hɨ; 257ኾ → ho; 258ዀ ← xwə; 259ዂ ← xwi; 260ዃ ← xwa; 261ዄ ← xwe; 262ዅ ← xwɨ; 263ዅ ← xw; 264ኸ ← xə; 265ኹ ← xu; 266ኺ ← xi; 267ኻ ← xa; 268ኼ ← xe; 269ኽ ← xɨ; 270ኾ ← xo; 271ኽ ← x; 272አ ↔ ʔə; 273ኡ ↔ ʔu; 274ኢ ↔ ʔi; 275ኣ ↔ ʔa; 276ኤ ↔ ʔe; 277እ ↔ ʔɨ; 278ኦ ↔ ʔo; 279ⶊ → ʔo; # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic. 280እ ← ʔ; 281ከ ↔ kə; 282ኩ ↔ ku; 283ኪ ↔ ki; 284ካ ↔ ka; 285ኬ ↔ ke; 286ክ ↔ kɨ; 287ኮ ↔ ko; 288ኰ ↔ kwə; 289ኵ ↔ kwu; 290ኲ ↔ kwi; 291ኳ ↔ kwa; 292ኴ ↔ kwe; 293ክ ← k; 294# In Sebatbeit, ⷈ is spoken as palatalized velar plosive /kʲ/ ([1], Appendix H). 295# Amharic speakers pronounce it as /k/ without palatalization. 296ⷈ → kə; 297ⷉ → ku; 298ⷊ → ki; 299ⷋ → ka; 300ⷌ → ke; 301ⷍ → kɨ; 302ⷎ → ko; 303# In Sebatbeit, ⷐ is spoken as palatalized voiceless velar fricative/xʲə/ 304# according to [1], Appendix H. When the syllable appears in names, 305# Amharic speakers pronounce it as /kə/ without palatalization. 306ⷐ → kə; 307ⷑ → ku; 308ⷒ → ki; 309ⷓ → ka; 310ⷔ → ke; 311ⷕ → kɨ; 312ⷖ → ko; 313ወ ↔ wə; 314ዉ ↔ wu; 315ዊ ↔ wi; 316ዋ ↔ wa; 317ዌ ↔ we; 318ው ↔ wɨ; 319ዎ ↔ wo; 320ዏ → wo; # Dizi, Me’en, Mursi, Suri /wɔ/ ([1], Appendix E); not used in Amharic. 321ው ← w; 322ዐ ↔ ʕə; 323ዑ ↔ ʕu; 324ዒ ↔ ʕi; 325ዓ ↔ ʕa; 326ዔ ↔ ʕe; 327ዕ ↔ ʕɨ; 328ዖ ↔ ʕo; 329ዒ ← ʕ; 330ዘ ↔ zə; 331ዙ ↔ zu; 332ዚ ↔ zi; 333ዛ ↔ za; 334ዜ ↔ ze; 335ዝ ↔ zɨ; 336ዞ ↔ zo; 337ⶋ → zo; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. 338ዟ ↔ zwa; 339ዝ ← z; 340ዠ ↔ ʒə; 341ዡ ↔ ʒu; 342ዢ ↔ ʒi; 343ዣ ↔ ʒa; 344ዤ ↔ ʒe; 345ዥ ↔ ʒɨ; 346ዦ ↔ ʒo; 347ዧ ↔ ʒwa; 348ዢ ← ʒ; 349# Unclear which Ethiopic language uses ⶰ. It only appears in the 350# “Language Neutral” list of Appendix L in [1], which transcribes it as ʒ. 351# For Amharic, we pronounce ⶰ therefore like ዠ. 352ⶰ → ʒə; 353ⶱ → ʒu; 354ⶲ → ʒi; 355ⶳ → ʒa; 356ⶴ → ʒe; 357ⶵ → ʒɨ; 358ⶶ → ʒo; 359የ ↔ jə; 360ዩ ↔ ju; 361ዪ ↔ ji; 362ያ ↔ ja; 363ዬ ↔ je; 364ይ ↔ jɨ; 365ዮ ↔ jo; 366ዯ → jo; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. 367ይ ← j; 368ጀ ↔ d\u0361ʒə; 369ጁ ↔ d\u0361ʒu; 370ጂ ↔ d\u0361ʒi; 371ጃ ↔ d\u0361ʒa; 372ጄ ↔ d\u0361ʒe; 373ጅ ↔ d\u0361ʒɨ; 374ጆ ↔ d\u0361ʒo; 375ጇ ↔ d\u0361ʒwa; 376ጅ ← d\u0361ʒ; 377ደ ↔ də; 378ዱ ↔ du; 379ዲ ↔ di; 380ዳ ↔ da; 381ዴ ↔ de; 382ድ ↔ dɨ; 383ዶ ↔ do; 384ⶌ → do; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. 385ዷ ↔ dwa; 386ድ ← d; 387ገ ↔ ɡə; 388ጉ ↔ ɡu; 389ጊ ↔ ɡi; 390ጋ ↔ ɡa; 391ጌ ↔ ɡe; 392ግ ↔ ɡɨ; 393ጎ ↔ ɡo; 394ጐ ↔ ɡwə; 395ጕ ↔ ɡwu; 396ጒ ↔ ɡwi; 397ጓ ↔ ɡwa; 398ጔ ↔ ɡwe; 399ግ ← ɡ; 400# In Awngi, Blin, Qimant, and Xamtanga, ጘ is spoken as voiced velar nasal [ŋ]. 401# Source: [1], Appendix C. While /ŋ/ is not an Amharic phoneme, Amharic speakers 402# still can pronounce it according to our source. However, when transliterating 403# foreign words with [ŋ], Amharic uses the sequence ንግ /nɡ/. For example, 404# the Amharic transliteration of Washington /waʃiŋtən/ is ዋሺንግተን. 405ጘ → ŋə; 406ጙ → ŋu; 407ጚ → ŋi; 408ጛ → ŋa; 409ጜ → ŋe; 410ጝ → ŋɨ; 411ጞ → ŋo; 412ⶓ → ŋwə; 413ⶖ → ŋwu; 414ⶔ → ŋwi; 415ጟ → ŋwa; 416ⶕ → ŋwe; 417# Since there is no uvular nasal [ɴ] in Amharic, we use the velar nasal [ŋ]. 418ጘ ← ɴə; 419ጙ ← ɴu; 420ጚ ← ɴi; 421ጛ ← ɴa; 422ጜ ← ɴe; 423ጝ ← ɴɨ; 424ጞ ← ɴo; 425ጝ ← ɴ; 426# In Sebatbeit, ⷘ is spoken as palatalized voiced velar stop /ɡj/ ([1], Appendix H). 427# Amharic speakers pronounce it as voiced velar stop /ɡ/ without palatalization. 428ⷘ → ɡə; 429ⷙ → ɡu; 430ⷚ → ɡi; 431ⷛ → ɡa; 432ⷜ → ɡe; 433ⷝ → ɡɨ; 434ⷞ → ɡo; 435ጠ ↔ tʼə; 436ጡ ↔ tʼu; 437ጢ ↔ tʼi; 438ጣ ↔ tʼa; 439ጤ ↔ tʼe; 440ጥ ↔ tʼɨ; 441ጦ ↔ tʼo; 442ጧ ↔ tʼwa; 443ጢ ← tʼ; 444ጨ ↔ t\u0361ʃʼə; 445ጩ ↔ t\u0361ʃʼu; 446ጪ ↔ t\u0361ʃʼi; 447ጫ ↔ t\u0361ʃʼa; 448ጬ ↔ t\u0361ʃʼe; 449ጭ ↔ t\u0361ʃʼɨ; 450ጮ ↔ t\u0361ʃʼo; 451ⶐ → t\u0361ʃʼo; # Dizi, Me’en, Mursi, Suri /t\u0361ʃʼɔ/ ([1], Appendix E); not used in Amharic. 452ጯ ↔ t\u0361ʃʼwa; 453ጪ ← t\u0361ʃʼ; 454# According to Appendix B of [1], the following are used in the Bench language 455# (aka Benchnon, Gimira). In Bench, ⶻ is pronounced as /ʈ\u0361ʂʼ/ Retroflex 456# ejective affricate; with a phonemic distrinction to the non-retroflex version. 457# Amharic does not have retroflex phonemes, so we go with /t\u0361ʃʼ/. 458ⶸ → t\u0361ʃʼə; 459ⶹ → t\u0361ʃʼu; 460ⶺ → t\u0361ʃʼi; 461ⶻ → t\u0361ʃʼa; 462ⶼ → t\u0361ʃʼe; 463ⶽ → t\u0361ʃʼɨ; 464ⶾ → t\u0361ʃʼo; 465ቸ ↔ t\u0361ʃə; 466ቹ ↔ t\u0361ʃu; 467ቺ ↔ t\u0361ʃi; 468ቻ ↔ t\u0361ʃa; 469ቼ ↔ t\u0361ʃe; 470ች ↔ t\u0361ʃɨ; 471ቾ ↔ t\u0361ʃo; 472ቿ ↔ t\u0361ʃwa; 473ች ← t\u0361ʃ; 474ተ ↔ tə; 475ቱ ↔ tu; 476ቲ ↔ ti; 477ታ ↔ ta; 478ቴ ↔ te; 479ት ↔ tɨ; 480ቶ ↔ to; 481ⶆ → to; # Dizi, Me’en, Mursi, Suri /tɔ/ ([1], Appendix E); not used in Amharic. 482ቷ ↔ twa; 483ት ← t; 484ጰ ↔ pʼə; 485ጱ ↔ pʼu; 486ጲ ↔ pʼi; 487ጳ ↔ pʼa; 488ጴ ↔ pʼe; 489ጵ ↔ pʼɨ; 490ጶ ↔ pʼo; 491ⶑ → pʼo; # Dizi, Me’en, Mursi, Suri /pʼɔ/ ([1], Appendix E); not used in Amharic. 492ጷ ↔ pʼwa; 493ጵ ← pʼ; 494ጸ ↔ sʼə; 495ጹ ↔ sʼu; 496ጺ ↔ sʼi; 497ጻ ↔ sʼa; 498ጼ ↔ sʼe; 499ጽ ↔ sʼɨ; 500ጾ ↔ sʼo; 501ጿ ↔ sʼwa; 502ጽ ← sʼ; 503# In Amharic, ፀ is pronounced like ጸ. 504# Source: [1], section on “Phonological Redundancy” for Amharic, page 5. 505ፀ → sʼə; 506ፁ → sʼu; 507ፂ → sʼi; 508ፃ → sʼa; 509ፄ → sʼe; 510ፅ → sʼɨ; 511ፆ → sʼo; 512ፇ → sʼo; # Dizi, Me’en, Mursi, Suri /sʼɔ/ ([1], Appendix E); not used in Amharic. 513# Amharic speakers pronounce ሰ like ሠ. Source: [1], Appendix B. 514ሰ ↔ sə; 515ሱ ↔ su; 516ሲ ↔ si; 517ሳ ↔ sa; 518ሴ ↔ se; 519ስ ↔ sɨ; 520ሶ ↔ so; 521ⶃ → so; # Dizi, Me’en, Mursi, Suri /sɔ/ ([1], Appendix E); not used in Amharic. 522ሷ ↔ swa; 523ስ ← s; 524ፈ ↔ fə; 525ፉ ↔ fu; 526ፊ ↔ fi; 527ፋ ↔ fa; 528ፌ ↔ fe; 529ፍ ↔ fɨ; 530ፎ ↔ fo; 531ᎈ → fwə; # Sebatbeit /fwə/ ([1], Appendix H); not used in Amharic. 532ᎉ → fwu; # Sebatbeit /fwu/ ([1], Appendix H); not used in Amharic. 533ᎋ → fwi; # Sebatbeit /fwi/ ([1], Appendix H); not used in Amharic. 534ፏ ↔ fwa; 535ᎊ → fwe; # Sebatbeit /fwe/ ([1], Appendix H); not used in Amharic. 536ፚ → fja; # Unclear which language; Appendix L of [1] transcribes ፚ as /fja/. 537ፍ ← f; 538ፐ ↔ pə; 539ፑ ↔ pu; 540ፒ ↔ pi; 541ፓ ↔ pa; 542ፔ ↔ pe; 543ፕ ↔ pɨ; 544ፖ ↔ po; 545ⶒ → po; # Dizi, Me’en, Mursi, Suri /pɔ/ ([1], Appendix E); not used in Amharic. 546ᎌ → pwə; # Sebatbeit /pwə/ ([1], Appendix H); not used in Amharic. 547ᎍ → pwu; # Sebatbeit /pwu/ ([1], Appendix H); not used in Amharic. 548ᎏ → pwi; # Sebatbeit /pwi/ ([1], Appendix H); not used in Amharic. 549ፗ ↔ pwa; 550ᎎ → pwe; # Sebatbeit /pwe/ ([1], Appendix H); not used in Amharic. 551ፕ ← p; 552ኧ ↔ ə; 553ኡ ← u; # ኡላዓን ባዓታር ← Ulaan Baatar /ulaʕan baʕatar/ 554አ ← a; # አምስተርዳም ← Amsterdam /amstərdam/ 555ኤ ← e; 556እ ← ɨ; 557ኦ ← o; # ፖርት ኦፍ ስፔን ← Port of Spain /port of speːn/ 558ኢ ← i; # ኢስላማባድ ← Islamabad /islamabad/ 559# Applications will typically split words before calling our rules. 560# To be resilient, we replace punctuation by whitespace in IPA. 561፠ → ' '; # U+1360 ETHIOPIC SECTION MARK 562፡ → ' '; # U+1361 ETHIOPIC WORDSPACE 563። → ' '; # U+1362 ETHIOPIC FULL STOP 564፣ → ' '; # U+1363 ETHIOPIC COMMA 565፤ → ' '; # U+1364 ETHIOPIC SEMICOLON 566፥ → ' '; # U+1365 ETHIOPIC COLON 567፦ → ' '; # U+1366 ETHIOPIC PREFACE COLON 568፧ → ' '; # U+1367 ETHIOPIC QUESTION MARK 569፨ → ' '; # U+1368 ETHIOPIC PARAGRAPH SEPARATOR 570# Likewise, Ethiopic numberals cannot be pronounced by these rules, 571# so we replace them by whitespace in the output IPA notation. 572# Applications will typically pre-process text before calling 573# the am → am_FONIPA transform. 574፩ → ' '; # U+1369 ETHIOPIC DIGIT ONE 575፪ → ' '; # U+136A ETHIOPIC DIGIT TWO 576፫ → ' '; # U+136B ETHIOPIC DIGIT THREE 577፬ → ' '; # U+136C ETHIOPIC DIGIT FOUR 578፭ → ' '; # U+136D ETHIOPIC DIGIT FIVE 579፮ → ' '; # U+136E ETHIOPIC DIGIT SIX 580፯ → ' '; # U+136F ETHIOPIC DIGIT SEVEN 581፰ → ' '; # U+1370 ETHIOPIC DIGIT EIGHT 582፱ → ' '; # U+1371 ETHIOPIC DIGIT NINE 583፲ → ' '; # U+1372 ETHIOPIC NUMBER TEN 584፳ → ' '; # U+1373 ETHIOPIC NUMBER TWENTY 585፴ → ' '; # U+1374 ETHIOPIC NUMBER THIRTY 586፵ → ' '; # U+1375 ETHIOPIC NUMBER FORTY 587፶ → ' '; # U+1376 ETHIOPIC NUMBER FIFTY 588፷ → ' '; # U+1377 ETHIOPIC NUMBER SIXTY 589፸ → ' '; # U+1378 ETHIOPIC NUMBER SEVENTY 590፹ → ' '; # U+1379 ETHIOPIC NUMBER EIGHTY 591፺ → ' '; # U+137A ETHIOPIC NUMBER NINETY 592፻ → ' '; # U+137B ETHIOPIC NUMBER HUNDRED 593፼ → ' '; # U+137C ETHIOPIC NUMBER TEN THOUSAND 594# Transform IPA length markers to one of these: 595# U+135D ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK 596# U+135E ETHIOPIC COMBINING VOWEL LENGTH MARK 597# U+135F ETHIOPIC COMBINING GEMINATION MARK 598::null(); 599← ː ; # Strip off any remaining IPA length markers. 600::(null); 601($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135D → $1 ː $2 ː; 602($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135E → $1 $2 ː; 603($IPA_CONSONANT) ([jw]? $IPA_VOWEL?) \u135F → $1 ː $2; 604[\u135D \u135E \u135F] → ; # Strip off any remaining length markers. 605$1 wa \u135D ← ($LABIALIZABLE_BEFORE_A) ː waː; # ቷ\u135D ← [tːʷaː] 606$1 wa \u135E ← ($LABIALIZABLE_BEFORE_A) waː; # ቷ\u135E ← [tʷaː] 607$1 wa \u135F ← ($LABIALIZABLE_BEFORE_A) ː wa; # አቷ\u135F ← [tːʷa] 608$1 \u135F $2 \u135E ← ([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL) ː; 609$1 \u135F $2 ← {([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL?)}; 610$1 \u135E ← ($IPA_VOWEL ː); 611$1 \u135D ← (jː $IPA_VOWEL ː); 612$1 \u135E ← ([jw] $IPA_VOWEL ː); 613$1 \u135F ← (jː $IPA_VOWEL?); 614$1 \u135D ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL ː); 615$1 \u135E ← ($IPA_CONSONANT [w]? $IPA_VOWEL ː); 616$1 \u135F ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL?); 617# Insert syllable markers in a separate pass. 618::null; 619{($IPA_VOWEL ː?)} [[:L:]] → $1 \.; 620::(null); 621← [ˈˌ\. \u0303\u032F]; 622aj ← ai; # Nairobi /nairobi/ ናይሮቢ, Cairo /kairo/ ካይሮ 623aw ← au; # Bissau /bisːau/ ቢሳው 624eji ← ei; # Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ 625ewo ← eo; # Montevideo /montevideo/ ሞንቴቪዴዎ 626ija ← ia; # Monrovia /monrovia/ ሞንሮቪያ 627ijə ← iə; # Reunion /rijunijən/ ሪዩኒየን 628iw ← iu; # Vilnius /vilnius/ ቪልኒውስ, New Delhi /niu deːli/ ኒው ዴሊ 629jo ← io; # Tokyo /tokio/ ቶክዮ 630nɡ ← ŋɡ; # Kongo /koŋɡo/ ኮንጎ, Hungary /həŋɡari/ ሀንጋሪ 631nɡ ← ŋ; # Bangkok /baŋkok/ ባንግኮክ, Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ 632uwa ← ua; # Kuala Lumpur /kuala lumpur/ ኩዋላ ሉምፑር, Ruanda /ruanda/ ሩዋንዳ 633bwe ← bue; # Buenos Aires /buenos aires/ ብዌኖስ አይሬስ 634sʼ ← t\u0361s; # Podgorica /podɡorit\u0361sa/ ፖድጎሪጻ, Vaduz /fadut\u0361s/ ፋዱጽ 635uwi ← ui; # Port Luis /port luis/ ፖርት ሉዊስ 636uwe ← ue; # Lithuania /lituenia/ ሊቱዌኒያ, Venezuela /venɨzuela/ ቬንዙዌላ 637::(null); 638ʔə ← \. ə; 639ʔu ← \. u; 640ʔi ← \. i; 641ʔa ← \. a; 642ʔe ← \. e; 643ʔɨ ← \. ɨ; 644ʔo ← \. o; 645$1 w ← {($IPA_VOWEL ː?) \u032F} $IPA_VOWEL; # /ewowa/ ← /e\u032Fo\u032Fa/ 646::(null); 647n ← [n {n\u033C} {n\u033C\u030A} {m\u033A} {n\u030A} {n\u0325} ⁿ ᵑ]; 648m ← [ɱ {m\u0325} {m\u032A} ᵐ]; 649ɲ ← [{ɳ\u030A} {ɳ\u0325} ɳ {ɲ\u030A} {ɲ\u0325} ɲ]; 650ŋ ← [{ŋ\u030A} {ŋ\u0325} ŋ]; 651ɴ ← [{ɴ\u030A} {ɴ\u0325} ɴ]; 652p ← [{t\u033C} {p\u033A}]; 653pʼ ← [ʘ ɋ]; 654b ← [{d\u033C} {b\u033A} {ɾ\u033C} ɓ]; 655t ← [{t\u032A} ʈ]; 656tʼ ← [ǁ ʖ]; 657d ← [ɖ ɗ ᶑ]; 658k ← q; 659kʼ ← [ǃ ʗ]; 660ɡ ← [g ɢ ɣ ɠ ʛ]; 661nɡ ← ᵑɡ; 662ʔ ← ʡ; 663s ← [θ {θ\u0331} {θ\u031E} {θ\u033C} {ɸ\u033A}]; 664z ← [ð {ð\u0320} {ð\u033C} {β\u033A}]; 665sʼ ← [{t\u0361s} {t\u035Cs} ʦ]; 666t\u0361ʃ ← [{t\u035Cʃ} ʧ {t\u0361ɕ} {t\u035Cɕ} ʨ {ʈ\u0361ʂ} c]; 667t\u0361ʃʼ ← [ǀ ʇ ǂ ʄ]; 668d\u0361ʒ ← [ʤ ʣ {d\u0361z} {d\u035Cz} {d\u0361ɕ} ʥ {d\u0361ʑ} {d\u035Cʑ} {ɖ\u0361ʐ} {d\u0361ʐ} ɟ]; 669pf ← [{p\u032A} {p\u0346} ȹ {p\u0361f} {p\u032Af} {p\u032A\u035Cf}]; 670bv ← [{b\u032A} {b\u0346} ȸ {b\u0361v} {b\u032A\u0361v}]; 671ʃ ← [ʂ ɕ]; 672ʒ ← [ʐ ʑ]; 673r ← [ɾ ɽ ʁ]; 674rːʒ ← r\u031Dː; 675rʒ ← r\u031D; 676v ← β; 677x ← [ç x χ]; 678ʕ ← ʕ\u031D; 679h ← ɦ; 680j ← [ʝ ʲ]; 681lj ← ʎ [iɨ]? [jʝʲ]?; 682t\u0361ʃl ← [{t\u0361ɬ} {tɬ}]; 683ʃl ← ɬ; 684w ← {u\u032F} $IPA_VOWEL; 685w ← ʷ; 686ʼː ← ːʼ; # /pʼː/ ← /pːʼ/; /sʼː/ ← /sːʼ/; etc. 687::(null); 688i ← y; 689ɨ ← [ɪ ʉ]; 690u ← [ʊ ɯ]; 691ə ← [ɛ æ ɘ]; 692o ← [ɔ ø]; 693a ← ɑ; 694ʼ ← ʰ; 695← [ʱ]; 696$1ːʲ ← ([pbtd])ʲː; # [bːʲeː] ← [bʲːeː] 697$1ːʷ ← ([pbtd])ʷː; # [bːʷeː] ← [bʷːeː] 698::(NFC); 699← [ \u0303 \u0330 \u030B \u0301 \u0304 \u0300 \u030F \u030C \u0302 ˥ ˦ ˧ ˨ ˩ ꜜ ꜛ ↗ ↘ ]; 700::(NFD); 701 702