]> git.saurik.com Git - apple/icu.git/blob - icuSources/data/translit/am_am_FONIPA.txt
ICU-66108.tar.gz
[apple/icu.git] / icuSources / data / translit / am_am_FONIPA.txt
1 # © 2016 and later: Unicode, Inc. and others.
2 # License & terms of use: http://www.unicode.org/copyright.html#License
3 #
4 # File: am_am_FONIPA.txt
5 # Generated from CLDR
6 #
7
8 # Transforms Amharic (am) to Amharic in phonemic IPA transcription (am_FONIPA).
9 #
10 # Long vowels, long/geminated consonants:
11 # In the direction from am_FONIPA to am, we emit Ethiopic gemination
12 # and vowel length markers (U+135D, U+135E, U+135F) although
13 # they are rarely written in Amharic text. Exceptions include
14 # school books and textbooks for non-native speakers.
15 # Clients who do not want these markers can easily strip them off
16 # in a post-processing step.
17 #
18 # Labialization:
19 # Amharic speakers will usually say ሟ as [mʷa] instead of [mwa];
20 # labializing [m] instead of saying [m] followed by a separate [w].
21 # Most Amharic consonants can get labialized. To keep the phonemic
22 # transcription simple, we emit /m/ + /w/; otherwise, our phoneme
23 # set would almost double, and it would include very unusual phonemes
24 # such as /ɲʷ/ or /t\u0361ʃʼʷ/.
25 #
26 # References:
27 # [1] The Ge’ez Frontier Foundation: “Principles and Specification
28 # for Mnemonic Ethiopic Keyboards.” Version of January 17, 2009;
29 # retrieved on November 4, 2014.
30 # http://keyboards.ethiopic.org/specification/GFF-MnemonicEthiopicKeyboardSpecification.pdf
31 # Other than most online sources, this report uses correct IPA notation
32 # with the exception of /j/, which it consistently (but wrongly)
33 # writes as */y/.
34 $IPA_VOWEL = [aeəiɨou];
35 $IPA_CONSONANT = [mnɲɴ p{pʼ}bt{tʼ}dk{kʼ}ɡʔʕ fvs{sʼ}zʃʒxh lr {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}];
36 # Some consonants have a special syllable when labialized, such as ፗ ↔ /pʷa/.
37 # Amharic restricts this mostly to /a/ syllables. While the Ethiopic script
38 # does offer labialized syllables for other vowels, these are typically
39 # not written in Amharic.
40 $LABIALIZABLE_BEFORE_A = [p{pʼ}t{tʼ} {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}{d\u0361ʒʼ} s{sʼ}zʃʒ fv r];
41 ← [ ʼ \u0361 \u035C \u032F];
42 ::(null);
43 # Appendix B of [1] transcribes ሀ as /hə/. However, according to
44 # an Amharic-speaking person, there is no /hə/ sequence
45 # in Amharic; instead, it gets pronounced as /ha/.
46 ሀ → ha;
47 ሀ ← hə;
48 ሁ ↔ hu;
49 ሂ ↔ hi;
50 ሃ ↔ ha;
51 ሄ ↔ he;
52 ህ ↔ hɨ;
53 ሆ ↔ ho;
54 ሇ → ho; # Dizi, Me’en, Mursi, Suri /hɔ/ ([1], Appendix E); not used in Amharic.
55 ህ ← h;
56 ለ ↔ lə;
57 ሉ ↔ lu;
58 ሊ ↔ li;
59 ላ ↔ la;
60 ሌ ↔ le;
61 ል ↔ lɨ;
62 ሎ ↔ lo;
63 ⶀ → lo; # Dizi, Me’en, Mursi, Suri /lɔ/ ([1], Appendix E); not used in Amharic.
64 ሏ ↔ lwa;
65 ል ← l;
66 # Appendix B of [1] transcribes ሐ as Voiceless pharyngeal fricative
67 # /ħə/. However, according to an Amharic-speaking person, Amharic
68 # makes no difference in pronunciation between ሐ...ሓ and ሀ...ሃ; both
69 # are pronounced as Voiceless glottal fricative /h/. Also, according
70 # to the speaker there is no /hə/ sequence in Amharic; instead, it
71 # gets pronounced as /ha/.
72 ሐ → ha;
73 ሑ → hu;
74 ሒ → hi;
75 ሓ → ha;
76 ሔ → he;
77 ሕ → hɨ;
78 ሖ → ho;
79 ሗ → hwa;
80 መ ↔ mə;
81 ሙ ↔ mu;
82 ሚ ↔ mi;
83 ማ ↔ ma;
84 ሜ ↔ me;
85 ም ↔ mɨ;
86 ሞ ↔ mo;
87 ⶁ → mo; # Dizi, Me’en, Mursi, Suri /mɔ/ ([1], Appendix E); not used in Amharic.
88 ᎀ → mwə; # Sebatbeit /mwə/ ([1], Appendix H); not used in Amharic.
89 ᎃ → mwu; # Sebatbeit /mwu/ ([1], Appendix H); not used in Amharic.
90 ᎁ → mwi; # Sebatbeit /mwi/ ([1], Appendix H); not used in Amharic.
91 ሟ ↔ mwa;
92 ᎂ → mwe; # Sebatbeit /mwe/ ([1], Appendix H); not used in Amharic.
93 ፙ → mja; # Unclear which language; Appendix L of [1] transcribes ፙ as /mʲa/.
94 ም ← m;
95 ሠ → sə;
96 ሡ → su;
97 ሢ → si;
98 ሣ → sa;
99 ሤ → se;
100 ሥ → sɨ;
101 ሦ → so;
102 ሧ → swa;
103 ረ ↔ rə;
104 ሩ ↔ ru;
105 ሪ ↔ ri;
106 ራ ↔ ra;
107 ሬ ↔ re;
108 ር ↔ rɨ;
109 ሮ ↔ ro;
110 ⶂ → ro; # Dizi, Me’en, Mursi, Suri /rɔ/ ([1], Appendix E); not used in Amharic.
111 ሯ ↔ rwa;
112 ፘ → rja; # Unclear which language; Appendix L of [1] transcribes ፘ as /rʲa/.
113 ር ← r;
114 # Amharic speakers pronounce ⶠ like ሸ. Source: [1], Appendix B.
115 ⶠ → ʃə;
116 ⶡ → ʃu;
117 ⶢ → ʃi;
118 ⶣ → ʃa;
119 ⶤ → ʃe;
120 ⶥ → ʃɨ;
121 ⶦ → ʃo;
122 ሸ ↔ ʃə;
123 ሹ ↔ ʃu;
124 ሺ ↔ ʃi;
125 ሻ ↔ ʃa;
126 ሼ ↔ ʃe;
127 ሽ ↔ ʃɨ;
128 ሾ ↔ ʃo;
129 ⶄ → ʃo; # Dizi, Me’en, Mursi, Suri /ʃɔ/ ([1], Appendix E); not used in Amharic.
130 ሿ ↔ ʃwa;
131 ሽ ← ʃ;
132 ቀ ↔ kʼə;
133 ቁ ↔ kʼu;
134 ቂ ↔ kʼi;
135 ቃ ↔ kʼa;
136 ቄ ↔ kʼe;
137 ቅ ↔ kʼɨ;
138 ቆ ↔ kʼo;
139 ቇ → kʼo; # Dizi, Me’en, Mursi, Suri /kʼɔ/ ([1], Appendix E); not used in Amharic.
140 ቈ ↔ kʼwə;
141 ቍ ↔ kʼwu;
142 ቊ ↔ kʼwi;
143 ቋ ↔ kʼwa;
144 ቌ ↔ kʼwe;
145 ቅ ← kʼ;
146 # In Awngi, Blin, Qimant, and Xamtanga, ቐ is spoken as voiced uvular fricative [ʁ].
147 # Source: [1], Appendix C. However, */ʁ/ is not an Amharic phoneme.
148 # When reading foreign words with ቐ, Amharic speakers pronounce
149 # ቐ like ቀ, i.e. as velar ejective /kʼ/.
150 ቐ → kʼə;
151 ቑ → kʼu;
152 ቒ → kʼi;
153 ቓ → kʼa;
154 ቔ → kʼe;
155 ቕ → kʼɨ;
156 ቖ → kʼo;
157 ቘ → kʼwə;
158 ቝ → kʼwu;
159 ቚ → kʼwi;
160 ቛ → kʼwa;
161 ቜ → kʼwe;
162 # In Sebatbeit, ⷀ is spoken as palatalized velar ejective /kʼʲ/ ([1], Appendix H).
163 # In Amharic, the syllable is not used, but it might appear in names.
164 ⷀ → kʼjə;
165 ⷁ → kʼju;
166 ⷂ → kʼji;
167 ⷃ → kʼja;
168 ⷄ → kʼje;
169 ⷅ → kʼjɨ;
170 ⷆ → kʼjo;
171 በ ↔ bə;
172 ቡ ↔ bu;
173 ቢ ↔ bi;
174 ባ ↔ ba;
175 ቤ ↔ be;
176 ብ ↔ bɨ;
177 ቦ ↔ bo;
178 ⶅ → bo; # Dizi, Me’en, Mursi, Suri /bɔ/ ([1], Appendix E); not used in Amharic.
179 ᎄ → bwə; # Sebatbeit /bʷə/ ([1], Appendix H); not used in Amharic.
180 ᎇ → bwu; # Sebatbeit /bʷu/ ([1], Appendix H); not used in Amharic.
181 ᎅ → bwi; # Sebatbeit /bʷi/ ([1], Appendix H); not used in Amharic.
182 ቧ → bwa; # Sebatbeit /bʷa/ ([1], Appendix H); not used in Amharic.
183 ᎆ → bwe; # Sebatbeit /bʷe/ ([1], Appendix H); not used in Amharic.
184 ብ ← b;
185 ቨ ↔ və;
186 ቩ ↔ vu;
187 ቪ ↔ vi;
188 ቫ ↔ va;
189 ቬ ↔ ve;
190 ቭ ↔ vɨ;
191 ቮ ↔ vo;
192 ቯ ↔ vwa;
193 ቭ ← v;
194 # Unclear which Ethiopic language uses ⶨ. It only appears in the
195 # “Language Neutral” list of Appendix L in [1], which transcribes it as t\u0361ʃ.
196 # For Amharic, we pronounce ⶨ therefore like ቸ.
197 ⶨ → t\u0361ʃə;
198 ⶩ → t\u0361ʃu;
199 ⶪ → t\u0361ʃi;
200 ⶫ → t\u0361ʃa;
201 ⶬ → t\u0361ʃe;
202 ⶭ → t\u0361ʃɨ;
203 ⶮ → t\u0361ʃo;
204 # In Amharic, ኀ is pronounced like ሀ.
205 # Source: [1], section on “Phonological Redundancy” for Amharic, page 5.
206 # Appendix B of [1] transcribes ሀ as /hə/. However, according to
207 # an Amharic-speaking person, there is no /hə/ sequence in Amharic.
208 # Instead, ሀ (and hence also ኀ) gets pronounced as /ha/.
209 ኀ → ha;
210 ኁ → hu;
211 ኂ → hi;
212 ኃ → ha;
213 ኄ → he;
214 ኅ → hɨ;
215 ኆ → ho;
216 ኇ → ho; # Dizi, Me’en, Mursi, Suri /ŋɔ/ ([1], Appendix E); not used in Amharic.
217 ኈ → hwə;
218 ኍ → hwu;
219 ኊ → hwi;
220 ኋ → hwa;
221 ኌ → hwe;
222 ነ ↔ nə;
223 ኑ ↔ nu;
224 ኒ ↔ ni;
225 ና ↔ na;
226 ኔ ↔ ne;
227 ን ↔ nɨ;
228 ኖ ↔ no;
229 ⶈ → no; # Dizi, Me’en, Mursi, Suri /nɔ/ ([1], Appendix E); not used in Amharic.
230 ኗ ↔ nwa;
231 ን ← n;
232 ኘ ↔ ɲə;
233 ኙ ↔ ɲu;
234 ኚ ↔ ɲi;
235 ኛ ↔ ɲa;
236 ኜ ↔ ɲe;
237 ኝ ↔ ɲɨ;
238 ኞ ↔ ɲo;
239 ⶉ → ɲo; # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic.
240 ኟ ↔ ɲwa;
241 ኝ ← ɲ;
242 # Amharic speakers pronounce ኸ as [h] because Amharic has no [x] sound.
243 # However, in transliterations of foreign (eg. Spanish) words with [x],
244 # several Amharic speakers have confirmed that they prefer ኻ over ሃ.
245 ዀ → hwə;
246 ዂ → hwi;
247 ዃ → hwa;
248 ዄ → hwe;
249 ዅ → hwɨ;
250 ኸ → hə;
251 ኹ → hu;
252 ኺ → hi;
253 ኻ → ha;
254 ኼ → he;
255 ኽ → hɨ;
256 ኾ → ho;
257 ዀ ← xwə;
258 ዂ ← xwi;
259 ዃ ← xwa;
260 ዄ ← xwe;
261 ዅ ← xwɨ;
262 ዅ ← xw;
263 ኸ ← xə;
264 ኹ ← xu;
265 ኺ ← xi;
266 ኻ ← xa;
267 ኼ ← xe;
268 ኽ ← xɨ;
269 ኾ ← xo;
270 ኽ ← x;
271 አ ↔ ʔə;
272 ኡ ↔ ʔu;
273 ኢ ↔ ʔi;
274 ኣ ↔ ʔa;
275 ኤ ↔ ʔe;
276 እ ↔ ʔɨ;
277 ኦ ↔ ʔo;
278 ⶊ → ʔo; # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic.
279 እ ← ʔ;
280 ከ ↔ kə;
281 ኩ ↔ ku;
282 ኪ ↔ ki;
283 ካ ↔ ka;
284 ኬ ↔ ke;
285 ክ ↔ kɨ;
286 ኮ ↔ ko;
287 ኰ ↔ kwə;
288 ኵ ↔ kwu;
289 ኲ ↔ kwi;
290 ኳ ↔ kwa;
291 ኴ ↔ kwe;
292 ክ ← k;
293 # In Sebatbeit, ⷈ is spoken as palatalized velar plosive /kʲ/ ([1], Appendix H).
294 # Amharic speakers pronounce it as /k/ without palatalization.
295 ⷈ → kə;
296 ⷉ → ku;
297 ⷊ → ki;
298 ⷋ → ka;
299 ⷌ → ke;
300 ⷍ → kɨ;
301 ⷎ → ko;
302 # In Sebatbeit, ⷐ is spoken as palatalized voiceless velar fricative/xʲə/
303 # according to [1], Appendix H. When the syllable appears in names,
304 # Amharic speakers pronounce it as /kə/ without palatalization.
305 ⷐ → kə;
306 ⷑ → ku;
307 ⷒ → ki;
308 ⷓ → ka;
309 ⷔ → ke;
310 ⷕ → kɨ;
311 ⷖ → ko;
312 ወ ↔ wə;
313 ዉ ↔ wu;
314 ዊ ↔ wi;
315 ዋ ↔ wa;
316 ዌ ↔ we;
317 ው ↔ wɨ;
318 ዎ ↔ wo;
319 ዏ → wo; # Dizi, Me’en, Mursi, Suri /wɔ/ ([1], Appendix E); not used in Amharic.
320 ው ← w;
321 ዐ ↔ ʕə;
322 ዑ ↔ ʕu;
323 ዒ ↔ ʕi;
324 ዓ ↔ ʕa;
325 ዔ ↔ ʕe;
326 ዕ ↔ ʕɨ;
327 ዖ ↔ ʕo;
328 ዒ ← ʕ;
329 ዘ ↔ zə;
330 ዙ ↔ zu;
331 ዚ ↔ zi;
332 ዛ ↔ za;
333 ዜ ↔ ze;
334 ዝ ↔ zɨ;
335 ዞ ↔ zo;
336 ⶋ → zo; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic.
337 ዟ ↔ zwa;
338 ዝ ← z;
339 ዠ ↔ ʒə;
340 ዡ ↔ ʒu;
341 ዢ ↔ ʒi;
342 ዣ ↔ ʒa;
343 ዤ ↔ ʒe;
344 ዥ ↔ ʒɨ;
345 ዦ ↔ ʒo;
346 ዧ ↔ ʒwa;
347 ዢ ← ʒ;
348 # Unclear which Ethiopic language uses ⶰ. It only appears in the
349 # “Language Neutral” list of Appendix L in [1], which transcribes it as ʒ.
350 # For Amharic, we pronounce ⶰ therefore like ዠ.
351 ⶰ → ʒə;
352 ⶱ → ʒu;
353 ⶲ → ʒi;
354 ⶳ → ʒa;
355 ⶴ → ʒe;
356 ⶵ → ʒɨ;
357 ⶶ → ʒo;
358 የ ↔ jə;
359 ዩ ↔ ju;
360 ዪ ↔ ji;
361 ያ ↔ ja;
362 ዬ ↔ je;
363 ይ ↔ jɨ;
364 ዮ ↔ jo;
365 ዯ → jo; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic.
366 ይ ← j;
367 ጀ ↔ d\u0361ʒə;
368 ጁ ↔ d\u0361ʒu;
369 ጂ ↔ d\u0361ʒi;
370 ጃ ↔ d\u0361ʒa;
371 ጄ ↔ d\u0361ʒe;
372 ጅ ↔ d\u0361ʒɨ;
373 ጆ ↔ d\u0361ʒo;
374 ጇ ↔ d\u0361ʒwa;
375 ጅ ← d\u0361ʒ;
376 ደ ↔ də;
377 ዱ ↔ du;
378 ዲ ↔ di;
379 ዳ ↔ da;
380 ዴ ↔ de;
381 ድ ↔ dɨ;
382 ዶ ↔ do;
383 ⶌ → do; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic.
384 ዷ ↔ dwa;
385 ድ ← d;
386 ገ ↔ ɡə;
387 ጉ ↔ ɡu;
388 ጊ ↔ ɡi;
389 ጋ ↔ ɡa;
390 ጌ ↔ ɡe;
391 ግ ↔ ɡɨ;
392 ጎ ↔ ɡo;
393 ጐ ↔ ɡwə;
394 ጕ ↔ ɡwu;
395 ጒ ↔ ɡwi;
396 ጓ ↔ ɡwa;
397 ጔ ↔ ɡwe;
398 ግ ← ɡ;
399 # In Awngi, Blin, Qimant, and Xamtanga, ጘ is spoken as voiced velar nasal [ŋ].
400 # Source: [1], Appendix C. While /ŋ/ is not an Amharic phoneme, Amharic speakers
401 # still can pronounce it according to our source. However, when transliterating
402 # foreign words with [ŋ], Amharic uses the sequence ንግ /nɡ/. For example,
403 # the Amharic transliteration of Washington /waʃiŋtən/ is ዋሺንግተን.
404 ጘ → ŋə;
405 ጙ → ŋu;
406 ጚ → ŋi;
407 ጛ → ŋa;
408 ጜ → ŋe;
409 ጝ → ŋɨ;
410 ጞ → ŋo;
411 ⶓ → ŋwə;
412 ⶖ → ŋwu;
413 ⶔ → ŋwi;
414 ጟ → ŋwa;
415 ⶕ → ŋwe;
416 # Since there is no uvular nasal [ɴ] in Amharic, we use the velar nasal [ŋ].
417 ጘ ← ɴə;
418 ጙ ← ɴu;
419 ጚ ← ɴi;
420 ጛ ← ɴa;
421 ጜ ← ɴe;
422 ጝ ← ɴɨ;
423 ጞ ← ɴo;
424 ጝ ← ɴ;
425 # In Sebatbeit, ⷘ is spoken as palatalized voiced velar stop /ɡj/ ([1], Appendix H).
426 # Amharic speakers pronounce it as voiced velar stop /ɡ/ without palatalization.
427 ⷘ → ɡə;
428 ⷙ → ɡu;
429 ⷚ → ɡi;
430 ⷛ → ɡa;
431 ⷜ → ɡe;
432 ⷝ → ɡɨ;
433 ⷞ → ɡo;
434 ጠ ↔ tʼə;
435 ጡ ↔ tʼu;
436 ጢ ↔ tʼi;
437 ጣ ↔ tʼa;
438 ጤ ↔ tʼe;
439 ጥ ↔ tʼɨ;
440 ጦ ↔ tʼo;
441 ጧ ↔ tʼwa;
442 ጢ ← tʼ;
443 ጨ ↔ t\u0361ʃʼə;
444 ጩ ↔ t\u0361ʃʼu;
445 ጪ ↔ t\u0361ʃʼi;
446 ጫ ↔ t\u0361ʃʼa;
447 ጬ ↔ t\u0361ʃʼe;
448 ጭ ↔ t\u0361ʃʼɨ;
449 ጮ ↔ t\u0361ʃʼo;
450 ⶐ → t\u0361ʃʼo; # Dizi, Me’en, Mursi, Suri /t\u0361ʃʼɔ/ ([1], Appendix E); not used in Amharic.
451 ጯ ↔ t\u0361ʃʼwa;
452 ጪ ← t\u0361ʃʼ;
453 # According to Appendix B of [1], the following are used in the Bench language
454 # (aka Benchnon, Gimira). In Bench, ⶻ is pronounced as /ʈ\u0361ʂʼ/ Retroflex
455 # ejective affricate; with a phonemic distrinction to the non-retroflex version.
456 # Amharic does not have retroflex phonemes, so we go with /t\u0361ʃʼ/.
457 ⶸ → t\u0361ʃʼə;
458 ⶹ → t\u0361ʃʼu;
459 ⶺ → t\u0361ʃʼi;
460 ⶻ → t\u0361ʃʼa;
461 ⶼ → t\u0361ʃʼe;
462 ⶽ → t\u0361ʃʼɨ;
463 ⶾ → t\u0361ʃʼo;
464 ቸ ↔ t\u0361ʃə;
465 ቹ ↔ t\u0361ʃu;
466 ቺ ↔ t\u0361ʃi;
467 ቻ ↔ t\u0361ʃa;
468 ቼ ↔ t\u0361ʃe;
469 ች ↔ t\u0361ʃɨ;
470 ቾ ↔ t\u0361ʃo;
471 ቿ ↔ t\u0361ʃwa;
472 ች ← t\u0361ʃ;
473 ተ ↔ tə;
474 ቱ ↔ tu;
475 ቲ ↔ ti;
476 ታ ↔ ta;
477 ቴ ↔ te;
478 ት ↔ tɨ;
479 ቶ ↔ to;
480 ⶆ → to; # Dizi, Me’en, Mursi, Suri /tɔ/ ([1], Appendix E); not used in Amharic.
481 ቷ ↔ twa;
482 ት ← t;
483 ጰ ↔ pʼə;
484 ጱ ↔ pʼu;
485 ጲ ↔ pʼi;
486 ጳ ↔ pʼa;
487 ጴ ↔ pʼe;
488 ጵ ↔ pʼɨ;
489 ጶ ↔ pʼo;
490 ⶑ → pʼo; # Dizi, Me’en, Mursi, Suri /pʼɔ/ ([1], Appendix E); not used in Amharic.
491 ጷ ↔ pʼwa;
492 ጵ ← pʼ;
493 ጸ ↔ sʼə;
494 ጹ ↔ sʼu;
495 ጺ ↔ sʼi;
496 ጻ ↔ sʼa;
497 ጼ ↔ sʼe;
498 ጽ ↔ sʼɨ;
499 ጾ ↔ sʼo;
500 ጿ ↔ sʼwa;
501 ጽ ← sʼ;
502 # In Amharic, ፀ is pronounced like ጸ.
503 # Source: [1], section on “Phonological Redundancy” for Amharic, page 5.
504 ፀ → sʼə;
505 ፁ → sʼu;
506 ፂ → sʼi;
507 ፃ → sʼa;
508 ፄ → sʼe;
509 ፅ → sʼɨ;
510 ፆ → sʼo;
511 ፇ → sʼo; # Dizi, Me’en, Mursi, Suri /sʼɔ/ ([1], Appendix E); not used in Amharic.
512 # Amharic speakers pronounce ሰ like ሠ. Source: [1], Appendix B.
513 ሰ ↔ sə;
514 ሱ ↔ su;
515 ሲ ↔ si;
516 ሳ ↔ sa;
517 ሴ ↔ se;
518 ስ ↔ sɨ;
519 ሶ ↔ so;
520 ⶃ → so; # Dizi, Me’en, Mursi, Suri /sɔ/ ([1], Appendix E); not used in Amharic.
521 ሷ ↔ swa;
522 ስ ← s;
523 ፈ ↔ fə;
524 ፉ ↔ fu;
525 ፊ ↔ fi;
526 ፋ ↔ fa;
527 ፌ ↔ fe;
528 ፍ ↔ fɨ;
529 ፎ ↔ fo;
530 ᎈ → fwə; # Sebatbeit /fwə/ ([1], Appendix H); not used in Amharic.
531 ᎉ → fwu; # Sebatbeit /fwu/ ([1], Appendix H); not used in Amharic.
532 ᎋ → fwi; # Sebatbeit /fwi/ ([1], Appendix H); not used in Amharic.
533 ፏ ↔ fwa;
534 ᎊ → fwe; # Sebatbeit /fwe/ ([1], Appendix H); not used in Amharic.
535 ፚ → fja; # Unclear which language; Appendix L of [1] transcribes ፚ as /fja/.
536 ፍ ← f;
537 ፐ ↔ pə;
538 ፑ ↔ pu;
539 ፒ ↔ pi;
540 ፓ ↔ pa;
541 ፔ ↔ pe;
542 ፕ ↔ pɨ;
543 ፖ ↔ po;
544 ⶒ → po; # Dizi, Me’en, Mursi, Suri /pɔ/ ([1], Appendix E); not used in Amharic.
545 ᎌ → pwə; # Sebatbeit /pwə/ ([1], Appendix H); not used in Amharic.
546 ᎍ → pwu; # Sebatbeit /pwu/ ([1], Appendix H); not used in Amharic.
547 ᎏ → pwi; # Sebatbeit /pwi/ ([1], Appendix H); not used in Amharic.
548 ፗ ↔ pwa;
549 ᎎ → pwe; # Sebatbeit /pwe/ ([1], Appendix H); not used in Amharic.
550 ፕ ← p;
551 ኧ ↔ ə;
552 ኡ ← u; # ኡላዓን ባዓታር ← Ulaan Baatar /ulaʕan baʕatar/
553 አ ← a; # አምስተርዳም ← Amsterdam /amstərdam/
554 ኤ ← e;
555 እ ← ɨ;
556 ኦ ← o; # ፖርት ኦፍ ስፔን ← Port of Spain /port of speːn/
557 ኢ ← i; # ኢስላማባድ ← Islamabad /islamabad/
558 # Applications will typically split words before calling our rules.
559 # To be resilient, we replace punctuation by whitespace in IPA.
560 ፠ → ' '; # U+1360 ETHIOPIC SECTION MARK
561 ፡ → ' '; # U+1361 ETHIOPIC WORDSPACE
562 ። → ' '; # U+1362 ETHIOPIC FULL STOP
563 ፣ → ' '; # U+1363 ETHIOPIC COMMA
564 ፤ → ' '; # U+1364 ETHIOPIC SEMICOLON
565 ፥ → ' '; # U+1365 ETHIOPIC COLON
566 ፦ → ' '; # U+1366 ETHIOPIC PREFACE COLON
567 ፧ → ' '; # U+1367 ETHIOPIC QUESTION MARK
568 ፨ → ' '; # U+1368 ETHIOPIC PARAGRAPH SEPARATOR
569 # Likewise, Ethiopic numberals cannot be pronounced by these rules,
570 # so we replace them by whitespace in the output IPA notation.
571 # Applications will typically pre-process text before calling
572 # the am → am_FONIPA transform.
573 ፩ → ' '; # U+1369 ETHIOPIC DIGIT ONE
574 ፪ → ' '; # U+136A ETHIOPIC DIGIT TWO
575 ፫ → ' '; # U+136B ETHIOPIC DIGIT THREE
576 ፬ → ' '; # U+136C ETHIOPIC DIGIT FOUR
577 ፭ → ' '; # U+136D ETHIOPIC DIGIT FIVE
578 ፮ → ' '; # U+136E ETHIOPIC DIGIT SIX
579 ፯ → ' '; # U+136F ETHIOPIC DIGIT SEVEN
580 ፰ → ' '; # U+1370 ETHIOPIC DIGIT EIGHT
581 ፱ → ' '; # U+1371 ETHIOPIC DIGIT NINE
582 ፲ → ' '; # U+1372 ETHIOPIC NUMBER TEN
583 ፳ → ' '; # U+1373 ETHIOPIC NUMBER TWENTY
584 ፴ → ' '; # U+1374 ETHIOPIC NUMBER THIRTY
585 ፵ → ' '; # U+1375 ETHIOPIC NUMBER FORTY
586 ፶ → ' '; # U+1376 ETHIOPIC NUMBER FIFTY
587 ፷ → ' '; # U+1377 ETHIOPIC NUMBER SIXTY
588 ፸ → ' '; # U+1378 ETHIOPIC NUMBER SEVENTY
589 ፹ → ' '; # U+1379 ETHIOPIC NUMBER EIGHTY
590 ፺ → ' '; # U+137A ETHIOPIC NUMBER NINETY
591 ፻ → ' '; # U+137B ETHIOPIC NUMBER HUNDRED
592 ፼ → ' '; # U+137C ETHIOPIC NUMBER TEN THOUSAND
593 # Transform IPA length markers to one of these:
594 # U+135D ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK
595 # U+135E ETHIOPIC COMBINING VOWEL LENGTH MARK
596 # U+135F ETHIOPIC COMBINING GEMINATION MARK
597 ::null();
598 ← ː ; # Strip off any remaining IPA length markers.
599 ::(null);
600 ($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135D → $1 ː $2 ː;
601 ($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135E → $1 $2 ː;
602 ($IPA_CONSONANT) ([jw]? $IPA_VOWEL?) \u135F → $1 ː $2;
603 [\u135D \u135E \u135F] → ; # Strip off any remaining length markers.
604 $1 wa \u135D ← ($LABIALIZABLE_BEFORE_A) ː waː; # ቷ\u135D ← [tːʷaː]
605 $1 wa \u135E ← ($LABIALIZABLE_BEFORE_A) waː; # ቷ\u135E ← [tʷaː]
606 $1 wa \u135F ← ($LABIALIZABLE_BEFORE_A) ː wa; # አቷ\u135F ← [tːʷa]
607 $1 \u135F $2 \u135E ← ([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL) ː;
608 $1 \u135F $2 ← {([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL?)};
609 $1 \u135E ← ($IPA_VOWEL ː);
610 $1 \u135D ← (jː $IPA_VOWEL ː);
611 $1 \u135E ← ([jw] $IPA_VOWEL ː);
612 $1 \u135F ← (jː $IPA_VOWEL?);
613 $1 \u135D ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL ː);
614 $1 \u135E ← ($IPA_CONSONANT [w]? $IPA_VOWEL ː);
615 $1 \u135F ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL?);
616 # Insert syllable markers in a separate pass.
617 ::null;
618 {($IPA_VOWEL ː?)} [[:L:]] → $1 \.;
619 ::(null);
620 ← [ˈˌ\. \u0303\u032F];
621 aj ← ai; # Nairobi /nairobi/ ናይሮቢ, Cairo /kairo/ ካይሮ
622 aw ← au; # Bissau /bisːau/ ቢሳው
623 eji ← ei; # Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ
624 ewo ← eo; # Montevideo /montevideo/ ሞንቴቪዴዎ
625 ija ← ia; # Monrovia /monrovia/ ሞንሮቪያ
626 ijə ← iə; # Reunion /rijunijən/ ሪዩኒየን
627 iw ← iu; # Vilnius /vilnius/ ቪልኒውስ, New Delhi /niu deːli/ ኒው ዴሊ
628 jo ← io; # Tokyo /tokio/ ቶክዮ
629 nɡ ← ŋɡ; # Kongo /koŋɡo/ ኮንጎ, Hungary /həŋɡari/ ሀንጋሪ
630 nɡ ← ŋ; # Bangkok /baŋkok/ ባንግኮክ, Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ
631 uwa ← ua; # Kuala Lumpur /kuala lumpur/ ኩዋላ ሉምፑር, Ruanda /ruanda/ ሩዋንዳ
632 bwe ← bue; # Buenos Aires /buenos aires/ ብዌኖስ አይሬስ
633 sʼ ← t\u0361s; # Podgorica /podɡorit\u0361sa/ ፖድጎሪጻ, Vaduz /fadut\u0361s/ ፋዱጽ
634 uwi ← ui; # Port Luis /port luis/ ፖርት ሉዊስ
635 uwe ← ue; # Lithuania /lituenia/ ሊቱዌኒያ, Venezuela /venɨzuela/ ቬንዙዌላ
636 ::(null);
637 ʔə ← \. ə;
638 ʔu ← \. u;
639 ʔi ← \. i;
640 ʔa ← \. a;
641 ʔe ← \. e;
642 ʔɨ ← \. ɨ;
643 ʔo ← \. o;
644 $1 w ← {($IPA_VOWEL ː?) \u032F} $IPA_VOWEL; # /ewowa/ ← /e\u032Fo\u032Fa/
645 ::(null);
646 n ← [n {n\u033C} {n\u033C\u030A} {m\u033A} {n\u030A} {n\u0325} ⁿ ᵑ];
647 m ← [ɱ {m\u0325} {m\u032A} ᵐ];
648 ɲ ← [{ɳ\u030A} {ɳ\u0325} ɳ {ɲ\u030A} {ɲ\u0325} ɲ];
649 ŋ ← [{ŋ\u030A} {ŋ\u0325} ŋ];
650 ɴ ← [{ɴ\u030A} {ɴ\u0325} ɴ];
651 p ← [{t\u033C} {p\u033A}];
652 pʼ ← [ʘ ɋ];
653 b ← [{d\u033C} {b\u033A} {ɾ\u033C} ɓ];
654 t ← [{t\u032A} ʈ];
655 tʼ ← [ǁ ʖ];
656 d ← [ɖ ɗ ᶑ];
657 k ← q;
658 kʼ ← [ǃ ʗ];
659 ɡ ← [g ɢ ɣ ɠ ʛ];
660 nɡ ← ᵑɡ;
661 ʔ ← ʡ;
662 s ← [θ {θ\u0331} {θ\u031E} {θ\u033C} {ɸ\u033A}];
663 z ← [ð {ð\u0320} {ð\u033C} {β\u033A}];
664 sʼ ← [{t\u0361s} {t\u035Cs} ʦ];
665 t\u0361ʃ ← [{t\u035Cʃ} ʧ {t\u0361ɕ} {t\u035Cɕ} ʨ {ʈ\u0361ʂ} c];
666 t\u0361ʃʼ ← [ǀ ʇ ǂ ʄ];
667 d\u0361ʒ ← [ʤ ʣ {d\u0361z} {d\u035Cz} {d\u0361ɕ} ʥ {d\u0361ʑ} {d\u035Cʑ} {ɖ\u0361ʐ} {d\u0361ʐ} ɟ];
668 pf ← [{p\u032A} {p\u0346} ȹ {p\u0361f} {p\u032Af} {p\u032A\u035Cf}];
669 bv ← [{b\u032A} {b\u0346} ȸ {b\u0361v} {b\u032A\u0361v}];
670 ʃ ← [ʂ ɕ];
671 ʒ ← [ʐ ʑ];
672 r ← [ɾ ɽ ʁ];
673 rːʒ ← r\u031Dː;
674 rʒ ← r\u031D;
675 v ← β;
676 x ← [ç x χ];
677 ʕ ← ʕ\u031D;
678 h ← ɦ;
679 j ← [ʝ ʲ];
680 lj ← ʎ [iɨ]? [jʝʲ]?;
681 t\u0361ʃl ← [{t\u0361ɬ} {tɬ}];
682 ʃl ← ɬ;
683 w ← {u\u032F} $IPA_VOWEL;
684 w ← ʷ;
685 ʼː ← ːʼ; # /pʼː/ ← /pːʼ/; /sʼː/ ← /sːʼ/; etc.
686 ::(null);
687 i ← y;
688 ɨ ← [ɪ ʉ];
689 u ← [ʊ ɯ];
690 ə ← [ɛ æ ɘ];
691 o ← [ɔ ø];
692 a ← ɑ;
693 ʼ ← ʰ;
694 ← [ʱ];
695 $1ːʲ ← ([pbtd])ʲː; # [bːʲeː] ← [bʲːeː]
696 $1ːʷ ← ([pbtd])ʷː; # [bːʷeː] ← [bʷːeː]
697 ::(NFC);
698 ← [ \u0303 \u0330 \u030B \u0301 \u0304 \u0300 \u030F \u030C \u0302 ˥ ˦ ˧ ˨ ˩ ꜜ ꜛ ↗ ↘ ];
699 ::(NFD);
700