]>
Commit | Line | Data |
---|---|---|
f3c0d7a5 A |
1 | # © 2016 and later: Unicode, Inc. and others. |
2 | # License & terms of use: http://www.unicode.org/copyright.html#License | |
3 | # | |
2ca993e8 | 4 | # File: am_am_FONIPA.txt |
f3c0d7a5 | 5 | # Generated from CLDR |
2ca993e8 A |
6 | # |
7 | ||
8 | # Transforms Amharic (am) to Amharic in phonemic IPA transcription (am_FONIPA). | |
9 | # | |
10 | # Long vowels, long/geminated consonants: | |
11 | # In the direction from am_FONIPA to am, we emit Ethiopic gemination | |
12 | # and vowel length markers (U+135D, U+135E, U+135F) although | |
13 | # they are rarely written in Amharic text. Exceptions include | |
14 | # school books and textbooks for non-native speakers. | |
15 | # Clients who do not want these markers can easily strip them off | |
16 | # in a post-processing step. | |
17 | # | |
18 | # Labialization: | |
19 | # Amharic speakers will usually say ሟ as [mʷa] instead of [mwa]; | |
20 | # labializing [m] instead of saying [m] followed by a separate [w]. | |
21 | # Most Amharic consonants can get labialized. To keep the phonemic | |
22 | # transcription simple, we emit /m/ + /w/; otherwise, our phoneme | |
23 | # set would almost double, and it would include very unusual phonemes | |
24 | # such as /ɲʷ/ or /t\u0361ʃʼʷ/. | |
25 | # | |
26 | # References: | |
27 | # [1] The Ge’ez Frontier Foundation: “Principles and Specification | |
28 | # for Mnemonic Ethiopic Keyboards.” Version of January 17, 2009; | |
29 | # retrieved on November 4, 2014. | |
30 | # http://keyboards.ethiopic.org/specification/GFF-MnemonicEthiopicKeyboardSpecification.pdf | |
31 | # Other than most online sources, this report uses correct IPA notation | |
32 | # with the exception of /j/, which it consistently (but wrongly) | |
33 | # writes as */y/. | |
34 | $IPA_VOWEL = [aeəiɨou]; | |
35 | $IPA_CONSONANT = [mnɲɴ p{pʼ}bt{tʼ}dk{kʼ}ɡʔʕ fvs{sʼ}zʃʒxh lr {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}]; | |
36 | # Some consonants have a special syllable when labialized, such as ፗ ↔ /pʷa/. | |
37 | # Amharic restricts this mostly to /a/ syllables. While the Ethiopic script | |
38 | # does offer labialized syllables for other vowels, these are typically | |
39 | # not written in Amharic. | |
40 | $LABIALIZABLE_BEFORE_A = [p{pʼ}t{tʼ} {t\u0361ʃ}{t\u0361ʃʼ}{d\u0361ʒ}{d\u0361ʒʼ} s{sʼ}zʃʒ fv r]; | |
41 | ← [ ʼ \u0361 \u035C \u032F]; | |
42 | ::(null); | |
43 | # Appendix B of [1] transcribes ሀ as /hə/. However, according to | |
44 | # an Amharic-speaking person, there is no /hə/ sequence | |
45 | # in Amharic; instead, it gets pronounced as /ha/. | |
46 | ሀ → ha; | |
47 | ሀ ← hə; | |
48 | ሁ ↔ hu; | |
49 | ሂ ↔ hi; | |
50 | ሃ ↔ ha; | |
51 | ሄ ↔ he; | |
52 | ህ ↔ hɨ; | |
53 | ሆ ↔ ho; | |
54 | ሇ → ho; # Dizi, Me’en, Mursi, Suri /hɔ/ ([1], Appendix E); not used in Amharic. | |
55 | ህ ← h; | |
56 | ለ ↔ lə; | |
57 | ሉ ↔ lu; | |
58 | ሊ ↔ li; | |
59 | ላ ↔ la; | |
60 | ሌ ↔ le; | |
61 | ል ↔ lɨ; | |
62 | ሎ ↔ lo; | |
63 | ⶀ → lo; # Dizi, Me’en, Mursi, Suri /lɔ/ ([1], Appendix E); not used in Amharic. | |
64 | ሏ ↔ lwa; | |
65 | ል ← l; | |
66 | # Appendix B of [1] transcribes ሐ as Voiceless pharyngeal fricative | |
67 | # /ħə/. However, according to an Amharic-speaking person, Amharic | |
68 | # makes no difference in pronunciation between ሐ...ሓ and ሀ...ሃ; both | |
69 | # are pronounced as Voiceless glottal fricative /h/. Also, according | |
70 | # to the speaker there is no /hə/ sequence in Amharic; instead, it | |
71 | # gets pronounced as /ha/. | |
72 | ሐ → ha; | |
73 | ሑ → hu; | |
74 | ሒ → hi; | |
75 | ሓ → ha; | |
76 | ሔ → he; | |
77 | ሕ → hɨ; | |
78 | ሖ → ho; | |
79 | ሗ → hwa; | |
80 | መ ↔ mə; | |
81 | ሙ ↔ mu; | |
82 | ሚ ↔ mi; | |
83 | ማ ↔ ma; | |
84 | ሜ ↔ me; | |
85 | ም ↔ mɨ; | |
86 | ሞ ↔ mo; | |
87 | ⶁ → mo; # Dizi, Me’en, Mursi, Suri /mɔ/ ([1], Appendix E); not used in Amharic. | |
88 | ᎀ → mwə; # Sebatbeit /mwə/ ([1], Appendix H); not used in Amharic. | |
89 | ᎃ → mwu; # Sebatbeit /mwu/ ([1], Appendix H); not used in Amharic. | |
90 | ᎁ → mwi; # Sebatbeit /mwi/ ([1], Appendix H); not used in Amharic. | |
91 | ሟ ↔ mwa; | |
92 | ᎂ → mwe; # Sebatbeit /mwe/ ([1], Appendix H); not used in Amharic. | |
93 | ፙ → mja; # Unclear which language; Appendix L of [1] transcribes ፙ as /mʲa/. | |
94 | ም ← m; | |
95 | ሠ → sə; | |
96 | ሡ → su; | |
97 | ሢ → si; | |
98 | ሣ → sa; | |
99 | ሤ → se; | |
100 | ሥ → sɨ; | |
101 | ሦ → so; | |
102 | ሧ → swa; | |
103 | ረ ↔ rə; | |
104 | ሩ ↔ ru; | |
105 | ሪ ↔ ri; | |
106 | ራ ↔ ra; | |
107 | ሬ ↔ re; | |
108 | ር ↔ rɨ; | |
109 | ሮ ↔ ro; | |
110 | ⶂ → ro; # Dizi, Me’en, Mursi, Suri /rɔ/ ([1], Appendix E); not used in Amharic. | |
111 | ሯ ↔ rwa; | |
112 | ፘ → rja; # Unclear which language; Appendix L of [1] transcribes ፘ as /rʲa/. | |
113 | ር ← r; | |
114 | # Amharic speakers pronounce ⶠ like ሸ. Source: [1], Appendix B. | |
115 | ⶠ → ʃə; | |
116 | ⶡ → ʃu; | |
117 | ⶢ → ʃi; | |
118 | ⶣ → ʃa; | |
119 | ⶤ → ʃe; | |
120 | ⶥ → ʃɨ; | |
121 | ⶦ → ʃo; | |
122 | ሸ ↔ ʃə; | |
123 | ሹ ↔ ʃu; | |
124 | ሺ ↔ ʃi; | |
125 | ሻ ↔ ʃa; | |
126 | ሼ ↔ ʃe; | |
127 | ሽ ↔ ʃɨ; | |
128 | ሾ ↔ ʃo; | |
129 | ⶄ → ʃo; # Dizi, Me’en, Mursi, Suri /ʃɔ/ ([1], Appendix E); not used in Amharic. | |
130 | ሿ ↔ ʃwa; | |
131 | ሽ ← ʃ; | |
132 | ቀ ↔ kʼə; | |
133 | ቁ ↔ kʼu; | |
134 | ቂ ↔ kʼi; | |
135 | ቃ ↔ kʼa; | |
136 | ቄ ↔ kʼe; | |
137 | ቅ ↔ kʼɨ; | |
138 | ቆ ↔ kʼo; | |
139 | ቇ → kʼo; # Dizi, Me’en, Mursi, Suri /kʼɔ/ ([1], Appendix E); not used in Amharic. | |
140 | ቈ ↔ kʼwə; | |
141 | ቍ ↔ kʼwu; | |
142 | ቊ ↔ kʼwi; | |
143 | ቋ ↔ kʼwa; | |
144 | ቌ ↔ kʼwe; | |
145 | ቅ ← kʼ; | |
146 | # In Awngi, Blin, Qimant, and Xamtanga, ቐ is spoken as voiced uvular fricative [ʁ]. | |
147 | # Source: [1], Appendix C. However, */ʁ/ is not an Amharic phoneme. | |
148 | # When reading foreign words with ቐ, Amharic speakers pronounce | |
149 | # ቐ like ቀ, i.e. as velar ejective /kʼ/. | |
150 | ቐ → kʼə; | |
151 | ቑ → kʼu; | |
152 | ቒ → kʼi; | |
153 | ቓ → kʼa; | |
154 | ቔ → kʼe; | |
155 | ቕ → kʼɨ; | |
156 | ቖ → kʼo; | |
157 | ቘ → kʼwə; | |
158 | ቝ → kʼwu; | |
159 | ቚ → kʼwi; | |
160 | ቛ → kʼwa; | |
161 | ቜ → kʼwe; | |
162 | # In Sebatbeit, ⷀ is spoken as palatalized velar ejective /kʼʲ/ ([1], Appendix H). | |
163 | # In Amharic, the syllable is not used, but it might appear in names. | |
164 | ⷀ → kʼjə; | |
165 | ⷁ → kʼju; | |
166 | ⷂ → kʼji; | |
167 | ⷃ → kʼja; | |
168 | ⷄ → kʼje; | |
169 | ⷅ → kʼjɨ; | |
170 | ⷆ → kʼjo; | |
171 | በ ↔ bə; | |
172 | ቡ ↔ bu; | |
173 | ቢ ↔ bi; | |
174 | ባ ↔ ba; | |
175 | ቤ ↔ be; | |
176 | ብ ↔ bɨ; | |
177 | ቦ ↔ bo; | |
178 | ⶅ → bo; # Dizi, Me’en, Mursi, Suri /bɔ/ ([1], Appendix E); not used in Amharic. | |
179 | ᎄ → bwə; # Sebatbeit /bʷə/ ([1], Appendix H); not used in Amharic. | |
180 | ᎇ → bwu; # Sebatbeit /bʷu/ ([1], Appendix H); not used in Amharic. | |
181 | ᎅ → bwi; # Sebatbeit /bʷi/ ([1], Appendix H); not used in Amharic. | |
182 | ቧ → bwa; # Sebatbeit /bʷa/ ([1], Appendix H); not used in Amharic. | |
183 | ᎆ → bwe; # Sebatbeit /bʷe/ ([1], Appendix H); not used in Amharic. | |
184 | ብ ← b; | |
185 | ቨ ↔ və; | |
186 | ቩ ↔ vu; | |
187 | ቪ ↔ vi; | |
188 | ቫ ↔ va; | |
189 | ቬ ↔ ve; | |
190 | ቭ ↔ vɨ; | |
191 | ቮ ↔ vo; | |
192 | ቯ ↔ vwa; | |
193 | ቭ ← v; | |
194 | # Unclear which Ethiopic language uses ⶨ. It only appears in the | |
195 | # “Language Neutral” list of Appendix L in [1], which transcribes it as t\u0361ʃ. | |
196 | # For Amharic, we pronounce ⶨ therefore like ቸ. | |
197 | ⶨ → t\u0361ʃə; | |
198 | ⶩ → t\u0361ʃu; | |
199 | ⶪ → t\u0361ʃi; | |
200 | ⶫ → t\u0361ʃa; | |
201 | ⶬ → t\u0361ʃe; | |
202 | ⶭ → t\u0361ʃɨ; | |
203 | ⶮ → t\u0361ʃo; | |
204 | # In Amharic, ኀ is pronounced like ሀ. | |
205 | # Source: [1], section on “Phonological Redundancy” for Amharic, page 5. | |
206 | # Appendix B of [1] transcribes ሀ as /hə/. However, according to | |
207 | # an Amharic-speaking person, there is no /hə/ sequence in Amharic. | |
208 | # Instead, ሀ (and hence also ኀ) gets pronounced as /ha/. | |
209 | ኀ → ha; | |
210 | ኁ → hu; | |
211 | ኂ → hi; | |
212 | ኃ → ha; | |
213 | ኄ → he; | |
214 | ኅ → hɨ; | |
215 | ኆ → ho; | |
216 | ኇ → ho; # Dizi, Me’en, Mursi, Suri /ŋɔ/ ([1], Appendix E); not used in Amharic. | |
217 | ኈ → hwə; | |
218 | ኍ → hwu; | |
219 | ኊ → hwi; | |
220 | ኋ → hwa; | |
221 | ኌ → hwe; | |
222 | ነ ↔ nə; | |
223 | ኑ ↔ nu; | |
224 | ኒ ↔ ni; | |
225 | ና ↔ na; | |
226 | ኔ ↔ ne; | |
227 | ን ↔ nɨ; | |
228 | ኖ ↔ no; | |
229 | ⶈ → no; # Dizi, Me’en, Mursi, Suri /nɔ/ ([1], Appendix E); not used in Amharic. | |
230 | ኗ ↔ nwa; | |
231 | ን ← n; | |
232 | ኘ ↔ ɲə; | |
233 | ኙ ↔ ɲu; | |
234 | ኚ ↔ ɲi; | |
235 | ኛ ↔ ɲa; | |
236 | ኜ ↔ ɲe; | |
237 | ኝ ↔ ɲɨ; | |
238 | ኞ ↔ ɲo; | |
239 | ⶉ → ɲo; # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic. | |
240 | ኟ ↔ ɲwa; | |
241 | ኝ ← ɲ; | |
242 | # Amharic speakers pronounce ኸ as [h] because Amharic has no [x] sound. | |
243 | # However, in transliterations of foreign (eg. Spanish) words with [x], | |
244 | # several Amharic speakers have confirmed that they prefer ኻ over ሃ. | |
245 | ዀ → hwə; | |
246 | ዂ → hwi; | |
247 | ዃ → hwa; | |
248 | ዄ → hwe; | |
249 | ዅ → hwɨ; | |
250 | ኸ → hə; | |
251 | ኹ → hu; | |
252 | ኺ → hi; | |
253 | ኻ → ha; | |
254 | ኼ → he; | |
255 | ኽ → hɨ; | |
256 | ኾ → ho; | |
257 | ዀ ← xwə; | |
258 | ዂ ← xwi; | |
259 | ዃ ← xwa; | |
260 | ዄ ← xwe; | |
261 | ዅ ← xwɨ; | |
262 | ዅ ← xw; | |
263 | ኸ ← xə; | |
264 | ኹ ← xu; | |
265 | ኺ ← xi; | |
266 | ኻ ← xa; | |
267 | ኼ ← xe; | |
268 | ኽ ← xɨ; | |
269 | ኾ ← xo; | |
270 | ኽ ← x; | |
271 | አ ↔ ʔə; | |
272 | ኡ ↔ ʔu; | |
273 | ኢ ↔ ʔi; | |
274 | ኣ ↔ ʔa; | |
275 | ኤ ↔ ʔe; | |
276 | እ ↔ ʔɨ; | |
277 | ኦ ↔ ʔo; | |
278 | ⶊ → ʔo; # Dizi, Me’en, Mursi, Suri /ɲɔ/ ([1], Appendix E); not used in Amharic. | |
279 | እ ← ʔ; | |
280 | ከ ↔ kə; | |
281 | ኩ ↔ ku; | |
282 | ኪ ↔ ki; | |
283 | ካ ↔ ka; | |
284 | ኬ ↔ ke; | |
285 | ክ ↔ kɨ; | |
286 | ኮ ↔ ko; | |
287 | ኰ ↔ kwə; | |
288 | ኵ ↔ kwu; | |
289 | ኲ ↔ kwi; | |
290 | ኳ ↔ kwa; | |
291 | ኴ ↔ kwe; | |
292 | ክ ← k; | |
293 | # In Sebatbeit, ⷈ is spoken as palatalized velar plosive /kʲ/ ([1], Appendix H). | |
294 | # Amharic speakers pronounce it as /k/ without palatalization. | |
295 | ⷈ → kə; | |
296 | ⷉ → ku; | |
297 | ⷊ → ki; | |
298 | ⷋ → ka; | |
299 | ⷌ → ke; | |
300 | ⷍ → kɨ; | |
301 | ⷎ → ko; | |
302 | # In Sebatbeit, ⷐ is spoken as palatalized voiceless velar fricative/xʲə/ | |
303 | # according to [1], Appendix H. When the syllable appears in names, | |
304 | # Amharic speakers pronounce it as /kə/ without palatalization. | |
305 | ⷐ → kə; | |
306 | ⷑ → ku; | |
307 | ⷒ → ki; | |
308 | ⷓ → ka; | |
309 | ⷔ → ke; | |
310 | ⷕ → kɨ; | |
311 | ⷖ → ko; | |
312 | ወ ↔ wə; | |
313 | ዉ ↔ wu; | |
314 | ዊ ↔ wi; | |
315 | ዋ ↔ wa; | |
316 | ዌ ↔ we; | |
317 | ው ↔ wɨ; | |
318 | ዎ ↔ wo; | |
319 | ዏ → wo; # Dizi, Me’en, Mursi, Suri /wɔ/ ([1], Appendix E); not used in Amharic. | |
320 | ው ← w; | |
321 | ዐ ↔ ʕə; | |
322 | ዑ ↔ ʕu; | |
323 | ዒ ↔ ʕi; | |
324 | ዓ ↔ ʕa; | |
325 | ዔ ↔ ʕe; | |
326 | ዕ ↔ ʕɨ; | |
327 | ዖ ↔ ʕo; | |
328 | ዒ ← ʕ; | |
329 | ዘ ↔ zə; | |
330 | ዙ ↔ zu; | |
331 | ዚ ↔ zi; | |
332 | ዛ ↔ za; | |
333 | ዜ ↔ ze; | |
334 | ዝ ↔ zɨ; | |
335 | ዞ ↔ zo; | |
336 | ⶋ → zo; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. | |
337 | ዟ ↔ zwa; | |
338 | ዝ ← z; | |
339 | ዠ ↔ ʒə; | |
340 | ዡ ↔ ʒu; | |
341 | ዢ ↔ ʒi; | |
342 | ዣ ↔ ʒa; | |
343 | ዤ ↔ ʒe; | |
344 | ዥ ↔ ʒɨ; | |
345 | ዦ ↔ ʒo; | |
346 | ዧ ↔ ʒwa; | |
347 | ዢ ← ʒ; | |
348 | # Unclear which Ethiopic language uses ⶰ. It only appears in the | |
349 | # “Language Neutral” list of Appendix L in [1], which transcribes it as ʒ. | |
350 | # For Amharic, we pronounce ⶰ therefore like ዠ. | |
351 | ⶰ → ʒə; | |
352 | ⶱ → ʒu; | |
353 | ⶲ → ʒi; | |
354 | ⶳ → ʒa; | |
355 | ⶴ → ʒe; | |
356 | ⶵ → ʒɨ; | |
357 | ⶶ → ʒo; | |
358 | የ ↔ jə; | |
359 | ዩ ↔ ju; | |
360 | ዪ ↔ ji; | |
361 | ያ ↔ ja; | |
362 | ዬ ↔ je; | |
363 | ይ ↔ jɨ; | |
364 | ዮ ↔ jo; | |
365 | ዯ → jo; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. | |
366 | ይ ← j; | |
367 | ጀ ↔ d\u0361ʒə; | |
368 | ጁ ↔ d\u0361ʒu; | |
369 | ጂ ↔ d\u0361ʒi; | |
370 | ጃ ↔ d\u0361ʒa; | |
371 | ጄ ↔ d\u0361ʒe; | |
372 | ጅ ↔ d\u0361ʒɨ; | |
373 | ጆ ↔ d\u0361ʒo; | |
374 | ጇ ↔ d\u0361ʒwa; | |
375 | ጅ ← d\u0361ʒ; | |
376 | ደ ↔ də; | |
377 | ዱ ↔ du; | |
378 | ዲ ↔ di; | |
379 | ዳ ↔ da; | |
380 | ዴ ↔ de; | |
381 | ድ ↔ dɨ; | |
382 | ዶ ↔ do; | |
383 | ⶌ → do; # Dizi, Me’en, Mursi, Suri /zɔ/ ([1], Appendix E); not used in Amharic. | |
384 | ዷ ↔ dwa; | |
385 | ድ ← d; | |
386 | ገ ↔ ɡə; | |
387 | ጉ ↔ ɡu; | |
388 | ጊ ↔ ɡi; | |
389 | ጋ ↔ ɡa; | |
390 | ጌ ↔ ɡe; | |
391 | ግ ↔ ɡɨ; | |
392 | ጎ ↔ ɡo; | |
393 | ጐ ↔ ɡwə; | |
394 | ጕ ↔ ɡwu; | |
395 | ጒ ↔ ɡwi; | |
396 | ጓ ↔ ɡwa; | |
397 | ጔ ↔ ɡwe; | |
398 | ግ ← ɡ; | |
399 | # In Awngi, Blin, Qimant, and Xamtanga, ጘ is spoken as voiced velar nasal [ŋ]. | |
400 | # Source: [1], Appendix C. While /ŋ/ is not an Amharic phoneme, Amharic speakers | |
401 | # still can pronounce it according to our source. However, when transliterating | |
402 | # foreign words with [ŋ], Amharic uses the sequence ንግ /nɡ/. For example, | |
403 | # the Amharic transliteration of Washington /waʃiŋtən/ is ዋሺንግተን. | |
404 | ጘ → ŋə; | |
405 | ጙ → ŋu; | |
406 | ጚ → ŋi; | |
407 | ጛ → ŋa; | |
408 | ጜ → ŋe; | |
409 | ጝ → ŋɨ; | |
410 | ጞ → ŋo; | |
411 | ⶓ → ŋwə; | |
412 | ⶖ → ŋwu; | |
413 | ⶔ → ŋwi; | |
414 | ጟ → ŋwa; | |
415 | ⶕ → ŋwe; | |
416 | # Since there is no uvular nasal [ɴ] in Amharic, we use the velar nasal [ŋ]. | |
417 | ጘ ← ɴə; | |
418 | ጙ ← ɴu; | |
419 | ጚ ← ɴi; | |
420 | ጛ ← ɴa; | |
421 | ጜ ← ɴe; | |
422 | ጝ ← ɴɨ; | |
423 | ጞ ← ɴo; | |
424 | ጝ ← ɴ; | |
425 | # In Sebatbeit, ⷘ is spoken as palatalized voiced velar stop /ɡj/ ([1], Appendix H). | |
426 | # Amharic speakers pronounce it as voiced velar stop /ɡ/ without palatalization. | |
427 | ⷘ → ɡə; | |
428 | ⷙ → ɡu; | |
429 | ⷚ → ɡi; | |
430 | ⷛ → ɡa; | |
431 | ⷜ → ɡe; | |
432 | ⷝ → ɡɨ; | |
433 | ⷞ → ɡo; | |
434 | ጠ ↔ tʼə; | |
435 | ጡ ↔ tʼu; | |
436 | ጢ ↔ tʼi; | |
437 | ጣ ↔ tʼa; | |
438 | ጤ ↔ tʼe; | |
439 | ጥ ↔ tʼɨ; | |
440 | ጦ ↔ tʼo; | |
441 | ጧ ↔ tʼwa; | |
442 | ጢ ← tʼ; | |
443 | ጨ ↔ t\u0361ʃʼə; | |
444 | ጩ ↔ t\u0361ʃʼu; | |
445 | ጪ ↔ t\u0361ʃʼi; | |
446 | ጫ ↔ t\u0361ʃʼa; | |
447 | ጬ ↔ t\u0361ʃʼe; | |
448 | ጭ ↔ t\u0361ʃʼɨ; | |
449 | ጮ ↔ t\u0361ʃʼo; | |
450 | ⶐ → t\u0361ʃʼo; # Dizi, Me’en, Mursi, Suri /t\u0361ʃʼɔ/ ([1], Appendix E); not used in Amharic. | |
451 | ጯ ↔ t\u0361ʃʼwa; | |
452 | ጪ ← t\u0361ʃʼ; | |
453 | # According to Appendix B of [1], the following are used in the Bench language | |
454 | # (aka Benchnon, Gimira). In Bench, ⶻ is pronounced as /ʈ\u0361ʂʼ/ Retroflex | |
455 | # ejective affricate; with a phonemic distrinction to the non-retroflex version. | |
456 | # Amharic does not have retroflex phonemes, so we go with /t\u0361ʃʼ/. | |
457 | ⶸ → t\u0361ʃʼə; | |
458 | ⶹ → t\u0361ʃʼu; | |
459 | ⶺ → t\u0361ʃʼi; | |
460 | ⶻ → t\u0361ʃʼa; | |
461 | ⶼ → t\u0361ʃʼe; | |
462 | ⶽ → t\u0361ʃʼɨ; | |
463 | ⶾ → t\u0361ʃʼo; | |
464 | ቸ ↔ t\u0361ʃə; | |
465 | ቹ ↔ t\u0361ʃu; | |
466 | ቺ ↔ t\u0361ʃi; | |
467 | ቻ ↔ t\u0361ʃa; | |
468 | ቼ ↔ t\u0361ʃe; | |
469 | ች ↔ t\u0361ʃɨ; | |
470 | ቾ ↔ t\u0361ʃo; | |
471 | ቿ ↔ t\u0361ʃwa; | |
472 | ች ← t\u0361ʃ; | |
473 | ተ ↔ tə; | |
474 | ቱ ↔ tu; | |
475 | ቲ ↔ ti; | |
476 | ታ ↔ ta; | |
477 | ቴ ↔ te; | |
478 | ት ↔ tɨ; | |
479 | ቶ ↔ to; | |
480 | ⶆ → to; # Dizi, Me’en, Mursi, Suri /tɔ/ ([1], Appendix E); not used in Amharic. | |
481 | ቷ ↔ twa; | |
482 | ት ← t; | |
483 | ጰ ↔ pʼə; | |
484 | ጱ ↔ pʼu; | |
485 | ጲ ↔ pʼi; | |
486 | ጳ ↔ pʼa; | |
487 | ጴ ↔ pʼe; | |
488 | ጵ ↔ pʼɨ; | |
489 | ጶ ↔ pʼo; | |
490 | ⶑ → pʼo; # Dizi, Me’en, Mursi, Suri /pʼɔ/ ([1], Appendix E); not used in Amharic. | |
491 | ጷ ↔ pʼwa; | |
492 | ጵ ← pʼ; | |
493 | ጸ ↔ sʼə; | |
494 | ጹ ↔ sʼu; | |
495 | ጺ ↔ sʼi; | |
496 | ጻ ↔ sʼa; | |
497 | ጼ ↔ sʼe; | |
498 | ጽ ↔ sʼɨ; | |
499 | ጾ ↔ sʼo; | |
500 | ጿ ↔ sʼwa; | |
501 | ጽ ← sʼ; | |
502 | # In Amharic, ፀ is pronounced like ጸ. | |
503 | # Source: [1], section on “Phonological Redundancy” for Amharic, page 5. | |
504 | ፀ → sʼə; | |
505 | ፁ → sʼu; | |
506 | ፂ → sʼi; | |
507 | ፃ → sʼa; | |
508 | ፄ → sʼe; | |
509 | ፅ → sʼɨ; | |
510 | ፆ → sʼo; | |
511 | ፇ → sʼo; # Dizi, Me’en, Mursi, Suri /sʼɔ/ ([1], Appendix E); not used in Amharic. | |
512 | # Amharic speakers pronounce ሰ like ሠ. Source: [1], Appendix B. | |
513 | ሰ ↔ sə; | |
514 | ሱ ↔ su; | |
515 | ሲ ↔ si; | |
516 | ሳ ↔ sa; | |
517 | ሴ ↔ se; | |
518 | ስ ↔ sɨ; | |
519 | ሶ ↔ so; | |
520 | ⶃ → so; # Dizi, Me’en, Mursi, Suri /sɔ/ ([1], Appendix E); not used in Amharic. | |
521 | ሷ ↔ swa; | |
522 | ስ ← s; | |
523 | ፈ ↔ fə; | |
524 | ፉ ↔ fu; | |
525 | ፊ ↔ fi; | |
526 | ፋ ↔ fa; | |
527 | ፌ ↔ fe; | |
528 | ፍ ↔ fɨ; | |
529 | ፎ ↔ fo; | |
530 | ᎈ → fwə; # Sebatbeit /fwə/ ([1], Appendix H); not used in Amharic. | |
531 | ᎉ → fwu; # Sebatbeit /fwu/ ([1], Appendix H); not used in Amharic. | |
532 | ᎋ → fwi; # Sebatbeit /fwi/ ([1], Appendix H); not used in Amharic. | |
533 | ፏ ↔ fwa; | |
534 | ᎊ → fwe; # Sebatbeit /fwe/ ([1], Appendix H); not used in Amharic. | |
535 | ፚ → fja; # Unclear which language; Appendix L of [1] transcribes ፚ as /fja/. | |
536 | ፍ ← f; | |
537 | ፐ ↔ pə; | |
538 | ፑ ↔ pu; | |
539 | ፒ ↔ pi; | |
540 | ፓ ↔ pa; | |
541 | ፔ ↔ pe; | |
542 | ፕ ↔ pɨ; | |
543 | ፖ ↔ po; | |
544 | ⶒ → po; # Dizi, Me’en, Mursi, Suri /pɔ/ ([1], Appendix E); not used in Amharic. | |
545 | ᎌ → pwə; # Sebatbeit /pwə/ ([1], Appendix H); not used in Amharic. | |
546 | ᎍ → pwu; # Sebatbeit /pwu/ ([1], Appendix H); not used in Amharic. | |
547 | ᎏ → pwi; # Sebatbeit /pwi/ ([1], Appendix H); not used in Amharic. | |
548 | ፗ ↔ pwa; | |
549 | ᎎ → pwe; # Sebatbeit /pwe/ ([1], Appendix H); not used in Amharic. | |
550 | ፕ ← p; | |
551 | ኧ ↔ ə; | |
552 | ኡ ← u; # ኡላዓን ባዓታር ← Ulaan Baatar /ulaʕan baʕatar/ | |
553 | አ ← a; # አምስተርዳም ← Amsterdam /amstərdam/ | |
554 | ኤ ← e; | |
555 | እ ← ɨ; | |
556 | ኦ ← o; # ፖርት ኦፍ ስፔን ← Port of Spain /port of speːn/ | |
557 | ኢ ← i; # ኢስላማባድ ← Islamabad /islamabad/ | |
558 | # Applications will typically split words before calling our rules. | |
559 | # To be resilient, we replace punctuation by whitespace in IPA. | |
560 | ፠ → ' '; # U+1360 ETHIOPIC SECTION MARK | |
561 | ፡ → ' '; # U+1361 ETHIOPIC WORDSPACE | |
562 | ። → ' '; # U+1362 ETHIOPIC FULL STOP | |
563 | ፣ → ' '; # U+1363 ETHIOPIC COMMA | |
564 | ፤ → ' '; # U+1364 ETHIOPIC SEMICOLON | |
565 | ፥ → ' '; # U+1365 ETHIOPIC COLON | |
566 | ፦ → ' '; # U+1366 ETHIOPIC PREFACE COLON | |
567 | ፧ → ' '; # U+1367 ETHIOPIC QUESTION MARK | |
568 | ፨ → ' '; # U+1368 ETHIOPIC PARAGRAPH SEPARATOR | |
569 | # Likewise, Ethiopic numberals cannot be pronounced by these rules, | |
570 | # so we replace them by whitespace in the output IPA notation. | |
571 | # Applications will typically pre-process text before calling | |
572 | # the am → am_FONIPA transform. | |
573 | ፩ → ' '; # U+1369 ETHIOPIC DIGIT ONE | |
574 | ፪ → ' '; # U+136A ETHIOPIC DIGIT TWO | |
575 | ፫ → ' '; # U+136B ETHIOPIC DIGIT THREE | |
576 | ፬ → ' '; # U+136C ETHIOPIC DIGIT FOUR | |
577 | ፭ → ' '; # U+136D ETHIOPIC DIGIT FIVE | |
578 | ፮ → ' '; # U+136E ETHIOPIC DIGIT SIX | |
579 | ፯ → ' '; # U+136F ETHIOPIC DIGIT SEVEN | |
580 | ፰ → ' '; # U+1370 ETHIOPIC DIGIT EIGHT | |
581 | ፱ → ' '; # U+1371 ETHIOPIC DIGIT NINE | |
582 | ፲ → ' '; # U+1372 ETHIOPIC NUMBER TEN | |
583 | ፳ → ' '; # U+1373 ETHIOPIC NUMBER TWENTY | |
584 | ፴ → ' '; # U+1374 ETHIOPIC NUMBER THIRTY | |
585 | ፵ → ' '; # U+1375 ETHIOPIC NUMBER FORTY | |
586 | ፶ → ' '; # U+1376 ETHIOPIC NUMBER FIFTY | |
587 | ፷ → ' '; # U+1377 ETHIOPIC NUMBER SIXTY | |
588 | ፸ → ' '; # U+1378 ETHIOPIC NUMBER SEVENTY | |
589 | ፹ → ' '; # U+1379 ETHIOPIC NUMBER EIGHTY | |
590 | ፺ → ' '; # U+137A ETHIOPIC NUMBER NINETY | |
591 | ፻ → ' '; # U+137B ETHIOPIC NUMBER HUNDRED | |
592 | ፼ → ' '; # U+137C ETHIOPIC NUMBER TEN THOUSAND | |
593 | # Transform IPA length markers to one of these: | |
594 | # U+135D ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK | |
595 | # U+135E ETHIOPIC COMBINING VOWEL LENGTH MARK | |
596 | # U+135F ETHIOPIC COMBINING GEMINATION MARK | |
597 | ::null(); | |
598 | ← ː ; # Strip off any remaining IPA length markers. | |
599 | ::(null); | |
600 | ($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135D → $1 ː $2 ː; | |
601 | ($IPA_CONSONANT) ([jw]? $IPA_VOWEL) \u135E → $1 $2 ː; | |
602 | ($IPA_CONSONANT) ([jw]? $IPA_VOWEL?) \u135F → $1 ː $2; | |
603 | [\u135D \u135E \u135F] → ; # Strip off any remaining length markers. | |
604 | $1 wa \u135D ← ($LABIALIZABLE_BEFORE_A) ː waː; # ቷ\u135D ← [tːʷaː] | |
605 | $1 wa \u135E ← ($LABIALIZABLE_BEFORE_A) waː; # ቷ\u135E ← [tʷaː] | |
606 | $1 wa \u135F ← ($LABIALIZABLE_BEFORE_A) ː wa; # አቷ\u135F ← [tːʷa] | |
607 | $1 \u135F $2 \u135E ← ([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL) ː; | |
608 | $1 \u135F $2 ← {([b $LABIALIZABLE_BEFORE_A]) ː ([jw] $IPA_VOWEL?)}; | |
609 | $1 \u135E ← ($IPA_VOWEL ː); | |
610 | $1 \u135D ← (jː $IPA_VOWEL ː); | |
611 | $1 \u135E ← ([jw] $IPA_VOWEL ː); | |
612 | $1 \u135F ← (jː $IPA_VOWEL?); | |
613 | $1 \u135D ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL ː); | |
614 | $1 \u135E ← ($IPA_CONSONANT [w]? $IPA_VOWEL ː); | |
615 | $1 \u135F ← ($IPA_CONSONANT ː [w]? $IPA_VOWEL?); | |
616 | # Insert syllable markers in a separate pass. | |
617 | ::null; | |
618 | {($IPA_VOWEL ː?)} [[:L:]] → $1 \.; | |
619 | ::(null); | |
620 | ← [ˈˌ\. \u0303\u032F]; | |
621 | aj ← ai; # Nairobi /nairobi/ ናይሮቢ, Cairo /kairo/ ካይሮ | |
622 | aw ← au; # Bissau /bisːau/ ቢሳው | |
623 | eji ← ei; # Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ | |
624 | ewo ← eo; # Montevideo /montevideo/ ሞንቴቪዴዎ | |
625 | ija ← ia; # Monrovia /monrovia/ ሞንሮቪያ | |
626 | ijə ← iə; # Reunion /rijunijən/ ሪዩኒየን | |
627 | iw ← iu; # Vilnius /vilnius/ ቪልኒውስ, New Delhi /niu deːli/ ኒው ዴሊ | |
628 | jo ← io; # Tokyo /tokio/ ቶክዮ | |
629 | nɡ ← ŋɡ; # Kongo /koŋɡo/ ኮንጎ, Hungary /həŋɡari/ ሀንጋሪ | |
630 | nɡ ← ŋ; # Bangkok /baŋkok/ ባንግኮክ, Beijing /beid\u0361ʒiŋ/ ቤዪጂንግ | |
631 | uwa ← ua; # Kuala Lumpur /kuala lumpur/ ኩዋላ ሉምፑር, Ruanda /ruanda/ ሩዋንዳ | |
632 | bwe ← bue; # Buenos Aires /buenos aires/ ብዌኖስ አይሬስ | |
633 | sʼ ← t\u0361s; # Podgorica /podɡorit\u0361sa/ ፖድጎሪጻ, Vaduz /fadut\u0361s/ ፋዱጽ | |
634 | uwi ← ui; # Port Luis /port luis/ ፖርት ሉዊስ | |
635 | uwe ← ue; # Lithuania /lituenia/ ሊቱዌኒያ, Venezuela /venɨzuela/ ቬንዙዌላ | |
636 | ::(null); | |
637 | ʔə ← \. ə; | |
638 | ʔu ← \. u; | |
639 | ʔi ← \. i; | |
640 | ʔa ← \. a; | |
641 | ʔe ← \. e; | |
642 | ʔɨ ← \. ɨ; | |
643 | ʔo ← \. o; | |
644 | $1 w ← {($IPA_VOWEL ː?) \u032F} $IPA_VOWEL; # /ewowa/ ← /e\u032Fo\u032Fa/ | |
645 | ::(null); | |
646 | n ← [n {n\u033C} {n\u033C\u030A} {m\u033A} {n\u030A} {n\u0325} ⁿ ᵑ]; | |
647 | m ← [ɱ {m\u0325} {m\u032A} ᵐ]; | |
648 | ɲ ← [{ɳ\u030A} {ɳ\u0325} ɳ {ɲ\u030A} {ɲ\u0325} ɲ]; | |
649 | ŋ ← [{ŋ\u030A} {ŋ\u0325} ŋ]; | |
650 | ɴ ← [{ɴ\u030A} {ɴ\u0325} ɴ]; | |
651 | p ← [{t\u033C} {p\u033A}]; | |
652 | pʼ ← [ʘ ɋ]; | |
653 | b ← [{d\u033C} {b\u033A} {ɾ\u033C} ɓ]; | |
654 | t ← [{t\u032A} ʈ]; | |
655 | tʼ ← [ǁ ʖ]; | |
656 | d ← [ɖ ɗ ᶑ]; | |
657 | k ← q; | |
658 | kʼ ← [ǃ ʗ]; | |
659 | ɡ ← [g ɢ ɣ ɠ ʛ]; | |
660 | nɡ ← ᵑɡ; | |
661 | ʔ ← ʡ; | |
662 | s ← [θ {θ\u0331} {θ\u031E} {θ\u033C} {ɸ\u033A}]; | |
663 | z ← [ð {ð\u0320} {ð\u033C} {β\u033A}]; | |
664 | sʼ ← [{t\u0361s} {t\u035Cs} ʦ]; | |
665 | t\u0361ʃ ← [{t\u035Cʃ} ʧ {t\u0361ɕ} {t\u035Cɕ} ʨ {ʈ\u0361ʂ} c]; | |
666 | t\u0361ʃʼ ← [ǀ ʇ ǂ ʄ]; | |
667 | d\u0361ʒ ← [ʤ ʣ {d\u0361z} {d\u035Cz} {d\u0361ɕ} ʥ {d\u0361ʑ} {d\u035Cʑ} {ɖ\u0361ʐ} {d\u0361ʐ} ɟ]; | |
668 | pf ← [{p\u032A} {p\u0346} ȹ {p\u0361f} {p\u032Af} {p\u032A\u035Cf}]; | |
669 | bv ← [{b\u032A} {b\u0346} ȸ {b\u0361v} {b\u032A\u0361v}]; | |
670 | ʃ ← [ʂ ɕ]; | |
671 | ʒ ← [ʐ ʑ]; | |
672 | r ← [ɾ ɽ ʁ]; | |
673 | rːʒ ← r\u031Dː; | |
674 | rʒ ← r\u031D; | |
675 | v ← β; | |
676 | x ← [ç x χ]; | |
677 | ʕ ← ʕ\u031D; | |
678 | h ← ɦ; | |
679 | j ← [ʝ ʲ]; | |
680 | lj ← ʎ [iɨ]? [jʝʲ]?; | |
681 | t\u0361ʃl ← [{t\u0361ɬ} {tɬ}]; | |
682 | ʃl ← ɬ; | |
683 | w ← {u\u032F} $IPA_VOWEL; | |
684 | w ← ʷ; | |
685 | ʼː ← ːʼ; # /pʼː/ ← /pːʼ/; /sʼː/ ← /sːʼ/; etc. | |
686 | ::(null); | |
687 | i ← y; | |
688 | ɨ ← [ɪ ʉ]; | |
689 | u ← [ʊ ɯ]; | |
690 | ə ← [ɛ æ ɘ]; | |
691 | o ← [ɔ ø]; | |
692 | a ← ɑ; | |
693 | ʼ ← ʰ; | |
694 | ← [ʱ]; | |
695 | $1ːʲ ← ([pbtd])ʲː; # [bːʲeː] ← [bʲːeː] | |
696 | $1ːʷ ← ([pbtd])ʷː; # [bːʷeː] ← [bʷːeː] | |
697 | ::(NFC); | |
698 | ← [ \u0303 \u0330 \u030B \u0301 \u0304 \u0300 \u030F \u030C \u0302 ˥ ˦ ˧ ˨ ˩ ꜜ ꜛ ↗ ↘ ]; | |
699 | ::(NFD); | |
700 |