X-Git-Url: https://git.saurik.com/apple/icu.git/blobdiff_plain/b331163bffd790ced0e88b73f44f86d49ccc48a5..340931cb2e044a2141d11567dd0f782524e32994:/icuSources/data/translit/ro_ro_FONIPA.txt diff --git a/icuSources/data/translit/ro_ro_FONIPA.txt b/icuSources/data/translit/ro_ro_FONIPA.txt index 0f1258c1..f9658964 100644 --- a/icuSources/data/translit/ro_ro_FONIPA.txt +++ b/icuSources/data/translit/ro_ro_FONIPA.txt @@ -1,15 +1,23 @@ -# *************************************************************************** -# * -# * Copyright (C) 2004-2015, International Business Machines -# * Corporation; Unicode, Inc.; and others. All Rights Reserved. -# * -# *************************************************************************** +# © 2016 and later: Unicode, Inc. and others. +# License & terms of use: http://www.unicode.org/copyright.html#License +# # File: ro_ro_FONIPA.txt -# Generated from CLDR +# Generated from CLDR +# + +# Romanian orthography to phonemic transcription. +# http://en.wikipedia.org/wiki/Romanian_phonology # +# TODO: Currently this transform does not palatalize consonants. +$VowelEI = [e i î]; +$VowelAOU = [a â ă o u]; +$Vowel = [$VowelEI $VowelAOU]; +$Boundary = [^[:L:][:M:][:N:]]; :: NFC () ; :: Lower () ; +# Special cases. eoai → eo\u032Faj ; # eg. leoaică → /leo\u032Fajkə/, not /le\u032Fo\u032Faikə/ +# Triphthongs. eai → e\u032Faj ; eau → e\u032Faw ; eoa → e\u032Fo\u032Fa ; @@ -18,7 +26,7 @@ ia\-i → jaj ; iau → jaw ; iei → jej ; ieu → jew ; -[\uffff] { eu → jew ; +$Boundary {eu} → jew ; ioa → jo\u032Fa ; ioi → joj ; i\-oi → joj ; @@ -27,10 +35,11 @@ oai → o\u032Faj ; uai → waj ; uau → waw ; uăi → wəj ; +# Diphthongs. ai → aj ; âi → ɨj ; ăi → əj ; -au } r → au ; +au} r → au ; au → aw ; âu → ɨw ; ău → əw ; @@ -45,7 +54,7 @@ i\-a → ja ; ie → je ; ii → ij ; io → jo ; -iu } [aâăeiîou$] → iw ; +iu} [$Vowel $Boundary] → iw ; iu → ju ; oa → o\u032Fa ; oi → oj ; @@ -61,13 +70,13 @@ a → a ; ă → ə ; b → b ; ch → k ; -c } [ei] → t \u0361 ʃ ; +{c} [ei] → t\u0361ʃ ; c → k ; d → d ; e → e ; f → f ; gh → ɡ ; -g } [ei] → d \u0361 ʒ ; +{g} [ei] → d\u0361ʒ ; g → ɡ ; h → h ; i → i ; @@ -76,14 +85,43 @@ j → ʒ ; k → k ; l → l ; m → m ; +ng → ŋ ; n → n ; o → o ; p → p ; +q → k ; r → r ; s → s ; ş → ʃ ; +ș → ʃ ; t → t ; -ţ → t \u0361 s ; +ţ → t\u0361s ; +ț → t\u0361s ; u → u ; v → v ; +x → ks ; +y → i ; z → z ; +[:P:]+ → ' '; +# Romanian does not have any gemination. +# https://en.wikipedia.org/wiki/Gemination#Latin_and_Romance_languages +::null; +pp+ → p; +bb+ → b; +tt+ → t; +dd+ → d; +kk+ → k; +dd+ → d; +ɡɡ+ → ɡ; +ff+ → f; +vv+ → v; +hh+ → h; +ss+ → s; +zz+ → z; +ʃʃ+ → ʃ; +ʒʒ+ → ʒ; +rr+ → r; +ll+ → l; +jj+ → j; +ww+ → w; +