1 # © 2016 and later: Unicode, Inc. and others.
2 # License & terms of use: http://www.unicode.org/copyright.html#License
4 # File: uz_Cyrl_uz_BGN.txt
9 ########################################################################
10 # BGN/PCGN 1979 System
12 # The BGN/PCGN system for Uzbek was designed for use in
13 # romanizing names written in the Uzbek alphabet.
14 # The Uzbek alphabet contains four letters not present
15 # in the Russian alphabet: Ўў, Ққ, Ғғ, and Ҳҳ.
17 # The Uzbek Alphabet as defined by the BGN (Page 107):
19 # АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЪЬЭЮЯЎҚҒҲ
20 # абвгдеёжзийклмнопрстуфхцчшъьэюяўқғҳ
22 # Originally prepared by Michael Everson <everson@evertype.com>
23 ########################################################################
25 # MINIMAL FILTER: Uzbek-Latin
27 :: [АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЪЬЭЮЯЎҚҒҲабвгдеёжзийклмнопрстуфхцчшъьэюяўқғҳ] ;
31 ########################################################################
33 ########################################################################
35 # Define All Transformation Variables
37 ########################################################################
41 $upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЪЬҚҒҲ] ;
42 $lowerConsonants = [бвгджзйклмнпрстфхцчшъьқғҳ] ;
43 $consonants = [$upperConsonants $lowerConsonants] ;
44 $upperVowels = [АЕЁИОУЭЮЯЎ] ;
45 $lowerVowels = [аеёиоуэюяў] ;
46 $vowels = [$upperVowels $lowerVowels] ;
47 $lower = [$lowerConsonants $lowerVowels] ;
50 # Use this $wordBoundary until bug 2034 is fixed in ICU:
51 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
53 $wordBoundary = [^[:L:][:M:][:N:]] ;
56 ########################################################################
58 ########################################################################
60 # Rules moved to front to avoid masking
62 ########################################################################
65 $upperVowels[Ыы] → Y ;
68 ########################################################################
70 # Start of Alphabetic Transformations
72 ########################################################################
74 А → A ; # CYRILLIC CAPITAL LETTER A
75 а → a ; # CYRILLIC SMALL LETTER A
76 Б → B ; # CYRILLIC CAPITAL LETTER BE
77 б → b ; # CYRILLIC SMALL LETTER BE
78 В → W ; # CYRILLIC CAPITAL LETTER VE
79 в → w ; # CYRILLIC SMALL LETTER VE
82 ########################################################################
86 # The character sequences гҳ, кҳ, сҳ, and цҳ may be romanized g·h,
87 # k·h, s·h, and ts·h in order to differentiate those romanizations from
88 # the digraphs gh, kh, sh, and the letter sequence tsh, which are used
89 # to render the chаracters г, х, ш, and the character sequence тш.
91 ########################################################################
93 ГҲ → G·H ; # CYRILLIC CAPITAL LETTER GHE
94 Гҳ → G·h ; # CYRILLIC CAPITAL LETTER GHE
95 гҳ → g·h ; # CYRILLIC SMALL LETTER GHE
96 Г → G ; # CYRILLIC CAPITAL LETTER GHE
97 г → g ; # CYRILLIC SMALL LETTER GHE
100 ########################################################################
104 ########################################################################
106 Д → D ; # CYRILLIC CAPITAL LETTER DE
107 д → d ; # CYRILLIC SMALL LETTER DE
110 ########################################################################
112 # BGN Page 108 Rule 1:
114 # The character e should be romanized ye initially, after the vowel
115 # characters a, e, ё, и, о, у, э, ю, я, and ў, and after й and ь.
116 # In all other instances, it should be romanized e.
118 ########################################################################
120 Е}[$upperVowels [ЙЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE
121 Е}[$lowerVowels [йь]] → Ye ; # CYRILLIC CAPITAL LETTER IE
122 $wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE
123 Е → E ; # CYRILLIC CAPITAL LETTER IE
124 е}[$upperVowels $lowerVowels [ЙйЬь]] → ye ; # CYRILLIC SMALL LETTER IE
125 $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE
126 е → e ; # CYRILLIC SMALL LETTER IE
129 ########################################################################
133 ########################################################################
135 Ё} $lower → Yo ; # CYRILLIC CAPITAL LETTER IO
136 Ё → YO ; # CYRILLIC CAPITAL LETTER IO
137 ё → yo ; # CYRILLIC SMALL LETTER IO
138 Ж → J ; # CYRILLIC CAPITAL LETTER ZHE
139 ж → j ; # CYRILLIC SMALL LETTER ZHE
140 З → Z ; # CYRILLIC CAPITAL LETTER ZE
141 з → z ; # CYRILLIC SMALL LETTER ZE
142 И → I ; # CYRILLIC CAPITAL LETTER I
143 и → i ; # CYRILLIC SMALL LETTER I
144 Й → Y ; # CYRILLIC CAPITAL LETTER I
145 й → y ; # CYRILLIC SMALL LETTER I
148 ########################################################################
150 # BGN Page 108 Rule 2
154 ########################################################################
156 КҲ → K·H ; # CYRILLIC CAPITAL LETTER KA
157 Кҳ → K·h ; # CYRILLIC CAPITAL LETTER KA
158 кҳ → k·h ; # CYRILLIC SMALL LETTER KA
159 К → K ; # CYRILLIC CAPITAL LETTER KA
160 к → k ; # CYRILLIC SMALL LETTER KA
163 ########################################################################
167 ########################################################################
169 Л → L ; # CYRILLIC CAPITAL LETTER EL
170 л → l ; # CYRILLIC SMALL LETTER EL
171 М → M ; # CYRILLIC CAPITAL LETTER EM
172 м → m ; # CYRILLIC SMALL LETTER EM
173 Н → N ; # CYRILLIC CAPITAL LETTER EN
174 н → n ; # CYRILLIC SMALL LETTER EN
175 О → O ; # CYRILLIC CAPITAL LETTER O
176 о → o ; # CYRILLIC SMALL LETTER O
177 П → P ; # CYRILLIC CAPITAL LETTER PE
178 п → p ; # CYRILLIC SMALL LETTER PE
179 Р → R ; # CYRILLIC CAPITAL LETTER ER
180 р → r ; # CYRILLIC SMALL LETTER ER
183 ########################################################################
185 # BGN Page 108 Rule 2
189 ########################################################################
191 СҲ → S·H ; # CYRILLIC CAPITAL LETTER ES
192 Сҳ → S·h ; # CYRILLIC CAPITAL LETTER ES
193 сҳ → s·h ; # CYRILLIC SMALL LETTER ES
194 С → S ; # CYRILLIC CAPITAL LETTER ES
195 с → s ; # CYRILLIC SMALL LETTER ES
198 ########################################################################
202 ########################################################################
204 Т → T ; # CYRILLIC CAPITAL LETTER TE
205 т → t ; # CYRILLIC SMALL LETTER TE
206 У → Ū ; # CYRILLIC CAPITAL LETTER U
207 у → ū ; # CYRILLIC SMALL LETTER U
208 Ф → F ; # CYRILLIC CAPITAL LETTER EF
209 ф → f ; # CYRILLIC SMALL LETTER EF
210 Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA
211 Х → KH ; # CYRILLIC CAPITAL LETTER HA
212 х → kh ; # CYRILLIC SMALL LETTER HA
215 ########################################################################
217 # BGN Page 108 Rule 2
221 ########################################################################
223 ЦҲ → TS·H ; # CYRILLIC CAPITAL LETTER GHE
224 Цҳ → Ts·h ; # CYRILLIC CAPITAL LETTER GHE
225 цҳ → ts·h ; # CYRILLIC SMALL LETTER GHE
226 Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
227 Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
228 ц → ts ; # CYRILLIC SMALL LETTER TSE
231 ########################################################################
235 ########################################################################
237 Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
238 Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
239 ч → ch ; # CYRILLIC SMALL LETTER CHE
240 Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA
241 Ш → SH ; # CYRILLIC CAPITAL LETTER SHA
242 ш → sh ; # CYRILLIC SMALL LETTER SHA
243 Ъ → $prime ; # CYRILLIC CAPITAL LETTER HARD SIGN
244 ъ → $prime ; # CYRILLIC SMALL LETTER HARD SIGN
245 Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN
246 ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN
247 Э → e ; # CYRILLIC CAPITAL LETTER E
248 э → e ; # CYRILLIC SMALL LETTER E
249 Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU
250 Ю → YU ; # CYRILLIC CAPITAL LETTER YU
251 ю → yu ; # CYRILLIC SMALL LETTER YU
252 Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA
253 Я → YA ; # CYRILLIC CAPITAL LETTER YA
254 я → ya ; # CYRILLIC SMALL LETTER YA
255 Ў → Ŭ ; # CYRILLIC CAPITAL LETTER SHORT U
256 ў → ŭ ; # CYRILLIC SMALL LETTER SHORT U
257 Қ → Q ; # CYRILLIC CAPITAL LETTER KA WITH DESCENDER
258 қ → q ; # CYRILLIC SMALL LETTER KA WITH DESCENDER
259 Ғ} $lower → Gh ; # CYRILLIC CAPITAL LETTER GHE WITH STROKE
260 Ғ → GH ; # CYRILLIC CAPITAL LETTER GHE WITH STROKE
261 ғ → gh ; # CYRILLIC SMALL LETTER GHE WITH STROKE
262 Ҳ → H ; # CYRILLIC CAPITAL LETTER HA WITH DESCENDER
263 ҳ → h ; # CYRILLIC SMALL LETTER HA WITH DESCENDER
266 ########################################################################