1 # ***************************************************************************
3 # * Copyright (C) 2004-2016, International Business Machines
4 # * Corporation; Unicode, Inc.; and others. All Rights Reserved.
6 # ***************************************************************************
7 # File: uz_Cyrl_uz_BGN.txt
12 ########################################################################
13 # BGN/PCGN 1979 System
15 # The BGN/PCGN system for Uzbek was designed for use in
16 # romanizing names written in the Uzbek alphabet.
17 # The Uzbek alphabet contains four letters not present
18 # in the Russian alphabet: Ўў, Ққ, Ғғ, and Ҳҳ.
20 # The Uzbek Alphabet as defined by the BGN (Page 107):
22 # АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЪЬЭЮЯЎҚҒҲ
23 # абвгдеёжзийклмнопрстуфхцчшъьэюяўқғҳ
25 # Originally prepared by Michael Everson <everson@evertype.com>
26 ########################################################################
28 # MINIMAL FILTER: Uzbek-Latin
30 :: [АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЪЬЭЮЯЎҚҒҲабвгдеёжзийклмнопрстуфхцчшъьэюяўқғҳ] ;
34 ########################################################################
36 ########################################################################
38 # Define All Transformation Variables
40 ########################################################################
44 $upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЪЬҚҒҲ] ;
45 $lowerConsonants = [бвгджзйклмнпрстфхцчшъьқғҳ] ;
46 $consonants = [$upperConsonants $lowerConsonants] ;
47 $upperVowels = [АЕЁИОУЭЮЯЎ] ;
48 $lowerVowels = [аеёиоуэюяў] ;
49 $vowels = [$upperVowels $lowerVowels] ;
50 $lower = [$lowerConsonants $lowerVowels] ;
53 # Use this $wordBoundary until bug 2034 is fixed in ICU:
54 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
56 $wordBoundary = [^[:L:][:M:][:N:]] ;
59 ########################################################################
61 ########################################################################
63 # Rules moved to front to avoid masking
65 ########################################################################
68 $upperVowels[Ыы] → Y ;
71 ########################################################################
73 # Start of Alphabetic Transformations
75 ########################################################################
77 А → A ; # CYRILLIC CAPITAL LETTER A
78 а → a ; # CYRILLIC SMALL LETTER A
79 Б → B ; # CYRILLIC CAPITAL LETTER BE
80 б → b ; # CYRILLIC SMALL LETTER BE
81 В → W ; # CYRILLIC CAPITAL LETTER VE
82 в → w ; # CYRILLIC SMALL LETTER VE
85 ########################################################################
89 # The character sequences гҳ, кҳ, сҳ, and цҳ may be romanized g·h,
90 # k·h, s·h, and ts·h in order to differentiate those romanizations from
91 # the digraphs gh, kh, sh, and the letter sequence tsh, which are used
92 # to render the chаracters г, х, ш, and the character sequence тш.
94 ########################################################################
96 ГҲ → G·H ; # CYRILLIC CAPITAL LETTER GHE
97 Гҳ → G·h ; # CYRILLIC CAPITAL LETTER GHE
98 гҳ → g·h ; # CYRILLIC SMALL LETTER GHE
99 Г → G ; # CYRILLIC CAPITAL LETTER GHE
100 г → g ; # CYRILLIC SMALL LETTER GHE
103 ########################################################################
107 ########################################################################
109 Д → D ; # CYRILLIC CAPITAL LETTER DE
110 д → d ; # CYRILLIC SMALL LETTER DE
113 ########################################################################
115 # BGN Page 108 Rule 1:
117 # The character e should be romanized ye initially, after the vowel
118 # characters a, e, ё, и, о, у, э, ю, я, and ў, and after й and ь.
119 # In all other instances, it should be romanized e.
121 ########################################################################
123 Е}[$upperVowels [ЙЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE
124 Е}[$lowerVowels [йь]] → Ye ; # CYRILLIC CAPITAL LETTER IE
125 $wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE
126 Е → E ; # CYRILLIC CAPITAL LETTER IE
127 е}[$upperVowels $lowerVowels [ЙйЬь]] → ye ; # CYRILLIC SMALL LETTER IE
128 $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE
129 е → e ; # CYRILLIC SMALL LETTER IE
132 ########################################################################
136 ########################################################################
138 Ё} $lower → Yo ; # CYRILLIC CAPITAL LETTER IO
139 Ё → YO ; # CYRILLIC CAPITAL LETTER IO
140 ё → yo ; # CYRILLIC SMALL LETTER IO
141 Ж → J ; # CYRILLIC CAPITAL LETTER ZHE
142 ж → j ; # CYRILLIC SMALL LETTER ZHE
143 З → Z ; # CYRILLIC CAPITAL LETTER ZE
144 з → z ; # CYRILLIC SMALL LETTER ZE
145 И → I ; # CYRILLIC CAPITAL LETTER I
146 и → i ; # CYRILLIC SMALL LETTER I
147 Й → Y ; # CYRILLIC CAPITAL LETTER I
148 й → y ; # CYRILLIC SMALL LETTER I
151 ########################################################################
153 # BGN Page 108 Rule 2
157 ########################################################################
159 КҲ → K·H ; # CYRILLIC CAPITAL LETTER KA
160 Кҳ → K·h ; # CYRILLIC CAPITAL LETTER KA
161 кҳ → k·h ; # CYRILLIC SMALL LETTER KA
162 К → K ; # CYRILLIC CAPITAL LETTER KA
163 к → k ; # CYRILLIC SMALL LETTER KA
166 ########################################################################
170 ########################################################################
172 Л → L ; # CYRILLIC CAPITAL LETTER EL
173 л → l ; # CYRILLIC SMALL LETTER EL
174 М → M ; # CYRILLIC CAPITAL LETTER EM
175 м → m ; # CYRILLIC SMALL LETTER EM
176 Н → N ; # CYRILLIC CAPITAL LETTER EN
177 н → n ; # CYRILLIC SMALL LETTER EN
178 О → O ; # CYRILLIC CAPITAL LETTER O
179 о → o ; # CYRILLIC SMALL LETTER O
180 П → P ; # CYRILLIC CAPITAL LETTER PE
181 п → p ; # CYRILLIC SMALL LETTER PE
182 Р → R ; # CYRILLIC CAPITAL LETTER ER
183 р → r ; # CYRILLIC SMALL LETTER ER
186 ########################################################################
188 # BGN Page 108 Rule 2
192 ########################################################################
194 СҲ → S·H ; # CYRILLIC CAPITAL LETTER ES
195 Сҳ → S·h ; # CYRILLIC CAPITAL LETTER ES
196 сҳ → s·h ; # CYRILLIC SMALL LETTER ES
197 С → S ; # CYRILLIC CAPITAL LETTER ES
198 с → s ; # CYRILLIC SMALL LETTER ES
201 ########################################################################
205 ########################################################################
207 Т → T ; # CYRILLIC CAPITAL LETTER TE
208 т → t ; # CYRILLIC SMALL LETTER TE
209 У → Ū ; # CYRILLIC CAPITAL LETTER U
210 у → ū ; # CYRILLIC SMALL LETTER U
211 Ф → F ; # CYRILLIC CAPITAL LETTER EF
212 ф → f ; # CYRILLIC SMALL LETTER EF
213 Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA
214 Х → KH ; # CYRILLIC CAPITAL LETTER HA
215 х → kh ; # CYRILLIC SMALL LETTER HA
218 ########################################################################
220 # BGN Page 108 Rule 2
224 ########################################################################
226 ЦҲ → TS·H ; # CYRILLIC CAPITAL LETTER GHE
227 Цҳ → Ts·h ; # CYRILLIC CAPITAL LETTER GHE
228 цҳ → ts·h ; # CYRILLIC SMALL LETTER GHE
229 Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
230 Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
231 ц → ts ; # CYRILLIC SMALL LETTER TSE
234 ########################################################################
238 ########################################################################
240 Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
241 Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
242 ч → ch ; # CYRILLIC SMALL LETTER CHE
243 Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA
244 Ш → SH ; # CYRILLIC CAPITAL LETTER SHA
245 ш → sh ; # CYRILLIC SMALL LETTER SHA
246 Ъ → $prime ; # CYRILLIC CAPITAL LETTER HARD SIGN
247 ъ → $prime ; # CYRILLIC SMALL LETTER HARD SIGN
248 Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN
249 ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN
250 Э → e ; # CYRILLIC CAPITAL LETTER E
251 э → e ; # CYRILLIC SMALL LETTER E
252 Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU
253 Ю → YU ; # CYRILLIC CAPITAL LETTER YU
254 ю → yu ; # CYRILLIC SMALL LETTER YU
255 Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA
256 Я → YA ; # CYRILLIC CAPITAL LETTER YA
257 я → ya ; # CYRILLIC SMALL LETTER YA
258 Ў → Ŭ ; # CYRILLIC CAPITAL LETTER SHORT U
259 ў → ŭ ; # CYRILLIC SMALL LETTER SHORT U
260 Қ → Q ; # CYRILLIC CAPITAL LETTER KA WITH DESCENDER
261 қ → q ; # CYRILLIC SMALL LETTER KA WITH DESCENDER
262 Ғ} $lower → Gh ; # CYRILLIC CAPITAL LETTER GHE WITH STROKE
263 Ғ → GH ; # CYRILLIC CAPITAL LETTER GHE WITH STROKE
264 ғ → gh ; # CYRILLIC SMALL LETTER GHE WITH STROKE
265 Ҳ → H ; # CYRILLIC CAPITAL LETTER HA WITH DESCENDER
266 ҳ → h ; # CYRILLIC SMALL LETTER HA WITH DESCENDER
269 ########################################################################