]>
Commit | Line | Data |
---|---|---|
f3c0d7a5 A |
1 | # © 2016 and later: Unicode, Inc. and others. |
2 | # License & terms of use: http://www.unicode.org/copyright.html#License | |
3 | # | |
2ca993e8 | 4 | # File: uz_Cyrl_uz_BGN.txt |
f3c0d7a5 | 5 | # Generated from CLDR |
729e4ab9 | 6 | # |
2ca993e8 A |
7 | |
8 | # | |
9 | ######################################################################## | |
10 | # BGN/PCGN 1979 System | |
11 | # | |
12 | # The BGN/PCGN system for Uzbek was designed for use in | |
13 | # romanizing names written in the Uzbek alphabet. | |
14 | # The Uzbek alphabet contains four letters not present | |
15 | # in the Russian alphabet: Ўў, Ққ, Ғғ, and Ҳҳ. | |
16 | # | |
17 | # The Uzbek Alphabet as defined by the BGN (Page 107): | |
18 | # | |
19 | # АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЪЬЭЮЯЎҚҒҲ | |
20 | # абвгдеёжзийклмнопрстуфхцчшъьэюяўқғҳ | |
21 | # | |
22 | # Originally prepared by Michael Everson <everson@evertype.com> | |
23 | ######################################################################## | |
24 | # | |
25 | # MINIMAL FILTER: Uzbek-Latin | |
26 | # | |
729e4ab9 A |
27 | :: [АБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЪЬЭЮЯЎҚҒҲабвгдеёжзийклмнопрстуфхцчшъьэюяўқғҳ] ; |
28 | :: NFD (NFC) ; | |
2ca993e8 A |
29 | # |
30 | # | |
31 | ######################################################################## | |
32 | # | |
33 | ######################################################################## | |
34 | # | |
35 | # Define All Transformation Variables | |
36 | # | |
37 | ######################################################################## | |
38 | # | |
51004dcb | 39 | $prime = ʹ ; |
729e4ab9 A |
40 | $doublePrime = ʺ ; |
41 | $upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЪЬҚҒҲ] ; | |
42 | $lowerConsonants = [бвгджзйклмнпрстфхцчшъьқғҳ] ; | |
43 | $consonants = [$upperConsonants $lowerConsonants] ; | |
44 | $upperVowels = [АЕЁИОУЭЮЯЎ] ; | |
45 | $lowerVowels = [аеёиоуэюяў] ; | |
46 | $vowels = [$upperVowels $lowerVowels] ; | |
47 | $lower = [$lowerConsonants $lowerVowels] ; | |
2ca993e8 A |
48 | # |
49 | # | |
50 | # Use this $wordBoundary until bug 2034 is fixed in ICU: | |
51 | # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest | |
52 | # | |
51004dcb | 53 | $wordBoundary = [^[:L:][:M:][:N:]] ; |
2ca993e8 A |
54 | # |
55 | # | |
56 | ######################################################################## | |
57 | # | |
58 | ######################################################################## | |
59 | # | |
60 | # Rules moved to front to avoid masking | |
61 | # | |
62 | ######################################################################## | |
63 | # | |
729e4ab9 A |
64 | $lowerVowels ы → y ; |
65 | $upperVowels[Ыы] → Y ; | |
2ca993e8 A |
66 | # |
67 | # | |
68 | ######################################################################## | |
69 | # | |
70 | # Start of Alphabetic Transformations | |
71 | # | |
72 | ######################################################################## | |
73 | # | |
729e4ab9 A |
74 | А → A ; # CYRILLIC CAPITAL LETTER A |
75 | а → a ; # CYRILLIC SMALL LETTER A | |
76 | Б → B ; # CYRILLIC CAPITAL LETTER BE | |
77 | б → b ; # CYRILLIC SMALL LETTER BE | |
78 | В → W ; # CYRILLIC CAPITAL LETTER VE | |
79 | в → w ; # CYRILLIC SMALL LETTER VE | |
2ca993e8 A |
80 | # |
81 | # | |
82 | ######################################################################## | |
83 | # | |
84 | # BGN Page 108 Rule 2 | |
85 | # | |
86 | # The character sequences гҳ, кҳ, сҳ, and цҳ may be romanized g·h, | |
87 | # k·h, s·h, and ts·h in order to differentiate those romanizations from | |
88 | # the digraphs gh, kh, sh, and the letter sequence tsh, which are used | |
89 | # to render the chаracters г, х, ш, and the character sequence тш. | |
90 | # | |
91 | ######################################################################## | |
92 | # | |
729e4ab9 A |
93 | ГҲ → G·H ; # CYRILLIC CAPITAL LETTER GHE |
94 | Гҳ → G·h ; # CYRILLIC CAPITAL LETTER GHE | |
95 | гҳ → g·h ; # CYRILLIC SMALL LETTER GHE | |
96 | Г → G ; # CYRILLIC CAPITAL LETTER GHE | |
97 | г → g ; # CYRILLIC SMALL LETTER GHE | |
2ca993e8 A |
98 | # |
99 | # | |
100 | ######################################################################## | |
101 | # | |
102 | # End Rule 2 | |
103 | # | |
104 | ######################################################################## | |
105 | # | |
729e4ab9 A |
106 | Д → D ; # CYRILLIC CAPITAL LETTER DE |
107 | д → d ; # CYRILLIC SMALL LETTER DE | |
2ca993e8 A |
108 | # |
109 | # | |
110 | ######################################################################## | |
111 | # | |
112 | # BGN Page 108 Rule 1: | |
113 | # | |
114 | # The character e should be romanized ye initially, after the vowel | |
115 | # characters a, e, ё, и, о, у, э, ю, я, and ў, and after й and ь. | |
116 | # In all other instances, it should be romanized e. | |
117 | # | |
118 | ######################################################################## | |
119 | # | |
729e4ab9 A |
120 | Е}[$upperVowels [ЙЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE |
121 | Е}[$lowerVowels [йь]] → Ye ; # CYRILLIC CAPITAL LETTER IE | |
122 | $wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE | |
51004dcb | 123 | Е → E ; # CYRILLIC CAPITAL LETTER IE |
729e4ab9 A |
124 | е}[$upperVowels $lowerVowels [ЙйЬь]] → ye ; # CYRILLIC SMALL LETTER IE |
125 | $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE | |
51004dcb | 126 | е → e ; # CYRILLIC SMALL LETTER IE |
2ca993e8 A |
127 | # |
128 | # | |
129 | ######################################################################## | |
130 | # | |
131 | # End of Rule 1 | |
132 | # | |
133 | ######################################################################## | |
134 | # | |
729e4ab9 A |
135 | Ё} $lower → Yo ; # CYRILLIC CAPITAL LETTER IO |
136 | Ё → YO ; # CYRILLIC CAPITAL LETTER IO | |
137 | ё → yo ; # CYRILLIC SMALL LETTER IO | |
138 | Ж → J ; # CYRILLIC CAPITAL LETTER ZHE | |
139 | ж → j ; # CYRILLIC SMALL LETTER ZHE | |
140 | З → Z ; # CYRILLIC CAPITAL LETTER ZE | |
141 | з → z ; # CYRILLIC SMALL LETTER ZE | |
142 | И → I ; # CYRILLIC CAPITAL LETTER I | |
143 | и → i ; # CYRILLIC SMALL LETTER I | |
144 | Й → Y ; # CYRILLIC CAPITAL LETTER I | |
145 | й → y ; # CYRILLIC SMALL LETTER I | |
2ca993e8 A |
146 | # |
147 | # | |
148 | ######################################################################## | |
149 | # | |
150 | # BGN Page 108 Rule 2 | |
151 | # | |
152 | # кҳ becomes k·h | |
153 | # | |
154 | ######################################################################## | |
155 | # | |
729e4ab9 A |
156 | КҲ → K·H ; # CYRILLIC CAPITAL LETTER KA |
157 | Кҳ → K·h ; # CYRILLIC CAPITAL LETTER KA | |
158 | кҳ → k·h ; # CYRILLIC SMALL LETTER KA | |
159 | К → K ; # CYRILLIC CAPITAL LETTER KA | |
160 | к → k ; # CYRILLIC SMALL LETTER KA | |
2ca993e8 A |
161 | # |
162 | # | |
163 | ######################################################################## | |
164 | # | |
165 | # End Rule 2 | |
166 | # | |
167 | ######################################################################## | |
168 | # | |
729e4ab9 A |
169 | Л → L ; # CYRILLIC CAPITAL LETTER EL |
170 | л → l ; # CYRILLIC SMALL LETTER EL | |
171 | М → M ; # CYRILLIC CAPITAL LETTER EM | |
172 | м → m ; # CYRILLIC SMALL LETTER EM | |
173 | Н → N ; # CYRILLIC CAPITAL LETTER EN | |
174 | н → n ; # CYRILLIC SMALL LETTER EN | |
175 | О → O ; # CYRILLIC CAPITAL LETTER O | |
176 | о → o ; # CYRILLIC SMALL LETTER O | |
177 | П → P ; # CYRILLIC CAPITAL LETTER PE | |
178 | п → p ; # CYRILLIC SMALL LETTER PE | |
179 | Р → R ; # CYRILLIC CAPITAL LETTER ER | |
180 | р → r ; # CYRILLIC SMALL LETTER ER | |
2ca993e8 A |
181 | # |
182 | # | |
183 | ######################################################################## | |
184 | # | |
185 | # BGN Page 108 Rule 2 | |
186 | # | |
187 | # сҳ becomes s·h | |
188 | # | |
189 | ######################################################################## | |
190 | # | |
729e4ab9 A |
191 | СҲ → S·H ; # CYRILLIC CAPITAL LETTER ES |
192 | Сҳ → S·h ; # CYRILLIC CAPITAL LETTER ES | |
193 | сҳ → s·h ; # CYRILLIC SMALL LETTER ES | |
194 | С → S ; # CYRILLIC CAPITAL LETTER ES | |
195 | с → s ; # CYRILLIC SMALL LETTER ES | |
2ca993e8 A |
196 | # |
197 | # | |
198 | ######################################################################## | |
199 | # | |
200 | # End Rule 2 | |
201 | # | |
202 | ######################################################################## | |
203 | # | |
729e4ab9 A |
204 | Т → T ; # CYRILLIC CAPITAL LETTER TE |
205 | т → t ; # CYRILLIC SMALL LETTER TE | |
206 | У → Ū ; # CYRILLIC CAPITAL LETTER U | |
207 | у → ū ; # CYRILLIC SMALL LETTER U | |
208 | Ф → F ; # CYRILLIC CAPITAL LETTER EF | |
209 | ф → f ; # CYRILLIC SMALL LETTER EF | |
210 | Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA | |
211 | Х → KH ; # CYRILLIC CAPITAL LETTER HA | |
212 | х → kh ; # CYRILLIC SMALL LETTER HA | |
2ca993e8 A |
213 | # |
214 | # | |
215 | ######################################################################## | |
216 | # | |
217 | # BGN Page 108 Rule 2 | |
218 | # | |
219 | # цҳ becomes ts·h | |
220 | # | |
221 | ######################################################################## | |
222 | # | |
729e4ab9 A |
223 | ЦҲ → TS·H ; # CYRILLIC CAPITAL LETTER GHE |
224 | Цҳ → Ts·h ; # CYRILLIC CAPITAL LETTER GHE | |
225 | цҳ → ts·h ; # CYRILLIC SMALL LETTER GHE | |
226 | Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE | |
227 | Ц → TS ; # CYRILLIC CAPITAL LETTER TSE | |
228 | ц → ts ; # CYRILLIC SMALL LETTER TSE | |
2ca993e8 A |
229 | # |
230 | # | |
231 | ######################################################################## | |
232 | # | |
233 | # End Rule 2 | |
234 | # | |
235 | ######################################################################## | |
236 | # | |
729e4ab9 A |
237 | Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE |
238 | Ч → CH ; # CYRILLIC CAPITAL LETTER CHE | |
239 | ч → ch ; # CYRILLIC SMALL LETTER CHE | |
240 | Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA | |
241 | Ш → SH ; # CYRILLIC CAPITAL LETTER SHA | |
242 | ш → sh ; # CYRILLIC SMALL LETTER SHA | |
243 | Ъ → $prime ; # CYRILLIC CAPITAL LETTER HARD SIGN | |
244 | ъ → $prime ; # CYRILLIC SMALL LETTER HARD SIGN | |
245 | Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN | |
246 | ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN | |
247 | Э → e ; # CYRILLIC CAPITAL LETTER E | |
248 | э → e ; # CYRILLIC SMALL LETTER E | |
249 | Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU | |
250 | Ю → YU ; # CYRILLIC CAPITAL LETTER YU | |
251 | ю → yu ; # CYRILLIC SMALL LETTER YU | |
252 | Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA | |
253 | Я → YA ; # CYRILLIC CAPITAL LETTER YA | |
254 | я → ya ; # CYRILLIC SMALL LETTER YA | |
255 | Ў → Ŭ ; # CYRILLIC CAPITAL LETTER SHORT U | |
256 | ў → ŭ ; # CYRILLIC SMALL LETTER SHORT U | |
257 | Қ → Q ; # CYRILLIC CAPITAL LETTER KA WITH DESCENDER | |
258 | қ → q ; # CYRILLIC SMALL LETTER KA WITH DESCENDER | |
259 | Ғ} $lower → Gh ; # CYRILLIC CAPITAL LETTER GHE WITH STROKE | |
260 | Ғ → GH ; # CYRILLIC CAPITAL LETTER GHE WITH STROKE | |
261 | ғ → gh ; # CYRILLIC SMALL LETTER GHE WITH STROKE | |
262 | Ҳ → H ; # CYRILLIC CAPITAL LETTER HA WITH DESCENDER | |
263 | ҳ → h ; # CYRILLIC SMALL LETTER HA WITH DESCENDER | |
2ca993e8 A |
264 | # |
265 | # | |
266 | ######################################################################## | |
267 |