]>
Commit | Line | Data |
---|---|---|
f3c0d7a5 A |
1 | # © 2016 and later: Unicode, Inc. and others. |
2 | # License & terms of use: http://www.unicode.org/copyright.html#License | |
3 | # | |
2ca993e8 | 4 | # File: tk_Cyrl_tk_BGN.txt |
f3c0d7a5 | 5 | # Generated from CLDR |
729e4ab9 | 6 | # |
2ca993e8 A |
7 | |
8 | # | |
9 | ######################################################################## | |
10 | # BGN/PCGN 1979 System | |
11 | # | |
12 | # The BGN/PCGN system for Turkmen was designed for use in | |
13 | # romanizing names written in the Turkmen alphabet. | |
14 | # The Turkmen alphabet contains five letters not present | |
15 | # in the Russian alphabet: Җҗ, Ңң, Өө, Үү, and Әә. | |
16 | # | |
17 | # The Turkmen Cyrillic Alphabet as defined by the BGN (Page 103): | |
18 | # | |
19 | # АБВГДЕЁЖҖЗИЙКЛМНҢОӨПРСТУҮФХЦЧШЩЪЫЬЭӘЮЯ | |
20 | # абвгдеёжзҗийклмнңоөпрстуүфхцчшщъыьэәюя | |
21 | # | |
22 | # Originally prepared by Michael Everson <everson@evertype.com> | |
23 | ######################################################################## | |
24 | # | |
25 | # MINIMAL FILTER: Turkmen-Latin | |
26 | # | |
27 | # :: [АБВГДЕЁЖҖЗИЙКЛМНҢОӨПРСТУҮФХЦЧШЩЪЫЬЭӘЮЯабвгдеёжзҗийклмнңоөпрстуүфхцчшщъыьэәюя] ; | |
729e4ab9 | 28 | :: NFD (NFC) ; |
2ca993e8 A |
29 | # |
30 | # | |
31 | ######################################################################## | |
32 | # | |
33 | ######################################################################## | |
34 | # | |
35 | # Define All Transformation Variables | |
36 | # | |
37 | ######################################################################## | |
38 | # | |
51004dcb | 39 | $prime = ʹ ; |
729e4ab9 A |
40 | $doublePrime = ʺ ; |
41 | $upperConsonants = [БВГДЖҖЗЙКЛМНҢПРСТФХЦЧШЩЪЬ] ; | |
42 | $lowerConsonants = [бвгджҗзйклмнңпрстфхцчшщъь] ; | |
43 | $consonants = [$upperConsonants $lowerConsonants] ; | |
44 | $upperVowels = [АЕЁИОӨУҮЫЭӘЮЯ] ; | |
45 | $lowerVowels = [аеёиоөуүыэәюя] ; | |
46 | $vowels = [$upperVowels $lowerVowels] ; | |
47 | $lower = [$lowerConsonants $lowerVowels] ; | |
2ca993e8 A |
48 | # |
49 | # | |
50 | # Use this $wordBoundary until bug 2034 is fixed in ICU: | |
51 | # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest | |
52 | # | |
51004dcb | 53 | $wordBoundary = [^[:L:][:M:][:N:]] ; |
2ca993e8 A |
54 | # |
55 | # | |
56 | ######################################################################## | |
57 | # | |
58 | ######################################################################## | |
59 | # | |
60 | # Start of Alphabetic Transformations | |
61 | # | |
62 | ######################################################################## | |
63 | # | |
729e4ab9 A |
64 | А → A ; # CYRILLIC CAPITAL LETTER A |
65 | а → a ; # CYRILLIC SMALL LETTER A | |
66 | Б → B ; # CYRILLIC CAPITAL LETTER BE | |
67 | б → b ; # CYRILLIC SMALL LETTER BE | |
68 | В → W ; # CYRILLIC CAPITAL LETTER VE | |
69 | в → w ; # CYRILLIC SMALL LETTER VE | |
70 | Г → G ; # CYRILLIC CAPITAL LETTER GHE | |
71 | г → g ; # CYRILLIC SMALL LETTER GHE | |
72 | Д → D ; # CYRILLIC CAPITAL LETTER DE | |
73 | д → d ; # CYRILLIC SMALL LETTER DE | |
2ca993e8 A |
74 | # |
75 | # | |
76 | ######################################################################## | |
77 | # | |
78 | # BGN Page 104 Rule 1: | |
79 | # | |
80 | # The character e should be romanized ye initially, after the vowel | |
81 | # characters a, e, ё, и, о, ө, у, ү, ы, э, ю, and я, and after й, ъ, and ь. | |
82 | # In all other instances, it should be romanized e. | |
83 | # | |
84 | ######################################################################## | |
85 | # | |
729e4ab9 A |
86 | Е}[[$upperVowels - [Ә]] [ЙЪЬ]] → YE ; # CYRILLIC CAPITAL LETTER IE |
87 | Е}[[$lowerVowels - [ә]] [йъь]] → Ye ; # CYRILLIC CAPITAL LETTER IE | |
88 | $wordBoundary{Е → Ye ; # CYRILLIC CAPITAL LETTER IE | |
51004dcb | 89 | Е → E ; # CYRILLIC CAPITAL LETTER IE |
729e4ab9 A |
90 | е}[[$upperVowels - [Ә]] [$lowerVowels - [ә]] [ЙйЪъЬь]] → ye ; # CYRILLIC SMALL LETTER IE |
91 | $wordBoundary{е → ye ; # CYRILLIC SMALL LETTER IE | |
51004dcb | 92 | е → e ; # CYRILLIC SMALL LETTER IE |
2ca993e8 A |
93 | # |
94 | # | |
95 | ######################################################################## | |
96 | # | |
97 | # End of Rule 1 | |
98 | # | |
99 | ######################################################################## | |
100 | # | |
729e4ab9 A |
101 | Ё} $lower → Yo ; # CYRILLIC CAPITAL LETTER IO |
102 | Ё → YO ; # CYRILLIC CAPITAL LETTER IO | |
103 | ё → yo ; # CYRILLIC SMALL LETTER IO | |
104 | Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE | |
105 | Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE | |
106 | ж → zh ; # CYRILLIC SMALL LETTER ZHE | |
2ca993e8 A |
107 | # |
108 | # | |
109 | ######################################################################## | |
110 | # | |
111 | # BGN Page 104 Rule 2 | |
112 | # | |
113 | # The character sequences зх, нг, сх, and цх may be romanized z·h, | |
114 | # n·g, s·h, and ts·h in order to differentiate those romanizations form | |
115 | # the digraphs zh, ng, sh, and the letter sequence tsh, which are used | |
116 | # to render the characters ж, ң, ш, and the character sequence тш. | |
117 | # | |
118 | ######################################################################## | |
119 | # | |
729e4ab9 A |
120 | ЗХ → Z·H ; # CYRILLIC CAPITAL LETTER ZE |
121 | Зх → Z·h ; # CYRILLIC CAPITAL LETTER ZE | |
122 | зх → z·h ; # CYRILLIC SMALL LETTER ZE | |
123 | З → Z ; # CYRILLIC CAPITAL LETTER ZE | |
124 | з → z ; # CYRILLIC SMALL LETTER ZE | |
2ca993e8 A |
125 | # |
126 | # | |
127 | ######################################################################## | |
128 | # | |
129 | # End Rule 2 | |
130 | # | |
131 | ######################################################################## | |
132 | # | |
729e4ab9 A |
133 | И → И ; # CYRILLIC CAPITAL LETTER I |
134 | и → и ; # CYRILLIC SMALL LETTER I | |
135 | Й → Y ; # CYRILLIC CAPITAL LETTER I | |
136 | й → y ; # CYRILLIC SMALL LETTER I | |
137 | К → K ; # CYRILLIC CAPITAL LETTER KA | |
138 | к → k ; # CYRILLIC SMALL LETTER KA | |
139 | Л → L ; # CYRILLIC CAPITAL LETTER EL | |
140 | л → l ; # CYRILLIC SMALL LETTER EL | |
141 | М → M ; # CYRILLIC CAPITAL LETTER EM | |
142 | м → m ; # CYRILLIC SMALL LETTER EM | |
2ca993e8 A |
143 | # |
144 | # | |
145 | ######################################################################## | |
146 | # | |
147 | # BGN Page 104 Rule 2 | |
148 | # | |
149 | # нг becomes n·g | |
150 | # | |
151 | ######################################################################## | |
152 | # | |
729e4ab9 A |
153 | НГ → N·G ; # CYRILLIC CAPITAL LETTER EN |
154 | Нг → N·g ; # CYRILLIC CAPITAL LETTER EN | |
155 | нг → n·g ; # CYRILLIC SMALL LETTER EN | |
156 | Н → N ; # CYRILLIC CAPITAL LETTER EN | |
157 | н → n ; # CYRILLIC SMALL LETTER EN | |
2ca993e8 A |
158 | # |
159 | # | |
160 | ######################################################################## | |
161 | # | |
162 | # End Rule 2 | |
163 | # | |
164 | ######################################################################## | |
165 | # | |
729e4ab9 A |
166 | Ң} $lower → Ng ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER |
167 | Ң → NG ; # CYRILLIC CAPITAL LETTER EN WITH DESCENDER | |
168 | ң → ng ; # CYRILLIC SMALL LETTER EN WITH DESCENDER | |
169 | О → O ; # CYRILLIC CAPITAL LETTER O | |
170 | о → o ; # CYRILLIC SMALL LETTER O | |
171 | Ө → Ö ; # CYRILLIC CAPITAL LETTER BARRED O | |
172 | ө → ö ; # CYRILLIC SMALL LETTER BARRED O | |
173 | П → P ; # CYRILLIC CAPITAL LETTER PE | |
174 | п → p ; # CYRILLIC SMALL LETTER PE | |
175 | Р → R ; # CYRILLIC CAPITAL LETTER ER | |
176 | р → r ; # CYRILLIC SMALL LETTER ER | |
2ca993e8 A |
177 | # |
178 | # | |
179 | ######################################################################## | |
180 | # | |
181 | # BGN Page 104 Rule 2 | |
182 | # | |
183 | # сх becomes s·h | |
184 | # | |
185 | ######################################################################## | |
186 | # | |
729e4ab9 A |
187 | СХ → S·H ; # CYRILLIC CAPITAL LETTER ES |
188 | Сх → S·h ; # CYRILLIC CAPITAL LETTER ES | |
189 | сх → s·h ; # CYRILLIC SMALL LETTER ES | |
190 | С → S ; # CYRILLIC CAPITAL LETTER ES | |
191 | с → s ; # CYRILLIC SMALL LETTER ES | |
2ca993e8 A |
192 | # |
193 | # | |
194 | ######################################################################## | |
195 | # | |
196 | # End Rule 2 | |
197 | # | |
198 | ######################################################################## | |
199 | # | |
729e4ab9 A |
200 | Т → T ; # CYRILLIC CAPITAL LETTER TE |
201 | т → t ; # CYRILLIC SMALL LETTER TE | |
202 | У → U ; # CYRILLIC CAPITAL LETTER U | |
203 | у → u ; # CYRILLIC SMALL LETTER U | |
204 | Ү → Ü ; # CYRILLIC CAPITAL LETTER STRAIGHT U | |
205 | ү → ü ; # CYRILLIC SMALL LETTER STRAIGHT U | |
206 | Ф → F ; # CYRILLIC CAPITAL LETTER EF | |
207 | ф → f ; # CYRILLIC SMALL LETTER EF | |
208 | Х → H ; # CYRILLIC CAPITAL LETTER HA | |
209 | х → h ; # CYRILLIC SMALL LETTER HA | |
2ca993e8 A |
210 | # |
211 | # | |
212 | ######################################################################## | |
213 | # | |
214 | # BGN Page 104 Rule 2 | |
215 | # | |
216 | # цх becomes ts·h | |
217 | # | |
218 | ######################################################################## | |
219 | # | |
729e4ab9 A |
220 | ЦХ → TS·H ; # CYRILLIC CAPITAL LETTER GHE |
221 | Цх → Ts·h ; # CYRILLIC CAPITAL LETTER GHE | |
222 | цх → ts·h ; # CYRILLIC SMALL LETTER GHE | |
223 | Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE | |
224 | Ц → TS ; # CYRILLIC CAPITAL LETTER TSE | |
225 | ц → ts ; # CYRILLIC SMALL LETTER TSE | |
2ca993e8 A |
226 | # |
227 | # | |
228 | ######################################################################## | |
229 | # | |
230 | # End Rule 2 | |
231 | # | |
232 | ######################################################################## | |
233 | # | |
729e4ab9 A |
234 | Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE |
235 | Ч → CH ; # CYRILLIC CAPITAL LETTER CHE | |
236 | ч → ch ; # CYRILLIC SMALL LETTER CHE | |
2ca993e8 A |
237 | # |
238 | # | |
239 | ######################################################################## | |
240 | # | |
241 | # Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6). | |
242 | # | |
243 | # шч becomes sh·ch | |
244 | # | |
245 | ######################################################################## | |
246 | # | |
729e4ab9 A |
247 | ШЧ → SH·CH ; # CYRILLIC CAPITAL LETTER SHA |
248 | Шч → Sh·ch ; # CYRILLIC CAPITAL LETTER SHA | |
249 | шч → sh·ch ; # CYRILLIC SMALL LETTER SHA | |
250 | Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA | |
251 | Ш → SH ; # CYRILLIC CAPITAL LETTER SHA | |
252 | ш → sh ; # CYRILLIC SMALL LETTER SHA | |
253 | Щ} $lower → Shch ; # CYRILLIC CAPITAL LETTER SHCHA | |
254 | Щ → SHCH ; # CYRILLIC CAPITAL LETTER SHCHA | |
255 | щ → shch ; # CYRILLIC SMALL LETTER SHCHA | |
2ca993e8 A |
256 | # |
257 | # | |
258 | ######################################################################## | |
259 | # | |
260 | # End Implied rule | |
261 | # | |
262 | ######################################################################## | |
263 | # | |
729e4ab9 A |
264 | Ъ → $doublePrime ; # CYRILLIC CAPITAL LETTER HARD SIGN |
265 | ъ → $doublePrime ; # CYRILLIC SMALL LETTER HARD SIGN | |
2ca993e8 A |
266 | # |
267 | # | |
268 | ######################################################################## | |
269 | # | |
270 | # BGN Page 104 Note 3 | |
271 | # | |
272 | # The character Ыы may be romanized Ɨɨ instead of Yy, if so desired. | |
273 | # | |
274 | ######################################################################## | |
275 | # | |
729e4ab9 A |
276 | Ы → Y ; # CYRILLIC CAPITAL LETTER YERU |
277 | ы → y ; # CYRILLIC SMALL LETTER YERU | |
2ca993e8 A |
278 | # |
279 | # | |
280 | # Alternative rule to implement the option described here. To apply | |
281 | # uncomment the following by removing the '#' mark at the start of the | |
282 | # line and insert before the two rule lines above. | |
283 | # | |
284 | #Ы → Ɨ ; # CYRILLIC CAPITAL LETTER YERU | |
285 | #ы → ɨ ; # CYRILLIC SMALL LETTER YERU | |
286 | # | |
287 | ######################################################################## | |
288 | # | |
289 | # End BGN Page 104 Note 2 | |
290 | # | |
291 | ######################################################################## | |
292 | # | |
729e4ab9 A |
293 | Ь → $prime ; # CYRILLIC CAPITAL LETTER SOFT SIGN |
294 | ь → $prime ; # CYRILLIC SMALL LETTER SOFT SIGN | |
295 | Э → E ; # CYRILLIC CAPITAL LETTER E | |
296 | э → e ; # CYRILLIC SMALL LETTER E | |
297 | Ә → Ä ; # CYRILLIC CAPITAL LETTER SCHWA | |
298 | ә → ä ; # CYRILLIC SMALL LETTER SCHWA | |
299 | Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU | |
300 | Ю → YU ; # CYRILLIC CAPITAL LETTER YU | |
301 | ю → yu ; # CYRILLIC SMALL LETTER YU | |
302 | Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA | |
303 | Я → YA ; # CYRILLIC CAPITAL LETTER YA | |
304 | я → ya ; # CYRILLIC SMALL LETTER YA | |
2ca993e8 A |
305 | # |
306 | # | |
307 | ######################################################################## | |
308 |