]> git.saurik.com Git - apple/icu.git/blob - icuSources/data/translit/mk_mk_Latn_BGN.txt
ICU-66108.tar.gz
[apple/icu.git] / icuSources / data / translit / mk_mk_Latn_BGN.txt
1 # © 2016 and later: Unicode, Inc. and others.
2 # License & terms of use: http://www.unicode.org/copyright.html#License
3 #
4 # File: mk_mk_Latn_BGN.txt
5 # Generated from CLDR
6 #
7
8 #
9 ########################################################################
10 # BGN/PCGN 1981 System
11 #
12 # Macedonian was official established as a literary language in
13 # Yugoslavia during World War II and is now the official language
14 # of Macedonia. Its alphabet is identical to Serbian, except
15 # that the letters Ђђ and Ћћ are replaced by Ѓѓ and Ќќ, and
16 # the letter Ѕѕ and the apostrophe are added.
17 #
18 # The Macedonian Alphabet as defined by the BGN (Page 69):
19 #
20 # АБВГДЃЕЖЗЅИЈКЛЉМНЊОПРСТЌУФХЦЧЏШ
21 # абвгдѓежзѕијклљмнњопрстќуфхцчџш’
22 #
23 # Originally prepared by Michael Everson <everson@evertype.com>
24 ########################################################################
25 #
26 # MINIMAL FILTER: Macedonian-Latin
27 #
28 :: [АБВГДЃЕЖЗЅИЈКЛЉМНЊОПРСТЌУФХЦЧЏШабвгдѓежзѕијклљмнњопрстќуфхцчџш’] ;
29 :: NFD (NFC) ;
30 #
31 #
32 ########################################################################
33 #
34 ########################################################################
35 #
36 # Define All Transformation Variables
37 #
38 ########################################################################
39 #
40 $prime = ’ ;
41 $upperConsonants = [БВГДЃЖЗЅЈКЛЉМНЊПРСТЌФХЦЧЏШ] ;
42 $lowerConsonants = [бвгдѓжзѕјклљмнњпрстќфхцчџш’] ;
43 $consonants = [$upperConsonants $lowerConsonants] ;
44 $upperVowels = [АЕИОУ] ;
45 $lowerVowels = [аеиоу] ;
46 $vowels = [$upperVowels $lowerVowels] ;
47 $lower = [$lowerConsonants $lowerVowels] ;
48 #
49 #
50 # Use this $wordBoundary until bug 2034 is fixed in ICU:
51 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
52 #
53 $wordBoundary = [^[:L:][:M:][:N:]] ;
54 #
55 #
56 ########################################################################
57 #
58 ########################################################################
59 #
60 # Start of Alphabetic Transformations
61 #
62 ########################################################################
63 #
64 А → A ; # CYRILLIC CAPITAL LETTER A
65 а → a ; # CYRILLIC SMALL LETTER A
66 Б → B ; # CYRILLIC CAPITAL LETTER BE
67 б → b ; # CYRILLIC SMALL LETTER BE
68 В → V ; # CYRILLIC CAPITAL LETTER VE
69 в → v ; # CYRILLIC SMALL LETTER VE
70 Г → G ; # CYRILLIC CAPITAL LETTER GHE
71 г → g ; # CYRILLIC SMALL LETTER GHE
72 Д → D ; # CYRILLIC CAPITAL LETTER DE
73 д → d ; # CYRILLIC SMALL LETTER DE
74 #
75 #
76 ########################################################################
77 #
78 # BGN Page 70 Rule 1:
79 #
80 # The character ѓ should be romanized g when it occurs before е
81 # and и. In all other instances, it should be romanized đ (Đ).
82 #
83 ########################################################################
84 #
85 Ѓ}[ЕеИи] → G ; # CYRILLIC CAPITAL LETTER GJE
86 ѓ}[ЕеИи] → g ; # CYRILLIC SMALL LETTER GJE
87 Ѓ → Đ ; # CYRILLIC CAPITAL LETTER GJE
88 ѓ → đ ; # CYRILLIC SMALL LETTER GJE
89 #
90 #
91 ########################################################################
92 #
93 # End Rule 1
94 #
95 ########################################################################
96 #
97 Е → E ; # CYRILLIC CAPITAL LETTER DE
98 е → e ; # CYRILLIC SMALL LETTER DE
99 Ж → Ž ; # CYRILLIC CAPITAL LETTER ZHE
100 ж → ž ; # CYRILLIC SMALL LETTER ZHE
101 З → Z ; # CYRILLIC CAPITAL LETTER ZE
102 з → z ; # CYRILLIC SMALL LETTER ZE
103 Ѕ} $lower → Dz ; # CYRILLIC CAPITAL LETTER DZE
104 Ѕ → DZ ; # CYRILLIC CAPITAL LETTER DZE
105 ѕ → dz ; # CYRILLIC SMALL LETTER DZE
106 И → I ; # CYRILLIC CAPITAL LETTER I
107 и → i ; # CYRILLIC SMALL LETTER I
108 Ј → J ; # CYRILLIC CAPITAL LETTER JE
109 ј → j ; # CYRILLIC SMALL LETTER JE
110 К → K ; # CYRILLIC CAPITAL LETTER KA
111 к → k ; # CYRILLIC SMALL LETTER KA
112 Л → L ; # CYRILLIC CAPITAL LETTER EL
113 л → l ; # CYRILLIC SMALL LETTER EL
114 Љ} $lower → Lj ; # CYRILLIC CAPITAL LETTER LJE
115 Љ → LJ ; # CYRILLIC CAPITAL LETTER LJE
116 љ → lj ; # CYRILLIC SMALL LETTER LJE
117 М → M ; # CYRILLIC CAPITAL LETTER EM
118 м → m ; # CYRILLIC SMALL LETTER EM
119 Н → N ; # CYRILLIC CAPITAL LETTER EN
120 н → n ; # CYRILLIC SMALL LETTER EN
121 Њ} $lower → Nj ; # CYRILLIC CAPITAL LETTER NJE
122 Њ → NJ ; # CYRILLIC CAPITAL LETTER NJE
123 њ → nj ; # CYRILLIC SMALL LETTER NJE
124 О → O ; # CYRILLIC CAPITAL LETTER O
125 о → o ; # CYRILLIC SMALL LETTER O
126 П → P ; # CYRILLIC CAPITAL LETTER PE
127 п → p ; # CYRILLIC SMALL LETTER PE
128 Р → R ; # CYRILLIC CAPITAL LETTER ER
129 р → r ; # CYRILLIC SMALL LETTER ER
130 С → S ; # CYRILLIC CAPITAL LETTER ES
131 с → s ; # CYRILLIC SMALL LETTER ES
132 Т → T ; # CYRILLIC CAPITAL LETTER TE
133 т → t ; # CYRILLIC SMALL LETTER TE
134 #
135 #
136 ########################################################################
137 #
138 # BGN Page 70 Rule 2:
139 #
140 # The character ќ should be romanized k when it occurs before е
141 # and и. In all other instances, it should be romanized c\u0301.
142 #
143 ########################################################################
144 #
145 Ќ}[ЕеИи] → K ; # CYRILLIC CAPITAL LETTER KJE
146 ќ}[ЕеИи] → k ; # CYRILLIC SMALL LETTER KJE
147 Ќ → C\u0301 ; # CYRILLIC CAPITAL LETTER KJE
148 ќ → c\u0301 ; # CYRILLIC SMALL LETTER KJE
149 #
150 #
151 ########################################################################
152 #
153 # End Rule 2
154 #
155 ########################################################################
156 #
157 У → U ; # CYRILLIC CAPITAL LETTER U
158 у → u ; # CYRILLIC SMALL LETTER U
159 Ф → F ; # CYRILLIC CAPITAL LETTER EF
160 ф → f ; # CYRILLIC SMALL LETTER EF
161 Х → H ; # CYRILLIC CAPITAL LETTER HA
162 х → h ; # CYRILLIC SMALL LETTER HA
163 Ц → C ; # CYRILLIC CAPITAL LETTER TSE
164 ц → c ; # CYRILLIC SMALL LETTER TSE
165 Ч → Č ; # CYRILLIC CAPITAL LETTER CHE
166 ч → č ; # CYRILLIC SMALL LETTER CHE
167 Џ} $lower → Dž ; # CYRILLIC CAPITAL LETTER SHA
168 Џ → DŽ ; # CYRILLIC CAPITAL LETTER SHA
169 џ → dž ; # CYRILLIC SMALL LETTER SHA
170 Ш → Š ; # CYRILLIC CAPITAL LETTER SHA
171 ш → š ; # CYRILLIC SMALL LETTER SHA
172 #
173 #
174 ########################################################################
175 #
176 # BGN Page 69 Rule 32, maps the symbol onto itself and
177 # is ignored here for computational efficiency.
178 #
179 # $prime → $prime ; # RIGHT SINGLE QUOTATION MARK
180 #
181 ########################################################################
182