1 # © 2016 and later: Unicode, Inc. and others.
2 # License & terms of use: http://www.unicode.org/copyright.html#License
4 # File: bg_bg_Latn_BGN.txt
9 ########################################################################
10 # BGN/PCGN 1952 System
12 # This system was adopted by the BGN in 1949 and by the PCGN in 1952.
13 # It reflects the much simplified Bulgarian orthography as officially
14 # revised in February 1945. The Bulgarian alphabet contains all of
15 # the characters present in the Russian alphabet with the exception
16 # of Ёё, Ыы, and Ээ. Two obsolete letters Ѫѫ and Ѣѣ are also given.
18 # The Bulgarian Alphabet as defined by the BGN (Page 15):
20 # АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢ
21 # абвгдежзийклмнопрстуфхцчшщъьюяѫѣ
23 # Originally prepared by Michael Everson <everson@evertype.com>
24 ########################################################################
26 # MINIMAL FILTER: Bulgarian-Latin
28 :: [АБВГДЕЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЬЮЯѪѢабвгдежзийклмнопрстуфхцчшщъьюяѫѣ] ;
32 ########################################################################
34 ########################################################################
36 # Define All Transformation Variables
38 ########################################################################
40 $upperConsonants = [БВГДЖЗЙКЛМНПРСТФХЦЧШЩЬ] ;
41 $lowerConsonants = [бвгджзйклмнпрстфхцчшщь] ;
42 $consonants = [$upperConsonants $lowerConsonants] ;
43 $upperVowels = [АЕИОУЪЮЯѪѢ] ;
44 $lowerVowels = [аеиоуъюяѫѣ] ;
45 $vowels = [$upperVowels $lowerVowels] ;
46 $lower = [$lowerConsonants $lowerVowels] ;
47 $bulgarian = [ $lower $upperConsonants $upperVowels ] ;
50 # Use this $wordBoundary until bug 2034 is fixed in ICU:
51 # http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
53 $wordBoundary = [^[:L:][:M:][:N:]] ;
56 ########################################################################
58 ########################################################################
60 # Start of Alphabetic Transformations
62 ########################################################################
64 А → A ; # CYRILLIC CAPITAL LETTER A
65 а → a ; # CYRILLIC SMALL LETTER A
66 Б → B ; # CYRILLIC CAPITAL LETTER BE
67 б → b ; # CYRILLIC SMALL LETTER BE
68 В → V ; # CYRILLIC CAPITAL LETTER VE
69 в → v ; # CYRILLIC SMALL LETTER VE
70 Г → G ; # CYRILLIC CAPITAL LETTER GHE
71 г → g ; # CYRILLIC SMALL LETTER GHE
72 Д → D ; # CYRILLIC CAPITAL LETTER DE
73 д → d ; # CYRILLIC SMALL LETTER DE
74 Е → E ; # CYRILLIC CAPITAL LETTER DE
75 е → e ; # CYRILLIC SMALL LETTER DE
76 Ж} $lower → Zh ; # CYRILLIC CAPITAL LETTER ZHE
77 Ж → ZH ; # CYRILLIC CAPITAL LETTER ZHE
78 ж → zh ; # CYRILLIC SMALL LETTER ZHE
79 З → Z ; # CYRILLIC CAPITAL LETTER ZE
80 з → z ; # CYRILLIC SMALL LETTER ZE
81 И → I ; # CYRILLIC CAPITAL LETTER I
82 и → i ; # CYRILLIC SMALL LETTER I
83 Й → Y ; # CYRILLIC CAPITAL LETTER I
84 й → y ; # CYRILLIC SMALL LETTER I
85 К → K ; # CYRILLIC CAPITAL LETTER KA
86 к → k ; # CYRILLIC SMALL LETTER KA
87 Л → L ; # CYRILLIC CAPITAL LETTER EL
88 л → l ; # CYRILLIC SMALL LETTER EL
89 М → M ; # CYRILLIC CAPITAL LETTER EM
90 м → m ; # CYRILLIC SMALL LETTER EM
91 Н → N ; # CYRILLIC CAPITAL LETTER EN
92 н → n ; # CYRILLIC SMALL LETTER EN
93 О → O ; # CYRILLIC CAPITAL LETTER O
94 о → o ; # CYRILLIC SMALL LETTER O
95 П → P ; # CYRILLIC CAPITAL LETTER PE
96 п → p ; # CYRILLIC SMALL LETTER PE
97 Р → R ; # CYRILLIC CAPITAL LETTER ER
98 р → r ; # CYRILLIC SMALL LETTER ER
99 С → S ; # CYRILLIC CAPITAL LETTER ES
100 с → s ; # CYRILLIC SMALL LETTER ES
103 ########################################################################
109 ########################################################################
111 ТС → T·S ; # CYRILLIC CAPITAL LETTER TE
112 Тс → T·s ; # CYRILLIC CAPITAL LETTER TE
113 тс → t·s ; # CYRILLIC SMALL LETTER TE
114 Т → T ; # CYRILLIC CAPITAL LETTER TE
115 т → t ; # CYRILLIC SMALL LETTER TE
118 ########################################################################
122 ########################################################################
123 У → U ; # CYRILLIC CAPITAL LETTER U
124 у → u ; # CYRILLIC SMALL LETTER U
125 Ф → F ; # CYRILLIC CAPITAL LETTER EF
126 ф → f ; # CYRILLIC SMALL LETTER EF
127 Х} $lower → Kh ; # CYRILLIC CAPITAL LETTER HA
128 Х → KH ; # CYRILLIC CAPITAL LETTER HA
129 х → kh ; # CYRILLIC SMALL LETTER HA
130 Ц} $lower → Ts ; # CYRILLIC CAPITAL LETTER TSE
131 Ц → TS ; # CYRILLIC CAPITAL LETTER TSE
132 ц → ts ; # CYRILLIC SMALL LETTER TSE
133 Ч} $lower → Ch ; # CYRILLIC CAPITAL LETTER CHE
134 Ч → CH ; # CYRILLIC CAPITAL LETTER CHE
135 ч → ch ; # CYRILLIC SMALL LETTER CHE
137 ########################################################################
139 # Implied rule from BGN Russian-Latin transliteration (Page 94 Note 3.6).
143 ########################################################################
145 ШТ → SH·T ; # CYRILLIC CAPITAL LETTER SHA
146 Шт → Sh·t ; # CYRILLIC CAPITAL LETTER SHA
147 шт → sh·t ; # CYRILLIC SMALL LETTER SHA
148 Ш} $lower → Sh ; # CYRILLIC CAPITAL LETTER SHA
149 Ш → SH ; # CYRILLIC CAPITAL LETTER SHA
150 ш → sh ; # CYRILLIC SMALL LETTER SHA
151 Щ} $lower → Sht ; # CYRILLIC CAPITAL LETTER SHCHA
152 Щ → SHT ; # CYRILLIC CAPITAL LETTER SHCHA
153 щ → sht ; # CYRILLIC SMALL LETTER SHCHA
156 ########################################################################
160 ########################################################################
161 Ъ → Ŭ ; # CYRILLIC CAPITAL LETTER HARD SIGN
162 ъ → ŭ ; # CYRILLIC SMALL LETTER HARD SIGN
164 ########################################################################
168 # In modern Bulgarian orthography, the character ъ does not occur in
169 # word-final position. It should be omitted in romanization when found
172 # The following rule removes all Ъъ at the end of a word. It is assumed
173 # that when the condition is met, the text must be from an older source.
174 # Comment out with a '#' at the start of a line to disable.
177 ########################################################################
179 $bulgarian { [Ъъ] } $wordBoundary > ;
182 ########################################################################
184 # End BGN Page 16 Note 1
186 ########################################################################
187 Ь → ’ ; # CYRILLIC CAPITAL LETTER SOFT SIGN
188 ь → ’ ; # CYRILLIC SMALL LETTER SOFT SIGN
189 Ю} $lower → Yu ; # CYRILLIC CAPITAL LETTER YU
190 Ю → YU ; # CYRILLIC CAPITAL LETTER YU
191 ю → yu ; # CYRILLIC SMALL LETTER YU
192 Я} $lower → Ya ; # CYRILLIC CAPITAL LETTER YA
193 Я → YA ; # CYRILLIC CAPITAL LETTER YA
194 я → ya ; # CYRILLIC SMALL LETTER YA
196 ########################################################################
200 # The obsolete character Ѫ, which was replaced by Ъ in 1945, should be
203 ########################################################################
205 Ѫ → Ŭ ; # CYRILLIC CAPITAL LETTER BIG YUS
206 ѫ → ŭ ; # CYRILLIC SMALL LETTER BIG YUS
209 ########################################################################
211 # End BGN Page 16 Note 2
213 ########################################################################
215 ########################################################################
219 # The obsolete character Ѣ, replaced in 1945 by Я or Е according to local
220 # pronunciation, should be romanized as e or ya, accordingly, if the
221 # pronunciation is known; otherwise as ye.
223 ########################################################################
225 Ѣ} $lower → Ye ; # CYRILLIC CAPITAL LETTER YAT
226 Ѣ → YE ; # CYRILLIC CAPITAL LETTER YAT
227 ѣ → ye ; # CYRILLIC SMALL LETTER YAT
230 # Alternative rule where appropriate for local pronounciation. To apply
231 # uncomment the following by removing the '#' mark at the start of the
232 # line and insert before the three rule lines above.
234 # Ѣ} $lower → e ; # CYRILLIC CAPITAL LETTER YAT
235 # Ѣ → E ; # CYRILLIC CAPITAL LETTER YAT
236 # ѣ → e ; # CYRILLIC SMALL LETTER YAT
238 ########################################################################
240 # End BGN Page 16 Note 3
242 ########################################################################