]> git.saurik.com Git - apple/icu.git/blame - icuSources/data/translit/fa_fa_Latn_BGN.txt
ICU-57131.0.1.tar.gz
[apple/icu.git] / icuSources / data / translit / fa_fa_Latn_BGN.txt
CommitLineData
729e4ab9
A
1# ***************************************************************************
2# *
2ca993e8 3# * Copyright (C) 2004-2016, International Business Machines
729e4ab9
A
4# * Corporation; Unicode, Inc.; and others. All Rights Reserved.
5# *
6# ***************************************************************************
2ca993e8 7# File: fa_fa_Latn_BGN.txt
729e4ab9
A
8# Generated from CLDR
9#
2ca993e8
A
10
11#
12########################################################################
13# BGN/PCGN 1956 System
14#
15# This system was adopted by the BGN in 1946 and by the PCGN in 1958.
16# It is used for the romanization of geographic names in Iran and
17# for Persian-language names in Afghanistan.
18#
19# Originally prepared by Michael Everson <everson@evertype.com>
20########################################################################
21#
22# MINIMAL FILTER: Persian-Latin
23#
729e4ab9
A
24:: [[:arabic:][:block=ARABIC:][ءآابةتثجحخدذرزسشصضطظعغفقكلمنهویي\u064E\u064F\u0650\u0651\u0652٠١٢٣٤٥٦٧٨٩پچژگی]] ;
25:: NFKD (NFC) ;
2ca993e8
A
26#
27#
28########################################################################
29#
30########################################################################
31#
32# Define All Transformation Variables
33#
34########################################################################
35#
729e4ab9
A
36$alef = ’;
37$ayin = ‘;
51004dcb 38$disambig = \u0331 ;
2ca993e8
A
39#
40#
41# Use this $wordBoundary until bug 2034 is fixed in ICU:
42# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
43#
51004dcb 44$wordBoundary = [^[:L:][:M:][:N:]] ;
2ca993e8
A
45#
46#
47########################################################################
48# non-letters
729e4ab9
A
49[:Nd:]{٫}[:Nd:] ↔ [:Nd:]{','}[:Nd:] ; # ARABIC DECIMAL SEPARATOR
50[:Nd:]{٬}[:Nd:] ↔ [:Nd:]{'.'}[:Nd:] ; # ARABIC THOUSANDS SEPARATOR
51٫ ↔ ',' $disambig ; # ARABIC DECIMAL SEPARATOR
52٬ ↔ '.' $disambig ; # ARABIC THOUSANDS SEPARATOR
2ca993e8 53# ٭ ↔ ; # ARABIC FIVE POINTED STAR // no need to transliterate
729e4ab9
A
54، ↔ ',' ; # ARABIC COMMA
55؛ ↔ ';' ; # ARABIC SEMICOLON
56؟ ↔ '?' ; # ARABIC QUESTION MARK
57٪ ↔ '%' ; # ARABIC PERCENT SIGN
58٠ ↔ 0 $disambig ; # ARABIC-INDIC DIGIT ZERO
59١ ↔ 1 $disambig ; # ARABIC-INDIC DIGIT ONE
60٢ ↔ 2 $disambig ; # ARABIC-INDIC DIGIT TWO
61٣ ↔ 3 $disambig ; # ARABIC-INDIC DIGIT THREE
62٤ ↔ 4 $disambig ; # ARABIC-INDIC DIGIT FOUR
63٥ ↔ 5 $disambig ; # ARABIC-INDIC DIGIT FIVE
64٦ ↔ 6 $disambig ; # ARABIC-INDIC DIGIT SIX
65٧ ↔ 7 $disambig ; # ARABIC-INDIC DIGIT SEVEN
66٨ ↔ 8 $disambig ; # ARABIC-INDIC DIGIT EIGHT
67٩ ↔ 9 $disambig ; # ARABIC-INDIC DIGIT NINE
68۰ ↔ 0 ; # EXTENDED ARABIC-INDIC DIGIT ZERO
69۱ ↔ 1 ; # EXTENDED ARABIC-INDIC DIGIT ONE
70۲ ↔ 2 ; # EXTENDED ARABIC-INDIC DIGIT TWO
71۳ ↔ 3 ; # EXTENDED ARABIC-INDIC DIGIT THREE
72۴ ↔ 4 ; # EXTENDED ARABIC-INDIC DIGIT FOUR
73۵ ↔ 5 ; # EXTENDED ARABIC-INDIC DIGIT FIVE
74۶ ↔ 6 ; # EXTENDED ARABIC-INDIC DIGIT SIX
75۷ ↔ 7 ; # EXTENDED ARABIC-INDIC DIGIT SEVEN
76۸ ↔ 8 ; # EXTENDED ARABIC-INDIC DIGIT EIGHT
77۹ ↔ 9 ; # EXTENDED ARABIC-INDIC DIGIT NINE
2ca993e8
A
78#
79########################################################################
80#
81# Rules moved to front to avoid masking
82#
83########################################################################
84#
85########################################################################
86#
87# BGN Page 89 Rule 4
88#
89# The character sequences كه , زه , سه , and گه may be romanized k·h, z·h,
90# s·h, and g·h in order to differentiate those romanizations from the
91# digraphs kh, zh, sh, and gh.
92#
93########################################################################
94#
729e4ab9
A
95كه → k·h ; # ARABIC LETTER KAF + HEH
96زه → z·h ; # ARABIC LETTER ZAIN + HEH
97سه → s·h ; # ARABIC LETTER SEEN + HEH
98گه → g·h ; # ARABIC LETTER GAF + HEH
2ca993e8
A
99#
100#
101########################################################################
102#
103# End Rule 4
104#
105########################################################################
106#
107########################################################################
108#
109# BGN Page 91 Rule 7
110#
111# Doubles consonant sounds are represented in Arabic script by
112# placing a shaddah ( \u0651 ) over a consonant character. In romanization
113# the letter should be doubled. [The remainder of this rule deals with
114# the definite article and is lexical.]
115#
116########################################################################
117#
729e4ab9
A
118ب\u0651 → bb ; # ARABIC LETTER BEH + SHADDA
119پ\u0651 → pp ; # ARABIC LETTER PEH + SHADDA
120ت\u0651 → tt ; # ARABIC LETTER TEH + SHADDA
121ث\u0651 → s\u0304s\u0304 ; # ARABIC LETTER THEH + SHADDA
122ج\u0651 → jj ; # ARABIC LETTER JEEM + SHADDA
123چ\u0651 → chch ; # ARABIC LETTER TCHEH + SHADDA
124ح\u0651 → ḥḥ ; # ARABIC LETTER HAH + SHADDA
125خ\u0651 → khkh ; # ARABIC LETTER KHAH + SHADDA
126د\u0651 → dd ; # ARABIC LETTER DAL + SHADDA
127ذ\u0651 → z\u0304z\u0304 ; # ARABIC LETTER THAL + SHADDA
128ر\u0651 → rr ; # ARABIC LETTER REH + SHADDA
129ز\u0651 → zz ; # ARABIC LETTER ZAIN + SHADDA
130ژ\u0651 → zhzh ; # ARABIC LETTER JEH + SHADDA
131س\u0651 → ss ; # ARABIC LETTER SEEN + SHADDA
132ش\u0651 → shsh ; # ARABIC LETTER SHEEN + SHADDA
133ص\u0651 → ṣṣ ; # ARABIC LETTER SAD + SHADDA
134ض\u0651 → ḍḍ ; # ARABIC LETTER DAD + SHADDA
135ط\u0651 → ṭṭ ; # ARABIC LETTER TAH + SHADDA
136ظ\u0651 → ẓẓ ; # ARABIC LETTER ZAH + SHADDA
137ع\u0651 → $ayin $ayin ; # ARABIC LETTER AIN + SHADDA
138غ\u0651 → ghgh ; # ARABIC LETTER GHAIN + SHADDA
139ف\u0651 → ff ; # ARABIC LETTER FEH + SHADDA
140ق\u0651 → qq ; # ARABIC LETTER QAF + SHADDA
141ك\u0651 → kk ; # ARABIC LETTER KAF + SHADDA
142ل\u0651 → ll ; # ARABIC LETTER LAM + SHADDA
143م\u0651 → mm ; # ARABIC LETTER MEEM + SHADDA
144ن\u0651 → nn ; # ARABIC LETTER NOON + SHADDA
145ه\u0651 → hh ; # ARABIC LETTER HEH + SHADDA
146و\u0651 → ww ; # ARABIC LETTER WAW + SHADDA
147ی\u0651 → yy ; # ARABIC LETTER FARSI YEH + SHADDA
2ca993e8
A
148#
149#
150########################################################################
151#
152# End Rule 7
153#
154########################################################################
155#
156########################################################################
157#
158# Start of Transformations
159#
160########################################################################
161#
51004dcb 162$wordBoundary{ء → ; # ARABIC LETTER HAMZA
729e4ab9 163ء → $alef ; # ARABIC LETTER HAMZA
51004dcb 164$wordBoundary{ا → ; # ARABIC LETTER ALEF
729e4ab9
A
165آ → $alef ā ; # ARABIC FATHA ALEF WITH MADDA ABOVE
166ب → b ; # ARABIC LETTER BEH
167پ → p ; # ARABIC LETTER PEH
168ت → t ; # ARABIC LETTER TEH
169ة → h ; # ARABIC LETTER TEH MARBUTA
170ث → s\u0304 ; # ARABIC LETTER THEH
171ج → j ; # ARABIC LETTER JEEM
172چ → ch ; # ARABIC LETTER TCHEH
173ح → ḥ ; # ARABIC LETTER HAH
174خ → kh ; # ARABIC LETTER KHAH
175د → d ; # ARABIC LETTER DAL
176ذ → z\u0304 ; # ARABIC LETTER THAL
177ر → r ; # ARABIC LETTER REH
178ز → z ; # ARABIC LETTER ZAIN
179ژ → zh ; # ARABIC LETTER JEH
180س → s ; # ARABIC LETTER SEEN
181ش → sh ; # ARABIC LETTER SHEEN
182ص → ṣ ; # ARABIC LETTER SAD
183ض → ẕ ; # ARABIC LETTER DAD
184ط → ṭ ; # ARABIC LETTER TAH
185ظ → ẓ ; # ARABIC LETTER ZAH
186ع → $ayin ; # ARABIC LETTER AIN
187غ → gh ; # ARABIC LETTER GHAIN
188ف → f ; # ARABIC LETTER FEH
189ق → q ; # ARABIC LETTER QAF
190ک ↔ k ; # ARABIC LETTER KEHEH
191ك ↔ k $disambig ; # ARABIC LETTER KAF
192گ → g ; # ARABIC LETTER GAF
193ل → l ; # ARABIC LETTER LAM
194م → m ; # ARABIC LETTER MEEM
195ن → n ; # ARABIC LETTER NOON
196ه → h ; # ARABIC LETTER HEH
197و → v ; # ARABIC LETTER WAW
198ی → y ; # ARABIC LETTER FARSI YEH
199\u064Eا → ā ; # ARABIC FATHA + ALEF
200\u064Eی → á ; # ARABIC FATHA + FARSI YEH
201\u064Eو\u0652 → ow ; # ARABIC FATHA + WAW + SUKUN
202\u064E → a ; # ARABIC FATHA
203\u0650ي → ī ; # ARABIC KASRA + YEH
204\u0650 → e ; # ARABIC KASRA
205\u064Fو → ū ; # ARABIC DAMMA + WAW
206\u064F → o ; # ARABIC DAMMA
51004dcb 207\u0652 → ; # ARABIC SUKUN
729e4ab9 208::NFC (NFD) ;
2ca993e8
A
209#
210#
211########################################################################
212