]>
Commit | Line | Data |
---|---|---|
1 | # © 2016 and later: Unicode, Inc. and others. | |
2 | # License & terms of use: http://www.unicode.org/copyright.html#License | |
3 | # | |
4 | # File: InterIndic_Arabic.txt | |
5 | # Generated from CLDR | |
6 | # | |
7 | ||
8 | $nonword = [^\uE000-\uE0FF]; | |
9 | $wordBoundary = [^[:L:][:M:][:N:]]; | |
10 | \uE015\uE03F\uE02F\uE03E } $nonword→كيا; # किया | |
11 | \uE026\uE03F\uE02F\uE03E } $nonword→ديا; # दिया | |
12 | \uE015\uE03F } $nonword→كي; # कि at word end | |
13 | \uE039\uE048→هي; # ह\u0948 | |
14 | \uE001 } $nonword→ن; # chandrabindu at end to noon | |
15 | \uE001→ن; # chandrabindu not at end to noon | |
16 | \uE002 } $nonword→ن; # anusvara to noon at end | |
17 | \uE002→ن; # anusvara to noon \u0902 | |
18 | \uE003→ه ا; # viarga to ha + alif ः | |
19 | \uE004→ا; # short a to alif ऄ | |
20 | \uE005→ا; # अ | |
21 | \uE006→ا \u0653; # alif with mad आ | |
22 | [[:L:][:M:]] {\uE007}→ي; # इ after another letter or mark | |
23 | \uE007→إ; # इ at beginning of word | |
24 | [[:L:][:M:]] {\uE008}→ي; # ई after another letter or mark | |
25 | \uE008→إ; # ई at beginning of word | |
26 | \uE009→و; # उ | |
27 | \uE00A→و; # ऊ | |
28 | \uE00B→ر; # ऋ | |
29 | \uE00C→ل; # ऌ | |
30 | \uE00D→ا ي; # ऍ | |
31 | \uE00E→ي; # ऎ | |
32 | $wordBoundary {\uE00F} → إي; # word-initial ए | |
33 | \uE00F } $nonword→ي; # ए use ي when at end | |
34 | \uE00F→ي; # ए use ي when not at end | |
35 | \uE010 } $nonword→ا ي; # ऐ use ي when at end | |
36 | \uE010→ا ي; # ऐ use ي when not at end | |
37 | \uE011→ا و; # ऑ | |
38 | \uE012→ا و; # ऒ | |
39 | \uE013→ا و; # ओ | |
40 | \uE014→ا و; # औ | |
41 | \uE015→ك; # क | |
42 | \uE016→كه; # ख | |
43 | \uE017→ج; # ग | |
44 | \uE018→جه; # घ | |
45 | \uE019→نج; # ङ | |
46 | \uE01A→تش; # च | |
47 | \uE01B→تشه; # छ | |
48 | \uE01C→ج; # ज | |
49 | \uE01D→جه; # झ | |
50 | \uE01E→ن; # ञ | |
51 | \uE01F→ط; # ट | |
52 | \uE020→طه; # ठ | |
53 | \uE021→د; # ड | |
54 | \uE022→ده; # ढ | |
55 | \uE023→ن; # ण | |
56 | \uE024→ت; # त | |
57 | \uE025→ته; # थ | |
58 | \uE026→د; # द | |
59 | \uE027→ده; # ध | |
60 | \uE028→ن; # न | |
61 | \uE029→ن; # ऩ | |
62 | \uE02A→ب; # प | |
63 | \uE02B→به; # फ | |
64 | \uE02C→ب; # ब | |
65 | \uE02D→به; # भ | |
66 | \uE02E→م; # म | |
67 | \uE02F→ي; # य | |
68 | \uE030→ر; # र | |
69 | \uE031→ر; # ऱ | |
70 | \uE032→ل; # ल | |
71 | \uE033→ر; # ळ | |
72 | \uE034→ر; # ऴ | |
73 | \uE035→و; # व | |
74 | \uE036→ش; # श | |
75 | \uE037→ش; # ष | |
76 | \uE038→س; # स | |
77 | \uE039→ه; # ह | |
78 | \uE03C→; # \u093C | |
79 | \uE03D→; # ऽ | |
80 | \uE03E→ا; # ा | |
81 | \uE03F→ي; # ि | |
82 | \uE040→ي; # ी | |
83 | \uE041→و; # \u0941 | |
84 | \uE042→و; # \u0942 | |
85 | \uE043→ر; # \u0943 | |
86 | \uE044→ر; # \u0944 | |
87 | \uE045→ن; # \u0945 | |
88 | \uE046→ي; # \u0946 | |
89 | \uE047 } $nonword→ي; # \u0947 use ي when at end | |
90 | \uE047→ي; # \u0947 use ي when not at end | |
91 | \uE048 } $nonword→ا ي; # \u0948 use ي when at end | |
92 | \uE048→ا ي; # \u0948 use ي when not at end | |
93 | \uE049→و; # ॉ | |
94 | \uE04A→ا و; # ॊ | |
95 | \uE04B→و; # ो | |
96 | \uE04C→ا و; # ौ | |
97 | \uE04D→; # \u094D | |
98 | \uE050→ا و; # ॐ | |
99 | \uE051→; # \u0951 | |
100 | \uE052→; # \u0952 | |
101 | \uE053→; # \u0953 | |
102 | \uE054→; # \u0954 | |
103 | \uE058→ق; # क़ | |
104 | \uE059→خ; # ख़ | |
105 | \uE05A→غ; # ग़ | |
106 | \uE05B→ز; # ज़ | |
107 | \uE05C→ر; # ड़ | |
108 | \uE05D→ره; # ढ़ | |
109 | \uE05E→ف; # फ़ | |
110 | \uE05F→ي; # य़ | |
111 | \uE060→ر; # ॠ | |
112 | \uE061→ل; # ॡ | |
113 | \uE062→ل; # \u0962 | |
114 | \uE063→ل; # \u0963 | |
115 | \uE064→۔; # । | |
116 | \uE065→۔; # ॥ | |
117 | \uE066→\.; # ० | |
118 | \uE067→١; # १ | |
119 | \uE068→٢; # २ | |
120 | \uE069→٣; # ३ | |
121 | \uE06A→٤; # ४ | |
122 | \uE06B→٥; # ५ | |
123 | \uE06C→٦; # ६ | |
124 | \uE06D→٧; # ७ | |
125 | \uE06E→٨; # ८ | |
126 | \uE06F→٩; # ९ | |
127 | \uE070→\.; # ॰ | |
128 | \uE082→; # ॽ | |
129 | # Remove sequences of alif characters. | |
130 | # For example, transform पाओला → بااولا → باولا. | |
131 | ::null; | |
132 | $alif = [أإآا] [:M:]*; | |
133 | ($alif) $alif+ → $1; | |
134 |