]> git.saurik.com Git - apple/icu.git/blame - icuSources/data/translit/t_InterIndic_Latn.txt
ICU-3.13.tar.gz
[apple/icu.git] / icuSources / data / translit / t_InterIndic_Latn.txt
CommitLineData
b75a7d8f
A
1 // -*- Coding: utf-8; -*-
2//--------------------------------------------------------------------
3// Copyright (c) 1999-2002, International Business Machines
4// Corporation and others. All Rights Reserved.
5//--------------------------------------------------------------------
6// THIS IS A MACHINE-GENERATED FILE
7// Tool: dumpicurules.bat
8// Source: ../../../impl/data/Transliterator_InterIndic_Latin.txt
9// Date: Sat Jul 27 10:31:07 2002
10//--------------------------------------------------------------------
11
12// InterIndic_Latin
13
14t_InterIndic_Latn {
15 Rule {
16//--------------------------------------------------------------------
17//--------------------------------------------------------------------
18//--------------------------------------------------------------------
19
20// InterIndic-Latin
21 //\u0e00 reserved
22 //consonants
23 "$chandrabindu=\ue001;"
24 "$anusvara=\ue002;"
25 "$visarga=\ue003;"
26 //\u0e004 reserved
27 // w<vowel> represents the stand-alone form
28 "$wa=\ue005;"
29 "$waa=\ue006;"
30 "$wi=\ue007;"
31 "$wii=\ue008;"
32 "$wu=\ue009;"
33 "$wuu=\ue00a;"
34 "$wr=\ue00b;"
35 "$wl=\ue00c;"
36 "$wce=\ue00d;" // LETTER CANDRA E
37 "$wse=\ue00e;" // LETTER SHORT E
38 "$we=\ue00f;" // \u090f LETTER E
39 "$wai=\ue010;"
40 "$wco=\ue011;" // LETTER CANDRA O
41 "$wso=\ue012;" // LETTER SHORT O
42 "$wo=\ue013;" // \u0913 LETTER O
43 "$wau=\ue014;"
44 "$ka=\ue015;"
45 "$kha=\ue016;"
46 "$ga=\ue017;"
47 "$gha=\ue018;"
48 "$nga=\ue019;"
49 "$ca=\ue01a;"
50 "$cha=\ue01b;"
51 "$ja=\ue01c;"
52 "$jha=\ue01d;"
53 "$nya=\ue01e;"
54 "$tta=\ue01f;"
55 "$ttha=\ue020;"
56 "$dda=\ue021;"
57 "$ddha=\ue022;"
58 "$nna=\ue023;"
59 "$ta=\ue024;"
60 "$tha=\ue025;"
61 "$da=\ue026;"
62 "$dha=\ue027;"
63 "$na=\ue028;"
64 "$ena=\ue029;" //compatibility
65 "$pa=\ue02a;"
66 "$pha=\ue02b;"
67 "$ba=\ue02c;"
68 "$bha=\ue02d;"
69 "$ma=\ue02e;"
70 "$ya=\ue02f;"
71 "$ra=\ue030;"
72 "$rra=\ue031;"
73 "$la=\ue032;"
74 "$lla=\ue033;"
75 "$ela=\ue034;" //compatibility
76 "$va=\ue035;"
77 "$sha=\ue036;"
78 "$ssa=\ue037;"
79 "$sa=\ue038;"
80 "$ha=\ue039;"
81//\u093a Reserved
82//\u093b Reserved
83 "$nukta=\ue03c;"
84 "$avagraha=\ue03d;" // SIGN AVAGRAHA
85 // <vowel> represents the dependent form
86 "$aa=\ue03e;"
87 "$i=\ue03f;"
88 "$ii=\ue040;"
89 "$u=\ue041;"
90 "$uu=\ue042;"
91 "$rh=\ue043;"
92 "$lh=\ue044;"
93 "$ce=\ue045;" //VOWEL SIGN CANDRA E
94 "$se=\ue046;" //VOWEL SIGN SHORT E
95 "$e=\ue047;"
96 "$ai=\ue048;"
97 "$co=\ue049;" // VOWEL SIGN CANDRA O
98 "$so=\ue04a;" // VOWEL SIGN SHORT O
99 "$o=\ue04b;" // \u094b
100 "$au=\ue04c;"
101 "$virama=\ue04d;"
102// \u094e Reserved
103// \u094f Reserved
104 "$om=\ue050;" // OM
105 "\ue051>;" // UNMAPPED STRESS SIGN UDATTA
106 "\ue052>;" // UNMAPPED STRESS SIGN ANUDATTA
107 "\ue053>;" // UNMAPPED GRAVE ACCENT
108 "\ue054>;" // UNMAPPED ACUTE ACCENT
109 "$lm = \ue055;"// Telugu Length Mark
110 "$ailm=\ue056;"// AI Length Mark
111 "$aulm=\ue057;"// AU Length Mark
112 //urdu compatibity forms
113 "$uka=\ue058;"
114 "$ukha=\ue059;"
115 "$ugha=\ue05a;"
116 "$ujha=\ue05b;"
117 "$uddha=\ue05c;"
118 "$udha=\ue05d;"
119 "$ufa=\ue05e;"
120 "$uya=\ue05f;"
121 "$wrr=\ue060;"
122 "$wll=\ue061;"
123 "$rrh=\ue062;"
124 "$llh=\ue063;"
125 "$danda=\ue064;"
126 "$doubleDanda=\ue065;"
127 "$zero=\ue066;" // DIGIT ZERO
128 "$one=\ue067;" // DIGIT ONE
129 "$two=\ue068;" // DIGIT TWO
130 "$three=\ue069;" // DIGIT THREE
131 "$four=\ue06a;" // DIGIT FOUR
132 "$five=\ue06b;" // DIGIT FIVE
133 "$six=\ue06c;" // DIGIT SIX
134 "$seven=\ue06d;" // DIGIT SEVEN
135 "$eight=\ue06e;" // DIGIT EIGHT
136 "$nine=\ue06f;" // DIGIT NINE
137 // For all other scripts
138 "$ecp0=\ue070;"
139 "$ecp1=\ue071;"
140 "$ecp2=\ue072;"
141 "$ecp3=\ue073;"
142 "$ecp4=\ue074;"
143 "$ecp5=\ue075;"
144 "$ecp6=\ue076;"
145 "$ecp7=\ue077;"
146 "$ecp8=\ue078;"
147 "$ecp9=\ue079;"
148 "$ecpA=\ue07a;"
149 "$ecpB=\ue07b;"
150 "$ecpC=\ue07c;"
151 "$ecpD=\ue07d;"
152 "$ecpE=\ue07e;"
153 "$ecpF=\ue07f;"
154// \u0970>; # UNMAPPED ABBREVIATION SIGN
155 "$depVowelAbove=[\ue03e-\ue040\ue045-\ue04c];"
156 "$depVowelBelow=[\ue041-\ue044];"
157 // $x was originally called '&'; $z was '%'
158 "$x=[$aa$ai$au$ii$i$uu$u$rrh$rh$lh$llh$e$o$se$ce$so$co];"
159 "$z=[bcdfghjklmnpqrstvwxyz];"
160 "$vowels=[aeiour\u0304\u0325\u0306];"
161 "$forceIndependentMatra = [^[[:L:][\u0300-\u034c]]];"
162 //#####################################################################
163 // convert from Native letters to Latin letters
164 //#####################################################################
165 //transliterations for anusvara
166 "$anusvara} [$ka$kha$ga$gha$nga] > n\u0307;"
167 "$anusvara} [$ca$cha$ja$jha$nya] > n\u0304;"
168 "$anusvara} [$tta$ttha$dda$ddha$nna] > n\u0323;"
169 "$anusvara} [$ta$tha$da$dha$na] > n ;"
170 "$anusvara} [$pa$pha$ba$bha$ma] > m ;"
171 "$anusvara} [$ya$ra$lla$la$va$ssa$sha$sa$ha] > n ;"
172 "$anusvara> m\u0307;"
173
174 // Urdu compatibility
175 "$ya$nukta}$x > y\u0307 ;"
176 "$ya$nukta$virama > y\u0307 ;"
177 "$ya$nukta > y\u0307a ;"
178
179 "$la$nukta }$x > l\u0331 ;"
180 "$la$nukta$virama > l\u0331 ;"
181 "$la$nukta > l\u0331a ;"
182
183 "$na$nukta }$x > n\u0331 ;"
184 "$na$nukta$virama > n\u0331 ;"
185 "$na$nukta > n\u0331a ;"
186
187 "$ena }$x > n\u0331 ;"
188 "$ena$virama > n\u0331 ;"
189 "$ena > n\u0331a ;"
190 "$uka > qa ;"
191 "$ka$nukta }$x > q ;"
192 "$ka$nukta$virama > q ;"
193 "$ka$nukta > qa ;"
194 "$kha$nukta }$x > k\u0331h\u0331 ;"
195 "$kha$nukta$virama > k\u0331h\u0331 ;"
196 "$kha$nukta > k\u0331h\u0331a ;"
197 "$ukha$virama > k\u0331h\u0331;"
198 "$ukha > k\u0331h\u0331a;"
199 "$ugha > g\u0307a ;"
200 "$ga$nukta }$x > g\u0307 ;"
201 "$ga$nukta$virama > g\u0307 ;"
202 "$ga$nukta > g\u0307a ;"
203
204 "$ujha > za ;"
205 "$ja$nukta }$x > z ;"
206 "$ja$nukta$virama > z ;"
207 "$ja$nukta > za ;"
208 "$ddha$nukta}$x > r\u0323h ;"
209 "$ddha$nukta$virama > r\u0323h ;"
210 "$ddha$nukta > r\u0323ha;"
211
212 "$uddha}$x > r\u0323 ;"
213 "$uddha$virama > r\u0323 ;"
214 "$uddha > r\u0323a;"
215
216 "$udha > r\u0323a ;"
217 "$dda$nukta}$x > r\u0323 ;"
218 "$dda$nukta$virama > r\u0323 ;"
219 "$dda$nukta > r\u0323a ;"
220 "$pha$nukta }$x > f ;"
221 "$pha$nukta$virama > f ;"
222 "$pha$nukta > fa ;"
223 "$ufa }$x > f ;"
224 "$ufa$virama > f ;"
225 "$ufa > fa ;"
226
227 "$ra$nukta}$x > r\u0331;"
228 "$ra$nukta$virama > r\u0331;"
229 "$ra$nukta > r\u0331a;"
230 "$lla$nukta}$x > l\u0331;"
231 "$lla$nukta$virama > l\u0331;"
232 "$lla$nukta > l\u0331a;"
233
234 "$ela}$x > l\u0331;"
235 "$ela$virama > l\u0331;"
236 "$ela > l\u0331a;"
237
238 "$uya}$x > y\u0307;"
239 "$uya$virama > y\u0307;"
240 "$uya > y\u0307a;"
241
242
243 // normal consonants
244 "$ka$virama}$ha>k'';"
245 "$ka}$x>k;"
246 "$ka$virama>k;"
247 "$ka>ka;"
248 "$kha}$x>kh;"
249 "$kha$virama>kh;"
250 "$kha>kha;"
251 "$ga$virama}$ha>g'';"
252 "$ga}$x>g;"
253 "$ga$virama>g;"
254 "$ga>ga;"
255
256 "$gha}$x>gh;"
257 "$gha$virama>gh;"
258 "$gha>gha;"
259
260 "$nga}$x>n\u0307;"
261 "$nga$virama>n\u0307;"
262 "$nga>n\u0307a ;"
263 "$ca$virama}$ha>c'';"
264 "$ca}$x>c;"
265 "$ca$virama>c;"
266 "$ca>ca;"
267
268 "$cha}$x>ch;"
269 "$cha$virama>ch;"
270 "$cha>cha;"
271 "$ja$virama}$ha>j'';"
272 "$ja}$x>j;"
273 "$ja$virama>j;"
274 "$ja>ja;"
275
276 "$jha}$x>jh;"
277 "$jha$virama>jh;"
278 "$jha>jha;"
279
280 "$nya }$x>n\u0303 ;"
281 "$nya$virama>n\u0303;"
282 "$nya > n\u0303a ;"
283
284
285 "$tta$virama}$ha>t\u0323'';"
286 "$tta}$x>t\u0323;"
287 "$tta$virama>t\u0323;"
288 "$tta>t\u0323a;"
289
290 "$ttha}$x>t\u0323h;"
291 "$ttha$virama>t\u0323h;"
292 "$ttha>t\u0323ha;"
293 "$dda}$x$ha>d\u0323'';"
294 "$dda}$x>d\u0323;"
295 "$dda$virama>d\u0323;"
296 "$dda>d\u0323a;"
297
298 "$ddha}$x>d\u0323h;"
299 "$ddha$virama>d\u0323h;"
300 "$ddha>d\u0323ha;"
301
302 "$nna}$x>n\u0323 ;"
303 "$nna$virama>n\u0323;"
304 "$nna>n\u0323a ;"
305
306
307 "$ta$virama}$ha>t'';"
308 "$ta$virama}$ttha>t'';"
309 "$ta$virama}$tta>t'';"
310 "$ta$virama}$tha>t'';"
311 "$ta}$x>t;"
312 "$ta$virama>t;"
313 "$ta>ta;"
314 "$tha}$x>th;"
315 "$tha$virama>th;"
316 "$tha>tha;"
317
318 "$da$virama}$ha>d'';"
319 "$da$virama}$ddha>d'';"
320 "$da$virama}$dda>d'';"
321 "$da$virama}$dha>d'';"
322 "$da}$x>d;"
323 "$da$virama>d;"
324 "$da>da;"
325 "$dha}$x>dh;"
326 "$dha$virama>dh;"
327 "$dha>dha;"
328 "$na$virama}$ga>n'';"
329 "$na$virama}$ya>n'';"
330 "$na}$x>n;"
331 "$na$virama>n;"
332 "$na>na;"
333
334
335 "$pa$virama}$ha>p'';"
336 "$pa}$x>p;"
337 "$pa$virama>p;"
338 "$pa>pa;"
339 "$pha}$x>ph;"
340 "$pha$virama>ph;"
341 "$pha>pha;"
342 "$ba$virama}$ha>b'';"
343 "$ba}$x>b;"
344 "$ba$virama>b;"
345 "$ba>ba;"
346
347 "$bha}$x>bh;"
348 "$bha$virama>bh;"
349 "$bha>bha;"
350
351 "$ma$virama}$ma>m'';"
352 "$ma}$x>m;"
353 "$ma$virama>m;"
354 "$ma>ma;"
355
356 "$ya}$x>y;"
357 "$ya$virama>y;"
358 "$ya>ya;"
359 "$ra$virama}$ha>r'';"
360 "$ra}$x>r;"
361 "$ra$virama>r;"
362 "$ra>ra;"
363 "$rra$virama}$ha>r\u0331'';"
364 "$rra}$x>r\u0331;"
365 "$rra$virama>r\u0331;"
366 "$rra>r\u0331a;"
367 "$la$virama}$ha>l'';"
368 "$la}$x>l;"
369 "$la$virama>l;"
370 "$la>la;"
371 "$lla$virama}$ha>l\u0323'';"
372 "$lla}$x>l\u0323;"
373 "$lla$virama>l\u0323;"
374 "$lla>l\u0323a;"
375 "$va}$x>v;"
376 "$va$virama>v;"
377 "$va>va;"
378 "$sa$virama}$ha>s'';"
379 "$sa$virama}$sha>s'';"
380 "$sa$virama}$ssa>s'';"
381 "$sa$virama}$sa>s'';"
382 "$sa}$x>s;"
383 "$sa$virama>s;"
384
385 //for gurmukhi
386 "$sa$nukta}$x>s\u0301;"
387 "$sa$nukta$virama>s\u0301;"
388 "$sa$nukta>s\u0301a;"
389 "$sa>sa;"
390
391 "$sha}$x>s\u0301;"
392 "$sha$virama>s\u0301;"
393 "$sha>s\u0301a;"
394
395 "$ssa}$x>s\u0323;"
396 "$ssa$virama>s\u0323;"
397 "$ssa>s\u0323a;"
398 "$ha}$x>h;"
399 "$ha$virama>h;"
400 "$ha>ha;"
401
402 // dependent vowels (should never occur except following consonants)
403 "$forceIndependentMatra{$aa > \u0314a\u0304 ;"
404 "$forceIndependentMatra{$ai > \u0314ai ;"
405 "$forceIndependentMatra{$au > \u0314au ;"
406 "$forceIndependentMatra{$ii > \u0314i\u0304 ;"
407 "$forceIndependentMatra{$i > \u0314i ;"
408 "$forceIndependentMatra{$uu > \u0314u\u0304 ;"
409 "$forceIndependentMatra{$u > \u0314u ;"
410 "$forceIndependentMatra{$rrh > \u0314r\u0325\u0304 ;"
411 "$forceIndependentMatra{$rh > \u0314r\u0325 ;"
412 "$forceIndependentMatra{$llh > \u0314l\u0325\u0304 ;"
413 "$forceIndependentMatra{$lh > \u0314l\u0325 ;"
414 "$forceIndependentMatra{$e > \u0314e\u0304 ;"
415 "$forceIndependentMatra{$o > \u0314o\u0304 ;"
416 //extra vowels
417 "$forceIndependentMatra{$ce > \u0314e\u0306 ;"
418 "$forceIndependentMatra{$co > \u0314o\u0306 ;"
419 "$forceIndependentMatra{$se > \u0314e ;"
420 "$forceIndependentMatra{$so > \u0314o ;"
421 "$forceIndependentMatra{$nukta >;" // Nukta cannot appear independently or as first character
422 "$forceIndependentMatra{$virama >;" // Virama cannot appear independently or as first character
423 "$aa > a\u0304 ;"
424 "$ai > ai ;"
425 "$au > au ;"
426 "$ii > i\u0304 ;"
427 "$i > i ;"
428 "$uu > u\u0304 ;"
429 "$u > u ;"
430 "$rrh > r\u0325\u0304 ;"
431 "$rh > r\u0325 ;"
432 "$llh > l\u0325\u0304 ;"
433 "$lh > l\u0325 ;"
434 "$e > e\u0304 ;"
435 "$o > o\u0304 ;"
436 //extra vowels
437 "$ce > e\u0306 ;"
438 "$co > o\u0306 ;"
439 "$se > e ;"
440 "$so > o ;"
441 //dependent vowels when following independent vowels. Generally Illegal only for roundtripping
442 "$waa} $x > a\u0304\u0314 ;"
443 "$wai} $x > ai\u0314 ;"
444 "$wau} $x > au\u0314 ;"
445 "$wii} $x > i\u0304\u0314 ;"
446 "$wi } $x > i\u0314 ;"
447 "$wuu} $x > u\u0304\u0314 ;"
448 "$wu } $x > u\u0314 ;"
449 "$wrr} $x > r\u0325\u0304\u0314 ;"
450 "$wr } $x > r\u0325\u0314 ;"
451 "$wll} $x > l\u0325\u0304\u0314 ;"
452 "$wl } $x > l\u0325\u0314 ;"
453 "$we } $x > e\u0304\u0314 ;"
454 "$wo } $x > o\u0304\u0314 ;"
455 "$wa } $x > a\u0314 ;"
456 //extra vowels
457 "$wce} $x > e\u0306\u0314 ;"
458 "$wco} $x > o\u0306\u0314 ;"
459 "$wse} $x > e\u0314 ;"
460 "$wso} $x > o\u0314 ;"
461 "$om} $x > ''om\u0314 ;"
462
463 // independent vowels when preceeded by vowels
464 "$vowels{$waa > ''a\u0304 ;"
465 "$vowels{$wai > ''ai ;"
466 "$vowels{$wau > ''au ;"
467 "$vowels{$wii > ''i\u0304 ;"
468 "$vowels{$wi > ''i ;"
469 "$vowels{$wuu > ''u\u0304 ;"
470 "$vowels{$wu > ''u ;"
471 "$vowels{$wrr > ''r\u0325\u0304 ;"
472 "$vowels{$wr > ''r\u0325 ;"
473 "$vowels{$wll > ''l\u0325\u0304 ;"
474 "$vowels{$wl > ''l\u0325 ;"
475 "$vowels{$we > ''e\u0304 ;"
476 "$vowels{$wo > ''o\u0304 ;"
477 "$vowels{$wa > ''a ;"
478 //extra vowels
479 "$vowels{$wce > ''e\u0306 ;"
480 "$vowels{$wco > ''o\u0306 ;"
481 "$vowels{$wse > ''e ;"
482 "$vowels{$wso > ''o ;"
483
484 // independent vowels (otherwise)
485 "$waa > a\u0304 ;"
486 "$wai > ai ;"
487 "$wau > au ;"
488 "$wii > i\u0304 ;"
489 "$wi > i ;"
490 "$wuu > u\u0304 ;"
491 "$wu > u ;"
492 "$wrr > r\u0325\u0304 ;"
493 "$wr > r\u0325 ;"
494 "$wll > l\u0325\u0304 ;"
495 "$wl > l\u0325 ;"
496 "$we > e\u0304 ;"
497 "$wo > o\u0304 ;"
498 "$wa > a ;"
499 //extra vowels
500 "$wce > e\u0306 ;"
501 "$wco > o\u0306 ;"
502 "$wse > e ;"
503 "$wso > o ;"
504 "$om > ''om ;"
505
506 //stress marks
507 "$avagraha > \u0315;"
508 "$chandrabindu$anusvara>\u0303;"
509 "$chandrabindu > m\u0310;"
510 "$visarga>h\u0323;"
511 //numbers
512 "$zero > 0;"
513 "$one > 1;"
514 "$two > 2;"
515 "$three > 3;"
516 "$four > 4;"
517 "$five > 5;"
518 "$six > 6;"
519 "$seven > 7;"
520 "$eight > 8;"
521 "$nine > 9;"
522 "$lm >;"
523 "$ailm >;"
524 "$aulm >;"
525 "$ecp0 >;"
526 "$ecp1 >;"
527 "$ecp2 >;"
528 "$ecp3 >;"
529 "$ecp4 >;"
530 "$ecp5 >;"
531 "$ecp6 >;"
532 "$ecp7 >;"
533 "$ecp8 >;"
534 "$ecp9 >;"
535 "$ecpA >;"
536 "$ecpB >;"
537 "$ecpC >;"
538 "$ecpD >;"
539 "$ecpE >;"
540 "$ecpF >;"
541 "$danda>'.';"
542 "$doubleDanda>'.';"
543 }
544}