]> git.saurik.com Git - apple/icu.git/blame - icuSources/data/translit/Hebrew_Latin.txt
ICU-6.2.22.tar.gz
[apple/icu.git] / icuSources / data / translit / Hebrew_Latin.txt
CommitLineData
374ca955
A
1#--------------------------------------------------------------------
2# Copyright (c) 1999-2004, International Business Machines
3# Corporation and others. All Rights Reserved.
4#--------------------------------------------------------------------
5
6# Transliteration table for Hebrew
7# Based on the UNGEGN table at:
8# http://www.eki.ee/wgrs/rom1_he.pdf
9#
10# Exceptions:
11# - Accents are added to disambiguate letters
12# - Combinations of dagesh, shin/sin dot that produce different
13# letters are not yet encoded.
14#
15# To test, open:
16# http://oss.software.ibm.com/cgi-bin/icu/tr
17# Click Edit, paste in this file, Save As hebrew-latin/XXX
18# (where XXX is a username)
19# Now go back to the main window, and try it out.
20# Use hebrew-latin/XXX for Output 1, and (Inverse) for Output 2
21# Paste in hebrew text in Input, and hit Transliterate.
22#
23# For more information, see"
24# http://oss.software.ibm.com/icu/userguide/Transliteration.html
25
26:: [[:Hebrew:] [:^ccc=0:] [\u05B0-\u05B9\u05BB-\u05BC\u05C1-\u05C2\u2135-\u2138̄\u05BF] - [\u05BD]] ;
27:: nfkd (nfc) ;
28$letterAfter = [:M:]* [:L:] ;
29
30# move longer items here to avoid masking
31
32ח <> ẖ ;
33צ <> ẕ } $letterAfter;
34ץ <> ẕ ;
35ש <> ş ;
36ת <> ţ ;
37
38א <> ʼ ;
39ב <> b ;
40ג <> g ;
41ד <> d ;
42ה <> h ;
43ו <> w ;
44ז <> z ;
45ט <> t ;
46י <> y ;
47כ <> k } $letterAfter;
48ך <> k ;
49ל <> l ;
50מ <> m } $letterAfter;
51ם <> m ;
52נ <> n } $letterAfter;
53ן <> n ;
54ס <> s ;
55ע <> ʻ ;
56פ <> p } $letterAfter;
57ף <> p ;
58ק <> q ;
59ר <> r ;
60
61 װ > | וו; # HEBREW LIGATURE YIDDISH DOUBLE VAV
62 ױ > | וי; # HEBREW LIGATURE YIDDISH VAV YOD
63 ײ > | יי ; # HEBREW LIGATURE YIDDISH DOUBLE YOD
64
65
66ּ <> ̇ ; # dagesh just goes to overdot for now
67ׁ <> ̌ ; # shin dot -> sh
68ׂ <> ̂ ; # sin dot -> s
69
70# points
71$above = [^[:ccc=0:][:ccc=230:]]*;
72
73‎ֲ‎ > à ;
74‎ֲ‎ $1< a ($above) ̀;
75
76‎ָ‎ > á ;
77‎ָ‎ $1 < a ($above) ́;
78
79‎ֱ‎ > è ;
80‎ֱ‎ $1 < e ($above) ̀;
81
82‎ֵ‎ > é ;
83‎ֵ‎ $1 < e ($above) ́;
84
85‎ְ‎ > e ̆ ;
86‎ְ‎ $1 < e ($above) ̆;
87
88‎ֹ‎ > ò ;
89‎ֹ‎ $1 < o ($above) ̀;
90
91ִ <> i ;
92ֻ <> u ;
93ַ <> a ;
94ֶ <> e ;
95ֳ <> o ;
96
97\u05BF <> ̄ ;
98
99# fallbacks
100ק < c ;
101פ < f } $letterAfter;
102ף < f ;
103ז < j ;
104ו < v ;
105כס < x ;
106
107:: (lower);
108:: nfc (nfd) ;
109:: ([[:Latin:] [:^ccc=0:] [\u02BB-\u02BC\u0300-\u0302\u0307\u030C\u0327\u0331\u0340-\u0341 ̄ ]]);