1 # ***************************************************************************
3 # * Copyright (C) 2004-2016, International Business Machines
4 # * Corporation; Unicode, Inc.; and others. All Rights Reserved.
6 # ***************************************************************************
11 # Transliteration table for Hebrew
12 # Based on the UNGEGN table at:
13 # http://www.eki.ee/wgrs/rom1_he.pdf
16 # - Accents are added to disambiguate letters
17 # - Combinations of dagesh, shin/sin dot that produce different
18 # letters are not yet encoded.
21 # http://www.ibm.com/software/globalization/icu/demo/transform
22 # Click Edit, paste in this file, Save As hebrew-latin/XXX
23 # (where XXX is a username)
24 # Now go back to the main window, and try it out.
25 # Use hebrew-latin/XXX for Output 1, and (Inverse) for Output 2
26 # Paste in hebrew text in Input, and hit Transliterate.
28 # For more information, see:
29 # http://icu.sourceforge.net/userguide/Transform.html
30 :: [[:Hebrew:] [:^ccc=0:] [\u05B0-\u05B9\u05BB-\u05BC\u05C1-\u05C2ℵ-ℸ\u0304\u05BF] - [\u05BD]] ;
32 $letterAfter = [:M:]* [:L:] ;
33 # move longer items here to avoid masking
35 צ ↔ z\u0331 } $letterAfter;
61 װ → | וו; # HEBREW LIGATURE YIDDISH DOUBLE VAV
62 ױ → | וי; # HEBREW LIGATURE YIDDISH VAV YOD
63 ײ → | יי ; # HEBREW LIGATURE YIDDISH DOUBLE YOD
64 \u05BC ↔ \u0307 ; # dagesh just goes to overdot for now
65 \u05C1 ↔ \u030C ; # shin dot -→ sh
66 \u05C2 ↔ \u0302 ; # sin dot -→ s
68 $above = [^[:ccc=0:][:ccc=230:]]*;
70 \u05B2 $1← a ($above) \u0300;
72 \u05B8 $1 ← a ($above) \u0301;
74 \u05B1 $1 ← e ($above) \u0300;
76 \u05B5 $1 ← e ($above) \u0301;
78 \u05B0 $1 ← e ($above) \u0306;
80 \u05B9 $1 ← o ($above) \u0300;
96 :: ([[:Latin:] [:^ccc=0:] [ʻ-ʼ\u0300-\u0302\u0307\u030C\u0327\u0331\u0340-\u0341 \u0304 ]]);