]>
Commit | Line | Data |
---|---|---|
f3c0d7a5 A |
1 | # © 2016 and later: Unicode, Inc. and others. |
2 | # License & terms of use: http://www.unicode.org/copyright.html#License | |
3 | # | |
729e4ab9 | 4 | # File: ja_Latn_ko.txt |
f3c0d7a5 | 5 | # Generated from CLDR |
729e4ab9 | 6 | # |
2ca993e8 A |
7 | |
8 | # Japanese (Rōmaji) to Korean (Hangul) transliteration table for ICU. | |
9 | # Can be run in sequence after e.g. Katakana-Latin. | |
10 | # | |
11 | # Based on 문교부 고시 제85-11호 (1986. 1. 7.) 외래어 표기법 | |
12 | # For background info, see http://ko.wikisource.org/wiki/문교부_고시_제85-11호 | |
13 | # and http://ko.wikipedia.org/wiki/외래어_표기법 (外來語表記法) | |
729e4ab9 A |
14 | ::NFD(NFC); |
15 | ::[:Latin:] Lower(); | |
16 | $consonant = [ᄀᄁᄂᄃᄄᄅᄆᄇᄈᄉᄊᄋᄌᄍᄎᄏᄐᄑᄒ]; | |
17 | $lengthMarker = [\u0302\u0304]; | |
2ca993e8 A |
18 | # |
19 | # | |
20 | # Drop hyphens and apostrophes. | |
729e4ab9 | 21 | [\-\'] → ; |
2ca993e8 A |
22 | # |
23 | # | |
24 | # Turn long /e:/ into diphthong /ei/. | |
729e4ab9 | 25 | e $lengthMarker → | e i ; |
2ca993e8 A |
26 | # |
27 | # | |
28 | # Ignore vowel length everywhere else. | |
729e4ab9 | 29 | $lengthMarker → ; |
2ca993e8 A |
30 | # |
31 | # | |
32 | # Vowels. | |
33 | # | |
51004dcb | 34 | [^$consonant] { ( [aiueoyw] ) → ᄋ | $1 ; # Supply a required null initial. |
729e4ab9 | 35 | a → ᅡ ; |
51004dcb | 36 | i\~e → | ie ; # イェ |
729e4ab9 | 37 | i → ᅵ ; |
51004dcb A |
38 | u\~a → | wa ; # クァ, グァ |
39 | u\~i → ᅱ ; # ウィ, クィ, etc. | |
40 | u\~e → ᅰ ; # ウェ | |
41 | u\~o → ᅯ ; # ウォ | |
729e4ab9 A |
42 | u → ᅮ ; |
43 | e → ᅦ ; | |
44 | o → ᅩ ; | |
2ca993e8 A |
45 | # |
46 | # | |
47 | # Geminates. | |
48 | # | |
729e4ab9 A |
49 | kk → ᆺ | k ; |
50 | ss → ᆺ | s ; | |
51 | tt → ᆺ | t ; | |
52 | tc → ᆺ | c ; | |
53 | cc → ᆺ | c ; | |
54 | hh → ᆺ | h ; | |
55 | ff → ᆺ | f ; | |
56 | rr → ᆺ | r ; | |
57 | gg → ᆺ | g ; | |
58 | zz → ᆺ | z ; | |
59 | jj → ᆺ | j ; | |
60 | dd → ᆺ | d ; | |
61 | bb → ᆺ | b ; | |
62 | vv → ᆺ | v ; | |
63 | pp → ᆺ | p ; | |
2ca993e8 A |
64 | # |
65 | # | |
66 | # Consonants. | |
67 | # | |
51004dcb A |
68 | ' ' { k → | g ; # Beginning of a word (after space). |
69 | ^k → | g ; # Beginning of the string. | |
729e4ab9 | 70 | k → ᄏ ; |
2ca993e8 A |
71 | # |
72 | # | |
729e4ab9 A |
73 | sh → | sy ; |
74 | su → 스 ; | |
75 | s → ᄉ ; | |
2ca993e8 A |
76 | # |
77 | # | |
51004dcb A |
78 | te\~ → | t ; # テュ |
79 | to\~ → | t ; # トゥ | |
80 | tsu\~ → | ch ; # ツァ, ツィ, etc. | |
729e4ab9 | 81 | tsu → 쓰 ; |
51004dcb A |
82 | ts → | ch ; |
83 | ' ' { t → | d ; | |
84 | ^t → | d ; | |
729e4ab9 A |
85 | t → ᄐ ; |
86 | ' ' { ch → | j ; | |
51004dcb | 87 | ^ch → | j ; |
729e4ab9 | 88 | ch → ᄎ ; |
2ca993e8 A |
89 | # |
90 | # | |
729e4ab9 A |
91 | n } [\ \'bcdfghjkmnprstwz] → ᆫ ; |
92 | n$ → ᆫ ; | |
93 | n → ᄂ ; | |
2ca993e8 A |
94 | # |
95 | # | |
729e4ab9 | 96 | h → ᄒ ; |
51004dcb A |
97 | fu\~ → | p ; # フュ |
98 | fu → | hu ; | |
99 | f → | p ; | |
2ca993e8 A |
100 | # |
101 | # | |
729e4ab9 A |
102 | m } [bmp] → ᆫ ; |
103 | m → ᄆ ; | |
2ca993e8 A |
104 | # |
105 | # | |
729e4ab9 | 106 | ya → ᅣ ; |
51004dcb | 107 | yi → ᅵ ; # Added for convenience, after shi. |
729e4ab9 A |
108 | yu → ᅲ ; |
109 | ye → ᅨ ; | |
110 | yo → ᅭ ; | |
2ca993e8 A |
111 | # |
112 | # | |
729e4ab9 | 113 | r → ᄅ ; |
2ca993e8 A |
114 | # |
115 | # | |
729e4ab9 A |
116 | wa → ᅪ ; |
117 | w → ; | |
2ca993e8 A |
118 | # |
119 | # | |
729e4ab9 | 120 | g → ᄀ ; |
2ca993e8 A |
121 | # |
122 | # | |
729e4ab9 A |
123 | zu → 즈 ; |
124 | z → | j ; | |
125 | j → ᄌ ; | |
2ca993e8 A |
126 | # |
127 | # | |
51004dcb A |
128 | de\~ → | d ; # デュ |
129 | dji\~ → | j ; # ヂァ, ヂゥ, etc. | |
130 | dji → | ji ; # ヂ | |
131 | do\~ → | d ; # ドゥ | |
132 | dzu\~ → | j ; # ヅァ, ヅィ, etc. | |
133 | dzu → | zu ; # ヅ | |
134 | dz → | j ; | |
729e4ab9 | 135 | d → ᄃ ; |
2ca993e8 A |
136 | # |
137 | # | |
729e4ab9 | 138 | b → ᄇ ; |
51004dcb A |
139 | vu\~ → | b ; # ヴァ, etc. |
140 | v → | b ; | |
2ca993e8 A |
141 | # |
142 | # | |
729e4ab9 | 143 | p → ᄑ ; |
2ca993e8 A |
144 | # |
145 | # | |
729e4ab9 | 146 | ::NFC(NFD); |
2ca993e8 | 147 |