1 # ***************************************************************************
3 # * Copyright (C) 2004-2016, International Business Machines
4 # * Corporation; Unicode, Inc.; and others. All Rights Reserved.
6 # ***************************************************************************
11 # Italian to Katakana Transliteration Table for ICU
13 # "現代イタリア語入門" (大学書林, 1974. ISBN:978-4475017176)
14 # http://ja.wikipedia.org/wiki/%E3%82%A4%E3%82%BF%E3%83%AA%E3%82%A2%E8%AA%9E
17 ::[:Latin:] fullwidth-halfwidth();
22 $consonant = [bcdfghjklmnpqrstvwxyz];
26 ($consonant) \' → | $1;
159 # 's' is voiced before [bdglmnrv].
170 # Force 's' after a consonat to be unvoiced.
171 ($consonant) s } $vowel → | $1 \~ s;
179 # 's' at the beginning is usually unvoiced.
180 [:^Letter:] { sa → サ;
181 [:^Letter:] { si → シ;
182 [:^Letter:] { su → ス;
183 [:^Letter:] { se → セ;
184 [:^Letter:] { so → ソ;
187 # Otherwise voiced 's' are common.
202 # Force 'z' after a consonat to be unvoiced.
203 ($consonant) z → | $1 \~z;
211 # Otherwise voiced 'z' are common except for 'zi'.
213 [:^Letter:] { zi → ジ;
225 # Standalone vowels and consonants.
254 # word delimiter of transliterated foreign phrase is '・'.
258 # Latin hyphen should be transliterated to U+30A0 (KATAKANA-HIRAGANA
259 # DOUBLE HYPHEN), ideally. But since the character isn't supported by
260 # many fonts or softwares, we use U+FF1D (FULLWIDTH EQUALS SIGN),
261 # which is widely used as "double hyphen".
266 [:nonspacing mark:] → ;