]> git.saurik.com Git - apple/icu.git/blame - icuSources/data/translit/xh_xh_FONIPA.txt
ICU-57163.0.1.tar.gz
[apple/icu.git] / icuSources / data / translit / xh_xh_FONIPA.txt
CommitLineData
2ca993e8
A
1# ***************************************************************************
2# *
3# * Copyright (C) 2004-2016, International Business Machines
4# * Corporation; Unicode, Inc.; and others. All Rights Reserved.
5# *
6# ***************************************************************************
7# File: xh_xh_FONIPA.txt
8# Generated from CLDR
9#
10
11# Pronunciation rules for isiXhosa.
12#
13# Author: mjansche@google.com (Martin Jansche)
14#
15# These rules transcribe isiXhosa into the phoneme inventory used within the
16# NCHLT Speech Corpus (https://sites.google.com/site/nchltspeechcorpus/home).
17#
18# The rules were tested using the NCHLT-inlang isiXhosa pronunciation dictionary
19# (http://rma.nwu.ac.za/index.php/resource-catalogue/nchlt-inlang-dictionaries.html).
20# They correctly account for 14,999 out of 15,000 entries in the dictionary.
21#
22# The NCHLT 2013 phone set does not distinguish short and long vowels and does
23# not indicate tone in any way. Transcription of tone is out of scope without a
24# dictionary, since tone is generally not indicated in the orthography. Nasal
25# clicks are not treated as separated phonemes in the NCHLT 2013 phone set and
26# are transcribed as a sequence of nasal plus click instead.
27#
28# One minor notational deviation from the NCHLT 2013 phone set is that we use a
29# tie bar within the complex (slack voiced) clicks, e.g. ɡ\u0361ǀ instead of ɡǀ, to
30# avoid ambiguity and make the phoneme inventory uniquely decodable.
31::Lower;
32nyh → ɲʰ;
33n { tsh → t\u0361ʃʼ;
34tsh → t\u0361ʃʰ;
35tyh → cʰ;
36bh → bʰ;
37ch → ǀʰ;
38dl → ɮ;
39dy → ɟ;
40gc → ɡ\u0361ǀ;
41gq → ɡ\u0361ǃ;
42gr → ɣ;
43gx → ɡ\u0361ǁ;
44hl → ɬ;
45kh → kʰ;
46kr → k\u0361x;
47mh } [^l] → mʰ; # <mhl> denotes /mɬ/ instead
48nh → nʰ;
49ny → ɲ;
50ph → pʰ;
51qh → ǃʰ;
52sh → ʃ;
53th → tʰ;
54tl → t\u0361ɬʼ;
55ts → t\u0361sʼ;
56ty → cʼ;
57xh → ǁʰ;
58aa → | a;
59ee → | e;
60ii → | i;
61kc → | c;
62kq → | q;
63mm → | m;
64oo → | o;
65rh → | r;
66uu → | u;
67a → a;
68b → ɓ;
69c → ǀ;
70d → d;
71e → ɛ;
72f → f;
73g → ɡ;
74h → h;
75i → i;
76j → d\u0361ʒ;
77k → kʼ;
78l → l;
79m → m;
80n } g → ŋ;
81n → n;
82o → ɔ;
83p → pʼ;
84q → ǃ;
85r → r;
86s → s;
87t → tʼ;
88u → u;
89v → v;
90w → w;
91x → ǁ;
92y → j;
93z → z;
94