1<?xml version="1.0" encoding="UTF-8" ?> 2<!DOCTYPE supplementalData SYSTEM "../../common/dtd/ldmlSupplemental.dtd"> 3<!-- Copyright © 1991-2015 Unicode, Inc. 4CLDR data files are interpreted according to the LDML specification (http://unicode.org/reports/tr35/) 5For terms of use, see http://www.unicode.org/copyright.html --> 6<supplementalData> 7 <version number="$Revision: 12347 $" /> 8 <transforms> 9 <transform source="xh" target="xh_FONIPA" direction="forward" alias="xh-fonipa-t-xh"> 10 <tRule><![CDATA[ 11# Pronunciation rules for isiXhosa. 12# 13# Author: mjansche@google.com (Martin Jansche) 14# 15# These rules transcribe isiXhosa into the phoneme inventory used within the 16# NCHLT Speech Corpus (https://sites.google.com/site/nchltspeechcorpus/home). 17# 18# The rules were tested using the NCHLT-inlang isiXhosa pronunciation dictionary 19# (http://rma.nwu.ac.za/index.php/resource-catalogue/nchlt-inlang-dictionaries.html). 20# They correctly account for 14,999 out of 15,000 entries in the dictionary. 21# 22# The NCHLT 2013 phone set does not distinguish short and long vowels and does 23# not indicate tone in any way. Transcription of tone is out of scope without a 24# dictionary, since tone is generally not indicated in the orthography. Nasal 25# clicks are not treated as separated phonemes in the NCHLT 2013 phone set and 26# are transcribed as a sequence of nasal plus click instead. 27# 28# One minor notational deviation from the NCHLT 2013 phone set is that we use a 29# tie bar within the complex (slack voiced) clicks, e.g. ɡ͡ǀ instead of ɡǀ, to 30# avoid ambiguity and make the phoneme inventory uniquely decodable. 31 32::Lower; 33 34nyh → ɲʰ; 35n { tsh → t͡ʃʼ; 36 tsh → t͡ʃʰ; 37tyh → cʰ; 38 39bh → bʰ; 40ch → ǀʰ; 41dl → ɮ; 42dy → ɟ; 43gc → ɡ͡ǀ; 44gq → ɡ͡ǃ; 45gr → ɣ; 46gx → ɡ͡ǁ; 47hl → ɬ; 48kh → kʰ; 49kr → k͡x; 50mh } [^l] → mʰ; # <mhl> denotes /mɬ/ instead 51nh → nʰ; 52ny → ɲ; 53ph → pʰ; 54qh → ǃʰ; 55sh → ʃ; 56th → tʰ; 57tl → t͡ɬʼ; 58ts → t͡sʼ; 59ty → cʼ; 60xh → ǁʰ; 61 62aa → | a; 63ee → | e; 64ii → | i; 65kc → | c; 66kq → | q; 67mm → | m; 68oo → | o; 69rh → | r; 70uu → | u; 71 72a → a; 73b → ɓ; 74c → ǀ; 75d → d; 76e → ɛ; 77f → f; 78g → ɡ; 79h → h; 80i → i; 81j → d͡ʒ; 82k → kʼ; 83l → l; 84m → m; 85n } g → ŋ; 86n → n; 87o → ɔ; 88p → pʼ; 89q → ǃ; 90r → r; 91s → s; 92t → tʼ; 93u → u; 94v → v; 95w → w; 96x → ǁ; 97y → j; 98z → z; 99 ]]></tRule> 100 </transform> 101 </transforms> 102</supplementalData> 103