tor-browser

The Tor Browser
git clone https://git.dasho.dev/tor-browser.git
Log | Files | Refs | README | LICENSE

xh_xh_FONIPA.txt (2114B)


      1 # © 2016 and later: Unicode, Inc. and others.
      2 # License & terms of use: http://www.unicode.org/copyright.html
      3 # Generated using tools/cldr/cldr-to-icu/
      4 #
      5 # File: xh_xh_FONIPA.txt
      6 # Generated from CLDR
      7 #
      8 
      9 # Pronunciation rules for isiXhosa.
     10 #
     11 # Author: mjansche@google.com (Martin Jansche)
     12 #
     13 # These rules transcribe isiXhosa into the phoneme inventory used within the
     14 # NCHLT Speech Corpus (https://sites.google.com/site/nchltspeechcorpus/home).
     15 #
     16 # The rules were tested using the NCHLT-inlang isiXhosa pronunciation dictionary
     17 # (http://rma.nwu.ac.za/index.php/resource-catalogue/nchlt-inlang-dictionaries.html).
     18 # They correctly account for 14,999 out of 15,000 entries in the dictionary.
     19 #
     20 # The NCHLT 2013 phone set does not distinguish short and long vowels and does
     21 # not indicate tone in any way. Transcription of tone is out of scope without a
     22 # dictionary, since tone is generally not indicated in the orthography. Nasal
     23 # clicks are not treated as separated phonemes in the NCHLT 2013 phone set and
     24 # are transcribed as a sequence of nasal plus click instead.
     25 #
     26 # One minor notational deviation from the NCHLT 2013 phone set is that we use a
     27 # tie bar within the complex (slack voiced) clicks, e.g. ɡ\u0361ǀ instead of ɡǀ, to
     28 # avoid ambiguity and make the phoneme inventory uniquely decodable.
     29 ::Lower;
     30 nyh → ɲʰ;
     31 n { tsh → t\u0361ʃʼ;
     32 tsh → t\u0361ʃʰ;
     33 tyh → cʰ;
     34 bh → bʰ;
     35 ch → ǀʰ;
     36 dl → ɮ;
     37 dy → ɟ;
     38 gc → ɡ\u0361ǀ;
     39 gq → ɡ\u0361ǃ;
     40 gr → ɣ;
     41 gx → ɡ\u0361ǁ;
     42 hl → ɬ;
     43 kh → kʰ;
     44 kr → k\u0361x;
     45 mh } [^l] → mʰ;  # <mhl> denotes /mɬ/ instead
     46 nh → nʰ;
     47 ny → ɲ;
     48 ph → pʰ;
     49 qh → ǃʰ;
     50 sh → ʃ;
     51 th → tʰ;
     52 tl → t\u0361ɬʼ;
     53 ts → t\u0361sʼ;
     54 ty → cʼ;
     55 xh → ǁʰ;
     56 aa → | a;
     57 ee → | e;
     58 ii → | i;
     59 kc → | c;
     60 kq → | q;
     61 mm → | m;
     62 oo → | o;
     63 rh → | r;
     64 uu → | u;
     65 a → a;
     66 b → ɓ;
     67 c → ǀ;
     68 d → d;
     69 e → ɛ;
     70 f → f;
     71 g → ɡ;
     72 h → h;
     73 i → i;
     74 j → d\u0361ʒ;
     75 k → kʼ;
     76 l → l;
     77 m → m;
     78 n } g → ŋ;
     79 n → n;
     80 o → ɔ;
     81 p → pʼ;
     82 q → ǃ;
     83 r → r;
     84 s → s;
     85 t → tʼ;
     86 u → u;
     87 v → v;
     88 w → w;
     89 x → ǁ;
     90 y → j;
     91 z → z;