tor-browser

The Tor Browser
git clone https://git.dasho.dev/tor-browser.git
Log | Files | Refs | README | LICENSE

blt_blt_FONIPA.txt (5111B)


      1 # © 2016 and later: Unicode, Inc. and others.
      2 # License & terms of use: http://www.unicode.org/copyright.html
      3 # Generated using tools/cldr/cldr-to-icu/
      4 #
      5 # File: blt_blt_FONIPA.txt
      6 # Generated from CLDR
      7 #
      8 
      9 # Output phonemes
     10 # ---------------
     11 # Nasals:           m mʷ n nʷ ɲ ɲʷ ŋ ŋʷ
     12 # Plosives:         p pʰ pʰʷ pʷ b t tʷ tʰ d dʷ k kʰ kʰʷ kʷ ɡ ɡʷ ʔ
     13 # Fricatives:       f fʷ v s sʷ h hʷ x xʷ
     14 # Other consonants: w j l
     15 # Affricates:       t\u0361ɕ t\u0361ɕʷ t\u0361ɕʰ t\u0361ɕʰʷ
     16 # Vowels:           i ɨ u ɛ e ə ɔ o a aː
     17 # Diphthongs:       iə\u032F ɨə\u032F uə\u032F ai\u032F
     18 # Tones:            ˨ ˧˥ ˨˩ ˥ ˦ ˧˩
     19 #
     20 #
     21 # Limitations
     22 # -----------
     23 # Currently, these rules only support tone marks, but not tone letters.
     24 #
     25 #
     26 # References
     27 # ----------
     28 # [1] Jim Brase, SIL International: Proposal to encode the Tai Viet script
     29 #     in the UCS. ISO/IEC JTC1/SC2/WG2 N3220. March 20, 2007.
     30 #     http://std.dkuug.dk/jtc1/sc2/wg2/docs/n3220.pdf
     31 #
     32 # [2] ScriptSource: Tai Viet Vowels.
     33 #     http://scriptsource.org/entry/eusd5ehysa
     34 #
     35 # [3] ScriptSource: Tai Viet Consonants.
     36 #     http://scriptsource.org/entry/lbwpkrqk7b
     37 #
     38 # [4] http://www.seasite.niu.edu/tai/TaiDam/tones.htm
     39 $LO = [ꪀ ꪂ ꪄ ꪆ ꪈ ꪊ ꪌ ꪎ ꪐ ꪒ ꪔ ꪖ ꪘ ꪚ ꪜ ꪞ ꪠ ꪢ ꪤ ꪦ ꪨ ꪪ ꪬ ꪮ];
     40 $HI = [ꪁ ꪃ ꪅ ꪇ ꪉ ꪋ ꪍ ꪏ ꪑ ꪓ ꪕ ꪗ ꪙ ꪛ ꪝ ꪟ ꪡ ꪣ ꪥ ꪧ ꪩ ꪫ ꪭ ꪯ];
     41 $C = [$LO $HI];
     42 $V1 = [ꪵ ꪶ ꪹ ꪻ ꪼ];  # vowels written before consonant
     43 $V2 = [ \uAAB0 \uAAB2 \uAAB3 \uAAB4 \uAAB7 \uAAB8 \uAABE];  # vowels written above or below consonant
     44 $V3 = [ꪱ ꪮ ꪺ ꪽ];  # vowels written after consonant
     45 $DIGRAPHS = [{ꪹ  \uAAB8} {ꪹ  \uAAB7} {ꪹ ꪱ}];
     46 $V12 = [$V1 $V2 $DIGRAPHS];
     47 $V123 = [$V12 $V3];
     48 $W = [ꪫ];  # labialization marker
     49 $F = [$C]; # syllable-final consonant
     50 $IPA_TONE = [˥ ˦ ˧ ˨ ˩];
     51 $NOT_IPA_TONE = [^$IPA_TONE];
     52 $BOUNDARY = [^[:L:][:M:][:N:]];
     53 # Consonants at the end of “checked” syllables.
     54 $CHK = [ꪜ ꪝ ꪞ ꪟ ꪔ ꪕ ꪖ ꪗ ꪀ ꪁ ꪂ ꪃ ꪮ ꪯ];
     55 # The Tai Viet script uses visual ordering. Convert to logical order.
     56 ($V1) ($C $W?) → $2 $1;
     57 ::null;
     58 # Special handling for stand-alone ꪽ ‘that’.
     59 $BOUNDARY {ꪽ} $BOUNDARY → nan˧˩;
     60 # Convert tones for checked syllables (those ending in /p/, /t/, /k/, /ʔ/)
     61 $LO $W? $V12 {($CHK)} → $1 ˧˥;  # Tone class 2: High-rising tone
     62 $LO $W? {($V3 $CHK)} → $1 ˧˥;  # Tone class 2: High-rising tone
     63 $HI $W? $V12 {($CHK)} → $1 ˦;  # Tone class 5: High-mid tone
     64 $HI $W? {($V3 $CHK)} → $1 ˦;  # Tone class 5: High-mid tone
     65 # Convert tones for unchecked syllables with vowels that are written
     66 # after the consonant (V3).
     67 # TODO: Also support tone letters, not just tone marks.
     68 $LO $W? { \uAABF ($V3 $F?)} → $1 ˧˥;  # Tone class 2: High-rising tone
     69 $LO $W? { \uAAC1 ($V3 $F?)} → $1 ˨˩;  # Tone class 3: Low-falling tone
     70 $HI $W? { \uAABF ($V3 $F?)} → $1 ˦;   # Tone class 5: High-mid tone
     71 $HI $W? { \uAAC1 ($V3 $F?)} → $1 ˧˩;  # Tone class 6: Mid-falling tone
     72 # Convert tones for unchecked syllables with vowels that are either written
     73 # before the consonant (V1) or vowels that are written above or below it (V2).
     74 # TODO: Also support tone letters, not just tone marks.
     75 $LO $W? $V12 { \uAABF ($F?)} → $1 ˧˥;  # Tone class 2: High-rising tone
     76 $LO $W? $V12 { \uAAC1 ($F?)} → $1 ˨˩;  # Tone class 3: Low-falling tone
     77 $HI $W? $V12 { \uAABF ($F?)} → $1 ˦;   # Tone class 5: High-mid tone
     78 $HI $W? $V12 { \uAAC1 ($F?)} → $1 ˧˩;  # Tone class 6: Mid-falling tone
     79 ::null;
     80 {($LO $W? $V123 $F?)} $NOT_IPA_TONE → $1 ˨;  # Tone class 1: Low-mid tone.
     81 {($HI $W? $V123 $F?)} $NOT_IPA_TONE → $1 ˥;  # Tone class 4: High tone.
     82 ::null;
     83 # Harden syllable-final consonants.
     84 $C $W? $V123 {ꪒ} → ꪔ;  # /d/ → /t/
     85 ::null;
     86 # Convert labialization marker.
     87 $C {$W} $V123 → ʷ;
     88 ::null;
     89 [ꪀ ꪁ] → k;
     90 [ꪂ ꪃ] → kʰ;  # Tai Dón; not used in Tai Dam according to [3]
     91 [ꪄ ꪅ] → x;
     92 [ꪆ ꪇ] → ɡ;  # only in loanwords, according to [3]
     93 [ꪈ ꪉ] → ŋ;
     94 [ꪊ ꪋ] → t\u0361ɕ;  # Tai Dón; not used in Tai Dam according to [3]
     95 [ꪌ ꪍ] → t\u0361ɕʰ;  # Tai Dón; not used in Tai Dam according to [3]
     96 [ꪎ ꪏ] → s;
     97 [ꪐ ꪑ] → ɲ;
     98 [ꪒ ꪓ] → d;
     99 [ꪔ ꪕ] → t;
    100 [ꪖ ꪗ] → tʰ;
    101 [ꪘ ꪙ] → n;
    102 [ꪚ ꪛ] → b;
    103 [ꪜ ꪝ] → p;
    104 [ꪞ ꪟ] → pʰ;  # Tai Dón; not used in Tai Dam according to [3]
    105 [ꪠ ꪡ] → f;
    106 [ꪢ ꪣ] → m;
    107 [ꪤ ꪥ] → j;
    108 [ꪦ ꪧ] → r;  # only in loanwords, according to [3]
    109 [ꪨ ꪩ] → l;
    110 {[ꪪ ꪫ]} $IPA_TONE → w;  # at the end of a syllable (before tone letters)
    111 [ꪪ ꪫ] → v;  # not at the end of a syllable
    112 [ꪬ ꪭ] → h;
    113 ʔ {[ꪮ ꪯ]} → ɔ;  # eg. ꪮꪮꪀ
    114 [ꪮ ꪯ] → ʔ;
    115 # Digraphs.
    116 ꪹ  \uAAB8 → e;
    117 ꪹ  \uAAB7 → ə;
    118 ꪹ ꪱ → aːw;
    119 # Vowels.
    120 \uAAB0 → a;
    121 ꪱ → aː;
    122 \uAAB2 → i;
    123 \uAAB3 → ɨ;
    124 \uAAB4 → u;
    125 ꪵ → ɛ;
    126 ꪶ → o;
    127 \uAAB7 → ɔ;
    128 ꪮ → ɔ;
    129 ꪺ → uə\u032F;
    130 ꪽ → an;
    131 ꪹ → ɨə\u032F;
    132 \uAAB8 → iə\u032F;
    133 ꪻ → əw;
    134 ꪼ → ai\u032F;
    135 \uAABE → am;
    136 # Word ligature symbols.
    137 ꫛ → kon˥;
    138 ꫜ → nɨŋ˦;