und_FONIPA_und_FONXSAMP.txt (11278B)
1 # © 2016 and later: Unicode, Inc. and others. 2 # License & terms of use: http://www.unicode.org/copyright.html 3 # Generated using tools/cldr/cldr-to-icu/ 4 # 5 # File: und_FONIPA_und_FONXSAMP.txt 6 # Generated from CLDR 7 # 8 9 # Conversion between IPA and X-SAMPA phonetic transcription. 10 # 11 # See http://www.phon.ucl.ac.uk/home/sampa/x-sampa.htm for a description of 12 # X-SAMPA, an ASCII encoding of the International Phonetic Alphabet. 13 # 14 # The following obsolete or extended IPA symbols have no X-SAMPA equivalents 15 # and remain unaffected by this transform: 16 # 17 # ʞ LATIN SMALL LETTER TURNED K 18 # ʩ LATIN SMALL LETTER FENG DIGRAPH 19 # ʪ LATIN SMALL LETTER LS DIGRAPH 20 # ʫ LATIN SMALL LETTER LZ DIGRAPH 21 # ʬ LATIN LETTER BILABIAL PERCUSSIVE 22 # ʭ LATIN LETTER BIDENTAL PERCUSSIVE 23 # 24 # An IPA tie bar is transformed to an X-SAMPA underscore, per the official 25 # X-SAMPA guidelines. This can result in certain ambiguities: For example, the 26 # labial-velar nasal (http://en.wikipedia.org/wiki/Labial-velar_nasal) can be 27 # either written as [ŋ\u0361m] or [m\u0361ŋ] in IPA. However, neither version can be 28 # represented unambiguously in X-SAMPA: IPA [ŋ\u0361m] becomes X-SAMPA [N_m], which 29 # is also used to represent a hypothetical laminal (_m) velar nasal, IPA [ŋ\u033B]; 30 # and IPA [m\u0361ŋ] becomes X-SAMPA [m_N], which can also represent a linguolabial 31 # (_N) nasal, IPA [m\u033C], which is more appropriately written [n\u033C]. To avoid 32 # unintended ambiguities, it may therefore be advisable to write affricates 33 # without tie bars. 34 # 35 $t = '_'; # X-SAMPA representation of IPA tie bar. 36 ::NFD(NFC); 37 # 5-character X-SAMPA representations 38 ʯ ↔ 'z`_w='; # LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL 39 # Alternative 5-character X-SAMPA representations 40 n\u031F\u030A ← 'n_+_0'; 41 n\u0320\u030A ← 'n_-_0'; 42 n\u032A\u030A ← 'n_d_0'; 43 n\u033A\u030A ← 'n_a_0'; 44 n\u033B\u030A ← 'n_m_0'; 45 n\u033C\u030A ← 'n_N_0'; 46 ɻ\u030A ← 'r\`_0'; 47 # 4-character X-SAMPA representations 48 ǁ ↔ '|\|\'; # LATIN LETTER LATERAL CLICK 49 ʄ ↔ 'J\_<'; # LATIN SMALL LETTER DOTLESS J WITH STROKE AND HOOK 50 ʛ ↔ 'G\_<'; # LATIN LETTER SMALL CAPITAL G WITH HOOK 51 ʮ ↔ 'z_w='; # LATIN SMALL LETTER TURNED H WITH FISHHOOK 52 \u1DC4 ↔ '_H_T'; # COMBINING MACRON-ACUTE 53 \u1DC5 ↔ '_B_L'; # COMBINING GRAVE-MACRON 54 \u1DC8 ↔ '_R_F'; # COMBINING GRAVE-ACUTE-GRAVE 55 # Alternative 4-character X-SAMPA representations 56 ɭ\u030A ← 'l`_0'; 57 ɰ\u030A ← 'M\_0'; 58 ɳ\u030A ← 'n`_0'; 59 ɽ\u030A ← 'r`_0'; 60 # 3-character X-SAMPA representations 61 ɓ ↔ 'b_<'; # LATIN SMALL LETTER B WITH HOOK 62 ɗ ↔ 'd_<'; # LATIN SMALL LETTER D WITH HOOK 63 ɠ ↔ 'g_<'; # LATIN SMALL LETTER G WITH HOOK 64 ɻ ↔ 'r\`'; # LATIN SMALL LETTER TURNED R WITH HOOK 65 ↗ ↔ '<R>'; # NORTH EAST ARROW 66 ↘ ↔ '<F>'; # SOUTH EAST ARROW 67 # Alternative 3-character X-SAMPA representations 68 j\u030A ← 'j_0'; 69 ŋ\u030A ← 'N_0'; 70 ɥ\u030A ← 'H_0'; 71 ɱ\u030A ← 'F_0'; 72 ɲ\u030A ← 'J_0'; 73 # 2-character X-SAMPA representations 74 ħ ↔ 'X\'; # LATIN SMALL LETTER H WITH STROKE 75 ǀ ↔ '|\'; # LATIN LETTER DENTAL CLICK 76 ǂ ↔ '=\'; # LATIN LETTER ALVEOLAR CLICK 77 ǃ ↔ '!\'; # LATIN LETTER RETROFLEX CLICK 78 ɕ ↔ 's\'; # LATIN SMALL LETTER C WITH CURL 79 ɖ ↔ 'd`'; # LATIN SMALL LETTER D WITH TAIL 80 ɘ ↔ '@\'; # LATIN SMALL LETTER REVERSED E 81 ɚ ↔ '@`'; # LATIN SMALL LETTER SCHWA WITH HOOK 82 ɝ ↔ '3`'; # LATIN SMALL LETTER REVERSED OPEN E WITH HOOK 83 ɞ ↔ '3\'; # LATIN SMALL LETTER CLOSED REVERSED OPEN E 84 ɟ ↔ 'J\'; # LATIN SMALL LETTER DOTLESS J WITH STROKE 85 ɢ ↔ 'G\'; # LATIN LETTER SMALL CAPITAL G 86 ɦ ↔ 'h\'; # LATIN SMALL LETTER H WITH HOOK 87 ɧ ↔ 'x\'; # LATIN SMALL LETTER HENG WITH HOOK 88 ɭ ↔ 'l`'; # LATIN SMALL LETTER L WITH RETROFLEX HOOK 89 ɮ ↔ 'K\'; # LATIN SMALL LETTER LEZH 90 ɰ ↔ 'M\'; # LATIN SMALL LETTER TURNED M WITH LONG LEG 91 ɳ ↔ 'n`'; # LATIN SMALL LETTER N WITH RETROFLEX HOOK 92 ɴ ↔ 'N\'; # LATIN LETTER SMALL CAPITAL N 93 ɸ ↔ 'p\'; # LATIN SMALL LETTER PHI 94 ɹ ↔ 'r\'; # LATIN SMALL LETTER TURNED R 95 ɺ ↔ 'l\'; # LATIN SMALL LETTER TURNED R WITH LONG LEG 96 ɽ ↔ 'r`'; # LATIN SMALL LETTER R WITH TAIL 97 ʀ ↔ 'R\'; # LATIN LETTER SMALL CAPITAL R 98 ʂ ↔ 's`'; # LATIN SMALL LETTER S WITH HOOK 99 ʈ ↔ 't`'; # LATIN SMALL LETTER T WITH RETROFLEX HOOK 100 ʐ ↔ 'z`'; # LATIN SMALL LETTER Z WITH RETROFLEX HOOK 101 ʑ ↔ 'z\'; # LATIN SMALL LETTER Z WITH CURL 102 ʕ ↔ '?\'; # LATIN LETTER PHARYNGEAL VOICED FRICATIVE 103 ʘ ↔ 'O\'; # LATIN LETTER BILABIAL CLICK 104 ʙ ↔ 'B\'; # LATIN LETTER SMALL CAPITAL B 105 ʜ ↔ 'H\'; # LATIN LETTER SMALL CAPITAL H 106 ʝ ↔ 'j\'; # LATIN SMALL LETTER J WITH CROSSED-TAIL 107 ʟ ↔ 'L\'; # LATIN LETTER SMALL CAPITAL L 108 ʡ ↔ '>\'; # LATIN LETTER GLOTTAL STOP WITH STROKE 109 ʢ ↔ '<\'; # LATIN LETTER REVERSED GLOTTAL STOP WITH STROKE 110 ʰ ↔ '_h'; # MODIFIER LETTER SMALL H 111 ʷ ↔ '_w'; # MODIFIER LETTER SMALL W 112 ʼ ↔ '_>'; # MODIFIER LETTER APOSTROPHE 113 ˆ ↔ '_\'; # MODIFIER LETTER CIRCUMFLEX ACCENT 114 ˇ ↔ '_/'; # CARON 115 ˑ ↔ ':\'; # MODIFIER LETTER HALF TRIANGULAR COLON 116 ˠ ↔ '_G'; # MODIFIER LETTER SMALL GAMMA 117 ˡ ↔ '_l'; # MODIFIER LETTER SMALL L 118 ˤ ↔ '_?\'; # MODIFIER LETTER SMALL REVERSED GLOTTAL STOP 119 \u0300 ↔ '_L'; # COMBINING GRAVE ACCENT 120 \u0301 ↔ '_H'; # COMBINING ACUTE ACCENT 121 \u0302 ↔ '_F'; # COMBINING CIRCUMFLEX ACCENT 122 \u0304 ↔ '_M'; # COMBINING MACRON 123 \u0306 ↔ '_X'; # COMBINING BREVE 124 \u0308 ↔ '_"'; # COMBINING DIAERESIS 125 \u030B ↔ '_T'; # COMBINING DOUBLE ACUTE ACCENT 126 \u030C ↔ '_R'; # COMBINING CARON 127 \u030F ↔ '_B'; # COMBINING DOUBLE GRAVE ACCENT 128 \u0318 ↔ '_A'; # COMBINING LEFT TACK BELOW 129 \u0319 ↔ '_q'; # COMBINING RIGHT TACK BELOW 130 \u031A ↔ '_}'; # COMBINING LEFT ANGLE ABOVE 131 \u031C ↔ '_c'; # COMBINING LEFT HALF RING BELOW 132 \u031D ↔ '_r'; # COMBINING UP TACK BELOW 133 \u031E ↔ '_o'; # COMBINING DOWN TACK BELOW 134 \u031F ↔ '_+'; # COMBINING PLUS SIGN BELOW 135 \u0320 ↔ '_-'; # COMBINING MINUS SIGN BELOW 136 \u0324 ↔ '_t'; # COMBINING DIAERESIS BELOW 137 \u0325 ↔ '_0'; # COMBINING RING BELOW 138 \u032A ↔ '_d'; # COMBINING BRIDGE BELOW 139 \u032C ↔ '_v'; # COMBINING CARON BELOW 140 \u032F ↔ '_^'; # COMBINING INVERTED BREVE BELOW 141 \u0330 ↔ '_k'; # COMBINING TILDE BELOW 142 \u0334 ↔ '_e'; # COMBINING TILDE OVERLAY 143 \u0339 ↔ '_O'; # COMBINING RIGHT HALF RING BELOW 144 \u033A ↔ '_a'; # COMBINING INVERTED BRIDGE BELOW 145 \u033B ↔ '_m'; # COMBINING SQUARE BELOW 146 \u033C ↔ '_N'; # COMBINING SEAGULL BELOW 147 \u033D ↔ '_x'; # COMBINING X ABOVE 148 ᵻ ↔ 'I\'; # LATIN SMALL CAPITAL LETTER I WITH STROKE 149 ᵿ ↔ 'U\'; # LATIN SMALL CAPITAL LETTER U WITH STROKE 150 ⁿ ↔ '_n'; # MODIFIER LETTER LATIN SMALL LETTER N 151 # Alternative 2-character X-SAMPA representations 152 ʋ ← 'v\'; # LATIN SMALL LETTER V WITH HOOK 153 ʲ ← '_j'; # MODIFIER LETTER SMALL J 154 \u0303 ← '_~'; # COMBINING TILDE 155 \u0329 ← '_='; # COMBINING VERTICAL LINE BELOW 156 # 1-character X-SAMPA representations 157 c\u0327 ↔ C; # LATIN SMALL LETTER C WITH CEDILLA (decomposed) 158 æ ↔ '{'; # LATIN SMALL LETTER AE 159 ð ↔ D; # LATIN SMALL LETTER ETH 160 ø ↔ 2; # LATIN SMALL LETTER O WITH STROKE 161 ŋ ↔ N; # LATIN SMALL LETTER ENG 162 œ ↔ 9; # LATIN SMALL LIGATURE OE 163 ɐ ↔ 6; # LATIN SMALL LETTER TURNED A 164 ɑ ↔ A; # LATIN SMALL LETTER ALPHA 165 ɒ ↔ Q; # LATIN SMALL LETTER TURNED ALPHA 166 ɔ ↔ O; # LATIN SMALL LETTER OPEN O 167 ə ↔ '@'; # LATIN SMALL LETTER SCHWA 168 ɛ ↔ E; # LATIN SMALL LETTER OPEN E 169 ɜ ↔ 3; # LATIN SMALL LETTER REVERSED OPEN E 170 ɡ ↔ g; # LATIN SMALL LETTER SCRIPT G 171 ɣ ↔ G; # LATIN SMALL LETTER GAMMA 172 ɤ ↔ 7; # LATIN SMALL LETTER RAMS HORN 173 ɥ ↔ H; # LATIN SMALL LETTER TURNED H 174 ɨ ↔ 1; # LATIN SMALL LETTER I WITH STROKE 175 ɪ ↔ I; # LATIN LETTER SMALL CAPITAL I 176 ɫ ↔ 5; # LATIN SMALL LETTER L WITH MIDDLE TILDE 177 ɬ ↔ K; # LATIN SMALL LETTER L WITH BELT 178 ɯ ↔ M; # LATIN SMALL LETTER TURNED M 179 ɱ ↔ F; # LATIN SMALL LETTER M WITH HOOK 180 ɲ ↔ J; # LATIN SMALL LETTER N WITH LEFT HOOK 181 ɵ ↔ 8; # LATIN SMALL LETTER BARRED O 182 ɶ ↔ '&'; # LATIN LETTER SMALL CAPITAL OE 183 ɾ ↔ 4; # LATIN SMALL LETTER R WITH FISHHOOK 184 ʁ ↔ R; # LATIN LETTER SMALL CAPITAL INVERTED R 185 ʃ ↔ S; # LATIN SMALL LETTER ESH 186 ʉ ↔ '}'; # LATIN SMALL LETTER U BAR 187 ʊ ↔ U; # LATIN SMALL LETTER UPSILON 188 ʋ ↔ P; # LATIN SMALL LETTER V WITH HOOK 189 ʌ ↔ V; # LATIN SMALL LETTER TURNED V 190 ʍ ↔ W; # LATIN SMALL LETTER TURNED W 191 ʎ ↔ L; # LATIN SMALL LETTER TURNED Y 192 ʏ ↔ Y; # LATIN LETTER SMALL CAPITAL Y 193 ʒ ↔ Z; # LATIN SMALL LETTER EZH 194 ʔ ↔ '?'; # LATIN LETTER GLOTTAL STOP 195 ʲ ↔ \'; # MODIFIER LETTER SMALL J 196 ˈ ↔ '"'; # MODIFIER LETTER VERTICAL LINE 197 ˌ ↔ '%'; # MODIFIER LETTER LOW VERTICAL LINE 198 ː ↔ ':'; # MODIFIER LETTER TRIANGULAR COLON 199 ˞ ↔ '`'; # MODIFIER LETTER RHOTIC HOOK 200 \u0303 ↔ '~'; # COMBINING TILDE 201 \u0329 ↔ '='; # COMBINING VERTICAL LINE BELOW 202 \u0361 ↔ $t; # COMBINING DOUBLE INVERTED BREVE 203 β ↔ B; # GREEK SMALL LETTER BETA 204 θ ↔ T; # GREEK SMALL LETTER THETA 205 χ ↔ X; # GREEK SMALL LETTER CHI 206 ↑ ↔ '^'; # UPWARDS ARROW 207 ↓ ↔ '!'; # DOWNWARDS ARROW 208 # Compatibility rules for variant or obsolete IPA symbols 209 g → g; # LATIN SMALL LETTER G (redundant, for additional clarity) 210 ȵ → J; # LATIN SMALL LETTER N WITH CURL 211 ɩ → I; # LATIN SMALL LETTER IOTA 212 ɷ → U; # LATIN SMALL LETTER CLOSED OMEGA 213 ɼ → 'r_r'; # LATIN SMALL LETTER R WITH LONG LEG 214 ɿ → 'z='; # LATIN SMALL LETTER REVERSED R WITH FISHHOOK 215 ʅ → 'z`='; # LATIN SMALL LETTER SQUAT REVERSED ESH 216 ʆ → S\'; # LATIN SMALL LETTER ESH WITH CURL 217 ʇ → '|\' ; # LATIN SMALL LETTER TURNED T 218 ʓ → Z\'; # LATIN SMALL LETTER EZH WITH CURL 219 ʖ → '|\|\'; # LATIN LETTER INVERTED GLOTTAL STOP 220 ʗ → '!\'; # LATIN LETTER STRETCHED C 221 ʚ → '3\'; # LATIN SMALL LETTER CLOSED OPEN E 222 ʠ → 'G\_<_0'; # LATIN SMALL LETTER Q WITH HOOK 223 ʣ → d $t z; # LATIN SMALL LETTER DZ DIGRAPH 224 ʤ → d $t Z; # LATIN SMALL LETTER DEZH DIGRAPH 225 ʥ → d $t 'z\'; # LATIN SMALL LETTER DZ DIGRAPH WITH CURL 226 ʦ → t $t s; # LATIN SMALL LETTER TS DIGRAPH 227 ʧ → t $t S; # LATIN SMALL LETTER TESH DIGRAPH 228 ʨ → t $t 's\'; # LATIN SMALL LETTER TC DIGRAPH WITH CURL 229 ˔ → '_r'; # MODIFIER LETTER UP TACK 230 ˕ → '_o'; # MODIFIER LETTER DOWN TACK 231 \u030A → '_0'; # COMBINING RING ABOVE 232 φ → 'p\'; # GREEK SMALL LETTER PHI 233 ꞎ → 'K`'; # LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT 234 ::NFC(NFD);