IndicSyllabicCategory-Additional.txt (15751B)
1 # Override values For Indic_Syllabic_Category 2 # Not derivable 3 # Initial version based on Unicode 7.0 by Andrew Glass 2014-03-17 4 # Updated for Unicode 10.0 by Andrew Glass 2017-07-25 5 # Updated for Unicode 12.1 by Andrew Glass 2019-05-24 6 # Updated for Unicode 13.0 by Andrew Glass 2020-07-28 7 # Updated for Unicode 14.0 by Andrew Glass 2021-09-25 8 # Updated for Unicode 15.0 by Andrew Glass 2022-09-16 9 # Updated for Unicode 15.1 by Andrew Glass 2023-09-14 10 # Updated for Unicode 16.0 by Andrew Glass 2024-09-11 11 12 # ================================================ 13 # OVERRIDES TO ASSIGNED VALUES 14 # ================================================ 15 16 # Indic_Syllabic_Category=Bindu 17 193A ; Bindu # Mn LIMBU SIGN KEMPHRENG 18 AA29 ; Bindu # Mn CHAM VOWEL SIGN AA 19 10A0D ; Bindu # Mn KHAROSHTHI SIGN DOUBLE RING BELOW 20 113CE ; Bindu # Mn TULU-TIGALARI SIGN VIRAMA 21 22 # ================================================ 23 24 # Indic_Syllabic_Category=Consonant 25 19C1..19C7 ; Consonant # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B # Reassigned to avoid clustering with a base consonant 26 25CC ; Consonant # So DOTTED CIRCLE #Reassigned to allow it to cluster as a generic base 27 28 # ================================================ 29 30 # Indic_Syllabic_Category=Consonant_Dead 31 0F7F ; Consonant_Dead # Mc TIBETAN SIGN RNAM BCAD # reassigned so that visarga can form an independent cluster, but see #19 32 33 # ================================================ 34 35 # Indic_Syllabic_Category=Consonant_With_Stacker 36 11A3A ; Consonant_With_Stacker # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA 37 38 # ================================================ 39 40 # Indic_Syllabic_Category=Consonant_Subjoined 41 11A3B..11A3E ; Consonant_Subjoined # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA 42 43 # ================================================ 44 45 # Indic_Syllabic_Category=Consonant_Final_Modifier 46 1C36 ; Consonant_Final_Modifier # Mn LEPCHA SIGN RAN 47 48 # ================================================ 49 50 # Indic_Syllabic_Category=Gemination_Mark 51 11134 ; Gemination_Mark # Mc CHAKMA MAAYYAA 52 53 # ================================================ 54 55 # Indic_Syllabic_Category=Nukta 56 0F71 ; Nukta # Mn TIBETAN VOWEL SIGN AA # Reassigned to get this before an above vowel, but see #22 57 113CF ; Nukta # Mc TULU-TIGALARI SIGN LOOPED VIRAMA 58 59 # ================================================ 60 61 # Indic_Syllabic_Category=Tone_Mark 62 1A7B..1A7C ; Tone_Mark # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN 63 1A7F ; Tone_Mark # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 64 65 # ================================================ 66 67 # Indic_Syllabic_Category=Vowel_Independent 68 AAB1 ; Vowel_Independent # Lo TAI VIET VOWEL AA 69 AABA ; Vowel_Independent # Lo TAI VIET VOWEL UA 70 AABD ; Vowel_Independent # Lo TAI VIET VOWEL AN 71 72 # ================================================ 73 # ================================================ 74 # VALUES NOT ASSIGNED IN Indic_Syllabic_Category 75 # ================================================ 76 # ================================================ 77 78 # Indic_Syllabic_Category=Consonant 79 0800..0815 ; Consonant # Lo [22] SAMARITAN LETTER ALAF..SAMARITAN LETTER TAAF 80 0840..0858 ; Consonant # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 81 0F00..0F01 ; Consonant # Lo [2] TIBETAN SYLLABLE OM..TIBETAN MARK GTER YIG MGO TRUNCATED 82 0F04..0F06 ; Consonant # Po TIBETAN MARK INITIAL YIG MGO MDUN MA..TIBETAN MARK CARET YIG MGO PHUR SHAD MA 83 1800 ; Consonant # Po MONGOLIAN BIRGA # Reassigned so that legacy Birga + MFVS sequences still work 84 1807 ; Consonant # Po MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER 85 180A ; Consonant # Po MONGOLIAN NIRUGU 86 1820..1842 ; Consonant # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 87 1843 ; Consonant # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN 88 1844..1878 ; Consonant # Lo [53] MONGOLIAN LETTER TODO E..MONGOLIAN LETTER CHA WITH TWO DOTS 89 2D30..2D67 ; Consonant # Lo [56] TIFINAGH LETTER YA..TIFINAGH LETTER YO 90 2D6F ; Consonant # Lm TIFINAGH MODIFIER LETTER LABIALIZATION MARK 91 10570..1057A ; Consonant # Lo [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA 92 1057C..1058A ; Consonant # Lo [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE 93 1058C..10592 ; Consonant # Lo [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE 94 10594..10595 ; Consonant # Lo [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE 95 10597..105A1 ; Consonant # Lo [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA 96 105A3..105B1 ; Consonant # Lo [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE 97 105B3..105B9 ; Consonant # Lo [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE 98 105BB..105BC ; Consonant # Lo [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 99 10AC0..10AC7 ; Consonant # Lo [8] MANICHAEAN LETTER ALEPH..MANICHAEAN LETTER WAW 100 10AC9..10AE4 ; Consonant # Lo [28] MANICHAEAN LETTER ZAYIN..MANICHAEAN LETTER TAW 101 10D00..10D23 ; Consonant # Lo [36] HANIFI ROHINGYA LETTER A..HANIFI ROHINGYA MARK NA KHONNA 102 10D4A..10D4F ; Consonant # Lo [6] GARAY VOWEL SIGN A..GARAY SUKUN 103 10D50..10D65 ; Consonant # Lu [22] GARAY CAPITAL LETTER A..GARAY CAPITAL LETTER OLD NA 104 10D70..10D85 ; Consonant # Ll [22] GARAY SMALL LETTER A..GARAY SMALL LETTER OLD NA 105 10D6F ; Consonant # Lm GARAY REDUPLICATION MARK 106 10E80..10EA9 ; Consonant # Lo [42] YEZIDI LETTER ELIF..YEZIDI LETTER ET 107 10EB0..10EB1 ; Consonant # Lo [2] YEZIDI LETTER LAM WITH DOT ABOVE..YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE 108 10F30..10F45 ; Consonant # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN 109 10F70..10F81 ; Consonant # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH 110 111DA ; Consonant # Lo SHARADA EKAM 111 16B00..16B2F ; Consonant # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 112 16F00..16F4A ; Consonant # Lo [75] MIAO LETTER PA..MIAO LETTER RTE 113 16FE4 ; Consonant # Mn KHITAN SMALL SCRIPT FILLER # Avoids Mn pushing this into VOWEL class 114 18B00..18CD5 ; Consonant # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5 115 18CFF ; Consonant # Lo KHITAN SMALL SCRIPT CHARACTER-18CFF 116 1BC00..1BC6A ; Consonant # Lo [107] DUPLOYAN LETTER H..DUPLOYAN LETTER VOCALIC M 117 1BC70..1BC7C ; Consonant # Lo [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK 118 1BC80..1BC88 ; Consonant # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 119 1BC90..1BC99 ; Consonant # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW 120 1E100..1E12C ; Consonant # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 121 1E137..1E13D ; Consonant # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 122 1E14E ; Consonant # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 123 1E14F ; Consonant # So NYIAKENG PUACHUE HMONG CIRCLED CA 124 1E290..1E2AD ; Consonant # Lo [30] TOTO LETTER PA..TOTO LETTER A 125 1E2C0..1E2EB ; Consonant # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 126 1E4D0..1E4EA ; Consonant # Lo [27] NAG MUNDARI LETTER O..NAG MUNDARI LETTER ELL 127 1E4EB ; Consonant # Lm NAG MUNDARI SIGN OJOD 128 1E5D0..1E5ED ; Consonant # Lo [30] OL ONAL LETTER O..OL ONAL LETTER EG 129 1E5F0 ; Consonant # Lo OL ONAL SIGN HODDOND 130 1E900..1E921 ; Consonant # Lu [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA 131 1E922..1E943 ; Consonant # Ll [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA 132 1E94B ; Consonant # Lm ADLAM NASALIZATION MARK 133 134 # ================================================ 135 136 # Indic_Syllabic_Category=Consonant_Placeholder 137 1880..1884 ; Consonant_Placeholder # Lo [5] MONGOLIAN LETTER ALI GALI ANUSVARA ONE..MONGOLIAN LETTER ALI GALI INVERTED UBADAMA 138 139 # ================================================ 140 141 # Indic_Syllabic_Category=Gemination_Mark 142 10D27 ; Gemination_Mark # Mn HANIFI ROHINGYA SIGN TASSI 143 144 # ================================================ 145 146 # Indic_Syllabic_Category=Modifying_Letter 147 FE00..FE0F ; Modifying_Letter # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16# Need to treat them as isolated bases so they don't merge with a cluster in invalid scenarios 148 16F50 ; Modifying_Letter # Lo MIAO LETTER NASALIZATION 149 150 # ================================================ 151 152 # Indic_Syllabic_Category=Nukta 153 0859..085B ; Nukta # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK 154 0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU # NOW IN UNICODE 10.0 155 1885..1886 ; Nukta # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 156 18A9 ; Nukta # Mn MONGOLIAN LETTER ALI GALI DAGALGA 157 10AE5..10AE6 ; Nukta # Mn [2] MANICHAEAN ABBREVIATION MARK ABOVE..MANICHAEAN ABBREVIATION MARK BELOW 158 16F4F ; Nukta # Mn MIAO SIGN CONSONANT MODIFIER BAR 159 1BC9D..1BC9E ; Nukta # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 160 1E944..1E94A ; Nukta # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA 161 10F82..10F85 ; Nukta # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 162 163 # ================================================ 164 165 # Indic_Syllabic_Category=Number 166 10D30..10D39 ; Number # Nd [10] HANIFI ROHINGYA DIGIT ZERO..HANIFI ROHINGYA DIGIT NINE 167 10F51..10F54 ; Number # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED 168 16AC0..16AC9 ; Number # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 169 1E140..1E149 ; Number # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 170 1E2F0..1E2F9 ; Number # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE 171 1E4F0..1E4F9 ; Number # Nd [10] NAG MUNDARI DIGIT ZERO..NAG MUNDARI DIGIT NINE 172 1E5F1..1E5FA ; Number # Nd [10] OL ONAL DIGIT ZERO..OL ONAL DIGIT NINE 173 1E950..1E959 ; Number # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 174 175 # ================================================ 176 177 # Indic_Syllabic_Category=Tone_Mark 178 07EB..07F3 ; Tone_Mark # Mn [9] NKO COMBINING SHORT HIGH TONE..NKO COMBINING DOUBLE DOT ABOVE 179 07FD ; Tone_Mark # Mn NKO DANTAYALAN 180 0F86..0F87 ; Tone_Mark # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS 181 17CF ; Tone_Mark # Mn KHMER SIGN AHSDA 182 10D24..10D26 ; Tone_Mark # Mn [3] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TANA 183 10F46..10F50 ; Tone_Mark # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW 184 16B30..16B36 ; Tone_Mark # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM 185 16F8F..16F92 ; Tone_Mark # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 186 1E130..1E136 ; Tone_Mark # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D 187 1E2AE ; Tone_Mark # Mn TOTO SIGN RISING TONE 188 1E2EC..1E2EF ; Tone_Mark # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 189 190 # ================================================ 191 192 # Indic_Syllabic_Category=Virama 193 2D7F ; Virama # Mn TIFINAGH CONSONANT JOINER 194 195 # ================================================ 196 197 # Indic_Syllabic_Category=Vowel_Dependent 198 0B55 ; Vowel_Dependent # Mn ORIYA SIGN OVERLINE 199 10D69..10D6D ; Vowel_Dependent # Mn [5] GARAY VOWEL SIGN E..GARAY CONSONANT NASALIZATION MARK 200 10EAB..10EAC ; Vowel_Dependent # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 201 16F51..16F87 ; Vowel_Dependent # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI 202 1E4EC..1E4EF ; Vowel_Dependent # Mn [4] NAG MUNDARI SIGN MUHOR..NAG MUNDARI SIGN SUTUH 203 1E5EE..1E5EF ; Vowel_Dependent # Mn [2] OL ONAL SIGN MU..OL ONAL SIGN IKIR 204 205 # ================================================ 206 207 # Indic_Syllabic_Category=Cantillation_Mark 208 209 1CF8..1CF9 ; Cantillation_Mark # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE 210 211 # ================================================ 212 213 # Indic_Syllabic_Category=Symbol_Modifier 214 1B6B..1B73 ; Symbol_Modifier # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 215 216 # ================================================ 217 # ================================================ 218 # PROPERTIES NOT ASSIGNED IN Indic_Syllabic_Category 219 # ================================================ 220 # ================================================ 221 222 # USE, Extended_Syllabic_Category=Hieroglyph 223 13000..1342F ; Hieroglyph # Lo [1072] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH V011D 224 1343C..1343F ; Hieroglyph # Cf [4] EGYPTIAN HIEROGLYPH BEGIN ENCLOSURE..END WALLED ENCLOSURE 225 13441..13446 ; Hieroglyph # Lo [6] EGYPTIAN HIEROGLYPH FULL BLANK..HIEROGLYPH WIDE LOST SIGN 226 13460..143FA ; Hieroglyph # Lo [3995] EGYPTIAN HIEROGLYPH-13460..EGYPTIAN HIEROGLYPH-143FA 227 228 # ================================================ 229 230 # USE, Extended_Syllabic_Category=Hieroglyph_Joiner 231 13430..13436 ; Hieroglyph_Joiner # Cf [7] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH OVERLAY MIDDLE 232 13439..1343B ; Hieroglyph_Joiner # Cf [3] EGYPTIAN HIEROGLYPH INSERT AT MIDDLE..EGYPTIAN HIEROGLYPH INSERT AT BOTTOM 233 234 # ================================================ 235 236 # USE, Extended_Syllabic_Category=Hieroglyph_Mark_Begin 237 005B ; Hieroglyph_Mark_Begin # Ps LEFT SQUARE BRACKET 238 007B ; Hieroglyph_Mark_Begin # Ps LEFT CURLY BRACKET 239 27E6 ; Hieroglyph_Mark_Begin # Ps MATHEMATICAL LEFT WHITE SQUARE BRACKET 240 27E8 ; Hieroglyph_Mark_Begin # Ps MATHEMATICAL LEFT ANGLE BRACKET 241 2E22 ; Hieroglyph_Mark_Begin # Ps TOP LEFT HALF BRACKET 242 2E24 ; Hieroglyph_Mark_Begin # Ps BOTTOM LEFT HALF BRACKET 243 244 # ================================================ 245 246 # USE, Extended_Syllabic_Category=Hieroglyph_Mark_End 247 005D ; Hieroglyph_Mark_End # Pe RIGHT SQUARE BRACKET 248 007D ; Hieroglyph_Mark_End # Pe RIGHT CURLY BRACKET 249 27E7 ; Hieroglyph_Mark_End # Pe MATHEMATICAL RIGHT WHITE SQUARE BRACKET 250 27E9 ; Hieroglyph_Mark_End # Pe MATHEMATICAL RIGHT ANGLE BRACKET 251 2E23 ; Hieroglyph_Mark_End # Pe TOP RIGHT HALF BRACKET 252 2E25 ; Hieroglyph_Mark_End # Pe BOTTOM RIGHT HALF BRACKET 253 254 # ================================================ 255 256 # USE, Extended_Syllabic_Category=Hieroglyph_Segment_Begin 257 13437 ; Hieroglyph_Segment_Begin # Cf EGYPTIAN HIEROGLYPH BEGIN SEGMENT 258 259 # ================================================ 260 261 # USE, Extended_Syllabic_Category=Hieroglyph_Segment_End 262 13438 ; Hieroglyph_Segment_End # Cf EGYPTIAN HIEROGLYPH END SEGMENT 263 264 # ================================================ 265 266 # USE, Extended_Syllabic_Category=Hieroglyph_Mirror 267 13440 ; Hieroglyph_Mirror # Mn EGYPTIAN HIEROGLYPH MIRROR HORIZONTALLY 268 269 # ================================================ 270 271 # USE, Extended_Syllabic_Category=Hieroglyph_Modifier 272 13447..13455 ; Hieroglyph_Modifier # Mn [15] EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP START..EGYPTIAN HIEROGLYPH MODIFIER DAMAGED 273 274 # ================================================ 275 276 # eof