1# Override values For Indic_Syllabic_Category 2# Not derivable 3# Initial version based on Unicode 7.0 by Andrew Glass 2014-03-17 4# Updated for Unicode 10.0 by Andrew Glass 2017-07-25 5# Updated for Unicode 12.1 by Andrew Glass 2019-05-24 6# Updated for Unicode 13.0 by Andrew Glass 2020-07-28 7# Updated for Unicode 14.0 by Andrew Glass 2021-09-25 8 9# ================================================ 10# OVERRIDES TO ASSIGNED VALUES 11# ================================================ 12 13# Indic_Syllabic_Category=Bindu 14193A ; Bindu # Mn LIMBU SIGN KEMPHRENG 15AA29 ; Bindu # Mn CHAM VOWEL SIGN AA 1610A0D ; Bindu # Mn KHAROSHTHI SIGN DOUBLE RING BELOW 17 18# ================================================ 19 20# Indic_Syllabic_Category=Consonant 210840..0858 ; Consonant # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 220F00..0F01 ; Consonant # Lo [2] TIBETAN SYLLABLE OM..TIBETAN MARK GTER YIG MGO TRUNCATED 230F04..0F06 ; Consonant # Po TIBETAN MARK INITIAL YIG MGO MDUN MA..TIBETAN MARK CARET YIG MGO PHUR SHAD MA 2419C1..19C7 ; Consonant # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B # Reassigned to avoid clustering with a base consonant 2525CC ; Consonant # So DOTTED CIRCLE 26 27# ================================================ 28 29# Indic_Syllabic_Category=Consonant_Dead 300F7F ; Consonant_Dead # Mc TIBETAN SIGN RNAM BCAD # reassigned so that visarga will form an independent cluster 31 32# ================================================ 33 34# Indic_Syllabic_Category=Consonant_Final 350F35 ; Consonant_Final # Mn TIBETAN MARK NGAS BZUNG NYI ZLA 360F37 ; Consonant_Final # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS 370FC6 ; Consonant_Final # Mn TIBETAN SYMBOL PADMA GDAN 38 39# ================================================ 40 41# Indic_Syllabic_Category=Consonant_Final_Modifier 421C36 ; Consonant_Final_Modifier # Mn LEPCHA SIGN RAN 43 44# ================================================ 45 46# Indic_Syllabic_Category=Gemination_Mark 4711134 ; Gemination_Mark # Mc CHAKMA MAAYYAA 48 49# ================================================ 50 51# Indic_Syllabic_Category=Nukta 520F71 ; Nukta # Mn TIBETAN VOWEL SIGN AA # Reassigned to get this before an above vowel 5310A38..10A3A ; Nukta # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW 54 55# ================================================ 56 57# Indic_Syllabic_Category=Tone_Mark 581A7B..1A7C ; Tone_Mark # Mn [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN 591A7F ; Tone_Mark # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 60 61# ================================================ 62 63# Indic_Syllabic_Category=Vowel_Independent 64AAB1 ; Vowel_Independent # Lo TAI VIET VOWEL AA 65AABA ; Vowel_Independent # Lo TAI VIET VOWEL UA 66AABD ; Vowel_Independent # Lo TAI VIET VOWEL AN 67 68# ================================================ 69# ================================================ 70# VALUES NOT ASSIGNED IN Indic_Syllabic_Category 71# ================================================ 72# ================================================ 73 74# Indic_Syllabic_Category=Consonant 750800..0815 ; Consonant # Lo [22] SAMARITAN LETTER ALAF..SAMARITAN LETTER TAAF 761800 ; Consonant # Po MONGOLIAN BIRGA # Reassigned so that legacy Birga + MFVS sequences still work 771807 ; Consonant # Po MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER 78180A ; Consonant # Po MONGOLIAN NIRUGU 791820..1878 ; Consonant # Lo [88] MONGOLIAN LETTER A..MONGOLIAN LETTER CHA WITH TWO DOTS 801843 ; Consonant # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN 812D30..2D67 ; Consonant # Lo [56] TIFINAGH LETTER YA..TIFINAGH LETTER YO 822D6F ; Consonant # Lm TIFINAGH MODIFIER LETTER LABIALIZATION MARK 8310570..1057A ; Consonant # Lo [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA 841057C..1058A ; Consonant # Lo [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE 851058C..10592 ; Consonant # Lo [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE 8610594..10595 ; Consonant # Lo [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE 8710597..105A1 ; Consonant # Lo [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA 88105A3..105B1 ; Consonant # Lo [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE 89105B3..105B9 ; Consonant # Lo [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE 90105BB..105BC ; Consonant # Lo [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 9110AC0..10AC7 ; Consonant # Lo [8] MANICHAEAN LETTER ALEPH..MANICHAEAN LETTER WAW 9210AC9..10AE4 ; Consonant # Lo [28] MANICHAEAN LETTER ZAYIN..MANICHAEAN LETTER TAW 9310D00..10D23 ; Consonant # Lo [36] HANIFI ROHINGYA LETTER A..HANIFI ROHINGYA MARK NA KHONNA 9410E80..10EA9 ; Consonant # Lo [42] YEZIDI LETTER ELIF..YEZIDI LETTER ET 9510EB0..10EB1 ; Consonant # Lo [2] YEZIDI LETTER LAM WITH DOT ABOVE..YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE 9610F30..10F45 ; Consonant # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN 97111DA ; Consonant # Lo SHARADA EKAM 98#HIEROGLYPHS to be moved to new category 9913000..1342E ; Consonant # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 100#For the Begin and End segment to be handled fully correctly, the cluster model needs to be modified. 10113437..13438 ; Consonant # Lo [2] EGYPTIAN HIEROGLYPH BEGIN SEGMENT..EGYPTIAN HIEROGLYPH END SEGMENT 10216B00..16B2F ; Consonant # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 10316F00..16F4A ; Consonant # Lo [75] MIAO LETTER PA..MIAO LETTER RTE 10416FE4 ; Consonant # Mn KHITAN SMALL SCRIPT FILLER # Avoids Mn pushing this into VOWEL class 10518B00..18CD5 ; Consonant # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5 1061BC00..1BC6A ; Consonant # Lo [107] DUPLOYAN LETTER H..DUPLOYAN LETTER VOCALIC M 1071BC70..1BC7C ; Consonant # Lo [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK 1081BC80..1BC88 ; Consonant # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 1091BC90..1BC99 ; Consonant # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW 1101E100..1E12C ; Consonant # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1111E137..1E13D ; Consonant # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1121E14E ; Consonant # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1131E14F ; Consonant # So NYIAKENG PUACHUE HMONG CIRCLED CA 1141E290..1E2AD ; Consonant # Lo [30] TOTO LETTER PA..TOTO LETTER A 1151E2C0..1E2EB ; Consonant # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1161E900..1E921 ; Consonant # Lu [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA 1171E922..1E943 ; Consonant # Ll [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA 1181E94B ; Consonant # Lm ADLAM NASALIZATION MARK 119 120# ================================================ 121 122# Indic_Syllabic_Category=Consonant_Placeholder 1231880..1884 ; Consonant_Placeholder # Lo [5] MONGOLIAN LETTER ALI GALI ANUSVARA ONE..MONGOLIAN LETTER ALI GALI INVERTED UBADAMA 124 125# ================================================ 126 127# Indic_Syllabic_Category=Gemination_Mark 12810D27 ; Gemination_Mark # Mn HANIFI ROHINGYA SIGN TASSI 129 130# ================================================ 131 132# Indic_Syllabic_Category=Modifying_Letter 133FE00..FE0F ; Modifying_Letter # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16# Need to treat them as isolated bases so they don't merge with a cluster in invalid scenarios 13416F50 ; Modifying_Letter # Lo MIAO LETTER NASALIZATION 135 136# ================================================ 137 138# Indic_Syllabic_Category=Nukta 1390859..085B ; Nukta # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK 1400F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU # NOW IN UNICODE 10.0 1411885..1886 ; Nukta # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 14218A9 ; Nukta # Mn MONGOLIAN LETTER ALI GALI DAGALGA 1431B6B..1B73 ; Nukta # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 14410AE5..10AE6 ; Nukta # Mn [2] MANICHAEAN ABBREVIATION MARK ABOVE..MANICHAEAN ABBREVIATION MARK BELOW 14516F4F ; Nukta # Mn MIAO SIGN CONSONANT MODIFIER BAR 1461BC9D..1BC9E ; Nukta # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 1471E944..1E94A ; Nukta # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA 14810F82..10F85 ; Nukta # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 149 150# ================================================ 151 152# Indic_Syllabic_Category=Number 15310D30..10D39 ; Number # Nd [10] HANIFI ROHINGYA DIGIT ZERO..HANIFI ROHINGYA DIGIT NINE 15410F51..10F54 ; Number # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED 15516AC0..16AC9 ; Number # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 1561E140..1E149 ; Number # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1571E2F0..1E2F9 ; Number # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE 1581E950..1E959 ; Number # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 159 160# ================================================ 161 162# Indic_Syllabic_Category=Tone_Mark 16307EB..07F3 ; Tone_Mark # Mn [9] NKO COMBINING SHORT HIGH TONE..NKO COMBINING DOUBLE DOT ABOVE 16407FD ; Tone_Mark # Mn NKO DANTAYALAN 1650F86..0F87 ; Tone_Mark # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS 16617CF ; Tone_Mark # Mn KHMER SIGN AHSDA 16710D24..10D26 ; Tone_Mark # Mn [3] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TANA 16810F46..10F50 ; Tone_Mark # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW 16916B30..16B36 ; Tone_Mark # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM 17016F8F..16F92 ; Tone_Mark # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 1711E130..1E136 ; Tone_Mark # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D 1721E2AE ; Tone_Mark # Mn TOTO SIGN RISING TONE 1731E2EC..1E2EF ; Tone_Mark # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 174 175# ================================================ 176 177# Indic_Syllabic_Category=Virama 1782D7F ; Virama # Mn TIFINAGH CONSONANT JOINER 17913430..13436 ; Virama # Cf [7] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH OVERLAY MIDDLE 180 181# ================================================ 182 183# Indic_Syllabic_Category=Vowel_Independent 184AAB1 ; Vowel_Independent # Lo TAI VIET VOWEL AA 185AABA ; Vowel_Independent # Lo TAI VIET VOWEL UA 186AABD ; Vowel_Independent # Lo TAI VIET VOWEL AN 187 188# ================================================ 189 190# Indic_Syllabic_Category=Vowel_Dependent 1910B55 ; Vowel_Dependent # Mn ORIYA SIGN OVERLINE 19210EAB..10EAC ; Vowel_Dependent # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 19316F51..16F87 ; Vowel_Dependent # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI 194 195# ================================================ 196# ================================================ 197# PROPERTIES NOT ASSIGNED IN Indic_Syllabic_Category 198# ================================================ 199# ================================================ 200 201# USE_Syllabic_Category=Hieroglyph 202# 13000..1342E ; Hieroglyph # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 203 204# ================================================ 205 206# USE_Syllabic_Category=Hieroglyph_Joiner 207# 13430..13436 ; Hieroglyph_Joiner # Cf EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH OVERLAY MIDDLE 208 209# ================================================ 210 211# USE_Syllabic_Category= Hieroglyph_Segment_Begin 212# 13437 ; Hieroglyph_Segment_Begin # Cf EGYPTIAN HIEROGLYPH BEGIN SEGMENT 213 214# ================================================ 215 216# USE_Syllabic_Category= Hieroglyph_Segment_End 217# 13438 ; Hieroglyph_Segment_End # Cf EGYPTIAN HIEROGLYPH END SEGMENT 218 219# ================================================ 220 221# eof 222