• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1# Override values For Indic_Syllabic_Category
2# Not derivable
3# Initial version based on Unicode 7.0 by Andrew Glass 2014-03-17
4# Updated for Unicode 10.0 by Andrew Glass 2017-07-25
5# Updated for Unicode 12.1 by Andrew Glass 2019-05-24
6# Updated for Unicode 13.0 by Andrew Glass 2020-07-28
7# Updated for Unicode 14.0 by Andrew Glass 2021-09-25
8
9# ================================================
10# OVERRIDES TO ASSIGNED VALUES
11# ================================================
12
13# Indic_Syllabic_Category=Bindu
14193A          ; Bindu  # Mn       LIMBU SIGN KEMPHRENG
15AA29          ; Bindu  # Mn       CHAM VOWEL SIGN AA
1610A0D         ; Bindu  # Mn       KHAROSHTHI SIGN DOUBLE RING BELOW
17
18# ================================================
19
20# Indic_Syllabic_Category=Consonant
210840..0858    ; Consonant # Lo  [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN
220F00..0F01    ; Consonant # Lo   [2] TIBETAN SYLLABLE OM..TIBETAN MARK GTER YIG MGO TRUNCATED
230F04..0F06    ; Consonant # Po       TIBETAN MARK INITIAL YIG MGO MDUN MA..TIBETAN MARK CARET YIG MGO PHUR SHAD MA
2419C1..19C7    ; Consonant # Lo   [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B # Reassigned to avoid clustering with a base consonant
2525CC          ; Consonant # So       DOTTED CIRCLE
26
27# ================================================
28
29# Indic_Syllabic_Category=Consonant_Dead
300F7F          ; Consonant_Dead    # Mc       TIBETAN SIGN RNAM BCAD # reassigned so that visarga will form an independent cluster
31
32# ================================================
33
34# Indic_Syllabic_Category=Consonant_Final
350F35          ; Consonant_Final   # Mn       TIBETAN MARK NGAS BZUNG NYI ZLA
360F37          ; Consonant_Final   # Mn       TIBETAN MARK NGAS BZUNG SGOR RTAGS
370FC6          ; Consonant_Final   # Mn       TIBETAN SYMBOL PADMA GDAN
38
39# ================================================
40
41# Indic_Syllabic_Category=Consonant_Final_Modifier
421C36          ; Consonant_Final_Modifier  # Mn   LEPCHA SIGN RAN
43
44# ================================================
45
46# Indic_Syllabic_Category=Gemination_Mark
4711134         ; Gemination_Mark  # Mc      CHAKMA MAAYYAA
48
49# ================================================
50
51# Indic_Syllabic_Category=Nukta
520F71          ; Nukta            # Mn       TIBETAN VOWEL SIGN AA # Reassigned to get this before an above vowel
5310A38..10A3A  ; Nukta            # Mn   [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW
54
55# ================================================
56
57# Indic_Syllabic_Category=Tone_Mark
581A7B..1A7C    ; Tone_Mark         # Mn   [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN
591A7F          ; Tone_Mark         # Mn       TAI THAM COMBINING CRYPTOGRAMMIC DOT
60
61# ================================================
62
63# Indic_Syllabic_Category=Vowel_Independent
64AAB1          ; Vowel_Independent # Lo       TAI VIET VOWEL AA
65AABA          ; Vowel_Independent # Lo       TAI VIET VOWEL UA
66AABD          ; Vowel_Independent # Lo       TAI VIET VOWEL AN
67
68# ================================================
69# ================================================
70# VALUES NOT ASSIGNED IN Indic_Syllabic_Category
71# ================================================
72# ================================================
73
74# Indic_Syllabic_Category=Consonant
750800..0815    ; Consonant # Lo   [22] SAMARITAN LETTER ALAF..SAMARITAN LETTER TAAF
761800          ; Consonant # Po        MONGOLIAN BIRGA # Reassigned so that legacy Birga + MFVS sequences still work
771807          ; Consonant # Po        MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER
78180A          ; Consonant # Po        MONGOLIAN NIRUGU
791820..1878    ; Consonant # Lo   [88] MONGOLIAN LETTER A..MONGOLIAN LETTER CHA WITH TWO DOTS
801843          ; Consonant # Lm        MONGOLIAN LETTER TODO LONG VOWEL SIGN
812D30..2D67    ; Consonant # Lo   [56] TIFINAGH LETTER YA..TIFINAGH LETTER YO
822D6F          ; Consonant # Lm        TIFINAGH MODIFIER LETTER LABIALIZATION MARK
8310570..1057A  ; Consonant # Lo   [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA
841057C..1058A  ; Consonant # Lo   [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE
851058C..10592  ; Consonant # Lo    [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE
8610594..10595  ; Consonant # Lo    [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE
8710597..105A1  ; Consonant # Lo   [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA
88105A3..105B1  ; Consonant # Lo   [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE
89105B3..105B9  ; Consonant # Lo    [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE
90105BB..105BC  ; Consonant # Lo    [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE
9110AC0..10AC7  ; Consonant # Lo    [8] MANICHAEAN LETTER ALEPH..MANICHAEAN LETTER WAW
9210AC9..10AE4  ; Consonant # Lo   [28] MANICHAEAN LETTER ZAYIN..MANICHAEAN LETTER TAW
9310D00..10D23  ; Consonant # Lo   [36] HANIFI ROHINGYA LETTER A..HANIFI ROHINGYA MARK NA KHONNA
9410E80..10EA9  ; Consonant # Lo   [42] YEZIDI LETTER ELIF..YEZIDI LETTER ET
9510EB0..10EB1  ; Consonant # Lo    [2] YEZIDI LETTER LAM WITH DOT ABOVE..YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE
9610F30..10F45  ; Consonant # Lo   [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN
97111DA         ; Consonant # Lo        SHARADA EKAM
98#HIEROGLYPHS to be moved to new category
9913000..1342E  ; Consonant # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032
100#For the Begin and End segment to be handled fully correctly, the cluster model needs to be modified.
10113437..13438  ; Consonant # Lo    [2] EGYPTIAN HIEROGLYPH BEGIN SEGMENT..EGYPTIAN HIEROGLYPH END SEGMENT
10216B00..16B2F  ; Consonant # Lo   [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU
10316F00..16F4A  ; Consonant # Lo   [75] MIAO LETTER PA..MIAO LETTER RTE
10416FE4         ; Consonant # Mn        KHITAN SMALL SCRIPT FILLER          # Avoids Mn pushing this into VOWEL class
10518B00..18CD5  ; Consonant # Lo  [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5
1061BC00..1BC6A  ; Consonant # Lo  [107] DUPLOYAN LETTER H..DUPLOYAN LETTER VOCALIC M
1071BC70..1BC7C  ; Consonant # Lo   [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK
1081BC80..1BC88  ; Consonant # Lo    [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL
1091BC90..1BC99  ; Consonant # Lo   [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW
1101E100..1E12C  ; Consonant # Lo   [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W
1111E137..1E13D  ; Consonant # Lm    [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER
1121E14E         ; Consonant # Lo        NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ
1131E14F         ; Consonant # So        NYIAKENG PUACHUE HMONG CIRCLED CA
1141E290..1E2AD  ; Consonant # Lo   [30] TOTO LETTER PA..TOTO LETTER A
1151E2C0..1E2EB  ; Consonant # Lo   [44] WANCHO LETTER AA..WANCHO LETTER YIH
1161E900..1E921  ; Consonant # Lu   [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA
1171E922..1E943  ; Consonant # Ll   [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA
1181E94B         ; Consonant # Lm        ADLAM NASALIZATION MARK
119
120# ================================================
121
122# Indic_Syllabic_Category=Consonant_Placeholder
1231880..1884 ; Consonant_Placeholder # Lo   [5] MONGOLIAN LETTER ALI GALI ANUSVARA ONE..MONGOLIAN LETTER ALI GALI INVERTED UBADAMA
124
125# ================================================
126
127# Indic_Syllabic_Category=Gemination_Mark
12810D27         ; Gemination_Mark   # Mn       HANIFI ROHINGYA SIGN TASSI
129
130# ================================================
131
132# Indic_Syllabic_Category=Modifying_Letter
133FE00..FE0F    ; Modifying_Letter  # Mn  [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16# Need to treat them as isolated bases so they don't merge with a cluster in invalid scenarios
13416F50         ; Modifying_Letter  # Lo       MIAO LETTER NASALIZATION
135
136# ================================================
137
138# Indic_Syllabic_Category=Nukta
1390859..085B    ; Nukta            # Mn   [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK
1400F39          ; Nukta            # Mn       TIBETAN MARK TSA -PHRU # NOW IN UNICODE 10.0
1411885..1886    ; Nukta            # Mn   [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA
14218A9          ; Nukta            # Mn       MONGOLIAN LETTER ALI GALI DAGALGA
1431B6B..1B73    ; Nukta            # Mn   [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG
14410AE5..10AE6  ; Nukta            # Mn   [2] MANICHAEAN ABBREVIATION MARK ABOVE..MANICHAEAN ABBREVIATION MARK BELOW
14516F4F         ; Nukta            # Mn       MIAO SIGN CONSONANT MODIFIER BAR
1461BC9D..1BC9E  ; Nukta            # Mn   [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK
1471E944..1E94A  ; Nukta            # Mn   [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA
14810F82..10F85  ; Nukta            # Mn   [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW
149
150# ================================================
151
152# Indic_Syllabic_Category=Number
15310D30..10D39  ; Number              # Nd  [10] HANIFI ROHINGYA DIGIT ZERO..HANIFI ROHINGYA DIGIT NINE
15410F51..10F54  ; Number              # No   [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED
15516AC0..16AC9  ; Number              # Nd  [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE
1561E140..1E149  ; Number              # Nd  [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE
1571E2F0..1E2F9  ; Number              # Nd  [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE
1581E950..1E959  ; Number              # Nd  [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE
159
160# ================================================
161
162# Indic_Syllabic_Category=Tone_Mark
16307EB..07F3    ; Tone_Mark           # Mn   [9] NKO COMBINING SHORT HIGH TONE..NKO COMBINING DOUBLE DOT ABOVE
16407FD          ; Tone_Mark           # Mn       NKO DANTAYALAN
1650F86..0F87    ; Tone_Mark           # Mn   [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS
16617CF          ; Tone_Mark           # Mn       KHMER SIGN AHSDA
16710D24..10D26  ; Tone_Mark           # Mn   [3] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TANA
16810F46..10F50  ; Tone_Mark           # Mn  [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW
16916B30..16B36  ; Tone_Mark           # Mn   [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM
17016F8F..16F92  ; Tone_Mark           # Mn   [4] MIAO TONE RIGHT..MIAO TONE BELOW
1711E130..1E136  ; Tone_Mark           # Mn   [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D
1721E2AE         ; Tone_Mark           # Mn       TOTO SIGN RISING TONE
1731E2EC..1E2EF  ; Tone_Mark           # Mn   [4] WANCHO TONE TUP..WANCHO TONE KOINI
174
175# ================================================
176
177# Indic_Syllabic_Category=Virama
1782D7F          ; Virama              # Mn       TIFINAGH CONSONANT JOINER
17913430..13436  ; Virama              # Cf   [7] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH OVERLAY MIDDLE
180
181# ================================================
182
183# Indic_Syllabic_Category=Vowel_Independent
184AAB1          ; Vowel_Independent   # Lo       TAI VIET VOWEL AA
185AABA          ; Vowel_Independent   # Lo       TAI VIET VOWEL UA
186AABD          ; Vowel_Independent   # Lo       TAI VIET VOWEL AN
187
188# ================================================
189
190# Indic_Syllabic_Category=Vowel_Dependent
1910B55          ; Vowel_Dependent     # Mn       ORIYA SIGN OVERLINE
19210EAB..10EAC  ; Vowel_Dependent     # Mn   [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK
19316F51..16F87  ; Vowel_Dependent     # Mc  [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI
194
195# ================================================
196# ================================================
197# PROPERTIES NOT ASSIGNED IN Indic_Syllabic_Category
198# ================================================
199# ================================================
200
201# USE_Syllabic_Category=Hieroglyph
202# 13000..1342E ; Hieroglyph          # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032
203
204# ================================================
205
206# USE_Syllabic_Category=Hieroglyph_Joiner
207# 13430..13436 ; Hieroglyph_Joiner   # Cf        EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH OVERLAY MIDDLE
208
209# ================================================
210
211# USE_Syllabic_Category= Hieroglyph_Segment_Begin
212# 13437        ; Hieroglyph_Segment_Begin  # Cf  EGYPTIAN HIEROGLYPH BEGIN SEGMENT
213
214# ================================================
215
216# USE_Syllabic_Category= Hieroglyph_Segment_End
217# 13438        ; Hieroglyph_Segment_End    # Cf  EGYPTIAN HIEROGLYPH END SEGMENT
218
219# ================================================
220
221# eof
222