• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1# Override values For Indic_Syllabic_Category
2# Not derivable
3# Initial version based on Unicode 7.0 by Andrew Glass 2014-03-17
4# Updated  for Unicode 10.0 by Andrew Glass 2017-07-25
5# Updated  for Unicode 12.1 by Andrew Glass 2019-05-24
6# Updated  for Unicode 13.0 by Andrew Glass 2020-07-28
7
8# ================================================
9# OVERRIDES TO ASSIGNED VALUES
10# ================================================
11
12# Indic_Syllabic_Category=Bindu
13193A          ; Bindu  # Mn       LIMBU SIGN KEMPHRENG
14AA29          ; Bindu  # Mn       CHAM VOWEL SIGN AA
1510A0D         ; Bindu  # Mn       KHAROSHTHI SIGN DOUBLE RING BELOW
16
17# ================================================
18
19# Indic_Syllabic_Category=Consonant
200840..0858   ; Consonant # Lo  [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN
210F00..0F01   ; Consonant # Lo   [2] TIBETAN SYLLABLE OM..TIBETAN MARK GTER YIG MGO TRUNCATED
220F04..0F06   ; Consonant # Po       TIBETAN MARK INITIAL YIG MGO MDUN MA..TIBETAN MARK CARET YIG MGO PHUR SHAD MA
2319C1..19C7   ; Consonant # Lo   [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B # Reassigned to avoid clustering with a base consonant
2425CC         ; Consonant # So       DOTTED CIRCLE
25
26# ================================================
27
28# Indic_Syllabic_Category=Consonant_Dead
290F7F         ; Consonant_Dead    # Mc       TIBETAN SIGN RNAM BCAD # reassigned so that visarga will form an independent cluster
30
31# ================================================
32
33# Indic_Syllabic_Category=Consonant_Final
340F35         ; Consonant_Final   # Mn       TIBETAN MARK NGAS BZUNG NYI ZLA
350F37         ; Consonant_Final   # Mn       TIBETAN MARK NGAS BZUNG SGOR RTAGS
360FC6         ; Consonant_Final   # Mn       TIBETAN SYMBOL PADMA GDAN
37
38# ================================================
39
40# Indic_Syllabic_Category=Consonant_Final_Modifier
411C36     ; Consonant_Final_Modifier  # Mn   LEPCHA SIGN RAN
42
43# ================================================
44
45# Indic_Syllabic_Category=Gemination_Mark
4611134         ; Gemination_Mark  # Mc      CHAKMA MAAYYAA
47
48# ================================================
49
50# Indic_Syllabic_Category=Nukta
510F71          ; Nukta            # Mn       TIBETAN VOWEL SIGN AA # Reassigned to get this before an above vowel
5210A38..10A3A  ; Nukta            # Mn   [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW
53
54# ================================================
55
56# Indic_Syllabic_Category=Tone_Mark
57A982         ; Tone_Mark         # Mn       JAVANESE SIGN LAYAR# Not a repha, because it does not reorder to front of cluster
581A7B..1A7C   ; Tone_Mark         # Mn   [2] TAI THAM SIGN MAI SAM..TAI THAM SIGN KHUEN-LUE KARAN
591A7F         ; Tone_Mark         # Mn       TAI THAM COMBINING CRYPTOGRAMMIC DOT
60
61# ================================================
62
63# Indic_Syllabic_Category=Vowel_Independent
64AAB1          ; Vowel_Independent # Lo       TAI VIET VOWEL AA
65AABA          ; Vowel_Independent # Lo       TAI VIET VOWEL UA
66AABD          ; Vowel_Independent # Lo       TAI VIET VOWEL AN
67
68# ================================================
69# ================================================
70# VALUES NOT ASSIGNED IN Indic_Syllabic_Category
71# ================================================
72# ================================================
73
74# Indic_Syllabic_Category=Consonant
750800..0815   ; Consonant # Lo   [22] SAMARITAN LETTER ALAF..SAMARITAN LETTER TAAF
761800         ; Consonant # Po        MONGOLIAN BIRGA # Reassigned so that legacy Birga + MFVS sequences still work
771807         ; Consonant # Po        MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER
78180A         ; Consonant # Po        MONGOLIAN NIRUGU
791820..1878   ; Consonant # Lo   [88] MONGOLIAN LETTER A..MONGOLIAN LETTER CHA WITH TWO DOTS
801843         ; Consonant # Lm        MONGOLIAN LETTER TODO LONG VOWEL SIGN
812D30..2D67   ; Consonant # Lo   [56] TIFINAGH LETTER YA..TIFINAGH LETTER YO
822D6F         ; Consonant # Lm        TIFINAGH MODIFIER LETTER LABIALIZATION MARK
8310AC0..10AC7 ; Consonant # Lo    [8] MANICHAEAN LETTER ALEPH..MANICHAEAN LETTER WAW
8410AC9..10AE4 ; Consonant # Lo   [28] MANICHAEAN LETTER ZAYIN..MANICHAEAN LETTER TAW
8510D00..10D23 ; Consonant # Lo   [36] HANIFI ROHINGYA LETTER A..HANIFI ROHINGYA MARK NA KHONNA
8610E80..10EA9 ; Consonant # Lo   [42] YEZIDI LETTER ELIF..YEZIDI LETTER ET
8710EB0..10EB1 ; Consonant # Lo    [2] YEZIDI LETTER LAM WITH DOT ABOVE..YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE
8810F30..10F45 ; Consonant # Lo   [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN
89111DA        ; Consonant # Lo        SHARADA EKAM
90#HIEROGLYPHS moved to new category
91#13000..1342E ; Consonant # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032
92#For the Begin and End segment to be handled fully correctly, the cluster model needs to be modified.
93#13437..13438 ; Consonant # Lo    [2] EGYPTIAN HIEROGLYPH BEGIN SEGMENT..EGYPTIAN HIEROGLYPH END SEGMENT
9416B00..16B2F ; Consonant # Lo   [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU
9516F00..16F4A ; Consonant # Lo   [75] MIAO LETTER PA..MIAO LETTER RTE
9616FE4        ; Consonant # Mn        KHITAN SMALL SCRIPT FILLER
9718B00..18CD5 ; Consonant # Lo  [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5
981BC00..1BC6A ; Consonant # Lo  [107] DUPLOYAN LETTER H..DUPLOYAN LETTER VOCALIC M
991BC70..1BC7C ; Consonant # Lo   [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK
1001BC80..1BC88 ; Consonant # Lo    [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL
1011BC90..1BC99 ; Consonant # Lo   [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW
1021E100..1E12C ; Consonant # Lo   [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W
1031E137..1E13D ; Consonant # Lm    [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER
1041E14E        ; Consonant # Lo        NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ
1051E14F        ; Consonant # So        NYIAKENG PUACHUE HMONG CIRCLED CA
1061E2C0..1E2EB ; Consonant # Lo   [44] WANCHO LETTER AA..WANCHO LETTER YIH
1071E900..1E921 ; Consonant # Lu   [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA
1081E922..1E943 ; Consonant # Ll   [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA
1091E94B        ; Consonant # Lm        ADLAM NASALIZATION MARK
110
111# ================================================
112
113# Indic_Syllabic_Category=Consonant_Placeholder
1141880..1884 ; Consonant_Placeholder # Lo   [5] MONGOLIAN LETTER ALI GALI ANUSVARA ONE..MONGOLIAN LETTER ALI GALI INVERTED UBADAMA
115
116# ================================================
117
118# Indic_Syllabic_Category=Gemination_Mark
11910D27      ; Gemination_Mark # Mn       HANIFI ROHINGYA SIGN TASSI
120
121# ================================================
122
123# Indic_Syllabic_Category=Modifying_Letter
124FE00..FE0F   ; Modifying_Letter  # Mn  [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16# Need to treat them as isolated bases so they don't merge with a cluster in invalid scenarios
12516F50        ; Modifying_Letter  # Lo       MIAO LETTER NASALIZATION
126
127# ================================================
128
129# Indic_Syllabic_Category=Nukta
1300859..085B    ; Nukta            # Mn   [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK
1310F39          ; Nukta            # Mn       TIBETAN MARK TSA -PHRU # NOW IN UNICODE 10.0
1321885..1886    ; Nukta            # Mn   [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA
13318A9          ; Nukta            # Mn       MONGOLIAN LETTER ALI GALI DAGALGA
1341B6B..1B73    ; Nukta            # Mn   [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG
13510AE5..10AE6  ; Nukta            # Mn   [2] MANICHAEAN ABBREVIATION MARK ABOVE..MANICHAEAN ABBREVIATION MARK BELOW
13616F4F         ; Nukta            # Mn       MIAO SIGN CONSONANT MODIFIER BAR
1371BC9D..1BC9E  ; Nukta            # Mn   [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK
1381E944..1E94A  ; Nukta            # Mn   [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA
139
140# ================================================
141
142# Indic_Syllabic_Category=Number
14310D30..10D39 ; Number              # Nd  [10] HANIFI ROHINGYA DIGIT ZERO..HANIFI ROHINGYA DIGIT NINE
14410F51..10F54 ; Number              # No   [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED
1451E140..1E149 ; Number              # Nd  [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE
1461E2F0..1E2F9 ; Number              # Nd  [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE
1471E950..1E959 ; Number              # Nd  [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE
148
149# ================================================
150
151# Indic_Syllabic_Category=Tone_Mark
15207EB..07F3   ; Tone_Mark           # Mn   [9] NKO COMBINING SHORT HIGH TONE..NKO COMBINING DOUBLE DOT ABOVE
15307FD         ; Tone_Mark           # Mn       NKO DANTAYALAN
1540F86..0F87   ; Tone_Mark           # Mn   [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS
15517CF         ; Tone_Mark           # Mn       KHMER SIGN AHSDA
15610D24..10D26 ; Tone_Mark           # Mn   [3] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TANA
15710F46..10F50 ; Tone_Mark           # Mn  [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW
15816B30..16B36 ; Tone_Mark           # Mn   [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM
15916F8F..16F92 ; Tone_Mark           # Mn   [4] MIAO TONE RIGHT..MIAO TONE BELOW
1601E130..1E136 ; Tone_Mark           # Mn   [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D
1611E2EC..1E2EF ; Tone_Mark           # Mn   [4] WANCHO TONE TUP..WANCHO TONE KOINI
162
163# ================================================
164
165# Indic_Syllabic_Category=Virama
1662D7F         ; Virama              # Mn       TIFINAGH CONSONANT JOINER
16713430..13436 ; Virama              # Cf   [7] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH OVERLAY MIDDLE
168
169# ================================================
170
171# Indic_Syllabic_Category=Vowel_Independent
172AAB1         ; Vowel_Independent   # Lo       TAI VIET VOWEL AA
173AABA         ; Vowel_Independent   # Lo       TAI VIET VOWEL UA
174AABD         ; Vowel_Independent   # Lo       TAI VIET VOWEL AN
175
176# ================================================
177
178# Indic_Syllabic_Category=Vowel_Dependent
1790B55          ; Vowel_Dependent   # Mn       ORIYA SIGN OVERLINE
18010EAB..10EAC  ; Vowel_Dependent   # Mn   [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK
18116F51..16F87  ; Vowel_Dependent   # Mc  [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI
182
183# ================================================
184# ================================================
185# PROPERTIES NOT ASSIGNED IN Indic_Syllabic_Category
186# ================================================
187# ================================================
188
189# USE_Syllabic_Category=Hieroglyph
190# 13000..1342E ; Hieroglyph          # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032
191
192# ================================================
193
194# USE_Syllabic_Category=Hieroglyph_Joiner
195# 13430..13436 ; Hieroglyph_Joiner   # Cf        EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH OVERLAY MIDDLE
196
197# ================================================
198
199# USE_Syllabic_Category= Hieroglyph_Segment_Begin
200# 13437        ; Hieroglyph_Segment_Begin  # Cf  EGYPTIAN HIEROGLYPH BEGIN SEGMENT
201
202# ================================================
203
204# USE_Syllabic_Category= Hieroglyph_Segment_End
205# 13438        ; Hieroglyph_Segment_End    # Cf  EGYPTIAN HIEROGLYPH END SEGMENT
206
207# ================================================
208
209# eof
210