• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1# -*- coding: utf-8 -*-
2#
3# NOTE: This file was auto-generated with MetaTools/buildUCD.py.
4# Source: https://unicode.org/Public/UNIDATA/Blocks.txt
5# License: http://unicode.org/copyright.html#License
6#
7# Blocks-14.0.0.txt
8# Date: 2021-01-22, 23:29:00 GMT [KW]
9# © 2021 Unicode®, Inc.
10# For terms of use, see http://www.unicode.org/terms_of_use.html
11#
12# Unicode Character Database
13# For documentation, see http://www.unicode.org/reports/tr44/
14#
15# Format:
16# Start Code..End Code; Block Name
17
18
19RANGES = [
20    0x0000,  # .. 0x007F ; Basic Latin
21    0x0080,  # .. 0x00FF ; Latin-1 Supplement
22    0x0100,  # .. 0x017F ; Latin Extended-A
23    0x0180,  # .. 0x024F ; Latin Extended-B
24    0x0250,  # .. 0x02AF ; IPA Extensions
25    0x02B0,  # .. 0x02FF ; Spacing Modifier Letters
26    0x0300,  # .. 0x036F ; Combining Diacritical Marks
27    0x0370,  # .. 0x03FF ; Greek and Coptic
28    0x0400,  # .. 0x04FF ; Cyrillic
29    0x0500,  # .. 0x052F ; Cyrillic Supplement
30    0x0530,  # .. 0x058F ; Armenian
31    0x0590,  # .. 0x05FF ; Hebrew
32    0x0600,  # .. 0x06FF ; Arabic
33    0x0700,  # .. 0x074F ; Syriac
34    0x0750,  # .. 0x077F ; Arabic Supplement
35    0x0780,  # .. 0x07BF ; Thaana
36    0x07C0,  # .. 0x07FF ; NKo
37    0x0800,  # .. 0x083F ; Samaritan
38    0x0840,  # .. 0x085F ; Mandaic
39    0x0860,  # .. 0x086F ; Syriac Supplement
40    0x0870,  # .. 0x089F ; Arabic Extended-B
41    0x08A0,  # .. 0x08FF ; Arabic Extended-A
42    0x0900,  # .. 0x097F ; Devanagari
43    0x0980,  # .. 0x09FF ; Bengali
44    0x0A00,  # .. 0x0A7F ; Gurmukhi
45    0x0A80,  # .. 0x0AFF ; Gujarati
46    0x0B00,  # .. 0x0B7F ; Oriya
47    0x0B80,  # .. 0x0BFF ; Tamil
48    0x0C00,  # .. 0x0C7F ; Telugu
49    0x0C80,  # .. 0x0CFF ; Kannada
50    0x0D00,  # .. 0x0D7F ; Malayalam
51    0x0D80,  # .. 0x0DFF ; Sinhala
52    0x0E00,  # .. 0x0E7F ; Thai
53    0x0E80,  # .. 0x0EFF ; Lao
54    0x0F00,  # .. 0x0FFF ; Tibetan
55    0x1000,  # .. 0x109F ; Myanmar
56    0x10A0,  # .. 0x10FF ; Georgian
57    0x1100,  # .. 0x11FF ; Hangul Jamo
58    0x1200,  # .. 0x137F ; Ethiopic
59    0x1380,  # .. 0x139F ; Ethiopic Supplement
60    0x13A0,  # .. 0x13FF ; Cherokee
61    0x1400,  # .. 0x167F ; Unified Canadian Aboriginal Syllabics
62    0x1680,  # .. 0x169F ; Ogham
63    0x16A0,  # .. 0x16FF ; Runic
64    0x1700,  # .. 0x171F ; Tagalog
65    0x1720,  # .. 0x173F ; Hanunoo
66    0x1740,  # .. 0x175F ; Buhid
67    0x1760,  # .. 0x177F ; Tagbanwa
68    0x1780,  # .. 0x17FF ; Khmer
69    0x1800,  # .. 0x18AF ; Mongolian
70    0x18B0,  # .. 0x18FF ; Unified Canadian Aboriginal Syllabics Extended
71    0x1900,  # .. 0x194F ; Limbu
72    0x1950,  # .. 0x197F ; Tai Le
73    0x1980,  # .. 0x19DF ; New Tai Lue
74    0x19E0,  # .. 0x19FF ; Khmer Symbols
75    0x1A00,  # .. 0x1A1F ; Buginese
76    0x1A20,  # .. 0x1AAF ; Tai Tham
77    0x1AB0,  # .. 0x1AFF ; Combining Diacritical Marks Extended
78    0x1B00,  # .. 0x1B7F ; Balinese
79    0x1B80,  # .. 0x1BBF ; Sundanese
80    0x1BC0,  # .. 0x1BFF ; Batak
81    0x1C00,  # .. 0x1C4F ; Lepcha
82    0x1C50,  # .. 0x1C7F ; Ol Chiki
83    0x1C80,  # .. 0x1C8F ; Cyrillic Extended-C
84    0x1C90,  # .. 0x1CBF ; Georgian Extended
85    0x1CC0,  # .. 0x1CCF ; Sundanese Supplement
86    0x1CD0,  # .. 0x1CFF ; Vedic Extensions
87    0x1D00,  # .. 0x1D7F ; Phonetic Extensions
88    0x1D80,  # .. 0x1DBF ; Phonetic Extensions Supplement
89    0x1DC0,  # .. 0x1DFF ; Combining Diacritical Marks Supplement
90    0x1E00,  # .. 0x1EFF ; Latin Extended Additional
91    0x1F00,  # .. 0x1FFF ; Greek Extended
92    0x2000,  # .. 0x206F ; General Punctuation
93    0x2070,  # .. 0x209F ; Superscripts and Subscripts
94    0x20A0,  # .. 0x20CF ; Currency Symbols
95    0x20D0,  # .. 0x20FF ; Combining Diacritical Marks for Symbols
96    0x2100,  # .. 0x214F ; Letterlike Symbols
97    0x2150,  # .. 0x218F ; Number Forms
98    0x2190,  # .. 0x21FF ; Arrows
99    0x2200,  # .. 0x22FF ; Mathematical Operators
100    0x2300,  # .. 0x23FF ; Miscellaneous Technical
101    0x2400,  # .. 0x243F ; Control Pictures
102    0x2440,  # .. 0x245F ; Optical Character Recognition
103    0x2460,  # .. 0x24FF ; Enclosed Alphanumerics
104    0x2500,  # .. 0x257F ; Box Drawing
105    0x2580,  # .. 0x259F ; Block Elements
106    0x25A0,  # .. 0x25FF ; Geometric Shapes
107    0x2600,  # .. 0x26FF ; Miscellaneous Symbols
108    0x2700,  # .. 0x27BF ; Dingbats
109    0x27C0,  # .. 0x27EF ; Miscellaneous Mathematical Symbols-A
110    0x27F0,  # .. 0x27FF ; Supplemental Arrows-A
111    0x2800,  # .. 0x28FF ; Braille Patterns
112    0x2900,  # .. 0x297F ; Supplemental Arrows-B
113    0x2980,  # .. 0x29FF ; Miscellaneous Mathematical Symbols-B
114    0x2A00,  # .. 0x2AFF ; Supplemental Mathematical Operators
115    0x2B00,  # .. 0x2BFF ; Miscellaneous Symbols and Arrows
116    0x2C00,  # .. 0x2C5F ; Glagolitic
117    0x2C60,  # .. 0x2C7F ; Latin Extended-C
118    0x2C80,  # .. 0x2CFF ; Coptic
119    0x2D00,  # .. 0x2D2F ; Georgian Supplement
120    0x2D30,  # .. 0x2D7F ; Tifinagh
121    0x2D80,  # .. 0x2DDF ; Ethiopic Extended
122    0x2DE0,  # .. 0x2DFF ; Cyrillic Extended-A
123    0x2E00,  # .. 0x2E7F ; Supplemental Punctuation
124    0x2E80,  # .. 0x2EFF ; CJK Radicals Supplement
125    0x2F00,  # .. 0x2FDF ; Kangxi Radicals
126    0x2FE0,  # .. 0x2FEF ; No_Block
127    0x2FF0,  # .. 0x2FFF ; Ideographic Description Characters
128    0x3000,  # .. 0x303F ; CJK Symbols and Punctuation
129    0x3040,  # .. 0x309F ; Hiragana
130    0x30A0,  # .. 0x30FF ; Katakana
131    0x3100,  # .. 0x312F ; Bopomofo
132    0x3130,  # .. 0x318F ; Hangul Compatibility Jamo
133    0x3190,  # .. 0x319F ; Kanbun
134    0x31A0,  # .. 0x31BF ; Bopomofo Extended
135    0x31C0,  # .. 0x31EF ; CJK Strokes
136    0x31F0,  # .. 0x31FF ; Katakana Phonetic Extensions
137    0x3200,  # .. 0x32FF ; Enclosed CJK Letters and Months
138    0x3300,  # .. 0x33FF ; CJK Compatibility
139    0x3400,  # .. 0x4DBF ; CJK Unified Ideographs Extension A
140    0x4DC0,  # .. 0x4DFF ; Yijing Hexagram Symbols
141    0x4E00,  # .. 0x9FFF ; CJK Unified Ideographs
142    0xA000,  # .. 0xA48F ; Yi Syllables
143    0xA490,  # .. 0xA4CF ; Yi Radicals
144    0xA4D0,  # .. 0xA4FF ; Lisu
145    0xA500,  # .. 0xA63F ; Vai
146    0xA640,  # .. 0xA69F ; Cyrillic Extended-B
147    0xA6A0,  # .. 0xA6FF ; Bamum
148    0xA700,  # .. 0xA71F ; Modifier Tone Letters
149    0xA720,  # .. 0xA7FF ; Latin Extended-D
150    0xA800,  # .. 0xA82F ; Syloti Nagri
151    0xA830,  # .. 0xA83F ; Common Indic Number Forms
152    0xA840,  # .. 0xA87F ; Phags-pa
153    0xA880,  # .. 0xA8DF ; Saurashtra
154    0xA8E0,  # .. 0xA8FF ; Devanagari Extended
155    0xA900,  # .. 0xA92F ; Kayah Li
156    0xA930,  # .. 0xA95F ; Rejang
157    0xA960,  # .. 0xA97F ; Hangul Jamo Extended-A
158    0xA980,  # .. 0xA9DF ; Javanese
159    0xA9E0,  # .. 0xA9FF ; Myanmar Extended-B
160    0xAA00,  # .. 0xAA5F ; Cham
161    0xAA60,  # .. 0xAA7F ; Myanmar Extended-A
162    0xAA80,  # .. 0xAADF ; Tai Viet
163    0xAAE0,  # .. 0xAAFF ; Meetei Mayek Extensions
164    0xAB00,  # .. 0xAB2F ; Ethiopic Extended-A
165    0xAB30,  # .. 0xAB6F ; Latin Extended-E
166    0xAB70,  # .. 0xABBF ; Cherokee Supplement
167    0xABC0,  # .. 0xABFF ; Meetei Mayek
168    0xAC00,  # .. 0xD7AF ; Hangul Syllables
169    0xD7B0,  # .. 0xD7FF ; Hangul Jamo Extended-B
170    0xD800,  # .. 0xDB7F ; High Surrogates
171    0xDB80,  # .. 0xDBFF ; High Private Use Surrogates
172    0xDC00,  # .. 0xDFFF ; Low Surrogates
173    0xE000,  # .. 0xF8FF ; Private Use Area
174    0xF900,  # .. 0xFAFF ; CJK Compatibility Ideographs
175    0xFB00,  # .. 0xFB4F ; Alphabetic Presentation Forms
176    0xFB50,  # .. 0xFDFF ; Arabic Presentation Forms-A
177    0xFE00,  # .. 0xFE0F ; Variation Selectors
178    0xFE10,  # .. 0xFE1F ; Vertical Forms
179    0xFE20,  # .. 0xFE2F ; Combining Half Marks
180    0xFE30,  # .. 0xFE4F ; CJK Compatibility Forms
181    0xFE50,  # .. 0xFE6F ; Small Form Variants
182    0xFE70,  # .. 0xFEFF ; Arabic Presentation Forms-B
183    0xFF00,  # .. 0xFFEF ; Halfwidth and Fullwidth Forms
184    0xFFF0,  # .. 0xFFFF ; Specials
185    0x10000,  # .. 0x1007F ; Linear B Syllabary
186    0x10080,  # .. 0x100FF ; Linear B Ideograms
187    0x10100,  # .. 0x1013F ; Aegean Numbers
188    0x10140,  # .. 0x1018F ; Ancient Greek Numbers
189    0x10190,  # .. 0x101CF ; Ancient Symbols
190    0x101D0,  # .. 0x101FF ; Phaistos Disc
191    0x10200,  # .. 0x1027F ; No_Block
192    0x10280,  # .. 0x1029F ; Lycian
193    0x102A0,  # .. 0x102DF ; Carian
194    0x102E0,  # .. 0x102FF ; Coptic Epact Numbers
195    0x10300,  # .. 0x1032F ; Old Italic
196    0x10330,  # .. 0x1034F ; Gothic
197    0x10350,  # .. 0x1037F ; Old Permic
198    0x10380,  # .. 0x1039F ; Ugaritic
199    0x103A0,  # .. 0x103DF ; Old Persian
200    0x103E0,  # .. 0x103FF ; No_Block
201    0x10400,  # .. 0x1044F ; Deseret
202    0x10450,  # .. 0x1047F ; Shavian
203    0x10480,  # .. 0x104AF ; Osmanya
204    0x104B0,  # .. 0x104FF ; Osage
205    0x10500,  # .. 0x1052F ; Elbasan
206    0x10530,  # .. 0x1056F ; Caucasian Albanian
207    0x10570,  # .. 0x105BF ; Vithkuqi
208    0x105C0,  # .. 0x105FF ; No_Block
209    0x10600,  # .. 0x1077F ; Linear A
210    0x10780,  # .. 0x107BF ; Latin Extended-F
211    0x107C0,  # .. 0x107FF ; No_Block
212    0x10800,  # .. 0x1083F ; Cypriot Syllabary
213    0x10840,  # .. 0x1085F ; Imperial Aramaic
214    0x10860,  # .. 0x1087F ; Palmyrene
215    0x10880,  # .. 0x108AF ; Nabataean
216    0x108B0,  # .. 0x108DF ; No_Block
217    0x108E0,  # .. 0x108FF ; Hatran
218    0x10900,  # .. 0x1091F ; Phoenician
219    0x10920,  # .. 0x1093F ; Lydian
220    0x10940,  # .. 0x1097F ; No_Block
221    0x10980,  # .. 0x1099F ; Meroitic Hieroglyphs
222    0x109A0,  # .. 0x109FF ; Meroitic Cursive
223    0x10A00,  # .. 0x10A5F ; Kharoshthi
224    0x10A60,  # .. 0x10A7F ; Old South Arabian
225    0x10A80,  # .. 0x10A9F ; Old North Arabian
226    0x10AA0,  # .. 0x10ABF ; No_Block
227    0x10AC0,  # .. 0x10AFF ; Manichaean
228    0x10B00,  # .. 0x10B3F ; Avestan
229    0x10B40,  # .. 0x10B5F ; Inscriptional Parthian
230    0x10B60,  # .. 0x10B7F ; Inscriptional Pahlavi
231    0x10B80,  # .. 0x10BAF ; Psalter Pahlavi
232    0x10BB0,  # .. 0x10BFF ; No_Block
233    0x10C00,  # .. 0x10C4F ; Old Turkic
234    0x10C50,  # .. 0x10C7F ; No_Block
235    0x10C80,  # .. 0x10CFF ; Old Hungarian
236    0x10D00,  # .. 0x10D3F ; Hanifi Rohingya
237    0x10D40,  # .. 0x10E5F ; No_Block
238    0x10E60,  # .. 0x10E7F ; Rumi Numeral Symbols
239    0x10E80,  # .. 0x10EBF ; Yezidi
240    0x10EC0,  # .. 0x10EFF ; No_Block
241    0x10F00,  # .. 0x10F2F ; Old Sogdian
242    0x10F30,  # .. 0x10F6F ; Sogdian
243    0x10F70,  # .. 0x10FAF ; Old Uyghur
244    0x10FB0,  # .. 0x10FDF ; Chorasmian
245    0x10FE0,  # .. 0x10FFF ; Elymaic
246    0x11000,  # .. 0x1107F ; Brahmi
247    0x11080,  # .. 0x110CF ; Kaithi
248    0x110D0,  # .. 0x110FF ; Sora Sompeng
249    0x11100,  # .. 0x1114F ; Chakma
250    0x11150,  # .. 0x1117F ; Mahajani
251    0x11180,  # .. 0x111DF ; Sharada
252    0x111E0,  # .. 0x111FF ; Sinhala Archaic Numbers
253    0x11200,  # .. 0x1124F ; Khojki
254    0x11250,  # .. 0x1127F ; No_Block
255    0x11280,  # .. 0x112AF ; Multani
256    0x112B0,  # .. 0x112FF ; Khudawadi
257    0x11300,  # .. 0x1137F ; Grantha
258    0x11380,  # .. 0x113FF ; No_Block
259    0x11400,  # .. 0x1147F ; Newa
260    0x11480,  # .. 0x114DF ; Tirhuta
261    0x114E0,  # .. 0x1157F ; No_Block
262    0x11580,  # .. 0x115FF ; Siddham
263    0x11600,  # .. 0x1165F ; Modi
264    0x11660,  # .. 0x1167F ; Mongolian Supplement
265    0x11680,  # .. 0x116CF ; Takri
266    0x116D0,  # .. 0x116FF ; No_Block
267    0x11700,  # .. 0x1174F ; Ahom
268    0x11750,  # .. 0x117FF ; No_Block
269    0x11800,  # .. 0x1184F ; Dogra
270    0x11850,  # .. 0x1189F ; No_Block
271    0x118A0,  # .. 0x118FF ; Warang Citi
272    0x11900,  # .. 0x1195F ; Dives Akuru
273    0x11960,  # .. 0x1199F ; No_Block
274    0x119A0,  # .. 0x119FF ; Nandinagari
275    0x11A00,  # .. 0x11A4F ; Zanabazar Square
276    0x11A50,  # .. 0x11AAF ; Soyombo
277    0x11AB0,  # .. 0x11ABF ; Unified Canadian Aboriginal Syllabics Extended-A
278    0x11AC0,  # .. 0x11AFF ; Pau Cin Hau
279    0x11B00,  # .. 0x11BFF ; No_Block
280    0x11C00,  # .. 0x11C6F ; Bhaiksuki
281    0x11C70,  # .. 0x11CBF ; Marchen
282    0x11CC0,  # .. 0x11CFF ; No_Block
283    0x11D00,  # .. 0x11D5F ; Masaram Gondi
284    0x11D60,  # .. 0x11DAF ; Gunjala Gondi
285    0x11DB0,  # .. 0x11EDF ; No_Block
286    0x11EE0,  # .. 0x11EFF ; Makasar
287    0x11F00,  # .. 0x11FAF ; No_Block
288    0x11FB0,  # .. 0x11FBF ; Lisu Supplement
289    0x11FC0,  # .. 0x11FFF ; Tamil Supplement
290    0x12000,  # .. 0x123FF ; Cuneiform
291    0x12400,  # .. 0x1247F ; Cuneiform Numbers and Punctuation
292    0x12480,  # .. 0x1254F ; Early Dynastic Cuneiform
293    0x12550,  # .. 0x12F8F ; No_Block
294    0x12F90,  # .. 0x12FFF ; Cypro-Minoan
295    0x13000,  # .. 0x1342F ; Egyptian Hieroglyphs
296    0x13430,  # .. 0x1343F ; Egyptian Hieroglyph Format Controls
297    0x13440,  # .. 0x143FF ; No_Block
298    0x14400,  # .. 0x1467F ; Anatolian Hieroglyphs
299    0x14680,  # .. 0x167FF ; No_Block
300    0x16800,  # .. 0x16A3F ; Bamum Supplement
301    0x16A40,  # .. 0x16A6F ; Mro
302    0x16A70,  # .. 0x16ACF ; Tangsa
303    0x16AD0,  # .. 0x16AFF ; Bassa Vah
304    0x16B00,  # .. 0x16B8F ; Pahawh Hmong
305    0x16B90,  # .. 0x16E3F ; No_Block
306    0x16E40,  # .. 0x16E9F ; Medefaidrin
307    0x16EA0,  # .. 0x16EFF ; No_Block
308    0x16F00,  # .. 0x16F9F ; Miao
309    0x16FA0,  # .. 0x16FDF ; No_Block
310    0x16FE0,  # .. 0x16FFF ; Ideographic Symbols and Punctuation
311    0x17000,  # .. 0x187FF ; Tangut
312    0x18800,  # .. 0x18AFF ; Tangut Components
313    0x18B00,  # .. 0x18CFF ; Khitan Small Script
314    0x18D00,  # .. 0x18D7F ; Tangut Supplement
315    0x18D80,  # .. 0x1AFEF ; No_Block
316    0x1AFF0,  # .. 0x1AFFF ; Kana Extended-B
317    0x1B000,  # .. 0x1B0FF ; Kana Supplement
318    0x1B100,  # .. 0x1B12F ; Kana Extended-A
319    0x1B130,  # .. 0x1B16F ; Small Kana Extension
320    0x1B170,  # .. 0x1B2FF ; Nushu
321    0x1B300,  # .. 0x1BBFF ; No_Block
322    0x1BC00,  # .. 0x1BC9F ; Duployan
323    0x1BCA0,  # .. 0x1BCAF ; Shorthand Format Controls
324    0x1BCB0,  # .. 0x1CEFF ; No_Block
325    0x1CF00,  # .. 0x1CFCF ; Znamenny Musical Notation
326    0x1CFD0,  # .. 0x1CFFF ; No_Block
327    0x1D000,  # .. 0x1D0FF ; Byzantine Musical Symbols
328    0x1D100,  # .. 0x1D1FF ; Musical Symbols
329    0x1D200,  # .. 0x1D24F ; Ancient Greek Musical Notation
330    0x1D250,  # .. 0x1D2DF ; No_Block
331    0x1D2E0,  # .. 0x1D2FF ; Mayan Numerals
332    0x1D300,  # .. 0x1D35F ; Tai Xuan Jing Symbols
333    0x1D360,  # .. 0x1D37F ; Counting Rod Numerals
334    0x1D380,  # .. 0x1D3FF ; No_Block
335    0x1D400,  # .. 0x1D7FF ; Mathematical Alphanumeric Symbols
336    0x1D800,  # .. 0x1DAAF ; Sutton SignWriting
337    0x1DAB0,  # .. 0x1DEFF ; No_Block
338    0x1DF00,  # .. 0x1DFFF ; Latin Extended-G
339    0x1E000,  # .. 0x1E02F ; Glagolitic Supplement
340    0x1E030,  # .. 0x1E0FF ; No_Block
341    0x1E100,  # .. 0x1E14F ; Nyiakeng Puachue Hmong
342    0x1E150,  # .. 0x1E28F ; No_Block
343    0x1E290,  # .. 0x1E2BF ; Toto
344    0x1E2C0,  # .. 0x1E2FF ; Wancho
345    0x1E300,  # .. 0x1E7DF ; No_Block
346    0x1E7E0,  # .. 0x1E7FF ; Ethiopic Extended-B
347    0x1E800,  # .. 0x1E8DF ; Mende Kikakui
348    0x1E8E0,  # .. 0x1E8FF ; No_Block
349    0x1E900,  # .. 0x1E95F ; Adlam
350    0x1E960,  # .. 0x1EC6F ; No_Block
351    0x1EC70,  # .. 0x1ECBF ; Indic Siyaq Numbers
352    0x1ECC0,  # .. 0x1ECFF ; No_Block
353    0x1ED00,  # .. 0x1ED4F ; Ottoman Siyaq Numbers
354    0x1ED50,  # .. 0x1EDFF ; No_Block
355    0x1EE00,  # .. 0x1EEFF ; Arabic Mathematical Alphabetic Symbols
356    0x1EF00,  # .. 0x1EFFF ; No_Block
357    0x1F000,  # .. 0x1F02F ; Mahjong Tiles
358    0x1F030,  # .. 0x1F09F ; Domino Tiles
359    0x1F0A0,  # .. 0x1F0FF ; Playing Cards
360    0x1F100,  # .. 0x1F1FF ; Enclosed Alphanumeric Supplement
361    0x1F200,  # .. 0x1F2FF ; Enclosed Ideographic Supplement
362    0x1F300,  # .. 0x1F5FF ; Miscellaneous Symbols and Pictographs
363    0x1F600,  # .. 0x1F64F ; Emoticons
364    0x1F650,  # .. 0x1F67F ; Ornamental Dingbats
365    0x1F680,  # .. 0x1F6FF ; Transport and Map Symbols
366    0x1F700,  # .. 0x1F77F ; Alchemical Symbols
367    0x1F780,  # .. 0x1F7FF ; Geometric Shapes Extended
368    0x1F800,  # .. 0x1F8FF ; Supplemental Arrows-C
369    0x1F900,  # .. 0x1F9FF ; Supplemental Symbols and Pictographs
370    0x1FA00,  # .. 0x1FA6F ; Chess Symbols
371    0x1FA70,  # .. 0x1FAFF ; Symbols and Pictographs Extended-A
372    0x1FB00,  # .. 0x1FBFF ; Symbols for Legacy Computing
373    0x1FC00,  # .. 0x1FFFF ; No_Block
374    0x20000,  # .. 0x2A6DF ; CJK Unified Ideographs Extension B
375    0x2A6E0,  # .. 0x2A6FF ; No_Block
376    0x2A700,  # .. 0x2B73F ; CJK Unified Ideographs Extension C
377    0x2B740,  # .. 0x2B81F ; CJK Unified Ideographs Extension D
378    0x2B820,  # .. 0x2CEAF ; CJK Unified Ideographs Extension E
379    0x2CEB0,  # .. 0x2EBEF ; CJK Unified Ideographs Extension F
380    0x2EBF0,  # .. 0x2F7FF ; No_Block
381    0x2F800,  # .. 0x2FA1F ; CJK Compatibility Ideographs Supplement
382    0x2FA20,  # .. 0x2FFFF ; No_Block
383    0x30000,  # .. 0x3134F ; CJK Unified Ideographs Extension G
384    0x31350,  # .. 0xDFFFF ; No_Block
385    0xE0000,  # .. 0xE007F ; Tags
386    0xE0080,  # .. 0xE00FF ; No_Block
387    0xE0100,  # .. 0xE01EF ; Variation Selectors Supplement
388    0xE01F0,  # .. 0xEFFFF ; No_Block
389    0xF0000,  # .. 0xFFFFF ; Supplementary Private Use Area-A
390    0x100000,  # .. 0x10FFFF ; Supplementary Private Use Area-B
391]
392
393VALUES = [
394    'Basic Latin',                                       # 0000..007F
395    'Latin-1 Supplement',                                # 0080..00FF
396    'Latin Extended-A',                                  # 0100..017F
397    'Latin Extended-B',                                  # 0180..024F
398    'IPA Extensions',                                    # 0250..02AF
399    'Spacing Modifier Letters',                          # 02B0..02FF
400    'Combining Diacritical Marks',                       # 0300..036F
401    'Greek and Coptic',                                  # 0370..03FF
402    'Cyrillic',                                          # 0400..04FF
403    'Cyrillic Supplement',                               # 0500..052F
404    'Armenian',                                          # 0530..058F
405    'Hebrew',                                            # 0590..05FF
406    'Arabic',                                            # 0600..06FF
407    'Syriac',                                            # 0700..074F
408    'Arabic Supplement',                                 # 0750..077F
409    'Thaana',                                            # 0780..07BF
410    'NKo',                                               # 07C0..07FF
411    'Samaritan',                                         # 0800..083F
412    'Mandaic',                                           # 0840..085F
413    'Syriac Supplement',                                 # 0860..086F
414    'Arabic Extended-B',                                 # 0870..089F
415    'Arabic Extended-A',                                 # 08A0..08FF
416    'Devanagari',                                        # 0900..097F
417    'Bengali',                                           # 0980..09FF
418    'Gurmukhi',                                          # 0A00..0A7F
419    'Gujarati',                                          # 0A80..0AFF
420    'Oriya',                                             # 0B00..0B7F
421    'Tamil',                                             # 0B80..0BFF
422    'Telugu',                                            # 0C00..0C7F
423    'Kannada',                                           # 0C80..0CFF
424    'Malayalam',                                         # 0D00..0D7F
425    'Sinhala',                                           # 0D80..0DFF
426    'Thai',                                              # 0E00..0E7F
427    'Lao',                                               # 0E80..0EFF
428    'Tibetan',                                           # 0F00..0FFF
429    'Myanmar',                                           # 1000..109F
430    'Georgian',                                          # 10A0..10FF
431    'Hangul Jamo',                                       # 1100..11FF
432    'Ethiopic',                                          # 1200..137F
433    'Ethiopic Supplement',                               # 1380..139F
434    'Cherokee',                                          # 13A0..13FF
435    'Unified Canadian Aboriginal Syllabics',             # 1400..167F
436    'Ogham',                                             # 1680..169F
437    'Runic',                                             # 16A0..16FF
438    'Tagalog',                                           # 1700..171F
439    'Hanunoo',                                           # 1720..173F
440    'Buhid',                                             # 1740..175F
441    'Tagbanwa',                                          # 1760..177F
442    'Khmer',                                             # 1780..17FF
443    'Mongolian',                                         # 1800..18AF
444    'Unified Canadian Aboriginal Syllabics Extended',    # 18B0..18FF
445    'Limbu',                                             # 1900..194F
446    'Tai Le',                                            # 1950..197F
447    'New Tai Lue',                                       # 1980..19DF
448    'Khmer Symbols',                                     # 19E0..19FF
449    'Buginese',                                          # 1A00..1A1F
450    'Tai Tham',                                          # 1A20..1AAF
451    'Combining Diacritical Marks Extended',              # 1AB0..1AFF
452    'Balinese',                                          # 1B00..1B7F
453    'Sundanese',                                         # 1B80..1BBF
454    'Batak',                                             # 1BC0..1BFF
455    'Lepcha',                                            # 1C00..1C4F
456    'Ol Chiki',                                          # 1C50..1C7F
457    'Cyrillic Extended-C',                               # 1C80..1C8F
458    'Georgian Extended',                                 # 1C90..1CBF
459    'Sundanese Supplement',                              # 1CC0..1CCF
460    'Vedic Extensions',                                  # 1CD0..1CFF
461    'Phonetic Extensions',                               # 1D00..1D7F
462    'Phonetic Extensions Supplement',                    # 1D80..1DBF
463    'Combining Diacritical Marks Supplement',            # 1DC0..1DFF
464    'Latin Extended Additional',                         # 1E00..1EFF
465    'Greek Extended',                                    # 1F00..1FFF
466    'General Punctuation',                               # 2000..206F
467    'Superscripts and Subscripts',                       # 2070..209F
468    'Currency Symbols',                                  # 20A0..20CF
469    'Combining Diacritical Marks for Symbols',           # 20D0..20FF
470    'Letterlike Symbols',                                # 2100..214F
471    'Number Forms',                                      # 2150..218F
472    'Arrows',                                            # 2190..21FF
473    'Mathematical Operators',                            # 2200..22FF
474    'Miscellaneous Technical',                           # 2300..23FF
475    'Control Pictures',                                  # 2400..243F
476    'Optical Character Recognition',                     # 2440..245F
477    'Enclosed Alphanumerics',                            # 2460..24FF
478    'Box Drawing',                                       # 2500..257F
479    'Block Elements',                                    # 2580..259F
480    'Geometric Shapes',                                  # 25A0..25FF
481    'Miscellaneous Symbols',                             # 2600..26FF
482    'Dingbats',                                          # 2700..27BF
483    'Miscellaneous Mathematical Symbols-A',              # 27C0..27EF
484    'Supplemental Arrows-A',                             # 27F0..27FF
485    'Braille Patterns',                                  # 2800..28FF
486    'Supplemental Arrows-B',                             # 2900..297F
487    'Miscellaneous Mathematical Symbols-B',              # 2980..29FF
488    'Supplemental Mathematical Operators',               # 2A00..2AFF
489    'Miscellaneous Symbols and Arrows',                  # 2B00..2BFF
490    'Glagolitic',                                        # 2C00..2C5F
491    'Latin Extended-C',                                  # 2C60..2C7F
492    'Coptic',                                            # 2C80..2CFF
493    'Georgian Supplement',                               # 2D00..2D2F
494    'Tifinagh',                                          # 2D30..2D7F
495    'Ethiopic Extended',                                 # 2D80..2DDF
496    'Cyrillic Extended-A',                               # 2DE0..2DFF
497    'Supplemental Punctuation',                          # 2E00..2E7F
498    'CJK Radicals Supplement',                           # 2E80..2EFF
499    'Kangxi Radicals',                                   # 2F00..2FDF
500    'No_Block',                                          # 2FE0..2FEF
501    'Ideographic Description Characters',                # 2FF0..2FFF
502    'CJK Symbols and Punctuation',                       # 3000..303F
503    'Hiragana',                                          # 3040..309F
504    'Katakana',                                          # 30A0..30FF
505    'Bopomofo',                                          # 3100..312F
506    'Hangul Compatibility Jamo',                         # 3130..318F
507    'Kanbun',                                            # 3190..319F
508    'Bopomofo Extended',                                 # 31A0..31BF
509    'CJK Strokes',                                       # 31C0..31EF
510    'Katakana Phonetic Extensions',                      # 31F0..31FF
511    'Enclosed CJK Letters and Months',                   # 3200..32FF
512    'CJK Compatibility',                                 # 3300..33FF
513    'CJK Unified Ideographs Extension A',                # 3400..4DBF
514    'Yijing Hexagram Symbols',                           # 4DC0..4DFF
515    'CJK Unified Ideographs',                            # 4E00..9FFF
516    'Yi Syllables',                                      # A000..A48F
517    'Yi Radicals',                                       # A490..A4CF
518    'Lisu',                                              # A4D0..A4FF
519    'Vai',                                               # A500..A63F
520    'Cyrillic Extended-B',                               # A640..A69F
521    'Bamum',                                             # A6A0..A6FF
522    'Modifier Tone Letters',                             # A700..A71F
523    'Latin Extended-D',                                  # A720..A7FF
524    'Syloti Nagri',                                      # A800..A82F
525    'Common Indic Number Forms',                         # A830..A83F
526    'Phags-pa',                                          # A840..A87F
527    'Saurashtra',                                        # A880..A8DF
528    'Devanagari Extended',                               # A8E0..A8FF
529    'Kayah Li',                                          # A900..A92F
530    'Rejang',                                            # A930..A95F
531    'Hangul Jamo Extended-A',                            # A960..A97F
532    'Javanese',                                          # A980..A9DF
533    'Myanmar Extended-B',                                # A9E0..A9FF
534    'Cham',                                              # AA00..AA5F
535    'Myanmar Extended-A',                                # AA60..AA7F
536    'Tai Viet',                                          # AA80..AADF
537    'Meetei Mayek Extensions',                           # AAE0..AAFF
538    'Ethiopic Extended-A',                               # AB00..AB2F
539    'Latin Extended-E',                                  # AB30..AB6F
540    'Cherokee Supplement',                               # AB70..ABBF
541    'Meetei Mayek',                                      # ABC0..ABFF
542    'Hangul Syllables',                                  # AC00..D7AF
543    'Hangul Jamo Extended-B',                            # D7B0..D7FF
544    'High Surrogates',                                   # D800..DB7F
545    'High Private Use Surrogates',                       # DB80..DBFF
546    'Low Surrogates',                                    # DC00..DFFF
547    'Private Use Area',                                  # E000..F8FF
548    'CJK Compatibility Ideographs',                      # F900..FAFF
549    'Alphabetic Presentation Forms',                     # FB00..FB4F
550    'Arabic Presentation Forms-A',                       # FB50..FDFF
551    'Variation Selectors',                               # FE00..FE0F
552    'Vertical Forms',                                    # FE10..FE1F
553    'Combining Half Marks',                              # FE20..FE2F
554    'CJK Compatibility Forms',                           # FE30..FE4F
555    'Small Form Variants',                               # FE50..FE6F
556    'Arabic Presentation Forms-B',                       # FE70..FEFF
557    'Halfwidth and Fullwidth Forms',                     # FF00..FFEF
558    'Specials',                                          # FFF0..FFFF
559    'Linear B Syllabary',                                # 10000..1007F
560    'Linear B Ideograms',                                # 10080..100FF
561    'Aegean Numbers',                                    # 10100..1013F
562    'Ancient Greek Numbers',                             # 10140..1018F
563    'Ancient Symbols',                                   # 10190..101CF
564    'Phaistos Disc',                                     # 101D0..101FF
565    'No_Block',                                          # 10200..1027F
566    'Lycian',                                            # 10280..1029F
567    'Carian',                                            # 102A0..102DF
568    'Coptic Epact Numbers',                              # 102E0..102FF
569    'Old Italic',                                        # 10300..1032F
570    'Gothic',                                            # 10330..1034F
571    'Old Permic',                                        # 10350..1037F
572    'Ugaritic',                                          # 10380..1039F
573    'Old Persian',                                       # 103A0..103DF
574    'No_Block',                                          # 103E0..103FF
575    'Deseret',                                           # 10400..1044F
576    'Shavian',                                           # 10450..1047F
577    'Osmanya',                                           # 10480..104AF
578    'Osage',                                             # 104B0..104FF
579    'Elbasan',                                           # 10500..1052F
580    'Caucasian Albanian',                                # 10530..1056F
581    'Vithkuqi',                                          # 10570..105BF
582    'No_Block',                                          # 105C0..105FF
583    'Linear A',                                          # 10600..1077F
584    'Latin Extended-F',                                  # 10780..107BF
585    'No_Block',                                          # 107C0..107FF
586    'Cypriot Syllabary',                                 # 10800..1083F
587    'Imperial Aramaic',                                  # 10840..1085F
588    'Palmyrene',                                         # 10860..1087F
589    'Nabataean',                                         # 10880..108AF
590    'No_Block',                                          # 108B0..108DF
591    'Hatran',                                            # 108E0..108FF
592    'Phoenician',                                        # 10900..1091F
593    'Lydian',                                            # 10920..1093F
594    'No_Block',                                          # 10940..1097F
595    'Meroitic Hieroglyphs',                              # 10980..1099F
596    'Meroitic Cursive',                                  # 109A0..109FF
597    'Kharoshthi',                                        # 10A00..10A5F
598    'Old South Arabian',                                 # 10A60..10A7F
599    'Old North Arabian',                                 # 10A80..10A9F
600    'No_Block',                                          # 10AA0..10ABF
601    'Manichaean',                                        # 10AC0..10AFF
602    'Avestan',                                           # 10B00..10B3F
603    'Inscriptional Parthian',                            # 10B40..10B5F
604    'Inscriptional Pahlavi',                             # 10B60..10B7F
605    'Psalter Pahlavi',                                   # 10B80..10BAF
606    'No_Block',                                          # 10BB0..10BFF
607    'Old Turkic',                                        # 10C00..10C4F
608    'No_Block',                                          # 10C50..10C7F
609    'Old Hungarian',                                     # 10C80..10CFF
610    'Hanifi Rohingya',                                   # 10D00..10D3F
611    'No_Block',                                          # 10D40..10E5F
612    'Rumi Numeral Symbols',                              # 10E60..10E7F
613    'Yezidi',                                            # 10E80..10EBF
614    'No_Block',                                          # 10EC0..10EFF
615    'Old Sogdian',                                       # 10F00..10F2F
616    'Sogdian',                                           # 10F30..10F6F
617    'Old Uyghur',                                        # 10F70..10FAF
618    'Chorasmian',                                        # 10FB0..10FDF
619    'Elymaic',                                           # 10FE0..10FFF
620    'Brahmi',                                            # 11000..1107F
621    'Kaithi',                                            # 11080..110CF
622    'Sora Sompeng',                                      # 110D0..110FF
623    'Chakma',                                            # 11100..1114F
624    'Mahajani',                                          # 11150..1117F
625    'Sharada',                                           # 11180..111DF
626    'Sinhala Archaic Numbers',                           # 111E0..111FF
627    'Khojki',                                            # 11200..1124F
628    'No_Block',                                          # 11250..1127F
629    'Multani',                                           # 11280..112AF
630    'Khudawadi',                                         # 112B0..112FF
631    'Grantha',                                           # 11300..1137F
632    'No_Block',                                          # 11380..113FF
633    'Newa',                                              # 11400..1147F
634    'Tirhuta',                                           # 11480..114DF
635    'No_Block',                                          # 114E0..1157F
636    'Siddham',                                           # 11580..115FF
637    'Modi',                                              # 11600..1165F
638    'Mongolian Supplement',                              # 11660..1167F
639    'Takri',                                             # 11680..116CF
640    'No_Block',                                          # 116D0..116FF
641    'Ahom',                                              # 11700..1174F
642    'No_Block',                                          # 11750..117FF
643    'Dogra',                                             # 11800..1184F
644    'No_Block',                                          # 11850..1189F
645    'Warang Citi',                                       # 118A0..118FF
646    'Dives Akuru',                                       # 11900..1195F
647    'No_Block',                                          # 11960..1199F
648    'Nandinagari',                                       # 119A0..119FF
649    'Zanabazar Square',                                  # 11A00..11A4F
650    'Soyombo',                                           # 11A50..11AAF
651    'Unified Canadian Aboriginal Syllabics Extended-A',  # 11AB0..11ABF
652    'Pau Cin Hau',                                       # 11AC0..11AFF
653    'No_Block',                                          # 11B00..11BFF
654    'Bhaiksuki',                                         # 11C00..11C6F
655    'Marchen',                                           # 11C70..11CBF
656    'No_Block',                                          # 11CC0..11CFF
657    'Masaram Gondi',                                     # 11D00..11D5F
658    'Gunjala Gondi',                                     # 11D60..11DAF
659    'No_Block',                                          # 11DB0..11EDF
660    'Makasar',                                           # 11EE0..11EFF
661    'No_Block',                                          # 11F00..11FAF
662    'Lisu Supplement',                                   # 11FB0..11FBF
663    'Tamil Supplement',                                  # 11FC0..11FFF
664    'Cuneiform',                                         # 12000..123FF
665    'Cuneiform Numbers and Punctuation',                 # 12400..1247F
666    'Early Dynastic Cuneiform',                          # 12480..1254F
667    'No_Block',                                          # 12550..12F8F
668    'Cypro-Minoan',                                      # 12F90..12FFF
669    'Egyptian Hieroglyphs',                              # 13000..1342F
670    'Egyptian Hieroglyph Format Controls',               # 13430..1343F
671    'No_Block',                                          # 13440..143FF
672    'Anatolian Hieroglyphs',                             # 14400..1467F
673    'No_Block',                                          # 14680..167FF
674    'Bamum Supplement',                                  # 16800..16A3F
675    'Mro',                                               # 16A40..16A6F
676    'Tangsa',                                            # 16A70..16ACF
677    'Bassa Vah',                                         # 16AD0..16AFF
678    'Pahawh Hmong',                                      # 16B00..16B8F
679    'No_Block',                                          # 16B90..16E3F
680    'Medefaidrin',                                       # 16E40..16E9F
681    'No_Block',                                          # 16EA0..16EFF
682    'Miao',                                              # 16F00..16F9F
683    'No_Block',                                          # 16FA0..16FDF
684    'Ideographic Symbols and Punctuation',               # 16FE0..16FFF
685    'Tangut',                                            # 17000..187FF
686    'Tangut Components',                                 # 18800..18AFF
687    'Khitan Small Script',                               # 18B00..18CFF
688    'Tangut Supplement',                                 # 18D00..18D7F
689    'No_Block',                                          # 18D80..1AFEF
690    'Kana Extended-B',                                   # 1AFF0..1AFFF
691    'Kana Supplement',                                   # 1B000..1B0FF
692    'Kana Extended-A',                                   # 1B100..1B12F
693    'Small Kana Extension',                              # 1B130..1B16F
694    'Nushu',                                             # 1B170..1B2FF
695    'No_Block',                                          # 1B300..1BBFF
696    'Duployan',                                          # 1BC00..1BC9F
697    'Shorthand Format Controls',                         # 1BCA0..1BCAF
698    'No_Block',                                          # 1BCB0..1CEFF
699    'Znamenny Musical Notation',                         # 1CF00..1CFCF
700    'No_Block',                                          # 1CFD0..1CFFF
701    'Byzantine Musical Symbols',                         # 1D000..1D0FF
702    'Musical Symbols',                                   # 1D100..1D1FF
703    'Ancient Greek Musical Notation',                    # 1D200..1D24F
704    'No_Block',                                          # 1D250..1D2DF
705    'Mayan Numerals',                                    # 1D2E0..1D2FF
706    'Tai Xuan Jing Symbols',                             # 1D300..1D35F
707    'Counting Rod Numerals',                             # 1D360..1D37F
708    'No_Block',                                          # 1D380..1D3FF
709    'Mathematical Alphanumeric Symbols',                 # 1D400..1D7FF
710    'Sutton SignWriting',                                # 1D800..1DAAF
711    'No_Block',                                          # 1DAB0..1DEFF
712    'Latin Extended-G',                                  # 1DF00..1DFFF
713    'Glagolitic Supplement',                             # 1E000..1E02F
714    'No_Block',                                          # 1E030..1E0FF
715    'Nyiakeng Puachue Hmong',                            # 1E100..1E14F
716    'No_Block',                                          # 1E150..1E28F
717    'Toto',                                              # 1E290..1E2BF
718    'Wancho',                                            # 1E2C0..1E2FF
719    'No_Block',                                          # 1E300..1E7DF
720    'Ethiopic Extended-B',                               # 1E7E0..1E7FF
721    'Mende Kikakui',                                     # 1E800..1E8DF
722    'No_Block',                                          # 1E8E0..1E8FF
723    'Adlam',                                             # 1E900..1E95F
724    'No_Block',                                          # 1E960..1EC6F
725    'Indic Siyaq Numbers',                               # 1EC70..1ECBF
726    'No_Block',                                          # 1ECC0..1ECFF
727    'Ottoman Siyaq Numbers',                             # 1ED00..1ED4F
728    'No_Block',                                          # 1ED50..1EDFF
729    'Arabic Mathematical Alphabetic Symbols',            # 1EE00..1EEFF
730    'No_Block',                                          # 1EF00..1EFFF
731    'Mahjong Tiles',                                     # 1F000..1F02F
732    'Domino Tiles',                                      # 1F030..1F09F
733    'Playing Cards',                                     # 1F0A0..1F0FF
734    'Enclosed Alphanumeric Supplement',                  # 1F100..1F1FF
735    'Enclosed Ideographic Supplement',                   # 1F200..1F2FF
736    'Miscellaneous Symbols and Pictographs',             # 1F300..1F5FF
737    'Emoticons',                                         # 1F600..1F64F
738    'Ornamental Dingbats',                               # 1F650..1F67F
739    'Transport and Map Symbols',                         # 1F680..1F6FF
740    'Alchemical Symbols',                                # 1F700..1F77F
741    'Geometric Shapes Extended',                         # 1F780..1F7FF
742    'Supplemental Arrows-C',                             # 1F800..1F8FF
743    'Supplemental Symbols and Pictographs',              # 1F900..1F9FF
744    'Chess Symbols',                                     # 1FA00..1FA6F
745    'Symbols and Pictographs Extended-A',                # 1FA70..1FAFF
746    'Symbols for Legacy Computing',                      # 1FB00..1FBFF
747    'No_Block',                                          # 1FC00..1FFFF
748    'CJK Unified Ideographs Extension B',                # 20000..2A6DF
749    'No_Block',                                          # 2A6E0..2A6FF
750    'CJK Unified Ideographs Extension C',                # 2A700..2B73F
751    'CJK Unified Ideographs Extension D',                # 2B740..2B81F
752    'CJK Unified Ideographs Extension E',                # 2B820..2CEAF
753    'CJK Unified Ideographs Extension F',                # 2CEB0..2EBEF
754    'No_Block',                                          # 2EBF0..2F7FF
755    'CJK Compatibility Ideographs Supplement',           # 2F800..2FA1F
756    'No_Block',                                          # 2FA20..2FFFF
757    'CJK Unified Ideographs Extension G',                # 30000..3134F
758    'No_Block',                                          # 31350..DFFFF
759    'Tags',                                              # E0000..E007F
760    'No_Block',                                          # E0080..E00FF
761    'Variation Selectors Supplement',                    # E0100..E01EF
762    'No_Block',                                          # E01F0..EFFFF
763    'Supplementary Private Use Area-A',                  # F0000..FFFFF
764    'Supplementary Private Use Area-B',                  # 100000..10FFFF
765]
766