aboutsummaryrefslogtreecommitdiff
path: root/Lib/fontTools/unicodedata/Blocks.py
diff options
context:
space:
mode:
Diffstat (limited to 'Lib/fontTools/unicodedata/Blocks.py')
-rw-r--r--Lib/fontTools/unicodedata/Blocks.py778
1 files changed, 398 insertions, 380 deletions
diff --git a/Lib/fontTools/unicodedata/Blocks.py b/Lib/fontTools/unicodedata/Blocks.py
index 0755074b..2b30be67 100644
--- a/Lib/fontTools/unicodedata/Blocks.py
+++ b/Lib/fontTools/unicodedata/Blocks.py
@@ -4,9 +4,9 @@
# Source: https://unicode.org/Public/UNIDATA/Blocks.txt
# License: http://unicode.org/copyright.html#License
#
-# Blocks-13.0.0.txt
-# Date: 2019-07-10, 19:06:00 GMT [KW]
-# © 2019 Unicode®, Inc.
+# Blocks-14.0.0.txt
+# Date: 2021-01-22, 23:29:00 GMT [KW]
+# © 2021 Unicode®, Inc.
# For terms of use, see http://www.unicode.org/terms_of_use.html
#
# Unicode Character Database
@@ -37,7 +37,7 @@ RANGES = [
0x0800, # .. 0x083F ; Samaritan
0x0840, # .. 0x085F ; Mandaic
0x0860, # .. 0x086F ; Syriac Supplement
- 0x0870, # .. 0x089F ; No_Block
+ 0x0870, # .. 0x089F ; Arabic Extended-B
0x08A0, # .. 0x08FF ; Arabic Extended-A
0x0900, # .. 0x097F ; Devanagari
0x0980, # .. 0x09FF ; Bengali
@@ -204,9 +204,11 @@ RANGES = [
0x104B0, # .. 0x104FF ; Osage
0x10500, # .. 0x1052F ; Elbasan
0x10530, # .. 0x1056F ; Caucasian Albanian
- 0x10570, # .. 0x105FF ; No_Block
+ 0x10570, # .. 0x105BF ; Vithkuqi
+ 0x105C0, # .. 0x105FF ; No_Block
0x10600, # .. 0x1077F ; Linear A
- 0x10780, # .. 0x107FF ; No_Block
+ 0x10780, # .. 0x107BF ; Latin Extended-F
+ 0x107C0, # .. 0x107FF ; No_Block
0x10800, # .. 0x1083F ; Cypriot Syllabary
0x10840, # .. 0x1085F ; Imperial Aramaic
0x10860, # .. 0x1087F ; Palmyrene
@@ -238,7 +240,7 @@ RANGES = [
0x10EC0, # .. 0x10EFF ; No_Block
0x10F00, # .. 0x10F2F ; Old Sogdian
0x10F30, # .. 0x10F6F ; Sogdian
- 0x10F70, # .. 0x10FAF ; No_Block
+ 0x10F70, # .. 0x10FAF ; Old Uyghur
0x10FB0, # .. 0x10FDF ; Chorasmian
0x10FE0, # .. 0x10FFF ; Elymaic
0x11000, # .. 0x1107F ; Brahmi
@@ -262,8 +264,8 @@ RANGES = [
0x11660, # .. 0x1167F ; Mongolian Supplement
0x11680, # .. 0x116CF ; Takri
0x116D0, # .. 0x116FF ; No_Block
- 0x11700, # .. 0x1173F ; Ahom
- 0x11740, # .. 0x117FF ; No_Block
+ 0x11700, # .. 0x1174F ; Ahom
+ 0x11750, # .. 0x117FF ; No_Block
0x11800, # .. 0x1184F ; Dogra
0x11850, # .. 0x1189F ; No_Block
0x118A0, # .. 0x118FF ; Warang Citi
@@ -272,7 +274,7 @@ RANGES = [
0x119A0, # .. 0x119FF ; Nandinagari
0x11A00, # .. 0x11A4F ; Zanabazar Square
0x11A50, # .. 0x11AAF ; Soyombo
- 0x11AB0, # .. 0x11ABF ; No_Block
+ 0x11AB0, # .. 0x11ABF ; Unified Canadian Aboriginal Syllabics Extended-A
0x11AC0, # .. 0x11AFF ; Pau Cin Hau
0x11B00, # .. 0x11BFF ; No_Block
0x11C00, # .. 0x11C6F ; Bhaiksuki
@@ -288,7 +290,8 @@ RANGES = [
0x12000, # .. 0x123FF ; Cuneiform
0x12400, # .. 0x1247F ; Cuneiform Numbers and Punctuation
0x12480, # .. 0x1254F ; Early Dynastic Cuneiform
- 0x12550, # .. 0x12FFF ; No_Block
+ 0x12550, # .. 0x12F8F ; No_Block
+ 0x12F90, # .. 0x12FFF ; Cypro-Minoan
0x13000, # .. 0x1342F ; Egyptian Hieroglyphs
0x13430, # .. 0x1343F ; Egyptian Hieroglyph Format Controls
0x13440, # .. 0x143FF ; No_Block
@@ -296,7 +299,7 @@ RANGES = [
0x14680, # .. 0x167FF ; No_Block
0x16800, # .. 0x16A3F ; Bamum Supplement
0x16A40, # .. 0x16A6F ; Mro
- 0x16A70, # .. 0x16ACF ; No_Block
+ 0x16A70, # .. 0x16ACF ; Tangsa
0x16AD0, # .. 0x16AFF ; Bassa Vah
0x16B00, # .. 0x16B8F ; Pahawh Hmong
0x16B90, # .. 0x16E3F ; No_Block
@@ -308,8 +311,9 @@ RANGES = [
0x17000, # .. 0x187FF ; Tangut
0x18800, # .. 0x18AFF ; Tangut Components
0x18B00, # .. 0x18CFF ; Khitan Small Script
- 0x18D00, # .. 0x18D8F ; Tangut Supplement
- 0x18D90, # .. 0x1AFFF ; No_Block
+ 0x18D00, # .. 0x18D7F ; Tangut Supplement
+ 0x18D80, # .. 0x1AFEF ; No_Block
+ 0x1AFF0, # .. 0x1AFFF ; Kana Extended-B
0x1B000, # .. 0x1B0FF ; Kana Supplement
0x1B100, # .. 0x1B12F ; Kana Extended-A
0x1B130, # .. 0x1B16F ; Small Kana Extension
@@ -317,7 +321,9 @@ RANGES = [
0x1B300, # .. 0x1BBFF ; No_Block
0x1BC00, # .. 0x1BC9F ; Duployan
0x1BCA0, # .. 0x1BCAF ; Shorthand Format Controls
- 0x1BCB0, # .. 0x1CFFF ; No_Block
+ 0x1BCB0, # .. 0x1CEFF ; No_Block
+ 0x1CF00, # .. 0x1CFCF ; Znamenny Musical Notation
+ 0x1CFD0, # .. 0x1CFFF ; No_Block
0x1D000, # .. 0x1D0FF ; Byzantine Musical Symbols
0x1D100, # .. 0x1D1FF ; Musical Symbols
0x1D200, # .. 0x1D24F ; Ancient Greek Musical Notation
@@ -328,13 +334,16 @@ RANGES = [
0x1D380, # .. 0x1D3FF ; No_Block
0x1D400, # .. 0x1D7FF ; Mathematical Alphanumeric Symbols
0x1D800, # .. 0x1DAAF ; Sutton SignWriting
- 0x1DAB0, # .. 0x1DFFF ; No_Block
+ 0x1DAB0, # .. 0x1DEFF ; No_Block
+ 0x1DF00, # .. 0x1DFFF ; Latin Extended-G
0x1E000, # .. 0x1E02F ; Glagolitic Supplement
0x1E030, # .. 0x1E0FF ; No_Block
0x1E100, # .. 0x1E14F ; Nyiakeng Puachue Hmong
- 0x1E150, # .. 0x1E2BF ; No_Block
+ 0x1E150, # .. 0x1E28F ; No_Block
+ 0x1E290, # .. 0x1E2BF ; Toto
0x1E2C0, # .. 0x1E2FF ; Wancho
- 0x1E300, # .. 0x1E7FF ; No_Block
+ 0x1E300, # .. 0x1E7DF ; No_Block
+ 0x1E7E0, # .. 0x1E7FF ; Ethiopic Extended-B
0x1E800, # .. 0x1E8DF ; Mende Kikakui
0x1E8E0, # .. 0x1E8FF ; No_Block
0x1E900, # .. 0x1E95F ; Adlam
@@ -382,366 +391,375 @@ RANGES = [
]
VALUES = [
- 'Basic Latin', # 0000..007F
- 'Latin-1 Supplement', # 0080..00FF
- 'Latin Extended-A', # 0100..017F
- 'Latin Extended-B', # 0180..024F
- 'IPA Extensions', # 0250..02AF
- 'Spacing Modifier Letters', # 02B0..02FF
- 'Combining Diacritical Marks', # 0300..036F
- 'Greek and Coptic', # 0370..03FF
- 'Cyrillic', # 0400..04FF
- 'Cyrillic Supplement', # 0500..052F
- 'Armenian', # 0530..058F
- 'Hebrew', # 0590..05FF
- 'Arabic', # 0600..06FF
- 'Syriac', # 0700..074F
- 'Arabic Supplement', # 0750..077F
- 'Thaana', # 0780..07BF
- 'NKo', # 07C0..07FF
- 'Samaritan', # 0800..083F
- 'Mandaic', # 0840..085F
- 'Syriac Supplement', # 0860..086F
- 'No_Block', # 0870..089F
- 'Arabic Extended-A', # 08A0..08FF
- 'Devanagari', # 0900..097F
- 'Bengali', # 0980..09FF
- 'Gurmukhi', # 0A00..0A7F
- 'Gujarati', # 0A80..0AFF
- 'Oriya', # 0B00..0B7F
- 'Tamil', # 0B80..0BFF
- 'Telugu', # 0C00..0C7F
- 'Kannada', # 0C80..0CFF
- 'Malayalam', # 0D00..0D7F
- 'Sinhala', # 0D80..0DFF
- 'Thai', # 0E00..0E7F
- 'Lao', # 0E80..0EFF
- 'Tibetan', # 0F00..0FFF
- 'Myanmar', # 1000..109F
- 'Georgian', # 10A0..10FF
- 'Hangul Jamo', # 1100..11FF
- 'Ethiopic', # 1200..137F
- 'Ethiopic Supplement', # 1380..139F
- 'Cherokee', # 13A0..13FF
- 'Unified Canadian Aboriginal Syllabics', # 1400..167F
- 'Ogham', # 1680..169F
- 'Runic', # 16A0..16FF
- 'Tagalog', # 1700..171F
- 'Hanunoo', # 1720..173F
- 'Buhid', # 1740..175F
- 'Tagbanwa', # 1760..177F
- 'Khmer', # 1780..17FF
- 'Mongolian', # 1800..18AF
- 'Unified Canadian Aboriginal Syllabics Extended', # 18B0..18FF
- 'Limbu', # 1900..194F
- 'Tai Le', # 1950..197F
- 'New Tai Lue', # 1980..19DF
- 'Khmer Symbols', # 19E0..19FF
- 'Buginese', # 1A00..1A1F
- 'Tai Tham', # 1A20..1AAF
- 'Combining Diacritical Marks Extended', # 1AB0..1AFF
- 'Balinese', # 1B00..1B7F
- 'Sundanese', # 1B80..1BBF
- 'Batak', # 1BC0..1BFF
- 'Lepcha', # 1C00..1C4F
- 'Ol Chiki', # 1C50..1C7F
- 'Cyrillic Extended-C', # 1C80..1C8F
- 'Georgian Extended', # 1C90..1CBF
- 'Sundanese Supplement', # 1CC0..1CCF
- 'Vedic Extensions', # 1CD0..1CFF
- 'Phonetic Extensions', # 1D00..1D7F
- 'Phonetic Extensions Supplement', # 1D80..1DBF
- 'Combining Diacritical Marks Supplement', # 1DC0..1DFF
- 'Latin Extended Additional', # 1E00..1EFF
- 'Greek Extended', # 1F00..1FFF
- 'General Punctuation', # 2000..206F
- 'Superscripts and Subscripts', # 2070..209F
- 'Currency Symbols', # 20A0..20CF
- 'Combining Diacritical Marks for Symbols', # 20D0..20FF
- 'Letterlike Symbols', # 2100..214F
- 'Number Forms', # 2150..218F
- 'Arrows', # 2190..21FF
- 'Mathematical Operators', # 2200..22FF
- 'Miscellaneous Technical', # 2300..23FF
- 'Control Pictures', # 2400..243F
- 'Optical Character Recognition', # 2440..245F
- 'Enclosed Alphanumerics', # 2460..24FF
- 'Box Drawing', # 2500..257F
- 'Block Elements', # 2580..259F
- 'Geometric Shapes', # 25A0..25FF
- 'Miscellaneous Symbols', # 2600..26FF
- 'Dingbats', # 2700..27BF
- 'Miscellaneous Mathematical Symbols-A', # 27C0..27EF
- 'Supplemental Arrows-A', # 27F0..27FF
- 'Braille Patterns', # 2800..28FF
- 'Supplemental Arrows-B', # 2900..297F
- 'Miscellaneous Mathematical Symbols-B', # 2980..29FF
- 'Supplemental Mathematical Operators', # 2A00..2AFF
- 'Miscellaneous Symbols and Arrows', # 2B00..2BFF
- 'Glagolitic', # 2C00..2C5F
- 'Latin Extended-C', # 2C60..2C7F
- 'Coptic', # 2C80..2CFF
- 'Georgian Supplement', # 2D00..2D2F
- 'Tifinagh', # 2D30..2D7F
- 'Ethiopic Extended', # 2D80..2DDF
- 'Cyrillic Extended-A', # 2DE0..2DFF
- 'Supplemental Punctuation', # 2E00..2E7F
- 'CJK Radicals Supplement', # 2E80..2EFF
- 'Kangxi Radicals', # 2F00..2FDF
- 'No_Block', # 2FE0..2FEF
- 'Ideographic Description Characters', # 2FF0..2FFF
- 'CJK Symbols and Punctuation', # 3000..303F
- 'Hiragana', # 3040..309F
- 'Katakana', # 30A0..30FF
- 'Bopomofo', # 3100..312F
- 'Hangul Compatibility Jamo', # 3130..318F
- 'Kanbun', # 3190..319F
- 'Bopomofo Extended', # 31A0..31BF
- 'CJK Strokes', # 31C0..31EF
- 'Katakana Phonetic Extensions', # 31F0..31FF
- 'Enclosed CJK Letters and Months', # 3200..32FF
- 'CJK Compatibility', # 3300..33FF
- 'CJK Unified Ideographs Extension A', # 3400..4DBF
- 'Yijing Hexagram Symbols', # 4DC0..4DFF
- 'CJK Unified Ideographs', # 4E00..9FFF
- 'Yi Syllables', # A000..A48F
- 'Yi Radicals', # A490..A4CF
- 'Lisu', # A4D0..A4FF
- 'Vai', # A500..A63F
- 'Cyrillic Extended-B', # A640..A69F
- 'Bamum', # A6A0..A6FF
- 'Modifier Tone Letters', # A700..A71F
- 'Latin Extended-D', # A720..A7FF
- 'Syloti Nagri', # A800..A82F
- 'Common Indic Number Forms', # A830..A83F
- 'Phags-pa', # A840..A87F
- 'Saurashtra', # A880..A8DF
- 'Devanagari Extended', # A8E0..A8FF
- 'Kayah Li', # A900..A92F
- 'Rejang', # A930..A95F
- 'Hangul Jamo Extended-A', # A960..A97F
- 'Javanese', # A980..A9DF
- 'Myanmar Extended-B', # A9E0..A9FF
- 'Cham', # AA00..AA5F
- 'Myanmar Extended-A', # AA60..AA7F
- 'Tai Viet', # AA80..AADF
- 'Meetei Mayek Extensions', # AAE0..AAFF
- 'Ethiopic Extended-A', # AB00..AB2F
- 'Latin Extended-E', # AB30..AB6F
- 'Cherokee Supplement', # AB70..ABBF
- 'Meetei Mayek', # ABC0..ABFF
- 'Hangul Syllables', # AC00..D7AF
- 'Hangul Jamo Extended-B', # D7B0..D7FF
- 'High Surrogates', # D800..DB7F
- 'High Private Use Surrogates', # DB80..DBFF
- 'Low Surrogates', # DC00..DFFF
- 'Private Use Area', # E000..F8FF
- 'CJK Compatibility Ideographs', # F900..FAFF
- 'Alphabetic Presentation Forms', # FB00..FB4F
- 'Arabic Presentation Forms-A', # FB50..FDFF
- 'Variation Selectors', # FE00..FE0F
- 'Vertical Forms', # FE10..FE1F
- 'Combining Half Marks', # FE20..FE2F
- 'CJK Compatibility Forms', # FE30..FE4F
- 'Small Form Variants', # FE50..FE6F
- 'Arabic Presentation Forms-B', # FE70..FEFF
- 'Halfwidth and Fullwidth Forms', # FF00..FFEF
- 'Specials', # FFF0..FFFF
- 'Linear B Syllabary', # 10000..1007F
- 'Linear B Ideograms', # 10080..100FF
- 'Aegean Numbers', # 10100..1013F
- 'Ancient Greek Numbers', # 10140..1018F
- 'Ancient Symbols', # 10190..101CF
- 'Phaistos Disc', # 101D0..101FF
- 'No_Block', # 10200..1027F
- 'Lycian', # 10280..1029F
- 'Carian', # 102A0..102DF
- 'Coptic Epact Numbers', # 102E0..102FF
- 'Old Italic', # 10300..1032F
- 'Gothic', # 10330..1034F
- 'Old Permic', # 10350..1037F
- 'Ugaritic', # 10380..1039F
- 'Old Persian', # 103A0..103DF
- 'No_Block', # 103E0..103FF
- 'Deseret', # 10400..1044F
- 'Shavian', # 10450..1047F
- 'Osmanya', # 10480..104AF
- 'Osage', # 104B0..104FF
- 'Elbasan', # 10500..1052F
- 'Caucasian Albanian', # 10530..1056F
- 'No_Block', # 10570..105FF
- 'Linear A', # 10600..1077F
- 'No_Block', # 10780..107FF
- 'Cypriot Syllabary', # 10800..1083F
- 'Imperial Aramaic', # 10840..1085F
- 'Palmyrene', # 10860..1087F
- 'Nabataean', # 10880..108AF
- 'No_Block', # 108B0..108DF
- 'Hatran', # 108E0..108FF
- 'Phoenician', # 10900..1091F
- 'Lydian', # 10920..1093F
- 'No_Block', # 10940..1097F
- 'Meroitic Hieroglyphs', # 10980..1099F
- 'Meroitic Cursive', # 109A0..109FF
- 'Kharoshthi', # 10A00..10A5F
- 'Old South Arabian', # 10A60..10A7F
- 'Old North Arabian', # 10A80..10A9F
- 'No_Block', # 10AA0..10ABF
- 'Manichaean', # 10AC0..10AFF
- 'Avestan', # 10B00..10B3F
- 'Inscriptional Parthian', # 10B40..10B5F
- 'Inscriptional Pahlavi', # 10B60..10B7F
- 'Psalter Pahlavi', # 10B80..10BAF
- 'No_Block', # 10BB0..10BFF
- 'Old Turkic', # 10C00..10C4F
- 'No_Block', # 10C50..10C7F
- 'Old Hungarian', # 10C80..10CFF
- 'Hanifi Rohingya', # 10D00..10D3F
- 'No_Block', # 10D40..10E5F
- 'Rumi Numeral Symbols', # 10E60..10E7F
- 'Yezidi', # 10E80..10EBF
- 'No_Block', # 10EC0..10EFF
- 'Old Sogdian', # 10F00..10F2F
- 'Sogdian', # 10F30..10F6F
- 'No_Block', # 10F70..10FAF
- 'Chorasmian', # 10FB0..10FDF
- 'Elymaic', # 10FE0..10FFF
- 'Brahmi', # 11000..1107F
- 'Kaithi', # 11080..110CF
- 'Sora Sompeng', # 110D0..110FF
- 'Chakma', # 11100..1114F
- 'Mahajani', # 11150..1117F
- 'Sharada', # 11180..111DF
- 'Sinhala Archaic Numbers', # 111E0..111FF
- 'Khojki', # 11200..1124F
- 'No_Block', # 11250..1127F
- 'Multani', # 11280..112AF
- 'Khudawadi', # 112B0..112FF
- 'Grantha', # 11300..1137F
- 'No_Block', # 11380..113FF
- 'Newa', # 11400..1147F
- 'Tirhuta', # 11480..114DF
- 'No_Block', # 114E0..1157F
- 'Siddham', # 11580..115FF
- 'Modi', # 11600..1165F
- 'Mongolian Supplement', # 11660..1167F
- 'Takri', # 11680..116CF
- 'No_Block', # 116D0..116FF
- 'Ahom', # 11700..1173F
- 'No_Block', # 11740..117FF
- 'Dogra', # 11800..1184F
- 'No_Block', # 11850..1189F
- 'Warang Citi', # 118A0..118FF
- 'Dives Akuru', # 11900..1195F
- 'No_Block', # 11960..1199F
- 'Nandinagari', # 119A0..119FF
- 'Zanabazar Square', # 11A00..11A4F
- 'Soyombo', # 11A50..11AAF
- 'No_Block', # 11AB0..11ABF
- 'Pau Cin Hau', # 11AC0..11AFF
- 'No_Block', # 11B00..11BFF
- 'Bhaiksuki', # 11C00..11C6F
- 'Marchen', # 11C70..11CBF
- 'No_Block', # 11CC0..11CFF
- 'Masaram Gondi', # 11D00..11D5F
- 'Gunjala Gondi', # 11D60..11DAF
- 'No_Block', # 11DB0..11EDF
- 'Makasar', # 11EE0..11EFF
- 'No_Block', # 11F00..11FAF
- 'Lisu Supplement', # 11FB0..11FBF
- 'Tamil Supplement', # 11FC0..11FFF
- 'Cuneiform', # 12000..123FF
- 'Cuneiform Numbers and Punctuation', # 12400..1247F
- 'Early Dynastic Cuneiform', # 12480..1254F
- 'No_Block', # 12550..12FFF
- 'Egyptian Hieroglyphs', # 13000..1342F
- 'Egyptian Hieroglyph Format Controls', # 13430..1343F
- 'No_Block', # 13440..143FF
- 'Anatolian Hieroglyphs', # 14400..1467F
- 'No_Block', # 14680..167FF
- 'Bamum Supplement', # 16800..16A3F
- 'Mro', # 16A40..16A6F
- 'No_Block', # 16A70..16ACF
- 'Bassa Vah', # 16AD0..16AFF
- 'Pahawh Hmong', # 16B00..16B8F
- 'No_Block', # 16B90..16E3F
- 'Medefaidrin', # 16E40..16E9F
- 'No_Block', # 16EA0..16EFF
- 'Miao', # 16F00..16F9F
- 'No_Block', # 16FA0..16FDF
- 'Ideographic Symbols and Punctuation', # 16FE0..16FFF
- 'Tangut', # 17000..187FF
- 'Tangut Components', # 18800..18AFF
- 'Khitan Small Script', # 18B00..18CFF
- 'Tangut Supplement', # 18D00..18D8F
- 'No_Block', # 18D90..1AFFF
- 'Kana Supplement', # 1B000..1B0FF
- 'Kana Extended-A', # 1B100..1B12F
- 'Small Kana Extension', # 1B130..1B16F
- 'Nushu', # 1B170..1B2FF
- 'No_Block', # 1B300..1BBFF
- 'Duployan', # 1BC00..1BC9F
- 'Shorthand Format Controls', # 1BCA0..1BCAF
- 'No_Block', # 1BCB0..1CFFF
- 'Byzantine Musical Symbols', # 1D000..1D0FF
- 'Musical Symbols', # 1D100..1D1FF
- 'Ancient Greek Musical Notation', # 1D200..1D24F
- 'No_Block', # 1D250..1D2DF
- 'Mayan Numerals', # 1D2E0..1D2FF
- 'Tai Xuan Jing Symbols', # 1D300..1D35F
- 'Counting Rod Numerals', # 1D360..1D37F
- 'No_Block', # 1D380..1D3FF
- 'Mathematical Alphanumeric Symbols', # 1D400..1D7FF
- 'Sutton SignWriting', # 1D800..1DAAF
- 'No_Block', # 1DAB0..1DFFF
- 'Glagolitic Supplement', # 1E000..1E02F
- 'No_Block', # 1E030..1E0FF
- 'Nyiakeng Puachue Hmong', # 1E100..1E14F
- 'No_Block', # 1E150..1E2BF
- 'Wancho', # 1E2C0..1E2FF
- 'No_Block', # 1E300..1E7FF
- 'Mende Kikakui', # 1E800..1E8DF
- 'No_Block', # 1E8E0..1E8FF
- 'Adlam', # 1E900..1E95F
- 'No_Block', # 1E960..1EC6F
- 'Indic Siyaq Numbers', # 1EC70..1ECBF
- 'No_Block', # 1ECC0..1ECFF
- 'Ottoman Siyaq Numbers', # 1ED00..1ED4F
- 'No_Block', # 1ED50..1EDFF
- 'Arabic Mathematical Alphabetic Symbols', # 1EE00..1EEFF
- 'No_Block', # 1EF00..1EFFF
- 'Mahjong Tiles', # 1F000..1F02F
- 'Domino Tiles', # 1F030..1F09F
- 'Playing Cards', # 1F0A0..1F0FF
- 'Enclosed Alphanumeric Supplement', # 1F100..1F1FF
- 'Enclosed Ideographic Supplement', # 1F200..1F2FF
- 'Miscellaneous Symbols and Pictographs', # 1F300..1F5FF
- 'Emoticons', # 1F600..1F64F
- 'Ornamental Dingbats', # 1F650..1F67F
- 'Transport and Map Symbols', # 1F680..1F6FF
- 'Alchemical Symbols', # 1F700..1F77F
- 'Geometric Shapes Extended', # 1F780..1F7FF
- 'Supplemental Arrows-C', # 1F800..1F8FF
- 'Supplemental Symbols and Pictographs', # 1F900..1F9FF
- 'Chess Symbols', # 1FA00..1FA6F
- 'Symbols and Pictographs Extended-A', # 1FA70..1FAFF
- 'Symbols for Legacy Computing', # 1FB00..1FBFF
- 'No_Block', # 1FC00..1FFFF
- 'CJK Unified Ideographs Extension B', # 20000..2A6DF
- 'No_Block', # 2A6E0..2A6FF
- 'CJK Unified Ideographs Extension C', # 2A700..2B73F
- 'CJK Unified Ideographs Extension D', # 2B740..2B81F
- 'CJK Unified Ideographs Extension E', # 2B820..2CEAF
- 'CJK Unified Ideographs Extension F', # 2CEB0..2EBEF
- 'No_Block', # 2EBF0..2F7FF
- 'CJK Compatibility Ideographs Supplement', # 2F800..2FA1F
- 'No_Block', # 2FA20..2FFFF
- 'CJK Unified Ideographs Extension G', # 30000..3134F
- 'No_Block', # 31350..DFFFF
- 'Tags', # E0000..E007F
- 'No_Block', # E0080..E00FF
- 'Variation Selectors Supplement', # E0100..E01EF
- 'No_Block', # E01F0..EFFFF
- 'Supplementary Private Use Area-A', # F0000..FFFFF
- 'Supplementary Private Use Area-B', # 100000..10FFFF
+ 'Basic Latin', # 0000..007F
+ 'Latin-1 Supplement', # 0080..00FF
+ 'Latin Extended-A', # 0100..017F
+ 'Latin Extended-B', # 0180..024F
+ 'IPA Extensions', # 0250..02AF
+ 'Spacing Modifier Letters', # 02B0..02FF
+ 'Combining Diacritical Marks', # 0300..036F
+ 'Greek and Coptic', # 0370..03FF
+ 'Cyrillic', # 0400..04FF
+ 'Cyrillic Supplement', # 0500..052F
+ 'Armenian', # 0530..058F
+ 'Hebrew', # 0590..05FF
+ 'Arabic', # 0600..06FF
+ 'Syriac', # 0700..074F
+ 'Arabic Supplement', # 0750..077F
+ 'Thaana', # 0780..07BF
+ 'NKo', # 07C0..07FF
+ 'Samaritan', # 0800..083F
+ 'Mandaic', # 0840..085F
+ 'Syriac Supplement', # 0860..086F
+ 'Arabic Extended-B', # 0870..089F
+ 'Arabic Extended-A', # 08A0..08FF
+ 'Devanagari', # 0900..097F
+ 'Bengali', # 0980..09FF
+ 'Gurmukhi', # 0A00..0A7F
+ 'Gujarati', # 0A80..0AFF
+ 'Oriya', # 0B00..0B7F
+ 'Tamil', # 0B80..0BFF
+ 'Telugu', # 0C00..0C7F
+ 'Kannada', # 0C80..0CFF
+ 'Malayalam', # 0D00..0D7F
+ 'Sinhala', # 0D80..0DFF
+ 'Thai', # 0E00..0E7F
+ 'Lao', # 0E80..0EFF
+ 'Tibetan', # 0F00..0FFF
+ 'Myanmar', # 1000..109F
+ 'Georgian', # 10A0..10FF
+ 'Hangul Jamo', # 1100..11FF
+ 'Ethiopic', # 1200..137F
+ 'Ethiopic Supplement', # 1380..139F
+ 'Cherokee', # 13A0..13FF
+ 'Unified Canadian Aboriginal Syllabics', # 1400..167F
+ 'Ogham', # 1680..169F
+ 'Runic', # 16A0..16FF
+ 'Tagalog', # 1700..171F
+ 'Hanunoo', # 1720..173F
+ 'Buhid', # 1740..175F
+ 'Tagbanwa', # 1760..177F
+ 'Khmer', # 1780..17FF
+ 'Mongolian', # 1800..18AF
+ 'Unified Canadian Aboriginal Syllabics Extended', # 18B0..18FF
+ 'Limbu', # 1900..194F
+ 'Tai Le', # 1950..197F
+ 'New Tai Lue', # 1980..19DF
+ 'Khmer Symbols', # 19E0..19FF
+ 'Buginese', # 1A00..1A1F
+ 'Tai Tham', # 1A20..1AAF
+ 'Combining Diacritical Marks Extended', # 1AB0..1AFF
+ 'Balinese', # 1B00..1B7F
+ 'Sundanese', # 1B80..1BBF
+ 'Batak', # 1BC0..1BFF
+ 'Lepcha', # 1C00..1C4F
+ 'Ol Chiki', # 1C50..1C7F
+ 'Cyrillic Extended-C', # 1C80..1C8F
+ 'Georgian Extended', # 1C90..1CBF
+ 'Sundanese Supplement', # 1CC0..1CCF
+ 'Vedic Extensions', # 1CD0..1CFF
+ 'Phonetic Extensions', # 1D00..1D7F
+ 'Phonetic Extensions Supplement', # 1D80..1DBF
+ 'Combining Diacritical Marks Supplement', # 1DC0..1DFF
+ 'Latin Extended Additional', # 1E00..1EFF
+ 'Greek Extended', # 1F00..1FFF
+ 'General Punctuation', # 2000..206F
+ 'Superscripts and Subscripts', # 2070..209F
+ 'Currency Symbols', # 20A0..20CF
+ 'Combining Diacritical Marks for Symbols', # 20D0..20FF
+ 'Letterlike Symbols', # 2100..214F
+ 'Number Forms', # 2150..218F
+ 'Arrows', # 2190..21FF
+ 'Mathematical Operators', # 2200..22FF
+ 'Miscellaneous Technical', # 2300..23FF
+ 'Control Pictures', # 2400..243F
+ 'Optical Character Recognition', # 2440..245F
+ 'Enclosed Alphanumerics', # 2460..24FF
+ 'Box Drawing', # 2500..257F
+ 'Block Elements', # 2580..259F
+ 'Geometric Shapes', # 25A0..25FF
+ 'Miscellaneous Symbols', # 2600..26FF
+ 'Dingbats', # 2700..27BF
+ 'Miscellaneous Mathematical Symbols-A', # 27C0..27EF
+ 'Supplemental Arrows-A', # 27F0..27FF
+ 'Braille Patterns', # 2800..28FF
+ 'Supplemental Arrows-B', # 2900..297F
+ 'Miscellaneous Mathematical Symbols-B', # 2980..29FF
+ 'Supplemental Mathematical Operators', # 2A00..2AFF
+ 'Miscellaneous Symbols and Arrows', # 2B00..2BFF
+ 'Glagolitic', # 2C00..2C5F
+ 'Latin Extended-C', # 2C60..2C7F
+ 'Coptic', # 2C80..2CFF
+ 'Georgian Supplement', # 2D00..2D2F
+ 'Tifinagh', # 2D30..2D7F
+ 'Ethiopic Extended', # 2D80..2DDF
+ 'Cyrillic Extended-A', # 2DE0..2DFF
+ 'Supplemental Punctuation', # 2E00..2E7F
+ 'CJK Radicals Supplement', # 2E80..2EFF
+ 'Kangxi Radicals', # 2F00..2FDF
+ 'No_Block', # 2FE0..2FEF
+ 'Ideographic Description Characters', # 2FF0..2FFF
+ 'CJK Symbols and Punctuation', # 3000..303F
+ 'Hiragana', # 3040..309F
+ 'Katakana', # 30A0..30FF
+ 'Bopomofo', # 3100..312F
+ 'Hangul Compatibility Jamo', # 3130..318F
+ 'Kanbun', # 3190..319F
+ 'Bopomofo Extended', # 31A0..31BF
+ 'CJK Strokes', # 31C0..31EF
+ 'Katakana Phonetic Extensions', # 31F0..31FF
+ 'Enclosed CJK Letters and Months', # 3200..32FF
+ 'CJK Compatibility', # 3300..33FF
+ 'CJK Unified Ideographs Extension A', # 3400..4DBF
+ 'Yijing Hexagram Symbols', # 4DC0..4DFF
+ 'CJK Unified Ideographs', # 4E00..9FFF
+ 'Yi Syllables', # A000..A48F
+ 'Yi Radicals', # A490..A4CF
+ 'Lisu', # A4D0..A4FF
+ 'Vai', # A500..A63F
+ 'Cyrillic Extended-B', # A640..A69F
+ 'Bamum', # A6A0..A6FF
+ 'Modifier Tone Letters', # A700..A71F
+ 'Latin Extended-D', # A720..A7FF
+ 'Syloti Nagri', # A800..A82F
+ 'Common Indic Number Forms', # A830..A83F
+ 'Phags-pa', # A840..A87F
+ 'Saurashtra', # A880..A8DF
+ 'Devanagari Extended', # A8E0..A8FF
+ 'Kayah Li', # A900..A92F
+ 'Rejang', # A930..A95F
+ 'Hangul Jamo Extended-A', # A960..A97F
+ 'Javanese', # A980..A9DF
+ 'Myanmar Extended-B', # A9E0..A9FF
+ 'Cham', # AA00..AA5F
+ 'Myanmar Extended-A', # AA60..AA7F
+ 'Tai Viet', # AA80..AADF
+ 'Meetei Mayek Extensions', # AAE0..AAFF
+ 'Ethiopic Extended-A', # AB00..AB2F
+ 'Latin Extended-E', # AB30..AB6F
+ 'Cherokee Supplement', # AB70..ABBF
+ 'Meetei Mayek', # ABC0..ABFF
+ 'Hangul Syllables', # AC00..D7AF
+ 'Hangul Jamo Extended-B', # D7B0..D7FF
+ 'High Surrogates', # D800..DB7F
+ 'High Private Use Surrogates', # DB80..DBFF
+ 'Low Surrogates', # DC00..DFFF
+ 'Private Use Area', # E000..F8FF
+ 'CJK Compatibility Ideographs', # F900..FAFF
+ 'Alphabetic Presentation Forms', # FB00..FB4F
+ 'Arabic Presentation Forms-A', # FB50..FDFF
+ 'Variation Selectors', # FE00..FE0F
+ 'Vertical Forms', # FE10..FE1F
+ 'Combining Half Marks', # FE20..FE2F
+ 'CJK Compatibility Forms', # FE30..FE4F
+ 'Small Form Variants', # FE50..FE6F
+ 'Arabic Presentation Forms-B', # FE70..FEFF
+ 'Halfwidth and Fullwidth Forms', # FF00..FFEF
+ 'Specials', # FFF0..FFFF
+ 'Linear B Syllabary', # 10000..1007F
+ 'Linear B Ideograms', # 10080..100FF
+ 'Aegean Numbers', # 10100..1013F
+ 'Ancient Greek Numbers', # 10140..1018F
+ 'Ancient Symbols', # 10190..101CF
+ 'Phaistos Disc', # 101D0..101FF
+ 'No_Block', # 10200..1027F
+ 'Lycian', # 10280..1029F
+ 'Carian', # 102A0..102DF
+ 'Coptic Epact Numbers', # 102E0..102FF
+ 'Old Italic', # 10300..1032F
+ 'Gothic', # 10330..1034F
+ 'Old Permic', # 10350..1037F
+ 'Ugaritic', # 10380..1039F
+ 'Old Persian', # 103A0..103DF
+ 'No_Block', # 103E0..103FF
+ 'Deseret', # 10400..1044F
+ 'Shavian', # 10450..1047F
+ 'Osmanya', # 10480..104AF
+ 'Osage', # 104B0..104FF
+ 'Elbasan', # 10500..1052F
+ 'Caucasian Albanian', # 10530..1056F
+ 'Vithkuqi', # 10570..105BF
+ 'No_Block', # 105C0..105FF
+ 'Linear A', # 10600..1077F
+ 'Latin Extended-F', # 10780..107BF
+ 'No_Block', # 107C0..107FF
+ 'Cypriot Syllabary', # 10800..1083F
+ 'Imperial Aramaic', # 10840..1085F
+ 'Palmyrene', # 10860..1087F
+ 'Nabataean', # 10880..108AF
+ 'No_Block', # 108B0..108DF
+ 'Hatran', # 108E0..108FF
+ 'Phoenician', # 10900..1091F
+ 'Lydian', # 10920..1093F
+ 'No_Block', # 10940..1097F
+ 'Meroitic Hieroglyphs', # 10980..1099F
+ 'Meroitic Cursive', # 109A0..109FF
+ 'Kharoshthi', # 10A00..10A5F
+ 'Old South Arabian', # 10A60..10A7F
+ 'Old North Arabian', # 10A80..10A9F
+ 'No_Block', # 10AA0..10ABF
+ 'Manichaean', # 10AC0..10AFF
+ 'Avestan', # 10B00..10B3F
+ 'Inscriptional Parthian', # 10B40..10B5F
+ 'Inscriptional Pahlavi', # 10B60..10B7F
+ 'Psalter Pahlavi', # 10B80..10BAF
+ 'No_Block', # 10BB0..10BFF
+ 'Old Turkic', # 10C00..10C4F
+ 'No_Block', # 10C50..10C7F
+ 'Old Hungarian', # 10C80..10CFF
+ 'Hanifi Rohingya', # 10D00..10D3F
+ 'No_Block', # 10D40..10E5F
+ 'Rumi Numeral Symbols', # 10E60..10E7F
+ 'Yezidi', # 10E80..10EBF
+ 'No_Block', # 10EC0..10EFF
+ 'Old Sogdian', # 10F00..10F2F
+ 'Sogdian', # 10F30..10F6F
+ 'Old Uyghur', # 10F70..10FAF
+ 'Chorasmian', # 10FB0..10FDF
+ 'Elymaic', # 10FE0..10FFF
+ 'Brahmi', # 11000..1107F
+ 'Kaithi', # 11080..110CF
+ 'Sora Sompeng', # 110D0..110FF
+ 'Chakma', # 11100..1114F
+ 'Mahajani', # 11150..1117F
+ 'Sharada', # 11180..111DF
+ 'Sinhala Archaic Numbers', # 111E0..111FF
+ 'Khojki', # 11200..1124F
+ 'No_Block', # 11250..1127F
+ 'Multani', # 11280..112AF
+ 'Khudawadi', # 112B0..112FF
+ 'Grantha', # 11300..1137F
+ 'No_Block', # 11380..113FF
+ 'Newa', # 11400..1147F
+ 'Tirhuta', # 11480..114DF
+ 'No_Block', # 114E0..1157F
+ 'Siddham', # 11580..115FF
+ 'Modi', # 11600..1165F
+ 'Mongolian Supplement', # 11660..1167F
+ 'Takri', # 11680..116CF
+ 'No_Block', # 116D0..116FF
+ 'Ahom', # 11700..1174F
+ 'No_Block', # 11750..117FF
+ 'Dogra', # 11800..1184F
+ 'No_Block', # 11850..1189F
+ 'Warang Citi', # 118A0..118FF
+ 'Dives Akuru', # 11900..1195F
+ 'No_Block', # 11960..1199F
+ 'Nandinagari', # 119A0..119FF
+ 'Zanabazar Square', # 11A00..11A4F
+ 'Soyombo', # 11A50..11AAF
+ 'Unified Canadian Aboriginal Syllabics Extended-A', # 11AB0..11ABF
+ 'Pau Cin Hau', # 11AC0..11AFF
+ 'No_Block', # 11B00..11BFF
+ 'Bhaiksuki', # 11C00..11C6F
+ 'Marchen', # 11C70..11CBF
+ 'No_Block', # 11CC0..11CFF
+ 'Masaram Gondi', # 11D00..11D5F
+ 'Gunjala Gondi', # 11D60..11DAF
+ 'No_Block', # 11DB0..11EDF
+ 'Makasar', # 11EE0..11EFF
+ 'No_Block', # 11F00..11FAF
+ 'Lisu Supplement', # 11FB0..11FBF
+ 'Tamil Supplement', # 11FC0..11FFF
+ 'Cuneiform', # 12000..123FF
+ 'Cuneiform Numbers and Punctuation', # 12400..1247F
+ 'Early Dynastic Cuneiform', # 12480..1254F
+ 'No_Block', # 12550..12F8F
+ 'Cypro-Minoan', # 12F90..12FFF
+ 'Egyptian Hieroglyphs', # 13000..1342F
+ 'Egyptian Hieroglyph Format Controls', # 13430..1343F
+ 'No_Block', # 13440..143FF
+ 'Anatolian Hieroglyphs', # 14400..1467F
+ 'No_Block', # 14680..167FF
+ 'Bamum Supplement', # 16800..16A3F
+ 'Mro', # 16A40..16A6F
+ 'Tangsa', # 16A70..16ACF
+ 'Bassa Vah', # 16AD0..16AFF
+ 'Pahawh Hmong', # 16B00..16B8F
+ 'No_Block', # 16B90..16E3F
+ 'Medefaidrin', # 16E40..16E9F
+ 'No_Block', # 16EA0..16EFF
+ 'Miao', # 16F00..16F9F
+ 'No_Block', # 16FA0..16FDF
+ 'Ideographic Symbols and Punctuation', # 16FE0..16FFF
+ 'Tangut', # 17000..187FF
+ 'Tangut Components', # 18800..18AFF
+ 'Khitan Small Script', # 18B00..18CFF
+ 'Tangut Supplement', # 18D00..18D7F
+ 'No_Block', # 18D80..1AFEF
+ 'Kana Extended-B', # 1AFF0..1AFFF
+ 'Kana Supplement', # 1B000..1B0FF
+ 'Kana Extended-A', # 1B100..1B12F
+ 'Small Kana Extension', # 1B130..1B16F
+ 'Nushu', # 1B170..1B2FF
+ 'No_Block', # 1B300..1BBFF
+ 'Duployan', # 1BC00..1BC9F
+ 'Shorthand Format Controls', # 1BCA0..1BCAF
+ 'No_Block', # 1BCB0..1CEFF
+ 'Znamenny Musical Notation', # 1CF00..1CFCF
+ 'No_Block', # 1CFD0..1CFFF
+ 'Byzantine Musical Symbols', # 1D000..1D0FF
+ 'Musical Symbols', # 1D100..1D1FF
+ 'Ancient Greek Musical Notation', # 1D200..1D24F
+ 'No_Block', # 1D250..1D2DF
+ 'Mayan Numerals', # 1D2E0..1D2FF
+ 'Tai Xuan Jing Symbols', # 1D300..1D35F
+ 'Counting Rod Numerals', # 1D360..1D37F
+ 'No_Block', # 1D380..1D3FF
+ 'Mathematical Alphanumeric Symbols', # 1D400..1D7FF
+ 'Sutton SignWriting', # 1D800..1DAAF
+ 'No_Block', # 1DAB0..1DEFF
+ 'Latin Extended-G', # 1DF00..1DFFF
+ 'Glagolitic Supplement', # 1E000..1E02F
+ 'No_Block', # 1E030..1E0FF
+ 'Nyiakeng Puachue Hmong', # 1E100..1E14F
+ 'No_Block', # 1E150..1E28F
+ 'Toto', # 1E290..1E2BF
+ 'Wancho', # 1E2C0..1E2FF
+ 'No_Block', # 1E300..1E7DF
+ 'Ethiopic Extended-B', # 1E7E0..1E7FF
+ 'Mende Kikakui', # 1E800..1E8DF
+ 'No_Block', # 1E8E0..1E8FF
+ 'Adlam', # 1E900..1E95F
+ 'No_Block', # 1E960..1EC6F
+ 'Indic Siyaq Numbers', # 1EC70..1ECBF
+ 'No_Block', # 1ECC0..1ECFF
+ 'Ottoman Siyaq Numbers', # 1ED00..1ED4F
+ 'No_Block', # 1ED50..1EDFF
+ 'Arabic Mathematical Alphabetic Symbols', # 1EE00..1EEFF
+ 'No_Block', # 1EF00..1EFFF
+ 'Mahjong Tiles', # 1F000..1F02F
+ 'Domino Tiles', # 1F030..1F09F
+ 'Playing Cards', # 1F0A0..1F0FF
+ 'Enclosed Alphanumeric Supplement', # 1F100..1F1FF
+ 'Enclosed Ideographic Supplement', # 1F200..1F2FF
+ 'Miscellaneous Symbols and Pictographs', # 1F300..1F5FF
+ 'Emoticons', # 1F600..1F64F
+ 'Ornamental Dingbats', # 1F650..1F67F
+ 'Transport and Map Symbols', # 1F680..1F6FF
+ 'Alchemical Symbols', # 1F700..1F77F
+ 'Geometric Shapes Extended', # 1F780..1F7FF
+ 'Supplemental Arrows-C', # 1F800..1F8FF
+ 'Supplemental Symbols and Pictographs', # 1F900..1F9FF
+ 'Chess Symbols', # 1FA00..1FA6F
+ 'Symbols and Pictographs Extended-A', # 1FA70..1FAFF
+ 'Symbols for Legacy Computing', # 1FB00..1FBFF
+ 'No_Block', # 1FC00..1FFFF
+ 'CJK Unified Ideographs Extension B', # 20000..2A6DF
+ 'No_Block', # 2A6E0..2A6FF
+ 'CJK Unified Ideographs Extension C', # 2A700..2B73F
+ 'CJK Unified Ideographs Extension D', # 2B740..2B81F
+ 'CJK Unified Ideographs Extension E', # 2B820..2CEAF
+ 'CJK Unified Ideographs Extension F', # 2CEB0..2EBEF
+ 'No_Block', # 2EBF0..2F7FF
+ 'CJK Compatibility Ideographs Supplement', # 2F800..2FA1F
+ 'No_Block', # 2FA20..2FFFF
+ 'CJK Unified Ideographs Extension G', # 30000..3134F
+ 'No_Block', # 31350..DFFFF
+ 'Tags', # E0000..E007F
+ 'No_Block', # E0080..E00FF
+ 'Variation Selectors Supplement', # E0100..E01EF
+ 'No_Block', # E01F0..EFFFF
+ 'Supplementary Private Use Area-A', # F0000..FFFFF
+ 'Supplementary Private Use Area-B', # 100000..10FFFF
]