summaryrefslogtreecommitdiff
path: root/doc/UNICODE_PROPERTIES
diff options
context:
space:
mode:
Diffstat (limited to 'doc/UNICODE_PROPERTIES')
-rw-r--r--doc/UNICODE_PROPERTIES1345
1 files changed, 681 insertions, 664 deletions
diff --git a/doc/UNICODE_PROPERTIES b/doc/UNICODE_PROPERTIES
index 1f961eb..1148b4d 100644
--- a/doc/UNICODE_PROPERTIES
+++ b/doc/UNICODE_PROPERTIES
@@ -1,4 +1,4 @@
-Unicode Properties (from Unicode Version: 11.0.0)
+Unicode Properties (from Unicode Version: 12.0.0)
15: ASCII_Hex_Digit
16: Adlam
@@ -56,203 +56,207 @@ Unicode Properties (from Unicode Version: 11.0.0)
68: Duployan
69: Egyptian_Hieroglyphs
70: Elbasan
- 71: Emoji
- 72: Emoji_Component
- 73: Emoji_Modifier
- 74: Emoji_Modifier_Base
- 75: Emoji_Presentation
- 76: Ethiopic
- 77: Extended_Pictographic
- 78: Extender
- 79: Georgian
- 80: Glagolitic
- 81: Gothic
- 82: Grantha
- 83: Grapheme_Base
- 84: Grapheme_Extend
- 85: Grapheme_Link
- 86: Greek
- 87: Gujarati
- 88: Gunjala_Gondi
- 89: Gurmukhi
- 90: Han
- 91: Hangul
- 92: Hanifi_Rohingya
- 93: Hanunoo
- 94: Hatran
- 95: Hebrew
- 96: Hex_Digit
- 97: Hiragana
- 98: Hyphen
- 99: IDS_Binary_Operator
-100: IDS_Trinary_Operator
-101: ID_Continue
-102: ID_Start
-103: Ideographic
-104: Imperial_Aramaic
-105: Inherited
-106: Inscriptional_Pahlavi
-107: Inscriptional_Parthian
-108: Javanese
-109: Join_Control
-110: Kaithi
-111: Kannada
-112: Katakana
-113: Kayah_Li
-114: Kharoshthi
-115: Khmer
-116: Khojki
-117: Khudawadi
-118: L
-119: LC
-120: Lao
-121: Latin
-122: Lepcha
-123: Limbu
-124: Linear_A
-125: Linear_B
-126: Lisu
-127: Ll
-128: Lm
-129: Lo
-130: Logical_Order_Exception
-131: Lowercase
-132: Lt
-133: Lu
-134: Lycian
-135: Lydian
-136: M
-137: Mahajani
-138: Makasar
-139: Malayalam
-140: Mandaic
-141: Manichaean
-142: Marchen
-143: Masaram_Gondi
-144: Math
-145: Mc
-146: Me
-147: Medefaidrin
-148: Meetei_Mayek
-149: Mende_Kikakui
-150: Meroitic_Cursive
-151: Meroitic_Hieroglyphs
-152: Miao
-153: Mn
-154: Modi
-155: Mongolian
-156: Mro
-157: Multani
-158: Myanmar
-159: N
-160: Nabataean
-161: Nd
-162: New_Tai_Lue
-163: Newa
-164: Nko
-165: Nl
-166: No
-167: Noncharacter_Code_Point
-168: Nushu
-169: Ogham
-170: Ol_Chiki
-171: Old_Hungarian
-172: Old_Italic
-173: Old_North_Arabian
-174: Old_Permic
-175: Old_Persian
-176: Old_Sogdian
-177: Old_South_Arabian
-178: Old_Turkic
-179: Oriya
-180: Osage
-181: Osmanya
-182: Other_Alphabetic
-183: Other_Default_Ignorable_Code_Point
-184: Other_Grapheme_Extend
-185: Other_ID_Continue
-186: Other_ID_Start
-187: Other_Lowercase
-188: Other_Math
-189: Other_Uppercase
-190: P
-191: Pahawh_Hmong
-192: Palmyrene
-193: Pattern_Syntax
-194: Pattern_White_Space
-195: Pau_Cin_Hau
-196: Pc
-197: Pd
-198: Pe
-199: Pf
-200: Phags_Pa
-201: Phoenician
-202: Pi
-203: Po
-204: Prepended_Concatenation_Mark
-205: Ps
-206: Psalter_Pahlavi
-207: Quotation_Mark
-208: Radical
-209: Regional_Indicator
-210: Rejang
-211: Runic
-212: S
-213: Samaritan
-214: Saurashtra
-215: Sc
-216: Sentence_Terminal
-217: Sharada
-218: Shavian
-219: Siddham
-220: SignWriting
-221: Sinhala
-222: Sk
-223: Sm
-224: So
-225: Soft_Dotted
-226: Sogdian
-227: Sora_Sompeng
-228: Soyombo
-229: Sundanese
-230: Syloti_Nagri
-231: Syriac
-232: Tagalog
-233: Tagbanwa
-234: Tai_Le
-235: Tai_Tham
-236: Tai_Viet
-237: Takri
-238: Tamil
-239: Tangut
-240: Telugu
-241: Terminal_Punctuation
-242: Thaana
-243: Thai
-244: Tibetan
-245: Tifinagh
-246: Tirhuta
-247: Ugaritic
-248: Unified_Ideograph
-249: Unknown
-250: Uppercase
-251: Vai
-252: Variation_Selector
-253: Warang_Citi
-254: White_Space
-255: XID_Continue
-256: XID_Start
-257: Yi
-258: Z
-259: Zanabazar_Square
-260: Zl
-261: Zp
-262: Zs
+ 71: Elymaic
+ 72: Emoji
+ 73: Emoji_Component
+ 74: Emoji_Modifier
+ 75: Emoji_Modifier_Base
+ 76: Emoji_Presentation
+ 77: Ethiopic
+ 78: Extended_Pictographic
+ 79: Extender
+ 80: Georgian
+ 81: Glagolitic
+ 82: Gothic
+ 83: Grantha
+ 84: Grapheme_Base
+ 85: Grapheme_Extend
+ 86: Grapheme_Link
+ 87: Greek
+ 88: Gujarati
+ 89: Gunjala_Gondi
+ 90: Gurmukhi
+ 91: Han
+ 92: Hangul
+ 93: Hanifi_Rohingya
+ 94: Hanunoo
+ 95: Hatran
+ 96: Hebrew
+ 97: Hex_Digit
+ 98: Hiragana
+ 99: Hyphen
+100: IDS_Binary_Operator
+101: IDS_Trinary_Operator
+102: ID_Continue
+103: ID_Start
+104: Ideographic
+105: Imperial_Aramaic
+106: Inherited
+107: Inscriptional_Pahlavi
+108: Inscriptional_Parthian
+109: Javanese
+110: Join_Control
+111: Kaithi
+112: Kannada
+113: Katakana
+114: Kayah_Li
+115: Kharoshthi
+116: Khmer
+117: Khojki
+118: Khudawadi
+119: L
+120: LC
+121: Lao
+122: Latin
+123: Lepcha
+124: Limbu
+125: Linear_A
+126: Linear_B
+127: Lisu
+128: Ll
+129: Lm
+130: Lo
+131: Logical_Order_Exception
+132: Lowercase
+133: Lt
+134: Lu
+135: Lycian
+136: Lydian
+137: M
+138: Mahajani
+139: Makasar
+140: Malayalam
+141: Mandaic
+142: Manichaean
+143: Marchen
+144: Masaram_Gondi
+145: Math
+146: Mc
+147: Me
+148: Medefaidrin
+149: Meetei_Mayek
+150: Mende_Kikakui
+151: Meroitic_Cursive
+152: Meroitic_Hieroglyphs
+153: Miao
+154: Mn
+155: Modi
+156: Mongolian
+157: Mro
+158: Multani
+159: Myanmar
+160: N
+161: Nabataean
+162: Nandinagari
+163: Nd
+164: New_Tai_Lue
+165: Newa
+166: Nko
+167: Nl
+168: No
+169: Noncharacter_Code_Point
+170: Nushu
+171: Nyiakeng_Puachue_Hmong
+172: Ogham
+173: Ol_Chiki
+174: Old_Hungarian
+175: Old_Italic
+176: Old_North_Arabian
+177: Old_Permic
+178: Old_Persian
+179: Old_Sogdian
+180: Old_South_Arabian
+181: Old_Turkic
+182: Oriya
+183: Osage
+184: Osmanya
+185: Other_Alphabetic
+186: Other_Default_Ignorable_Code_Point
+187: Other_Grapheme_Extend
+188: Other_ID_Continue
+189: Other_ID_Start
+190: Other_Lowercase
+191: Other_Math
+192: Other_Uppercase
+193: P
+194: Pahawh_Hmong
+195: Palmyrene
+196: Pattern_Syntax
+197: Pattern_White_Space
+198: Pau_Cin_Hau
+199: Pc
+200: Pd
+201: Pe
+202: Pf
+203: Phags_Pa
+204: Phoenician
+205: Pi
+206: Po
+207: Prepended_Concatenation_Mark
+208: Ps
+209: Psalter_Pahlavi
+210: Quotation_Mark
+211: Radical
+212: Regional_Indicator
+213: Rejang
+214: Runic
+215: S
+216: Samaritan
+217: Saurashtra
+218: Sc
+219: Sentence_Terminal
+220: Sharada
+221: Shavian
+222: Siddham
+223: SignWriting
+224: Sinhala
+225: Sk
+226: Sm
+227: So
+228: Soft_Dotted
+229: Sogdian
+230: Sora_Sompeng
+231: Soyombo
+232: Sundanese
+233: Syloti_Nagri
+234: Syriac
+235: Tagalog
+236: Tagbanwa
+237: Tai_Le
+238: Tai_Tham
+239: Tai_Viet
+240: Takri
+241: Tamil
+242: Tangut
+243: Telugu
+244: Terminal_Punctuation
+245: Thaana
+246: Thai
+247: Tibetan
+248: Tifinagh
+249: Tirhuta
+250: Ugaritic
+251: Unified_Ideograph
+252: Unknown
+253: Uppercase
+254: Vai
+255: Variation_Selector
+256: Wancho
+257: Warang_Citi
+258: White_Space
+259: XID_Continue
+260: XID_Start
+261: Yi
+262: Z
+263: Zanabazar_Square
+264: Zl
+265: Zp
+266: Zs
16: Adlm
42: Aghb
15: AHex
21: Arab
-104: Armi
+105: Armi
22: Armn
24: Avst
25: Bali
@@ -270,24 +274,24 @@ Unicode Properties (from Unicode Version: 11.0.0)
45: Cakm
38: Cans
39: Cari
-119: Cased_Letter
+120: Cased_Letter
52: Cher
40: CI
-198: Close_Punctuation
-136: Combining_Mark
-196: Connector_Punctuation
+201: Close_Punctuation
+137: Combining_Mark
+199: Connector_Punctuation
43: Control
56: Copt
59: Cprt
-215: Currency_Symbol
+218: Currency_Symbol
47: CWCF
48: CWCM
49: CWL
50: CWT
51: CWU
60: Cyrl
-197: Dash_Punctuation
-161: Decimal_Number
+200: Dash_Punctuation
+163: Decimal_Number
63: Dep
65: Deva
62: DI
@@ -297,475 +301,488 @@ Unicode Properties (from Unicode Version: 11.0.0)
68: Dupl
69: Egyp
70: Elba
-146: Enclosing_Mark
- 76: Ethi
- 78: Ext
-199: Final_Punctuation
+ 71: Elym
+147: Enclosing_Mark
+ 77: Ethi
+ 79: Ext
+202: Final_Punctuation
44: Format
- 79: Geor
- 80: Glag
- 88: Gong
-143: Gonm
- 81: Goth
- 82: Gran
- 83: Gr_Base
- 86: Grek
- 84: Gr_Ext
- 85: Gr_Link
- 87: Gujr
- 89: Guru
- 91: Hang
- 90: Hani
- 93: Hano
- 94: Hatr
- 95: Hebr
- 96: Hex
- 97: Hira
+ 80: Geor
+ 81: Glag
+ 89: Gong
+144: Gonm
+ 82: Goth
+ 83: Gran
+ 84: Gr_Base
+ 87: Grek
+ 85: Gr_Ext
+ 86: Gr_Link
+ 88: Gujr
+ 90: Guru
+ 92: Hang
+ 91: Hani
+ 94: Hano
+ 95: Hatr
+ 96: Hebr
+ 97: Hex
+ 98: Hira
19: Hluw
-191: Hmng
-171: Hung
-101: IDC
-103: Ideo
-102: IDS
- 99: IDSB
-100: IDST
-202: Initial_Punctuation
-172: Ital
-108: Java
-109: Join_C
-113: Kali
-112: Kana
-114: Khar
-115: Khmr
-116: Khoj
-111: Knda
-110: Kthi
-235: Lana
-120: Laoo
-121: Latn
-122: Lepc
-118: Letter
-165: Letter_Number
-123: Limb
-124: Lina
-125: Linb
-260: Line_Separator
-130: LOE
-127: Lowercase_Letter
-134: Lyci
-135: Lydi
-137: Mahj
-138: Maka
-140: Mand
-141: Mani
-142: Marc
-136: Mark
-223: Math_Symbol
-147: Medf
-149: Mend
-150: Merc
-151: Mero
-139: Mlym
-128: Modifier_Letter
-222: Modifier_Symbol
-155: Mong
-156: Mroo
-148: Mtei
-157: Mult
-158: Mymr
-173: Narb
-160: Nbat
-167: NChar
-164: Nkoo
-153: Nonspacing_Mark
-168: Nshu
-159: Number
-182: OAlpha
-183: ODI
-169: Ogam
-184: OGr_Ext
-185: OIDC
-186: OIDS
-170: Olck
-187: OLower
-188: OMath
-205: Open_Punctuation
-178: Orkh
-179: Orya
-180: Osge
-181: Osma
+194: Hmng
+171: Hmnp
+174: Hung
+102: IDC
+104: Ideo
+103: IDS
+100: IDSB
+101: IDST
+205: Initial_Punctuation
+175: Ital
+109: Java
+110: Join_C
+114: Kali
+113: Kana
+115: Khar
+116: Khmr
+117: Khoj
+112: Knda
+111: Kthi
+238: Lana
+121: Laoo
+122: Latn
+123: Lepc
+119: Letter
+167: Letter_Number
+124: Limb
+125: Lina
+126: Linb
+264: Line_Separator
+131: LOE
+128: Lowercase_Letter
+135: Lyci
+136: Lydi
+138: Mahj
+139: Maka
+141: Mand
+142: Mani
+143: Marc
+137: Mark
+226: Math_Symbol
+148: Medf
+150: Mend
+151: Merc
+152: Mero
+140: Mlym
+129: Modifier_Letter
+225: Modifier_Symbol
+156: Mong
+157: Mroo
+149: Mtei
+158: Mult
+159: Mymr
+162: Nand
+176: Narb
+161: Nbat
+169: NChar
+166: Nkoo
+154: Nonspacing_Mark
+170: Nshu
+160: Number
+185: OAlpha
+186: ODI
+172: Ogam
+187: OGr_Ext
+188: OIDC
+189: OIDS
+173: Olck
+190: OLower
+191: OMath
+208: Open_Punctuation
+181: Orkh
+182: Orya
+183: Osge
+184: Osma
37: Other
-129: Other_Letter
-166: Other_Number
-203: Other_Punctuation
-224: Other_Symbol
-189: OUpper
-192: Palm
-261: Paragraph_Separator
-193: Pat_Syn
-194: Pat_WS
-195: Pauc
-204: PCM
-174: Perm
-200: Phag
-106: Phli
-206: Phlp
-201: Phnx
-152: Plrd
+130: Other_Letter
+168: Other_Number
+206: Other_Punctuation
+227: Other_Symbol
+192: OUpper
+195: Palm
+265: Paragraph_Separator
+196: Pat_Syn
+197: Pat_WS
+198: Pauc
+207: PCM
+177: Perm
+203: Phag
+107: Phli
+209: Phlp
+204: Phnx
+153: Plrd
54: Private_Use
-107: Prti
-190: Punctuation
+108: Prti
+193: Punctuation
56: Qaac
-105: Qaai
-207: QMark
-209: RI
-210: Rjng
- 92: Rohg
-211: Runr
-213: Samr
-177: Sarb
-214: Saur
-225: SD
-258: Separator
-220: Sgnw
-218: Shaw
-217: Shrd
-219: Sidd
-117: Sind
-221: Sinh
-226: Sogd
-176: Sogo
-227: Sora
-228: Soyo
-262: Space_Separator
-145: Spacing_Mark
-216: STerm
-229: Sund
+106: Qaai
+210: QMark
+212: RI
+213: Rjng
+ 93: Rohg
+214: Runr
+216: Samr
+180: Sarb
+217: Saur
+228: SD
+262: Separator
+223: Sgnw
+221: Shaw
+220: Shrd
+222: Sidd
+118: Sind
+224: Sinh
+229: Sogd
+179: Sogo
+230: Sora
+231: Soyo
+266: Space_Separator
+146: Spacing_Mark
+219: STerm
+232: Sund
57: Surrogate
-230: Sylo
-212: Symbol
-231: Syrc
-233: Tagb
-237: Takr
-234: Tale
-162: Talu
-238: Taml
-239: Tang
-236: Tavt
-240: Telu
-241: Term
-245: Tfng
-232: Tglg
-242: Thaa
-244: Tibt
-246: Tirh
-132: Titlecase_Letter
-247: Ugar
-248: UIdeo
+233: Sylo
+215: Symbol
+234: Syrc
+236: Tagb
+240: Takr
+237: Tale
+164: Talu
+241: Taml
+242: Tang
+239: Tavt
+243: Telu
+244: Term
+248: Tfng
+235: Tglg
+245: Thaa
+247: Tibt
+249: Tirh
+133: Titlecase_Letter
+250: Ugar
+251: UIdeo
53: Unassigned
-133: Uppercase_Letter
-251: Vaii
-252: VS
-253: Wara
-254: WSpace
-255: XIDC
-256: XIDS
-175: Xpeo
+134: Uppercase_Letter
+254: Vaii
+255: VS
+257: Wara
+256: Wcho
+258: WSpace
+259: XIDC
+260: XIDS
+178: Xpeo
58: Xsux
-257: Yiii
-259: Zanb
-105: Zinh
+261: Yiii
+263: Zanb
+106: Zinh
55: Zyyy
-249: Zzzz
-263: In_Basic_Latin
-264: In_Latin_1_Supplement
-265: In_Latin_Extended_A
-266: In_Latin_Extended_B
-267: In_IPA_Extensions
-268: In_Spacing_Modifier_Letters
-269: In_Combining_Diacritical_Marks
-270: In_Greek_and_Coptic
-271: In_Cyrillic
-272: In_Cyrillic_Supplement
-273: In_Armenian
-274: In_Hebrew
-275: In_Arabic
-276: In_Syriac
-277: In_Arabic_Supplement
-278: In_Thaana
-279: In_NKo
-280: In_Samaritan
-281: In_Mandaic
-282: In_Syriac_Supplement
-283: In_Arabic_Extended_A
-284: In_Devanagari
-285: In_Bengali
-286: In_Gurmukhi
-287: In_Gujarati
-288: In_Oriya
-289: In_Tamil
-290: In_Telugu
-291: In_Kannada
-292: In_Malayalam
-293: In_Sinhala
-294: In_Thai
-295: In_Lao
-296: In_Tibetan
-297: In_Myanmar
-298: In_Georgian
-299: In_Hangul_Jamo
-300: In_Ethiopic
-301: In_Ethiopic_Supplement
-302: In_Cherokee
-303: In_Unified_Canadian_Aboriginal_Syllabics
-304: In_Ogham
-305: In_Runic
-306: In_Tagalog
-307: In_Hanunoo
-308: In_Buhid
-309: In_Tagbanwa
-310: In_Khmer
-311: In_Mongolian
-312: In_Unified_Canadian_Aboriginal_Syllabics_Extended
-313: In_Limbu
-314: In_Tai_Le
-315: In_New_Tai_Lue
-316: In_Khmer_Symbols
-317: In_Buginese
-318: In_Tai_Tham
-319: In_Combining_Diacritical_Marks_Extended
-320: In_Balinese
-321: In_Sundanese
-322: In_Batak
-323: In_Lepcha
-324: In_Ol_Chiki
-325: In_Cyrillic_Extended_C
-326: In_Georgian_Extended
-327: In_Sundanese_Supplement
-328: In_Vedic_Extensions
-329: In_Phonetic_Extensions
-330: In_Phonetic_Extensions_Supplement
-331: In_Combining_Diacritical_Marks_Supplement
-332: In_Latin_Extended_Additional
-333: In_Greek_Extended
-334: In_General_Punctuation
-335: In_Superscripts_and_Subscripts
-336: In_Currency_Symbols
-337: In_Combining_Diacritical_Marks_for_Symbols
-338: In_Letterlike_Symbols
-339: In_Number_Forms
-340: In_Arrows
-341: In_Mathematical_Operators
-342: In_Miscellaneous_Technical
-343: In_Control_Pictures
-344: In_Optical_Character_Recognition
-345: In_Enclosed_Alphanumerics
-346: In_Box_Drawing
-347: In_Block_Elements
-348: In_Geometric_Shapes
-349: In_Miscellaneous_Symbols
-350: In_Dingbats
-351: In_Miscellaneous_Mathematical_Symbols_A
-352: In_Supplemental_Arrows_A
-353: In_Braille_Patterns
-354: In_Supplemental_Arrows_B
-355: In_Miscellaneous_Mathematical_Symbols_B
-356: In_Supplemental_Mathematical_Operators
-357: In_Miscellaneous_Symbols_and_Arrows
-358: In_Glagolitic
-359: In_Latin_Extended_C
-360: In_Coptic
-361: In_Georgian_Supplement
-362: In_Tifinagh
-363: In_Ethiopic_Extended
-364: In_Cyrillic_Extended_A
-365: In_Supplemental_Punctuation
-366: In_CJK_Radicals_Supplement
-367: In_Kangxi_Radicals
-368: In_Ideographic_Description_Characters
-369: In_CJK_Symbols_and_Punctuation
-370: In_Hiragana
-371: In_Katakana
-372: In_Bopomofo
-373: In_Hangul_Compatibility_Jamo
-374: In_Kanbun
-375: In_Bopomofo_Extended
-376: In_CJK_Strokes
-377: In_Katakana_Phonetic_Extensions
-378: In_Enclosed_CJK_Letters_and_Months
-379: In_CJK_Compatibility
-380: In_CJK_Unified_Ideographs_Extension_A
-381: In_Yijing_Hexagram_Symbols
-382: In_CJK_Unified_Ideographs
-383: In_Yi_Syllables
-384: In_Yi_Radicals
-385: In_Lisu
-386: In_Vai
-387: In_Cyrillic_Extended_B
-388: In_Bamum
-389: In_Modifier_Tone_Letters
-390: In_Latin_Extended_D
-391: In_Syloti_Nagri
-392: In_Common_Indic_Number_Forms
-393: In_Phags_pa
-394: In_Saurashtra
-395: In_Devanagari_Extended
-396: In_Kayah_Li
-397: In_Rejang
-398: In_Hangul_Jamo_Extended_A
-399: In_Javanese
-400: In_Myanmar_Extended_B
-401: In_Cham
-402: In_Myanmar_Extended_A
-403: In_Tai_Viet
-404: In_Meetei_Mayek_Extensions
-405: In_Ethiopic_Extended_A
-406: In_Latin_Extended_E
-407: In_Cherokee_Supplement
-408: In_Meetei_Mayek
-409: In_Hangul_Syllables
-410: In_Hangul_Jamo_Extended_B
-411: In_High_Surrogates
-412: In_High_Private_Use_Surrogates
-413: In_Low_Surrogates
-414: In_Private_Use_Area
-415: In_CJK_Compatibility_Ideographs
-416: In_Alphabetic_Presentation_Forms
-417: In_Arabic_Presentation_Forms_A
-418: In_Variation_Selectors
-419: In_Vertical_Forms
-420: In_Combining_Half_Marks
-421: In_CJK_Compatibility_Forms
-422: In_Small_Form_Variants
-423: In_Arabic_Presentation_Forms_B
-424: In_Halfwidth_and_Fullwidth_Forms
-425: In_Specials
-426: In_Linear_B_Syllabary
-427: In_Linear_B_Ideograms
-428: In_Aegean_Numbers
-429: In_Ancient_Greek_Numbers
-430: In_Ancient_Symbols
-431: In_Phaistos_Disc
-432: In_Lycian
-433: In_Carian
-434: In_Coptic_Epact_Numbers
-435: In_Old_Italic
-436: In_Gothic
-437: In_Old_Permic
-438: In_Ugaritic
-439: In_Old_Persian
-440: In_Deseret
-441: In_Shavian
-442: In_Osmanya
-443: In_Osage
-444: In_Elbasan
-445: In_Caucasian_Albanian
-446: In_Linear_A
-447: In_Cypriot_Syllabary
-448: In_Imperial_Aramaic
-449: In_Palmyrene
-450: In_Nabataean
-451: In_Hatran
-452: In_Phoenician
-453: In_Lydian
-454: In_Meroitic_Hieroglyphs
-455: In_Meroitic_Cursive
-456: In_Kharoshthi
-457: In_Old_South_Arabian
-458: In_Old_North_Arabian
-459: In_Manichaean
-460: In_Avestan
-461: In_Inscriptional_Parthian
-462: In_Inscriptional_Pahlavi
-463: In_Psalter_Pahlavi
-464: In_Old_Turkic
-465: In_Old_Hungarian
-466: In_Hanifi_Rohingya
-467: In_Rumi_Numeral_Symbols
-468: In_Old_Sogdian
-469: In_Sogdian
-470: In_Brahmi
-471: In_Kaithi
-472: In_Sora_Sompeng
-473: In_Chakma
-474: In_Mahajani
-475: In_Sharada
-476: In_Sinhala_Archaic_Numbers
-477: In_Khojki
-478: In_Multani
-479: In_Khudawadi
-480: In_Grantha
-481: In_Newa
-482: In_Tirhuta
-483: In_Siddham
-484: In_Modi
-485: In_Mongolian_Supplement
-486: In_Takri
-487: In_Ahom
-488: In_Dogra
-489: In_Warang_Citi
-490: In_Zanabazar_Square
-491: In_Soyombo
-492: In_Pau_Cin_Hau
-493: In_Bhaiksuki
-494: In_Marchen
-495: In_Masaram_Gondi
-496: In_Gunjala_Gondi
-497: In_Makasar
-498: In_Cuneiform
-499: In_Cuneiform_Numbers_and_Punctuation
-500: In_Early_Dynastic_Cuneiform
-501: In_Egyptian_Hieroglyphs
-502: In_Anatolian_Hieroglyphs
-503: In_Bamum_Supplement
-504: In_Mro
-505: In_Bassa_Vah
-506: In_Pahawh_Hmong
-507: In_Medefaidrin
-508: In_Miao
-509: In_Ideographic_Symbols_and_Punctuation
-510: In_Tangut
-511: In_Tangut_Components
-512: In_Kana_Supplement
-513: In_Kana_Extended_A
-514: In_Nushu
-515: In_Duployan
-516: In_Shorthand_Format_Controls
-517: In_Byzantine_Musical_Symbols
-518: In_Musical_Symbols
-519: In_Ancient_Greek_Musical_Notation
-520: In_Mayan_Numerals
-521: In_Tai_Xuan_Jing_Symbols
-522: In_Counting_Rod_Numerals
-523: In_Mathematical_Alphanumeric_Symbols
-524: In_Sutton_SignWriting
-525: In_Glagolitic_Supplement
-526: In_Mende_Kikakui
-527: In_Adlam
-528: In_Indic_Siyaq_Numbers
-529: In_Arabic_Mathematical_Alphabetic_Symbols
-530: In_Mahjong_Tiles
-531: In_Domino_Tiles
-532: In_Playing_Cards
-533: In_Enclosed_Alphanumeric_Supplement
-534: In_Enclosed_Ideographic_Supplement
-535: In_Miscellaneous_Symbols_and_Pictographs
-536: In_Emoticons
-537: In_Ornamental_Dingbats
-538: In_Transport_and_Map_Symbols
-539: In_Alchemical_Symbols
-540: In_Geometric_Shapes_Extended
-541: In_Supplemental_Arrows_C
-542: In_Supplemental_Symbols_and_Pictographs
-543: In_Chess_Symbols
-544: In_CJK_Unified_Ideographs_Extension_B
-545: In_CJK_Unified_Ideographs_Extension_C
-546: In_CJK_Unified_Ideographs_Extension_D
-547: In_CJK_Unified_Ideographs_Extension_E
-548: In_CJK_Unified_Ideographs_Extension_F
-549: In_CJK_Compatibility_Ideographs_Supplement
-550: In_Tags
-551: In_Variation_Selectors_Supplement
-552: In_Supplementary_Private_Use_Area_A
-553: In_Supplementary_Private_Use_Area_B
-554: In_No_Block
+252: Zzzz
+267: In_Basic_Latin
+268: In_Latin_1_Supplement
+269: In_Latin_Extended_A
+270: In_Latin_Extended_B
+271: In_IPA_Extensions
+272: In_Spacing_Modifier_Letters
+273: In_Combining_Diacritical_Marks
+274: In_Greek_and_Coptic
+275: In_Cyrillic
+276: In_Cyrillic_Supplement
+277: In_Armenian
+278: In_Hebrew
+279: In_Arabic
+280: In_Syriac
+281: In_Arabic_Supplement
+282: In_Thaana
+283: In_NKo
+284: In_Samaritan
+285: In_Mandaic
+286: In_Syriac_Supplement
+287: In_Arabic_Extended_A
+288: In_Devanagari
+289: In_Bengali
+290: In_Gurmukhi
+291: In_Gujarati
+292: In_Oriya
+293: In_Tamil
+294: In_Telugu
+295: In_Kannada
+296: In_Malayalam
+297: In_Sinhala
+298: In_Thai
+299: In_Lao
+300: In_Tibetan
+301: In_Myanmar
+302: In_Georgian
+303: In_Hangul_Jamo
+304: In_Ethiopic
+305: In_Ethiopic_Supplement
+306: In_Cherokee
+307: In_Unified_Canadian_Aboriginal_Syllabics
+308: In_Ogham
+309: In_Runic
+310: In_Tagalog
+311: In_Hanunoo
+312: In_Buhid
+313: In_Tagbanwa
+314: In_Khmer
+315: In_Mongolian
+316: In_Unified_Canadian_Aboriginal_Syllabics_Extended
+317: In_Limbu
+318: In_Tai_Le
+319: In_New_Tai_Lue
+320: In_Khmer_Symbols
+321: In_Buginese
+322: In_Tai_Tham
+323: In_Combining_Diacritical_Marks_Extended
+324: In_Balinese
+325: In_Sundanese
+326: In_Batak
+327: In_Lepcha
+328: In_Ol_Chiki
+329: In_Cyrillic_Extended_C
+330: In_Georgian_Extended
+331: In_Sundanese_Supplement
+332: In_Vedic_Extensions
+333: In_Phonetic_Extensions
+334: In_Phonetic_Extensions_Supplement
+335: In_Combining_Diacritical_Marks_Supplement
+336: In_Latin_Extended_Additional
+337: In_Greek_Extended
+338: In_General_Punctuation
+339: In_Superscripts_and_Subscripts
+340: In_Currency_Symbols
+341: In_Combining_Diacritical_Marks_for_Symbols
+342: In_Letterlike_Symbols
+343: In_Number_Forms
+344: In_Arrows
+345: In_Mathematical_Operators
+346: In_Miscellaneous_Technical
+347: In_Control_Pictures
+348: In_Optical_Character_Recognition
+349: In_Enclosed_Alphanumerics
+350: In_Box_Drawing
+351: In_Block_Elements
+352: In_Geometric_Shapes
+353: In_Miscellaneous_Symbols
+354: In_Dingbats
+355: In_Miscellaneous_Mathematical_Symbols_A
+356: In_Supplemental_Arrows_A
+357: In_Braille_Patterns
+358: In_Supplemental_Arrows_B
+359: In_Miscellaneous_Mathematical_Symbols_B
+360: In_Supplemental_Mathematical_Operators
+361: In_Miscellaneous_Symbols_and_Arrows
+362: In_Glagolitic
+363: In_Latin_Extended_C
+364: In_Coptic
+365: In_Georgian_Supplement
+366: In_Tifinagh
+367: In_Ethiopic_Extended
+368: In_Cyrillic_Extended_A
+369: In_Supplemental_Punctuation
+370: In_CJK_Radicals_Supplement
+371: In_Kangxi_Radicals
+372: In_Ideographic_Description_Characters
+373: In_CJK_Symbols_and_Punctuation
+374: In_Hiragana
+375: In_Katakana
+376: In_Bopomofo
+377: In_Hangul_Compatibility_Jamo
+378: In_Kanbun
+379: In_Bopomofo_Extended
+380: In_CJK_Strokes
+381: In_Katakana_Phonetic_Extensions
+382: In_Enclosed_CJK_Letters_and_Months
+383: In_CJK_Compatibility
+384: In_CJK_Unified_Ideographs_Extension_A
+385: In_Yijing_Hexagram_Symbols
+386: In_CJK_Unified_Ideographs
+387: In_Yi_Syllables
+388: In_Yi_Radicals
+389: In_Lisu
+390: In_Vai
+391: In_Cyrillic_Extended_B
+392: In_Bamum
+393: In_Modifier_Tone_Letters
+394: In_Latin_Extended_D
+395: In_Syloti_Nagri
+396: In_Common_Indic_Number_Forms
+397: In_Phags_pa
+398: In_Saurashtra
+399: In_Devanagari_Extended
+400: In_Kayah_Li
+401: In_Rejang
+402: In_Hangul_Jamo_Extended_A
+403: In_Javanese
+404: In_Myanmar_Extended_B
+405: In_Cham
+406: In_Myanmar_Extended_A
+407: In_Tai_Viet
+408: In_Meetei_Mayek_Extensions
+409: In_Ethiopic_Extended_A
+410: In_Latin_Extended_E
+411: In_Cherokee_Supplement
+412: In_Meetei_Mayek
+413: In_Hangul_Syllables
+414: In_Hangul_Jamo_Extended_B
+415: In_High_Surrogates
+416: In_High_Private_Use_Surrogates
+417: In_Low_Surrogates
+418: In_Private_Use_Area
+419: In_CJK_Compatibility_Ideographs
+420: In_Alphabetic_Presentation_Forms
+421: In_Arabic_Presentation_Forms_A
+422: In_Variation_Selectors
+423: In_Vertical_Forms
+424: In_Combining_Half_Marks
+425: In_CJK_Compatibility_Forms
+426: In_Small_Form_Variants
+427: In_Arabic_Presentation_Forms_B
+428: In_Halfwidth_and_Fullwidth_Forms
+429: In_Specials
+430: In_Linear_B_Syllabary
+431: In_Linear_B_Ideograms
+432: In_Aegean_Numbers
+433: In_Ancient_Greek_Numbers
+434: In_Ancient_Symbols
+435: In_Phaistos_Disc
+436: In_Lycian
+437: In_Carian
+438: In_Coptic_Epact_Numbers
+439: In_Old_Italic
+440: In_Gothic
+441: In_Old_Permic
+442: In_Ugaritic
+443: In_Old_Persian
+444: In_Deseret
+445: In_Shavian
+446: In_Osmanya
+447: In_Osage
+448: In_Elbasan
+449: In_Caucasian_Albanian
+450: In_Linear_A
+451: In_Cypriot_Syllabary
+452: In_Imperial_Aramaic
+453: In_Palmyrene
+454: In_Nabataean
+455: In_Hatran
+456: In_Phoenician
+457: In_Lydian
+458: In_Meroitic_Hieroglyphs
+459: In_Meroitic_Cursive
+460: In_Kharoshthi
+461: In_Old_South_Arabian
+462: In_Old_North_Arabian
+463: In_Manichaean
+464: In_Avestan
+465: In_Inscriptional_Parthian
+466: In_Inscriptional_Pahlavi
+467: In_Psalter_Pahlavi
+468: In_Old_Turkic
+469: In_Old_Hungarian
+470: In_Hanifi_Rohingya
+471: In_Rumi_Numeral_Symbols
+472: In_Old_Sogdian
+473: In_Sogdian
+474: In_Elymaic
+475: In_Brahmi
+476: In_Kaithi
+477: In_Sora_Sompeng
+478: In_Chakma
+479: In_Mahajani
+480: In_Sharada
+481: In_Sinhala_Archaic_Numbers
+482: In_Khojki
+483: In_Multani
+484: In_Khudawadi
+485: In_Grantha
+486: In_Newa
+487: In_Tirhuta
+488: In_Siddham
+489: In_Modi
+490: In_Mongolian_Supplement
+491: In_Takri
+492: In_Ahom
+493: In_Dogra
+494: In_Warang_Citi
+495: In_Nandinagari
+496: In_Zanabazar_Square
+497: In_Soyombo
+498: In_Pau_Cin_Hau
+499: In_Bhaiksuki
+500: In_Marchen
+501: In_Masaram_Gondi
+502: In_Gunjala_Gondi
+503: In_Makasar
+504: In_Tamil_Supplement
+505: In_Cuneiform
+506: In_Cuneiform_Numbers_and_Punctuation
+507: In_Early_Dynastic_Cuneiform
+508: In_Egyptian_Hieroglyphs
+509: In_Egyptian_Hieroglyph_Format_Controls
+510: In_Anatolian_Hieroglyphs
+511: In_Bamum_Supplement
+512: In_Mro
+513: In_Bassa_Vah
+514: In_Pahawh_Hmong
+515: In_Medefaidrin
+516: In_Miao
+517: In_Ideographic_Symbols_and_Punctuation
+518: In_Tangut
+519: In_Tangut_Components
+520: In_Kana_Supplement
+521: In_Kana_Extended_A
+522: In_Small_Kana_Extension
+523: In_Nushu
+524: In_Duployan
+525: In_Shorthand_Format_Controls
+526: In_Byzantine_Musical_Symbols
+527: In_Musical_Symbols
+528: In_Ancient_Greek_Musical_Notation
+529: In_Mayan_Numerals
+530: In_Tai_Xuan_Jing_Symbols
+531: In_Counting_Rod_Numerals
+532: In_Mathematical_Alphanumeric_Symbols
+533: In_Sutton_SignWriting
+534: In_Glagolitic_Supplement
+535: In_Nyiakeng_Puachue_Hmong
+536: In_Wancho
+537: In_Mende_Kikakui
+538: In_Adlam
+539: In_Indic_Siyaq_Numbers
+540: In_Ottoman_Siyaq_Numbers
+541: In_Arabic_Mathematical_Alphabetic_Symbols
+542: In_Mahjong_Tiles
+543: In_Domino_Tiles
+544: In_Playing_Cards
+545: In_Enclosed_Alphanumeric_Supplement
+546: In_Enclosed_Ideographic_Supplement
+547: In_Miscellaneous_Symbols_and_Pictographs
+548: In_Emoticons
+549: In_Ornamental_Dingbats
+550: In_Transport_and_Map_Symbols
+551: In_Alchemical_Symbols
+552: In_Geometric_Shapes_Extended
+553: In_Supplemental_Arrows_C
+554: In_Supplemental_Symbols_and_Pictographs
+555: In_Chess_Symbols
+556: In_Symbols_and_Pictographs_Extended_A
+557: In_CJK_Unified_Ideographs_Extension_B
+558: In_CJK_Unified_Ideographs_Extension_C
+559: In_CJK_Unified_Ideographs_Extension_D
+560: In_CJK_Unified_Ideographs_Extension_E
+561: In_CJK_Unified_Ideographs_Extension_F
+562: In_CJK_Compatibility_Ideographs_Supplement
+563: In_Tags
+564: In_Variation_Selectors_Supplement
+565: In_Supplementary_Private_Use_Area_A
+566: In_Supplementary_Private_Use_Area_B
+567: In_No_Block