From 2f1eff3d4e0c24e2ac28c8bcaa8eb740b8e22c48 Mon Sep 17 00:00:00 2001 From: Unicode Consortium Date: Wed, 15 Sep 2021 08:26:00 -0600 Subject: Support Unicode 14.0 --- charclass_invlists.h | 21582 ++++++++++++++++------ lib/Unicode/UCD.t | 4 +- lib/unicore/ArabicShaping.txt | 80 +- lib/unicore/BidiBrackets.txt | 20 +- lib/unicore/BidiMirroring.txt | 26 +- lib/unicore/Blocks.txt | 22 +- lib/unicore/CJKRadicals.txt | 6 +- lib/unicore/CaseFolding.txt | 46 +- lib/unicore/CompositionExclusions.txt | 12 +- lib/unicore/DAge.txt | 95 +- lib/unicore/DCoreProperties.txt | 700 +- lib/unicore/DNormalizationProps.txt | 144 +- lib/unicore/EastAsianWidth.txt | 149 +- lib/unicore/EmojiSources.txt | 6 +- lib/unicore/EquivalentUnifiedIdeograph.txt | 6 +- lib/unicore/HangulSyllableType.txt | 6 +- lib/unicore/IdStatus.txt | 31 +- lib/unicore/IdType.txt | 125 +- lib/unicore/Index.txt | 6 + lib/unicore/IndicPositionalCategory.txt | 18 +- lib/unicore/IndicSyllabicCategory.txt | 30 +- lib/unicore/Jamo.txt | 8 +- lib/unicore/LineBreak.txt | 169 +- lib/unicore/NameAliases.txt | 8 +- lib/unicore/NamedSequences.txt | 43 +- lib/unicore/NamedSqProv.txt | 41 +- lib/unicore/NamesList.txt | 1807 +- lib/unicore/NormalizationCorrections.txt | 6 +- lib/unicore/PropList.txt | 100 +- lib/unicore/PropValueAliases.txt | 26 +- lib/unicore/PropertyAliases.txt | 6 +- lib/unicore/ReadMe.txt | 10 +- lib/unicore/ScriptExtensions.txt | 80 +- lib/unicore/Scripts.txt | 213 +- lib/unicore/SpecialCasing.txt | 6 +- lib/unicore/StandardizedVariants.txt | 70 +- lib/unicore/UnicodeData.txt | 837 +- lib/unicore/VerticalOrientation.txt | 187 +- lib/unicore/auxiliary/GCBTest.txt | 6 +- lib/unicore/auxiliary/GraphemeBreakProperty.txt | 33 +- lib/unicore/auxiliary/LBTest.txt | 60 +- lib/unicore/auxiliary/SBTest.txt | 6 +- lib/unicore/auxiliary/SentenceBreakProperty.txt | 130 +- lib/unicore/auxiliary/WBTest.txt | 6 +- lib/unicore/auxiliary/WordBreakProperty.txt | 96 +- lib/unicore/emoji/emoji.txt | 96 +- lib/unicore/extracted/DBidiClass.txt | 178 +- lib/unicore/extracted/DBinaryProperties.txt | 18 +- lib/unicore/extracted/DCombiningClass.txt | 165 +- lib/unicore/extracted/DDecompositionType.txt | 14 +- lib/unicore/extracted/DEastAsianWidth.txt | 153 +- lib/unicore/extracted/DGeneralCategory.txt | 306 +- lib/unicore/extracted/DJoinGroup.txt | 37 +- lib/unicore/extracted/DJoinType.txt | 46 +- lib/unicore/extracted/DLineBreak.txt | 195 +- lib/unicore/extracted/DNumType.txt | 9 +- lib/unicore/extracted/DNumValues.txt | 36 +- lib/unicore/mktables | 2 +- lib/unicore/uni_keywords.pl | 2586 +-- lib/unicore/version | 2 +- pod/perldelta.pod | 4 + regcharclass.h | 104 +- regen/mk_invlists.pl | 19 +- uni_keywords.h | 15119 +++++++-------- unicode_constants.h | 4 +- 65 files changed, 30605 insertions(+), 15556 deletions(-) diff --git a/charclass_invlists.h b/charclass_invlists.h index 4daa404be0..7fb2069eb7 100644 --- a/charclass_invlists.h +++ b/charclass_invlists.h @@ -54,7 +54,7 @@ static const UV * const InBitmap_invlist = Latin1_invlist; # if 'A' == 65 /* ASCII/Latin1 */ static const UV Case_Folding_invlist[] = { /* for ASCII/Latin1 */ - 1398, /* Number of elements */ + 1414, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -1072,7 +1072,7 @@ static const UV Case_Folding_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -1416,6 +1416,8 @@ static const UV Case_Folding_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -1425,6 +1427,12 @@ static const UV Case_Folding_invlist[] = { /* for ASCII/Latin1 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -1448,6 +1456,14 @@ static const UV Case_Folding_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -3444,6 +3460,8 @@ static const I32 Case_Folding_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -3453,6 +3471,12 @@ static const I32 Case_Folding_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0x13A0, @@ -3476,6 +3500,14 @@ static const I32 Case_Folding_invmap[] = { /* for ASCII/Latin1 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -3498,7 +3530,7 @@ static const I32 Case_Folding_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV Case_Folding_invlist[] = { /* for EBCDIC 1047 */ - 1417, /* Number of elements */ + 1433, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -4535,7 +4567,7 @@ static const UV Case_Folding_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -4879,6 +4911,8 @@ static const UV Case_Folding_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -4888,6 +4922,12 @@ static const UV Case_Folding_invlist[] = { /* for EBCDIC 1047 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -4911,6 +4951,14 @@ static const UV Case_Folding_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -6929,6 +6977,8 @@ static const I32 Case_Folding_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -6938,6 +6988,12 @@ static const I32 Case_Folding_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0x13A0, @@ -6961,6 +7017,14 @@ static const I32 Case_Folding_invmap[] = { /* for EBCDIC 1047 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -6983,7 +7047,7 @@ static const I32 Case_Folding_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV Case_Folding_invlist[] = { /* for EBCDIC 037 */ - 1413, /* Number of elements */ + 1429, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -8016,7 +8080,7 @@ static const UV Case_Folding_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -8360,6 +8424,8 @@ static const UV Case_Folding_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -8369,6 +8435,12 @@ static const UV Case_Folding_invlist[] = { /* for EBCDIC 037 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -8392,6 +8464,14 @@ static const UV Case_Folding_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -10406,6 +10486,8 @@ static const I32 Case_Folding_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -10415,6 +10497,12 @@ static const I32 Case_Folding_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0x13A0, @@ -10438,6 +10526,14 @@ static const I32 Case_Folding_invmap[] = { /* for EBCDIC 037 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -10457,7 +10553,7 @@ static const I32 Case_Folding_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV Lowercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ - 1262, /* Number of elements */ + 1278, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -11354,7 +11450,7 @@ static const UV Lowercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -11698,6 +11794,8 @@ static const UV Lowercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -11707,6 +11805,12 @@ static const UV Lowercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -11715,6 +11819,14 @@ static const UV Lowercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -13000,6 +13112,8 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -13009,6 +13123,12 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0xFF41, @@ -13017,6 +13137,14 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for ASCII/Latin1 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -13039,7 +13167,7 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ - 1280, /* Number of elements */ + 1296, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -13954,7 +14082,7 @@ static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -14298,6 +14426,8 @@ static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -14307,6 +14437,12 @@ static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -14315,6 +14451,14 @@ static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -15621,6 +15765,8 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -15630,6 +15776,12 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0xFF41, @@ -15638,6 +15790,14 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for EBCDIC 1047 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -15660,7 +15820,7 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 037 */ - 1276, /* Number of elements */ + 1292, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -16571,7 +16731,7 @@ static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -16915,6 +17075,8 @@ static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -16924,6 +17086,12 @@ static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -16932,6 +17100,14 @@ static const UV Lowercase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -18234,6 +18410,8 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -18243,6 +18421,12 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0xFF41, @@ -18251,6 +18435,14 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for EBCDIC 037 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -18268,7 +18460,7 @@ static const I32 Lowercase_Mapping_invmap[] = { /* for EBCDIC 037 */ #if (defined(PERL_IN_REGCOMP_C) && ! defined(PERL_IN_XSUB_RE)) static const UV _Perl_CCC_non0_non230_invlist[] = { /* for all charsets */ - 359, /* Number of elements */ + 373, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -18353,7 +18545,9 @@ static const UV _Perl_CCC_non0_non230_invlist[] = { /* for all charsets */ 0x7FE, 0x859, 0x85C, - 0x8D3, + 0x899, + 0x89C, + 0x8CF, 0x8D4, 0x8E3, 0x8E4, @@ -18391,6 +18585,8 @@ static const UV _Perl_CCC_non0_non230_invlist[] = { /* for all charsets */ 0xB4E, 0xBCD, 0xBCE, + 0xC3C, + 0xC3D, 0xC4D, 0xC4E, 0xC55, @@ -18440,7 +18636,7 @@ static const UV _Perl_CCC_non0_non230_invlist[] = { /* for all charsets */ 0x108D, 0x108E, 0x1714, - 0x1715, + 0x1716, 0x1734, 0x1735, 0x17D2, @@ -18463,6 +18659,10 @@ static const UV _Perl_CCC_non0_non230_invlist[] = { /* for all charsets */ 0x1ABE, 0x1ABF, 0x1AC1, + 0x1AC3, + 0x1AC5, + 0x1ACA, + 0x1ACB, 0x1B34, 0x1B35, 0x1B44, @@ -18492,7 +18692,7 @@ static const UV _Perl_CCC_non0_non230_invlist[] = { /* for all charsets */ 0x1DCD, 0x1DD1, 0x1DF6, - 0x1DFA, + 0x1DFB, 0x1DFC, 0x1DFE, 0x1DFF, @@ -18555,8 +18755,14 @@ static const UV _Perl_CCC_non0_non230_invlist[] = { /* for all charsets */ 0x10F4C, 0x10F4D, 0x10F51, + 0x10F83, + 0x10F84, + 0x10F85, + 0x10F86, 0x11046, 0x11047, + 0x11070, + 0x11071, 0x1107F, 0x11080, 0x110B9, @@ -18636,7 +18842,7 @@ static const UV _Perl_CCC_non0_non230_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ - 1805, /* Number of elements */ + 1826, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -18708,7 +18914,11 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -18819,6 +19029,8 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC45, @@ -18954,7 +19166,9 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x1360, 0x1712, 0x1715, + 0x1716, 0x1732, + 0x1734, 0x1735, 0x1752, 0x1754, @@ -18973,6 +19187,7 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x180B, 0x180E, 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -19007,7 +19222,7 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B05, @@ -19058,8 +19273,6 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -20103,12 +20316,18 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11001, 0x11002, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x11083, @@ -20119,6 +20338,8 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -20337,6 +20558,10 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D166, 0x1D167, @@ -20376,6 +20601,8 @@ static const UV _Perl_GCB_invlist[] = { /* for ASCII/Latin1 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -20547,6 +20774,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Prepend, + GCB_Other, + GCB_Extend, + GCB_Other, GCB_Extend, GCB_Prepend, GCB_Extend, @@ -20659,6 +20890,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Other, GCB_Extend, @@ -20792,8 +21025,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_SpacingMark, GCB_Other, GCB_Extend, + GCB_SpacingMark, GCB_Other, GCB_Extend, GCB_Other, @@ -20811,6 +21046,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Other, GCB_Extend, GCB_Control, + GCB_Extend, GCB_Other, GCB_Extend, GCB_Other, @@ -20898,8 +21134,6 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Other, GCB_Extend, GCB_Other, - GCB_Extend, - GCB_Other, GCB_Control, GCB_Extend, GCB_ZWJ, @@ -21942,6 +22176,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_SpacingMark, GCB_Extend, GCB_SpacingMark, @@ -21949,6 +22185,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Other, GCB_SpacingMark, @@ -21958,6 +22198,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Other, GCB_Prepend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_Prepend, GCB_Other, GCB_Extend, @@ -22067,7 +22309,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Extend, GCB_Other, GCB_Extend, - GCB_SpacingMark, + GCB_Other, GCB_Extend, GCB_SpacingMark, GCB_Extend, @@ -22177,6 +22419,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Control, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Extend, GCB_Other, @@ -22221,6 +22467,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_ExtPict_XX, GCB_Other, GCB_ExtPict_XX, @@ -22298,7 +22546,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ - 1806, /* Number of elements */ + 1827, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -22371,7 +22619,11 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -22482,6 +22734,8 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC45, @@ -22617,7 +22871,9 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x1360, 0x1712, 0x1715, + 0x1716, 0x1732, + 0x1734, 0x1735, 0x1752, 0x1754, @@ -22636,6 +22892,7 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x180B, 0x180E, 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -22670,7 +22927,7 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B05, @@ -22721,8 +22978,6 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -23766,12 +24021,18 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11001, 0x11002, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x11083, @@ -23782,6 +24043,8 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -24000,6 +24263,10 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D166, 0x1D167, @@ -24039,6 +24306,8 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 1047 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -24214,6 +24483,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Prepend, + GCB_Other, + GCB_Extend, + GCB_Other, GCB_Extend, GCB_Prepend, GCB_Extend, @@ -24326,6 +24599,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Other, GCB_Extend, @@ -24459,8 +24734,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_SpacingMark, GCB_Other, GCB_Extend, + GCB_SpacingMark, GCB_Other, GCB_Extend, GCB_Other, @@ -24478,6 +24755,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Other, GCB_Extend, GCB_Control, + GCB_Extend, GCB_Other, GCB_Extend, GCB_Other, @@ -24565,8 +24843,6 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Other, GCB_Extend, GCB_Other, - GCB_Extend, - GCB_Other, GCB_Control, GCB_Extend, GCB_ZWJ, @@ -25609,6 +25885,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_SpacingMark, GCB_Extend, GCB_SpacingMark, @@ -25616,6 +25894,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Other, GCB_SpacingMark, @@ -25625,6 +25907,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Other, GCB_Prepend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_Prepend, GCB_Other, GCB_Extend, @@ -25734,7 +26018,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Extend, GCB_Other, GCB_Extend, - GCB_SpacingMark, + GCB_Other, GCB_Extend, GCB_SpacingMark, GCB_Extend, @@ -25844,6 +26128,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Control, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Extend, GCB_Other, @@ -25888,6 +26176,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_ExtPict_XX, GCB_Other, GCB_ExtPict_XX, @@ -25965,7 +26255,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ - 1806, /* Number of elements */ + 1827, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -26038,7 +26328,11 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -26149,6 +26443,8 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC45, @@ -26284,7 +26580,9 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x1360, 0x1712, 0x1715, + 0x1716, 0x1732, + 0x1734, 0x1735, 0x1752, 0x1754, @@ -26303,6 +26601,7 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x180B, 0x180E, 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -26337,7 +26636,7 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B05, @@ -26388,8 +26687,6 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -27433,12 +27730,18 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11001, 0x11002, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x11083, @@ -27449,6 +27752,8 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -27667,6 +27972,10 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D166, 0x1D167, @@ -27706,6 +28015,8 @@ static const UV _Perl_GCB_invlist[] = { /* for EBCDIC 037 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -27881,6 +28192,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Prepend, + GCB_Other, + GCB_Extend, + GCB_Other, GCB_Extend, GCB_Prepend, GCB_Extend, @@ -27993,6 +28308,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Other, GCB_Extend, @@ -28126,8 +28443,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_SpacingMark, GCB_Other, GCB_Extend, + GCB_SpacingMark, GCB_Other, GCB_Extend, GCB_Other, @@ -28145,6 +28464,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Other, GCB_Extend, GCB_Control, + GCB_Extend, GCB_Other, GCB_Extend, GCB_Other, @@ -28232,8 +28552,6 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Other, GCB_Extend, GCB_Other, - GCB_Extend, - GCB_Other, GCB_Control, GCB_Extend, GCB_ZWJ, @@ -29276,6 +29594,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_SpacingMark, GCB_Extend, GCB_SpacingMark, @@ -29283,6 +29603,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Extend, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Other, GCB_SpacingMark, @@ -29292,6 +29616,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Other, GCB_Prepend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_Prepend, GCB_Other, GCB_Extend, @@ -29401,7 +29727,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Extend, GCB_Other, GCB_Extend, - GCB_SpacingMark, + GCB_Other, GCB_Extend, GCB_SpacingMark, GCB_Extend, @@ -29511,6 +29837,10 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Control, GCB_Other, GCB_Extend, + GCB_Other, + GCB_Extend, + GCB_Other, + GCB_Extend, GCB_SpacingMark, GCB_Extend, GCB_Other, @@ -29555,6 +29885,8 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ GCB_Other, GCB_Extend, GCB_Other, + GCB_Extend, + GCB_Other, GCB_ExtPict_XX, GCB_Other, GCB_ExtPict_XX, @@ -29629,7 +29961,7 @@ static const GCB_enum _Perl_GCB_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV _Perl_IVCF_invlist[] = { /* for ASCII/Latin1 */ - 1318, /* Number of elements */ + 1334, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -30593,7 +30925,7 @@ static const UV _Perl_IVCF_invlist[] = { /* for ASCII/Latin1 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -30924,12 +31256,20 @@ static const UV _Perl_IVCF_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -30943,6 +31283,14 @@ static const UV _Perl_IVCF_invlist[] = { /* for ASCII/Latin1 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -32501,12 +32849,20 @@ static const I32 _Perl_IVCF_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -32520,6 +32876,14 @@ static const I32 _Perl_IVCF_invmap[] = { /* for ASCII/Latin1 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -32542,7 +32906,7 @@ static const I32 _Perl_IVCF_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV _Perl_IVCF_invlist[] = { /* for EBCDIC 1047 */ - 1333, /* Number of elements */ + 1349, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -33521,7 +33885,7 @@ static const UV _Perl_IVCF_invlist[] = { /* for EBCDIC 1047 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -33852,12 +34216,20 @@ static const UV _Perl_IVCF_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -33871,6 +34243,14 @@ static const UV _Perl_IVCF_invlist[] = { /* for EBCDIC 1047 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -35447,12 +35827,20 @@ static const I32 _Perl_IVCF_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -35466,6 +35854,14 @@ static const I32 _Perl_IVCF_invmap[] = { /* for EBCDIC 1047 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -35488,7 +35884,7 @@ static const I32 _Perl_IVCF_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV _Perl_IVCF_invlist[] = { /* for EBCDIC 037 */ - 1331, /* Number of elements */ + 1347, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -36465,7 +36861,7 @@ static const UV _Perl_IVCF_invlist[] = { /* for EBCDIC 037 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -36796,12 +37192,20 @@ static const UV _Perl_IVCF_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -36815,6 +37219,14 @@ static const UV _Perl_IVCF_invlist[] = { /* for EBCDIC 037 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -38389,12 +38801,20 @@ static const I32 _Perl_IVCF_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -38408,6 +38828,14 @@ static const I32 _Perl_IVCF_invmap[] = { /* for EBCDIC 037 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -38427,7 +38855,7 @@ static const I32 _Perl_IVCF_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ - 2467, /* Number of elements */ + 2501, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -38529,7 +38957,6 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x620, 0x64B, 0x660, @@ -38576,7 +39003,9 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -38681,6 +39110,8 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0xBFA, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -38850,7 +39281,7 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x16EB, 0x16EE, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1737, @@ -38907,7 +39338,7 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -38919,6 +39350,8 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1B61, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1B83, 0x1BA1, @@ -38947,8 +39380,6 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FFD, 0x1FFE, @@ -39010,6 +39441,8 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2103, @@ -39191,6 +39624,17 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E53, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -40378,6 +40822,8 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x10EAE, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, @@ -40385,12 +40831,16 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x11049, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BE, 0x110C2, + 0x110C3, 0x110F0, 0x110FA, 0x11100, @@ -40606,6 +41056,8 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16AC0, + 0x16ACA, 0x16AF0, 0x16AF5, 0x16AF6, @@ -40636,7 +41088,7 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x18D00, 0x18D09, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -40647,6 +41099,10 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -40687,6 +41143,8 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1E137, 0x1E140, 0x1E14A, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E2FA, @@ -40814,7 +41272,7 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1F6CC, 0x1F6CD, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -40825,6 +41283,8 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -40852,15 +41312,12 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1F93F, 0x1F977, 0x1F978, - 0x1F979, - 0x1F97A, 0x1F9B5, 0x1F9B7, 0x1F9B8, 0x1F9BA, 0x1F9BB, 0x1F9BC, - 0x1F9CC, 0x1F9CD, 0x1F9D0, 0x1F9D1, @@ -40872,17 +41329,22 @@ static const UV _Perl_LB_invlist[] = { /* for ASCII/Latin1 */ 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FBF0, 0x1FBFA, @@ -41051,7 +41513,6 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Combining_Mark, LB_Exclamation, LB_Combining_Mark, - LB_Alphabetic, LB_Exclamation, LB_Alphabetic, LB_Combining_Mark, @@ -41110,6 +41571,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Break_After, LB_Numeric, LB_Alphabetic, @@ -41214,6 +41677,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, LB_Numeric, LB_Alphabetic, LB_Break_Before, @@ -41402,7 +41867,7 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Alphabetic, LB_Combining_Mark, LB_Glue, - LB_Alphabetic, + LB_Combining_Mark, LB_Numeric, LB_Alphabetic, LB_Combining_Mark, @@ -41442,6 +41907,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Break_After, + LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, @@ -41471,8 +41938,6 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, - LB_Combining_Mark, - LB_Alphabetic, LB_Break_Before, LB_Alphabetic, LB_Break_After, @@ -41533,6 +41998,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Prefix_Numeric, LB_Postfix_Numeric, LB_Prefix_Numeric, + LB_Postfix_Numeric, + LB_Prefix_Numeric, LB_Combining_Mark, LB_Alphabetic, LB_Postfix_Numeric, @@ -41714,6 +42181,17 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Alphabetic, LB_Break_After, LB_Alphabetic, + LB_Exclamation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Break_After, + LB_Alphabetic, LB_Ideographic, LB_Alphabetic, LB_Ideographic, @@ -42904,15 +43382,21 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Break_After, LB_Alphabetic, LB_Numeric, + LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Break_After, + LB_Combining_Mark, LB_Alphabetic, LB_Numeric, LB_Alphabetic, @@ -43129,6 +43613,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Alphabetic, LB_Break_After, LB_Alphabetic, + LB_Numeric, + LB_Alphabetic, LB_Combining_Mark, LB_Break_After, LB_Alphabetic, @@ -43180,6 +43666,10 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, LB_Numeric, LB_Alphabetic, LB_Combining_Mark, @@ -43211,6 +43701,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Numeric, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Numeric, LB_Alphabetic, LB_Prefix_Numeric, @@ -43348,6 +43840,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, + LB_Ideographic, + LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, @@ -43375,15 +43869,12 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Ideographic, LB_E_Base, LB_Ideographic, - LB_Unassigned_Extended_Pictographic_Ideographic, - LB_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, LB_Ideographic, - LB_Unassigned_Extended_Pictographic_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, @@ -43403,9 +43894,14 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, + LB_E_Base, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, + LB_Ideographic, + LB_Unassigned_Extended_Pictographic_Ideographic, + LB_E_Base, + LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, LB_Numeric, LB_Alphabetic, @@ -43435,7 +43931,7 @@ static const LB_enum _Perl_LB_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ - 2479, /* Number of elements */ + 2513, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -43549,7 +44045,6 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x620, 0x64B, 0x660, @@ -43596,7 +44091,9 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -43701,6 +44198,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0xBFA, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -43870,7 +44369,7 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x16EB, 0x16EE, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1737, @@ -43927,7 +44426,7 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -43939,6 +44438,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1B61, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1B83, 0x1BA1, @@ -43967,8 +44468,6 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FFD, 0x1FFE, @@ -44030,6 +44529,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2103, @@ -44211,6 +44712,17 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E53, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -45398,6 +45910,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x10EAE, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, @@ -45405,12 +45919,16 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x11049, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BE, 0x110C2, + 0x110C3, 0x110F0, 0x110FA, 0x11100, @@ -45626,6 +46144,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16AC0, + 0x16ACA, 0x16AF0, 0x16AF5, 0x16AF6, @@ -45656,7 +46176,7 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x18D00, 0x18D09, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -45667,6 +46187,10 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -45707,6 +46231,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1E137, 0x1E140, 0x1E14A, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E2FA, @@ -45834,7 +46360,7 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1F6CC, 0x1F6CD, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -45845,6 +46371,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -45872,15 +46400,12 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1F93F, 0x1F977, 0x1F978, - 0x1F979, - 0x1F97A, 0x1F9B5, 0x1F9B7, 0x1F9B8, 0x1F9BA, 0x1F9BB, 0x1F9BC, - 0x1F9CC, 0x1F9CD, 0x1F9D0, 0x1F9D1, @@ -45892,17 +46417,22 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 1047 */ 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FBF0, 0x1FBFA, @@ -46086,7 +46616,6 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Combining_Mark, LB_Exclamation, LB_Combining_Mark, - LB_Alphabetic, LB_Exclamation, LB_Alphabetic, LB_Combining_Mark, @@ -46145,6 +46674,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Break_After, LB_Numeric, LB_Alphabetic, @@ -46249,6 +46780,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, LB_Numeric, LB_Alphabetic, LB_Break_Before, @@ -46437,7 +46970,7 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Alphabetic, LB_Combining_Mark, LB_Glue, - LB_Alphabetic, + LB_Combining_Mark, LB_Numeric, LB_Alphabetic, LB_Combining_Mark, @@ -46477,6 +47010,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Break_After, + LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, @@ -46506,8 +47041,6 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, - LB_Combining_Mark, - LB_Alphabetic, LB_Break_Before, LB_Alphabetic, LB_Break_After, @@ -46568,6 +47101,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Prefix_Numeric, LB_Postfix_Numeric, LB_Prefix_Numeric, + LB_Postfix_Numeric, + LB_Prefix_Numeric, LB_Combining_Mark, LB_Alphabetic, LB_Postfix_Numeric, @@ -46749,6 +47284,17 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Alphabetic, LB_Break_After, LB_Alphabetic, + LB_Exclamation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Break_After, + LB_Alphabetic, LB_Ideographic, LB_Alphabetic, LB_Ideographic, @@ -47939,15 +48485,21 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Break_After, LB_Alphabetic, LB_Numeric, + LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Break_After, + LB_Combining_Mark, LB_Alphabetic, LB_Numeric, LB_Alphabetic, @@ -48164,6 +48716,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Alphabetic, LB_Break_After, LB_Alphabetic, + LB_Numeric, + LB_Alphabetic, LB_Combining_Mark, LB_Break_After, LB_Alphabetic, @@ -48215,6 +48769,10 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, LB_Numeric, LB_Alphabetic, LB_Combining_Mark, @@ -48246,6 +48804,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Numeric, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Numeric, LB_Alphabetic, LB_Prefix_Numeric, @@ -48383,6 +48943,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, + LB_Ideographic, + LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, @@ -48410,15 +48972,12 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Ideographic, LB_E_Base, LB_Ideographic, - LB_Unassigned_Extended_Pictographic_Ideographic, - LB_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, LB_Ideographic, - LB_Unassigned_Extended_Pictographic_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, @@ -48438,9 +48997,14 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, + LB_E_Base, + LB_Unassigned_Extended_Pictographic_Ideographic, + LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, + LB_E_Base, + LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, LB_Numeric, LB_Alphabetic, @@ -48470,7 +49034,7 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ - 2479, /* Number of elements */ + 2513, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -48584,7 +49148,6 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x620, 0x64B, 0x660, @@ -48631,7 +49194,9 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -48736,6 +49301,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0xBFA, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -48905,7 +49472,7 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x16EB, 0x16EE, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1737, @@ -48962,7 +49529,7 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -48974,6 +49541,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1B61, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1B83, 0x1BA1, @@ -49002,8 +49571,6 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FFD, 0x1FFE, @@ -49065,6 +49632,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2103, @@ -49246,6 +49815,17 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E53, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -50433,6 +51013,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x10EAE, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, @@ -50440,12 +51022,16 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x11049, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BE, 0x110C2, + 0x110C3, 0x110F0, 0x110FA, 0x11100, @@ -50661,6 +51247,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16AC0, + 0x16ACA, 0x16AF0, 0x16AF5, 0x16AF6, @@ -50691,7 +51279,7 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x18D00, 0x18D09, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -50702,6 +51290,10 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -50742,6 +51334,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1E137, 0x1E140, 0x1E14A, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E2FA, @@ -50869,7 +51463,7 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1F6CC, 0x1F6CD, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -50880,6 +51474,8 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -50907,15 +51503,12 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1F93F, 0x1F977, 0x1F978, - 0x1F979, - 0x1F97A, 0x1F9B5, 0x1F9B7, 0x1F9B8, 0x1F9BA, 0x1F9BB, 0x1F9BC, - 0x1F9CC, 0x1F9CD, 0x1F9D0, 0x1F9D1, @@ -50927,17 +51520,22 @@ static const UV _Perl_LB_invlist[] = { /* for EBCDIC 037 */ 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FBF0, 0x1FBFA, @@ -51121,7 +51719,6 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Combining_Mark, LB_Exclamation, LB_Combining_Mark, - LB_Alphabetic, LB_Exclamation, LB_Alphabetic, LB_Combining_Mark, @@ -51180,6 +51777,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Break_After, LB_Numeric, LB_Alphabetic, @@ -51284,6 +51883,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, LB_Numeric, LB_Alphabetic, LB_Break_Before, @@ -51472,7 +52073,7 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Alphabetic, LB_Combining_Mark, LB_Glue, - LB_Alphabetic, + LB_Combining_Mark, LB_Numeric, LB_Alphabetic, LB_Combining_Mark, @@ -51512,6 +52113,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Break_After, + LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, @@ -51541,8 +52144,6 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, - LB_Combining_Mark, - LB_Alphabetic, LB_Break_Before, LB_Alphabetic, LB_Break_After, @@ -51603,6 +52204,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Prefix_Numeric, LB_Postfix_Numeric, LB_Prefix_Numeric, + LB_Postfix_Numeric, + LB_Prefix_Numeric, LB_Combining_Mark, LB_Alphabetic, LB_Postfix_Numeric, @@ -51784,6 +52387,17 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Alphabetic, LB_Break_After, LB_Alphabetic, + LB_Exclamation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Open_Punctuation, + LB_Close_Punctuation, + LB_Break_After, + LB_Alphabetic, LB_Ideographic, LB_Alphabetic, LB_Ideographic, @@ -52974,15 +53588,21 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Break_After, LB_Alphabetic, LB_Numeric, + LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, LB_Break_After, + LB_Combining_Mark, LB_Alphabetic, LB_Numeric, LB_Alphabetic, @@ -53199,6 +53819,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Alphabetic, LB_Break_After, LB_Alphabetic, + LB_Numeric, + LB_Alphabetic, LB_Combining_Mark, LB_Break_After, LB_Alphabetic, @@ -53250,6 +53872,10 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Alphabetic, LB_Combining_Mark, LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, + LB_Alphabetic, LB_Numeric, LB_Alphabetic, LB_Combining_Mark, @@ -53281,6 +53907,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Numeric, LB_Alphabetic, LB_Combining_Mark, + LB_Alphabetic, + LB_Combining_Mark, LB_Numeric, LB_Alphabetic, LB_Prefix_Numeric, @@ -53418,6 +54046,8 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, + LB_Ideographic, + LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, @@ -53445,15 +54075,12 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Ideographic, LB_E_Base, LB_Ideographic, - LB_Unassigned_Extended_Pictographic_Ideographic, - LB_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, LB_Ideographic, - LB_Unassigned_Extended_Pictographic_Ideographic, LB_E_Base, LB_Ideographic, LB_E_Base, @@ -53473,9 +54100,14 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, + LB_E_Base, + LB_Unassigned_Extended_Pictographic_Ideographic, + LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, LB_Ideographic, LB_Unassigned_Extended_Pictographic_Ideographic, + LB_E_Base, + LB_Unassigned_Extended_Pictographic_Ideographic, LB_Alphabetic, LB_Numeric, LB_Alphabetic, @@ -53502,7 +54134,7 @@ static const LB_enum _Perl_LB_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ - 3146, /* Number of elements */ + 3227, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -54148,7 +54780,6 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x620, 0x64B, 0x660, @@ -54216,11 +54847,15 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x85C, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -54414,6 +55049,7 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, + 0xC3C, 0xC3D, 0xC3E, 0xC45, @@ -54425,6 +55061,8 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC64, @@ -54453,7 +55091,7 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -54662,11 +55300,9 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1732, 0x1735, 0x1737, @@ -54745,12 +55381,12 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1AA8, 0x1AAC, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B5C, @@ -54758,6 +55394,8 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1B60, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1B83, 0x1BA1, @@ -54796,8 +55434,6 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1CFB, 0x1D00, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1E01, 0x1E02, @@ -55206,9 +55842,7 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x29FC, 0x29FE, 0x2C00, - 0x2C2F, 0x2C30, - 0x2C5F, 0x2C60, 0x2C61, 0x2C62, @@ -55377,6 +56011,9 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x2E3D, 0x2E42, 0x2E43, + 0x2E53, + 0x2E55, + 0x2E5D, 0x3000, 0x3001, 0x3002, @@ -55416,8 +56053,6 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -55655,6 +56290,7 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -55662,6 +56298,18 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D0, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, + 0xA7F2, 0xA7F5, 0xA7F6, 0xA7F7, @@ -55942,12 +56590,36 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -56037,6 +56709,10 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x10F51, 0x10F55, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FC5, 0x10FE0, @@ -56048,6 +56724,10 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x11049, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x1107F, 0x11083, 0x110B0, @@ -56055,6 +56735,7 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x110BD, 0x110BE, 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -56203,6 +56884,8 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1173A, 0x1173C, 0x1173F, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x1183B, @@ -56264,7 +56947,7 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x11A9B, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -56326,6 +57009,8 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -56340,6 +57025,9 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -56385,8 +57073,14 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -56405,6 +57099,10 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -56522,6 +57220,10 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -56541,10 +57243,21 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, + 0x1E2AF, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -56633,9 +57346,9 @@ static const UV _Perl_SB_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -57323,7 +58036,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Extend, SB_Other, SB_Format, - SB_Other, SB_STerm, SB_OLetter, SB_Extend, @@ -57396,6 +58108,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_OLetter, SB_Other, + SB_Format, + SB_Other, + SB_Extend, + SB_OLetter, SB_Extend, SB_Format, SB_Extend, @@ -57590,6 +58306,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_OLetter, SB_Other, + SB_Extend, SB_OLetter, SB_Extend, SB_Other, @@ -57602,6 +58319,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_OLetter, SB_Other, SB_OLetter, + SB_Other, + SB_OLetter, SB_Extend, SB_Other, SB_Numeric, @@ -57838,8 +58557,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_OLetter, SB_Other, SB_OLetter, - SB_Other, - SB_OLetter, SB_Extend, SB_Other, SB_OLetter, @@ -57873,7 +58590,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_Extend, SB_Format, - SB_Other, + SB_Extend, SB_Numeric, SB_Other, SB_OLetter, @@ -57934,6 +58651,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_Extend, SB_Other, + SB_STerm, + SB_Other, SB_Extend, SB_OLetter, SB_Extend, @@ -57972,8 +58691,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_Lower, SB_Extend, - SB_Other, - SB_Extend, SB_Upper, SB_Lower, SB_Upper, @@ -58382,9 +59099,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Close, SB_Other, SB_Upper, - SB_Other, SB_Lower, - SB_Other, SB_Upper, SB_Lower, SB_Upper, @@ -58553,6 +59268,9 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_Close, SB_Other, + SB_STerm, + SB_Close, + SB_Other, SB_Sp, SB_SContinue, SB_STerm, @@ -58595,8 +59313,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_OLetter, SB_Other, - SB_OLetter, - SB_Other, SB_STerm, SB_OLetter, SB_Other, @@ -58830,14 +59546,27 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Lower, SB_Upper, SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, SB_Other, SB_Upper, SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, SB_Upper, SB_Lower, SB_Upper, SB_Lower, SB_Other, + SB_OLetter, SB_Upper, SB_Lower, SB_OLetter, @@ -59118,13 +59847,37 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_OLetter, SB_Other, - SB_OLetter, + SB_Upper, SB_Other, - SB_OLetter, + SB_Upper, SB_Other, - SB_OLetter, + SB_Upper, SB_Other, - SB_OLetter, + SB_Upper, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_Lower, + SB_OLetter, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_OLetter, SB_Other, SB_OLetter, SB_Other, @@ -59214,6 +59967,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_STerm, SB_Other, SB_OLetter, + SB_Extend, + SB_STerm, + SB_Other, + SB_OLetter, SB_Other, SB_OLetter, SB_Other, @@ -59223,6 +59980,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_STerm, SB_Other, SB_Numeric, + SB_Extend, + SB_OLetter, + SB_Extend, + SB_OLetter, SB_Other, SB_Extend, SB_OLetter, @@ -59230,6 +59991,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_Format, SB_STerm, + SB_Extend, SB_Other, SB_Format, SB_Other, @@ -59380,6 +60142,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_STerm, SB_Other, SB_OLetter, + SB_Other, + SB_OLetter, SB_Extend, SB_Other, SB_Upper, @@ -59504,6 +60268,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, SB_Format, SB_Other, SB_OLetter, @@ -59515,6 +60281,9 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Numeric, SB_Other, SB_STerm, + SB_OLetter, + SB_Other, + SB_Numeric, SB_Other, SB_OLetter, SB_Other, @@ -59577,6 +60346,12 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, SB_Extend, SB_STerm, SB_Format, @@ -59584,6 +60359,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Extend, SB_Other, SB_Extend, + SB_Other, + SB_Extend, + SB_Other, + SB_Extend, SB_Format, SB_Extend, SB_Other, @@ -59698,6 +60477,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_Extend, SB_Other, + SB_Lower, + SB_OLetter, + SB_Lower, + SB_Other, SB_Extend, SB_Other, SB_Extend, @@ -59719,10 +60502,21 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ SB_Other, SB_OLetter, SB_Extend, + SB_Other, + SB_OLetter, + SB_Extend, SB_Numeric, SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, SB_Extend, SB_Other, SB_Upper, @@ -59842,7 +60636,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ - 3170, /* Number of elements */ + 3251, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -60512,7 +61306,6 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x620, 0x64B, 0x660, @@ -60580,11 +61373,15 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -60778,6 +61575,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, + 0xC3C, 0xC3D, 0xC3E, 0xC45, @@ -60789,6 +61587,8 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC64, @@ -60817,7 +61617,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -61026,11 +61826,9 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1732, 0x1735, 0x1737, @@ -61109,12 +61907,12 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1AA8, 0x1AAC, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B5C, @@ -61122,6 +61920,8 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1B60, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1B83, 0x1BA1, @@ -61160,8 +61960,6 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1CFB, 0x1D00, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1E01, 0x1E02, @@ -61570,9 +62368,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x29FC, 0x29FE, 0x2C00, - 0x2C2F, 0x2C30, - 0x2C5F, 0x2C60, 0x2C61, 0x2C62, @@ -61741,6 +62537,9 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x2E3D, 0x2E42, 0x2E43, + 0x2E53, + 0x2E55, + 0x2E5D, 0x3000, 0x3001, 0x3002, @@ -61780,8 +62579,6 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -62019,6 +62816,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -62026,6 +62824,18 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D0, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, + 0xA7F2, 0xA7F5, 0xA7F6, 0xA7F7, @@ -62306,12 +63116,36 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -62401,6 +63235,10 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x10F51, 0x10F55, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FC5, 0x10FE0, @@ -62412,6 +63250,10 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x11049, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x1107F, 0x11083, 0x110B0, @@ -62419,6 +63261,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x110BD, 0x110BE, 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -62567,6 +63410,8 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1173A, 0x1173C, 0x1173F, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x1183B, @@ -62628,7 +63473,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x11A9B, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -62690,6 +63535,8 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -62704,6 +63551,9 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -62749,8 +63599,14 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -62769,6 +63625,10 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -62886,6 +63746,10 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -62905,10 +63769,21 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, + 0x1E2AF, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -62997,9 +63872,9 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -63714,7 +64589,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Extend, SB_Other, SB_Format, - SB_Other, SB_STerm, SB_OLetter, SB_Extend, @@ -63787,6 +64661,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_OLetter, SB_Other, + SB_Format, + SB_Other, + SB_Extend, + SB_OLetter, SB_Extend, SB_Format, SB_Extend, @@ -63981,6 +64859,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_OLetter, SB_Other, + SB_Extend, SB_OLetter, SB_Extend, SB_Other, @@ -63993,6 +64872,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_OLetter, SB_Other, SB_OLetter, + SB_Other, + SB_OLetter, SB_Extend, SB_Other, SB_Numeric, @@ -64229,8 +65110,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_OLetter, SB_Other, SB_OLetter, - SB_Other, - SB_OLetter, SB_Extend, SB_Other, SB_OLetter, @@ -64264,7 +65143,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_Extend, SB_Format, - SB_Other, + SB_Extend, SB_Numeric, SB_Other, SB_OLetter, @@ -64325,6 +65204,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_Extend, SB_Other, + SB_STerm, + SB_Other, SB_Extend, SB_OLetter, SB_Extend, @@ -64363,8 +65244,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_Lower, SB_Extend, - SB_Other, - SB_Extend, SB_Upper, SB_Lower, SB_Upper, @@ -64773,9 +65652,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Close, SB_Other, SB_Upper, - SB_Other, SB_Lower, - SB_Other, SB_Upper, SB_Lower, SB_Upper, @@ -64944,6 +65821,9 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_Close, SB_Other, + SB_STerm, + SB_Close, + SB_Other, SB_Sp, SB_SContinue, SB_STerm, @@ -64986,8 +65866,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_OLetter, SB_Other, - SB_OLetter, - SB_Other, SB_STerm, SB_OLetter, SB_Other, @@ -65221,14 +66099,27 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Lower, SB_Upper, SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, SB_Other, SB_Upper, SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, SB_Upper, SB_Lower, SB_Upper, SB_Lower, SB_Other, + SB_OLetter, SB_Upper, SB_Lower, SB_OLetter, @@ -65509,11 +66400,35 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_OLetter, SB_Other, + SB_Upper, + SB_Other, + SB_Upper, + SB_Other, + SB_Upper, + SB_Other, + SB_Upper, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_OLetter, + SB_Other, SB_OLetter, SB_Other, SB_OLetter, SB_Other, + SB_Lower, SB_OLetter, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, SB_Other, SB_OLetter, SB_Other, @@ -65605,6 +66520,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_STerm, SB_Other, SB_OLetter, + SB_Extend, + SB_STerm, + SB_Other, + SB_OLetter, SB_Other, SB_OLetter, SB_Other, @@ -65614,6 +66533,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_STerm, SB_Other, SB_Numeric, + SB_Extend, + SB_OLetter, + SB_Extend, + SB_OLetter, SB_Other, SB_Extend, SB_OLetter, @@ -65621,6 +66544,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_Format, SB_STerm, + SB_Extend, SB_Other, SB_Format, SB_Other, @@ -65771,6 +66695,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_STerm, SB_Other, SB_OLetter, + SB_Other, + SB_OLetter, SB_Extend, SB_Other, SB_Upper, @@ -65895,6 +66821,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, SB_Format, SB_Other, SB_OLetter, @@ -65906,6 +66834,9 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Numeric, SB_Other, SB_STerm, + SB_OLetter, + SB_Other, + SB_Numeric, SB_Other, SB_OLetter, SB_Other, @@ -65968,6 +66899,12 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, SB_Extend, SB_STerm, SB_Format, @@ -65975,6 +66912,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Extend, SB_Other, SB_Extend, + SB_Other, + SB_Extend, + SB_Other, + SB_Extend, SB_Format, SB_Extend, SB_Other, @@ -66089,6 +67030,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_Extend, SB_Other, + SB_Lower, + SB_OLetter, + SB_Lower, + SB_Other, SB_Extend, SB_Other, SB_Extend, @@ -66110,10 +67055,21 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ SB_Other, SB_OLetter, SB_Extend, + SB_Other, + SB_OLetter, + SB_Extend, SB_Numeric, SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, SB_Extend, SB_Other, SB_Upper, @@ -66233,7 +67189,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ - 3166, /* Number of elements */ + 3247, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -66899,7 +67855,6 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x620, 0x64B, 0x660, @@ -66967,11 +67922,15 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -67165,6 +68124,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, + 0xC3C, 0xC3D, 0xC3E, 0xC45, @@ -67176,6 +68136,8 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC64, @@ -67204,7 +68166,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -67413,11 +68375,9 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1732, 0x1735, 0x1737, @@ -67496,12 +68456,12 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1AA8, 0x1AAC, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B5C, @@ -67509,6 +68469,8 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1B60, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1B83, 0x1BA1, @@ -67547,8 +68509,6 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1CFB, 0x1D00, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1E01, 0x1E02, @@ -67957,9 +68917,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x29FC, 0x29FE, 0x2C00, - 0x2C2F, 0x2C30, - 0x2C5F, 0x2C60, 0x2C61, 0x2C62, @@ -68128,6 +69086,9 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x2E3D, 0x2E42, 0x2E43, + 0x2E53, + 0x2E55, + 0x2E5D, 0x3000, 0x3001, 0x3002, @@ -68167,8 +69128,6 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -68406,6 +69365,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -68413,6 +69373,18 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D0, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, + 0xA7F2, 0xA7F5, 0xA7F6, 0xA7F7, @@ -68693,12 +69665,36 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -68788,6 +69784,10 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x10F51, 0x10F55, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FC5, 0x10FE0, @@ -68799,6 +69799,10 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x11049, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x1107F, 0x11083, 0x110B0, @@ -68806,6 +69810,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x110BD, 0x110BE, 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -68954,6 +69959,8 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1173A, 0x1173C, 0x1173F, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x1183B, @@ -69015,7 +70022,7 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x11A9B, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -69077,6 +70084,8 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -69091,6 +70100,9 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -69136,8 +70148,14 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -69156,6 +70174,10 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -69273,6 +70295,10 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -69292,10 +70318,21 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, + 0x1E2AF, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -69384,9 +70421,9 @@ static const UV _Perl_SB_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -70097,7 +71134,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Extend, SB_Other, SB_Format, - SB_Other, SB_STerm, SB_OLetter, SB_Extend, @@ -70170,6 +71206,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_OLetter, SB_Other, + SB_Format, + SB_Other, + SB_Extend, + SB_OLetter, SB_Extend, SB_Format, SB_Extend, @@ -70364,6 +71404,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_OLetter, SB_Other, + SB_Extend, SB_OLetter, SB_Extend, SB_Other, @@ -70376,6 +71417,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_OLetter, SB_Other, SB_OLetter, + SB_Other, + SB_OLetter, SB_Extend, SB_Other, SB_Numeric, @@ -70612,8 +71655,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_OLetter, SB_Other, SB_OLetter, - SB_Other, - SB_OLetter, SB_Extend, SB_Other, SB_OLetter, @@ -70647,7 +71688,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_Extend, SB_Format, - SB_Other, + SB_Extend, SB_Numeric, SB_Other, SB_OLetter, @@ -70708,6 +71749,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_Extend, SB_Other, + SB_STerm, + SB_Other, SB_Extend, SB_OLetter, SB_Extend, @@ -70746,8 +71789,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_Lower, SB_Extend, - SB_Other, - SB_Extend, SB_Upper, SB_Lower, SB_Upper, @@ -71156,9 +72197,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Close, SB_Other, SB_Upper, - SB_Other, SB_Lower, - SB_Other, SB_Upper, SB_Lower, SB_Upper, @@ -71327,6 +72366,9 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_Close, SB_Other, + SB_STerm, + SB_Close, + SB_Other, SB_Sp, SB_SContinue, SB_STerm, @@ -71369,8 +72411,6 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_OLetter, SB_Other, - SB_OLetter, - SB_Other, SB_STerm, SB_OLetter, SB_Other, @@ -71604,14 +72644,27 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Lower, SB_Upper, SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, + SB_Upper, + SB_Lower, SB_Other, SB_Upper, SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, SB_Upper, SB_Lower, SB_Upper, SB_Lower, SB_Other, + SB_OLetter, SB_Upper, SB_Lower, SB_OLetter, @@ -71892,13 +72945,37 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_OLetter, SB_Other, - SB_OLetter, + SB_Upper, SB_Other, - SB_OLetter, + SB_Upper, SB_Other, - SB_OLetter, + SB_Upper, SB_Other, - SB_OLetter, + SB_Upper, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_Lower, + SB_OLetter, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_Lower, + SB_Other, + SB_OLetter, SB_Other, SB_OLetter, SB_Other, @@ -71988,6 +73065,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_STerm, SB_Other, SB_OLetter, + SB_Extend, + SB_STerm, + SB_Other, + SB_OLetter, SB_Other, SB_OLetter, SB_Other, @@ -71997,6 +73078,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_STerm, SB_Other, SB_Numeric, + SB_Extend, + SB_OLetter, + SB_Extend, + SB_OLetter, SB_Other, SB_Extend, SB_OLetter, @@ -72004,6 +73089,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_Format, SB_STerm, + SB_Extend, SB_Other, SB_Format, SB_Other, @@ -72154,6 +73240,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_STerm, SB_Other, SB_OLetter, + SB_Other, + SB_OLetter, SB_Extend, SB_Other, SB_Upper, @@ -72278,6 +73366,8 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, SB_Format, SB_Other, SB_OLetter, @@ -72289,6 +73379,9 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Numeric, SB_Other, SB_STerm, + SB_OLetter, + SB_Other, + SB_Numeric, SB_Other, SB_OLetter, SB_Other, @@ -72351,6 +73444,12 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, SB_Extend, SB_STerm, SB_Format, @@ -72358,6 +73457,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Extend, SB_Other, SB_Extend, + SB_Other, + SB_Extend, + SB_Other, + SB_Extend, SB_Format, SB_Extend, SB_Other, @@ -72472,6 +73575,10 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_Extend, SB_Other, + SB_Lower, + SB_OLetter, + SB_Lower, + SB_Other, SB_Extend, SB_Other, SB_Extend, @@ -72493,10 +73600,21 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ SB_Other, SB_OLetter, SB_Extend, + SB_Other, + SB_OLetter, + SB_Extend, SB_Numeric, SB_Other, SB_OLetter, SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, + SB_OLetter, + SB_Other, SB_Extend, SB_Other, SB_Upper, @@ -72613,7 +73731,7 @@ static const SB_enum _Perl_SB_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ - 1673, /* Number of elements */ + 1731, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -72690,7 +73808,6 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x61F, 0x620, 0x640, @@ -72726,11 +73843,11 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8E2, 0x8E3, 0x900, @@ -72902,7 +74019,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -72912,6 +74029,8 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -72935,7 +74054,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -73083,9 +74202,8 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, + 0x1716, + 0x171F, 0x1720, 0x1735, 0x1737, @@ -73108,8 +74226,6 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1804, 0x1805, 0x1806, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -73152,11 +74268,11 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BC0, 0x1BF4, @@ -73268,7 +74384,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F0, 0x20F1, @@ -73296,9 +74412,6 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x2B96, 0x2B97, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, 0x2C60, 0x2C80, 0x2CF4, @@ -73336,7 +74449,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x2E00, 0x2E43, 0x2E44, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -73408,7 +74521,6 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, 0xA000, 0xA48D, 0xA490, @@ -73426,10 +74538,14 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xA82D, 0xA830, @@ -73524,14 +74640,15 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0xFB45, 0xFB46, 0xFB50, - 0xFBC2, + 0xFBC3, 0xFBD3, 0xFD3E, 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, 0xFDF2, 0xFDF3, @@ -73597,6 +74714,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x10080, 0x100FB, 0x10100, + 0x10102, 0x10103, 0x10107, 0x10134, @@ -73646,12 +74764,33 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x10564, 0x1056F, 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -73711,6 +74850,8 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x10AC0, 0x10AE7, 0x10AEB, + 0x10AF2, + 0x10AF3, 0x10AF7, 0x10B00, 0x10B36, @@ -73750,6 +74891,8 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -73757,10 +74900,10 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x11080, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -73848,7 +74991,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -73856,7 +74999,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -73888,6 +75031,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x11A48, 0x11A50, 0x11AA3, + 0x11AB0, 0x11AC0, 0x11AF9, 0x11C00, @@ -73949,6 +75093,8 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -73963,6 +75109,9 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -73999,9 +75148,16 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, - 0x1B11F, + 0x1B120, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -74018,6 +75174,12 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -74031,7 +75193,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -74088,6 +75250,8 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -74106,10 +75270,20 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -74220,7 +75394,7 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -74230,6 +75404,8 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -74243,27 +75419,27 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -74271,9 +75447,9 @@ static const UV _Perl_SCX_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -74332,138 +75508,143 @@ typedef enum { SCX_Coptic = 26, SCX_Cuneiform = 27, SCX_Cypriot = 28, - SCX_Cyrillic = 29, - SCX_Deseret = 30, - SCX_Devanagari = 31, - SCX_Dives_Akuru = 32, - SCX_Dogra = 33, - SCX_Duployan = 34, - SCX_Egyptian_Hieroglyphs = 35, - SCX_Elbasan = 36, - SCX_Elymaic = 37, - SCX_Ethiopic = 38, - SCX_Georgian = 39, - SCX_Glagolitic = 40, - SCX_Gothic = 41, - SCX_Grantha = 42, - SCX_Greek = 43, - SCX_Gujarati = 44, - SCX_Gunjala_Gondi = 45, - SCX_Gurmukhi = 46, - SCX_Han = 47, - SCX_Hanb = 48, - SCX_Hangul = 49, - SCX_Hanifi_Rohingya = 50, - SCX_Hanunoo = 51, - SCX_Hatran = 52, - SCX_Hebrew = 53, - SCX_Hiragana = 54, - SCX_Imperial_Aramaic = 55, - SCX_Inherited = 56, - SCX_Inscriptional_Pahlavi = 57, - SCX_Inscriptional_Parthian = 58, - SCX_INVALID = 59, - SCX_Javanese = 60, - SCX_Jpan = 61, - SCX_Kaithi = 62, - SCX_Kannada = 63, - SCX_Katakana = 64, - SCX_Kayah_Li = 65, - SCX_Kharoshthi = 66, - SCX_Khitan_Small_Script = 67, - SCX_Khmer = 68, - SCX_Khojki = 69, - SCX_Khudawadi = 70, - SCX_Kore = 71, - SCX_Lao = 72, - SCX_Latin = 73, - SCX_Lepcha = 74, - SCX_Limbu = 75, - SCX_Linear_A = 76, - SCX_Linear_B = 77, - SCX_Lisu = 78, - SCX_Lycian = 79, - SCX_Lydian = 80, - SCX_Mahajani = 81, - SCX_Makasar = 82, - SCX_Malayalam = 83, - SCX_Mandaic = 84, - SCX_Manichaean = 85, - SCX_Marchen = 86, - SCX_Masaram_Gondi = 87, - SCX_Medefaidrin = 88, - SCX_Meetei_Mayek = 89, - SCX_Mende_Kikakui = 90, - SCX_Meroitic_Cursive = 91, - SCX_Meroitic_Hieroglyphs = 92, - SCX_Miao = 93, - SCX_Modi = 94, - SCX_Mongolian = 95, - SCX_Mro = 96, - SCX_Multani = 97, - SCX_Myanmar = 98, - SCX_Nabataean = 99, - SCX_Nandinagari = 100, - SCX_New_Tai_Lue = 101, - SCX_Newa = 102, - SCX_Nko = 103, - SCX_Nushu = 104, - SCX_Nyiakeng_Puachue_Hmong = 105, - SCX_Ogham = 106, - SCX_Ol_Chiki = 107, - SCX_Old_Hungarian = 108, - SCX_Old_Italic = 109, - SCX_Old_North_Arabian = 110, - SCX_Old_Permic = 111, - SCX_Old_Persian = 112, - SCX_Old_Sogdian = 113, - SCX_Old_South_Arabian = 114, - SCX_Old_Turkic = 115, - SCX_Oriya = 116, - SCX_Osage = 117, - SCX_Osmanya = 118, - SCX_Pahawh_Hmong = 119, - SCX_Palmyrene = 120, - SCX_Pau_Cin_Hau = 121, - SCX_Phags_Pa = 122, - SCX_Phoenician = 123, - SCX_Psalter_Pahlavi = 124, - SCX_Rejang = 125, - SCX_Runic = 126, - SCX_Samaritan = 127, - SCX_Saurashtra = 128, - SCX_Sharada = 129, - SCX_Shavian = 130, - SCX_Siddham = 131, - SCX_SignWriting = 132, - SCX_Sinhala = 133, - SCX_Sogdian = 134, - SCX_Sora_Sompeng = 135, - SCX_Soyombo = 136, - SCX_Sundanese = 137, - SCX_Syloti_Nagri = 138, - SCX_Syriac = 139, - SCX_Tagalog = 140, - SCX_Tagbanwa = 141, - SCX_Tai_Le = 142, - SCX_Tai_Tham = 143, - SCX_Tai_Viet = 144, - SCX_Takri = 145, - SCX_Tamil = 146, - SCX_Tangut = 147, - SCX_Telugu = 148, - SCX_Thaana = 149, - SCX_Thai = 150, - SCX_Tibetan = 151, - SCX_Tifinagh = 152, - SCX_Tirhuta = 153, - SCX_Ugaritic = 154, - SCX_Vai = 155, - SCX_Wancho = 156, - SCX_Warang_Citi = 157, - SCX_Yezidi = 158, - SCX_Yi = 159, - SCX_Zanabazar_Square = 160, + SCX_Cypro_Minoan = 29, + SCX_Cyrillic = 30, + SCX_Deseret = 31, + SCX_Devanagari = 32, + SCX_Dives_Akuru = 33, + SCX_Dogra = 34, + SCX_Duployan = 35, + SCX_Egyptian_Hieroglyphs = 36, + SCX_Elbasan = 37, + SCX_Elymaic = 38, + SCX_Ethiopic = 39, + SCX_Georgian = 40, + SCX_Glagolitic = 41, + SCX_Gothic = 42, + SCX_Grantha = 43, + SCX_Greek = 44, + SCX_Gujarati = 45, + SCX_Gunjala_Gondi = 46, + SCX_Gurmukhi = 47, + SCX_Han = 48, + SCX_Hanb = 49, + SCX_Hangul = 50, + SCX_Hanifi_Rohingya = 51, + SCX_Hanunoo = 52, + SCX_Hatran = 53, + SCX_Hebrew = 54, + SCX_Hiragana = 55, + SCX_Imperial_Aramaic = 56, + SCX_Inherited = 57, + SCX_Inscriptional_Pahlavi = 58, + SCX_Inscriptional_Parthian = 59, + SCX_INVALID = 60, + SCX_Javanese = 61, + SCX_Jpan = 62, + SCX_Kaithi = 63, + SCX_Kannada = 64, + SCX_Katakana = 65, + SCX_Kayah_Li = 66, + SCX_Kharoshthi = 67, + SCX_Khitan_Small_Script = 68, + SCX_Khmer = 69, + SCX_Khojki = 70, + SCX_Khudawadi = 71, + SCX_Kore = 72, + SCX_Lao = 73, + SCX_Latin = 74, + SCX_Lepcha = 75, + SCX_Limbu = 76, + SCX_Linear_A = 77, + SCX_Linear_B = 78, + SCX_Lisu = 79, + SCX_Lycian = 80, + SCX_Lydian = 81, + SCX_Mahajani = 82, + SCX_Makasar = 83, + SCX_Malayalam = 84, + SCX_Mandaic = 85, + SCX_Manichaean = 86, + SCX_Marchen = 87, + SCX_Masaram_Gondi = 88, + SCX_Medefaidrin = 89, + SCX_Meetei_Mayek = 90, + SCX_Mende_Kikakui = 91, + SCX_Meroitic_Cursive = 92, + SCX_Meroitic_Hieroglyphs = 93, + SCX_Miao = 94, + SCX_Modi = 95, + SCX_Mongolian = 96, + SCX_Mro = 97, + SCX_Multani = 98, + SCX_Myanmar = 99, + SCX_Nabataean = 100, + SCX_Nandinagari = 101, + SCX_New_Tai_Lue = 102, + SCX_Newa = 103, + SCX_Nko = 104, + SCX_Nushu = 105, + SCX_Nyiakeng_Puachue_Hmong = 106, + SCX_Ogham = 107, + SCX_Ol_Chiki = 108, + SCX_Old_Hungarian = 109, + SCX_Old_Italic = 110, + SCX_Old_North_Arabian = 111, + SCX_Old_Permic = 112, + SCX_Old_Persian = 113, + SCX_Old_Sogdian = 114, + SCX_Old_South_Arabian = 115, + SCX_Old_Turkic = 116, + SCX_Old_Uyghur = 117, + SCX_Oriya = 118, + SCX_Osage = 119, + SCX_Osmanya = 120, + SCX_Pahawh_Hmong = 121, + SCX_Palmyrene = 122, + SCX_Pau_Cin_Hau = 123, + SCX_Phags_Pa = 124, + SCX_Phoenician = 125, + SCX_Psalter_Pahlavi = 126, + SCX_Rejang = 127, + SCX_Runic = 128, + SCX_Samaritan = 129, + SCX_Saurashtra = 130, + SCX_Sharada = 131, + SCX_Shavian = 132, + SCX_Siddham = 133, + SCX_SignWriting = 134, + SCX_Sinhala = 135, + SCX_Sogdian = 136, + SCX_Sora_Sompeng = 137, + SCX_Soyombo = 138, + SCX_Sundanese = 139, + SCX_Syloti_Nagri = 140, + SCX_Syriac = 141, + SCX_Tagalog = 142, + SCX_Tagbanwa = 143, + SCX_Tai_Le = 144, + SCX_Tai_Tham = 145, + SCX_Tai_Viet = 146, + SCX_Takri = 147, + SCX_Tamil = 148, + SCX_Tangsa = 149, + SCX_Tangut = 150, + SCX_Telugu = 151, + SCX_Thaana = 152, + SCX_Thai = 153, + SCX_Tibetan = 154, + SCX_Tifinagh = 155, + SCX_Tirhuta = 156, + SCX_Toto = 157, + SCX_Ugaritic = 158, + SCX_Vai = 159, + SCX_Vithkuqi = 160, + SCX_Wancho = 161, + SCX_Warang_Citi = 162, + SCX_Yezidi = 163, + SCX_Yi = 164, + SCX_Zanabazar_Square = 165, SCX_use_AUX_TABLE_1 = -1, SCX_use_AUX_TABLE_2 = -2, SCX_use_AUX_TABLE_3 = -3, @@ -74518,7 +75699,11 @@ typedef enum { SCX_use_AUX_TABLE_52 = -52, SCX_use_AUX_TABLE_53 = -53, SCX_use_AUX_TABLE_54 = -54, - SCX_use_AUX_TABLE_55 = -55 + SCX_use_AUX_TABLE_55 = -55, + SCX_use_AUX_TABLE_56 = -56, + SCX_use_AUX_TABLE_57 = -57, + SCX_use_AUX_TABLE_58 = -58, + SCX_use_AUX_TABLE_59 = -59 } SCX_enum; # endif /* ASCII/Latin1 */ @@ -74552,6 +75737,7 @@ static const SCX_enum SCX_AUX_TABLE_4[] = { static const SCX_enum SCX_AUX_TABLE_5[] = { SCX_Arabic, SCX_Hanifi_Rohingya, + SCX_Nko, SCX_Syriac, SCX_Thaana, SCX_Yezidi @@ -74564,33 +75750,44 @@ static const SCX_enum SCX_AUX_TABLE_6[] = { }; static const SCX_enum SCX_AUX_TABLE_7[] = { + SCX_Adlam, + SCX_Arabic, + SCX_Hanifi_Rohingya, + SCX_Nko, + SCX_Syriac, + SCX_Thaana, + SCX_Yezidi +}; + +static const SCX_enum SCX_AUX_TABLE_8[] = { SCX_Adlam, SCX_Arabic, SCX_Hanifi_Rohingya, SCX_Mandaic, SCX_Manichaean, + SCX_Old_Uyghur, SCX_Psalter_Pahlavi, SCX_Sogdian, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_8[] = { +static const SCX_enum SCX_AUX_TABLE_9[] = { SCX_Arabic, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_9[] = { +static const SCX_enum SCX_AUX_TABLE_10[] = { SCX_Arabic, SCX_Thaana, SCX_Yezidi }; -static const SCX_enum SCX_AUX_TABLE_10[] = { +static const SCX_enum SCX_AUX_TABLE_11[] = { SCX_Arabic, SCX_Hanifi_Rohingya }; -static const SCX_enum SCX_AUX_TABLE_11[] = { +static const SCX_enum SCX_AUX_TABLE_12[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -74606,7 +75803,7 @@ static const SCX_enum SCX_AUX_TABLE_11[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_12[] = { +static const SCX_enum SCX_AUX_TABLE_13[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -74621,7 +75818,7 @@ static const SCX_enum SCX_AUX_TABLE_12[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_13[] = { +static const SCX_enum SCX_AUX_TABLE_14[] = { SCX_Bengali, SCX_Devanagari, SCX_Dogra, @@ -74644,7 +75841,7 @@ static const SCX_enum SCX_AUX_TABLE_13[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_14[] = { +static const SCX_enum SCX_AUX_TABLE_15[] = { SCX_Bengali, SCX_Devanagari, SCX_Dogra, @@ -74668,90 +75865,90 @@ static const SCX_enum SCX_AUX_TABLE_14[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_15[] = { +static const SCX_enum SCX_AUX_TABLE_16[] = { SCX_Devanagari, SCX_Dogra, SCX_Kaithi, SCX_Mahajani }; -static const SCX_enum SCX_AUX_TABLE_16[] = { +static const SCX_enum SCX_AUX_TABLE_17[] = { SCX_Bengali, SCX_Chakma, SCX_Syloti_Nagri }; -static const SCX_enum SCX_AUX_TABLE_17[] = { +static const SCX_enum SCX_AUX_TABLE_18[] = { SCX_Gurmukhi, SCX_Multani }; -static const SCX_enum SCX_AUX_TABLE_18[] = { +static const SCX_enum SCX_AUX_TABLE_19[] = { SCX_Gujarati, SCX_Khojki }; -static const SCX_enum SCX_AUX_TABLE_19[] = { +static const SCX_enum SCX_AUX_TABLE_20[] = { SCX_Grantha, SCX_Tamil }; -static const SCX_enum SCX_AUX_TABLE_20[] = { +static const SCX_enum SCX_AUX_TABLE_21[] = { SCX_Kannada, SCX_Nandinagari }; -static const SCX_enum SCX_AUX_TABLE_21[] = { +static const SCX_enum SCX_AUX_TABLE_22[] = { SCX_Chakma, SCX_Myanmar, SCX_Tai_Le }; -static const SCX_enum SCX_AUX_TABLE_22[] = { +static const SCX_enum SCX_AUX_TABLE_23[] = { SCX_Georgian, SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_23[] = { +static const SCX_enum SCX_AUX_TABLE_24[] = { SCX_Hangul, SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_24[] = { +static const SCX_enum SCX_AUX_TABLE_25[] = { SCX_Buhid, SCX_Hanunoo, SCX_Tagalog, SCX_Tagbanwa }; -static const SCX_enum SCX_AUX_TABLE_25[] = { +static const SCX_enum SCX_AUX_TABLE_26[] = { SCX_Mongolian, SCX_Phags_Pa }; -static const SCX_enum SCX_AUX_TABLE_26[] = { +static const SCX_enum SCX_AUX_TABLE_27[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, SCX_Kannada }; -static const SCX_enum SCX_AUX_TABLE_27[] = { +static const SCX_enum SCX_AUX_TABLE_28[] = { SCX_Devanagari, SCX_Grantha }; -static const SCX_enum SCX_AUX_TABLE_28[] = { +static const SCX_enum SCX_AUX_TABLE_29[] = { SCX_Bengali, SCX_Devanagari }; -static const SCX_enum SCX_AUX_TABLE_29[] = { +static const SCX_enum SCX_AUX_TABLE_30[] = { SCX_Devanagari, SCX_Sharada }; -static const SCX_enum SCX_AUX_TABLE_30[] = { +static const SCX_enum SCX_AUX_TABLE_31[] = { SCX_Devanagari, SCX_Kannada, SCX_Malayalam, @@ -74760,12 +75957,12 @@ static const SCX_enum SCX_AUX_TABLE_30[] = { SCX_Telugu }; -static const SCX_enum SCX_AUX_TABLE_31[] = { +static const SCX_enum SCX_AUX_TABLE_32[] = { SCX_Devanagari, SCX_Nandinagari }; -static const SCX_enum SCX_AUX_TABLE_32[] = { +static const SCX_enum SCX_AUX_TABLE_33[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -74776,36 +75973,36 @@ static const SCX_enum SCX_AUX_TABLE_32[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_33[] = { +static const SCX_enum SCX_AUX_TABLE_34[] = { SCX_Devanagari, SCX_Grantha, SCX_Kannada }; -static const SCX_enum SCX_AUX_TABLE_34[] = { +static const SCX_enum SCX_AUX_TABLE_35[] = { SCX_Cyrillic, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_35[] = { +static const SCX_enum SCX_AUX_TABLE_36[] = { SCX_Latin, SCX_Mongolian }; -static const SCX_enum SCX_AUX_TABLE_36[] = { +static const SCX_enum SCX_AUX_TABLE_37[] = { SCX_Devanagari, SCX_Grantha, SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_37[] = { +static const SCX_enum SCX_AUX_TABLE_38[] = { SCX_Han, SCX_Hanb, SCX_Jpan, SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_38[] = { +static const SCX_enum SCX_AUX_TABLE_39[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -74817,7 +76014,7 @@ static const SCX_enum SCX_AUX_TABLE_38[] = { SCX_Yi }; -static const SCX_enum SCX_AUX_TABLE_39[] = { +static const SCX_enum SCX_AUX_TABLE_40[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -74828,7 +76025,7 @@ static const SCX_enum SCX_AUX_TABLE_39[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_40[] = { +static const SCX_enum SCX_AUX_TABLE_41[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -74836,13 +76033,13 @@ static const SCX_enum SCX_AUX_TABLE_40[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_41[] = { +static const SCX_enum SCX_AUX_TABLE_42[] = { SCX_Hiragana, SCX_Jpan, SCX_Katakana }; -static const SCX_enum SCX_AUX_TABLE_42[] = { +static const SCX_enum SCX_AUX_TABLE_43[] = { SCX_Han, SCX_Hanb, SCX_Hiragana, @@ -74851,17 +76048,17 @@ static const SCX_enum SCX_AUX_TABLE_42[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_43[] = { +static const SCX_enum SCX_AUX_TABLE_44[] = { SCX_Hiragana, SCX_Jpan }; -static const SCX_enum SCX_AUX_TABLE_44[] = { +static const SCX_enum SCX_AUX_TABLE_45[] = { SCX_Jpan, SCX_Katakana }; -static const SCX_enum SCX_AUX_TABLE_45[] = { +static const SCX_enum SCX_AUX_TABLE_46[] = { SCX_Han, SCX_Hanb, SCX_Jpan, @@ -74869,7 +76066,7 @@ static const SCX_enum SCX_AUX_TABLE_45[] = { SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_46[] = { +static const SCX_enum SCX_AUX_TABLE_47[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -74886,7 +76083,7 @@ static const SCX_enum SCX_AUX_TABLE_46[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_47[] = { +static const SCX_enum SCX_AUX_TABLE_48[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -74902,7 +76099,7 @@ static const SCX_enum SCX_AUX_TABLE_47[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_48[] = { +static const SCX_enum SCX_AUX_TABLE_49[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -74916,43 +76113,59 @@ static const SCX_enum SCX_AUX_TABLE_48[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_49[] = { +static const SCX_enum SCX_AUX_TABLE_50[] = { SCX_Devanagari, SCX_Tamil }; -static const SCX_enum SCX_AUX_TABLE_50[] = { +static const SCX_enum SCX_AUX_TABLE_51[] = { SCX_Kayah_Li, SCX_Latin, SCX_Myanmar }; -static const SCX_enum SCX_AUX_TABLE_51[] = { +static const SCX_enum SCX_AUX_TABLE_52[] = { SCX_Buginese, SCX_Javanese }; -static const SCX_enum SCX_AUX_TABLE_52[] = { +static const SCX_enum SCX_AUX_TABLE_53[] = { + SCX_Arabic, + SCX_Nko +}; + +static const SCX_enum SCX_AUX_TABLE_54[] = { SCX_Arabic, SCX_Thaana }; -static const SCX_enum SCX_AUX_TABLE_53[] = { +static const SCX_enum SCX_AUX_TABLE_55[] = { SCX_Cypriot, + SCX_Cypro_Minoan, SCX_Linear_B }; -static const SCX_enum SCX_AUX_TABLE_54[] = { +static const SCX_enum SCX_AUX_TABLE_56[] = { + SCX_Cypriot, + SCX_Linear_B +}; + +static const SCX_enum SCX_AUX_TABLE_57[] = { SCX_Cypriot, SCX_Linear_A, SCX_Linear_B }; -static const SCX_enum SCX_AUX_TABLE_55[] = { +static const SCX_enum SCX_AUX_TABLE_58[] = { SCX_Arabic, SCX_Coptic }; +static const SCX_enum SCX_AUX_TABLE_59[] = { + SCX_Manichaean, + SCX_Old_Uyghur +}; + static const SCX_enum * const SCX_AUX_TABLE_ptrs[] = { NULL, /* Placeholder */ SCX_AUX_TABLE_1, @@ -75009,7 +76222,11 @@ static const SCX_enum * const SCX_AUX_TABLE_ptrs[] = { SCX_AUX_TABLE_52, SCX_AUX_TABLE_53, SCX_AUX_TABLE_54, - SCX_AUX_TABLE_55 + SCX_AUX_TABLE_55, + SCX_AUX_TABLE_56, + SCX_AUX_TABLE_57, + SCX_AUX_TABLE_58, + SCX_AUX_TABLE_59 }; /* Parallel table to the above, giving the number of elements in each table @@ -75021,57 +76238,61 @@ static const U8 SCX_AUX_TABLE_lengths[] = { 2 /* SCX_AUX_TABLE_2 */, 2 /* SCX_AUX_TABLE_3 */, 2 /* SCX_AUX_TABLE_4 */, - 5 /* SCX_AUX_TABLE_5 */, + 6 /* SCX_AUX_TABLE_5 */, 3 /* SCX_AUX_TABLE_6 */, - 8 /* SCX_AUX_TABLE_7 */, - 2 /* SCX_AUX_TABLE_8 */, - 3 /* SCX_AUX_TABLE_9 */, - 2 /* SCX_AUX_TABLE_10 */, - 13 /* SCX_AUX_TABLE_11 */, - 12 /* SCX_AUX_TABLE_12 */, - 20 /* SCX_AUX_TABLE_13 */, - 21 /* SCX_AUX_TABLE_14 */, - 4 /* SCX_AUX_TABLE_15 */, - 3 /* SCX_AUX_TABLE_16 */, - 2 /* SCX_AUX_TABLE_17 */, + 7 /* SCX_AUX_TABLE_7 */, + 9 /* SCX_AUX_TABLE_8 */, + 2 /* SCX_AUX_TABLE_9 */, + 3 /* SCX_AUX_TABLE_10 */, + 2 /* SCX_AUX_TABLE_11 */, + 13 /* SCX_AUX_TABLE_12 */, + 12 /* SCX_AUX_TABLE_13 */, + 20 /* SCX_AUX_TABLE_14 */, + 21 /* SCX_AUX_TABLE_15 */, + 4 /* SCX_AUX_TABLE_16 */, + 3 /* SCX_AUX_TABLE_17 */, 2 /* SCX_AUX_TABLE_18 */, 2 /* SCX_AUX_TABLE_19 */, 2 /* SCX_AUX_TABLE_20 */, - 3 /* SCX_AUX_TABLE_21 */, - 2 /* SCX_AUX_TABLE_22 */, + 2 /* SCX_AUX_TABLE_21 */, + 3 /* SCX_AUX_TABLE_22 */, 2 /* SCX_AUX_TABLE_23 */, - 4 /* SCX_AUX_TABLE_24 */, - 2 /* SCX_AUX_TABLE_25 */, - 4 /* SCX_AUX_TABLE_26 */, - 2 /* SCX_AUX_TABLE_27 */, + 2 /* SCX_AUX_TABLE_24 */, + 4 /* SCX_AUX_TABLE_25 */, + 2 /* SCX_AUX_TABLE_26 */, + 4 /* SCX_AUX_TABLE_27 */, 2 /* SCX_AUX_TABLE_28 */, 2 /* SCX_AUX_TABLE_29 */, - 6 /* SCX_AUX_TABLE_30 */, - 2 /* SCX_AUX_TABLE_31 */, - 8 /* SCX_AUX_TABLE_32 */, - 3 /* SCX_AUX_TABLE_33 */, - 2 /* SCX_AUX_TABLE_34 */, + 2 /* SCX_AUX_TABLE_30 */, + 6 /* SCX_AUX_TABLE_31 */, + 2 /* SCX_AUX_TABLE_32 */, + 8 /* SCX_AUX_TABLE_33 */, + 3 /* SCX_AUX_TABLE_34 */, 2 /* SCX_AUX_TABLE_35 */, - 3 /* SCX_AUX_TABLE_36 */, - 4 /* SCX_AUX_TABLE_37 */, - 9 /* SCX_AUX_TABLE_38 */, - 8 /* SCX_AUX_TABLE_39 */, - 5 /* SCX_AUX_TABLE_40 */, - 3 /* SCX_AUX_TABLE_41 */, - 6 /* SCX_AUX_TABLE_42 */, - 2 /* SCX_AUX_TABLE_43 */, + 2 /* SCX_AUX_TABLE_36 */, + 3 /* SCX_AUX_TABLE_37 */, + 4 /* SCX_AUX_TABLE_38 */, + 9 /* SCX_AUX_TABLE_39 */, + 8 /* SCX_AUX_TABLE_40 */, + 5 /* SCX_AUX_TABLE_41 */, + 3 /* SCX_AUX_TABLE_42 */, + 6 /* SCX_AUX_TABLE_43 */, 2 /* SCX_AUX_TABLE_44 */, - 5 /* SCX_AUX_TABLE_45 */, - 14 /* SCX_AUX_TABLE_46 */, - 13 /* SCX_AUX_TABLE_47 */, - 11 /* SCX_AUX_TABLE_48 */, - 2 /* SCX_AUX_TABLE_49 */, - 3 /* SCX_AUX_TABLE_50 */, - 2 /* SCX_AUX_TABLE_51 */, + 2 /* SCX_AUX_TABLE_45 */, + 5 /* SCX_AUX_TABLE_46 */, + 14 /* SCX_AUX_TABLE_47 */, + 13 /* SCX_AUX_TABLE_48 */, + 11 /* SCX_AUX_TABLE_49 */, + 2 /* SCX_AUX_TABLE_50 */, + 3 /* SCX_AUX_TABLE_51 */, 2 /* SCX_AUX_TABLE_52 */, 2 /* SCX_AUX_TABLE_53 */, - 3 /* SCX_AUX_TABLE_54 */, - 2 /* SCX_AUX_TABLE_55 */ + 2 /* SCX_AUX_TABLE_54 */, + 3 /* SCX_AUX_TABLE_55 */, + 2 /* SCX_AUX_TABLE_56 */, + 3 /* SCX_AUX_TABLE_57 */, + 2 /* SCX_AUX_TABLE_58 */, + 2 /* SCX_AUX_TABLE_59 */ }; /* This table, indexed by the script enum, gives the zero code point for that @@ -75108,6 +76329,7 @@ static const UV script_zeros[] = { '0', /* Coptic */ '0', /* Cuneiform */ '0', /* Cypriot */ + '0', /* Cypro_Minoan */ '0', /* Cyrillic */ '0', /* Deseret */ 0x966, /* Devanagari */ @@ -75195,6 +76417,7 @@ static const UV script_zeros[] = { '0', /* Old_Sogdian */ '0', /* Old_South_Arabian */ '0', /* Old_Turkic */ + '0', /* Old_Uyghur */ 0xb66, /* Oriya */ '0', /* Osage */ 0x104a0, /* Osmanya */ @@ -75226,6 +76449,7 @@ static const UV script_zeros[] = { '0', /* Tai_Viet */ 0x116c0, /* Takri */ 0xbe6, /* Tamil */ + 0x16ac0, /* Tangsa */ '0', /* Tangut */ 0xc66, /* Telugu */ 0x660, /* Thaana */ @@ -75233,8 +76457,10 @@ static const UV script_zeros[] = { 0xf20, /* Tibetan */ '0', /* Tifinagh */ 0x114d0, /* Tirhuta */ + '0', /* Toto */ '0', /* Ugaritic */ 0xa620, /* Vai */ + '0', /* Vithkuqi */ 0x1e2f0, /* Wancho */ 0x118e0, /* Warang_Citi */ 0x660 /* Yezidi */ @@ -75313,9 +76539,6 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Arabic, SCX_use_AUX_TABLE_5, SCX_use_AUX_TABLE_6, - SCX_Unknown, - SCX_Arabic, - SCX_use_AUX_TABLE_5, SCX_Arabic, SCX_use_AUX_TABLE_7, SCX_Arabic, @@ -75323,10 +76546,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Arabic, SCX_use_AUX_TABLE_9, SCX_Arabic, - SCX_use_AUX_TABLE_8, - SCX_Arabic, SCX_use_AUX_TABLE_10, SCX_Arabic, + SCX_use_AUX_TABLE_9, + SCX_Arabic, + SCX_use_AUX_TABLE_11, + SCX_Arabic, SCX_Common, SCX_Arabic, SCX_Syriac, @@ -75358,13 +76583,13 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Common, SCX_Arabic, SCX_Devanagari, - SCX_use_AUX_TABLE_11, SCX_use_AUX_TABLE_12, + SCX_use_AUX_TABLE_13, SCX_Inherited, SCX_Devanagari, - SCX_use_AUX_TABLE_13, SCX_use_AUX_TABLE_14, SCX_use_AUX_TABLE_15, + SCX_use_AUX_TABLE_16, SCX_Devanagari, SCX_Bengali, SCX_Unknown, @@ -75392,7 +76617,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Bengali, SCX_Unknown, - SCX_use_AUX_TABLE_16, + SCX_use_AUX_TABLE_17, SCX_Bengali, SCX_Unknown, SCX_Gurmukhi, @@ -75425,7 +76650,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Gurmukhi, SCX_Unknown, - SCX_use_AUX_TABLE_17, + SCX_use_AUX_TABLE_18, SCX_Gurmukhi, SCX_Unknown, SCX_Gujarati, @@ -75452,7 +76677,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Gujarati, SCX_Unknown, - SCX_use_AUX_TABLE_18, + SCX_use_AUX_TABLE_19, SCX_Gujarati, SCX_Unknown, SCX_Gujarati, @@ -75515,7 +76740,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Tamil, SCX_Unknown, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, SCX_Unknown, SCX_Telugu, @@ -75541,6 +76766,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Telugu, SCX_Unknown, SCX_Telugu, + SCX_Unknown, + SCX_Telugu, SCX_Kannada, SCX_Unknown, SCX_Kannada, @@ -75563,7 +76790,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Kannada, SCX_Unknown, - SCX_use_AUX_TABLE_20, + SCX_use_AUX_TABLE_21, SCX_Unknown, SCX_Kannada, SCX_Unknown, @@ -75647,7 +76874,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Tibetan, SCX_Unknown, SCX_Myanmar, - SCX_use_AUX_TABLE_21, + SCX_use_AUX_TABLE_22, SCX_Myanmar, SCX_Georgian, SCX_Unknown, @@ -75656,9 +76883,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Georgian, SCX_Unknown, SCX_Georgian, - SCX_use_AUX_TABLE_22, - SCX_Georgian, SCX_use_AUX_TABLE_23, + SCX_Georgian, + SCX_use_AUX_TABLE_24, SCX_Ethiopic, SCX_Unknown, SCX_Ethiopic, @@ -75709,9 +76936,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Tagalog, SCX_Unknown, SCX_Tagalog, - SCX_Unknown, SCX_Hanunoo, - SCX_use_AUX_TABLE_24, + SCX_use_AUX_TABLE_25, SCX_Unknown, SCX_Buhid, SCX_Unknown, @@ -75728,11 +76954,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Khmer, SCX_Unknown, SCX_Mongolian, - SCX_use_AUX_TABLE_25, - SCX_Mongolian, - SCX_use_AUX_TABLE_25, + SCX_use_AUX_TABLE_26, SCX_Mongolian, - SCX_Unknown, + SCX_use_AUX_TABLE_26, SCX_Mongolian, SCX_Unknown, SCX_Mongolian, @@ -75798,33 +77022,33 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Georgian, SCX_Sundanese, SCX_Unknown, - SCX_use_AUX_TABLE_26, - SCX_Devanagari, - SCX_use_AUX_TABLE_26, SCX_use_AUX_TABLE_27, SCX_Devanagari, + SCX_use_AUX_TABLE_27, SCX_use_AUX_TABLE_28, + SCX_Devanagari, SCX_use_AUX_TABLE_29, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_30, SCX_use_AUX_TABLE_29, SCX_use_AUX_TABLE_30, + SCX_use_AUX_TABLE_31, SCX_Devanagari, - SCX_use_AUX_TABLE_29, + SCX_use_AUX_TABLE_30, SCX_Devanagari, + SCX_use_AUX_TABLE_30, SCX_use_AUX_TABLE_29, - SCX_use_AUX_TABLE_28, SCX_Devanagari, - SCX_use_AUX_TABLE_31, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_32, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_32, - SCX_use_AUX_TABLE_27, SCX_use_AUX_TABLE_33, SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_34, + SCX_use_AUX_TABLE_29, SCX_Bengali, - SCX_use_AUX_TABLE_27, + SCX_use_AUX_TABLE_28, SCX_Nandinagari, SCX_Unknown, SCX_Latin, @@ -75839,9 +77063,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Latin, SCX_Greek, SCX_Inherited, - SCX_use_AUX_TABLE_34, + SCX_use_AUX_TABLE_35, SCX_Inherited, - SCX_Unknown, + SCX_Syriac, SCX_Inherited, SCX_Latin, SCX_Greek, @@ -75879,7 +77103,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Common, SCX_Inherited, SCX_Common, - SCX_use_AUX_TABLE_35, + SCX_use_AUX_TABLE_36, SCX_Common, SCX_Unknown, SCX_Common, @@ -75894,7 +77118,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Common, SCX_Unknown, SCX_Inherited, - SCX_use_AUX_TABLE_36, + SCX_use_AUX_TABLE_37, SCX_Unknown, SCX_Common, SCX_Greek, @@ -75920,9 +77144,6 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Common, SCX_Glagolitic, - SCX_Unknown, - SCX_Glagolitic, - SCX_Unknown, SCX_Latin, SCX_Coptic, SCX_Unknown, @@ -75961,78 +77182,77 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_use_AUX_TABLE_3, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, - SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_40, SCX_Common, - SCX_use_AUX_TABLE_37, - SCX_use_AUX_TABLE_38, - SCX_Common, - SCX_use_AUX_TABLE_39, SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_39, SCX_Common, - SCX_use_AUX_TABLE_37, SCX_use_AUX_TABLE_40, - SCX_use_AUX_TABLE_23, SCX_use_AUX_TABLE_39, - SCX_use_AUX_TABLE_41, + SCX_use_AUX_TABLE_40, SCX_Common, - SCX_use_AUX_TABLE_39, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, + SCX_use_AUX_TABLE_41, + SCX_use_AUX_TABLE_24, + SCX_use_AUX_TABLE_40, SCX_use_AUX_TABLE_42, - SCX_use_AUX_TABLE_37, - SCX_Unknown, + SCX_Common, + SCX_use_AUX_TABLE_40, + SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_43, - SCX_use_AUX_TABLE_41, SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_38, - SCX_use_AUX_TABLE_41, + SCX_Unknown, + SCX_use_AUX_TABLE_42, SCX_use_AUX_TABLE_44, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, SCX_Unknown, SCX_use_AUX_TABLE_1, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_1, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_37, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_38, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, - SCX_Unknown, + SCX_use_AUX_TABLE_38, SCX_Yi, SCX_Unknown, SCX_Yi, @@ -76045,7 +77265,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Cyrillic, SCX_Bamum, SCX_Unknown, - SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_46, SCX_Common, SCX_Latin, SCX_Common, @@ -76054,11 +77274,15 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Latin, SCX_Unknown, SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, SCX_Syloti_Nagri, SCX_Unknown, - SCX_use_AUX_TABLE_46, SCX_use_AUX_TABLE_47, SCX_use_AUX_TABLE_48, + SCX_use_AUX_TABLE_49, SCX_Unknown, SCX_Phags_Pa, SCX_Unknown, @@ -76067,21 +77291,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Saurashtra, SCX_Unknown, SCX_Devanagari, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_49, + SCX_use_AUX_TABLE_50, SCX_Devanagari, SCX_Kayah_Li, - SCX_use_AUX_TABLE_50, + SCX_use_AUX_TABLE_51, SCX_Kayah_Li, SCX_Rejang, SCX_Unknown, SCX_Rejang, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, SCX_Javanese, SCX_Unknown, - SCX_use_AUX_TABLE_51, + SCX_use_AUX_TABLE_52, SCX_Javanese, SCX_Unknown, SCX_Javanese, @@ -76122,15 +77346,15 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Meetei_Mayek, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Latin, SCX_Unknown, @@ -76150,24 +77374,25 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Arabic, SCX_Unknown, SCX_Arabic, - SCX_Common, + SCX_use_AUX_TABLE_53, + SCX_Arabic, SCX_Unknown, SCX_Arabic, SCX_Unknown, SCX_Arabic, SCX_Unknown, SCX_Arabic, - SCX_use_AUX_TABLE_52, + SCX_use_AUX_TABLE_54, + SCX_Arabic, + SCX_use_AUX_TABLE_54, SCX_Arabic, - SCX_use_AUX_TABLE_52, - SCX_Unknown, SCX_Inherited, SCX_Common, SCX_Unknown, SCX_Inherited, SCX_Cyrillic, SCX_Common, - SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_40, SCX_Common, SCX_Unknown, SCX_Common, @@ -76185,20 +77410,20 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Common, SCX_Latin, SCX_Common, - SCX_use_AUX_TABLE_38, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -76220,11 +77445,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Linear_B, SCX_Unknown, - SCX_use_AUX_TABLE_53, + SCX_use_AUX_TABLE_55, + SCX_use_AUX_TABLE_56, SCX_Unknown, - SCX_use_AUX_TABLE_54, + SCX_use_AUX_TABLE_57, SCX_Unknown, - SCX_use_AUX_TABLE_53, + SCX_use_AUX_TABLE_56, SCX_Greek, SCX_Unknown, SCX_Common, @@ -76238,7 +77464,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Carian, SCX_Unknown, - SCX_use_AUX_TABLE_55, + SCX_use_AUX_TABLE_58, SCX_Unknown, SCX_Old_Italic, SCX_Unknown, @@ -76269,6 +77495,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Caucasian_Albanian, SCX_Unknown, SCX_Caucasian_Albanian, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, SCX_Unknown, SCX_Linear_A, SCX_Unknown, @@ -76276,6 +77517,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Linear_A, SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, SCX_Cypriot, SCX_Unknown, SCX_Cypriot, @@ -76335,6 +77582,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Manichaean, SCX_Unknown, SCX_Manichaean, + SCX_use_AUX_TABLE_59, + SCX_Manichaean, SCX_Unknown, SCX_Avestan, SCX_Unknown, @@ -76374,6 +77623,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Sogdian, SCX_Unknown, + SCX_Old_Uyghur, + SCX_Unknown, SCX_Chorasmian, SCX_Unknown, SCX_Elymaic, @@ -76420,9 +77671,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Khudawadi, SCX_Unknown, SCX_Grantha, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Grantha, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Unknown, SCX_Grantha, SCX_Unknown, @@ -76436,7 +77687,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Grantha, SCX_Unknown, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Grantha, SCX_Unknown, SCX_Grantha, @@ -76512,6 +77763,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Soyombo, SCX_Unknown, + SCX_Canadian_Aboriginal, SCX_Pau_Cin_Hau, SCX_Unknown, SCX_Bhaiksuki, @@ -76559,9 +77811,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Lisu, SCX_Unknown, SCX_Tamil, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, SCX_Unknown, SCX_Tamil, @@ -76573,6 +77825,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Cuneiform, SCX_Unknown, + SCX_Cypro_Minoan, + SCX_Unknown, SCX_Egyptian_Hieroglyphs, SCX_Unknown, SCX_Egyptian_Hieroglyphs, @@ -76586,6 +77840,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Mro, SCX_Unknown, SCX_Mro, + SCX_Tangsa, + SCX_Unknown, + SCX_Tangsa, SCX_Unknown, SCX_Bassa_Vah, SCX_Unknown, @@ -76611,10 +77868,10 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Tangut, SCX_Nushu, - SCX_Common, + SCX_use_AUX_TABLE_38, SCX_Khitan_Small_Script, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Tangut, SCX_Unknown, @@ -76623,13 +77880,20 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Tangut, SCX_Unknown, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_45, SCX_Unknown, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_45, + SCX_Unknown, + SCX_use_AUX_TABLE_45, + SCX_Unknown, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_44, + SCX_use_AUX_TABLE_45, SCX_Unknown, SCX_use_AUX_TABLE_44, SCX_Unknown, + SCX_use_AUX_TABLE_45, + SCX_Unknown, SCX_Nushu, SCX_Unknown, SCX_Duployan, @@ -76642,6 +77906,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Duployan, SCX_Unknown, + SCX_Inherited, + SCX_Unknown, + SCX_Inherited, + SCX_Unknown, + SCX_Common, + SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, @@ -76662,7 +77932,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, SCX_Unknown, SCX_Common, @@ -76712,6 +77982,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_SignWriting, SCX_Unknown, + SCX_Latin, + SCX_Unknown, SCX_Glagolitic, SCX_Unknown, SCX_Glagolitic, @@ -76730,10 +78002,20 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Nyiakeng_Puachue_Hmong, SCX_Unknown, + SCX_Toto, + SCX_Unknown, SCX_Wancho, SCX_Unknown, SCX_Wancho, SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, SCX_Mende_Kikakui, SCX_Unknown, SCX_Mende_Kikakui, @@ -76831,14 +78113,14 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Common, SCX_Unknown, SCX_Common, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_44, SCX_Common, SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -76894,19 +78176,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, + SCX_Unknown, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -76928,7 +78212,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ - 1699, /* Number of elements */ + 1757, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -77031,7 +78315,6 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x61F, 0x620, 0x640, @@ -77067,11 +78350,11 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8E2, 0x8E3, 0x900, @@ -77243,7 +78526,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -77253,6 +78536,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -77276,7 +78561,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -77424,9 +78709,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, + 0x1716, + 0x171F, 0x1720, 0x1735, 0x1737, @@ -77449,8 +78733,6 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1804, 0x1805, 0x1806, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -77493,11 +78775,11 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BC0, 0x1BF4, @@ -77609,7 +78891,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F0, 0x20F1, @@ -77637,9 +78919,6 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x2B96, 0x2B97, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, 0x2C60, 0x2C80, 0x2CF4, @@ -77677,7 +78956,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x2E00, 0x2E43, 0x2E44, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -77749,7 +79028,6 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, 0xA000, 0xA48D, 0xA490, @@ -77767,10 +79045,14 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xA82D, 0xA830, @@ -77865,14 +79147,15 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0xFB45, 0xFB46, 0xFB50, - 0xFBC2, + 0xFBC3, 0xFBD3, 0xFD3E, 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, 0xFDF2, 0xFDF3, @@ -77938,6 +79221,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x10080, 0x100FB, 0x10100, + 0x10102, 0x10103, 0x10107, 0x10134, @@ -77987,12 +79271,33 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x10564, 0x1056F, 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -78052,6 +79357,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x10AC0, 0x10AE7, 0x10AEB, + 0x10AF2, + 0x10AF3, 0x10AF7, 0x10B00, 0x10B36, @@ -78091,6 +79398,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -78098,10 +79407,10 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x11080, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -78189,7 +79498,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -78197,7 +79506,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -78229,6 +79538,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x11A48, 0x11A50, 0x11AA3, + 0x11AB0, 0x11AC0, 0x11AF9, 0x11C00, @@ -78290,6 +79600,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -78304,6 +79616,9 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -78340,9 +79655,16 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, - 0x1B11F, + 0x1B120, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -78359,6 +79681,12 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -78372,7 +79700,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -78429,6 +79757,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -78447,10 +79777,20 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -78561,7 +79901,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -78571,6 +79911,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -78584,27 +79926,27 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -78612,9 +79954,9 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -78676,138 +80018,143 @@ typedef enum { SCX_Coptic = 26, SCX_Cuneiform = 27, SCX_Cypriot = 28, - SCX_Cyrillic = 29, - SCX_Deseret = 30, - SCX_Devanagari = 31, - SCX_Dives_Akuru = 32, - SCX_Dogra = 33, - SCX_Duployan = 34, - SCX_Egyptian_Hieroglyphs = 35, - SCX_Elbasan = 36, - SCX_Elymaic = 37, - SCX_Ethiopic = 38, - SCX_Georgian = 39, - SCX_Glagolitic = 40, - SCX_Gothic = 41, - SCX_Grantha = 42, - SCX_Greek = 43, - SCX_Gujarati = 44, - SCX_Gunjala_Gondi = 45, - SCX_Gurmukhi = 46, - SCX_Han = 47, - SCX_Hanb = 48, - SCX_Hangul = 49, - SCX_Hanifi_Rohingya = 50, - SCX_Hanunoo = 51, - SCX_Hatran = 52, - SCX_Hebrew = 53, - SCX_Hiragana = 54, - SCX_Imperial_Aramaic = 55, - SCX_Inherited = 56, - SCX_Inscriptional_Pahlavi = 57, - SCX_Inscriptional_Parthian = 58, - SCX_INVALID = 59, - SCX_Javanese = 60, - SCX_Jpan = 61, - SCX_Kaithi = 62, - SCX_Kannada = 63, - SCX_Katakana = 64, - SCX_Kayah_Li = 65, - SCX_Kharoshthi = 66, - SCX_Khitan_Small_Script = 67, - SCX_Khmer = 68, - SCX_Khojki = 69, - SCX_Khudawadi = 70, - SCX_Kore = 71, - SCX_Lao = 72, - SCX_Latin = 73, - SCX_Lepcha = 74, - SCX_Limbu = 75, - SCX_Linear_A = 76, - SCX_Linear_B = 77, - SCX_Lisu = 78, - SCX_Lycian = 79, - SCX_Lydian = 80, - SCX_Mahajani = 81, - SCX_Makasar = 82, - SCX_Malayalam = 83, - SCX_Mandaic = 84, - SCX_Manichaean = 85, - SCX_Marchen = 86, - SCX_Masaram_Gondi = 87, - SCX_Medefaidrin = 88, - SCX_Meetei_Mayek = 89, - SCX_Mende_Kikakui = 90, - SCX_Meroitic_Cursive = 91, - SCX_Meroitic_Hieroglyphs = 92, - SCX_Miao = 93, - SCX_Modi = 94, - SCX_Mongolian = 95, - SCX_Mro = 96, - SCX_Multani = 97, - SCX_Myanmar = 98, - SCX_Nabataean = 99, - SCX_Nandinagari = 100, - SCX_New_Tai_Lue = 101, - SCX_Newa = 102, - SCX_Nko = 103, - SCX_Nushu = 104, - SCX_Nyiakeng_Puachue_Hmong = 105, - SCX_Ogham = 106, - SCX_Ol_Chiki = 107, - SCX_Old_Hungarian = 108, - SCX_Old_Italic = 109, - SCX_Old_North_Arabian = 110, - SCX_Old_Permic = 111, - SCX_Old_Persian = 112, - SCX_Old_Sogdian = 113, - SCX_Old_South_Arabian = 114, - SCX_Old_Turkic = 115, - SCX_Oriya = 116, - SCX_Osage = 117, - SCX_Osmanya = 118, - SCX_Pahawh_Hmong = 119, - SCX_Palmyrene = 120, - SCX_Pau_Cin_Hau = 121, - SCX_Phags_Pa = 122, - SCX_Phoenician = 123, - SCX_Psalter_Pahlavi = 124, - SCX_Rejang = 125, - SCX_Runic = 126, - SCX_Samaritan = 127, - SCX_Saurashtra = 128, - SCX_Sharada = 129, - SCX_Shavian = 130, - SCX_Siddham = 131, - SCX_SignWriting = 132, - SCX_Sinhala = 133, - SCX_Sogdian = 134, - SCX_Sora_Sompeng = 135, - SCX_Soyombo = 136, - SCX_Sundanese = 137, - SCX_Syloti_Nagri = 138, - SCX_Syriac = 139, - SCX_Tagalog = 140, - SCX_Tagbanwa = 141, - SCX_Tai_Le = 142, - SCX_Tai_Tham = 143, - SCX_Tai_Viet = 144, - SCX_Takri = 145, - SCX_Tamil = 146, - SCX_Tangut = 147, - SCX_Telugu = 148, - SCX_Thaana = 149, - SCX_Thai = 150, - SCX_Tibetan = 151, - SCX_Tifinagh = 152, - SCX_Tirhuta = 153, - SCX_Ugaritic = 154, - SCX_Vai = 155, - SCX_Wancho = 156, - SCX_Warang_Citi = 157, - SCX_Yezidi = 158, - SCX_Yi = 159, - SCX_Zanabazar_Square = 160, + SCX_Cypro_Minoan = 29, + SCX_Cyrillic = 30, + SCX_Deseret = 31, + SCX_Devanagari = 32, + SCX_Dives_Akuru = 33, + SCX_Dogra = 34, + SCX_Duployan = 35, + SCX_Egyptian_Hieroglyphs = 36, + SCX_Elbasan = 37, + SCX_Elymaic = 38, + SCX_Ethiopic = 39, + SCX_Georgian = 40, + SCX_Glagolitic = 41, + SCX_Gothic = 42, + SCX_Grantha = 43, + SCX_Greek = 44, + SCX_Gujarati = 45, + SCX_Gunjala_Gondi = 46, + SCX_Gurmukhi = 47, + SCX_Han = 48, + SCX_Hanb = 49, + SCX_Hangul = 50, + SCX_Hanifi_Rohingya = 51, + SCX_Hanunoo = 52, + SCX_Hatran = 53, + SCX_Hebrew = 54, + SCX_Hiragana = 55, + SCX_Imperial_Aramaic = 56, + SCX_Inherited = 57, + SCX_Inscriptional_Pahlavi = 58, + SCX_Inscriptional_Parthian = 59, + SCX_INVALID = 60, + SCX_Javanese = 61, + SCX_Jpan = 62, + SCX_Kaithi = 63, + SCX_Kannada = 64, + SCX_Katakana = 65, + SCX_Kayah_Li = 66, + SCX_Kharoshthi = 67, + SCX_Khitan_Small_Script = 68, + SCX_Khmer = 69, + SCX_Khojki = 70, + SCX_Khudawadi = 71, + SCX_Kore = 72, + SCX_Lao = 73, + SCX_Latin = 74, + SCX_Lepcha = 75, + SCX_Limbu = 76, + SCX_Linear_A = 77, + SCX_Linear_B = 78, + SCX_Lisu = 79, + SCX_Lycian = 80, + SCX_Lydian = 81, + SCX_Mahajani = 82, + SCX_Makasar = 83, + SCX_Malayalam = 84, + SCX_Mandaic = 85, + SCX_Manichaean = 86, + SCX_Marchen = 87, + SCX_Masaram_Gondi = 88, + SCX_Medefaidrin = 89, + SCX_Meetei_Mayek = 90, + SCX_Mende_Kikakui = 91, + SCX_Meroitic_Cursive = 92, + SCX_Meroitic_Hieroglyphs = 93, + SCX_Miao = 94, + SCX_Modi = 95, + SCX_Mongolian = 96, + SCX_Mro = 97, + SCX_Multani = 98, + SCX_Myanmar = 99, + SCX_Nabataean = 100, + SCX_Nandinagari = 101, + SCX_New_Tai_Lue = 102, + SCX_Newa = 103, + SCX_Nko = 104, + SCX_Nushu = 105, + SCX_Nyiakeng_Puachue_Hmong = 106, + SCX_Ogham = 107, + SCX_Ol_Chiki = 108, + SCX_Old_Hungarian = 109, + SCX_Old_Italic = 110, + SCX_Old_North_Arabian = 111, + SCX_Old_Permic = 112, + SCX_Old_Persian = 113, + SCX_Old_Sogdian = 114, + SCX_Old_South_Arabian = 115, + SCX_Old_Turkic = 116, + SCX_Old_Uyghur = 117, + SCX_Oriya = 118, + SCX_Osage = 119, + SCX_Osmanya = 120, + SCX_Pahawh_Hmong = 121, + SCX_Palmyrene = 122, + SCX_Pau_Cin_Hau = 123, + SCX_Phags_Pa = 124, + SCX_Phoenician = 125, + SCX_Psalter_Pahlavi = 126, + SCX_Rejang = 127, + SCX_Runic = 128, + SCX_Samaritan = 129, + SCX_Saurashtra = 130, + SCX_Sharada = 131, + SCX_Shavian = 132, + SCX_Siddham = 133, + SCX_SignWriting = 134, + SCX_Sinhala = 135, + SCX_Sogdian = 136, + SCX_Sora_Sompeng = 137, + SCX_Soyombo = 138, + SCX_Sundanese = 139, + SCX_Syloti_Nagri = 140, + SCX_Syriac = 141, + SCX_Tagalog = 142, + SCX_Tagbanwa = 143, + SCX_Tai_Le = 144, + SCX_Tai_Tham = 145, + SCX_Tai_Viet = 146, + SCX_Takri = 147, + SCX_Tamil = 148, + SCX_Tangsa = 149, + SCX_Tangut = 150, + SCX_Telugu = 151, + SCX_Thaana = 152, + SCX_Thai = 153, + SCX_Tibetan = 154, + SCX_Tifinagh = 155, + SCX_Tirhuta = 156, + SCX_Toto = 157, + SCX_Ugaritic = 158, + SCX_Vai = 159, + SCX_Vithkuqi = 160, + SCX_Wancho = 161, + SCX_Warang_Citi = 162, + SCX_Yezidi = 163, + SCX_Yi = 164, + SCX_Zanabazar_Square = 165, SCX_use_AUX_TABLE_1 = -1, SCX_use_AUX_TABLE_2 = -2, SCX_use_AUX_TABLE_3 = -3, @@ -78862,7 +80209,11 @@ typedef enum { SCX_use_AUX_TABLE_52 = -52, SCX_use_AUX_TABLE_53 = -53, SCX_use_AUX_TABLE_54 = -54, - SCX_use_AUX_TABLE_55 = -55 + SCX_use_AUX_TABLE_55 = -55, + SCX_use_AUX_TABLE_56 = -56, + SCX_use_AUX_TABLE_57 = -57, + SCX_use_AUX_TABLE_58 = -58, + SCX_use_AUX_TABLE_59 = -59 } SCX_enum; # endif /* EBCDIC 1047 */ @@ -78899,6 +80250,7 @@ static const SCX_enum SCX_AUX_TABLE_4[] = { static const SCX_enum SCX_AUX_TABLE_5[] = { SCX_Arabic, SCX_Hanifi_Rohingya, + SCX_Nko, SCX_Syriac, SCX_Thaana, SCX_Yezidi @@ -78911,33 +80263,44 @@ static const SCX_enum SCX_AUX_TABLE_6[] = { }; static const SCX_enum SCX_AUX_TABLE_7[] = { + SCX_Adlam, + SCX_Arabic, + SCX_Hanifi_Rohingya, + SCX_Nko, + SCX_Syriac, + SCX_Thaana, + SCX_Yezidi +}; + +static const SCX_enum SCX_AUX_TABLE_8[] = { SCX_Adlam, SCX_Arabic, SCX_Hanifi_Rohingya, SCX_Mandaic, SCX_Manichaean, + SCX_Old_Uyghur, SCX_Psalter_Pahlavi, SCX_Sogdian, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_8[] = { +static const SCX_enum SCX_AUX_TABLE_9[] = { SCX_Arabic, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_9[] = { +static const SCX_enum SCX_AUX_TABLE_10[] = { SCX_Arabic, SCX_Thaana, SCX_Yezidi }; -static const SCX_enum SCX_AUX_TABLE_10[] = { +static const SCX_enum SCX_AUX_TABLE_11[] = { SCX_Arabic, SCX_Hanifi_Rohingya }; -static const SCX_enum SCX_AUX_TABLE_11[] = { +static const SCX_enum SCX_AUX_TABLE_12[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -78953,7 +80316,7 @@ static const SCX_enum SCX_AUX_TABLE_11[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_12[] = { +static const SCX_enum SCX_AUX_TABLE_13[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -78968,7 +80331,7 @@ static const SCX_enum SCX_AUX_TABLE_12[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_13[] = { +static const SCX_enum SCX_AUX_TABLE_14[] = { SCX_Bengali, SCX_Devanagari, SCX_Dogra, @@ -78991,7 +80354,7 @@ static const SCX_enum SCX_AUX_TABLE_13[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_14[] = { +static const SCX_enum SCX_AUX_TABLE_15[] = { SCX_Bengali, SCX_Devanagari, SCX_Dogra, @@ -79015,90 +80378,90 @@ static const SCX_enum SCX_AUX_TABLE_14[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_15[] = { +static const SCX_enum SCX_AUX_TABLE_16[] = { SCX_Devanagari, SCX_Dogra, SCX_Kaithi, SCX_Mahajani }; -static const SCX_enum SCX_AUX_TABLE_16[] = { +static const SCX_enum SCX_AUX_TABLE_17[] = { SCX_Bengali, SCX_Chakma, SCX_Syloti_Nagri }; -static const SCX_enum SCX_AUX_TABLE_17[] = { +static const SCX_enum SCX_AUX_TABLE_18[] = { SCX_Gurmukhi, SCX_Multani }; -static const SCX_enum SCX_AUX_TABLE_18[] = { +static const SCX_enum SCX_AUX_TABLE_19[] = { SCX_Gujarati, SCX_Khojki }; -static const SCX_enum SCX_AUX_TABLE_19[] = { +static const SCX_enum SCX_AUX_TABLE_20[] = { SCX_Grantha, SCX_Tamil }; -static const SCX_enum SCX_AUX_TABLE_20[] = { +static const SCX_enum SCX_AUX_TABLE_21[] = { SCX_Kannada, SCX_Nandinagari }; -static const SCX_enum SCX_AUX_TABLE_21[] = { +static const SCX_enum SCX_AUX_TABLE_22[] = { SCX_Chakma, SCX_Myanmar, SCX_Tai_Le }; -static const SCX_enum SCX_AUX_TABLE_22[] = { +static const SCX_enum SCX_AUX_TABLE_23[] = { SCX_Georgian, SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_23[] = { +static const SCX_enum SCX_AUX_TABLE_24[] = { SCX_Hangul, SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_24[] = { +static const SCX_enum SCX_AUX_TABLE_25[] = { SCX_Buhid, SCX_Hanunoo, SCX_Tagalog, SCX_Tagbanwa }; -static const SCX_enum SCX_AUX_TABLE_25[] = { +static const SCX_enum SCX_AUX_TABLE_26[] = { SCX_Mongolian, SCX_Phags_Pa }; -static const SCX_enum SCX_AUX_TABLE_26[] = { +static const SCX_enum SCX_AUX_TABLE_27[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, SCX_Kannada }; -static const SCX_enum SCX_AUX_TABLE_27[] = { +static const SCX_enum SCX_AUX_TABLE_28[] = { SCX_Devanagari, SCX_Grantha }; -static const SCX_enum SCX_AUX_TABLE_28[] = { +static const SCX_enum SCX_AUX_TABLE_29[] = { SCX_Bengali, SCX_Devanagari }; -static const SCX_enum SCX_AUX_TABLE_29[] = { +static const SCX_enum SCX_AUX_TABLE_30[] = { SCX_Devanagari, SCX_Sharada }; -static const SCX_enum SCX_AUX_TABLE_30[] = { +static const SCX_enum SCX_AUX_TABLE_31[] = { SCX_Devanagari, SCX_Kannada, SCX_Malayalam, @@ -79107,12 +80470,12 @@ static const SCX_enum SCX_AUX_TABLE_30[] = { SCX_Telugu }; -static const SCX_enum SCX_AUX_TABLE_31[] = { +static const SCX_enum SCX_AUX_TABLE_32[] = { SCX_Devanagari, SCX_Nandinagari }; -static const SCX_enum SCX_AUX_TABLE_32[] = { +static const SCX_enum SCX_AUX_TABLE_33[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -79123,36 +80486,36 @@ static const SCX_enum SCX_AUX_TABLE_32[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_33[] = { +static const SCX_enum SCX_AUX_TABLE_34[] = { SCX_Devanagari, SCX_Grantha, SCX_Kannada }; -static const SCX_enum SCX_AUX_TABLE_34[] = { +static const SCX_enum SCX_AUX_TABLE_35[] = { SCX_Cyrillic, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_35[] = { +static const SCX_enum SCX_AUX_TABLE_36[] = { SCX_Latin, SCX_Mongolian }; -static const SCX_enum SCX_AUX_TABLE_36[] = { +static const SCX_enum SCX_AUX_TABLE_37[] = { SCX_Devanagari, SCX_Grantha, SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_37[] = { +static const SCX_enum SCX_AUX_TABLE_38[] = { SCX_Han, SCX_Hanb, SCX_Jpan, SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_38[] = { +static const SCX_enum SCX_AUX_TABLE_39[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -79164,7 +80527,7 @@ static const SCX_enum SCX_AUX_TABLE_38[] = { SCX_Yi }; -static const SCX_enum SCX_AUX_TABLE_39[] = { +static const SCX_enum SCX_AUX_TABLE_40[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -79175,7 +80538,7 @@ static const SCX_enum SCX_AUX_TABLE_39[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_40[] = { +static const SCX_enum SCX_AUX_TABLE_41[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -79183,13 +80546,13 @@ static const SCX_enum SCX_AUX_TABLE_40[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_41[] = { +static const SCX_enum SCX_AUX_TABLE_42[] = { SCX_Hiragana, SCX_Jpan, SCX_Katakana }; -static const SCX_enum SCX_AUX_TABLE_42[] = { +static const SCX_enum SCX_AUX_TABLE_43[] = { SCX_Han, SCX_Hanb, SCX_Hiragana, @@ -79198,17 +80561,17 @@ static const SCX_enum SCX_AUX_TABLE_42[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_43[] = { +static const SCX_enum SCX_AUX_TABLE_44[] = { SCX_Hiragana, SCX_Jpan }; -static const SCX_enum SCX_AUX_TABLE_44[] = { +static const SCX_enum SCX_AUX_TABLE_45[] = { SCX_Jpan, SCX_Katakana }; -static const SCX_enum SCX_AUX_TABLE_45[] = { +static const SCX_enum SCX_AUX_TABLE_46[] = { SCX_Han, SCX_Hanb, SCX_Jpan, @@ -79216,7 +80579,7 @@ static const SCX_enum SCX_AUX_TABLE_45[] = { SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_46[] = { +static const SCX_enum SCX_AUX_TABLE_47[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -79233,7 +80596,7 @@ static const SCX_enum SCX_AUX_TABLE_46[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_47[] = { +static const SCX_enum SCX_AUX_TABLE_48[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -79249,7 +80612,7 @@ static const SCX_enum SCX_AUX_TABLE_47[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_48[] = { +static const SCX_enum SCX_AUX_TABLE_49[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -79263,43 +80626,59 @@ static const SCX_enum SCX_AUX_TABLE_48[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_49[] = { +static const SCX_enum SCX_AUX_TABLE_50[] = { SCX_Devanagari, SCX_Tamil }; -static const SCX_enum SCX_AUX_TABLE_50[] = { +static const SCX_enum SCX_AUX_TABLE_51[] = { SCX_Kayah_Li, SCX_Latin, SCX_Myanmar }; -static const SCX_enum SCX_AUX_TABLE_51[] = { +static const SCX_enum SCX_AUX_TABLE_52[] = { SCX_Buginese, SCX_Javanese }; -static const SCX_enum SCX_AUX_TABLE_52[] = { +static const SCX_enum SCX_AUX_TABLE_53[] = { + SCX_Arabic, + SCX_Nko +}; + +static const SCX_enum SCX_AUX_TABLE_54[] = { SCX_Arabic, SCX_Thaana }; -static const SCX_enum SCX_AUX_TABLE_53[] = { +static const SCX_enum SCX_AUX_TABLE_55[] = { SCX_Cypriot, + SCX_Cypro_Minoan, SCX_Linear_B }; -static const SCX_enum SCX_AUX_TABLE_54[] = { +static const SCX_enum SCX_AUX_TABLE_56[] = { + SCX_Cypriot, + SCX_Linear_B +}; + +static const SCX_enum SCX_AUX_TABLE_57[] = { SCX_Cypriot, SCX_Linear_A, SCX_Linear_B }; -static const SCX_enum SCX_AUX_TABLE_55[] = { +static const SCX_enum SCX_AUX_TABLE_58[] = { SCX_Arabic, SCX_Coptic }; +static const SCX_enum SCX_AUX_TABLE_59[] = { + SCX_Manichaean, + SCX_Old_Uyghur +}; + static const SCX_enum * const SCX_AUX_TABLE_ptrs[] = { NULL, /* Placeholder */ SCX_AUX_TABLE_1, @@ -79356,7 +80735,11 @@ static const SCX_enum * const SCX_AUX_TABLE_ptrs[] = { SCX_AUX_TABLE_52, SCX_AUX_TABLE_53, SCX_AUX_TABLE_54, - SCX_AUX_TABLE_55 + SCX_AUX_TABLE_55, + SCX_AUX_TABLE_56, + SCX_AUX_TABLE_57, + SCX_AUX_TABLE_58, + SCX_AUX_TABLE_59 }; /* Parallel table to the above, giving the number of elements in each table @@ -79368,57 +80751,61 @@ static const U8 SCX_AUX_TABLE_lengths[] = { 2 /* SCX_AUX_TABLE_2 */, 2 /* SCX_AUX_TABLE_3 */, 2 /* SCX_AUX_TABLE_4 */, - 5 /* SCX_AUX_TABLE_5 */, + 6 /* SCX_AUX_TABLE_5 */, 3 /* SCX_AUX_TABLE_6 */, - 8 /* SCX_AUX_TABLE_7 */, - 2 /* SCX_AUX_TABLE_8 */, - 3 /* SCX_AUX_TABLE_9 */, - 2 /* SCX_AUX_TABLE_10 */, - 13 /* SCX_AUX_TABLE_11 */, - 12 /* SCX_AUX_TABLE_12 */, - 20 /* SCX_AUX_TABLE_13 */, - 21 /* SCX_AUX_TABLE_14 */, - 4 /* SCX_AUX_TABLE_15 */, - 3 /* SCX_AUX_TABLE_16 */, - 2 /* SCX_AUX_TABLE_17 */, + 7 /* SCX_AUX_TABLE_7 */, + 9 /* SCX_AUX_TABLE_8 */, + 2 /* SCX_AUX_TABLE_9 */, + 3 /* SCX_AUX_TABLE_10 */, + 2 /* SCX_AUX_TABLE_11 */, + 13 /* SCX_AUX_TABLE_12 */, + 12 /* SCX_AUX_TABLE_13 */, + 20 /* SCX_AUX_TABLE_14 */, + 21 /* SCX_AUX_TABLE_15 */, + 4 /* SCX_AUX_TABLE_16 */, + 3 /* SCX_AUX_TABLE_17 */, 2 /* SCX_AUX_TABLE_18 */, 2 /* SCX_AUX_TABLE_19 */, 2 /* SCX_AUX_TABLE_20 */, - 3 /* SCX_AUX_TABLE_21 */, - 2 /* SCX_AUX_TABLE_22 */, + 2 /* SCX_AUX_TABLE_21 */, + 3 /* SCX_AUX_TABLE_22 */, 2 /* SCX_AUX_TABLE_23 */, - 4 /* SCX_AUX_TABLE_24 */, - 2 /* SCX_AUX_TABLE_25 */, - 4 /* SCX_AUX_TABLE_26 */, - 2 /* SCX_AUX_TABLE_27 */, + 2 /* SCX_AUX_TABLE_24 */, + 4 /* SCX_AUX_TABLE_25 */, + 2 /* SCX_AUX_TABLE_26 */, + 4 /* SCX_AUX_TABLE_27 */, 2 /* SCX_AUX_TABLE_28 */, 2 /* SCX_AUX_TABLE_29 */, - 6 /* SCX_AUX_TABLE_30 */, - 2 /* SCX_AUX_TABLE_31 */, - 8 /* SCX_AUX_TABLE_32 */, - 3 /* SCX_AUX_TABLE_33 */, - 2 /* SCX_AUX_TABLE_34 */, + 2 /* SCX_AUX_TABLE_30 */, + 6 /* SCX_AUX_TABLE_31 */, + 2 /* SCX_AUX_TABLE_32 */, + 8 /* SCX_AUX_TABLE_33 */, + 3 /* SCX_AUX_TABLE_34 */, 2 /* SCX_AUX_TABLE_35 */, - 3 /* SCX_AUX_TABLE_36 */, - 4 /* SCX_AUX_TABLE_37 */, - 9 /* SCX_AUX_TABLE_38 */, - 8 /* SCX_AUX_TABLE_39 */, - 5 /* SCX_AUX_TABLE_40 */, - 3 /* SCX_AUX_TABLE_41 */, - 6 /* SCX_AUX_TABLE_42 */, - 2 /* SCX_AUX_TABLE_43 */, + 2 /* SCX_AUX_TABLE_36 */, + 3 /* SCX_AUX_TABLE_37 */, + 4 /* SCX_AUX_TABLE_38 */, + 9 /* SCX_AUX_TABLE_39 */, + 8 /* SCX_AUX_TABLE_40 */, + 5 /* SCX_AUX_TABLE_41 */, + 3 /* SCX_AUX_TABLE_42 */, + 6 /* SCX_AUX_TABLE_43 */, 2 /* SCX_AUX_TABLE_44 */, - 5 /* SCX_AUX_TABLE_45 */, - 14 /* SCX_AUX_TABLE_46 */, - 13 /* SCX_AUX_TABLE_47 */, - 11 /* SCX_AUX_TABLE_48 */, - 2 /* SCX_AUX_TABLE_49 */, - 3 /* SCX_AUX_TABLE_50 */, - 2 /* SCX_AUX_TABLE_51 */, + 2 /* SCX_AUX_TABLE_45 */, + 5 /* SCX_AUX_TABLE_46 */, + 14 /* SCX_AUX_TABLE_47 */, + 13 /* SCX_AUX_TABLE_48 */, + 11 /* SCX_AUX_TABLE_49 */, + 2 /* SCX_AUX_TABLE_50 */, + 3 /* SCX_AUX_TABLE_51 */, 2 /* SCX_AUX_TABLE_52 */, 2 /* SCX_AUX_TABLE_53 */, - 3 /* SCX_AUX_TABLE_54 */, - 2 /* SCX_AUX_TABLE_55 */ + 2 /* SCX_AUX_TABLE_54 */, + 3 /* SCX_AUX_TABLE_55 */, + 2 /* SCX_AUX_TABLE_56 */, + 3 /* SCX_AUX_TABLE_57 */, + 2 /* SCX_AUX_TABLE_58 */, + 2 /* SCX_AUX_TABLE_59 */ }; /* This table, indexed by the script enum, gives the zero code point for that @@ -79455,6 +80842,7 @@ static const UV script_zeros[] = { '0', /* Coptic */ '0', /* Cuneiform */ '0', /* Cypriot */ + '0', /* Cypro_Minoan */ '0', /* Cyrillic */ '0', /* Deseret */ 0x966, /* Devanagari */ @@ -79542,6 +80930,7 @@ static const UV script_zeros[] = { '0', /* Old_Sogdian */ '0', /* Old_South_Arabian */ '0', /* Old_Turkic */ + '0', /* Old_Uyghur */ 0xb66, /* Oriya */ '0', /* Osage */ 0x104a0, /* Osmanya */ @@ -79573,6 +80962,7 @@ static const UV script_zeros[] = { '0', /* Tai_Viet */ 0x116c0, /* Takri */ 0xbe6, /* Tamil */ + 0x16ac0, /* Tangsa */ '0', /* Tangut */ 0xc66, /* Telugu */ 0x660, /* Thaana */ @@ -79580,8 +80970,10 @@ static const UV script_zeros[] = { 0xf20, /* Tibetan */ '0', /* Tifinagh */ 0x114d0, /* Tirhuta */ + '0', /* Toto */ '0', /* Ugaritic */ 0xa620, /* Vai */ + '0', /* Vithkuqi */ 0x1e2f0, /* Wancho */ 0x118e0, /* Warang_Citi */ 0x660 /* Yezidi */ @@ -79686,9 +81078,6 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Arabic, SCX_use_AUX_TABLE_5, SCX_use_AUX_TABLE_6, - SCX_Unknown, - SCX_Arabic, - SCX_use_AUX_TABLE_5, SCX_Arabic, SCX_use_AUX_TABLE_7, SCX_Arabic, @@ -79696,10 +81085,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Arabic, SCX_use_AUX_TABLE_9, SCX_Arabic, - SCX_use_AUX_TABLE_8, - SCX_Arabic, SCX_use_AUX_TABLE_10, SCX_Arabic, + SCX_use_AUX_TABLE_9, + SCX_Arabic, + SCX_use_AUX_TABLE_11, + SCX_Arabic, SCX_Common, SCX_Arabic, SCX_Syriac, @@ -79731,13 +81122,13 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Common, SCX_Arabic, SCX_Devanagari, - SCX_use_AUX_TABLE_11, SCX_use_AUX_TABLE_12, + SCX_use_AUX_TABLE_13, SCX_Inherited, SCX_Devanagari, - SCX_use_AUX_TABLE_13, SCX_use_AUX_TABLE_14, SCX_use_AUX_TABLE_15, + SCX_use_AUX_TABLE_16, SCX_Devanagari, SCX_Bengali, SCX_Unknown, @@ -79765,7 +81156,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Bengali, SCX_Unknown, - SCX_use_AUX_TABLE_16, + SCX_use_AUX_TABLE_17, SCX_Bengali, SCX_Unknown, SCX_Gurmukhi, @@ -79798,7 +81189,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Gurmukhi, SCX_Unknown, - SCX_use_AUX_TABLE_17, + SCX_use_AUX_TABLE_18, SCX_Gurmukhi, SCX_Unknown, SCX_Gujarati, @@ -79825,7 +81216,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Gujarati, SCX_Unknown, - SCX_use_AUX_TABLE_18, + SCX_use_AUX_TABLE_19, SCX_Gujarati, SCX_Unknown, SCX_Gujarati, @@ -79888,7 +81279,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Tamil, SCX_Unknown, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, SCX_Unknown, SCX_Telugu, @@ -79914,6 +81305,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Telugu, SCX_Unknown, SCX_Telugu, + SCX_Unknown, + SCX_Telugu, SCX_Kannada, SCX_Unknown, SCX_Kannada, @@ -79936,7 +81329,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Kannada, SCX_Unknown, - SCX_use_AUX_TABLE_20, + SCX_use_AUX_TABLE_21, SCX_Unknown, SCX_Kannada, SCX_Unknown, @@ -80020,7 +81413,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Tibetan, SCX_Unknown, SCX_Myanmar, - SCX_use_AUX_TABLE_21, + SCX_use_AUX_TABLE_22, SCX_Myanmar, SCX_Georgian, SCX_Unknown, @@ -80029,9 +81422,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Georgian, SCX_Unknown, SCX_Georgian, - SCX_use_AUX_TABLE_22, - SCX_Georgian, SCX_use_AUX_TABLE_23, + SCX_Georgian, + SCX_use_AUX_TABLE_24, SCX_Ethiopic, SCX_Unknown, SCX_Ethiopic, @@ -80082,9 +81475,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Tagalog, SCX_Unknown, SCX_Tagalog, - SCX_Unknown, SCX_Hanunoo, - SCX_use_AUX_TABLE_24, + SCX_use_AUX_TABLE_25, SCX_Unknown, SCX_Buhid, SCX_Unknown, @@ -80101,11 +81493,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Khmer, SCX_Unknown, SCX_Mongolian, - SCX_use_AUX_TABLE_25, - SCX_Mongolian, - SCX_use_AUX_TABLE_25, + SCX_use_AUX_TABLE_26, SCX_Mongolian, - SCX_Unknown, + SCX_use_AUX_TABLE_26, SCX_Mongolian, SCX_Unknown, SCX_Mongolian, @@ -80171,33 +81561,33 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Georgian, SCX_Sundanese, SCX_Unknown, - SCX_use_AUX_TABLE_26, - SCX_Devanagari, - SCX_use_AUX_TABLE_26, SCX_use_AUX_TABLE_27, SCX_Devanagari, + SCX_use_AUX_TABLE_27, SCX_use_AUX_TABLE_28, + SCX_Devanagari, SCX_use_AUX_TABLE_29, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_30, SCX_use_AUX_TABLE_29, SCX_use_AUX_TABLE_30, + SCX_use_AUX_TABLE_31, SCX_Devanagari, - SCX_use_AUX_TABLE_29, + SCX_use_AUX_TABLE_30, SCX_Devanagari, + SCX_use_AUX_TABLE_30, SCX_use_AUX_TABLE_29, - SCX_use_AUX_TABLE_28, SCX_Devanagari, - SCX_use_AUX_TABLE_31, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_32, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_32, - SCX_use_AUX_TABLE_27, SCX_use_AUX_TABLE_33, SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_34, + SCX_use_AUX_TABLE_29, SCX_Bengali, - SCX_use_AUX_TABLE_27, + SCX_use_AUX_TABLE_28, SCX_Nandinagari, SCX_Unknown, SCX_Latin, @@ -80212,9 +81602,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Latin, SCX_Greek, SCX_Inherited, - SCX_use_AUX_TABLE_34, + SCX_use_AUX_TABLE_35, SCX_Inherited, - SCX_Unknown, + SCX_Syriac, SCX_Inherited, SCX_Latin, SCX_Greek, @@ -80252,7 +81642,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Common, SCX_Inherited, SCX_Common, - SCX_use_AUX_TABLE_35, + SCX_use_AUX_TABLE_36, SCX_Common, SCX_Unknown, SCX_Common, @@ -80267,7 +81657,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Common, SCX_Unknown, SCX_Inherited, - SCX_use_AUX_TABLE_36, + SCX_use_AUX_TABLE_37, SCX_Unknown, SCX_Common, SCX_Greek, @@ -80293,9 +81683,6 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Common, SCX_Glagolitic, - SCX_Unknown, - SCX_Glagolitic, - SCX_Unknown, SCX_Latin, SCX_Coptic, SCX_Unknown, @@ -80334,78 +81721,77 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_use_AUX_TABLE_3, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, - SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_40, SCX_Common, - SCX_use_AUX_TABLE_37, - SCX_use_AUX_TABLE_38, - SCX_Common, - SCX_use_AUX_TABLE_39, SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_39, SCX_Common, - SCX_use_AUX_TABLE_37, SCX_use_AUX_TABLE_40, - SCX_use_AUX_TABLE_23, SCX_use_AUX_TABLE_39, - SCX_use_AUX_TABLE_41, + SCX_use_AUX_TABLE_40, SCX_Common, - SCX_use_AUX_TABLE_39, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, + SCX_use_AUX_TABLE_41, + SCX_use_AUX_TABLE_24, + SCX_use_AUX_TABLE_40, SCX_use_AUX_TABLE_42, - SCX_use_AUX_TABLE_37, - SCX_Unknown, + SCX_Common, + SCX_use_AUX_TABLE_40, + SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_43, - SCX_use_AUX_TABLE_41, SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_38, - SCX_use_AUX_TABLE_41, + SCX_Unknown, + SCX_use_AUX_TABLE_42, SCX_use_AUX_TABLE_44, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, SCX_Unknown, SCX_use_AUX_TABLE_1, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_1, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_37, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_38, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, - SCX_Unknown, + SCX_use_AUX_TABLE_38, SCX_Yi, SCX_Unknown, SCX_Yi, @@ -80418,7 +81804,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Cyrillic, SCX_Bamum, SCX_Unknown, - SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_46, SCX_Common, SCX_Latin, SCX_Common, @@ -80427,11 +81813,15 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Latin, SCX_Unknown, SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, SCX_Syloti_Nagri, SCX_Unknown, - SCX_use_AUX_TABLE_46, SCX_use_AUX_TABLE_47, SCX_use_AUX_TABLE_48, + SCX_use_AUX_TABLE_49, SCX_Unknown, SCX_Phags_Pa, SCX_Unknown, @@ -80440,21 +81830,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Saurashtra, SCX_Unknown, SCX_Devanagari, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_49, + SCX_use_AUX_TABLE_50, SCX_Devanagari, SCX_Kayah_Li, - SCX_use_AUX_TABLE_50, + SCX_use_AUX_TABLE_51, SCX_Kayah_Li, SCX_Rejang, SCX_Unknown, SCX_Rejang, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, SCX_Javanese, SCX_Unknown, - SCX_use_AUX_TABLE_51, + SCX_use_AUX_TABLE_52, SCX_Javanese, SCX_Unknown, SCX_Javanese, @@ -80495,15 +81885,15 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Meetei_Mayek, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Latin, SCX_Unknown, @@ -80523,24 +81913,25 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Arabic, SCX_Unknown, SCX_Arabic, - SCX_Common, + SCX_use_AUX_TABLE_53, + SCX_Arabic, SCX_Unknown, SCX_Arabic, SCX_Unknown, SCX_Arabic, SCX_Unknown, SCX_Arabic, - SCX_use_AUX_TABLE_52, + SCX_use_AUX_TABLE_54, + SCX_Arabic, + SCX_use_AUX_TABLE_54, SCX_Arabic, - SCX_use_AUX_TABLE_52, - SCX_Unknown, SCX_Inherited, SCX_Common, SCX_Unknown, SCX_Inherited, SCX_Cyrillic, SCX_Common, - SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_40, SCX_Common, SCX_Unknown, SCX_Common, @@ -80558,20 +81949,20 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Common, SCX_Latin, SCX_Common, - SCX_use_AUX_TABLE_38, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -80593,11 +81984,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Linear_B, SCX_Unknown, - SCX_use_AUX_TABLE_53, + SCX_use_AUX_TABLE_55, + SCX_use_AUX_TABLE_56, SCX_Unknown, - SCX_use_AUX_TABLE_54, + SCX_use_AUX_TABLE_57, SCX_Unknown, - SCX_use_AUX_TABLE_53, + SCX_use_AUX_TABLE_56, SCX_Greek, SCX_Unknown, SCX_Common, @@ -80611,7 +82003,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Carian, SCX_Unknown, - SCX_use_AUX_TABLE_55, + SCX_use_AUX_TABLE_58, SCX_Unknown, SCX_Old_Italic, SCX_Unknown, @@ -80642,6 +82034,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Caucasian_Albanian, SCX_Unknown, SCX_Caucasian_Albanian, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, SCX_Unknown, SCX_Linear_A, SCX_Unknown, @@ -80649,6 +82056,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Linear_A, SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, SCX_Cypriot, SCX_Unknown, SCX_Cypriot, @@ -80708,6 +82121,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Manichaean, SCX_Unknown, SCX_Manichaean, + SCX_use_AUX_TABLE_59, + SCX_Manichaean, SCX_Unknown, SCX_Avestan, SCX_Unknown, @@ -80747,6 +82162,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Sogdian, SCX_Unknown, + SCX_Old_Uyghur, + SCX_Unknown, SCX_Chorasmian, SCX_Unknown, SCX_Elymaic, @@ -80793,9 +82210,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Khudawadi, SCX_Unknown, SCX_Grantha, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Grantha, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Unknown, SCX_Grantha, SCX_Unknown, @@ -80809,7 +82226,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Grantha, SCX_Unknown, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Grantha, SCX_Unknown, SCX_Grantha, @@ -80885,6 +82302,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Soyombo, SCX_Unknown, + SCX_Canadian_Aboriginal, SCX_Pau_Cin_Hau, SCX_Unknown, SCX_Bhaiksuki, @@ -80932,9 +82350,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Lisu, SCX_Unknown, SCX_Tamil, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, SCX_Unknown, SCX_Tamil, @@ -80946,6 +82364,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Cuneiform, SCX_Unknown, + SCX_Cypro_Minoan, + SCX_Unknown, SCX_Egyptian_Hieroglyphs, SCX_Unknown, SCX_Egyptian_Hieroglyphs, @@ -80959,6 +82379,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Mro, SCX_Unknown, SCX_Mro, + SCX_Tangsa, + SCX_Unknown, + SCX_Tangsa, SCX_Unknown, SCX_Bassa_Vah, SCX_Unknown, @@ -80984,10 +82407,10 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Tangut, SCX_Nushu, - SCX_Common, + SCX_use_AUX_TABLE_38, SCX_Khitan_Small_Script, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Tangut, SCX_Unknown, @@ -80996,12 +82419,19 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Tangut, SCX_Unknown, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_45, SCX_Unknown, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_45, + SCX_Unknown, + SCX_use_AUX_TABLE_45, SCX_Unknown, + SCX_use_AUX_TABLE_45, SCX_use_AUX_TABLE_44, + SCX_use_AUX_TABLE_45, + SCX_Unknown, + SCX_use_AUX_TABLE_44, + SCX_Unknown, + SCX_use_AUX_TABLE_45, SCX_Unknown, SCX_Nushu, SCX_Unknown, @@ -81015,6 +82445,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Duployan, SCX_Unknown, + SCX_Inherited, + SCX_Unknown, + SCX_Inherited, + SCX_Unknown, + SCX_Common, + SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, @@ -81035,7 +82471,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, SCX_Unknown, SCX_Common, @@ -81085,6 +82521,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_SignWriting, SCX_Unknown, + SCX_Latin, + SCX_Unknown, SCX_Glagolitic, SCX_Unknown, SCX_Glagolitic, @@ -81103,10 +82541,20 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Nyiakeng_Puachue_Hmong, SCX_Unknown, + SCX_Toto, + SCX_Unknown, SCX_Wancho, SCX_Unknown, SCX_Wancho, SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, SCX_Mende_Kikakui, SCX_Unknown, SCX_Mende_Kikakui, @@ -81204,14 +82652,14 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Common, SCX_Unknown, SCX_Common, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_44, SCX_Common, SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -81267,19 +82715,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, + SCX_Unknown, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -81301,7 +82751,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ - 1695, /* Number of elements */ + 1753, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -81400,7 +82850,6 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x61B, 0x61C, 0x61D, - 0x61E, 0x61F, 0x620, 0x640, @@ -81436,11 +82885,11 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8E2, 0x8E3, 0x900, @@ -81612,7 +83061,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -81622,6 +83071,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -81645,7 +83096,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -81793,9 +83244,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, + 0x1716, + 0x171F, 0x1720, 0x1735, 0x1737, @@ -81818,8 +83268,6 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1804, 0x1805, 0x1806, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -81862,11 +83310,11 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BC0, 0x1BF4, @@ -81978,7 +83426,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F0, 0x20F1, @@ -82006,9 +83454,6 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x2B96, 0x2B97, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, 0x2C60, 0x2C80, 0x2CF4, @@ -82046,7 +83491,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x2E00, 0x2E43, 0x2E44, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -82118,7 +83563,6 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, 0xA000, 0xA48D, 0xA490, @@ -82136,10 +83580,14 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xA82D, 0xA830, @@ -82234,14 +83682,15 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0xFB45, 0xFB46, 0xFB50, - 0xFBC2, + 0xFBC3, 0xFBD3, 0xFD3E, 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, 0xFDF2, 0xFDF3, @@ -82307,6 +83756,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x10080, 0x100FB, 0x10100, + 0x10102, 0x10103, 0x10107, 0x10134, @@ -82356,12 +83806,33 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x10564, 0x1056F, 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -82421,6 +83892,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x10AC0, 0x10AE7, 0x10AEB, + 0x10AF2, + 0x10AF3, 0x10AF7, 0x10B00, 0x10B36, @@ -82460,6 +83933,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -82467,10 +83942,10 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x11080, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -82558,7 +84033,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -82566,7 +84041,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -82598,6 +84073,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x11A48, 0x11A50, 0x11AA3, + 0x11AB0, 0x11AC0, 0x11AF9, 0x11C00, @@ -82659,6 +84135,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -82673,6 +84151,9 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x16A6A, 0x16A6E, 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -82709,9 +84190,16 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, - 0x1B11F, + 0x1B120, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -82728,6 +84216,12 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -82741,7 +84235,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -82798,6 +84292,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -82816,10 +84312,20 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -82930,7 +84436,7 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -82940,6 +84446,8 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -82953,27 +84461,27 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -82981,9 +84489,9 @@ static const UV _Perl_SCX_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -83045,138 +84553,143 @@ typedef enum { SCX_Coptic = 26, SCX_Cuneiform = 27, SCX_Cypriot = 28, - SCX_Cyrillic = 29, - SCX_Deseret = 30, - SCX_Devanagari = 31, - SCX_Dives_Akuru = 32, - SCX_Dogra = 33, - SCX_Duployan = 34, - SCX_Egyptian_Hieroglyphs = 35, - SCX_Elbasan = 36, - SCX_Elymaic = 37, - SCX_Ethiopic = 38, - SCX_Georgian = 39, - SCX_Glagolitic = 40, - SCX_Gothic = 41, - SCX_Grantha = 42, - SCX_Greek = 43, - SCX_Gujarati = 44, - SCX_Gunjala_Gondi = 45, - SCX_Gurmukhi = 46, - SCX_Han = 47, - SCX_Hanb = 48, - SCX_Hangul = 49, - SCX_Hanifi_Rohingya = 50, - SCX_Hanunoo = 51, - SCX_Hatran = 52, - SCX_Hebrew = 53, - SCX_Hiragana = 54, - SCX_Imperial_Aramaic = 55, - SCX_Inherited = 56, - SCX_Inscriptional_Pahlavi = 57, - SCX_Inscriptional_Parthian = 58, - SCX_INVALID = 59, - SCX_Javanese = 60, - SCX_Jpan = 61, - SCX_Kaithi = 62, - SCX_Kannada = 63, - SCX_Katakana = 64, - SCX_Kayah_Li = 65, - SCX_Kharoshthi = 66, - SCX_Khitan_Small_Script = 67, - SCX_Khmer = 68, - SCX_Khojki = 69, - SCX_Khudawadi = 70, - SCX_Kore = 71, - SCX_Lao = 72, - SCX_Latin = 73, - SCX_Lepcha = 74, - SCX_Limbu = 75, - SCX_Linear_A = 76, - SCX_Linear_B = 77, - SCX_Lisu = 78, - SCX_Lycian = 79, - SCX_Lydian = 80, - SCX_Mahajani = 81, - SCX_Makasar = 82, - SCX_Malayalam = 83, - SCX_Mandaic = 84, - SCX_Manichaean = 85, - SCX_Marchen = 86, - SCX_Masaram_Gondi = 87, - SCX_Medefaidrin = 88, - SCX_Meetei_Mayek = 89, - SCX_Mende_Kikakui = 90, - SCX_Meroitic_Cursive = 91, - SCX_Meroitic_Hieroglyphs = 92, - SCX_Miao = 93, - SCX_Modi = 94, - SCX_Mongolian = 95, - SCX_Mro = 96, - SCX_Multani = 97, - SCX_Myanmar = 98, - SCX_Nabataean = 99, - SCX_Nandinagari = 100, - SCX_New_Tai_Lue = 101, - SCX_Newa = 102, - SCX_Nko = 103, - SCX_Nushu = 104, - SCX_Nyiakeng_Puachue_Hmong = 105, - SCX_Ogham = 106, - SCX_Ol_Chiki = 107, - SCX_Old_Hungarian = 108, - SCX_Old_Italic = 109, - SCX_Old_North_Arabian = 110, - SCX_Old_Permic = 111, - SCX_Old_Persian = 112, - SCX_Old_Sogdian = 113, - SCX_Old_South_Arabian = 114, - SCX_Old_Turkic = 115, - SCX_Oriya = 116, - SCX_Osage = 117, - SCX_Osmanya = 118, - SCX_Pahawh_Hmong = 119, - SCX_Palmyrene = 120, - SCX_Pau_Cin_Hau = 121, - SCX_Phags_Pa = 122, - SCX_Phoenician = 123, - SCX_Psalter_Pahlavi = 124, - SCX_Rejang = 125, - SCX_Runic = 126, - SCX_Samaritan = 127, - SCX_Saurashtra = 128, - SCX_Sharada = 129, - SCX_Shavian = 130, - SCX_Siddham = 131, - SCX_SignWriting = 132, - SCX_Sinhala = 133, - SCX_Sogdian = 134, - SCX_Sora_Sompeng = 135, - SCX_Soyombo = 136, - SCX_Sundanese = 137, - SCX_Syloti_Nagri = 138, - SCX_Syriac = 139, - SCX_Tagalog = 140, - SCX_Tagbanwa = 141, - SCX_Tai_Le = 142, - SCX_Tai_Tham = 143, - SCX_Tai_Viet = 144, - SCX_Takri = 145, - SCX_Tamil = 146, - SCX_Tangut = 147, - SCX_Telugu = 148, - SCX_Thaana = 149, - SCX_Thai = 150, - SCX_Tibetan = 151, - SCX_Tifinagh = 152, - SCX_Tirhuta = 153, - SCX_Ugaritic = 154, - SCX_Vai = 155, - SCX_Wancho = 156, - SCX_Warang_Citi = 157, - SCX_Yezidi = 158, - SCX_Yi = 159, - SCX_Zanabazar_Square = 160, + SCX_Cypro_Minoan = 29, + SCX_Cyrillic = 30, + SCX_Deseret = 31, + SCX_Devanagari = 32, + SCX_Dives_Akuru = 33, + SCX_Dogra = 34, + SCX_Duployan = 35, + SCX_Egyptian_Hieroglyphs = 36, + SCX_Elbasan = 37, + SCX_Elymaic = 38, + SCX_Ethiopic = 39, + SCX_Georgian = 40, + SCX_Glagolitic = 41, + SCX_Gothic = 42, + SCX_Grantha = 43, + SCX_Greek = 44, + SCX_Gujarati = 45, + SCX_Gunjala_Gondi = 46, + SCX_Gurmukhi = 47, + SCX_Han = 48, + SCX_Hanb = 49, + SCX_Hangul = 50, + SCX_Hanifi_Rohingya = 51, + SCX_Hanunoo = 52, + SCX_Hatran = 53, + SCX_Hebrew = 54, + SCX_Hiragana = 55, + SCX_Imperial_Aramaic = 56, + SCX_Inherited = 57, + SCX_Inscriptional_Pahlavi = 58, + SCX_Inscriptional_Parthian = 59, + SCX_INVALID = 60, + SCX_Javanese = 61, + SCX_Jpan = 62, + SCX_Kaithi = 63, + SCX_Kannada = 64, + SCX_Katakana = 65, + SCX_Kayah_Li = 66, + SCX_Kharoshthi = 67, + SCX_Khitan_Small_Script = 68, + SCX_Khmer = 69, + SCX_Khojki = 70, + SCX_Khudawadi = 71, + SCX_Kore = 72, + SCX_Lao = 73, + SCX_Latin = 74, + SCX_Lepcha = 75, + SCX_Limbu = 76, + SCX_Linear_A = 77, + SCX_Linear_B = 78, + SCX_Lisu = 79, + SCX_Lycian = 80, + SCX_Lydian = 81, + SCX_Mahajani = 82, + SCX_Makasar = 83, + SCX_Malayalam = 84, + SCX_Mandaic = 85, + SCX_Manichaean = 86, + SCX_Marchen = 87, + SCX_Masaram_Gondi = 88, + SCX_Medefaidrin = 89, + SCX_Meetei_Mayek = 90, + SCX_Mende_Kikakui = 91, + SCX_Meroitic_Cursive = 92, + SCX_Meroitic_Hieroglyphs = 93, + SCX_Miao = 94, + SCX_Modi = 95, + SCX_Mongolian = 96, + SCX_Mro = 97, + SCX_Multani = 98, + SCX_Myanmar = 99, + SCX_Nabataean = 100, + SCX_Nandinagari = 101, + SCX_New_Tai_Lue = 102, + SCX_Newa = 103, + SCX_Nko = 104, + SCX_Nushu = 105, + SCX_Nyiakeng_Puachue_Hmong = 106, + SCX_Ogham = 107, + SCX_Ol_Chiki = 108, + SCX_Old_Hungarian = 109, + SCX_Old_Italic = 110, + SCX_Old_North_Arabian = 111, + SCX_Old_Permic = 112, + SCX_Old_Persian = 113, + SCX_Old_Sogdian = 114, + SCX_Old_South_Arabian = 115, + SCX_Old_Turkic = 116, + SCX_Old_Uyghur = 117, + SCX_Oriya = 118, + SCX_Osage = 119, + SCX_Osmanya = 120, + SCX_Pahawh_Hmong = 121, + SCX_Palmyrene = 122, + SCX_Pau_Cin_Hau = 123, + SCX_Phags_Pa = 124, + SCX_Phoenician = 125, + SCX_Psalter_Pahlavi = 126, + SCX_Rejang = 127, + SCX_Runic = 128, + SCX_Samaritan = 129, + SCX_Saurashtra = 130, + SCX_Sharada = 131, + SCX_Shavian = 132, + SCX_Siddham = 133, + SCX_SignWriting = 134, + SCX_Sinhala = 135, + SCX_Sogdian = 136, + SCX_Sora_Sompeng = 137, + SCX_Soyombo = 138, + SCX_Sundanese = 139, + SCX_Syloti_Nagri = 140, + SCX_Syriac = 141, + SCX_Tagalog = 142, + SCX_Tagbanwa = 143, + SCX_Tai_Le = 144, + SCX_Tai_Tham = 145, + SCX_Tai_Viet = 146, + SCX_Takri = 147, + SCX_Tamil = 148, + SCX_Tangsa = 149, + SCX_Tangut = 150, + SCX_Telugu = 151, + SCX_Thaana = 152, + SCX_Thai = 153, + SCX_Tibetan = 154, + SCX_Tifinagh = 155, + SCX_Tirhuta = 156, + SCX_Toto = 157, + SCX_Ugaritic = 158, + SCX_Vai = 159, + SCX_Vithkuqi = 160, + SCX_Wancho = 161, + SCX_Warang_Citi = 162, + SCX_Yezidi = 163, + SCX_Yi = 164, + SCX_Zanabazar_Square = 165, SCX_use_AUX_TABLE_1 = -1, SCX_use_AUX_TABLE_2 = -2, SCX_use_AUX_TABLE_3 = -3, @@ -83231,7 +84744,11 @@ typedef enum { SCX_use_AUX_TABLE_52 = -52, SCX_use_AUX_TABLE_53 = -53, SCX_use_AUX_TABLE_54 = -54, - SCX_use_AUX_TABLE_55 = -55 + SCX_use_AUX_TABLE_55 = -55, + SCX_use_AUX_TABLE_56 = -56, + SCX_use_AUX_TABLE_57 = -57, + SCX_use_AUX_TABLE_58 = -58, + SCX_use_AUX_TABLE_59 = -59 } SCX_enum; # endif /* EBCDIC 037 */ @@ -83268,6 +84785,7 @@ static const SCX_enum SCX_AUX_TABLE_4[] = { static const SCX_enum SCX_AUX_TABLE_5[] = { SCX_Arabic, SCX_Hanifi_Rohingya, + SCX_Nko, SCX_Syriac, SCX_Thaana, SCX_Yezidi @@ -83280,33 +84798,44 @@ static const SCX_enum SCX_AUX_TABLE_6[] = { }; static const SCX_enum SCX_AUX_TABLE_7[] = { + SCX_Adlam, + SCX_Arabic, + SCX_Hanifi_Rohingya, + SCX_Nko, + SCX_Syriac, + SCX_Thaana, + SCX_Yezidi +}; + +static const SCX_enum SCX_AUX_TABLE_8[] = { SCX_Adlam, SCX_Arabic, SCX_Hanifi_Rohingya, SCX_Mandaic, SCX_Manichaean, + SCX_Old_Uyghur, SCX_Psalter_Pahlavi, SCX_Sogdian, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_8[] = { +static const SCX_enum SCX_AUX_TABLE_9[] = { SCX_Arabic, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_9[] = { +static const SCX_enum SCX_AUX_TABLE_10[] = { SCX_Arabic, SCX_Thaana, SCX_Yezidi }; -static const SCX_enum SCX_AUX_TABLE_10[] = { +static const SCX_enum SCX_AUX_TABLE_11[] = { SCX_Arabic, SCX_Hanifi_Rohingya }; -static const SCX_enum SCX_AUX_TABLE_11[] = { +static const SCX_enum SCX_AUX_TABLE_12[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -83322,7 +84851,7 @@ static const SCX_enum SCX_AUX_TABLE_11[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_12[] = { +static const SCX_enum SCX_AUX_TABLE_13[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -83337,7 +84866,7 @@ static const SCX_enum SCX_AUX_TABLE_12[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_13[] = { +static const SCX_enum SCX_AUX_TABLE_14[] = { SCX_Bengali, SCX_Devanagari, SCX_Dogra, @@ -83360,7 +84889,7 @@ static const SCX_enum SCX_AUX_TABLE_13[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_14[] = { +static const SCX_enum SCX_AUX_TABLE_15[] = { SCX_Bengali, SCX_Devanagari, SCX_Dogra, @@ -83384,90 +84913,90 @@ static const SCX_enum SCX_AUX_TABLE_14[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_15[] = { +static const SCX_enum SCX_AUX_TABLE_16[] = { SCX_Devanagari, SCX_Dogra, SCX_Kaithi, SCX_Mahajani }; -static const SCX_enum SCX_AUX_TABLE_16[] = { +static const SCX_enum SCX_AUX_TABLE_17[] = { SCX_Bengali, SCX_Chakma, SCX_Syloti_Nagri }; -static const SCX_enum SCX_AUX_TABLE_17[] = { +static const SCX_enum SCX_AUX_TABLE_18[] = { SCX_Gurmukhi, SCX_Multani }; -static const SCX_enum SCX_AUX_TABLE_18[] = { +static const SCX_enum SCX_AUX_TABLE_19[] = { SCX_Gujarati, SCX_Khojki }; -static const SCX_enum SCX_AUX_TABLE_19[] = { +static const SCX_enum SCX_AUX_TABLE_20[] = { SCX_Grantha, SCX_Tamil }; -static const SCX_enum SCX_AUX_TABLE_20[] = { +static const SCX_enum SCX_AUX_TABLE_21[] = { SCX_Kannada, SCX_Nandinagari }; -static const SCX_enum SCX_AUX_TABLE_21[] = { +static const SCX_enum SCX_AUX_TABLE_22[] = { SCX_Chakma, SCX_Myanmar, SCX_Tai_Le }; -static const SCX_enum SCX_AUX_TABLE_22[] = { +static const SCX_enum SCX_AUX_TABLE_23[] = { SCX_Georgian, SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_23[] = { +static const SCX_enum SCX_AUX_TABLE_24[] = { SCX_Hangul, SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_24[] = { +static const SCX_enum SCX_AUX_TABLE_25[] = { SCX_Buhid, SCX_Hanunoo, SCX_Tagalog, SCX_Tagbanwa }; -static const SCX_enum SCX_AUX_TABLE_25[] = { +static const SCX_enum SCX_AUX_TABLE_26[] = { SCX_Mongolian, SCX_Phags_Pa }; -static const SCX_enum SCX_AUX_TABLE_26[] = { +static const SCX_enum SCX_AUX_TABLE_27[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, SCX_Kannada }; -static const SCX_enum SCX_AUX_TABLE_27[] = { +static const SCX_enum SCX_AUX_TABLE_28[] = { SCX_Devanagari, SCX_Grantha }; -static const SCX_enum SCX_AUX_TABLE_28[] = { +static const SCX_enum SCX_AUX_TABLE_29[] = { SCX_Bengali, SCX_Devanagari }; -static const SCX_enum SCX_AUX_TABLE_29[] = { +static const SCX_enum SCX_AUX_TABLE_30[] = { SCX_Devanagari, SCX_Sharada }; -static const SCX_enum SCX_AUX_TABLE_30[] = { +static const SCX_enum SCX_AUX_TABLE_31[] = { SCX_Devanagari, SCX_Kannada, SCX_Malayalam, @@ -83476,12 +85005,12 @@ static const SCX_enum SCX_AUX_TABLE_30[] = { SCX_Telugu }; -static const SCX_enum SCX_AUX_TABLE_31[] = { +static const SCX_enum SCX_AUX_TABLE_32[] = { SCX_Devanagari, SCX_Nandinagari }; -static const SCX_enum SCX_AUX_TABLE_32[] = { +static const SCX_enum SCX_AUX_TABLE_33[] = { SCX_Bengali, SCX_Devanagari, SCX_Grantha, @@ -83492,36 +85021,36 @@ static const SCX_enum SCX_AUX_TABLE_32[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_33[] = { +static const SCX_enum SCX_AUX_TABLE_34[] = { SCX_Devanagari, SCX_Grantha, SCX_Kannada }; -static const SCX_enum SCX_AUX_TABLE_34[] = { +static const SCX_enum SCX_AUX_TABLE_35[] = { SCX_Cyrillic, SCX_Syriac }; -static const SCX_enum SCX_AUX_TABLE_35[] = { +static const SCX_enum SCX_AUX_TABLE_36[] = { SCX_Latin, SCX_Mongolian }; -static const SCX_enum SCX_AUX_TABLE_36[] = { +static const SCX_enum SCX_AUX_TABLE_37[] = { SCX_Devanagari, SCX_Grantha, SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_37[] = { +static const SCX_enum SCX_AUX_TABLE_38[] = { SCX_Han, SCX_Hanb, SCX_Jpan, SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_38[] = { +static const SCX_enum SCX_AUX_TABLE_39[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -83533,7 +85062,7 @@ static const SCX_enum SCX_AUX_TABLE_38[] = { SCX_Yi }; -static const SCX_enum SCX_AUX_TABLE_39[] = { +static const SCX_enum SCX_AUX_TABLE_40[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -83544,7 +85073,7 @@ static const SCX_enum SCX_AUX_TABLE_39[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_40[] = { +static const SCX_enum SCX_AUX_TABLE_41[] = { SCX_Bopomofo, SCX_Han, SCX_Hanb, @@ -83552,13 +85081,13 @@ static const SCX_enum SCX_AUX_TABLE_40[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_41[] = { +static const SCX_enum SCX_AUX_TABLE_42[] = { SCX_Hiragana, SCX_Jpan, SCX_Katakana }; -static const SCX_enum SCX_AUX_TABLE_42[] = { +static const SCX_enum SCX_AUX_TABLE_43[] = { SCX_Han, SCX_Hanb, SCX_Hiragana, @@ -83567,17 +85096,17 @@ static const SCX_enum SCX_AUX_TABLE_42[] = { SCX_Kore }; -static const SCX_enum SCX_AUX_TABLE_43[] = { +static const SCX_enum SCX_AUX_TABLE_44[] = { SCX_Hiragana, SCX_Jpan }; -static const SCX_enum SCX_AUX_TABLE_44[] = { +static const SCX_enum SCX_AUX_TABLE_45[] = { SCX_Jpan, SCX_Katakana }; -static const SCX_enum SCX_AUX_TABLE_45[] = { +static const SCX_enum SCX_AUX_TABLE_46[] = { SCX_Han, SCX_Hanb, SCX_Jpan, @@ -83585,7 +85114,7 @@ static const SCX_enum SCX_AUX_TABLE_45[] = { SCX_Latin }; -static const SCX_enum SCX_AUX_TABLE_46[] = { +static const SCX_enum SCX_AUX_TABLE_47[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -83602,7 +85131,7 @@ static const SCX_enum SCX_AUX_TABLE_46[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_47[] = { +static const SCX_enum SCX_AUX_TABLE_48[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -83618,7 +85147,7 @@ static const SCX_enum SCX_AUX_TABLE_47[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_48[] = { +static const SCX_enum SCX_AUX_TABLE_49[] = { SCX_Devanagari, SCX_Dogra, SCX_Gujarati, @@ -83632,43 +85161,59 @@ static const SCX_enum SCX_AUX_TABLE_48[] = { SCX_Tirhuta }; -static const SCX_enum SCX_AUX_TABLE_49[] = { +static const SCX_enum SCX_AUX_TABLE_50[] = { SCX_Devanagari, SCX_Tamil }; -static const SCX_enum SCX_AUX_TABLE_50[] = { +static const SCX_enum SCX_AUX_TABLE_51[] = { SCX_Kayah_Li, SCX_Latin, SCX_Myanmar }; -static const SCX_enum SCX_AUX_TABLE_51[] = { +static const SCX_enum SCX_AUX_TABLE_52[] = { SCX_Buginese, SCX_Javanese }; -static const SCX_enum SCX_AUX_TABLE_52[] = { +static const SCX_enum SCX_AUX_TABLE_53[] = { + SCX_Arabic, + SCX_Nko +}; + +static const SCX_enum SCX_AUX_TABLE_54[] = { SCX_Arabic, SCX_Thaana }; -static const SCX_enum SCX_AUX_TABLE_53[] = { +static const SCX_enum SCX_AUX_TABLE_55[] = { SCX_Cypriot, + SCX_Cypro_Minoan, SCX_Linear_B }; -static const SCX_enum SCX_AUX_TABLE_54[] = { +static const SCX_enum SCX_AUX_TABLE_56[] = { + SCX_Cypriot, + SCX_Linear_B +}; + +static const SCX_enum SCX_AUX_TABLE_57[] = { SCX_Cypriot, SCX_Linear_A, SCX_Linear_B }; -static const SCX_enum SCX_AUX_TABLE_55[] = { +static const SCX_enum SCX_AUX_TABLE_58[] = { SCX_Arabic, SCX_Coptic }; +static const SCX_enum SCX_AUX_TABLE_59[] = { + SCX_Manichaean, + SCX_Old_Uyghur +}; + static const SCX_enum * const SCX_AUX_TABLE_ptrs[] = { NULL, /* Placeholder */ SCX_AUX_TABLE_1, @@ -83725,7 +85270,11 @@ static const SCX_enum * const SCX_AUX_TABLE_ptrs[] = { SCX_AUX_TABLE_52, SCX_AUX_TABLE_53, SCX_AUX_TABLE_54, - SCX_AUX_TABLE_55 + SCX_AUX_TABLE_55, + SCX_AUX_TABLE_56, + SCX_AUX_TABLE_57, + SCX_AUX_TABLE_58, + SCX_AUX_TABLE_59 }; /* Parallel table to the above, giving the number of elements in each table @@ -83737,57 +85286,61 @@ static const U8 SCX_AUX_TABLE_lengths[] = { 2 /* SCX_AUX_TABLE_2 */, 2 /* SCX_AUX_TABLE_3 */, 2 /* SCX_AUX_TABLE_4 */, - 5 /* SCX_AUX_TABLE_5 */, + 6 /* SCX_AUX_TABLE_5 */, 3 /* SCX_AUX_TABLE_6 */, - 8 /* SCX_AUX_TABLE_7 */, - 2 /* SCX_AUX_TABLE_8 */, - 3 /* SCX_AUX_TABLE_9 */, - 2 /* SCX_AUX_TABLE_10 */, - 13 /* SCX_AUX_TABLE_11 */, - 12 /* SCX_AUX_TABLE_12 */, - 20 /* SCX_AUX_TABLE_13 */, - 21 /* SCX_AUX_TABLE_14 */, - 4 /* SCX_AUX_TABLE_15 */, - 3 /* SCX_AUX_TABLE_16 */, - 2 /* SCX_AUX_TABLE_17 */, + 7 /* SCX_AUX_TABLE_7 */, + 9 /* SCX_AUX_TABLE_8 */, + 2 /* SCX_AUX_TABLE_9 */, + 3 /* SCX_AUX_TABLE_10 */, + 2 /* SCX_AUX_TABLE_11 */, + 13 /* SCX_AUX_TABLE_12 */, + 12 /* SCX_AUX_TABLE_13 */, + 20 /* SCX_AUX_TABLE_14 */, + 21 /* SCX_AUX_TABLE_15 */, + 4 /* SCX_AUX_TABLE_16 */, + 3 /* SCX_AUX_TABLE_17 */, 2 /* SCX_AUX_TABLE_18 */, 2 /* SCX_AUX_TABLE_19 */, 2 /* SCX_AUX_TABLE_20 */, - 3 /* SCX_AUX_TABLE_21 */, - 2 /* SCX_AUX_TABLE_22 */, + 2 /* SCX_AUX_TABLE_21 */, + 3 /* SCX_AUX_TABLE_22 */, 2 /* SCX_AUX_TABLE_23 */, - 4 /* SCX_AUX_TABLE_24 */, - 2 /* SCX_AUX_TABLE_25 */, - 4 /* SCX_AUX_TABLE_26 */, - 2 /* SCX_AUX_TABLE_27 */, + 2 /* SCX_AUX_TABLE_24 */, + 4 /* SCX_AUX_TABLE_25 */, + 2 /* SCX_AUX_TABLE_26 */, + 4 /* SCX_AUX_TABLE_27 */, 2 /* SCX_AUX_TABLE_28 */, 2 /* SCX_AUX_TABLE_29 */, - 6 /* SCX_AUX_TABLE_30 */, - 2 /* SCX_AUX_TABLE_31 */, - 8 /* SCX_AUX_TABLE_32 */, - 3 /* SCX_AUX_TABLE_33 */, - 2 /* SCX_AUX_TABLE_34 */, + 2 /* SCX_AUX_TABLE_30 */, + 6 /* SCX_AUX_TABLE_31 */, + 2 /* SCX_AUX_TABLE_32 */, + 8 /* SCX_AUX_TABLE_33 */, + 3 /* SCX_AUX_TABLE_34 */, 2 /* SCX_AUX_TABLE_35 */, - 3 /* SCX_AUX_TABLE_36 */, - 4 /* SCX_AUX_TABLE_37 */, - 9 /* SCX_AUX_TABLE_38 */, - 8 /* SCX_AUX_TABLE_39 */, - 5 /* SCX_AUX_TABLE_40 */, - 3 /* SCX_AUX_TABLE_41 */, - 6 /* SCX_AUX_TABLE_42 */, - 2 /* SCX_AUX_TABLE_43 */, + 2 /* SCX_AUX_TABLE_36 */, + 3 /* SCX_AUX_TABLE_37 */, + 4 /* SCX_AUX_TABLE_38 */, + 9 /* SCX_AUX_TABLE_39 */, + 8 /* SCX_AUX_TABLE_40 */, + 5 /* SCX_AUX_TABLE_41 */, + 3 /* SCX_AUX_TABLE_42 */, + 6 /* SCX_AUX_TABLE_43 */, 2 /* SCX_AUX_TABLE_44 */, - 5 /* SCX_AUX_TABLE_45 */, - 14 /* SCX_AUX_TABLE_46 */, - 13 /* SCX_AUX_TABLE_47 */, - 11 /* SCX_AUX_TABLE_48 */, - 2 /* SCX_AUX_TABLE_49 */, - 3 /* SCX_AUX_TABLE_50 */, - 2 /* SCX_AUX_TABLE_51 */, + 2 /* SCX_AUX_TABLE_45 */, + 5 /* SCX_AUX_TABLE_46 */, + 14 /* SCX_AUX_TABLE_47 */, + 13 /* SCX_AUX_TABLE_48 */, + 11 /* SCX_AUX_TABLE_49 */, + 2 /* SCX_AUX_TABLE_50 */, + 3 /* SCX_AUX_TABLE_51 */, 2 /* SCX_AUX_TABLE_52 */, 2 /* SCX_AUX_TABLE_53 */, - 3 /* SCX_AUX_TABLE_54 */, - 2 /* SCX_AUX_TABLE_55 */ + 2 /* SCX_AUX_TABLE_54 */, + 3 /* SCX_AUX_TABLE_55 */, + 2 /* SCX_AUX_TABLE_56 */, + 3 /* SCX_AUX_TABLE_57 */, + 2 /* SCX_AUX_TABLE_58 */, + 2 /* SCX_AUX_TABLE_59 */ }; /* This table, indexed by the script enum, gives the zero code point for that @@ -83824,6 +85377,7 @@ static const UV script_zeros[] = { '0', /* Coptic */ '0', /* Cuneiform */ '0', /* Cypriot */ + '0', /* Cypro_Minoan */ '0', /* Cyrillic */ '0', /* Deseret */ 0x966, /* Devanagari */ @@ -83911,6 +85465,7 @@ static const UV script_zeros[] = { '0', /* Old_Sogdian */ '0', /* Old_South_Arabian */ '0', /* Old_Turkic */ + '0', /* Old_Uyghur */ 0xb66, /* Oriya */ '0', /* Osage */ 0x104a0, /* Osmanya */ @@ -83942,6 +85497,7 @@ static const UV script_zeros[] = { '0', /* Tai_Viet */ 0x116c0, /* Takri */ 0xbe6, /* Tamil */ + 0x16ac0, /* Tangsa */ '0', /* Tangut */ 0xc66, /* Telugu */ 0x660, /* Thaana */ @@ -83949,8 +85505,10 @@ static const UV script_zeros[] = { 0xf20, /* Tibetan */ '0', /* Tifinagh */ 0x114d0, /* Tirhuta */ + '0', /* Toto */ '0', /* Ugaritic */ 0xa620, /* Vai */ + '0', /* Vithkuqi */ 0x1e2f0, /* Wancho */ 0x118e0, /* Warang_Citi */ 0x660 /* Yezidi */ @@ -84051,9 +85609,6 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Arabic, SCX_use_AUX_TABLE_5, SCX_use_AUX_TABLE_6, - SCX_Unknown, - SCX_Arabic, - SCX_use_AUX_TABLE_5, SCX_Arabic, SCX_use_AUX_TABLE_7, SCX_Arabic, @@ -84061,10 +85616,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Arabic, SCX_use_AUX_TABLE_9, SCX_Arabic, - SCX_use_AUX_TABLE_8, - SCX_Arabic, SCX_use_AUX_TABLE_10, SCX_Arabic, + SCX_use_AUX_TABLE_9, + SCX_Arabic, + SCX_use_AUX_TABLE_11, + SCX_Arabic, SCX_Common, SCX_Arabic, SCX_Syriac, @@ -84096,13 +85653,13 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Common, SCX_Arabic, SCX_Devanagari, - SCX_use_AUX_TABLE_11, SCX_use_AUX_TABLE_12, + SCX_use_AUX_TABLE_13, SCX_Inherited, SCX_Devanagari, - SCX_use_AUX_TABLE_13, SCX_use_AUX_TABLE_14, SCX_use_AUX_TABLE_15, + SCX_use_AUX_TABLE_16, SCX_Devanagari, SCX_Bengali, SCX_Unknown, @@ -84130,7 +85687,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Bengali, SCX_Unknown, - SCX_use_AUX_TABLE_16, + SCX_use_AUX_TABLE_17, SCX_Bengali, SCX_Unknown, SCX_Gurmukhi, @@ -84163,7 +85720,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Gurmukhi, SCX_Unknown, - SCX_use_AUX_TABLE_17, + SCX_use_AUX_TABLE_18, SCX_Gurmukhi, SCX_Unknown, SCX_Gujarati, @@ -84190,7 +85747,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Gujarati, SCX_Unknown, - SCX_use_AUX_TABLE_18, + SCX_use_AUX_TABLE_19, SCX_Gujarati, SCX_Unknown, SCX_Gujarati, @@ -84253,7 +85810,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Tamil, SCX_Unknown, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, SCX_Unknown, SCX_Telugu, @@ -84279,6 +85836,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Telugu, SCX_Unknown, SCX_Telugu, + SCX_Unknown, + SCX_Telugu, SCX_Kannada, SCX_Unknown, SCX_Kannada, @@ -84301,7 +85860,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Kannada, SCX_Unknown, - SCX_use_AUX_TABLE_20, + SCX_use_AUX_TABLE_21, SCX_Unknown, SCX_Kannada, SCX_Unknown, @@ -84385,7 +85944,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Tibetan, SCX_Unknown, SCX_Myanmar, - SCX_use_AUX_TABLE_21, + SCX_use_AUX_TABLE_22, SCX_Myanmar, SCX_Georgian, SCX_Unknown, @@ -84394,9 +85953,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Georgian, SCX_Unknown, SCX_Georgian, - SCX_use_AUX_TABLE_22, - SCX_Georgian, SCX_use_AUX_TABLE_23, + SCX_Georgian, + SCX_use_AUX_TABLE_24, SCX_Ethiopic, SCX_Unknown, SCX_Ethiopic, @@ -84447,9 +86006,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Tagalog, SCX_Unknown, SCX_Tagalog, - SCX_Unknown, SCX_Hanunoo, - SCX_use_AUX_TABLE_24, + SCX_use_AUX_TABLE_25, SCX_Unknown, SCX_Buhid, SCX_Unknown, @@ -84466,11 +86024,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Khmer, SCX_Unknown, SCX_Mongolian, - SCX_use_AUX_TABLE_25, - SCX_Mongolian, - SCX_use_AUX_TABLE_25, + SCX_use_AUX_TABLE_26, SCX_Mongolian, - SCX_Unknown, + SCX_use_AUX_TABLE_26, SCX_Mongolian, SCX_Unknown, SCX_Mongolian, @@ -84536,33 +86092,33 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Georgian, SCX_Sundanese, SCX_Unknown, - SCX_use_AUX_TABLE_26, - SCX_Devanagari, - SCX_use_AUX_TABLE_26, SCX_use_AUX_TABLE_27, SCX_Devanagari, + SCX_use_AUX_TABLE_27, SCX_use_AUX_TABLE_28, + SCX_Devanagari, SCX_use_AUX_TABLE_29, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_30, SCX_use_AUX_TABLE_29, SCX_use_AUX_TABLE_30, + SCX_use_AUX_TABLE_31, SCX_Devanagari, - SCX_use_AUX_TABLE_29, + SCX_use_AUX_TABLE_30, SCX_Devanagari, + SCX_use_AUX_TABLE_30, SCX_use_AUX_TABLE_29, - SCX_use_AUX_TABLE_28, SCX_Devanagari, - SCX_use_AUX_TABLE_31, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_32, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_32, - SCX_use_AUX_TABLE_27, SCX_use_AUX_TABLE_33, SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_34, + SCX_use_AUX_TABLE_29, SCX_Bengali, - SCX_use_AUX_TABLE_27, + SCX_use_AUX_TABLE_28, SCX_Nandinagari, SCX_Unknown, SCX_Latin, @@ -84577,9 +86133,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Latin, SCX_Greek, SCX_Inherited, - SCX_use_AUX_TABLE_34, + SCX_use_AUX_TABLE_35, SCX_Inherited, - SCX_Unknown, + SCX_Syriac, SCX_Inherited, SCX_Latin, SCX_Greek, @@ -84617,7 +86173,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Common, SCX_Inherited, SCX_Common, - SCX_use_AUX_TABLE_35, + SCX_use_AUX_TABLE_36, SCX_Common, SCX_Unknown, SCX_Common, @@ -84632,7 +86188,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Common, SCX_Unknown, SCX_Inherited, - SCX_use_AUX_TABLE_36, + SCX_use_AUX_TABLE_37, SCX_Unknown, SCX_Common, SCX_Greek, @@ -84658,9 +86214,6 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Common, SCX_Glagolitic, - SCX_Unknown, - SCX_Glagolitic, - SCX_Unknown, SCX_Latin, SCX_Coptic, SCX_Unknown, @@ -84699,78 +86252,77 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_use_AUX_TABLE_3, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, - SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_40, SCX_Common, - SCX_use_AUX_TABLE_37, - SCX_use_AUX_TABLE_38, - SCX_Common, - SCX_use_AUX_TABLE_39, SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_39, SCX_Common, - SCX_use_AUX_TABLE_37, SCX_use_AUX_TABLE_40, - SCX_use_AUX_TABLE_23, SCX_use_AUX_TABLE_39, - SCX_use_AUX_TABLE_41, + SCX_use_AUX_TABLE_40, SCX_Common, - SCX_use_AUX_TABLE_39, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, + SCX_use_AUX_TABLE_41, + SCX_use_AUX_TABLE_24, + SCX_use_AUX_TABLE_40, SCX_use_AUX_TABLE_42, - SCX_use_AUX_TABLE_37, - SCX_Unknown, + SCX_Common, + SCX_use_AUX_TABLE_40, + SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_43, - SCX_use_AUX_TABLE_41, SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_38, - SCX_use_AUX_TABLE_41, + SCX_Unknown, + SCX_use_AUX_TABLE_42, SCX_use_AUX_TABLE_44, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, SCX_Unknown, SCX_use_AUX_TABLE_1, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_use_AUX_TABLE_1, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_37, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_38, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, - SCX_use_AUX_TABLE_37, - SCX_Unknown, + SCX_use_AUX_TABLE_38, SCX_Yi, SCX_Unknown, SCX_Yi, @@ -84783,7 +86335,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Cyrillic, SCX_Bamum, SCX_Unknown, - SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_46, SCX_Common, SCX_Latin, SCX_Common, @@ -84792,11 +86344,15 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Latin, SCX_Unknown, SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, SCX_Syloti_Nagri, SCX_Unknown, - SCX_use_AUX_TABLE_46, SCX_use_AUX_TABLE_47, SCX_use_AUX_TABLE_48, + SCX_use_AUX_TABLE_49, SCX_Unknown, SCX_Phags_Pa, SCX_Unknown, @@ -84805,21 +86361,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Saurashtra, SCX_Unknown, SCX_Devanagari, - SCX_use_AUX_TABLE_28, + SCX_use_AUX_TABLE_29, SCX_Devanagari, - SCX_use_AUX_TABLE_49, + SCX_use_AUX_TABLE_50, SCX_Devanagari, SCX_Kayah_Li, - SCX_use_AUX_TABLE_50, + SCX_use_AUX_TABLE_51, SCX_Kayah_Li, SCX_Rejang, SCX_Unknown, SCX_Rejang, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, SCX_Javanese, SCX_Unknown, - SCX_use_AUX_TABLE_51, + SCX_use_AUX_TABLE_52, SCX_Javanese, SCX_Unknown, SCX_Javanese, @@ -84860,15 +86416,15 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Meetei_Mayek, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Latin, SCX_Unknown, @@ -84888,24 +86444,25 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Arabic, SCX_Unknown, SCX_Arabic, - SCX_Common, + SCX_use_AUX_TABLE_53, + SCX_Arabic, SCX_Unknown, SCX_Arabic, SCX_Unknown, SCX_Arabic, SCX_Unknown, SCX_Arabic, - SCX_use_AUX_TABLE_52, + SCX_use_AUX_TABLE_54, + SCX_Arabic, + SCX_use_AUX_TABLE_54, SCX_Arabic, - SCX_use_AUX_TABLE_52, - SCX_Unknown, SCX_Inherited, SCX_Common, SCX_Unknown, SCX_Inherited, SCX_Cyrillic, SCX_Common, - SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_40, SCX_Common, SCX_Unknown, SCX_Common, @@ -84923,20 +86480,20 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Common, SCX_Latin, SCX_Common, - SCX_use_AUX_TABLE_38, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_41, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_39, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_42, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, - SCX_use_AUX_TABLE_23, + SCX_use_AUX_TABLE_24, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -84958,11 +86515,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Linear_B, SCX_Unknown, - SCX_use_AUX_TABLE_53, + SCX_use_AUX_TABLE_55, + SCX_use_AUX_TABLE_56, SCX_Unknown, - SCX_use_AUX_TABLE_54, + SCX_use_AUX_TABLE_57, SCX_Unknown, - SCX_use_AUX_TABLE_53, + SCX_use_AUX_TABLE_56, SCX_Greek, SCX_Unknown, SCX_Common, @@ -84976,7 +86534,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Carian, SCX_Unknown, - SCX_use_AUX_TABLE_55, + SCX_use_AUX_TABLE_58, SCX_Unknown, SCX_Old_Italic, SCX_Unknown, @@ -85007,6 +86565,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Caucasian_Albanian, SCX_Unknown, SCX_Caucasian_Albanian, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, + SCX_Unknown, + SCX_Vithkuqi, SCX_Unknown, SCX_Linear_A, SCX_Unknown, @@ -85014,6 +86587,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Linear_A, SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, + SCX_Latin, + SCX_Unknown, SCX_Cypriot, SCX_Unknown, SCX_Cypriot, @@ -85073,6 +86652,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Manichaean, SCX_Unknown, SCX_Manichaean, + SCX_use_AUX_TABLE_59, + SCX_Manichaean, SCX_Unknown, SCX_Avestan, SCX_Unknown, @@ -85112,6 +86693,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Sogdian, SCX_Unknown, + SCX_Old_Uyghur, + SCX_Unknown, SCX_Chorasmian, SCX_Unknown, SCX_Elymaic, @@ -85158,9 +86741,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Khudawadi, SCX_Unknown, SCX_Grantha, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Grantha, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Unknown, SCX_Grantha, SCX_Unknown, @@ -85174,7 +86757,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Grantha, SCX_Unknown, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Grantha, SCX_Unknown, SCX_Grantha, @@ -85250,6 +86833,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Soyombo, SCX_Unknown, + SCX_Canadian_Aboriginal, SCX_Pau_Cin_Hau, SCX_Unknown, SCX_Bhaiksuki, @@ -85297,9 +86881,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Lisu, SCX_Unknown, SCX_Tamil, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, - SCX_use_AUX_TABLE_19, + SCX_use_AUX_TABLE_20, SCX_Tamil, SCX_Unknown, SCX_Tamil, @@ -85311,6 +86895,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Cuneiform, SCX_Unknown, + SCX_Cypro_Minoan, + SCX_Unknown, SCX_Egyptian_Hieroglyphs, SCX_Unknown, SCX_Egyptian_Hieroglyphs, @@ -85324,6 +86910,9 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Mro, SCX_Unknown, SCX_Mro, + SCX_Tangsa, + SCX_Unknown, + SCX_Tangsa, SCX_Unknown, SCX_Bassa_Vah, SCX_Unknown, @@ -85349,10 +86938,10 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Tangut, SCX_Nushu, - SCX_Common, + SCX_use_AUX_TABLE_38, SCX_Khitan_Small_Script, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Tangut, SCX_Unknown, @@ -85361,13 +86950,20 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Tangut, SCX_Unknown, - SCX_use_AUX_TABLE_44, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_45, SCX_Unknown, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_45, + SCX_Unknown, + SCX_use_AUX_TABLE_45, + SCX_Unknown, + SCX_use_AUX_TABLE_45, + SCX_use_AUX_TABLE_44, + SCX_use_AUX_TABLE_45, SCX_Unknown, SCX_use_AUX_TABLE_44, SCX_Unknown, + SCX_use_AUX_TABLE_45, + SCX_Unknown, SCX_Nushu, SCX_Unknown, SCX_Duployan, @@ -85380,6 +86976,12 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Duployan, SCX_Unknown, + SCX_Inherited, + SCX_Unknown, + SCX_Inherited, + SCX_Unknown, + SCX_Common, + SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, @@ -85400,7 +87002,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Common, SCX_Unknown, SCX_Common, @@ -85450,6 +87052,8 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_SignWriting, SCX_Unknown, + SCX_Latin, + SCX_Unknown, SCX_Glagolitic, SCX_Unknown, SCX_Glagolitic, @@ -85468,10 +87072,20 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Nyiakeng_Puachue_Hmong, SCX_Unknown, + SCX_Toto, + SCX_Unknown, SCX_Wancho, SCX_Unknown, SCX_Wancho, SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, + SCX_Ethiopic, + SCX_Unknown, SCX_Mende_Kikakui, SCX_Unknown, SCX_Mende_Kikakui, @@ -85569,14 +87183,14 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Common, SCX_Unknown, SCX_Common, - SCX_use_AUX_TABLE_43, + SCX_use_AUX_TABLE_44, SCX_Common, SCX_Unknown, SCX_Common, SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -85632,19 +87246,21 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ SCX_Unknown, SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_Common, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, SCX_Unknown, - SCX_use_AUX_TABLE_37, + SCX_use_AUX_TABLE_38, + SCX_Unknown, + SCX_use_AUX_TABLE_38, SCX_Unknown, SCX_Common, SCX_Unknown, @@ -85663,7 +87279,7 @@ static const SCX_enum _Perl_SCX_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ - 1884, /* Number of elements */ + 1949, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -85835,11 +87451,15 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x85C, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -86033,6 +87653,7 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, + 0xC3C, 0xC3D, 0xC3E, 0xC45, @@ -86044,6 +87665,8 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC64, @@ -86072,7 +87695,7 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -86252,11 +87875,9 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1732, 0x1735, 0x1740, @@ -86312,12 +87933,12 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -86358,8 +87979,6 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x1CFB, 0x1D00, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1F16, 0x1F18, @@ -86550,10 +88169,6 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x2B55, 0x2B56, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -86647,10 +88262,14 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0xA6F0, 0xA6F2, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -86883,12 +88502,34 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -86974,6 +88615,9 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x10F30, 0x10F46, 0x10F51, + 0x10F70, + 0x10F82, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -86984,12 +88628,18 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x11047, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -87175,7 +88825,7 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -87235,6 +88885,8 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -87247,6 +88899,10 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -87280,8 +88936,16 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x16FE5, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168, 0x1BC00, @@ -87296,6 +88960,10 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -87382,6 +89050,8 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -87401,10 +89071,21 @@ static const UV _Perl_WB_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, + 0x1E2AF, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -87764,6 +89445,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_ALetter, WB_Other, + WB_Format, + WB_Other, + WB_Extend, + WB_ALetter, WB_Extend, WB_Format, WB_Extend, @@ -87958,6 +89643,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_ALetter, WB_Other, + WB_Extend, WB_ALetter, WB_Extend, WB_Other, @@ -87970,6 +89656,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_Other, WB_Numeric, @@ -88177,8 +89865,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_ALetter, WB_Other, WB_ALetter, - WB_Other, - WB_ALetter, WB_Extend, WB_Other, WB_ALetter, @@ -88201,7 +89887,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_Extend, WB_Format, - WB_Other, + WB_Extend, WB_Numeric, WB_Other, WB_ALetter, @@ -88283,8 +89969,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_ALetter, WB_Extend, - WB_Other, - WB_Extend, WB_ALetter, WB_Other, WB_ALetter, @@ -88477,10 +90161,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_ALetter, WB_Other, WB_ALetter, - WB_Other, - WB_ALetter, - WB_Other, - WB_ALetter, WB_Extend, WB_ALetter, WB_Other, @@ -88576,6 +90256,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_ALetter, WB_Extend, @@ -88843,6 +90527,28 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_Other, WB_Extend, @@ -88900,6 +90606,9 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Extend, WB_Other, WB_ALetter, + WB_Extend, + WB_Other, + WB_ALetter, WB_Other, WB_ALetter, WB_Other, @@ -88908,6 +90617,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Extend, WB_Other, WB_Numeric, + WB_Extend, + WB_ALetter, + WB_Extend, + WB_ALetter, WB_Other, WB_Extend, WB_ALetter, @@ -88915,6 +90628,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_Format, WB_Other, + WB_Extend, + WB_Other, WB_Format, WB_Other, WB_ALetter, @@ -89162,6 +90877,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_ALetter, WB_Other, + WB_ALetter, + WB_Other, WB_Format, WB_Other, WB_ALetter, @@ -89174,6 +90891,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_ALetter, WB_Other, + WB_Numeric, + WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_ALetter, @@ -89209,6 +90930,14 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_Katakana, WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, WB_ALetter, WB_Other, WB_ALetter, @@ -89224,6 +90953,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Extend, WB_Other, WB_Extend, + WB_Other, + WB_Extend, + WB_Other, + WB_Extend, WB_Format, WB_Extend, WB_Other, @@ -89307,6 +91040,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_Extend, WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_Extend, @@ -89328,10 +91063,21 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ WB_Other, WB_ALetter, WB_Extend, + WB_Other, + WB_ALetter, + WB_Extend, WB_Numeric, WB_Other, WB_ALetter, WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_ALetter, @@ -89490,7 +91236,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ - 1907, /* Number of elements */ + 1972, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -89685,11 +91431,15 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -89883,6 +91633,7 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, + 0xC3C, 0xC3D, 0xC3E, 0xC45, @@ -89894,6 +91645,8 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC64, @@ -89922,7 +91675,7 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -90102,11 +91855,9 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1732, 0x1735, 0x1740, @@ -90162,12 +91913,12 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -90208,8 +91959,6 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x1CFB, 0x1D00, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1F16, 0x1F18, @@ -90400,10 +92149,6 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x2B55, 0x2B56, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -90497,10 +92242,14 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0xA6F0, 0xA6F2, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -90733,12 +92482,34 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -90824,6 +92595,9 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x10F30, 0x10F46, 0x10F51, + 0x10F70, + 0x10F82, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -90834,12 +92608,18 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x11047, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -91025,7 +92805,7 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -91085,6 +92865,8 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -91097,6 +92879,10 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -91130,8 +92916,16 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x16FE5, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168, 0x1BC00, @@ -91146,6 +92940,10 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -91232,6 +93030,8 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -91251,10 +93051,21 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, + 0x1E2AF, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -91640,6 +93451,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_ALetter, WB_Other, + WB_Format, + WB_Other, + WB_Extend, + WB_ALetter, WB_Extend, WB_Format, WB_Extend, @@ -91834,6 +93649,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_ALetter, WB_Other, + WB_Extend, WB_ALetter, WB_Extend, WB_Other, @@ -91846,6 +93662,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_Other, WB_Numeric, @@ -92053,8 +93871,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_ALetter, WB_Other, WB_ALetter, - WB_Other, - WB_ALetter, WB_Extend, WB_Other, WB_ALetter, @@ -92077,7 +93893,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_Extend, WB_Format, - WB_Other, + WB_Extend, WB_Numeric, WB_Other, WB_ALetter, @@ -92159,8 +93975,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_ALetter, WB_Extend, - WB_Other, - WB_Extend, WB_ALetter, WB_Other, WB_ALetter, @@ -92353,10 +94167,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_ALetter, WB_Other, WB_ALetter, - WB_Other, - WB_ALetter, - WB_Other, - WB_ALetter, WB_Extend, WB_ALetter, WB_Other, @@ -92452,6 +94262,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_ALetter, WB_Extend, @@ -92719,6 +94533,28 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_Other, WB_Extend, @@ -92776,6 +94612,9 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Extend, WB_Other, WB_ALetter, + WB_Extend, + WB_Other, + WB_ALetter, WB_Other, WB_ALetter, WB_Other, @@ -92784,6 +94623,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Extend, WB_Other, WB_Numeric, + WB_Extend, + WB_ALetter, + WB_Extend, + WB_ALetter, WB_Other, WB_Extend, WB_ALetter, @@ -92791,6 +94634,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_Format, WB_Other, + WB_Extend, + WB_Other, WB_Format, WB_Other, WB_ALetter, @@ -93038,6 +94883,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_ALetter, WB_Other, + WB_ALetter, + WB_Other, WB_Format, WB_Other, WB_ALetter, @@ -93050,6 +94897,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_ALetter, WB_Other, + WB_Numeric, + WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_ALetter, @@ -93085,6 +94936,14 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_Katakana, WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, WB_ALetter, WB_Other, WB_ALetter, @@ -93100,6 +94959,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Extend, WB_Other, WB_Extend, + WB_Other, + WB_Extend, + WB_Other, + WB_Extend, WB_Format, WB_Extend, WB_Other, @@ -93183,6 +95046,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_Extend, WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_Extend, @@ -93204,10 +95069,21 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ WB_Other, WB_ALetter, WB_Extend, + WB_Other, + WB_ALetter, + WB_Extend, WB_Numeric, WB_Other, WB_ALetter, WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_ALetter, @@ -93366,7 +95242,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ - 1903, /* Number of elements */ + 1968, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -93557,11 +95433,15 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -93755,6 +95635,7 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, + 0xC3C, 0xC3D, 0xC3E, 0xC45, @@ -93766,6 +95647,8 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC64, @@ -93794,7 +95677,7 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -93974,11 +95857,9 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1732, 0x1735, 0x1740, @@ -94034,12 +95915,12 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -94080,8 +95961,6 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x1CFB, 0x1D00, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1F16, 0x1F18, @@ -94272,10 +96151,6 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x2B55, 0x2B56, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -94369,10 +96244,14 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0xA6F0, 0xA6F2, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -94605,12 +96484,34 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -94696,6 +96597,9 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x10F30, 0x10F46, 0x10F51, + 0x10F70, + 0x10F82, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -94706,12 +96610,18 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x11047, 0x11066, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -94897,7 +96807,7 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -94957,6 +96867,8 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -94969,6 +96881,10 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -95002,8 +96918,16 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x16FE5, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168, 0x1BC00, @@ -95018,6 +96942,10 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -95104,6 +97032,8 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -95123,10 +97053,21 @@ static const UV _Perl_WB_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, + 0x1E2AF, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -95508,6 +97449,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_ALetter, WB_Other, + WB_Format, + WB_Other, + WB_Extend, + WB_ALetter, WB_Extend, WB_Format, WB_Extend, @@ -95702,6 +97647,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_ALetter, WB_Other, + WB_Extend, WB_ALetter, WB_Extend, WB_Other, @@ -95714,6 +97660,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_Other, WB_Numeric, @@ -95921,8 +97869,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_ALetter, WB_Other, WB_ALetter, - WB_Other, - WB_ALetter, WB_Extend, WB_Other, WB_ALetter, @@ -95945,7 +97891,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_Extend, WB_Format, - WB_Other, + WB_Extend, WB_Numeric, WB_Other, WB_ALetter, @@ -96027,8 +97973,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_ALetter, WB_Extend, - WB_Other, - WB_Extend, WB_ALetter, WB_Other, WB_ALetter, @@ -96221,10 +98165,6 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_ALetter, WB_Other, WB_ALetter, - WB_Other, - WB_ALetter, - WB_Other, - WB_ALetter, WB_Extend, WB_ALetter, WB_Other, @@ -96320,6 +98260,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_ALetter, WB_Extend, @@ -96587,6 +98531,28 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_ALetter, WB_Other, WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, WB_Extend, WB_Other, WB_Extend, @@ -96644,6 +98610,9 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Extend, WB_Other, WB_ALetter, + WB_Extend, + WB_Other, + WB_ALetter, WB_Other, WB_ALetter, WB_Other, @@ -96652,6 +98621,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Extend, WB_Other, WB_Numeric, + WB_Extend, + WB_ALetter, + WB_Extend, + WB_ALetter, WB_Other, WB_Extend, WB_ALetter, @@ -96659,6 +98632,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_Format, WB_Other, + WB_Extend, + WB_Other, WB_Format, WB_Other, WB_ALetter, @@ -96906,6 +98881,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_ALetter, WB_Other, + WB_ALetter, + WB_Other, WB_Format, WB_Other, WB_ALetter, @@ -96918,6 +98895,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_ALetter, WB_Other, + WB_Numeric, + WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_ALetter, @@ -96953,6 +98934,14 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_Katakana, WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, + WB_Katakana, + WB_Other, WB_ALetter, WB_Other, WB_ALetter, @@ -96968,6 +98957,10 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Extend, WB_Other, WB_Extend, + WB_Other, + WB_Extend, + WB_Other, + WB_Extend, WB_Format, WB_Extend, WB_Other, @@ -97051,6 +99044,8 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_Extend, WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_Extend, @@ -97072,10 +99067,21 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ WB_Other, WB_ALetter, WB_Extend, + WB_Other, + WB_ALetter, + WB_Extend, WB_Numeric, WB_Other, WB_ALetter, WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, + WB_ALetter, + WB_Other, WB_Extend, WB_Other, WB_ALetter, @@ -97231,7 +99237,7 @@ static const WB_enum _Perl_WB_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV Simple_Case_Folding_invlist[] = { /* for ASCII/Latin1 */ - 1291, /* Number of elements */ + 1307, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -98155,7 +100161,7 @@ static const UV Simple_Case_Folding_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -98499,6 +100505,8 @@ static const UV Simple_Case_Folding_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -98508,6 +100516,12 @@ static const UV Simple_Case_Folding_invlist[] = { /* for ASCII/Latin1 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -98518,6 +100532,14 @@ static const UV Simple_Case_Folding_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -99801,6 +101823,8 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -99810,6 +101834,12 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0x13A0, @@ -99820,6 +101850,14 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for ASCII/Latin1 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -99842,7 +101880,7 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 1047 */ - 1309, /* Number of elements */ + 1325, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -100784,7 +102822,7 @@ static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -101128,6 +103166,8 @@ static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -101137,6 +103177,12 @@ static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 1047 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -101147,6 +103193,14 @@ static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -102451,6 +104505,8 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -102460,6 +104516,12 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0x13A0, @@ -102470,6 +104532,14 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for EBCDIC 1047 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -102492,7 +104562,7 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 037 */ - 1305, /* Number of elements */ + 1321, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -103430,7 +105500,7 @@ static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -103774,6 +105844,8 @@ static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, @@ -103783,6 +105855,12 @@ static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 037 */ 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -103793,6 +105871,14 @@ static const UV Simple_Case_Folding_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -105093,6 +107179,8 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7BF, 0, + 0xA7C1, + 0, 0xA7C3, 0, 0xA794, @@ -105102,6 +107190,12 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7CA, 0, + 0xA7D1, + 0, + 0xA7D7, + 0, + 0xA7D9, + 0, 0xA7F6, 0, 0x13A0, @@ -105112,6 +107206,14 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for EBCDIC 037 */ 0, 0x104D8, 0, + 0x10597, + 0, + 0x105A3, + 0, + 0x105B3, + 0, + 0x105BB, + 0, 0x10CC0, 0, 0x118C0, @@ -105131,7 +107233,7 @@ static const I32 Simple_Case_Folding_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV Titlecase_Mapping_invlist[] = { /* for ASCII/Latin1 */ - 1340, /* Number of elements */ + 1356, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -106105,7 +108207,7 @@ static const UV Titlecase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -106436,12 +108538,20 @@ static const UV Titlecase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -106467,6 +108577,14 @@ static const UV Titlecase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -108182,12 +110300,20 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -108213,6 +110339,14 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for ASCII/Latin1 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -108235,7 +110369,7 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV Titlecase_Mapping_invlist[] = { /* for EBCDIC 1047 */ - 1356, /* Number of elements */ + 1372, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -109225,7 +111359,7 @@ static const UV Titlecase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -109556,12 +111690,20 @@ static const UV Titlecase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -109587,6 +111729,14 @@ static const UV Titlecase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -111321,12 +113471,20 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -111352,6 +113510,14 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for EBCDIC 1047 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -111374,7 +113540,7 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV Titlecase_Mapping_invlist[] = { /* for EBCDIC 037 */ - 1354, /* Number of elements */ + 1370, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -112362,7 +114528,7 @@ static const UV Titlecase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -112693,12 +114859,20 @@ static const UV Titlecase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -112724,6 +114898,14 @@ static const UV Titlecase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -114456,12 +116638,20 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -114487,6 +116677,14 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for EBCDIC 037 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -114506,7 +116704,7 @@ static const I32 Titlecase_Mapping_invmap[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV Uppercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ - 1391, /* Number of elements */ + 1407, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -115531,7 +117729,7 @@ static const UV Uppercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -115862,12 +118060,20 @@ static const UV Uppercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -115893,6 +118099,14 @@ static const UV Uppercase_Mapping_invlist[] = { /* for ASCII/Latin1 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -117875,12 +120089,20 @@ static const I32 Uppercase_Mapping_invmap[] = { /* for ASCII/Latin1 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -117906,6 +120128,14 @@ static const I32 Uppercase_Mapping_invmap[] = { /* for ASCII/Latin1 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -117928,7 +120158,7 @@ static const I32 Uppercase_Mapping_invmap[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV Uppercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ - 1407, /* Number of elements */ + 1423, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -118969,7 +121199,7 @@ static const UV Uppercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -119300,12 +121530,20 @@ static const UV Uppercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -119331,6 +121569,14 @@ static const UV Uppercase_Mapping_invlist[] = { /* for EBCDIC 1047 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -121332,12 +123578,20 @@ static const I32 Uppercase_Mapping_invmap[] = { /* for EBCDIC 1047 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -121363,6 +123617,14 @@ static const I32 Uppercase_Mapping_invmap[] = { /* for EBCDIC 1047 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -121385,7 +123647,7 @@ static const I32 Uppercase_Mapping_invmap[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV Uppercase_Mapping_invlist[] = { /* for EBCDIC 037 */ - 1405, /* Number of elements */ + 1421, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -122424,7 +124686,7 @@ static const UV Uppercase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -122755,12 +125017,20 @@ static const UV Uppercase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -122786,6 +125056,14 @@ static const UV Uppercase_Mapping_invlist[] = { /* for EBCDIC 037 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -124785,12 +127063,20 @@ static const I32 Uppercase_Mapping_invmap[] = { /* for EBCDIC 037 */ 0, 0xA7BE, 0, + 0xA7C0, + 0, 0xA7C2, 0, 0xA7C7, 0, 0xA7C9, 0, + 0xA7D0, + 0, + 0xA7D6, + 0, + 0xA7D8, + 0, 0xA7F5, 0, 0xA7B3, @@ -124816,6 +127102,14 @@ static const I32 Uppercase_Mapping_invmap[] = { /* for EBCDIC 037 */ 0, 0x104B0, 0, + 0x10570, + 0, + 0x1057C, + 0, + 0x1058C, + 0, + 0x10594, + 0, 0x10C80, 0, 0x118A0, @@ -125138,7 +127432,7 @@ static const UV UNI_ASCII_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ - 1354, /* Number of elements */ + 1396, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -125167,8 +127461,6 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -125186,11 +127478,11 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -125346,7 +127638,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -125356,6 +127648,8 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -125378,7 +127672,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -125513,10 +127807,8 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -125533,8 +127825,6 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -125573,11 +127863,11 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -125593,8 +127883,6 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -125635,7 +127923,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -125649,10 +127937,6 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -125683,7 +127967,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -125707,8 +127991,6 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -125717,10 +127999,14 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -125791,16 +128077,14 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -125887,13 +128171,33 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -125980,6 +128284,8 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -125987,9 +128293,9 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -126073,7 +128379,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -126081,7 +128387,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -126112,7 +128418,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -126168,6 +128474,8 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -126181,7 +128489,9 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -126214,8 +128524,14 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -126232,12 +128548,18 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -126292,6 +128614,8 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -126310,10 +128634,20 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -126422,7 +128756,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -126432,6 +128766,8 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -126445,27 +128781,27 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -126473,9 +128809,9 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -126501,7 +128837,7 @@ static const UV UNI_ASSIGNED_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CASED_invlist[] = { /* for ASCII/Latin1 */ - 283, /* Number of elements */ + 311, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -126661,10 +128997,6 @@ static const UV UNI_CASED_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -126685,9 +129017,13 @@ static const UV UNI_CASED_invlist[] = { /* for ASCII/Latin1 */ 0xA78B, 0xA78F, 0xA790, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA7F5, 0xA7F7, 0xA7F8, @@ -126712,6 +129048,30 @@ static const UV UNI_CASED_invlist[] = { /* for ASCII/Latin1 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10C80, 0x10CB3, 0x10CC0, @@ -126780,6 +129140,10 @@ static const UV UNI_CASED_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E900, 0x1E944, 0x1F130, @@ -126798,7 +129162,7 @@ static const UV UNI_CASED_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CASED_invlist[] = { /* for EBCDIC 1047 */ - 309, /* Number of elements */ + 337, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -126984,10 +129348,6 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -127008,9 +129368,13 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 1047 */ 0xA78B, 0xA78F, 0xA790, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA7F5, 0xA7F7, 0xA7F8, @@ -127035,6 +129399,30 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 1047 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10C80, 0x10CB3, 0x10CC0, @@ -127103,6 +129491,10 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E900, 0x1E944, 0x1F130, @@ -127121,7 +129513,7 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CASED_invlist[] = { /* for EBCDIC 037 */ - 305, /* Number of elements */ + 333, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -127303,10 +129695,6 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -127327,9 +129715,13 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 037 */ 0xA78B, 0xA78F, 0xA790, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA7F5, 0xA7F7, 0xA7F8, @@ -127354,6 +129746,30 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 037 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10C80, 0x10CB3, 0x10CC0, @@ -127422,6 +129838,10 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E900, 0x1E944, 0x1F130, @@ -127437,7 +129857,7 @@ static const UV UNI_CASED_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CASEDLETTER_invlist[] = { /* for ASCII/Latin1 */ - 265, /* Number of elements */ + 285, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -127581,10 +130001,6 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for ASCII/Latin1 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C7C, 0x2C7E, 0x2CE5, @@ -127609,9 +130025,13 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for ASCII/Latin1 */ 0xA78B, 0xA78F, 0xA790, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA7F5, 0xA7F7, 0xA7FA, @@ -127636,6 +130056,22 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for ASCII/Latin1 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -127704,6 +130140,10 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E900, 0x1E944 }; @@ -127716,7 +130156,7 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 1047 */ - 297, /* Number of elements */ + 317, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -127892,10 +130332,6 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 1047 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C7C, 0x2C7E, 0x2CE5, @@ -127920,9 +130356,13 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 1047 */ 0xA78B, 0xA78F, 0xA790, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA7F5, 0xA7F7, 0xA7FA, @@ -127947,6 +130387,22 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 1047 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -128015,6 +130471,10 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E900, 0x1E944 }; @@ -128027,7 +130487,7 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 037 */ - 293, /* Number of elements */ + 313, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -128199,10 +130659,6 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 037 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C7C, 0x2C7E, 0x2CE5, @@ -128227,9 +130683,13 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 037 */ 0xA78B, 0xA78F, 0xA790, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA7F5, 0xA7F7, 0xA7FA, @@ -128254,6 +130714,22 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 037 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -128322,6 +130798,10 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E900, 0x1E944 }; @@ -128331,7 +130811,7 @@ static const UV UNI_CASEDLETTER_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ - 1291, /* Number of elements */ + 1315, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -129199,7 +131679,7 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ 0x2184, 0x2185, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -129536,12 +132016,24 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7FA, @@ -129562,6 +132054,14 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -129624,6 +132124,10 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -129636,7 +132140,7 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ - 1305, /* Number of elements */ + 1329, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -130518,7 +133022,7 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ 0x2184, 0x2185, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -130855,12 +133359,24 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7FA, @@ -130881,6 +133397,14 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -130943,6 +133467,10 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -130955,7 +133483,7 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 037 */ - 1305, /* Number of elements */ + 1329, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -131837,7 +134365,7 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 037 */ 0x2184, 0x2185, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -132174,12 +134702,24 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7FA, @@ -132200,6 +134740,14 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 037 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -132262,6 +134810,10 @@ static const UV UNI_LOWERCASELETTER_invlist[] = { /* for EBCDIC 037 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -133258,7 +135810,7 @@ static const UV UNI_TITLE_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ - 1277, /* Number of elements */ + 1293, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -134126,7 +136678,7 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ 0x2183, 0x2184, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -134455,12 +137007,20 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -134469,6 +137029,14 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -134549,7 +137117,7 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ - 1295, /* Number of elements */ + 1311, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -135435,7 +138003,7 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ 0x2183, 0x2184, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -135764,12 +138332,20 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -135778,6 +138354,14 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -135858,7 +138442,7 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 037 */ - 1291, /* Number of elements */ + 1307, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -136740,7 +139324,7 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 037 */ 0x2183, 0x2184, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -137069,12 +139653,20 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -137083,6 +139675,14 @@ static const UV UNI_UPPERCASELETTER_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -137224,7 +139824,7 @@ static const UV UNI_VERTSPACE_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ - 1465, /* Number of elements */ + 1521, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -137333,10 +139933,12 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8D4, 0x8E0, 0x8E3, @@ -137523,6 +140125,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -137547,7 +140151,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0xCCD, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -137710,10 +140314,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1714, - 0x1720, + 0x171F, 0x1734, 0x1740, 0x1754, @@ -137771,12 +140373,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x1AA8, 0x1ABF, 0x1AC1, + 0x1ACC, + 0x1ACF, 0x1B00, 0x1B34, 0x1B35, 0x1B44, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B80, @@ -137884,10 +140488,6 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -137952,8 +140552,6 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -137972,10 +140570,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA806, 0xA807, 0xA828, @@ -138145,12 +140747,34 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -138227,6 +140851,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, @@ -138235,8 +140861,12 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x11046, 0x11066, 0x11070, + 0x11071, + 0x11076, 0x11082, 0x110B9, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -138351,6 +140981,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x1172B, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x11839, 0x118A0, @@ -138391,7 +141023,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x11A98, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -138451,6 +141083,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -138461,6 +141095,10 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16B00, @@ -138493,8 +141131,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -138573,6 +141217,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x1D7CC, 0x1D7CE, 0x1D800, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -138591,10 +141237,20 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -138680,9 +141336,9 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -138703,7 +141359,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ - 1489, /* Number of elements */ + 1545, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -138836,10 +141492,12 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8D4, 0x8E0, 0x8E3, @@ -139026,6 +141684,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -139050,7 +141710,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0xCCD, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -139213,10 +141873,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1714, - 0x1720, + 0x171F, 0x1734, 0x1740, 0x1754, @@ -139274,12 +141932,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x1AA8, 0x1ABF, 0x1AC1, + 0x1ACC, + 0x1ACF, 0x1B00, 0x1B34, 0x1B35, 0x1B44, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B80, @@ -139387,10 +142047,6 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -139455,8 +142111,6 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -139475,10 +142129,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA806, 0xA807, 0xA828, @@ -139648,12 +142306,34 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -139730,6 +142410,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, @@ -139738,8 +142420,12 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x11046, 0x11066, 0x11070, + 0x11071, + 0x11076, 0x11082, 0x110B9, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -139854,6 +142540,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x1172B, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x11839, 0x118A0, @@ -139894,7 +142582,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x11A98, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -139954,6 +142642,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -139964,6 +142654,10 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16B00, @@ -139996,8 +142690,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -140076,6 +142776,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x1D7CC, 0x1D7CE, 0x1D800, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -140094,10 +142796,20 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -140183,9 +142895,9 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -140206,7 +142918,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ - 1485, /* Number of elements */ + 1541, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -140335,10 +143047,12 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8D4, 0x8E0, 0x8E3, @@ -140525,6 +143239,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -140549,7 +143265,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0xCCD, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -140712,10 +143428,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1714, - 0x1720, + 0x171F, 0x1734, 0x1740, 0x1754, @@ -140773,12 +143487,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x1AA8, 0x1ABF, 0x1AC1, + 0x1ACC, + 0x1ACF, 0x1B00, 0x1B34, 0x1B35, 0x1B44, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B80, @@ -140886,10 +143602,6 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -140954,8 +143666,6 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -140974,10 +143684,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA806, 0xA807, 0xA828, @@ -141147,12 +143861,34 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -141229,6 +143965,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, @@ -141237,8 +143975,12 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x11046, 0x11066, 0x11070, + 0x11071, + 0x11076, 0x11082, 0x110B9, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -141353,6 +144095,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x1172B, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x11839, 0x118A0, @@ -141393,7 +144137,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x11A98, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -141453,6 +144197,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -141463,6 +144209,10 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16B00, @@ -141495,8 +144245,14 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -141575,6 +144331,8 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x1D7CC, 0x1D7CE, 0x1D800, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -141593,10 +144351,20 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -141682,9 +144450,9 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -141702,7 +144470,7 @@ static const UV UNI_XPOSIXALNUM_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ - 1391, /* Number of elements */ + 1445, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -141811,10 +144579,12 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8D4, 0x8E0, 0x8E3, @@ -141993,6 +144763,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC80, @@ -142015,7 +144787,7 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0xCCD, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -142168,10 +144940,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1714, - 0x1720, + 0x171F, 0x1734, 0x1740, 0x1754, @@ -142219,12 +144989,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x1AA8, 0x1ABF, 0x1AC1, + 0x1ACC, + 0x1ACF, 0x1B00, 0x1B34, 0x1B35, 0x1B44, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B80, 0x1BAA, 0x1BAC, @@ -142332,10 +145104,6 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -142400,8 +145168,6 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -142422,10 +145188,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA806, 0xA807, 0xA828, @@ -142589,12 +145359,34 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -142669,14 +145461,20 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11000, 0x11046, + 0x11071, + 0x11076, 0x11082, 0x110B9, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x11100, @@ -142777,6 +145575,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x1171B, 0x1171D, 0x1172B, + 0x11740, + 0x11747, 0x11800, 0x11839, 0x118A0, @@ -142815,7 +145615,7 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x11A98, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -142869,6 +145669,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -142877,6 +145679,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -142907,8 +145711,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -142985,6 +145795,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -143001,8 +145813,18 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -143084,9 +145906,9 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ 0x1F170, 0x1F18A, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -143107,7 +145929,7 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ - 1417, /* Number of elements */ + 1471, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -143242,10 +146064,12 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8D4, 0x8E0, 0x8E3, @@ -143424,6 +146248,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC80, @@ -143446,7 +146272,7 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0xCCD, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -143599,10 +146425,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1714, - 0x1720, + 0x171F, 0x1734, 0x1740, 0x1754, @@ -143650,12 +146474,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x1AA8, 0x1ABF, 0x1AC1, + 0x1ACC, + 0x1ACF, 0x1B00, 0x1B34, 0x1B35, 0x1B44, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B80, 0x1BAA, 0x1BAC, @@ -143763,10 +146589,6 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -143831,8 +146653,6 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -143853,10 +146673,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA806, 0xA807, 0xA828, @@ -144020,12 +146844,34 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -144100,14 +146946,20 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11000, 0x11046, + 0x11071, + 0x11076, 0x11082, 0x110B9, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x11100, @@ -144208,6 +147060,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x1171B, 0x1171D, 0x1172B, + 0x11740, + 0x11747, 0x11800, 0x11839, 0x118A0, @@ -144246,7 +147100,7 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x11A98, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -144300,6 +147154,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -144308,6 +147164,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -144338,8 +147196,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -144416,6 +147280,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -144432,8 +147298,18 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -144515,9 +147391,9 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ 0x1F170, 0x1F18A, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -144538,7 +147414,7 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ - 1413, /* Number of elements */ + 1467, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -144669,10 +147545,12 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8D4, 0x8E0, 0x8E3, @@ -144851,6 +147729,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC80, @@ -144873,7 +147753,7 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0xCCD, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -145026,10 +147906,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1714, - 0x1720, + 0x171F, 0x1734, 0x1740, 0x1754, @@ -145077,12 +147955,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x1AA8, 0x1ABF, 0x1AC1, + 0x1ACC, + 0x1ACF, 0x1B00, 0x1B34, 0x1B35, 0x1B44, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B80, 0x1BAA, 0x1BAC, @@ -145190,10 +148070,6 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -145258,8 +148134,6 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -145280,10 +148154,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA806, 0xA807, 0xA828, @@ -145447,12 +148325,34 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -145527,14 +148427,20 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11000, 0x11046, + 0x11071, + 0x11076, 0x11082, 0x110B9, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x11100, @@ -145635,6 +148541,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x1171B, 0x1171D, 0x1172B, + 0x11740, + 0x11747, 0x11800, 0x11839, 0x118A0, @@ -145673,7 +148581,7 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x11A98, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -145727,6 +148635,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -145735,6 +148645,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -145765,8 +148677,14 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -145843,6 +148761,8 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -145859,8 +148779,18 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -145942,9 +148872,9 @@ static const UV UNI_XPOSIXALPHA_invlist[] = { /* for EBCDIC 037 */ 0x1F170, 0x1F18A, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -146099,7 +149029,7 @@ static const UV UNI_XPOSIXCNTRL_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for ASCII/Latin1 */ - 123, /* Number of elements */ + 125, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -146214,6 +149144,8 @@ static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for ASCII/Latin1 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -146236,7 +149168,7 @@ static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for EBCDIC 1047 */ - 123, /* Number of elements */ + 125, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -146351,6 +149283,8 @@ static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for EBCDIC 1047 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -146373,7 +149307,7 @@ static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for EBCDIC 037 */ - 123, /* Number of elements */ + 125, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -146488,6 +149422,8 @@ static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for EBCDIC 037 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -146507,7 +149443,7 @@ static const UV UNI_XPOSIXDIGIT_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ - 1365, /* Number of elements */ + 1407, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -146539,8 +149475,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -146558,11 +149492,11 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -146718,7 +149652,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -146728,6 +149662,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -146750,7 +149686,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -146887,10 +149823,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -146907,8 +149841,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -146947,11 +149879,11 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -146967,8 +149899,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -147015,7 +149945,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -147029,10 +149959,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -147063,7 +149989,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -147087,8 +150013,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -147097,10 +150021,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -147171,16 +150099,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -147267,13 +150193,33 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -147360,6 +150306,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -147367,9 +150315,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -147453,7 +150401,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -147461,7 +150409,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -147492,7 +150440,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -147548,6 +150496,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -147561,7 +150511,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -147594,8 +150546,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -147612,12 +150570,18 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -147672,6 +150636,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -147690,10 +150656,20 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -147802,7 +150778,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -147812,6 +150788,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -147825,27 +150803,27 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -147853,9 +150831,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -147886,7 +150864,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ - 1365, /* Number of elements */ + 1407, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -147918,8 +150896,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -147937,11 +150913,11 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -148097,7 +151073,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -148107,6 +151083,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -148129,7 +151107,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -148266,10 +151244,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -148286,8 +151262,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -148326,11 +151300,11 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -148346,8 +151320,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -148394,7 +151366,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -148408,10 +151380,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -148442,7 +151410,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -148466,8 +151434,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -148476,10 +151442,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -148550,16 +151520,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -148646,13 +151614,33 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -148739,6 +151727,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -148746,9 +151736,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -148832,7 +151822,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -148840,7 +151830,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -148871,7 +151861,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -148927,6 +151917,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -148940,7 +151932,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -148973,8 +151967,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -148991,12 +151991,18 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -149051,6 +152057,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -149069,10 +152077,20 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -149181,7 +152199,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -149191,6 +152209,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -149204,27 +152224,27 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -149232,9 +152252,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -149265,7 +152285,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ - 1365, /* Number of elements */ + 1407, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -149297,8 +152317,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -149316,11 +152334,11 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -149476,7 +152494,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -149486,6 +152504,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -149508,7 +152528,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -149645,10 +152665,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -149665,8 +152683,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -149705,11 +152721,11 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -149725,8 +152741,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -149773,7 +152787,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -149787,10 +152801,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -149821,7 +152831,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -149845,8 +152855,6 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -149855,10 +152863,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -149929,16 +152941,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -150025,13 +153035,33 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -150118,6 +153148,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -150125,9 +153157,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -150211,7 +153243,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -150219,7 +153251,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -150250,7 +153282,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -150306,6 +153338,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -150319,7 +153353,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -150352,8 +153388,14 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -150370,12 +153412,18 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -150430,6 +153478,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -150448,10 +153498,20 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -150560,7 +153620,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -150570,6 +153630,8 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -150583,27 +153645,27 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -150611,9 +153673,9 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -150641,7 +153703,7 @@ static const UV UNI_XPOSIXGRAPH_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for ASCII/Latin1 */ - 1305, /* Number of elements */ + 1337, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -151525,7 +154587,7 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for ASCII/Latin1 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -151860,12 +154922,24 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7F8, @@ -151886,6 +154960,22 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for ASCII/Latin1 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10CC0, 0x10CF3, 0x118C0, @@ -151948,6 +155038,10 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for ASCII/Latin1 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -151960,7 +155054,7 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 1047 */ - 1313, /* Number of elements */ + 1345, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -152852,7 +155946,7 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 1047 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -153187,12 +156281,24 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7F8, @@ -153213,6 +156319,22 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 1047 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10CC0, 0x10CF3, 0x118C0, @@ -153275,6 +156397,10 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 1047 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -153287,7 +156413,7 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 037 */ - 1313, /* Number of elements */ + 1345, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -154179,7 +157305,7 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 037 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -154514,12 +157640,24 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7F8, @@ -154540,6 +157678,22 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 037 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10CC0, 0x10CF3, 0x118C0, @@ -154602,6 +157756,10 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 037 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -154611,7 +157769,7 @@ static const UV UNI_XPOSIXLOWER_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ - 1359, /* Number of elements */ + 1401, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -154643,8 +157801,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -154662,11 +157818,11 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -154822,7 +157978,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -154832,6 +157988,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -154854,7 +158012,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -154989,10 +158147,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -155009,8 +158165,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -155049,11 +158203,11 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -155069,8 +158223,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -155113,7 +158265,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -155127,10 +158279,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -155161,7 +158309,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -155185,8 +158333,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -155195,10 +158341,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -155269,16 +158419,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -155365,13 +158513,33 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -155458,6 +158626,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -155465,9 +158635,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -155551,7 +158721,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -155559,7 +158729,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -155590,7 +158760,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -155646,6 +158816,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -155659,7 +158831,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -155692,8 +158866,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -155710,12 +158890,18 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -155770,6 +158956,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -155788,10 +158976,20 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -155900,7 +159098,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -155910,6 +159108,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -155923,27 +159123,27 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -155951,9 +159151,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -155984,7 +159184,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ - 1359, /* Number of elements */ + 1401, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -156016,8 +159216,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -156035,11 +159233,11 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -156195,7 +159393,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -156205,6 +159403,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -156227,7 +159427,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -156362,10 +159562,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -156382,8 +159580,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -156422,11 +159618,11 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -156442,8 +159638,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -156486,7 +159680,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -156500,10 +159694,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -156534,7 +159724,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -156558,8 +159748,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -156568,10 +159756,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -156642,16 +159834,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -156738,13 +159928,33 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -156831,6 +160041,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -156838,9 +160050,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -156924,7 +160136,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -156932,7 +160144,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -156963,7 +160175,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -157019,6 +160231,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -157032,7 +160246,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -157065,8 +160281,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -157083,12 +160305,18 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -157143,6 +160371,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -157161,10 +160391,20 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -157273,7 +160513,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -157283,6 +160523,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -157296,27 +160538,27 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -157324,9 +160566,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -157357,7 +160599,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ - 1359, /* Number of elements */ + 1401, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -157389,8 +160631,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -157408,11 +160648,11 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -157568,7 +160808,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -157578,6 +160818,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -157600,7 +160842,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -157735,10 +160977,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -157755,8 +160995,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -157795,11 +161033,11 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -157815,8 +161053,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -157859,7 +161095,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -157873,10 +161109,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -157907,7 +161139,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -157931,8 +161163,6 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -157941,10 +161171,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -158015,16 +161249,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -158111,13 +161343,33 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -158204,6 +161456,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -158211,9 +161465,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -158297,7 +161551,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -158305,7 +161559,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -158336,7 +161590,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -158392,6 +161646,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -158405,7 +161661,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -158438,8 +161696,14 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -158456,12 +161720,18 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -158516,6 +161786,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -158534,10 +161806,20 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -158646,7 +161928,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -158656,6 +161938,8 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -158669,27 +161953,27 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -158697,9 +161981,9 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -158727,7 +162011,7 @@ static const UV UNI_XPOSIXPRINT_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for ASCII/Latin1 */ - 361, /* Number of elements */ + 369, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -158776,7 +162060,7 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for ASCII/Latin1 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -158854,6 +162138,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for ASCII/Latin1 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -158903,7 +162189,7 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for ASCII/Latin1 */ 0x2E30, 0x2E50, 0x2E52, - 0x2E53, + 0x2E5E, 0x3001, 0x3004, 0x3008, @@ -159014,6 +162300,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for ASCII/Latin1 */ 0x10EAE, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -159050,6 +162338,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for ASCII/Latin1 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -159074,6 +162364,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for ASCII/Latin1 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -159102,7 +162394,7 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 1047 */ - 369, /* Number of elements */ + 377, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -159159,7 +162451,7 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 1047 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -159237,6 +162529,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 1047 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -159286,7 +162580,7 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 1047 */ 0x2E30, 0x2E50, 0x2E52, - 0x2E53, + 0x2E5E, 0x3001, 0x3004, 0x3008, @@ -159397,6 +162691,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 1047 */ 0x10EAE, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -159433,6 +162729,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 1047 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -159457,6 +162755,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 1047 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -159485,7 +162785,7 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 037 */ - 371, /* Number of elements */ + 379, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -159544,7 +162844,7 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 037 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -159622,6 +162922,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 037 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -159671,7 +162973,7 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 037 */ 0x2E30, 0x2E50, 0x2E52, - 0x2E53, + 0x2E5E, 0x3001, 0x3004, 0x3008, @@ -159782,6 +163084,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 037 */ 0x10EAE, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -159818,6 +163122,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 037 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -159842,6 +163148,8 @@ static const UV UNI_XPOSIXPUNCT_invlist[] = { /* for EBCDIC 037 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -159973,7 +163281,7 @@ static const UV UNI_XPOSIXSPACE_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for ASCII/Latin1 */ - 1287, /* Number of elements */ + 1303, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -160845,7 +164153,7 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -161174,12 +164482,20 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -161188,6 +164504,14 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -161274,7 +164598,7 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 1047 */ - 1305, /* Number of elements */ + 1321, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -162164,7 +165488,7 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -162493,12 +165817,20 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -162507,6 +165839,14 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -162593,7 +165933,7 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 037 */ - 1301, /* Number of elements */ + 1317, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -163479,7 +166819,7 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -163808,12 +167148,20 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -163822,6 +167170,14 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -163905,7 +167261,7 @@ static const UV UNI_XPOSIXUPPER_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ - 1467, /* Number of elements */ + 1519, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -164010,11 +167366,11 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -164182,7 +167538,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -164192,6 +167548,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -164216,7 +167574,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -164381,10 +167739,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -164404,7 +167760,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -164441,9 +167797,9 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x1AA7, 0x1AA8, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -164467,8 +167823,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -164551,10 +167905,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -164619,8 +167969,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -164639,10 +167987,14 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -164820,12 +168172,34 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -164906,6 +168280,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -164913,9 +168289,11 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -165022,6 +168400,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -165058,7 +168438,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -165110,6 +168490,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -165120,6 +168502,10 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -165154,8 +168540,14 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -165172,6 +168564,10 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -165258,6 +168654,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -165276,8 +168674,18 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -165361,9 +168769,9 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -165386,7 +168794,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ - 1491, /* Number of elements */ + 1543, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -165515,11 +168923,11 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -165687,7 +169095,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -165697,6 +169105,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -165721,7 +169131,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -165886,10 +169296,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -165909,7 +169317,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -165946,9 +169354,9 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x1AA7, 0x1AA8, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -165972,8 +169380,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -166056,10 +169462,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -166124,8 +169526,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -166144,10 +169544,14 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -166325,12 +169729,34 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -166411,6 +169837,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -166418,9 +169846,11 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -166527,6 +169957,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -166563,7 +169995,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -166615,6 +170047,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -166625,6 +170059,10 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -166659,8 +170097,14 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -166677,6 +170121,10 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -166763,6 +170211,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -166781,8 +170231,18 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -166866,9 +170326,9 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -166891,7 +170351,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ - 1487, /* Number of elements */ + 1539, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -167016,11 +170476,11 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -167188,7 +170648,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -167198,6 +170658,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -167222,7 +170684,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -167387,10 +170849,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -167410,7 +170870,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -167447,9 +170907,9 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x1AA7, 0x1AA8, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -167473,8 +170933,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -167557,10 +171015,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -167625,8 +171079,6 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -167645,10 +171097,14 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -167826,12 +171282,34 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -167912,6 +171390,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -167919,9 +171399,11 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -168028,6 +171510,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -168064,7 +171548,7 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -168116,6 +171600,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -168126,6 +171612,10 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -168160,8 +171650,14 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -168178,6 +171674,10 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -168264,6 +171764,8 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -168282,8 +171784,18 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -168367,9 +171879,9 @@ static const UV UNI_XPOSIXWORD_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -168467,7 +171979,7 @@ static const UV UNI_XPOSIXXDIGIT_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for ASCII/Latin1 */ - 269, /* Number of elements */ + 283, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -168669,10 +172181,6 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C71, 0x2C72, 0x2C74, @@ -168707,9 +172215,11 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for ASCII/Latin1 */ 0xA796, 0xA7AF, 0xA7B0, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D6, + 0xA7DA, 0xA7F5, 0xA7F7, 0xAB53, @@ -168730,6 +172240,22 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for ASCII/Latin1 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -168750,7 +172276,7 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 1047 */ - 301, /* Number of elements */ + 315, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -168984,10 +172510,6 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C71, 0x2C72, 0x2C74, @@ -169022,9 +172544,11 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 1047 */ 0xA796, 0xA7AF, 0xA7B0, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D6, + 0xA7DA, 0xA7F5, 0xA7F7, 0xAB53, @@ -169045,6 +172569,22 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 1047 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -169065,7 +172605,7 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 037 */ - 297, /* Number of elements */ + 311, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -169295,10 +172835,6 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C71, 0x2C72, 0x2C74, @@ -169333,9 +172869,11 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 037 */ 0xA796, 0xA7AF, 0xA7B0, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D6, + 0xA7DA, 0xA7F5, 0xA7F7, 0xAB53, @@ -169356,6 +172894,22 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 037 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -169373,7 +172927,7 @@ static const UV UNI__PERL_ANY_FOLDS_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ - 1257, /* Number of elements */ + 1309, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -169476,10 +173030,12 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -169608,6 +173164,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -169624,7 +173182,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -169767,10 +173325,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -169813,7 +173369,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -169915,10 +173471,6 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -169977,8 +173529,6 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -169999,10 +173549,14 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -170192,12 +173746,34 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -170268,12 +173844,18 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -170356,6 +173938,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -170394,7 +173978,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -170428,6 +174012,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -170436,6 +174022,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -170464,8 +174052,14 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -170540,14 +174134,26 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -170621,9 +174227,9 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -170644,7 +174250,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ - 1283, /* Number of elements */ + 1335, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -170773,10 +174379,12 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -170905,6 +174513,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -170921,7 +174531,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -171064,10 +174674,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -171110,7 +174718,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -171212,10 +174820,6 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -171274,8 +174878,6 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -171296,10 +174898,14 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -171489,12 +175095,34 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -171565,12 +175193,18 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -171653,6 +175287,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -171691,7 +175327,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -171725,6 +175361,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -171733,6 +175371,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -171761,8 +175401,14 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -171837,14 +175483,26 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -171918,9 +175576,9 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -171941,7 +175599,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ - 1279, /* Number of elements */ + 1331, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -172066,10 +175724,12 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -172198,6 +175858,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -172214,7 +175876,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -172357,10 +176019,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -172403,7 +176063,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -172505,10 +176165,6 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -172567,8 +176223,6 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -172589,10 +176243,14 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -172782,12 +176440,34 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -172858,12 +176538,18 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -172946,6 +176632,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -172984,7 +176672,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -173018,6 +176706,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -173026,6 +176716,8 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -173054,8 +176746,14 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -173130,14 +176828,26 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -173211,9 +176921,9 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -173231,7 +176941,7 @@ static const UV UNI__PERL_CHARNAME_BEGIN_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 */ - 1481, /* Number of elements */ + 1533, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -173344,11 +177054,11 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -173516,7 +177226,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -173526,6 +177236,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -173550,7 +177262,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -173715,10 +177427,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -173738,7 +177448,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -173777,9 +177487,9 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -173803,8 +177513,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -173887,10 +177595,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -173953,8 +177657,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -173973,10 +177675,14 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -174166,12 +177872,34 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -174252,6 +177980,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -174259,9 +177989,11 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -174368,6 +178100,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -174404,7 +178138,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -174456,6 +178190,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -174466,6 +178202,10 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -174500,8 +178240,14 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -174518,6 +178264,10 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -174604,6 +178354,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -174622,8 +178374,18 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -174701,9 +178463,9 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -174726,7 +178488,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for ASCII/Latin1 * && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ - 1507, /* Number of elements */ + 1559, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -174865,11 +178627,11 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -175037,7 +178799,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -175047,6 +178809,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -175071,7 +178835,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -175236,10 +179000,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -175259,7 +179021,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -175298,9 +179060,9 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -175324,8 +179086,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -175408,10 +179168,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -175474,8 +179230,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -175494,10 +179248,14 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -175687,12 +179445,34 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -175773,6 +179553,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -175780,9 +179562,11 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -175889,6 +179673,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -175925,7 +179711,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -175977,6 +179763,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -175987,6 +179775,10 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -176021,8 +179813,14 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -176039,6 +179837,10 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -176125,6 +179927,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -176143,8 +179947,18 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -176222,9 +180036,9 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -176247,7 +180061,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ - 1503, /* Number of elements */ + 1555, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -176382,11 +180196,11 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -176554,7 +180368,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -176564,6 +180378,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -176588,7 +180404,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -176753,10 +180569,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -176776,7 +180590,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -176815,9 +180629,9 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -176841,8 +180655,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -176925,10 +180737,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -176991,8 +180799,6 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -177011,10 +180817,14 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -177204,12 +181014,34 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -177290,6 +181122,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -177297,9 +181131,11 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -177406,6 +181242,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -177442,7 +181280,7 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -177494,6 +181332,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -177504,6 +181344,10 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -177538,8 +181382,14 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -177556,6 +181406,10 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -177642,6 +181496,8 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -177660,8 +181516,18 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -177739,9 +181605,9 @@ static const UV UNI__PERL_CHARNAME_CONTINUE_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -177977,7 +181843,7 @@ static const UV UNI__PERL_FOLDS_TO_MULTI_CHAR_invlist[] = { /* for EBCDIC 037 * # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ - 1475, /* Number of elements */ + 1527, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -178084,11 +181950,11 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -178256,7 +182122,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -178266,6 +182132,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -178290,7 +182158,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -178455,10 +182323,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -178478,7 +182344,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -178517,9 +182383,9 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -178543,8 +182409,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -178627,10 +182491,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -178693,8 +182553,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -178713,10 +182571,14 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -178906,12 +182768,34 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -178992,6 +182876,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -178999,9 +182885,11 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -179108,6 +182996,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -179144,7 +183034,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -179196,6 +183086,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -179206,6 +183098,10 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -179240,8 +183136,14 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -179258,6 +183160,10 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -179344,6 +183250,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -179362,8 +183270,18 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -179441,9 +183359,9 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -179466,7 +183384,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ - 1499, /* Number of elements */ + 1551, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -179597,11 +183515,11 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -179769,7 +183687,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -179779,6 +183697,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -179803,7 +183723,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -179968,10 +183888,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -179991,7 +183909,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -180030,9 +183948,9 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -180056,8 +183974,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -180140,10 +184056,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -180206,8 +184118,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -180226,10 +184136,14 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -180419,12 +184333,34 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -180505,6 +184441,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -180512,9 +184450,11 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -180621,6 +184561,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -180657,7 +184599,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -180709,6 +184651,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -180719,6 +184663,10 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -180753,8 +184701,14 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -180771,6 +184725,10 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -180857,6 +184815,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -180875,8 +184835,18 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -180954,9 +184924,9 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -180979,7 +184949,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ - 1495, /* Number of elements */ + 1547, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -181106,11 +185076,11 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -181278,7 +185248,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -181288,6 +185258,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -181312,7 +185284,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -181477,10 +185449,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -181500,7 +185470,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -181539,9 +185509,9 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -181565,8 +185535,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -181649,10 +185617,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -181715,8 +185679,6 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -181735,10 +185697,14 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -181928,12 +185894,34 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -182014,6 +186002,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -182021,9 +186011,11 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -182130,6 +186122,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -182166,7 +186160,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -182218,6 +186212,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -182228,6 +186224,10 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -182262,8 +186262,14 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -182280,6 +186286,10 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -182366,6 +186376,8 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -182384,8 +186396,18 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -182463,9 +186485,9 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -182485,7 +186507,7 @@ static const UV UNI__PERL_IDCONT_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ - 1263, /* Number of elements */ + 1315, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -182590,10 +186612,12 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -182722,6 +186746,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -182738,7 +186764,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -182881,10 +186907,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -182925,7 +186949,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -183027,10 +187051,6 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -183091,8 +187111,6 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -183113,10 +187131,14 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -183308,12 +187330,34 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -183384,12 +187428,18 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -183472,6 +187522,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -183510,7 +187562,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -183546,6 +187598,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -183554,6 +187608,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -183582,8 +187638,14 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -183658,14 +187720,26 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -183739,9 +187813,9 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -183762,7 +187836,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ - 1289, /* Number of elements */ + 1341, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -183893,10 +187967,12 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -184025,6 +188101,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -184041,7 +188119,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -184184,10 +188262,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -184228,7 +188304,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -184330,10 +188406,6 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -184394,8 +188466,6 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -184416,10 +188486,14 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -184611,12 +188685,34 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -184687,12 +188783,18 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -184775,6 +188877,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -184813,7 +188917,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -184849,6 +188953,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -184857,6 +188963,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -184885,8 +188993,14 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -184961,14 +189075,26 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -185042,9 +189168,9 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -185065,7 +189191,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ - 1285, /* Number of elements */ + 1337, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -185192,10 +189318,12 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -185324,6 +189452,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -185340,7 +189470,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -185483,10 +189613,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -185527,7 +189655,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -185629,10 +189757,6 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -185693,8 +189817,6 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -185715,10 +189837,14 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -185910,12 +190036,34 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -185986,12 +190134,18 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -186074,6 +190228,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -186112,7 +190268,7 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -186148,6 +190304,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -186156,6 +190314,8 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -186184,8 +190344,14 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -186260,14 +190426,26 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -186341,9 +190519,9 @@ static const UV UNI__PERL_IDSTART_invlist[] = { /* for EBCDIC 037 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -186748,7 +190926,7 @@ static const UV UNI__PERL_QUOTEMETA_invlist[] = { /* for ASCII/Latin1 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x2000, 0x203F, 0x2041, @@ -186854,7 +191032,7 @@ static const UV UNI__PERL_QUOTEMETA_invlist[] = { /* for EBCDIC 1047 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x2000, 0x203F, 0x2041, @@ -186958,7 +191136,7 @@ static const UV UNI__PERL_QUOTEMETA_invlist[] = { /* for EBCDIC 037 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x2000, 0x203F, 0x2041, @@ -187004,11 +191182,13 @@ static const UV UNI__PERL_QUOTEMETA_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_ADLM_invlist[] = { /* for all charsets */ - 9, /* Number of elements */ + 11, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, + 0x61F, + 0x620, 0x640, 0x641, 0x1E900, @@ -187507,6 +191687,170 @@ static const UV UNI_AGE__13_invlist[] = { /* for all charsets */ 0x3134B }; +static const UV UNI_AGE__14_invlist[] = { /* for all charsets */ + 157, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x61D, + 0x61E, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8B5, + 0x8B6, + 0x8C8, + 0x8D3, + 0xC3C, + 0xC3D, + 0xC5D, + 0xC5E, + 0xCDD, + 0xCDE, + 0x170D, + 0x170E, + 0x1715, + 0x1716, + 0x171F, + 0x1720, + 0x180F, + 0x1810, + 0x1AC1, + 0x1ACF, + 0x1B4C, + 0x1B4D, + 0x1B7D, + 0x1B7F, + 0x1DFA, + 0x1DFB, + 0x20C0, + 0x20C1, + 0x2C2F, + 0x2C30, + 0x2C5F, + 0x2C60, + 0x2E53, + 0x2E5E, + 0x9FFD, + 0xA000, + 0xA7C0, + 0xA7C2, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, + 0xA7F5, + 0xFBC2, + 0xFBC3, + 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, + 0xFDFE, + 0xFE00, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, + 0x10F70, + 0x10F8A, + 0x11070, + 0x11076, + 0x110C2, + 0x110C3, + 0x116B9, + 0x116BA, + 0x11740, + 0x11747, + 0x11AB0, + 0x11AC0, + 0x12F90, + 0x12FF3, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, + 0x1B11F, + 0x1B123, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, + 0x1D1E9, + 0x1D1EB, + 0x1DF00, + 0x1DF1F, + 0x1E290, + 0x1E2AF, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, + 0x1F6DD, + 0x1F6E0, + 0x1F7F0, + 0x1F7F1, + 0x1F979, + 0x1F97A, + 0x1F9CC, + 0x1F9CD, + 0x1FA7B, + 0x1FA7D, + 0x1FAA9, + 0x1FAAD, + 0x1FAB7, + 0x1FABB, + 0x1FAC3, + 0x1FAC6, + 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, + 0x2A6DE, + 0x2A6E0, + 0x2B735, + 0x2B739 +}; + static const UV UNI_AGE__2_invlist[] = { /* for all charsets */ 59, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -189792,7 +194136,7 @@ static const UV UNI_AGE__9_invlist[] = { /* for all charsets */ }; static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ - 1372, /* Number of elements */ + 1412, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -189821,8 +194165,6 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -189840,11 +194182,11 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -190000,7 +194342,7 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -190010,6 +194352,8 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -190032,7 +194376,7 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -190167,10 +194511,8 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -190187,8 +194529,6 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -190227,11 +194567,11 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -190247,8 +194587,6 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -190289,7 +194627,7 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -190303,10 +194641,6 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -190337,7 +194671,7 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -190361,8 +194695,6 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -190371,10 +194703,14 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -190445,16 +194781,12 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, - 0xFDD0, - 0xFDFE, - 0xFE00, + 0xFDCF, 0xFE1A, 0xFE20, 0xFE53, @@ -190539,13 +194871,33 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -190632,6 +194984,8 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -190639,9 +194993,9 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -190725,7 +195079,7 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -190733,7 +195087,7 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -190764,7 +195118,7 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -190820,6 +195174,8 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -190833,7 +195189,9 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -190866,8 +195224,14 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -190884,12 +195248,18 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -190944,6 +195314,8 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -190962,10 +195334,20 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -191074,7 +195456,7 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -191084,6 +195466,8 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -191097,27 +195481,27 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -191125,9 +195509,9 @@ static const UV UNI_AGE__NA_invlist[] = { /* for all charsets */ 0x1FBF0, 0x1FBFA, 0x1FFFE, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -191193,7 +195577,7 @@ static const UV UNI_AHOM_invlist[] = { /* for all charsets */ 0x1171D, 0x1172C, 0x11730, - 0x11740 + 0x11747 }; static const UV UNI_ALCHEMICAL_invlist[] = { /* for all charsets */ @@ -191264,7 +195648,7 @@ static const UV UNI_ANY_invlist[] = { /* for all charsets */ }; static const UV UNI_ARAB_invlist[] = { /* for all charsets */ - 105, /* Number of elements */ + 103, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -191272,31 +195656,29 @@ static const UV UNI_ARAB_invlist[] = { /* for all charsets */ 0x600, 0x605, 0x606, - 0x61D, - 0x61E, 0x6DD, 0x6DE, 0x700, 0x750, 0x780, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8E2, 0x8E3, 0x900, 0xFB50, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD3E, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, + 0xFE00, 0xFE70, 0xFE75, 0xFE76, @@ -191385,6 +195767,16 @@ static const UV UNI_ARABICEXTA_invlist[] = { /* for all charsets */ 0x900 }; +static const UV UNI_ARABICEXTB_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x870, + 0x8A0 +}; + static const UV UNI_ARABICMATH_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -191482,9 +195874,9 @@ static const UV UNI_BALI_invlist[] = { /* for all charsets */ 1 if it starts at the element beyond 0 */ 0x0, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D + 0x1B7F }; static const UV UNI_BAMU_invlist[] = { /* for all charsets */ @@ -191564,17 +195956,17 @@ static const UV UNI_BC__AL_invlist[] = { /* for all charsets */ 0x7B1, 0x7C0, 0x860, - 0x870, + 0x890, + 0x892, + 0x898, 0x8A0, - 0x8D3, + 0x8CA, 0xFB50, 0xFD3E, - 0xFD40, - 0xFDD0, + 0xFD50, + 0xFDCF, 0xFDF0, 0xFDFD, - 0xFDFE, - 0xFE00, 0xFE70, 0xFEFF, 0x10D00, @@ -191598,7 +195990,7 @@ static const UV UNI_BC__AL_invlist[] = { /* for all charsets */ }; static const UV UNI_BC__AN_invlist[] = { /* for all charsets */ - 15, /* Number of elements */ + 17, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -191611,6 +196003,8 @@ static const UV UNI_BC__AN_invlist[] = { /* for all charsets */ 0x66D, 0x6DD, 0x6DE, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x10D30, @@ -192489,7 +196883,7 @@ static const UV UNI_BC__FSI_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ - 926, /* Number of elements */ + 942, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -192621,6 +197015,8 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -192728,7 +197124,7 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -192748,7 +197144,7 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -192786,7 +197182,7 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -192832,8 +197228,6 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FBD, 0x1FBE, @@ -192916,7 +197310,7 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x2D7F, 0x2D80, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -193089,12 +197483,18 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x11047, 0x11052, 0x11066, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -193261,6 +197661,10 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -193269,6 +197673,8 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1D18C, 0x1D1AA, 0x1D1AE, + 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D300, @@ -193309,6 +197715,8 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E2FF, @@ -193337,7 +197745,7 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -193347,6 +197755,8 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -193360,27 +197770,27 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -193429,7 +197839,7 @@ static const UV UNI_BC__L_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ - 952, /* Number of elements */ + 968, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -193587,6 +197997,8 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -193694,7 +198106,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -193714,7 +198126,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -193752,7 +198164,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -193798,8 +198210,6 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FBD, 0x1FBE, @@ -193882,7 +198292,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x2D7F, 0x2D80, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -194055,12 +198465,18 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x11047, 0x11052, 0x11066, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -194227,6 +198643,10 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -194235,6 +198655,8 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1D18C, 0x1D1AA, 0x1D1AE, + 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D300, @@ -194275,6 +198697,8 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E2FF, @@ -194303,7 +198727,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -194313,6 +198737,8 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -194326,27 +198752,27 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -194395,7 +198821,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ - 948, /* Number of elements */ + 964, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -194549,6 +198975,8 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -194656,7 +199084,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -194676,7 +199104,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x17F0, 0x17FA, 0x1800, - 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -194714,7 +199142,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -194760,8 +199188,6 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FBD, 0x1FBE, @@ -194844,7 +199270,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x2D7F, 0x2D80, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -195017,12 +199443,18 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x11047, 0x11052, 0x11066, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -195189,6 +199621,10 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -195197,6 +199633,8 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1D18C, 0x1D1AA, 0x1D1AE, + 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D300, @@ -195237,6 +199675,8 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E2FF, @@ -195265,7 +199705,7 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -195275,6 +199715,8 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -195288,27 +199730,27 @@ static const UV UNI_BC__L_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -195382,7 +199824,7 @@ static const UV UNI_BC__LRO_invlist[] = { /* for all charsets */ }; static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ - 645, /* Number of elements */ + 663, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -195435,7 +199877,9 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -195517,6 +199961,8 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -195612,7 +200058,7 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -195629,6 +200075,8 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -195660,7 +200108,7 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -195706,8 +200154,6 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x20D0, 0x20F1, @@ -195821,16 +200267,24 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -195989,6 +200443,10 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0x16FE5, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D17B, @@ -196023,6 +200481,8 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -196036,7 +200496,7 @@ static const UV UNI_BC__NSM_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_BC__ON_invlist[] = { /* for ASCII/Latin1 */ - 377, /* Number of elements */ + 383, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -196204,7 +200664,7 @@ static const UV UNI_BC__ON_invlist[] = { /* for ASCII/Latin1 */ 0x2CF9, 0x2D00, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -196268,9 +200728,11 @@ static const UV UNI_BC__ON_invlist[] = { /* for ASCII/Latin1 */ 0xAB6A, 0xAB6C, 0xFD3E, - 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE10, 0xFE1A, 0xFE30, @@ -196327,6 +200789,8 @@ static const UV UNI_BC__ON_invlist[] = { /* for ASCII/Latin1 */ 0x11FF2, 0x16FE2, 0x16FE3, + 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -196369,7 +200833,7 @@ static const UV UNI_BC__ON_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -196379,6 +200843,8 @@ static const UV UNI_BC__ON_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -196392,27 +200858,27 @@ static const UV UNI_BC__ON_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -196427,7 +200893,7 @@ static const UV UNI_BC__ON_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 1047 */ - 385, /* Number of elements */ + 391, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -196603,7 +201069,7 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 1047 */ 0x2CF9, 0x2D00, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -196667,9 +201133,11 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 1047 */ 0xAB6A, 0xAB6C, 0xFD3E, - 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE10, 0xFE1A, 0xFE30, @@ -196726,6 +201194,8 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 1047 */ 0x11FF2, 0x16FE2, 0x16FE3, + 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -196768,7 +201238,7 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -196778,6 +201248,8 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -196791,27 +201263,27 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -196826,7 +201298,7 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 037 */ - 381, /* Number of elements */ + 387, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -196998,7 +201470,7 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 037 */ 0x2CF9, 0x2D00, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -197062,9 +201534,11 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 037 */ 0xAB6A, 0xAB6C, 0xFD3E, - 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE10, 0xFE1A, 0xFE30, @@ -197121,6 +201595,8 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 037 */ 0x11FF2, 0x16FE2, 0x16FE3, + 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -197163,7 +201639,7 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -197173,6 +201649,8 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -197186,27 +201664,27 @@ static const UV UNI_BC__ON_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -197271,8 +201749,6 @@ static const UV UNI_BC__R_invlist[] = { /* for all charsets */ 0x859, 0x85C, 0x860, - 0x870, - 0x8A0, 0x200F, 0x2010, 0xFB1D, @@ -197306,6 +201782,8 @@ static const UV UNI_BC__R_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F30, 0x10F70, + 0x10F82, + 0x10F86, 0x11000, 0x1E800, 0x1E8D0, @@ -197590,7 +202068,7 @@ static const UV UNI_BIDIC_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_BIDIM_invlist[] = { /* for ASCII/Latin1 */ - 227, /* Number of elements */ + 229, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -197785,6 +202263,8 @@ static const UV UNI_BIDIM_invlist[] = { /* for ASCII/Latin1 */ 0x2E1E, 0x2E20, 0x2E2A, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -197831,7 +202311,7 @@ static const UV UNI_BIDIM_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_BIDIM_invlist[] = { /* for EBCDIC 1047 */ - 225, /* Number of elements */ + 227, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -198024,6 +202504,8 @@ static const UV UNI_BIDIM_invlist[] = { /* for EBCDIC 1047 */ 0x2E1E, 0x2E20, 0x2E2A, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -198070,7 +202552,7 @@ static const UV UNI_BIDIM_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_BIDIM_invlist[] = { /* for EBCDIC 037 */ - 223, /* Number of elements */ + 225, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -198261,6 +202743,8 @@ static const UV UNI_BIDIM_invlist[] = { /* for EBCDIC 037 */ 0x2E1E, 0x2E20, 0x2E2A, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -198366,7 +202850,7 @@ static const UV UNI_BOXDRAWING_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_BPT__C_invlist[] = { /* for ASCII/Latin1 */ - 121, /* Number of elements */ + 129, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -198457,6 +202941,14 @@ static const UV UNI_BPT__C_invlist[] = { /* for ASCII/Latin1 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3009, 0x300A, 0x300B, @@ -198501,7 +202993,7 @@ static const UV UNI_BPT__C_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_BPT__C_invlist[] = { /* for EBCDIC 1047 */ - 121, /* Number of elements */ + 129, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -198592,6 +203084,14 @@ static const UV UNI_BPT__C_invlist[] = { /* for EBCDIC 1047 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3009, 0x300A, 0x300B, @@ -198636,7 +203136,7 @@ static const UV UNI_BPT__C_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_BPT__C_invlist[] = { /* for EBCDIC 037 */ - 121, /* Number of elements */ + 129, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -198727,6 +203227,14 @@ static const UV UNI_BPT__C_invlist[] = { /* for EBCDIC 037 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3009, 0x300A, 0x300B, @@ -198768,7 +203276,7 @@ static const UV UNI_BPT__C_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_BPT__N_invlist[] = { /* for ASCII/Latin1 */ - 59, /* Number of elements */ + 61, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -198811,6 +203319,8 @@ static const UV UNI_BPT__N_invlist[] = { /* for ASCII/Latin1 */ 0x29FE, 0x2E22, 0x2E2A, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -198841,7 +203351,7 @@ static const UV UNI_BPT__N_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_BPT__N_invlist[] = { /* for EBCDIC 1047 */ - 61, /* Number of elements */ + 63, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -198886,6 +203396,8 @@ static const UV UNI_BPT__N_invlist[] = { /* for EBCDIC 1047 */ 0x29FE, 0x2E22, 0x2E2A, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -198916,7 +203428,7 @@ static const UV UNI_BPT__N_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_BPT__N_invlist[] = { /* for EBCDIC 037 */ - 59, /* Number of elements */ + 61, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -198959,6 +203471,8 @@ static const UV UNI_BPT__N_invlist[] = { /* for EBCDIC 037 */ 0x29FE, 0x2E22, 0x2E2A, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -198986,7 +203500,7 @@ static const UV UNI_BPT__N_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_BPT__O_invlist[] = { /* for ASCII/Latin1 */ - 121, /* Number of elements */ + 129, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -199077,6 +203591,14 @@ static const UV UNI_BPT__O_invlist[] = { /* for ASCII/Latin1 */ 0x2E27, 0x2E28, 0x2E29, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -199121,7 +203643,7 @@ static const UV UNI_BPT__O_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_BPT__O_invlist[] = { /* for EBCDIC 1047 */ - 121, /* Number of elements */ + 129, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -199212,6 +203734,14 @@ static const UV UNI_BPT__O_invlist[] = { /* for EBCDIC 1047 */ 0x2E27, 0x2E28, 0x2E29, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -199256,7 +203786,7 @@ static const UV UNI_BPT__O_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_BPT__O_invlist[] = { /* for EBCDIC 037 */ - 121, /* Number of elements */ + 129, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -199347,6 +203877,14 @@ static const UV UNI_BPT__O_invlist[] = { /* for EBCDIC 037 */ 0x2E27, 0x2E28, 0x2E29, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -199394,7 +203932,7 @@ static const UV UNI_BRAH_invlist[] = { /* for all charsets */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x11080 }; @@ -199448,7 +203986,7 @@ static const UV UNI_BYZANTINEMUSIC_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ - 1357, /* Number of elements */ + 1401, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -199483,7 +204021,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x5F5, 0x606, 0x61C, - 0x61E, + 0x61D, 0x6DD, 0x6DE, 0x70E, @@ -199503,11 +204041,9 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x984, @@ -199665,7 +204201,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -199675,6 +204211,8 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -199697,7 +204235,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -199832,10 +204370,8 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -199853,7 +204389,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x17FA, 0x1800, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -199892,11 +204428,11 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -199912,8 +204448,6 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -199958,7 +204492,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -199972,10 +204506,6 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -200006,7 +204536,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -200030,8 +204560,6 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -200040,10 +204568,14 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -200114,16 +204646,14 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -200208,13 +204738,33 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -200301,6 +204851,8 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -200308,11 +204860,11 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x110BD, 0x110BE, - 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -200394,7 +204946,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -200402,7 +204954,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -200433,7 +204985,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -200489,6 +205041,8 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x14400, @@ -200500,7 +205054,9 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -200533,8 +205089,14 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -200551,6 +205113,12 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9C, 0x1BCA0, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -200558,7 +205126,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1D129, 0x1D173, 0x1D17B, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -200613,6 +205181,8 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -200631,10 +205201,20 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -200743,7 +205323,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -200753,6 +205333,8 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -200766,27 +205348,27 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -200794,9 +205376,9 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -200819,7 +205401,7 @@ static const UV UNI_C_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ - 1357, /* Number of elements */ + 1401, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -200854,7 +205436,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x5F5, 0x606, 0x61C, - 0x61E, + 0x61D, 0x6DD, 0x6DE, 0x70E, @@ -200874,11 +205456,9 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x984, @@ -201036,7 +205616,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -201046,6 +205626,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -201068,7 +205650,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -201203,10 +205785,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -201224,7 +205804,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x17FA, 0x1800, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -201263,11 +205843,11 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -201283,8 +205863,6 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -201329,7 +205907,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -201343,10 +205921,6 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -201377,7 +205951,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -201401,8 +205975,6 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -201411,10 +205983,14 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -201485,16 +206061,14 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -201579,13 +206153,33 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -201672,6 +206266,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -201679,11 +206275,11 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x110BD, 0x110BE, - 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -201765,7 +206361,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -201773,7 +206369,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -201804,7 +206400,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -201860,6 +206456,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x14400, @@ -201871,7 +206469,9 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -201904,8 +206504,14 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -201922,6 +206528,12 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9C, 0x1BCA0, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -201929,7 +206541,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1D129, 0x1D173, 0x1D17B, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -201984,6 +206596,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -202002,10 +206616,20 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -202114,7 +206738,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -202124,6 +206748,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -202137,27 +206763,27 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -202165,9 +206791,9 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -202190,7 +206816,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ - 1357, /* Number of elements */ + 1401, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -202225,7 +206851,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x5F5, 0x606, 0x61C, - 0x61E, + 0x61D, 0x6DD, 0x6DE, 0x70E, @@ -202245,11 +206871,9 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x984, @@ -202407,7 +207031,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -202417,6 +207041,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -202439,7 +207065,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -202574,10 +207200,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -202595,7 +207219,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x17FA, 0x1800, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -202634,11 +207258,11 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -202654,8 +207278,6 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -202700,7 +207322,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -202714,10 +207336,6 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -202748,7 +207366,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -202772,8 +207390,6 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -202782,10 +207398,14 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -202856,16 +207476,14 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -202950,13 +207568,33 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -203043,6 +207681,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -203050,11 +207690,11 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x110BD, 0x110BE, - 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -203136,7 +207776,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -203144,7 +207784,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -203175,7 +207815,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -203231,6 +207871,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x14400, @@ -203242,7 +207884,9 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -203275,8 +207919,14 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -203293,6 +207943,12 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9C, 0x1BCA0, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -203300,7 +207956,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1D129, 0x1D173, 0x1D17B, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -203355,6 +208011,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -203373,10 +208031,20 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -203485,7 +208153,7 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -203495,6 +208163,8 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -203508,27 +208178,27 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -203536,9 +208206,9 @@ static const UV UNI_C_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -203572,7 +208242,7 @@ static const UV UNI_CAKM_invlist[] = { /* for all charsets */ }; static const UV UNI_CANS_invlist[] = { /* for all charsets */ - 5, /* Number of elements */ + 7, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -203580,7 +208250,9 @@ static const UV UNI_CANS_invlist[] = { /* for all charsets */ 0x1400, 0x1680, 0x18B0, - 0x18F6 + 0x18F6, + 0x11AB0, + 0x11AC0 }; static const UV UNI_CARI_invlist[] = { /* for all charsets */ @@ -203594,7 +208266,7 @@ static const UV UNI_CARI_invlist[] = { /* for all charsets */ }; static const UV UNI_CCC__0_invlist[] = { /* for all charsets */ - 369, /* Number of elements */ + 377, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -203647,7 +208319,9 @@ static const UV UNI_CCC__0_invlist[] = { /* for all charsets */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x900, @@ -203677,6 +208351,8 @@ static const UV UNI_CCC__0_invlist[] = { /* for all charsets */ 0xB4E, 0xBCD, 0xBCE, + 0xC3C, + 0xC3D, 0xC4D, 0xC4E, 0xC55, @@ -203730,7 +208406,7 @@ static const UV UNI_CCC__0_invlist[] = { /* for all charsets */ 0x135D, 0x1360, 0x1714, - 0x1715, + 0x1716, 0x1734, 0x1735, 0x17D2, @@ -203752,7 +208428,7 @@ static const UV UNI_CCC__0_invlist[] = { /* for all charsets */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B34, 0x1B35, 0x1B44, @@ -203780,8 +208456,6 @@ static const UV UNI_CCC__0_invlist[] = { /* for all charsets */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x20D0, 0x20DD, @@ -203863,8 +208537,12 @@ static const UV UNI_CCC__0_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11046, 0x11047, + 0x11070, + 0x11071, 0x1107F, 0x11080, 0x110B9, @@ -203961,6 +208639,8 @@ static const UV UNI_CCC__0_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -204408,7 +209088,7 @@ static const UV UNI_CCC__6_invlist[] = { /* for all charsets */ }; static const UV UNI_CCC__7_invlist[] = { /* for all charsets */ - 51, /* Number of elements */ + 53, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -204423,6 +209103,8 @@ static const UV UNI_CCC__7_invlist[] = { /* for all charsets */ 0xABD, 0xB3C, 0xB3D, + 0xC3C, + 0xC3D, 0xCBC, 0xCBD, 0x1037, @@ -204486,7 +209168,7 @@ static const UV UNI_CCC__84_invlist[] = { /* for all charsets */ }; static const UV UNI_CCC__9_invlist[] = { /* for all charsets */ - 109, /* Number of elements */ + 111, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -204522,7 +209204,7 @@ static const UV UNI_CCC__9_invlist[] = { /* for all charsets */ 0x1039, 0x103B, 0x1714, - 0x1715, + 0x1716, 0x1734, 0x1735, 0x17D2, @@ -204555,6 +209237,8 @@ static const UV UNI_CCC__9_invlist[] = { /* for all charsets */ 0x10A40, 0x11046, 0x11047, + 0x11070, + 0x11071, 0x1107F, 0x11080, 0x110B9, @@ -204612,7 +209296,7 @@ static const UV UNI_CCC__91_invlist[] = { /* for all charsets */ }; static const UV UNI_CCC__A_invlist[] = { /* for all charsets */ - 237, /* Number of elements */ + 255, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -204699,6 +209383,12 @@ static const UV UNI_CCC__A_invlist[] = { /* for all charsets */ 0x828, 0x829, 0x82E, + 0x898, + 0x899, + 0x89C, + 0x8A0, + 0x8CA, + 0x8CF, 0x8D4, 0x8E2, 0x8E4, @@ -204737,6 +209427,12 @@ static const UV UNI_CCC__A_invlist[] = { /* for all charsets */ 0x1AB5, 0x1ABB, 0x1ABD, + 0x1AC1, + 0x1AC3, + 0x1AC5, + 0x1ACA, + 0x1ACB, + 0x1ACF, 0x1B6B, 0x1B6C, 0x1B6D, @@ -204821,6 +209517,10 @@ static const UV UNI_CCC__A_invlist[] = { /* for all charsets */ 0x10F4B, 0x10F4C, 0x10F4D, + 0x10F82, + 0x10F83, + 0x10F84, + 0x10F85, 0x11100, 0x11103, 0x11366, @@ -204849,6 +209549,8 @@ static const UV UNI_CCC__A_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E944, @@ -204890,7 +209592,7 @@ static const UV UNI_CCC__AR_invlist[] = { /* for all charsets */ }; static const UV UNI_CCC__B_invlist[] = { /* for all charsets */ - 157, /* Number of elements */ + 167, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -204961,7 +209663,9 @@ static const UV UNI_CCC__B_invlist[] = { /* for all charsets */ 0x7FE, 0x859, 0x85C, - 0x8D3, + 0x899, + 0x89C, + 0x8CF, 0x8D4, 0x8E3, 0x8E4, @@ -204999,6 +209703,10 @@ static const UV UNI_CCC__B_invlist[] = { /* for all charsets */ 0x1ABE, 0x1ABF, 0x1AC1, + 0x1AC3, + 0x1AC5, + 0x1ACA, + 0x1ACB, 0x1B6C, 0x1B6D, 0x1CD5, @@ -205045,6 +209753,10 @@ static const UV UNI_CCC__B_invlist[] = { /* for all charsets */ 0x10F4C, 0x10F4D, 0x10F51, + 0x10F83, + 0x10F84, + 0x10F85, + 0x10F86, 0x1D17B, 0x1D183, 0x1D18A, @@ -205054,11 +209766,13 @@ static const UV UNI_CCC__B_invlist[] = { /* for all charsets */ }; static const UV UNI_CCC__BL_invlist[] = { /* for all charsets */ - 3, /* Number of elements */ + 5, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, + 0x1DFA, + 0x1DFB, 0x302A, 0x302B }; @@ -205216,7 +209930,7 @@ static const UV UNI_CE_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CF_invlist[] = { /* for ASCII/Latin1 */ - 41, /* Number of elements */ + 43, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -205231,6 +209945,8 @@ static const UV UNI_CF_invlist[] = { /* for ASCII/Latin1 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -205271,7 +209987,7 @@ static const UV UNI_CF_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CF_invlist[] = { /* for EBCDIC 1047 */ - 41, /* Number of elements */ + 43, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -205286,6 +210002,8 @@ static const UV UNI_CF_invlist[] = { /* for EBCDIC 1047 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -205326,7 +210044,7 @@ static const UV UNI_CF_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CF_invlist[] = { /* for EBCDIC 037 */ - 41, /* Number of elements */ + 43, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -205341,6 +210059,8 @@ static const UV UNI_CF_invlist[] = { /* for EBCDIC 037 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -205438,7 +210158,7 @@ static const UV UNI_CHRS_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ - 821, /* Number of elements */ + 855, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -205527,7 +210247,13 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x888, + 0x889, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8C9, 0x903, 0x93A, 0x93B, @@ -205609,6 +210335,8 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -205712,7 +210440,7 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -205730,7 +210458,7 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x17DD, 0x17DE, 0x180B, - 0x180F, + 0x1810, 0x1843, 0x1844, 0x1885, @@ -205766,7 +210494,7 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x1AA7, 0x1AA8, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -205818,8 +210546,6 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x1D78, 0x1D79, 0x1D9B, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FBD, 0x1FBE, @@ -205901,6 +210627,8 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0xA771, 0xA788, 0xA78B, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xA802, @@ -205980,7 +210708,7 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0xFB1E, 0xFB1F, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFE00, 0xFE10, 0xFE13, @@ -206017,6 +210745,12 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x102E1, 0x10376, 0x1037B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10A01, 0x10A04, 0x10A05, @@ -206035,10 +210769,16 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, @@ -206047,6 +210787,8 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -206211,10 +210953,20 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x16FE2, 0x16FE3, 0x16FE5, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1BC9D, 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -206249,6 +211001,8 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ 0x1E02B, 0x1E130, 0x1E13E, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -206273,7 +211027,7 @@ static const UV UNI_CI_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ - 819, /* Number of elements */ + 853, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -206360,7 +211114,13 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x888, + 0x889, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8C9, 0x903, 0x93A, 0x93B, @@ -206442,6 +211202,8 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -206545,7 +211307,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -206563,7 +211325,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x17DD, 0x17DE, 0x180B, - 0x180F, + 0x1810, 0x1843, 0x1844, 0x1885, @@ -206599,7 +211361,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x1AA7, 0x1AA8, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -206651,8 +211413,6 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x1D78, 0x1D79, 0x1D9B, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FBD, 0x1FBE, @@ -206734,6 +211494,8 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0xA771, 0xA788, 0xA78B, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xA802, @@ -206813,7 +211575,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0xFB1E, 0xFB1F, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFE00, 0xFE10, 0xFE13, @@ -206850,6 +211612,12 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x102E1, 0x10376, 0x1037B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10A01, 0x10A04, 0x10A05, @@ -206868,10 +211636,16 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, @@ -206880,6 +211654,8 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -207044,10 +211820,20 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x16FE2, 0x16FE3, 0x16FE5, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1BC9D, 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -207082,6 +211868,8 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ 0x1E02B, 0x1E130, 0x1E13E, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -207106,7 +211894,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ - 817, /* Number of elements */ + 851, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -207191,7 +211979,13 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x888, + 0x889, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8C9, 0x903, 0x93A, 0x93B, @@ -207273,6 +212067,8 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -207376,7 +212172,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -207394,7 +212190,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x17DD, 0x17DE, 0x180B, - 0x180F, + 0x1810, 0x1843, 0x1844, 0x1885, @@ -207430,7 +212226,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x1AA7, 0x1AA8, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -207482,8 +212278,6 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x1D78, 0x1D79, 0x1D9B, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1FBD, 0x1FBE, @@ -207565,6 +212359,8 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0xA771, 0xA788, 0xA78B, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xA802, @@ -207644,7 +212440,7 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0xFB1E, 0xFB1F, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFE00, 0xFE10, 0xFE13, @@ -207681,6 +212477,12 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x102E1, 0x10376, 0x1037B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10A01, 0x10A04, 0x10A05, @@ -207699,10 +212501,16 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, @@ -207711,6 +212519,8 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -207875,10 +212685,20 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x16FE2, 0x16FE3, 0x16FE5, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1BC9D, 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -207913,6 +212733,8 @@ static const UV UNI_CI_invlist[] = { /* for EBCDIC 037 */ 0x1E02B, 0x1E130, 0x1E13E, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -208082,7 +212904,7 @@ static const UV UNI_CJKSYMBOLS_invlist[] = { /* for all charsets */ }; static const UV UNI_CN_invlist[] = { /* for all charsets */ - 1354, /* Number of elements */ + 1396, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -208111,8 +212933,6 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -208130,11 +212950,11 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -208290,7 +213110,7 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -208300,6 +213120,8 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -208322,7 +213144,7 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -208457,10 +213279,8 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -208477,8 +213297,6 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -208517,11 +213335,11 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -208537,8 +213355,6 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -208579,7 +213395,7 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -208593,10 +213409,6 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -208627,7 +213439,7 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -208651,8 +213463,6 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -208661,10 +213471,14 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -208735,16 +213549,14 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -208831,13 +213643,33 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -208924,6 +213756,8 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -208931,9 +213765,9 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -209017,7 +213851,7 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -209025,7 +213859,7 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -209056,7 +213890,7 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -209112,6 +213946,8 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -209125,7 +213961,9 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -209158,8 +213996,14 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -209176,12 +214020,18 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -209236,6 +214086,8 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -209254,10 +214106,20 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -209366,7 +214228,7 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -209376,6 +214238,8 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -209389,27 +214253,27 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -209417,9 +214281,9 @@ static const UV UNI_CN_invlist[] = { /* for all charsets */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -209666,6 +214530,18 @@ static const UV UNI_COUNTINGROD_invlist[] = { /* for all charsets */ 0x1D380 }; +static const UV UNI_CPMN_invlist[] = { /* for all charsets */ + 5, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x10100, + 0x10102, + 0x12F90, + 0x12FF3 +}; + static const UV UNI_CPRT_invlist[] = { /* for all charsets */ 19, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -209715,7 +214591,7 @@ static const UV UNI_CURRENCYSYMBOLS_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CWCF_invlist[] = { /* for ASCII/Latin1 */ - 1229, /* Number of elements */ + 1245, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -210591,7 +215467,7 @@ static const UV UNI_CWCF_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -210920,12 +215796,20 @@ static const UV UNI_CWCF_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -210940,6 +215824,14 @@ static const UV UNI_CWCF_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -210958,7 +215850,7 @@ static const UV UNI_CWCF_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 1047 */ - 1249, /* Number of elements */ + 1265, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -211854,7 +216746,7 @@ static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -212183,12 +217075,20 @@ static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -212203,6 +217103,14 @@ static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -212221,7 +217129,7 @@ static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 037 */ - 1245, /* Number of elements */ + 1261, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -213113,7 +218021,7 @@ static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -213442,12 +218350,20 @@ static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xAB70, @@ -213462,6 +218378,14 @@ static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -213477,7 +218401,7 @@ static const UV UNI_CWCF_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CWCM_invlist[] = { /* for ASCII/Latin1 */ - 249, /* Number of elements */ + 263, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -213659,10 +218583,6 @@ static const UV UNI_CWCM_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C71, 0x2C72, 0x2C74, @@ -213697,9 +218617,11 @@ static const UV UNI_CWCM_invlist[] = { /* for ASCII/Latin1 */ 0xA796, 0xA7AF, 0xA7B0, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D6, + 0xA7DA, 0xA7F5, 0xA7F7, 0xAB53, @@ -213720,6 +218642,22 @@ static const UV UNI_CWCM_invlist[] = { /* for ASCII/Latin1 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -213740,7 +218678,7 @@ static const UV UNI_CWCM_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 1047 */ - 281, /* Number of elements */ + 295, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -213954,10 +218892,6 @@ static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C71, 0x2C72, 0x2C74, @@ -213992,9 +218926,11 @@ static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 1047 */ 0xA796, 0xA7AF, 0xA7B0, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D6, + 0xA7DA, 0xA7F5, 0xA7F7, 0xAB53, @@ -214015,6 +218951,22 @@ static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 1047 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -214035,7 +218987,7 @@ static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 037 */ - 277, /* Number of elements */ + 291, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -214245,10 +219197,6 @@ static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2C71, 0x2C72, 0x2C74, @@ -214283,9 +219231,11 @@ static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 037 */ 0xA796, 0xA7AF, 0xA7B0, - 0xA7C0, - 0xA7C2, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D6, + 0xA7DA, 0xA7F5, 0xA7F7, 0xAB53, @@ -214306,6 +219256,22 @@ static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 037 */ 0x104D4, 0x104D8, 0x104FC, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10C80, 0x10CB3, 0x10CC0, @@ -214323,7 +219289,7 @@ static const UV UNI_CWCM_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CWKCF_invlist[] = { /* for ASCII/Latin1 */ - 1655, /* Number of elements */ + 1677, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -214969,7 +219935,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for ASCII/Latin1 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x1C80, 0x1C89, 0x1C90, @@ -215371,7 +220337,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for ASCII/Latin1 */ 0x2ADC, 0x2ADD, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -215736,13 +220702,21 @@ static const UV UNI_CWKCF_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, - 0xA7F5, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7F2, 0xA7F6, 0xA7F8, 0xA7FA, @@ -215834,6 +220808,20 @@ static const UV UNI_CWKCF_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10C80, 0x10CB3, 0x118A0, @@ -215992,7 +220980,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 1047 */ - 1665, /* Number of elements */ + 1687, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -216648,7 +221636,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 1047 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x1C80, 0x1C89, 0x1C90, @@ -217050,7 +222038,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 1047 */ 0x2ADC, 0x2ADD, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -217415,13 +222403,21 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, - 0xA7F5, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7F2, 0xA7F6, 0xA7F8, 0xA7FA, @@ -217513,6 +222509,20 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10C80, 0x10CB3, 0x118A0, @@ -217671,7 +222681,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 037 */ - 1663, /* Number of elements */ + 1685, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -218325,7 +223335,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 037 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x1C80, 0x1C89, 0x1C90, @@ -218727,7 +223737,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 037 */ 0x2ADC, 0x2ADD, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -219092,13 +224102,21 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, - 0xA7F5, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7F2, 0xA7F6, 0xA7F8, 0xA7FA, @@ -219190,6 +224208,20 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10C80, 0x10CB3, 0x118A0, @@ -219345,7 +224377,7 @@ static const UV UNI_CWKCF_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CWL_invlist[] = { /* for ASCII/Latin1 */ - 1203, /* Number of elements */ + 1219, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -220201,7 +225233,7 @@ static const UV UNI_CWL_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -220530,12 +225562,20 @@ static const UV UNI_CWL_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -220544,6 +225584,14 @@ static const UV UNI_CWL_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -220562,7 +225610,7 @@ static const UV UNI_CWL_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CWL_invlist[] = { /* for EBCDIC 1047 */ - 1221, /* Number of elements */ + 1237, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -221436,7 +226484,7 @@ static const UV UNI_CWL_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -221765,12 +226813,20 @@ static const UV UNI_CWL_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -221779,6 +226835,14 @@ static const UV UNI_CWL_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -221797,7 +226861,7 @@ static const UV UNI_CWL_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CWL_invlist[] = { /* for EBCDIC 037 */ - 1217, /* Number of elements */ + 1233, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -222667,7 +227731,7 @@ static const UV UNI_CWL_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -222996,12 +228060,20 @@ static const UV UNI_CWL_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -223010,6 +228082,14 @@ static const UV UNI_CWL_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -223025,7 +228105,7 @@ static const UV UNI_CWL_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CWT_invlist[] = { /* for ASCII/Latin1 */ - 1237, /* Number of elements */ + 1253, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -223907,7 +228987,7 @@ static const UV UNI_CWT_invlist[] = { /* for ASCII/Latin1 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -224236,12 +229316,20 @@ static const UV UNI_CWT_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -224258,6 +229346,14 @@ static const UV UNI_CWT_invlist[] = { /* for ASCII/Latin1 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -224276,7 +229372,7 @@ static const UV UNI_CWT_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CWT_invlist[] = { /* for EBCDIC 1047 */ - 1251, /* Number of elements */ + 1267, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -225172,7 +230268,7 @@ static const UV UNI_CWT_invlist[] = { /* for EBCDIC 1047 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -225501,12 +230597,20 @@ static const UV UNI_CWT_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -225523,6 +230627,14 @@ static const UV UNI_CWT_invlist[] = { /* for EBCDIC 1047 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -225541,7 +230653,7 @@ static const UV UNI_CWT_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CWT_invlist[] = { /* for EBCDIC 037 */ - 1251, /* Number of elements */ + 1267, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -226437,7 +231549,7 @@ static const UV UNI_CWT_invlist[] = { /* for EBCDIC 037 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -226766,12 +231878,20 @@ static const UV UNI_CWT_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -226788,6 +231908,14 @@ static const UV UNI_CWT_invlist[] = { /* for EBCDIC 037 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -226803,7 +231931,7 @@ static const UV UNI_CWT_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_CWU_invlist[] = { /* for ASCII/Latin1 */ - 1239, /* Number of elements */ + 1255, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -227687,7 +232815,7 @@ static const UV UNI_CWU_invlist[] = { /* for ASCII/Latin1 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -228016,12 +233144,20 @@ static const UV UNI_CWU_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -228038,6 +233174,14 @@ static const UV UNI_CWU_invlist[] = { /* for ASCII/Latin1 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -228056,7 +233200,7 @@ static const UV UNI_CWU_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_CWU_invlist[] = { /* for EBCDIC 1047 */ - 1253, /* Number of elements */ + 1269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -228954,7 +234098,7 @@ static const UV UNI_CWU_invlist[] = { /* for EBCDIC 1047 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -229283,12 +234427,20 @@ static const UV UNI_CWU_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -229305,6 +234457,14 @@ static const UV UNI_CWU_invlist[] = { /* for EBCDIC 1047 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -229323,7 +234483,7 @@ static const UV UNI_CWU_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_CWU_invlist[] = { /* for EBCDIC 037 */ - 1253, /* Number of elements */ + 1269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -230221,7 +235381,7 @@ static const UV UNI_CWU_invlist[] = { /* for EBCDIC 037 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -230550,12 +235710,20 @@ static const UV UNI_CWU_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xAB53, @@ -230572,6 +235740,14 @@ static const UV UNI_CWU_invlist[] = { /* for EBCDIC 037 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10CC0, 0x10CF3, 0x118C0, @@ -230663,7 +235839,7 @@ static const UV UNI_CYRL_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_DASH_invlist[] = { /* for ASCII/Latin1 */ - 45, /* Number of elements */ + 47, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -230696,6 +235872,8 @@ static const UV UNI_DASH_invlist[] = { /* for ASCII/Latin1 */ 0x2E3C, 0x2E40, 0x2E41, + 0x2E5D, + 0x2E5E, 0x301C, 0x301D, 0x3030, @@ -230722,7 +235900,7 @@ static const UV UNI_DASH_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_DASH_invlist[] = { /* for EBCDIC 1047 */ - 45, /* Number of elements */ + 47, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -230755,6 +235933,8 @@ static const UV UNI_DASH_invlist[] = { /* for EBCDIC 1047 */ 0x2E3C, 0x2E40, 0x2E41, + 0x2E5D, + 0x2E5E, 0x301C, 0x301D, 0x3030, @@ -230781,7 +235961,7 @@ static const UV UNI_DASH_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_DASH_invlist[] = { /* for EBCDIC 037 */ - 45, /* Number of elements */ + 47, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -230814,6 +235994,8 @@ static const UV UNI_DASH_invlist[] = { /* for EBCDIC 037 */ 0x2E3C, 0x2E40, 0x2E41, + 0x2E5D, + 0x2E5E, 0x301C, 0x301D, 0x3030, @@ -230909,7 +236091,7 @@ static const UV UNI_DI_invlist[] = { /* for ASCII/Latin1 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x200B, 0x2010, 0x202A, @@ -230958,7 +236140,7 @@ static const UV UNI_DI_invlist[] = { /* for EBCDIC 1047 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x200B, 0x2010, 0x202A, @@ -231007,7 +236189,7 @@ static const UV UNI_DI_invlist[] = { /* for EBCDIC 037 */ 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x200B, 0x2010, 0x202A, @@ -231037,7 +236219,7 @@ static const UV UNI_DI_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ - 353, /* Number of elements */ + 385, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -231098,6 +236280,10 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ 0x7F6, 0x818, 0x81A, + 0x898, + 0x8A0, + 0x8C9, + 0x8D3, 0x8E3, 0x8FF, 0x93C, @@ -231130,6 +236316,8 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ 0xB56, 0xBCD, 0xBCE, + 0xC3C, + 0xC3D, 0xC4D, 0xC4E, 0xCBC, @@ -231182,6 +236370,8 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ 0x109C, 0x135D, 0x1360, + 0x1714, + 0x1716, 0x17C9, 0x17D4, 0x17DD, @@ -231193,7 +236383,9 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1ABE, + 0x1ABF, + 0x1AC1, + 0x1ACC, 0x1B34, 0x1B35, 0x1B44, @@ -231219,8 +236411,6 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ 0x1DC4, 0x1DD0, 0x1DF5, - 0x1DFA, - 0x1DFD, 0x1E00, 0x1FBD, 0x1FBE, @@ -231302,12 +236492,24 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ 0xFFE4, 0x102E0, 0x102E1, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10AE5, 0x10AE7, 0x10D22, 0x10D28, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, + 0x11046, + 0x11047, + 0x11070, + 0x11071, 0x110B9, 0x110BB, 0x11133, @@ -231374,6 +236576,16 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ 0x16FA0, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D16D, @@ -231386,6 +236598,8 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ 0x1D1AE, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -231404,7 +236618,7 @@ static const UV UNI_DIA_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ - 353, /* Number of elements */ + 385, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -231465,6 +236679,10 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ 0x7F6, 0x818, 0x81A, + 0x898, + 0x8A0, + 0x8C9, + 0x8D3, 0x8E3, 0x8FF, 0x93C, @@ -231497,6 +236715,8 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ 0xB56, 0xBCD, 0xBCE, + 0xC3C, + 0xC3D, 0xC4D, 0xC4E, 0xCBC, @@ -231549,6 +236769,8 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ 0x109C, 0x135D, 0x1360, + 0x1714, + 0x1716, 0x17C9, 0x17D4, 0x17DD, @@ -231560,7 +236782,9 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1ABE, + 0x1ABF, + 0x1AC1, + 0x1ACC, 0x1B34, 0x1B35, 0x1B44, @@ -231586,8 +236810,6 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ 0x1DC4, 0x1DD0, 0x1DF5, - 0x1DFA, - 0x1DFD, 0x1E00, 0x1FBD, 0x1FBE, @@ -231669,12 +236891,24 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ 0xFFE4, 0x102E0, 0x102E1, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10AE5, 0x10AE7, 0x10D22, 0x10D28, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, + 0x11046, + 0x11047, + 0x11070, + 0x11071, 0x110B9, 0x110BB, 0x11133, @@ -231741,6 +236975,16 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ 0x16FA0, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D16D, @@ -231753,6 +236997,8 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ 0x1D1AE, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -231771,7 +237017,7 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ - 351, /* Number of elements */ + 383, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -231830,6 +237076,10 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ 0x7F6, 0x818, 0x81A, + 0x898, + 0x8A0, + 0x8C9, + 0x8D3, 0x8E3, 0x8FF, 0x93C, @@ -231862,6 +237112,8 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ 0xB56, 0xBCD, 0xBCE, + 0xC3C, + 0xC3D, 0xC4D, 0xC4E, 0xCBC, @@ -231914,6 +237166,8 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ 0x109C, 0x135D, 0x1360, + 0x1714, + 0x1716, 0x17C9, 0x17D4, 0x17DD, @@ -231925,7 +237179,9 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1ABE, + 0x1ABF, + 0x1AC1, + 0x1ACC, 0x1B34, 0x1B35, 0x1B44, @@ -231951,8 +237207,6 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ 0x1DC4, 0x1DD0, 0x1DF5, - 0x1DFA, - 0x1DFD, 0x1E00, 0x1FBD, 0x1FBE, @@ -232034,12 +237288,24 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ 0xFFE4, 0x102E0, 0x102E1, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10AE5, 0x10AE7, 0x10D22, 0x10D28, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, + 0x11046, + 0x11047, + 0x11070, + 0x11071, 0x110B9, 0x110BB, 0x11133, @@ -232106,6 +237372,16 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ 0x16FA0, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D16D, @@ -232118,6 +237394,8 @@ static const UV UNI_DIA_invlist[] = { /* for EBCDIC 037 */ 0x1D1AE, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -235199,7 +240477,7 @@ static const UV UNI_DT__NB_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_DT__NONCANON_invlist[] = { /* for ASCII/Latin1 */ - 375, /* Number of elements */ + 383, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -235398,6 +240676,8 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for ASCII/Latin1 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -235450,6 +240730,12 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for ASCII/Latin1 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D400, 0x1D455, 0x1D456, @@ -235588,7 +240874,7 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_DT__NONCANON_invlist[] = { /* for EBCDIC 1047 */ - 381, /* Number of elements */ + 389, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -235793,6 +241079,8 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for EBCDIC 1047 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -235845,6 +241133,12 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for EBCDIC 1047 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D400, 0x1D455, 0x1D456, @@ -235983,7 +241277,7 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_DT__NONCANON_invlist[] = { /* for EBCDIC 037 */ - 379, /* Number of elements */ + 387, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -236186,6 +241480,8 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for EBCDIC 037 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -236238,6 +241534,12 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for EBCDIC 037 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D400, 0x1D455, 0x1D456, @@ -236373,7 +241675,7 @@ static const UV UNI_DT__NONCANON_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_DT__NONE_invlist[] = { /* for ASCII/Latin1 */ - 785, /* Number of elements */ + 793, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -236928,6 +242230,8 @@ static const UV UNI_DT__NONE_invlist[] = { /* for ASCII/Latin1 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -237010,6 +242314,12 @@ static const UV UNI_DT__NONE_invlist[] = { /* for ASCII/Latin1 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1109A, 0x1109B, 0x1109C, @@ -237172,7 +242482,7 @@ static const UV UNI_DT__NONE_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_DT__NONE_invlist[] = { /* for EBCDIC 1047 */ - 783, /* Number of elements */ + 791, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -237725,6 +243035,8 @@ static const UV UNI_DT__NONE_invlist[] = { /* for EBCDIC 1047 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -237807,6 +243119,12 @@ static const UV UNI_DT__NONE_invlist[] = { /* for EBCDIC 1047 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1109A, 0x1109B, 0x1109C, @@ -237969,7 +243287,7 @@ static const UV UNI_DT__NONE_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_DT__NONE_invlist[] = { /* for EBCDIC 037 */ - 785, /* Number of elements */ + 793, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -238524,6 +243842,8 @@ static const UV UNI_DT__NONE_invlist[] = { /* for EBCDIC 037 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -238606,6 +243926,12 @@ static const UV UNI_DT__NONE_invlist[] = { /* for EBCDIC 037 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1109A, 0x1109B, 0x1109C, @@ -238821,7 +244147,7 @@ static const UV UNI_DT__SUB_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_DT__SUP_invlist[] = { /* for ASCII/Latin1 */ - 51, /* Number of elements */ + 59, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -238868,12 +244194,20 @@ static const UV UNI_DT__SUP_invlist[] = { /* for ASCII/Latin1 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, 0xAB60, 0xAB69, 0xAB6A, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1F16A, 0x1F16D }; @@ -238886,7 +244220,7 @@ static const UV UNI_DT__SUP_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_DT__SUP_invlist[] = { /* for EBCDIC 1047 */ - 53, /* Number of elements */ + 61, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -238935,12 +244269,20 @@ static const UV UNI_DT__SUP_invlist[] = { /* for EBCDIC 1047 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, 0xAB60, 0xAB69, 0xAB6A, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1F16A, 0x1F16D }; @@ -238953,7 +244295,7 @@ static const UV UNI_DT__SUP_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_DT__SUP_invlist[] = { /* for EBCDIC 037 */ - 53, /* Number of elements */ + 61, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -239002,12 +244344,20 @@ static const UV UNI_DT__SUP_invlist[] = { /* for EBCDIC 037 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, 0xAB60, 0xAB69, 0xAB6A, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1F16A, 0x1F16D }; @@ -240211,7 +245561,7 @@ static const UV UNI_EA__H_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_EA__N_invlist[] = { /* for ASCII/Latin1 */ - 553, /* Number of elements */ + 563, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -240654,8 +246004,14 @@ static const UV UNI_EA__N_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -240728,36 +246084,40 @@ static const UV UNI_EA__N_invlist[] = { /* for ASCII/Latin1 */ 0x1F6D3, 0x1F6D5, 0x1F6D8, + 0x1F6DD, + 0x1F6E0, 0x1F6EB, 0x1F6ED, 0x1F6F4, 0x1F6FD, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F90C, 0x1F93B, 0x1F93C, 0x1F946, 0x1F947, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA00, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x20000, 0x2FFFE, 0x30000, @@ -240778,7 +246138,7 @@ static const UV UNI_EA__N_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_EA__N_invlist[] = { /* for EBCDIC 1047 */ - 551, /* Number of elements */ + 561, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -241219,8 +246579,14 @@ static const UV UNI_EA__N_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -241293,36 +246659,40 @@ static const UV UNI_EA__N_invlist[] = { /* for EBCDIC 1047 */ 0x1F6D3, 0x1F6D5, 0x1F6D8, + 0x1F6DD, + 0x1F6E0, 0x1F6EB, 0x1F6ED, 0x1F6F4, 0x1F6FD, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F90C, 0x1F93B, 0x1F93C, 0x1F946, 0x1F947, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA00, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x20000, 0x2FFFE, 0x30000, @@ -241343,7 +246713,7 @@ static const UV UNI_EA__N_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_EA__N_invlist[] = { /* for EBCDIC 037 */ - 551, /* Number of elements */ + 561, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -241784,8 +247154,14 @@ static const UV UNI_EA__N_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -241858,36 +247234,40 @@ static const UV UNI_EA__N_invlist[] = { /* for EBCDIC 037 */ 0x1F6D3, 0x1F6D5, 0x1F6D8, + 0x1F6DD, + 0x1F6E0, 0x1F6EB, 0x1F6ED, 0x1F6F4, 0x1F6FD, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F90C, 0x1F93B, 0x1F93C, 0x1F946, 0x1F947, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA00, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x20000, 0x2FFFE, 0x30000, @@ -242029,7 +247409,7 @@ static const UV UNI_EA__NA_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_EA__W_invlist[] = { /* for all charsets */ - 229, /* Number of elements */ + 239, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -242158,8 +247538,14 @@ static const UV UNI_EA__W_invlist[] = { /* for all charsets */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -242228,36 +247614,40 @@ static const UV UNI_EA__W_invlist[] = { /* for all charsets */ 0x1F6D3, 0x1F6D5, 0x1F6D8, + 0x1F6DD, + 0x1F6E0, 0x1F6EB, 0x1F6ED, 0x1F6F4, 0x1F6FD, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F90C, 0x1F93B, 0x1F93C, 0x1F946, 0x1F947, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA00, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x20000, 0x2FFFE, 0x30000, @@ -242275,7 +247665,7 @@ static const UV UNI_EARLYDYNASTICCUNEIFORM_invlist[] = { /* for all charsets */ }; static const UV UNI_EBASE_invlist[] = { /* for all charsets */ - 77, /* Number of elements */ + 81, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -242355,7 +247745,11 @@ static const UV UNI_EBASE_invlist[] = { /* for all charsets */ 0x1F9CD, 0x1F9D0, 0x1F9D1, - 0x1F9DE + 0x1F9DE, + 0x1FAC3, + 0x1FAC6, + 0x1FAF0, + 0x1FAF7 }; # if 'A' == 65 /* ASCII/Latin1 */ @@ -242515,7 +247909,7 @@ static const UV UNI_EMOD_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_EMOJI_invlist[] = { /* for ASCII/Latin1 */ - 305, /* Number of elements */ + 307, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -242788,7 +248182,7 @@ static const UV UNI_EMOJI_invlist[] = { /* for ASCII/Latin1 */ 0x1F6D3, 0x1F6D5, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6E6, 0x1F6E9, 0x1F6EA, @@ -242800,30 +248194,32 @@ static const UV UNI_EMOJI_invlist[] = { /* for ASCII/Latin1 */ 0x1F6FD, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F90C, 0x1F93B, 0x1F93C, 0x1F946, 0x1F947, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA00, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7 + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7 }; # endif /* ASCII/Latin1 */ @@ -242834,7 +248230,7 @@ static const UV UNI_EMOJI_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_EMOJI_invlist[] = { /* for EBCDIC 1047 */ - 305, /* Number of elements */ + 307, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -243107,7 +248503,7 @@ static const UV UNI_EMOJI_invlist[] = { /* for EBCDIC 1047 */ 0x1F6D3, 0x1F6D5, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6E6, 0x1F6E9, 0x1F6EA, @@ -243119,30 +248515,32 @@ static const UV UNI_EMOJI_invlist[] = { /* for EBCDIC 1047 */ 0x1F6FD, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F90C, 0x1F93B, 0x1F93C, 0x1F946, 0x1F947, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA00, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7 + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7 }; # endif /* EBCDIC 1047 */ @@ -243153,7 +248551,7 @@ static const UV UNI_EMOJI_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_EMOJI_invlist[] = { /* for EBCDIC 037 */ - 305, /* Number of elements */ + 307, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -243426,7 +248824,7 @@ static const UV UNI_EMOJI_invlist[] = { /* for EBCDIC 037 */ 0x1F6D3, 0x1F6D5, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6E6, 0x1F6E9, 0x1F6EA, @@ -243438,30 +248836,32 @@ static const UV UNI_EMOJI_invlist[] = { /* for EBCDIC 037 */ 0x1F6FD, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F90C, 0x1F93B, 0x1F93C, 0x1F946, 0x1F947, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA00, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7 + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7 }; # endif /* EBCDIC 037 */ @@ -243517,7 +248917,7 @@ static const UV UNI_ENCLOSEDIDEOGRAPHICSUP_invlist[] = { /* for all charsets */ }; static const UV UNI_EPRES_invlist[] = { /* for all charsets */ - 163, /* Number of elements */ + 167, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -243654,40 +249054,44 @@ static const UV UNI_EPRES_invlist[] = { /* for all charsets */ 0x1F6D3, 0x1F6D5, 0x1F6D8, + 0x1F6DD, + 0x1F6E0, 0x1F6EB, 0x1F6ED, 0x1F6F4, 0x1F6FD, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F90C, 0x1F93B, 0x1F93C, 0x1F946, 0x1F947, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA00, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7 + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7 }; static const UV UNI_ETHI_invlist[] = { /* for all charsets */ - 65, /* Number of elements */ + 73, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -243755,7 +249159,15 @@ static const UV UNI_ETHI_invlist[] = { /* for all charsets */ 0xAB20, 0xAB27, 0xAB28, - 0xAB2F + 0xAB2F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF }; static const UV UNI_ETHIOPICEXT_invlist[] = { /* for all charsets */ @@ -243778,6 +249190,16 @@ static const UV UNI_ETHIOPICEXTA_invlist[] = { /* for all charsets */ 0xAB30 }; +static const UV UNI_ETHIOPICEXTB_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x1E7E0, + 0x1E800 +}; + static const UV UNI_ETHIOPICSUP_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -243791,7 +249213,7 @@ static const UV UNI_ETHIOPICSUP_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_EXT_invlist[] = { /* for ASCII/Latin1 */ - 65, /* Number of elements */ + 67, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -243844,6 +249266,8 @@ static const UV UNI_EXT_invlist[] = { /* for ASCII/Latin1 */ 0xAAF5, 0xFF70, 0xFF71, + 0x10781, + 0x10783, 0x1135D, 0x1135E, 0x115C6, @@ -243870,7 +249294,7 @@ static const UV UNI_EXT_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_EXT_invlist[] = { /* for EBCDIC 1047 */ - 65, /* Number of elements */ + 67, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -243923,6 +249347,8 @@ static const UV UNI_EXT_invlist[] = { /* for EBCDIC 1047 */ 0xAAF5, 0xFF70, 0xFF71, + 0x10781, + 0x10783, 0x1135D, 0x1135E, 0x115C6, @@ -243949,7 +249375,7 @@ static const UV UNI_EXT_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_EXT_invlist[] = { /* for EBCDIC 037 */ - 65, /* Number of elements */ + 67, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -244002,6 +249428,8 @@ static const UV UNI_EXT_invlist[] = { /* for EBCDIC 037 */ 0xAAF5, 0xFF70, 0xFF71, + 0x10781, + 0x10783, 0x1135D, 0x1135E, 0x115C6, @@ -244686,7 +250114,7 @@ static const UV UNI_GCB__CN_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ - 691, /* Number of elements */ + 709, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -244739,7 +250167,9 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -244829,6 +250259,8 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -244940,7 +250372,7 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -244957,6 +250389,8 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -244988,7 +250422,7 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -245032,8 +250466,6 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200C, 0x200D, @@ -245151,16 +250583,24 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -245331,6 +250771,10 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0x16FE5, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D166, 0x1D167, @@ -245369,6 +250813,8 @@ static const UV UNI_GCB__EX_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -245396,7 +250842,7 @@ static const UV UNI_GCB__L_invlist[] = { /* for all charsets */ }; static const UV UNI_GCB__PP_invlist[] = { /* for all charsets */ - 27, /* Number of elements */ + 29, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -245407,6 +250853,8 @@ static const UV UNI_GCB__PP_invlist[] = { /* for all charsets */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0xD4E, @@ -245430,7 +250878,7 @@ static const UV UNI_GCB__PP_invlist[] = { /* for all charsets */ }; static const UV UNI_GCB__SM_invlist[] = { /* for all charsets */ - 319, /* Number of elements */ + 321, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -245529,6 +250977,10 @@ static const UV UNI_GCB__SM_invlist[] = { /* for all charsets */ 0x1058, 0x1084, 0x1085, + 0x1715, + 0x1716, + 0x1734, + 0x1735, 0x17B6, 0x17B7, 0x17BE, @@ -245697,8 +251149,6 @@ static const UV UNI_GCB__SM_invlist[] = { /* for all charsets */ 0x116B0, 0x116B6, 0x116B7, - 0x11720, - 0x11722, 0x11726, 0x11727, 0x1182C, @@ -245782,7 +251232,7 @@ static const UV UNI_GCB__V_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ - 620, /* Number of elements */ + 640, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -245846,7 +251296,11 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -245928,6 +251382,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -246033,7 +251489,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -246045,7 +251501,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x17DD, 0x17DE, 0x180B, - 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -246067,7 +251523,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -246093,8 +251549,6 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x2010, @@ -246220,16 +251674,24 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -246291,6 +251753,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x116AB, 0x116B8, 0x1171D, + 0x11720, + 0x11722, 0x1172C, 0x1182C, 0x1183B, @@ -246360,6 +251824,10 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -246394,6 +251862,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -246416,7 +251886,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ - 620, /* Number of elements */ + 640, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -246480,7 +251950,11 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -246562,6 +252036,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -246667,7 +252143,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -246679,7 +252155,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x17DD, 0x17DE, 0x180B, - 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -246701,7 +252177,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -246727,8 +252203,6 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x2010, @@ -246854,16 +252328,24 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -246925,6 +252407,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x116AB, 0x116B8, 0x1171D, + 0x11720, + 0x11722, 0x1172C, 0x1182C, 0x1183B, @@ -246994,6 +252478,10 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -247028,6 +252516,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -247050,7 +252540,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ - 620, /* Number of elements */ + 640, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -247114,7 +252604,11 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x890, + 0x892, + 0x898, + 0x8A0, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -247196,6 +252690,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -247301,7 +252797,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -247313,7 +252809,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x17DD, 0x17DE, 0x180B, - 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -247335,7 +252831,7 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -247361,8 +252857,6 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x2010, @@ -247488,16 +252982,24 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x11100, @@ -247559,6 +253061,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x116AB, 0x116B8, 0x1171D, + 0x11720, + 0x11722, 0x1172C, 0x1182C, 0x1183B, @@ -247628,6 +253132,10 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -247662,6 +253170,8 @@ static const UV UNI_GCB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -247745,7 +253255,7 @@ static const UV UNI_GEORGIANSUP_invlist[] = { /* for all charsets */ }; static const UV UNI_GLAG_invlist[] = { /* for all charsets */ - 23, /* Number of elements */ + 21, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -247755,9 +253265,7 @@ static const UV UNI_GLAG_invlist[] = { /* for all charsets */ 0x487, 0x488, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, + 0x2C60, 0x2E43, 0x2E44, 0xA66F, @@ -247901,7 +253409,7 @@ static const UV UNI_GRAN_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ - 1669, /* Number of elements */ + 1723, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -247948,7 +253456,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x610, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x64B, 0x660, 0x670, @@ -247990,10 +253498,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x85F, 0x860, 0x86B, + 0x870, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x903, 0x93A, 0x93B, @@ -248170,6 +253678,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0xC45, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -248196,7 +253706,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0xCC9, 0xCCA, 0xCCC, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -248375,12 +253885,12 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x1715, + 0x1716, + 0x171F, 0x1732, - 0x1735, + 0x1734, 0x1737, 0x1740, 0x1752, @@ -248465,11 +253975,11 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1B3D, 0x1B42, 0x1B43, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B6B, 0x1B74, - 0x1B7D, + 0x1B7F, 0x1B82, 0x1BA2, 0x1BA6, @@ -248557,7 +254067,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x218C, 0x2190, @@ -248569,10 +254079,6 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CEF, 0x2CF2, 0x2CF4, @@ -248605,7 +254111,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x2DD8, 0x2DDF, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -248631,8 +254137,6 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -248649,10 +254153,14 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0xA6F2, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -248773,15 +254281,15 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, + 0xFE00, 0xFE10, 0xFE1A, 0xFE30, @@ -248869,13 +254377,33 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -248960,6 +254488,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x10F46, 0x10F51, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -248972,6 +254504,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1104E, 0x11052, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11082, 0x110B3, 0x110B7, @@ -249117,7 +254653,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x116B6, 0x116B7, 0x116B8, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -249127,7 +254663,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x11726, 0x11727, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1182F, 0x11838, @@ -249184,7 +254720,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x11A98, 0x11A9A, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -249244,6 +254780,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x14400, @@ -249255,7 +254793,9 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF5, @@ -249290,8 +254830,14 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -249310,6 +254856,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9D, 0x1BC9F, 0x1BCA0, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -249325,7 +254873,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -249386,6 +254934,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1DA84, 0x1DA85, 0x1DA8C, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, @@ -249394,12 +254944,22 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -249510,7 +255070,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -249520,6 +255080,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -249533,27 +255095,27 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -249561,9 +255123,9 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -249584,7 +255146,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ - 1669, /* Number of elements */ + 1723, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -249631,7 +255193,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x610, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x64B, 0x660, 0x670, @@ -249673,10 +255235,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x85F, 0x860, 0x86B, + 0x870, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x903, 0x93A, 0x93B, @@ -249853,6 +255415,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0xC45, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -249879,7 +255443,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0xCC9, 0xCCA, 0xCCC, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -250058,12 +255622,12 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x1715, + 0x1716, + 0x171F, 0x1732, - 0x1735, + 0x1734, 0x1737, 0x1740, 0x1752, @@ -250148,11 +255712,11 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1B3D, 0x1B42, 0x1B43, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B6B, 0x1B74, - 0x1B7D, + 0x1B7F, 0x1B82, 0x1BA2, 0x1BA6, @@ -250240,7 +255804,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x218C, 0x2190, @@ -250252,10 +255816,6 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CEF, 0x2CF2, 0x2CF4, @@ -250288,7 +255848,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x2DD8, 0x2DDF, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -250314,8 +255874,6 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -250332,10 +255890,14 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0xA6F2, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -250456,15 +256018,15 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, + 0xFE00, 0xFE10, 0xFE1A, 0xFE30, @@ -250552,13 +256114,33 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -250643,6 +256225,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x10F46, 0x10F51, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -250655,6 +256241,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1104E, 0x11052, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11082, 0x110B3, 0x110B7, @@ -250800,7 +256390,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x116B6, 0x116B7, 0x116B8, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -250810,7 +256400,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x11726, 0x11727, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1182F, 0x11838, @@ -250867,7 +256457,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x11A98, 0x11A9A, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -250927,6 +256517,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x14400, @@ -250938,7 +256530,9 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF5, @@ -250973,8 +256567,14 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -250993,6 +256593,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9D, 0x1BC9F, 0x1BCA0, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -251008,7 +256610,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -251069,6 +256671,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1DA84, 0x1DA85, 0x1DA8C, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, @@ -251077,12 +256681,22 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -251193,7 +256807,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -251203,6 +256817,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -251216,27 +256832,27 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -251244,9 +256860,9 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -251267,7 +256883,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ - 1669, /* Number of elements */ + 1723, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -251314,7 +256930,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x610, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x64B, 0x660, 0x670, @@ -251356,10 +256972,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x85F, 0x860, 0x86B, + 0x870, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x903, 0x93A, 0x93B, @@ -251536,6 +257152,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0xC45, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -251562,7 +257180,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0xCC9, 0xCCA, 0xCCC, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -251741,12 +257359,12 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x1715, + 0x1716, + 0x171F, 0x1732, - 0x1735, + 0x1734, 0x1737, 0x1740, 0x1752, @@ -251831,11 +257449,11 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1B3D, 0x1B42, 0x1B43, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B6B, 0x1B74, - 0x1B7D, + 0x1B7F, 0x1B82, 0x1BA2, 0x1BA6, @@ -251923,7 +257541,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x218C, 0x2190, @@ -251935,10 +257553,6 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CEF, 0x2CF2, 0x2CF4, @@ -251971,7 +257585,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x2DD8, 0x2DDF, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -251997,8 +257611,6 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -252015,10 +257627,14 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0xA6F2, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -252139,15 +257755,15 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, + 0xFE00, 0xFE10, 0xFE1A, 0xFE30, @@ -252235,13 +257851,33 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -252326,6 +257962,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x10F46, 0x10F51, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -252338,6 +257978,10 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1104E, 0x11052, 0x11070, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11082, 0x110B3, 0x110B7, @@ -252483,7 +258127,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x116B6, 0x116B7, 0x116B8, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -252493,7 +258137,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x11726, 0x11727, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1182F, 0x11838, @@ -252550,7 +258194,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x11A98, 0x11A9A, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -252610,6 +258254,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x14400, @@ -252621,7 +258267,9 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF5, @@ -252656,8 +258304,14 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -252676,6 +258330,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1BC9D, 0x1BC9F, 0x1BCA0, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -252691,7 +258347,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -252752,6 +258408,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1DA84, 0x1DA85, 0x1DA8C, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, @@ -252760,12 +258418,22 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, 0x1E2F0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -252876,7 +258544,7 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -252886,6 +258554,8 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -252899,27 +258569,27 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -252927,9 +258597,9 @@ static const UV UNI_GRBASE_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -253039,7 +258709,7 @@ static const UV UNI_GREK_invlist[] = { /* for all charsets */ }; static const UV UNI_GREXT_invlist[] = { /* for all charsets */ - 689, /* Number of elements */ + 707, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -253092,7 +258762,9 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -253182,6 +258854,8 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -253293,7 +258967,7 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -253310,6 +258984,8 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -253341,7 +259017,7 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -253385,8 +259061,6 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200C, 0x200D, @@ -253504,16 +259178,24 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -253684,6 +259366,10 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0x16FE5, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D166, 0x1D167, @@ -253722,6 +259408,8 @@ static const UV UNI_GREXT_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -253843,7 +259531,7 @@ static const UV UNI_HALFMARKS_invlist[] = { /* for all charsets */ }; static const UV UNI_HAN_invlist[] = { /* for all charsets */ - 73, /* Number of elements */ + 75, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -253889,7 +259577,7 @@ static const UV UNI_HAN_invlist[] = { /* for all charsets */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA700, 0xA708, 0xF900, @@ -253900,6 +259588,8 @@ static const UV UNI_HAN_invlist[] = { /* for all charsets */ 0xFE47, 0xFF61, 0xFF66, + 0x16FE2, + 0x16FE4, 0x16FF0, 0x16FF2, 0x1D360, @@ -253907,9 +259597,9 @@ static const UV UNI_HAN_invlist[] = { /* for all charsets */ 0x1F250, 0x1F252, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -254075,7 +259765,7 @@ static const UV UNI_HIRA_invlist[] = { /* for all charsets */ 0xFF9E, 0xFFA0, 0x1B001, - 0x1B11F, + 0x1B120, 0x1B150, 0x1B153, 0x1F200, @@ -254263,7 +259953,7 @@ static const UV UNI_HYPHEN_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ - 1461, /* Number of elements */ + 1513, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -254370,11 +260060,11 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -254542,7 +260232,7 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -254552,6 +260242,8 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -254576,7 +260268,7 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -254743,10 +260435,8 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -254766,7 +260456,7 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -254805,9 +260495,9 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -254831,8 +260521,6 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -254913,10 +260601,6 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -254977,8 +260661,6 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -254997,10 +260679,14 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -255178,12 +260864,34 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -255264,6 +260972,8 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -255271,9 +260981,11 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -255380,6 +261092,8 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -255416,7 +261130,7 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -255468,6 +261182,8 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -255478,6 +261194,10 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -255512,8 +261232,14 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -255530,6 +261256,10 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -255616,6 +261346,8 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -255634,8 +261366,18 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -255713,9 +261455,9 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -255738,7 +261480,7 @@ static const UV UNI_IDC_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ - 1485, /* Number of elements */ + 1537, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -255869,11 +261611,11 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -256041,7 +261783,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -256051,6 +261793,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -256075,7 +261819,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -256242,10 +261986,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -256265,7 +262007,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -256304,9 +262046,9 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -256330,8 +262072,6 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -256412,10 +262152,6 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -256476,8 +262212,6 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -256496,10 +262230,14 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -256677,12 +262415,34 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -256763,6 +262523,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -256770,9 +262532,11 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -256879,6 +262643,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -256915,7 +262681,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -256967,6 +262733,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -256977,6 +262745,10 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -257011,8 +262783,14 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -257029,6 +262807,10 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -257115,6 +262897,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -257133,8 +262917,18 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -257212,9 +263006,9 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -257237,7 +263031,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ - 1481, /* Number of elements */ + 1533, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -257364,11 +263158,11 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -257536,7 +263330,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -257546,6 +263340,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -257570,7 +263366,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -257737,10 +263533,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -257760,7 +263554,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -257799,9 +263593,9 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -257825,8 +263619,6 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -257907,10 +263699,6 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -257971,8 +263759,6 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -257991,10 +263777,14 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -258172,12 +263962,34 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -258258,6 +264070,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -258265,9 +264079,11 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -258374,6 +264190,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -258410,7 +264228,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -258462,6 +264280,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -258472,6 +264292,10 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -258506,8 +264330,14 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -258524,6 +264354,10 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -258610,6 +264444,8 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -258628,8 +264464,18 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -258707,9 +264553,9 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -258729,7 +264575,7 @@ static const UV UNI_IDC_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 */ - 749, /* Number of elements */ + 777, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -258870,12 +264716,16 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -259044,7 +264894,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -259052,6 +264902,8 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -259078,6 +264930,8 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -259275,7 +265129,9 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -259405,7 +265261,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -259422,8 +265278,14 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -259466,14 +265328,26 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -259492,7 +265366,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for ASCII/Latin1 && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 */ - 783, /* Number of elements */ + 811, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -259667,12 +265541,16 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -259841,7 +265719,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -259849,6 +265727,8 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -259875,6 +265755,8 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -260072,7 +265954,9 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -260202,7 +266086,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -260219,8 +266103,14 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -260263,14 +266153,26 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -260289,7 +266191,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 1047 && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 */ - 779, /* Number of elements */ + 807, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -260460,12 +266362,16 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -260634,7 +266540,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -260642,6 +266548,8 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -260668,6 +266576,8 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -260865,7 +266775,9 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -260995,7 +266907,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -261012,8 +266924,14 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -261056,14 +266974,26 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -261079,7 +267009,7 @@ static const UV UNI_IDENTIFIERSTATUS__ALLOWED_invlist[] = { /* for EBCDIC 037 * # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Latin1 */ - 749, /* Number of elements */ + 777, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -261220,12 +267150,16 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -261394,7 +267328,7 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -261402,6 +267336,8 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -261428,6 +267364,8 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -261625,7 +267563,9 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -261755,7 +267695,7 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -261772,8 +267712,14 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -261816,14 +267762,26 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -261842,7 +267800,7 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for ASCII/Lat && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 1047 */ - 783, /* Number of elements */ + 811, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -262017,12 +267975,16 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -262191,7 +268153,7 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -262199,6 +268161,8 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -262225,6 +268189,8 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -262422,7 +268388,9 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -262552,7 +268520,7 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -262569,8 +268537,14 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -262613,14 +268587,26 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -262639,7 +268625,7 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 10 && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 037 */ - 779, /* Number of elements */ + 807, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -262810,12 +268796,16 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 03 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -262984,7 +268974,7 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 03 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -262992,6 +268982,8 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 03 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -263018,6 +269010,8 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 03 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -263215,7 +269209,9 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 03 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -263345,7 +269341,7 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 03 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -263362,8 +269358,14 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 03 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -263406,14 +269408,26 @@ static const UV UNI_IDENTIFIERSTATUS__RESTRICTED_invlist[] = { /* for EBCDIC 03 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -263445,7 +269459,7 @@ static const UV UNI_IDENTIFIERTYPE__DEFAULTIGNORABLE_invlist[] = { /* for ASCII 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x200B, 0x200C, 0x200E, @@ -263498,7 +269512,7 @@ static const UV UNI_IDENTIFIERTYPE__DEFAULTIGNORABLE_invlist[] = { /* for EBCDI 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x200B, 0x200C, 0x200E, @@ -263551,7 +269565,7 @@ static const UV UNI_IDENTIFIERTYPE__DEFAULTIGNORABLE_invlist[] = { /* for EBCDI 0x17B4, 0x17B6, 0x180B, - 0x180F, + 0x1810, 0x200B, 0x200C, 0x200E, @@ -263583,7 +269597,7 @@ static const UV UNI_IDENTIFIERTYPE__DEFAULTIGNORABLE_invlist[] = { /* for EBCDI # endif /* EBCDIC 037 */ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets */ - 425, /* Number of elements */ + 443, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -263601,10 +269615,8 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -263629,9 +269641,7 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x1CFA, 0x1CFB, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, + 0x2C60, 0x2C80, 0x2CF4, 0x2CF9, @@ -263689,7 +269699,21 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, @@ -263778,6 +269802,8 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -263785,9 +269811,9 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -263863,7 +269889,7 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -263871,7 +269897,7 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -263942,6 +269968,8 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -263953,7 +269981,9 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -264008,6 +270038,8 @@ static const UV UNI_IDENTIFIERTYPE__EXCLUSION_invlist[] = { /* for all charsets 0x1E025, 0x1E026, 0x1E02B, + 0x1E290, + 0x1E2AF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -264151,7 +270183,7 @@ static const UV UNI_IDENTIFIERTYPE__INCLUSION_invlist[] = { /* for EBCDIC 037 * # endif /* EBCDIC 037 */ static const UV UNI_IDENTIFIERTYPE__LIMITEDUSE_invlist[] = { /* for all charsets */ - 171, /* Number of elements */ + 175, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -264211,9 +270243,9 @@ static const UV UNI_IDENTIFIERTYPE__LIMITEDUSE_invlist[] = { /* for all charset 0x1AA0, 0x1AAE, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -264224,6 +270256,8 @@ static const UV UNI_IDENTIFIERTYPE__LIMITEDUSE_invlist[] = { /* for all charset 0x1C80, 0x1CC0, 0x1CC8, + 0x1DFA, + 0x1DFB, 0x2D30, 0x2D68, 0x2D70, @@ -264286,6 +270320,8 @@ static const UV UNI_IDENTIFIERTYPE__LIMITEDUSE_invlist[] = { /* for all charset 0x1145C, 0x1145D, 0x11462, + 0x11AB0, + 0x11AC0, 0x11D60, 0x11D66, 0x11D67, @@ -264331,7 +270367,7 @@ static const UV UNI_IDENTIFIERTYPE__LIMITEDUSE_invlist[] = { /* for all charset # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Latin1 */ - 1357, /* Number of elements */ + 1399, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -264367,8 +270403,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -264386,11 +270420,11 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -264546,7 +270580,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -264556,6 +270590,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -264578,7 +270614,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -264713,10 +270749,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -264733,8 +270767,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -264773,11 +270805,11 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -264793,8 +270825,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -264835,7 +270865,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -264849,10 +270879,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -264883,7 +270909,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -264907,8 +270933,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -264917,10 +270941,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -264991,16 +271019,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -265087,13 +271113,33 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -265180,6 +271226,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -265187,9 +271235,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -265273,7 +271321,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -265281,7 +271329,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -265312,7 +271360,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -265368,6 +271416,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -265381,7 +271431,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -265414,8 +271466,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -265432,12 +271490,18 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -265492,6 +271556,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -265510,10 +271576,20 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -265622,7 +271698,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -265632,6 +271708,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -265645,27 +271723,27 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -265673,9 +271751,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -265702,7 +271780,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for ASCII/Lat && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 1047 */ - 1361, /* Number of elements */ + 1403, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -265742,8 +271820,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -265761,11 +271837,11 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -265921,7 +271997,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -265931,6 +272007,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -265953,7 +272031,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -266088,10 +272166,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -266108,8 +272184,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -266148,11 +272222,11 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -266168,8 +272242,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -266210,7 +272282,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -266224,10 +272296,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -266258,7 +272326,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -266282,8 +272350,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -266292,10 +272358,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -266366,16 +272436,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -266462,13 +272530,33 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -266555,6 +272643,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -266562,9 +272652,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -266648,7 +272738,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -266656,7 +272746,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -266687,7 +272777,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -266743,6 +272833,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -266756,7 +272848,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -266789,8 +272883,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -266807,12 +272907,18 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -266867,6 +272973,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -266885,10 +272993,20 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -266997,7 +273115,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -267007,6 +273125,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -267020,27 +273140,27 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -267048,9 +273168,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -267077,7 +273197,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 10 && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 037 */ - 1361, /* Number of elements */ + 1403, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -267117,8 +273237,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -267136,11 +273254,11 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -267296,7 +273414,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -267306,6 +273424,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -267328,7 +273448,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -267463,10 +273583,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -267483,8 +273601,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -267523,11 +273639,11 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -267543,8 +273659,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -267585,7 +273699,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -267599,10 +273713,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -267633,7 +273743,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -267657,8 +273767,6 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -267667,10 +273775,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -267741,16 +273853,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -267837,13 +273947,33 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -267930,6 +274060,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -267937,9 +274069,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -268023,7 +274155,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -268031,7 +274163,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -268062,7 +274194,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -268118,6 +274250,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -268131,7 +274265,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -268164,8 +274300,14 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -268182,12 +274324,18 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -268242,6 +274390,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -268260,10 +274410,20 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -268372,7 +274532,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -268382,6 +274542,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -268395,27 +274557,27 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -268423,9 +274585,9 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -268449,7 +274611,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTCHARACTER_invlist[] = { /* for EBCDIC 03 # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for ASCII/Latin1 */ - 503, /* Number of elements */ + 511, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -268740,6 +274902,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for ASCII/Latin1 * 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -268822,6 +274986,12 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for ASCII/Latin1 * 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D15E, 0x1D165, 0x1D1BB, @@ -268966,7 +275136,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for ASCII/Latin1 * && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for EBCDIC 1047 */ - 509, /* Number of elements */ + 517, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -269263,6 +275433,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for EBCDIC 1047 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -269345,6 +275517,12 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for EBCDIC 1047 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D15E, 0x1D165, 0x1D1BB, @@ -269489,7 +275667,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for EBCDIC 037 */ - 507, /* Number of elements */ + 515, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -269784,6 +275962,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for EBCDIC 037 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -269866,6 +276046,12 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for EBCDIC 037 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D15E, 0x1D165, 0x1D1BB, @@ -270007,7 +276193,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTNFKC_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ - 691, /* Number of elements */ + 707, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -270086,7 +276272,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x610, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -270108,6 +276294,10 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x83F, 0x85E, 0x85F, + 0x888, + 0x889, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x964, @@ -270217,7 +276407,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x1B5A, 0x1B6B, 0x1B74, - 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -270255,7 +276445,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x20A0, 0x20A8, 0x20A9, - 0x20C0, + 0x20C1, 0x20DD, 0x20E1, 0x20E2, @@ -270317,7 +276507,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x2D70, 0x2D71, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -270399,11 +276589,13 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0xABEB, 0xABEC, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFD3E, - 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE45, 0xFE47, 0xFFF9, @@ -270484,6 +276676,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x10F27, 0x10F51, 0x10F5A, + 0x10F86, + 0x10F8A, 0x10FC5, 0x10FCC, 0x11047, @@ -270526,6 +276720,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173A, 0x11740, 0x1183B, @@ -270556,6 +276752,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x13430, 0x13439, 0x16A6E, @@ -270576,6 +276774,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9D, 0x1BC9F, 0x1BCA0, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -270591,7 +276791,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x1D1AE, 0x1D1BB, 0x1D1C1, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -270654,7 +276854,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -270664,6 +276864,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -270677,27 +276879,27 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -270712,7 +276914,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ - 705, /* Number of elements */ + 721, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -270805,7 +277007,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x610, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -270827,6 +277029,10 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x83F, 0x85E, 0x85F, + 0x888, + 0x889, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x964, @@ -270936,7 +277142,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x1B5A, 0x1B6B, 0x1B74, - 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -270974,7 +277180,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x20A0, 0x20A8, 0x20A9, - 0x20C0, + 0x20C1, 0x20DD, 0x20E1, 0x20E2, @@ -271036,7 +277242,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x2D70, 0x2D71, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -271118,11 +277324,13 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0xABEB, 0xABEC, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFD3E, - 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE45, 0xFE47, 0xFFF9, @@ -271203,6 +277411,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x10F27, 0x10F51, 0x10F5A, + 0x10F86, + 0x10F8A, 0x10FC5, 0x10FCC, 0x11047, @@ -271245,6 +277455,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173A, 0x11740, 0x1183B, @@ -271275,6 +277487,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x13430, 0x13439, 0x16A6E, @@ -271295,6 +277509,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9D, 0x1BC9F, 0x1BCA0, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -271310,7 +277526,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x1D1AE, 0x1D1BB, 0x1D1C1, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -271373,7 +277589,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -271383,6 +277599,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -271396,27 +277614,27 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -271431,7 +277649,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ - 703, /* Number of elements */ + 719, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -271522,7 +277740,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x610, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -271544,6 +277762,10 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x83F, 0x85E, 0x85F, + 0x888, + 0x889, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x964, @@ -271653,7 +277875,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x1B5A, 0x1B6B, 0x1B74, - 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -271691,7 +277913,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x20A0, 0x20A8, 0x20A9, - 0x20C0, + 0x20C1, 0x20DD, 0x20E1, 0x20E2, @@ -271753,7 +277975,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x2D70, 0x2D71, 0x2E00, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -271835,11 +278057,13 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0xABEB, 0xABEC, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFD3E, - 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE45, 0xFE47, 0xFFF9, @@ -271920,6 +278144,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x10F27, 0x10F51, 0x10F5A, + 0x10F86, + 0x10F8A, 0x10FC5, 0x10FCC, 0x11047, @@ -271962,6 +278188,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173A, 0x11740, 0x1183B, @@ -271992,6 +278220,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x13430, 0x13439, 0x16A6E, @@ -272012,6 +278242,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x1BC9D, 0x1BC9F, 0x1BCA0, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -272027,7 +278259,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x1D1AE, 0x1D1BB, 0x1D1C1, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -272090,7 +278322,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -272100,6 +278332,8 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -272113,27 +278347,27 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -272143,7 +278377,7 @@ static const UV UNI_IDENTIFIERTYPE__NOTXID_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_IDENTIFIERTYPE__OBSOLETE_invlist[] = { /* for all charsets */ - 207, /* Number of elements */ + 209, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -272298,6 +278532,8 @@ static const UV UNI_IDENTIFIERTYPE__OBSOLETE_invlist[] = { /* for all charsets 0x3030, 0x312E, 0x312F, + 0x31F0, + 0x3200, 0xA610, 0xA613, 0xA62A, @@ -272359,7 +278595,7 @@ static const UV UNI_IDENTIFIERTYPE__OBSOLETE_invlist[] = { /* for all charsets # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Latin1 */ - 733, /* Number of elements */ + 761, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -272492,12 +278728,16 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -272666,7 +278906,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -272674,6 +278914,8 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -272700,6 +278942,8 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -272895,7 +279139,9 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -273019,7 +279265,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -273036,8 +279282,14 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -273080,14 +279332,26 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -273106,7 +279370,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for ASCII/Lati && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 1047 */ - 763, /* Number of elements */ + 791, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -273269,12 +279533,16 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -273443,7 +279711,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -273451,6 +279719,8 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -273477,6 +279747,8 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -273672,7 +279944,9 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -273796,7 +280070,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -273813,8 +280087,14 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -273857,14 +280137,26 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -273883,7 +280175,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 104 && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 */ - 759, /* Number of elements */ + 787, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -274042,12 +280334,16 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 0x700, 0x750, 0x7B2, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8B2, 0x8B3, - 0x8B6, - 0x8C8, + 0x8B5, + 0x8CA, 0x901, 0x94E, 0x94F, @@ -274216,7 +280512,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 0xC34, 0xC35, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -274224,6 +280520,8 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 0xC4E, 0xC55, 0xC57, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC66, @@ -274250,6 +280548,8 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 0xCCE, 0xCD5, 0xCD7, + 0xCDD, + 0xCDE, 0xCE0, 0xCE4, 0xCE6, @@ -274445,7 +280745,9 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 0x17A9, 0x17B4, 0x17B6, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17D3, 0x17D7, @@ -274569,7 +280871,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xA67F, 0xA680, 0xA717, @@ -274586,8 +280888,14 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 0xA7AF, 0xA7B8, 0xA7BA, - 0xA7C2, + 0xA7C0, 0xA7CB, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, 0xA9E7, 0xA9FF, 0xAA60, @@ -274630,14 +280938,26 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 0x1133D, 0x16FF0, 0x16FF2, + 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, 0x1B168, + 0x1DF00, + 0x1DF1F, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -274651,7 +280971,7 @@ static const UV UNI_IDENTIFIERTYPE__RECOMMENDED_invlist[] = { /* for EBCDIC 037 # endif /* EBCDIC 037 */ static const UV UNI_IDENTIFIERTYPE__TECHNICAL_invlist[] = { /* for all charsets */ - 191, /* Number of elements */ + 199, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -274740,12 +281060,16 @@ static const UV UNI_IDENTIFIERTYPE__TECHNICAL_invlist[] = { /* for all charsets 0xDF4, 0xF18, 0xF1A, - 0x17CB, + 0x17CE, + 0x17D0, + 0x17D1, 0x17D2, 0x17DD, 0x17DE, 0x1ABF, 0x1AC1, + 0x1B6B, + 0x1B74, 0x1D00, 0x1D2C, 0x1D2F, @@ -274759,8 +281083,6 @@ static const UV UNI_IDENTIFIERTYPE__TECHNICAL_invlist[] = { /* for all charsets 0x1D79, 0x1D9B, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x1E9C, 0x1E9E, @@ -274796,8 +281118,6 @@ static const UV UNI_IDENTIFIERTYPE__TECHNICAL_invlist[] = { /* for all charsets 0x3036, 0x303B, 0x303D, - 0x31F0, - 0x3200, 0x327F, 0x3280, 0x4DC0, @@ -274819,17 +281139,25 @@ static const UV UNI_IDENTIFIERTYPE__TECHNICAL_invlist[] = { /* for all charsets 0xFB1E, 0xFB1F, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFD3E, - 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE20, 0xFE30, 0xFE45, 0xFE47, 0xFE73, 0xFE74, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -274841,7 +281169,7 @@ static const UV UNI_IDENTIFIERTYPE__TECHNICAL_invlist[] = { /* for all charsets 0x1D17B, 0x1D1BB, 0x1D1C1, - 0x1D1E9, + 0x1D1EB, 0x1D242, 0x1D245, 0x1D300, @@ -274849,7 +281177,7 @@ static const UV UNI_IDENTIFIERTYPE__TECHNICAL_invlist[] = { /* for all charsets }; static const UV UNI_IDENTIFIERTYPE__UNCOMMONUSE_invlist[] = { /* for all charsets */ - 153, /* Number of elements */ + 165, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -274932,9 +281260,11 @@ static const UV UNI_IDENTIFIERTYPE__UNCOMMONUSE_invlist[] = { /* for all charse 0x6E9, 0x6EA, 0x6EE, + 0x898, + 0x8A0, 0x8B3, 0x8B5, - 0x8D3, + 0x8CA, 0x8E2, 0x8E3, 0x901, @@ -274970,6 +281300,8 @@ static const UV UNI_IDENTIFIERTYPE__UNCOMMONUSE_invlist[] = { /* for all charse 0xF3A, 0x18A9, 0x18AA, + 0x1AC1, + 0x1ACF, 0x2054, 0x2055, 0x218A, @@ -274998,10 +281330,18 @@ static const UV UNI_IDENTIFIERTYPE__UNCOMMONUSE_invlist[] = { /* for all charse 0xFB1F, 0xFE2E, 0xFE30, + 0x10780, + 0x10781, 0x16A40, 0x16A5F, 0x16A60, 0x16A6A, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1D1DE, 0x1D1E9, 0x1F54F, @@ -275023,7 +281363,7 @@ static const UV UNI_IDEO_invlist[] = { /* for all charsets */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xF900, 0xFA6E, 0xFA70, @@ -275039,9 +281379,9 @@ static const UV UNI_IDEO_invlist[] = { /* for all charsets */ 0x1B170, 0x1B2FC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -275067,7 +281407,7 @@ static const UV UNI_IDEOGRAPHICSYMBOLS_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ - 1245, /* Number of elements */ + 1297, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -275170,10 +281510,12 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -275302,6 +281644,8 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -275318,7 +281662,7 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -275461,10 +281805,8 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -275505,7 +281847,7 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -275605,10 +281947,6 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -275669,8 +282007,6 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -275691,10 +282027,14 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -275872,12 +282212,34 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -275948,12 +282310,18 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -276036,6 +282404,8 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -276074,7 +282444,7 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -276110,6 +282480,8 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -276118,6 +282490,8 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -276146,8 +282520,14 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -276222,14 +282602,26 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -276303,9 +282695,9 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -276326,7 +282718,7 @@ static const UV UNI_IDS_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ - 1271, /* Number of elements */ + 1323, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -276455,10 +282847,12 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -276587,6 +282981,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -276603,7 +282999,7 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -276746,10 +283142,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -276790,7 +283184,7 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -276890,10 +283284,6 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -276954,8 +283344,6 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -276976,10 +283364,14 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -277157,12 +283549,34 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -277233,12 +283647,18 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -277321,6 +283741,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -277359,7 +283781,7 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -277395,6 +283817,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -277403,6 +283827,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -277431,8 +283857,14 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -277507,14 +283939,26 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -277588,9 +284032,9 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -277611,7 +284055,7 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ - 1267, /* Number of elements */ + 1319, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -277736,10 +284180,12 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -277868,6 +284314,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -277884,7 +284332,7 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -278027,10 +284475,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -278071,7 +284517,7 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -278171,10 +284617,6 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -278235,8 +284677,6 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -278257,10 +284697,14 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -278438,12 +284882,34 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -278514,12 +284980,18 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -278602,6 +285074,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -278640,7 +285114,7 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -278676,6 +285150,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -278684,6 +285160,8 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -278712,8 +285190,14 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -278788,14 +285272,26 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -278869,9 +285365,9 @@ static const UV UNI_IDS_invlist[] = { /* for EBCDIC 037 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -280412,7 +286908,1326 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x11334, 0x11335, 0x1133A, - 0x1133C, + 0x1133C, + 0x11345, + 0x11347, + 0x11349, + 0x1134B, + 0x1134E, + 0x11350, + 0x11351, + 0x11357, + 0x11358, + 0x1135D, + 0x11364, + 0x11366, + 0x1136D, + 0x11370, + 0x11375, + 0x11400, + 0x1145A, + 0x1145B, + 0x1145C, + 0x1145D, + 0x1145E, + 0x11480, + 0x114C8, + 0x114D0, + 0x114DA, + 0x11580, + 0x115B6, + 0x115B8, + 0x115DE, + 0x11600, + 0x11645, + 0x11650, + 0x1165A, + 0x11660, + 0x1166D, + 0x11680, + 0x116B8, + 0x116C0, + 0x116CA, + 0x11700, + 0x1171A, + 0x1171D, + 0x1172C, + 0x11730, + 0x11740, + 0x118A0, + 0x118F3, + 0x118FF, + 0x11900, + 0x11A00, + 0x11A48, + 0x11A50, + 0x11A84, + 0x11A86, + 0x11A9D, + 0x11A9E, + 0x11AA3, + 0x11AC0, + 0x11AF9, + 0x11C00, + 0x11C09, + 0x11C0A, + 0x11C37, + 0x11C38, + 0x11C46, + 0x11C50, + 0x11C6D, + 0x11C70, + 0x11C90, + 0x11C92, + 0x11CA8, + 0x11CA9, + 0x11CB7, + 0x11D00, + 0x11D07, + 0x11D08, + 0x11D0A, + 0x11D0B, + 0x11D37, + 0x11D3A, + 0x11D3B, + 0x11D3C, + 0x11D3E, + 0x11D3F, + 0x11D48, + 0x11D50, + 0x11D5A, + 0x12000, + 0x1239A, + 0x12400, + 0x1246F, + 0x12470, + 0x12475, + 0x12480, + 0x12544, + 0x13000, + 0x1342F, + 0x14400, + 0x14647, + 0x16800, + 0x16A39, + 0x16A40, + 0x16A5F, + 0x16A60, + 0x16A6A, + 0x16A6E, + 0x16A70, + 0x16AD0, + 0x16AEE, + 0x16AF0, + 0x16AF6, + 0x16B00, + 0x16B46, + 0x16B50, + 0x16B5A, + 0x16B5B, + 0x16B62, + 0x16B63, + 0x16B78, + 0x16B7D, + 0x16B90, + 0x16F00, + 0x16F45, + 0x16F50, + 0x16F7F, + 0x16F8F, + 0x16FA0, + 0x16FE0, + 0x16FE2, + 0x17000, + 0x187ED, + 0x18800, + 0x18AF3, + 0x1B000, + 0x1B11F, + 0x1B170, + 0x1B2FC, + 0x1BC00, + 0x1BC6B, + 0x1BC70, + 0x1BC7D, + 0x1BC80, + 0x1BC89, + 0x1BC90, + 0x1BC9A, + 0x1BC9C, + 0x1BCA4, + 0x1D000, + 0x1D0F6, + 0x1D100, + 0x1D127, + 0x1D129, + 0x1D1E9, + 0x1D200, + 0x1D246, + 0x1D300, + 0x1D357, + 0x1D360, + 0x1D372, + 0x1D400, + 0x1D455, + 0x1D456, + 0x1D49D, + 0x1D49E, + 0x1D4A0, + 0x1D4A2, + 0x1D4A3, + 0x1D4A5, + 0x1D4A7, + 0x1D4A9, + 0x1D4AD, + 0x1D4AE, + 0x1D4BA, + 0x1D4BB, + 0x1D4BC, + 0x1D4BD, + 0x1D4C4, + 0x1D4C5, + 0x1D506, + 0x1D507, + 0x1D50B, + 0x1D50D, + 0x1D515, + 0x1D516, + 0x1D51D, + 0x1D51E, + 0x1D53A, + 0x1D53B, + 0x1D53F, + 0x1D540, + 0x1D545, + 0x1D546, + 0x1D547, + 0x1D54A, + 0x1D551, + 0x1D552, + 0x1D6A6, + 0x1D6A8, + 0x1D7CC, + 0x1D7CE, + 0x1DA8C, + 0x1DA9B, + 0x1DAA0, + 0x1DAA1, + 0x1DAB0, + 0x1E000, + 0x1E007, + 0x1E008, + 0x1E019, + 0x1E01B, + 0x1E022, + 0x1E023, + 0x1E025, + 0x1E026, + 0x1E02B, + 0x1E800, + 0x1E8C5, + 0x1E8C7, + 0x1E8D7, + 0x1E900, + 0x1E94B, + 0x1E950, + 0x1E95A, + 0x1E95E, + 0x1E960, + 0x1EE00, + 0x1EE04, + 0x1EE05, + 0x1EE20, + 0x1EE21, + 0x1EE23, + 0x1EE24, + 0x1EE25, + 0x1EE27, + 0x1EE28, + 0x1EE29, + 0x1EE33, + 0x1EE34, + 0x1EE38, + 0x1EE39, + 0x1EE3A, + 0x1EE3B, + 0x1EE3C, + 0x1EE42, + 0x1EE43, + 0x1EE47, + 0x1EE48, + 0x1EE49, + 0x1EE4A, + 0x1EE4B, + 0x1EE4C, + 0x1EE4D, + 0x1EE50, + 0x1EE51, + 0x1EE53, + 0x1EE54, + 0x1EE55, + 0x1EE57, + 0x1EE58, + 0x1EE59, + 0x1EE5A, + 0x1EE5B, + 0x1EE5C, + 0x1EE5D, + 0x1EE5E, + 0x1EE5F, + 0x1EE60, + 0x1EE61, + 0x1EE63, + 0x1EE64, + 0x1EE65, + 0x1EE67, + 0x1EE6B, + 0x1EE6C, + 0x1EE73, + 0x1EE74, + 0x1EE78, + 0x1EE79, + 0x1EE7D, + 0x1EE7E, + 0x1EE7F, + 0x1EE80, + 0x1EE8A, + 0x1EE8B, + 0x1EE9C, + 0x1EEA1, + 0x1EEA4, + 0x1EEA5, + 0x1EEAA, + 0x1EEAB, + 0x1EEBC, + 0x1EEF0, + 0x1EEF2, + 0x1F000, + 0x1F02C, + 0x1F030, + 0x1F094, + 0x1F0A0, + 0x1F0AF, + 0x1F0B1, + 0x1F0C0, + 0x1F0C1, + 0x1F0D0, + 0x1F0D1, + 0x1F0F6, + 0x1F100, + 0x1F10D, + 0x1F110, + 0x1F12F, + 0x1F130, + 0x1F16C, + 0x1F170, + 0x1F1AD, + 0x1F1E6, + 0x1F203, + 0x1F210, + 0x1F23C, + 0x1F240, + 0x1F249, + 0x1F250, + 0x1F252, + 0x1F260, + 0x1F266, + 0x1F300, + 0x1F6D5, + 0x1F6E0, + 0x1F6ED, + 0x1F6F0, + 0x1F6F9, + 0x1F700, + 0x1F774, + 0x1F780, + 0x1F7D5, + 0x1F800, + 0x1F80C, + 0x1F810, + 0x1F848, + 0x1F850, + 0x1F85A, + 0x1F860, + 0x1F888, + 0x1F890, + 0x1F8AE, + 0x1F900, + 0x1F90C, + 0x1F910, + 0x1F93F, + 0x1F940, + 0x1F94D, + 0x1F950, + 0x1F96C, + 0x1F980, + 0x1F998, + 0x1F9C0, + 0x1F9C1, + 0x1F9D0, + 0x1F9E7, + 0x1FFFE, + 0x2A6D7, + 0x2A700, + 0x2B735, + 0x2B740, + 0x2B81E, + 0x2B820, + 0x2CEA2, + 0x2CEB0, + 0x2EBE1, + 0x2F800, + 0x2FA1E, + 0x2FFFE, + 0x30000, + 0x3FFFE, + 0x40000, + 0x4FFFE, + 0x50000, + 0x5FFFE, + 0x60000, + 0x6FFFE, + 0x70000, + 0x7FFFE, + 0x80000, + 0x8FFFE, + 0x90000, + 0x9FFFE, + 0xA0000, + 0xAFFFE, + 0xB0000, + 0xBFFFE, + 0xC0000, + 0xCFFFE, + 0xD0000, + 0xDFFFE, + 0xE0000, + 0xE0001, + 0xE0002, + 0xE0020, + 0xE0080, + 0xE0100, + 0xE01F0, + 0xEFFFE, + 0x110000 +}; + +static const UV UNI_IN__11_invlist[] = { /* for all charsets */ + 1336, /* Number of elements */ + 148565664, /* Version and data structure type */ + 0, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x378, + 0x37A, + 0x380, + 0x384, + 0x38B, + 0x38C, + 0x38D, + 0x38E, + 0x3A2, + 0x3A3, + 0x530, + 0x531, + 0x557, + 0x559, + 0x58B, + 0x58D, + 0x590, + 0x591, + 0x5C8, + 0x5D0, + 0x5EB, + 0x5EF, + 0x5F5, + 0x600, + 0x61D, + 0x61E, + 0x70E, + 0x70F, + 0x74B, + 0x74D, + 0x7B2, + 0x7C0, + 0x7FB, + 0x7FD, + 0x82E, + 0x830, + 0x83F, + 0x840, + 0x85C, + 0x85E, + 0x85F, + 0x860, + 0x86B, + 0x8A0, + 0x8B5, + 0x8B6, + 0x8BE, + 0x8D3, + 0x984, + 0x985, + 0x98D, + 0x98F, + 0x991, + 0x993, + 0x9A9, + 0x9AA, + 0x9B1, + 0x9B2, + 0x9B3, + 0x9B6, + 0x9BA, + 0x9BC, + 0x9C5, + 0x9C7, + 0x9C9, + 0x9CB, + 0x9CF, + 0x9D7, + 0x9D8, + 0x9DC, + 0x9DE, + 0x9DF, + 0x9E4, + 0x9E6, + 0x9FF, + 0xA01, + 0xA04, + 0xA05, + 0xA0B, + 0xA0F, + 0xA11, + 0xA13, + 0xA29, + 0xA2A, + 0xA31, + 0xA32, + 0xA34, + 0xA35, + 0xA37, + 0xA38, + 0xA3A, + 0xA3C, + 0xA3D, + 0xA3E, + 0xA43, + 0xA47, + 0xA49, + 0xA4B, + 0xA4E, + 0xA51, + 0xA52, + 0xA59, + 0xA5D, + 0xA5E, + 0xA5F, + 0xA66, + 0xA77, + 0xA81, + 0xA84, + 0xA85, + 0xA8E, + 0xA8F, + 0xA92, + 0xA93, + 0xAA9, + 0xAAA, + 0xAB1, + 0xAB2, + 0xAB4, + 0xAB5, + 0xABA, + 0xABC, + 0xAC6, + 0xAC7, + 0xACA, + 0xACB, + 0xACE, + 0xAD0, + 0xAD1, + 0xAE0, + 0xAE4, + 0xAE6, + 0xAF2, + 0xAF9, + 0xB00, + 0xB01, + 0xB04, + 0xB05, + 0xB0D, + 0xB0F, + 0xB11, + 0xB13, + 0xB29, + 0xB2A, + 0xB31, + 0xB32, + 0xB34, + 0xB35, + 0xB3A, + 0xB3C, + 0xB45, + 0xB47, + 0xB49, + 0xB4B, + 0xB4E, + 0xB56, + 0xB58, + 0xB5C, + 0xB5E, + 0xB5F, + 0xB64, + 0xB66, + 0xB78, + 0xB82, + 0xB84, + 0xB85, + 0xB8B, + 0xB8E, + 0xB91, + 0xB92, + 0xB96, + 0xB99, + 0xB9B, + 0xB9C, + 0xB9D, + 0xB9E, + 0xBA0, + 0xBA3, + 0xBA5, + 0xBA8, + 0xBAB, + 0xBAE, + 0xBBA, + 0xBBE, + 0xBC3, + 0xBC6, + 0xBC9, + 0xBCA, + 0xBCE, + 0xBD0, + 0xBD1, + 0xBD7, + 0xBD8, + 0xBE6, + 0xBFB, + 0xC00, + 0xC0D, + 0xC0E, + 0xC11, + 0xC12, + 0xC29, + 0xC2A, + 0xC3A, + 0xC3D, + 0xC45, + 0xC46, + 0xC49, + 0xC4A, + 0xC4E, + 0xC55, + 0xC57, + 0xC58, + 0xC5B, + 0xC60, + 0xC64, + 0xC66, + 0xC70, + 0xC78, + 0xC8D, + 0xC8E, + 0xC91, + 0xC92, + 0xCA9, + 0xCAA, + 0xCB4, + 0xCB5, + 0xCBA, + 0xCBC, + 0xCC5, + 0xCC6, + 0xCC9, + 0xCCA, + 0xCCE, + 0xCD5, + 0xCD7, + 0xCDE, + 0xCDF, + 0xCE0, + 0xCE4, + 0xCE6, + 0xCF0, + 0xCF1, + 0xCF3, + 0xD00, + 0xD04, + 0xD05, + 0xD0D, + 0xD0E, + 0xD11, + 0xD12, + 0xD45, + 0xD46, + 0xD49, + 0xD4A, + 0xD50, + 0xD54, + 0xD64, + 0xD66, + 0xD80, + 0xD82, + 0xD84, + 0xD85, + 0xD97, + 0xD9A, + 0xDB2, + 0xDB3, + 0xDBC, + 0xDBD, + 0xDBE, + 0xDC0, + 0xDC7, + 0xDCA, + 0xDCB, + 0xDCF, + 0xDD5, + 0xDD6, + 0xDD7, + 0xDD8, + 0xDE0, + 0xDE6, + 0xDF0, + 0xDF2, + 0xDF5, + 0xE01, + 0xE3B, + 0xE3F, + 0xE5C, + 0xE81, + 0xE83, + 0xE84, + 0xE85, + 0xE87, + 0xE89, + 0xE8A, + 0xE8B, + 0xE8D, + 0xE8E, + 0xE94, + 0xE98, + 0xE99, + 0xEA0, + 0xEA1, + 0xEA4, + 0xEA5, + 0xEA6, + 0xEA7, + 0xEA8, + 0xEAA, + 0xEAC, + 0xEAD, + 0xEBA, + 0xEBB, + 0xEBE, + 0xEC0, + 0xEC5, + 0xEC6, + 0xEC7, + 0xEC8, + 0xECE, + 0xED0, + 0xEDA, + 0xEDC, + 0xEE0, + 0xF00, + 0xF48, + 0xF49, + 0xF6D, + 0xF71, + 0xF98, + 0xF99, + 0xFBD, + 0xFBE, + 0xFCD, + 0xFCE, + 0xFDB, + 0x1000, + 0x10C6, + 0x10C7, + 0x10C8, + 0x10CD, + 0x10CE, + 0x10D0, + 0x1249, + 0x124A, + 0x124E, + 0x1250, + 0x1257, + 0x1258, + 0x1259, + 0x125A, + 0x125E, + 0x1260, + 0x1289, + 0x128A, + 0x128E, + 0x1290, + 0x12B1, + 0x12B2, + 0x12B6, + 0x12B8, + 0x12BF, + 0x12C0, + 0x12C1, + 0x12C2, + 0x12C6, + 0x12C8, + 0x12D7, + 0x12D8, + 0x1311, + 0x1312, + 0x1316, + 0x1318, + 0x135B, + 0x135D, + 0x137D, + 0x1380, + 0x139A, + 0x13A0, + 0x13F6, + 0x13F8, + 0x13FE, + 0x1400, + 0x169D, + 0x16A0, + 0x16F9, + 0x1700, + 0x170D, + 0x170E, + 0x1715, + 0x1720, + 0x1737, + 0x1740, + 0x1754, + 0x1760, + 0x176D, + 0x176E, + 0x1771, + 0x1772, + 0x1774, + 0x1780, + 0x17DE, + 0x17E0, + 0x17EA, + 0x17F0, + 0x17FA, + 0x1800, + 0x180F, + 0x1810, + 0x181A, + 0x1820, + 0x1879, + 0x1880, + 0x18AB, + 0x18B0, + 0x18F6, + 0x1900, + 0x191F, + 0x1920, + 0x192C, + 0x1930, + 0x193C, + 0x1940, + 0x1941, + 0x1944, + 0x196E, + 0x1970, + 0x1975, + 0x1980, + 0x19AC, + 0x19B0, + 0x19CA, + 0x19D0, + 0x19DB, + 0x19DE, + 0x1A1C, + 0x1A1E, + 0x1A5F, + 0x1A60, + 0x1A7D, + 0x1A7F, + 0x1A8A, + 0x1A90, + 0x1A9A, + 0x1AA0, + 0x1AAE, + 0x1AB0, + 0x1ABF, + 0x1B00, + 0x1B4C, + 0x1B50, + 0x1B7D, + 0x1B80, + 0x1BF4, + 0x1BFC, + 0x1C38, + 0x1C3B, + 0x1C4A, + 0x1C4D, + 0x1C89, + 0x1C90, + 0x1CBB, + 0x1CBD, + 0x1CC8, + 0x1CD0, + 0x1CFA, + 0x1D00, + 0x1DFA, + 0x1DFB, + 0x1F16, + 0x1F18, + 0x1F1E, + 0x1F20, + 0x1F46, + 0x1F48, + 0x1F4E, + 0x1F50, + 0x1F58, + 0x1F59, + 0x1F5A, + 0x1F5B, + 0x1F5C, + 0x1F5D, + 0x1F5E, + 0x1F5F, + 0x1F7E, + 0x1F80, + 0x1FB5, + 0x1FB6, + 0x1FC5, + 0x1FC6, + 0x1FD4, + 0x1FD6, + 0x1FDC, + 0x1FDD, + 0x1FF0, + 0x1FF2, + 0x1FF5, + 0x1FF6, + 0x1FFF, + 0x2000, + 0x2065, + 0x2066, + 0x2072, + 0x2074, + 0x208F, + 0x2090, + 0x209D, + 0x20A0, + 0x20C0, + 0x20D0, + 0x20F1, + 0x2100, + 0x218C, + 0x2190, + 0x2427, + 0x2440, + 0x244B, + 0x2460, + 0x2B74, + 0x2B76, + 0x2B96, + 0x2B98, + 0x2BC9, + 0x2BCA, + 0x2BFF, + 0x2C00, + 0x2C2F, + 0x2C30, + 0x2C5F, + 0x2C60, + 0x2CF4, + 0x2CF9, + 0x2D26, + 0x2D27, + 0x2D28, + 0x2D2D, + 0x2D2E, + 0x2D30, + 0x2D68, + 0x2D6F, + 0x2D71, + 0x2D7F, + 0x2D97, + 0x2DA0, + 0x2DA7, + 0x2DA8, + 0x2DAF, + 0x2DB0, + 0x2DB7, + 0x2DB8, + 0x2DBF, + 0x2DC0, + 0x2DC7, + 0x2DC8, + 0x2DCF, + 0x2DD0, + 0x2DD7, + 0x2DD8, + 0x2DDF, + 0x2DE0, + 0x2E4F, + 0x2E80, + 0x2E9A, + 0x2E9B, + 0x2EF4, + 0x2F00, + 0x2FD6, + 0x2FF0, + 0x2FFC, + 0x3000, + 0x3040, + 0x3041, + 0x3097, + 0x3099, + 0x3100, + 0x3105, + 0x3130, + 0x3131, + 0x318F, + 0x3190, + 0x31BB, + 0x31C0, + 0x31E4, + 0x31F0, + 0x321F, + 0x3220, + 0x32FF, + 0x3300, + 0x4DB6, + 0x4DC0, + 0x9FF0, + 0xA000, + 0xA48D, + 0xA490, + 0xA4C7, + 0xA4D0, + 0xA62C, + 0xA640, + 0xA6F8, + 0xA700, + 0xA7BA, + 0xA7F7, + 0xA82C, + 0xA830, + 0xA83A, + 0xA840, + 0xA878, + 0xA880, + 0xA8C6, + 0xA8CE, + 0xA8DA, + 0xA8E0, + 0xA954, + 0xA95F, + 0xA97D, + 0xA980, + 0xA9CE, + 0xA9CF, + 0xA9DA, + 0xA9DE, + 0xA9FF, + 0xAA00, + 0xAA37, + 0xAA40, + 0xAA4E, + 0xAA50, + 0xAA5A, + 0xAA5C, + 0xAAC3, + 0xAADB, + 0xAAF7, + 0xAB01, + 0xAB07, + 0xAB09, + 0xAB0F, + 0xAB11, + 0xAB17, + 0xAB20, + 0xAB27, + 0xAB28, + 0xAB2F, + 0xAB30, + 0xAB66, + 0xAB70, + 0xABEE, + 0xABF0, + 0xABFA, + 0xAC00, + 0xD7A4, + 0xD7B0, + 0xD7C7, + 0xD7CB, + 0xD7FC, + 0xD800, + 0xFA6E, + 0xFA70, + 0xFADA, + 0xFB00, + 0xFB07, + 0xFB13, + 0xFB18, + 0xFB1D, + 0xFB37, + 0xFB38, + 0xFB3D, + 0xFB3E, + 0xFB3F, + 0xFB40, + 0xFB42, + 0xFB43, + 0xFB45, + 0xFB46, + 0xFBC2, + 0xFBD3, + 0xFD40, + 0xFD50, + 0xFD90, + 0xFD92, + 0xFDC8, + 0xFDD0, + 0xFDFE, + 0xFE00, + 0xFE1A, + 0xFE20, + 0xFE53, + 0xFE54, + 0xFE67, + 0xFE68, + 0xFE6C, + 0xFE70, + 0xFE75, + 0xFE76, + 0xFEFD, + 0xFEFF, + 0xFF00, + 0xFF01, + 0xFFBF, + 0xFFC2, + 0xFFC8, + 0xFFCA, + 0xFFD0, + 0xFFD2, + 0xFFD8, + 0xFFDA, + 0xFFDD, + 0xFFE0, + 0xFFE7, + 0xFFE8, + 0xFFEF, + 0xFFF9, + 0x1000C, + 0x1000D, + 0x10027, + 0x10028, + 0x1003B, + 0x1003C, + 0x1003E, + 0x1003F, + 0x1004E, + 0x10050, + 0x1005E, + 0x10080, + 0x100FB, + 0x10100, + 0x10103, + 0x10107, + 0x10134, + 0x10137, + 0x1018F, + 0x10190, + 0x1019C, + 0x101A0, + 0x101A1, + 0x101D0, + 0x101FE, + 0x10280, + 0x1029D, + 0x102A0, + 0x102D1, + 0x102E0, + 0x102FC, + 0x10300, + 0x10324, + 0x1032D, + 0x1034B, + 0x10350, + 0x1037B, + 0x10380, + 0x1039E, + 0x1039F, + 0x103C4, + 0x103C8, + 0x103D6, + 0x10400, + 0x1049E, + 0x104A0, + 0x104AA, + 0x104B0, + 0x104D4, + 0x104D8, + 0x104FC, + 0x10500, + 0x10528, + 0x10530, + 0x10564, + 0x1056F, + 0x10570, + 0x10600, + 0x10737, + 0x10740, + 0x10756, + 0x10760, + 0x10768, + 0x10800, + 0x10806, + 0x10808, + 0x10809, + 0x1080A, + 0x10836, + 0x10837, + 0x10839, + 0x1083C, + 0x1083D, + 0x1083F, + 0x10856, + 0x10857, + 0x1089F, + 0x108A7, + 0x108B0, + 0x108E0, + 0x108F3, + 0x108F4, + 0x108F6, + 0x108FB, + 0x1091C, + 0x1091F, + 0x1093A, + 0x1093F, + 0x10940, + 0x10980, + 0x109B8, + 0x109BC, + 0x109D0, + 0x109D2, + 0x10A04, + 0x10A05, + 0x10A07, + 0x10A0C, + 0x10A14, + 0x10A15, + 0x10A18, + 0x10A19, + 0x10A36, + 0x10A38, + 0x10A3B, + 0x10A3F, + 0x10A49, + 0x10A50, + 0x10A59, + 0x10A60, + 0x10AA0, + 0x10AC0, + 0x10AE7, + 0x10AEB, + 0x10AF7, + 0x10B00, + 0x10B36, + 0x10B39, + 0x10B56, + 0x10B58, + 0x10B73, + 0x10B78, + 0x10B92, + 0x10B99, + 0x10B9D, + 0x10BA9, + 0x10BB0, + 0x10C00, + 0x10C49, + 0x10C80, + 0x10CB3, + 0x10CC0, + 0x10CF3, + 0x10CFA, + 0x10D28, + 0x10D30, + 0x10D3A, + 0x10E60, + 0x10E7F, + 0x10F00, + 0x10F28, + 0x10F30, + 0x10F5A, + 0x11000, + 0x1104E, + 0x11052, + 0x11070, + 0x1107F, + 0x110C2, + 0x110CD, + 0x110CE, + 0x110D0, + 0x110E9, + 0x110F0, + 0x110FA, + 0x11100, + 0x11135, + 0x11136, + 0x11147, + 0x11150, + 0x11177, + 0x11180, + 0x111CE, + 0x111D0, + 0x111E0, + 0x111E1, + 0x111F5, + 0x11200, + 0x11212, + 0x11213, + 0x1123F, + 0x11280, + 0x11287, + 0x11288, + 0x11289, + 0x1128A, + 0x1128E, + 0x1128F, + 0x1129E, + 0x1129F, + 0x112AA, + 0x112B0, + 0x112EB, + 0x112F0, + 0x112FA, + 0x11300, + 0x11304, + 0x11305, + 0x1130D, + 0x1130F, + 0x11311, + 0x11313, + 0x11329, + 0x1132A, + 0x11331, + 0x11332, + 0x11334, + 0x11335, + 0x1133A, + 0x1133B, 0x11345, 0x11347, 0x11349, @@ -280433,7 +288248,7 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x1145B, 0x1145C, 0x1145D, - 0x1145E, + 0x1145F, 0x11480, 0x114C8, 0x114D0, @@ -280453,11 +288268,13 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x116C0, 0x116CA, 0x11700, - 0x1171A, + 0x1171B, 0x1171D, 0x1172C, 0x11730, 0x11740, + 0x11800, + 0x1183C, 0x118A0, 0x118F3, 0x118FF, @@ -280467,8 +288284,6 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x11A50, 0x11A84, 0x11A86, - 0x11A9D, - 0x11A9E, 0x11AA3, 0x11AC0, 0x11AF9, @@ -280500,6 +288315,20 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x11D48, 0x11D50, 0x11D5A, + 0x11D60, + 0x11D66, + 0x11D67, + 0x11D69, + 0x11D6A, + 0x11D8F, + 0x11D90, + 0x11D92, + 0x11D93, + 0x11D99, + 0x11DA0, + 0x11DAA, + 0x11EE0, + 0x11EF9, 0x12000, 0x1239A, 0x12400, @@ -280534,6 +288363,8 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x16B78, 0x16B7D, 0x16B90, + 0x16E40, + 0x16E9B, 0x16F00, 0x16F45, 0x16F50, @@ -280543,7 +288374,7 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x16FE0, 0x16FE2, 0x17000, - 0x187ED, + 0x187F2, 0x18800, 0x18AF3, 0x1B000, @@ -280568,10 +288399,12 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x1D1E9, 0x1D200, 0x1D246, + 0x1D2E0, + 0x1D2F4, 0x1D300, 0x1D357, 0x1D360, - 0x1D372, + 0x1D379, 0x1D400, 0x1D455, 0x1D456, @@ -280638,6 +288471,8 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x1E95A, 0x1E95E, 0x1E960, + 0x1EC71, + 0x1ECB5, 0x1EE00, 0x1EE04, 0x1EE05, @@ -280721,8 +288556,6 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x1F100, 0x1F10D, 0x1F110, - 0x1F12F, - 0x1F130, 0x1F16C, 0x1F170, 0x1F1AD, @@ -280741,11 +288574,11 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x1F6E0, 0x1F6ED, 0x1F6F0, - 0x1F6F9, + 0x1F6FA, 0x1F700, 0x1F774, 0x1F780, - 0x1F7D5, + 0x1F7D9, 0x1F800, 0x1F80C, 0x1F810, @@ -280761,15 +288594,21 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x1F910, 0x1F93F, 0x1F940, - 0x1F94D, - 0x1F950, - 0x1F96C, - 0x1F980, - 0x1F998, + 0x1F971, + 0x1F973, + 0x1F977, + 0x1F97A, + 0x1F97B, + 0x1F97C, + 0x1F9A3, + 0x1F9B0, + 0x1F9BA, 0x1F9C0, - 0x1F9C1, + 0x1F9C3, 0x1F9D0, - 0x1F9E7, + 0x1FA00, + 0x1FA60, + 0x1FA6E, 0x1FFFE, 0x2A6D7, 0x2A700, @@ -280816,8 +288655,8 @@ static const UV UNI_IN__10_invlist[] = { /* for all charsets */ 0x110000 }; -static const UV UNI_IN__11_invlist[] = { /* for all charsets */ - 1336, /* Number of elements */ +static const UV UNI_IN__12_invlist[] = { /* for all charsets */ + 1354, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -281039,7 +288878,7 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0xC64, 0xC66, 0xC70, - 0xC78, + 0xC77, 0xC8D, 0xC8E, 0xC91, @@ -281113,27 +288952,13 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0xE83, 0xE84, 0xE85, - 0xE87, - 0xE89, - 0xE8A, + 0xE86, 0xE8B, - 0xE8D, - 0xE8E, - 0xE94, - 0xE98, - 0xE99, - 0xEA0, - 0xEA1, + 0xE8C, 0xEA4, 0xEA5, 0xEA6, 0xEA7, - 0xEA8, - 0xEAA, - 0xEAC, - 0xEAD, - 0xEBA, - 0xEBB, 0xEBE, 0xEC0, 0xEC5, @@ -281286,7 +289111,7 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x1CBD, 0x1CC8, 0x1CD0, - 0x1CFA, + 0x1CFB, 0x1D00, 0x1DFA, 0x1DFB, @@ -281344,10 +289169,6 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x2B76, 0x2B96, 0x2B98, - 0x2BC9, - 0x2BCA, - 0x2BFF, - 0x2C00, 0x2C2F, 0x2C30, 0x2C5F, @@ -281382,7 +289203,7 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E4F, + 0x2E50, 0x2E80, 0x2E9A, 0x2E9B, @@ -281422,7 +289243,9 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0xA640, 0xA6F8, 0xA700, - 0xA7BA, + 0xA7C0, + 0xA7C2, + 0xA7C7, 0xA7F7, 0xA82C, 0xA830, @@ -281464,7 +289287,7 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0xAB28, 0xAB2F, 0xAB30, - 0xAB66, + 0xAB68, 0xAB70, 0xABEE, 0xABF0, @@ -281675,6 +289498,8 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x10F28, 0x10F30, 0x10F5A, + 0x10FE0, + 0x10FF7, 0x11000, 0x1104E, 0x11052, @@ -281752,7 +289577,7 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x1145B, 0x1145C, 0x1145D, - 0x1145F, + 0x11460, 0x11480, 0x114C8, 0x114D0, @@ -281768,7 +289593,7 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x11660, 0x1166D, 0x11680, - 0x116B8, + 0x116B9, 0x116C0, 0x116CA, 0x11700, @@ -281783,11 +289608,15 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x118F3, 0x118FF, 0x11900, + 0x119A0, + 0x119A8, + 0x119AA, + 0x119D8, + 0x119DA, + 0x119E5, 0x11A00, 0x11A48, 0x11A50, - 0x11A84, - 0x11A86, 0x11AA3, 0x11AC0, 0x11AF9, @@ -281833,7 +289662,9 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x11DAA, 0x11EE0, 0x11EF9, - 0x12000, + 0x11FC0, + 0x11FF2, + 0x11FFF, 0x1239A, 0x12400, 0x1246F, @@ -281843,6 +289674,8 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x12544, 0x13000, 0x1342F, + 0x13430, + 0x13439, 0x14400, 0x14647, 0x16800, @@ -281870,19 +289703,23 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x16E40, 0x16E9B, 0x16F00, - 0x16F45, - 0x16F50, - 0x16F7F, + 0x16F4B, + 0x16F4F, + 0x16F88, 0x16F8F, 0x16FA0, 0x16FE0, - 0x16FE2, + 0x16FE4, 0x17000, - 0x187F2, + 0x187F8, 0x18800, 0x18AF3, 0x1B000, 0x1B11F, + 0x1B150, + 0x1B153, + 0x1B164, + 0x1B168, 0x1B170, 0x1B2FC, 0x1BC00, @@ -281965,18 +289802,32 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x1E025, 0x1E026, 0x1E02B, + 0x1E100, + 0x1E12D, + 0x1E130, + 0x1E13E, + 0x1E140, + 0x1E14A, + 0x1E14E, + 0x1E150, + 0x1E2C0, + 0x1E2FA, + 0x1E2FF, + 0x1E300, 0x1E800, 0x1E8C5, 0x1E8C7, 0x1E8D7, 0x1E900, - 0x1E94B, + 0x1E94C, 0x1E950, 0x1E95A, 0x1E95E, 0x1E960, 0x1EC71, 0x1ECB5, + 0x1ED01, + 0x1ED3E, 0x1EE00, 0x1EE04, 0x1EE05, @@ -282060,7 +289911,7 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x1F100, 0x1F10D, 0x1F110, - 0x1F16C, + 0x1F16D, 0x1F170, 0x1F1AD, 0x1F1E6, @@ -282074,15 +289925,17 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x1F260, 0x1F266, 0x1F300, - 0x1F6D5, + 0x1F6D6, 0x1F6E0, 0x1F6ED, 0x1F6F0, - 0x1F6FA, + 0x1F6FB, 0x1F700, 0x1F774, 0x1F780, 0x1F7D9, + 0x1F7E0, + 0x1F7EC, 0x1F800, 0x1F80C, 0x1F810, @@ -282095,24 +289948,28 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x1F8AE, 0x1F900, 0x1F90C, - 0x1F910, - 0x1F93F, - 0x1F940, - 0x1F971, + 0x1F90D, + 0x1F972, 0x1F973, 0x1F977, 0x1F97A, - 0x1F97B, - 0x1F97C, 0x1F9A3, - 0x1F9B0, - 0x1F9BA, - 0x1F9C0, - 0x1F9C3, - 0x1F9D0, - 0x1FA00, + 0x1F9A5, + 0x1F9AB, + 0x1F9AE, + 0x1F9CB, + 0x1F9CD, + 0x1FA54, 0x1FA60, 0x1FA6E, + 0x1FA70, + 0x1FA74, + 0x1FA78, + 0x1FA7B, + 0x1FA80, + 0x1FA83, + 0x1FA90, + 0x1FA96, 0x1FFFE, 0x2A6D7, 0x2A700, @@ -282159,8 +290016,8 @@ static const UV UNI_IN__11_invlist[] = { /* for all charsets */ 0x110000 }; -static const UV UNI_IN__12_invlist[] = { /* for all charsets */ - 1354, /* Number of elements */ +static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ + 1352, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -282733,8 +290590,6 @@ static const UV UNI_IN__12_invlist[] = { /* for all charsets */ 0x31F0, 0x321F, 0x3220, - 0x32FF, - 0x3300, 0x4DB6, 0x4DC0, 0x9FF0, @@ -283520,8 +291375,8 @@ static const UV UNI_IN__12_invlist[] = { /* for all charsets */ 0x110000 }; -static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ - 1352, /* Number of elements */ +static const UV UNI_IN__13_invlist[] = { /* for all charsets */ + 1372, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -283572,7 +291427,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x8A0, 0x8B5, 0x8B6, - 0x8BE, + 0x8C8, 0x8D3, 0x984, 0x985, @@ -283681,7 +291536,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0xB49, 0xB4B, 0xB4E, - 0xB56, + 0xB55, 0xB58, 0xB5C, 0xB5E, @@ -283770,8 +291625,6 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0xCF1, 0xCF3, 0xD00, - 0xD04, - 0xD05, 0xD0D, 0xD0E, 0xD11, @@ -283785,7 +291638,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0xD64, 0xD66, 0xD80, - 0xD82, + 0xD81, 0xD84, 0xD85, 0xD97, @@ -283958,7 +291811,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1ABF, + 0x1AC1, 0x1B00, 0x1B4C, 0x1B50, @@ -284033,7 +291886,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x2B74, 0x2B76, 0x2B96, - 0x2B98, + 0x2B97, 0x2C2F, 0x2C30, 0x2C5F, @@ -284068,7 +291921,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E50, + 0x2E53, 0x2E80, 0x2E9A, 0x2E9B, @@ -284088,15 +291941,11 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x3131, 0x318F, 0x3190, - 0x31BB, - 0x31C0, 0x31E4, 0x31F0, 0x321F, 0x3220, - 0x4DB6, - 0x4DC0, - 0x9FF0, + 0x9FFD, 0xA000, 0xA48D, 0xA490, @@ -284108,9 +291957,9 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0xA700, 0xA7C0, 0xA7C2, - 0xA7C7, - 0xA7F7, - 0xA82C, + 0xA7CB, + 0xA7F5, + 0xA82D, 0xA830, 0xA83A, 0xA840, @@ -284150,7 +291999,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0xAB28, 0xAB2F, 0xAB30, - 0xAB68, + 0xAB6C, 0xAB70, 0xABEE, 0xABF0, @@ -284238,7 +292087,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x10137, 0x1018F, 0x10190, - 0x1019C, + 0x1019D, 0x101A0, 0x101A1, 0x101D0, @@ -284357,10 +292206,18 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x10D3A, 0x10E60, 0x10E7F, + 0x10E80, + 0x10EAA, + 0x10EAB, + 0x10EAE, + 0x10EB0, + 0x10EB2, 0x10F00, 0x10F28, 0x10F30, 0x10F5A, + 0x10FB0, + 0x10FCC, 0x10FE0, 0x10FF7, 0x11000, @@ -284378,12 +292235,10 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x11100, 0x11135, 0x11136, - 0x11147, + 0x11148, 0x11150, 0x11177, 0x11180, - 0x111CE, - 0x111D0, 0x111E0, 0x111E1, 0x111F5, @@ -284436,11 +292291,9 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x11370, 0x11375, 0x11400, - 0x1145A, - 0x1145B, 0x1145C, 0x1145D, - 0x11460, + 0x11462, 0x11480, 0x114C8, 0x114D0, @@ -284470,7 +292323,21 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x118A0, 0x118F3, 0x118FF, - 0x11900, + 0x11907, + 0x11909, + 0x1190A, + 0x1190C, + 0x11914, + 0x11915, + 0x11917, + 0x11918, + 0x11936, + 0x11937, + 0x11939, + 0x1193B, + 0x11947, + 0x11950, + 0x1195A, 0x119A0, 0x119A8, 0x119AA, @@ -284525,6 +292392,8 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x11DAA, 0x11EE0, 0x11EF9, + 0x11FB0, + 0x11FB1, 0x11FC0, 0x11FF2, 0x11FFF, @@ -284572,11 +292441,15 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x16F8F, 0x16FA0, 0x16FE0, - 0x16FE4, + 0x16FE5, + 0x16FF0, + 0x16FF2, 0x17000, 0x187F8, 0x18800, - 0x18AF3, + 0x18CD6, + 0x18D00, + 0x18D09, 0x1B000, 0x1B11F, 0x1B150, @@ -284772,11 +292645,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x1F0D1, 0x1F0F6, 0x1F100, - 0x1F10D, - 0x1F110, - 0x1F16D, - 0x1F170, - 0x1F1AD, + 0x1F1AE, 0x1F1E6, 0x1F203, 0x1F210, @@ -284788,11 +292657,11 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x1F260, 0x1F266, 0x1F300, - 0x1F6D6, + 0x1F6D8, 0x1F6E0, 0x1F6ED, 0x1F6F0, - 0x1F6FB, + 0x1F6FD, 0x1F700, 0x1F774, 0x1F780, @@ -284809,32 +292678,38 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x1F888, 0x1F890, 0x1F8AE, + 0x1F8B0, + 0x1F8B2, 0x1F900, - 0x1F90C, - 0x1F90D, - 0x1F972, - 0x1F973, - 0x1F977, + 0x1F979, 0x1F97A, - 0x1F9A3, - 0x1F9A5, - 0x1F9AB, - 0x1F9AE, - 0x1F9CB, + 0x1F9CC, 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, - 0x1FA74, + 0x1FA75, 0x1FA78, 0x1FA7B, 0x1FA80, - 0x1FA83, + 0x1FA87, 0x1FA90, - 0x1FA96, + 0x1FAA9, + 0x1FAB0, + 0x1FAB7, + 0x1FAC0, + 0x1FAC3, + 0x1FAD0, + 0x1FAD7, + 0x1FB00, + 0x1FB93, + 0x1FB94, + 0x1FBCB, + 0x1FBF0, + 0x1FBFA, 0x1FFFE, - 0x2A6D7, + 0x2A6DE, 0x2A700, 0x2B735, 0x2B740, @@ -284846,7 +292721,7 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x2F800, 0x2FA1E, 0x2FFFE, - 0x30000, + 0x3134B, 0x3FFFE, 0x40000, 0x4FFFE, @@ -284879,8 +292754,8 @@ static const UV UNI_IN__12_DOT_1_invlist[] = { /* for all charsets */ 0x110000 }; -static const UV UNI_IN__13_invlist[] = { /* for all charsets */ - 1372, /* Number of elements */ +static const UV UNI_IN__14_invlist[] = { /* for all charsets */ + 1412, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -284909,8 +292784,6 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -284928,11 +292801,11 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -285088,7 +292961,7 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -285098,6 +292971,8 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -285120,7 +292995,7 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -285255,10 +293130,8 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -285275,8 +293148,6 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -285315,11 +293186,11 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -285335,8 +293206,6 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -285377,7 +293246,7 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -285391,10 +293260,6 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -285425,7 +293290,7 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -285449,8 +293314,6 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -285459,10 +293322,14 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -285533,16 +293400,12 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, - 0xFDD0, - 0xFDFE, - 0xFE00, + 0xFDCF, 0xFE1A, 0xFE20, 0xFE53, @@ -285627,13 +293490,33 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -285720,6 +293603,8 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -285727,9 +293612,9 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -285813,7 +293698,7 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -285821,7 +293706,7 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -285852,7 +293737,7 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -285908,6 +293793,8 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -285921,7 +293808,9 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -285954,8 +293843,14 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -285972,12 +293867,18 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -286032,6 +293933,8 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -286050,10 +293953,20 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -286162,7 +294075,7 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -286172,6 +294085,8 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -286185,27 +294100,27 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -286213,9 +294128,9 @@ static const UV UNI_IN__13_invlist[] = { /* for all charsets */ 0x1FBF0, 0x1FBFA, 0x1FFFE, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -302520,7 +310435,7 @@ static const UV UNI_INAHOM_invlist[] = { /* for all charsets */ 1 if it starts at the element beyond 0 */ 0x0, 0x11700, - 0x11740 + 0x11750 }; static const UV UNI_INANATOLIANHIEROGLYPHS_invlist[] = { /* for all charsets */ @@ -302743,6 +310658,16 @@ static const UV UNI_INCUNEIFORM_invlist[] = { /* for all charsets */ 0x12400 }; +static const UV UNI_INCYPROMINOAN_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x12F90, + 0x13000 +}; + static const UV UNI_INCYRILLIC_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -303503,6 +311428,16 @@ static const UV UNI_INOLDTURKIC_invlist[] = { /* for all charsets */ 0x10C50 }; +static const UV UNI_INOLDUYGHUR_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x10F70, + 0x10FB0 +}; + static const UV UNI_INORIYA_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -303554,7 +311489,7 @@ static const UV UNI_INPAUCINHAU_invlist[] = { /* for all charsets */ }; static const UV UNI_INPC__BOTTOM_invlist[] = { /* for all charsets */ - 287, /* Number of elements */ + 291, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -303605,6 +311540,8 @@ static const UV UNI_INPC__BOTTOM_invlist[] = { /* for all charsets */ 0xB4E, 0xB62, 0xB64, + 0xC3C, + 0xC3D, 0xC56, 0xC57, 0xC62, @@ -303662,7 +311599,7 @@ static const UV UNI_INPC__BOTTOM_invlist[] = { /* for all charsets */ 0x1713, 0x1715, 0x1733, - 0x1735, + 0x1734, 0x1753, 0x1754, 0x1773, @@ -303751,6 +311688,8 @@ static const UV UNI_INPC__BOTTOM_invlist[] = { /* for all charsets */ 0x110B5, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x1112A, 0x1112C, 0x11131, @@ -304012,7 +311951,7 @@ static const UV UNI_INPC__LEFTANDRIGHT_invlist[] = { /* for all charsets */ }; static const UV UNI_INPC__NA_invlist[] = { /* for all charsets */ - 421, /* Number of elements */ + 429, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -304099,6 +312038,8 @@ static const UV UNI_INPC__NA_invlist[] = { /* for all charsets */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -304202,7 +312143,7 @@ static const UV UNI_INPC__NA_invlist[] = { /* for all charsets */ 0x109A, 0x109E, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -304321,10 +312262,16 @@ static const UV UNI_INPC__NA_invlist[] = { /* for all charsets */ 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x11080, 0x11083, 0x110B0, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -304456,7 +312403,7 @@ static const UV UNI_INPC__OVERSTRUCK_invlist[] = { /* for all charsets */ }; static const UV UNI_INPC__RIGHT_invlist[] = { /* for all charsets */ - 329, /* Number of elements */ + 333, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -304569,6 +312516,10 @@ static const UV UNI_INPC__RIGHT_invlist[] = { /* for all charsets */ 0x1090, 0x109A, 0x109D, + 0x1715, + 0x1716, + 0x1734, + 0x1735, 0x17B6, 0x17B7, 0x17C7, @@ -304792,7 +312743,7 @@ static const UV UNI_INPC__RIGHT_invlist[] = { /* for all charsets */ }; static const UV UNI_INPC__TOP_invlist[] = { /* for all charsets */ - 387, /* Number of elements */ + 391, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -305055,6 +313006,10 @@ static const UV UNI_INPC__TOP_invlist[] = { /* for all charsets */ 0x1103C, 0x11042, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x11080, 0x11082, 0x110B5, @@ -305574,7 +313529,7 @@ static const UV UNI_INSC__CANTILLATIONMARK_invlist[] = { /* for all charsets */ }; static const UV UNI_INSC__CONSONANT_invlist[] = { /* for all charsets */ - 307, /* Number of elements */ + 311, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -305714,9 +313669,9 @@ static const UV UNI_INSC__CONSONANT_invlist[] = { /* for all charsets */ 0x108E, 0x108F, 0x1703, - 0x170D, - 0x170E, 0x1712, + 0x171F, + 0x1720, 0x1723, 0x1732, 0x1743, @@ -305742,7 +313697,7 @@ static const UV UNI_INSC__CONSONANT_invlist[] = { /* for all charsets */ 0x1B13, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B8A, 0x1BA1, 0x1BAE, @@ -305811,6 +313766,8 @@ static const UV UNI_INSC__CONSONANT_invlist[] = { /* for all charsets */ 0x10A36, 0x11013, 0x11038, + 0x11075, + 0x11076, 0x1108D, 0x110B0, 0x11107, @@ -305861,6 +313818,8 @@ static const UV UNI_INSC__CONSONANT_invlist[] = { /* for all charsets */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x1180A, 0x1182C, 0x1190C, @@ -305888,13 +313847,17 @@ static const UV UNI_INSC__CONSONANT_invlist[] = { /* for all charsets */ }; static const UV UNI_INSC__CONSONANTDEAD_invlist[] = { /* for all charsets */ - 9, /* Number of elements */ + 13, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, 0x9CE, 0x9CF, + 0xC5D, + 0xC5E, + 0xCDD, + 0xCDE, 0xD54, 0xD57, 0xD7A, @@ -305904,7 +313867,7 @@ static const UV UNI_INSC__CONSONANTDEAD_invlist[] = { /* for all charsets */ }; static const UV UNI_INSC__CONSONANTFINAL_invlist[] = { /* for all charsets */ - 23, /* Number of elements */ + 29, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -305917,6 +313880,10 @@ static const UV UNI_INSC__CONSONANTFINAL_invlist[] = { /* for all charsets */ 0x19C8, 0x1A58, 0x1A5A, + 0x1B03, + 0x1B04, + 0x1B81, + 0x1B82, 0x1BBE, 0x1BC0, 0x1BF0, @@ -305925,6 +313892,8 @@ static const UV UNI_INSC__CONSONANTFINAL_invlist[] = { /* for all charsets */ 0x1C34, 0xA94F, 0xA953, + 0xA982, + 0xA983, 0xAA40, 0xAA4E, 0xABDB, @@ -306196,19 +314165,13 @@ static const UV UNI_INSC__CONSONANTSUBJOINED_invlist[] = { /* for all charsets }; static const UV UNI_INSC__CONSONANTSUCCEEDINGREPHA_invlist[] = { /* for all charsets */ - 9, /* Number of elements */ + 3, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, 0x17CC, - 0x17CD, - 0x1B03, - 0x1B04, - 0x1B81, - 0x1B82, - 0xA982, - 0xA983 + 0x17CD }; static const UV UNI_INSC__CONSONANTWITHSTACKER_invlist[] = { /* for all charsets */ @@ -306294,7 +314257,7 @@ static const UV UNI_INSC__NONJOINER_invlist[] = { /* for all charsets */ }; static const UV UNI_INSC__NUKTA_invlist[] = { /* for all charsets */ - 53, /* Number of elements */ + 55, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -306311,6 +314274,8 @@ static const UV UNI_INSC__NUKTA_invlist[] = { /* for all charsets */ 0xB00, 0xB3C, 0xB3D, + 0xC3C, + 0xC3D, 0xCBC, 0xCBD, 0xF39, @@ -306678,7 +314643,7 @@ static const UV UNI_INSC__NUMBERJOINER_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ - 643, /* Number of elements */ + 647, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -306861,7 +314826,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -306871,6 +314836,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -306895,7 +314862,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -307008,10 +314975,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ 0x1050, 0x109E, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -307056,7 +315021,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ 0x1A90, 0x1A9A, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B80, @@ -307150,9 +315115,11 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x11047, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11135, 0x11136, @@ -307247,6 +315214,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ 0x1172C, 0x11730, 0x1173C, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x11900, @@ -307335,7 +315304,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ - 643, /* Number of elements */ + 647, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -307518,7 +315487,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -307528,6 +315497,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -307552,7 +315523,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -307665,10 +315636,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ 0x1050, 0x109E, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -307713,7 +315682,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ 0x1A90, 0x1A9A, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B80, @@ -307807,9 +315776,11 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x11047, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11135, 0x11136, @@ -307904,6 +315875,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ 0x1172C, 0x11730, 0x1173C, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x11900, @@ -307992,7 +315965,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ - 643, /* Number of elements */ + 647, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -308175,7 +316148,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -308185,6 +316158,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -308209,7 +316184,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -308322,10 +316297,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ 0x1050, 0x109E, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -308370,7 +316343,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ 0x1A90, 0x1A9A, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B80, @@ -308464,9 +316437,11 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x11047, 0x11052, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11135, 0x11136, @@ -308561,6 +316536,8 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ 0x1172C, 0x11730, 0x1173C, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x11900, @@ -308644,7 +316621,7 @@ static const UV UNI_INSC__OTHER_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_INSC__PUREKILLER_invlist[] = { /* for all charsets */ - 43, /* Number of elements */ + 45, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -308662,7 +316639,7 @@ static const UV UNI_INSC__PUREKILLER_invlist[] = { /* for all charsets */ 0x103A, 0x103B, 0x1714, - 0x1715, + 0x1716, 0x1734, 0x1735, 0x17D1, @@ -308679,6 +316656,8 @@ static const UV UNI_INSC__PUREKILLER_invlist[] = { /* for all charsets */ 0xA954, 0xABED, 0xABEE, + 0x11070, + 0x11071, 0x11134, 0x11135, 0x112EA, @@ -309074,7 +317053,7 @@ static const UV UNI_INSC__VOWEL_invlist[] = { /* for all charsets */ }; static const UV UNI_INSC__VOWELDEPENDENT_invlist[] = { /* for all charsets */ - 265, /* Number of elements */ + 269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -309259,8 +317238,12 @@ static const UV UNI_INSC__VOWELDEPENDENT_invlist[] = { /* for all charsets */ 0x10A0E, 0x11038, 0x11046, + 0x11073, + 0x11075, 0x110B0, 0x110B9, + 0x110C2, + 0x110C3, 0x11127, 0x11133, 0x11145, @@ -309346,7 +317329,7 @@ static const UV UNI_INSC__VOWELDEPENDENT_invlist[] = { /* for all charsets */ }; static const UV UNI_INSC__VOWELINDEPENDENT_invlist[] = { /* for all charsets */ - 175, /* Number of elements */ + 177, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -309463,6 +317446,8 @@ static const UV UNI_INSC__VOWELINDEPENDENT_invlist[] = { /* for all charsets */ 0xABD2, 0x11005, 0x11013, + 0x11071, + 0x11073, 0x11083, 0x1108D, 0x11103, @@ -309677,6 +317662,16 @@ static const UV UNI_INTAMIL_invlist[] = { /* for all charsets */ 0xC00 }; +static const UV UNI_INTANGSA_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x16A70, + 0x16AD0 +}; + static const UV UNI_INTANGUT_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -309747,6 +317742,16 @@ static const UV UNI_INTIRHUTA_invlist[] = { /* for all charsets */ 0x114E0 }; +static const UV UNI_INTOTO_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x1E290, + 0x1E2C0 +}; + static const UV UNI_INUGARITIC_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -309767,6 +317772,16 @@ static const UV UNI_INVAI_invlist[] = { /* for all charsets */ 0xA640 }; +static const UV UNI_INVITHKUQI_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x10570, + 0x105C0 +}; + static const UV UNI_INVS_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -309946,7 +317961,7 @@ static const UV UNI_JG__ALAPH_invlist[] = { /* for all charsets */ }; static const UV UNI_JG__ALEF_invlist[] = { /* for all charsets */ - 13, /* Number of elements */ + 15, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -309962,7 +317977,9 @@ static const UV UNI_JG__ALEF_invlist[] = { /* for all charsets */ 0x675, 0x676, 0x773, - 0x775 + 0x775, + 0x870, + 0x883 }; static const UV UNI_JG__BEH_invlist[] = { /* for all charsets */ @@ -310106,7 +318123,7 @@ static const UV UNI_JG__FINALSEMKATH_invlist[] = { /* for all charsets */ }; static const UV UNI_JG__GAF_invlist[] = { /* for all charsets */ - 15, /* Number of elements */ + 19, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -310121,10 +318138,14 @@ static const UV UNI_JG__GAF_invlist[] = { /* for all charsets */ 0x6B5, 0x762, 0x765, + 0x88D, + 0x88E, 0x8B0, 0x8B1, 0x8C2, - 0x8C3 + 0x8C3, + 0x8C8, + 0x8C9 }; static const UV UNI_JG__GAMAL_invlist[] = { /* for all charsets */ @@ -310140,7 +318161,7 @@ static const UV UNI_JG__GAMAL_invlist[] = { /* for all charsets */ }; static const UV UNI_JG__HAH_invlist[] = { /* for all charsets */ - 21, /* Number of elements */ + 23, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -310159,6 +318180,8 @@ static const UV UNI_JG__HAH_invlist[] = { /* for all charsets */ 0x773, 0x77C, 0x77D, + 0x88A, + 0x88B, 0x8A2, 0x8A3, 0x8C1, @@ -310728,7 +318751,7 @@ static const UV UNI_JG__MIM_invlist[] = { /* for all charsets */ }; static const UV UNI_JG__NOJOININGGROUP_invlist[] = { /* for all charsets */ - 61, /* Number of elements */ + 65, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -310761,12 +318784,16 @@ static const UV UNI_JG__NOJOININGGROUP_invlist[] = { /* for all charsets */ 0x780, 0x860, 0x86B, + 0x870, + 0x883, + 0x886, + 0x887, + 0x889, + 0x88F, 0x8A0, 0x8AD, 0x8AE, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8C9, 0x10AC0, 0x10AC6, 0x10AC7, @@ -310796,7 +318823,7 @@ static const UV UNI_JG__NOJOININGGROUP_invlist[] = { /* for all charsets */ }; static const UV UNI_JG__NOON_invlist[] = { /* for all charsets */ - 7, /* Number of elements */ + 9, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -310806,7 +318833,9 @@ static const UV UNI_JG__NOON_invlist[] = { /* for all charsets */ 0x6B9, 0x6BD, 0x767, - 0x76A + 0x76A, + 0x889, + 0x88A }; static const UV UNI_JG__NUN_invlist[] = { /* for all charsets */ @@ -310840,7 +318869,7 @@ static const UV UNI_JG__PE_invlist[] = { /* for all charsets */ }; static const UV UNI_JG__QAF_invlist[] = { /* for all charsets */ - 9, /* Number of elements */ + 11, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -310852,7 +318881,9 @@ static const UV UNI_JG__QAF_invlist[] = { /* for all charsets */ 0x6A7, 0x6A9, 0x8A5, - 0x8A6 + 0x8A6, + 0x8B5, + 0x8B6 }; static const UV UNI_JG__QAPH_invlist[] = { /* for all charsets */ @@ -311010,7 +319041,7 @@ static const UV UNI_JG__SYRIACWAW_invlist[] = { /* for all charsets */ }; static const UV UNI_JG__TAH_invlist[] = { /* for all charsets */ - 7, /* Number of elements */ + 9, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -311019,6 +319050,8 @@ static const UV UNI_JG__TAH_invlist[] = { /* for all charsets */ 0x639, 0x69F, 0x6A0, + 0x88B, + 0x88D, 0x8A3, 0x8A4 }; @@ -311057,6 +319090,26 @@ static const UV UNI_JG__TETH_invlist[] = { /* for all charsets */ 0x71D }; +static const UV UNI_JG__THINYEH_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x886, + 0x887 +}; + +static const UV UNI_JG__VERTICALTAIL_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x88E, + 0x88F +}; + static const UV UNI_JG__WAW_invlist[] = { /* for all charsets */ 15, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -311174,7 +319227,7 @@ static const UV UNI_JOINC_invlist[] = { /* for all charsets */ }; static const UV UNI_JT__C_invlist[] = { /* for all charsets */ - 9, /* Number of elements */ + 11, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -311183,6 +319236,8 @@ static const UV UNI_JT__C_invlist[] = { /* for all charsets */ 0x641, 0x7FA, 0x7FB, + 0x883, + 0x886, 0x180A, 0x180B, 0x200D, @@ -311190,7 +319245,7 @@ static const UV UNI_JT__C_invlist[] = { /* for all charsets */ }; static const UV UNI_JT__D_invlist[] = { /* for all charsets */ - 145, /* Number of elements */ + 151, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -311267,16 +319322,18 @@ static const UV UNI_JT__D_invlist[] = { /* for all charsets */ 0x866, 0x868, 0x869, + 0x886, + 0x887, + 0x889, + 0x88E, 0x8A0, 0x8AA, 0x8AF, 0x8B1, 0x8B3, - 0x8B5, - 0x8B6, 0x8B9, 0x8BA, - 0x8C8, + 0x8C9, 0x1807, 0x1808, 0x1820, @@ -311321,6 +319378,10 @@ static const UV UNI_JT__D_invlist[] = { /* for all charsets */ 0x10F45, 0x10F51, 0x10F54, + 0x10F70, + 0x10F74, + 0x10F76, + 0x10F82, 0x10FB0, 0x10FB1, 0x10FB2, @@ -311360,7 +319421,7 @@ static const UV UNI_JT__L_invlist[] = { /* for all charsets */ }; static const UV UNI_JT__R_invlist[] = { /* for all charsets */ - 125, /* Number of elements */ + 131, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -311435,6 +319496,10 @@ static const UV UNI_JT__R_invlist[] = { /* for all charsets */ 0x868, 0x869, 0x86B, + 0x870, + 0x883, + 0x88E, + 0x88F, 0x8AA, 0x8AD, 0x8AE, @@ -311479,6 +319544,8 @@ static const UV UNI_JT__R_invlist[] = { /* for all charsets */ 0x10F34, 0x10F54, 0x10F55, + 0x10F74, + 0x10F76, 0x10FB4, 0x10FB7, 0x10FB9, @@ -311494,7 +319561,7 @@ static const UV UNI_JT__R_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ - 677, /* Number of elements */ + 695, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -311553,7 +319620,9 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -311635,6 +319704,8 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -311734,7 +319805,7 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -311751,6 +319822,8 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -311782,7 +319855,7 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -311828,8 +319901,6 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -311957,16 +320028,24 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -312129,6 +320208,10 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -312163,6 +320246,8 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -312185,7 +320270,7 @@ static const UV UNI_JT__T_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ - 677, /* Number of elements */ + 695, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -312244,7 +320329,9 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -312326,6 +320413,8 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -312425,7 +320514,7 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -312442,6 +320531,8 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -312473,7 +320564,7 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -312519,8 +320610,6 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -312648,16 +320737,24 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -312820,6 +320917,10 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -312854,6 +320955,8 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -312876,7 +320979,7 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ - 677, /* Number of elements */ + 695, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -312935,7 +321038,9 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -313017,6 +321122,8 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -313116,7 +321223,7 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -313133,6 +321240,8 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -313164,7 +321273,7 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -313210,8 +321319,6 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -313339,16 +321446,24 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -313511,6 +321626,10 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -313545,6 +321664,8 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -313564,7 +321685,7 @@ static const UV UNI_JT__T_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ - 727, /* Number of elements */ + 745, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -313637,13 +321758,15 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x866, 0x867, 0x86B, - 0x8A0, + 0x870, + 0x887, + 0x889, + 0x88F, + 0x898, 0x8AD, 0x8AE, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8C9, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -313725,6 +321848,8 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -313824,7 +321949,7 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -313843,6 +321968,8 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x1808, 0x180A, 0x180E, + 0x180F, + 0x1810, 0x1820, 0x1879, 0x1885, @@ -313874,7 +322001,7 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -313920,8 +322047,6 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -314067,6 +322192,8 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x10F45, 0x10F46, 0x10F55, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FB1, 0x10FB2, @@ -314081,12 +322208,18 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -314249,6 +322382,10 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -314283,6 +322420,8 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -314305,7 +322444,7 @@ static const UV UNI_JT__U_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ - 727, /* Number of elements */ + 745, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -314378,13 +322517,15 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x866, 0x867, 0x86B, - 0x8A0, + 0x870, + 0x887, + 0x889, + 0x88F, + 0x898, 0x8AD, 0x8AE, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8C9, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -314466,6 +322607,8 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -314565,7 +322708,7 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -314584,6 +322727,8 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x1808, 0x180A, 0x180E, + 0x180F, + 0x1810, 0x1820, 0x1879, 0x1885, @@ -314615,7 +322760,7 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -314661,8 +322806,6 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -314808,6 +322951,8 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x10F45, 0x10F46, 0x10F55, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FB1, 0x10FB2, @@ -314822,12 +322967,18 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -314990,6 +323141,10 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -315024,6 +323179,8 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -315046,7 +323203,7 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ - 727, /* Number of elements */ + 745, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -315119,13 +323276,15 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x866, 0x867, 0x86B, - 0x8A0, + 0x870, + 0x887, + 0x889, + 0x88F, + 0x898, 0x8AD, 0x8AE, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x8C9, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -315207,6 +323366,8 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -315306,7 +323467,7 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -315325,6 +323486,8 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x1808, 0x180A, 0x180E, + 0x180F, + 0x1810, 0x1820, 0x1879, 0x1885, @@ -315356,7 +323519,7 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -315402,8 +323565,6 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200B, 0x200C, @@ -315549,6 +323710,8 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x10F45, 0x10F46, 0x10F55, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FB1, 0x10FB2, @@ -315563,12 +323726,18 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -315731,6 +323900,10 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D173, @@ -315765,6 +323938,8 @@ static const UV UNI_JT__U_invlist[] = { /* for EBCDIC 037 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -315792,7 +323967,7 @@ static const UV UNI_KALI_invlist[] = { /* for all charsets */ }; static const UV UNI_KANA_invlist[] = { /* for all charsets */ - 31, /* Number of elements */ + 39, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -315823,8 +323998,16 @@ static const UV UNI_KANA_invlist[] = { /* for all charsets */ 0xFE47, 0xFF61, 0xFFA0, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168 }; @@ -315839,6 +324022,16 @@ static const UV UNI_KANAEXTA_invlist[] = { /* for all charsets */ 0x1B130 }; +static const UV UNI_KANAEXTB_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x1AFF0, + 0x1B000 +}; + static const UV UNI_KANASUP_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -315985,7 +324178,7 @@ static const UV UNI_KNDA_invlist[] = { /* for all charsets */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -316018,7 +324211,7 @@ static const UV UNI_KTHI_invlist[] = { /* for all charsets */ 0xA830, 0xA83A, 0x11080, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE }; @@ -316026,7 +324219,7 @@ static const UV UNI_KTHI_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ - 1245, /* Number of elements */ + 1297, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -316129,10 +324322,12 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -316261,6 +324456,8 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -316277,7 +324474,7 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -316420,10 +324617,8 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -316466,7 +324661,7 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -316568,10 +324763,6 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -316632,8 +324823,6 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -316654,10 +324843,14 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -316833,12 +325026,34 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -316909,12 +325124,18 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -316997,6 +325218,8 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -317035,7 +325258,7 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -317069,6 +325292,8 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -317077,6 +325302,8 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -317105,8 +325332,14 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -317181,14 +325414,26 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -317262,9 +325507,9 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -317285,7 +325530,7 @@ static const UV UNI_L_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ - 1271, /* Number of elements */ + 1323, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -317414,10 +325659,12 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -317546,6 +325793,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -317562,7 +325811,7 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -317705,10 +325954,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -317751,7 +325998,7 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -317853,10 +326100,6 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -317917,8 +326160,6 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -317939,10 +326180,14 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -318118,12 +326363,34 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -318194,12 +326461,18 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -318282,6 +326555,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -318320,7 +326595,7 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -318354,6 +326629,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -318362,6 +326639,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -318390,8 +326669,14 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -318466,14 +326751,26 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -318547,9 +326844,9 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -318570,7 +326867,7 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ - 1267, /* Number of elements */ + 1319, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -318695,10 +326992,12 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -318827,6 +327126,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -318843,7 +327144,7 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -318986,10 +327287,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -319032,7 +327331,7 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -319134,10 +327433,6 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x2183, 0x2185, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -319198,8 +327493,6 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -319220,10 +327513,14 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -319399,12 +327696,34 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -319475,12 +327794,18 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -319563,6 +327888,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -319601,7 +327928,7 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -319635,6 +327962,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -319643,6 +327972,8 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -319671,8 +328002,14 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -319747,14 +328084,26 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -319828,9 +328177,9 @@ static const UV UNI_L_invlist[] = { /* for EBCDIC 037 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -320107,10 +328456,30 @@ static const UV UNI_LATINEXTE_invlist[] = { /* for all charsets */ 0xAB70 }; +static const UV UNI_LATINEXTF_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x10780, + 0x107C0 +}; + +static const UV UNI_LATINEXTG_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x1DF00, + 0x1E000 +}; + # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LATN_invlist[] = { /* for ASCII/Latin1 */ - 81, /* Number of elements */ + 93, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -320176,10 +328545,14 @@ static const UV UNI_LATN_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xA92E, 0xA92F, @@ -320194,7 +328567,15 @@ static const UV UNI_LATN_invlist[] = { /* for ASCII/Latin1 */ 0xFF21, 0xFF3B, 0xFF41, - 0xFF5B + 0xFF5B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, + 0x1DF00, + 0x1DF1F }; # endif /* ASCII/Latin1 */ @@ -320205,7 +328586,7 @@ static const UV UNI_LATN_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LATN_invlist[] = { /* for EBCDIC 1047 */ - 107, /* Number of elements */ + 119, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -320297,10 +328678,14 @@ static const UV UNI_LATN_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xA92E, 0xA92F, @@ -320315,7 +328700,15 @@ static const UV UNI_LATN_invlist[] = { /* for EBCDIC 1047 */ 0xFF21, 0xFF3B, 0xFF41, - 0xFF5B + 0xFF5B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, + 0x1DF00, + 0x1DF1F }; # endif /* EBCDIC 1047 */ @@ -320326,7 +328719,7 @@ static const UV UNI_LATN_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LATN_invlist[] = { /* for EBCDIC 037 */ - 103, /* Number of elements */ + 115, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -320414,10 +328807,14 @@ static const UV UNI_LATN_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xA92E, 0xA92F, @@ -320432,7 +328829,15 @@ static const UV UNI_LATN_invlist[] = { /* for EBCDIC 037 */ 0xFF21, 0xFF3B, 0xFF41, - 0xFF5B + 0xFF5B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, + 0x1DF00, + 0x1DF1F }; # endif /* EBCDIC 037 */ @@ -321148,7 +329553,7 @@ static const UV UNI_LB__AI_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ - 1541, /* Number of elements */ + 1597, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -321273,10 +329678,12 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x85F, 0x860, 0x86B, + 0x870, + 0x88F, + 0x890, + 0x892, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -321419,6 +329826,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC78, @@ -321435,7 +329844,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -321564,10 +329973,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -321606,7 +330013,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B5C, 0x1B5D, 0x1B61, @@ -321904,10 +330311,6 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CEF, 0x2CF2, 0x2CF4, @@ -321982,10 +330385,14 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0xA6F2, 0xA6F3, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -322056,17 +330463,19 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0xFB29, 0xFB2A, 0xFB50, - 0xFBC2, + 0xFBC3, 0xFBD3, 0xFD3E, - 0xFD50, + 0xFD40, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, 0xFDFC, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE70, 0xFE75, 0xFE76, @@ -322128,13 +330537,33 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -322215,6 +330644,10 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x10F46, 0x10F51, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -322225,6 +330658,10 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x1104E, 0x11052, 0x11066, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110BB, @@ -322324,7 +330761,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x11680, 0x116AB, 0x116B8, - 0x116B9, + 0x116BA, 0x11800, 0x1182C, 0x1183B, @@ -322371,7 +330808,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -322415,6 +330852,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x13258, 0x1325E, @@ -322433,6 +330872,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -322459,6 +330900,12 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x16FA0, 0x18B00, 0x18CD6, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1BC00, 0x1BC6B, 0x1BC70, @@ -322469,6 +330916,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -322482,7 +330931,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -322545,14 +330994,26 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ 0x1DA87, 0x1DA8B, 0x1DA8C, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -322703,7 +331164,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ - 1569, /* Number of elements */ + 1625, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -322856,10 +331317,12 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x85F, 0x860, 0x86B, + 0x870, + 0x88F, + 0x890, + 0x892, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -323002,6 +331465,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC78, @@ -323018,7 +331483,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -323147,10 +331612,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -323189,7 +331652,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B5C, 0x1B5D, 0x1B61, @@ -323487,10 +331950,6 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CEF, 0x2CF2, 0x2CF4, @@ -323565,10 +332024,14 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0xA6F2, 0xA6F3, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -323639,17 +332102,19 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0xFB29, 0xFB2A, 0xFB50, - 0xFBC2, + 0xFBC3, 0xFBD3, 0xFD3E, - 0xFD50, + 0xFD40, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, 0xFDFC, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE70, 0xFE75, 0xFE76, @@ -323711,13 +332176,33 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -323798,6 +332283,10 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x10F46, 0x10F51, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -323808,6 +332297,10 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x1104E, 0x11052, 0x11066, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110BB, @@ -323907,7 +332400,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x11680, 0x116AB, 0x116B8, - 0x116B9, + 0x116BA, 0x11800, 0x1182C, 0x1183B, @@ -323954,7 +332447,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -323998,6 +332491,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x13258, 0x1325E, @@ -324016,6 +332511,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -324042,6 +332539,12 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x16FA0, 0x18B00, 0x18CD6, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1BC00, 0x1BC6B, 0x1BC70, @@ -324052,6 +332555,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -324065,7 +332570,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -324128,14 +332633,26 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ 0x1DA87, 0x1DA8B, 0x1DA8C, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -324286,7 +332803,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ - 1565, /* Number of elements */ + 1621, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -324435,10 +332952,12 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x85F, 0x860, 0x86B, + 0x870, + 0x88F, + 0x890, + 0x892, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -324581,6 +333100,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC78, @@ -324597,7 +333118,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -324726,10 +333247,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -324768,7 +333287,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B5C, 0x1B5D, 0x1B61, @@ -325066,10 +333585,6 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CEF, 0x2CF2, 0x2CF4, @@ -325144,10 +333659,14 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0xA6F2, 0xA6F3, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -325218,17 +333737,19 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0xFB29, 0xFB2A, 0xFB50, - 0xFBC2, + 0xFBC3, 0xFBD3, 0xFD3E, - 0xFD50, + 0xFD40, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, 0xFDFC, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFE70, 0xFE75, 0xFE76, @@ -325290,13 +333811,33 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -325377,6 +333918,10 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x10F46, 0x10F51, 0x10F5A, + 0x10F70, + 0x10F82, + 0x10F86, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -325387,6 +333932,10 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x1104E, 0x11052, 0x11066, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110BB, @@ -325486,7 +334035,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x11680, 0x116AB, 0x116B8, - 0x116B9, + 0x116BA, 0x11800, 0x1182C, 0x1183B, @@ -325533,7 +334082,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -325577,6 +334126,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x13258, 0x1325E, @@ -325595,6 +334146,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -325621,6 +334174,12 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x16FA0, 0x18B00, 0x18CD6, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1BC00, 0x1BC6B, 0x1BC70, @@ -325631,6 +334190,8 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -325644,7 +334205,7 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -325707,14 +334268,26 @@ static const UV UNI_LB__AL_invlist[] = { /* for EBCDIC 037 */ 0x1DA87, 0x1DA8B, 0x1DA8C, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -325874,7 +334447,7 @@ static const UV UNI_LB__B2_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__BA_invlist[] = { /* for ASCII/Latin1 */ - 197, /* Number of elements */ + 201, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -325929,6 +334502,8 @@ static const UV UNI_LB__BA_invlist[] = { /* for ASCII/Latin1 */ 0x1B5C, 0x1B5D, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C40, 0x1C7E, @@ -325977,6 +334552,8 @@ static const UV UNI_LB__BA_invlist[] = { /* for ASCII/Latin1 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E5D, + 0x2E5E, 0x3000, 0x3001, 0xA4FE, @@ -326085,7 +334662,7 @@ static const UV UNI_LB__BA_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__BA_invlist[] = { /* for EBCDIC 1047 */ - 197, /* Number of elements */ + 201, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -326140,6 +334717,8 @@ static const UV UNI_LB__BA_invlist[] = { /* for EBCDIC 1047 */ 0x1B5C, 0x1B5D, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C40, 0x1C7E, @@ -326188,6 +334767,8 @@ static const UV UNI_LB__BA_invlist[] = { /* for EBCDIC 1047 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E5D, + 0x2E5E, 0x3000, 0x3001, 0xA4FE, @@ -326296,7 +334877,7 @@ static const UV UNI_LB__BA_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__BA_invlist[] = { /* for EBCDIC 037 */ - 197, /* Number of elements */ + 201, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -326351,6 +334932,8 @@ static const UV UNI_LB__BA_invlist[] = { /* for EBCDIC 037 */ 0x1B5C, 0x1B5D, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C40, 0x1C7E, @@ -326399,6 +334982,8 @@ static const UV UNI_LB__BA_invlist[] = { /* for EBCDIC 037 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E5D, + 0x2E5E, 0x3000, 0x3001, 0xA4FE, @@ -326816,7 +335401,7 @@ static const UV UNI_LB__CJ_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__CL_invlist[] = { /* for ASCII/Latin1 */ - 167, /* Number of elements */ + 175, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -326903,6 +335488,14 @@ static const UV UNI_LB__CL_invlist[] = { /* for ASCII/Latin1 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3001, 0x3003, 0x3009, @@ -326997,7 +335590,7 @@ static const UV UNI_LB__CL_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__CL_invlist[] = { /* for EBCDIC 1047 */ - 167, /* Number of elements */ + 175, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -327084,6 +335677,14 @@ static const UV UNI_LB__CL_invlist[] = { /* for EBCDIC 1047 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3001, 0x3003, 0x3009, @@ -327178,7 +335779,7 @@ static const UV UNI_LB__CL_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__CL_invlist[] = { /* for EBCDIC 037 */ - 167, /* Number of elements */ + 175, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -327265,6 +335866,14 @@ static const UV UNI_LB__CL_invlist[] = { /* for EBCDIC 037 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3001, 0x3003, 0x3009, @@ -327356,7 +335965,7 @@ static const UV UNI_LB__CL_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ - 556, /* Number of elements */ + 574, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -327422,7 +336031,9 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -327506,6 +336117,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -327581,7 +336194,7 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -327590,6 +336203,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0x1774, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -327603,7 +336218,7 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -327629,8 +336244,6 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200C, 0x200D, @@ -327734,14 +336347,22 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -327870,6 +336491,10 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -327904,6 +336529,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -327926,7 +336553,7 @@ static const UV UNI_LB__CM_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ - 560, /* Number of elements */ + 578, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -327996,7 +336623,9 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -328080,6 +336709,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -328155,7 +336786,7 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -328164,6 +336795,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0x1774, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -328177,7 +336810,7 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -328203,8 +336836,6 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200C, 0x200D, @@ -328308,14 +336939,22 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -328444,6 +337083,10 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -328478,6 +337121,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -328500,7 +337145,7 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ - 560, /* Number of elements */ + 578, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -328570,7 +337215,9 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -328654,6 +337301,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -328729,7 +337378,7 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -328738,6 +337387,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0x1774, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -328751,7 +337402,7 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -328777,8 +337428,6 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200C, 0x200D, @@ -328882,14 +337531,22 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -329018,6 +337675,10 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -329052,6 +337713,8 @@ static const UV UNI_LB__CM_invlist[] = { /* for EBCDIC 037 */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -329173,7 +337836,7 @@ static const UV UNI_LB__CR_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__EX_invlist[] = { /* for ASCII/Latin1 */ - 49, /* Number of elements */ + 51, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -329186,7 +337849,7 @@ static const UV UNI_LB__EX_invlist[] = { /* for ASCII/Latin1 */ 0x5C7, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -329210,6 +337873,8 @@ static const UV UNI_LB__EX_invlist[] = { /* for ASCII/Latin1 */ 0x2CFF, 0x2E2E, 0x2E2F, + 0x2E53, + 0x2E55, 0xA60E, 0xA60F, 0xA876, @@ -329236,7 +337901,7 @@ static const UV UNI_LB__EX_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__EX_invlist[] = { /* for EBCDIC 1047 */ - 49, /* Number of elements */ + 51, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -329249,7 +337914,7 @@ static const UV UNI_LB__EX_invlist[] = { /* for EBCDIC 1047 */ 0x5C7, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -329273,6 +337938,8 @@ static const UV UNI_LB__EX_invlist[] = { /* for EBCDIC 1047 */ 0x2CFF, 0x2E2E, 0x2E2F, + 0x2E53, + 0x2E55, 0xA60E, 0xA60F, 0xA876, @@ -329299,7 +337966,7 @@ static const UV UNI_LB__EX_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__EX_invlist[] = { /* for EBCDIC 037 */ - 49, /* Number of elements */ + 51, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -329312,7 +337979,7 @@ static const UV UNI_LB__EX_invlist[] = { /* for EBCDIC 037 */ 0x5C7, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -329336,6 +338003,8 @@ static const UV UNI_LB__EX_invlist[] = { /* for EBCDIC 037 */ 0x2CFF, 0x2E2E, 0x2E2F, + 0x2E53, + 0x2E55, 0xA60E, 0xA60F, 0xA876, @@ -331165,7 +339834,7 @@ static const UV UNI_LB__HY_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_LB__ID_invlist[] = { /* for all charsets */ - 331, /* Number of elements */ + 335, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -331367,7 +340036,7 @@ static const UV UNI_LB__ID_invlist[] = { /* for all charsets */ 0x18D00, 0x18D09, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B170, 0x1B2FC, 0x1F000, @@ -331493,6 +340162,10 @@ static const UV UNI_LB__ID_invlist[] = { /* for all charsets */ 0x1F9DE, 0x1FA00, 0x1FA54, + 0x1FAC3, + 0x1FAC6, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FC00, 0x1FFFE, @@ -331765,7 +340438,7 @@ static const UV UNI_LB__NS_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__NU_invlist[] = { /* for ASCII/Latin1 */ - 123, /* Number of elements */ + 125, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -331880,6 +340553,8 @@ static const UV UNI_LB__NU_invlist[] = { /* for ASCII/Latin1 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -331902,7 +340577,7 @@ static const UV UNI_LB__NU_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__NU_invlist[] = { /* for EBCDIC 1047 */ - 123, /* Number of elements */ + 125, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332017,6 +340692,8 @@ static const UV UNI_LB__NU_invlist[] = { /* for EBCDIC 1047 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -332039,7 +340716,7 @@ static const UV UNI_LB__NU_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__NU_invlist[] = { /* for EBCDIC 037 */ - 123, /* Number of elements */ + 125, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332154,6 +340831,8 @@ static const UV UNI_LB__NU_invlist[] = { /* for EBCDIC 037 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -332173,7 +340852,7 @@ static const UV UNI_LB__NU_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__OP_invlist[] = { /* for ASCII/Latin1 */ - 171, /* Number of elements */ + 179, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332276,6 +340955,14 @@ static const UV UNI_LB__OP_invlist[] = { /* for ASCII/Latin1 */ 0x2E29, 0x2E42, 0x2E43, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -332358,7 +341045,7 @@ static const UV UNI_LB__OP_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__OP_invlist[] = { /* for EBCDIC 1047 */ - 169, /* Number of elements */ + 177, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332459,6 +341146,14 @@ static const UV UNI_LB__OP_invlist[] = { /* for EBCDIC 1047 */ 0x2E29, 0x2E42, 0x2E43, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -332541,7 +341236,7 @@ static const UV UNI_LB__OP_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__OP_invlist[] = { /* for EBCDIC 037 */ - 169, /* Number of elements */ + 177, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332642,6 +341337,14 @@ static const UV UNI_LB__OP_invlist[] = { /* for EBCDIC 037 */ 0x2E29, 0x2E42, 0x2E43, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -332721,7 +341424,7 @@ static const UV UNI_LB__OP_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__PO_invlist[] = { /* for ASCII/Latin1 */ - 47, /* Number of elements */ + 49, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332752,6 +341455,8 @@ static const UV UNI_LB__PO_invlist[] = { /* for ASCII/Latin1 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x2103, 0x2104, 0x2109, @@ -332782,7 +341487,7 @@ static const UV UNI_LB__PO_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__PO_invlist[] = { /* for EBCDIC 1047 */ - 47, /* Number of elements */ + 49, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332813,6 +341518,8 @@ static const UV UNI_LB__PO_invlist[] = { /* for EBCDIC 1047 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x2103, 0x2104, 0x2109, @@ -332843,7 +341550,7 @@ static const UV UNI_LB__PO_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__PO_invlist[] = { /* for EBCDIC 037 */ - 47, /* Number of elements */ + 49, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332874,6 +341581,8 @@ static const UV UNI_LB__PO_invlist[] = { /* for EBCDIC 037 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x2103, 0x2104, 0x2109, @@ -332901,7 +341610,7 @@ static const UV UNI_LB__PO_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LB__PR_invlist[] = { /* for ASCII/Latin1 */ - 49, /* Number of elements */ + 51, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -332939,6 +341648,8 @@ static const UV UNI_LB__PR_invlist[] = { /* for ASCII/Latin1 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x20D0, 0x2116, 0x2117, @@ -332964,7 +341675,7 @@ static const UV UNI_LB__PR_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LB__PR_invlist[] = { /* for EBCDIC 1047 */ - 51, /* Number of elements */ + 53, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -333004,6 +341715,8 @@ static const UV UNI_LB__PR_invlist[] = { /* for EBCDIC 1047 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x20D0, 0x2116, 0x2117, @@ -333029,7 +341742,7 @@ static const UV UNI_LB__PR_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LB__PR_invlist[] = { /* for EBCDIC 037 */ - 51, /* Number of elements */ + 53, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -333069,6 +341782,8 @@ static const UV UNI_LB__PR_invlist[] = { /* for EBCDIC 037 */ 0x20BC, 0x20BE, 0x20BF, + 0x20C0, + 0x20C1, 0x20D0, 0x2116, 0x2117, @@ -333279,7 +341994,7 @@ static const UV UNI_LB__SA_invlist[] = { /* for all charsets */ 0x1173A, 0x1173C, 0x1173F, - 0x11740 + 0x11747 }; static const UV UNI_LB__SG_invlist[] = { /* for all charsets */ @@ -333401,7 +342116,7 @@ static const UV UNI_LB__WJ_invlist[] = { /* for all charsets */ }; static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ - 1266, /* Number of elements */ + 1308, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -333430,8 +342145,6 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -333449,11 +342162,11 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -333609,7 +342322,7 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -333619,6 +342332,8 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -333641,7 +342356,7 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -333776,10 +342491,8 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -333796,8 +342509,6 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -333836,11 +342547,11 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -333856,8 +342567,6 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -333910,10 +342619,6 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -333944,7 +342649,7 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -333976,10 +342681,14 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -334048,16 +342757,14 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -334144,13 +342851,33 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -334237,6 +342964,8 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -334244,9 +342973,9 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -334330,7 +343059,7 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -334338,7 +343067,7 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -334369,7 +343098,7 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -334425,6 +343154,8 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -334438,7 +343169,9 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -334471,8 +343204,14 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -334489,12 +343228,18 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -334549,6 +343294,8 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -334567,10 +343314,20 @@ static const UV UNI_LB__XX_invlist[] = { /* for all charsets */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -334824,7 +343581,7 @@ static const UV UNI_LISUSUP_invlist[] = { /* for all charsets */ }; static const UV UNI_LM_invlist[] = { /* for all charsets */ - 123, /* Number of elements */ + 139, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -334859,6 +343616,8 @@ static const UV UNI_LM_invlist[] = { /* for all charsets */ 0x825, 0x828, 0x829, + 0x8C9, + 0x8CA, 0x971, 0x972, 0xE46, @@ -334919,6 +343678,8 @@ static const UV UNI_LM_invlist[] = { /* for all charsets */ 0xA771, 0xA788, 0xA789, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xA9CF, @@ -334939,6 +343700,12 @@ static const UV UNI_LM_invlist[] = { /* for all charsets */ 0xFF71, 0xFF9E, 0xFFA0, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x16B40, 0x16B44, 0x16F93, @@ -334947,6 +343714,12 @@ static const UV UNI_LM_invlist[] = { /* for all charsets */ 0x16FE2, 0x16FE3, 0x16FE4, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1E137, 0x1E13E, 0x1E94B, @@ -334956,7 +343729,7 @@ static const UV UNI_LM_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ - 979, /* Number of elements */ + 1003, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -335007,10 +343780,12 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8C9, 0x904, 0x93A, 0x93D, @@ -335139,6 +343914,8 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -335155,7 +343932,7 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -335284,10 +344061,8 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -335328,7 +344103,7 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -335394,8 +344169,6 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA015, 0xA016, 0xA48D, @@ -335651,12 +344424,18 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -335739,6 +344518,8 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118FF, @@ -335775,7 +344556,7 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -335809,6 +344590,8 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -335817,6 +344600,8 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -335836,7 +344621,7 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x18D00, 0x18D09, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -335851,12 +344636,24 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x1BC89, 0x1BC90, 0x1BC9A, + 0x1DF0A, + 0x1DF0B, 0x1E100, 0x1E12D, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1EE00, @@ -335926,9 +344723,9 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -335949,7 +344746,7 @@ static const UV UNI_LO_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ - 977, /* Number of elements */ + 1001, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -335998,10 +344795,12 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8C9, 0x904, 0x93A, 0x93D, @@ -336130,6 +344929,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -336146,7 +344947,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -336275,10 +345076,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -336319,7 +345118,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -336385,8 +345184,6 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA015, 0xA016, 0xA48D, @@ -336642,12 +345439,18 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -336730,6 +345533,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118FF, @@ -336766,7 +345571,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -336800,6 +345605,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -336808,6 +345615,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -336827,7 +345636,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x18D00, 0x18D09, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -336842,12 +345651,24 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x1BC89, 0x1BC90, 0x1BC9A, + 0x1DF0A, + 0x1DF0B, 0x1E100, 0x1E12D, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1EE00, @@ -336917,9 +345738,9 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -336940,7 +345761,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ - 977, /* Number of elements */ + 1001, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -336989,10 +345810,12 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8C9, 0x904, 0x93A, 0x93D, @@ -337121,6 +345944,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -337137,7 +345962,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -337266,10 +346091,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x16F1, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -337310,7 +346133,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -337376,8 +346199,6 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA015, 0xA016, 0xA48D, @@ -337633,12 +346454,18 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -337721,6 +346548,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118FF, @@ -337757,7 +346586,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -337791,6 +346620,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x1239A, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -337799,6 +346630,8 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -337818,7 +346651,7 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x18D00, 0x18D09, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -337833,12 +346666,24 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x1BC89, 0x1BC90, 0x1BC9A, + 0x1DF0A, + 0x1DF0B, 0x1E100, 0x1E12D, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1EE00, @@ -337908,9 +346753,9 @@ static const UV UNI_LO_invlist[] = { /* for EBCDIC 037 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -337980,7 +346825,7 @@ static const UV UNI_LYDI_invlist[] = { /* for all charsets */ }; static const UV UNI_M_invlist[] = { /* for all charsets */ - 581, /* Number of elements */ + 599, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -338033,7 +346878,9 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -338117,6 +346964,8 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -338220,7 +347069,7 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -338233,6 +347082,8 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -338250,7 +347101,7 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -338276,8 +347127,6 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x20D0, 0x20F1, @@ -338383,14 +347232,22 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -338521,6 +347378,10 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0x16FF2, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -338557,6 +347418,8 @@ static const UV UNI_M_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -339548,7 +348411,7 @@ static const UV UNI_MAYANNUMERALS_invlist[] = { /* for all charsets */ }; static const UV UNI_MC_invlist[] = { /* for all charsets */ - 351, /* Number of elements */ + 355, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -339667,6 +348530,10 @@ static const UV UNI_MC_invlist[] = { /* for all charsets */ 0x1090, 0x109A, 0x109D, + 0x1715, + 0x1716, + 0x1734, + 0x1735, 0x17B6, 0x17B7, 0x17BE, @@ -340084,7 +348951,7 @@ static const UV UNI_MLYM_invlist[] = { /* for all charsets */ }; static const UV UNI_MN_invlist[] = { /* for all charsets */ - 655, /* Number of elements */ + 673, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -340137,7 +349004,9 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x903, @@ -340219,6 +349088,8 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0xC01, 0xC04, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC41, 0xC46, @@ -340318,7 +349189,7 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0x1712, 0x1715, 0x1732, - 0x1735, + 0x1734, 0x1752, 0x1754, 0x1772, @@ -340335,6 +349206,8 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -340368,7 +349241,7 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B04, 0x1B34, @@ -340414,8 +349287,6 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x20D0, 0x20DD, @@ -340533,16 +349404,24 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11001, 0x11002, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11082, 0x110B3, 0x110B7, 0x110B9, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -340701,6 +349580,10 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0x16FE5, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D17B, @@ -340735,6 +349618,8 @@ static const UV UNI_MN_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -340780,14 +349665,12 @@ static const UV UNI_MODIFIERTONELETTERS_invlist[] = { /* for all charsets */ }; static const UV UNI_MONG_invlist[] = { /* for all charsets */ - 13, /* Number of elements */ + 11, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -340906,7 +349789,7 @@ static const UV UNI_MYMR_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_N_invlist[] = { /* for ASCII/Latin1 */ - 267, /* Number of elements */ + 269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -341143,6 +350026,8 @@ static const UV UNI_N_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x16B5B, @@ -341187,7 +350072,7 @@ static const UV UNI_N_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_N_invlist[] = { /* for EBCDIC 1047 */ - 267, /* Number of elements */ + 269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -341424,6 +350309,8 @@ static const UV UNI_N_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x16B5B, @@ -341468,7 +350355,7 @@ static const UV UNI_N_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_N_invlist[] = { /* for EBCDIC 037 */ - 267, /* Number of elements */ + 269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -341705,6 +350592,8 @@ static const UV UNI_N_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x16B5B, @@ -341780,22 +350669,20 @@ static const UV UNI_NARB_invlist[] = { /* for all charsets */ }; static const UV UNI_NB_invlist[] = { /* for all charsets */ - 110, /* Number of elements */ + 104, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, - 0x870, - 0x8A0, 0x2FE0, 0x2FF0, 0x10200, 0x10280, 0x103E0, 0x10400, - 0x10570, + 0x105C0, 0x10600, - 0x10780, + 0x107C0, 0x10800, 0x108B0, 0x108E0, @@ -341811,8 +350698,6 @@ static const UV UNI_NB_invlist[] = { /* for all charsets */ 0x10E60, 0x10EC0, 0x10F00, - 0x10F70, - 0x10FB0, 0x11250, 0x11280, 0x11380, @@ -341821,14 +350706,12 @@ static const UV UNI_NB_invlist[] = { /* for all charsets */ 0x11580, 0x116D0, 0x11700, - 0x11740, + 0x11750, 0x11800, 0x11850, 0x118A0, 0x11960, 0x119A0, - 0x11AB0, - 0x11AC0, 0x11B00, 0x11C00, 0x11CC0, @@ -341838,37 +350721,37 @@ static const UV UNI_NB_invlist[] = { /* for all charsets */ 0x11F00, 0x11FB0, 0x12550, - 0x13000, + 0x12F90, 0x13440, 0x14400, 0x14680, 0x16800, - 0x16A70, - 0x16AD0, 0x16B90, 0x16E40, 0x16EA0, 0x16F00, 0x16FA0, 0x16FE0, - 0x18D90, - 0x1B000, + 0x18D80, + 0x1AFF0, 0x1B300, 0x1BC00, 0x1BCB0, + 0x1CF00, + 0x1CFD0, 0x1D000, 0x1D250, 0x1D2E0, 0x1D380, 0x1D400, 0x1DAB0, - 0x1E000, + 0x1DF00, 0x1E030, 0x1E100, 0x1E150, - 0x1E2C0, + 0x1E290, 0x1E300, - 0x1E800, + 0x1E7E0, 0x1E8E0, 0x1E900, 0x1E960, @@ -343689,7 +352572,7 @@ static const UV UNI_NFDQC__Y_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NFKCQC__N_invlist[] = { /* for ASCII/Latin1 */ - 501, /* Number of elements */ + 509, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -343980,6 +352863,8 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for ASCII/Latin1 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -344060,6 +352945,12 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for ASCII/Latin1 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D15E, 0x1D165, 0x1D1BB, @@ -344204,7 +353095,7 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NFKCQC__N_invlist[] = { /* for EBCDIC 1047 */ - 507, /* Number of elements */ + 515, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -344501,6 +353392,8 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for EBCDIC 1047 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -344581,6 +353474,12 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for EBCDIC 1047 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D15E, 0x1D165, 0x1D1BB, @@ -344725,7 +353624,7 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NFKCQC__N_invlist[] = { /* for EBCDIC 037 */ - 505, /* Number of elements */ + 513, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -345020,6 +353919,8 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for EBCDIC 037 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -345100,6 +354001,12 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for EBCDIC 037 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1D15E, 0x1D165, 0x1D1BB, @@ -345241,7 +354148,7 @@ static const UV UNI_NFKCQC__N_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NFKCQC__Y_invlist[] = { /* for ASCII/Latin1 */ - 577, /* Number of elements */ + 585, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -345590,6 +354497,8 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for ASCII/Latin1 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -345670,6 +354579,12 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for ASCII/Latin1 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x110BA, 0x110BB, 0x11127, @@ -345832,7 +354747,7 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NFKCQC__Y_invlist[] = { /* for EBCDIC 1047 */ - 583, /* Number of elements */ + 591, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -346187,6 +355102,8 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for EBCDIC 1047 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -346267,6 +355184,12 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for EBCDIC 1047 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x110BA, 0x110BB, 0x11127, @@ -346429,7 +355352,7 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NFKCQC__Y_invlist[] = { /* for EBCDIC 037 */ - 581, /* Number of elements */ + 589, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -346782,6 +355705,8 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for EBCDIC 037 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -346862,6 +355787,12 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for EBCDIC 037 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x110BA, 0x110BB, 0x11127, @@ -347021,7 +355952,7 @@ static const UV UNI_NFKCQC__Y_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NFKDQC__N_invlist[] = { /* for ASCII/Latin1 */ - 785, /* Number of elements */ + 793, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -347576,6 +356507,8 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for ASCII/Latin1 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -347658,6 +356591,12 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for ASCII/Latin1 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1109A, 0x1109B, 0x1109C, @@ -347820,7 +356759,7 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NFKDQC__N_invlist[] = { /* for EBCDIC 1047 */ - 783, /* Number of elements */ + 791, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -348373,6 +357312,8 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for EBCDIC 1047 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -348455,6 +357396,12 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for EBCDIC 1047 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1109A, 0x1109B, 0x1109C, @@ -348617,7 +357564,7 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NFKDQC__N_invlist[] = { /* for EBCDIC 037 */ - 785, /* Number of elements */ + 793, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -349172,6 +358119,8 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for EBCDIC 037 */ 0xA69E, 0xA770, 0xA771, + 0xA7F2, + 0xA7F5, 0xA7F8, 0xA7FA, 0xAB5C, @@ -349254,6 +358203,12 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for EBCDIC 037 */ 0xFFE7, 0xFFE8, 0xFFEF, + 0x10781, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x1109A, 0x1109B, 0x1109C, @@ -349411,15 +358366,23 @@ static const UV UNI_NFKDQC__N_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_NKO_invlist[] = { /* for all charsets */ - 5, /* Number of elements */ + 13, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, + 0x60C, + 0x60D, + 0x61B, + 0x61C, + 0x61F, + 0x620, 0x7C0, 0x7FB, 0x7FD, - 0x800 + 0x800, + 0xFD3E, + 0xFD40 }; static const UV UNI_NL_invlist[] = { /* for all charsets */ @@ -351075,7 +360038,7 @@ static const UV UNI_NV___MINUS_1_SLASH_2_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__0_invlist[] = { /* for ASCII/Latin1 */ - 163, /* Number of elements */ + 165, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -351214,6 +360177,8 @@ static const UV UNI_NV__0_invlist[] = { /* for ASCII/Latin1 */ 0x11DA1, 0x16A60, 0x16A61, + 0x16AC0, + 0x16AC1, 0x16B50, 0x16B51, 0x16E80, @@ -351252,7 +360217,7 @@ static const UV UNI_NV__0_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__0_invlist[] = { /* for EBCDIC 1047 */ - 163, /* Number of elements */ + 165, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -351391,6 +360356,8 @@ static const UV UNI_NV__0_invlist[] = { /* for EBCDIC 1047 */ 0x11DA1, 0x16A60, 0x16A61, + 0x16AC0, + 0x16AC1, 0x16B50, 0x16B51, 0x16E80, @@ -351429,7 +360396,7 @@ static const UV UNI_NV__0_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__0_invlist[] = { /* for EBCDIC 037 */ - 163, /* Number of elements */ + 165, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -351568,6 +360535,8 @@ static const UV UNI_NV__0_invlist[] = { /* for EBCDIC 037 */ 0x11DA1, 0x16A60, 0x16A61, + 0x16AC0, + 0x16AC1, 0x16B50, 0x16B51, 0x16E80, @@ -351603,7 +360572,7 @@ static const UV UNI_NV__0_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__1_invlist[] = { /* for ASCII/Latin1 */ - 275, /* Number of elements */ + 277, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -351836,6 +360805,8 @@ static const UV UNI_NV__1_invlist[] = { /* for ASCII/Latin1 */ 0x12459, 0x16A61, 0x16A62, + 0x16AC1, + 0x16AC2, 0x16B51, 0x16B52, 0x16E81, @@ -351892,7 +360863,7 @@ static const UV UNI_NV__1_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__1_invlist[] = { /* for EBCDIC 1047 */ - 275, /* Number of elements */ + 277, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -352125,6 +361096,8 @@ static const UV UNI_NV__1_invlist[] = { /* for EBCDIC 1047 */ 0x12459, 0x16A61, 0x16A62, + 0x16AC1, + 0x16AC2, 0x16B51, 0x16B52, 0x16E81, @@ -352181,7 +361154,7 @@ static const UV UNI_NV__1_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__1_invlist[] = { /* for EBCDIC 037 */ - 275, /* Number of elements */ + 277, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -352414,6 +361387,8 @@ static const UV UNI_NV__1_invlist[] = { /* for EBCDIC 037 */ 0x12459, 0x16A61, 0x16A62, + 0x16AC1, + 0x16AC2, 0x16B51, 0x16B52, 0x16E81, @@ -353549,7 +362524,7 @@ static const UV UNI_NV__19_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__2_invlist[] = { /* for ASCII/Latin1 */ - 273, /* Number of elements */ + 275, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -353780,6 +362755,8 @@ static const UV UNI_NV__2_invlist[] = { /* for ASCII/Latin1 */ 0x1245A, 0x16A62, 0x16A63, + 0x16AC2, + 0x16AC3, 0x16B52, 0x16B53, 0x16E82, @@ -353836,7 +362813,7 @@ static const UV UNI_NV__2_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__2_invlist[] = { /* for EBCDIC 1047 */ - 273, /* Number of elements */ + 275, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -354067,6 +363044,8 @@ static const UV UNI_NV__2_invlist[] = { /* for EBCDIC 1047 */ 0x1245A, 0x16A62, 0x16A63, + 0x16AC2, + 0x16AC3, 0x16B52, 0x16B53, 0x16E82, @@ -354123,7 +363102,7 @@ static const UV UNI_NV__2_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__2_invlist[] = { /* for EBCDIC 037 */ - 273, /* Number of elements */ + 275, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -354354,6 +363333,8 @@ static const UV UNI_NV__2_invlist[] = { /* for EBCDIC 037 */ 0x1245A, 0x16A62, 0x16A63, + 0x16AC2, + 0x16AC3, 0x16B52, 0x16B53, 0x16E82, @@ -354695,7 +363676,7 @@ static const UV UNI_NV__29_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__3_invlist[] = { /* for ASCII/Latin1 */ - 267, /* Number of elements */ + 269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -354916,6 +363897,8 @@ static const UV UNI_NV__3_invlist[] = { /* for ASCII/Latin1 */ 0x12458, 0x16A63, 0x16A64, + 0x16AC3, + 0x16AC4, 0x16B53, 0x16B54, 0x16E83, @@ -354976,7 +363959,7 @@ static const UV UNI_NV__3_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__3_invlist[] = { /* for EBCDIC 1047 */ - 267, /* Number of elements */ + 269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -355197,6 +364180,8 @@ static const UV UNI_NV__3_invlist[] = { /* for EBCDIC 1047 */ 0x12458, 0x16A63, 0x16A64, + 0x16AC3, + 0x16AC4, 0x16B53, 0x16B54, 0x16E83, @@ -355257,7 +364242,7 @@ static const UV UNI_NV__3_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__3_invlist[] = { /* for EBCDIC 037 */ - 267, /* Number of elements */ + 269, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -355478,6 +364463,8 @@ static const UV UNI_NV__3_invlist[] = { /* for EBCDIC 037 */ 0x12458, 0x16A63, 0x16A64, + 0x16AC3, + 0x16AC4, 0x16B53, 0x16B54, 0x16E83, @@ -355913,7 +364900,7 @@ static const UV UNI_NV__39_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__4_invlist[] = { /* for ASCII/Latin1 */ - 253, /* Number of elements */ + 255, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -356124,6 +365111,8 @@ static const UV UNI_NV__4_invlist[] = { /* for ASCII/Latin1 */ 0x1246A, 0x16A64, 0x16A65, + 0x16AC4, + 0x16AC5, 0x16B54, 0x16B55, 0x16E84, @@ -356180,7 +365169,7 @@ static const UV UNI_NV__4_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__4_invlist[] = { /* for EBCDIC 1047 */ - 253, /* Number of elements */ + 255, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -356391,6 +365380,8 @@ static const UV UNI_NV__4_invlist[] = { /* for EBCDIC 1047 */ 0x1246A, 0x16A64, 0x16A65, + 0x16AC4, + 0x16AC5, 0x16B54, 0x16B55, 0x16E84, @@ -356447,7 +365438,7 @@ static const UV UNI_NV__4_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__4_invlist[] = { /* for EBCDIC 037 */ - 253, /* Number of elements */ + 255, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -356658,6 +365649,8 @@ static const UV UNI_NV__4_invlist[] = { /* for EBCDIC 037 */ 0x1246A, 0x16A64, 0x16A65, + 0x16AC4, + 0x16AC5, 0x16B54, 0x16B55, 0x16E84, @@ -356929,7 +365922,7 @@ static const UV UNI_NV__49_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__5_invlist[] = { /* for ASCII/Latin1 */ - 257, /* Number of elements */ + 259, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -357146,6 +366139,8 @@ static const UV UNI_NV__5_invlist[] = { /* for ASCII/Latin1 */ 0x1246B, 0x16A65, 0x16A66, + 0x16AC5, + 0x16AC6, 0x16B55, 0x16B56, 0x16E85, @@ -357200,7 +366195,7 @@ static const UV UNI_NV__5_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__5_invlist[] = { /* for EBCDIC 1047 */ - 257, /* Number of elements */ + 259, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -357417,6 +366412,8 @@ static const UV UNI_NV__5_invlist[] = { /* for EBCDIC 1047 */ 0x1246B, 0x16A65, 0x16A66, + 0x16AC5, + 0x16AC6, 0x16B55, 0x16B56, 0x16E85, @@ -357471,7 +366468,7 @@ static const UV UNI_NV__5_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__5_invlist[] = { /* for EBCDIC 037 */ - 257, /* Number of elements */ + 259, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -357688,6 +366685,8 @@ static const UV UNI_NV__5_invlist[] = { /* for EBCDIC 037 */ 0x1246B, 0x16A65, 0x16A66, + 0x16AC5, + 0x16AC6, 0x16B55, 0x16B56, 0x16E85, @@ -357931,7 +366930,7 @@ static const UV UNI_NV__500000_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__6_invlist[] = { /* for ASCII/Latin1 */ - 227, /* Number of elements */ + 229, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -358122,6 +367121,8 @@ static const UV UNI_NV__6_invlist[] = { /* for ASCII/Latin1 */ 0x1246C, 0x16A66, 0x16A67, + 0x16AC6, + 0x16AC7, 0x16B56, 0x16B57, 0x16E86, @@ -358172,7 +367173,7 @@ static const UV UNI_NV__6_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__6_invlist[] = { /* for EBCDIC 1047 */ - 227, /* Number of elements */ + 229, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -358363,6 +367364,8 @@ static const UV UNI_NV__6_invlist[] = { /* for EBCDIC 1047 */ 0x1246C, 0x16A66, 0x16A67, + 0x16AC6, + 0x16AC7, 0x16B56, 0x16B57, 0x16E86, @@ -358413,7 +367416,7 @@ static const UV UNI_NV__6_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__6_invlist[] = { /* for EBCDIC 037 */ - 227, /* Number of elements */ + 229, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -358604,6 +367607,8 @@ static const UV UNI_NV__6_invlist[] = { /* for EBCDIC 037 */ 0x1246C, 0x16A66, 0x16A67, + 0x16AC6, + 0x16AC7, 0x16B56, 0x16B57, 0x16E86, @@ -358749,7 +367754,7 @@ static const UV UNI_NV__600000_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__7_invlist[] = { /* for ASCII/Latin1 */ - 221, /* Number of elements */ + 223, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -358934,6 +367939,8 @@ static const UV UNI_NV__7_invlist[] = { /* for ASCII/Latin1 */ 0x1246D, 0x16A67, 0x16A68, + 0x16AC7, + 0x16AC8, 0x16B57, 0x16B58, 0x16E87, @@ -358984,7 +367991,7 @@ static const UV UNI_NV__7_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__7_invlist[] = { /* for EBCDIC 1047 */ - 221, /* Number of elements */ + 223, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -359169,6 +368176,8 @@ static const UV UNI_NV__7_invlist[] = { /* for EBCDIC 1047 */ 0x1246D, 0x16A67, 0x16A68, + 0x16AC7, + 0x16AC8, 0x16B57, 0x16B58, 0x16E87, @@ -359219,7 +368228,7 @@ static const UV UNI_NV__7_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__7_invlist[] = { /* for EBCDIC 037 */ - 221, /* Number of elements */ + 223, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -359404,6 +368413,8 @@ static const UV UNI_NV__7_invlist[] = { /* for EBCDIC 037 */ 0x1246D, 0x16A67, 0x16A68, + 0x16AC7, + 0x16AC8, 0x16B57, 0x16B58, 0x16E87, @@ -359577,7 +368588,7 @@ static const UV UNI_NV__700000_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__8_invlist[] = { /* for ASCII/Latin1 */ - 215, /* Number of elements */ + 217, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -359758,6 +368769,8 @@ static const UV UNI_NV__8_invlist[] = { /* for ASCII/Latin1 */ 0x1246E, 0x16A68, 0x16A69, + 0x16AC8, + 0x16AC9, 0x16B58, 0x16B59, 0x16E88, @@ -359806,7 +368819,7 @@ static const UV UNI_NV__8_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__8_invlist[] = { /* for EBCDIC 1047 */ - 215, /* Number of elements */ + 217, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -359987,6 +369000,8 @@ static const UV UNI_NV__8_invlist[] = { /* for EBCDIC 1047 */ 0x1246E, 0x16A68, 0x16A69, + 0x16AC8, + 0x16AC9, 0x16B58, 0x16B59, 0x16E88, @@ -360035,7 +369050,7 @@ static const UV UNI_NV__8_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__8_invlist[] = { /* for EBCDIC 037 */ - 215, /* Number of elements */ + 217, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -360216,6 +369231,8 @@ static const UV UNI_NV__8_invlist[] = { /* for EBCDIC 037 */ 0x1246E, 0x16A68, 0x16A69, + 0x16AC8, + 0x16AC9, 0x16B58, 0x16B59, 0x16E88, @@ -360355,7 +369372,7 @@ static const UV UNI_NV__800000_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__9_invlist[] = { /* for ASCII/Latin1 */ - 219, /* Number of elements */ + 221, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -360538,6 +369555,8 @@ static const UV UNI_NV__9_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x16A69, 0x16A6A, + 0x16AC9, + 0x16ACA, 0x16B59, 0x16B5A, 0x16E89, @@ -360588,7 +369607,7 @@ static const UV UNI_NV__9_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__9_invlist[] = { /* for EBCDIC 1047 */ - 219, /* Number of elements */ + 221, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -360771,6 +369790,8 @@ static const UV UNI_NV__9_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x16A69, 0x16A6A, + 0x16AC9, + 0x16ACA, 0x16B59, 0x16B5A, 0x16E89, @@ -360821,7 +369842,7 @@ static const UV UNI_NV__9_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__9_invlist[] = { /* for EBCDIC 037 */ - 219, /* Number of elements */ + 221, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -361004,6 +370025,8 @@ static const UV UNI_NV__9_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x16A69, 0x16A6A, + 0x16AC9, + 0x16ACA, 0x16B59, 0x16B5A, 0x16E89, @@ -361157,7 +370180,7 @@ static const UV UNI_NV__900000_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_NV__NAN_invlist[] = { /* for ASCII/Latin1 */ - 411, /* Number of elements */ + 413, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -361506,6 +370529,8 @@ static const UV UNI_NV__NAN_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x16B5B, @@ -361582,7 +370607,7 @@ static const UV UNI_NV__NAN_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_NV__NAN_invlist[] = { /* for EBCDIC 1047 */ - 411, /* Number of elements */ + 413, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -361931,6 +370956,8 @@ static const UV UNI_NV__NAN_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x16B5B, @@ -362007,7 +371034,7 @@ static const UV UNI_NV__NAN_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_NV__NAN_invlist[] = { /* for EBCDIC 037 */ - 411, /* Number of elements */ + 413, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -362356,6 +371383,8 @@ static const UV UNI_NV__NAN_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x16B5B, @@ -362554,10 +371583,24 @@ static const UV UNI_OTTOMANSIYAQNUMBERS_invlist[] = { /* for all charsets */ 0x1ED50 }; +static const UV UNI_OUGR_invlist[] = { /* for all charsets */ + 7, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x640, + 0x641, + 0x10AF2, + 0x10AF3, + 0x10F70, + 0x10F8A +}; + # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_P_invlist[] = { /* for ASCII/Latin1 */ - 371, /* Number of elements */ + 379, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -362616,7 +371659,7 @@ static const UV UNI_P_invlist[] = { /* for ASCII/Latin1 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -362694,6 +371737,8 @@ static const UV UNI_P_invlist[] = { /* for ASCII/Latin1 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -362743,7 +371788,7 @@ static const UV UNI_P_invlist[] = { /* for ASCII/Latin1 */ 0x2E30, 0x2E50, 0x2E52, - 0x2E53, + 0x2E5E, 0x3001, 0x3004, 0x3008, @@ -362854,6 +371899,8 @@ static const UV UNI_P_invlist[] = { /* for ASCII/Latin1 */ 0x10EAE, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -362890,6 +371937,8 @@ static const UV UNI_P_invlist[] = { /* for ASCII/Latin1 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -362914,6 +371963,8 @@ static const UV UNI_P_invlist[] = { /* for ASCII/Latin1 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -362942,7 +371993,7 @@ static const UV UNI_P_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_P_invlist[] = { /* for EBCDIC 1047 */ - 379, /* Number of elements */ + 387, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -363009,7 +372060,7 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 1047 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -363087,6 +372138,8 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 1047 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -363136,7 +372189,7 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 1047 */ 0x2E30, 0x2E50, 0x2E52, - 0x2E53, + 0x2E5E, 0x3001, 0x3004, 0x3008, @@ -363247,6 +372300,8 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 1047 */ 0x10EAE, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -363283,6 +372338,8 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 1047 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -363307,6 +372364,8 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 1047 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -363335,7 +372394,7 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_P_invlist[] = { /* for EBCDIC 037 */ - 377, /* Number of elements */ + 385, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -363400,7 +372459,7 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 037 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -363478,6 +372537,8 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 037 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -363527,7 +372588,7 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 037 */ 0x2E30, 0x2E50, 0x2E52, - 0x2E53, + 0x2E5E, 0x3001, 0x3004, 0x3008, @@ -363638,6 +372699,8 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 037 */ 0x10EAE, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -363674,6 +372737,8 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 037 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -363698,6 +372763,8 @@ static const UV UNI_P_invlist[] = { /* for EBCDIC 037 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -364035,7 +373102,7 @@ static const UV UNI_PC_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_PCM_invlist[] = { /* for all charsets */ - 13, /* Number of elements */ + 15, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -364046,6 +373113,8 @@ static const UV UNI_PCM_invlist[] = { /* for all charsets */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x110BD, @@ -364057,7 +373126,7 @@ static const UV UNI_PCM_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_PD_invlist[] = { /* for ASCII/Latin1 */ - 37, /* Number of elements */ + 39, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -364082,6 +373151,8 @@ static const UV UNI_PD_invlist[] = { /* for ASCII/Latin1 */ 0x2E3C, 0x2E40, 0x2E41, + 0x2E5D, + 0x2E5E, 0x301C, 0x301D, 0x3030, @@ -364108,7 +373179,7 @@ static const UV UNI_PD_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_PD_invlist[] = { /* for EBCDIC 1047 */ - 37, /* Number of elements */ + 39, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -364133,6 +373204,8 @@ static const UV UNI_PD_invlist[] = { /* for EBCDIC 1047 */ 0x2E3C, 0x2E40, 0x2E41, + 0x2E5D, + 0x2E5E, 0x301C, 0x301D, 0x3030, @@ -364159,7 +373232,7 @@ static const UV UNI_PD_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_PD_invlist[] = { /* for EBCDIC 037 */ - 37, /* Number of elements */ + 39, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -364184,6 +373257,8 @@ static const UV UNI_PD_invlist[] = { /* for EBCDIC 037 */ 0x2E3C, 0x2E40, 0x2E41, + 0x2E5D, + 0x2E5E, 0x301C, 0x301D, 0x3030, @@ -364207,7 +373282,7 @@ static const UV UNI_PD_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_PE_invlist[] = { /* for ASCII/Latin1 */ - 145, /* Number of elements */ + 153, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -364298,6 +373373,14 @@ static const UV UNI_PE_invlist[] = { /* for ASCII/Latin1 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3009, 0x300A, 0x300B, @@ -364366,7 +373449,7 @@ static const UV UNI_PE_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_PE_invlist[] = { /* for EBCDIC 1047 */ - 145, /* Number of elements */ + 153, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -364457,6 +373540,14 @@ static const UV UNI_PE_invlist[] = { /* for EBCDIC 1047 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3009, 0x300A, 0x300B, @@ -364525,7 +373616,7 @@ static const UV UNI_PE_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_PE_invlist[] = { /* for EBCDIC 037 */ - 145, /* Number of elements */ + 153, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -364616,6 +373707,14 @@ static const UV UNI_PE_invlist[] = { /* for EBCDIC 037 */ 0x2E28, 0x2E29, 0x2E2A, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, + 0x2E5D, 0x3009, 0x300A, 0x300B, @@ -364997,7 +374096,7 @@ static const UV UNI_PLAYINGCARDS_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_PO_invlist[] = { /* for ASCII/Latin1 */ - 363, /* Number of elements */ + 371, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -365048,7 +374147,7 @@ static const UV UNI_PO_invlist[] = { /* for ASCII/Latin1 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -365122,6 +374221,8 @@ static const UV UNI_PO_invlist[] = { /* for ASCII/Latin1 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -365179,7 +374280,7 @@ static const UV UNI_PO_invlist[] = { /* for ASCII/Latin1 */ 0x2E43, 0x2E50, 0x2E52, - 0x2E53, + 0x2E55, 0x3001, 0x3004, 0x303D, @@ -365286,6 +374387,8 @@ static const UV UNI_PO_invlist[] = { /* for ASCII/Latin1 */ 0x10B9D, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -365322,6 +374425,8 @@ static const UV UNI_PO_invlist[] = { /* for ASCII/Latin1 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -365346,6 +374451,8 @@ static const UV UNI_PO_invlist[] = { /* for ASCII/Latin1 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -365374,7 +374481,7 @@ static const UV UNI_PO_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_PO_invlist[] = { /* for EBCDIC 1047 */ - 367, /* Number of elements */ + 375, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -365429,7 +374536,7 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 1047 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -365503,6 +374610,8 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 1047 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -365560,7 +374669,7 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 1047 */ 0x2E43, 0x2E50, 0x2E52, - 0x2E53, + 0x2E55, 0x3001, 0x3004, 0x303D, @@ -365667,6 +374776,8 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 1047 */ 0x10B9D, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -365703,6 +374814,8 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 1047 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -365727,6 +374840,8 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 1047 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -365755,7 +374870,7 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_PO_invlist[] = { /* for EBCDIC 037 */ - 367, /* Number of elements */ + 375, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -365810,7 +374925,7 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 037 */ 0x60E, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x66A, 0x66E, @@ -365884,6 +374999,8 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 037 */ 0x1AAE, 0x1B5A, 0x1B61, + 0x1B7D, + 0x1B7F, 0x1BFC, 0x1C00, 0x1C3B, @@ -365941,7 +375058,7 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 037 */ 0x2E43, 0x2E50, 0x2E52, - 0x2E53, + 0x2E55, 0x3001, 0x3004, 0x303D, @@ -366048,6 +375165,8 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 037 */ 0x10B9D, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BB, @@ -366084,6 +375203,8 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 037 */ 0x11644, 0x11660, 0x1166D, + 0x116B9, + 0x116BA, 0x1173C, 0x1173F, 0x1183B, @@ -366108,6 +375229,8 @@ static const UV UNI_PO_invlist[] = { /* for EBCDIC 037 */ 0x12000, 0x12470, 0x12475, + 0x12FF1, + 0x12FF3, 0x16A6E, 0x16A70, 0x16AF5, @@ -366145,7 +375268,7 @@ static const UV UNI_PRTI_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_PS_invlist[] = { /* for ASCII/Latin1 */ - 151, /* Number of elements */ + 159, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -366242,6 +375365,14 @@ static const UV UNI_PS_invlist[] = { /* for ASCII/Latin1 */ 0x2E29, 0x2E42, 0x2E43, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -366310,7 +375441,7 @@ static const UV UNI_PS_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_PS_invlist[] = { /* for EBCDIC 1047 */ - 151, /* Number of elements */ + 159, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -366407,6 +375538,14 @@ static const UV UNI_PS_invlist[] = { /* for EBCDIC 1047 */ 0x2E29, 0x2E42, 0x2E43, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -366475,7 +375614,7 @@ static const UV UNI_PS_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_PS_invlist[] = { /* for EBCDIC 037 */ - 151, /* Number of elements */ + 159, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -366572,6 +375711,14 @@ static const UV UNI_PS_invlist[] = { /* for EBCDIC 037 */ 0x2E29, 0x2E42, 0x2E43, + 0x2E55, + 0x2E56, + 0x2E57, + 0x2E58, + 0x2E59, + 0x2E5A, + 0x2E5B, + 0x2E5C, 0x3008, 0x3009, 0x300A, @@ -366645,7 +375792,7 @@ static const UV UNI_PUA_invlist[] = { /* for all charsets */ }; static const UV UNI_QAAI_invlist[] = { /* for all charsets */ - 37, /* Number of elements */ + 41, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -366659,7 +375806,7 @@ static const UV UNI_QAAI_invlist[] = { /* for all charsets */ 0x953, 0x955, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1DC2, 0x1DF8, 0x1DF9, @@ -366676,6 +375823,10 @@ static const UV UNI_QAAI_invlist[] = { /* for all charsets */ 0xFE2E, 0x101FD, 0x101FE, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D17B, @@ -366887,7 +376038,7 @@ static const UV UNI_RUNR_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ - 459, /* Number of elements */ + 469, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -366958,6 +376109,8 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ 0x7F7, 0x7FE, 0x800, + 0x888, + 0x889, 0x9F2, 0x9F4, 0x9FA, @@ -367035,7 +376188,7 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ 0x208A, 0x208D, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2102, 0x2103, @@ -367159,9 +376312,13 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ 0xFB29, 0xFB2A, 0xFBB2, - 0xFBC2, + 0xFBC3, + 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFC, - 0xFDFE, + 0xFE00, 0xFE62, 0xFE63, 0xFE64, @@ -367214,6 +376371,8 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ 0x16B46, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -367227,7 +376386,7 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -367302,7 +376461,7 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -367312,6 +376471,8 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -367325,27 +376486,27 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -367360,7 +376521,7 @@ static const UV UNI_S_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ - 465, /* Number of elements */ + 475, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -367437,6 +376598,8 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ 0x7F7, 0x7FE, 0x800, + 0x888, + 0x889, 0x9F2, 0x9F4, 0x9FA, @@ -367514,7 +376677,7 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ 0x208A, 0x208D, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2102, 0x2103, @@ -367638,9 +376801,13 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ 0xFB29, 0xFB2A, 0xFBB2, - 0xFBC2, + 0xFBC3, + 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFC, - 0xFDFE, + 0xFE00, 0xFE62, 0xFE63, 0xFE64, @@ -367693,6 +376860,8 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ 0x16B46, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -367706,7 +376875,7 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -367781,7 +376950,7 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -367791,6 +376960,8 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -367804,27 +376975,27 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -367839,7 +377010,7 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ - 463, /* Number of elements */ + 473, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -367914,6 +377085,8 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ 0x7F7, 0x7FE, 0x800, + 0x888, + 0x889, 0x9F2, 0x9F4, 0x9FA, @@ -367991,7 +377164,7 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ 0x208A, 0x208D, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2102, 0x2103, @@ -368115,9 +377288,13 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ 0xFB29, 0xFB2A, 0xFBB2, - 0xFBC2, + 0xFBC3, + 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFC, - 0xFDFE, + 0xFE00, 0xFE62, 0xFE63, 0xFE64, @@ -368170,6 +377347,8 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ 0x16B46, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -368183,7 +377362,7 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -368258,7 +377437,7 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -368268,6 +377447,8 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -368281,27 +377462,27 @@ static const UV UNI_S_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -368413,7 +377594,7 @@ static const UV UNI_SB__AT_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SB__CL_invlist[] = { /* for ASCII/Latin1 */ - 89, /* Number of elements */ + 91, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -368474,6 +377655,8 @@ static const UV UNI_SB__CL_invlist[] = { /* for ASCII/Latin1 */ 0x2E2A, 0x2E42, 0x2E43, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -368516,7 +377699,7 @@ static const UV UNI_SB__CL_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SB__CL_invlist[] = { /* for EBCDIC 1047 */ - 91, /* Number of elements */ + 93, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -368579,6 +377762,8 @@ static const UV UNI_SB__CL_invlist[] = { /* for EBCDIC 1047 */ 0x2E2A, 0x2E42, 0x2E43, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -368621,7 +377806,7 @@ static const UV UNI_SB__CL_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SB__CL_invlist[] = { /* for EBCDIC 037 */ - 89, /* Number of elements */ + 91, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -368682,6 +377867,8 @@ static const UV UNI_SB__CL_invlist[] = { /* for EBCDIC 037 */ 0x2E2A, 0x2E42, 0x2E43, + 0x2E55, + 0x2E5D, 0x3008, 0x3012, 0x3014, @@ -368719,7 +377906,7 @@ static const UV UNI_SB__CL_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ - 587, /* Number of elements */ + 605, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -368772,7 +377959,9 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -368856,6 +378045,8 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -368959,7 +378150,7 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -368972,6 +378163,8 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -368989,7 +378182,7 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -369015,8 +378208,6 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200C, 0x200E, @@ -369126,14 +378317,22 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -369264,6 +378463,10 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0x16FF2, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -369300,6 +378503,8 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -369315,7 +378520,7 @@ static const UV UNI_SB__EX_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SB__FO_invlist[] = { /* for ASCII/Latin1 */ - 41, /* Number of elements */ + 43, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -369330,6 +378535,8 @@ static const UV UNI_SB__FO_invlist[] = { /* for ASCII/Latin1 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -369370,7 +378577,7 @@ static const UV UNI_SB__FO_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SB__FO_invlist[] = { /* for EBCDIC 1047 */ - 41, /* Number of elements */ + 43, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -369385,6 +378592,8 @@ static const UV UNI_SB__FO_invlist[] = { /* for EBCDIC 1047 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -369425,7 +378634,7 @@ static const UV UNI_SB__FO_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SB__FO_invlist[] = { /* for EBCDIC 037 */ - 41, /* Number of elements */ + 43, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -369440,6 +378649,8 @@ static const UV UNI_SB__FO_invlist[] = { /* for EBCDIC 037 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -369475,7 +378686,7 @@ static const UV UNI_SB__FO_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ - 1039, /* Number of elements */ + 1073, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -369544,10 +378755,12 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -369676,6 +378889,8 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -369692,7 +378907,7 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -369825,10 +379040,8 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -369871,7 +379084,7 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -369953,8 +379166,6 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -369976,6 +379187,8 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0xA789, 0xA78F, 0xA790, + 0xA7F2, + 0xA7F5, 0xA7F7, 0xA7F8, 0xA7FB, @@ -370150,6 +379363,8 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x10756, 0x10760, 0x10768, + 0x10781, + 0x10783, 0x10800, 0x10806, 0x10808, @@ -370216,12 +379431,18 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -370304,6 +379525,8 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118FF, @@ -370340,7 +379563,7 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -370376,6 +379599,8 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -370384,6 +379609,8 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -370410,8 +379637,14 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -370426,14 +379659,26 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x1BC89, 0x1BC90, 0x1BC9A, + 0x1DF0A, + 0x1DF0B, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E94B, @@ -370505,9 +379750,9 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -370523,7 +379768,7 @@ static const UV UNI_SB__LE_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SB__LO_invlist[] = { /* for ASCII/Latin1 */ - 1299, /* Number of elements */ + 1331, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -371401,7 +380646,7 @@ static const UV UNI_SB__LO_invlist[] = { /* for ASCII/Latin1 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -371736,12 +380981,24 @@ static const UV UNI_SB__LO_invlist[] = { /* for ASCII/Latin1 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7F8, @@ -371762,6 +381019,22 @@ static const UV UNI_SB__LO_invlist[] = { /* for ASCII/Latin1 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10CC0, 0x10CF3, 0x118C0, @@ -371824,6 +381097,10 @@ static const UV UNI_SB__LO_invlist[] = { /* for ASCII/Latin1 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -371836,7 +381113,7 @@ static const UV UNI_SB__LO_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 1047 */ - 1307, /* Number of elements */ + 1339, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -372722,7 +381999,7 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 1047 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -373057,12 +382334,24 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 1047 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7F8, @@ -373083,6 +382372,22 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 1047 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10CC0, 0x10CF3, 0x118C0, @@ -373145,6 +382450,10 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 1047 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -373157,7 +382466,7 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 037 */ - 1307, /* Number of elements */ + 1339, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -374043,7 +383352,7 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 037 */ 0x24D0, 0x24EA, 0x2C30, - 0x2C5F, + 0x2C60, 0x2C61, 0x2C62, 0x2C65, @@ -374378,12 +383687,24 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 037 */ 0xA7BE, 0xA7BF, 0xA7C0, + 0xA7C1, + 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, 0xA7CB, + 0xA7D1, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, + 0xA7DA, 0xA7F6, 0xA7F7, 0xA7F8, @@ -374404,6 +383725,22 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 037 */ 0x10450, 0x104D8, 0x104FC, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, + 0x10780, + 0x10781, + 0x10783, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10CC0, 0x10CF3, 0x118C0, @@ -374466,6 +383803,10 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 037 */ 0x1D7CA, 0x1D7CB, 0x1D7CC, + 0x1DF00, + 0x1DF0A, + 0x1DF0B, + 0x1DF1F, 0x1E922, 0x1E944 }; @@ -374475,7 +383816,7 @@ static const UV UNI_SB__LO_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SB__NU_invlist[] = { /* for ASCII/Latin1 */ - 125, /* Number of elements */ + 127, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -374592,6 +383933,8 @@ static const UV UNI_SB__NU_invlist[] = { /* for ASCII/Latin1 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -374614,7 +383957,7 @@ static const UV UNI_SB__NU_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SB__NU_invlist[] = { /* for EBCDIC 1047 */ - 125, /* Number of elements */ + 127, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -374731,6 +384074,8 @@ static const UV UNI_SB__NU_invlist[] = { /* for EBCDIC 1047 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -374753,7 +384098,7 @@ static const UV UNI_SB__NU_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SB__NU_invlist[] = { /* for EBCDIC 037 */ - 125, /* Number of elements */ + 127, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -374870,6 +384215,8 @@ static const UV UNI_SB__NU_invlist[] = { /* for EBCDIC 037 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -375195,7 +384542,7 @@ static const UV UNI_SB__SP_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SB__ST_invlist[] = { /* for ASCII/Latin1 */ - 147, /* Number of elements */ + 153, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -375206,7 +384553,7 @@ static const UV UNI_SB__ST_invlist[] = { /* for ASCII/Latin1 */ 0x40, 0x589, 0x58A, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -375244,6 +384591,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for ASCII/Latin1 */ 0x1B5C, 0x1B5E, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C3D, 0x1C7E, @@ -375256,6 +384605,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for ASCII/Latin1 */ 0x2E2F, 0x2E3C, 0x2E3D, + 0x2E53, + 0x2E55, 0x3002, 0x3003, 0xA4FF, @@ -375292,6 +384643,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for ASCII/Latin1 */ 0x10A58, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x11049, 0x110BE, @@ -375356,7 +384709,7 @@ static const UV UNI_SB__ST_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 1047 */ - 147, /* Number of elements */ + 153, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -375367,7 +384720,7 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 1047 */ 0x70, 0x589, 0x58A, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -375405,6 +384758,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 1047 */ 0x1B5C, 0x1B5E, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C3D, 0x1C7E, @@ -375417,6 +384772,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 1047 */ 0x2E2F, 0x2E3C, 0x2E3D, + 0x2E53, + 0x2E55, 0x3002, 0x3003, 0xA4FF, @@ -375453,6 +384810,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 1047 */ 0x10A58, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x11049, 0x110BE, @@ -375517,7 +384876,7 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 037 */ - 147, /* Number of elements */ + 153, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -375528,7 +384887,7 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 037 */ 0x70, 0x589, 0x58A, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -375566,6 +384925,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 037 */ 0x1B5C, 0x1B5E, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C3D, 0x1C7E, @@ -375578,6 +384939,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 037 */ 0x2E2F, 0x2E3C, 0x2E3D, + 0x2E53, + 0x2E55, 0x3002, 0x3003, 0xA4FF, @@ -375614,6 +384977,8 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 037 */ 0x10A58, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x11049, 0x110BE, @@ -375675,7 +385040,7 @@ static const UV UNI_SB__ST_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SB__UP_invlist[] = { /* for ASCII/Latin1 */ - 1289, /* Number of elements */ + 1305, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -376549,7 +385914,7 @@ static const UV UNI_SB__UP_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -376878,12 +386243,20 @@ static const UV UNI_SB__UP_invlist[] = { /* for ASCII/Latin1 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -376892,6 +386265,14 @@ static const UV UNI_SB__UP_invlist[] = { /* for ASCII/Latin1 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -376978,7 +386359,7 @@ static const UV UNI_SB__UP_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 1047 */ - 1307, /* Number of elements */ + 1323, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -377870,7 +387251,7 @@ static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -378199,12 +387580,20 @@ static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 1047 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -378213,6 +387602,14 @@ static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 1047 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -378299,7 +387696,7 @@ static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 037 */ - 1303, /* Number of elements */ + 1319, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -379187,7 +388584,7 @@ static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24D0, 0x2C00, - 0x2C2F, + 0x2C30, 0x2C60, 0x2C61, 0x2C62, @@ -379516,12 +388913,20 @@ static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 037 */ 0xA7BD, 0xA7BE, 0xA7BF, + 0xA7C0, + 0xA7C1, 0xA7C2, 0xA7C3, 0xA7C4, 0xA7C8, 0xA7C9, 0xA7CA, + 0xA7D0, + 0xA7D1, + 0xA7D6, + 0xA7D7, + 0xA7D8, + 0xA7D9, 0xA7F5, 0xA7F6, 0xFF21, @@ -379530,6 +388935,14 @@ static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 037 */ 0x10428, 0x104B0, 0x104D4, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, 0x10C80, 0x10CB3, 0x118A0, @@ -379613,7 +389026,7 @@ static const UV UNI_SB__UP_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ - 1611, /* Number of elements */ + 1661, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -379715,8 +389128,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x610, 0x61B, 0x61C, - 0x61D, - 0x61E, 0x66A, 0x66B, 0x66D, @@ -379750,11 +389161,13 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x970, 0x971, 0x984, @@ -379918,7 +389331,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -379928,6 +389341,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -379952,7 +389367,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -380117,10 +389532,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -380143,8 +389556,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1808, 0x180A, 0x180B, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -380181,15 +389592,17 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1AA7, 0x1AAC, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5C, 0x1B5E, 0x1B60, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1C00, @@ -380209,8 +389622,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -380327,10 +389738,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x29FC, 0x29FE, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -380374,6 +389781,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x2E3D, 0x2E42, 0x2E43, + 0x2E53, + 0x2E5D, 0x3000, 0x3003, 0x3005, @@ -380409,8 +389818,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -380433,10 +389840,14 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -380642,12 +390053,34 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -380732,6 +390165,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x10F51, 0x10F55, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FC5, 0x10FE0, @@ -380739,11 +390174,11 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x11049, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, 0x110BD, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -380858,6 +390293,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1173A, 0x1173C, 0x1173F, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -380898,7 +390335,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x11A9A, 0x11A9B, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -380950,6 +390387,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -380963,7 +390402,9 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -381000,8 +390441,14 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -381018,6 +390465,10 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9D, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -381104,6 +390555,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -381122,8 +390575,18 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -381209,9 +390672,9 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -381238,7 +390701,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ - 1631, /* Number of elements */ + 1681, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -381360,8 +390823,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x610, 0x61B, 0x61C, - 0x61D, - 0x61E, 0x66A, 0x66B, 0x66D, @@ -381395,11 +390856,13 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x970, 0x971, 0x984, @@ -381563,7 +391026,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -381573,6 +391036,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -381597,7 +391062,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -381762,10 +391227,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -381788,8 +391251,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1808, 0x180A, 0x180B, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -381826,15 +391287,17 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1AA7, 0x1AAC, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5C, 0x1B5E, 0x1B60, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1C00, @@ -381854,8 +391317,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -381972,10 +391433,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x29FC, 0x29FE, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -382019,6 +391476,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x2E3D, 0x2E42, 0x2E43, + 0x2E53, + 0x2E5D, 0x3000, 0x3003, 0x3005, @@ -382054,8 +391513,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -382078,10 +391535,14 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -382287,12 +391748,34 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -382377,6 +391860,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x10F51, 0x10F55, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FC5, 0x10FE0, @@ -382384,11 +391869,11 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x11049, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, 0x110BD, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -382503,6 +391988,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1173A, 0x1173C, 0x1173F, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -382543,7 +392030,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x11A9A, 0x11A9B, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -382595,6 +392082,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -382608,7 +392097,9 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -382645,8 +392136,14 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -382663,6 +392160,10 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9D, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -382749,6 +392250,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -382767,8 +392270,18 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -382854,9 +392367,9 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -382883,7 +392396,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ - 1629, /* Number of elements */ + 1679, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -383003,8 +392516,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x610, 0x61B, 0x61C, - 0x61D, - 0x61E, 0x66A, 0x66B, 0x66D, @@ -383038,11 +392549,13 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x970, 0x971, 0x984, @@ -383206,7 +392719,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -383216,6 +392729,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -383240,7 +392755,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -383405,10 +392920,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -383431,8 +392944,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1808, 0x180A, 0x180B, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -383469,15 +392980,17 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1AA7, 0x1AAC, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5C, 0x1B5E, 0x1B60, 0x1B6B, 0x1B74, + 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1C00, @@ -383497,8 +393010,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -383615,10 +393126,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x29FC, 0x29FE, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -383662,6 +393169,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x2E3D, 0x2E42, 0x2E43, + 0x2E53, + 0x2E5D, 0x3000, 0x3003, 0x3005, @@ -383697,8 +393206,6 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -383721,10 +393228,14 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -383930,12 +393441,34 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -384020,6 +393553,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x10F51, 0x10F55, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FC5, 0x10FE0, @@ -384027,11 +393562,11 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x11049, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, 0x110BD, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -384146,6 +393681,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1173A, 0x1173C, 0x1173F, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -384186,7 +393723,7 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x11A9A, 0x11A9B, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -384238,6 +393775,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -384251,7 +393790,9 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -384288,8 +393829,14 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -384306,6 +393853,10 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9D, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -384392,6 +393943,8 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -384410,8 +393963,18 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -384497,9 +394060,9 @@ static const UV UNI_SB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -384551,7 +394114,7 @@ static const UV UNI_SC_invlist[] = { /* for ASCII/Latin1 */ 0x17DB, 0x17DC, 0x20A0, - 0x20C0, + 0x20C1, 0xA838, 0xA839, 0xFDFC, @@ -384612,7 +394175,7 @@ static const UV UNI_SC_invlist[] = { /* for EBCDIC 1047 */ 0x17DB, 0x17DC, 0x20A0, - 0x20C0, + 0x20C1, 0xA838, 0xA839, 0xFDFC, @@ -384673,7 +394236,7 @@ static const UV UNI_SC_invlist[] = { /* for EBCDIC 037 */ 0x17DB, 0x17DC, 0x20A0, - 0x20C0, + 0x20C1, 0xA838, 0xA839, 0xFDFC, @@ -384723,8 +394286,6 @@ static const UV UNI_SC__ARAB_invlist[] = { /* for all charsets */ 0x60D, 0x61B, 0x61C, - 0x61D, - 0x61E, 0x61F, 0x620, 0x640, @@ -384738,24 +394299,26 @@ static const UV UNI_SC__ARAB_invlist[] = { /* for all charsets */ 0x700, 0x750, 0x780, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x8E2, 0x8E3, 0x900, 0xFB50, - 0xFBC2, + 0xFBC3, 0xFBD3, 0xFD3E, - 0xFD50, + 0xFD40, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, + 0xFE00, 0xFE70, 0xFE75, 0xFE76, @@ -384930,6 +394493,16 @@ static const UV UNI_SC__COPT_invlist[] = { /* for all charsets */ 0x2D00 }; +static const UV UNI_SC__CPMN_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x12F90, + 0x12FF3 +}; + static const UV UNI_SC__CPRT_invlist[] = { /* for all charsets */ 13, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -385047,15 +394620,13 @@ static const UV UNI_SC__GEOR_invlist[] = { /* for all charsets */ }; static const UV UNI_SC__GLAG_invlist[] = { /* for all charsets */ - 15, /* Number of elements */ + 13, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, + 0x2C60, 0x1E000, 0x1E007, 0x1E008, @@ -385305,7 +394876,7 @@ static const UV UNI_SC__GURU_invlist[] = { /* for all charsets */ }; static const UV UNI_SC__HAN_invlist[] = { /* for all charsets */ - 39, /* Number of elements */ + 41, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -385327,17 +394898,19 @@ static const UV UNI_SC__HAN_invlist[] = { /* for all charsets */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xF900, 0xFA6E, 0xFA70, 0xFADA, + 0x16FE2, + 0x16FE4, 0x16FF0, 0x16FF2, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -385407,7 +394980,7 @@ static const UV UNI_SC__HIRA_invlist[] = { /* for all charsets */ 0x309D, 0x30A0, 0x1B001, - 0x1B11F, + 0x1B120, 0x1B150, 0x1B153, 0x1F200, @@ -385441,7 +395014,7 @@ static const UV UNI_SC__KALI_invlist[] = { /* for all charsets */ }; static const UV UNI_SC__KANA_invlist[] = { /* for all charsets */ - 19, /* Number of elements */ + 27, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -385460,8 +395033,16 @@ static const UV UNI_SC__KANA_invlist[] = { /* for all charsets */ 0xFF70, 0xFF71, 0xFF9E, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168 }; @@ -385502,7 +395083,7 @@ static const UV UNI_SC__KNDA_invlist[] = { /* for all charsets */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -385519,7 +395100,7 @@ static const UV UNI_SC__KTHI_invlist[] = { /* for all charsets */ 1 if it starts at the element beyond 0 */ 0x0, 0x11080, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE }; @@ -385527,7 +395108,7 @@ static const UV UNI_SC__KTHI_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SC__LATN_invlist[] = { /* for ASCII/Latin1 */ - 65, /* Number of elements */ + 77, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -385579,10 +395160,14 @@ static const UV UNI_SC__LATN_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xAB30, 0xAB5B, @@ -385595,7 +395180,15 @@ static const UV UNI_SC__LATN_invlist[] = { /* for ASCII/Latin1 */ 0xFF21, 0xFF3B, 0xFF41, - 0xFF5B + 0xFF5B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, + 0x1DF00, + 0x1DF1F }; # endif /* ASCII/Latin1 */ @@ -385606,7 +395199,7 @@ static const UV UNI_SC__LATN_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SC__LATN_invlist[] = { /* for EBCDIC 1047 */ - 91, /* Number of elements */ + 103, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -385684,10 +395277,14 @@ static const UV UNI_SC__LATN_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xAB30, 0xAB5B, @@ -385700,7 +395297,15 @@ static const UV UNI_SC__LATN_invlist[] = { /* for EBCDIC 1047 */ 0xFF21, 0xFF3B, 0xFF41, - 0xFF5B + 0xFF5B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, + 0x1DF00, + 0x1DF1F }; # endif /* EBCDIC 1047 */ @@ -385711,7 +395316,7 @@ static const UV UNI_SC__LATN_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SC__LATN_invlist[] = { /* for EBCDIC 037 */ - 87, /* Number of elements */ + 99, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -385785,10 +395390,14 @@ static const UV UNI_SC__LATN_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA788, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA800, 0xAB30, 0xAB5B, @@ -385801,7 +395410,15 @@ static const UV UNI_SC__LATN_invlist[] = { /* for EBCDIC 037 */ 0xFF21, 0xFF3B, 0xFF41, - 0xFF5B + 0xFF5B, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, + 0x1DF00, + 0x1DF1F }; # endif /* EBCDIC 037 */ @@ -385929,7 +395546,7 @@ static const UV UNI_SC__MODI_invlist[] = { /* for all charsets */ }; static const UV UNI_SC__MONG_invlist[] = { /* for all charsets */ - 15, /* Number of elements */ + 13, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -385939,8 +395556,6 @@ static const UV UNI_SC__MONG_invlist[] = { /* for all charsets */ 0x1804, 0x1805, 0x1806, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -385996,6 +395611,18 @@ static const UV UNI_SC__NAND_invlist[] = { /* for all charsets */ 0x119E5 }; +static const UV UNI_SC__NKO_invlist[] = { /* for all charsets */ + 5, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x7C0, + 0x7FB, + 0x7FD, + 0x800 +}; + static const UV UNI_SC__ORYA_invlist[] = { /* for all charsets */ 29, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -386032,6 +395659,16 @@ static const UV UNI_SC__ORYA_invlist[] = { /* for all charsets */ 0xB78 }; +static const UV UNI_SC__OUGR_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x10F70, + 0x10F8A +}; + static const UV UNI_SC__PERM_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -386067,7 +395704,7 @@ static const UV UNI_SC__PHLP_invlist[] = { /* for all charsets */ }; static const UV UNI_SC__QAAI_invlist[] = { /* for all charsets */ - 57, /* Number of elements */ + 59, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -386083,7 +395720,7 @@ static const UV UNI_SC__QAAI_invlist[] = { /* for all charsets */ 0x951, 0x955, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1CD0, 0x1CD3, 0x1CD4, @@ -386097,8 +395734,6 @@ static const UV UNI_SC__QAAI_invlist[] = { /* for all charsets */ 0x1CF8, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200C, 0x200E, @@ -386118,6 +395753,10 @@ static const UV UNI_SC__QAAI_invlist[] = { /* for all charsets */ 0x102E1, 0x1133B, 0x1133C, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D167, 0x1D16A, 0x1D17B, @@ -386255,7 +395894,7 @@ static const UV UNI_SC__TAKR_invlist[] = { /* for all charsets */ 1 if it starts at the element beyond 0 */ 0x0, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA }; @@ -386317,7 +395956,7 @@ static const UV UNI_SC__TAML_invlist[] = { /* for all charsets */ }; static const UV UNI_SC__TELU_invlist[] = { /* for all charsets */ - 25, /* Number of elements */ + 27, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -386330,7 +395969,7 @@ static const UV UNI_SC__TELU_invlist[] = { /* for all charsets */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -386340,6 +395979,8 @@ static const UV UNI_SC__TELU_invlist[] = { /* for all charsets */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -386355,9 +395996,9 @@ static const UV UNI_SC__TGLG_invlist[] = { /* for all charsets */ 1 if it starts at the element beyond 0 */ 0x0, 0x1700, - 0x170D, - 0x170E, - 0x1715 + 0x1716, + 0x171F, + 0x1720 }; static const UV UNI_SC__THAA_invlist[] = { /* for all charsets */ @@ -386411,7 +396052,7 @@ static const UV UNI_SC__YI_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ - 346, /* Number of elements */ + 348, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -386496,7 +396137,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x2080, 0x208F, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2126, 0x2127, @@ -386522,7 +396163,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x2B97, 0x2C00, 0x2E00, - 0x2E53, + 0x2E5E, 0x2FF0, 0x2FFC, 0x3000, @@ -386609,10 +396250,10 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x101FD, 0x102E1, 0x102FC, - 0x16FE2, - 0x16FE4, 0x1BCA0, 0x1BCA4, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -386626,7 +396267,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D2E0, 0x1D2F4, 0x1D300, @@ -386707,7 +396348,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -386717,6 +396358,8 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -386730,27 +396373,27 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -386771,7 +396414,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ - 372, /* Number of elements */ + 374, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -386882,7 +396525,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x2080, 0x208F, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2126, 0x2127, @@ -386908,7 +396551,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x2B97, 0x2C00, 0x2E00, - 0x2E53, + 0x2E5E, 0x2FF0, 0x2FFC, 0x3000, @@ -386995,10 +396638,10 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x101FD, 0x102E1, 0x102FC, - 0x16FE2, - 0x16FE4, 0x1BCA0, 0x1BCA4, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -387012,7 +396655,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D2E0, 0x1D2F4, 0x1D300, @@ -387093,7 +396736,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -387103,6 +396746,8 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -387116,27 +396761,27 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -387157,7 +396802,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ - 368, /* Number of elements */ + 370, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -387264,7 +396909,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x2080, 0x208F, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2126, 0x2127, @@ -387290,7 +396935,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x2B97, 0x2C00, 0x2E00, - 0x2E53, + 0x2E5E, 0x2FF0, 0x2FFC, 0x3000, @@ -387377,10 +397022,10 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x101FD, 0x102E1, 0x102FC, - 0x16FE2, - 0x16FE4, 0x1BCA0, 0x1BCA4, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -387394,7 +397039,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D2E0, 0x1D2F4, 0x1D300, @@ -387475,7 +397120,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -387485,6 +397130,8 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -387498,27 +397145,27 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -387536,7 +397183,7 @@ static const UV UNI_SC__ZYYY_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SD_invlist[] = { /* for ASCII/Latin1 */ - 63, /* Number of elements */ + 65, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -387602,7 +397249,9 @@ static const UV UNI_SD_invlist[] = { /* for ASCII/Latin1 */ 0x1D65E, 0x1D660, 0x1D692, - 0x1D694 + 0x1D694, + 0x1DF1A, + 0x1DF1B }; # endif /* ASCII/Latin1 */ @@ -387613,7 +397262,7 @@ static const UV UNI_SD_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SD_invlist[] = { /* for EBCDIC 1047 */ - 65, /* Number of elements */ + 67, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -387681,7 +397330,9 @@ static const UV UNI_SD_invlist[] = { /* for EBCDIC 1047 */ 0x1D65E, 0x1D660, 0x1D692, - 0x1D694 + 0x1D694, + 0x1DF1A, + 0x1DF1B }; # endif /* EBCDIC 1047 */ @@ -387692,7 +397343,7 @@ static const UV UNI_SD_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SD_invlist[] = { /* for EBCDIC 037 */ - 65, /* Number of elements */ + 67, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -387760,7 +397411,9 @@ static const UV UNI_SD_invlist[] = { /* for EBCDIC 037 */ 0x1D65E, 0x1D660, 0x1D692, - 0x1D694 + 0x1D694, + 0x1DF1A, + 0x1DF1B }; # endif /* EBCDIC 037 */ @@ -387896,7 +397549,7 @@ static const UV UNI_SINHALAARCHAICNUMBERS_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SK_invlist[] = { /* for ASCII/Latin1 */ - 61, /* Number of elements */ + 63, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -387927,6 +397580,8 @@ static const UV UNI_SK_invlist[] = { /* for ASCII/Latin1 */ 0x376, 0x384, 0x386, + 0x888, + 0x889, 0x1FBD, 0x1FBE, 0x1FBF, @@ -387952,7 +397607,7 @@ static const UV UNI_SK_invlist[] = { /* for ASCII/Latin1 */ 0xAB6A, 0xAB6C, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFF3E, 0xFF3F, 0xFF40, @@ -387971,7 +397626,7 @@ static const UV UNI_SK_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SK_invlist[] = { /* for EBCDIC 1047 */ - 59, /* Number of elements */ + 61, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -388000,6 +397655,8 @@ static const UV UNI_SK_invlist[] = { /* for EBCDIC 1047 */ 0x376, 0x384, 0x386, + 0x888, + 0x889, 0x1FBD, 0x1FBE, 0x1FBF, @@ -388025,7 +397682,7 @@ static const UV UNI_SK_invlist[] = { /* for EBCDIC 1047 */ 0xAB6A, 0xAB6C, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFF3E, 0xFF3F, 0xFF40, @@ -388044,7 +397701,7 @@ static const UV UNI_SK_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SK_invlist[] = { /* for EBCDIC 037 */ - 57, /* Number of elements */ + 59, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -388071,6 +397728,8 @@ static const UV UNI_SK_invlist[] = { /* for EBCDIC 037 */ 0x376, 0x384, 0x386, + 0x888, + 0x889, 0x1FBD, 0x1FBE, 0x1FBF, @@ -388096,7 +397755,7 @@ static const UV UNI_SK_invlist[] = { /* for EBCDIC 037 */ 0xAB6A, 0xAB6C, 0xFBB2, - 0xFBC2, + 0xFBC3, 0xFF3E, 0xFF3F, 0xFF40, @@ -388562,7 +398221,7 @@ static const UV UNI_SMALLKANAEXT_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_SO_invlist[] = { /* for ASCII/Latin1 */ - 365, /* Number of elements */ + 373, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -388781,8 +398440,12 @@ static const UV UNI_SO_invlist[] = { /* for ASCII/Latin1 */ 0xA83A, 0xAA77, 0xAA7A, + 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFFE4, 0xFFE5, 0xFFE8, @@ -388819,6 +398482,8 @@ static const UV UNI_SO_invlist[] = { /* for ASCII/Latin1 */ 0x16B46, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -388832,7 +398497,7 @@ static const UV UNI_SO_invlist[] = { /* for ASCII/Latin1 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -388883,7 +398548,7 @@ static const UV UNI_SO_invlist[] = { /* for ASCII/Latin1 */ 0x1F3FB, 0x1F400, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -388893,6 +398558,8 @@ static const UV UNI_SO_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -388906,27 +398573,27 @@ static const UV UNI_SO_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -388941,7 +398608,7 @@ static const UV UNI_SO_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_SO_invlist[] = { /* for EBCDIC 1047 */ - 365, /* Number of elements */ + 373, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -389160,8 +398827,12 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 1047 */ 0xA83A, 0xAA77, 0xAA7A, + 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFFE4, 0xFFE5, 0xFFE8, @@ -389198,6 +398869,8 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 1047 */ 0x16B46, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -389211,7 +398884,7 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 1047 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -389262,7 +398935,7 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 1047 */ 0x1F3FB, 0x1F400, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -389272,6 +398945,8 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -389285,27 +398960,27 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -389320,7 +398995,7 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_SO_invlist[] = { /* for EBCDIC 037 */ - 365, /* Number of elements */ + 373, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -389539,8 +399214,12 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 037 */ 0xA83A, 0xAA77, 0xAA7A, + 0xFD40, + 0xFD50, + 0xFDCF, + 0xFDD0, 0xFDFD, - 0xFDFE, + 0xFE00, 0xFFE4, 0xFFE5, 0xFFE8, @@ -389577,6 +399256,8 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 037 */ 0x16B46, 0x1BC9C, 0x1BC9D, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -389590,7 +399271,7 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 037 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D242, 0x1D245, @@ -389641,7 +399322,7 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 037 */ 0x1F3FB, 0x1F400, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -389651,6 +399332,8 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -389664,27 +399347,27 @@ static const UV UNI_SO_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -389750,7 +399433,7 @@ static const UV UNI_SPECIALS_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_STERM_invlist[] = { /* for ASCII/Latin1 */ - 153, /* Number of elements */ + 159, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -389763,7 +399446,7 @@ static const UV UNI_STERM_invlist[] = { /* for ASCII/Latin1 */ 0x40, 0x589, 0x58A, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -389801,6 +399484,8 @@ static const UV UNI_STERM_invlist[] = { /* for ASCII/Latin1 */ 0x1B5C, 0x1B5E, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C3D, 0x1C7E, @@ -389813,6 +399498,8 @@ static const UV UNI_STERM_invlist[] = { /* for ASCII/Latin1 */ 0x2E2F, 0x2E3C, 0x2E3D, + 0x2E53, + 0x2E55, 0x3002, 0x3003, 0xA4FF, @@ -389853,6 +399540,8 @@ static const UV UNI_STERM_invlist[] = { /* for ASCII/Latin1 */ 0x10A58, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x11049, 0x110BE, @@ -389917,7 +399606,7 @@ static const UV UNI_STERM_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_STERM_invlist[] = { /* for EBCDIC 1047 */ - 153, /* Number of elements */ + 159, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -389930,7 +399619,7 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 1047 */ 0x70, 0x589, 0x58A, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -389968,6 +399657,8 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 1047 */ 0x1B5C, 0x1B5E, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C3D, 0x1C7E, @@ -389980,6 +399671,8 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 1047 */ 0x2E2F, 0x2E3C, 0x2E3D, + 0x2E53, + 0x2E55, 0x3002, 0x3003, 0xA4FF, @@ -390020,6 +399713,8 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 1047 */ 0x10A58, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x11049, 0x110BE, @@ -390084,7 +399779,7 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_STERM_invlist[] = { /* for EBCDIC 037 */ - 153, /* Number of elements */ + 159, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -390097,7 +399792,7 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 037 */ 0x70, 0x589, 0x58A, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -390135,6 +399830,8 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 037 */ 0x1B5C, 0x1B5E, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C3D, 0x1C7E, @@ -390147,6 +399844,8 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 037 */ 0x2E2F, 0x2E3C, 0x2E3D, + 0x2E53, + 0x2E55, 0x3002, 0x3003, 0xA4FF, @@ -390187,6 +399886,8 @@ static const UV UNI_STERM_invlist[] = { /* for EBCDIC 037 */ 0x10A58, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x11049, 0x110BE, @@ -390402,7 +400103,7 @@ static const UV UNI_SYMBOLSFORLEGACYCOMPUTING_invlist[] = { /* for all charsets }; static const UV UNI_SYRC_invlist[] = { /* for all charsets */ - 23, /* Number of elements */ + 25, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -390428,7 +400129,9 @@ static const UV UNI_SYRC_invlist[] = { /* for all charsets */ 0x860, 0x86B, 0x1DF8, - 0x1DF9 + 0x1DF9, + 0x1DFA, + 0x1DFB }; static const UV UNI_SYRIACSUP_invlist[] = { /* for all charsets */ @@ -390488,7 +400191,7 @@ static const UV UNI_TAKR_invlist[] = { /* for all charsets */ 0xA830, 0xA83A, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA }; @@ -390624,7 +400327,7 @@ static const UV UNI_TANGUTSUP_invlist[] = { /* for all charsets */ 1 if it starts at the element beyond 0 */ 0x0, 0x18D00, - 0x18D90 + 0x18D80 }; static const UV UNI_TAVT_invlist[] = { /* for all charsets */ @@ -390640,7 +400343,7 @@ static const UV UNI_TAVT_invlist[] = { /* for all charsets */ }; static const UV UNI_TELU_invlist[] = { /* for all charsets */ - 33, /* Number of elements */ + 35, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -390657,7 +400360,7 @@ static const UV UNI_TELU_invlist[] = { /* for all charsets */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -390667,6 +400370,8 @@ static const UV UNI_TELU_invlist[] = { /* for all charsets */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -390682,7 +400387,7 @@ static const UV UNI_TELU_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_TERM_invlist[] = { /* for ASCII/Latin1 */ - 209, /* Number of elements */ + 215, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -390709,7 +400414,7 @@ static const UV UNI_TERM_invlist[] = { /* for ASCII/Latin1 */ 0x60D, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -390757,6 +400462,8 @@ static const UV UNI_TERM_invlist[] = { /* for ASCII/Latin1 */ 0x1B5C, 0x1B5D, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C40, 0x1C7E, @@ -390775,6 +400482,8 @@ static const UV UNI_TERM_invlist[] = { /* for ASCII/Latin1 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E53, + 0x2E55, 0x3001, 0x3003, 0xA4FE, @@ -390835,6 +400544,8 @@ static const UV UNI_TERM_invlist[] = { /* for ASCII/Latin1 */ 0x10B9D, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BE, @@ -390905,7 +400616,7 @@ static const UV UNI_TERM_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_TERM_invlist[] = { /* for EBCDIC 1047 */ - 211, /* Number of elements */ + 217, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -390934,7 +400645,7 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 1047 */ 0x60D, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -390982,6 +400693,8 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 1047 */ 0x1B5C, 0x1B5D, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C40, 0x1C7E, @@ -391000,6 +400713,8 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 1047 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E53, + 0x2E55, 0x3001, 0x3003, 0xA4FE, @@ -391060,6 +400775,8 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 1047 */ 0x10B9D, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BE, @@ -391130,7 +400847,7 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_TERM_invlist[] = { /* for EBCDIC 037 */ - 211, /* Number of elements */ + 217, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -391159,7 +400876,7 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 037 */ 0x60D, 0x61B, 0x61C, - 0x61E, + 0x61D, 0x620, 0x6D4, 0x6D5, @@ -391207,6 +400924,8 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 037 */ 0x1B5C, 0x1B5D, 0x1B60, + 0x1B7D, + 0x1B7F, 0x1C3B, 0x1C40, 0x1C7E, @@ -391225,6 +400944,8 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 037 */ 0x2E4D, 0x2E4E, 0x2E50, + 0x2E53, + 0x2E55, 0x3001, 0x3003, 0xA4FE, @@ -391285,6 +401006,8 @@ static const UV UNI_TERM_invlist[] = { /* for EBCDIC 037 */ 0x10B9D, 0x10F55, 0x10F5A, + 0x10F86, + 0x10F8A, 0x11047, 0x1104E, 0x110BE, @@ -391370,9 +401093,9 @@ static const UV UNI_TGLG_invlist[] = { /* for all charsets */ 1 if it starts at the element beyond 0 */ 0x0, 0x1700, - 0x170D, - 0x170E, - 0x1715, + 0x1716, + 0x171F, + 0x1720, 0x1735, 0x1737 }; @@ -391453,6 +401176,28 @@ static const UV UNI_TIRH_invlist[] = { /* for all charsets */ 0x114DA }; +static const UV UNI_TNSA_invlist[] = { /* for all charsets */ + 5, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA +}; + +static const UV UNI_TOTO_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x1E290, + 0x1E2AF +}; + static const UV UNI_TRANSPORTANDMAP_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -391483,6 +401228,16 @@ static const UV UNI_UCASEXT_invlist[] = { /* for all charsets */ 0x1900 }; +static const UV UNI_UCASEXTA_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x11AB0, + 0x11AC0 +}; + static const UV UNI_UGAR_invlist[] = { /* for all charsets */ 5, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -391504,7 +401259,7 @@ static const UV UNI_UIDEO_invlist[] = { /* for all charsets */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, + 0xA000, 0xFA0E, 0xFA10, 0xFA11, @@ -391520,9 +401275,9 @@ static const UV UNI_UIDEO_invlist[] = { /* for all charsets */ 0xFA27, 0xFA2A, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -391563,10 +401318,34 @@ static const UV UNI_VERTICALFORMS_invlist[] = { /* for all charsets */ 0xFE20 }; +static const UV UNI_VITH_invlist[] = { /* for all charsets */ + 17, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD +}; + # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_VO__R_invlist[] = { /* for ASCII/Latin1 */ - 177, /* Number of elements */ + 179, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -391720,15 +401499,17 @@ static const UV UNI_VO__R_invlist[] = { /* for ASCII/Latin1 */ 0x11580, 0x11600, 0x11A00, - 0x11AB0, + 0x11AC0, 0x13000, 0x13440, 0x14400, 0x14680, 0x16FE0, - 0x18D90, - 0x1B000, + 0x18D80, + 0x1AFF0, 0x1B300, + 0x1CF00, + 0x1CFD0, 0x1D000, 0x1D200, 0x1D2E0, @@ -391757,7 +401538,7 @@ static const UV UNI_VO__R_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_VO__R_invlist[] = { /* for EBCDIC 1047 */ - 175, /* Number of elements */ + 177, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -391909,15 +401690,17 @@ static const UV UNI_VO__R_invlist[] = { /* for EBCDIC 1047 */ 0x11580, 0x11600, 0x11A00, - 0x11AB0, + 0x11AC0, 0x13000, 0x13440, 0x14400, 0x14680, 0x16FE0, - 0x18D90, - 0x1B000, + 0x18D80, + 0x1AFF0, 0x1B300, + 0x1CF00, + 0x1CFD0, 0x1D000, 0x1D200, 0x1D2E0, @@ -391946,7 +401729,7 @@ static const UV UNI_VO__R_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_VO__R_invlist[] = { /* for EBCDIC 037 */ - 175, /* Number of elements */ + 177, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -392098,15 +401881,17 @@ static const UV UNI_VO__R_invlist[] = { /* for EBCDIC 037 */ 0x11580, 0x11600, 0x11A00, - 0x11AB0, + 0x11AC0, 0x13000, 0x13440, 0x14400, 0x14680, 0x16FE0, - 0x18D90, - 0x1B000, + 0x18D80, + 0x1AFF0, 0x1B300, + 0x1CF00, + 0x1CFD0, 0x1D000, 0x1D200, 0x1D2E0, @@ -392244,7 +402029,7 @@ static const UV UNI_VO__TU_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_VO__U_invlist[] = { /* for ASCII/Latin1 */ - 255, /* Number of elements */ + 257, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -392474,15 +402259,17 @@ static const UV UNI_VO__U_invlist[] = { /* for ASCII/Latin1 */ 0x11580, 0x11600, 0x11A00, - 0x11AB0, + 0x11AC0, 0x13000, 0x13440, 0x14400, 0x14680, 0x16FE0, - 0x18D90, - 0x1B000, + 0x18D80, + 0x1AFF0, 0x1B300, + 0x1CF00, + 0x1CFD0, 0x1D000, 0x1D200, 0x1D2E0, @@ -392513,7 +402300,7 @@ static const UV UNI_VO__U_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_VO__U_invlist[] = { /* for EBCDIC 1047 */ - 253, /* Number of elements */ + 255, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -392741,15 +402528,17 @@ static const UV UNI_VO__U_invlist[] = { /* for EBCDIC 1047 */ 0x11580, 0x11600, 0x11A00, - 0x11AB0, + 0x11AC0, 0x13000, 0x13440, 0x14400, 0x14680, 0x16FE0, - 0x18D90, - 0x1B000, + 0x18D80, + 0x1AFF0, 0x1B300, + 0x1CF00, + 0x1CFD0, 0x1D000, 0x1D200, 0x1D2E0, @@ -392780,7 +402569,7 @@ static const UV UNI_VO__U_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_VO__U_invlist[] = { /* for EBCDIC 037 */ - 253, /* Number of elements */ + 255, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -393008,15 +402797,17 @@ static const UV UNI_VO__U_invlist[] = { /* for EBCDIC 037 */ 0x11580, 0x11600, 0x11A00, - 0x11AB0, + 0x11AC0, 0x13000, 0x13440, 0x14400, 0x14680, 0x16FE0, - 0x18D90, - 0x1B000, + 0x18D80, + 0x1AFF0, 0x1B300, + 0x1CF00, + 0x1CFD0, 0x1D000, 0x1D200, 0x1D2E0, @@ -393042,13 +402833,15 @@ static const UV UNI_VO__U_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_VS_invlist[] = { /* for all charsets */ - 7, /* Number of elements */ + 9, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ 0x0, 0x180B, 0x180E, + 0x180F, + 0x1810, 0xFE00, 0xFE10, 0xE0100, @@ -393217,7 +403010,7 @@ static const UV UNI_WB__EX_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ - 589, /* Number of elements */ + 607, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -393270,7 +403063,9 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0x82E, 0x859, 0x85C, - 0x8D3, + 0x898, + 0x8A0, + 0x8CA, 0x8E2, 0x8E3, 0x904, @@ -393354,6 +403149,8 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0xBD8, 0xC00, 0xC05, + 0xC3C, + 0xC3D, 0xC3E, 0xC45, 0xC46, @@ -393457,7 +403254,7 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0x135D, 0x1360, 0x1712, - 0x1715, + 0x1716, 0x1732, 0x1735, 0x1752, @@ -393470,6 +403267,8 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0x17DE, 0x180B, 0x180E, + 0x180F, + 0x1810, 0x1885, 0x1887, 0x18A9, @@ -393487,7 +403286,7 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0x1A7F, 0x1A80, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, 0x1B05, 0x1B34, @@ -393513,8 +403312,6 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0x1CF7, 0x1CFA, 0x1DC0, - 0x1DFA, - 0x1DFB, 0x1E00, 0x200C, 0x200D, @@ -393624,14 +403421,22 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0x10EAD, 0x10F46, 0x10F51, + 0x10F82, + 0x10F86, 0x11000, 0x11003, 0x11038, 0x11047, + 0x11070, + 0x11071, + 0x11073, + 0x11075, 0x1107F, 0x11083, 0x110B0, 0x110BB, + 0x110C2, + 0x110C3, 0x11100, 0x11103, 0x11127, @@ -393762,6 +403567,10 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0x16FF2, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -393798,6 +403607,8 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ 0x1E02B, 0x1E130, 0x1E137, + 0x1E2AE, + 0x1E2AF, 0x1E2EC, 0x1E2F0, 0x1E8D0, @@ -393815,7 +403626,7 @@ static const UV UNI_WB__EXTEND_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_WB__FO_invlist[] = { /* for ASCII/Latin1 */ - 39, /* Number of elements */ + 41, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -393830,6 +403641,8 @@ static const UV UNI_WB__FO_invlist[] = { /* for ASCII/Latin1 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -393868,7 +403681,7 @@ static const UV UNI_WB__FO_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_WB__FO_invlist[] = { /* for EBCDIC 1047 */ - 39, /* Number of elements */ + 41, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -393883,6 +403696,8 @@ static const UV UNI_WB__FO_invlist[] = { /* for EBCDIC 1047 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -393921,7 +403736,7 @@ static const UV UNI_WB__FO_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_WB__FO_invlist[] = { /* for EBCDIC 037 */ - 39, /* Number of elements */ + 41, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -393936,6 +403751,8 @@ static const UV UNI_WB__FO_invlist[] = { /* for EBCDIC 037 */ 0x6DE, 0x70F, 0x710, + 0x890, + 0x892, 0x8E2, 0x8E3, 0x180E, @@ -393969,7 +403786,7 @@ static const UV UNI_WB__FO_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_WB__KA_invlist[] = { /* for all charsets */ - 21, /* Number of elements */ + 29, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -393990,8 +403807,16 @@ static const UV UNI_WB__KA_invlist[] = { /* for all charsets */ 0x3358, 0xFF66, 0xFF9E, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168 }; @@ -393999,7 +403824,7 @@ static const UV UNI_WB__KA_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ - 1095, /* Number of elements */ + 1141, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -394098,10 +403923,12 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -394230,6 +404057,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -394246,7 +404075,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -394343,10 +404172,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -394371,7 +404198,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -394475,10 +404302,6 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -394541,10 +404364,14 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0xA6A0, 0xA6F0, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -394678,12 +404505,34 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -394754,12 +404603,18 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -394878,7 +404733,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -394914,6 +404769,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -394922,6 +404779,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -395012,14 +404871,26 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -395108,7 +404979,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ - 1121, /* Number of elements */ + 1167, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -395233,10 +405104,12 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -395365,6 +405238,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -395381,7 +405256,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -395478,10 +405353,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -395506,7 +405379,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -395610,10 +405483,6 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -395676,10 +405545,14 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0xA6A0, 0xA6F0, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -395813,12 +405686,34 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -395889,12 +405784,18 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -396013,7 +405914,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -396049,6 +405950,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -396057,6 +405960,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -396147,14 +406052,26 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -396243,7 +406160,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ - 1117, /* Number of elements */ + 1163, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -396364,10 +406281,12 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -396496,6 +406415,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -396512,7 +406433,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -396609,10 +406530,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -396637,7 +406556,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -396741,10 +406660,6 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -396807,10 +406722,14 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0xA6A0, 0xA6F0, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -396944,12 +406863,34 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -397020,12 +406961,18 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -397144,7 +407091,7 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -397180,6 +407127,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -397188,6 +407137,8 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -397278,14 +407229,26 @@ static const UV UNI_WB__LE_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -397731,7 +407694,7 @@ static const UV UNI_WB__NL_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_WB__NU_invlist[] = { /* for ASCII/Latin1 */ - 125, /* Number of elements */ + 127, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -397848,6 +407811,8 @@ static const UV UNI_WB__NU_invlist[] = { /* for ASCII/Latin1 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -397870,7 +407835,7 @@ static const UV UNI_WB__NU_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_WB__NU_invlist[] = { /* for EBCDIC 1047 */ - 125, /* Number of elements */ + 127, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -397987,6 +407952,8 @@ static const UV UNI_WB__NU_invlist[] = { /* for EBCDIC 1047 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -398009,7 +407976,7 @@ static const UV UNI_WB__NU_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_WB__NU_invlist[] = { /* for EBCDIC 037 */ - 125, /* Number of elements */ + 127, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -398126,6 +408093,8 @@ static const UV UNI_WB__NU_invlist[] = { /* for EBCDIC 037 */ 0x11DAA, 0x16A60, 0x16A6A, + 0x16AC0, + 0x16ACA, 0x16B50, 0x16B5A, 0x1D7CE, @@ -398271,7 +408240,7 @@ static const UV UNI_WB__WSEGSPACE_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ - 1487, /* Number of elements */ + 1541, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -398392,11 +408361,13 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x964, 0x966, 0x970, @@ -398562,7 +408533,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -398572,6 +408543,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -398596,7 +408569,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -398761,10 +408734,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -398781,8 +408752,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x17E0, 0x17EA, 0x180B, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -398811,9 +408780,9 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -398837,8 +408806,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -398937,10 +408904,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -399019,10 +408982,14 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0xA67F, 0xA6F2, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -399218,12 +409185,34 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -399304,6 +409293,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -399311,11 +409302,13 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -399458,7 +409451,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -399510,6 +409503,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -399522,6 +409517,10 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -399550,8 +409549,16 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x16FE5, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168, 0x1BC00, @@ -399566,6 +409573,10 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -399650,6 +409661,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -399668,8 +409681,18 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -399772,7 +409795,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ - 1511, /* Number of elements */ + 1565, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -399917,11 +409940,13 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x964, 0x966, 0x970, @@ -400087,7 +410112,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -400097,6 +410122,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -400121,7 +410148,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -400286,10 +410313,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -400306,8 +410331,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x17E0, 0x17EA, 0x180B, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -400336,9 +410359,9 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -400362,8 +410385,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -400462,10 +410483,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -400544,10 +410561,14 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0xA67F, 0xA6F2, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -400743,12 +410764,34 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -400829,6 +410872,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -400836,11 +410881,13 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -400983,7 +411030,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -401035,6 +411082,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -401047,6 +411096,10 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -401075,8 +411128,16 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x16FE5, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168, 0x1BC00, @@ -401091,6 +411152,10 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -401175,6 +411240,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -401193,8 +411260,18 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -401297,7 +411374,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ - 1507, /* Number of elements */ + 1561, /* Number of elements */ 148565664, /* Version and data structure type */ 0, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -401438,11 +411515,13 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x890, + 0x892, + 0x898, 0x964, 0x966, 0x970, @@ -401608,7 +411687,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -401618,6 +411697,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -401642,7 +411723,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -401807,10 +411888,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -401827,8 +411906,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x17E0, 0x17EA, 0x180B, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -401857,9 +411934,9 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1A90, 0x1A9A, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -401883,8 +411960,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -401983,10 +412058,6 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x24B6, 0x24EA, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -402065,10 +412136,14 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0xA67F, 0xA6F2, 0xA708, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -402264,12 +412339,34 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -402350,6 +412447,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -402357,11 +412456,13 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, 0x110BD, 0x110BE, + 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -402504,7 +412605,7 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -402556,6 +412657,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x13430, @@ -402568,6 +412671,10 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -402596,8 +412703,16 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x16FE5, 0x16FF0, 0x16FF2, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, 0x1B001, + 0x1B120, + 0x1B123, 0x1B164, 0x1B168, 0x1BC00, @@ -402612,6 +412727,10 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1BC9F, 0x1BCA0, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -402696,6 +412815,8 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -402714,8 +412835,18 @@ static const UV UNI_WB__XX_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -402827,7 +412958,7 @@ static const UV UNI_WCHO_invlist[] = { /* for all charsets */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ - 1475, /* Number of elements */ + 1527, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -402934,11 +413065,11 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -403106,7 +413237,7 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -403116,6 +413247,8 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -403140,7 +413273,7 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -403307,10 +413440,8 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -403330,7 +413461,7 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -403369,9 +413500,9 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -403395,8 +413526,6 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -403477,10 +413606,6 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -403543,8 +413668,6 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -403563,10 +413686,14 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -403756,12 +413883,34 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -403842,6 +413991,8 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -403849,9 +414000,11 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -403958,6 +414111,8 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -403994,7 +414149,7 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -404046,6 +414201,8 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -404056,6 +414213,10 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -404090,8 +414251,14 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -404108,6 +414275,10 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -404194,6 +414365,8 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -404212,8 +414385,18 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -404291,9 +414474,9 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -404316,7 +414499,7 @@ static const UV UNI_XIDC_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ - 1499, /* Number of elements */ + 1551, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -404447,11 +414630,11 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -404619,7 +414802,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -404629,6 +414812,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -404653,7 +414838,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -404820,10 +415005,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -404843,7 +415026,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -404882,9 +415065,9 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -404908,8 +415091,6 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -404990,10 +415171,6 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -405056,8 +415233,6 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -405076,10 +415251,14 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -405269,12 +415448,34 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -405355,6 +415556,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -405362,9 +415565,11 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -405471,6 +415676,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -405507,7 +415714,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -405559,6 +415766,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -405569,6 +415778,10 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -405603,8 +415816,14 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -405621,6 +415840,10 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -405707,6 +415930,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -405725,8 +415950,18 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -405804,9 +416039,9 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -405829,7 +416064,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ - 1495, /* Number of elements */ + 1547, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -405956,11 +416191,11 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x85C, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x888, + 0x889, + 0x88F, + 0x898, 0x8E2, 0x8E3, 0x964, @@ -406128,7 +416363,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -406138,6 +416373,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -406162,7 +416399,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -406329,10 +416566,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1735, 0x1740, 0x1754, @@ -406352,7 +416587,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x17EA, 0x180B, 0x180E, - 0x1810, + 0x180F, 0x181A, 0x1820, 0x1879, @@ -406391,9 +416626,9 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x1AB0, 0x1ABE, 0x1ABF, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, 0x1B5A, 0x1B6B, @@ -406417,8 +416652,6 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x1CD4, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -406499,10 +416732,6 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CF4, @@ -406565,8 +416794,6 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -406585,10 +416812,14 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA828, 0xA82C, 0xA82D, @@ -406778,12 +417009,34 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -406864,6 +417117,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F51, + 0x10F70, + 0x10F86, 0x10FB0, 0x10FC5, 0x10FE0, @@ -406871,9 +417126,11 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x11000, 0x11047, 0x11066, - 0x11070, + 0x11076, 0x1107F, 0x110BB, + 0x110C2, + 0x110C3, 0x110D0, 0x110E9, 0x110F0, @@ -406980,6 +417237,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x1172C, 0x11730, 0x1173A, + 0x11740, + 0x11747, 0x11800, 0x1183B, 0x118A0, @@ -407016,7 +417275,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x11A9A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -407068,6 +417327,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -407078,6 +417339,10 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x16A5F, 0x16A60, 0x16A6A, + 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -407112,8 +417377,14 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -407130,6 +417401,10 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x1BC9A, 0x1BC9D, 0x1BC9F, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, 0x1D165, 0x1D16A, 0x1D16D, @@ -407216,6 +417491,8 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -407234,8 +417511,18 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x1E14A, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8D0, @@ -407313,9 +417600,9 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -407335,7 +417622,7 @@ static const UV UNI_XIDC_invlist[] = { /* for EBCDIC 037 */ # if 'A' == 65 /* ASCII/Latin1 */ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ - 1259, /* Number of elements */ + 1311, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -407438,10 +417725,12 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -407570,6 +417859,8 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -407586,7 +417877,7 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -407729,10 +418020,8 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -407773,7 +418062,7 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -407873,10 +418162,6 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -407937,8 +418222,6 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -407959,10 +418242,14 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -408154,12 +418441,34 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -408230,12 +418539,18 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -408318,6 +418633,8 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -408356,7 +418673,7 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -408392,6 +418709,8 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -408400,6 +418719,8 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -408428,8 +418749,14 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -408504,14 +418831,26 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -408585,9 +418924,9 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -408608,7 +418947,7 @@ static const UV UNI_XIDS_invlist[] = { /* for ASCII/Latin1 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 21 static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ - 1285, /* Number of elements */ + 1337, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -408737,10 +419076,12 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -408869,6 +419210,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -408885,7 +419228,7 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -409028,10 +419371,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -409072,7 +419413,7 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -409172,10 +419513,6 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -409236,8 +419573,6 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -409258,10 +419593,14 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -409453,12 +419792,34 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -409529,12 +419890,18 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -409617,6 +419984,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -409655,7 +420024,7 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -409691,6 +420060,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -409699,6 +420070,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -409727,8 +420100,14 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -409803,14 +420182,26 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -409884,9 +420275,9 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -409907,7 +420298,7 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 1047 */ && '$' == 91 && '@' == 124 && '`' == 121 && '\n' == 37 static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ - 1281, /* Number of elements */ + 1333, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -410032,10 +420423,12 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x859, 0x860, 0x86B, + 0x870, + 0x888, + 0x889, + 0x88F, 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, + 0x8CA, 0x904, 0x93A, 0x93D, @@ -410164,6 +420557,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0xC3E, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC62, 0xC80, @@ -410180,7 +420575,7 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0xCBA, 0xCBD, 0xCBE, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE2, @@ -410323,10 +420718,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x16EE, 0x16F9, 0x1700, - 0x170D, - 0x170E, 0x1712, - 0x1720, + 0x171F, 0x1732, 0x1740, 0x1752, @@ -410367,7 +420760,7 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x1B05, 0x1B34, 0x1B45, - 0x1B4C, + 0x1B4D, 0x1B83, 0x1BA1, 0x1BAE, @@ -410467,10 +420860,6 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x2160, 0x2189, 0x2C00, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CE5, 0x2CEB, 0x2CEF, @@ -410531,8 +420920,6 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x3400, 0x4DC0, 0x4E00, - 0x9FFD, - 0xA000, 0xA48D, 0xA4D0, 0xA4FE, @@ -410553,10 +420940,14 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0xA722, 0xA789, 0xA78B, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA802, 0xA803, 0xA806, @@ -410748,12 +421139,34 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x10528, 0x10530, 0x10564, + 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -410824,12 +421237,18 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x10F28, 0x10F30, 0x10F46, + 0x10F70, + 0x10F82, 0x10FB0, 0x10FC5, 0x10FE0, 0x10FF7, 0x11003, 0x11038, + 0x11071, + 0x11073, + 0x11075, + 0x11076, 0x11083, 0x110B0, 0x110D0, @@ -410912,6 +421331,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x116B9, 0x11700, 0x1171B, + 0x11740, + 0x11747, 0x11800, 0x1182C, 0x118A0, @@ -410950,7 +421371,7 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x11A8A, 0x11A9D, 0x11A9E, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -410986,6 +421407,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x1246F, 0x12480, 0x12544, + 0x12F90, + 0x12FF1, 0x13000, 0x1342F, 0x14400, @@ -410994,6 +421417,8 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x16A39, 0x16A40, 0x16A5F, + 0x16A70, + 0x16ABF, 0x16AD0, 0x16AEE, 0x16B00, @@ -411022,8 +421447,14 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -411098,14 +421529,26 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x1D7C3, 0x1D7C4, 0x1D7CC, + 0x1DF00, + 0x1DF1F, 0x1E100, 0x1E12D, 0x1E137, 0x1E13E, 0x1E14E, 0x1E14F, + 0x1E290, + 0x1E2AE, 0x1E2C0, 0x1E2EC, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E900, @@ -411179,9 +421622,9 @@ static const UV UNI_XIDS_invlist[] = { /* for EBCDIC 037 */ 0x1EEAB, 0x1EEBC, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -411404,6 +421847,16 @@ static const UV UNI_ZL_invlist[] = { /* for all charsets */ 0x2029 }; +static const UV UNI_ZNAMENNYMUSIC_invlist[] = { /* for all charsets */ + 3, /* Number of elements */ + 148565664, /* Version and data structure type */ + 1, /* 0 if the list starts at 0; + 1 if it starts at the element beyond 0 */ + 0x0, + 0x1CF00, + 0x1CFD0 +}; + static const UV UNI_ZP_invlist[] = { /* for all charsets */ 3, /* Number of elements */ 148565664, /* Version and data structure type */ @@ -411554,7 +422007,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x2080, 0x208F, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2126, 0x2127, @@ -411582,7 +422035,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x2E00, 0x2E43, 0x2E44, - 0x2E53, + 0x2E5E, 0x2FF0, 0x2FFC, 0x3000, @@ -411619,8 +422072,6 @@ static const UV UNI_ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0xAB5C, 0xAB6A, 0xAB6C, - 0xFD3E, - 0xFD40, 0xFE10, 0xFE1A, 0xFE30, @@ -411649,8 +422100,8 @@ static const UV UNI_ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1019D, 0x101D0, 0x101FD, - 0x16FE2, - 0x16FE4, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -411664,7 +422115,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D2E0, 0x1D2F4, 0x1D300, @@ -411743,7 +422194,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -411753,6 +422204,8 @@ static const UV UNI_ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -411766,27 +422219,27 @@ static const UV UNI_ZYYY_invlist[] = { /* for ASCII/Latin1 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -411890,7 +422343,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x2080, 0x208F, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2126, 0x2127, @@ -411918,7 +422371,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x2E00, 0x2E43, 0x2E44, - 0x2E53, + 0x2E5E, 0x2FF0, 0x2FFC, 0x3000, @@ -411955,8 +422408,6 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0xAB5C, 0xAB6A, 0xAB6C, - 0xFD3E, - 0xFD40, 0xFE10, 0xFE1A, 0xFE30, @@ -411985,8 +422436,8 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1019D, 0x101D0, 0x101FD, - 0x16FE2, - 0x16FE4, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -412000,7 +422451,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D2E0, 0x1D2F4, 0x1D300, @@ -412079,7 +422530,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -412089,6 +422540,8 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -412102,27 +422555,27 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 1047 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -412222,7 +422675,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x2080, 0x208F, 0x20A0, - 0x20C0, + 0x20C1, 0x2100, 0x2126, 0x2127, @@ -412250,7 +422703,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x2E00, 0x2E43, 0x2E44, - 0x2E53, + 0x2E5E, 0x2FF0, 0x2FFC, 0x3000, @@ -412287,8 +422740,6 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ 0xAB5C, 0xAB6A, 0xAB6C, - 0xFD3E, - 0xFD40, 0xFE10, 0xFE1A, 0xFE30, @@ -412317,8 +422768,8 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1019D, 0x101D0, 0x101FD, - 0x16FE2, - 0x16FE4, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, @@ -412332,7 +422783,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1D18C, 0x1D1AA, 0x1D1AE, - 0x1D1E9, + 0x1D1EB, 0x1D2E0, 0x1D2F4, 0x1D300, @@ -412411,7 +422862,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -412421,6 +422872,8 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -412434,27 +422887,27 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -412470,7 +422923,7 @@ static const UV UNI_ZYYY_invlist[] = { /* for EBCDIC 037 */ # endif /* EBCDIC 037 */ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ - 1350, /* Number of elements */ + 1392, /* Number of elements */ 148565664, /* Version and data structure type */ 1, /* 0 if the list starts at 0; 1 if it starts at the element beyond 0 */ @@ -412499,8 +422952,6 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x5EF, 0x5F5, 0x600, - 0x61D, - 0x61E, 0x70E, 0x70F, 0x74B, @@ -412518,11 +422969,11 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x85F, 0x860, 0x86B, - 0x8A0, - 0x8B5, - 0x8B6, - 0x8C8, - 0x8D3, + 0x870, + 0x88F, + 0x890, + 0x892, + 0x898, 0x984, 0x985, 0x98D, @@ -412678,7 +423129,7 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0xC29, 0xC2A, 0xC3A, - 0xC3D, + 0xC3C, 0xC45, 0xC46, 0xC49, @@ -412688,6 +423139,8 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0xC57, 0xC58, 0xC5B, + 0xC5D, + 0xC5E, 0xC60, 0xC64, 0xC66, @@ -412710,7 +423163,7 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0xCCE, 0xCD5, 0xCD7, - 0xCDE, + 0xCDD, 0xCDF, 0xCE0, 0xCE4, @@ -412845,10 +423298,8 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x16A0, 0x16F9, 0x1700, - 0x170D, - 0x170E, - 0x1715, - 0x1720, + 0x1716, + 0x171F, 0x1737, 0x1740, 0x1754, @@ -412865,8 +423316,6 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x17F0, 0x17FA, 0x1800, - 0x180F, - 0x1810, 0x181A, 0x1820, 0x1879, @@ -412905,11 +423354,11 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1AA0, 0x1AAE, 0x1AB0, - 0x1AC1, + 0x1ACF, 0x1B00, - 0x1B4C, + 0x1B4D, 0x1B50, - 0x1B7D, + 0x1B7F, 0x1B80, 0x1BF4, 0x1BFC, @@ -412925,8 +423374,6 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1CD0, 0x1CFB, 0x1D00, - 0x1DFA, - 0x1DFB, 0x1F16, 0x1F18, 0x1F1E, @@ -412967,7 +423414,7 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x2090, 0x209D, 0x20A0, - 0x20C0, + 0x20C1, 0x20D0, 0x20F1, 0x2100, @@ -412981,10 +423428,6 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x2B76, 0x2B96, 0x2B97, - 0x2C2F, - 0x2C30, - 0x2C5F, - 0x2C60, 0x2CF4, 0x2CF9, 0x2D26, @@ -413015,7 +423458,7 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x2DD8, 0x2DDF, 0x2DE0, - 0x2E53, + 0x2E5E, 0x2E80, 0x2E9A, 0x2E9B, @@ -413039,8 +423482,6 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x31F0, 0x321F, 0x3220, - 0x9FFD, - 0xA000, 0xA48D, 0xA490, 0xA4C7, @@ -413049,10 +423490,14 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0xA640, 0xA6F8, 0xA700, - 0xA7C0, - 0xA7C2, 0xA7CB, - 0xA7F5, + 0xA7D0, + 0xA7D2, + 0xA7D3, + 0xA7D4, + 0xA7D5, + 0xA7DA, + 0xA7F2, 0xA82D, 0xA830, 0xA83A, @@ -413123,16 +423568,14 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0xFB43, 0xFB45, 0xFB46, - 0xFBC2, + 0xFBC3, 0xFBD3, - 0xFD40, - 0xFD50, 0xFD90, 0xFD92, 0xFDC8, + 0xFDCF, + 0xFDD0, 0xFDF0, - 0xFDFE, - 0xFE00, 0xFE1A, 0xFE20, 0xFE53, @@ -413219,13 +423662,33 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x10530, 0x10564, 0x1056F, - 0x10570, + 0x1057B, + 0x1057C, + 0x1058B, + 0x1058C, + 0x10593, + 0x10594, + 0x10596, + 0x10597, + 0x105A2, + 0x105A3, + 0x105B2, + 0x105B3, + 0x105BA, + 0x105BB, + 0x105BD, 0x10600, 0x10737, 0x10740, 0x10756, 0x10760, 0x10768, + 0x10780, + 0x10786, + 0x10787, + 0x107B1, + 0x107B2, + 0x107BB, 0x10800, 0x10806, 0x10808, @@ -413312,6 +423775,8 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x10F28, 0x10F30, 0x10F5A, + 0x10F70, + 0x10F8A, 0x10FB0, 0x10FCC, 0x10FE0, @@ -413319,9 +423784,9 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x11000, 0x1104E, 0x11052, - 0x11070, + 0x11076, 0x1107F, - 0x110C2, + 0x110C3, 0x110CD, 0x110CE, 0x110D0, @@ -413405,7 +423870,7 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x11660, 0x1166D, 0x11680, - 0x116B9, + 0x116BA, 0x116C0, 0x116CA, 0x11700, @@ -413413,7 +423878,7 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1171D, 0x1172C, 0x11730, - 0x11740, + 0x11747, 0x11800, 0x1183C, 0x118A0, @@ -413444,7 +423909,7 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x11A48, 0x11A50, 0x11AA3, - 0x11AC0, + 0x11AB0, 0x11AF9, 0x11C00, 0x11C09, @@ -413500,6 +423965,8 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x12475, 0x12480, 0x12544, + 0x12F90, + 0x12FF3, 0x13000, 0x1342F, 0x13430, @@ -413513,7 +423980,9 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x16A60, 0x16A6A, 0x16A6E, - 0x16A70, + 0x16ABF, + 0x16AC0, + 0x16ACA, 0x16AD0, 0x16AEE, 0x16AF0, @@ -413546,8 +424015,14 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x18CD6, 0x18D00, 0x18D09, + 0x1AFF0, + 0x1AFF4, + 0x1AFF5, + 0x1AFFC, + 0x1AFFD, + 0x1AFFF, 0x1B000, - 0x1B11F, + 0x1B123, 0x1B150, 0x1B153, 0x1B164, @@ -413564,12 +424039,18 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1BC9A, 0x1BC9C, 0x1BCA4, + 0x1CF00, + 0x1CF2E, + 0x1CF30, + 0x1CF47, + 0x1CF50, + 0x1CFC4, 0x1D000, 0x1D0F6, 0x1D100, 0x1D127, 0x1D129, - 0x1D1E9, + 0x1D1EB, 0x1D200, 0x1D246, 0x1D2E0, @@ -413624,6 +424105,8 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1DAA0, 0x1DAA1, 0x1DAB0, + 0x1DF00, + 0x1DF1F, 0x1E000, 0x1E007, 0x1E008, @@ -413642,10 +424125,20 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1E14A, 0x1E14E, 0x1E150, + 0x1E290, + 0x1E2AF, 0x1E2C0, 0x1E2FA, 0x1E2FF, 0x1E300, + 0x1E7E0, + 0x1E7E7, + 0x1E7E8, + 0x1E7EC, + 0x1E7ED, + 0x1E7EF, + 0x1E7F0, + 0x1E7FF, 0x1E800, 0x1E8C5, 0x1E8C7, @@ -413754,7 +424247,7 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1F266, 0x1F300, 0x1F6D8, - 0x1F6E0, + 0x1F6DD, 0x1F6ED, 0x1F6F0, 0x1F6FD, @@ -413764,6 +424257,8 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1F7D9, 0x1F7E0, 0x1F7EC, + 0x1F7F0, + 0x1F7F1, 0x1F800, 0x1F80C, 0x1F810, @@ -413777,27 +424272,27 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1F8B0, 0x1F8B2, 0x1F900, - 0x1F979, - 0x1F97A, - 0x1F9CC, - 0x1F9CD, 0x1FA54, 0x1FA60, 0x1FA6E, 0x1FA70, 0x1FA75, 0x1FA78, - 0x1FA7B, + 0x1FA7D, 0x1FA80, 0x1FA87, 0x1FA90, - 0x1FAA9, + 0x1FAAD, 0x1FAB0, - 0x1FAB7, + 0x1FABB, 0x1FAC0, - 0x1FAC3, + 0x1FAC6, 0x1FAD0, - 0x1FAD7, + 0x1FADA, + 0x1FAE0, + 0x1FAE8, + 0x1FAF0, + 0x1FAF7, 0x1FB00, 0x1FB93, 0x1FB94, @@ -413805,9 +424300,9 @@ static const UV UNI_ZZZZ_invlist[] = { /* for all charsets */ 0x1FBF0, 0x1FBFA, 0x20000, - 0x2A6DE, + 0x2A6E0, 0x2A700, - 0x2B735, + 0x2B739, 0x2B740, 0x2B81E, 0x2B820, @@ -413982,6 +424477,7 @@ typedef enum { UNI_AGE__12, UNI_AGE__12_DOT_1, UNI_AGE__13, + UNI_AGE__14, UNI_AGE__2, UNI_AGE__2_DOT_1, UNI_AGE__3, @@ -414011,6 +424507,7 @@ typedef enum { UNI_ANY, UNI_ARAB, UNI_ARABICEXTA, + UNI_ARABICEXTB, UNI_ARABICMATH, UNI_ARABICPFA, UNI_ARABICPFB, @@ -414158,6 +424655,7 @@ typedef enum { UNI_COPT, UNI_COPTICEPACTNUMBERS, UNI_COUNTINGROD, + UNI_CPMN, UNI_CPRT, UNI_CUNEIFORMNUMBERS, UNI_CURRENCYSYMBOLS, @@ -414231,6 +424729,7 @@ typedef enum { UNI_ETHI, UNI_ETHIOPICEXT, UNI_ETHIOPICEXTA, + UNI_ETHIOPICEXTB, UNI_ETHIOPICSUP, UNI_EXT, UNI_EXTPICT, @@ -414318,6 +424817,7 @@ typedef enum { UNI_INCHORASMIAN, UNI_INCOPTIC, UNI_INCUNEIFORM, + UNI_INCYPROMINOAN, UNI_INCYRILLIC, UNI_INDEVANAGARI, UNI_INDICNUMBERFORMS, @@ -414394,6 +424894,7 @@ typedef enum { UNI_INOLDPERSIAN, UNI_INOLDSOGDIAN, UNI_INOLDTURKIC, + UNI_INOLDUYGHUR, UNI_INORIYA, UNI_INOSAGE, UNI_INOSMANYA, @@ -414472,6 +424973,7 @@ typedef enum { UNI_INTAIVIET, UNI_INTAKRI, UNI_INTAMIL, + UNI_INTANGSA, UNI_INTANGUT, UNI_INTELUGU, UNI_INTHAANA, @@ -414479,8 +424981,10 @@ typedef enum { UNI_INTIBETAN, UNI_INTIFINAGH, UNI_INTIRHUTA, + UNI_INTOTO, UNI_INUGARITIC, UNI_INVAI, + UNI_INVITHKUQI, UNI_INVS, UNI_INWANCHO, UNI_INWARANGCITI, @@ -414491,6 +424995,7 @@ typedef enum { UNI_IN__12, UNI_IN__12_DOT_1, UNI_IN__13, + UNI_IN__14, UNI_IN__1_DOT_1, UNI_IN__2, UNI_IN__2_DOT_1, @@ -414609,6 +425114,8 @@ typedef enum { UNI_JG__TAW, UNI_JG__TEHMARBUTA, UNI_JG__TETH, + UNI_JG__THINYEH, + UNI_JG__VERTICALTAIL, UNI_JG__WAW, UNI_JG__YEH, UNI_JG__YEHBARREE, @@ -414627,6 +425134,7 @@ typedef enum { UNI_KALI, UNI_KANA, UNI_KANAEXTA, + UNI_KANAEXTB, UNI_KANASUP, UNI_KANBUN, UNI_KANGXI, @@ -414648,6 +425156,8 @@ typedef enum { UNI_LATINEXTC, UNI_LATINEXTD, UNI_LATINEXTE, + UNI_LATINEXTF, + UNI_LATINEXTG, UNI_LATN, UNI_LB__AI, UNI_LB__AL, @@ -414912,6 +425422,7 @@ typedef enum { UNI_OSGE, UNI_OSMA, UNI_OTTOMANSIYAQNUMBERS, + UNI_OUGR, UNI_P, UNI_PALM, UNI_PATSYN, @@ -414982,6 +425493,7 @@ typedef enum { UNI_SC__BUHD, UNI_SC__CAKM, UNI_SC__COPT, + UNI_SC__CPMN, UNI_SC__CPRT, UNI_SC__CYRL, UNI_SC__DEVA, @@ -415018,7 +425530,9 @@ typedef enum { UNI_SC__MULT, UNI_SC__MYMR, UNI_SC__NAND, + UNI_SC__NKO, UNI_SC__ORYA, + UNI_SC__OUGR, UNI_SC__PERM, UNI_SC__PHAG, UNI_SC__PHLP, @@ -415099,9 +425613,12 @@ typedef enum { UNI_TIBT, UNI_TIRH, UNI_TITLE, + UNI_TNSA, + UNI_TOTO, UNI_TRANSPORTANDMAP, UNI_UCAS, UNI_UCASEXT, + UNI_UCASEXTA, UNI_UGAR, UNI_UIDEO, UNI_UPPERCASELETTER, @@ -415109,6 +425626,7 @@ typedef enum { UNI_VEDICEXT, UNI_VERTICALFORMS, UNI_VERTSPACE, + UNI_VITH, UNI_VO__R, UNI_VO__TR, UNI_VO__TU, @@ -415157,6 +425675,7 @@ typedef enum { UNI_Z, UNI_ZANB, UNI_ZL, + UNI_ZNAMENNYMUSIC, UNI_ZP, UNI_ZS, UNI_ZYYY, @@ -415191,6 +425710,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_AGE__12_invlist, UNI_AGE__12_DOT_1_invlist, UNI_AGE__13_invlist, + UNI_AGE__14_invlist, UNI_AGE__2_invlist, UNI_AGE__2_DOT_1_invlist, UNI_AGE__3_invlist, @@ -415220,6 +425740,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_ANY_invlist, UNI_ARAB_invlist, UNI_ARABICEXTA_invlist, + UNI_ARABICEXTB_invlist, UNI_ARABICMATH_invlist, UNI_ARABICPFA_invlist, UNI_ARABICPFB_invlist, @@ -415367,6 +425888,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_COPT_invlist, UNI_COPTICEPACTNUMBERS_invlist, UNI_COUNTINGROD_invlist, + UNI_CPMN_invlist, UNI_CPRT_invlist, UNI_CUNEIFORMNUMBERS_invlist, UNI_CURRENCYSYMBOLS_invlist, @@ -415440,6 +425962,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_ETHI_invlist, UNI_ETHIOPICEXT_invlist, UNI_ETHIOPICEXTA_invlist, + UNI_ETHIOPICEXTB_invlist, UNI_ETHIOPICSUP_invlist, UNI_EXT_invlist, UNI_EXTPICT_invlist, @@ -415527,6 +426050,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_INCHORASMIAN_invlist, UNI_INCOPTIC_invlist, UNI_INCUNEIFORM_invlist, + UNI_INCYPROMINOAN_invlist, UNI_INCYRILLIC_invlist, UNI_INDEVANAGARI_invlist, UNI_INDICNUMBERFORMS_invlist, @@ -415603,6 +426127,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_INOLDPERSIAN_invlist, UNI_INOLDSOGDIAN_invlist, UNI_INOLDTURKIC_invlist, + UNI_INOLDUYGHUR_invlist, UNI_INORIYA_invlist, UNI_INOSAGE_invlist, UNI_INOSMANYA_invlist, @@ -415681,6 +426206,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_INTAIVIET_invlist, UNI_INTAKRI_invlist, UNI_INTAMIL_invlist, + UNI_INTANGSA_invlist, UNI_INTANGUT_invlist, UNI_INTELUGU_invlist, UNI_INTHAANA_invlist, @@ -415688,8 +426214,10 @@ static const UV * const uni_prop_ptrs[] = { UNI_INTIBETAN_invlist, UNI_INTIFINAGH_invlist, UNI_INTIRHUTA_invlist, + UNI_INTOTO_invlist, UNI_INUGARITIC_invlist, UNI_INVAI_invlist, + UNI_INVITHKUQI_invlist, UNI_INVS_invlist, UNI_INWANCHO_invlist, UNI_INWARANGCITI_invlist, @@ -415700,6 +426228,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_IN__12_invlist, UNI_IN__12_DOT_1_invlist, UNI_IN__13_invlist, + UNI_IN__14_invlist, UNI_IN__1_DOT_1_invlist, UNI_IN__2_invlist, UNI_IN__2_DOT_1_invlist, @@ -415818,6 +426347,8 @@ static const UV * const uni_prop_ptrs[] = { UNI_JG__TAW_invlist, UNI_JG__TEHMARBUTA_invlist, UNI_JG__TETH_invlist, + UNI_JG__THINYEH_invlist, + UNI_JG__VERTICALTAIL_invlist, UNI_JG__WAW_invlist, UNI_JG__YEH_invlist, UNI_JG__YEHBARREE_invlist, @@ -415836,6 +426367,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_KALI_invlist, UNI_KANA_invlist, UNI_KANAEXTA_invlist, + UNI_KANAEXTB_invlist, UNI_KANASUP_invlist, UNI_KANBUN_invlist, UNI_KANGXI_invlist, @@ -415857,6 +426389,8 @@ static const UV * const uni_prop_ptrs[] = { UNI_LATINEXTC_invlist, UNI_LATINEXTD_invlist, UNI_LATINEXTE_invlist, + UNI_LATINEXTF_invlist, + UNI_LATINEXTG_invlist, UNI_LATN_invlist, UNI_LB__AI_invlist, UNI_LB__AL_invlist, @@ -416121,6 +426655,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_OSGE_invlist, UNI_OSMA_invlist, UNI_OTTOMANSIYAQNUMBERS_invlist, + UNI_OUGR_invlist, UNI_P_invlist, UNI_PALM_invlist, UNI_PATSYN_invlist, @@ -416191,6 +426726,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_SC__BUHD_invlist, UNI_SC__CAKM_invlist, UNI_SC__COPT_invlist, + UNI_SC__CPMN_invlist, UNI_SC__CPRT_invlist, UNI_SC__CYRL_invlist, UNI_SC__DEVA_invlist, @@ -416227,7 +426763,9 @@ static const UV * const uni_prop_ptrs[] = { UNI_SC__MULT_invlist, UNI_SC__MYMR_invlist, UNI_SC__NAND_invlist, + UNI_SC__NKO_invlist, UNI_SC__ORYA_invlist, + UNI_SC__OUGR_invlist, UNI_SC__PERM_invlist, UNI_SC__PHAG_invlist, UNI_SC__PHLP_invlist, @@ -416308,9 +426846,12 @@ static const UV * const uni_prop_ptrs[] = { UNI_TIBT_invlist, UNI_TIRH_invlist, UNI_TITLE_invlist, + UNI_TNSA_invlist, + UNI_TOTO_invlist, UNI_TRANSPORTANDMAP_invlist, UNI_UCAS_invlist, UNI_UCASEXT_invlist, + UNI_UCASEXTA_invlist, UNI_UGAR_invlist, UNI_UIDEO_invlist, UNI_UPPERCASELETTER_invlist, @@ -416318,6 +426859,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_VEDICEXT_invlist, UNI_VERTICALFORMS_invlist, UNI_VERTSPACE_invlist, + UNI_VITH_invlist, UNI_VO__R_invlist, UNI_VO__TR_invlist, UNI_VO__TU_invlist, @@ -416366,6 +426908,7 @@ static const UV * const uni_prop_ptrs[] = { UNI_Z_invlist, UNI_ZANB_invlist, UNI_ZL_invlist, + UNI_ZNAMENNYMUSIC_invlist, UNI_ZP_invlist, UNI_ZS_invlist, UNI_ZYYY_invlist, @@ -416460,6 +427003,7 @@ static const char * const UNI_age_values[] = { "12.0", "12.1", "13.0", + "14.0", "NA", "na", "Unassigned", @@ -416469,6 +427013,7 @@ static const char * const UNI_age_values[] = { "V12_0", "V12_1", "V13_0", + "V14_0", "V1_1", "V2_0", "V2_1", @@ -416493,6 +427038,7 @@ static const char * const UNI_age_values[] = { "v120", "v121", "v130", + "v140", "v20", "v21", "v30", @@ -416665,9 +427211,14 @@ static const char * const UNI_blk_values[] = { "arabic", "Arabic_Ext_A", "arabicexta", + "Arabic_Ext_B", + "arabicextb", "Arabic Extended-A", "Arabic_Extended_A", "arabicextendeda", + "Arabic Extended-B", + "Arabic_Extended_B", + "arabicextendedb", "Arabic_Math", "arabicmath", "Arabic Mathematical Alphabetic Symbols", @@ -416890,6 +427441,9 @@ static const char * const UNI_blk_values[] = { "Cypriot Syllabary", "Cypriot_Syllabary", "cypriotsyllabary", + "Cypro-Minoan", + "Cypro_Minoan", + "cyprominoan", "Cyrillic", "cyrillic", "Cyrillic_Ext_A", @@ -416986,12 +427540,17 @@ static const char * const UNI_blk_values[] = { "ethiopicext", "Ethiopic_Ext_A", "ethiopicexta", + "Ethiopic_Ext_B", + "ethiopicextb", "Ethiopic Extended", "Ethiopic_Extended", "ethiopicextended", "Ethiopic Extended-A", "Ethiopic_Extended_A", "ethiopicextendeda", + "Ethiopic Extended-B", + "Ethiopic_Extended_B", + "ethiopicextendedb", "Ethiopic_Sup", "ethiopicsup", "Ethiopic Supplement", @@ -417132,9 +427691,14 @@ static const char * const UNI_blk_values[] = { "kaithi", "Kana_Ext_A", "kanaexta", + "Kana_Ext_B", + "kanaextb", "Kana Extended-A", "Kana_Extended_A", "kanaextendeda", + "Kana Extended-B", + "Kana_Extended_B", + "kanaextendedb", "Kana_Sup", "kanasup", "Kana Supplement", @@ -417207,6 +427771,16 @@ static const char * const UNI_blk_values[] = { "Latin Extended-E", "Latin_Extended_E", "latinextendede", + "Latin Extended-F", + "Latin_Extended_F", + "latinextendedf", + "Latin Extended-G", + "Latin_Extended_G", + "latinextendedg", + "Latin_Ext_F", + "latinextf", + "Latin_Ext_G", + "latinextg", "Latin_1_Sup", "latin1sup", "Latin-1 Supplement", @@ -417415,6 +427989,9 @@ static const char * const UNI_blk_values[] = { "Old Turkic", "Old_Turkic", "oldturkic", + "Old Uyghur", + "Old_Uyghur", + "olduyghur", "Optical Character Recognition", "Optical_Character_Recognition", "opticalcharacterrecognition", @@ -417624,6 +428201,8 @@ static const char * const UNI_blk_values[] = { "Tamil Supplement", "Tamil_Supplement", "tamilsupplement", + "Tangsa", + "tangsa", "Tangut", "tangut", "Tangut Components", @@ -417646,6 +428225,8 @@ static const char * const UNI_blk_values[] = { "tifinagh", "Tirhuta", "tirhuta", + "Toto", + "toto", "Transport_And_Map", "transportandmap", "Transport and Map Symbols", @@ -417655,6 +428236,8 @@ static const char * const UNI_blk_values[] = { "ucas", "UCAS_Ext", "ucasext", + "UCAS_Ext_A", + "ucasexta", "Ugaritic", "ugaritic", "Unified Canadian Aboriginal Syllabics", @@ -417663,6 +428246,9 @@ static const char * const UNI_blk_values[] = { "Unified Canadian Aboriginal Syllabics Extended", "Unified_Canadian_Aboriginal_Syllabics_Extended", "unifiedcanadianaboriginalsyllabicsextended", + "Unified Canadian Aboriginal Syllabics Extended-A", + "Unified_Canadian_Aboriginal_Syllabics_Extended_A", + "unifiedcanadianaboriginalsyllabicsextendeda", "Vai", "vai", "Variation Selectors", @@ -417679,6 +428265,8 @@ static const char * const UNI_blk_values[] = { "Vertical Forms", "Vertical_Forms", "verticalforms", + "Vithkuqi", + "vithkuqi", "VS", "vs", "VS_Sup", @@ -417704,6 +428292,11 @@ static const char * const UNI_blk_values[] = { "Zanabazar Square", "Zanabazar_Square", "zanabazarsquare", + "Znamenny_Music", + "znamennymusic", + "Znamenny Musical Notation", + "Znamenny_Musical_Notation", + "znamennymusicalnotation", NULL }; @@ -418352,6 +428945,7 @@ static const char * const UNI_in_values[] = { "12.0", "12.1", "13.0", + "14.0", "Unassigned", "unassigned", "V10_0", @@ -418359,6 +428953,7 @@ static const char * const UNI_in_values[] = { "V12_0", "V12_1", "V13_0", + "V14_0", "V2_0", "V2_1", "V3_0", @@ -418381,6 +428976,7 @@ static const char * const UNI_in_values[] = { "v120", "v121", "v130", + "v140", "v20", "v21", "v30", @@ -418704,6 +429300,10 @@ static const char * const UNI_jg_values[] = { "tehmarbutagoal", "Teth", "teth", + "Thin_Yeh", + "thinyeh", + "Vertical_Tail", + "verticaltail", "Waw", "waw", "Yeh", @@ -419269,12 +429869,16 @@ static const char * const UNI_sc_values[] = { "copt", "Coptic", "coptic", + "Cpmn", + "cpmn", "Cprt", "cprt", "Cuneiform", "cuneiform", "Cypriot", "cypriot", + "Cypro_Minoan", + "cyprominoan", "Cyrillic", "cyrillic", "Cyrl", @@ -419581,6 +430185,8 @@ static const char * const UNI_sc_values[] = { "oldsoutharabian", "Old_Turkic", "oldturkic", + "Old_Uyghur", + "olduyghur", "Oriya", "oriya", "Orkh", @@ -419595,6 +430201,8 @@ static const char * const UNI_sc_values[] = { "osma", "Osmanya", "osmanya", + "Ougr", + "ougr", "Pahawh_Hmong", "pahawhhmong", "Palm", @@ -419723,6 +430331,8 @@ static const char * const UNI_sc_values[] = { "taml", "Tang", "tang", + "Tangsa", + "tangsa", "Tangut", "tangut", "Tavt", @@ -419751,6 +430361,10 @@ static const char * const UNI_sc_values[] = { "tirh", "Tirhuta", "tirhuta", + "Tnsa", + "tnsa", + "Toto", + "toto", "Ugar", "ugar", "Ugaritic", @@ -419761,6 +430375,10 @@ static const char * const UNI_sc_values[] = { "vai", "Vaii", "vaii", + "Vith", + "vith", + "Vithkuqi", + "vithkuqi", "Wancho", "wancho", "Wara", @@ -420102,7 +430720,7 @@ static const U8 LB_table[42][42] = { /* RI */ { 1, 1, 0, 1, 0, 1, 2, 0, 2, 0, 1, 1, 1, 1, 2, 0, 1, 1, 1, 0, 1, 0, 2, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0,15, 0, 2, 1, 0, 0, 0, 2 }, /* SP */ { 7, 7, 7, 7, 0, 7, 8, 7, 8, 0, 7, 7, 1, 7, 8, 7, 7, 7, 7, 7, 7, 7, 8, 7, 7, 7, 0, 0, 7, 7, 7, 7, 7, 7, 7, 0, 8, 7, 8, 0, 7, 8 }, /* SY */ { 1, 1, 0, 1, 0, 1, 2, 0, 2, 0, 1, 1, 1, 1, 2, 0, 1, 1, 0, 0, 1, 0, 2, 1, 1, 1, 0, 0, 0,12, 1,33,33, 0, 1, 0, 2, 1, 0, 0, 0, 2 }, -/* UEP*/ { 1, 1, 0, 1, 0, 1, 2, 0, 2, 0, 1, 1, 1, 1, 2, 0, 1, 1, 1, 0, 1, 0, 2, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 2, 1, 0, 0, 0, 2 }, +/* UEP*/ { 1, 1, 0, 1, 0, 1, 2, 0, 2, 0, 1, 1, 1, 0, 2, 0, 1, 1, 1, 0, 1, 0, 2, 1, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 2, 1, 0, 0, 0, 2 }, /* WJ */ { 0, 0, 0, 0, 0, 0, 2, 0, 2, 0, 0, 0, 1, 0, 2, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 0, 0, 0, 0, 2 }, /* ZW */ { 1, 1, 1, 1, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1 }, /* ZWJ*/ { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }, @@ -420163,56 +430781,56 @@ static const U8 WB_table[23][23] = { /* Generated from: * 688d673ec947f7ccf898b4eae9848139d4d33676b688dee54f449f8bf9d3bbd2 lib/Unicode/UCD.pm - * ce96627d4fc91b4fd886c409caeb9b76cf7bd345e12f05c6701add7f233f6437 lib/unicore/ArabicShaping.txt - * 0e69eef3da722cc104522d8372e86d5b86bb7afcc761b0c991e39e832294946d lib/unicore/BidiBrackets.txt - * a00d9d21585106a52113fb7b1d3d0373a5835be72e76862fb559ebddd474d70e lib/unicore/BidiMirroring.txt - * 81a82b6a9fcf1a9c12f588d7a1decd73a9afdc4cac95b0eb7e576e7942d6c19f lib/unicore/Blocks.txt - * 99d231d7c91688bbe8ca8ccebcc2f46b5b222f844babe4827295bae11e2abe5f lib/unicore/CaseFolding.txt - * 38badafd818d8405324fe298c0676be0c95186368c84b5368375fd871a645144 lib/unicore/CompositionExclusions.txt - * e779a443d3aa2a3166a15becaa2b737c922480e32c0453d5956093633555078f lib/unicore/DAge.txt - * a5d45f59b39deaab3c72ce8c1a2e212a5e086dff11b1f9d5bb0e352642e82248 lib/unicore/DCoreProperties.txt - * 3ac44e11c84bdaf6b207d2c2c20eed857ae17052393fc7f71b0fe951186ba906 lib/unicore/DNormalizationProps.txt - * 4f822ec7a9ebbb3138ad29bade8b9688d25b39c7a3c0b7431f01e7229e4fcb6e lib/unicore/EastAsianWidth.txt - * fc535aa1047a70105ab9a22c2b4c3f363a2ff02fe48ebbc5eeb9873b2752ff0b lib/unicore/EquivalentUnifiedIdeograph.txt - * b9c5158ce944d2fec57e0e4ecb716bdabfc3bdde73525f1772fe03f61a30d473 lib/unicore/HangulSyllableType.txt - * 36c1b2a626ff1fb23b8b21e6ea8712698f8ce668dded1cb48b8ddf6a6a1b04e9 lib/unicore/IdStatus.txt - * 4857c4ffa3898e6128b2d46b0a02e499a663fb91464a69ef3611096f01293acc lib/unicore/IdType.txt - * 69197b019fa5f2fb0d8c6ed1ed8acb9f2e8b5b8f45a947953ffa652f3bf54983 lib/unicore/IndicPositionalCategory.txt - * 6604e2f0fde7428675364aa0006bc686b79488dcc60ae8cb29800af2be3352e8 lib/unicore/IndicSyllabicCategory.txt - * 84ead63924aaa74b988b2eaf254a8733276ed108633ce2ef77a9ee1de7818162 lib/unicore/Jamo.txt - * d5abcd8f54c8a2aa912924c485ccf7f968ad98feaa303d8e9a29ad89172f1faf lib/unicore/LineBreak.txt - * 985128e8c8b2540233331d9b27d897d2c23bd5bcf1d05da960befce6efc59542 lib/unicore/NameAliases.txt - * 27282b8aa01d4d0c44aef436cb74195ae8639ffa187aeee4e6247af76febea76 lib/unicore/NamedSequences.txt - * 485b5a3ed25dbf1f94dfa5a9b69d8b4550ffd0c33045ccc55ccfd7c80b2a40cf lib/unicore/PropList.txt - * 6b3902e9268cd843fe65cbdea992108c9528343ec0679f800b96f356bb553e5a lib/unicore/PropValueAliases.txt - * 2bd5777847e3d6add3c7e5c0d1393ddcab89e5a0ac3ff498cb0c53041f0b86e4 lib/unicore/PropertyAliases.txt - * 03a61dc89422e44cc2b73e8e893321007880ab69e2a4d281c0f1bc29c602b9d0 lib/unicore/ScriptExtensions.txt - * 9a5ed1ec9b5f0d7147e9371ad792ab39203611af7637cff2aa4a5c663b172cde lib/unicore/Scripts.txt - * 6424312f1dc39b22e0ff9c0ffb13dfad424d9b03e6a6dc6bca941f6bf5ef1ffd lib/unicore/SpecialCasing.txt - * bdbffbbfc8ad4d3a6d01b5891510458f3d36f7170422af4ea2bed3211a73e8bb lib/unicore/UnicodeData.txt - * 160f41816234addb511901d5f21febd69574578dd93de6ef8153e35693325575 lib/unicore/VerticalOrientation.txt - * 32dfb37d21db530529a6ec3dc13d96f21f8e7c7faf7ff3db8a9760cd76cec81d lib/unicore/auxiliary/GCBTest.txt - * 2bd3c5e2d62701ff81fb3ec318e179a4618cabb1493b1e0dd2b4e7e56c5437c4 lib/unicore/auxiliary/GraphemeBreakProperty.txt - * c51fbebfa82a0f36473b44bfd71d5ef6cb6a1f81fb313375dc9a1910d79bb2b6 lib/unicore/auxiliary/LBTest.txt - * 80b0107750818d8f370bd120b6fe56b6855b60581f72affe8b60409a469b4b65 lib/unicore/auxiliary/SBTest.txt - * 09e3166ebab166ac630a227f77f4e794ebd433271abd5588f5a67e7f199c71ee lib/unicore/auxiliary/SentenceBreakProperty.txt - * bf5373ce28a5df06796c93dc159dd15a997bb2950c92704b40ae8190cfc3716d lib/unicore/auxiliary/WBTest.txt - * a2b7373cf2fe3fa3b26dbb53405ca849985f771ff47f1c61743978003ff80499 lib/unicore/auxiliary/WordBreakProperty.txt - * d2686f400a638c80775d7c662556fb8fa8dd3bbe4aa548d9d31624264c6e1bb1 lib/unicore/emoji/emoji.txt - * b827ae5da8c2b08947cc9a120a7b7fd2f1676fb160b508df78075381635b127c lib/unicore/extracted/DBidiClass.txt - * 6fdc5b5ef40444a8f0c772e6b67c00498d4216fe0c0fdf76744ce338f2ad3810 lib/unicore/extracted/DBinaryProperties.txt - * e14928a5bf6ad5958a80332bd42e96e14420080a95c660e5da29384e496755d0 lib/unicore/extracted/DCombiningClass.txt - * 579a03281fbe87b78d5d9a8523de4d255edd7e4ca6eab0e4c7729de97e9b89b1 lib/unicore/extracted/DDecompositionType.txt - * ad83c59b257e9d480ffd3001d4ac240c5fed7cb1919453e1c4e8877035256bcd lib/unicore/extracted/DEastAsianWidth.txt - * 4502f0969e4e6558c4b4c6ca4c23dad70b863d61dd3d5eed1a62a6c3c99fd570 lib/unicore/extracted/DGeneralCategory.txt - * 00bb88b89e2adb646f3177f9444e2d3192386b81a5de9556104b338274b253e1 lib/unicore/extracted/DJoinGroup.txt - * ac835b6e11a60c9820d3cf2d1cb0558dd68efb8f53f404a51632e4726690a6d7 lib/unicore/extracted/DJoinType.txt - * baba9dfc133e3cb770a89aaf0973b1341fa61c2da6c176baf6428898b3b568d8 lib/unicore/extracted/DLineBreak.txt - * 6d4a8c945dd7db83ed617cbb7d937de7f4ecf016ff22970d846e996a7c9a2a5d lib/unicore/extracted/DNumType.txt - * 5b7c14380d5cceeaffcfbc18db1ed936391d2af2d51f5a41f1a17b692c77e59b lib/unicore/extracted/DNumValues.txt - * 4e169849b96b76987a8fc443ef421b44d2dcebbd981bb457f6a13e8af77cdbe2 lib/unicore/mktables - * 50b85a67451145545a65cea370dab8d3444fbfe07e9c34cef560c5b7da9d3eef lib/unicore/version + * c7698811e9adb6cc98fb996a7de4be2b6532f2ac67e76055cc8afdbf6ee18af3 lib/unicore/ArabicShaping.txt + * 24a74555f918bbe99f5b3f1b83cf36fc0e205bb8a600a6a3aa539c710a3dcf27 lib/unicore/BidiBrackets.txt + * 7a5c74cedc1616a9af0a9d22e108ae592d86fe93649c144ae6ba49f193a44122 lib/unicore/BidiMirroring.txt + * 598870dddef7b34b5a972916528c456aff2765b79cd4f9647fb58ceb767e7f17 lib/unicore/Blocks.txt + * a566cd48687b2cd897e02501118b2413c14ae86d318f9abbbba97feb84189f0f lib/unicore/CaseFolding.txt + * 3360762fc3295cea54ab251c31df621d05ba4b94d46c60eaac29aa16d70ad1e0 lib/unicore/CompositionExclusions.txt + * 7e058dec02147098bc9c28d86209f0f251bba0538f3b5a705ad02ea3bb709fe0 lib/unicore/DAge.txt + * e3eddd7d469cd1b0feed7528defad1a1cc7c6a9ceb0ae4446a6d10921ed2e7bc lib/unicore/DCoreProperties.txt + * b2c444c20730b097787fdf50bd7d6dd3fc5256ab8084f5b35b11c8776eca674c lib/unicore/DNormalizationProps.txt + * f901ac011aa32a09224d6555da71e2532c59c1d3381322829de0e3b880507250 lib/unicore/EastAsianWidth.txt + * 5995522f01633073911dad1edb74d13aa832f42862c0392a79627b85d52f2391 lib/unicore/EquivalentUnifiedIdeograph.txt + * cd1c9367cba438afa965fcb5edc6ed3ec6e685fd5dd21c0cc20c026f04beb0e5 lib/unicore/HangulSyllableType.txt + * 3f3f368fccdb37f350ecedc20b37fa71ab31c04e847884c77780d34283539f73 lib/unicore/IdStatus.txt + * 45a150c23961b58d7784704af6c4daccd6517d97b6489e53d13bbdbf9e4f065f lib/unicore/IdType.txt + * d8704c8725568813a947ff2ef38bcf1f05e2a6fbea6876ba384890f187a8bf61 lib/unicore/IndicPositionalCategory.txt + * c7b969b653dc278fb66ab4136223d320e30ad19367eb791ae60dcc6d92071b16 lib/unicore/IndicSyllabicCategory.txt + * 39ff89e0a329e1ccce6d54fad8cf82e90926901928c0ca9b9a2ad5681f330dd9 lib/unicore/Jamo.txt + * 9e06e9f35c6959fb91dcc7993f90d58523c3079bc62c6b25f828b4cdebc5d70c lib/unicore/LineBreak.txt + * 14b3b677d33f95c51423dce6eef4a6a28b4b160451ecedee4b91edb6745cf4a3 lib/unicore/NameAliases.txt + * db5745688affcdc0c3927a1ee0667018a96a7b24513f866d5235e98fef6c2436 lib/unicore/NamedSequences.txt + * 6bddfdb850417a5bee6deff19290fd1b138589909afb50f5a049f343bf2c6722 lib/unicore/PropList.txt + * eb755757e20b72b330b2948df3cf2ff7adb0e31bb060140dc09dafb132ace2cd lib/unicore/PropValueAliases.txt + * 859d7225f2d2a460b3ccb1d61a7945f8cc219acdf5aa53b66b7a1e4bf6ebfc87 lib/unicore/PropertyAliases.txt + * d37eedf63ff9c48bac863d5f76862373d6cf5269fd21253d499e2430d638c01d lib/unicore/ScriptExtensions.txt + * 52db475c4ec445e73b0b16915448c357614946ad7062843c563e00d7535c6510 lib/unicore/Scripts.txt + * c667b45908fd269af25fd55d2fc5bbc157fb1b77675936e25c513ce32e080334 lib/unicore/SpecialCasing.txt + * 36018e68657fdcb3485f636630ffe8c8532e01c977703d2803f5b89d6c5feafb lib/unicore/UnicodeData.txt + * 869ff43dd012f924d03c89fc268c88f0e7eea72f0228b91ca30455afdb84f8fd lib/unicore/VerticalOrientation.txt + * ddc7d4d1f3838573b94fc5d83ff7217e63c47b22ae1cd40c5fe1a54efc15589b lib/unicore/auxiliary/GCBTest.txt + * 97e79f1f8d9cd76d120f2420381a01abc00a7c78a2aa583fa3f9627264a99742 lib/unicore/auxiliary/GraphemeBreakProperty.txt + * 488dbb6a7e1d0070d4aa7c175352c818ff6425172850d1b40c6177726658cb05 lib/unicore/auxiliary/LBTest.txt + * 7e42dd749dbb94aa44b13faf9df6319d9a16ce2ea09a3a094fcfbb5962168040 lib/unicore/auxiliary/SBTest.txt + * 7092ca4117cec891c25c7724132efc519e1dece01ae9fd6068035a9db04d526e lib/unicore/auxiliary/SentenceBreakProperty.txt + * 8094b544ec1580c7e41ac0187805cc1aeb330a90301ec7505563e1a59318284e lib/unicore/auxiliary/WBTest.txt + * 7716752aad296d4ab23ff4ed0a2746fc5328750ff84e9e7d6f3828ee9eaef742 lib/unicore/auxiliary/WordBreakProperty.txt + * b597836124298b8f7fa076273802840cfc3271a25f5c397a082e120954b82c3c lib/unicore/emoji/emoji.txt + * e5fe51acc74e3e83b4fb4c7b25f3c34491d6eb8095c9955d0712dafbca7b3c2b lib/unicore/extracted/DBidiClass.txt + * cd0a14176d93bf440b77a582a0d678190fc0688b15442d4cfb250bf2e27956af lib/unicore/extracted/DBinaryProperties.txt + * 12b0c3af9b600b49488d66545a3e7844ea980809627201bf9afeebe1c9f16f4e lib/unicore/extracted/DCombiningClass.txt + * f76064b298cfbd715ba542e7894f7a507d32da2f011070d1d01df95cad9817d6 lib/unicore/extracted/DDecompositionType.txt + * f9bef074cc916db57fece99d54a4505f8e7c7b17481619e3f0005211f7717d4b lib/unicore/extracted/DEastAsianWidth.txt + * cde679c8461976ed40d7edf61ae98cbb947540831f06f5bc7da7decbf91a1420 lib/unicore/extracted/DGeneralCategory.txt + * 9bb891831328713603a486a4a03df7f7987c3e1e8144a6d1ac71fd061ef3f732 lib/unicore/extracted/DJoinGroup.txt + * e97c65bbea0a69d2fae6ec4182b09e519e13232e20bd804b3004edc0f36bb0d4 lib/unicore/extracted/DJoinType.txt + * 43f6df50e4878f501b417e366b0ee097ae5ccb2d4ce942026bed3d62d78e7887 lib/unicore/extracted/DLineBreak.txt + * a04502ebb36a45d83cbe48a7d8132ea8143edb7b3d34d0aa6afe4a9685049741 lib/unicore/extracted/DNumType.txt + * 11075771b112e8e7ccf6ffa637c4c91eadc3ef3db0517b24e605df8fd3624239 lib/unicore/extracted/DNumValues.txt + * 24b7b7bda1a2ab4684ba53355d82ad227c1624b337b37c3b96f2e4b902eea1f2 lib/unicore/mktables + * c72bbdeda99714db1c8024d3311da4aef3c0db3b9b9f11455a7cfe10d5e9aba3 lib/unicore/version * 0a6b5ab33bb1026531f816efe81aea1a8ffcd34a27cbea37dd6a70a63d73c844 regen/charset_translations.pl * 5f8520d3a17ade6317fc0c423f5091470924b1ef425bca0c41ce8e4a9f8460fe regen/mk_PL_charclass.pl - * 04a5294218c412e5ee2e0d9f8d22af1d95bbfd2cafae3935cbb6b5871e9f9704 regen/mk_invlists.pl + * 6defb8383a69034f8279fea4ff66e09bf58049c4cbecf2331b9b245c45d4f2d5 regen/mk_invlists.pl * ex: set ro: */ diff --git a/lib/Unicode/UCD.t b/lib/Unicode/UCD.t index c7e3ecb046..3d39121217 100644 --- a/lib/Unicode/UCD.t +++ b/lib/Unicode/UCD.t @@ -19,7 +19,7 @@ use Test::More; use Unicode::UCD qw(charinfo charprop charprops_all); -my $expected_version = '13.0.0'; +my $expected_version = '14.0.0'; my $current_version = Unicode::UCD::UnicodeVersion; my $v_unicode_version = pack "C*", split /\./, $current_version; my $unknown_script = ($v_unicode_version lt v5.0.0) @@ -786,7 +786,7 @@ SKIP: skip("Latin range count will be wrong when using older Unicode release", 2) if $current_version lt $expected_version; my $n1 = @$r1; - is($n1, 32, "number of ranges in Latin script (Unicode $expected_version)") if $::IS_ASCII; + is($n1, 38, "number of ranges in Latin script (Unicode $expected_version)") if $::IS_ASCII; shift @$r1 while @$r1; my $r2 = charscript('Latin'); is(@$r2, $n1, "modifying results should not mess up internal caches"); diff --git a/lib/unicore/ArabicShaping.txt b/lib/unicore/ArabicShaping.txt index 9a93adc12f..bfb6b47a55 100644 --- a/lib/unicore/ArabicShaping.txt +++ b/lib/unicore/ArabicShaping.txt @@ -1,6 +1,6 @@ -# ArabicShaping-13.0.0.txt -# Date: 2020-01-31, 23:55:00 GMT [KW, RP] -# © 2020 Unicode®, Inc. +# ArabicShaping-14.0.0.txt +# Date: 2021-05-21, 01:54:00 GMT [KW, RP] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -13,11 +13,12 @@ # exemplified in Tables 9-3, 9-8, 9-9, 9-10, 9-14, 9-15, 9-16, 9-19, # 9-20, 10-4, 10-5, 10-6, 10-7, and 19-5 of The Unicode Standard core # specification. This file also defines Joining_Type values for -# Mongolian, Phags-pa, Psalter Pahlavi, Sogdian, Chorasmian, and Adlam positional shaping, +# Mongolian, Phags-pa, Psalter Pahlavi, Sogdian, Old Uyghur, Chorasmian, +# and Adlam positional shaping, # and Joining_Type and Joining_Group values for Hanifi Rohingya positional shaping, # which are not listed in tables in the standard. # -# See Sections 9.2, 9.3, 9.5, 10.5, 10.6, 13.4, 14.3, 14.10, 16.14, 19.4, and 19.9 +# See Sections 9.2, 9.3, 9.5, 10.5, 10.6, 13.5, 14.4, 14.10, 14.11, 16.14, 19.4, and 19.9 # of The Unicode Standard core specification for more information. # # Each line contains four fields, separated by a semicolon. @@ -44,7 +45,7 @@ # Note that for cursive joining scripts which are typically rendered # top-to-bottom, rather than right-to-left, Joining_Type=L conventionally # refers to bottom joining, and Joining_Type=R conventionally refers -# to top joining. See Section 14.3, Phags-pa for more information on the +# to top joining. See Section 14.4, Phags-pa for more information on the # interpretation of joining types in vertical layout. # # Field 3: defines the joining group (property name: Joining_Group) @@ -79,7 +80,7 @@ # joining group values will be defined only if an explicit proposal # to define those values exactly has been approved by the UTC. This # is the convention exemplified by the N'Ko, Mandaic, Mongolian, -# Phags-pa, Psalter Pahlavi, Sogdian, Chorasmian, and Adlam scripts. +# Phags-pa, Psalter Pahlavi, Sogdian, Old Uyghur, Chorasmian, and Adlam scripts. # Only the Arabic, Manichaean, and Syriac scripts currently have # explicit joining group values defined for all characters, including # those which have only a single character in a particular Joining_Group @@ -162,7 +163,7 @@ 0674; HIGH HAMZA; U; No_Joining_Group 0675; HIGH HAMZA ALEF; R; ALEF 0676; HIGH HAMZA WAW; R; WAW -0677; HIGH HAMZA WAW WITH DAMMA ABOVE; R; WAW +0677; HIGH HAMZA WAW WITH COMMA ABOVE; R; WAW 0678; HIGH HAMZA DOTLESS YEH; D; YEH 0679; DOTLESS BEH WITH TAH ABOVE; D; BEH 067A; DOTLESS BEH WITH VERTICAL 2 DOTS ABOVE; D; BEH @@ -240,9 +241,9 @@ 06C2; HEH GOAL WITH HAMZA ABOVE; D; HEH GOAL 06C3; TEH MARBUTA GOAL; R; TEH MARBUTA GOAL 06C4; WAW WITH ATTACHED RING WITHIN; R; WAW -06C5; WAW WITH BAR; R; WAW +06C5; WAW WITH LOOP; R; WAW 06C6; WAW WITH V ABOVE; R; WAW -06C7; WAW WITH DAMMA ABOVE; R; WAW +06C7; WAW WITH COMMA ABOVE; R; WAW 06C8; WAW WITH ALEF ABOVE; R; WAW 06C9; WAW WITH INVERTED V ABOVE; R; WAW 06CA; WAW WITH 2 DOTS ABOVE; R; WAW @@ -432,6 +433,42 @@ 0869; MALAYALAM LLLA; R; MALAYALAM LLLA 086A; MALAYALAM SSA; R; MALAYALAM SSA +# Arabic Extended-B Characters + +0870; ALEF WITH ATTACHED FATHA; R; ALEF +0871; ALEF WITH ATTACHED TOP RIGHT FATHA; R; ALEF +0872; ALEF WITH RIGHT MIDDLE STROKE; R; ALEF +0873; ALEF WITH LEFT MIDDLE STROKE; R; ALEF +0874; ALEF WITH ATTACHED KASRA; R; ALEF +0875; ALEF WITH ATTACHED BOTTOM RIGHT KASRA; R; ALEF +0876; ALEF WITH ATTACHED ROUND DOT ABOVE; R; ALEF +0877; ALEF WITH ATTACHED RIGHT ROUND DOT; R; ALEF +0878; ALEF WITH ATTACHED LEFT ROUND DOT; R; ALEF +0879; ALEF WITH ATTACHED ROUND DOT BELOW; R; ALEF +087A; ALEF WITH DOT ABOVE; R; ALEF +087B; ALEF WITH ATTACHED TOP RIGHT FATHA AND DOT ABOVE; R; ALEF +087C; ALEF WITH RIGHT MIDDLE STROKE AND DOT ABOVE; R; ALEF +087D; ALEF WITH ATTACHED BOTTOM RIGHT KASRA AND DOT ABOVE; R; ALEF +087E; ALEF WITH ATTACHED TOP RIGHT FATHA AND LEFT RING; R; ALEF +087F; ALEF WITH RIGHT MIDDLE STROKE AND LEFT RING; R; ALEF +0880; ALEF WITH ATTACHED BOTTOM RIGHT KASRA AND LEFT RING; R; ALEF +0881; ALEF WITH ATTACHED RIGHT HAMZA; R; ALEF +0882; ALEF WITH ATTACHED LEFT HAMZA; R; ALEF +0883; TATWEEL WITH OVERSTRUCK HAMZA; C; No_Joining_Group +0884; TATWEEL WITH OVERSTRUCK WAW; C; No_Joining_Group +0885; TATWEEL WITH TWO DOTS BELOW; C; No_Joining_Group +0886; THIN YEH; D; THIN YEH +0887; ARABIC BASELINE ROUND DOT; U; No_Joining_Group +0888; ARABIC RAISED ROUND DOT; U; No_Joining_Group +0889; DOTLESS NOON WITH INVERTED V ABOVE; D; NOON +088A; HAH WITH INVERTED V BELOW; D; HAH +088B; TAH WITH DOT BELOW; D; TAH +088C; TAH WITH 3 DOTS BELOW; D; TAH +088D; KEHEH WITH VERTICAL 2 DOTS BELOW; D; GAF +088E; VERTICAL TAIL; R; VERTICAL TAIL +0890; ARABIC POUND MARK ABOVE; U; No_Joining_Group +0891; ARABIC PIASTRE MARK ABOVE; U; No_Joining_Group + # Arabic Extended-A Characters 08A0; DOTLESS BEH WITH V BELOW; D; BEH @@ -455,6 +492,7 @@ 08B2; REH WITH DOT AND INVERTED V ABOVE; R; REH 08B3; AIN WITH 3 DOTS BELOW; D; AIN 08B4; KAF WITH DOT BELOW; D; KAF +08B5; DOTLESS QAF WITH DOT BELOW; D; QAF 08B6; BEH WITH MEEM ABOVE; D; BEH 08B7; DOTLESS BEH WITH 3 DOTS BELOW AND MEEM ABOVE; D; BEH 08B8; DOTLESS BEH WITH TEH ABOVE; D; BEH @@ -473,6 +511,7 @@ 08C5; HAH WITH DOT BELOW AND 3 DOTS ABOVE; D; HAH 08C6; HAH WITH DIAMOND 4 DOTS BELOW; D; HAH 08C7; LAM WITH TAH ABOVE; D; LAM +08C8; KEHEH WITH ELONGATED HAMZA ABOVE; D; GAF 08E2; ARABIC DISPUTED END OF AYAH; U; No_Joining_Group # Mongolian Characters @@ -819,6 +858,27 @@ A873; PHAGS-PA CANDRABINDU; U; No_Joining_Group 10F53; SOGDIAN TWENTY; D; No_Joining_Group 10F54; SOGDIAN ONE HUNDRED; R; No_Joining_Group +# Old Uyghur Characters + +10F70; OLD UYGHUR ALEPH; D; No_Joining_Group +10F71; OLD UYGHUR BETH; D; No_Joining_Group +10F72; OLD UYGHUR GIMEL-HETH; D; No_Joining_Group +10F73; OLD UYGHUR WAW; D; No_Joining_Group +10F74; OLD UYGHUR ZAYIN; R; No_Joining_Group +10F75; OLD UYGHUR FINAL HETH; R; No_Joining_Group +10F76; OLD UYGHUR YODH; D; No_Joining_Group +10F77; OLD UYGHUR KAPH; D; No_Joining_Group +10F78; OLD UYGHUR LAMEDH; D; No_Joining_Group +10F79; OLD UYGHUR MEM; D; No_Joining_Group +10F7A; OLD UYGHUR NUN; D; No_Joining_Group +10F7B; OLD UYGHUR SAMEKH; D; No_Joining_Group +10F7C; OLD UYGHUR PE; D; No_Joining_Group +10F7D; OLD UYGHUR SADHE; D; No_Joining_Group +10F7E; OLD UYGHUR RESH; D; No_Joining_Group +10F7F; OLD UYGHUR SHIN; D; No_Joining_Group +10F80; OLD UYGHUR TAW; D; No_Joining_Group +10F81; OLD UYGHUR LESH; D; No_Joining_Group + # Chorasmian Characters 10FB0; CHORASMIAN ALEPH; D; No_Joining_Group diff --git a/lib/unicore/BidiBrackets.txt b/lib/unicore/BidiBrackets.txt index a95e5ca5ca..89698f588a 100644 --- a/lib/unicore/BidiBrackets.txt +++ b/lib/unicore/BidiBrackets.txt @@ -1,11 +1,11 @@ -# BidiBrackets-13.0.0.txt -# Date: 2019-09-09, 19:31:00 GMT [AG, LI, KW] -# © 2019 Unicode®, Inc. +# BidiBrackets-14.0.0.txt +# Date: 2021-06-30, 23:59:00 GMT [AG, LI, KW] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Bidi_Paired_Bracket and Bidi_Paired_Bracket_Type Properties # @@ -56,7 +56,7 @@ # of each line. # # For information on bidirectional paired brackets, see UAX #9: Unicode -# Bidirectional Algorithm, at http://www.unicode.org/unicode/reports/tr9/ +# Bidirectional Algorithm, at https://www.unicode.org/reports/tr9/ # # This file was originally created by Andrew Glass and Laurentiu Iancu # for Unicode 6.3. @@ -147,6 +147,14 @@ 2E27; 2E26; c # RIGHT SIDEWAYS U BRACKET 2E28; 2E29; o # LEFT DOUBLE PARENTHESIS 2E29; 2E28; c # RIGHT DOUBLE PARENTHESIS +2E55; 2E56; o # LEFT SQUARE BRACKET WITH STROKE +2E56; 2E55; c # RIGHT SQUARE BRACKET WITH STROKE +2E57; 2E58; o # LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58; 2E57; c # RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59; 2E5A; o # TOP HALF LEFT PARENTHESIS +2E5A; 2E59; c # TOP HALF RIGHT PARENTHESIS +2E5B; 2E5C; o # BOTTOM HALF LEFT PARENTHESIS +2E5C; 2E5B; c # BOTTOM HALF RIGHT PARENTHESIS 3008; 3009; o # LEFT ANGLE BRACKET 3009; 3008; c # RIGHT ANGLE BRACKET 300A; 300B; o # LEFT DOUBLE ANGLE BRACKET diff --git a/lib/unicore/BidiMirroring.txt b/lib/unicore/BidiMirroring.txt index 34e42ae8dc..bd8e2c5d00 100644 --- a/lib/unicore/BidiMirroring.txt +++ b/lib/unicore/BidiMirroring.txt @@ -1,10 +1,10 @@ -# BidiMirroring-13.0.0.txt -# Date: 2019-09-09, 19:34:00 GMT [KW, LI, RP] -# © 2019 Unicode®, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# BidiMirroring-14.0.0.txt +# Date: 2021-08-08, 22:55:00 GMT [KW, RP] +# © 2021 Unicode®, Inc. +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Bidi_Mirroring_Glyph Property # @@ -15,7 +15,7 @@ # value, for which there is another Unicode character that typically has a glyph # that is the mirror image of the original character's glyph. # -# The repertoire covered by the file is Unicode 13.0.0. +# The repertoire covered by the file is Unicode 14.0.0. # # The file contains a list of lines with mappings from one code point # to another one for character-based mirroring. @@ -40,7 +40,7 @@ # for character-based mirroring. # # For information on bidi mirroring, see UAX #9: Unicode Bidirectional Algorithm, -# at http://www.unicode.org/unicode/reports/tr9/ +# at https://www.unicode.org/reports/tr9/ # # This file was originally created by Markus Scherer. # Extended for Unicode 3.2, 4.0, 4.1, 5.0, 5.1, 5.2, and 6.0 by Ken Whistler, @@ -96,10 +96,10 @@ 208D; 208E # SUBSCRIPT LEFT PARENTHESIS 208E; 208D # SUBSCRIPT RIGHT PARENTHESIS 2208; 220B # ELEMENT OF -2209; 220C # NOT AN ELEMENT OF +2209; 220C # [BEST FIT] NOT AN ELEMENT OF 220A; 220D # SMALL ELEMENT OF 220B; 2208 # CONTAINS AS MEMBER -220C; 2209 # DOES NOT CONTAIN AS MEMBER +220C; 2209 # [BEST FIT] DOES NOT CONTAIN AS MEMBER 220D; 220A # SMALL CONTAINS AS MEMBER 2215; 29F5 # DIVISION SLASH 221F; 2BFE # RIGHT ANGLE @@ -453,6 +453,14 @@ 2E27; 2E26 # RIGHT SIDEWAYS U BRACKET 2E28; 2E29 # LEFT DOUBLE PARENTHESIS 2E29; 2E28 # RIGHT DOUBLE PARENTHESIS +2E55; 2E56 # LEFT SQUARE BRACKET WITH STROKE +2E56; 2E55 # RIGHT SQUARE BRACKET WITH STROKE +2E57; 2E58 # LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58; 2E57 # RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59; 2E5A # TOP HALF LEFT PARENTHESIS +2E5A; 2E59 # TOP HALF RIGHT PARENTHESIS +2E5B; 2E5C # BOTTOM HALF LEFT PARENTHESIS +2E5C; 2E5B # BOTTOM HALF RIGHT PARENTHESIS 3008; 3009 # LEFT ANGLE BRACKET 3009; 3008 # RIGHT ANGLE BRACKET 300A; 300B # LEFT DOUBLE ANGLE BRACKET diff --git a/lib/unicore/Blocks.txt b/lib/unicore/Blocks.txt index 56877db10f..cc5d61988b 100644 --- a/lib/unicore/Blocks.txt +++ b/lib/unicore/Blocks.txt @@ -1,6 +1,6 @@ -# Blocks-13.0.0.txt -# Date: 2019-07-10, 19:06:00 GMT [KW] -# © 2019 Unicode®, Inc. +# Blocks-14.0.0.txt +# Date: 2021-01-22, 23:29:00 GMT [KW] +# © 2021 Unicode®, Inc. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Character Database @@ -52,6 +52,7 @@ 0800..083F; Samaritan 0840..085F; Mandaic 0860..086F; Syriac Supplement +0870..089F; Arabic Extended-B 08A0..08FF; Arabic Extended-A 0900..097F; Devanagari 0980..09FF; Bengali @@ -215,7 +216,9 @@ FFF0..FFFF; Specials 104B0..104FF; Osage 10500..1052F; Elbasan 10530..1056F; Caucasian Albanian +10570..105BF; Vithkuqi 10600..1077F; Linear A +10780..107BF; Latin Extended-F 10800..1083F; Cypriot Syllabary 10840..1085F; Imperial Aramaic 10860..1087F; Palmyrene @@ -240,6 +243,7 @@ FFF0..FFFF; Specials 10E80..10EBF; Yezidi 10F00..10F2F; Old Sogdian 10F30..10F6F; Sogdian +10F70..10FAF; Old Uyghur 10FB0..10FDF; Chorasmian 10FE0..10FFF; Elymaic 11000..1107F; Brahmi @@ -259,13 +263,14 @@ FFF0..FFFF; Specials 11600..1165F; Modi 11660..1167F; Mongolian Supplement 11680..116CF; Takri -11700..1173F; Ahom +11700..1174F; Ahom 11800..1184F; Dogra 118A0..118FF; Warang Citi 11900..1195F; Dives Akuru 119A0..119FF; Nandinagari 11A00..11A4F; Zanabazar Square 11A50..11AAF; Soyombo +11AB0..11ABF; Unified Canadian Aboriginal Syllabics Extended-A 11AC0..11AFF; Pau Cin Hau 11C00..11C6F; Bhaiksuki 11C70..11CBF; Marchen @@ -277,11 +282,13 @@ FFF0..FFFF; Specials 12000..123FF; Cuneiform 12400..1247F; Cuneiform Numbers and Punctuation 12480..1254F; Early Dynastic Cuneiform +12F90..12FFF; Cypro-Minoan 13000..1342F; Egyptian Hieroglyphs 13430..1343F; Egyptian Hieroglyph Format Controls 14400..1467F; Anatolian Hieroglyphs 16800..16A3F; Bamum Supplement 16A40..16A6F; Mro +16A70..16ACF; Tangsa 16AD0..16AFF; Bassa Vah 16B00..16B8F; Pahawh Hmong 16E40..16E9F; Medefaidrin @@ -290,13 +297,15 @@ FFF0..FFFF; Specials 17000..187FF; Tangut 18800..18AFF; Tangut Components 18B00..18CFF; Khitan Small Script -18D00..18D8F; Tangut Supplement +18D00..18D7F; Tangut Supplement +1AFF0..1AFFF; Kana Extended-B 1B000..1B0FF; Kana Supplement 1B100..1B12F; Kana Extended-A 1B130..1B16F; Small Kana Extension 1B170..1B2FF; Nushu 1BC00..1BC9F; Duployan 1BCA0..1BCAF; Shorthand Format Controls +1CF00..1CFCF; Znamenny Musical Notation 1D000..1D0FF; Byzantine Musical Symbols 1D100..1D1FF; Musical Symbols 1D200..1D24F; Ancient Greek Musical Notation @@ -305,9 +314,12 @@ FFF0..FFFF; Specials 1D360..1D37F; Counting Rod Numerals 1D400..1D7FF; Mathematical Alphanumeric Symbols 1D800..1DAAF; Sutton SignWriting +1DF00..1DFFF; Latin Extended-G 1E000..1E02F; Glagolitic Supplement 1E100..1E14F; Nyiakeng Puachue Hmong +1E290..1E2BF; Toto 1E2C0..1E2FF; Wancho +1E7E0..1E7FF; Ethiopic Extended-B 1E800..1E8DF; Mende Kikakui 1E900..1E95F; Adlam 1EC70..1ECBF; Indic Siyaq Numbers diff --git a/lib/unicore/CJKRadicals.txt b/lib/unicore/CJKRadicals.txt index 231361591f..61a45878ef 100644 --- a/lib/unicore/CJKRadicals.txt +++ b/lib/unicore/CJKRadicals.txt @@ -1,6 +1,6 @@ -# CJKRadicals-13.0.0.txt -# Date: 2019-09-09, 19:38:00 GMT [RC, KW, LI] -# © 2019 Unicode®, Inc. +# CJKRadicals-14.0.0.txt +# Date: 2021-03-16, 21:39:00 GMT [RC, KW, LI] +# © 2021 Unicode®, Inc. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Character Database diff --git a/lib/unicore/CaseFolding.txt b/lib/unicore/CaseFolding.txt index 033788b253..932ace29e6 100644 --- a/lib/unicore/CaseFolding.txt +++ b/lib/unicore/CaseFolding.txt @@ -1,6 +1,6 @@ -# CaseFolding-13.0.0.txt -# Date: 2019-09-08, 23:30:59 GMT -# © 2019 Unicode®, Inc. +# CaseFolding-14.0.0.txt +# Date: 2021-03-08, 19:35:41 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -1050,6 +1050,7 @@ 2C2C; C; 2C5C; # GLAGOLITIC CAPITAL LETTER SHTAPIC 2C2D; C; 2C5D; # GLAGOLITIC CAPITAL LETTER TROKUTASTI A 2C2E; C; 2C5E; # GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C2F; C; 2C5F; # GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI 2C60; C; 2C61; # LATIN CAPITAL LETTER L WITH DOUBLE BAR 2C62; C; 026B; # LATIN CAPITAL LETTER L WITH MIDDLE TILDE 2C63; C; 1D7D; # LATIN CAPITAL LETTER P WITH STROKE @@ -1230,12 +1231,16 @@ A7B8; C; A7B9; # LATIN CAPITAL LETTER U WITH STROKE A7BA; C; A7BB; # LATIN CAPITAL LETTER GLOTTAL A A7BC; C; A7BD; # LATIN CAPITAL LETTER GLOTTAL I A7BE; C; A7BF; # LATIN CAPITAL LETTER GLOTTAL U +A7C0; C; A7C1; # LATIN CAPITAL LETTER OLD POLISH O A7C2; C; A7C3; # LATIN CAPITAL LETTER ANGLICANA W A7C4; C; A794; # LATIN CAPITAL LETTER C WITH PALATAL HOOK A7C5; C; 0282; # LATIN CAPITAL LETTER S WITH HOOK A7C6; C; 1D8E; # LATIN CAPITAL LETTER Z WITH PALATAL HOOK A7C7; C; A7C8; # LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY A7C9; C; A7CA; # LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY +A7D0; C; A7D1; # LATIN CAPITAL LETTER CLOSED INSULAR G +A7D6; C; A7D7; # LATIN CAPITAL LETTER MIDDLE SCOTS S +A7D8; C; A7D9; # LATIN CAPITAL LETTER SIGMOID S A7F5; C; A7F6; # LATIN CAPITAL LETTER REVERSED HALF H AB70; C; 13A0; # CHEROKEE SMALL LETTER A AB71; C; 13A1; # CHEROKEE SMALL LETTER E @@ -1431,6 +1436,41 @@ FF3A; C; FF5A; # FULLWIDTH LATIN CAPITAL LETTER Z 104D1; C; 104F9; # OSAGE CAPITAL LETTER GHA 104D2; C; 104FA; # OSAGE CAPITAL LETTER ZA 104D3; C; 104FB; # OSAGE CAPITAL LETTER ZHA +10570; C; 10597; # VITHKUQI CAPITAL LETTER A +10571; C; 10598; # VITHKUQI CAPITAL LETTER BBE +10572; C; 10599; # VITHKUQI CAPITAL LETTER BE +10573; C; 1059A; # VITHKUQI CAPITAL LETTER CE +10574; C; 1059B; # VITHKUQI CAPITAL LETTER CHE +10575; C; 1059C; # VITHKUQI CAPITAL LETTER DE +10576; C; 1059D; # VITHKUQI CAPITAL LETTER DHE +10577; C; 1059E; # VITHKUQI CAPITAL LETTER EI +10578; C; 1059F; # VITHKUQI CAPITAL LETTER E +10579; C; 105A0; # VITHKUQI CAPITAL LETTER FE +1057A; C; 105A1; # VITHKUQI CAPITAL LETTER GA +1057C; C; 105A3; # VITHKUQI CAPITAL LETTER HA +1057D; C; 105A4; # VITHKUQI CAPITAL LETTER HHA +1057E; C; 105A5; # VITHKUQI CAPITAL LETTER I +1057F; C; 105A6; # VITHKUQI CAPITAL LETTER IJE +10580; C; 105A7; # VITHKUQI CAPITAL LETTER JE +10581; C; 105A8; # VITHKUQI CAPITAL LETTER KA +10582; C; 105A9; # VITHKUQI CAPITAL LETTER LA +10583; C; 105AA; # VITHKUQI CAPITAL LETTER LLA +10584; C; 105AB; # VITHKUQI CAPITAL LETTER ME +10585; C; 105AC; # VITHKUQI CAPITAL LETTER NE +10586; C; 105AD; # VITHKUQI CAPITAL LETTER NJE +10587; C; 105AE; # VITHKUQI CAPITAL LETTER O +10588; C; 105AF; # VITHKUQI CAPITAL LETTER PE +10589; C; 105B0; # VITHKUQI CAPITAL LETTER QA +1058A; C; 105B1; # VITHKUQI CAPITAL LETTER RE +1058C; C; 105B3; # VITHKUQI CAPITAL LETTER SE +1058D; C; 105B4; # VITHKUQI CAPITAL LETTER SHE +1058E; C; 105B5; # VITHKUQI CAPITAL LETTER TE +1058F; C; 105B6; # VITHKUQI CAPITAL LETTER THE +10590; C; 105B7; # VITHKUQI CAPITAL LETTER U +10591; C; 105B8; # VITHKUQI CAPITAL LETTER VE +10592; C; 105B9; # VITHKUQI CAPITAL LETTER XE +10594; C; 105BB; # VITHKUQI CAPITAL LETTER Y +10595; C; 105BC; # VITHKUQI CAPITAL LETTER ZE 10C80; C; 10CC0; # OLD HUNGARIAN CAPITAL LETTER A 10C81; C; 10CC1; # OLD HUNGARIAN CAPITAL LETTER AA 10C82; C; 10CC2; # OLD HUNGARIAN CAPITAL LETTER EB diff --git a/lib/unicore/CompositionExclusions.txt b/lib/unicore/CompositionExclusions.txt index 52bbb465bc..74e425e2a0 100644 --- a/lib/unicore/CompositionExclusions.txt +++ b/lib/unicore/CompositionExclusions.txt @@ -1,10 +1,10 @@ -# CompositionExclusions-13.0.0.txt -# Date: 2019-10-15, 18:27:00 GMT [KW, LI] -# © 2019 Unicode®, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# CompositionExclusions-14.0.0.txt +# Date: 2021-03-30, 23:59:00 GMT [KW, LI] +# © 2021 Unicode®, Inc. +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # This file lists the characters for the Composition Exclusion Table # defined in UAX #15, Unicode Normalization Forms. @@ -13,7 +13,7 @@ # Unicode Character Database. # # For more information, see -# http://www.unicode.org/unicode/reports/tr15/#Primary_Exclusion_List_Table +# https://www.unicode.org/reports/tr15/#Primary_Exclusion_List_Table # # For a full derivation of composition exclusions, see the derived property # Full_Composition_Exclusion in DerivedNormalizationProps.txt diff --git a/lib/unicore/DAge.txt b/lib/unicore/DAge.txt index 0d2bd10f8d..c8ee531b8a 100644 --- a/lib/unicore/DAge.txt +++ b/lib/unicore/DAge.txt @@ -1,6 +1,6 @@ -# DerivedAge-13.0.0.txt -# Date: 2019-09-08, 23:30:59 GMT -# © 2019 Unicode®, Inc. +# DerivedAge-14.0.0.txt +# Date: 2021-07-10, 00:35:00 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -40,7 +40,7 @@ # an expression such as "\p{age=3.0}" matches all of the code points # assigned in Version 3.0--that is, all the code points with a value # less than or equal to 3.0 for the Age property. -# For more information, see [http://www.unicode.org/reports/tr18/]. +# For more information, see [https://www.unicode.org/reports/tr18/]. # All code points not explicitly listed for Age # have the value Unassigned (NA). @@ -1862,4 +1862,91 @@ AB68..AB6B ; 13.0 # [4] LATIN SMALL LETTER TURNED R WITH MIDDLE TILDE..MODI # Total code points: 5930 +# ================================================ + +# Age=V14_0 + +# Newly assigned in Unicode 14.0.0 (September, 2021) + +061D ; 14.0 # ARABIC END OF TEXT MARK +0870..088E ; 14.0 # [31] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC VERTICAL TAIL +0890..0891 ; 14.0 # [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +0898..089F ; 14.0 # [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08B5 ; 14.0 # ARABIC LETTER QAF WITH DOT BELOW AND NO DOTS ABOVE +08C8..08D2 ; 14.0 # [11] ARABIC LETTER GRAF..ARABIC LARGE ROUND DOT INSIDE CIRCLE BELOW +0C3C ; 14.0 # TELUGU SIGN NUKTA +0C5D ; 14.0 # TELUGU LETTER NAKAARA POLLU +0CDD ; 14.0 # KANNADA LETTER NAKAARA POLLU +170D ; 14.0 # TAGALOG LETTER RA +1715 ; 14.0 # TAGALOG SIGN PAMUDPOD +171F ; 14.0 # TAGALOG LETTER ARCHAIC RA +180F ; 14.0 # MONGOLIAN FREE VARIATION SELECTOR FOUR +1AC1..1ACE ; 14.0 # [14] COMBINING LEFT PARENTHESIS ABOVE LEFT..COMBINING LATIN SMALL LETTER INSULAR T +1B4C ; 14.0 # BALINESE LETTER ARCHAIC JNYA +1B7D..1B7E ; 14.0 # [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG +1DFA ; 14.0 # COMBINING DOT BELOW LEFT +20C0 ; 14.0 # SOM SIGN +2C2F ; 14.0 # GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI +2C5F ; 14.0 # GLAGOLITIC SMALL LETTER CAUDATE CHRIVI +2E53..2E5D ; 14.0 # [11] MEDIEVAL EXCLAMATION MARK..OBLIQUE HYPHEN +9FFD..9FFF ; 14.0 # [3] CJK UNIFIED IDEOGRAPH-9FFD..CJK UNIFIED IDEOGRAPH-9FFF +A7C0..A7C1 ; 14.0 # [2] LATIN CAPITAL LETTER OLD POLISH O..LATIN SMALL LETTER OLD POLISH O +A7D0..A7D1 ; 14.0 # [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; 14.0 # LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; 14.0 # [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; 14.0 # [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q +FBC2 ; 14.0 # ARABIC SYMBOL WASLA ABOVE +FD40..FD4F ; 14.0 # [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH +FDCF ; 14.0 # ARABIC LIGATURE SALAAMUHU ALAYNAA +FDFE..FDFF ; 14.0 # [2] ARABIC LIGATURE SUBHAANAHU WA TAAALAA..ARABIC LIGATURE AZZA WA JALL +10570..1057A ; 14.0 # [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; 14.0 # [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; 14.0 # [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; 14.0 # [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; 14.0 # [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; 14.0 # [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; 14.0 # [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; 14.0 # [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE +10780..10785 ; 14.0 # [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; 14.0 # [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; 14.0 # [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL +10F70..10F89 ; 14.0 # [26] OLD UYGHUR LETTER ALEPH..OLD UYGHUR PUNCTUATION FOUR DOTS +11070..11075 ; 14.0 # [6] BRAHMI SIGN OLD TAMIL VIRAMA..BRAHMI LETTER OLD TAMIL LLA +110C2 ; 14.0 # KAITHI VOWEL SIGN VOCALIC R +116B9 ; 14.0 # TAKRI ABBREVIATION SIGN +11740..11746 ; 14.0 # [7] AHOM LETTER CA..AHOM LETTER LLA +11AB0..11ABF ; 14.0 # [16] CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA +12F90..12FF2 ; 14.0 # [99] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM302 +16A70..16ABE ; 14.0 # [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; 14.0 # [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE +1AFF0..1AFF3 ; 14.0 # [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; 14.0 # [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; 14.0 # [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B11F..1B122 ; 14.0 # [4] HIRAGANA LETTER ARCHAIC WU..KATAKANA LETTER ARCHAIC WU +1CF00..1CF2D ; 14.0 # [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; 14.0 # [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG +1CF50..1CFC3 ; 14.0 # [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK +1D1E9..1D1EA ; 14.0 # [2] MUSICAL SYMBOL SORI..MUSICAL SYMBOL KORON +1DF00..1DF1E ; 14.0 # [31] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER S WITH CURL +1E290..1E2AE ; 14.0 # [31] TOTO LETTER PA..TOTO SIGN RISING TONE +1E7E0..1E7E6 ; 14.0 # [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; 14.0 # [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; 14.0 # [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; 14.0 # [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE +1F6DD..1F6DF ; 14.0 # [3] PLAYGROUND SLIDE..RING BUOY +1F7F0 ; 14.0 # HEAVY EQUALS SIGN +1F979 ; 14.0 # FACE HOLDING BACK TEARS +1F9CC ; 14.0 # TROLL +1FA7B..1FA7C ; 14.0 # [2] X-RAY..CRUTCH +1FAA9..1FAAC ; 14.0 # [4] MIRROR BALL..HAMSA +1FAB7..1FABA ; 14.0 # [4] LOTUS..NEST WITH EGGS +1FAC3..1FAC5 ; 14.0 # [3] PREGNANT MAN..PERSON WITH CROWN +1FAD7..1FAD9 ; 14.0 # [3] POURING LIQUID..JAR +1FAE0..1FAE7 ; 14.0 # [8] MELTING FACE..BUBBLES +1FAF0..1FAF6 ; 14.0 # [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS +2A6DE..2A6DF ; 14.0 # [2] CJK UNIFIED IDEOGRAPH-2A6DE..CJK UNIFIED IDEOGRAPH-2A6DF +2B735..2B738 ; 14.0 # [4] CJK UNIFIED IDEOGRAPH-2B735..CJK UNIFIED IDEOGRAPH-2B738 + +# Total code points: 838 + # EOF diff --git a/lib/unicore/DCoreProperties.txt b/lib/unicore/DCoreProperties.txt index bc97e2173d..afc2abd97e 100644 --- a/lib/unicore/DCoreProperties.txt +++ b/lib/unicore/DCoreProperties.txt @@ -1,6 +1,6 @@ -# DerivedCoreProperties-13.0.0.txt -# Date: 2020-01-22, 00:07:19 GMT -# © 2020 Unicode®, Inc. +# DerivedCoreProperties-14.0.0.txt +# Date: 2021-08-12, 23:12:53 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -341,8 +341,10 @@ FFE9..FFEC ; Math # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS A 0829..082C ; Alphabetic # Mn [4] SAMARITAN VOWEL SIGN LONG I..SAMARITAN VOWEL SIGN SUKUN 0840..0858 ; Alphabetic # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 0860..086A ; Alphabetic # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; Alphabetic # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; Alphabetic # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +0870..0887 ; Alphabetic # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; Alphabetic # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +08A0..08C8 ; Alphabetic # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; Alphabetic # Lm ARABIC SMALL FARSI YEH 08D4..08DF ; Alphabetic # Mn [12] ARABIC SMALL HIGH WORD AR-RUB..ARABIC SMALL HIGH WORD WAQFA 08E3..08E9 ; Alphabetic # Mn [7] ARABIC TURNED DAMMA BELOW..ARABIC CURLY KASRATAN 08F0..0902 ; Alphabetic # Mn [19] ARABIC OPEN FATHATAN..DEVANAGARI SIGN ANUSVARA @@ -471,6 +473,7 @@ FFE9..FFEC ; Math # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS A 0C4A..0C4C ; Alphabetic # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU 0C55..0C56 ; Alphabetic # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK 0C58..0C5A ; Alphabetic # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; Alphabetic # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; Alphabetic # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63 ; Alphabetic # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C80 ; Alphabetic # Lo KANNADA SIGN SPACING CANDRABINDU @@ -490,7 +493,7 @@ FFE9..FFEC ; Math # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS A 0CCA..0CCB ; Alphabetic # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC ; Alphabetic # Mn KANNADA VOWEL SIGN AU 0CD5..0CD6 ; Alphabetic # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE ; Alphabetic # Lo KANNADA LETTER FA +0CDD..0CDE ; Alphabetic # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; Alphabetic # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; Alphabetic # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CF1..0CF2 ; Alphabetic # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA @@ -614,10 +617,9 @@ FFE9..FFEC ; Math # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS A 16A0..16EA ; Alphabetic # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16EE..16F0 ; Alphabetic # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; Alphabetic # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; Alphabetic # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; Alphabetic # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711 ; Alphabetic # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1713 ; Alphabetic # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U -1720..1731 ; Alphabetic # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA +171F..1731 ; Alphabetic # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA 1732..1733 ; Alphabetic # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U 1740..1751 ; Alphabetic # Lo [18] BUHID LETTER A..BUHID LETTER HA 1752..1753 ; Alphabetic # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U @@ -670,6 +672,7 @@ FFE9..FFEC ; Math # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS A 1A73..1A74 ; Alphabetic # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG 1AA7 ; Alphabetic # Lm TAI THAM SIGN MAI YAMOK 1ABF..1AC0 ; Alphabetic # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ACC..1ACE ; Alphabetic # Mn [3] COMBINING LATIN SMALL LETTER INSULAR G..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; Alphabetic # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; Alphabetic # Mc BALINESE SIGN BISAH 1B05..1B33 ; Alphabetic # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA @@ -680,7 +683,7 @@ FFE9..FFEC ; Math # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS A 1B3D..1B41 ; Alphabetic # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42 ; Alphabetic # Mn BALINESE VOWEL SIGN PEPET 1B43 ; Alphabetic # Mc BALINESE VOWEL SIGN PEPET TEDUNG -1B45..1B4B ; Alphabetic # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; Alphabetic # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B80..1B81 ; Alphabetic # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR 1B82 ; Alphabetic # Mc SUNDANESE SIGN PANGWISAD 1B83..1BA0 ; Alphabetic # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA @@ -760,9 +763,7 @@ FFE9..FFEC ; Math # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS A 2183..2184 ; Alphabetic # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C 2185..2188 ; Alphabetic # Nl [4] ROMAN NUMERAL SIX LATE FORM..ROMAN NUMERAL ONE HUNDRED THOUSAND 24B6..24E9 ; Alphabetic # So [52] CIRCLED LATIN CAPITAL LETTER A..CIRCLED LATIN SMALL LETTER Z -2C00..2C2E ; Alphabetic # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; Alphabetic # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; Alphabetic # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; Alphabetic # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; Alphabetic # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; Alphabetic # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CEB..2CEE ; Alphabetic # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA @@ -802,8 +803,7 @@ FFE9..FFEC ; Math # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS A 31A0..31BF ; Alphabetic # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH 31F0..31FF ; Alphabetic # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO 3400..4DBF ; Alphabetic # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; Alphabetic # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; Alphabetic # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; Alphabetic # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; Alphabetic # Lm YI SYLLABLE WU A016..A48C ; Alphabetic # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A4D0..A4F7 ; Alphabetic # Lo [40] LISU LETTER BA..LISU LETTER OE @@ -828,8 +828,11 @@ A771..A787 ; Alphabetic # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER A788 ; Alphabetic # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; Alphabetic # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; Alphabetic # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; Alphabetic # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; Alphabetic # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; Alphabetic # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; Alphabetic # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; Alphabetic # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; Alphabetic # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; Alphabetic # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; Alphabetic # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; Alphabetic # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; Alphabetic # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -985,9 +988,20 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 104D8..104FB ; Alphabetic # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA 10500..10527 ; Alphabetic # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; Alphabetic # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW +10570..1057A ; Alphabetic # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Alphabetic # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Alphabetic # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Alphabetic # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; Alphabetic # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Alphabetic # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Alphabetic # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Alphabetic # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; Alphabetic # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; Alphabetic # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; Alphabetic # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; Alphabetic # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Alphabetic # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Alphabetic # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; Alphabetic # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; Alphabetic # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; Alphabetic # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -1028,6 +1042,7 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 10F00..10F1C ; Alphabetic # Lo [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL 10F27 ; Alphabetic # Lo OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F45 ; Alphabetic # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN +10F70..10F81 ; Alphabetic # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH 10FB0..10FC4 ; Alphabetic # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; Alphabetic # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11000 ; Alphabetic # Mc BRAHMI SIGN CANDRABINDU @@ -1035,11 +1050,15 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 11002 ; Alphabetic # Mc BRAHMI SIGN VISARGA 11003..11037 ; Alphabetic # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA 11038..11045 ; Alphabetic # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +11071..11072 ; Alphabetic # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074 ; Alphabetic # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075 ; Alphabetic # Lo BRAHMI LETTER OLD TAMIL LLA 11082 ; Alphabetic # Mc KAITHI SIGN VISARGA 11083..110AF ; Alphabetic # Lo [45] KAITHI LETTER A..KAITHI LETTER HA 110B0..110B2 ; Alphabetic # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II 110B3..110B6 ; Alphabetic # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B7..110B8 ; Alphabetic # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +110C2 ; Alphabetic # Mn KAITHI VOWEL SIGN VOCALIC R 110D0..110E8 ; Alphabetic # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 11100..11102 ; Alphabetic # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11103..11126 ; Alphabetic # Lo [36] CHAKMA LETTER AA..CHAKMA LETTER HAA @@ -1144,6 +1163,7 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 11722..11725 ; Alphabetic # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU 11726 ; Alphabetic # Mc AHOM VOWEL SIGN E 11727..1172A ; Alphabetic # Mn [4] AHOM VOWEL SIGN AW..AHOM VOWEL SIGN AM +11740..11746 ; Alphabetic # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; Alphabetic # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E ; Alphabetic # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 1182F..11837 ; Alphabetic # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA @@ -1185,7 +1205,7 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 11A8A..11A96 ; Alphabetic # Mn [13] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO SIGN ANUSVARA 11A97 ; Alphabetic # Mc SOYOMBO SIGN VISARGA 11A9D ; Alphabetic # Lo SOYOMBO MARK PLUTA -11AC0..11AF8 ; Alphabetic # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; Alphabetic # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; Alphabetic # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; Alphabetic # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C2F ; Alphabetic # Mc BHAIKSUKI VOWEL SIGN AA @@ -1227,10 +1247,12 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 12000..12399 ; Alphabetic # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12400..1246E ; Alphabetic # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; Alphabetic # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; Alphabetic # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; Alphabetic # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; Alphabetic # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; Alphabetic # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; Alphabetic # Lo [31] MRO LETTER TA..MRO LETTER TEK +16A70..16ABE ; Alphabetic # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA 16AD0..16AED ; Alphabetic # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16B00..16B2F ; Alphabetic # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 16B40..16B43 ; Alphabetic # Lm [4] PAHAWH HMONG SIGN VOS SEEV..PAHAWH HMONG SIGN IB YAM @@ -1249,7 +1271,10 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 17000..187F7 ; Alphabetic # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; Alphabetic # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; Alphabetic # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; Alphabetic # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; Alphabetic # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; Alphabetic # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; Alphabetic # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; Alphabetic # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; Alphabetic # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; Alphabetic # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; Alphabetic # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -1288,6 +1313,9 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 1D78A..1D7A8 ; Alphabetic # L& [31] MATHEMATICAL SANS-SERIF BOLD EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA 1D7AA..1D7C2 ; Alphabetic # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA 1D7C4..1D7CB ; Alphabetic # L& [8] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL BOLD SMALL DIGAMMA +1DF00..1DF09 ; Alphabetic # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; Alphabetic # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; Alphabetic # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E000..1E006 ; Alphabetic # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; Alphabetic # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; Alphabetic # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -1296,7 +1324,12 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 1E100..1E12C ; Alphabetic # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; Alphabetic # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E14E ; Alphabetic # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ +1E290..1E2AD ; Alphabetic # Lo [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; Alphabetic # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH +1E7E0..1E7E6 ; Alphabetic # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; Alphabetic # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; Alphabetic # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; Alphabetic # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; Alphabetic # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E900..1E943 ; Alphabetic # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA 1E947 ; Alphabetic # Mn ADLAM HAMZA @@ -1337,15 +1370,15 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 1F130..1F149 ; Alphabetic # So [26] SQUARED LATIN CAPITAL LETTER A..SQUARED LATIN CAPITAL LETTER Z 1F150..1F169 ; Alphabetic # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Alphabetic # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -20000..2A6DD ; Alphabetic # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; Alphabetic # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; Alphabetic # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; Alphabetic # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; Alphabetic # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Alphabetic # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Alphabetic # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 2F800..2FA1D ; Alphabetic # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D 30000..3134A ; Alphabetic # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 132875 +# Total code points: 133396 # ================================================ @@ -1798,7 +1831,7 @@ FFDA..FFDC ; Alphabetic # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANG 2170..217F ; Lowercase # Nl [16] SMALL ROMAN NUMERAL ONE..SMALL ROMAN NUMERAL ONE THOUSAND 2184 ; Lowercase # L& LATIN SMALL LETTER REVERSED C 24D0..24E9 ; Lowercase # So [26] CIRCLED LATIN SMALL LETTER A..CIRCLED LATIN SMALL LETTER Z -2C30..2C5E ; Lowercase # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C30..2C5F ; Lowercase # L& [48] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C61 ; Lowercase # L& LATIN SMALL LETTER L WITH DOUBLE BAR 2C65..2C66 ; Lowercase # L& [2] LATIN SMALL LETTER A WITH STROKE..LATIN SMALL LETTER T WITH DIAGONAL STROKE 2C68 ; Lowercase # L& LATIN SMALL LETTER H WITH DESCENDER @@ -1970,9 +2003,15 @@ A7B9 ; Lowercase # L& LATIN SMALL LETTER U WITH STROKE A7BB ; Lowercase # L& LATIN SMALL LETTER GLOTTAL A A7BD ; Lowercase # L& LATIN SMALL LETTER GLOTTAL I A7BF ; Lowercase # L& LATIN SMALL LETTER GLOTTAL U +A7C1 ; Lowercase # L& LATIN SMALL LETTER OLD POLISH O A7C3 ; Lowercase # L& LATIN SMALL LETTER ANGLICANA W A7C8 ; Lowercase # L& LATIN SMALL LETTER D WITH SHORT STROKE OVERLAY A7CA ; Lowercase # L& LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D1 ; Lowercase # L& LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; Lowercase # L& LATIN SMALL LETTER DOUBLE THORN +A7D5 ; Lowercase # L& LATIN SMALL LETTER DOUBLE WYNN +A7D7 ; Lowercase # L& LATIN SMALL LETTER MIDDLE SCOTS S +A7D9 ; Lowercase # L& LATIN SMALL LETTER SIGMOID S A7F6 ; Lowercase # L& LATIN SMALL LETTER REVERSED HALF H A7F8..A7F9 ; Lowercase # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE A7FA ; Lowercase # L& LATIN LETTER SMALL CAPITAL TURNED M @@ -1985,6 +2024,14 @@ FB13..FB17 ; Lowercase # L& [5] ARMENIAN SMALL LIGATURE MEN NOW..ARMENIAN S FF41..FF5A ; Lowercase # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL LETTER Z 10428..1044F ; Lowercase # L& [40] DESERET SMALL LETTER LONG I..DESERET SMALL LETTER EW 104D8..104FB ; Lowercase # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA +10597..105A1 ; Lowercase # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Lowercase # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Lowercase # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Lowercase # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE +10780 ; Lowercase # Lm MODIFIER LETTER SMALL CAPITAL AA +10783..10785 ; Lowercase # Lm [3] MODIFIER LETTER SMALL AE..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Lowercase # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Lowercase # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10CC0..10CF2 ; Lowercase # L& [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US 118C0..118DF ; Lowercase # L& [32] WARANG CITI SMALL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 16E60..16E7F ; Lowercase # L& [32] MEDEFAIDRIN SMALL LETTER M..MEDEFAIDRIN SMALL LETTER Y @@ -2016,9 +2063,11 @@ FF41..FF5A ; Lowercase # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH L 1D7AA..1D7C2 ; Lowercase # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA 1D7C4..1D7C9 ; Lowercase # L& [6] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC PI SYMBOL 1D7CB ; Lowercase # L& MATHEMATICAL BOLD SMALL DIGAMMA +1DF00..1DF09 ; Lowercase # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0B..1DF1E ; Lowercase # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E922..1E943 ; Lowercase # L& [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 2344 +# Total code points: 2471 # ================================================ @@ -2458,7 +2507,7 @@ FF41..FF5A ; Lowercase # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH L 2160..216F ; Uppercase # Nl [16] ROMAN NUMERAL ONE..ROMAN NUMERAL ONE THOUSAND 2183 ; Uppercase # L& ROMAN NUMERAL REVERSED ONE HUNDRED 24B6..24CF ; Uppercase # So [26] CIRCLED LATIN CAPITAL LETTER A..CIRCLED LATIN CAPITAL LETTER Z -2C00..2C2E ; Uppercase # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C00..2C2F ; Uppercase # L& [48] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI 2C60 ; Uppercase # L& LATIN CAPITAL LETTER L WITH DOUBLE BAR 2C62..2C64 ; Uppercase # L& [3] LATIN CAPITAL LETTER L WITH MIDDLE TILDE..LATIN CAPITAL LETTER R WITH TAIL 2C67 ; Uppercase # L& LATIN CAPITAL LETTER H WITH DESCENDER @@ -2623,13 +2672,21 @@ A7B8 ; Uppercase # L& LATIN CAPITAL LETTER U WITH STROKE A7BA ; Uppercase # L& LATIN CAPITAL LETTER GLOTTAL A A7BC ; Uppercase # L& LATIN CAPITAL LETTER GLOTTAL I A7BE ; Uppercase # L& LATIN CAPITAL LETTER GLOTTAL U +A7C0 ; Uppercase # L& LATIN CAPITAL LETTER OLD POLISH O A7C2 ; Uppercase # L& LATIN CAPITAL LETTER ANGLICANA W A7C4..A7C7 ; Uppercase # L& [4] LATIN CAPITAL LETTER C WITH PALATAL HOOK..LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY A7C9 ; Uppercase # L& LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY +A7D0 ; Uppercase # L& LATIN CAPITAL LETTER CLOSED INSULAR G +A7D6 ; Uppercase # L& LATIN CAPITAL LETTER MIDDLE SCOTS S +A7D8 ; Uppercase # L& LATIN CAPITAL LETTER SIGMOID S A7F5 ; Uppercase # L& LATIN CAPITAL LETTER REVERSED HALF H FF21..FF3A ; Uppercase # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Uppercase # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW 104B0..104D3 ; Uppercase # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA +10570..1057A ; Uppercase # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Uppercase # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Uppercase # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Uppercase # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE 10C80..10CB2 ; Uppercase # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 118A0..118BF ; Uppercase # L& [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 16E40..16E5F ; Uppercase # L& [32] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y @@ -2669,7 +2726,7 @@ FF21..FF3A ; Uppercase # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH 1F150..1F169 ; Uppercase # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Uppercase # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 1911 +# Total code points: 1951 # ================================================ @@ -2761,9 +2818,7 @@ FF21..FF3A ; Uppercase # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH 2160..217F ; Cased # Nl [32] ROMAN NUMERAL ONE..SMALL ROMAN NUMERAL ONE THOUSAND 2183..2184 ; Cased # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C 24B6..24E9 ; Cased # So [52] CIRCLED LATIN CAPITAL LETTER A..CIRCLED LATIN SMALL LETTER Z -2C00..2C2E ; Cased # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; Cased # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; Cased # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; Cased # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; Cased # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; Cased # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CEB..2CEE ; Cased # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA @@ -2778,8 +2833,10 @@ A722..A76F ; Cased # L& [78] LATIN CAPITAL LETTER EGYPTOLOGICAL ALEF..LATIN A770 ; Cased # Lm MODIFIER LETTER US A771..A787 ; Cased # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER INSULAR T A78B..A78E ; Cased # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT -A790..A7BF ; Cased # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; Cased # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; Cased # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; Cased # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; Cased # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; Cased # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S A7F5..A7F6 ; Cased # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F8..A7F9 ; Cased # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE A7FA ; Cased # L& LATIN LETTER SMALL CAPITAL TURNED M @@ -2794,6 +2851,18 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 10400..1044F ; Cased # L& [80] DESERET CAPITAL LETTER LONG I..DESERET SMALL LETTER EW 104B0..104D3 ; Cased # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA 104D8..104FB ; Cased # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA +10570..1057A ; Cased # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Cased # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Cased # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Cased # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; Cased # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Cased # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Cased # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Cased # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE +10780 ; Cased # Lm MODIFIER LETTER SMALL CAPITAL AA +10783..10785 ; Cased # Lm [3] MODIFIER LETTER SMALL AE..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Cased # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Cased # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10C80..10CB2 ; Cased # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 10CC0..10CF2 ; Cased # L& [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US 118A0..118DF ; Cased # L& [64] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI SMALL LETTER VIYO @@ -2828,12 +2897,14 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 1D78A..1D7A8 ; Cased # L& [31] MATHEMATICAL SANS-SERIF BOLD EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA 1D7AA..1D7C2 ; Cased # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA 1D7C4..1D7CB ; Cased # L& [8] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL BOLD SMALL DIGAMMA +1DF00..1DF09 ; Cased # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0B..1DF1E ; Cased # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E900..1E943 ; Cased # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA 1F130..1F149 ; Cased # So [26] SQUARED LATIN CAPITAL LETTER A..SQUARED LATIN CAPITAL LETTER Z 1F150..1F169 ; Cased # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Cased # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 4286 +# Total code points: 4453 # ================================================ @@ -2908,7 +2979,11 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 0828 ; Case_Ignorable # Lm SAMARITAN MODIFIER LETTER I 0829..082D ; Case_Ignorable # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA 0859..085B ; Case_Ignorable # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3..08E1 ; Case_Ignorable # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0888 ; Case_Ignorable # Sk ARABIC RAISED ROUND DOT +0890..0891 ; Case_Ignorable # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +0898..089F ; Case_Ignorable # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08C9 ; Case_Ignorable # Lm ARABIC SMALL FARSI YEH +08CA..08E1 ; Case_Ignorable # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E2 ; Case_Ignorable # Cf ARABIC DISPUTED END OF AYAH 08E3..0902 ; Case_Ignorable # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 093A ; Case_Ignorable # Mn DEVANAGARI VOWEL SIGN OE @@ -2951,6 +3026,7 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 0BCD ; Case_Ignorable # Mn TAMIL SIGN VIRAMA 0C00 ; Case_Ignorable # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE 0C04 ; Case_Ignorable # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3C ; Case_Ignorable # Mn TELUGU SIGN NUKTA 0C3E..0C40 ; Case_Ignorable # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C46..0C48 ; Case_Ignorable # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI 0C4A..0C4D ; Case_Ignorable # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA @@ -3003,7 +3079,7 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 10FC ; Case_Ignorable # Lm MODIFIER LETTER GEORGIAN NAR 135D..135F ; Case_Ignorable # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK 1712..1714 ; Case_Ignorable # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1732..1734 ; Case_Ignorable # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733 ; Case_Ignorable # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U 1752..1753 ; Case_Ignorable # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1772..1773 ; Case_Ignorable # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U 17B4..17B5 ; Case_Ignorable # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA @@ -3014,6 +3090,7 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 17DD ; Case_Ignorable # Mn KHMER SIGN ATTHACAN 180B..180D ; Case_Ignorable # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; Case_Ignorable # Cf MONGOLIAN VOWEL SEPARATOR +180F ; Case_Ignorable # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1843 ; Case_Ignorable # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN 1885..1886 ; Case_Ignorable # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 18A9 ; Case_Ignorable # Mn MONGOLIAN LETTER ALI GALI DAGALGA @@ -3033,7 +3110,7 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 1AA7 ; Case_Ignorable # Lm TAI THAM SIGN MAI YAMOK 1AB0..1ABD ; Case_Ignorable # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; Case_Ignorable # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; Case_Ignorable # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; Case_Ignorable # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; Case_Ignorable # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B34 ; Case_Ignorable # Mn BALINESE SIGN REREKAN 1B36..1B3A ; Case_Ignorable # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA @@ -3060,8 +3137,7 @@ FF41..FF5A ; Cased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 1D2C..1D6A ; Case_Ignorable # Lm [63] MODIFIER LETTER CAPITAL A..GREEK SUBSCRIPT SMALL LETTER CHI 1D78 ; Case_Ignorable # Lm MODIFIER LETTER CYRILLIC EN 1D9B..1DBF ; Case_Ignorable # Lm [37] MODIFIER LETTER SMALL TURNED ALPHA..MODIFIER LETTER SMALL THETA -1DC0..1DF9 ; Case_Ignorable # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; Case_Ignorable # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; Case_Ignorable # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 1FBD ; Case_Ignorable # Sk GREEK KORONIS 1FBF..1FC1 ; Case_Ignorable # Sk [3] GREEK PSILI..GREEK DIALYTIKA AND PERISPOMENI 1FCD..1FCF ; Case_Ignorable # Sk [3] GREEK PSILI AND VARIA..GREEK PSILI AND PERISPOMENI @@ -3114,6 +3190,7 @@ A720..A721 ; Case_Ignorable # Sk [2] MODIFIER LETTER STRESS AND HIGH TONE.. A770 ; Case_Ignorable # Lm MODIFIER LETTER US A788 ; Case_Ignorable # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; Case_Ignorable # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN +A7F2..A7F4 ; Case_Ignorable # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F8..A7F9 ; Case_Ignorable # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE A802 ; Case_Ignorable # Mn SYLOTI NAGRI SIGN DVISVARA A806 ; Case_Ignorable # Mn SYLOTI NAGRI SIGN HASANTA @@ -3156,7 +3233,7 @@ ABE5 ; Case_Ignorable # Mn MEETEI MAYEK VOWEL SIGN ANAP ABE8 ; Case_Ignorable # Mn MEETEI MAYEK VOWEL SIGN UNAP ABED ; Case_Ignorable # Mn MEETEI MAYEK APUN IYEK FB1E ; Case_Ignorable # Mn HEBREW POINT JUDEO-SPANISH VARIKA -FBB2..FBC1 ; Case_Ignorable # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2 ; Case_Ignorable # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FE00..FE0F ; Case_Ignorable # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16 FE13 ; Case_Ignorable # Po PRESENTATION FORM FOR VERTICAL COLON FE20..FE2F ; Case_Ignorable # Mn [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC TITLO RIGHT HALF @@ -3175,6 +3252,9 @@ FFF9..FFFB ; Case_Ignorable # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLI 101FD ; Case_Ignorable # Mn PHAISTOS DISC SIGN COMBINING OBLIQUE STROKE 102E0 ; Case_Ignorable # Mn COPTIC EPACT THOUSANDS MARK 10376..1037A ; Case_Ignorable # Mn [5] COMBINING OLD PERMIC LETTER AN..COMBINING OLD PERMIC LETTER SII +10780..10785 ; Case_Ignorable # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Case_Ignorable # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Case_Ignorable # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10A01..10A03 ; Case_Ignorable # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R 10A05..10A06 ; Case_Ignorable # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O 10A0C..10A0F ; Case_Ignorable # Mn [4] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN VISARGA @@ -3184,12 +3264,16 @@ FFF9..FFFB ; Case_Ignorable # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLI 10D24..10D27 ; Case_Ignorable # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10EAB..10EAC ; Case_Ignorable # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F46..10F50 ; Case_Ignorable # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; Case_Ignorable # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 11001 ; Case_Ignorable # Mn BRAHMI SIGN ANUSVARA 11038..11046 ; Case_Ignorable # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA +11070 ; Case_Ignorable # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Case_Ignorable # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 1107F..11081 ; Case_Ignorable # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 110B3..110B6 ; Case_Ignorable # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B9..110BA ; Case_Ignorable # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA 110BD ; Case_Ignorable # Cf KAITHI NUMBER SIGN +110C2 ; Case_Ignorable # Mn KAITHI VOWEL SIGN VOCALIC R 110CD ; Case_Ignorable # Cf KAITHI NUMBER SIGN ABOVE 11100..11102 ; Case_Ignorable # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; Case_Ignorable # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU @@ -3274,8 +3358,13 @@ FFF9..FFFB ; Case_Ignorable # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLI 16FE0..16FE1 ; Case_Ignorable # Lm [2] TANGUT ITERATION MARK..NUSHU ITERATION MARK 16FE3 ; Case_Ignorable # Lm OLD CHINESE ITERATION MARK 16FE4 ; Case_Ignorable # Mn KHITAN SMALL SCRIPT FILLER +1AFF0..1AFF3 ; Case_Ignorable # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; Case_Ignorable # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; Case_Ignorable # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 1BC9D..1BC9E ; Case_Ignorable # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 1BCA0..1BCA3 ; Case_Ignorable # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF00..1CF2D ; Case_Ignorable # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; Case_Ignorable # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D167..1D169 ; Case_Ignorable # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D173..1D17A ; Case_Ignorable # Cf [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE 1D17B..1D182 ; Case_Ignorable # Mn [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE @@ -3295,6 +3384,7 @@ FFF9..FFFB ; Case_Ignorable # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLI 1E026..1E02A ; Case_Ignorable # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; Case_Ignorable # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D 1E137..1E13D ; Case_Ignorable # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER +1E2AE ; Case_Ignorable # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; Case_Ignorable # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; Case_Ignorable # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E94A ; Case_Ignorable # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA @@ -3304,7 +3394,7 @@ E0001 ; Case_Ignorable # Cf LANGUAGE TAG E0020..E007F ; Case_Ignorable # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Case_Ignorable # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2413 +# Total code points: 2602 # ================================================ @@ -3738,7 +3828,7 @@ E0100..E01EF ; Case_Ignorable # Mn [240] VARIATION SELECTOR-17..VARIATION SELEC 2160..216F ; Changes_When_Lowercased # Nl [16] ROMAN NUMERAL ONE..ROMAN NUMERAL ONE THOUSAND 2183 ; Changes_When_Lowercased # L& ROMAN NUMERAL REVERSED ONE HUNDRED 24B6..24CF ; Changes_When_Lowercased # So [26] CIRCLED LATIN CAPITAL LETTER A..CIRCLED LATIN CAPITAL LETTER Z -2C00..2C2E ; Changes_When_Lowercased # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C00..2C2F ; Changes_When_Lowercased # L& [48] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI 2C60 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER L WITH DOUBLE BAR 2C62..2C64 ; Changes_When_Lowercased # L& [3] LATIN CAPITAL LETTER L WITH MIDDLE TILDE..LATIN CAPITAL LETTER R WITH TAIL 2C67 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER H WITH DESCENDER @@ -3903,19 +3993,27 @@ A7B8 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER U WITH S A7BA ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER GLOTTAL A A7BC ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER GLOTTAL I A7BE ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER GLOTTAL U +A7C0 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER OLD POLISH O A7C2 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER ANGLICANA W A7C4..A7C7 ; Changes_When_Lowercased # L& [4] LATIN CAPITAL LETTER C WITH PALATAL HOOK..LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY A7C9 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY +A7D0 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER CLOSED INSULAR G +A7D6 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER MIDDLE SCOTS S +A7D8 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER SIGMOID S A7F5 ; Changes_When_Lowercased # L& LATIN CAPITAL LETTER REVERSED HALF H FF21..FF3A ; Changes_When_Lowercased # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Changes_When_Lowercased # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW 104B0..104D3 ; Changes_When_Lowercased # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA +10570..1057A ; Changes_When_Lowercased # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Changes_When_Lowercased # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Changes_When_Lowercased # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Changes_When_Lowercased # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE 10C80..10CB2 ; Changes_When_Lowercased # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 118A0..118BF ; Changes_When_Lowercased # L& [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 16E40..16E5F ; Changes_When_Lowercased # L& [32] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y 1E900..1E921 ; Changes_When_Lowercased # L& [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA -# Total code points: 1393 +# Total code points: 1433 # ================================================ @@ -4363,7 +4461,7 @@ FF21..FF3A ; Changes_When_Lowercased # L& [26] FULLWIDTH LATIN CAPITAL LETTE 2170..217F ; Changes_When_Uppercased # Nl [16] SMALL ROMAN NUMERAL ONE..SMALL ROMAN NUMERAL ONE THOUSAND 2184 ; Changes_When_Uppercased # L& LATIN SMALL LETTER REVERSED C 24D0..24E9 ; Changes_When_Uppercased # So [26] CIRCLED LATIN SMALL LETTER A..CIRCLED LATIN SMALL LETTER Z -2C30..2C5E ; Changes_When_Uppercased # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C30..2C5F ; Changes_When_Uppercased # L& [48] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C61 ; Changes_When_Uppercased # L& LATIN SMALL LETTER L WITH DOUBLE BAR 2C65..2C66 ; Changes_When_Uppercased # L& [2] LATIN SMALL LETTER A WITH STROKE..LATIN SMALL LETTER T WITH DIAGONAL STROKE 2C68 ; Changes_When_Uppercased # L& LATIN SMALL LETTER H WITH DESCENDER @@ -4528,9 +4626,13 @@ A7B9 ; Changes_When_Uppercased # L& LATIN SMALL LETTER U WITH STR A7BB ; Changes_When_Uppercased # L& LATIN SMALL LETTER GLOTTAL A A7BD ; Changes_When_Uppercased # L& LATIN SMALL LETTER GLOTTAL I A7BF ; Changes_When_Uppercased # L& LATIN SMALL LETTER GLOTTAL U +A7C1 ; Changes_When_Uppercased # L& LATIN SMALL LETTER OLD POLISH O A7C3 ; Changes_When_Uppercased # L& LATIN SMALL LETTER ANGLICANA W A7C8 ; Changes_When_Uppercased # L& LATIN SMALL LETTER D WITH SHORT STROKE OVERLAY A7CA ; Changes_When_Uppercased # L& LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D1 ; Changes_When_Uppercased # L& LATIN SMALL LETTER CLOSED INSULAR G +A7D7 ; Changes_When_Uppercased # L& LATIN SMALL LETTER MIDDLE SCOTS S +A7D9 ; Changes_When_Uppercased # L& LATIN SMALL LETTER SIGMOID S A7F6 ; Changes_When_Uppercased # L& LATIN SMALL LETTER REVERSED HALF H AB53 ; Changes_When_Uppercased # L& LATIN SMALL LETTER CHI AB70..ABBF ; Changes_When_Uppercased # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA @@ -4539,12 +4641,16 @@ FB13..FB17 ; Changes_When_Uppercased # L& [5] ARMENIAN SMALL LIGATURE MEN N FF41..FF5A ; Changes_When_Uppercased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL LETTER Z 10428..1044F ; Changes_When_Uppercased # L& [40] DESERET SMALL LETTER LONG I..DESERET SMALL LETTER EW 104D8..104FB ; Changes_When_Uppercased # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA +10597..105A1 ; Changes_When_Uppercased # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Changes_When_Uppercased # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Changes_When_Uppercased # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Changes_When_Uppercased # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10CC0..10CF2 ; Changes_When_Uppercased # L& [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US 118C0..118DF ; Changes_When_Uppercased # L& [32] WARANG CITI SMALL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 16E60..16E7F ; Changes_When_Uppercased # L& [32] MEDEFAIDRIN SMALL LETTER M..MEDEFAIDRIN SMALL LETTER Y 1E922..1E943 ; Changes_When_Uppercased # L& [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 1485 +# Total code points: 1525 # ================================================ @@ -4991,7 +5097,7 @@ FF41..FF5A ; Changes_When_Uppercased # L& [26] FULLWIDTH LATIN SMALL LETTER 2170..217F ; Changes_When_Titlecased # Nl [16] SMALL ROMAN NUMERAL ONE..SMALL ROMAN NUMERAL ONE THOUSAND 2184 ; Changes_When_Titlecased # L& LATIN SMALL LETTER REVERSED C 24D0..24E9 ; Changes_When_Titlecased # So [26] CIRCLED LATIN SMALL LETTER A..CIRCLED LATIN SMALL LETTER Z -2C30..2C5E ; Changes_When_Titlecased # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C30..2C5F ; Changes_When_Titlecased # L& [48] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C61 ; Changes_When_Titlecased # L& LATIN SMALL LETTER L WITH DOUBLE BAR 2C65..2C66 ; Changes_When_Titlecased # L& [2] LATIN SMALL LETTER A WITH STROKE..LATIN SMALL LETTER T WITH DIAGONAL STROKE 2C68 ; Changes_When_Titlecased # L& LATIN SMALL LETTER H WITH DESCENDER @@ -5156,9 +5262,13 @@ A7B9 ; Changes_When_Titlecased # L& LATIN SMALL LETTER U WITH STR A7BB ; Changes_When_Titlecased # L& LATIN SMALL LETTER GLOTTAL A A7BD ; Changes_When_Titlecased # L& LATIN SMALL LETTER GLOTTAL I A7BF ; Changes_When_Titlecased # L& LATIN SMALL LETTER GLOTTAL U +A7C1 ; Changes_When_Titlecased # L& LATIN SMALL LETTER OLD POLISH O A7C3 ; Changes_When_Titlecased # L& LATIN SMALL LETTER ANGLICANA W A7C8 ; Changes_When_Titlecased # L& LATIN SMALL LETTER D WITH SHORT STROKE OVERLAY A7CA ; Changes_When_Titlecased # L& LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D1 ; Changes_When_Titlecased # L& LATIN SMALL LETTER CLOSED INSULAR G +A7D7 ; Changes_When_Titlecased # L& LATIN SMALL LETTER MIDDLE SCOTS S +A7D9 ; Changes_When_Titlecased # L& LATIN SMALL LETTER SIGMOID S A7F6 ; Changes_When_Titlecased # L& LATIN SMALL LETTER REVERSED HALF H AB53 ; Changes_When_Titlecased # L& LATIN SMALL LETTER CHI AB70..ABBF ; Changes_When_Titlecased # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA @@ -5167,12 +5277,16 @@ FB13..FB17 ; Changes_When_Titlecased # L& [5] ARMENIAN SMALL LIGATURE MEN N FF41..FF5A ; Changes_When_Titlecased # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL LETTER Z 10428..1044F ; Changes_When_Titlecased # L& [40] DESERET SMALL LETTER LONG I..DESERET SMALL LETTER EW 104D8..104FB ; Changes_When_Titlecased # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA +10597..105A1 ; Changes_When_Titlecased # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Changes_When_Titlecased # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Changes_When_Titlecased # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Changes_When_Titlecased # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10CC0..10CF2 ; Changes_When_Titlecased # L& [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US 118C0..118DF ; Changes_When_Titlecased # L& [32] WARANG CITI SMALL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 16E60..16E7F ; Changes_When_Titlecased # L& [32] MEDEFAIDRIN SMALL LETTER M..MEDEFAIDRIN SMALL LETTER Y 1E922..1E943 ; Changes_When_Titlecased # L& [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 1412 +# Total code points: 1452 # ================================================ @@ -5616,7 +5730,7 @@ FF41..FF5A ; Changes_When_Titlecased # L& [26] FULLWIDTH LATIN SMALL LETTER 2160..216F ; Changes_When_Casefolded # Nl [16] ROMAN NUMERAL ONE..ROMAN NUMERAL ONE THOUSAND 2183 ; Changes_When_Casefolded # L& ROMAN NUMERAL REVERSED ONE HUNDRED 24B6..24CF ; Changes_When_Casefolded # So [26] CIRCLED LATIN CAPITAL LETTER A..CIRCLED LATIN CAPITAL LETTER Z -2C00..2C2E ; Changes_When_Casefolded # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C00..2C2F ; Changes_When_Casefolded # L& [48] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI 2C60 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER L WITH DOUBLE BAR 2C62..2C64 ; Changes_When_Casefolded # L& [3] LATIN CAPITAL LETTER L WITH MIDDLE TILDE..LATIN CAPITAL LETTER R WITH TAIL 2C67 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER H WITH DESCENDER @@ -5781,9 +5895,13 @@ A7B8 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER U WITH S A7BA ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER GLOTTAL A A7BC ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER GLOTTAL I A7BE ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER GLOTTAL U +A7C0 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER OLD POLISH O A7C2 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER ANGLICANA W A7C4..A7C7 ; Changes_When_Casefolded # L& [4] LATIN CAPITAL LETTER C WITH PALATAL HOOK..LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY A7C9 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY +A7D0 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER CLOSED INSULAR G +A7D6 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER MIDDLE SCOTS S +A7D8 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER SIGMOID S A7F5 ; Changes_When_Casefolded # L& LATIN CAPITAL LETTER REVERSED HALF H AB70..ABBF ; Changes_When_Casefolded # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA FB00..FB06 ; Changes_When_Casefolded # L& [7] LATIN SMALL LIGATURE FF..LATIN SMALL LIGATURE ST @@ -5791,12 +5909,16 @@ FB13..FB17 ; Changes_When_Casefolded # L& [5] ARMENIAN SMALL LIGATURE MEN N FF21..FF3A ; Changes_When_Casefolded # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Changes_When_Casefolded # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW 104B0..104D3 ; Changes_When_Casefolded # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA +10570..1057A ; Changes_When_Casefolded # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Changes_When_Casefolded # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Changes_When_Casefolded # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Changes_When_Casefolded # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE 10C80..10CB2 ; Changes_When_Casefolded # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 118A0..118BF ; Changes_When_Casefolded # L& [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 16E40..16E5F ; Changes_When_Casefolded # L& [32] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y 1E900..1E921 ; Changes_When_Casefolded # L& [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA -# Total code points: 1466 +# Total code points: 1506 # ================================================ @@ -5893,9 +6015,7 @@ FF21..FF3A ; Changes_When_Casefolded # L& [26] FULLWIDTH LATIN CAPITAL LETTE 2160..217F ; Changes_When_Casemapped # Nl [32] ROMAN NUMERAL ONE..SMALL ROMAN NUMERAL ONE THOUSAND 2183..2184 ; Changes_When_Casemapped # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C 24B6..24E9 ; Changes_When_Casemapped # So [52] CIRCLED LATIN CAPITAL LETTER A..CIRCLED LATIN SMALL LETTER Z -2C00..2C2E ; Changes_When_Casemapped # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; Changes_When_Casemapped # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C70 ; Changes_When_Casemapped # L& [17] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN CAPITAL LETTER TURNED ALPHA +2C00..2C70 ; Changes_When_Casemapped # L& [113] GLAGOLITIC CAPITAL LETTER AZU..LATIN CAPITAL LETTER TURNED ALPHA 2C72..2C73 ; Changes_When_Casemapped # L& [2] LATIN CAPITAL LETTER W WITH HOOK..LATIN SMALL LETTER W WITH HOOK 2C75..2C76 ; Changes_When_Casemapped # L& [2] LATIN CAPITAL LETTER HALF H..LATIN SMALL LETTER HALF H 2C7E..2CE3 ; Changes_When_Casemapped # L& [102] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SMALL LETTER OLD NUBIAN WAU @@ -5912,8 +6032,9 @@ A779..A787 ; Changes_When_Casemapped # L& [15] LATIN CAPITAL LETTER INSULAR A78B..A78D ; Changes_When_Casemapped # L& [3] LATIN CAPITAL LETTER SALTILLO..LATIN CAPITAL LETTER TURNED H A790..A794 ; Changes_When_Casemapped # L& [5] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER C WITH PALATAL HOOK A796..A7AE ; Changes_When_Casemapped # L& [25] LATIN CAPITAL LETTER B WITH FLOURISH..LATIN CAPITAL LETTER SMALL CAPITAL I -A7B0..A7BF ; Changes_When_Casemapped # L& [16] LATIN CAPITAL LETTER TURNED K..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; Changes_When_Casemapped # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7B0..A7CA ; Changes_When_Casemapped # L& [27] LATIN CAPITAL LETTER TURNED K..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; Changes_When_Casemapped # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D6..A7D9 ; Changes_When_Casemapped # L& [4] LATIN CAPITAL LETTER MIDDLE SCOTS S..LATIN SMALL LETTER SIGMOID S A7F5..A7F6 ; Changes_When_Casemapped # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H AB53 ; Changes_When_Casemapped # L& LATIN SMALL LETTER CHI AB70..ABBF ; Changes_When_Casemapped # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA @@ -5924,13 +6045,21 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 10400..1044F ; Changes_When_Casemapped # L& [80] DESERET CAPITAL LETTER LONG I..DESERET SMALL LETTER EW 104B0..104D3 ; Changes_When_Casemapped # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA 104D8..104FB ; Changes_When_Casemapped # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA +10570..1057A ; Changes_When_Casemapped # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Changes_When_Casemapped # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Changes_When_Casemapped # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Changes_When_Casemapped # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; Changes_When_Casemapped # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Changes_When_Casemapped # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Changes_When_Casemapped # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Changes_When_Casemapped # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10C80..10CB2 ; Changes_When_Casemapped # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 10CC0..10CF2 ; Changes_When_Casemapped # L& [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US 118A0..118DF ; Changes_When_Casemapped # L& [64] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 16E40..16E7F ; Changes_When_Casemapped # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y 1E900..1E943 ; Changes_When_Casemapped # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 2847 +# Total code points: 2927 # ================================================ @@ -6003,8 +6132,10 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 0828 ; ID_Start # Lm SAMARITAN MODIFIER LETTER I 0840..0858 ; ID_Start # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 0860..086A ; ID_Start # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; ID_Start # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; ID_Start # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +0870..0887 ; ID_Start # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; ID_Start # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +08A0..08C8 ; ID_Start # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; ID_Start # Lm ARABIC SMALL FARSI YEH 0904..0939 ; ID_Start # Lo [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA 093D ; ID_Start # Lo DEVANAGARI SIGN AVAGRAHA 0950 ; ID_Start # Lo DEVANAGARI OM @@ -6070,6 +6201,7 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 0C2A..0C39 ; ID_Start # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA 0C3D ; ID_Start # Lo TELUGU SIGN AVAGRAHA 0C58..0C5A ; ID_Start # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; ID_Start # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; ID_Start # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C80 ; ID_Start # Lo KANNADA SIGN SPACING CANDRABINDU 0C85..0C8C ; ID_Start # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L @@ -6078,7 +6210,7 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 0CAA..0CB3 ; ID_Start # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA 0CB5..0CB9 ; ID_Start # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA 0CBD ; ID_Start # Lo KANNADA SIGN AVAGRAHA -0CDE ; ID_Start # Lo KANNADA LETTER FA +0CDD..0CDE ; ID_Start # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; ID_Start # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CF1..0CF2 ; ID_Start # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA 0D04..0D0C ; ID_Start # Lo [9] MALAYALAM LETTER VEDIC ANUSVARA..MALAYALAM LETTER VOCALIC L @@ -6153,9 +6285,8 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 16A0..16EA ; ID_Start # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16EE..16F0 ; ID_Start # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; ID_Start # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; ID_Start # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; ID_Start # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA -1720..1731 ; ID_Start # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA +1700..1711 ; ID_Start # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA +171F..1731 ; ID_Start # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA 1740..1751 ; ID_Start # Lo [18] BUHID LETTER A..BUHID LETTER HA 1760..176C ; ID_Start # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA 176E..1770 ; ID_Start # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA @@ -6179,7 +6310,7 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 1A20..1A54 ; ID_Start # Lo [53] TAI THAM LETTER HIGH KA..TAI THAM LETTER GREAT SA 1AA7 ; ID_Start # Lm TAI THAM SIGN MAI YAMOK 1B05..1B33 ; ID_Start # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA -1B45..1B4B ; ID_Start # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; ID_Start # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B83..1BA0 ; ID_Start # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA 1BAE..1BAF ; ID_Start # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA 1BBA..1BE5 ; ID_Start # Lo [44] SUNDANESE AVAGRAHA..BATAK LETTER U @@ -6242,9 +6373,7 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 2160..2182 ; ID_Start # Nl [35] ROMAN NUMERAL ONE..ROMAN NUMERAL TEN THOUSAND 2183..2184 ; ID_Start # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C 2185..2188 ; ID_Start # Nl [4] ROMAN NUMERAL SIX LATE FORM..ROMAN NUMERAL ONE HUNDRED THOUSAND -2C00..2C2E ; ID_Start # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; ID_Start # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; ID_Start # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; ID_Start # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; ID_Start # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; ID_Start # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CEB..2CEE ; ID_Start # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA @@ -6283,8 +6412,7 @@ FF41..FF5A ; Changes_When_Casemapped # L& [26] FULLWIDTH LATIN SMALL LETTER 31A0..31BF ; ID_Start # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH 31F0..31FF ; ID_Start # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO 3400..4DBF ; ID_Start # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; ID_Start # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; ID_Start # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; ID_Start # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; ID_Start # Lm YI SYLLABLE WU A016..A48C ; ID_Start # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A4D0..A4F7 ; ID_Start # Lo [40] LISU LETTER BA..LISU LETTER OE @@ -6307,8 +6435,11 @@ A771..A787 ; ID_Start # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER I A788 ; ID_Start # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; ID_Start # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; ID_Start # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; ID_Start # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; ID_Start # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; ID_Start # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; ID_Start # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; ID_Start # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; ID_Start # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; ID_Start # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; ID_Start # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; ID_Start # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; ID_Start # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -6418,9 +6549,20 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 104D8..104FB ; ID_Start # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA 10500..10527 ; ID_Start # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; ID_Start # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW +10570..1057A ; ID_Start # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; ID_Start # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; ID_Start # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; ID_Start # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; ID_Start # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; ID_Start # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; ID_Start # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; ID_Start # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; ID_Start # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; ID_Start # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; ID_Start # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; ID_Start # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; ID_Start # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; ID_Start # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; ID_Start # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; ID_Start # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; ID_Start # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -6456,9 +6598,12 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 10F00..10F1C ; ID_Start # Lo [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL 10F27 ; ID_Start # Lo OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F45 ; ID_Start # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN +10F70..10F81 ; ID_Start # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH 10FB0..10FC4 ; ID_Start # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; ID_Start # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11003..11037 ; ID_Start # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA +11071..11072 ; ID_Start # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11075 ; ID_Start # Lo BRAHMI LETTER OLD TAMIL LLA 11083..110AF ; ID_Start # Lo [45] KAITHI LETTER A..KAITHI LETTER HA 110D0..110E8 ; ID_Start # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 11103..11126 ; ID_Start # Lo [36] CHAKMA LETTER AA..CHAKMA LETTER HAA @@ -6500,6 +6645,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 11680..116AA ; ID_Start # Lo [43] TAKRI LETTER A..TAKRI LETTER RRA 116B8 ; ID_Start # Lo TAKRI LETTER ARCHAIC KHA 11700..1171A ; ID_Start # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; ID_Start # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; ID_Start # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 118A0..118DF ; ID_Start # L& [64] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 118FF..11906 ; ID_Start # Lo [8] WARANG CITI OM..DIVES AKURU LETTER E @@ -6519,7 +6665,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 11A50 ; ID_Start # Lo SOYOMBO LETTER A 11A5C..11A89 ; ID_Start # Lo [46] SOYOMBO LETTER KA..SOYOMBO CLUSTER-INITIAL LETTER SA 11A9D ; ID_Start # Lo SOYOMBO MARK PLUTA -11AC0..11AF8 ; ID_Start # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; ID_Start # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; ID_Start # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; ID_Start # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C40 ; ID_Start # Lo BHAIKSUKI SIGN AVAGRAHA @@ -6537,10 +6683,12 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 12000..12399 ; ID_Start # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12400..1246E ; ID_Start # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; ID_Start # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; ID_Start # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; ID_Start # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; ID_Start # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; ID_Start # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; ID_Start # Lo [31] MRO LETTER TA..MRO LETTER TEK +16A70..16ABE ; ID_Start # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA 16AD0..16AED ; ID_Start # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16B00..16B2F ; ID_Start # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 16B40..16B43 ; ID_Start # Lm [4] PAHAWH HMONG SIGN VOS SEEV..PAHAWH HMONG SIGN IB YAM @@ -6555,7 +6703,10 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 17000..187F7 ; ID_Start # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; ID_Start # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; ID_Start # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; ID_Start # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; ID_Start # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; ID_Start # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; ID_Start # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; ID_Start # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; ID_Start # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; ID_Start # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; ID_Start # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -6593,10 +6744,18 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1D78A..1D7A8 ; ID_Start # L& [31] MATHEMATICAL SANS-SERIF BOLD EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA 1D7AA..1D7C2 ; ID_Start # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA 1D7C4..1D7CB ; ID_Start # L& [8] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL BOLD SMALL DIGAMMA +1DF00..1DF09 ; ID_Start # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; ID_Start # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; ID_Start # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E100..1E12C ; ID_Start # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; ID_Start # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E14E ; ID_Start # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ +1E290..1E2AD ; ID_Start # Lo [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; ID_Start # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH +1E7E0..1E7E6 ; ID_Start # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; ID_Start # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; ID_Start # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; ID_Start # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; ID_Start # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E900..1E943 ; ID_Start # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA 1E94B ; ID_Start # Lm ADLAM NASALIZATION MARK @@ -6633,15 +6792,15 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1EEA1..1EEA3 ; ID_Start # Lo [3] ARABIC MATHEMATICAL DOUBLE-STRUCK BEH..ARABIC MATHEMATICAL DOUBLE-STRUCK DAL 1EEA5..1EEA9 ; ID_Start # Lo [5] ARABIC MATHEMATICAL DOUBLE-STRUCK WAW..ARABIC MATHEMATICAL DOUBLE-STRUCK YEH 1EEAB..1EEBB ; ID_Start # Lo [17] ARABIC MATHEMATICAL DOUBLE-STRUCK LAM..ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN -20000..2A6DD ; ID_Start # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; ID_Start # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; ID_Start # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; ID_Start # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; ID_Start # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; ID_Start # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; ID_Start # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 2F800..2FA1D ; ID_Start # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D 30000..3134A ; ID_Start # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 131482 +# Total code points: 131997 # ================================================ @@ -6746,9 +6905,12 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 0840..0858 ; ID_Continue # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 0859..085B ; ID_Continue # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK 0860..086A ; ID_Continue # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; ID_Continue # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; ID_Continue # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE -08D3..08E1 ; ID_Continue # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0870..0887 ; ID_Continue # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; ID_Continue # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0898..089F ; ID_Continue # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08A0..08C8 ; ID_Continue # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; ID_Continue # Lm ARABIC SMALL FARSI YEH +08CA..08E1 ; ID_Continue # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; ID_Continue # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 0903 ; ID_Continue # Mc DEVANAGARI SIGN VISARGA 0904..0939 ; ID_Continue # Lo [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA @@ -6886,6 +7048,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 0C0E..0C10 ; ID_Continue # Lo [3] TELUGU LETTER E..TELUGU LETTER AI 0C12..0C28 ; ID_Continue # Lo [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C39 ; ID_Continue # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C3C ; ID_Continue # Mn TELUGU SIGN NUKTA 0C3D ; ID_Continue # Lo TELUGU SIGN AVAGRAHA 0C3E..0C40 ; ID_Continue # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44 ; ID_Continue # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR @@ -6893,6 +7056,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 0C4A..0C4D ; ID_Continue # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56 ; ID_Continue # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK 0C58..0C5A ; ID_Continue # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; ID_Continue # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; ID_Continue # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63 ; ID_Continue # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C66..0C6F ; ID_Continue # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE @@ -6914,7 +7078,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 0CCA..0CCB ; ID_Continue # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC..0CCD ; ID_Continue # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA 0CD5..0CD6 ; ID_Continue # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE ; ID_Continue # Lo KANNADA LETTER FA +0CDD..0CDE ; ID_Continue # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; ID_Continue # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; ID_Continue # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; ID_Continue # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -7058,11 +7222,12 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 16A0..16EA ; ID_Continue # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16EE..16F0 ; ID_Continue # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; ID_Continue # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; ID_Continue # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; ID_Continue # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711 ; ID_Continue # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1714 ; ID_Continue # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1720..1731 ; ID_Continue # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA -1732..1734 ; ID_Continue # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1715 ; ID_Continue # Mc TAGALOG SIGN PAMUDPOD +171F..1731 ; ID_Continue # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA +1732..1733 ; ID_Continue # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734 ; ID_Continue # Mc HANUNOO SIGN PAMUDPOD 1740..1751 ; ID_Continue # Lo [18] BUHID LETTER A..BUHID LETTER HA 1752..1753 ; ID_Continue # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1760..176C ; ID_Continue # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA @@ -7081,6 +7246,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 17DD ; ID_Continue # Mn KHMER SIGN ATTHACAN 17E0..17E9 ; ID_Continue # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE 180B..180D ; ID_Continue # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; ID_Continue # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1810..1819 ; ID_Continue # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE 1820..1842 ; ID_Continue # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843 ; ID_Continue # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -7128,7 +7294,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1A90..1A99 ; ID_Continue # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE 1AA7 ; ID_Continue # Lm TAI THAM SIGN MAI YAMOK 1AB0..1ABD ; ID_Continue # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW -1ABF..1AC0 ; ID_Continue # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; ID_Continue # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; ID_Continue # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; ID_Continue # Mc BALINESE SIGN BISAH 1B05..1B33 ; ID_Continue # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA @@ -7140,7 +7306,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1B3D..1B41 ; ID_Continue # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42 ; ID_Continue # Mn BALINESE VOWEL SIGN PEPET 1B43..1B44 ; ID_Continue # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG -1B45..1B4B ; ID_Continue # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; ID_Continue # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59 ; ID_Continue # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B6B..1B73 ; ID_Continue # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1B80..1B81 ; ID_Continue # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR @@ -7194,8 +7360,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1D78 ; ID_Continue # Lm MODIFIER LETTER CYRILLIC EN 1D79..1D9A ; ID_Continue # L& [34] LATIN SMALL LETTER INSULAR G..LATIN SMALL LETTER EZH WITH RETROFLEX HOOK 1D9B..1DBF ; ID_Continue # Lm [37] MODIFIER LETTER SMALL TURNED ALPHA..MODIFIER LETTER SMALL THETA -1DC0..1DF9 ; ID_Continue # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; ID_Continue # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; ID_Continue # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 1E00..1F15 ; ID_Continue # L& [278] LATIN CAPITAL LETTER A WITH RING BELOW..GREEK SMALL LETTER EPSILON WITH DASIA AND OXIA 1F18..1F1D ; ID_Continue # L& [6] GREEK CAPITAL LETTER EPSILON WITH PSILI..GREEK CAPITAL LETTER EPSILON WITH DASIA AND OXIA 1F20..1F45 ; ID_Continue # L& [38] GREEK SMALL LETTER ETA WITH PSILI..GREEK SMALL LETTER OMICRON WITH DASIA AND OXIA @@ -7243,9 +7408,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 2160..2182 ; ID_Continue # Nl [35] ROMAN NUMERAL ONE..ROMAN NUMERAL TEN THOUSAND 2183..2184 ; ID_Continue # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C 2185..2188 ; ID_Continue # Nl [4] ROMAN NUMERAL SIX LATE FORM..ROMAN NUMERAL ONE HUNDRED THOUSAND -2C00..2C2E ; ID_Continue # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; ID_Continue # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; ID_Continue # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; ID_Continue # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; ID_Continue # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; ID_Continue # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CEB..2CEE ; ID_Continue # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA @@ -7290,8 +7453,7 @@ FFDA..FFDC ; ID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 31A0..31BF ; ID_Continue # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH 31F0..31FF ; ID_Continue # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO 3400..4DBF ; ID_Continue # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; ID_Continue # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; ID_Continue # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; ID_Continue # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; ID_Continue # Lm YI SYLLABLE WU A016..A48C ; ID_Continue # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A4D0..A4F7 ; ID_Continue # Lo [40] LISU LETTER BA..LISU LETTER OE @@ -7319,8 +7481,11 @@ A771..A787 ; ID_Continue # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTE A788 ; ID_Continue # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; ID_Continue # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; ID_Continue # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; ID_Continue # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; ID_Continue # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; ID_Continue # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; ID_Continue # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; ID_Continue # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; ID_Continue # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; ID_Continue # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; ID_Continue # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; ID_Continue # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; ID_Continue # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -7499,9 +7664,20 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 104D8..104FB ; ID_Continue # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA 10500..10527 ; ID_Continue # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; ID_Continue # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW +10570..1057A ; ID_Continue # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; ID_Continue # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; ID_Continue # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; ID_Continue # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; ID_Continue # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; ID_Continue # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; ID_Continue # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; ID_Continue # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; ID_Continue # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; ID_Continue # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; ID_Continue # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; ID_Continue # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; ID_Continue # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; ID_Continue # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; ID_Continue # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; ID_Continue # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; ID_Continue # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -7547,6 +7723,8 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 10F27 ; ID_Continue # Lo OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F45 ; ID_Continue # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN 10F46..10F50 ; ID_Continue # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F70..10F81 ; ID_Continue # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F82..10F85 ; ID_Continue # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 10FB0..10FC4 ; ID_Continue # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; ID_Continue # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11000 ; ID_Continue # Mc BRAHMI SIGN CANDRABINDU @@ -7555,6 +7733,10 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 11003..11037 ; ID_Continue # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA 11038..11046 ; ID_Continue # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA 11066..1106F ; ID_Continue # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11070 ; ID_Continue # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11071..11072 ; ID_Continue # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074 ; ID_Continue # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075 ; ID_Continue # Lo BRAHMI LETTER OLD TAMIL LLA 1107F..11081 ; ID_Continue # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 11082 ; ID_Continue # Mc KAITHI SIGN VISARGA 11083..110AF ; ID_Continue # Lo [45] KAITHI LETTER A..KAITHI LETTER HA @@ -7562,6 +7744,7 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 110B3..110B6 ; ID_Continue # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B7..110B8 ; ID_Continue # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU 110B9..110BA ; ID_Continue # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; ID_Continue # Mn KAITHI VOWEL SIGN VOCALIC R 110D0..110E8 ; ID_Continue # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 110F0..110F9 ; ID_Continue # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE 11100..11102 ; ID_Continue # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA @@ -7687,6 +7870,7 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 11726 ; ID_Continue # Mc AHOM VOWEL SIGN E 11727..1172B ; ID_Continue # Mn [5] AHOM VOWEL SIGN AW..AHOM SIGN KILLER 11730..11739 ; ID_Continue # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +11740..11746 ; ID_Continue # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; ID_Continue # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E ; ID_Continue # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 1182F..11837 ; ID_Continue # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA @@ -7737,7 +7921,7 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 11A97 ; ID_Continue # Mc SOYOMBO SIGN VISARGA 11A98..11A99 ; ID_Continue # Mn [2] SOYOMBO GEMINATION MARK..SOYOMBO SUBJOINER 11A9D ; ID_Continue # Lo SOYOMBO MARK PLUTA -11AC0..11AF8 ; ID_Continue # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; ID_Continue # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; ID_Continue # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; ID_Continue # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C2F ; ID_Continue # Mc BHAIKSUKI VOWEL SIGN AA @@ -7783,11 +7967,14 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 12000..12399 ; ID_Continue # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12400..1246E ; ID_Continue # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; ID_Continue # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; ID_Continue # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; ID_Continue # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; ID_Continue # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; ID_Continue # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; ID_Continue # Lo [31] MRO LETTER TA..MRO LETTER TEK 16A60..16A69 ; ID_Continue # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE +16A70..16ABE ; ID_Continue # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; ID_Continue # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED ; ID_Continue # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF0..16AF4 ; ID_Continue # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B00..16B2F ; ID_Continue # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU @@ -7810,7 +7997,10 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 17000..187F7 ; ID_Continue # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; ID_Continue # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; ID_Continue # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; ID_Continue # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; ID_Continue # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; ID_Continue # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; ID_Continue # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; ID_Continue # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; ID_Continue # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; ID_Continue # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; ID_Continue # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -7819,6 +8009,8 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 1BC80..1BC88 ; ID_Continue # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 1BC90..1BC99 ; ID_Continue # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW 1BC9D..1BC9E ; ID_Continue # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK +1CF00..1CF2D ; ID_Continue # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; ID_Continue # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D165..1D166 ; ID_Continue # Mc [2] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING SPRECHGESANG STEM 1D167..1D169 ; ID_Continue # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16D..1D172 ; ID_Continue # Mc [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 @@ -7863,6 +8055,9 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 1DA84 ; ID_Continue # Mn SIGNWRITING LOCATION HEAD NECK 1DA9B..1DA9F ; ID_Continue # Mn [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6 1DAA1..1DAAF ; ID_Continue # Mn [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16 +1DF00..1DF09 ; ID_Continue # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; ID_Continue # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; ID_Continue # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E000..1E006 ; ID_Continue # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; ID_Continue # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; ID_Continue # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -7873,9 +8068,15 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 1E137..1E13D ; ID_Continue # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E140..1E149 ; ID_Continue # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1E14E ; ID_Continue # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ +1E290..1E2AD ; ID_Continue # Lo [30] TOTO LETTER PA..TOTO LETTER A +1E2AE ; ID_Continue # Mn TOTO SIGN RISING TONE 1E2C0..1E2EB ; ID_Continue # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1E2EC..1E2EF ; ID_Continue # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E2F0..1E2F9 ; ID_Continue # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE +1E7E0..1E7E6 ; ID_Continue # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; ID_Continue # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; ID_Continue # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; ID_Continue # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; ID_Continue # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8D0..1E8D6 ; ID_Continue # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E900..1E943 ; ID_Continue # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA @@ -7916,8 +8117,8 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 1EEA5..1EEA9 ; ID_Continue # Lo [5] ARABIC MATHEMATICAL DOUBLE-STRUCK WAW..ARABIC MATHEMATICAL DOUBLE-STRUCK YEH 1EEAB..1EEBB ; ID_Continue # Lo [17] ARABIC MATHEMATICAL DOUBLE-STRUCK LAM..ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN 1FBF0..1FBF9 ; ID_Continue # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -20000..2A6DD ; ID_Continue # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; ID_Continue # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; ID_Continue # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; ID_Continue # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; ID_Continue # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; ID_Continue # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; ID_Continue # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 @@ -7925,7 +8126,7 @@ FFDA..FFDC ; ID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HAN 30000..3134A ; ID_Continue # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 134434 +# Total code points: 135072 # ================================================ @@ -7995,8 +8196,10 @@ E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR 0828 ; XID_Start # Lm SAMARITAN MODIFIER LETTER I 0840..0858 ; XID_Start # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 0860..086A ; XID_Start # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; XID_Start # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; XID_Start # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +0870..0887 ; XID_Start # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; XID_Start # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +08A0..08C8 ; XID_Start # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; XID_Start # Lm ARABIC SMALL FARSI YEH 0904..0939 ; XID_Start # Lo [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA 093D ; XID_Start # Lo DEVANAGARI SIGN AVAGRAHA 0950 ; XID_Start # Lo DEVANAGARI OM @@ -8062,6 +8265,7 @@ E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR 0C2A..0C39 ; XID_Start # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA 0C3D ; XID_Start # Lo TELUGU SIGN AVAGRAHA 0C58..0C5A ; XID_Start # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; XID_Start # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; XID_Start # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C80 ; XID_Start # Lo KANNADA SIGN SPACING CANDRABINDU 0C85..0C8C ; XID_Start # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L @@ -8070,7 +8274,7 @@ E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR 0CAA..0CB3 ; XID_Start # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA 0CB5..0CB9 ; XID_Start # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA 0CBD ; XID_Start # Lo KANNADA SIGN AVAGRAHA -0CDE ; XID_Start # Lo KANNADA LETTER FA +0CDD..0CDE ; XID_Start # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; XID_Start # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CF1..0CF2 ; XID_Start # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA 0D04..0D0C ; XID_Start # Lo [9] MALAYALAM LETTER VEDIC ANUSVARA..MALAYALAM LETTER VOCALIC L @@ -8145,9 +8349,8 @@ E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR 16A0..16EA ; XID_Start # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16EE..16F0 ; XID_Start # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; XID_Start # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; XID_Start # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; XID_Start # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA -1720..1731 ; XID_Start # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA +1700..1711 ; XID_Start # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA +171F..1731 ; XID_Start # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA 1740..1751 ; XID_Start # Lo [18] BUHID LETTER A..BUHID LETTER HA 1760..176C ; XID_Start # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA 176E..1770 ; XID_Start # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA @@ -8171,7 +8374,7 @@ E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR 1A20..1A54 ; XID_Start # Lo [53] TAI THAM LETTER HIGH KA..TAI THAM LETTER GREAT SA 1AA7 ; XID_Start # Lm TAI THAM SIGN MAI YAMOK 1B05..1B33 ; XID_Start # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA -1B45..1B4B ; XID_Start # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; XID_Start # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B83..1BA0 ; XID_Start # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA 1BAE..1BAF ; XID_Start # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA 1BBA..1BE5 ; XID_Start # Lo [44] SUNDANESE AVAGRAHA..BATAK LETTER U @@ -8234,9 +8437,7 @@ E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR 2160..2182 ; XID_Start # Nl [35] ROMAN NUMERAL ONE..ROMAN NUMERAL TEN THOUSAND 2183..2184 ; XID_Start # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C 2185..2188 ; XID_Start # Nl [4] ROMAN NUMERAL SIX LATE FORM..ROMAN NUMERAL ONE HUNDRED THOUSAND -2C00..2C2E ; XID_Start # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; XID_Start # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; XID_Start # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; XID_Start # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; XID_Start # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; XID_Start # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CEB..2CEE ; XID_Start # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA @@ -8274,8 +8475,7 @@ E0100..E01EF ; ID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR 31A0..31BF ; XID_Start # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH 31F0..31FF ; XID_Start # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO 3400..4DBF ; XID_Start # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; XID_Start # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; XID_Start # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; XID_Start # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; XID_Start # Lm YI SYLLABLE WU A016..A48C ; XID_Start # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A4D0..A4F7 ; XID_Start # Lo [40] LISU LETTER BA..LISU LETTER OE @@ -8298,8 +8498,11 @@ A771..A787 ; XID_Start # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER A788 ; XID_Start # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; XID_Start # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; XID_Start # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; XID_Start # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; XID_Start # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; XID_Start # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; XID_Start # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; XID_Start # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; XID_Start # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; XID_Start # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; XID_Start # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; XID_Start # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; XID_Start # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -8414,9 +8617,20 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 104D8..104FB ; XID_Start # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA 10500..10527 ; XID_Start # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; XID_Start # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW +10570..1057A ; XID_Start # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; XID_Start # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; XID_Start # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; XID_Start # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; XID_Start # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; XID_Start # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; XID_Start # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; XID_Start # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; XID_Start # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; XID_Start # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; XID_Start # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; XID_Start # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; XID_Start # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; XID_Start # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; XID_Start # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; XID_Start # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; XID_Start # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -8452,9 +8666,12 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 10F00..10F1C ; XID_Start # Lo [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL 10F27 ; XID_Start # Lo OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F45 ; XID_Start # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN +10F70..10F81 ; XID_Start # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH 10FB0..10FC4 ; XID_Start # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; XID_Start # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11003..11037 ; XID_Start # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA +11071..11072 ; XID_Start # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11075 ; XID_Start # Lo BRAHMI LETTER OLD TAMIL LLA 11083..110AF ; XID_Start # Lo [45] KAITHI LETTER A..KAITHI LETTER HA 110D0..110E8 ; XID_Start # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 11103..11126 ; XID_Start # Lo [36] CHAKMA LETTER AA..CHAKMA LETTER HAA @@ -8496,6 +8713,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 11680..116AA ; XID_Start # Lo [43] TAKRI LETTER A..TAKRI LETTER RRA 116B8 ; XID_Start # Lo TAKRI LETTER ARCHAIC KHA 11700..1171A ; XID_Start # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; XID_Start # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; XID_Start # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 118A0..118DF ; XID_Start # L& [64] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 118FF..11906 ; XID_Start # Lo [8] WARANG CITI OM..DIVES AKURU LETTER E @@ -8515,7 +8733,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 11A50 ; XID_Start # Lo SOYOMBO LETTER A 11A5C..11A89 ; XID_Start # Lo [46] SOYOMBO LETTER KA..SOYOMBO CLUSTER-INITIAL LETTER SA 11A9D ; XID_Start # Lo SOYOMBO MARK PLUTA -11AC0..11AF8 ; XID_Start # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; XID_Start # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; XID_Start # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; XID_Start # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C40 ; XID_Start # Lo BHAIKSUKI SIGN AVAGRAHA @@ -8533,10 +8751,12 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 12000..12399 ; XID_Start # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12400..1246E ; XID_Start # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; XID_Start # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; XID_Start # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; XID_Start # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; XID_Start # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; XID_Start # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; XID_Start # Lo [31] MRO LETTER TA..MRO LETTER TEK +16A70..16ABE ; XID_Start # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA 16AD0..16AED ; XID_Start # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16B00..16B2F ; XID_Start # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 16B40..16B43 ; XID_Start # Lm [4] PAHAWH HMONG SIGN VOS SEEV..PAHAWH HMONG SIGN IB YAM @@ -8551,7 +8771,10 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 17000..187F7 ; XID_Start # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; XID_Start # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; XID_Start # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; XID_Start # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; XID_Start # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; XID_Start # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; XID_Start # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; XID_Start # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; XID_Start # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; XID_Start # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; XID_Start # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -8589,10 +8812,18 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 1D78A..1D7A8 ; XID_Start # L& [31] MATHEMATICAL SANS-SERIF BOLD EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA 1D7AA..1D7C2 ; XID_Start # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA 1D7C4..1D7CB ; XID_Start # L& [8] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL BOLD SMALL DIGAMMA +1DF00..1DF09 ; XID_Start # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; XID_Start # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; XID_Start # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E100..1E12C ; XID_Start # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; XID_Start # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E14E ; XID_Start # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ +1E290..1E2AD ; XID_Start # Lo [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; XID_Start # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH +1E7E0..1E7E6 ; XID_Start # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; XID_Start # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; XID_Start # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; XID_Start # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; XID_Start # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E900..1E943 ; XID_Start # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA 1E94B ; XID_Start # Lm ADLAM NASALIZATION MARK @@ -8629,15 +8860,15 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 1EEA1..1EEA3 ; XID_Start # Lo [3] ARABIC MATHEMATICAL DOUBLE-STRUCK BEH..ARABIC MATHEMATICAL DOUBLE-STRUCK DAL 1EEA5..1EEA9 ; XID_Start # Lo [5] ARABIC MATHEMATICAL DOUBLE-STRUCK WAW..ARABIC MATHEMATICAL DOUBLE-STRUCK YEH 1EEAB..1EEBB ; XID_Start # Lo [17] ARABIC MATHEMATICAL DOUBLE-STRUCK LAM..ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN -20000..2A6DD ; XID_Start # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; XID_Start # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; XID_Start # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; XID_Start # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; XID_Start # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; XID_Start # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; XID_Start # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 2F800..2FA1D ; XID_Start # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D 30000..3134A ; XID_Start # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 131459 +# Total code points: 131974 # ================================================ @@ -8738,9 +8969,12 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 0840..0858 ; XID_Continue # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 0859..085B ; XID_Continue # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK 0860..086A ; XID_Continue # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; XID_Continue # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; XID_Continue # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE -08D3..08E1 ; XID_Continue # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0870..0887 ; XID_Continue # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; XID_Continue # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0898..089F ; XID_Continue # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08A0..08C8 ; XID_Continue # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; XID_Continue # Lm ARABIC SMALL FARSI YEH +08CA..08E1 ; XID_Continue # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; XID_Continue # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 0903 ; XID_Continue # Mc DEVANAGARI SIGN VISARGA 0904..0939 ; XID_Continue # Lo [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA @@ -8878,6 +9112,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 0C0E..0C10 ; XID_Continue # Lo [3] TELUGU LETTER E..TELUGU LETTER AI 0C12..0C28 ; XID_Continue # Lo [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C39 ; XID_Continue # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C3C ; XID_Continue # Mn TELUGU SIGN NUKTA 0C3D ; XID_Continue # Lo TELUGU SIGN AVAGRAHA 0C3E..0C40 ; XID_Continue # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44 ; XID_Continue # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR @@ -8885,6 +9120,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 0C4A..0C4D ; XID_Continue # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56 ; XID_Continue # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK 0C58..0C5A ; XID_Continue # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; XID_Continue # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; XID_Continue # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63 ; XID_Continue # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C66..0C6F ; XID_Continue # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE @@ -8906,7 +9142,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 0CCA..0CCB ; XID_Continue # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC..0CCD ; XID_Continue # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA 0CD5..0CD6 ; XID_Continue # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE ; XID_Continue # Lo KANNADA LETTER FA +0CDD..0CDE ; XID_Continue # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; XID_Continue # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; XID_Continue # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; XID_Continue # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -9050,11 +9286,12 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 16A0..16EA ; XID_Continue # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16EE..16F0 ; XID_Continue # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; XID_Continue # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; XID_Continue # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; XID_Continue # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711 ; XID_Continue # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1714 ; XID_Continue # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1720..1731 ; XID_Continue # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA -1732..1734 ; XID_Continue # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1715 ; XID_Continue # Mc TAGALOG SIGN PAMUDPOD +171F..1731 ; XID_Continue # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA +1732..1733 ; XID_Continue # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734 ; XID_Continue # Mc HANUNOO SIGN PAMUDPOD 1740..1751 ; XID_Continue # Lo [18] BUHID LETTER A..BUHID LETTER HA 1752..1753 ; XID_Continue # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1760..176C ; XID_Continue # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA @@ -9073,6 +9310,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 17DD ; XID_Continue # Mn KHMER SIGN ATTHACAN 17E0..17E9 ; XID_Continue # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE 180B..180D ; XID_Continue # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; XID_Continue # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1810..1819 ; XID_Continue # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE 1820..1842 ; XID_Continue # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843 ; XID_Continue # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -9120,7 +9358,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 1A90..1A99 ; XID_Continue # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE 1AA7 ; XID_Continue # Lm TAI THAM SIGN MAI YAMOK 1AB0..1ABD ; XID_Continue # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW -1ABF..1AC0 ; XID_Continue # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; XID_Continue # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; XID_Continue # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; XID_Continue # Mc BALINESE SIGN BISAH 1B05..1B33 ; XID_Continue # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA @@ -9132,7 +9370,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 1B3D..1B41 ; XID_Continue # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42 ; XID_Continue # Mn BALINESE VOWEL SIGN PEPET 1B43..1B44 ; XID_Continue # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG -1B45..1B4B ; XID_Continue # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; XID_Continue # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59 ; XID_Continue # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B6B..1B73 ; XID_Continue # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1B80..1B81 ; XID_Continue # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR @@ -9186,8 +9424,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 1D78 ; XID_Continue # Lm MODIFIER LETTER CYRILLIC EN 1D79..1D9A ; XID_Continue # L& [34] LATIN SMALL LETTER INSULAR G..LATIN SMALL LETTER EZH WITH RETROFLEX HOOK 1D9B..1DBF ; XID_Continue # Lm [37] MODIFIER LETTER SMALL TURNED ALPHA..MODIFIER LETTER SMALL THETA -1DC0..1DF9 ; XID_Continue # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; XID_Continue # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; XID_Continue # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 1E00..1F15 ; XID_Continue # L& [278] LATIN CAPITAL LETTER A WITH RING BELOW..GREEK SMALL LETTER EPSILON WITH DASIA AND OXIA 1F18..1F1D ; XID_Continue # L& [6] GREEK CAPITAL LETTER EPSILON WITH PSILI..GREEK CAPITAL LETTER EPSILON WITH DASIA AND OXIA 1F20..1F45 ; XID_Continue # L& [38] GREEK SMALL LETTER ETA WITH PSILI..GREEK SMALL LETTER OMICRON WITH DASIA AND OXIA @@ -9235,9 +9472,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 2160..2182 ; XID_Continue # Nl [35] ROMAN NUMERAL ONE..ROMAN NUMERAL TEN THOUSAND 2183..2184 ; XID_Continue # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C 2185..2188 ; XID_Continue # Nl [4] ROMAN NUMERAL SIX LATE FORM..ROMAN NUMERAL ONE HUNDRED THOUSAND -2C00..2C2E ; XID_Continue # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; XID_Continue # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; XID_Continue # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; XID_Continue # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; XID_Continue # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; XID_Continue # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CEB..2CEE ; XID_Continue # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA @@ -9281,8 +9516,7 @@ FFDA..FFDC ; XID_Start # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGU 31A0..31BF ; XID_Continue # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH 31F0..31FF ; XID_Continue # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO 3400..4DBF ; XID_Continue # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; XID_Continue # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; XID_Continue # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; XID_Continue # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; XID_Continue # Lm YI SYLLABLE WU A016..A48C ; XID_Continue # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A4D0..A4F7 ; XID_Continue # Lo [40] LISU LETTER BA..LISU LETTER OE @@ -9310,8 +9544,11 @@ A771..A787 ; XID_Continue # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETT A788 ; XID_Continue # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78B..A78E ; XID_Continue # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; XID_Continue # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; XID_Continue # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; XID_Continue # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; XID_Continue # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; XID_Continue # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; XID_Continue # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; XID_Continue # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; XID_Continue # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; XID_Continue # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; XID_Continue # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; XID_Continue # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -9496,9 +9733,20 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 104D8..104FB ; XID_Continue # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA 10500..10527 ; XID_Continue # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; XID_Continue # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW +10570..1057A ; XID_Continue # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; XID_Continue # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; XID_Continue # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; XID_Continue # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; XID_Continue # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; XID_Continue # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; XID_Continue # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; XID_Continue # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; XID_Continue # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; XID_Continue # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; XID_Continue # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; XID_Continue # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; XID_Continue # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; XID_Continue # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; XID_Continue # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; XID_Continue # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; XID_Continue # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -9544,6 +9792,8 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 10F27 ; XID_Continue # Lo OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F45 ; XID_Continue # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN 10F46..10F50 ; XID_Continue # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F70..10F81 ; XID_Continue # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F82..10F85 ; XID_Continue # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 10FB0..10FC4 ; XID_Continue # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; XID_Continue # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11000 ; XID_Continue # Mc BRAHMI SIGN CANDRABINDU @@ -9552,6 +9802,10 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 11003..11037 ; XID_Continue # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA 11038..11046 ; XID_Continue # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA 11066..1106F ; XID_Continue # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11070 ; XID_Continue # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11071..11072 ; XID_Continue # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074 ; XID_Continue # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075 ; XID_Continue # Lo BRAHMI LETTER OLD TAMIL LLA 1107F..11081 ; XID_Continue # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 11082 ; XID_Continue # Mc KAITHI SIGN VISARGA 11083..110AF ; XID_Continue # Lo [45] KAITHI LETTER A..KAITHI LETTER HA @@ -9559,6 +9813,7 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 110B3..110B6 ; XID_Continue # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B7..110B8 ; XID_Continue # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU 110B9..110BA ; XID_Continue # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; XID_Continue # Mn KAITHI VOWEL SIGN VOCALIC R 110D0..110E8 ; XID_Continue # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 110F0..110F9 ; XID_Continue # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE 11100..11102 ; XID_Continue # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA @@ -9684,6 +9939,7 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 11726 ; XID_Continue # Mc AHOM VOWEL SIGN E 11727..1172B ; XID_Continue # Mn [5] AHOM VOWEL SIGN AW..AHOM SIGN KILLER 11730..11739 ; XID_Continue # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +11740..11746 ; XID_Continue # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; XID_Continue # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E ; XID_Continue # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 1182F..11837 ; XID_Continue # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA @@ -9734,7 +9990,7 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 11A97 ; XID_Continue # Mc SOYOMBO SIGN VISARGA 11A98..11A99 ; XID_Continue # Mn [2] SOYOMBO GEMINATION MARK..SOYOMBO SUBJOINER 11A9D ; XID_Continue # Lo SOYOMBO MARK PLUTA -11AC0..11AF8 ; XID_Continue # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; XID_Continue # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; XID_Continue # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; XID_Continue # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C2F ; XID_Continue # Mc BHAIKSUKI VOWEL SIGN AA @@ -9780,11 +10036,14 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 12000..12399 ; XID_Continue # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12400..1246E ; XID_Continue # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; XID_Continue # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; XID_Continue # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; XID_Continue # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; XID_Continue # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; XID_Continue # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; XID_Continue # Lo [31] MRO LETTER TA..MRO LETTER TEK 16A60..16A69 ; XID_Continue # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE +16A70..16ABE ; XID_Continue # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; XID_Continue # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED ; XID_Continue # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF0..16AF4 ; XID_Continue # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B00..16B2F ; XID_Continue # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU @@ -9807,7 +10066,10 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 17000..187F7 ; XID_Continue # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; XID_Continue # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; XID_Continue # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; XID_Continue # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; XID_Continue # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; XID_Continue # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; XID_Continue # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; XID_Continue # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; XID_Continue # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; XID_Continue # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; XID_Continue # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -9816,6 +10078,8 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 1BC80..1BC88 ; XID_Continue # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 1BC90..1BC99 ; XID_Continue # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW 1BC9D..1BC9E ; XID_Continue # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK +1CF00..1CF2D ; XID_Continue # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; XID_Continue # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D165..1D166 ; XID_Continue # Mc [2] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING SPRECHGESANG STEM 1D167..1D169 ; XID_Continue # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16D..1D172 ; XID_Continue # Mc [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 @@ -9860,6 +10124,9 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 1DA84 ; XID_Continue # Mn SIGNWRITING LOCATION HEAD NECK 1DA9B..1DA9F ; XID_Continue # Mn [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6 1DAA1..1DAAF ; XID_Continue # Mn [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16 +1DF00..1DF09 ; XID_Continue # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; XID_Continue # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; XID_Continue # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E000..1E006 ; XID_Continue # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; XID_Continue # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; XID_Continue # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -9870,9 +10137,15 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 1E137..1E13D ; XID_Continue # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E140..1E149 ; XID_Continue # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1E14E ; XID_Continue # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ +1E290..1E2AD ; XID_Continue # Lo [30] TOTO LETTER PA..TOTO LETTER A +1E2AE ; XID_Continue # Mn TOTO SIGN RISING TONE 1E2C0..1E2EB ; XID_Continue # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1E2EC..1E2EF ; XID_Continue # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E2F0..1E2F9 ; XID_Continue # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE +1E7E0..1E7E6 ; XID_Continue # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; XID_Continue # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; XID_Continue # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; XID_Continue # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; XID_Continue # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8D0..1E8D6 ; XID_Continue # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E900..1E943 ; XID_Continue # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA @@ -9913,8 +10186,8 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 1EEA5..1EEA9 ; XID_Continue # Lo [5] ARABIC MATHEMATICAL DOUBLE-STRUCK WAW..ARABIC MATHEMATICAL DOUBLE-STRUCK YEH 1EEAB..1EEBB ; XID_Continue # Lo [17] ARABIC MATHEMATICAL DOUBLE-STRUCK LAM..ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN 1FBF0..1FBF9 ; XID_Continue # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -20000..2A6DD ; XID_Continue # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; XID_Continue # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; XID_Continue # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; XID_Continue # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; XID_Continue # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; XID_Continue # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; XID_Continue # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 @@ -9922,7 +10195,7 @@ FFDA..FFDC ; XID_Continue # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HA 30000..3134A ; XID_Continue # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A E0100..E01EF ; XID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 134415 +# Total code points: 135053 # ================================================ @@ -9943,6 +10216,7 @@ E0100..E01EF ; XID_Continue # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTO 17B4..17B5 ; Default_Ignorable_Code_Point # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA 180B..180D ; Default_Ignorable_Code_Point # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; Default_Ignorable_Code_Point # Cf MONGOLIAN VOWEL SEPARATOR +180F ; Default_Ignorable_Code_Point # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 200B..200F ; Default_Ignorable_Code_Point # Cf [5] ZERO WIDTH SPACE..RIGHT-TO-LEFT MARK 202A..202E ; Default_Ignorable_Code_Point # Cf [5] LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE 2060..2064 ; Default_Ignorable_Code_Point # Cf [5] WORD JOINER..INVISIBLE PLUS @@ -9963,7 +10237,7 @@ E0080..E00FF ; Default_Ignorable_Code_Point # Cn [128] .... -# Total code points: 4173 +# Total code points: 4174 # ================================================ @@ -9997,7 +10271,8 @@ E01F0..E0FFF ; Default_Ignorable_Code_Point # Cn [3600] ............ @@ -3523,6 +3534,7 @@ FFE3 ; Expands_On_NFKC # Sk FULLWIDTH MACRON 17B4..17B5 ; NFKC_CF; # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA 180B..180D ; NFKC_CF; # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; NFKC_CF; # Cf MONGOLIAN VOWEL SEPARATOR +180F ; NFKC_CF; # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1C80 ; NFKC_CF; 0432 # L& CYRILLIC SMALL LETTER ROUNDED VE 1C81 ; NFKC_CF; 0434 # L& CYRILLIC SMALL LETTER LONG-LEGGED DE 1C82 ; NFKC_CF; 043E # L& CYRILLIC SMALL LETTER NARROW O @@ -4318,6 +4330,7 @@ FFE3 ; Expands_On_NFKC # Sk FULLWIDTH MACRON 2C2C ; NFKC_CF; 2C5C # L& GLAGOLITIC CAPITAL LETTER SHTAPIC 2C2D ; NFKC_CF; 2C5D # L& GLAGOLITIC CAPITAL LETTER TROKUTASTI A 2C2E ; NFKC_CF; 2C5E # L& GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C2F ; NFKC_CF; 2C5F # L& GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI 2C60 ; NFKC_CF; 2C61 # L& LATIN CAPITAL LETTER L WITH DOUBLE BAR 2C62 ; NFKC_CF; 026B # L& LATIN CAPITAL LETTER L WITH MIDDLE TILDE 2C63 ; NFKC_CF; 1D7D # L& LATIN CAPITAL LETTER P WITH STROKE @@ -5339,12 +5352,19 @@ A7B8 ; NFKC_CF; A7B9 # L& LATIN CAPITAL LETTER U WITH S A7BA ; NFKC_CF; A7BB # L& LATIN CAPITAL LETTER GLOTTAL A A7BC ; NFKC_CF; A7BD # L& LATIN CAPITAL LETTER GLOTTAL I A7BE ; NFKC_CF; A7BF # L& LATIN CAPITAL LETTER GLOTTAL U +A7C0 ; NFKC_CF; A7C1 # L& LATIN CAPITAL LETTER OLD POLISH O A7C2 ; NFKC_CF; A7C3 # L& LATIN CAPITAL LETTER ANGLICANA W A7C4 ; NFKC_CF; A794 # L& LATIN CAPITAL LETTER C WITH PALATAL HOOK A7C5 ; NFKC_CF; 0282 # L& LATIN CAPITAL LETTER S WITH HOOK A7C6 ; NFKC_CF; 1D8E # L& LATIN CAPITAL LETTER Z WITH PALATAL HOOK A7C7 ; NFKC_CF; A7C8 # L& LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY A7C9 ; NFKC_CF; A7CA # L& LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY +A7D0 ; NFKC_CF; A7D1 # L& LATIN CAPITAL LETTER CLOSED INSULAR G +A7D6 ; NFKC_CF; A7D7 # L& LATIN CAPITAL LETTER MIDDLE SCOTS S +A7D8 ; NFKC_CF; A7D9 # L& LATIN CAPITAL LETTER SIGMOID S +A7F2 ; NFKC_CF; 0063 # Lm MODIFIER LETTER CAPITAL C +A7F3 ; NFKC_CF; 0066 # Lm MODIFIER LETTER CAPITAL F +A7F4 ; NFKC_CF; 0071 # Lm MODIFIER LETTER CAPITAL Q A7F5 ; NFKC_CF; A7F6 # L& LATIN CAPITAL LETTER REVERSED HALF H A7F8 ; NFKC_CF; 0127 # Lm MODIFIER LETTER CAPITAL H WITH STROKE A7F9 ; NFKC_CF; 0153 # Lm MODIFIER LETTER SMALL LIGATURE OE @@ -6845,6 +6865,97 @@ FFF0..FFF8 ; NFKC_CF; # Cn [9] ...... -# Total code points: 10329 +# Total code points: 10429 # ================================================ @@ -9164,6 +9275,7 @@ E01F0..E0FFF ; NFKC_CF; # Cn [3600] ...... 10400..10427 ; Changes_When_NFKC_Casefolded # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW 104B0..104D3 ; Changes_When_NFKC_Casefolded # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA +10570..1057A ; Changes_When_NFKC_Casefolded # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Changes_When_NFKC_Casefolded # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Changes_When_NFKC_Casefolded # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Changes_When_NFKC_Casefolded # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10781..10785 ; Changes_When_NFKC_Casefolded # Lm [5] MODIFIER LETTER SUPERSCRIPT TRIANGULAR COLON..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Changes_When_NFKC_Casefolded # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Changes_When_NFKC_Casefolded # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10C80..10CB2 ; Changes_When_NFKC_Casefolded # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 118A0..118BF ; Changes_When_NFKC_Casefolded # L& [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 16E40..16E5F ; Changes_When_NFKC_Casefolded # L& [32] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y @@ -9824,6 +9948,6 @@ E0080..E00FF ; Changes_When_NFKC_Casefolded # Cn [128] .... -# Total code points: 10329 +# Total code points: 10429 # EOF diff --git a/lib/unicore/EastAsianWidth.txt b/lib/unicore/EastAsianWidth.txt index b43aec9273..e04f705178 100644 --- a/lib/unicore/EastAsianWidth.txt +++ b/lib/unicore/EastAsianWidth.txt @@ -1,11 +1,11 @@ -# EastAsianWidth-13.0.0.txt -# Date: 2029-01-21, 18:14:00 GMT [KW, LI] -# © 2020 Unicode®, Inc. +# EastAsianWidth-14.0.0.txt +# Date: 2021-07-06, 09:58:53 GMT [KW, LI] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # East_Asian_Width Property # @@ -37,7 +37,7 @@ # with ranges of code points, the code point count in square brackets. # # For more information, see UAX #11: East Asian Width, -# at http://www.unicode.org/reports/tr11/ +# at https://www.unicode.org/reports/tr11/ # # @missing: 0000..10FFFF; N 0000..001F;N # Cc [32] .. @@ -273,7 +273,7 @@ 0610..061A;N # Mn [11] ARABIC SIGN SALLALLAHOU ALAYHE WASSALLAM..ARABIC SMALL KASRA 061B;N # Po ARABIC SEMICOLON 061C;N # Cf ARABIC LETTER MARK -061E..061F;N # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F;N # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 0620..063F;N # Lo [32] ARABIC LETTER KASHMIRI YEH..ARABIC LETTER FARSI YEH WITH THREE DOTS ABOVE 0640;N # Lm ARABIC TATWEEL 0641..064A;N # Lo [10] ARABIC LETTER FEH..ARABIC LETTER YEH @@ -331,9 +331,14 @@ 0859..085B;N # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK 085E;N # Po MANDAIC PUNCTUATION 0860..086A;N # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4;N # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7;N # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE -08D3..08E1;N # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0870..0887;N # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0888;N # Sk ARABIC RAISED ROUND DOT +0889..088E;N # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0890..0891;N # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +0898..089F;N # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08A0..08C8;N # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9;N # Lm ARABIC SMALL FARSI YEH +08CA..08E1;N # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E2;N # Cf ARABIC DISPUTED END OF AYAH 08E3..08FF;N # Mn [29] ARABIC TURNED DAMMA BELOW..ARABIC MARK SIDEWAYS NOON GHUNNA 0900..0902;N # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA @@ -490,6 +495,7 @@ 0C0E..0C10;N # Lo [3] TELUGU LETTER E..TELUGU LETTER AI 0C12..0C28;N # Lo [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C39;N # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C3C;N # Mn TELUGU SIGN NUKTA 0C3D;N # Lo TELUGU SIGN AVAGRAHA 0C3E..0C40;N # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44;N # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR @@ -497,6 +503,7 @@ 0C4A..0C4D;N # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56;N # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK 0C58..0C5A;N # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D;N # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61;N # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63;N # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C66..0C6F;N # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE @@ -522,7 +529,7 @@ 0CCA..0CCB;N # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC..0CCD;N # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA 0CD5..0CD6;N # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE;N # Lo KANNADA LETTER FA +0CDD..0CDE;N # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1;N # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3;N # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF;N # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -709,11 +716,13 @@ 16EB..16ED;N # Po [3] RUNIC SINGLE PUNCTUATION..RUNIC CROSS PUNCTUATION 16EE..16F0;N # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8;N # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C;N # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711;N # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711;N # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1714;N # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA +1715;N # Mc TAGALOG SIGN PAMUDPOD +171F;N # Lo TAGALOG LETTER ARCHAIC RA 1720..1731;N # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA -1732..1734;N # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733;N # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734;N # Mc HANUNOO SIGN PAMUDPOD 1735..1736;N # Po [2] PHILIPPINE SINGLE PUNCTUATION..PHILIPPINE DOUBLE PUNCTUATION 1740..1751;N # Lo [18] BUHID LETTER A..BUHID LETTER HA 1752..1753;N # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U @@ -741,6 +750,7 @@ 1807..180A;N # Po [4] MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER..MONGOLIAN NIRUGU 180B..180D;N # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E;N # Cf MONGOLIAN VOWEL SEPARATOR +180F;N # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1810..1819;N # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE 1820..1842;N # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843;N # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -796,7 +806,7 @@ 1AA8..1AAD;N # Po [6] TAI THAM SIGN KAAN..TAI THAM SIGN CAANG 1AB0..1ABD;N # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE;N # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0;N # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE;N # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03;N # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04;N # Mc BALINESE SIGN BISAH 1B05..1B33;N # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA @@ -808,12 +818,13 @@ 1B3D..1B41;N # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42;N # Mn BALINESE VOWEL SIGN PEPET 1B43..1B44;N # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG -1B45..1B4B;N # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C;N # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59;N # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B5A..1B60;N # Po [7] BALINESE PANTI..BALINESE PAMENENG 1B61..1B6A;N # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE 1B6B..1B73;N # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1B74..1B7C;N # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +1B7D..1B7E;N # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1B80..1B81;N # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR 1B82;N # Mc SUNDANESE SIGN PANGWISAD 1B83..1BA0;N # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA @@ -872,8 +883,7 @@ 1D79..1D7F;N # Ll [7] LATIN SMALL LETTER INSULAR G..LATIN SMALL LETTER UPSILON WITH STROKE 1D80..1D9A;N # Ll [27] LATIN SMALL LETTER B WITH PALATAL HOOK..LATIN SMALL LETTER EZH WITH RETROFLEX HOOK 1D9B..1DBF;N # Lm [37] MODIFIER LETTER SMALL TURNED ALPHA..MODIFIER LETTER SMALL THETA -1DC0..1DF9;N # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF;N # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF;N # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 1E00..1EFF;N # L& [256] LATIN CAPITAL LETTER A WITH RING BELOW..LATIN SMALL LETTER Y WITH LOOP 1F00..1F15;N # L& [22] GREEK SMALL LETTER ALPHA WITH PSILI..GREEK SMALL LETTER EPSILON WITH DASIA AND OXIA 1F18..1F1D;N # Lu [6] GREEK CAPITAL LETTER EPSILON WITH PSILI..GREEK CAPITAL LETTER EPSILON WITH DASIA AND OXIA @@ -965,7 +975,7 @@ 20A9;H # Sc WON SIGN 20AA..20AB;N # Sc [2] NEW SHEQEL SIGN..DONG SIGN 20AC;A # Sc EURO SIGN -20AD..20BF;N # Sc [19] KIP SIGN..BITCOIN SIGN +20AD..20C0;N # Sc [20] KIP SIGN..SOM SIGN 20D0..20DC;N # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0;N # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH 20E1;N # Mn COMBINING LEFT RIGHT ARROW ABOVE @@ -1338,8 +1348,7 @@ 2B5A..2B73;N # So [26] SLANTED NORTH ARROW WITH HOOKED HEAD..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR 2B76..2B95;N # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW 2B97..2BFF;N # So [105] SYMBOL FOR TYPE A ELECTRONICS..HELLSCHREIBER PAUSE SYMBOL -2C00..2C2E;N # Lu [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E;N # Ll [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C00..2C5F;N # L& [96] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C60..2C7B;N # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D;N # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2C7F;N # Lu [2] LATIN CAPITAL LETTER S WITH SWASH TAIL..LATIN CAPITAL LETTER Z WITH SWASH TAIL @@ -1407,7 +1416,16 @@ 2E42;N # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK 2E43..2E4F;N # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER 2E50..2E51;N # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR -2E52;N # Po TIRONIAN SIGN CAPITAL ET +2E52..2E54;N # Po [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK +2E55;N # Ps LEFT SQUARE BRACKET WITH STROKE +2E56;N # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57;N # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58;N # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59;N # Ps TOP HALF LEFT PARENTHESIS +2E5A;N # Pe TOP HALF RIGHT PARENTHESIS +2E5B;N # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C;N # Pe BOTTOM HALF RIGHT PARENTHESIS +2E5D;N # Pd OBLIQUE HYPHEN 2E80..2E99;W # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3;W # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5;W # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -1485,8 +1503,7 @@ 3300..33FF;W # So [256] SQUARE APAATO..SQUARE GAL 3400..4DBF;W # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF 4DC0..4DFF;N # So [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION -4E00..9FFC;W # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -9FFD..9FFF;W # Cn [3] .. +4E00..9FFF;W # Lo [20992] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFF A000..A014;W # Lo [21] YI SYLLABLE IT..YI SYLLABLE E A015;W # Lm YI SYLLABLE WU A016..A48C;W # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR @@ -1525,8 +1542,11 @@ A788;N # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A;N # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E;N # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F;N # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF;N # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA;N # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA;N # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1;N # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3;N # Ll LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9;N # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4;N # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6;N # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7;N # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9;N # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -1682,15 +1702,17 @@ FB40..FB41;N # Lo [2] HEBREW LETTER NUN WITH DAGESH..HEBREW LETTER SAMEK FB43..FB44;N # Lo [2] HEBREW LETTER FINAL PE WITH DAGESH..HEBREW LETTER PE WITH DAGESH FB46..FB4F;N # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATURE ALEF LAMED FB50..FBB1;N # Lo [98] ARABIC LETTER ALEF WASLA ISOLATED FORM..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM -FBB2..FBC1;N # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2;N # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FBD3..FD3D;N # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM FD3E;N # Pe ORNATE LEFT PARENTHESIS FD3F;N # Ps ORNATE RIGHT PARENTHESIS +FD40..FD4F;N # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH FD50..FD8F;N # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM FD92..FDC7;N # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM +FDCF;N # So ARABIC LIGATURE SALAAMUHU ALAYNAA FDF0..FDFB;N # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU FDFC;N # Sc RIAL SIGN -FDFD;N # So ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFD..FDFF;N # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FE00..FE0F;A # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16 FE10..FE16;W # Po [7] PRESENTATION FORM FOR VERTICAL COMMA..PRESENTATION FORM FOR VERTICAL QUESTION MARK FE17;W # Ps PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET @@ -1839,9 +1861,20 @@ FFFD;A # So REPLACEMENT CHARACTER 10500..10527;N # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563;N # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW 1056F;N # Po CAUCASIAN ALBANIAN CITATION MARK +10570..1057A;N # Lu [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A;N # Lu [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592;N # Lu [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595;N # Lu [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1;N # Ll [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1;N # Ll [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9;N # Ll [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC;N # Ll [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736;N # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755;N # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767;N # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785;N # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0;N # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA;N # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805;N # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808;N # Lo CYPRIOT SYLLABLE JO 1080A..10835;N # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -1920,6 +1953,9 @@ FFFD;A # So REPLACEMENT CHARACTER 10F46..10F50;N # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW 10F51..10F54;N # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED 10F55..10F59;N # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F70..10F81;N # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F82..10F85;N # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW +10F86..10F89;N # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 10FB0..10FC4;N # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FC5..10FCB;N # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED 10FE0..10FF6;N # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH @@ -1931,6 +1967,10 @@ FFFD;A # So REPLACEMENT CHARACTER 11047..1104D;N # Po [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 11052..11065;N # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND 11066..1106F;N # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11070;N # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11071..11072;N # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074;N # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075;N # Lo BRAHMI LETTER OLD TAMIL LLA 1107F;N # Mn BRAHMI NUMBER JOINER 11080..11081;N # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA 11082;N # Mc KAITHI SIGN VISARGA @@ -1942,6 +1982,7 @@ FFFD;A # So REPLACEMENT CHARACTER 110BB..110BC;N # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN 110BD;N # Cf KAITHI NUMBER SIGN 110BE..110C1;N # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA +110C2;N # Mn KAITHI VOWEL SIGN VOCALIC R 110CD;N # Cf KAITHI NUMBER SIGN ABOVE 110D0..110E8;N # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 110F0..110F9;N # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE @@ -2076,6 +2117,7 @@ FFFD;A # So REPLACEMENT CHARACTER 116B6;N # Mc TAKRI SIGN VIRAMA 116B7;N # Mn TAKRI SIGN NUKTA 116B8;N # Lo TAKRI LETTER ARCHAIC KHA +116B9;N # Po TAKRI ABBREVIATION SIGN 116C0..116C9;N # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE 11700..1171A;N # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA 1171D..1171F;N # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA @@ -2087,6 +2129,7 @@ FFFD;A # So REPLACEMENT CHARACTER 1173A..1173B;N # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY 1173C..1173E;N # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI 1173F;N # So AHOM SYMBOL VI +11740..11746;N # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B;N # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E;N # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 1182F..11837;N # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA @@ -2145,6 +2188,7 @@ FFFD;A # So REPLACEMENT CHARACTER 11A9A..11A9C;N # Po [3] SOYOMBO MARK TSHEG..SOYOMBO MARK DOUBLE SHAD 11A9D;N # Lo SOYOMBO MARK PLUTA 11A9E..11AA2;N # Po [5] SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME..SOYOMBO TERMINAL MARK-2 +11AB0..11ABF;N # Lo [16] CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA 11AC0..11AF8;N # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08;N # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E;N # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA @@ -2201,6 +2245,8 @@ FFFD;A # So REPLACEMENT CHARACTER 12400..1246E;N # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12470..12474;N # Po [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON 12480..12543;N # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0;N # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2;N # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13000..1342E;N # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 13430..13438;N # Cf [9] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT 14400..14646;N # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 @@ -2208,6 +2254,8 @@ FFFD;A # So REPLACEMENT CHARACTER 16A40..16A5E;N # Lo [31] MRO LETTER TA..MRO LETTER TEK 16A60..16A69;N # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE 16A6E..16A6F;N # Po [2] MRO DANDA..MRO DOUBLE DANDA +16A70..16ABE;N # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9;N # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED;N # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF0..16AF4;N # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16AF5;N # Po BASSA VAH FULL STOP @@ -2240,8 +2288,11 @@ FFFD;A # So REPLACEMENT CHARACTER 18800..18AFF;W # Lo [768] TANGUT COMPONENT-001..TANGUT COMPONENT-768 18B00..18CD5;W # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08;W # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 +1AFF0..1AFF3;W # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB;W # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE;W # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 1B000..1B0FF;W # Lo [256] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER RE-2 -1B100..1B11E;W # Lo [31] HENTAIGANA LETTER RE-3..HENTAIGANA LETTER N-MU-MO-2 +1B100..1B122;W # Lo [35] HENTAIGANA LETTER RE-3..KATAKANA LETTER ARCHAIC WU 1B150..1B152;W # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167;W # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB;W # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -2253,6 +2304,9 @@ FFFD;A # So REPLACEMENT CHARACTER 1BC9D..1BC9E;N # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 1BC9F;N # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1BCA0..1BCA3;N # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF00..1CF2D;N # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46;N # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG +1CF50..1CFC3;N # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5;N # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126;N # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129..1D164;N # So [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE @@ -2266,7 +2320,7 @@ FFFD;A # So REPLACEMENT CHARACTER 1D185..1D18B;N # Mn [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1D18C..1D1A9;N # So [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH 1D1AA..1D1AD;N # Mn [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO -1D1AE..1D1E8;N # So [59] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KIEVAN FLAT SIGN +1D1AE..1D1EA;N # So [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON 1D200..1D241;N # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54 1D242..1D244;N # Mn [3] COMBINING GREEK MUSICAL TRISEME..COMBINING GREEK MUSICAL PENTASEME 1D245;N # So GREEK MUSICAL LEIMMA @@ -2326,6 +2380,9 @@ FFFD;A # So REPLACEMENT CHARACTER 1DA87..1DA8B;N # Po [5] SIGNWRITING COMMA..SIGNWRITING PARENTHESIS 1DA9B..1DA9F;N # Mn [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6 1DAA1..1DAAF;N # Mn [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16 +1DF00..1DF09;N # Ll [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A;N # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E;N # Ll [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E000..1E006;N # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018;N # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021;N # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -2337,10 +2394,16 @@ FFFD;A # So REPLACEMENT CHARACTER 1E140..1E149;N # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1E14E;N # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1E14F;N # So NYIAKENG PUACHUE HMONG CIRCLED CA +1E290..1E2AD;N # Lo [30] TOTO LETTER PA..TOTO LETTER A +1E2AE;N # Mn TOTO SIGN RISING TONE 1E2C0..1E2EB;N # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1E2EC..1E2EF;N # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E2F0..1E2F9;N # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE 1E2FF;N # Sc WANCHO NGUN SIGN +1E7E0..1E7E6;N # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB;N # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE;N # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE;N # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4;N # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8C7..1E8CF;N # No [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE 1E8D0..1E8D6;N # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS @@ -2465,6 +2528,7 @@ FFFD;A # So REPLACEMENT CHARACTER 1F6D0..1F6D2;W # So [3] PLACE OF WORSHIP..SHOPPING TROLLEY 1F6D3..1F6D4;N # So [2] STUPA..PAGODA 1F6D5..1F6D7;W # So [3] HINDU TEMPLE..ELEVATOR +1F6DD..1F6DF;W # So [3] PLAYGROUND SLIDE..RING BUOY 1F6E0..1F6EA;N # So [11] HAMMER AND WRENCH..NORTHEAST-POINTING AIRPLANE 1F6EB..1F6EC;W # So [2] AIRPLANE DEPARTURE..AIRPLANE ARRIVING 1F6F0..1F6F3;N # So [4] SATELLITE..PASSENGER SHIP @@ -2472,6 +2536,7 @@ FFFD;A # So REPLACEMENT CHARACTER 1F700..1F773;N # So [116] ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE 1F780..1F7D8;N # So [89] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7E0..1F7EB;W # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE +1F7F0;W # So HEAVY EQUALS SIGN 1F800..1F80B;N # So [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847;N # So [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859;N # So [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW @@ -2483,25 +2548,25 @@ FFFD;A # So REPLACEMENT CHARACTER 1F93B;N # So MODERN PENTATHLON 1F93C..1F945;W # So [10] WRESTLERS..GOAL NET 1F946;N # So RIFLE -1F947..1F978;W # So [50] FIRST PLACE MEDAL..DISGUISED FACE -1F97A..1F9CB;W # So [82] FACE WITH PLEADING EYES..BUBBLE TEA -1F9CD..1F9FF;W # So [51] STANDING PERSON..NAZAR AMULET +1F947..1F9FF;W # So [185] FIRST PLACE MEDAL..NAZAR AMULET 1FA00..1FA53;N # So [84] NEUTRAL CHESS KING..BLACK CHESS KNIGHT-BISHOP 1FA60..1FA6D;N # So [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER 1FA70..1FA74;W # So [5] BALLET SHOES..THONG SANDAL -1FA78..1FA7A;W # So [3] DROP OF BLOOD..STETHOSCOPE +1FA78..1FA7C;W # So [5] DROP OF BLOOD..CRUTCH 1FA80..1FA86;W # So [7] YO-YO..NESTING DOLLS -1FA90..1FAA8;W # So [25] RINGED PLANET..ROCK -1FAB0..1FAB6;W # So [7] FLY..FEATHER -1FAC0..1FAC2;W # So [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAD0..1FAD6;W # So [7] BLUEBERRIES..TEAPOT +1FA90..1FAAC;W # So [29] RINGED PLANET..HAMSA +1FAB0..1FABA;W # So [11] FLY..NEST WITH EGGS +1FAC0..1FAC5;W # So [6] ANATOMICAL HEART..PERSON WITH CROWN +1FAD0..1FAD9;W # So [10] BLUEBERRIES..JAR +1FAE0..1FAE7;W # So [8] MELTING FACE..BUBBLES +1FAF0..1FAF6;W # So [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS 1FB00..1FB92;N # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA;N # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON 1FBF0..1FBF9;N # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -20000..2A6DD;W # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A6DE..2A6FF;W # Cn [34] .. -2A700..2B734;W # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 -2B735..2B73F;W # Cn [11] .. +20000..2A6DF;W # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A6E0..2A6FF;W # Cn [32] .. +2A700..2B738;W # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 +2B739..2B73F;W # Cn [7] .. 2B740..2B81D;W # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B81E..2B81F;W # Cn [2] .. 2B820..2CEA1;W # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 diff --git a/lib/unicore/EmojiSources.txt b/lib/unicore/EmojiSources.txt index b2a526160c..391a7e0750 100644 --- a/lib/unicore/EmojiSources.txt +++ b/lib/unicore/EmojiSources.txt @@ -1,6 +1,6 @@ -# EmojiSources-13.0.0.txt -# Date: 2019-09-09, 19:40:00 GMT [MS, KW] -# © 2019 Unicode®, Inc. +# EmojiSources-14.0.0.txt +# Date: 2021-03-16, 21:39:00 GMT [MS, KW] +# © 2021 Unicode®, Inc. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Character Database diff --git a/lib/unicore/EquivalentUnifiedIdeograph.txt b/lib/unicore/EquivalentUnifiedIdeograph.txt index 98dc294b19..340ec3a71e 100644 --- a/lib/unicore/EquivalentUnifiedIdeograph.txt +++ b/lib/unicore/EquivalentUnifiedIdeograph.txt @@ -1,6 +1,6 @@ -# EquivalentUnifiedIdeograph-13.0.0.txt -# Date: 2019-09-09, 19:41:00 GMT [KL, KW] -# © 2019 Unicode®, Inc. +# EquivalentUnifiedIdeograph-14.0.0.txt +# Date: 2021-03-16, 21:41:00 GMT [KL, KW] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # diff --git a/lib/unicore/HangulSyllableType.txt b/lib/unicore/HangulSyllableType.txt index 90aa56964e..8e7ca091f6 100644 --- a/lib/unicore/HangulSyllableType.txt +++ b/lib/unicore/HangulSyllableType.txt @@ -1,6 +1,6 @@ -# HangulSyllableType-13.0.0.txt -# Date: 2019-09-08, 23:31:10 GMT -# © 2019 Unicode®, Inc. +# HangulSyllableType-14.0.0.txt +# Date: 2021-03-08, 19:35:46 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # diff --git a/lib/unicore/IdStatus.txt b/lib/unicore/IdStatus.txt index e699176ca9..29043bc846 100644 --- a/lib/unicore/IdStatus.txt +++ b/lib/unicore/IdStatus.txt @@ -1,11 +1,11 @@ # IdentifierStatus.txt -# Date: 2020-02-07, 22:02:47 GMT -# © 2020 Unicode®, Inc. +# Date: 2021-08-12, 01:13:34 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Security Mechanisms for UTS #39 -# Version: 13.0.0 +# Version: 14.0.0 # # For documentation and usage, see http://www.unicode.org/reports/tr39 # @@ -140,12 +140,16 @@ 076E..077F ; Allowed # 5.1 [18] ARABIC LETTER HAH WITH SMALL ARABIC LETTER TAH BELOW..ARABIC LETTER KAF WITH TWO DOTS ABOVE 0780..07B0 ; Allowed # 3.0 [49] THAANA LETTER HAA..THAANA SUKUN 07B1 ; Allowed # 3.2 THAANA LETTER NAA +0870..0887 ; Allowed # 14.0 [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; Allowed # 14.0 [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL 08A0 ; Allowed # 6.1 ARABIC LETTER BEH WITH SMALL V BELOW 08A1 ; Allowed # 7.0 ARABIC LETTER BEH WITH HAMZA ABOVE 08A2..08AC ; Allowed # 6.1 [11] ARABIC LETTER JEEM WITH TWO DOTS ABOVE..ARABIC LETTER ROHINGYA YEH 08B2 ; Allowed # 7.0 ARABIC LETTER ZAIN WITH INVERTED V ABOVE +08B5 ; Allowed # 14.0 ARABIC LETTER QAF WITH DOT BELOW AND NO DOTS ABOVE 08B6..08BD ; Allowed # 9.0 [8] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER AFRICAN NOON 08BE..08C7 ; Allowed # 13.0 [10] ARABIC LETTER PEH WITH SMALL V..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +08C8..08C9 ; Allowed # 14.0 [2] ARABIC LETTER GRAF..ARABIC SMALL FARSI YEH 0901..0903 ; Allowed # 1.1 [3] DEVANAGARI SIGN CANDRABINDU..DEVANAGARI SIGN VISARGA 0904 ; Allowed # 4.0 DEVANAGARI LETTER SHORT A 0905..0939 ; Allowed # 1.1 [53] DEVANAGARI LETTER A..DEVANAGARI LETTER HA @@ -254,11 +258,13 @@ 0C12..0C28 ; Allowed # 1.1 [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C33 ; Allowed # 1.1 [10] TELUGU LETTER PA..TELUGU LETTER LLA 0C35..0C39 ; Allowed # 1.1 [5] TELUGU LETTER VA..TELUGU LETTER HA +0C3C ; Allowed # 14.0 TELUGU SIGN NUKTA 0C3D ; Allowed # 5.1 TELUGU SIGN AVAGRAHA 0C3E..0C44 ; Allowed # 1.1 [7] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN VOCALIC RR 0C46..0C48 ; Allowed # 1.1 [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI 0C4A..0C4D ; Allowed # 1.1 [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56 ; Allowed # 1.1 [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C5D ; Allowed # 14.0 TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; Allowed # 1.1 [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C66..0C6F ; Allowed # 1.1 [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE 0C80 ; Allowed # 9.0 KANNADA SIGN SPACING CANDRABINDU @@ -273,6 +279,7 @@ 0CC6..0CC8 ; Allowed # 1.1 [3] KANNADA VOWEL SIGN E..KANNADA VOWEL SIGN AI 0CCA..0CCD ; Allowed # 1.1 [4] KANNADA VOWEL SIGN O..KANNADA SIGN VIRAMA 0CD5..0CD6 ; Allowed # 1.1 [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CDD ; Allowed # 14.0 KANNADA LETTER NAKAARA POLLU 0CE0..0CE1 ; Allowed # 1.1 [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; Allowed # 5.0 [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; Allowed # 1.1 [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -434,7 +441,8 @@ 1780..17A2 ; Allowed # 3.0 [35] KHMER LETTER KA..KHMER LETTER QA 17A5..17A7 ; Allowed # 3.0 [3] KHMER INDEPENDENT VOWEL QI..KHMER INDEPENDENT VOWEL QU 17A9..17B3 ; Allowed # 3.0 [11] KHMER INDEPENDENT VOWEL QUU..KHMER INDEPENDENT VOWEL QAU -17B6..17CA ; Allowed # 3.0 [21] KHMER VOWEL SIGN AA..KHMER SIGN TRIISAP +17B6..17CD ; Allowed # 3.0 [24] KHMER VOWEL SIGN AA..KHMER SIGN TOANDAKHIAT +17D0 ; Allowed # 3.0 KHMER SIGN SAMYOK SANNYA 17D2 ; Allowed # 3.0 KHMER SIGN COENG 17D7 ; Allowed # 3.0 KHMER SIGN LEK TOO 17DC ; Allowed # 3.0 KHMER SIGN AVAKRAHASANYA @@ -514,6 +522,7 @@ 9FD6..9FEA ; Allowed # 10.0 [21] CJK UNIFIED IDEOGRAPH-9FD6..CJK UNIFIED IDEOGRAPH-9FEA 9FEB..9FEF ; Allowed # 11.0 [5] CJK UNIFIED IDEOGRAPH-9FEB..CJK UNIFIED IDEOGRAPH-9FEF 9FF0..9FFC ; Allowed # 13.0 [13] CJK UNIFIED IDEOGRAPH-9FF0..CJK UNIFIED IDEOGRAPH-9FFC +9FFD..9FFF ; Allowed # 14.0 [3] CJK UNIFIED IDEOGRAPH-9FFD..CJK UNIFIED IDEOGRAPH-9FFF A67F ; Allowed # 5.1 CYRILLIC PAYEROK A717..A71A ; Allowed # 5.0 [4] MODIFIER LETTER DOT VERTICAL BAR..MODIFIER LETTER LOWER RIGHT CORNER ANGLE A71B..A71F ; Allowed # 5.1 [5] MODIFIER LETTER RAISED UP ARROW..MODIFIER LETTER LOW INVERTED EXCLAMATION MARK @@ -523,8 +532,12 @@ A792..A793 ; Allowed # 6.1 [2] LATIN CAPITAL LETTER C WITH BAR..LATIN S A7AA ; Allowed # 6.1 LATIN CAPITAL LETTER H WITH HOOK A7AE ; Allowed # 9.0 LATIN CAPITAL LETTER SMALL CAPITAL I A7B8..A7B9 ; Allowed # 11.0 [2] LATIN CAPITAL LETTER U WITH STROKE..LATIN SMALL LETTER U WITH STROKE +A7C0..A7C1 ; Allowed # 14.0 [2] LATIN CAPITAL LETTER OLD POLISH O..LATIN SMALL LETTER OLD POLISH O A7C2..A7C6 ; Allowed # 12.0 [5] LATIN CAPITAL LETTER ANGLICANA W..LATIN CAPITAL LETTER Z WITH PALATAL HOOK A7C7..A7CA ; Allowed # 13.0 [4] LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; Allowed # 14.0 [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; Allowed # 14.0 LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; Allowed # 14.0 [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S A9E7..A9FE ; Allowed # 7.0 [24] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING BHA AA60..AA76 ; Allowed # 5.2 [23] MYANMAR LETTER KHAMTI GA..MYANMAR LOGOGRAM KHAMTI HM AA7A..AA7B ; Allowed # 5.2 [2] MYANMAR LETTER AITON RA..MYANMAR SIGN PAO KAREN TONE @@ -548,14 +561,22 @@ FA27..FA29 ; Allowed # 1.1 [3] CJK COMPATIBILITY IDEOGRAPH-FA27..CJK CO 1133B ; Allowed # 11.0 COMBINING BINDU BELOW 1133C ; Allowed # 7.0 GRANTHA SIGN NUKTA 16FF0..16FF1 ; Allowed # 13.0 [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY +1B11F..1B122 ; Allowed # 14.0 [4] HIRAGANA LETTER ARCHAIC WU..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; Allowed # 12.0 [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; Allowed # 12.0 [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N +1DF00..1DF1E ; Allowed # 14.0 [31] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER S WITH CURL +1E7E0..1E7E6 ; Allowed # 14.0 [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; Allowed # 14.0 [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; Allowed # 14.0 [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; Allowed # 14.0 [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 20000..2A6D6 ; Allowed # 3.1 [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6 2A6D7..2A6DD ; Allowed # 13.0 [7] CJK UNIFIED IDEOGRAPH-2A6D7..CJK UNIFIED IDEOGRAPH-2A6DD +2A6DE..2A6DF ; Allowed # 14.0 [2] CJK UNIFIED IDEOGRAPH-2A6DE..CJK UNIFIED IDEOGRAPH-2A6DF 2A700..2B734 ; Allowed # 5.2 [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +2B735..2B738 ; Allowed # 14.0 [4] CJK UNIFIED IDEOGRAPH-2B735..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; Allowed # 6.0 [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Allowed # 8.0 [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Allowed # 10.0 [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 30000..3134A ; Allowed # 13.0 [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 107835 +# Total code points: 107957 diff --git a/lib/unicore/IdType.txt b/lib/unicore/IdType.txt index f71717465a..dc2f735451 100644 --- a/lib/unicore/IdType.txt +++ b/lib/unicore/IdType.txt @@ -1,11 +1,11 @@ # IdentifierType.txt -# Date: 2020-02-07, 22:02:47 GMT -# © 2020 Unicode®, Inc. +# Date: 2021-08-12, 01:13:33 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Security Mechanisms for UTS #39 -# Version: 13.0.0 +# Version: 14.0.0 # # For documentation and usage, see http://www.unicode.org/reports/tr39 # @@ -137,12 +137,16 @@ 076E..077F ; Recommended # 5.1 [18] ARABIC LETTER HAH WITH SMALL ARABIC LETTER TAH BELOW..ARABIC LETTER KAF WITH TWO DOTS ABOVE 0780..07B0 ; Recommended # 3.0 [49] THAANA LETTER HAA..THAANA SUKUN 07B1 ; Recommended # 3.2 THAANA LETTER NAA +0870..0887 ; Recommended # 14.0 [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; Recommended # 14.0 [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL 08A0 ; Recommended # 6.1 ARABIC LETTER BEH WITH SMALL V BELOW 08A1 ; Recommended # 7.0 ARABIC LETTER BEH WITH HAMZA ABOVE 08A2..08AC ; Recommended # 6.1 [11] ARABIC LETTER JEEM WITH TWO DOTS ABOVE..ARABIC LETTER ROHINGYA YEH 08B2 ; Recommended # 7.0 ARABIC LETTER ZAIN WITH INVERTED V ABOVE +08B5 ; Recommended # 14.0 ARABIC LETTER QAF WITH DOT BELOW AND NO DOTS ABOVE 08B6..08BD ; Recommended # 9.0 [8] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER AFRICAN NOON 08BE..08C7 ; Recommended # 13.0 [10] ARABIC LETTER PEH WITH SMALL V..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +08C8..08C9 ; Recommended # 14.0 [2] ARABIC LETTER GRAF..ARABIC SMALL FARSI YEH 0901..0903 ; Recommended # 1.1 [3] DEVANAGARI SIGN CANDRABINDU..DEVANAGARI SIGN VISARGA 0904 ; Recommended # 4.0 DEVANAGARI LETTER SHORT A 0905..0939 ; Recommended # 1.1 [53] DEVANAGARI LETTER A..DEVANAGARI LETTER HA @@ -251,11 +255,13 @@ 0C12..0C28 ; Recommended # 1.1 [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C33 ; Recommended # 1.1 [10] TELUGU LETTER PA..TELUGU LETTER LLA 0C35..0C39 ; Recommended # 1.1 [5] TELUGU LETTER VA..TELUGU LETTER HA +0C3C ; Recommended # 14.0 TELUGU SIGN NUKTA 0C3D ; Recommended # 5.1 TELUGU SIGN AVAGRAHA 0C3E..0C44 ; Recommended # 1.1 [7] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN VOCALIC RR 0C46..0C48 ; Recommended # 1.1 [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI 0C4A..0C4D ; Recommended # 1.1 [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56 ; Recommended # 1.1 [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK +0C5D ; Recommended # 14.0 TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; Recommended # 1.1 [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C66..0C6F ; Recommended # 1.1 [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE 0C80 ; Recommended # 9.0 KANNADA SIGN SPACING CANDRABINDU @@ -270,6 +276,7 @@ 0CC6..0CC8 ; Recommended # 1.1 [3] KANNADA VOWEL SIGN E..KANNADA VOWEL SIGN AI 0CCA..0CCD ; Recommended # 1.1 [4] KANNADA VOWEL SIGN O..KANNADA SIGN VIRAMA 0CD5..0CD6 ; Recommended # 1.1 [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK +0CDD ; Recommended # 14.0 KANNADA LETTER NAKAARA POLLU 0CE0..0CE1 ; Recommended # 1.1 [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; Recommended # 5.0 [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; Recommended # 1.1 [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -430,7 +437,8 @@ 1780..17A2 ; Recommended # 3.0 [35] KHMER LETTER KA..KHMER LETTER QA 17A5..17A7 ; Recommended # 3.0 [3] KHMER INDEPENDENT VOWEL QI..KHMER INDEPENDENT VOWEL QU 17A9..17B3 ; Recommended # 3.0 [11] KHMER INDEPENDENT VOWEL QUU..KHMER INDEPENDENT VOWEL QAU -17B6..17CA ; Recommended # 3.0 [21] KHMER VOWEL SIGN AA..KHMER SIGN TRIISAP +17B6..17CD ; Recommended # 3.0 [24] KHMER VOWEL SIGN AA..KHMER SIGN TOANDAKHIAT +17D0 ; Recommended # 3.0 KHMER SIGN SAMYOK SANNYA 17D2 ; Recommended # 3.0 KHMER SIGN COENG 17D7 ; Recommended # 3.0 KHMER SIGN LEK TOO 17DC ; Recommended # 3.0 KHMER SIGN AVAKRAHASANYA @@ -506,6 +514,7 @@ 9FD6..9FEA ; Recommended # 10.0 [21] CJK UNIFIED IDEOGRAPH-9FD6..CJK UNIFIED IDEOGRAPH-9FEA 9FEB..9FEF ; Recommended # 11.0 [5] CJK UNIFIED IDEOGRAPH-9FEB..CJK UNIFIED IDEOGRAPH-9FEF 9FF0..9FFC ; Recommended # 13.0 [13] CJK UNIFIED IDEOGRAPH-9FF0..CJK UNIFIED IDEOGRAPH-9FFC +9FFD..9FFF ; Recommended # 14.0 [3] CJK UNIFIED IDEOGRAPH-9FFD..CJK UNIFIED IDEOGRAPH-9FFF A67F ; Recommended # 5.1 CYRILLIC PAYEROK A717..A71A ; Recommended # 5.0 [4] MODIFIER LETTER DOT VERTICAL BAR..MODIFIER LETTER LOWER RIGHT CORNER ANGLE A71B..A71F ; Recommended # 5.1 [5] MODIFIER LETTER RAISED UP ARROW..MODIFIER LETTER LOW INVERTED EXCLAMATION MARK @@ -515,8 +524,12 @@ A792..A793 ; Recommended # 6.1 [2] LATIN CAPITAL LETTER A7AA ; Recommended # 6.1 LATIN CAPITAL LETTER H WITH HOOK A7AE ; Recommended # 9.0 LATIN CAPITAL LETTER SMALL CAPITAL I A7B8..A7B9 ; Recommended # 11.0 [2] LATIN CAPITAL LETTER U WITH STROKE..LATIN SMALL LETTER U WITH STROKE +A7C0..A7C1 ; Recommended # 14.0 [2] LATIN CAPITAL LETTER OLD POLISH O..LATIN SMALL LETTER OLD POLISH O A7C2..A7C6 ; Recommended # 12.0 [5] LATIN CAPITAL LETTER ANGLICANA W..LATIN CAPITAL LETTER Z WITH PALATAL HOOK A7C7..A7CA ; Recommended # 13.0 [4] LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; Recommended # 14.0 [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; Recommended # 14.0 LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; Recommended # 14.0 [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S A9E7..A9FE ; Recommended # 7.0 [24] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING BHA AA60..AA76 ; Recommended # 5.2 [23] MYANMAR LETTER KHAMTI GA..MYANMAR LOGOGRAM KHAMTI HM AA7A..AA7B ; Recommended # 5.2 [2] MYANMAR LETTER AITON RA..MYANMAR SIGN PAO KAREN TONE @@ -540,17 +553,25 @@ FA27..FA29 ; Recommended # 1.1 [3] CJK COMPATIBILITY ID 1133B ; Recommended # 11.0 COMBINING BINDU BELOW 1133C ; Recommended # 7.0 GRANTHA SIGN NUKTA 16FF0..16FF1 ; Recommended # 13.0 [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY +1B11F..1B122 ; Recommended # 14.0 [4] HIRAGANA LETTER ARCHAIC WU..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; Recommended # 12.0 [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; Recommended # 12.0 [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N +1DF00..1DF1E ; Recommended # 14.0 [31] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER S WITH CURL +1E7E0..1E7E6 ; Recommended # 14.0 [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; Recommended # 14.0 [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; Recommended # 14.0 [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; Recommended # 14.0 [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 20000..2A6D6 ; Recommended # 3.1 [42711] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6D6 2A6D7..2A6DD ; Recommended # 13.0 [7] CJK UNIFIED IDEOGRAPH-2A6D7..CJK UNIFIED IDEOGRAPH-2A6DD +2A6DE..2A6DF ; Recommended # 14.0 [2] CJK UNIFIED IDEOGRAPH-2A6DE..CJK UNIFIED IDEOGRAPH-2A6DF 2A700..2B734 ; Recommended # 5.2 [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +2B735..2B738 ; Recommended # 14.0 [4] CJK UNIFIED IDEOGRAPH-2B735..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; Recommended # 6.0 [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Recommended # 8.0 [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Recommended # 10.0 [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 30000..3134A ; Recommended # 13.0 [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 107816 +# Total code points: 107938 # Identifier_Type: Inclusion @@ -607,8 +628,8 @@ FA27..FA29 ; Recommended # 1.1 [3] CJK COMPATIBILITY ID 1A90..1A99 ; Limited_Use # 5.2 [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE 1AA7 ; Limited_Use # 5.2 TAI THAM SIGN MAI YAMOK 1B00..1B4B ; Limited_Use # 5.0 [76] BALINESE SIGN ULU RICEM..BALINESE LETTER ASYURA SASAK +1B4C ; Limited_Use # 14.0 BALINESE LETTER ARCHAIC JNYA 1B50..1B59 ; Limited_Use # 5.0 [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE -1B6B..1B73 ; Limited_Use # 5.0 [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1B80..1BAA ; Limited_Use # 5.1 [43] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PAMAAEH 1BAB..1BAD ; Limited_Use # 6.1 [3] SUNDANESE SIGN VIRAMA..SUNDANESE CONSONANT SIGN PASANGAN WA 1BAE..1BB9 ; Limited_Use # 5.1 [12] SUNDANESE LETTER KHA..SUNDANESE DIGIT NINE @@ -657,6 +678,7 @@ ABF0..ABF9 ; Limited_Use # 5.2 [10] MEETEI MAYEK DIGIT Z 1145E ; Limited_Use # 11.0 NEWA SANDHI MARK 1145F ; Limited_Use # 12.0 NEWA LETTER VEDIC ANUSVARA 11460..11461 ; Limited_Use # 13.0 [2] NEWA SIGN JIHVAMULIYA..NEWA SIGN UPADHMANIYA +11AB0..11ABF ; Limited_Use # 14.0 [16] CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA 11D60..11D65 ; Limited_Use # 11.0 [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU 11D67..11D68 ; Limited_Use # 11.0 [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI 11D6A..11D8E ; Limited_Use # 11.0 [37] GUNJALA GONDI LETTER OO..GUNJALA GONDI VOWEL SIGN UU @@ -680,13 +702,15 @@ ABF0..ABF9 ; Limited_Use # 5.2 [10] MEETEI MAYEK DIGIT Z 1E94B ; Limited_Use # 12.0 ADLAM NASALIZATION MARK 1E950..1E959 ; Limited_Use # 9.0 [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE -# Total code points: 5025 +# Total code points: 5033 # Identifier_Type: Limited_Use Technical 0740..074A ; Limited_Use Technical # 3.0 [11] SYRIAC FEMININE DOT..SYRIAC BARREKH +1B6B..1B73 ; Limited_Use Technical # 5.0 [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG +1DFA ; Limited_Use Technical # 14.0 COMBINING DOT BELOW LEFT -# Total code points: 11 +# Total code points: 21 # Identifier_Type: Limited_Use Exclusion @@ -719,6 +743,7 @@ A62A..A62B ; Limited_Use Obsolete # 5.1 [2] VAI SYLLABLE NDOLE M 1AA8..1AAD ; Limited_Use Not_XID # 5.2 [6] TAI THAM SIGN KAAN..TAI THAM SIGN CAANG 1B5A..1B6A ; Limited_Use Not_XID # 5.0 [17] BALINESE PANTI..BALINESE MUSICAL SYMBOL DANG GEDE 1B74..1B7C ; Limited_Use Not_XID # 5.0 [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +1B7D..1B7E ; Limited_Use Not_XID # 14.0 [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1BFC..1BFF ; Limited_Use Not_XID # 6.0 [4] BATAK SYMBOL BINDU NA METEK..BATAK SYMBOL BINDU PANGOLAT 1C3B..1C3F ; Limited_Use Not_XID # 5.1 [5] LEPCHA PUNCTUATION TA-ROL..LEPCHA PUNCTUATION TSHOOK 1C7E..1C7F ; Limited_Use Not_XID # 5.1 [2] OL CHIKI PUNCTUATION MUCAAD..OL CHIKI PUNCTUATION DOUBLE MUCAAD @@ -754,7 +779,7 @@ ABEB ; Limited_Use Not_XID # 5.2 MEETEI MAYEK CHEIKHE 1E2FF ; Limited_Use Not_XID # 12.0 WANCHO NGUN SIGN 1E95E..1E95F ; Limited_Use Not_XID # 9.0 [2] ADLAM INITIAL EXCLAMATION MARK..ADLAM INITIAL QUESTION MARK -# Total code points: 202 +# Total code points: 204 # Identifier_Type: Uncommon_Use @@ -798,7 +823,9 @@ ABEB ; Limited_Use Not_XID # 5.2 MEETEI MAYEK CHEIKHE 06DF..06E4 ; Uncommon_Use # 1.1 [6] ARABIC SMALL HIGH ROUNDED ZERO..ARABIC SMALL HIGH MADDA 06E7..06E8 ; Uncommon_Use # 1.1 [2] ARABIC SMALL HIGH YEH..ARABIC SMALL HIGH NOON 06EA..06ED ; Uncommon_Use # 1.1 [4] ARABIC EMPTY CENTRE LOW STOP..ARABIC SMALL LOW MEEM +0898..089F ; Uncommon_Use # 14.0 [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA 08B3..08B4 ; Uncommon_Use # 8.0 [2] ARABIC LETTER AIN WITH THREE DOTS BELOW..ARABIC LETTER KAF WITH DOT BELOW +08CA..08D2 ; Uncommon_Use # 14.0 [9] ARABIC SMALL HIGH FARSI YEH..ARABIC LARGE ROUND DOT INSIDE CIRCLE BELOW 08D3 ; Uncommon_Use # 11.0 ARABIC SMALL LOW WAW 08D4..08E1 ; Uncommon_Use # 9.0 [14] ARABIC SMALL HIGH WORD AR-RUB..ARABIC SMALL HIGH SIGN SAFHA 08E3 ; Uncommon_Use # 8.0 ARABIC TURNED DAMMA BELOW @@ -816,6 +843,7 @@ ABEB ; Limited_Use Not_XID # 5.2 MEETEI MAYEK CHEIKHE 0D44 ; Uncommon_Use # 5.1 MALAYALAM VOWEL SIGN VOCALIC RR 0D62..0D63 ; Uncommon_Use # 5.1 [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL 0F39 ; Uncommon_Use # 2.0 TIBETAN MARK TSA -PHRU +1AC1..1ACE ; Uncommon_Use # 14.0 [14] COMBINING LEFT PARENTHESIS ABOVE LEFT..COMBINING LATIN SMALL LETTER INSULAR T 2054 ; Uncommon_Use # 4.0 INVERTED UNDERTIE 2C68..2C6C ; Uncommon_Use # 5.0 [5] LATIN SMALL LETTER H WITH DESCENDER..LATIN SMALL LETTER Z WITH DESCENDER A66F ; Uncommon_Use # 5.1 COMBINING CYRILLIC VZMET @@ -824,8 +852,12 @@ A78B..A78C ; Uncommon_Use # 5.1 [2] LATIN CAPITAL LETTER A78F ; Uncommon_Use # 8.0 LATIN LETTER SINOLOGICAL DOT A7B2..A7B7 ; Uncommon_Use # 8.0 [6] LATIN CAPITAL LETTER J WITH CROSSED-TAIL..LATIN SMALL LETTER OMEGA AB60..AB63 ; Uncommon_Use # 8.0 [4] LATIN SMALL LETTER SAKHA YAT..LATIN SMALL LETTER UO +10780 ; Uncommon_Use # 14.0 MODIFIER LETTER SMALL CAPITAL AA +1AFF0..1AFF3 ; Uncommon_Use # 14.0 [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; Uncommon_Use # 14.0 [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; Uncommon_Use # 14.0 [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 -# Total code points: 263 +# Total code points: 308 # Identifier_Type: Uncommon_Use Technical @@ -931,7 +963,7 @@ A8FC ; Uncommon_Use Obsolete Not_XID # 8.0 DEVANAGARI SIGN SIDD 0953..0954 ; Technical # 1.1 [2] DEVANAGARI GRAVE ACCENT..DEVANAGARI ACUTE ACCENT 0D81 ; Technical # 13.0 SINHALA SIGN CANDRABINDU 0F18..0F19 ; Technical # 2.0 [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS -17CB..17D0 ; Technical # 3.0 [6] KHMER SIGN BANTOC..KHMER SIGN SAMYOK SANNYA +17CE..17CF ; Technical # 3.0 [2] KHMER SIGN KAKABAT..KHMER SIGN AHSDA 1ABF..1AC0 ; Technical # 13.0 [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW 1D00..1D2B ; Technical # 4.0 [44] LATIN LETTER SMALL CAPITAL A..CYRILLIC LETTER SMALL CAPITAL EL 1D2F ; Technical # 4.0 MODIFIER LETTER CAPITAL BARRED B @@ -967,7 +999,6 @@ A8FC ; Uncommon_Use Obsolete Not_XID # 8.0 DEVANAGARI SIGN SIDD 3021..302D ; Technical # 1.1 [13] HANGZHOU NUMERAL ONE..IDEOGRAPHIC ENTERING TONE MARK 3031..3035 ; Technical # 1.1 [5] VERTICAL KANA REPEAT MARK..VERTICAL KANA REPEAT MARK LOWER HALF 303B..303C ; Technical # 3.2 [2] VERTICAL IDEOGRAPHIC ITERATION MARK..MASU MARK -31F0..31FF ; Technical # 3.2 [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO A78E ; Technical # 6.0 LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A7AF ; Technical # 11.0 LATIN LETTER SMALL CAPITAL Q A7BA..A7BF ; Technical # 12.0 [6] LATIN CAPITAL LETTER GLOTTAL A..LATIN SMALL LETTER GLOTTAL U @@ -977,13 +1008,15 @@ FE20..FE23 ; Technical # 1.1 [4] COMBINING LIGATURE L FE24..FE26 ; Technical # 5.1 [3] COMBINING MACRON LEFT HALF..COMBINING CONJOINING MACRON FE27..FE2D ; Technical # 7.0 [7] COMBINING LIGATURE LEFT HALF BELOW..COMBINING CONJOINING MACRON BELOW FE73 ; Technical # 3.2 ARABIC TAIL FRAGMENT +1CF00..1CF2D ; Technical # 14.0 [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; Technical # 14.0 [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D165..1D169 ; Technical # 3.1 [5] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16D..1D172 ; Technical # 3.1 [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 1D17B..1D182 ; Technical # 3.1 [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE 1D185..1D18B ; Technical # 3.1 [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1D1AA..1D1AD ; Technical # 3.1 [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO -# Total code points: 451 +# Total code points: 500 # Identifier_Type: Technical Exclusion @@ -1035,9 +1068,14 @@ A722..A72F ; Technical Obsolete # 5.1 [14] LATIN CAPITAL LETTER 4DC0..4DFF ; Technical Not_XID # 4.0 [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION A708..A716 ; Technical Not_XID # 4.1 [15] MODIFIER LETTER EXTRA-HIGH DOTTED TONE BAR..MODIFIER LETTER EXTRA-LOW LEFT-STEM TONE BAR FBB2..FBC1 ; Technical Not_XID # 6.0 [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBC2 ; Technical Not_XID # 14.0 ARABIC SYMBOL WASLA ABOVE FD3E..FD3F ; Technical Not_XID # 1.1 [2] ORNATE LEFT PARENTHESIS..ORNATE RIGHT PARENTHESIS +FD40..FD4F ; Technical Not_XID # 14.0 [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH +FDCF ; Technical Not_XID # 14.0 ARABIC LIGATURE SALAAMUHU ALAYNAA FDFD ; Technical Not_XID # 4.0 ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFE..FDFF ; Technical Not_XID # 14.0 [2] ARABIC LIGATURE SUBHAANAHU WA TAAALAA..ARABIC LIGATURE AZZA WA JALL FE45..FE46 ; Technical Not_XID # 3.2 [2] SESAME DOT..WHITE SESAME DOT +1CF50..1CFC3 ; Technical Not_XID # 14.0 [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5 ; Technical Not_XID # 3.1 [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126 ; Technical Not_XID # 3.1 [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129 ; Technical Not_XID # 5.1 MUSICAL SYMBOL MULTIPLE MEASURE REST @@ -1047,9 +1085,10 @@ FE45..FE46 ; Technical Not_XID # 3.2 [2] SESAME DOT..WHITE SE 1D18C..1D1A9 ; Technical Not_XID # 3.1 [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH 1D1AE..1D1BA ; Technical Not_XID # 3.1 [13] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL SEMIBREVIS BLACK 1D1C1..1D1DD ; Technical Not_XID # 3.1 [29] MUSICAL SYMBOL LONGA PERFECTA REST..MUSICAL SYMBOL PES SUBPUNCTIS +1D1E9..1D1EA ; Technical Not_XID # 14.0 [2] MUSICAL SYMBOL SORI..MUSICAL SYMBOL KORON 1D300..1D356 ; Technical Not_XID # 4.0 [87] MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING -# Total code points: 887 +# Total code points: 1025 # Identifier_Type: Exclusion @@ -1060,7 +1099,10 @@ FE45..FE46 ; Technical Not_XID # 3.2 [2] SESAME DOT..WHITE SE 16EE..16F0 ; Exclusion # 3.0 [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; Exclusion # 7.0 [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC 1700..170C ; Exclusion # 3.2 [13] TAGALOG LETTER A..TAGALOG LETTER YA +170D ; Exclusion # 14.0 TAGALOG LETTER RA 170E..1714 ; Exclusion # 3.2 [7] TAGALOG LETTER LA..TAGALOG SIGN VIRAMA +1715 ; Exclusion # 14.0 TAGALOG SIGN PAMUDPOD +171F ; Exclusion # 14.0 TAGALOG LETTER ARCHAIC RA 1720..1734 ; Exclusion # 3.2 [21] HANUNOO LETTER A..HANUNOO SIGN PAMUDPOD 1740..1753 ; Exclusion # 3.2 [20] BUHID LETTER A..BUHID VOWEL SIGN U 1760..176C ; Exclusion # 3.2 [13] TAGBANWA LETTER A..TAGBANWA LETTER YA @@ -1074,7 +1116,9 @@ FE45..FE46 ; Technical Not_XID # 3.2 [2] SESAME DOT..WHITE SE 1A00..1A1B ; Exclusion # 4.1 [28] BUGINESE LETTER KA..BUGINESE VOWEL SIGN AE 1CFA ; Exclusion # 12.0 VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA 2C00..2C2E ; Exclusion # 4.1 [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C2F ; Exclusion # 14.0 GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI 2C30..2C5E ; Exclusion # 4.1 [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C5F ; Exclusion # 14.0 GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C80..2CE4 ; Exclusion # 4.1 [101] COPTIC CAPITAL LETTER ALFA..COPTIC SYMBOL KAI 2CEB..2CEF ; Exclusion # 5.2 [5] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC COMBINING NI ABOVE 2CF2..2CF3 ; Exclusion # 6.1 [2] COPTIC CAPITAL LETTER BOHAIRIC KHEI..COPTIC SMALL LETTER BOHAIRIC KHEI @@ -1105,6 +1149,14 @@ A930..A953 ; Exclusion # 5.1 [36] REJANG LETTER KA..RE 104A0..104A9 ; Exclusion # 4.0 [10] OSMANYA DIGIT ZERO..OSMANYA DIGIT NINE 10500..10527 ; Exclusion # 7.0 [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; Exclusion # 7.0 [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW +10570..1057A ; Exclusion # 14.0 [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Exclusion # 14.0 [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Exclusion # 14.0 [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Exclusion # 14.0 [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; Exclusion # 14.0 [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Exclusion # 14.0 [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Exclusion # 14.0 [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Exclusion # 14.0 [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; Exclusion # 7.0 [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; Exclusion # 7.0 [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; Exclusion # 7.0 [8] LINEAR A SIGN A800..LINEAR A SIGN A807 @@ -1148,12 +1200,15 @@ A930..A953 ; Exclusion # 5.1 [36] REJANG LETTER KA..RE 10F00..10F1C ; Exclusion # 11.0 [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL 10F27 ; Exclusion # 11.0 OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F50 ; Exclusion # 11.0 [33] SOGDIAN LETTER ALEPH..SOGDIAN COMBINING STROKE BELOW +10F70..10F85 ; Exclusion # 14.0 [22] OLD UYGHUR LETTER ALEPH..OLD UYGHUR COMBINING TWO DOTS BELOW 10FB0..10FC4 ; Exclusion # 13.0 [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; Exclusion # 12.0 [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11000..11046 ; Exclusion # 6.0 [71] BRAHMI SIGN CANDRABINDU..BRAHMI VIRAMA 11066..1106F ; Exclusion # 6.0 [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11070..11075 ; Exclusion # 14.0 [6] BRAHMI SIGN OLD TAMIL VIRAMA..BRAHMI LETTER OLD TAMIL LLA 1107F ; Exclusion # 7.0 BRAHMI NUMBER JOINER 11080..110BA ; Exclusion # 5.2 [59] KAITHI SIGN CANDRABINDU..KAITHI SIGN NUKTA +110C2 ; Exclusion # 14.0 KAITHI VOWEL SIGN VOCALIC R 110D0..110E8 ; Exclusion # 6.1 [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 110F0..110F9 ; Exclusion # 6.1 [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE 11150..11173 ; Exclusion # 7.0 [36] MAHAJANI LETTER A..MAHAJANI SIGN NUKTA @@ -1206,6 +1261,7 @@ A930..A953 ; Exclusion # 5.1 [36] REJANG LETTER KA..RE 1171A ; Exclusion # 11.0 AHOM LETTER ALTERNATE BA 1171D..1172B ; Exclusion # 8.0 [15] AHOM CONSONANT SIGN MEDIAL LA..AHOM SIGN KILLER 11730..11739 ; Exclusion # 8.0 [10] AHOM DIGIT ZERO..AHOM DIGIT NINE +11740..11746 ; Exclusion # 14.0 [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1183A ; Exclusion # 11.0 [59] DOGRA LETTER A..DOGRA SIGN NUKTA 118A0..118E9 ; Exclusion # 7.0 [74] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI DIGIT NINE 118FF ; Exclusion # 7.0 WARANG CITI OM @@ -1249,8 +1305,11 @@ A930..A953 ; Exclusion # 5.1 [36] REJANG LETTER KA..RE 12400..12462 ; Exclusion # 5.0 [99] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN OLD ASSYRIAN ONE QUARTER 12463..1246E ; Exclusion # 7.0 [12] CUNEIFORM NUMERIC SIGN ONE QUARTER GUR..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; Exclusion # 8.0 [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; Exclusion # 14.0 [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; Exclusion # 5.2 [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; Exclusion # 8.0 [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 +16A70..16ABE ; Exclusion # 14.0 [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; Exclusion # 14.0 [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED ; Exclusion # 7.0 [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF0..16AF4 ; Exclusion # 7.0 [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16B00..16B36 ; Exclusion # 7.0 [55] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG MARK CIM TAUM @@ -1285,10 +1344,11 @@ A930..A953 ; Exclusion # 5.1 [36] REJANG LETTER KA..RE 1E01B..1E021 ; Exclusion # 9.0 [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI 1E023..1E024 ; Exclusion # 9.0 [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; Exclusion # 9.0 [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA +1E290..1E2AE ; Exclusion # 14.0 [31] TOTO LETTER PA..TOTO SIGN RISING TONE 1E800..1E8C4 ; Exclusion # 7.0 [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8D0..1E8D6 ; Exclusion # 7.0 [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS -# Total code points: 15602 +# Total code points: 15930 # Identifier_Type: Exclusion Not_XID @@ -1336,6 +1396,7 @@ A95F ; Exclusion Not_XID # 5.1 REJANG SECTION MARK 10EAD ; Exclusion Not_XID # 13.0 YEZIDI HYPHENATION MARK 10F1D..10F26 ; Exclusion Not_XID # 11.0 [10] OLD SOGDIAN NUMBER ONE..OLD SOGDIAN FRACTION ONE HALF 10F51..10F59 ; Exclusion Not_XID # 11.0 [9] SOGDIAN NUMBER ONE..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F86..10F89 ; Exclusion Not_XID # 14.0 [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 10FC5..10FCB ; Exclusion Not_XID # 13.0 [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED 11047..1104D ; Exclusion Not_XID # 6.0 [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 11052..11065 ; Exclusion Not_XID # 6.0 [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND @@ -1355,6 +1416,7 @@ A95F ; Exclusion Not_XID # 5.1 REJANG SECTION MARK 115CA..115D7 ; Exclusion Not_XID # 8.0 [14] SIDDHAM SECTION MARK WITH TRIDENT AND U-SHAPED ORNAMENTS..SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES 11641..11643 ; Exclusion Not_XID # 7.0 [3] MODI DANDA..MODI ABBREVIATION SIGN 11660..1166C ; Exclusion Not_XID # 9.0 [13] MONGOLIAN BIRGA WITH ORNAMENT..MONGOLIAN TURNED SWIRL BIRGA WITH DOUBLE ORNAMENT +116B9 ; Exclusion Not_XID # 14.0 TAKRI ABBREVIATION SIGN 1173A..1173F ; Exclusion Not_XID # 8.0 [6] AHOM NUMBER TEN..AHOM SYMBOL VI 1183B ; Exclusion Not_XID # 11.0 DOGRA ABBREVIATION SIGN 118EA..118F2 ; Exclusion Not_XID # 7.0 [9] WARANG CITI NUMBER TEN..WARANG CITI NUMBER NINETY @@ -1369,6 +1431,7 @@ A95F ; Exclusion Not_XID # 5.1 REJANG SECTION MARK 11EF7..11EF8 ; Exclusion Not_XID # 11.0 [2] MAKASAR PASSIMBANG..MAKASAR END OF SECTION 12470..12473 ; Exclusion Not_XID # 5.0 [4] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL TRICOLON 12474 ; Exclusion Not_XID # 7.0 CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON +12FF1..12FF2 ; Exclusion Not_XID # 14.0 [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13430..13438 ; Exclusion Not_XID # 12.0 [9] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT 16A6E..16A6F ; Exclusion Not_XID # 7.0 [2] MRO DANDA..MRO DOUBLE DANDA 16AF5 ; Exclusion Not_XID # 7.0 BASSA VAH FULL STOP @@ -1385,7 +1448,7 @@ A95F ; Exclusion Not_XID # 5.1 REJANG SECTION MARK 1DA85..1DA8B ; Exclusion Not_XID # 8.0 [7] SIGNWRITING LOCATION TORSO..SIGNWRITING PARENTHESIS 1E8C7..1E8CF ; Exclusion Not_XID # 7.0 [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE -# Total code points: 1098 +# Total code points: 1105 # Identifier_Type: Obsolete @@ -1461,6 +1524,7 @@ A95F ; Exclusion Not_XID # 5.1 REJANG SECTION MARK 2D00..2D25 ; Obsolete # 4.1 [38] GEORGIAN SMALL LETTER AN..GEORGIAN SMALL LETTER HOE 2DE0..2DFF ; Obsolete # 5.1 [32] COMBINING CYRILLIC LETTER BE..COMBINING CYRILLIC LETTER IOTIFIED BIG YUS 312E ; Obsolete # 10.0 BOPOMOFO LETTER O WITH DOT ABOVE +31F0..31FF ; Obsolete # 3.2 [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO A640..A65F ; Obsolete # 5.1 [32] CYRILLIC CAPITAL LETTER ZEMLYA..CYRILLIC SMALL LETTER YN A660..A661 ; Obsolete # 6.0 [2] CYRILLIC CAPITAL LETTER REVERSED TSE..CYRILLIC SMALL LETTER REVERSED TSE A662..A66E ; Obsolete # 5.1 [13] CYRILLIC CAPITAL LETTER SOFT DE..CYRILLIC LETTER MULTIOCULAR O @@ -1494,7 +1558,7 @@ D7CB..D7FB ; Obsolete # 5.2 [49] HANGUL JONGSEONG NIE 1B000..1B001 ; Obsolete # 6.0 [2] KATAKANA LETTER ARCHAIC E..HIRAGANA LETTER ARCHAIC YE 1B002..1B11E ; Obsolete # 10.0 [285] HENTAIGANA LETTER A-1..HENTAIGANA LETTER N-MU-MO-2 -# Total code points: 1325 +# Total code points: 1341 # Identifier_Type: Obsolete Not_XID @@ -1569,6 +1633,7 @@ A8F8..A8FA ; Obsolete Not_XID # 5.2 [3] DEVANAGARI SIGN PUSH 060C ; Not_XID # 1.1 ARABIC COMMA 060D..060F ; Not_XID # 4.0 [3] ARABIC DATE SEPARATOR..ARABIC SIGN MISRA 061B ; Not_XID # 1.1 ARABIC SEMICOLON +061D ; Not_XID # 14.0 ARABIC END OF TEXT MARK 061E ; Not_XID # 4.1 ARABIC TRIPLE DOT PUNCTUATION MARK 061F ; Not_XID # 1.1 ARABIC QUESTION MARK 066A..066D ; Not_XID # 1.1 [4] ARABIC PERCENT SIGN..ARABIC FIVE POINTED STAR @@ -1576,6 +1641,8 @@ A8F8..A8FA ; Obsolete Not_XID # 5.2 [3] DEVANAGARI SIGN PUSH 06DD ; Not_XID # 1.1 ARABIC END OF AYAH 06DE ; Not_XID # 1.1 ARABIC START OF RUB EL HIZB 06E9 ; Not_XID # 1.1 ARABIC PLACE OF SAJDAH +0888 ; Not_XID # 14.0 ARABIC RAISED ROUND DOT +0890..0891 ; Not_XID # 14.0 [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE 08E2 ; Not_XID # 9.0 ARABIC DISPUTED END OF AYAH 0964..0965 ; Not_XID # 1.1 [2] DEVANAGARI DANDA..DEVANAGARI DOUBLE DANDA 0970 ; Not_XID # 1.1 DEVANAGARI ABBREVIATION SIGN @@ -1656,6 +1723,7 @@ A8F8..A8FA ; Obsolete Not_XID # 5.2 [3] DEVANAGARI SIGN PUSH 20BB..20BD ; Not_XID # 7.0 [3] NORDIC MARK SIGN..RUBLE SIGN 20BE ; Not_XID # 8.0 LARI SIGN 20BF ; Not_XID # 10.0 BITCOIN SIGN +20C0 ; Not_XID # 14.0 SOM SIGN 2104 ; Not_XID # 1.1 CENTRE LINE SYMBOL 2108 ; Not_XID # 1.1 SCRUPLE 2114 ; Not_XID # 1.1 L B BAR SYMBOL @@ -1799,6 +1867,7 @@ A8F8..A8FA ; Obsolete Not_XID # 5.2 [3] DEVANAGARI SIGN PUSH 2E4A..2E4E ; Not_XID # 11.0 [5] DOTTED SOLIDUS..PUNCTUS ELEVATUS MARK 2E4F ; Not_XID # 12.0 CORNISH VERSE DIVIDER 2E50..2E52 ; Not_XID # 13.0 [3] CROSS PATTY WITH RIGHT CROSSBAR..TIRONIAN SIGN CAPITAL ET +2E53..2E5D ; Not_XID # 14.0 [11] MEDIEVAL EXCLAMATION MARK..OBLIQUE HYPHEN 2E80..2E99 ; Not_XID # 3.0 [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2E9E ; Not_XID # 3.0 [4] CJK RADICAL CHOKE..CJK RADICAL DEATH 2EA0..2EF2 ; Not_XID # 3.0 [83] CJK RADICAL CIVILIAN..CJK RADICAL J-SIMPLIFIED TURTLE @@ -1947,6 +2016,7 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1F6D3..1F6D4 ; Not_XID # 10.0 [2] STUPA..PAGODA 1F6D5 ; Not_XID # 12.0 HINDU TEMPLE 1F6D6..1F6D7 ; Not_XID # 13.0 [2] HUT..ELEVATOR +1F6DD..1F6DF ; Not_XID # 14.0 [3] PLAYGROUND SLIDE..RING BUOY 1F6E0..1F6EC ; Not_XID # 7.0 [13] HAMMER AND WRENCH..AIRPLANE ARRIVING 1F6F0..1F6F3 ; Not_XID # 7.0 [4] SATELLITE..PASSENGER SHIP 1F6F4..1F6F6 ; Not_XID # 9.0 [3] SCOOTER..CANOE @@ -1958,6 +2028,7 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1F780..1F7D4 ; Not_XID # 7.0 [85] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..HEAVY TWELVE POINTED PINWHEEL STAR 1F7D5..1F7D8 ; Not_XID # 11.0 [4] CIRCLED TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7E0..1F7EB ; Not_XID # 12.0 [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE +1F7F0 ; Not_XID # 14.0 HEAVY EQUALS SIGN 1F800..1F80B ; Not_XID # 7.0 [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847 ; Not_XID # 7.0 [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859 ; Not_XID # 7.0 [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW @@ -1986,6 +2057,7 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1F972 ; Not_XID # 13.0 SMILING FACE WITH TEAR 1F973..1F976 ; Not_XID # 11.0 [4] FACE WITH PARTY HORN AND PARTY HAT..FREEZING FACE 1F977..1F978 ; Not_XID # 13.0 [2] NINJA..DISGUISED FACE +1F979 ; Not_XID # 14.0 FACE HOLDING BACK TEARS 1F97A ; Not_XID # 11.0 FACE WITH PLEADING EYES 1F97B ; Not_XID # 12.0 SARI 1F97C..1F97F ; Not_XID # 11.0 [4] LAB COAT..FLAT SHOE @@ -2003,6 +2075,7 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1F9C1..1F9C2 ; Not_XID # 11.0 [2] CUPCAKE..SALT SHAKER 1F9C3..1F9CA ; Not_XID # 12.0 [8] BEVERAGE BOX..ICE CUBE 1F9CB ; Not_XID # 13.0 BUBBLE TEA +1F9CC ; Not_XID # 14.0 TROLL 1F9CD..1F9CF ; Not_XID # 12.0 [3] STANDING PERSON..DEAF PERSON 1F9D0..1F9E6 ; Not_XID # 10.0 [23] FACE WITH MONOCLE..SOCKS 1F9E7..1F9FF ; Not_XID # 11.0 [25] RED GIFT ENVELOPE..NAZAR AMULET @@ -2011,17 +2084,24 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 1FA70..1FA73 ; Not_XID # 12.0 [4] BALLET SHOES..SHORTS 1FA74 ; Not_XID # 13.0 THONG SANDAL 1FA78..1FA7A ; Not_XID # 12.0 [3] DROP OF BLOOD..STETHOSCOPE +1FA7B..1FA7C ; Not_XID # 14.0 [2] X-RAY..CRUTCH 1FA80..1FA82 ; Not_XID # 12.0 [3] YO-YO..PARACHUTE 1FA83..1FA86 ; Not_XID # 13.0 [4] BOOMERANG..NESTING DOLLS 1FA90..1FA95 ; Not_XID # 12.0 [6] RINGED PLANET..BANJO 1FA96..1FAA8 ; Not_XID # 13.0 [19] MILITARY HELMET..ROCK +1FAA9..1FAAC ; Not_XID # 14.0 [4] MIRROR BALL..HAMSA 1FAB0..1FAB6 ; Not_XID # 13.0 [7] FLY..FEATHER +1FAB7..1FABA ; Not_XID # 14.0 [4] LOTUS..NEST WITH EGGS 1FAC0..1FAC2 ; Not_XID # 13.0 [3] ANATOMICAL HEART..PEOPLE HUGGING +1FAC3..1FAC5 ; Not_XID # 14.0 [3] PREGNANT MAN..PERSON WITH CROWN 1FAD0..1FAD6 ; Not_XID # 13.0 [7] BLUEBERRIES..TEAPOT +1FAD7..1FAD9 ; Not_XID # 14.0 [3] POURING LIQUID..JAR +1FAE0..1FAE7 ; Not_XID # 14.0 [8] MELTING FACE..BUBBLES +1FAF0..1FAF6 ; Not_XID # 14.0 [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS 1FB00..1FB92 ; Not_XID # 13.0 [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA ; Not_XID # 13.0 [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON -# Total code points: 5587 +# Total code points: 5640 # Identifier_Type: Not_NFKC @@ -2193,6 +2273,7 @@ FFFD ; Not_XID # 1.1 REPLACEMENT CHARACTE 33FF ; Not_NFKC # 4.0 SQUARE GAL A69C..A69D ; Not_NFKC # 7.0 [2] MODIFIER LETTER CYRILLIC HARD SIGN..MODIFIER LETTER CYRILLIC SOFT SIGN A770 ; Not_NFKC # 5.1 MODIFIER LETTER US +A7F2..A7F4 ; Not_NFKC # 14.0 [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F8..A7F9 ; Not_NFKC # 6.1 [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE AB5C..AB5F ; Not_NFKC # 7.0 [4] MODIFIER LETTER SMALL HENG..MODIFIER LETTER SMALL U WITH LEFT HOOK AB69 ; Not_NFKC # 13.0 MODIFIER LETTER SMALL TURNED W @@ -2241,6 +2322,9 @@ FFD2..FFD7 ; Not_NFKC # 1.1 [6] HALFWIDTH HANGUL LET FFDA..FFDC ; Not_NFKC # 1.1 [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I FFE0..FFE6 ; Not_NFKC # 1.1 [7] FULLWIDTH CENT SIGN..FULLWIDTH WON SIGN FFE8..FFEE ; Not_NFKC # 1.1 [7] HALFWIDTH FORMS LIGHT VERTICAL..HALFWIDTH WHITE CIRCLE +10781..10785 ; Not_NFKC # 14.0 [5] MODIFIER LETTER SUPERSCRIPT TRIANGULAR COLON..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Not_NFKC # 14.0 [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Not_NFKC # 14.0 [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 1D15E..1D164 ; Not_NFKC # 3.1 [7] MUSICAL SYMBOL HALF NOTE..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE 1D1BB..1D1C0 ; Not_NFKC # 3.1 [6] MUSICAL SYMBOL MINIMA..MUSICAL SYMBOL FUSA BLACK 1D400..1D454 ; Not_NFKC # 3.1 [85] MATHEMATICAL BOLD CAPITAL A..MATHEMATICAL ITALIC SMALL G @@ -2329,7 +2413,7 @@ FFE8..FFEE ; Not_NFKC # 1.1 [7] HALFWIDTH FORMS LIGH 1FBF0..1FBF9 ; Not_NFKC # 13.0 [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE 2F800..2FA1D ; Not_NFKC # 3.1 [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D -# Total code points: 4800 +# Total code points: 4859 # Identifier_Type: Default_Ignorable @@ -2340,6 +2424,7 @@ FFE8..FFEE ; Not_NFKC # 1.1 [7] HALFWIDTH FORMS LIGH 17B4..17B5 ; Default_Ignorable # 3.0 [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA 180B..180D ; Default_Ignorable # 3.0 [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; Default_Ignorable # 3.0 MONGOLIAN VOWEL SEPARATOR +180F ; Default_Ignorable # 14.0 MONGOLIAN FREE VARIATION SELECTOR FOUR 200B ; Default_Ignorable # 1.1 ZERO WIDTH SPACE 200E..200F ; Default_Ignorable # 1.1 [2] LEFT-TO-RIGHT MARK..RIGHT-TO-LEFT MARK 202A..202E ; Default_Ignorable # 1.1 [5] LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE @@ -2355,7 +2440,7 @@ FFA0 ; Default_Ignorable # 1.1 HALFWIDTH HANGUL FIL E0020..E007F ; Default_Ignorable # 3.1 [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Default_Ignorable # 4.0 [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 395 +# Total code points: 396 # Identifier_Type: Deprecated diff --git a/lib/unicore/Index.txt b/lib/unicore/Index.txt index 498519f58b..451255cd83 100644 --- a/lib/unicore/Index.txt +++ b/lib/unicore/Index.txt @@ -1036,6 +1036,7 @@ combining counterclockwise ring overlay 20DA Combining Diacritical Marks 0300 Combining Diacritical Marks Extended 1AB0 Combining Diacritical Marks for Symbols 20D0 +Combining Diacritical Marks Supplement 1DC0 COMBINING DIAERESIS 0308 COMBINING DIAERESIS BELOW 0324 COMBINING DOT ABOVE 0307 @@ -1937,6 +1938,7 @@ Equality and Inequality Signs 22D5 EQUALS COLON 2255 EQUALS SIGN 003D EQUALS SIGN BELOW, COMBINING 0347 +EQUALS SIGN, HEAVY 1F7F0 EQUALS, CIRCLED 229C EQUALS, COLON 2254 equals, nearly 2252 @@ -2032,6 +2034,7 @@ FACE, WHITE FROWNING 2639 FACE, WHITE SMILING 263A Faces 1F600 Faces 1F920 +Faces 1FAE0 Facial Parts Symbols 1F440 FACSIMILE SIGN 213B factorial 0021 @@ -2429,6 +2432,7 @@ han-daku-on, japanese 309C Hand Symbols 1F446 Hand Symbols 1F58E Hand Symbols 1F918 +Hand Symbols 1FAF0 Hand Symbols, Pointing 261A Hand, Index Finger Pointing 1F446 HAND, RAISED 270B @@ -2478,6 +2482,7 @@ HEADPHONE 1F3A7 HEADSTONE GRAVEYARD SYMBOL 26FC HEART BULLET, REVERSED ROTATED FLORAL 2619 Heart Dingbats 2763 +HEART HANDS 1FAF6 Heart Ornaments 2763 Heart Symbols 1F493 HEART, BLACK 1F5A4 @@ -2567,6 +2572,7 @@ HYPHEN, DOUBLE 2E40 HYPHEN, KATAKANA-HIRAGANA DOUBLE 30A0 HYPHEN, MONGOLIAN TODO SOFT 1806 HYPHEN, NON-BREAKING 2011 +HYPHEN, OBLIQUE 2E5D hyphen, papyrological 035C HYPHEN, SOFT 00AD HYPHEN-MINUS 002D diff --git a/lib/unicore/IndicPositionalCategory.txt b/lib/unicore/IndicPositionalCategory.txt index ee74dbe0fa..69109ac51f 100644 --- a/lib/unicore/IndicPositionalCategory.txt +++ b/lib/unicore/IndicPositionalCategory.txt @@ -1,6 +1,6 @@ -# IndicPositionalCategory-13.0.0.txt -# Date: 2019-07-23, 00:01:00 GMT [KW, RP] -# © 2019 Unicode®, Inc. +# IndicPositionalCategory-14.0.0.txt +# Date: 2021-05-22, 01:01:00 GMT [KW, RP] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -25,8 +25,8 @@ # # In addition to combining marks associated with Indic scripts, the # Indic_Positional_Category has non-trivial values for special signs -# associated with Indic_Syllabic_Category=Consonant_Prefixed or -# Indic_Syllabic_Category=Consonant_Preceding_Repha. Those signs +# associated with Indic_Syllabic_Category=Consonant_Prefixed +# or Indic_Syllabic_Category=Consonant_Preceding_Repha. Those signs # have General_Category=Lo, rather than being combining marks. # They occur in initial position in syllabic structure. However, when # rendered, they appear as marks positioned with respect to another @@ -184,6 +184,8 @@ 1087..108C ; Right # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 108F ; Right # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 109A..109C ; Right # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +1715 ; Right # Mc TAGALOG SIGN PAMUDPOD +1734 ; Right # Mc HANUNOO SIGN PAMUDPOD 17B6 ; Right # Mc KHMER VOWEL SIGN AA 17C7..17C8 ; Right # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU 1923..1924 ; Right # Mc [2] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AI @@ -512,6 +514,8 @@ ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP 11001 ; Top # Mn BRAHMI SIGN ANUSVARA 11038..1103B ; Top # Mn [4] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN II 11042..11046 ; Top # Mn [5] BRAHMI VOWEL SIGN E..BRAHMI VIRAMA +11070 ; Top # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Top # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 11080..11081 ; Top # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA 110B5..110B6 ; Top # Mn [2] KAITHI VOWEL SIGN E..KAITHI VOWEL SIGN AI 11100..11102 ; Top # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA @@ -602,6 +606,7 @@ ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP 0B41..0B44 ; Bottom # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR 0B4D ; Bottom # Mn ORIYA SIGN VIRAMA 0B62..0B63 ; Bottom # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL +0C3C ; Bottom # Mn TELUGU SIGN NUKTA 0C56 ; Bottom # Mn TELUGU AI LENGTH MARK 0C62..0C63 ; Bottom # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0CBC ; Bottom # Mn KANNADA SIGN NUKTA @@ -630,7 +635,7 @@ ABE5 ; Top # Mn MEETEI MAYEK VOWEL SIGN ANAP 1082 ; Bottom # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA 108D ; Bottom # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE 1713..1714 ; Bottom # Mn [2] TAGALOG VOWEL SIGN U..TAGALOG SIGN VIRAMA -1733..1734 ; Bottom # Mn [2] HANUNOO VOWEL SIGN U..HANUNOO SIGN PAMUDPOD +1733 ; Bottom # Mn HANUNOO VOWEL SIGN U 1753 ; Bottom # Mn BUHID VOWEL SIGN U 1773 ; Bottom # Mn TAGBANWA VOWEL SIGN U 17BB..17BD ; Bottom # Mn [3] KHMER VOWEL SIGN U..KHMER VOWEL SIGN UA @@ -675,6 +680,7 @@ ABED ; Bottom # Mn MEETEI MAYEK APUN IYEK 1103C..11041 ; Bottom # Mn [6] BRAHMI VOWEL SIGN U..BRAHMI VOWEL SIGN VOCALIC LL 110B3..110B4 ; Bottom # Mn [2] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN UU 110B9..110BA ; Bottom # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Bottom # Mn KAITHI VOWEL SIGN VOCALIC R 1112A..1112B ; Bottom # Mn [2] CHAKMA VOWEL SIGN U..CHAKMA VOWEL SIGN UU 11131..11132 ; Bottom # Mn [2] CHAKMA O MARK..CHAKMA AU MARK 11173 ; Bottom # Mn MAHAJANI SIGN NUKTA diff --git a/lib/unicore/IndicSyllabicCategory.txt b/lib/unicore/IndicSyllabicCategory.txt index 8297578d18..23b86372ae 100644 --- a/lib/unicore/IndicSyllabicCategory.txt +++ b/lib/unicore/IndicSyllabicCategory.txt @@ -1,6 +1,6 @@ -# IndicSyllabicCategory-13.0.0.txt -# Date: 2019-07-22, 19:55:00 GMT [KW, RP] -# © 2019 Unicode®, Inc. +# IndicSyllabicCategory-14.0.0.txt +# Date: 2021-05-22, 01:01:00 GMT [KW, RP] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -225,6 +225,7 @@ AAF5 ; Visarga # Mc MEETEI MAYEK VOWEL SIGN VISARGA 0ABC ; Nukta # Mn GUJARATI SIGN NUKTA 0AFD..0AFF ; Nukta # Mn [3] GUJARATI SIGN THREE-DOT NUKTA ABOVE..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE 0B3C ; Nukta # Mn ORIYA SIGN NUKTA +0C3C ; Nukta # Mn TELUGU SIGN NUKTA 0CBC ; Nukta # Mn KANNADA SIGN NUKTA 0F39 ; Nukta # Mn TIBETAN MARK TSA -PHRU 1B34 ; Nukta # Mn BALINESE SIGN REREKAN @@ -303,7 +304,8 @@ A9C0 ; Virama # Mc JAVANESE PANGKON 0F84 ; Pure_Killer # Mn TIBETAN MARK HALANTA 103A ; Pure_Killer # Mn MYANMAR SIGN ASAT 1714 ; Pure_Killer # Mn TAGALOG SIGN VIRAMA -1734 ; Pure_Killer # Mn HANUNOO SIGN PAMUDPOD +1715 ; Pure_Killer # Mc TAGALOG SIGN PAMUDPOD +1734 ; Pure_Killer # Mc HANUNOO SIGN PAMUDPOD 17D1 ; Pure_Killer # Mn KHMER SIGN VIRIAM 1A7A ; Pure_Killer # Mn TAI THAM SIGN RA HAAM 1BAA ; Pure_Killer # Mc SUNDANESE SIGN PAMAAEH @@ -311,6 +313,7 @@ A9C0 ; Virama # Mc JAVANESE PANGKON A82C ; Pure_Killer # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA A953 ; Pure_Killer # Mc REJANG VIRAMA ABED ; Pure_Killer # Mn MEETEI MAYEK APUN IYEK +11070 ; Pure_Killer # Mn BRAHMI SIGN OLD TAMIL VIRAMA 11134 ; Pure_Killer # Mn CHAKMA MAAYYAA 112EA ; Pure_Killer # Mn KHUDAWADI SIGN VIRAMA 1172B ; Pure_Killer # Mn AHOM SIGN KILLER @@ -408,6 +411,7 @@ AAE0..AAE1 ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER E..MEETEI MAYEK ABCE..ABCF ; Vowel_Independent # Lo [2] MEETEI MAYEK LETTER UN..MEETEI MAYEK LETTER I ABD1 ; Vowel_Independent # Lo MEETEI MAYEK LETTER ATIYA 11005..11012 ; Vowel_Independent # Lo [14] BRAHMI LETTER A..BRAHMI LETTER AU +11071..11072 ; Vowel_Independent # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O 11083..1108C ; Vowel_Independent # Lo [10] KAITHI LETTER A..KAITHI LETTER AU 11103..11106 ; Vowel_Independent # Lo [4] CHAKMA LETTER AA..CHAKMA LETTER E 11183..11190 ; Vowel_Independent # Lo [14] SHARADA LETTER A..SHARADA LETTER AU @@ -617,9 +621,11 @@ ABE9..ABEA ; Vowel_Dependent # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEET 10A05..10A06 ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O 10A0C..10A0D ; Vowel_Dependent # Mn [2] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN DOUBLE RING BELOW 11038..11045 ; Vowel_Dependent # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +11073..11074 ; Vowel_Dependent # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 110B0..110B2 ; Vowel_Dependent # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II 110B3..110B6 ; Vowel_Dependent # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B7..110B8 ; Vowel_Dependent # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +110C2 ; Vowel_Dependent # Mn KAITHI VOWEL SIGN VOCALIC R 11127..1112B ; Vowel_Dependent # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112C ; Vowel_Dependent # Mc CHAKMA VOWEL SIGN E 1112D..11132 ; Vowel_Dependent # Mn [6] CHAKMA VOWEL SIGN AI..CHAKMA AU MARK @@ -813,8 +819,8 @@ AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MY 106E..1070 ; Consonant # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA 1075..1081 ; Consonant # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA 108E ; Consonant # Lo MYANMAR LETTER RUMAI PALAUNG FA -1703..170C ; Consonant # Lo [10] TAGALOG LETTER KA..TAGALOG LETTER YA -170E..1711 ; Consonant # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1703..1711 ; Consonant # Lo [15] TAGALOG LETTER KA..TAGALOG LETTER HA +171F ; Consonant # Lo TAGALOG LETTER ARCHAIC RA 1723..1731 ; Consonant # Lo [15] HANUNOO LETTER KA..HANUNOO LETTER HA 1743..1751 ; Consonant # Lo [15] BUHID LETTER KA..BUHID LETTER HA 1763..176C ; Consonant # Lo [10] TAGBANWA LETTER KA..TAGBANWA LETTER YA @@ -827,7 +833,7 @@ AA74..AA76 ; Consonant_Placeholder # Lo [3] MYANMAR LOGOGRAM KHAMTI OAY..MY 1A20..1A4C ; Consonant # Lo [45] TAI THAM LETTER HIGH KA..TAI THAM LETTER LOW HA 1A53..1A54 ; Consonant # Lo [2] TAI THAM LETTER LAE..TAI THAM LETTER GREAT SA 1B13..1B33 ; Consonant # Lo [33] BALINESE LETTER KA..BALINESE LETTER HA -1B45..1B4B ; Consonant # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; Consonant # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B8A..1BA0 ; Consonant # Lo [23] SUNDANESE LETTER KA..SUNDANESE LETTER HA 1BAE..1BAF ; Consonant # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA 1BBB..1BBD ; Consonant # Lo [3] SUNDANESE LETTER REU..SUNDANESE LETTER BHA @@ -863,6 +869,7 @@ ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTE 10A15..10A17 ; Consonant # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA 10A19..10A35 ; Consonant # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA 11013..11037 ; Consonant # Lo [37] BRAHMI LETTER KA..BRAHMI LETTER OLD TAMIL NNNA +11075 ; Consonant # Lo BRAHMI LETTER OLD TAMIL LLA 1108D..110AF ; Consonant # Lo [35] KAITHI LETTER KA..KAITHI LETTER HA 11107..11126 ; Consonant # Lo [32] CHAKMA LETTER KAA..CHAKMA LETTER HAA 11144 ; Consonant # Lo CHAKMA LETTER LHAA @@ -888,6 +895,7 @@ ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTE 1168A..116AA ; Consonant # Lo [33] TAKRI LETTER KA..TAKRI LETTER RRA 116B8 ; Consonant # Lo TAKRI LETTER ARCHAIC KHA 11700..1171A ; Consonant # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; Consonant # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 1180A..1182B ; Consonant # Lo [34] DOGRA LETTER KA..DOGRA LETTER RRA 1190C..11913 ; Consonant # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA 11915..11916 ; Consonant # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA @@ -910,6 +918,8 @@ ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTE # [Not derivable] 09CE ; Consonant_Dead # Lo BENGALI LETTER KHANDA TA +0C5D ; Consonant_Dead # Lo TELUGU LETTER NAKAARA POLLU +0CDD ; Consonant_Dead # Lo KANNADA LETTER NAKAARA POLLU 0D54..0D56 ; Consonant_Dead # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL 0D7A..0D7F ; Consonant_Dead # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K 1CF2..1CF3 ; Consonant_Dead # Lo [2] VEDIC SIGN ARDHAVISARGA..VEDIC SIGN ROTATED ARDHAVISARGA @@ -975,9 +985,6 @@ ABD2..ABDA ; Consonant # Lo [9] MEETEI MAYEK LETTER GOK..MEETEI MAYEK LETTE # [Not derivable] 17CC ; Consonant_Succeeding_Repha # Mn KHMER SIGN ROBAT -1B03 ; Consonant_Succeeding_Repha # Mn BALINESE SIGN SURANG -1B81 ; Consonant_Succeeding_Repha # Mn SUNDANESE SIGN PANGLAYAR -A982 ; Consonant_Succeeding_Repha # Mn JAVANESE SIGN LAYAR # ================================================ @@ -1043,11 +1050,14 @@ AA35..AA36 ; Consonant_Medial # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONA 1939 ; Consonant_Final # Mn LIMBU SIGN MUKPHRENG 19C1..19C7 ; Consonant_Final # Lo [7] NEW TAI LUE LETTER FINAL V..NEW TAI LUE LETTER FINAL B 1A58..1A59 ; Consonant_Final # Mn [2] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN FINAL NGA +1B03 ; Consonant_Final # Mn BALINESE SIGN SURANG +1B81 ; Consonant_Final # Mn SUNDANESE SIGN PANGLAYAR 1BBE..1BBF ; Consonant_Final # Lo [2] SUNDANESE LETTER FINAL K..SUNDANESE LETTER FINAL M 1BF0..1BF1 ; Consonant_Final # Mn [2] BATAK CONSONANT SIGN NG..BATAK CONSONANT SIGN H 1C2D..1C33 ; Consonant_Final # Mn [7] LEPCHA CONSONANT SIGN K..LEPCHA CONSONANT SIGN T A94F..A951 ; Consonant_Final # Mn [3] REJANG CONSONANT SIGN NG..REJANG CONSONANT SIGN R A952 ; Consonant_Final # Mc REJANG CONSONANT SIGN H +A982 ; Consonant_Final # Mn JAVANESE SIGN LAYAR AA40..AA42 ; Consonant_Final # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG AA43 ; Consonant_Final # Mn CHAM CONSONANT SIGN FINAL NG AA44..AA4B ; Consonant_Final # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS diff --git a/lib/unicore/Jamo.txt b/lib/unicore/Jamo.txt index 7e171e1cda..298d9df988 100644 --- a/lib/unicore/Jamo.txt +++ b/lib/unicore/Jamo.txt @@ -1,6 +1,6 @@ -# Jamo-13.0.0.txt -# Date: 2019-09-09, 19:46:00 GMT [KW, LI] -# © 2019 Unicode®, Inc. +# Jamo-14.0.0.txt +# Date: 2021-03-16, 21:43:00 GMT [KW, LI] +# © 2021 Unicode®, Inc. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Character Database @@ -8,7 +8,7 @@ # # This file defines the Jamo_Short_Name property. # -# See Section 3.12 of The Unicode Standard, Version 13.0 +# See Section 3.12 of The Unicode Standard, Version 14.0 # for more information. # # Each line contains two fields, separated by a semicolon. diff --git a/lib/unicore/LineBreak.txt b/lib/unicore/LineBreak.txt index 22abddcd90..aa5985b8f0 100644 --- a/lib/unicore/LineBreak.txt +++ b/lib/unicore/LineBreak.txt @@ -1,11 +1,11 @@ -# LineBreak-13.0.0.txt -# Date: 2020-02-17, 07:43:02 GMT [KW, LI] -# © 2020 Unicode®, Inc. +# LineBreak-14.0.0.txt +# Date: 2021-07-06, 09:58:55 GMT [KW, LI] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Line_Break Property # @@ -49,7 +49,7 @@ # with ranges of code points, the code point count in square brackets. # # For more information, see UAX #14: Unicode Line Breaking Algorithm, -# at http://www.unicode.org/reports/tr14/ +# at https://www.unicode.org/reports/tr14/ # # @missing: 0000..10FFFF; XX 0000..0008;CM # Cc [9] .. @@ -215,7 +215,7 @@ 0610..061A;CM # Mn [11] ARABIC SIGN SALLALLAHOU ALAYHE WASSALLAM..ARABIC SMALL KASRA 061B;EX # Po ARABIC SEMICOLON 061C;CM # Cf ARABIC LETTER MARK -061E..061F;EX # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F;EX # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 0620..063F;AL # Lo [32] ARABIC LETTER KASHMIRI YEH..ARABIC LETTER FARSI YEH WITH THREE DOTS ABOVE 0640;AL # Lm ARABIC TATWEEL 0641..064A;AL # Lo [10] ARABIC LETTER FEH..ARABIC LETTER YEH @@ -277,9 +277,14 @@ 0859..085B;CM # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK 085E;AL # Po MANDAIC PUNCTUATION 0860..086A;AL # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4;AL # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7;AL # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE -08D3..08E1;CM # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0870..0887;AL # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0888;AL # Sk ARABIC RAISED ROUND DOT +0889..088E;AL # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0890..0891;AL # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +0898..089F;CM # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08A0..08C8;AL # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9;AL # Lm ARABIC SMALL FARSI YEH +08CA..08E1;CM # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E2;AL # Cf ARABIC DISPUTED END OF AYAH 08E3..08FF;CM # Mn [29] ARABIC TURNED DAMMA BELOW..ARABIC MARK SIDEWAYS NOON GHUNNA 0900..0902;CM # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA @@ -437,6 +442,7 @@ 0C0E..0C10;AL # Lo [3] TELUGU LETTER E..TELUGU LETTER AI 0C12..0C28;AL # Lo [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C39;AL # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C3C;CM # Mn TELUGU SIGN NUKTA 0C3D;AL # Lo TELUGU SIGN AVAGRAHA 0C3E..0C40;CM # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44;CM # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR @@ -444,6 +450,7 @@ 0C4A..0C4D;CM # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56;CM # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK 0C58..0C5A;AL # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D;AL # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61;AL # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63;CM # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C66..0C6F;NU # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE @@ -469,7 +476,7 @@ 0CCA..0CCB;CM # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC..0CCD;CM # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA 0CD5..0CD6;CM # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE;AL # Lo KANNADA LETTER FA +0CDD..0CDE;AL # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1;AL # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3;CM # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF;NU # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -672,11 +679,13 @@ 16EB..16ED;BA # Po [3] RUNIC SINGLE PUNCTUATION..RUNIC CROSS PUNCTUATION 16EE..16F0;AL # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8;AL # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C;AL # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711;AL # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711;AL # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1714;CM # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA +1715;CM # Mc TAGALOG SIGN PAMUDPOD +171F;AL # Lo TAGALOG LETTER ARCHAIC RA 1720..1731;AL # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA -1732..1734;CM # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733;CM # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734;CM # Mc HANUNOO SIGN PAMUDPOD 1735..1736;BA # Po [2] PHILIPPINE SINGLE PUNCTUATION..PHILIPPINE DOUBLE PUNCTUATION 1740..1751;AL # Lo [18] BUHID LETTER A..BUHID LETTER HA 1752..1753;CM # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U @@ -711,6 +720,7 @@ 180A;AL # Po MONGOLIAN NIRUGU 180B..180D;CM # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E;GL # Cf MONGOLIAN VOWEL SEPARATOR +180F;CM # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1810..1819;NU # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE 1820..1842;AL # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843;AL # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -766,7 +776,7 @@ 1AA8..1AAD;SA # Po [6] TAI THAM SIGN KAAN..TAI THAM SIGN CAANG 1AB0..1ABD;CM # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE;CM # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0;CM # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE;CM # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03;CM # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04;CM # Mc BALINESE SIGN BISAH 1B05..1B33;AL # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA @@ -778,7 +788,7 @@ 1B3D..1B41;CM # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42;CM # Mn BALINESE VOWEL SIGN PEPET 1B43..1B44;CM # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG -1B45..1B4B;AL # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C;AL # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59;NU # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B5A..1B5B;BA # Po [2] BALINESE PANTI..BALINESE PAMADA 1B5C;AL # Po BALINESE WINDU @@ -786,6 +796,7 @@ 1B61..1B6A;AL # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE 1B6B..1B73;CM # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1B74..1B7C;AL # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +1B7D..1B7E;BA # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1B80..1B81;CM # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR 1B82;CM # Mc SUNDANESE SIGN PANGWISAD 1B83..1BA0;AL # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA @@ -844,8 +855,7 @@ 1D79..1D7F;AL # Ll [7] LATIN SMALL LETTER INSULAR G..LATIN SMALL LETTER UPSILON WITH STROKE 1D80..1D9A;AL # Ll [27] LATIN SMALL LETTER B WITH PALATAL HOOK..LATIN SMALL LETTER EZH WITH RETROFLEX HOOK 1D9B..1DBF;AL # Lm [37] MODIFIER LETTER SMALL TURNED ALPHA..MODIFIER LETTER SMALL THETA -1DC0..1DF9;CM # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF;CM # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF;CM # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 1E00..1EFF;AL # L& [256] LATIN CAPITAL LETTER A WITH RING BELOW..LATIN SMALL LETTER Y WITH LOOP 1F00..1F15;AL # L& [22] GREEK SMALL LETTER ALPHA WITH PSILI..GREEK SMALL LETTER EPSILON WITH DASIA AND OXIA 1F18..1F1D;AL # Lu [6] GREEK CAPITAL LETTER EPSILON WITH PSILI..GREEK CAPITAL LETTER EPSILON WITH DASIA AND OXIA @@ -953,7 +963,8 @@ 20BC..20BD;PR # Sc [2] MANAT SIGN..RUBLE SIGN 20BE;PO # Sc LARI SIGN 20BF;PR # Sc BITCOIN SIGN -20C0..20CF;PR # Cn [16] .. +20C0;PO # Sc SOM SIGN +20C1..20CF;PR # Cn [15] .. 20D0..20DC;CM # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0;CM # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH 20E1;CM # Mn COMBINING LEFT RIGHT ARROW ABOVE @@ -1307,8 +1318,7 @@ 2B5A..2B73;AL # So [26] SLANTED NORTH ARROW WITH HOOKED HEAD..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR 2B76..2B95;AL # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW 2B97..2BFF;AL # So [105] SYMBOL FOR TYPE A ELECTRONICS..HELLSCHREIBER PAUSE SYMBOL -2C00..2C2E;AL # Lu [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E;AL # Ll [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C00..2C5F;AL # L& [96] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C60..2C7B;AL # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D;AL # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2C7F;AL # Lu [2] LATIN CAPITAL LETTER S WITH SWASH TAIL..LATIN CAPITAL LETTER Z WITH SWASH TAIL @@ -1390,6 +1400,16 @@ 2E4E..2E4F;BA # Po [2] PUNCTUS ELEVATUS MARK..CORNISH VERSE DIVIDER 2E50..2E51;AL # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR 2E52;AL # Po TIRONIAN SIGN CAPITAL ET +2E53..2E54;EX # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK +2E55;OP # Ps LEFT SQUARE BRACKET WITH STROKE +2E56;CL # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57;OP # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58;CL # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59;OP # Ps TOP HALF LEFT PARENTHESIS +2E5A;CL # Pe TOP HALF RIGHT PARENTHESIS +2E5B;OP # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C;CL # Pe BOTTOM HALF RIGHT PARENTHESIS +2E5D;BA # Pd OBLIQUE HYPHEN 2E80..2E99;ID # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3;ID # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5;ID # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -1510,8 +1530,7 @@ 3300..33FF;ID # So [256] SQUARE APAATO..SQUARE GAL 3400..4DBF;ID # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF 4DC0..4DFF;AL # So [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION -4E00..9FFC;ID # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -9FFD..9FFF;ID # Cn [3] .. +4E00..9FFF;ID # Lo [20992] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFF A000..A014;ID # Lo [21] YI SYLLABLE IT..YI SYLLABLE E A015;NS # Lm YI SYLLABLE WU A016..A48C;ID # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR @@ -1553,8 +1572,11 @@ A788;AL # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A;AL # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E;AL # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F;AL # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF;AL # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA;AL # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA;AL # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1;AL # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3;AL # Ll LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9;AL # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4;AL # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6;AL # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7;AL # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9;AL # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -2511,15 +2533,17 @@ FB40..FB41;HL # Lo [2] HEBREW LETTER NUN WITH DAGESH..HEBREW LETTER SAME FB43..FB44;HL # Lo [2] HEBREW LETTER FINAL PE WITH DAGESH..HEBREW LETTER PE WITH DAGESH FB46..FB4F;HL # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATURE ALEF LAMED FB50..FBB1;AL # Lo [98] ARABIC LETTER ALEF WASLA ISOLATED FORM..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM -FBB2..FBC1;AL # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2;AL # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FBD3..FD3D;AL # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM FD3E;CL # Pe ORNATE LEFT PARENTHESIS FD3F;OP # Ps ORNATE RIGHT PARENTHESIS +FD40..FD4F;AL # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH FD50..FD8F;AL # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM FD92..FDC7;AL # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM +FDCF;AL # So ARABIC LIGATURE SALAAMUHU ALAYNAA FDF0..FDFB;AL # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU FDFC;PO # Sc RIAL SIGN -FDFD;AL # So ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFD..FDFF;AL # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FE00..FE0F;CM # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16 FE10;IS # Po PRESENTATION FORM FOR VERTICAL COMMA FE11..FE12;CL # Po [2] PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC COMMA..PRESENTATION FORM FOR VERTICAL IDEOGRAPHIC FULL STOP @@ -2682,9 +2706,20 @@ FFFD;AI # So REPLACEMENT CHARACTER 10500..10527;AL # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563;AL # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW 1056F;AL # Po CAUCASIAN ALBANIAN CITATION MARK +10570..1057A;AL # Lu [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A;AL # Lu [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592;AL # Lu [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595;AL # Lu [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1;AL # Ll [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1;AL # Ll [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9;AL # Ll [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC;AL # Ll [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736;AL # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755;AL # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767;AL # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785;AL # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0;AL # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA;AL # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805;AL # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808;AL # Lo CYPRIOT SYLLABLE JO 1080A..10835;AL # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -2765,6 +2800,9 @@ FFFD;AI # So REPLACEMENT CHARACTER 10F46..10F50;CM # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW 10F51..10F54;AL # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED 10F55..10F59;AL # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F70..10F81;AL # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F82..10F85;CM # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW +10F86..10F89;AL # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 10FB0..10FC4;AL # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FC5..10FCB;AL # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED 10FE0..10FF6;AL # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH @@ -2777,6 +2815,10 @@ FFFD;AI # So REPLACEMENT CHARACTER 11049..1104D;AL # Po [5] BRAHMI PUNCTUATION DOT..BRAHMI PUNCTUATION LOTUS 11052..11065;AL # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND 11066..1106F;NU # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11070;CM # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11071..11072;AL # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074;CM # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075;AL # Lo BRAHMI LETTER OLD TAMIL LLA 1107F;CM # Mn BRAHMI NUMBER JOINER 11080..11081;CM # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA 11082;CM # Mc KAITHI SIGN VISARGA @@ -2788,6 +2830,7 @@ FFFD;AI # So REPLACEMENT CHARACTER 110BB..110BC;AL # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN 110BD;AL # Cf KAITHI NUMBER SIGN 110BE..110C1;BA # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA +110C2;CM # Mn KAITHI VOWEL SIGN VOCALIC R 110CD;AL # Cf KAITHI NUMBER SIGN ABOVE 110D0..110E8;AL # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 110F0..110F9;NU # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE @@ -2934,6 +2977,7 @@ FFFD;AI # So REPLACEMENT CHARACTER 116B6;CM # Mc TAKRI SIGN VIRAMA 116B7;CM # Mn TAKRI SIGN NUKTA 116B8;AL # Lo TAKRI LETTER ARCHAIC KHA +116B9;AL # Po TAKRI ABBREVIATION SIGN 116C0..116C9;NU # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE 11700..1171A;SA # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA 1171D..1171F;SA # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA @@ -2945,6 +2989,7 @@ FFFD;AI # So REPLACEMENT CHARACTER 1173A..1173B;SA # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY 1173C..1173E;BA # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI 1173F;SA # So AHOM SYMBOL VI +11740..11746;SA # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B;AL # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E;CM # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 1182F..11837;CM # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA @@ -3008,6 +3053,7 @@ FFFD;AI # So REPLACEMENT CHARACTER 11A9D;AL # Lo SOYOMBO MARK PLUTA 11A9E..11AA0;BB # Po [3] SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME..SOYOMBO HEAD MARK WITH MOON AND SUN 11AA1..11AA2;BA # Po [2] SOYOMBO TERMINAL MARK-1..SOYOMBO TERMINAL MARK-2 +11AB0..11ABF;AL # Lo [16] CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA 11AC0..11AF8;AL # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08;AL # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E;AL # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA @@ -3065,6 +3111,8 @@ FFFD;AI # So REPLACEMENT CHARACTER 12400..1246E;AL # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12470..12474;BA # Po [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON 12480..12543;AL # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0;AL # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2;AL # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13000..13257;AL # Lo [600] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH O006 13258..1325A;OP # Lo [3] EGYPTIAN HIEROGLYPH O006A..EGYPTIAN HIEROGLYPH O006C 1325B..1325D;CL # Lo [3] EGYPTIAN HIEROGLYPH O006D..EGYPTIAN HIEROGLYPH O006F @@ -3090,6 +3138,8 @@ FFFD;AI # So REPLACEMENT CHARACTER 16A40..16A5E;AL # Lo [31] MRO LETTER TA..MRO LETTER TEK 16A60..16A69;NU # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE 16A6E..16A6F;BA # Po [2] MRO DANDA..MRO DOUBLE DANDA +16A70..16ABE;AL # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9;NU # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED;AL # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF0..16AF4;CM # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16AF5;BA # Po BASSA VAH FULL STOP @@ -3124,8 +3174,11 @@ FFFD;AI # So REPLACEMENT CHARACTER 18800..18AFF;ID # Lo [768] TANGUT COMPONENT-001..TANGUT COMPONENT-768 18B00..18CD5;AL # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08;ID # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 +1AFF0..1AFF3;AL # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB;AL # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE;AL # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 1B000..1B0FF;ID # Lo [256] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER RE-2 -1B100..1B11E;ID # Lo [31] HENTAIGANA LETTER RE-3..HENTAIGANA LETTER N-MU-MO-2 +1B100..1B122;ID # Lo [35] HENTAIGANA LETTER RE-3..KATAKANA LETTER ARCHAIC WU 1B150..1B152;CJ # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167;CJ # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB;ID # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -3137,6 +3190,9 @@ FFFD;AI # So REPLACEMENT CHARACTER 1BC9D..1BC9E;CM # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 1BC9F;BA # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1BCA0..1BCA3;CM # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF00..1CF2D;CM # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46;CM # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG +1CF50..1CFC3;AL # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5;AL # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126;AL # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129..1D164;AL # So [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE @@ -3150,7 +3206,7 @@ FFFD;AI # So REPLACEMENT CHARACTER 1D185..1D18B;CM # Mn [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1D18C..1D1A9;AL # So [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH 1D1AA..1D1AD;CM # Mn [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO -1D1AE..1D1E8;AL # So [59] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KIEVAN FLAT SIGN +1D1AE..1D1EA;AL # So [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON 1D200..1D241;AL # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54 1D242..1D244;CM # Mn [3] COMBINING GREEK MUSICAL TRISEME..COMBINING GREEK MUSICAL PENTASEME 1D245;AL # So GREEK MUSICAL LEIMMA @@ -3211,6 +3267,9 @@ FFFD;AI # So REPLACEMENT CHARACTER 1DA8B;AL # Po SIGNWRITING PARENTHESIS 1DA9B..1DA9F;CM # Mn [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6 1DAA1..1DAAF;CM # Mn [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16 +1DF00..1DF09;AL # Ll [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A;AL # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E;AL # Ll [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E000..1E006;CM # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018;CM # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021;CM # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -3222,10 +3281,16 @@ FFFD;AI # So REPLACEMENT CHARACTER 1E140..1E149;NU # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1E14E;AL # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1E14F;AL # So NYIAKENG PUACHUE HMONG CIRCLED CA +1E290..1E2AD;AL # Lo [30] TOTO LETTER PA..TOTO LETTER A +1E2AE;CM # Mn TOTO SIGN RISING TONE 1E2C0..1E2EB;AL # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1E2EC..1E2EF;CM # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E2F0..1E2F9;NU # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE 1E2FF;PR # Sc WANCHO NGUN SIGN +1E7E0..1E7E6;AL # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB;AL # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE;AL # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE;AL # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4;AL # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8C7..1E8CF;AL # No [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE 1E8D0..1E8D6;CM # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS @@ -3389,8 +3454,8 @@ FFFD;AI # So REPLACEMENT CHARACTER 1F6C1..1F6CB;ID # So [11] BATHTUB..COUCH AND LAMP 1F6CC;EB # So SLEEPING ACCOMMODATION 1F6CD..1F6D7;ID # So [11] SHOPPING BAGS..ELEVATOR -1F6D8..1F6DF;ID # Cn [8] .. -1F6E0..1F6EC;ID # So [13] HAMMER AND WRENCH..AIRPLANE ARRIVING +1F6D8..1F6DC;ID # Cn [5] .. +1F6DD..1F6EC;ID # So [16] PLAYGROUND SLIDE..AIRPLANE ARRIVING 1F6ED..1F6EF;ID # Cn [3] .. 1F6F0..1F6FC;ID # So [13] SATELLITE..ROLLER SKATE 1F6FD..1F6FF;ID # Cn [3] .. @@ -3400,7 +3465,9 @@ FFFD;AI # So REPLACEMENT CHARACTER 1F7D5..1F7D8;ID # So [4] CIRCLED TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7D9..1F7DF;ID # Cn [7] .. 1F7E0..1F7EB;ID # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE -1F7EC..1F7FF;ID # Cn [20] .. +1F7EC..1F7EF;ID # Cn [4] .. +1F7F0;ID # So HEAVY EQUALS SIGN +1F7F1..1F7FF;ID # Cn [15] .. 1F800..1F80B;AL # So [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F80C..1F80F;ID # Cn [4] .. 1F810..1F847;AL # So [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW @@ -3427,16 +3494,13 @@ FFFD;AI # So REPLACEMENT CHARACTER 1F93C..1F93E;EB # So [3] WRESTLERS..HANDBALL 1F93F..1F976;ID # So [56] DIVING MASK..FREEZING FACE 1F977;EB # So NINJA -1F978;ID # So DISGUISED FACE -1F979;ID # Cn -1F97A..1F9B4;ID # So [59] FACE WITH PLEADING EYES..BONE +1F978..1F9B4;ID # So [61] DISGUISED FACE..BONE 1F9B5..1F9B6;EB # So [2] LEG..FOOT 1F9B7;ID # So TOOTH 1F9B8..1F9B9;EB # So [2] SUPERHERO..SUPERVILLAIN 1F9BA;ID # So SAFETY VEST 1F9BB;EB # So EAR WITH HEARING AID -1F9BC..1F9CB;ID # So [16] MOTORIZED WHEELCHAIR..BUBBLE TEA -1F9CC;ID # Cn +1F9BC..1F9CC;ID # So [17] MOTORIZED WHEELCHAIR..TROLL 1F9CD..1F9CF;EB # So [3] STANDING PERSON..DEAF PERSON 1F9D0;ID # So FACE WITH MONOCLE 1F9D1..1F9DD;EB # So [13] ADULT..ELF @@ -3447,26 +3511,31 @@ FFFD;AI # So REPLACEMENT CHARACTER 1FA6E..1FA6F;ID # Cn [2] .. 1FA70..1FA74;ID # So [5] BALLET SHOES..THONG SANDAL 1FA75..1FA77;ID # Cn [3] .. -1FA78..1FA7A;ID # So [3] DROP OF BLOOD..STETHOSCOPE -1FA7B..1FA7F;ID # Cn [5] .. +1FA78..1FA7C;ID # So [5] DROP OF BLOOD..CRUTCH +1FA7D..1FA7F;ID # Cn [3] .. 1FA80..1FA86;ID # So [7] YO-YO..NESTING DOLLS 1FA87..1FA8F;ID # Cn [9] .. -1FA90..1FAA8;ID # So [25] RINGED PLANET..ROCK -1FAA9..1FAAF;ID # Cn [7] .. -1FAB0..1FAB6;ID # So [7] FLY..FEATHER -1FAB7..1FABF;ID # Cn [9] .. +1FA90..1FAAC;ID # So [29] RINGED PLANET..HAMSA +1FAAD..1FAAF;ID # Cn [3] .. +1FAB0..1FABA;ID # So [11] FLY..NEST WITH EGGS +1FABB..1FABF;ID # Cn [5] .. 1FAC0..1FAC2;ID # So [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAC3..1FACF;ID # Cn [13] .. -1FAD0..1FAD6;ID # So [7] BLUEBERRIES..TEAPOT -1FAD7..1FAFF;ID # Cn [41] .. +1FAC3..1FAC5;EB # So [3] PREGNANT MAN..PERSON WITH CROWN +1FAC6..1FACF;ID # Cn [10] .. +1FAD0..1FAD9;ID # So [10] BLUEBERRIES..JAR +1FADA..1FADF;ID # Cn [6] .. +1FAE0..1FAE7;ID # So [8] MELTING FACE..BUBBLES +1FAE8..1FAEF;ID # Cn [8] .. +1FAF0..1FAF6;EB # So [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS +1FAF7..1FAFF;ID # Cn [9] .. 1FB00..1FB92;AL # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA;AL # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON 1FBF0..1FBF9;NU # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE 1FC00..1FFFD;ID # Cn [1022] .. -20000..2A6DD;ID # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A6DE..2A6FF;ID # Cn [34] .. -2A700..2B734;ID # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 -2B735..2B73F;ID # Cn [11] .. +20000..2A6DF;ID # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A6E0..2A6FF;ID # Cn [32] .. +2A700..2B738;ID # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 +2B739..2B73F;ID # Cn [7] .. 2B740..2B81D;ID # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B81E..2B81F;ID # Cn [2] .. 2B820..2CEA1;ID # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 diff --git a/lib/unicore/NameAliases.txt b/lib/unicore/NameAliases.txt index 0e62632db5..8519284d89 100644 --- a/lib/unicore/NameAliases.txt +++ b/lib/unicore/NameAliases.txt @@ -1,6 +1,6 @@ -# NameAliases-13.0.0.txt -# Date: 2019-09-09, 19:47:00 GMT [KW, LI] -# © 2019 Unicode®, Inc. +# NameAliases-14.0.0.txt +# Date: 2020-10-21, 22:28:00 GMT [KW, LI] +# © 2020 Unicode®, Inc. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Character Database @@ -270,6 +270,7 @@ 180C;FVS2;abbreviation 180D;FVS3;abbreviation 180E;MVS;abbreviation +180F;FVS4;abbreviation 200B;ZWSP;abbreviation 200C;ZWNJ;abbreviation 200D;ZWJ;abbreviation @@ -293,6 +294,7 @@ 2B7A;LEFTWARDS TRIANGLE-HEADED ARROW WITH DOUBLE VERTICAL STROKE;correction 2B7C;RIGHTWARDS TRIANGLE-HEADED ARROW WITH DOUBLE VERTICAL STROKE;correction A015;YI SYLLABLE ITERATION MARK;correction +AA6E;MYANMAR LETTER KHAMTI LLA;correction FE00;VS1;abbreviation FE01;VS2;abbreviation FE02;VS3;abbreviation diff --git a/lib/unicore/NamedSequences.txt b/lib/unicore/NamedSequences.txt index b3c64f18c2..fa05c6a7d8 100644 --- a/lib/unicore/NamedSequences.txt +++ b/lib/unicore/NamedSequences.txt @@ -1,10 +1,10 @@ -# NamedSequences-13.0.0.txt -# Date: 2020-01-22, 19:12:00 GMT [KW, LI] -# © 2020 Unicode®, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# NamedSequences-14.0.0.txt +# Date: 2021-08-03, 23:04:00 GMT [KW] +# © 2021 Unicode®, Inc. +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Unicode Named Character Sequences # @@ -28,7 +28,7 @@ # <1000, 1001, 1002> # # For more information, see UAX #34: Unicode Named Character -# Sequences, at http://www.unicode.org/unicode/reports/tr34/ +# Sequences, at https://www.unicode.org/reports/tr34/ # # Note: The order of entries in this file is not significant. # However, entries are generally in script order corresponding @@ -168,6 +168,35 @@ ARABIC SEQUENCE YEH WITH HAMZA ABOVE WITH E;0626 06D0 ARABIC SEQUENCE YEH WITH HAMZA ABOVE WITH AE;0626 06D5 ARABIC SEQUENCE NOON WITH KEHEH;0646 06A9 +# Entries that correspond to Indic characters with nuktas +# that are also listed in CompositionExclusions.txt. +# These characters decompose for normalized text, even +# in NFC. Having named sequences for these helps in +# certain specifications, including Label Generation Rules (LGR) +# for Internationalized Domain Names (IDN). +# +# Provisional 2020-01-16, Approved 2021-07-27 + +DEVANAGARI SEQUENCE FOR LETTER QA; 0915 093C +DEVANAGARI SEQUENCE FOR LETTER KHHA; 0916 093C +DEVANAGARI SEQUENCE FOR LETTER GHHA; 0917 093C +DEVANAGARI SEQUENCE FOR LETTER ZA; 091C 093C +DEVANAGARI SEQUENCE FOR LETTER DDDHA; 0921 093C +DEVANAGARI SEQUENCE FOR LETTER RHA; 0922 093C +DEVANAGARI SEQUENCE FOR LETTER FA; 092B 093C +DEVANAGARI SEQUENCE FOR LETTER YYA; 092F 093C +BENGALI SEQUENCE FOR LETTER RRA; 09A1 09BC +BENGALI SEQUENCE FOR LETTER RHA; 09A2 09BC +BENGALI SEQUENCE FOR LETTER YYA; 09AF 09BC +GURMUKHI SEQUENCE FOR LETTER LLA; 0A32 0A3C +GURMUKHI SEQUENCE FOR LETTER SHA; 0A38 0A3C +GURMUKHI SEQUENCE FOR LETTER KHHA; 0A16 0A3C +GURMUKHI SEQUENCE FOR LETTER GHHA; 0A17 0A3C +GURMUKHI SEQUENCE FOR LETTER ZA; 0A1C 0A3C +GURMUKHI SEQUENCE FOR LETTER FA; 0A2B 0A3C +ORIYA SEQUENCE FOR LETTER RRA; 0B21 0B3C +ORIYA SEQUENCE FOR LETTER RHA; 0B22 0B3C + # Entry for a Bangla entity. # Provisional 2009-08-10, Approved 2010-05-14 # @@ -180,7 +209,7 @@ BENGALI LETTER KHINYA;0995 09CD 09B7 # # A visual display of the Tamil named character sequences is available # in the documentation for the Unicode Standard. See Section 12.6, Tamil in -# http://www.unicode.org/versions/latest/ +# https://www.unicode.org/versions/latest/ TAMIL CONSONANT K; 0B95 0BCD TAMIL CONSONANT NG; 0B99 0BCD diff --git a/lib/unicore/NamedSqProv.txt b/lib/unicore/NamedSqProv.txt index a4e4fdc2e4..6c74798e65 100644 --- a/lib/unicore/NamedSqProv.txt +++ b/lib/unicore/NamedSqProv.txt @@ -1,10 +1,10 @@ -# NamedSequencesProv-13.0.0.txt -# Date: 2020-01-22, 19:32:00 GMT [KW, LI] -# © 2020 Unicode®, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# NamedSequencesProv-14.0.0.txt +# Date: 2021-08-03, 23:04:00 GMT [KW] +# © 2021 Unicode®, Inc. +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Provisional Unicode Named Character Sequences # @@ -29,7 +29,7 @@ # <1000, 1001, 1002> # # For more information, see UAX #34: Unicode Named Character -# Sequences, at http://www.unicode.org/unicode/reports/tr34/ +# Sequences, at https://www.unicode.org/reports/tr34/ # # Note: The order of entries in this file is not significant. # However, entries are generally in script order corresponding @@ -40,34 +40,7 @@ # Provisional entries for NamedSequences.txt. -# Entries that correspond to Indic characters with nuktas -# that are also listed in CompositionExclusions.txt. -# These characters decompose for normalized text, even -# in NFC. Having named sequences for these helps in -# certain specifications, including Label Generation Rules (LGR) -# for Internationalized Domain Names (IDN). -# -# Provisional 2020-01-16 - -DEVANAGARI SEQUENCE FOR LETTER QA; 0915 093C -DEVANAGARI SEQUENCE FOR LETTER KHHA; 0916 093C -DEVANAGARI SEQUENCE FOR LETTER GHHA; 0917 093C -DEVANAGARI SEQUENCE FOR LETTER ZA; 091C 093C -DEVANAGARI SEQUENCE FOR LETTER DDDHA; 0921 093C -DEVANAGARI SEQUENCE FOR LETTER RHA; 0922 093C -DEVANAGARI SEQUENCE FOR LETTER FA; 092B 093C -DEVANAGARI SEQUENCE FOR LETTER YYA; 092F 093C -BENGALI SEQUENCE FOR LETTER RRA; 09A1 09BC -BENGALI SEQUENCE FOR LETTER RHA; 09A2 09BC -BENGALI SEQUENCE FOR LETTER YYA; 09AF 09BC -GURMUKHI SEQUENCE FOR LETTER LLA; 0A32 0A3C -GURMUKHI SEQUENCE FOR LETTER SHA; 0A38 0A3C -GURMUKHI SEQUENCE FOR LETTER KHHA; 0A16 0A3C -GURMUKHI SEQUENCE FOR LETTER GHHA; 0A17 0A3C -GURMUKHI SEQUENCE FOR LETTER ZA; 0A1C 0A3C -GURMUKHI SEQUENCE FOR LETTER FA; 0A2B 0A3C -ORIYA SEQUENCE FOR LETTER RRA; 0B21 0B3C -ORIYA SEQUENCE FOR LETTER RHA; 0B22 0B3C +# No provisional entries are currently defined. # ================================================ diff --git a/lib/unicore/NamesList.txt b/lib/unicore/NamesList.txt index 6b856885b8..a5618d9e13 100644 --- a/lib/unicore/NamesList.txt +++ b/lib/unicore/NamesList.txt @@ -1,28 +1,15 @@ ; charset=UTF-8 -@@@ The Unicode Standard 13.0.0 -@@@+ U13M200203.lst - Unicode 13.0.0 names list, eighth delta. - Repertoire synched with UnicodeData-13.0.0d6.txt - Eighth delta of annotation fixes. - Added xrefs for 27C7, 27D1, 2227, 2228. Adjusted subhead for 27C7. - Updated aliases for 26A5, 26A4, 26A2, 263F. - Updated subheads and annotations for 1DF8 through 1DFB. - Updated title of UTR #54 in notice at 1800. - Added xref to 202F for 0020. - Added annotations about abbreviations for 2066 through 2069 for consistency. - Separated aliases for 0009 and 000A onto separate lines. - Removed superfluous xrefs for 2011. - Adjusted subheads for 2028 and 202A. - Added notices for the sets of composition exclusions in four Indic scripts. - Added xrefs for 029C, 1D34, 1D78, A7F8 and a notice at A7F8. +@@@ The Unicode Standard 14.0.0 +@@@+ U14M210804.lst + Unicode 14.0.0 final names list. This file is semi-automatically derived from UnicodeData.txt and a set of manually created annotations using a script to select or suppress information from the data file. The rules used for this process are aimed at readability for the human reader, at the expense of some details; therefore, this file should not be parsed for machine-readable information. -@+ © 2020 Unicode®, Inc. - For terms of use, see http://www.unicode.org/terms_of_use.html +@+ © 2021 Unicode®, Inc. + For terms of use, see https://www.unicode.org/terms_of_use.html @@ 0000 C0 Controls and Basic Latin (Basic Latin) 007F @@+ @ C0 controls @@ -112,6 +99,9 @@ x (zero width space - 200B) x (narrow no-break space - 202F) x (word joiner - 2060) + x (symbol for space - 2420) + x (blank symbol - 2422) + x (open box - 2423) x (ideographic space - 3000) x (zero width no-break space - FEFF) 0021 EXCLAMATION MARK @@ -121,27 +111,42 @@ x (latin letter retroflex click - 01C3) x (double exclamation mark - 203C) x (interrobang - 203D) + x (warning sign - 26A0) + x (heavy exclamation mark symbol - 2757) x (heavy exclamation mark ornament - 2762) + x (medieval exclamation mark - 2E53) + x (modifier letter raised exclamation mark - A71D) 0022 QUOTATION MARK + = double quote * neutral (vertical), used as opening or closing quotation mark * preferred characters in English for paired quotation marks are 201C & 201D * 05F4 is preferred for gershayim when writing Hebrew x (modifier letter double prime - 02BA) + x (double acute accent - 02DD) + x (modifier letter double apostrophe - 02EE) x (combining double acute accent - 030B) x (combining double vertical line above - 030E) x (hebrew punctuation gershayim - 05F4) + x (left double quotation mark - 201C) + x (right double quotation mark - 201D) x (double prime - 2033) x (ditto mark - 3003) 0023 NUMBER SIGN - = pound sign, hash, crosshatch, octothorpe + = pound sign (weight) + = hashtag, hash + = crosshatch, octothorpe + * for denoting musical sharp 266F is preferred x (l b bar symbol - 2114) + x (numero sign - 2116) x (viewdata square - 2317) x (music sharp sign - 266F) + x (equals sign and slanted parallel - 29E3) 0024 DOLLAR SIGN = milréis, escudo * used for many peso currencies in Latin America and elsewhere * glyph may have one or two vertical bars * other currency symbol characters start at 20A0 + x (cent sign - 00A2) x (currency sign - 00A4) x (peso sign - 20B1) x (heavy dollar sign - 1F4B2) @@ -151,11 +156,14 @@ x (per ten thousand sign - 2031) x (commercial minus sign - 2052) 0026 AMPERSAND + = and + * originally derived from a ligature of 'e' and 't' x (tironian sign et - 204A) x (turned ampersand - 214B) x (heavy ampersand ornament - 1F674) 0027 APOSTROPHE = apostrophe-quote (1.0) + = single quote = APL quote * neutral (vertical) glyph with mixed usage * 2019 is preferred for apostrophe @@ -165,7 +173,10 @@ x (modifier letter apostrophe - 02BC) x (modifier letter vertical line - 02C8) x (combining acute accent - 0301) + x (combining vertical line above - 030D) x (hebrew punctuation geresh - 05F3) + x (left single quotation mark - 2018) + x (right single quotation mark - 2019) x (prime - 2032) x (latin small letter saltillo - A78C) 0028 LEFT PARENTHESIS @@ -174,43 +185,65 @@ = closing parenthesis (1.0) * see discussion on semantics of paired bracketing characters 002A ASTERISK - = star (on phone keypads) + = star + * can have five or six spokes x (arabic five pointed star - 066D) + x (asterism - 2042) x (low asterisk - 204E) + x (two asterisks aligned vertically - 2051) + x (combining asterisk above - 20F0) x (asterisk operator - 2217) x (sextile - 26B9) x (heavy asterisk - 2731) + x (slavonic asterisk - A673) + x (medium six spoked asterisk - 1F7B6) +@ ASCII math operator 002B PLUS SIGN + x (modifier letter plus sign - 02D6) + x (minus sign - 2212) x (heavy plus sign - 2795) + x (hebrew letter alternative plus sign - FB29) + x (light greek cross - 1F7A2) +@ ASCII punctuation 002C COMMA = decimal separator x (arabic comma - 060C) + x (arabic decimal separator - 066B) x (single low-9 quotation mark - 201A) x (reversed comma - 2E41) x (medieval comma - 2E4C) x (ideographic comma - 3001) 002D HYPHEN-MINUS - = hyphen or minus sign - * used for either hyphen or minus sign + = hyphen, dash + = minus sign + * used generically for hyphen, minus sign or en dash, all of which have dedicated alternatives + x (soft hyphen - 00AD) + x (modifier letter minus sign - 02D7) x (hyphen - 2010) x (non-breaking hyphen - 2011) x (figure dash - 2012) x (en dash - 2013) + x (hyphenation point - 2027) x (hyphen bullet - 2043) x (minus sign - 2212) x (roman uncia sign - 10191) 002E FULL STOP = period, dot, decimal point + * the use as decimal point is locale dependent * may be rendered as a raised decimal point in old style numbers x (arabic full stop - 06D4) + x (one dot leader - 2024) + x (horizontal ellipsis - 2026) + x (raised dot - 2E33) x (stenographic full stop - 2E3C) x (ideographic full stop - 3002) 002F SOLIDUS - = slash, virgule - x (latin letter dental click - 01C0) + = slash,forward slash, virgule x (combining long solidus overlay - 0338) x (fraction slash - 2044) x (division slash - 2215) + x (mathematical rising diagonal - 27CB) + x (big solidus - 29F8) x (dotted solidus - 2E4A) @ ASCII digits 0030 DIGIT ZERO @@ -224,41 +257,65 @@ 0037 DIGIT SEVEN 0038 DIGIT EIGHT 0039 DIGIT NINE -@ ASCII punctuation and symbols +@ ASCII punctuation 003A COLON * also used to denote division or scale; for that mathematical use 2236 is preferred + * in Finnish and Swedish, also used as intra-word punctation (abbreviation mark) + x (modifier letter triangular colon - 02D0) + x (modifier letter raised colon - 02F8) x (armenian full stop - 0589) x (hebrew punctuation sof pasuq - 05C3) + x (ethiopic wordspace - 1361) + x (ethiopic colon - 1365) + x (two dot punctuation - 205A) + x (tricolon - 205D) x (ratio - 2236) x (modifier letter colon - A789) + x (presentation form for vertical two dot leader - FE30) 003B SEMICOLON * this, and not 037E, is the preferred character for 'Greek question mark' x (greek question mark - 037E) x (arabic semicolon - 061B) x (reversed semicolon - 204F) + x (turned semicolon - 2E35) +@ ASCII mathematical operators +@+ Other mathematical operators start at 2200. 003C LESS-THAN SIGN + * paired with 003E for ASCII-based angle bracket markup conventions + x (modifier letter left arrowhead - 02C2) x (single left-pointing angle quotation mark - 2039) x (left-pointing angle bracket - 2329) x (mathematical left angle bracket - 27E8) x (left angle bracket - 3008) 003D EQUALS SIGN * other related characters: 2241-2263 + x (canadian syllabics hyphen - 1400) + x (almost equal to - 2248) x (not equal to - 2260) x (identical to - 2261) + x (double hyphen - 2E40) + x (katakana-hiragana double hyphen - 30A0) x (modifier letter short equals sign - A78A) x (roman sextans sign - 10190) + x (heavy equals sign - 1F7F0) 003E GREATER-THAN SIGN + x (modifier letter right arrowhead - 02C3) x (single right-pointing angle quotation mark - 203A) x (right-pointing angle bracket - 232A) x (mathematical right angle bracket - 27E9) x (right angle bracket - 3009) +@ ASCII punctuation 003F QUESTION MARK x (inverted question mark - 00BF) x (greek question mark - 037E) x (arabic question mark - 061F) x (interrobang - 203D) - x (question exclamation mark - 2048) - x (exclamation question mark - 2049) + x (double question mark - 2047) + x (black question mark ornament - 2753) + x (uncertainty sign - 2BD1) + x (reversed question mark - 2E2E) + x (medieval question mark - 2E54) + x (replacement character - FFFD) 0040 COMMERCIAL AT = at sign @ Uppercase Latin alphabet @@ -267,12 +324,16 @@ x (script capital b - 212C) 0043 LATIN CAPITAL LETTER C x (double-struck capital c - 2102) + x (degree celsius - 2103) x (black-letter capital c - 212D) + x (roman numeral one hundred - 216D) 0044 LATIN CAPITAL LETTER D + x (roman numeral five hundred - 216E) 0045 LATIN CAPITAL LETTER E x (euler constant - 2107) x (script capital e - 2130) 0046 LATIN CAPITAL LETTER F + x (degree fahrenheit - 2109) x (script capital f - 2131) x (turned capital f - 2132) 0047 LATIN CAPITAL LETTER G @@ -283,8 +344,6 @@ 0049 LATIN CAPITAL LETTER I * Turkish and Azerbaijani use 0131 for lowercase x (latin capital letter i with dot above - 0130) - x (cyrillic capital letter byelorussian-ukrainian i - 0406) - x (cyrillic letter palochka - 04C0) x (script capital i - 2110) x (black-letter capital i - 2111) x (roman numeral one - 2160) @@ -295,13 +354,16 @@ x (script capital l - 2112) 004D LATIN CAPITAL LETTER M x (script capital m - 2133) + x (roman numeral one thousand - 216F) 004E LATIN CAPITAL LETTER N x (double-struck capital n - 2115) 004F LATIN CAPITAL LETTER O 0050 LATIN CAPITAL LETTER P + x (script capital p - 2118) x (double-struck capital p - 2119) 0051 LATIN CAPITAL LETTER Q x (double-struck capital q - 211A) + x (rotated capital q - 213A) 0052 LATIN CAPITAL LETTER R x (script capital r - 211B) x (black-letter capital r - 211C) @@ -313,6 +375,7 @@ x (roman numeral five - 2164) 0057 LATIN CAPITAL LETTER W 0058 LATIN CAPITAL LETTER X + x (roman numeral ten - 2169) 0059 LATIN CAPITAL LETTER Y 005A LATIN CAPITAL LETTER Z x (double-struck capital z - 2124) @@ -325,10 +388,13 @@ = backslash x (combining reverse solidus overlay - 20E5) x (set minus - 2216) + x (mathematical falling diagonal - 27CD) + x (big reverse solidus - 29F9) 005D RIGHT SQUARE BRACKET = closing square bracket (1.0) 005E CIRCUMFLEX ACCENT * this is a spacing character + * used in ASCII-based representation of exponentiation x (modifier letter up arrowhead - 02C4) x (modifier letter circumflex accent - 02C6) x (combining circumflex accent - 0302) @@ -337,10 +403,12 @@ 005F LOW LINE = spacing underscore (1.0) * this is a spacing character + * joins with adjacent instances of itself x (modifier letter low macron - 02CD) x (combining macron below - 0331) x (combining low line - 0332) x (double low line - 2017) + x (combining conjoining macron below - FE2D) 0060 GRAVE ACCENT * this is a spacing character x (modifier letter grave accent - 02CB) @@ -354,6 +422,7 @@ 0065 LATIN SMALL LETTER E x (estimated symbol - 212E) x (script small e - 212F) + x (latin small letter blackletter e - AB32) 0066 LATIN SMALL LETTER F 0067 LATIN SMALL LETTER G x (latin small letter script g - 0261) @@ -364,6 +433,7 @@ 0069 LATIN SMALL LETTER I * Turkish and Azerbaijani use 0130 for uppercase x (latin small letter dotless i - 0131) + x (superscript latin small letter i - 2071) x (mathematical italic small dotless i - 1D6A4) 006A LATIN SMALL LETTER J x (latin small letter dotless j - 0237) @@ -377,15 +447,18 @@ x (superscript latin small letter n - 207F) 006F LATIN SMALL LETTER O x (script small o - 2134) + x (latin small letter blackletter o - AB3D) 0070 LATIN SMALL LETTER P 0071 LATIN SMALL LETTER Q 0072 LATIN SMALL LETTER R 0073 LATIN SMALL LETTER S + x (latin small letter long s - 017F) 0074 LATIN SMALL LETTER T 0075 LATIN SMALL LETTER U 0076 LATIN SMALL LETTER V 0077 LATIN SMALL LETTER W 0078 LATIN SMALL LETTER X + x (multiplication sign - 00D7) 0079 LATIN SMALL LETTER Y 007A LATIN SMALL LETTER Z x (latin small letter z with stroke - 01B6) @@ -394,10 +467,14 @@ = opening curly bracket (1.0) = left brace 007C VERTICAL LINE - = vertical bar + = vertical bar, pipe * used in pairs to indicate absolute value + * also used as an unpaired separator or as a fence + x (broken bar - 00A6) x (latin letter dental click - 01C0) x (hebrew punctuation paseq - 05C0) + x (devanagari danda - 0964) + x (combining long vertical line overlay - 20D2) x (divides - 2223) x (light vertical bar - 2758) 007D RIGHT CURLY BRACKET @@ -407,8 +484,12 @@ * this is a spacing character x (small tilde - 02DC) x (combining tilde - 0303) + x (combining tilde overlay - 0334) x (swung dash - 2053) x (tilde operator - 223C) + x (tilde with ring above - 2E1B) + x (vertical tilde - 2E2F) + x (wave dash - 301C) x (fullwidth tilde - FF5E) @ Control character 007F @@ -488,30 +569,42 @@ x (figure space - 2007) x (narrow no-break space - 202F) x (word joiner - 2060) + x (shouldered open box - 237D) x (zero width no-break space - FEFF) # 0020 00A1 INVERTED EXCLAMATION MARK * Spanish, Asturian, Galician + * used in extended IPA to represent sublaminal lower alveolar percussive x (exclamation mark - 0021) + x (modifier letter raised inverted exclamation mark - A71E) 00A2 CENT SIGN + x (latin small letter c with stroke - 023C) + x (mill sign - 20A5) + x (cedi sign - 20B5) + x (musical symbol cut time - 1D135) 00A3 POUND SIGN - = pound sterling, Irish punt, Italian lira, Turkish lira, etc. + = pound sterling, Irish punt, lira, etc. + * glyph may have one or two crossbars, in distinction from 20A4 x (lira sign - 20A4) x (turkish lira sign - 20BA) x (roman semuncia sign - 10192) 00A4 CURRENCY SIGN - * other currency symbol characters: 20A0-20BF + * generic or unknown currency + * other currency symbol characters start at 20A0 x (dollar sign - 0024) 00A5 YEN SIGN - = yuan sign + = yuan sign (renminbi) * glyph may have one or two crossbars, but the official symbol in Japan and China has two + * in native context, specific ideographs may be used for units of these currencies x 5143 x 5186 00A6 BROKEN BAR = broken vertical bar (1.0) = parted rule (in typography) + x (vertical line - 007C) 00A7 SECTION SIGN - * paragraph sign in some European usage + * used in referencing numbered sections or paragraphs + x (top half section sign - 2E39) 00A8 DIAERESIS * this is a spacing character x (combining diaeresis - 0308) @@ -523,6 +616,7 @@ x (mask work symbol - 1F1AD) 00AA FEMININE ORDINAL INDICATOR * Spanish + x (modifier letter small a - 1D43) # 0061 00AB LEFT-POINTING DOUBLE ANGLE QUOTATION MARK = left guillemet @@ -533,26 +627,37 @@ 00AC NOT SIGN = angled dash (in typography) x (reversed not sign - 2310) + x (turned not sign - 2319) 00AD SOFT HYPHEN = discretionary hyphen * commonly abbreviated as SHY + * an invisible format character indicating a possible hyphenation location 00AE REGISTERED SIGN = registered trade mark sign (1.0) + x (trade mark sign - 2122) x (circled latin capital letter r - 24C7) + x (raised md sign - 1F16B) + x (raised mr sign - 1F16C) 00AF MACRON = overline, APL overbar * this is a spacing character + * unlike 203E, adjacent instances of this character do not join x (modifier letter macron - 02C9) x (combining macron - 0304) x (combining overline - 0305) + x (overline - 203E) + x (combining conjoining macron - FE26) # 0020 0304 00B0 DEGREE SIGN * this is a spacing character x (ring above - 02DA) x (combining ring above - 030A) x (superscript zero - 2070) + x (degree celsius - 2103) + x (degree fahrenheit - 2109) x (ring operator - 2218) 00B1 PLUS-MINUS SIGN + = biquintile (astrological aspect: 144°) x (minus-or-plus sign - 2213) 00B2 SUPERSCRIPT TWO = squared @@ -568,6 +673,8 @@ x (modifier letter prime - 02B9) x (modifier letter acute accent - 02CA) x (combining acute accent - 0301) + x (greek tonos - 0384) + x (greek oxia - 1FFD) x (prime - 2032) # 0020 0301 00B5 MICRO SIGN @@ -583,6 +690,8 @@ = Georgian comma = Greek middle dot (ano teleia) * also used as a raised decimal point or to denote multiplication; for multiplication 22C5 is preferred + x (full stop - 002E) + x (dot above - 02D9) x (greek ano teleia - 0387) x (runic single punctuation - 16EB) x (bullet - 2022) @@ -602,9 +711,12 @@ 00B9 SUPERSCRIPT ONE x (superscript two - 00B2) x (superscript three - 00B3) + x (superscript zero - 2070) # 0031 00BA MASCULINE ORDINAL INDICATOR * Spanish + x (modifier letter small o - 1D52) + x (numero sign - 2116) # 006F 00BB RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK = right guillemet @@ -663,6 +775,7 @@ * lowercase is 00F0 x (latin capital letter d with stroke - 0110) x (latin capital letter african d - 0189) + x (latin capital letter d with short stroke overlay - A7C7) 00D1 LATIN CAPITAL LETTER N WITH TILDE : 004E 0303 00D2 LATIN CAPITAL LETTER O WITH GRAVE @@ -678,9 +791,14 @@ @ Mathematical operator 00D7 MULTIPLICATION SIGN = z notation Cartesian product + x (latin small letter x - 0078) + x (saltire - 2613) x (multiplication x - 2715) + x (heavy ballot x - 2718) x (cross mark - 274C) x (vector or cross product - 2A2F) + x (cancellation x - 1F5D9) + x (light saltire - 1F7A9) @ Letters 00D8 LATIN CAPITAL LETTER O WITH STROKE = o slash @@ -700,9 +818,12 @@ = Eszett * German * not used in Swiss High German - * uppercase is "SS" or 1E9E + * uppercase is "SS" (standard case mapping), alternatively 1E9E * typographically the glyph for this character can be based on a ligature of 017F with either 0073 or with an old-style glyph for 007A (the latter similar in appearance to 0292). Both forms exist interchangeably today. + x (latin small letter long s - 017F) + x (latin small letter ezh - 0292) x (greek small letter beta - 03B2) + x (latin capital letter sharp s - 1E9E) 00E0 LATIN SMALL LETTER A WITH GRAVE : 0061 0300 00E1 LATIN SMALL LETTER A WITH ACUTE @@ -745,6 +866,7 @@ 00F0 LATIN SMALL LETTER ETH * Icelandic, Faroese, Old English, IPA * uppercase is 00D0 + x (latin small letter d with stroke - 0111) x (greek small letter delta - 03B4) x (partial differential - 2202) 00F1 LATIN SMALL LETTER N WITH TILDE @@ -763,7 +885,7 @@ @ Mathematical operator 00F7 DIVISION SIGN = obelus - * occasionally used as an alternate, more visually distinct version of 2212 or 2011 in some contexts + * occasionally used as an alternate, more visually distinct shape for a hyphen in some contexts * historically used as a punctuation mark to denote questionable passages in manuscripts x (syriac harklean obelus - 070B) x (commercial minus sign - 2052) @@ -772,6 +894,8 @@ x (divides - 2223) x (ratio - 2236) x (heavy division sign - 2797) + x (long division - 27CC) + x (dotted obelos - 2E13) @ Letters 00F8 LATIN SMALL LETTER O WITH STROKE = o slash @@ -1543,7 +1667,7 @@ : 00D8 0301 01FF LATIN SMALL LETTER O WITH STROKE AND ACUTE : 00F8 0301 -@ Additions for Slovenian and Croatian +@ Additions for Slovenian 0200 LATIN CAPITAL LETTER A WITH DOUBLE GRAVE : 0041 030F 0201 LATIN SMALL LETTER A WITH DOUBLE GRAVE @@ -2090,7 +2214,7 @@ # 0079 @ Miscellaneous phonetic modifiers 02B9 MODIFIER LETTER PRIME - * primary stress, emphasis + * stress, emphasis * transliteration of mjagkij znak (Cyrillic soft sign: palatalization) * transliteration of Hebrew geresh x (apostrophe - 0027) @@ -2431,6 +2555,7 @@ 031F COMBINING PLUS SIGN BELOW * IPA: advanced or fronted articulation x (modifier letter plus sign - 02D6) + x (combining plus sign above - 1AC8) 0320 COMBINING MINUS SIGN BELOW * IPA: retracted or backed articulation * glyph may have small end-serifs @@ -2477,6 +2602,7 @@ 032B COMBINING INVERTED DOUBLE ARCH BELOW * IPA: labialization x (modifier letter small w - 02B7) + x (combining inverted double arch above - 1AC7) 032C COMBINING CARON BELOW * IPA: voiced 032D COMBINING CIRCUMFLEX ACCENT BELOW @@ -2961,6 +3087,7 @@ 0416 CYRILLIC CAPITAL LETTER ZHE 0417 CYRILLIC CAPITAL LETTER ZE 0418 CYRILLIC CAPITAL LETTER I +@+ This letter is also used to represent electrolarynx phonation in the Voice Quality Symbols for extended IPA. 0419 CYRILLIC CAPITAL LETTER SHORT I : 0418 0306 041A CYRILLIC CAPITAL LETTER KA @@ -3365,6 +3492,7 @@ 04FF CYRILLIC SMALL LETTER HA WITH STROKE @@ 0500 Cyrillic Supplement 052F @ Komi letters +@+ These letters are for the obsolete Molodtsov alphabet, used in the 1920s. 0500 CYRILLIC CAPITAL LETTER KOMI DE 0501 CYRILLIC SMALL LETTER KOMI DE 0502 CYRILLIC CAPITAL LETTER KOMI DJE @@ -3427,9 +3555,10 @@ 0528 CYRILLIC CAPITAL LETTER EN WITH LEFT HOOK 0529 CYRILLIC SMALL LETTER EN WITH LEFT HOOK @ Komi letters +@+ These are obsolete letters attested in a 19th century grammar of Komi. 052A CYRILLIC CAPITAL LETTER DZZHE 052B CYRILLIC SMALL LETTER DZZHE - * also used for Ossetian + * also used for Ossetian until 1924 052C CYRILLIC CAPITAL LETTER DCHE 052D CYRILLIC SMALL LETTER DCHE @ Khanty letters @@ -3741,15 +3870,18 @@ * represents sallallahu alayhe wasallam "may God's peace and blessings be upon him" 0611 ARABIC SIGN ALAYHE ASSALLAM * represents alayhe assalam "upon him be peace" + x (arabic ligature alayhi as-salaam - FD47) 0612 ARABIC SIGN RAHMATULLAH ALAYHE * represents rahmatullah alayhe "may God have mercy upon him" + x (arabic ligature rahimahu allaah - FD40) 0613 ARABIC SIGN RADI ALLAHOU ANHU * represents radi allahu 'anhu "may God be pleased with him" + x (arabic ligature radi allaahu anh - FD41) 0614 ARABIC SIGN TAKHALLUS * sign placed over the name or nom-de-plume of a poet, or in some writings used to mark all proper names @ Quranic annotation sign 0615 ARABIC SMALL HIGH TAH - * marks a recommended pause position in some Korans published in Iran and Pakistan + * marks a recommended pause position in some Qurans published in Iran and Pakistan * should not be confused with the small TAH sign used as a diacritic for some letters such as 0679 @ Extended Arabic mark 0616 ARABIC SMALL HIGH LIGATURE ALEF WITH LAM WITH YEH @@ -3773,6 +3905,7 @@ * commonly abbreviated ALM x (right-to-left mark - 200F) @ Punctuation +061D ARABIC END OF TEXT MARK 061E ARABIC TRIPLE DOT PUNCTUATION MARK 061F ARABIC QUESTION MARK * also used with Thaana and Syriac in modern text @@ -3793,6 +3926,7 @@ 0625 ARABIC LETTER ALEF WITH HAMZA BELOW : 0627 0655 0626 ARABIC LETTER YEH WITH HAMZA ABOVE + * in Kyrgyz the hamza is consistently positioned to the top right in isolate and final forms : 064A 0654 0627 ARABIC LETTER ALEF 0628 ARABIC LETTER BEH @@ -3833,6 +3967,7 @@ 0643 ARABIC LETTER KAF 0644 ARABIC LETTER LAM 0645 ARABIC LETTER MEEM + * Sindhi uses a shape with a short tail 0646 ARABIC LETTER NOON 0647 ARABIC LETTER HEH 0648 ARABIC LETTER WAW @@ -3855,11 +3990,15 @@ 0651 ARABIC SHADDA 0652 ARABIC SUKUN * marks absence of a vowel after the base consonant - * used in some Korans to mark a long vowel as ignored + * used in some Qurans to mark a long vowel as ignored * can have a variety of shapes, including a circular one and a shape that looks like '06E1' x (arabic small high dotless head of khah - 06E1) @ Combining maddah and hamza 0653 ARABIC MADDAH ABOVE + * used for madd jaa'iz in South Asian and Indonesian orthographies + x (arabic madda waajib - 089C) + x (arabic doubled madda - 089E) + x (arabic half madda over madda - 089F) 0654 ARABIC HAMZA ABOVE * restricted to hamza and ezafe semantics * is not used as a diacritic to form new letters @@ -3925,22 +4064,21 @@ * Kashmiri * this character is deprecated and its use is strongly discouraged * use the sequence 0627 065F instead -@ Extended Arabic letters +@ High hamza 0674 ARABIC LETTER HIGH HAMZA - * Kazakh + * Kazakh, Jawi * forms digraphs +@ Digraphic letters for Kazakh +@+ Use of these characters is discouraged. They were encoded for Kazakh digraphs, but their decompositions do not reflect the preferred order of representation. 0675 ARABIC LETTER HIGH HAMZA ALEF - * Kazakh # 0627 0674 0676 ARABIC LETTER HIGH HAMZA WAW - * Kazakh # 0648 0674 0677 ARABIC LETTER U WITH HAMZA ABOVE - * Kazakh # 06C7 0674 0678 ARABIC LETTER HIGH HAMZA YEH - * Kazakh # 064A 0674 +@ Extended Arabic letters 0679 ARABIC LETTER TTEH * Urdu 067A ARABIC LETTER TTEHEH @@ -4039,7 +4177,7 @@ 06A6 ARABIC LETTER PEHEH * Sindhi 06A7 ARABIC LETTER QAF WITH DOT ABOVE - * Maghrib Arabic, Uighur + * Maghrib Arabic, Uyghur 06A8 ARABIC LETTER QAF WITH THREE DOTS ABOVE * Tunisian Arabic 06A9 ARABIC LETTER KEHEH @@ -4054,9 +4192,10 @@ * use for the Jawi gaf is not recommended, although it may be found in some existing text data; recommended character for Jawi gaf is 0762 x (arabic letter keheh with dot above - 0762) 06AD ARABIC LETTER NG - * Uighur, Kazakh, Moroccan Arabic, early Jawi, early Persian, ... + * Uyghur, Kazakh, Moroccan Arabic, early Jawi, early Persian, ... 06AE ARABIC LETTER KAF WITH THREE DOTS BELOW * Berber, early Persian + * Pegon alternative for 068A 06AF ARABIC LETTER GAF * Persian, Urdu, ... 06B0 ARABIC LETTER GAF WITH RING @@ -4088,7 +4227,7 @@ * Jawi 06BE ARABIC LETTER HEH DOACHASHMEE * forms aspirate digraphs in Urdu and other languages of South Asia - * represents the glottal fricative /h/ in Uighur + * represents the glottal fricative /h/ in Uyghur 06BF ARABIC LETTER TCHEH WITH DOT ABOVE 06C0 ARABIC LETTER HEH WITH YEH ABOVE = arabic letter hamzah on ha (1.0) @@ -4106,19 +4245,20 @@ 06C4 ARABIC LETTER WAW WITH RING * Kashmiri 06C5 ARABIC LETTER KIRGHIZ OE - * Kirghiz + * Kyrgyz + * a glyph variant occurs which replaces the looped tail with a horizontal bar through the tail 06C6 ARABIC LETTER OE - * Uighur, Kurdish, Kazakh, Azerbaijani, Bosnian + * Uyghur, Kurdish, Kazakh, Azerbaijani, Bosnian 06C7 ARABIC LETTER U - * Kirghiz, Azerbaijani + * Azerbaijani, Kazakh, Kyrgyz, Uyghur 06C8 ARABIC LETTER YU - * Uighur + * Uyghur 06C9 ARABIC LETTER KIRGHIZ YU - * Kazakh, Kirghiz, Bosnian + * Kazakh, Kyrgyz, Bosnian 06CA ARABIC LETTER WAW WITH TWO DOTS ABOVE * Kurdish 06CB ARABIC LETTER VE - * Uighur, Kazakh + * Uyghur, Kazakh 06CC ARABIC LETTER FARSI YEH * Arabic, Persian, Urdu, Kashmiri, ... * initial and medial forms of this letter have dots @@ -4130,7 +4270,7 @@ * Kurdish 06CF ARABIC LETTER WAW WITH DOT ABOVE 06D0 ARABIC LETTER E - * Pashto, Uighur + * Pashto, Uyghur * used as the letter bbeh in Sindhi 06D1 ARABIC LETTER YEH WITH THREE DOTS BELOW * Mende languages, Hausa @@ -4145,7 +4285,7 @@ * Urdu @ Extended Arabic letter 06D5 ARABIC LETTER AE - * Uighur, Kazakh, Kirghiz + * Uyghur, Kazakh, Kyrgyz @ Quranic annotation signs 06D6 ARABIC SMALL HIGH LIGATURE SAD WITH LAM WITH ALEF MAKSURA 06D7 ARABIC SMALL HIGH LIGATURE QAF WITH LAM WITH ALEF MAKSURA @@ -4159,10 +4299,11 @@ 06DF ARABIC SMALL HIGH ROUNDED ZERO * smaller than the typical circular shape used for 0652 06E0 ARABIC SMALL HIGH UPRIGHT RECTANGULAR ZERO + * the term "rectangular zero" is a translation of the Arabic name of this sign 06E1 ARABIC SMALL HIGH DOTLESS HEAD OF KHAH = Arabic jazm * presentation form of 0652, using font technology to select the variant is preferred - * used in some Korans to mark absence of a vowel + * used in some Qurans to mark absence of a vowel x (arabic sukun - 0652) 06E2 ARABIC SMALL HIGH MEEM ISOLATED FORM 06E3 ARABIC SMALL LOW SEEN @@ -4308,6 +4449,7 @@ @ Syriac marks 0740 SYRIAC FEMININE DOT * feminine marker used with the Taw feminine suffix + x (combining dot above left - 1DF8) 0741 SYRIAC QUSHSHAYA * indicates a plosive pronunciation 0742 SYRIAC RUKKAKHA @@ -4701,6 +4843,63 @@ x (malayalam letter llla - 0D34) 086A SYRIAC LETTER MALAYALAM SSA x (malayalam letter ssa - 0D37) +@@ 0870 Arabic Extended-B 089F +@ Additions for Quranic orthographies +0870 ARABIC LETTER ALEF WITH ATTACHED FATHA +0871 ARABIC LETTER ALEF WITH ATTACHED TOP RIGHT FATHA +0872 ARABIC LETTER ALEF WITH RIGHT MIDDLE STROKE +0873 ARABIC LETTER ALEF WITH LEFT MIDDLE STROKE +0874 ARABIC LETTER ALEF WITH ATTACHED KASRA +0875 ARABIC LETTER ALEF WITH ATTACHED BOTTOM RIGHT KASRA +0876 ARABIC LETTER ALEF WITH ATTACHED ROUND DOT ABOVE +0877 ARABIC LETTER ALEF WITH ATTACHED RIGHT ROUND DOT +0878 ARABIC LETTER ALEF WITH ATTACHED LEFT ROUND DOT +0879 ARABIC LETTER ALEF WITH ATTACHED ROUND DOT BELOW +087A ARABIC LETTER ALEF WITH DOT ABOVE +087B ARABIC LETTER ALEF WITH ATTACHED TOP RIGHT FATHA AND DOT ABOVE +087C ARABIC LETTER ALEF WITH RIGHT MIDDLE STROKE AND DOT ABOVE +087D ARABIC LETTER ALEF WITH ATTACHED BOTTOM RIGHT KASRA AND DOT ABOVE +087E ARABIC LETTER ALEF WITH ATTACHED TOP RIGHT FATHA AND LEFT RING +087F ARABIC LETTER ALEF WITH RIGHT MIDDLE STROKE AND LEFT RING +0880 ARABIC LETTER ALEF WITH ATTACHED BOTTOM RIGHT KASRA AND LEFT RING +0881 ARABIC LETTER ALEF WITH ATTACHED RIGHT HAMZA +0882 ARABIC LETTER ALEF WITH ATTACHED LEFT HAMZA +0883 ARABIC TATWEEL WITH OVERSTRUCK HAMZA +0884 ARABIC TATWEEL WITH OVERSTRUCK WAW +0885 ARABIC TATWEEL WITH TWO DOTS BELOW +0886 ARABIC LETTER THIN YEH + * no final or isolated forms are attested +0887 ARABIC BASELINE ROUND DOT +0888 ARABIC RAISED ROUND DOT +@ Additions for Bosnian orthographies +0889 ARABIC LETTER NOON WITH INVERTED SMALL V +088A ARABIC LETTER HAH WITH INVERTED SMALL V BELOW +@ Additions for Pegon orthographies +088B ARABIC LETTER TAH WITH DOT BELOW + * Pegon, Malagasy +088C ARABIC LETTER TAH WITH THREE DOTS BELOW + * Pegon alternative for 088B +088D ARABIC LETTER KEHEH WITH TWO DOTS VERTICALLY BELOW + * Sundanese Pegon +@ Abbreviation mark +088E ARABIC VERTICAL TAIL + * mark used to indicate abbreviations in early movable type texts from Iran + * only attested in final form +@ Supertending currency symbols +0890 ARABIC POUND MARK ABOVE + * Egyptian pound +0891 ARABIC PIASTRE MARK ABOVE + * Egyptian piastre +@ Additions for Quranic orthographies +0898 ARABIC SMALL HIGH WORD AL-JUZ +0899 ARABIC SMALL LOW WORD ISHMAAM +089A ARABIC SMALL LOW WORD IMAALA +089B ARABIC SMALL LOW WORD TASHEEL +089C ARABIC MADDA WAAJIB + x (arabic maddah above - 0653) +089D ARABIC SUPERSCRIPT ALEF MOKHASSAS +089E ARABIC DOUBLED MADDA +089F ARABIC HALF MADDA OVER MADDA @@ 08A0 Arabic Extended-A 08FF @ Arabic letters for African languages 08A0 ARABIC LETTER BEH WITH SMALL V BELOW @@ -4746,6 +4945,8 @@ @ Arabic letters for Arwi 08B3 ARABIC LETTER AIN WITH THREE DOTS BELOW 08B4 ARABIC LETTER KAF WITH DOT BELOW +@ Early Arabic letter +08B5 ARABIC LETTER QAF WITH DOT BELOW AND NO DOTS ABOVE @ Arabic letters for Bravanese 08B6 ARABIC LETTER BEH WITH SMALL MEEM ABOVE 08B7 ARABIC LETTER PEH WITH SMALL MEEM ABOVE @@ -4782,6 +4983,20 @@ 08C6 ARABIC LETTER JEEM WITH THREE DOTS BELOW @ Arabic letter for Punjabi 08C7 ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +@ Arabic letter for Balti +08C8 ARABIC LETTER GRAF +@ Additions for Quranic orthographies +08C9 ARABIC SMALL FARSI YEH +08CA ARABIC SMALL HIGH FARSI YEH +08CB ARABIC SMALL HIGH YEH BARREE WITH TWO DOTS BELOW +08CC ARABIC SMALL HIGH WORD SAH + = sign of waqf +08CD ARABIC SMALL HIGH ZAH +08CE ARABIC LARGE ROUND DOT ABOVE +08CF ARABIC LARGE ROUND DOT BELOW +08D0 ARABIC SUKUN BELOW +08D1 ARABIC LARGE CIRCLE BELOW +08D2 ARABIC LARGE ROUND DOT INSIDE CIRCLE BELOW @ Quranic annotation signs 08D3 ARABIC SMALL LOW WAW 08D4 ARABIC SMALL HIGH WORD AR-RUB @@ -4834,8 +5049,8 @@ 08F9 ARABIC LEFT ARROWHEAD BELOW 08FA ARABIC RIGHT ARROWHEAD BELOW 08FB ARABIC DOUBLE RIGHT ARROWHEAD ABOVE -08FC ARABIC DOUBLE RIGHT ARROWHEAD ABOVE WITH DOT * also used in Quranic text in African and other orthographies to represent dammatan +08FC ARABIC DOUBLE RIGHT ARROWHEAD ABOVE WITH DOT 08FD ARABIC RIGHT ARROWHEAD ABOVE WITH DOT @ Extended vowel signs 08FE ARABIC DAMMA WITH DOT @@ -5792,6 +6007,10 @@ 0C37 TELUGU LETTER SSA 0C38 TELUGU LETTER SA 0C39 TELUGU LETTER HA +@ Sign +0C3C TELUGU SIGN NUKTA + * used for Tamil transliteration and Perso-Arabic phonemes + * can also appear as a large dot, should be placed sufficiently below the baseline of a consonant to avoid confusion/collision with the aspiration marker @ Addition for Sanskrit 0C3D TELUGU SIGN AVAGRAHA @ Dependent vowel signs @@ -5820,6 +6039,11 @@ 0C59 TELUGU LETTER DZA 0C5A TELUGU LETTER RRRA * letter for an alveolar consonant whose exact phonetic value is not known +@ Consonant +0C5D TELUGU LETTER NAKAARA POLLU + * vowelless form of na + x (kannada letter nakaara pollu - 0CDD) + x (malayalam letter chillu n - 0D7B) @ Additional vowels for Sanskrit 0C60 TELUGU LETTER VOCALIC RR 0C61 TELUGU LETTER VOCALIC LL @@ -5949,6 +6173,10 @@ 0CD5 KANNADA LENGTH MARK 0CD6 KANNADA AI LENGTH MARK @ Additional consonants +0CDD KANNADA LETTER NAKAARA POLLU + * vowelless form of na + x (telugu letter nakaara pollu - 0C5D) + x (malayalam letter chillu n - 0D7B) 0CDE KANNADA LETTER FA % KANNADA LETTER LLLA * obsolete historic letter @@ -7759,9 +7987,12 @@ 1247 ETHIOPIC SYLLABLE QOA 1248 ETHIOPIC SYLLABLE QWA 124A ETHIOPIC SYLLABLE QWI + x (ethiopic syllable gurage qwi - 1E7F0) 124B ETHIOPIC SYLLABLE QWAA 124C ETHIOPIC SYLLABLE QWEE + x (ethiopic syllable gurage qwee - 1E7F1) 124D ETHIOPIC SYLLABLE QWE + x (ethiopic syllable gurage qwe - 1E7F2) 1250 ETHIOPIC SYLLABLE QHA 1251 ETHIOPIC SYLLABLE QHU 1252 ETHIOPIC SYLLABLE QHI @@ -7853,9 +8084,12 @@ 12AF ETHIOPIC SYLLABLE KOA 12B0 ETHIOPIC SYLLABLE KWA 12B2 ETHIOPIC SYLLABLE KWI + x (ethiopic syllable gurage kwi - 1E7F5) 12B3 ETHIOPIC SYLLABLE KWAA 12B4 ETHIOPIC SYLLABLE KWEE + x (ethiopic syllable gurage kwee - 1E7F6) 12B5 ETHIOPIC SYLLABLE KWE + x (ethiopic syllable gurage kwe - 1E7F7) 12B8 ETHIOPIC SYLLABLE KXA 12B9 ETHIOPIC SYLLABLE KXU 12BA ETHIOPIC SYLLABLE KXI @@ -7864,10 +8098,14 @@ 12BD ETHIOPIC SYLLABLE KXE 12BE ETHIOPIC SYLLABLE KXO 12C0 ETHIOPIC SYLLABLE KXWA + x (ethiopic syllable gurage hhwa - 1E7E8) 12C2 ETHIOPIC SYLLABLE KXWI + x (ethiopic syllable hhwi - 1E7E9) 12C3 ETHIOPIC SYLLABLE KXWAA 12C4 ETHIOPIC SYLLABLE KXWEE + x (ethiopic syllable hhwee - 1E7EA) 12C5 ETHIOPIC SYLLABLE KXWE + x (ethiopic syllable hhwe - 1E7EB) 12C8 ETHIOPIC SYLLABLE WA 12C9 ETHIOPIC SYLLABLE WU 12CA ETHIOPIC SYLLABLE WI @@ -7941,9 +8179,12 @@ 130F ETHIOPIC SYLLABLE GOA 1310 ETHIOPIC SYLLABLE GWA 1312 ETHIOPIC SYLLABLE GWI + x (ethiopic syllable gurage gwi - 1E7F8) 1313 ETHIOPIC SYLLABLE GWAA 1314 ETHIOPIC SYLLABLE GWEE + x (ethiopic syllable gurage gwee - 1E7F9) 1315 ETHIOPIC SYLLABLE GWE + x (ethiopic syllable gurage gwe - 1E7FA) 1318 ETHIOPIC SYLLABLE GGA 1319 ETHIOPIC SYLLABLE GGU 131A ETHIOPIC SYLLABLE GGI @@ -8050,22 +8291,30 @@ 137B ETHIOPIC NUMBER HUNDRED 137C ETHIOPIC NUMBER TEN THOUSAND @@ 1380 Ethiopic Supplement 139F -@ Syllables for Sebatbeit +@ Syllables for Gurage 1380 ETHIOPIC SYLLABLE SEBATBEIT MWA 1381 ETHIOPIC SYLLABLE MWI + x (ethiopic syllable gurage mwi - 1E7ED) 1382 ETHIOPIC SYLLABLE MWEE + x (ethiopic syllable gurage mwee - 1E7EE) 1383 ETHIOPIC SYLLABLE MWE 1384 ETHIOPIC SYLLABLE SEBATBEIT BWA 1385 ETHIOPIC SYLLABLE BWI + x (ethiopic syllable gurage bwi - 1E7F3) 1386 ETHIOPIC SYLLABLE BWEE + x (ethiopic syllable gurage bwee - 1E7F4) 1387 ETHIOPIC SYLLABLE BWE 1388 ETHIOPIC SYLLABLE SEBATBEIT FWA 1389 ETHIOPIC SYLLABLE FWI + x (ethiopic syllable gurage fwi - 1E7FB) 138A ETHIOPIC SYLLABLE FWEE + x (ethiopic syllable gurage fwee - 1E7FC) 138B ETHIOPIC SYLLABLE FWE 138C ETHIOPIC SYLLABLE SEBATBEIT PWA 138D ETHIOPIC SYLLABLE PWI + x (ethiopic syllable gurage pwi - 1E7FD) 138E ETHIOPIC SYLLABLE PWEE + x (ethiopic syllable gurage pwee - 1E7FE) 138F ETHIOPIC SYLLABLE PWE @ Tonal marks @+ Intended for use with a multiline scored layout @@ -8745,6 +8994,7 @@ 15C2 CANADIAN SYLLABICS SAYISI HO * Sayisi (HU) 15C3 CANADIAN SYLLABICS SAYISI HA +@ Syllables for Carrier 15C4 CANADIAN SYLLABICS CARRIER GHU 15C5 CANADIAN SYLLABICS CARRIER GHO 15C6 CANADIAN SYLLABICS CARRIER GHE @@ -9101,6 +9351,8 @@ 170A TAGALOG LETTER BA 170B TAGALOG LETTER MA 170C TAGALOG LETTER YA +170D TAGALOG LETTER RA + * modern adaptation, not found in Old Tagalog 170E TAGALOG LETTER LA 170F TAGALOG LETTER WA 1710 TAGALOG LETTER SA @@ -9108,8 +9360,14 @@ @ Dependent vowel signs 1712 TAGALOG VOWEL SIGN I 1713 TAGALOG VOWEL SIGN U -@ Virama +@ Viramas 1714 TAGALOG SIGN VIRAMA +1715 TAGALOG SIGN PAMUDPOD + x (hanunoo sign pamudpod - 1734) +@ Archaic letter +171F TAGALOG LETTER ARCHAIC RA + = Zambales ra + * modern adaptation, not found in Old Tagalog @@ 1720 Hanunoo 173F @ Independent vowels 1720 HANUNOO LETTER A @@ -9136,6 +9394,7 @@ 1733 HANUNOO VOWEL SIGN U @ Virama 1734 HANUNOO SIGN PAMUDPOD + x (tagalog sign pamudpod - 1715) @ Generic punctuation for Philippine scripts 1735 PHILIPPINE SINGLE PUNCTUATION x (devanagari danda - 0964) @@ -9424,6 +9683,8 @@ * abbreviated FVS3 180E MONGOLIAN VOWEL SEPARATOR * abbreviated MVS +180F MONGOLIAN FREE VARIATION SELECTOR FOUR + * abbreviated FVS4 @ Digits 1810 MONGOLIAN DIGIT ZERO 1811 MONGOLIAN DIGIT ONE @@ -10150,7 +10411,8 @@ * used in combinations with other punctuation marks at ends of sections 1AAD TAI THAM SIGN CAANG @@ 1AB0 Combining Diacritical Marks Extended 1AFF -@ Used for German dialectology +@+ This block contains many specialized combining marks, often derived from European dialectology transcriptional conventions. +@ Used in German dialectology 1AB0 COMBINING DOUBLED CIRCUMFLEX ACCENT 1AB1 COMBINING DIAERESIS-RING 1AB2 COMBINING INFINITY @@ -10164,6 +10426,8 @@ 1AB8 COMBINING DOUBLE OPEN MARK BELOW 1AB9 COMBINING LIGHT CENTRALIZATION STROKE BELOW 1ABA COMBINING STRONG CENTRALIZATION STROKE BELOW +@ Marks surrounding other diacritics or letters +@+ These marks are often intended to indicate partial or uncertain applicability of another diacritic. 1ABB COMBINING PARENTHESES ABOVE * intended to surround a diacritic above 1ABC COMBINING DOUBLE PARENTHESES ABOVE @@ -10172,11 +10436,39 @@ 1ABE COMBINING PARENTHESES OVERLAY * intended to surround a base letter * exact placement is font dependent -@ Used for Scots dialectology +@ Used in Scots dialectology 1ABF COMBINING LATIN SMALL LETTER W BELOW * indicates voiced labialization + x (modifier letter small w - 02B7) 1AC0 COMBINING LATIN SMALL LETTER TURNED W BELOW * indicates voiceless labialization +@ Marks next to or surrounding other diacritics +@+ The left or right parentheses marks are used in extended IPA in combination with voicing or devoicing diacritics to indicate initial or final partial applicability. +1AC1 COMBINING LEFT PARENTHESIS ABOVE LEFT +1AC2 COMBINING RIGHT PARENTHESIS ABOVE RIGHT +1AC3 COMBINING LEFT PARENTHESIS BELOW LEFT +1AC4 COMBINING RIGHT PARENTHESIS BELOW RIGHT +1AC5 COMBINING SQUARE BRACKETS ABOVE + * intended to surround a diacritic above + * used to indicate cancellation of an accent in Japanese transliteration +@ Phonetic sign +1AC6 COMBINING NUMBER SIGN ABOVE + = superscript octothorp + * used extensively in J.P. Harrington's transcriptional notation +@ Used in extended IPA +1AC7 COMBINING INVERTED DOUBLE ARCH ABOVE + x (combining inverted double arch below - 032B) + x (combining latin small letter w - 1DF1) +1AC8 COMBINING PLUS SIGN ABOVE + x (combining plus sign below - 031F) +1AC9 COMBINING DOUBLE PLUS SIGN ABOVE +1ACA COMBINING DOUBLE PLUS SIGN BELOW +@ Used in Middle English Ormulum +1ACB COMBINING TRIPLE ACUTE ACCENT + x (combining double acute accent - 030B) +1ACC COMBINING LATIN SMALL LETTER INSULAR G +1ACD COMBINING LATIN SMALL LETTER INSULAR R +1ACE COMBINING LATIN SMALL LETTER INSULAR T @@ 1B00 Balinese 1B7F @ Various signs 1B00 BALINESE SIGN ULU RICEM @@ -10186,7 +10478,9 @@ 1B02 BALINESE SIGN CECEK = anusvara 1B03 BALINESE SIGN SURANG - = repha + = final r + * also used for repha in transliteration of Kawi + x (javanese sign layar - A982) 1B04 BALINESE SIGN BISAH = visarga @ Independent vowels @@ -10323,6 +10617,9 @@ 1B49 BALINESE LETTER VE SASAK 1B4A BALINESE LETTER ZAL SASAK 1B4B BALINESE LETTER ASYURA SASAK +1B4C BALINESE LETTER ARCHAIC JNYA + * used in older texts in place of the ja + nya conjunct + x (javanese letter nya murda - A998) @ Digits 1B50 BALINESE DIGIT ZERO 1B51 BALINESE DIGIT ONE @@ -10382,12 +10679,17 @@ 1B7A BALINESE MUSICAL SYMBOL LEFT-HAND CLOSED PLAK 1B7B BALINESE MUSICAL SYMBOL LEFT-HAND CLOSED PLUK 1B7C BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +@ Punctuation +1B7D BALINESE PANTI LANTANG + = end of text +1B7E BALINESE PAMADA LANTANG + = end of text @@ 1B80 Sundanese 1BBF @ Various signs 1B80 SUNDANESE SIGN PANYECEK = anusvara 1B81 SUNDANESE SIGN PANGLAYAR - = repha + = final r 1B82 SUNDANESE SIGN PANGWISAD = visarga @ Vowels @@ -10982,9 +11284,11 @@ 1D33 MODIFIER LETTER CAPITAL G # 0047 1D34 MODIFIER LETTER CAPITAL H + # 0048 +@+ A typographical distinction between a capital form and a small capital form is not distinctive for this character in IPA usage. + * voiceless epiglottalized release (extended IPA) x (latin letter small capital h - 029C) x (modifier letter cyrillic en - 1D78) - # 0048 1D35 MODIFIER LETTER CAPITAL I # 0049 1D36 MODIFIER LETTER CAPITAL J @@ -11117,6 +11421,7 @@ * Georgian transcription x (georgian letter turned gan - 10F9) 1D78 MODIFIER LETTER CYRILLIC EN + * sometimes substituted for 1D34 in extended IPA x (modifier letter capital h - 1D34) # 043D @ Other phonetic symbols @@ -11127,6 +11432,7 @@ x (latin small letter yogh - 021D) x (latin small letter script g - 0261) x (latin small letter gamma - 0263) + x (latin small letter closed insular g - A7D1) 1D7A LATIN SMALL LETTER TH WITH STRIKETHROUGH * American dictionary usage x (greek small letter theta - 03B8) @@ -11345,6 +11651,8 @@ 1DEF COMBINING LATIN SMALL LETTER ESH 1DF0 COMBINING LATIN SMALL LETTER U WITH LIGHT CENTRALIZATION STROKE 1DF1 COMBINING LATIN SMALL LETTER W + x (combining latin small letter w below - 1ABF) + x (combining inverted double arch above - 1AC7) 1DF2 COMBINING LATIN SMALL LETTER A WITH DIAERESIS 1DF3 COMBINING LATIN SMALL LETTER O WITH DIAERESIS 1DF4 COMBINING LATIN SMALL LETTER U WITH DIAERESIS @@ -11359,9 +11667,12 @@ * used in Syriac as a disambiguation dot * used in Typicon Cyrillic, where the dot may have a square appearance x (combining dot above right - 0358) + x (syriac feminine dot - 0740) 1DF9 COMBINING WIDE INVERTED BRIDGE BELOW * used as a Typicon mark x (combining inverted bridge below - 033A) +1DFA COMBINING DOT BELOW LEFT + * used in Syriac as a disambiguation dot 1DFB COMBINING DELETION MARK * used for "mhusaa" in Newa scribal tradition @ Double diacritic mark for UPA @@ -12633,7 +12944,7 @@ = Japanese kome = Urdu paragraph separator x (tibetan ku ru kha bzhi mig can - 0FBF) - x (cjk unified ideograph-200AD - 200AD) + x 200AD @ Double punctuation for vertical text 203C DOUBLE EXCLAMATION MARK x (exclamation mark - 0021) @@ -12667,6 +12978,7 @@ @ Brackets 2045 LEFT SQUARE BRACKET WITH QUILL x (left vertical bar with quill - 2E20) + x (left square bracket with stroke - 2E55) 2046 RIGHT SQUARE BRACKET WITH QUILL @ Double punctuation for vertical text 2047 DOUBLE QUESTION MARK @@ -12895,10 +13207,10 @@ x (thai currency symbol baht - 0E3F) x (khmer currency symbol riel - 17DB) x (script capital m - 2133) - x (cjk unified ideograph-5143 - 5143) - x (cjk unified ideograph-5186 - 5186) - x (cjk unified ideograph-5706 - 5706) - x (cjk unified ideograph-5713 - 5713) + x 5143 + x 5186 + x 5706 + x 5713 x (rial sign - FDFC) x (wancho ngun sign - 1E2FF) 20A0 EURO-CURRENCY SIGN @@ -12991,6 +13303,8 @@ * Georgia 20BF BITCOIN SIGN * a cryptocurrency +20C0 SOM SIGN + * Kyrgyzstan @@ 20D0 Combining Diacritical Marks for Symbols 20FF @ Combining diacritical marks for symbols 20D0 COMBINING LEFT HARPOON ABOVE @@ -13093,6 +13407,8 @@ # 0067 latin small letter g 210B SCRIPT CAPITAL H = Hamiltonian operator + ~ 210B FE00 chancery style + ~ 210B FE01 roundhand style # 0048 latin capital letter h 210C BLACK-LETTER CAPITAL H = Hilbert space @@ -13108,12 +13424,16 @@ x (cyrillic small letter tshe - 045B) # 0127 latin small letter h with stroke 2110 SCRIPT CAPITAL I + ~ 2110 FE00 chancery style + ~ 2110 FE01 roundhand style # 0049 latin capital letter i 2111 BLACK-LETTER CAPITAL I = imaginary part # 0049 latin capital letter i 2112 SCRIPT CAPITAL L = Laplace transform + ~ 2112 FE00 chancery style + ~ 2112 FE01 roundhand style # 004C latin capital letter l 2113 SCRIPT SMALL L = mathematical symbol 'ell' @@ -13148,6 +13468,8 @@ # 0051 latin capital letter q 211B SCRIPT CAPITAL R = Riemann Integral + ~ 211B FE00 chancery style + ~ 211B FE01 roundhand style # 0052 latin capital letter r 211C BLACK-LETTER CAPITAL R = real part @@ -13202,6 +13524,8 @@ : 00C5 latin capital letter a with ring above 212C SCRIPT CAPITAL B = Bernoulli function + ~ 212C FE00 chancery style + ~ 212C FE01 roundhand style # 0042 latin capital letter b 212D BLACK-LETTER CAPITAL C # 0043 latin capital letter c @@ -13214,9 +13538,13 @@ # 0065 latin small letter e 2130 SCRIPT CAPITAL E = emf (electromotive force) + ~ 2130 FE00 chancery style + ~ 2130 FE01 roundhand style # 0045 latin capital letter e 2131 SCRIPT CAPITAL F = Fourier transform + ~ 2131 FE00 chancery style + ~ 2131 FE01 roundhand style # 0046 latin capital letter f 2132 TURNED CAPITAL F = Claudian digamma inversum @@ -13228,6 +13556,8 @@ = German Mark currency symbol, before WWII * when used for the Mark symbol, the range of glyph variation is restricted x (nordic mark sign - 20BB) + ~ 2133 FE00 chancery style + ~ 2133 FE01 roundhand style # 004D latin capital letter m 2134 SCRIPT SMALL O = order, of inferior order to @@ -13311,6 +13641,7 @@ x (greek small letter digamma - 03DD) @ Biblical editorial symbol 214F SYMBOL FOR SAMARITAN SOURCE +@~ Standardized Variation Sequences @@ 2150 Number Forms 218F @ Fractions @+ Other fraction number forms are found in the Latin-1 Supplement block. @@ -13890,7 +14221,9 @@ : 2261 0338 2263 STRICTLY EQUIVALENT TO 2264 LESS-THAN OR EQUAL TO + x (less-than sign - 003C) 2265 GREATER-THAN OR EQUAL TO + x (greater-than sign - 003E) 2266 LESS-THAN OVER EQUAL TO 2267 GREATER-THAN OVER EQUAL TO 2268 LESS-THAN BUT NOT EQUAL TO @@ -14110,6 +14443,9 @@ x (black star - 2605) x (white medium star - 2B50) 22C7 DIVISION TIMES + x (multiplication sign - 00D7) + x (division sign - 00F7) + x (multiplication x - 2715) @ Relation 22C8 BOWTIE x (ocr bow tie - 2445) @@ -18275,6 +18611,8 @@ 2C2C GLAGOLITIC CAPITAL LETTER SHTAPIC 2C2D GLAGOLITIC CAPITAL LETTER TROKUTASTI A 2C2E GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C2F GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI +@+ This is used as an alternative to Glagolitic letter chrivi, combined with 0303 combining tilde or with 0483 combining Cyrillic titlo as an et cetera sign. @ Small letters 2C30 GLAGOLITIC SMALL LETTER AZU 2C31 GLAGOLITIC SMALL LETTER BUKY @@ -18324,6 +18662,7 @@ 2C5C GLAGOLITIC SMALL LETTER SHTAPIC 2C5D GLAGOLITIC SMALL LETTER TROKUTASTI A 2C5E GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C5F GLAGOLITIC SMALL LETTER CAUDATE CHRIVI @@ 2C60 Latin Extended-C 2C7F @ Orthographic Latin additions 2C60 LATIN CAPITAL LETTER L WITH DOUBLE BAR @@ -18338,7 +18677,7 @@ * uppercase is 023A 2C66 LATIN SMALL LETTER T WITH DIAGONAL STROKE * uppercase is 023E -@ Additions for Uighur +@ Additions for Uyghur 2C67 LATIN CAPITAL LETTER H WITH DESCENDER 2C68 LATIN SMALL LETTER H WITH DESCENDER 2C69 LATIN CAPITAL LETTER K WITH DESCENDER @@ -18705,7 +19044,7 @@ 2DBC ETHIOPIC SYLLABLE CCHEE 2DBD ETHIOPIC SYLLABLE CCHE 2DBE ETHIOPIC SYLLABLE CCHO -@ Syllables for Sebatbeit +@ Syllables for Gurage 2DC0 ETHIOPIC SYLLABLE QYA 2DC1 ETHIOPIC SYLLABLE QYU 2DC2 ETHIOPIC SYLLABLE QYI @@ -18721,12 +19060,19 @@ 2DCD ETHIOPIC SYLLABLE KYE 2DCE ETHIOPIC SYLLABLE KYO 2DD0 ETHIOPIC SYLLABLE XYA + x (ethiopic syllable hhya - 1E7E0) 2DD1 ETHIOPIC SYLLABLE XYU + x (ethiopic syllable hhyu - 1E7E1) 2DD2 ETHIOPIC SYLLABLE XYI + x (ethiopic syllable hhyi - 1E7E2) 2DD3 ETHIOPIC SYLLABLE XYAA + x (ethiopic syllable hhyaa - 1E7E3) 2DD4 ETHIOPIC SYLLABLE XYEE + x (ethiopic syllable hhyee - 1E7E4) 2DD5 ETHIOPIC SYLLABLE XYE + x (ethiopic syllable hhye - 1E7E5) 2DD6 ETHIOPIC SYLLABLE XYO + x (ethiopic syllable hhyo - 1E7E6) 2DD8 ETHIOPIC SYLLABLE GYA 2DD9 ETHIOPIC SYLLABLE GYU 2DDA ETHIOPIC SYLLABLE GYI @@ -18821,6 +19167,7 @@ x (equals sign - 003D) x (hyphen - 2010) x (double hyphen - 2E40) + x (oblique hyphen - 2E5D) @ General punctuation 2E18 INVERTED INTERROBANG = gnaborretni @@ -18978,13 +19325,37 @@ x (paragraphos - 2E0F) x (capitulum - 2E3F) 2E4E PUNCTUS ELEVATUS MARK - * indicates a major medial pause where the sense is complete but the meaning is not +@+ This mark indicates a major intermediate pause where the sensus is complete but the sentence is not; this is similar in some regards to the modern use of a semicolon. 2E4F CORNISH VERSE DIVIDER 2E50 CROSS PATTY WITH RIGHT CROSSBAR x (maltese cross - 2720) + x (latin capital letter half h - 2C75) 2E51 CROSS PATTY WITH LEFT CROSSBAR + x (latin capital letter reversed half h - A7F5) 2E52 TIRONIAN SIGN CAPITAL ET x (tironian sign et - 204A) +2E53 MEDIEVAL EXCLAMATION MARK +2E54 MEDIEVAL QUESTION MARK +@ Brackets +@+ These brackets indicate ellipsis in certain conventions for Japanese transliteration. +2E55 LEFT SQUARE BRACKET WITH STROKE + * optional ellipsis + x (left square bracket with quill - 2045) +2E56 RIGHT SQUARE BRACKET WITH STROKE +2E57 LEFT SQUARE BRACKET WITH DOUBLE STROKE + * obligatory ellipsis +2E58 RIGHT SQUARE BRACKET WITH DOUBLE STROKE +@ Parentheses top and bottom halves +@+ These are used in pairs in extended IPA to indicate dubious phonemes or questionable presence of a sound. +2E59 TOP HALF LEFT PARENTHESIS +2E5A TOP HALF RIGHT PARENTHESIS +2E5B BOTTOM HALF LEFT PARENTHESIS +2E5C BOTTOM HALF RIGHT PARENTHESIS +@ Oblique hyphen +@+ The oblique hyphen is historic punctuation seen in some medieval and Renaissance manuscripts. In some modern lexicography an oblique hyphen is used distinctly to indicate hyphenation which is retained when a word is not broken at a line boundary. +2E5D OBLIQUE HYPHEN + x (hyphen - 2010) + x (double oblique hyphen - 2E17) @@ 2E80 CJK Radicals Supplement 2EFF @+ For the characters in this block whose representative glyph takes up only a portion of the em-box, the placement relative to the em-box is either centered or respects prototypical usage. The placement of the representative glyph is for informational purposes only, and should not be considered a recommendation for implementations. @ CJK radicals supplement @@ -19090,6 +19461,7 @@ x 4E2C 2EA7 CJK RADICAL COW x 725B + x 20092 2EA8 CJK RADICAL DOG * form used on left side x 72AD @@ -19790,6 +20162,7 @@ * substitute for ideograph not in font * editorial convention to represent ideographic lacuna x (white square - 25A1) + x (heavy equals sign - 1F7F0) @ CJK brackets 3014 LEFT TORTOISE SHELL BRACKET 3015 RIGHT TORTOISE SHELL BRACKET @@ -21844,7 +22217,7 @@ 4DFD HEXAGRAM FOR SMALL PREPONDERANCE 4DFE HEXAGRAM FOR AFTER COMPLETION 4DFF HEXAGRAM FOR BEFORE COMPLETION -@@ 4E00 CJK Unified Ideographs 9FFC +@@ 4E00 CJK Unified Ideographs 9FFF @@ A000 Yi Syllables A48F @@+ @ Syllables @@ -23791,6 +24164,7 @@ A72F LATIN SMALL LETTER CUATRILLO WITH COMMA A730 LATIN LETTER SMALL CAPITAL F A731 LATIN LETTER SMALL CAPITAL S A732 LATIN CAPITAL LETTER AA + x (modifier letter small capital aa - 10780) A733 LATIN SMALL LETTER AA A734 LATIN CAPITAL LETTER AO A735 LATIN SMALL LETTER AO @@ -23976,6 +24350,7 @@ A7AE LATIN CAPITAL LETTER SMALL CAPITAL I @ Letter for Japanese phonemic transcription A7AF LATIN LETTER SMALL CAPITAL Q * used to represent gemination + x (modifier letter capital q - A7F4) @ Letters for Americanist orthographies A7B0 LATIN CAPITAL LETTER TURNED K * lowercase is 029E @@ -23996,7 +24371,7 @@ A7B5 LATIN SMALL LETTER BETA A7B6 LATIN CAPITAL LETTER OMEGA A7B7 LATIN SMALL LETTER OMEGA x (greek small letter omega - 03C9) -@ Letters for Mazahua (Mexico) +@ Letters for Mazahua (México) A7B8 LATIN CAPITAL LETTER U WITH STROKE A7B9 LATIN SMALL LETTER U WITH STROKE @ Letters for Ugaritic and Egyptological transliteration @@ -24010,7 +24385,11 @@ A7BD LATIN SMALL LETTER GLOTTAL I x (latin small letter egyptological ain - A725) A7BE LATIN CAPITAL LETTER GLOTTAL U A7BF LATIN SMALL LETTER GLOTTAL U -@ Additional letters +@ Additional medieval letters +A7C0 LATIN CAPITAL LETTER OLD POLISH O +A7C1 LATIN SMALL LETTER OLD POLISH O + * used in Old Polish as a nasal vowel + x (latin small letter o with stroke - 00F8) A7C2 LATIN CAPITAL LETTER ANGLICANA W A7C3 LATIN SMALL LETTER ANGLICANA W * used in medieval English and Cornish @@ -24028,6 +24407,31 @@ A7C8 LATIN SMALL LETTER D WITH SHORT STROKE OVERLAY * indicates a dental affricate A7C9 LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY A7CA LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +@ Letters used in the Middle English Ormulum +A7D0 LATIN CAPITAL LETTER CLOSED INSULAR G +A7D1 LATIN SMALL LETTER CLOSED INSULAR G + x (latin small letter insular g - 1D79) +A7D3 LATIN SMALL LETTER DOUBLE THORN + x (latin small letter thorn - 00FE) +A7D5 LATIN SMALL LETTER DOUBLE WYNN + x (latin letter wynn - 01BF) +@ Letters used in medieval palaeography +A7D6 LATIN CAPITAL LETTER MIDDLE SCOTS S +A7D7 LATIN SMALL LETTER MIDDLE SCOTS S + * used in Middle Scots for s, ss, ser, sir, is, sis, etc. + x (latin small letter sharp s - 00DF) +A7D8 LATIN CAPITAL LETTER SIGMOID S +A7D9 LATIN SMALL LETTER SIGMOID S + * used in Middle Cornish, Middle English, and Middle Scots +@ Modifier letters for Chatino (México) +A7F2 MODIFIER LETTER CAPITAL C + # 0043 +A7F3 MODIFIER LETTER CAPITAL F + # 0046 +@ Modifier letter for Japanese phonemic transcription +A7F4 MODIFIER LETTER CAPITAL Q + x (latin letter small capital q - A7AF) + # 0051 @ Ancient Gaulish and Celtic epigraphic letters A7F5 LATIN CAPITAL LETTER REVERSED HALF H = H dimidié @@ -24039,7 +24443,7 @@ A7F7 LATIN EPIGRAPHIC LETTER SIDEWAYS I @ Additions for Extended IPA A7F8 MODIFIER LETTER CAPITAL H WITH STROKE # 0126 -@+ A typographical distinction between a capital form and a small capital form is not distinctive for this IPA usage. +@+ A typographical distinction between a capital form and a small capital form is not distinctive for this character in IPA usage. * faucalized x (latin letter small capital h - 029C) A7F9 MODIFIER LETTER SMALL LIGATURE OE @@ -24129,7 +24533,7 @@ A838 NORTH INDIC RUPEE MARK A839 NORTH INDIC QUANTITY MARK * a unit mark for various weights and measures @@ A840 Phags-pa A87F -@+ Phags-pa letters are used for Mongolian, Chinese, Uighur, Tibetan, and Sanskrit unless annotated with a more restricted list of languages. +@+ Phags-pa letters are used for Mongolian, Chinese, Uyghur, Tibetan, and Sanskrit unless annotated with a more restricted list of languages. @ Consonants A840 PHAGS-PA LETTER KA * Mongolian, Chinese, Tibetan, Sanskrit @@ -24145,10 +24549,10 @@ A844 PHAGS-PA LETTER CA * Chinese, Tibetan x (tibetan letter ca - 0F45) A845 PHAGS-PA LETTER CHA - * Mongolian, Chinese, Uighur, Tibetan + * Mongolian, Chinese, Uyghur, Tibetan x (tibetan letter cha - 0F46) A846 PHAGS-PA LETTER JA - * Mongolian, Chinese, Uighur, Tibetan + * Mongolian, Chinese, Uyghur, Tibetan x (tibetan letter ja - 0F47) A847 PHAGS-PA LETTER NYA * Chinese, Tibetan, Sanskrit @@ -24195,7 +24599,7 @@ A856 PHAGS-PA LETTER SMALL A A857 PHAGS-PA LETTER YA x (tibetan letter ya - 0F61) A858 PHAGS-PA LETTER RA - * Mongolian, Uighur, Tibetan, Sanskrit + * Mongolian, Uyghur, Tibetan, Sanskrit x (tibetan letter ra - 0F62) A859 PHAGS-PA LETTER LA x (tibetan letter la - 0F63) @@ -24223,18 +24627,18 @@ A861 PHAGS-PA LETTER O x (tibetan vowel sign o - 0F7C) @ Consonants A862 PHAGS-PA LETTER QA - * Mongolian, Uighur + * Mongolian, Uyghur A863 PHAGS-PA LETTER XA * Mongolian, Chinese A864 PHAGS-PA LETTER FA - * Chinese, Uighur + * Chinese, Uyghur x (phags-pa letter ha - A85C) A865 PHAGS-PA LETTER GGA * language usage unknown * created by reversal of A862 @ Vowel A866 PHAGS-PA LETTER EE - * Mongolian, Chinese, Uighur + * Mongolian, Chinese, Uyghur @ Subjoined consonants A867 PHAGS-PA SUBJOINED LETTER WA * Chinese, Tibetan, Sanskrit @@ -24620,7 +25024,9 @@ A980 JAVANESE SIGN PANYANGGA A981 JAVANESE SIGN CECAK = anusvara A982 JAVANESE SIGN LAYAR - = repha + = final r + * also used for repha in transliteration of Kawi + x (balinese sign surang - 1B03) A983 JAVANESE SIGN WIGNYAN = visarga @ Letters @@ -24656,6 +25062,7 @@ A996 JAVANESE LETTER CA MURDA A997 JAVANESE LETTER JA A998 JAVANESE LETTER NYA MURDA = jnya + x (balinese letter archaic jnya - 1B4C) A999 JAVANESE LETTER JA MAHAPRANA = jha A99A JAVANESE LETTER NYA @@ -24915,6 +25322,7 @@ AA6C MYANMAR LETTER KHAMTI SA ~ AA6C FE00 dotted form AA6D MYANMAR LETTER KHAMTI HA AA6E MYANMAR LETTER KHAMTI HHA + % MYANMAR LETTER KHAMTI LLA AA6F MYANMAR LETTER KHAMTI FA ~ AA6F FE00 dotted form AA70 MYANMAR MODIFIER LETTER KHAMTI REDUPLICATION @@ -25586,7 +25994,7 @@ F92B CJK COMPATIBILITY IDEOGRAPH-F92B : 72FC F92C CJK COMPATIBILITY IDEOGRAPH-F92C * a mapping change removed the original K0 source - x (cjk unified ideograph-90DE - 90DE) + x 90DE x (cjk compatibility ideograph-FA2E - FA2E) : 90CE F92D CJK COMPATIBILITY IDEOGRAPH-F92D @@ -25869,7 +26277,7 @@ F9B7 CJK COMPATIBILITY IDEOGRAPH-F9B7 : 91B4 F9B8 CJK COMPATIBILITY IDEOGRAPH-F9B8 * a mapping change removed the original K0 source - x (cjk unified ideograph-96B7 - 96B7) + x 96B7 x (cjk compatibility ideograph-FA2F - FA2F) : 96B8 F9B9 CJK COMPATIBILITY IDEOGRAPH-F9B9 @@ -26805,6 +27213,8 @@ FBC0 ARABIC SYMBOL SMALL TAH ABOVE * Urdu FBC1 ARABIC SYMBOL SMALL TAH BELOW * Urdu +FBC2 ARABIC SYMBOL WASLA ABOVE + x (arabic letter alef wasla - 0671) @ Glyphs for contextual forms of letters for Central Asian languages FBD3 ARABIC LETTER NG ISOLATED FORM # 06AD @@ -27538,6 +27948,29 @@ FD3D ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM @+ These parentheses also do not have compatibility decompositions and should not be considered presentation forms. FD3E ORNATE LEFT PARENTHESIS FD3F ORNATE RIGHT PARENTHESIS +@ Honorific word ligatures +FD40 ARABIC LIGATURE RAHIMAHU ALLAAH + x (arabic sign rahmatullah alayhe - 0612) +FD41 ARABIC LIGATURE RADI ALLAAHU ANH + x (arabic sign radi allahou anhu - 0613) +FD42 ARABIC LIGATURE RADI ALLAAHU ANHAA +FD43 ARABIC LIGATURE RADI ALLAAHU ANHUM +FD44 ARABIC LIGATURE RADI ALLAAHU ANHUMAA +FD45 ARABIC LIGATURE RADI ALLAAHU ANHUNNA +FD46 ARABIC LIGATURE SALLALLAAHU ALAYHI WA-AALIH + x (arabic ligature sallallahou alayhe wasallam - FDFA) +FD47 ARABIC LIGATURE ALAYHI AS-SALAAM + x (arabic sign alayhe assallam - 0611) +FD48 ARABIC LIGATURE ALAYHIM AS-SALAAM +FD49 ARABIC LIGATURE ALAYHIMAA AS-SALAAM +FD4A ARABIC LIGATURE ALAYHI AS-SALAATU WAS-SALAAM +FD4B ARABIC LIGATURE QUDDISA SIRRAH +FD4C ARABIC LIGATURE SALLALLAHU ALAYHI WAAALIHEE WA-SALLAM + x (arabic ligature sallallahou alayhe wasallam - FDFA) + x (arabic ligature sallallaahu alayhi wa-aalih - FD46) +FD4D ARABIC LIGATURE ALAYHAA AS-SALAAM +FD4E ARABIC LIGATURE TABAARAKA WA-TAAALAA +FD4F ARABIC LIGATURE RAHIMAHUM ALLAAH @ Ligatures (three elements) FD50 ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM # 062A 062C 0645 @@ -27775,6 +28208,10 @@ FDC6 ARABIC LIGATURE SEEN WITH KHAH WITH YEH FINAL FORM # 0633 062E 064A FDC7 ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM # 0646 062C 064A +@ Honorific word ligature +FDCF ARABIC LIGATURE SALAAMUHU ALAYNAA + * his blessing on us + * used in Christian texts @ Noncharacters @+ These codes are intended for process-internal uses. FDD0 @@ -27839,9 +28276,11 @@ FDFB ARABIC LIGATURE JALLAJALALOUHOU @ Currency symbol FDFC RIAL SIGN # 0631 06CC 0627 0644 -@ Symbol -@+ The bismillah is treated as an atomic symbol, rather than as a word ligature. It has no decomposition. +@ Honorific word ligatures +@+ These word ligatures have no decompositions. FDFD ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFE ARABIC LIGATURE SUBHAANAHU WA TAAALAA +FDFF ARABIC LIGATURE AZZA WA JALL @@ FE00 Variation Selectors FE0F @ Variation selectors @+ These are combining characters; in conjunction with the preceding character they indicate a predetermined choice of variant glyph. @@ -30036,6 +30475,83 @@ FFFF 10563 CAUCASIAN ALBANIAN LETTER KIW @ Punctuation 1056F CAUCASIAN ALBANIAN CITATION MARK +@@ 10570 Vithkuqi 105BF +@ Capital letters +10570 VITHKUQI CAPITAL LETTER A +10571 VITHKUQI CAPITAL LETTER BBE +10572 VITHKUQI CAPITAL LETTER BE +10573 VITHKUQI CAPITAL LETTER CE +10574 VITHKUQI CAPITAL LETTER CHE +10575 VITHKUQI CAPITAL LETTER DE +10576 VITHKUQI CAPITAL LETTER DHE +10577 VITHKUQI CAPITAL LETTER EI +10578 VITHKUQI CAPITAL LETTER E +10579 VITHKUQI CAPITAL LETTER FE +1057A VITHKUQI CAPITAL LETTER GA +1057C VITHKUQI CAPITAL LETTER HA +1057D VITHKUQI CAPITAL LETTER HHA + * used in 19th-century orthography +1057E VITHKUQI CAPITAL LETTER I +1057F VITHKUQI CAPITAL LETTER IJE + * used in 19th-century orthography +10580 VITHKUQI CAPITAL LETTER JE +10581 VITHKUQI CAPITAL LETTER KA +10582 VITHKUQI CAPITAL LETTER LA +10583 VITHKUQI CAPITAL LETTER LLA +10584 VITHKUQI CAPITAL LETTER ME +10585 VITHKUQI CAPITAL LETTER NE +10586 VITHKUQI CAPITAL LETTER NJE +10587 VITHKUQI CAPITAL LETTER O +10588 VITHKUQI CAPITAL LETTER PE +10589 VITHKUQI CAPITAL LETTER QA +1058A VITHKUQI CAPITAL LETTER RE +1058C VITHKUQI CAPITAL LETTER SE +1058D VITHKUQI CAPITAL LETTER SHE +1058E VITHKUQI CAPITAL LETTER TE +1058F VITHKUQI CAPITAL LETTER THE +10590 VITHKUQI CAPITAL LETTER U +10591 VITHKUQI CAPITAL LETTER VE +10592 VITHKUQI CAPITAL LETTER XE +10594 VITHKUQI CAPITAL LETTER Y +10595 VITHKUQI CAPITAL LETTER ZE +@ Small letters +10597 VITHKUQI SMALL LETTER A +10598 VITHKUQI SMALL LETTER BBE +10599 VITHKUQI SMALL LETTER BE +1059A VITHKUQI SMALL LETTER CE +1059B VITHKUQI SMALL LETTER CHE +1059C VITHKUQI SMALL LETTER DE +1059D VITHKUQI SMALL LETTER DHE +1059E VITHKUQI SMALL LETTER EI +1059F VITHKUQI SMALL LETTER E +105A0 VITHKUQI SMALL LETTER FE +105A1 VITHKUQI SMALL LETTER GA +105A3 VITHKUQI SMALL LETTER HA +105A4 VITHKUQI SMALL LETTER HHA + * used in 19th-century orthography +105A5 VITHKUQI SMALL LETTER I +105A6 VITHKUQI SMALL LETTER IJE + * used in 19th-century orthography +105A7 VITHKUQI SMALL LETTER JE +105A8 VITHKUQI SMALL LETTER KA +105A9 VITHKUQI SMALL LETTER LA +105AA VITHKUQI SMALL LETTER LLA +105AB VITHKUQI SMALL LETTER ME +105AC VITHKUQI SMALL LETTER NE +105AD VITHKUQI SMALL LETTER NJE +105AE VITHKUQI SMALL LETTER O +105AF VITHKUQI SMALL LETTER PE +105B0 VITHKUQI SMALL LETTER QA +105B1 VITHKUQI SMALL LETTER RE +105B3 VITHKUQI SMALL LETTER SE +105B4 VITHKUQI SMALL LETTER SHE +105B5 VITHKUQI SMALL LETTER TE +105B6 VITHKUQI SMALL LETTER THE +105B7 VITHKUQI SMALL LETTER U +105B8 VITHKUQI SMALL LETTER VE +105B9 VITHKUQI SMALL LETTER XE +105BB VITHKUQI SMALL LETTER Y +105BC VITHKUQI SMALL LETTER ZE @@ 10600 Linear A 1077F @ Simple signs 10600 LINEAR A SIGN AB001 @@ -30587,6 +31103,124 @@ FFFF * 10668 a316, 10601 ab002 10767 LINEAR A SIGN A807 * 10668 a316, 10742 a703 d +@@ 10780 Latin Extended-F 107BF +@ Modifier letter for VoQS +10780 MODIFIER LETTER SMALL CAPITAL AA + * actually a small capital in VoQS (voice quality symbol) usage, with no semantic distinction from a full capital + x (latin capital letter aa - A732) +@ Modifier letters for IPA +10781 MODIFIER LETTER SUPERSCRIPT TRIANGULAR COLON + # 02D0 +10782 MODIFIER LETTER SUPERSCRIPT HALF TRIANGULAR COLON + # 02D1 +10783 MODIFIER LETTER SMALL AE + # 00E6 +10784 MODIFIER LETTER SMALL CAPITAL B + # 0299 +10785 MODIFIER LETTER SMALL B WITH HOOK + # 0253 +10787 MODIFIER LETTER SMALL DZ DIGRAPH + # 02A3 +10788 MODIFIER LETTER SMALL DZ DIGRAPH WITH RETROFLEX HOOK + # AB66 +10789 MODIFIER LETTER SMALL DZ DIGRAPH WITH CURL + # 02A5 +1078A MODIFIER LETTER SMALL DEZH DIGRAPH + # 02A4 +1078B MODIFIER LETTER SMALL D WITH TAIL + # 0256 +1078C MODIFIER LETTER SMALL D WITH HOOK + # 0257 +1078D MODIFIER LETTER SMALL D WITH HOOK AND TAIL + # 1D91 +1078E MODIFIER LETTER SMALL REVERSED E + # 0258 +1078F MODIFIER LETTER SMALL CLOSED REVERSED OPEN E + # 025E +10790 MODIFIER LETTER SMALL FENG DIGRAPH + # 02A9 +10791 MODIFIER LETTER SMALL RAMS HORN + # 0264 +10792 MODIFIER LETTER SMALL CAPITAL G + # 0262 +10793 MODIFIER LETTER SMALL G WITH HOOK + # 0260 +10794 MODIFIER LETTER SMALL CAPITAL G WITH HOOK + # 029B +10795 MODIFIER LETTER SMALL H WITH STROKE + # 0127 +10796 MODIFIER LETTER SMALL CAPITAL H + # 029C +10797 MODIFIER LETTER SMALL HENG WITH HOOK + # 0267 +10798 MODIFIER LETTER SMALL DOTLESS J WITH STROKE AND HOOK + # 0284 +10799 MODIFIER LETTER SMALL LS DIGRAPH + # 02AA +1079A MODIFIER LETTER SMALL LZ DIGRAPH + # 02AB +1079B MODIFIER LETTER SMALL L WITH BELT + # 026C +1079C MODIFIER LETTER SMALL CAPITAL L WITH BELT + # 1DF04 +1079D MODIFIER LETTER SMALL L WITH RETROFLEX HOOK AND BELT + # A78E +1079E MODIFIER LETTER SMALL LEZH + # 026E +1079F MODIFIER LETTER SMALL LEZH WITH RETROFLEX HOOK + # 1DF05 +107A0 MODIFIER LETTER SMALL TURNED Y + # 028E +107A1 MODIFIER LETTER SMALL TURNED Y WITH BELT + # 1DF06 +107A2 MODIFIER LETTER SMALL O WITH STROKE + # 00F8 +107A3 MODIFIER LETTER SMALL CAPITAL OE + # 0276 +107A4 MODIFIER LETTER SMALL CLOSED OMEGA + # 0277 +107A5 MODIFIER LETTER SMALL Q + # 0071 +107A6 MODIFIER LETTER SMALL TURNED R WITH LONG LEG + # 027A +107A7 MODIFIER LETTER SMALL TURNED R WITH LONG LEG AND RETROFLEX HOOK + # 1DF08 +107A8 MODIFIER LETTER SMALL R WITH TAIL + # 027D +107A9 MODIFIER LETTER SMALL R WITH FISHHOOK + # 027E +107AA MODIFIER LETTER SMALL CAPITAL R + # 0280 +107AB MODIFIER LETTER SMALL TC DIGRAPH WITH CURL + # 02A8 +107AC MODIFIER LETTER SMALL TS DIGRAPH + # 02A6 +107AD MODIFIER LETTER SMALL TS DIGRAPH WITH RETROFLEX HOOK + # AB67 +107AE MODIFIER LETTER SMALL TESH DIGRAPH + # 02A7 +107AF MODIFIER LETTER SMALL T WITH RETROFLEX HOOK + # 0288 +107B0 MODIFIER LETTER SMALL V WITH RIGHT HOOK + # 2C71 +107B2 MODIFIER LETTER SMALL CAPITAL Y + # 028F +107B3 MODIFIER LETTER GLOTTAL STOP WITH STROKE + # 02A1 +107B4 MODIFIER LETTER REVERSED GLOTTAL STOP WITH STROKE + # 02A2 +107B5 MODIFIER LETTER BILABIAL CLICK + # 0298 +107B6 MODIFIER LETTER DENTAL CLICK + # 01C0 +107B7 MODIFIER LETTER LATERAL CLICK + # 01C1 +107B8 MODIFIER LETTER ALVEOLAR CLICK + # 01C2 +107B9 MODIFIER LETTER RETROFLEX CLICK WITH RETROFLEX HOOK + # 1DF0A +107BA MODIFIER LETTER SMALL S WITH CURL + # 1DF1E @@ 10800 Cypriot Syllabary 1083F @ Syllables 10800 CYPRIOT SYLLABLE A @@ -32120,6 +32754,37 @@ FFFF 10F57 SOGDIAN PUNCTUATION CIRCLE WITH DOT 10F58 SOGDIAN PUNCTUATION TWO CIRCLES WITH DOTS 10F59 SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +@@ 10F70 Old Uyghur 10FAF +@ Letters +10F70 OLD UYGHUR LETTER ALEPH +10F71 OLD UYGHUR LETTER BETH +10F72 OLD UYGHUR LETTER GIMEL-HETH +10F73 OLD UYGHUR LETTER WAW +10F74 OLD UYGHUR LETTER ZAYIN +10F75 OLD UYGHUR LETTER FINAL HETH +10F76 OLD UYGHUR LETTER YODH +10F77 OLD UYGHUR LETTER KAPH +10F78 OLD UYGHUR LETTER LAMEDH +10F79 OLD UYGHUR LETTER MEM +10F7A OLD UYGHUR LETTER NUN +10F7B OLD UYGHUR LETTER SAMEKH +10F7C OLD UYGHUR LETTER PE +10F7D OLD UYGHUR LETTER SADHE +10F7E OLD UYGHUR LETTER RESH +10F7F OLD UYGHUR LETTER SHIN +10F80 OLD UYGHUR LETTER TAW +10F81 OLD UYGHUR LETTER LESH + = hooked resh +@ Combining signs +10F82 OLD UYGHUR COMBINING DOT ABOVE +10F83 OLD UYGHUR COMBINING DOT BELOW +10F84 OLD UYGHUR COMBINING TWO DOTS ABOVE +10F85 OLD UYGHUR COMBINING TWO DOTS BELOW +@ Punctuation +10F86 OLD UYGHUR PUNCTUATION BAR +10F87 OLD UYGHUR PUNCTUATION TWO BARS +10F88 OLD UYGHUR PUNCTUATION TWO DOTS +10F89 OLD UYGHUR PUNCTUATION FOUR DOTS @@ 10FB0 Chorasmian 10FDF @+ This script is also known as 'Khwarezmian', from its classical Persian name xvārazm. @ Letters @@ -32296,6 +32961,17 @@ FFFF 1106D BRAHMI DIGIT SEVEN 1106E BRAHMI DIGIT EIGHT 1106F BRAHMI DIGIT NINE +@ Virama +@+ The Old Tamil virama and the other Old Tamil characters below are extensions used in Brahmi when writing Old Tamil. +11070 BRAHMI SIGN OLD TAMIL VIRAMA +@ Independent vowels +11071 BRAHMI LETTER OLD TAMIL SHORT E +11072 BRAHMI LETTER OLD TAMIL SHORT O +@ Dependent vowel signs +11073 BRAHMI VOWEL SIGN OLD TAMIL SHORT E +11074 BRAHMI VOWEL SIGN OLD TAMIL SHORT O +@ Consonant +11075 BRAHMI LETTER OLD TAMIL LLA @ Number joiner 1107F BRAHMI NUMBER JOINER * a virama used to form ligatures between Brahmi numbers signifying multiplication @@ -32382,6 +33058,8 @@ FFFF x (khojki double section mark - 1123C) 110C0 KAITHI DANDA 110C1 KAITHI DOUBLE DANDA +@ Vowel sign +110C2 KAITHI VOWEL SIGN VOCALIC R @ Sign 110CD KAITHI NUMBER SIGN ABOVE * used to indicate a number in an itemized list @@ -33544,6 +34222,10 @@ FFFF @ Consonant 116B8 TAKRI LETTER ARCHAIC KHA * used in earlier writings to denote kha +@ Punctuation +116B9 TAKRI ABBREVIATION SIGN + x (gurmukhi abbreviation sign - 0A76) + x (sharada abbreviation sign - 111C7) @ Digits 116C0 TAKRI DIGIT ZERO 116C1 TAKRI DIGIT ONE @@ -33555,7 +34237,7 @@ FFFF 116C7 TAKRI DIGIT SEVEN 116C8 TAKRI DIGIT EIGHT 116C9 TAKRI DIGIT NINE -@@ 11700 Ahom 1173F +@@ 11700 Ahom 1174F @ Consonants 11700 AHOM LETTER KA 11701 AHOM LETTER KHA @@ -33620,6 +34302,14 @@ FFFF 1173D AHOM SIGN SECTION 1173E AHOM SIGN RULAI 1173F AHOM SYMBOL VI +@ Additional consonants +11740 AHOM LETTER CA +11741 AHOM LETTER TTA +11742 AHOM LETTER TTHA +11743 AHOM LETTER DDA +11744 AHOM LETTER DDHA +11745 AHOM LETTER NNA +11746 AHOM LETTER LLA @@ 11800 Dogra 1184F @ Independent vowels 11800 DOGRA LETTER A @@ -34181,6 +34871,29 @@ FFFF 11AA1 SOYOMBO TERMINAL MARK-1 11AA2 SOYOMBO TERMINAL MARK-2 = cintamani, candamani +@@ 11AB0 Unified Canadian Aboriginal Syllabics Extended-A 11ABF +@ Syllables for Nattilik +11AB0 CANADIAN SYLLABICS NATTILIK HI +11AB1 CANADIAN SYLLABICS NATTILIK HII +11AB2 CANADIAN SYLLABICS NATTILIK HO + * Nattilik (HU) +11AB3 CANADIAN SYLLABICS NATTILIK HOO + * Nattilik (HUU) +11AB4 CANADIAN SYLLABICS NATTILIK HA +11AB5 CANADIAN SYLLABICS NATTILIK HAA +11AB6 CANADIAN SYLLABICS NATTILIK SHRI +11AB7 CANADIAN SYLLABICS NATTILIK SHRII +11AB8 CANADIAN SYLLABICS NATTILIK SHRO + * Nattilik (SHRU) +11AB9 CANADIAN SYLLABICS NATTILIK SHROO + * Nattilik (SHRUU) +11ABA CANADIAN SYLLABICS NATTILIK SHRA +11ABB CANADIAN SYLLABICS NATTILIK SHRAA +@ Historic syllables for Cree and Ojibway +11ABC CANADIAN SYLLABICS SPE +11ABD CANADIAN SYLLABICS SPI +11ABE CANADIAN SYLLABICS SPO +11ABF CANADIAN SYLLABICS SPA @@ 11AC0 Pau Cin Hau 11AFF @ Consonants 11AC0 PAU CIN HAU LETTER PA @@ -36005,6 +36718,108 @@ FFFF 12541 CUNEIFORM SIGN ZA7 12542 CUNEIFORM SIGN ZU OVER ZU PLUS SAR 12543 CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +@@ 12F90 Cypro-Minoan 12FFF +@ Signs +12F90 CYPRO-MINOAN SIGN CM001 +12F91 CYPRO-MINOAN SIGN CM002 +12F92 CYPRO-MINOAN SIGN CM004 +12F93 CYPRO-MINOAN SIGN CM005 +12F94 CYPRO-MINOAN SIGN CM006 +12F95 CYPRO-MINOAN SIGN CM007 +12F96 CYPRO-MINOAN SIGN CM008 +12F97 CYPRO-MINOAN SIGN CM009 +12F98 CYPRO-MINOAN SIGN CM010 +12F99 CYPRO-MINOAN SIGN CM011 +12F9A CYPRO-MINOAN SIGN CM012 +12F9B CYPRO-MINOAN SIGN CM012B +12F9C CYPRO-MINOAN SIGN CM013 +12F9D CYPRO-MINOAN SIGN CM015 +12F9E CYPRO-MINOAN SIGN CM017 +12F9F CYPRO-MINOAN SIGN CM019 +12FA0 CYPRO-MINOAN SIGN CM021 +12FA1 CYPRO-MINOAN SIGN CM023 +12FA2 CYPRO-MINOAN SIGN CM024 +12FA3 CYPRO-MINOAN SIGN CM025 +12FA4 CYPRO-MINOAN SIGN CM026 +12FA5 CYPRO-MINOAN SIGN CM027 +12FA6 CYPRO-MINOAN SIGN CM028 +12FA7 CYPRO-MINOAN SIGN CM029 +12FA8 CYPRO-MINOAN SIGN CM030 +12FA9 CYPRO-MINOAN SIGN CM033 +12FAA CYPRO-MINOAN SIGN CM034 +12FAB CYPRO-MINOAN SIGN CM035 +12FAC CYPRO-MINOAN SIGN CM036 +12FAD CYPRO-MINOAN SIGN CM037 +12FAE CYPRO-MINOAN SIGN CM038 +12FAF CYPRO-MINOAN SIGN CM039 +12FB0 CYPRO-MINOAN SIGN CM040 +12FB1 CYPRO-MINOAN SIGN CM041 +12FB2 CYPRO-MINOAN SIGN CM044 +12FB3 CYPRO-MINOAN SIGN CM046 +12FB4 CYPRO-MINOAN SIGN CM047 +12FB5 CYPRO-MINOAN SIGN CM049 +12FB6 CYPRO-MINOAN SIGN CM050 +12FB7 CYPRO-MINOAN SIGN CM051 +12FB8 CYPRO-MINOAN SIGN CM052 +12FB9 CYPRO-MINOAN SIGN CM053 +12FBA CYPRO-MINOAN SIGN CM054 +12FBB CYPRO-MINOAN SIGN CM055 +12FBC CYPRO-MINOAN SIGN CM056 +12FBD CYPRO-MINOAN SIGN CM058 +12FBE CYPRO-MINOAN SIGN CM059 +12FBF CYPRO-MINOAN SIGN CM060 +12FC0 CYPRO-MINOAN SIGN CM061 +12FC1 CYPRO-MINOAN SIGN CM062 +12FC2 CYPRO-MINOAN SIGN CM063 +12FC3 CYPRO-MINOAN SIGN CM064 +12FC4 CYPRO-MINOAN SIGN CM066 +12FC5 CYPRO-MINOAN SIGN CM067 +12FC6 CYPRO-MINOAN SIGN CM068 +12FC7 CYPRO-MINOAN SIGN CM069 +12FC8 CYPRO-MINOAN SIGN CM070 +12FC9 CYPRO-MINOAN SIGN CM071 +12FCA CYPRO-MINOAN SIGN CM072 +12FCB CYPRO-MINOAN SIGN CM073 +12FCC CYPRO-MINOAN SIGN CM074 +12FCD CYPRO-MINOAN SIGN CM075 +12FCE CYPRO-MINOAN SIGN CM075B +12FCF CYPRO-MINOAN SIGN CM076 +12FD0 CYPRO-MINOAN SIGN CM078 +12FD1 CYPRO-MINOAN SIGN CM079 +12FD2 CYPRO-MINOAN SIGN CM080 +12FD3 CYPRO-MINOAN SIGN CM081 +12FD4 CYPRO-MINOAN SIGN CM082 +12FD5 CYPRO-MINOAN SIGN CM083 +12FD6 CYPRO-MINOAN SIGN CM084 +12FD7 CYPRO-MINOAN SIGN CM085 +12FD8 CYPRO-MINOAN SIGN CM086 +12FD9 CYPRO-MINOAN SIGN CM087 +12FDA CYPRO-MINOAN SIGN CM088 +12FDB CYPRO-MINOAN SIGN CM089 +12FDC CYPRO-MINOAN SIGN CM090 +12FDD CYPRO-MINOAN SIGN CM091 +12FDE CYPRO-MINOAN SIGN CM092 +12FDF CYPRO-MINOAN SIGN CM094 +12FE0 CYPRO-MINOAN SIGN CM095 +12FE1 CYPRO-MINOAN SIGN CM096 +12FE2 CYPRO-MINOAN SIGN CM097 +12FE3 CYPRO-MINOAN SIGN CM098 +12FE4 CYPRO-MINOAN SIGN CM099 +12FE5 CYPRO-MINOAN SIGN CM100 +12FE6 CYPRO-MINOAN SIGN CM101 +12FE7 CYPRO-MINOAN SIGN CM102 +12FE8 CYPRO-MINOAN SIGN CM103 +12FE9 CYPRO-MINOAN SIGN CM104 +12FEA CYPRO-MINOAN SIGN CM105 +12FEB CYPRO-MINOAN SIGN CM107 +12FEC CYPRO-MINOAN SIGN CM108 +12FED CYPRO-MINOAN SIGN CM109 +12FEE CYPRO-MINOAN SIGN CM110 +12FEF CYPRO-MINOAN SIGN CM112 +12FF0 CYPRO-MINOAN SIGN CM114 +@ Punctuation +12FF1 CYPRO-MINOAN SIGN CM301 +12FF2 CYPRO-MINOAN SIGN CM302 @@ 13000 Egyptian Hieroglyphs 1342F @+ The characters in this block are taken primarily from Alan Gardiner's works on Middle Egyptian. @ A. Man and his occupations @@ -36104,7 +36919,9 @@ FFFF 1305B EGYPTIAN HIEROGLYPH C002 1305C EGYPTIAN HIEROGLYPH C002A 1305D EGYPTIAN HIEROGLYPH C002B + * mirrored version of 1305C 1305E EGYPTIAN HIEROGLYPH C002C + * mirrored version of 1305B 1305F EGYPTIAN HIEROGLYPH C003 13060 EGYPTIAN HIEROGLYPH C004 13061 EGYPTIAN HIEROGLYPH C005 @@ -36118,8 +36935,10 @@ FFFF * 1,000,000 13069 EGYPTIAN HIEROGLYPH C012 1306A EGYPTIAN HIEROGLYPH C013 + * mirrored version of 13069 1306B EGYPTIAN HIEROGLYPH C014 1306C EGYPTIAN HIEROGLYPH C015 + * mirrored version of 1306B 1306D EGYPTIAN HIEROGLYPH C016 1306E EGYPTIAN HIEROGLYPH C017 1306F EGYPTIAN HIEROGLYPH C018 @@ -36144,6 +36963,8 @@ FFFF 13081 EGYPTIAN HIEROGLYPH D011 * 1/2 13082 EGYPTIAN HIEROGLYPH D012 + * pupil of the eye + * not to be confused with 131F3 or 133F8 * 1/4 13083 EGYPTIAN HIEROGLYPH D013 * 1/8 @@ -36158,6 +36979,8 @@ FFFF 13089 EGYPTIAN HIEROGLYPH D019 1308A EGYPTIAN HIEROGLYPH D020 1308B EGYPTIAN HIEROGLYPH D021 + * mouth + * not to be confused with 133AB * transliterated as r 1308C EGYPTIAN HIEROGLYPH D022 1308D EGYPTIAN HIEROGLYPH D023 @@ -36197,6 +37020,8 @@ FFFF 130AB EGYPTIAN HIEROGLYPH D048A 130AC EGYPTIAN HIEROGLYPH D049 130AD EGYPTIAN HIEROGLYPH D050 + * classifier 'accurate, finger' + * not to be confused with 130B7 * 10,000 130AE EGYPTIAN HIEROGLYPH D050A * 20,000 @@ -36217,12 +37042,16 @@ FFFF 130B6 EGYPTIAN HIEROGLYPH D050I * 50,000 130B7 EGYPTIAN HIEROGLYPH D051 + * classifier 'measure, nail, scratching, taking' + * not to be confused with 130AD 130B8 EGYPTIAN HIEROGLYPH D052 130B9 EGYPTIAN HIEROGLYPH D052A 130BA EGYPTIAN HIEROGLYPH D053 130BB EGYPTIAN HIEROGLYPH D054 + * (forward) motion 130BC EGYPTIAN HIEROGLYPH D054A 130BD EGYPTIAN HIEROGLYPH D055 + * backward motion 130BE EGYPTIAN HIEROGLYPH D056 130BF EGYPTIAN HIEROGLYPH D057 130C0 EGYPTIAN HIEROGLYPH D058 @@ -36237,6 +37066,7 @@ FFFF 130C8 EGYPTIAN HIEROGLYPH D066 130C9 EGYPTIAN HIEROGLYPH D067 * 1 heqat measure + * not to be confused with 13212 130CA EGYPTIAN HIEROGLYPH D067A * 2 heqat measures 130CB EGYPTIAN HIEROGLYPH D067B @@ -36255,7 +37085,10 @@ FFFF * 9 heqat measures @ E. Mammals 130D2 EGYPTIAN HIEROGLYPH E001 + * bull, classifier 'cattle' + * not to be confused with 130FD 130D3 EGYPTIAN HIEROGLYPH E002 + * aggressive bull 130D4 EGYPTIAN HIEROGLYPH E003 130D5 EGYPTIAN HIEROGLYPH E004 130D6 EGYPTIAN HIEROGLYPH E005 @@ -36295,9 +37128,12 @@ FFFF 130F8 EGYPTIAN HIEROGLYPH E033 130F9 EGYPTIAN HIEROGLYPH E034 130FA EGYPTIAN HIEROGLYPH E034A + * stylistic variant, use of 130F9 is preferred 130FB EGYPTIAN HIEROGLYPH E036 130FC EGYPTIAN HIEROGLYPH E037 130FD EGYPTIAN HIEROGLYPH E038 + * cow + * not to be confused with 130D2 @ F. Parts of mammals 130FE EGYPTIAN HIEROGLYPH F001 130FF EGYPTIAN HIEROGLYPH F001A @@ -36314,6 +37150,7 @@ FFFF 1310A EGYPTIAN HIEROGLYPH F012 1310B EGYPTIAN HIEROGLYPH F013 1310C EGYPTIAN HIEROGLYPH F013A + * stylistic variant, use of 1310B is preferred 1310D EGYPTIAN HIEROGLYPH F014 1310E EGYPTIAN HIEROGLYPH F015 1310F EGYPTIAN HIEROGLYPH F016 @@ -36323,9 +37160,11 @@ FFFF 13113 EGYPTIAN HIEROGLYPH F020 13114 EGYPTIAN HIEROGLYPH F021 13115 EGYPTIAN HIEROGLYPH F021A + * from hieratic 13116 EGYPTIAN HIEROGLYPH F022 13117 EGYPTIAN HIEROGLYPH F023 13118 EGYPTIAN HIEROGLYPH F024 + * mirrored version of 13117 13119 EGYPTIAN HIEROGLYPH F025 1311A EGYPTIAN HIEROGLYPH F026 1311B EGYPTIAN HIEROGLYPH F027 @@ -36334,6 +37173,7 @@ FFFF 1311E EGYPTIAN HIEROGLYPH F030 1311F EGYPTIAN HIEROGLYPH F031 13120 EGYPTIAN HIEROGLYPH F031A + * cursive variant of 1311F 13121 EGYPTIAN HIEROGLYPH F032 * transliterated as 1E96 13122 EGYPTIAN HIEROGLYPH F033 @@ -36354,25 +37194,35 @@ FFFF 13131 EGYPTIAN HIEROGLYPH F045A 13132 EGYPTIAN HIEROGLYPH F046 13133 EGYPTIAN HIEROGLYPH F046A + * rotated version of 13132 13134 EGYPTIAN HIEROGLYPH F047 + * mirrored version of 13132 13135 EGYPTIAN HIEROGLYPH F047A + * mirrored version of 13133 13136 EGYPTIAN HIEROGLYPH F048 13137 EGYPTIAN HIEROGLYPH F049 + * mirrored version of 13136 13138 EGYPTIAN HIEROGLYPH F050 13139 EGYPTIAN HIEROGLYPH F051 1313A EGYPTIAN HIEROGLYPH F051A 1313B EGYPTIAN HIEROGLYPH F051B + * variant of 1313A 1313C EGYPTIAN HIEROGLYPH F051C + * rotated version of 13139 1313D EGYPTIAN HIEROGLYPH F052 1313E EGYPTIAN HIEROGLYPH F053 @ G. Birds 1313F EGYPTIAN HIEROGLYPH G001 + * Egyptian vulture, Egyptological alef + * not to be confused with 13142 * transliterated as A723 x (hebrew letter alef - 05D0) x (arabic letter alef with hamza above - 0623) 13140 EGYPTIAN HIEROGLYPH G002 13141 EGYPTIAN HIEROGLYPH G003 13142 EGYPTIAN HIEROGLYPH G004 + * phonogram 'tw' + * not to be confused with 1313F 13143 EGYPTIAN HIEROGLYPH G005 13144 EGYPTIAN HIEROGLYPH G006 13145 EGYPTIAN HIEROGLYPH G006A @@ -36413,10 +37263,14 @@ FFFF 13167 EGYPTIAN HIEROGLYPH G035 13168 EGYPTIAN HIEROGLYPH G036 13169 EGYPTIAN HIEROGLYPH G036A + * stylistic variant, use of 13168 is preferred 1316A EGYPTIAN HIEROGLYPH G037 1316B EGYPTIAN HIEROGLYPH G037A + * stylistic variant, use of 1316A is preferred 1316C EGYPTIAN HIEROGLYPH G038 + * goose 1316D EGYPTIAN HIEROGLYPH G039 + * duck 1316E EGYPTIAN HIEROGLYPH G040 1316F EGYPTIAN HIEROGLYPH G041 13170 EGYPTIAN HIEROGLYPH G042 @@ -36443,6 +37297,7 @@ FFFF 13183 EGYPTIAN HIEROGLYPH H005 13184 EGYPTIAN HIEROGLYPH H006 13185 EGYPTIAN HIEROGLYPH H006A + * from hieratic 13186 EGYPTIAN HIEROGLYPH H007 13187 EGYPTIAN HIEROGLYPH H008 @ I. Amphibious animals, reptiles, etc. @@ -36477,7 +37332,7 @@ FFFF 131A0 EGYPTIAN HIEROGLYPH K006 131A1 EGYPTIAN HIEROGLYPH K007 131A2 EGYPTIAN HIEROGLYPH K008 -@ L. Invertabrata and lesser animals +@ L. Invertebrata and lesser animals 131A3 EGYPTIAN HIEROGLYPH L001 131A4 EGYPTIAN HIEROGLYPH L002 131A5 EGYPTIAN HIEROGLYPH L002A @@ -36486,6 +37341,7 @@ FFFF 131A8 EGYPTIAN HIEROGLYPH L005 131A9 EGYPTIAN HIEROGLYPH L006 131AA EGYPTIAN HIEROGLYPH L006A + * mirrored version of 131A9 131AB EGYPTIAN HIEROGLYPH L007 131AC EGYPTIAN HIEROGLYPH L008 @ M. Trees and plants @@ -36529,18 +37385,21 @@ FFFF 131C9 EGYPTIAN HIEROGLYPH M016 131CA EGYPTIAN HIEROGLYPH M016A 131CB EGYPTIAN HIEROGLYPH M017 - * yod + * egyptological yod + * transliterated as A7BD x (hebrew letter yod - 05D9) x (arabic letter yeh - 064A) 131CC EGYPTIAN HIEROGLYPH M017A - * transliterated as y + * phonogram 'y' x (egyptian hieroglyph z004 - 133ED) 131CD EGYPTIAN HIEROGLYPH M018 131CE EGYPTIAN HIEROGLYPH M019 131CF EGYPTIAN HIEROGLYPH M020 131D0 EGYPTIAN HIEROGLYPH M021 131D1 EGYPTIAN HIEROGLYPH M022 + * classifier 'bud, lotus bud' 131D2 EGYPTIAN HIEROGLYPH M022A + *phonogram 'nn' 131D3 EGYPTIAN HIEROGLYPH M023 131D4 EGYPTIAN HIEROGLYPH M024 131D5 EGYPTIAN HIEROGLYPH M024A @@ -36556,30 +37415,42 @@ FFFF 131DF EGYPTIAN HIEROGLYPH M032 131E0 EGYPTIAN HIEROGLYPH M033 131E1 EGYPTIAN HIEROGLYPH M033A + * variant of 131E0 131E2 EGYPTIAN HIEROGLYPH M033B + * variant of 131E0 131E3 EGYPTIAN HIEROGLYPH M034 131E4 EGYPTIAN HIEROGLYPH M035 131E5 EGYPTIAN HIEROGLYPH M036 131E6 EGYPTIAN HIEROGLYPH M037 + * older variant of 131E5 131E7 EGYPTIAN HIEROGLYPH M038 131E8 EGYPTIAN HIEROGLYPH M039 131E9 EGYPTIAN HIEROGLYPH M040 + * phonogram 'js' + * not to be confused with 132A7 or 1342A 131EA EGYPTIAN HIEROGLYPH M040A 131EB EGYPTIAN HIEROGLYPH M041 131EC EGYPTIAN HIEROGLYPH M042 131ED EGYPTIAN HIEROGLYPH M043 131EE EGYPTIAN HIEROGLYPH M044 + * thorn + * not to be confused with 133DA @ N. Sky, earth, water 131EF EGYPTIAN HIEROGLYPH N001 131F0 EGYPTIAN HIEROGLYPH N002 131F1 EGYPTIAN HIEROGLYPH N003 + * older variant of 131F0 131F2 EGYPTIAN HIEROGLYPH N004 131F3 EGYPTIAN HIEROGLYPH N005 + * sun + * not to be confused with 13082 or 133F8 131F4 EGYPTIAN HIEROGLYPH N006 131F5 EGYPTIAN HIEROGLYPH N007 131F6 EGYPTIAN HIEROGLYPH N008 131F7 EGYPTIAN HIEROGLYPH N009 + * variant of 131F8 131F8 EGYPTIAN HIEROGLYPH N010 + * variant of 131F7 131F9 EGYPTIAN HIEROGLYPH N011 131FA EGYPTIAN HIEROGLYPH N012 131FB EGYPTIAN HIEROGLYPH N013 @@ -36587,10 +37458,15 @@ FFFF 131FD EGYPTIAN HIEROGLYPH N015 131FE EGYPTIAN HIEROGLYPH N016 131FF EGYPTIAN HIEROGLYPH N017 + * land + * variant of 131FE 13200 EGYPTIAN HIEROGLYPH N018 + * island + * not to be confused with 132F0, 133D4, or 133F3 13201 EGYPTIAN HIEROGLYPH N018A 13202 EGYPTIAN HIEROGLYPH N018B 13203 EGYPTIAN HIEROGLYPH N019 + * logogram 'akhti' 13204 EGYPTIAN HIEROGLYPH N020 13205 EGYPTIAN HIEROGLYPH N021 13206 EGYPTIAN HIEROGLYPH N022 @@ -36598,10 +37474,13 @@ FFFF 13208 EGYPTIAN HIEROGLYPH N024 13209 EGYPTIAN HIEROGLYPH N025 1320A EGYPTIAN HIEROGLYPH N025A + * stylistic variant, use of 13209 is preferred 1320B EGYPTIAN HIEROGLYPH N026 1320C EGYPTIAN HIEROGLYPH N027 1320D EGYPTIAN HIEROGLYPH N028 1320E EGYPTIAN HIEROGLYPH N029 + * hill + * not to be confused with 133D8 * transliterated as q or as 1E33 x (hebrew letter qof - 05E7) x (arabic letter qaf - 0642) @@ -36609,21 +37488,33 @@ FFFF 13210 EGYPTIAN HIEROGLYPH N031 13211 EGYPTIAN HIEROGLYPH N032 13212 EGYPTIAN HIEROGLYPH N033 + * classifier 'granule, grain' + * not to be confused with 130C9 13213 EGYPTIAN HIEROGLYPH N033A + * classifier 'granules, grains' + * not to be confused with 133E7 13214 EGYPTIAN HIEROGLYPH N034 13215 EGYPTIAN HIEROGLYPH N034A + * stylistic variant, use of 13214 is preferred 13216 EGYPTIAN HIEROGLYPH N035 * transliterated as n 13217 EGYPTIAN HIEROGLYPH N035A + * classifier 'liquid' 13218 EGYPTIAN HIEROGLYPH N036 13219 EGYPTIAN HIEROGLYPH N037 + * lake * transliterated as 0161 + * not to be confused with 1328C 1321A EGYPTIAN HIEROGLYPH N037A + * variant of 13219 1321B EGYPTIAN HIEROGLYPH N038 + * variant of 13219 1321C EGYPTIAN HIEROGLYPH N039 + * variant of 13219 1321D EGYPTIAN HIEROGLYPH N040 1321E EGYPTIAN HIEROGLYPH N041 1321F EGYPTIAN HIEROGLYPH N042 + * variant of 1321E @ NL. Nomes of Lower Egypt 13220 EGYPTIAN HIEROGLYPH NL001 13221 EGYPTIAN HIEROGLYPH NL002 @@ -36685,6 +37576,7 @@ FFFF x (arabic letter heh - 0647) 13255 EGYPTIAN HIEROGLYPH O005 13256 EGYPTIAN HIEROGLYPH O005A + * mirrored version of 13255 13257 EGYPTIAN HIEROGLYPH O006 13258 EGYPTIAN HIEROGLYPH O006A * beginning of hwt or serekh enclosure @@ -36730,11 +37622,15 @@ FFFF 1327A EGYPTIAN HIEROGLYPH O028 1327B EGYPTIAN HIEROGLYPH O029 1327C EGYPTIAN HIEROGLYPH O029A + * rotated variant of 1327B 1327D EGYPTIAN HIEROGLYPH O030 + * supporting pole + * not to be confused with 13361 1327E EGYPTIAN HIEROGLYPH O030A 1327F EGYPTIAN HIEROGLYPH O031 13280 EGYPTIAN HIEROGLYPH O032 13281 EGYPTIAN HIEROGLYPH O033 + * classifier 'serekh' 13282 EGYPTIAN HIEROGLYPH O033A * end of serekh enclosure x (egyptian hieroglyph o006a - 13258) @@ -36754,10 +37650,13 @@ FFFF 1328A EGYPTIAN HIEROGLYPH O037 1328B EGYPTIAN HIEROGLYPH O038 1328C EGYPTIAN HIEROGLYPH O039 + * stone, brick + * not to be confused with 13219 1328D EGYPTIAN HIEROGLYPH O040 1328E EGYPTIAN HIEROGLYPH O041 1328F EGYPTIAN HIEROGLYPH O042 13290 EGYPTIAN HIEROGLYPH O043 + * older variant of 1328F 13291 EGYPTIAN HIEROGLYPH O044 13292 EGYPTIAN HIEROGLYPH O045 13293 EGYPTIAN HIEROGLYPH O046 @@ -36767,13 +37666,18 @@ FFFF 13297 EGYPTIAN HIEROGLYPH O050 13298 EGYPTIAN HIEROGLYPH O050A 13299 EGYPTIAN HIEROGLYPH O050B + * mirrored version of 13298 1329A EGYPTIAN HIEROGLYPH O051 @ P. Ships and parts of ships 1329B EGYPTIAN HIEROGLYPH P001 + * classifier 'ship, travel' 1329C EGYPTIAN HIEROGLYPH P001A + * classifier 'upset, overturn' 1329D EGYPTIAN HIEROGLYPH P002 1329E EGYPTIAN HIEROGLYPH P003 + * sacred ship 1329F EGYPTIAN HIEROGLYPH P003A + * mirrored variant of 1329E 132A0 EGYPTIAN HIEROGLYPH P004 132A1 EGYPTIAN HIEROGLYPH P005 132A2 EGYPTIAN HIEROGLYPH P006 @@ -36782,6 +37686,8 @@ FFFF 132A5 EGYPTIAN HIEROGLYPH P009 132A6 EGYPTIAN HIEROGLYPH P010 132A7 EGYPTIAN HIEROGLYPH P011 + * mooring post + * not to be confused with 131E9 or 1342A @ Q. Domestic and funerary furniture 132A8 EGYPTIAN HIEROGLYPH Q001 132A9 EGYPTIAN HIEROGLYPH Q002 @@ -36859,6 +37765,8 @@ FFFF 132EE EGYPTIAN HIEROGLYPH S025 132EF EGYPTIAN HIEROGLYPH S026 132F0 EGYPTIAN HIEROGLYPH S026A + * loin-cloth + * not to be confused with 13200, 133D4, or 133F3 132F1 EGYPTIAN HIEROGLYPH S026B 132F2 EGYPTIAN HIEROGLYPH S027 132F3 EGYPTIAN HIEROGLYPH S028 @@ -36872,12 +37780,16 @@ FFFF 132F9 EGYPTIAN HIEROGLYPH S034 132FA EGYPTIAN HIEROGLYPH S035 132FB EGYPTIAN HIEROGLYPH S035A + * variant of 132FA 132FC EGYPTIAN HIEROGLYPH S036 + * older variant of 132FA 132FD EGYPTIAN HIEROGLYPH S037 132FE EGYPTIAN HIEROGLYPH S038 132FF EGYPTIAN HIEROGLYPH S039 13300 EGYPTIAN HIEROGLYPH S040 + * phonogram 'wꜣs' 13301 EGYPTIAN HIEROGLYPH S041 + * phonogram 'ḏꜣm' 13302 EGYPTIAN HIEROGLYPH S042 13303 EGYPTIAN HIEROGLYPH S043 13304 EGYPTIAN HIEROGLYPH S044 @@ -36886,7 +37798,9 @@ FFFF @ T. Warfare, hunting, butchery 13307 EGYPTIAN HIEROGLYPH T001 13308 EGYPTIAN HIEROGLYPH T002 + * classifier 'striking, hitting' 13309 EGYPTIAN HIEROGLYPH T003 + * classifier 'mace' 1330A EGYPTIAN HIEROGLYPH T003A 1330B EGYPTIAN HIEROGLYPH T004 1330C EGYPTIAN HIEROGLYPH T005 @@ -36894,9 +37808,11 @@ FFFF 1330E EGYPTIAN HIEROGLYPH T007 1330F EGYPTIAN HIEROGLYPH T007A 13310 EGYPTIAN HIEROGLYPH T008 + * older variant of 13311 13311 EGYPTIAN HIEROGLYPH T008A 13312 EGYPTIAN HIEROGLYPH T009 13313 EGYPTIAN HIEROGLYPH T009A + * older variant of 13312 13314 EGYPTIAN HIEROGLYPH T010 13315 EGYPTIAN HIEROGLYPH T011 13316 EGYPTIAN HIEROGLYPH T011A @@ -36904,41 +37820,55 @@ FFFF 13318 EGYPTIAN HIEROGLYPH T013 13319 EGYPTIAN HIEROGLYPH T014 1331A EGYPTIAN HIEROGLYPH T015 + * older variant of 13319 1331B EGYPTIAN HIEROGLYPH T016 1331C EGYPTIAN HIEROGLYPH T016A 1331D EGYPTIAN HIEROGLYPH T017 1331E EGYPTIAN HIEROGLYPH T018 1331F EGYPTIAN HIEROGLYPH T019 13320 EGYPTIAN HIEROGLYPH T020 + * older variant of 1331F 13321 EGYPTIAN HIEROGLYPH T021 13322 EGYPTIAN HIEROGLYPH T022 13323 EGYPTIAN HIEROGLYPH T023 + * more recent variant of 13322 13324 EGYPTIAN HIEROGLYPH T024 13325 EGYPTIAN HIEROGLYPH T025 13326 EGYPTIAN HIEROGLYPH T026 13327 EGYPTIAN HIEROGLYPH T027 + * older variant of 13326 13328 EGYPTIAN HIEROGLYPH T028 13329 EGYPTIAN HIEROGLYPH T029 1332A EGYPTIAN HIEROGLYPH T030 + * classifier 'knife, cutting' 1332B EGYPTIAN HIEROGLYPH T031 + * phonogram 'sšm' 1332C EGYPTIAN HIEROGLYPH T032 1332D EGYPTIAN HIEROGLYPH T032A 1332E EGYPTIAN HIEROGLYPH T033 + * older variant of 13326 1332F EGYPTIAN HIEROGLYPH T033A 13330 EGYPTIAN HIEROGLYPH T034 13331 EGYPTIAN HIEROGLYPH T035 + * variant of 13330 13332 EGYPTIAN HIEROGLYPH T036 @ U. Agriculture, crafts, and professions 13333 EGYPTIAN HIEROGLYPH U001 13334 EGYPTIAN HIEROGLYPH U002 + * stylistic variant of 13333 13335 EGYPTIAN HIEROGLYPH U003 13336 EGYPTIAN HIEROGLYPH U004 13337 EGYPTIAN HIEROGLYPH U005 + * stylistic variant of 13336 13338 EGYPTIAN HIEROGLYPH U006 13339 EGYPTIAN HIEROGLYPH U006A + * stylistic variant of 13338 1333A EGYPTIAN HIEROGLYPH U006B + * mirrored version of 13339 1333B EGYPTIAN HIEROGLYPH U007 + * variant of 13338 1333C EGYPTIAN HIEROGLYPH U008 + * variant of 1333B 1333D EGYPTIAN HIEROGLYPH U009 1333E EGYPTIAN HIEROGLYPH U010 1333F EGYPTIAN HIEROGLYPH U011 @@ -36949,18 +37879,24 @@ FFFF 13344 EGYPTIAN HIEROGLYPH U016 13345 EGYPTIAN HIEROGLYPH U017 13346 EGYPTIAN HIEROGLYPH U018 + * variant of 13345 13347 EGYPTIAN HIEROGLYPH U019 13348 EGYPTIAN HIEROGLYPH U020 + * older variant of 13347 13349 EGYPTIAN HIEROGLYPH U021 1334A EGYPTIAN HIEROGLYPH U022 1334B EGYPTIAN HIEROGLYPH U023 1334C EGYPTIAN HIEROGLYPH U023A + * stylistic variant of 1334B 1334D EGYPTIAN HIEROGLYPH U024 1334E EGYPTIAN HIEROGLYPH U025 + * older variant of 1334D 1334F EGYPTIAN HIEROGLYPH U026 13350 EGYPTIAN HIEROGLYPH U027 + * older variant of 1334F 13351 EGYPTIAN HIEROGLYPH U028 13352 EGYPTIAN HIEROGLYPH U029 + * older variant of 13351 13353 EGYPTIAN HIEROGLYPH U029A 13354 EGYPTIAN HIEROGLYPH U030 13355 EGYPTIAN HIEROGLYPH U031 @@ -36974,11 +37910,16 @@ FFFF 1335D EGYPTIAN HIEROGLYPH U038 1335E EGYPTIAN HIEROGLYPH U039 1335F EGYPTIAN HIEROGLYPH U040 + * cursive variant of 1335E 13360 EGYPTIAN HIEROGLYPH U041 13361 EGYPTIAN HIEROGLYPH U042 + * pitchfork + * not to be confused with 1327D @ V. Rope, fiber, baskets, bags, etc. 13362 EGYPTIAN HIEROGLYPH V001 * 100 + * classifier 'cord, rope' + * not to be confused with 133F2 13363 EGYPTIAN HIEROGLYPH V001A * 200 13364 EGYPTIAN HIEROGLYPH V001B @@ -37003,13 +37944,17 @@ FFFF 1336F EGYPTIAN HIEROGLYPH V004 13370 EGYPTIAN HIEROGLYPH V005 13371 EGYPTIAN HIEROGLYPH V006 + * phonogram 'šs' 13372 EGYPTIAN HIEROGLYPH V007 + * phonogram 'šn' 13373 EGYPTIAN HIEROGLYPH V007A 13374 EGYPTIAN HIEROGLYPH V007B 13375 EGYPTIAN HIEROGLYPH V008 13376 EGYPTIAN HIEROGLYPH V009 13377 EGYPTIAN HIEROGLYPH V010 + * logogram 'name' 13378 EGYPTIAN HIEROGLYPH V011 + * classifier 'restrain, split' 13379 EGYPTIAN HIEROGLYPH V011A * beginning of cartouche 1337A EGYPTIAN HIEROGLYPH V011B @@ -37022,15 +37967,19 @@ FFFF 1337F EGYPTIAN HIEROGLYPH V013 * transliterated as 1E6F 13380 EGYPTIAN HIEROGLYPH V014 + * variant of 1337F 13381 EGYPTIAN HIEROGLYPH V015 13382 EGYPTIAN HIEROGLYPH V016 13383 EGYPTIAN HIEROGLYPH V017 13384 EGYPTIAN HIEROGLYPH V018 + * older variant of 13383 13385 EGYPTIAN HIEROGLYPH V019 13386 EGYPTIAN HIEROGLYPH V020 * 10 + * not to be confused with 133AD 13387 EGYPTIAN HIEROGLYPH V020A * 20 + * not to be confused with 133AE 13388 EGYPTIAN HIEROGLYPH V020B * 30 13389 EGYPTIAN HIEROGLYPH V020C @@ -37047,20 +37996,27 @@ FFFF * 90 1338F EGYPTIAN HIEROGLYPH V020I * 20 + * variant of 13387 13390 EGYPTIAN HIEROGLYPH V020J * 30 + * variant of 13388 13391 EGYPTIAN HIEROGLYPH V020K * 40 + * variant of 13389 13392 EGYPTIAN HIEROGLYPH V020L * 50 + * variant of 1338A 13393 EGYPTIAN HIEROGLYPH V021 13394 EGYPTIAN HIEROGLYPH V022 13395 EGYPTIAN HIEROGLYPH V023 + * older variant of 13394 13396 EGYPTIAN HIEROGLYPH V023A 13397 EGYPTIAN HIEROGLYPH V024 13398 EGYPTIAN HIEROGLYPH V025 + * more recent variant of 13397 13399 EGYPTIAN HIEROGLYPH V026 1339A EGYPTIAN HIEROGLYPH V027 + * older variant of 13399 1339B EGYPTIAN HIEROGLYPH V028 * transliterated as 1E25 x (arabic letter hah - 062D) @@ -37069,30 +38025,38 @@ FFFF 1339E EGYPTIAN HIEROGLYPH V029A 1339F EGYPTIAN HIEROGLYPH V030 133A0 EGYPTIAN HIEROGLYPH V030A + * stylistic variant, use of 1339F is preferred 133A1 EGYPTIAN HIEROGLYPH V031 * transliterated as k x (hebrew letter kaf - 05DB) x (arabic letter kaf - 0643) 133A2 EGYPTIAN HIEROGLYPH V031A + * from hieratic 133A3 EGYPTIAN HIEROGLYPH V032 133A4 EGYPTIAN HIEROGLYPH V033 133A5 EGYPTIAN HIEROGLYPH V033A 133A6 EGYPTIAN HIEROGLYPH V034 + * more recent variant of 133A4 133A7 EGYPTIAN HIEROGLYPH V035 133A8 EGYPTIAN HIEROGLYPH V036 133A9 EGYPTIAN HIEROGLYPH V037 133AA EGYPTIAN HIEROGLYPH V037A 133AB EGYPTIAN HIEROGLYPH V038 + * bandage + * not to be confused with 1308B 133AC EGYPTIAN HIEROGLYPH V039 133AD EGYPTIAN HIEROGLYPH V040 * 10 in dates + * not to be confused with 13386 133AE EGYPTIAN HIEROGLYPH V040A * 20 in dates + * not to be confused with 13387 @ W. Vessels of stone and earthenware 133AF EGYPTIAN HIEROGLYPH W001 133B0 EGYPTIAN HIEROGLYPH W002 133B1 EGYPTIAN HIEROGLYPH W003 133B2 EGYPTIAN HIEROGLYPH W003A + * stylistic variant, use of 133B1 is preferred 133B3 EGYPTIAN HIEROGLYPH W004 133B4 EGYPTIAN HIEROGLYPH W005 133B5 EGYPTIAN HIEROGLYPH W006 @@ -37100,11 +38064,13 @@ FFFF 133B7 EGYPTIAN HIEROGLYPH W008 133B8 EGYPTIAN HIEROGLYPH W009 133B9 EGYPTIAN HIEROGLYPH W009A + * mirrored version of 133B8 133BA EGYPTIAN HIEROGLYPH W010 133BB EGYPTIAN HIEROGLYPH W010A 133BC EGYPTIAN HIEROGLYPH W011 * transliterated as g 133BD EGYPTIAN HIEROGLYPH W012 + * older variant of 133BC 133BE EGYPTIAN HIEROGLYPH W013 133BF EGYPTIAN HIEROGLYPH W014 133C0 EGYPTIAN HIEROGLYPH W014A @@ -37112,81 +38078,122 @@ FFFF 133C2 EGYPTIAN HIEROGLYPH W016 133C3 EGYPTIAN HIEROGLYPH W017 133C4 EGYPTIAN HIEROGLYPH W017A + * cursive variant of 133C3 133C5 EGYPTIAN HIEROGLYPH W018 + * older variant of 133C3 133C6 EGYPTIAN HIEROGLYPH W018A + * cursive variant of 133C5 133C7 EGYPTIAN HIEROGLYPH W019 133C8 EGYPTIAN HIEROGLYPH W020 133C9 EGYPTIAN HIEROGLYPH W021 133CA EGYPTIAN HIEROGLYPH W022 133CB EGYPTIAN HIEROGLYPH W023 133CC EGYPTIAN HIEROGLYPH W024 + * phonogramm 'nw' 133CD EGYPTIAN HIEROGLYPH W024A + * monogramm 'nw(n)' or 'nww' 133CE EGYPTIAN HIEROGLYPH W025 @ X. Loaves and cakes 133CF EGYPTIAN HIEROGLYPH X001 * transliterated as t 133D0 EGYPTIAN HIEROGLYPH X002 133D1 EGYPTIAN HIEROGLYPH X003 + * variant of 133D0 133D2 EGYPTIAN HIEROGLYPH X004 133D3 EGYPTIAN HIEROGLYPH X004A + * variant of 133D2 133D4 EGYPTIAN HIEROGLYPH X004B + * cake + * variant of 133D2 + * not to be confused with 13200, 132F0, or 133F3 133D5 EGYPTIAN HIEROGLYPH X005 + * hieratic + * variant of 133D4 133D6 EGYPTIAN HIEROGLYPH X006 133D7 EGYPTIAN HIEROGLYPH X006A 133D8 EGYPTIAN HIEROGLYPH X007 + * classifier 'food' + * not to be confused with 1320E 133D9 EGYPTIAN HIEROGLYPH X008 133DA EGYPTIAN HIEROGLYPH X008A + * bread + * variant of 133D9 + * not to be confused with 131EE @ Y. Writings, games, music 133DB EGYPTIAN HIEROGLYPH Y001 133DC EGYPTIAN HIEROGLYPH Y001A + * rotated variant of 133DB 133DD EGYPTIAN HIEROGLYPH Y002 + * older variant of 133DB 133DE EGYPTIAN HIEROGLYPH Y003 133DF EGYPTIAN HIEROGLYPH Y004 + * mirrored version of 133DE 133E0 EGYPTIAN HIEROGLYPH Y005 133E1 EGYPTIAN HIEROGLYPH Y006 133E2 EGYPTIAN HIEROGLYPH Y007 133E3 EGYPTIAN HIEROGLYPH Y008 @ Z. Strokes, signs derived from Hieratic, geometrical figures 133E4 EGYPTIAN HIEROGLYPH Z001 - x (egyptian hieroglyph z015 - 133FA) + * semogram index + * classifier 'single' + * not to be confuse with 133FA 133E5 EGYPTIAN HIEROGLYPH Z002 - * plurality - x (egyptian hieroglyph z015b - 133FC) + * classifier 'plural' + * not to be confused with 133FC 133E6 EGYPTIAN HIEROGLYPH Z002A + * stylistic variant of 133E5 133E7 EGYPTIAN HIEROGLYPH Z002B + * classifier 'plural' + * not to be confused with 13213 133E8 EGYPTIAN HIEROGLYPH Z002C + * variant of 133E6 133E9 EGYPTIAN HIEROGLYPH Z002D + * variant of 133E8 133EA EGYPTIAN HIEROGLYPH Z003 + * variant of 133E5 133EB EGYPTIAN HIEROGLYPH Z003A + * variant of 133EA 133EC EGYPTIAN HIEROGLYPH Z003B - * 3 + * variant of 133E7 133ED EGYPTIAN HIEROGLYPH Z004 - * duality + * classifier 'dual' * transliterated as y x (egyptian hieroglyph m017a - 131CC) 133EE EGYPTIAN HIEROGLYPH Z004A - * duality - x (egyptian hieroglyph z015a - 133FB) + * variant of 133ED + * classifier 'dual' + * transliterated as y + * not to be confused with 133FB 133EF EGYPTIAN HIEROGLYPH Z005 133F0 EGYPTIAN HIEROGLYPH Z005A + * variant of 133EF 133F1 EGYPTIAN HIEROGLYPH Z006 133F2 EGYPTIAN HIEROGLYPH Z007 + * phonogram 'w' + * not to be confused with 13362 133F3 EGYPTIAN HIEROGLYPH Z008 + * oval + * not to be confused with 13200, 132F0, or 133D4 133F4 EGYPTIAN HIEROGLYPH Z009 133F5 EGYPTIAN HIEROGLYPH Z010 + * older variant of 133F4 133F6 EGYPTIAN HIEROGLYPH Z011 133F7 EGYPTIAN HIEROGLYPH Z012 + * hieratic 133F8 EGYPTIAN HIEROGLYPH Z013 + * circle, unmarked round sign + * not to be confused with 13082 or 131F3 133F9 EGYPTIAN HIEROGLYPH Z014 + * hieratic 133FA EGYPTIAN HIEROGLYPH Z015 * 1 - x (egyptian hieroglyph z001 - 133E4) + * not to be confused with 133E4 133FB EGYPTIAN HIEROGLYPH Z015A * 2 - x (egyptian hieroglyph z004a - 133EE) + * not to be confused with 133EE 133FC EGYPTIAN HIEROGLYPH Z015B * 3 - x (egyptian hieroglyph z002 - 133E5) + * not to be confused with 133E5 x (egyptian hieroglyph z003 - 133EA) 133FD EGYPTIAN HIEROGLYPH Z015C * 4 @@ -37231,31 +38238,41 @@ FFFF 13412 EGYPTIAN HIEROGLYPH AA006 13413 EGYPTIAN HIEROGLYPH AA007 13414 EGYPTIAN HIEROGLYPH AA007A + * mirrored version of 13413 13415 EGYPTIAN HIEROGLYPH AA007B 13416 EGYPTIAN HIEROGLYPH AA008 13417 EGYPTIAN HIEROGLYPH AA009 13418 EGYPTIAN HIEROGLYPH AA010 13419 EGYPTIAN HIEROGLYPH AA011 1341A EGYPTIAN HIEROGLYPH AA012 + * older variant of 13419 1341B EGYPTIAN HIEROGLYPH AA013 1341C EGYPTIAN HIEROGLYPH AA014 + * older variant of 1341B 1341D EGYPTIAN HIEROGLYPH AA015 1341E EGYPTIAN HIEROGLYPH AA016 + * variant of 1341D 1341F EGYPTIAN HIEROGLYPH AA017 13420 EGYPTIAN HIEROGLYPH AA018 + * more recent variant of 1341F 13421 EGYPTIAN HIEROGLYPH AA019 13422 EGYPTIAN HIEROGLYPH AA020 13423 EGYPTIAN HIEROGLYPH AA021 13424 EGYPTIAN HIEROGLYPH AA022 13425 EGYPTIAN HIEROGLYPH AA023 13426 EGYPTIAN HIEROGLYPH AA024 + * older variant of 13425 13427 EGYPTIAN HIEROGLYPH AA025 13428 EGYPTIAN HIEROGLYPH AA026 13429 EGYPTIAN HIEROGLYPH AA027 1342A EGYPTIAN HIEROGLYPH AA028 + * phonogram 'qd' + * not to be confused with 131E9 and 132A7 1342B EGYPTIAN HIEROGLYPH AA029 + * older variant of 1342A 1342C EGYPTIAN HIEROGLYPH AA030 1342D EGYPTIAN HIEROGLYPH AA031 + * older variant of 1342C 1342E EGYPTIAN HIEROGLYPH AA032 @@ 13430 Egyptian Hieroglyph Format Controls 1343F @+ These format controls are used to render Egyptian hieroglyphic quadrats. @@ -38955,6 +39972,99 @@ FFFF @ Punctuation 16A6E MRO DANDA 16A6F MRO DOUBLE DANDA +@@ 16A70 Tangsa 16ACF +@ Vowels +16A70 TANGSA LETTER OZ +16A71 TANGSA LETTER OC +16A72 TANGSA LETTER OQ +16A73 TANGSA LETTER OX +16A74 TANGSA LETTER AZ +16A75 TANGSA LETTER AC +16A76 TANGSA LETTER AQ +16A77 TANGSA LETTER AX +16A78 TANGSA LETTER VZ +16A79 TANGSA LETTER VC +16A7A TANGSA LETTER VQ +16A7B TANGSA LETTER VX +16A7C TANGSA LETTER EZ +16A7D TANGSA LETTER EC +16A7E TANGSA LETTER EQ +16A7F TANGSA LETTER EX +16A80 TANGSA LETTER IZ +16A81 TANGSA LETTER IC +16A82 TANGSA LETTER IQ +16A83 TANGSA LETTER IX +16A84 TANGSA LETTER UZ +16A85 TANGSA LETTER UC +16A86 TANGSA LETTER UQ +16A87 TANGSA LETTER UX +16A88 TANGSA LETTER AWZ +16A89 TANGSA LETTER AWC +16A8A TANGSA LETTER AWQ +16A8B TANGSA LETTER AWX +16A8C TANGSA LETTER UIZ +16A8D TANGSA LETTER UIC +16A8E TANGSA LETTER UIQ +16A8F TANGSA LETTER UIX +16A90 TANGSA LETTER FINAL NG +16A91 TANGSA LETTER LONG UEX +16A92 TANGSA LETTER SHORT UEZ +16A93 TANGSA LETTER SHORT AWX +16A94 TANGSA LETTER UEC +16A95 TANGSA LETTER UEZ +16A96 TANGSA LETTER UEQ +16A97 TANGSA LETTER UEX +16A98 TANGSA LETTER UIUZ +16A99 TANGSA LETTER UIUC +16A9A TANGSA LETTER UIUQ +16A9B TANGSA LETTER UIUX +16A9C TANGSA LETTER MZ +16A9D TANGSA LETTER MC +16A9E TANGSA LETTER MQ +16A9F TANGSA LETTER MX +@ Consonants +16AA0 TANGSA LETTER KA +16AA1 TANGSA LETTER KHA +16AA2 TANGSA LETTER GA +16AA3 TANGSA LETTER NGA +16AA4 TANGSA LETTER SA +16AA5 TANGSA LETTER YA +16AA6 TANGSA LETTER WA +16AA7 TANGSA LETTER PA +16AA8 TANGSA LETTER NYA +16AA9 TANGSA LETTER PHA +16AAA TANGSA LETTER BA +16AAB TANGSA LETTER MA +16AAC TANGSA LETTER NA +16AAD TANGSA LETTER HA +16AAE TANGSA LETTER LA +16AAF TANGSA LETTER HTA +16AB0 TANGSA LETTER TA +16AB1 TANGSA LETTER DA +16AB2 TANGSA LETTER RA +16AB3 TANGSA LETTER NHA +16AB4 TANGSA LETTER SHA +16AB5 TANGSA LETTER CA +16AB6 TANGSA LETTER TSA +16AB7 TANGSA LETTER GHA +16AB8 TANGSA LETTER HTTA +16AB9 TANGSA LETTER THA +16ABA TANGSA LETTER XA +16ABB TANGSA LETTER FA +16ABC TANGSA LETTER DHA +16ABD TANGSA LETTER CHA +16ABE TANGSA LETTER ZA +@ Digits +16AC0 TANGSA DIGIT ZERO +16AC1 TANGSA DIGIT ONE +16AC2 TANGSA DIGIT TWO +16AC3 TANGSA DIGIT THREE +16AC4 TANGSA DIGIT FOUR +16AC5 TANGSA DIGIT FIVE +16AC6 TANGSA DIGIT SIX +16AC7 TANGSA DIGIT SEVEN +16AC8 TANGSA DIGIT EIGHT +16AC9 TANGSA DIGIT NINE @@ 16AD0 Bassa Vah 16AFF @ Consonant letters 16AD0 BASSA VAH LETTER ENNI @@ -40862,6 +41972,23 @@ FFFF 18CD4 KHITAN SMALL SCRIPT CHARACTER-18CD4 18CD5 KHITAN SMALL SCRIPT CHARACTER-18CD5 @@ 18D00 Tangut Supplement 18D08 +@@ 1AFF0 Kana Extended-B 1AFFF +@+ This block contains tone marks occasionally used in furigana extensions to annotate Minnan Chinese. +@ Tone marks +1AFF0 KATAKANA LETTER MINNAN TONE-2 +1AFF1 KATAKANA LETTER MINNAN TONE-3 +1AFF2 KATAKANA LETTER MINNAN TONE-4 +1AFF3 KATAKANA LETTER MINNAN TONE-5 +1AFF5 KATAKANA LETTER MINNAN TONE-7 +1AFF6 KATAKANA LETTER MINNAN TONE-8 +@ Nasalized tone marks +1AFF7 KATAKANA LETTER MINNAN NASALIZED TONE-1 +1AFF8 KATAKANA LETTER MINNAN NASALIZED TONE-2 +1AFF9 KATAKANA LETTER MINNAN NASALIZED TONE-3 +1AFFA KATAKANA LETTER MINNAN NASALIZED TONE-4 +1AFFB KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD KATAKANA LETTER MINNAN NASALIZED TONE-7 +1AFFE KATAKANA LETTER MINNAN NASALIZED TONE-8 @@ 1B000 Kana Supplement 1B0FF @ Historic Katakana 1B000 KATAKANA LETTER ARCHAIC E @@ -41442,6 +42569,13 @@ FFFF * derived from 65E0 1B11E HENTAIGANA LETTER N-MU-MO-2 * derived from 65E0 +@ Historic Hiragana +1B11F HIRAGANA LETTER ARCHAIC WU + * derived from 6C59 +@ Historic Katakana +1B120 KATAKANA LETTER ARCHAIC YI +1B121 KATAKANA LETTER ARCHAIC YE +1B122 KATAKANA LETTER ARCHAIC WU @@ 1B130 Small Kana Extension 1B16F @ Historic small hiragana letters 1B150 HIRAGANA LETTER SMALL WI @@ -42357,6 +43491,210 @@ FFFF = Sloan contracted ending oo/o + ZWSP 1BCA3 SHORTHAND FORMAT UP STEP = Sloan contracted ending uh/au/aui + ZWSP +@@ 1CF00 Znamenny Musical Notation 1CFCF +@ Combining red marks +1CF00 ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT +1CF01 ZNAMENNY COMBINING MARK NIZKO S KRYZHEM ON LEFT +1CF02 ZNAMENNY COMBINING MARK TSATA ON LEFT +1CF03 ZNAMENNY COMBINING MARK GORAZDO NIZKO ON LEFT +1CF04 ZNAMENNY COMBINING MARK NIZKO ON LEFT +1CF05 ZNAMENNY COMBINING MARK SREDNE ON LEFT +1CF06 ZNAMENNY COMBINING MARK MALO POVYSHE ON LEFT +1CF07 ZNAMENNY COMBINING MARK POVYSHE ON LEFT +1CF08 ZNAMENNY COMBINING MARK VYSOKO ON LEFT +1CF09 ZNAMENNY COMBINING MARK MALO POVYSHE S KHOKHLOM ON LEFT +1CF0A ZNAMENNY COMBINING MARK POVYSHE S KHOKHLOM ON LEFT +1CF0B ZNAMENNY COMBINING MARK VYSOKO S KHOKHLOM ON LEFT +1CF0C ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON RIGHT +1CF0D ZNAMENNY COMBINING MARK NIZKO S KRYZHEM ON RIGHT +1CF0E ZNAMENNY COMBINING MARK TSATA ON RIGHT +1CF0F ZNAMENNY COMBINING MARK GORAZDO NIZKO ON RIGHT +1CF10 ZNAMENNY COMBINING MARK NIZKO ON RIGHT +1CF11 ZNAMENNY COMBINING MARK SREDNE ON RIGHT +1CF12 ZNAMENNY COMBINING MARK MALO POVYSHE ON RIGHT +1CF13 ZNAMENNY COMBINING MARK POVYSHE ON RIGHT +1CF14 ZNAMENNY COMBINING MARK VYSOKO ON RIGHT +1CF15 ZNAMENNY COMBINING MARK MALO POVYSHE S KHOKHLOM ON RIGHT +1CF16 ZNAMENNY COMBINING MARK POVYSHE S KHOKHLOM ON RIGHT +1CF17 ZNAMENNY COMBINING MARK VYSOKO S KHOKHLOM ON RIGHT +1CF18 ZNAMENNY COMBINING MARK TSATA S KRYZHEM +1CF19 ZNAMENNY COMBINING MARK MALO POVYSHE S KRYZHEM +1CF1A ZNAMENNY COMBINING MARK STRANNO MALO POVYSHE +1CF1B ZNAMENNY COMBINING MARK POVYSHE S KRYZHEM +1CF1C ZNAMENNY COMBINING MARK POVYSHE STRANNO +1CF1D ZNAMENNY COMBINING MARK VYSOKO S KRYZHEM +1CF1E ZNAMENNY COMBINING MARK MALO POVYSHE STRANNO +1CF1F ZNAMENNY COMBINING MARK GORAZDO VYSOKO +1CF20 ZNAMENNY COMBINING MARK ZELO +1CF21 ZNAMENNY COMBINING MARK ON +1CF22 ZNAMENNY COMBINING MARK RAVNO +1CF23 ZNAMENNY COMBINING MARK TIKHAYA +1CF24 ZNAMENNY COMBINING MARK BORZAYA +1CF25 ZNAMENNY COMBINING MARK UDARKA +1CF26 ZNAMENNY COMBINING MARK PODVERTKA +1CF27 ZNAMENNY COMBINING MARK LOMKA +1CF28 ZNAMENNY COMBINING MARK KUPNAYA +1CF29 ZNAMENNY COMBINING MARK KACHKA +1CF2A ZNAMENNY COMBINING MARK ZEVOK +1CF2B ZNAMENNY COMBINING MARK SKOBA +1CF2C ZNAMENNY COMBINING MARK RAZSEKA +1CF2D ZNAMENNY COMBINING MARK KRYZH ON LEFT +@ Combining black marks +1CF30 ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO +1CF31 ZNAMENNY COMBINING TONAL RANGE MARK SVETLO +1CF32 ZNAMENNY COMBINING TONAL RANGE MARK TRESVETLO +1CF33 ZNAMENNY COMBINING MARK ZADERZHKA + = ottyazhka +1CF34 ZNAMENNY COMBINING MARK DEMESTVENNY ZADERZHKA +1CF35 ZNAMENNY COMBINING MARK OTSECHKA +1CF36 ZNAMENNY COMBINING MARK PODCHASHIE +1CF37 ZNAMENNY COMBINING MARK PODCHASHIE WITH VERTICAL STROKE +1CF38 ZNAMENNY COMBINING MARK CHASHKA +1CF39 ZNAMENNY COMBINING MARK CHASHKA POLNAYA +1CF3A ZNAMENNY COMBINING MARK OBLACHKO +1CF3B ZNAMENNY COMBINING MARK SOROCHYA NOZHKA + = sokolik +1CF3C ZNAMENNY COMBINING MARK TOCHKA +1CF3D ZNAMENNY COMBINING MARK DVOETOCHIE +1CF3E ZNAMENNY COMBINING ATTACHING VERTICAL OMET +1CF3F ZNAMENNY COMBINING MARK CURVED OMET +1CF40 ZNAMENNY COMBINING MARK KRYZH +1CF41 ZNAMENNY COMBINING LOWER TONAL RANGE INDICATOR +@ Modifying marks for priznaki +1CF42 ZNAMENNY PRIZNAK MODIFIER LEVEL-2 +1CF43 ZNAMENNY PRIZNAK MODIFIER LEVEL-3 +1CF44 ZNAMENNY PRIZNAK MODIFIER DIRECTION FLIP +1CF45 ZNAMENNY PRIZNAK MODIFIER KRYZH +1CF46 ZNAMENNY PRIZNAK MODIFIER ROG +@ Znamenny neumes +1CF50 ZNAMENNY NEUME KRYUK +1CF51 ZNAMENNY NEUME KRYUK TIKHY +1CF52 ZNAMENNY NEUME PARAKLIT +1CF53 ZNAMENNY NEUME DVA V CHELNU +1CF54 ZNAMENNY NEUME KLYUCH + = kryuk klyuchevoy +1CF55 ZNAMENNY NEUME ZANOZHEK +1CF56 ZNAMENNY NEUME STOPITSA +1CF57 ZNAMENNY NEUME STOPITSA S OCHKOM +1CF58 ZNAMENNY NEUME PEREVODKA +1CF59 ZNAMENNY NEUME PEREVODKA NEPOSTOYANNAYA +1CF5A ZNAMENNY NEUME STOPITSA WITH SOROCHYA NOZHKA + * not a decomposable character +1CF5B ZNAMENNY NEUME CHELYUSTKA +1CF5C ZNAMENNY NEUME PALKA +1CF5D ZNAMENNY NEUME ZAPYATAYA +1CF5E ZNAMENNY NEUME GOLUBCHIK BORZY +1CF5F ZNAMENNY NEUME GOLUBCHIK TIKHY +1CF60 ZNAMENNY NEUME GOLUBCHIK MRACHNY +1CF61 ZNAMENNY NEUME GOLUBCHIK SVETLY +1CF62 ZNAMENNY NEUME GOLUBCHIK TRESVETLY + = golubchik nepostoyanny +1CF63 ZNAMENNY NEUME VRAKHIYA PROSTAYA +1CF64 ZNAMENNY NEUME VRAKHIYA MRACHNAYA +1CF65 ZNAMENNY NEUME VRAKHIYA SVETLAYA +1CF66 ZNAMENNY NEUME VRAKHIYA TRESVETLAYA + = vrakhia nepostoyannaya +1CF67 ZNAMENNY NEUME VRAKHIYA KLYUCHEVAYA PROSTAYA +1CF68 ZNAMENNY NEUME VRAKHIYA KLYUCHEVAYA MRACHNAYA +1CF69 ZNAMENNY NEUME VRAKHIYA KLYUCHEVAYA SVETLAYA +1CF6A ZNAMENNY NEUME VRAKHIYA KLYUCHEVAYA TRESVETLAYA + = vrakhia klyuchevaya nepostoyannaya +1CF6B ZNAMENNY NEUME DOUBLE ZAPYATAYA +1CF6C ZNAMENNY NEUME REVERSED CHELYUSTKA +1CF6D ZNAMENNY NEUME DERBITSA +1CF6E ZNAMENNY NEUME KHAMILO +1CF6F ZNAMENNY NEUME CHASHKA +1CF70 ZNAMENNY NEUME PODCHASHIE +1CF71 ZNAMENNY NEUME SKAMEYTSA MRACHNAYA +1CF72 ZNAMENNY NEUME SKAMEYTSA SVETLAYA +1CF73 ZNAMENNY NEUME SKAMEYTSA TRESVETLAYA +1CF74 ZNAMENNY NEUME SKAMEYTSA TIKHAYA +1CF75 ZNAMENNY NEUME DEMESTVENNY KLYUCH + = skameytsa klyuchevaya +1CF76 ZNAMENNY NEUME SKAMEYTSA KLYUCHEVAYA SVETLAYA +1CF77 ZNAMENNY NEUME SKAMEYTSA KLYUCHENEPOSTOYANNAYA +1CF78 ZNAMENNY NEUME SKAMEYTSA KLYUCHEVAYA TIKHAYA +1CF79 ZNAMENNY NEUME SKAMEYTSA DVOECHELNAYA PROSTAYA +1CF7A ZNAMENNY NEUME SKAMEYTSA DVOECHELNAYA SVETLAYA +1CF7B ZNAMENNY NEUME SKAMEYTSA DVOECHELNAYA NEPOSTOYANNAYA +1CF7C ZNAMENNY NEUME SKAMEYTSA DVOECHELNAYA KLYUCHEVAYA +1CF7D ZNAMENNY NEUME SLOZHITIE +1CF7E ZNAMENNY NEUME SLOZHITIE S ZAPYATOY +1CF7F ZNAMENNY NEUME SLOZHITIE ZAKRYTOE +1CF80 ZNAMENNY NEUME SLOZHITIE S KRYZHEM +1CF81 ZNAMENNY NEUME KRYZH +1CF82 ZNAMENNY NEUME ROG +1CF83 ZNAMENNY NEUME FITA +1CF84 ZNAMENNY NEUME KOBYLA +1CF85 ZNAMENNY NEUME ZMEYTSA + = litso +1CF86 ZNAMENNY NEUME STATYA +1CF87 ZNAMENNY NEUME STATYA S ZAPYATOY +1CF88 ZNAMENNY NEUME STATYA S KRYZHEM +1CF89 ZNAMENNY NEUME STATYA S ZAPYATOY I KRYZHEM +1CF8A ZNAMENNY NEUME STATYA S KRYZHEM I ZAPYATOY +1CF8B ZNAMENNY NEUME STATYA ZAKRYTAYA +1CF8C ZNAMENNY NEUME STATYA ZAKRYTAYA S ZAPYATOY +1CF8D ZNAMENNY NEUME STATYA S ROGOM +1CF8E ZNAMENNY NEUME STATYA S DVUMYA ZAPYATYMI +1CF8F ZNAMENNY NEUME STATYA S ZAPYATOY I PODCHASHIEM +1CF90 ZNAMENNY NEUME POLKULIZMY + * not a decomposable character +1CF91 ZNAMENNY NEUME STATYA NEPOSTOYANNAYA +1CF92 ZNAMENNY NEUME STRELA PROSTAYA +1CF93 ZNAMENNY NEUME STRELA MRACHNOTIKHAYA +1CF94 ZNAMENNY NEUME STRELA KRYZHEVAYA + = strela polukryzhevaya +1CF95 ZNAMENNY NEUME STRELA POLUPOVODNAYA +1CF96 ZNAMENNY NEUME STRELA POVODNAYA +1CF97 ZNAMENNY NEUME STRELA NEPOSTOYANNAYA +1CF98 ZNAMENNY NEUME STRELA KLYUCHEPOVODNAYA +1CF99 ZNAMENNY NEUME STRELA KLYUCHENEPOSTOYANNAYA +1CF9A ZNAMENNY NEUME STRELA TIKHAYA PUTNAYA +1CF9B ZNAMENNY NEUME STRELA DVOECHELNAYA +1CF9C ZNAMENNY NEUME STRELA DVOECHELNOKRYZHEVAYA +1CF9D ZNAMENNY NEUME STRELA DVOECHELNOPOVODNAYA +1CF9E ZNAMENNY NEUME STRELA DVOECHELNAYA KLYUCHEVAYA +1CF9F ZNAMENNY NEUME STRELA DVOECHELNOPOVODNAYA KLYUCHEVAYA +1CFA0 ZNAMENNY NEUME STRELA GROMNAYA WITH SINGLE ZAPYATAYA +1CFA1 ZNAMENNY NEUME STRELA GROMOPOVODNAYA WITH SINGLE ZAPYATAYA +1CFA2 ZNAMENNY NEUME STRELA GROMNAYA +1CFA3 ZNAMENNY NEUME STRELA GROMOPOVODNAYA +1CFA4 ZNAMENNY NEUME STRELA GROMOPOVODNAYA WITH DOUBLE ZAPYATAYA +1CFA5 ZNAMENNY NEUME STRELA GROMOKRYZHEVAYA +1CFA6 ZNAMENNY NEUME STRELA GROMOKRYZHEVAYA POVODNAYA + = strela gromomrachnaya s kryzhem +1CFA7 ZNAMENNY NEUME MECHIK +1CFA8 ZNAMENNY NEUME MECHIK POVODNY +1CFA9 ZNAMENNY NEUME MECHIK KLYUCHEVOY +1CFAA ZNAMENNY NEUME MECHIK KLYUCHEPOVODNY +1CFAB ZNAMENNY NEUME MECHIK KLYUCHENEPOSTOYANNY +1CFAC ZNAMENNY NEUME STRELA TRYASOGLASNAYA +1CFAD ZNAMENNY NEUME STRELA TRYASOPOVODNAYA +1CFAE ZNAMENNY NEUME STRELA TRYASOSTRELNAYA +1CFAF ZNAMENNY NEUME OSOKA +1CFB0 ZNAMENNY NEUME OSOKA SVETLAYA +1CFB1 ZNAMENNY NEUME OSOKA TRESVETLAYA + = osoka nepostoyannaya +1CFB2 ZNAMENNY NEUME OSOKA KRYUKOVAYA SVETLAYA +1CFB3 ZNAMENNY NEUME OSOKA KLYUCHEVAYA SVETLAYA +1CFB4 ZNAMENNY NEUME OSOKA KLYUCHEVAYA NEPOSTOYANNAYA +1CFB5 ZNAMENNY NEUME STRELA KRYUKOVAYA +1CFB6 ZNAMENNY NEUME STRELA KRYUKOVAYA POVODNAYA +1CFB7 ZNAMENNY NEUME STRELA KRYUKOVAYA GROMNAYA WITH SINGLE ZAPYATAYA +1CFB8 ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOPOVODNAYA WITH SINGLE ZAPYATAYA +1CFB9 ZNAMENNY NEUME STRELA KRYUKOVAYA GROMNAYA +1CFBA ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOPOVODNAYA +1CFBB ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOPOVODNAYA WITH DOUBLE ZAPYATAYA +1CFBC ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOKRYZHEVAYA +1CFBD ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOKRYZHEVAYA POVODNAYA + = strela kryukovaya gromomrachnaya s kryzhem +1CFBE ZNAMENNY NEUME STRELA KRYUKOVAYA TRYASKA +1CFBF ZNAMENNY NEUME KUFISMA +1CFC0 ZNAMENNY NEUME OBLAKO +1CFC1 ZNAMENNY NEUME DUDA +1CFC2 ZNAMENNY NEUME NEMKA +1CFC3 ZNAMENNY NEUME PAUK @@ 1D000 Byzantine Musical Symbols 1D0FF @@+ @ Prosodies (Prosodics) @@ -42956,6 +44294,11 @@ FFFF 1D1E7 MUSICAL SYMBOL KIEVAN EIGHTH NOTE STEM UP @ Accidental 1D1E8 MUSICAL SYMBOL KIEVAN FLAT SIGN +@ Iranian notation +@+ The following range is specific to Iranian classical music. +@ Accidentals for quarter tones +1D1E9 MUSICAL SYMBOL SORI +1D1EA MUSICAL SYMBOL KORON @@ 1D200 Ancient Greek Musical Notation 1D24F @ Ancient Greek vocalic notation @+ In a few instances vocalic and instrumental symbols have been unified with each other. In other instances they have been unified with regular Greek letters. @@ -43601,57 +44944,93 @@ FFFF @ Script symbols @+ Script symbols already encoded in the Letterlike Symbols block are omitted here to avoid duplicate encoding. Fonts that use a less elaborate style are also acceptable for many uses, as long as they can be distinguished from serifed and italic styles. 1D49C MATHEMATICAL SCRIPT CAPITAL A + ~ 1D49C FE00 chancery style + ~ 1D49C FE01 roundhand style # 0041 latin capital letter a 1D49D x (script capital b - 212C) 1D49E MATHEMATICAL SCRIPT CAPITAL C + ~ 1D49E FE00 chancery style + ~ 1D49E FE01 roundhand style # 0043 latin capital letter c 1D49F MATHEMATICAL SCRIPT CAPITAL D + ~ 1D49F FE00 chancery style + ~ 1D49F FE01 roundhand style # 0044 latin capital letter d 1D4A0 x (script capital e - 2130) 1D4A1 x (script capital f - 2131) 1D4A2 MATHEMATICAL SCRIPT CAPITAL G + ~ 1D4A2 FE00 chancery style + ~ 1D4A2 FE01 roundhand style # 0047 latin capital letter g 1D4A3 x (script capital h - 210B) 1D4A4 x (script capital i - 2110) 1D4A5 MATHEMATICAL SCRIPT CAPITAL J + ~ 1D4A5 FE00 chancery style + ~ 1D4A5 FE01 roundhand style # 004A latin capital letter j 1D4A6 MATHEMATICAL SCRIPT CAPITAL K + ~ 1D4A6 FE00 chancery style + ~ 1D4A6 FE01 roundhand style # 004B latin capital letter k 1D4A7 x (script capital l - 2112) 1D4A8 x (script capital m - 2133) 1D4A9 MATHEMATICAL SCRIPT CAPITAL N + ~ 1D4A9 FE00 chancery style + ~ 1D4A9 FE01 roundhand style # 004E latin capital letter n 1D4AA MATHEMATICAL SCRIPT CAPITAL O + ~ 1D4AA FE00 chancery style + ~ 1D4AA FE01 roundhand style # 004F latin capital letter o 1D4AB MATHEMATICAL SCRIPT CAPITAL P = power set + ~ 1D4AB FE00 chancery style + ~ 1D4AB FE01 roundhand style # 0050 latin capital letter p 1D4AC MATHEMATICAL SCRIPT CAPITAL Q + ~ 1D4AC FE00 chancery style + ~ 1D4AC FE01 roundhand style # 0051 latin capital letter q 1D4AD x (script capital r - 211B) 1D4AE MATHEMATICAL SCRIPT CAPITAL S + ~ 1D4AE FE00 chancery style + ~ 1D4AE FE01 roundhand style # 0053 latin capital letter s 1D4AF MATHEMATICAL SCRIPT CAPITAL T + ~ 1D4AF FE00 chancery style + ~ 1D4AF FE01 roundhand style # 0054 latin capital letter t 1D4B0 MATHEMATICAL SCRIPT CAPITAL U + ~ 1D4B0 FE00 chancery style + ~ 1D4B0 FE01 roundhand style # 0055 latin capital letter u 1D4B1 MATHEMATICAL SCRIPT CAPITAL V + ~ 1D4B1 FE00 chancery style + ~ 1D4B1 FE01 roundhand style # 0056 latin capital letter v 1D4B2 MATHEMATICAL SCRIPT CAPITAL W + ~ 1D4B2 FE00 chancery style + ~ 1D4B2 FE01 roundhand style # 0057 latin capital letter w 1D4B3 MATHEMATICAL SCRIPT CAPITAL X + ~ 1D4B3 FE00 chancery style + ~ 1D4B3 FE01 roundhand style # 0058 latin capital letter x 1D4B4 MATHEMATICAL SCRIPT CAPITAL Y + ~ 1D4B4 FE00 chancery style + ~ 1D4B4 FE01 roundhand style # 0059 latin capital letter y 1D4B5 MATHEMATICAL SCRIPT CAPITAL Z + ~ 1D4B5 FE00 chancery style + ~ 1D4B5 FE01 roundhand style # 005A latin capital letter z 1D4B6 MATHEMATICAL SCRIPT SMALL A # 0061 latin small letter a @@ -45368,6 +46747,7 @@ FFFF # 0038 digit eight 1D7FF MATHEMATICAL MONOSPACE DIGIT NINE # 0039 digit nine +@~ Standardized Variation Sequences @@ 1D800 Sutton SignWriting 1DAAF @ Hand shapes with index finger 1D800 SIGNWRITING HAND-FIST INDEX @@ -46063,6 +47443,45 @@ FFFF 1DAAD SIGNWRITING ROTATION MODIFIER-14 1DAAE SIGNWRITING ROTATION MODIFIER-15 1DAAF SIGNWRITING ROTATION MODIFIER-16 +@@ 1DF00 Latin Extended-G 1DFFF +@ Extended IPA for disordered speech +1DF00 LATIN SMALL LETTER FENG DIGRAPH WITH TRILL +1DF01 LATIN SMALL LETTER REVERSED SCRIPT G +1DF02 LATIN LETTER SMALL CAPITAL TURNED G +1DF03 LATIN SMALL LETTER REVERSED K +1DF04 LATIN LETTER SMALL CAPITAL L WITH BELT +1DF05 LATIN SMALL LETTER LEZH WITH RETROFLEX HOOK +1DF06 LATIN SMALL LETTER TURNED Y WITH BELT +1DF07 LATIN SMALL LETTER REVERSED ENG +@ IPA extensions +1DF08 LATIN SMALL LETTER TURNED R WITH LONG LEG AND RETROFLEX HOOK +1DF09 LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +@ Clicks +1DF0B LATIN SMALL LETTER ESH WITH DOUBLE BAR +1DF0C LATIN SMALL LETTER ESH WITH DOUBLE BAR AND CURL +1DF0D LATIN SMALL LETTER TURNED T WITH CURL +1DF0E LATIN LETTER INVERTED GLOTTAL STOP WITH CURL +1DF0F LATIN LETTER STRETCHED C WITH CURL +1DF10 LATIN LETTER SMALL CAPITAL TURNED K +@ Lateral +1DF11 LATIN SMALL LETTER L WITH FISHHOOK +@ Letters with palatal hooks +1DF12 LATIN SMALL LETTER DEZH DIGRAPH WITH PALATAL HOOK +1DF13 LATIN SMALL LETTER L WITH BELT AND PALATAL HOOK +1DF14 LATIN SMALL LETTER ENG WITH PALATAL HOOK +1DF15 LATIN SMALL LETTER TURNED R WITH PALATAL HOOK +1DF16 LATIN SMALL LETTER R WITH FISHHOOK AND PALATAL HOOK +1DF17 LATIN SMALL LETTER TESH DIGRAPH WITH PALATAL HOOK +1DF18 LATIN SMALL LETTER EZH WITH PALATAL HOOK +@ Letters with retroflex hooks +1DF19 LATIN SMALL LETTER DEZH DIGRAPH WITH RETROFLEX HOOK +1DF1A LATIN SMALL LETTER I WITH STROKE AND RETROFLEX HOOK +1DF1B LATIN SMALL LETTER O WITH RETROFLEX HOOK +1DF1C LATIN SMALL LETTER TESH DIGRAPH WITH RETROFLEX HOOK +1DF1D LATIN SMALL LETTER C WITH RETROFLEX HOOK +@ IPA extension +1DF1E LATIN SMALL LETTER S WITH CURL @@ 1E000 Glagolitic Supplement 1E02F @ Combining letters 1E000 COMBINING GLAGOLITIC LETTER AZU @@ -46220,6 +47639,41 @@ FFFF 1E14F NYIAKENG PUACHUE HMONG CIRCLED CA * used to indicate ownership x (nyiakeng puachue hmong letter ca - 1E108) +@@ 1E290 Toto 1E2BF +@ Basic consonants +1E290 TOTO LETTER PA +1E291 TOTO LETTER BA +1E292 TOTO LETTER TA +1E293 TOTO LETTER DA +1E294 TOTO LETTER KA +1E295 TOTO LETTER GA +1E296 TOTO LETTER MA +1E297 TOTO LETTER NA +1E298 TOTO LETTER NGA +1E299 TOTO LETTER SA +1E29A TOTO LETTER CHA +1E29B TOTO LETTER YA +1E29C TOTO LETTER WA +1E29D TOTO LETTER JA +1E29E TOTO LETTER HA +1E29F TOTO LETTER RA +1E2A0 TOTO LETTER LA +@ Basic vowels +1E2A1 TOTO LETTER I +1E2A2 TOTO LETTER BREATHY I +1E2A3 TOTO LETTER IU +1E2A4 TOTO LETTER BREATHY IU +1E2A5 TOTO LETTER U +1E2A6 TOTO LETTER E +1E2A7 TOTO LETTER BREATHY E +1E2A8 TOTO LETTER EO +1E2A9 TOTO LETTER BREATHY EO +1E2AA TOTO LETTER O +1E2AB TOTO LETTER AE +1E2AC TOTO LETTER BREATHY AE +1E2AD TOTO LETTER A +@ Sign +1E2AE TOTO SIGN RISING TONE @@ 1E2C0 Wancho 1E2FF @ Letters 1E2C0 WANCHO LETTER AA @@ -46286,6 +47740,64 @@ FFFF 1E2FF WANCHO NGUN SIGN = rupee x (indian rupee sign - 20B9) +@@ 1E7E0 Ethiopic Extended-B 1E7FF +@ Syllables for Gurage +1E7E0 ETHIOPIC SYLLABLE HHYA + x (ethiopic syllable xya - 2DD0) +1E7E1 ETHIOPIC SYLLABLE HHYU + x (ethiopic syllable xyu - 2DD1) +1E7E2 ETHIOPIC SYLLABLE HHYI + x (ethiopic syllable xyi - 2DD2) +1E7E3 ETHIOPIC SYLLABLE HHYAA + x (ethiopic syllable xyaa - 2DD3) +1E7E4 ETHIOPIC SYLLABLE HHYEE + x (ethiopic syllable xyee - 2DD4) +1E7E5 ETHIOPIC SYLLABLE HHYE + x (ethiopic syllable xye - 2DD5) +1E7E6 ETHIOPIC SYLLABLE HHYO + x (ethiopic syllable xyo - 2DD6) +1E7E8 ETHIOPIC SYLLABLE GURAGE HHWA + x (ethiopic syllable kxwa - 12C0) +1E7E9 ETHIOPIC SYLLABLE HHWI + x (ethiopic syllable kxwi - 12C2) +1E7EA ETHIOPIC SYLLABLE HHWEE + x (ethiopic syllable kxwee - 12C4) +1E7EB ETHIOPIC SYLLABLE HHWE + x (ethiopic syllable kxwe - 12C5) +1E7ED ETHIOPIC SYLLABLE GURAGE MWI + x (ethiopic syllable mwi - 1381) +1E7EE ETHIOPIC SYLLABLE GURAGE MWEE + x (ethiopic syllable mwee - 1382) +1E7F0 ETHIOPIC SYLLABLE GURAGE QWI + x (ethiopic syllable qwi - 124A) +1E7F1 ETHIOPIC SYLLABLE GURAGE QWEE + x (ethiopic syllable qwee - 124C) +1E7F2 ETHIOPIC SYLLABLE GURAGE QWE + x (ethiopic syllable qwe - 124D) +1E7F3 ETHIOPIC SYLLABLE GURAGE BWI + x (ethiopic syllable bwi - 1385) +1E7F4 ETHIOPIC SYLLABLE GURAGE BWEE + x (ethiopic syllable bwee - 1386) +1E7F5 ETHIOPIC SYLLABLE GURAGE KWI + x (ethiopic syllable kwi - 12B2) +1E7F6 ETHIOPIC SYLLABLE GURAGE KWEE + x (ethiopic syllable kwee - 12B4) +1E7F7 ETHIOPIC SYLLABLE GURAGE KWE + x (ethiopic syllable kwe - 12B5) +1E7F8 ETHIOPIC SYLLABLE GURAGE GWI + x (ethiopic syllable gwi - 1312) +1E7F9 ETHIOPIC SYLLABLE GURAGE GWEE + x (ethiopic syllable gwee - 1314) +1E7FA ETHIOPIC SYLLABLE GURAGE GWE + x (ethiopic syllable gwe - 1315) +1E7FB ETHIOPIC SYLLABLE GURAGE FWI + x (ethiopic syllable fwi - 1389) +1E7FC ETHIOPIC SYLLABLE GURAGE FWEE + x (ethiopic syllable fwee - 138A) +1E7FD ETHIOPIC SYLLABLE GURAGE PWI + x (ethiopic syllable pwi - 138D) +1E7FE ETHIOPIC SYLLABLE GURAGE PWEE + x (ethiopic syllable pwee - 138E) @@ 1E800 Mende Kikakui 1E8DF @+ Annotations refer to the syllabaries of Amara Mansaray and David Dalby. @ Syllables in k- @@ -48684,9 +50196,11 @@ FFFF 1F448 WHITE LEFT POINTING BACKHAND INDEX x (white left pointing index - 261C) x (black left pointing backhand index - 1F59C) + x (leftwards hand - 1FAF2) 1F449 WHITE RIGHT POINTING BACKHAND INDEX x (white right pointing index - 261E) x (black right pointing backhand index - 1F59D) + x (rightwards hand - 1FAF1) 1F44A FISTED HAND SIGN = punch x (raised fist - 270A) @@ -48758,6 +50272,7 @@ FFFF @ Fairy tale symbols 1F478 PRINCESS x (prince - 1F934) + x (person with crown - 1FAC5) 1F479 JAPANESE OGRE 1F47A JAPANESE GOBLIN 1F47B GHOST @@ -48839,6 +50354,7 @@ FFFF 1F4A7 DROPLET * represents a drop of sweat or drop of water x (black droplet - 1F322) + x (drop of blood - 1FA78) 1F4A8 DASH SYMBOL = running dash, briffits 1F4A9 PILE OF POO @@ -49018,6 +50534,7 @@ FFFF 1F50A SPEAKER WITH THREE SOUND WAVES = sound 1F50B BATTERY + x (low battery - 1FAAB) 1F50C ELECTRIC PLUG 1F50D LEFT-POINTING MAGNIFYING GLASS = search @@ -49435,6 +50952,7 @@ FFFF = rated for sex = kiss x (kiss mark - 1F48B) + x (biting lip - 1FAE6) 1F5E3 SPEAKING HEAD IN SILHOUETTE = rated for strong language @ Sound symbols @@ -49823,6 +51341,9 @@ FFFF 1F6D6 HUT 1F6D7 ELEVATOR @ Miscellaneous symbols +1F6DD PLAYGROUND SLIDE +1F6DE WHEEL +1F6DF RING BUOY 1F6E0 HAMMER AND WRENCH = tools, repair facility x (hammer and pick - 2692) @@ -50267,6 +51788,14 @@ FFFF 1F7E9 LARGE GREEN SQUARE 1F7EA LARGE PURPLE SQUARE 1F7EB LARGE BROWN SQUARE +@ Miscellaneous symbol +1F7F0 HEAVY EQUALS SIGN + * symbol of equality + x (equals sign - 003D) + x (heavy multiplication x - 2716) + x (heavy plus sign - 2795) + x (geta mark - 3013) + x (roman sextans sign - 10190) @@ 1F800 Supplemental Arrows-C 1F8FF @ Arrows with triangle arrowheads 1F800 LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD @@ -50490,9 +52019,12 @@ FFFF 1F919 CALL ME HAND 1F91A RAISED BACK OF HAND 1F91B LEFT-FACING FIST + x (leftwards hand - 1FAF2) 1F91C RIGHT-FACING FIST + x (rightwards hand - 1FAF1) 1F91D HANDSHAKE 1F91E HAND WITH INDEX AND MIDDLE FINGERS CROSSED + x (hand with index finger and thumb crossed - 1FAF0) 1F91F I LOVE YOU HAND SIGN * can be abbreviated ILY @ Emoticon faces @@ -50517,6 +52049,7 @@ FFFF 1F92F SHOCKED FACE WITH EXPLODING HEAD @ Portrait and role symbols 1F930 PREGNANT WOMAN + x (pregnant person - 1FAC4) 1F931 BREAST-FEEDING 1F932 PALMS UP TOGETHER * used for prayer in some cultures @@ -50594,6 +52127,7 @@ FFFF = chicken egg 1F95B GLASS OF MILK = milk + x (pouring liquid - 1FAD7) 1F95C PEANUTS 1F95D KIWIFRUIT 1F95E PANCAKES @@ -50635,6 +52169,7 @@ FFFF 1F976 FREEZING FACE 1F977 NINJA 1F978 DISGUISED FACE +1F979 FACE HOLDING BACK TEARS 1F97A FACE WITH PLEADING EYES @ Clothing 1F97B SARI @@ -50737,6 +52272,8 @@ FFFF 1F9C9 MATE DRINK 1F9CA ICE CUBE 1F9CB BUBBLE TEA +@ Fantasy being +1F9CC TROLL @ Portrait and accessibility symbols 1F9CD STANDING PERSON 1F9CE KNEELING PERSON @@ -50981,10 +52518,14 @@ FFFF 1FA72 BRIEFS 1FA73 SHORTS 1FA74 THONG SANDAL + = flip flop @ Medical symbols 1FA78 DROP OF BLOOD + x (droplet - 1F4A7) 1FA79 ADHESIVE BANDAGE 1FA7A STETHOSCOPE +1FA7B X-RAY +1FA7C CRUTCH @ Toys and sport symbols 1FA80 YO-YO 1FA81 KITE @@ -51019,6 +52560,12 @@ FFFF 1FAA6 HEADSTONE 1FAA7 PLACARD 1FAA8 ROCK +1FAA9 MIRROR BALL +1FAAA IDENTIFICATION CARD + = ID +1FAAB LOW BATTERY + x (battery - 1F50B) +1FAAC HAMSA @ Animals and nature 1FAB0 FLY 1FAB1 WORM @@ -51027,11 +52574,20 @@ FFFF 1FAB4 POTTED PLANT 1FAB5 WOOD 1FAB6 FEATHER +1FAB7 LOTUS +1FAB8 CORAL +1FAB9 EMPTY NEST +1FABA NEST WITH EGGS @ Body parts 1FAC0 ANATOMICAL HEART 1FAC1 LUNGS @ People 1FAC2 PEOPLE HUGGING +1FAC3 PREGNANT MAN +1FAC4 PREGNANT PERSON + x (pregnant woman - 1F930) +1FAC5 PERSON WITH CROWN + x (princess - 1F478) @ Food and drink 1FAD0 BLUEBERRIES 1FAD1 BELL PEPPER @@ -51040,6 +52596,30 @@ FFFF 1FAD4 TAMALE 1FAD5 FONDUE 1FAD6 TEAPOT +1FAD7 POURING LIQUID + x (glass of milk - 1F95B) +1FAD8 BEANS +1FAD9 JAR +@ Faces +1FAE0 MELTING FACE +1FAE1 SALUTING FACE +1FAE2 FACE WITH OPEN EYES AND HAND OVER MOUTH +1FAE3 FACE WITH PEEKING EYE +1FAE4 FACE WITH DIAGONAL MOUTH +1FAE5 DOTTED LINE FACE +@ Emotion +1FAE6 BITING LIP + x (lips - 1F5E2) +1FAE7 BUBBLES +@ Hand symbols +1FAF0 HAND WITH INDEX FINGER AND THUMB CROSSED + x (hand with index and middle fingers crossed - 1F91E) +1FAF1 RIGHTWARDS HAND +1FAF2 LEFTWARDS HAND +1FAF3 PALM DOWN HAND +1FAF4 PALM UP HAND +1FAF5 INDEX POINTING AT THE VIEWER +1FAF6 HEART HANDS @@ 1FB00 Symbols for Legacy Computing 1FBFF @ Block mosaic terminal graphic characters @+ The term "sextant" refers to block mosaics divided into six parts. @@ -51355,8 +52935,8 @@ FFFF @+ These codes are intended for process-internal uses. 1FFFE 1FFFF -@@ 20000 CJK Unified Ideographs Extension B 2A6DD -@@ 2A700 CJK Unified Ideographs Extension C 2B734 +@@ 20000 CJK Unified Ideographs Extension B 2A6DF +@@ 2A700 CJK Unified Ideographs Extension C 2B738 @@ 2B740 CJK Unified Ideographs Extension D 2B81D @@ 2B820 CJK Unified Ideographs Extension E 2CEA1 @@ 2CEB0 CJK Unified Ideographs Extension F 2EBE0 @@ -51453,6 +53033,7 @@ FFFF 2F82B CJK COMPATIBILITY IDEOGRAPH-2F82B : 5317 2F82C CJK COMPATIBILITY IDEOGRAPH-2F82C + x 20984 : 5349 2F82D CJK COMPATIBILITY IDEOGRAPH-2F82D : 5351 @@ -51483,6 +53064,7 @@ FFFF 2F83A CJK COMPATIBILITY IDEOGRAPH-2F83A : 53F1 2F83B CJK COMPATIBILITY IDEOGRAPH-2F83B + x 4DB8 : 5406 2F83C CJK COMPATIBILITY IDEOGRAPH-2F83C : 549E @@ -51559,6 +53141,7 @@ FFFF 2F85F CJK COMPATIBILITY IDEOGRAPH-2F85F : 5962 2F860 CJK COMPATIBILITY IDEOGRAPH-2F860 + x 216A7 : 216A8 2F861 CJK COMPATIBILITY IDEOGRAPH-2F861 : 216EA @@ -51599,6 +53182,7 @@ FFFF 2F873 CJK COMPATIBILITY IDEOGRAPH-2F873 : 5C06 2F874 CJK COMPATIBILITY IDEOGRAPH-2F874 + x 22450 : 5F53 2F875 CJK COMPATIBILITY IDEOGRAPH-2F875 : 5C22 @@ -51607,6 +53191,7 @@ FFFF 2F877 CJK COMPATIBILITY IDEOGRAPH-2F877 : 5C60 2F878 CJK COMPATIBILITY IDEOGRAPH-2F878 + x 4DB9 : 5C6E 2F879 CJK COMPATIBILITY IDEOGRAPH-2F879 : 5CC0 @@ -51848,6 +53433,7 @@ FFFF 2F8EF CJK COMPATIBILITY IDEOGRAPH-2F8EF : 6B21 2F8F0 CJK COMPATIBILITY IDEOGRAPH-2F8F0 + x 4DBE : 238A7 2F8F1 CJK COMPATIBILITY IDEOGRAPH-2F8F1 : 6B54 @@ -51874,6 +53460,7 @@ FFFF 2F8FC CJK COMPATIBILITY IDEOGRAPH-2F8FC : 6CBF 2F8FD CJK COMPATIBILITY IDEOGRAPH-2F8FD + x 2DC09 : 6CCD 2F8FE CJK COMPATIBILITY IDEOGRAPH-2F8FE : 6C67 @@ -51890,6 +53477,7 @@ FFFF 2F904 CJK COMPATIBILITY IDEOGRAPH-2F904 : 6D78 2F905 CJK COMPATIBILITY IDEOGRAPH-2F905 + x 23D40 : 6D85 2F906 CJK COMPATIBILITY IDEOGRAPH-2F906 : 23D1E @@ -51908,6 +53496,7 @@ FFFF 2F90D CJK COMPATIBILITY IDEOGRAPH-2F90D : 23ED1 2F90E CJK COMPATIBILITY IDEOGRAPH-2F90E + x 23F1C : 6DF9 2F90F CJK COMPATIBILITY IDEOGRAPH-2F90F : 6F6E @@ -51936,6 +53525,7 @@ FFFF 2F91B CJK COMPATIBILITY IDEOGRAPH-2F91B : 20525 2F91C CJK COMPATIBILITY IDEOGRAPH-2F91C + x 242B3 : 7145 2F91D CJK COMPATIBILITY IDEOGRAPH-2F91D : 24263 @@ -51958,6 +53548,7 @@ FFFF 2F926 CJK COMPATIBILITY IDEOGRAPH-2F926 : 24735 2F927 CJK COMPATIBILITY IDEOGRAPH-2F927 + x 2AEC5 : 24814 2F928 CJK COMPATIBILITY IDEOGRAPH-2F928 : 737A @@ -52014,6 +53605,7 @@ FFFF 2F942 CJK COMPATIBILITY IDEOGRAPH-2F942 : 250F2 2F943 CJK COMPATIBILITY IDEOGRAPH-2F943 + x 2511A : 25119 2F944 CJK COMPATIBILITY IDEOGRAPH-2F944 : 25133 @@ -52030,6 +53622,7 @@ FFFF 2F94A CJK COMPATIBILITY IDEOGRAPH-2F94A : 778B 2F94B CJK COMPATIBILITY IDEOGRAPH-2F94B + x 25271 : 4046 2F94C CJK COMPATIBILITY IDEOGRAPH-2F94C : 4096 diff --git a/lib/unicore/NormalizationCorrections.txt b/lib/unicore/NormalizationCorrections.txt index 7144fb8935..a1a34d6bb6 100644 --- a/lib/unicore/NormalizationCorrections.txt +++ b/lib/unicore/NormalizationCorrections.txt @@ -1,6 +1,6 @@ -# NormalizationCorrections-13.0.0.txt -# Date: 2019-09-09, 19:50:00 GMT [KW, LI] -# © 2019 Unicode®, Inc. +# NormalizationCorrections-14.0.0.txt +# Date: 2021-03-16, 22:07:00 GMT [KW, LI] +# © 2021 Unicode®, Inc. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Character Database diff --git a/lib/unicore/PropList.txt b/lib/unicore/PropList.txt index 7d2f44c56f..0a5a934682 100644 --- a/lib/unicore/PropList.txt +++ b/lib/unicore/PropList.txt @@ -1,6 +1,6 @@ -# PropList-13.0.0.txt -# Date: 2019-11-27, 03:13:28 GMT -# © 2019 Unicode®, Inc. +# PropList-14.0.0.txt +# Date: 2021-08-12, 23:13:05 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -54,6 +54,7 @@ 2E1A ; Dash # Pd HYPHEN WITH DIAERESIS 2E3A..2E3B ; Dash # Pd [2] TWO-EM DASH..THREE-EM DASH 2E40 ; Dash # Pd DOUBLE HYPHEN +2E5D ; Dash # Pd OBLIQUE HYPHEN 301C ; Dash # Pd WAVE DASH 3030 ; Dash # Pd WAVY DASH 30A0 ; Dash # Pd KATAKANA-HIRAGANA DOUBLE HYPHEN @@ -63,7 +64,7 @@ FE63 ; Dash # Pd SMALL HYPHEN-MINUS FF0D ; Dash # Pd FULLWIDTH HYPHEN-MINUS 10EAD ; Dash # Pd YEZIDI HYPHENATION MARK -# Total code points: 29 +# Total code points: 30 # ================================================ @@ -126,7 +127,7 @@ FF63 ; Quotation_Mark # Pe HALFWIDTH RIGHT CORNER BRACKET 05C3 ; Terminal_Punctuation # Po HEBREW PUNCTUATION SOF PASUQ 060C ; Terminal_Punctuation # Po ARABIC COMMA 061B ; Terminal_Punctuation # Po ARABIC SEMICOLON -061E..061F ; Terminal_Punctuation # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; Terminal_Punctuation # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 06D4 ; Terminal_Punctuation # Po ARABIC FULL STOP 0700..070A ; Terminal_Punctuation # Po [11] SYRIAC END OF PARAGRAPH..SYRIAC CONTRACTION 070C ; Terminal_Punctuation # Po SYRIAC HARKLEAN METOBELUS @@ -150,6 +151,7 @@ FF63 ; Quotation_Mark # Pe HALFWIDTH RIGHT CORNER BRACKET 1AA8..1AAB ; Terminal_Punctuation # Po [4] TAI THAM SIGN KAAN..TAI THAM SIGN SATKAANKUU 1B5A..1B5B ; Terminal_Punctuation # Po [2] BALINESE PANTI..BALINESE PAMADA 1B5D..1B5F ; Terminal_Punctuation # Po [3] BALINESE CARIK PAMUNGKAH..BALINESE CARIK PAREREN +1B7D..1B7E ; Terminal_Punctuation # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1C3B..1C3F ; Terminal_Punctuation # Po [5] LEPCHA PUNCTUATION TA-ROL..LEPCHA PUNCTUATION TSHOOK 1C7E..1C7F ; Terminal_Punctuation # Po [2] OL CHIKI PUNCTUATION MUCAAD..OL CHIKI PUNCTUATION DOUBLE MUCAAD 203C..203D ; Terminal_Punctuation # Po [2] DOUBLE EXCLAMATION MARK..INTERROBANG @@ -159,6 +161,7 @@ FF63 ; Quotation_Mark # Pe HALFWIDTH RIGHT CORNER BRACKET 2E41 ; Terminal_Punctuation # Po REVERSED COMMA 2E4C ; Terminal_Punctuation # Po MEDIEVAL COMMA 2E4E..2E4F ; Terminal_Punctuation # Po [2] PUNCTUS ELEVATUS MARK..CORNISH VERSE DIVIDER +2E53..2E54 ; Terminal_Punctuation # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK 3001..3002 ; Terminal_Punctuation # Po [2] IDEOGRAPHIC COMMA..IDEOGRAPHIC FULL STOP A4FE..A4FF ; Terminal_Punctuation # Po [2] LISU PUNCTUATION COMMA..LISU PUNCTUATION FULL STOP A60D..A60F ; Terminal_Punctuation # Po [3] VAI COMMA..VAI QUESTION MARK @@ -189,6 +192,7 @@ FF64 ; Terminal_Punctuation # Po HALFWIDTH IDEOGRAPHIC COMMA 10B3A..10B3F ; Terminal_Punctuation # Po [6] TINY TWO DOTS OVER ONE DOT PUNCTUATION..LARGE ONE RING OVER TWO RINGS PUNCTUATION 10B99..10B9C ; Terminal_Punctuation # Po [4] PSALTER PAHLAVI SECTION MARK..PSALTER PAHLAVI FOUR DOTS WITH DOT 10F55..10F59 ; Terminal_Punctuation # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F86..10F89 ; Terminal_Punctuation # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 11047..1104D ; Terminal_Punctuation # Po [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 110BE..110C1 ; Terminal_Punctuation # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA 11141..11143 ; Terminal_Punctuation # Po [3] CHAKMA DANDA..CHAKMA QUESTION MARK @@ -220,7 +224,7 @@ FF64 ; Terminal_Punctuation # Po HALFWIDTH IDEOGRAPHIC COMMA 1BC9F ; Terminal_Punctuation # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1DA87..1DA8A ; Terminal_Punctuation # Po [4] SIGNWRITING COMMA..SIGNWRITING COLON -# Total code points: 267 +# Total code points: 276 # ================================================ @@ -600,6 +604,7 @@ FF41..FF46 ; Hex_Digit # L& [6] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH L 1A6D..1A72 ; Other_Alphabetic # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI 1A73..1A74 ; Other_Alphabetic # Mn [2] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN MAI KANG 1ABF..1AC0 ; Other_Alphabetic # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ACC..1ACE ; Other_Alphabetic # Mn [3] COMBINING LATIN SMALL LETTER INSULAR G..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; Other_Alphabetic # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; Other_Alphabetic # Mc BALINESE SIGN BISAH 1B35 ; Other_Alphabetic # Mc BALINESE VOWEL SIGN TEDUNG @@ -686,10 +691,12 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA 11001 ; Other_Alphabetic # Mn BRAHMI SIGN ANUSVARA 11002 ; Other_Alphabetic # Mc BRAHMI SIGN VISARGA 11038..11045 ; Other_Alphabetic # Mn [14] BRAHMI VOWEL SIGN AA..BRAHMI VOWEL SIGN AU +11073..11074 ; Other_Alphabetic # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 11082 ; Other_Alphabetic # Mc KAITHI SIGN VISARGA 110B0..110B2 ; Other_Alphabetic # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II 110B3..110B6 ; Other_Alphabetic # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B7..110B8 ; Other_Alphabetic # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU +110C2 ; Other_Alphabetic # Mn KAITHI VOWEL SIGN VOCALIC R 11100..11102 ; Other_Alphabetic # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; Other_Alphabetic # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112C ; Other_Alphabetic # Mc CHAKMA VOWEL SIGN E @@ -815,7 +822,7 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA 1F150..1F169 ; Other_Alphabetic # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Other_Alphabetic # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 1398 +# Total code points: 1404 # ================================================ @@ -824,7 +831,7 @@ FB1E ; Other_Alphabetic # Mn HEBREW POINT JUDEO-SPANISH VARIKA 3021..3029 ; Ideographic # Nl [9] HANGZHOU NUMERAL ONE..HANGZHOU NUMERAL NINE 3038..303A ; Ideographic # Nl [3] HANGZHOU NUMERAL TEN..HANGZHOU NUMERAL THIRTY 3400..4DBF ; Ideographic # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; Ideographic # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC +4E00..9FFF ; Ideographic # Lo [20992] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFF F900..FA6D ; Ideographic # Lo [366] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA6D FA70..FAD9 ; Ideographic # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9 16FE4 ; Ideographic # Mn KHITAN SMALL SCRIPT FILLER @@ -832,15 +839,15 @@ FA70..FAD9 ; Ideographic # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COM 18800..18CD5 ; Ideographic # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; Ideographic # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 1B170..1B2FB ; Ideographic # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB -20000..2A6DD ; Ideographic # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; Ideographic # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; Ideographic # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; Ideographic # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; Ideographic # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Ideographic # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Ideographic # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 2F800..2FA1D ; Ideographic # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D 30000..3134A ; Ideographic # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 101652 +# Total code points: 101661 # ================================================ @@ -885,6 +892,9 @@ FA70..FAD9 ; Ideographic # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COM 07EB..07F3 ; Diacritic # Mn [9] NKO COMBINING SHORT HIGH TONE..NKO COMBINING DOUBLE DOT ABOVE 07F4..07F5 ; Diacritic # Lm [2] NKO HIGH TONE APOSTROPHE..NKO LOW TONE APOSTROPHE 0818..0819 ; Diacritic # Mn [2] SAMARITAN MARK OCCLUSION..SAMARITAN MARK DAGESH +0898..089F ; Diacritic # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08C9 ; Diacritic # Lm ARABIC SMALL FARSI YEH +08CA..08D2 ; Diacritic # Mn [9] ARABIC SMALL HIGH FARSI YEH..ARABIC LARGE ROUND DOT INSIDE CIRCLE BELOW 08E3..08FE ; Diacritic # Mn [28] ARABIC TURNED DAMMA BELOW..ARABIC DAMMA WITH DOT 093C ; Diacritic # Mn DEVANAGARI SIGN NUKTA 094D ; Diacritic # Mn DEVANAGARI SIGN VIRAMA @@ -901,6 +911,7 @@ FA70..FAD9 ; Ideographic # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COM 0B4D ; Diacritic # Mn ORIYA SIGN VIRAMA 0B55 ; Diacritic # Mn ORIYA SIGN OVERLINE 0BCD ; Diacritic # Mn TAMIL SIGN VIRAMA +0C3C ; Diacritic # Mn TELUGU SIGN NUKTA 0C4D ; Diacritic # Mn TELUGU SIGN VIRAMA 0CBC ; Diacritic # Mn KANNADA SIGN NUKTA 0CCD ; Diacritic # Mn KANNADA SIGN VIRAMA @@ -928,12 +939,16 @@ FA70..FAD9 ; Ideographic # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COM 108F ; Diacritic # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5 109A..109B ; Diacritic # Mc [2] MYANMAR SIGN KHAMTI TONE-1..MYANMAR SIGN KHAMTI TONE-3 135D..135F ; Diacritic # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK +1714 ; Diacritic # Mn TAGALOG SIGN VIRAMA +1715 ; Diacritic # Mc TAGALOG SIGN PAMUDPOD 17C9..17D3 ; Diacritic # Mn [11] KHMER SIGN MUUSIKATOAN..KHMER SIGN BATHAMASAT 17DD ; Diacritic # Mn KHMER SIGN ATTHACAN 1939..193B ; Diacritic # Mn [3] LIMBU SIGN MUKPHRENG..LIMBU SIGN SA-I 1A75..1A7C ; Diacritic # Mn [8] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN-LUE KARAN 1A7F ; Diacritic # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 1AB0..1ABD ; Diacritic # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW +1ABE ; Diacritic # Me COMBINING PARENTHESES OVERLAY +1AC1..1ACB ; Diacritic # Mn [11] COMBINING LEFT PARENTHESIS ABOVE LEFT..COMBINING TRIPLE ACUTE ACCENT 1B34 ; Diacritic # Mn BALINESE SIGN REREKAN 1B44 ; Diacritic # Mc BALINESE ADEG ADEG 1B6B..1B73 ; Diacritic # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG @@ -952,8 +967,7 @@ FA70..FAD9 ; Ideographic # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COM 1CF8..1CF9 ; Diacritic # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE 1D2C..1D6A ; Diacritic # Lm [63] MODIFIER LETTER CAPITAL A..GREEK SUBSCRIPT SMALL LETTER CHI 1DC4..1DCF ; Diacritic # Mn [12] COMBINING MACRON-ACUTE..COMBINING ZIGZAG BELOW -1DF5..1DF9 ; Diacritic # Mn [5] COMBINING UP TACK ABOVE..COMBINING WIDE INVERTED BRIDGE BELOW -1DFD..1DFF ; Diacritic # Mn [3] COMBINING ALMOST EQUAL TO BELOW..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DF5..1DFF ; Diacritic # Mn [11] COMBINING UP TACK ABOVE..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 1FBD ; Diacritic # Sk GREEK KORONIS 1FBF..1FC1 ; Diacritic # Sk [3] GREEK PSILI..GREEK DIALYTIKA AND PERISPOMENI 1FCD..1FCF ; Diacritic # Sk [3] GREEK PSILI AND VARIA..GREEK PSILI AND PERISPOMENI @@ -1008,10 +1022,16 @@ FF70 ; Diacritic # Lm HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND FF9E..FF9F ; Diacritic # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK FFE3 ; Diacritic # Sk FULLWIDTH MACRON 102E0 ; Diacritic # Mn COPTIC EPACT THOUSANDS MARK +10780..10785 ; Diacritic # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Diacritic # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Diacritic # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10AE5..10AE6 ; Diacritic # Mn [2] MANICHAEAN ABBREVIATION MARK ABOVE..MANICHAEAN ABBREVIATION MARK BELOW 10D22..10D23 ; Diacritic # Lo [2] HANIFI ROHINGYA MARK SAKIN..HANIFI ROHINGYA MARK NA KHONNA 10D24..10D27 ; Diacritic # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10F46..10F50 ; Diacritic # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; Diacritic # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW +11046 ; Diacritic # Mn BRAHMI VIRAMA +11070 ; Diacritic # Mn BRAHMI SIGN OLD TAMIL VIRAMA 110B9..110BA ; Diacritic # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA 11133..11134 ; Diacritic # Mn [2] CHAKMA VIRAMA..CHAKMA MAAYYAA 11173 ; Diacritic # Mn MAHAJANI SIGN NUKTA @@ -1049,18 +1069,24 @@ FFE3 ; Diacritic # Sk FULLWIDTH MACRON 16F8F..16F92 ; Diacritic # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16F93..16F9F ; Diacritic # Lm [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8 16FF0..16FF1 ; Diacritic # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY +1AFF0..1AFF3 ; Diacritic # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; Diacritic # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; Diacritic # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1CF00..1CF2D ; Diacritic # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; Diacritic # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D167..1D169 ; Diacritic # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16D..1D172 ; Diacritic # Mc [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 1D17B..1D182 ; Diacritic # Mn [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE 1D185..1D18B ; Diacritic # Mn [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1D1AA..1D1AD ; Diacritic # Mn [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO 1E130..1E136 ; Diacritic # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; Diacritic # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; Diacritic # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; Diacritic # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E946 ; Diacritic # Mn [3] ADLAM ALIF LENGTHENER..ADLAM GEMINATION MARK 1E948..1E94A ; Diacritic # Mn [3] ADLAM CONSONANT MODIFIER..ADLAM NUKTA -# Total code points: 882 +# Total code points: 1064 # ================================================ @@ -1088,6 +1114,7 @@ AA70 ; Extender # Lm MYANMAR MODIFIER LETTER KHAMTI REDUPLICATION AADD ; Extender # Lm TAI VIET SYMBOL SAM AAF3..AAF4 ; Extender # Lm [2] MEETEI MAYEK SYLLABLE REPETITION MARK..MEETEI MAYEK WORD REPETITION MARK FF70 ; Extender # Lm HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND MARK +10781..10782 ; Extender # Lm [2] MODIFIER LETTER SUPERSCRIPT TRIANGULAR COLON..MODIFIER LETTER SUPERSCRIPT HALF TRIANGULAR COLON 1135D ; Extender # Lo GRANTHA SIGN PLUTA 115C6..115C8 ; Extender # Po [3] SIDDHAM REPETITION MARK-1..SIDDHAM REPETITION MARK-3 11A98 ; Extender # Mn SOYOMBO GEMINATION MARK @@ -1097,7 +1124,7 @@ FF70 ; Extender # Lm HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND 1E13C..1E13D ; Extender # Lm [2] NYIAKENG PUACHUE HMONG SIGN XW XW..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E944..1E946 ; Extender # Mn [3] ADLAM ALIF LENGTHENER..ADLAM GEMINATION MARK -# Total code points: 48 +# Total code points: 50 # ================================================ @@ -1121,8 +1148,12 @@ A69C..A69D ; Other_Lowercase # Lm [2] MODIFIER LETTER CYRILLIC HARD SIGN..M A770 ; Other_Lowercase # Lm MODIFIER LETTER US A7F8..A7F9 ; Other_Lowercase # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE AB5C..AB5F ; Other_Lowercase # Lm [4] MODIFIER LETTER SMALL HENG..MODIFIER LETTER SMALL U WITH LEFT HOOK +10780 ; Other_Lowercase # Lm MODIFIER LETTER SMALL CAPITAL AA +10783..10785 ; Other_Lowercase # Lm [3] MODIFIER LETTER SMALL AE..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Other_Lowercase # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Other_Lowercase # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL -# Total code points: 189 +# Total code points: 244 # ================================================ @@ -1211,7 +1242,7 @@ E0020..E007F ; Other_Grapheme_Extend # Cf [96] TAG SPACE..CANCEL TAG # ================================================ 3400..4DBF ; Unified_Ideograph # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; Unified_Ideograph # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC +4E00..9FFF ; Unified_Ideograph # Lo [20992] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFF FA0E..FA0F ; Unified_Ideograph # Lo [2] CJK COMPATIBILITY IDEOGRAPH-FA0E..CJK COMPATIBILITY IDEOGRAPH-FA0F FA11 ; Unified_Ideograph # Lo CJK COMPATIBILITY IDEOGRAPH-FA11 FA13..FA14 ; Unified_Ideograph # Lo [2] CJK COMPATIBILITY IDEOGRAPH-FA13..CJK COMPATIBILITY IDEOGRAPH-FA14 @@ -1219,14 +1250,14 @@ FA1F ; Unified_Ideograph # Lo CJK COMPATIBILITY IDEOGRAPH-FA1F FA21 ; Unified_Ideograph # Lo CJK COMPATIBILITY IDEOGRAPH-FA21 FA23..FA24 ; Unified_Ideograph # Lo [2] CJK COMPATIBILITY IDEOGRAPH-FA23..CJK COMPATIBILITY IDEOGRAPH-FA24 FA27..FA29 ; Unified_Ideograph # Lo [3] CJK COMPATIBILITY IDEOGRAPH-FA27..CJK COMPATIBILITY IDEOGRAPH-FA29 -20000..2A6DD ; Unified_Ideograph # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; Unified_Ideograph # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; Unified_Ideograph # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; Unified_Ideograph # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; Unified_Ideograph # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Unified_Ideograph # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Unified_Ideograph # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 30000..3134A ; Unified_Ideograph # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 92856 +# Total code points: 92865 # ================================================ @@ -1291,8 +1322,9 @@ E0001 ; Deprecated # Cf LANGUAGE TAG 1D62A..1D62B ; Soft_Dotted # L& [2] MATHEMATICAL SANS-SERIF ITALIC SMALL I..MATHEMATICAL SANS-SERIF ITALIC SMALL J 1D65E..1D65F ; Soft_Dotted # L& [2] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL I..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL J 1D692..1D693 ; Soft_Dotted # L& [2] MATHEMATICAL MONOSPACE SMALL I..MATHEMATICAL MONOSPACE SMALL J +1DF1A ; Soft_Dotted # L& LATIN SMALL LETTER I WITH STROKE AND RETROFLEX HOOK -# Total code points: 46 +# Total code points: 47 # ================================================ @@ -1330,7 +1362,7 @@ AABB..AABC ; Logical_Order_Exception # Lo [2] TAI VIET VOWEL AUE..TAI VIET 002E ; Sentence_Terminal # Po FULL STOP 003F ; Sentence_Terminal # Po QUESTION MARK 0589 ; Sentence_Terminal # Po ARMENIAN FULL STOP -061E..061F ; Sentence_Terminal # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; Sentence_Terminal # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 06D4 ; Sentence_Terminal # Po ARABIC FULL STOP 0700..0702 ; Sentence_Terminal # Po [3] SYRIAC END OF PARAGRAPH..SYRIAC SUBLINEAR FULL STOP 07F9 ; Sentence_Terminal # Po NKO EXCLAMATION MARK @@ -1349,12 +1381,14 @@ AABB..AABC ; Logical_Order_Exception # Lo [2] TAI VIET VOWEL AUE..TAI VIET 1AA8..1AAB ; Sentence_Terminal # Po [4] TAI THAM SIGN KAAN..TAI THAM SIGN SATKAANKUU 1B5A..1B5B ; Sentence_Terminal # Po [2] BALINESE PANTI..BALINESE PAMADA 1B5E..1B5F ; Sentence_Terminal # Po [2] BALINESE CARIK SIKI..BALINESE CARIK PAREREN +1B7D..1B7E ; Sentence_Terminal # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1C3B..1C3C ; Sentence_Terminal # Po [2] LEPCHA PUNCTUATION TA-ROL..LEPCHA PUNCTUATION NYET THYOOM TA-ROL 1C7E..1C7F ; Sentence_Terminal # Po [2] OL CHIKI PUNCTUATION MUCAAD..OL CHIKI PUNCTUATION DOUBLE MUCAAD 203C..203D ; Sentence_Terminal # Po [2] DOUBLE EXCLAMATION MARK..INTERROBANG 2047..2049 ; Sentence_Terminal # Po [3] DOUBLE QUESTION MARK..EXCLAMATION QUESTION MARK 2E2E ; Sentence_Terminal # Po REVERSED QUESTION MARK 2E3C ; Sentence_Terminal # Po STENOGRAPHIC FULL STOP +2E53..2E54 ; Sentence_Terminal # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK 3002 ; Sentence_Terminal # Po IDEOGRAPHIC FULL STOP A4FF ; Sentence_Terminal # Po LISU PUNCTUATION FULL STOP A60E..A60F ; Sentence_Terminal # Po [2] VAI FULL STOP..VAI QUESTION MARK @@ -1375,6 +1409,7 @@ FF1F ; Sentence_Terminal # Po FULLWIDTH QUESTION MARK FF61 ; Sentence_Terminal # Po HALFWIDTH IDEOGRAPHIC FULL STOP 10A56..10A57 ; Sentence_Terminal # Po [2] KHAROSHTHI PUNCTUATION DANDA..KHAROSHTHI PUNCTUATION DOUBLE DANDA 10F55..10F59 ; Sentence_Terminal # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F86..10F89 ; Sentence_Terminal # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 11047..11048 ; Sentence_Terminal # Po [2] BRAHMI DANDA..BRAHMI DOUBLE DANDA 110BE..110C1 ; Sentence_Terminal # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA 11141..11143 ; Sentence_Terminal # Po [3] CHAKMA DANDA..CHAKMA QUESTION MARK @@ -1403,15 +1438,16 @@ FF61 ; Sentence_Terminal # Po HALFWIDTH IDEOGRAPHIC FULL STOP 1BC9F ; Sentence_Terminal # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1DA88 ; Sentence_Terminal # Po SIGNWRITING FULL STOP -# Total code points: 143 +# Total code points: 152 # ================================================ 180B..180D ; Variation_Selector # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; Variation_Selector # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR FE00..FE0F ; Variation_Selector # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16 E0100..E01EF ; Variation_Selector # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 259 +# Total code points: 260 # ================================================ @@ -1644,8 +1680,17 @@ E0100..E01EF ; Variation_Selector # Mn [240] VARIATION SELECTOR-17..VARIATION S 2E42 ; Pattern_Syntax # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK 2E43..2E4F ; Pattern_Syntax # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER 2E50..2E51 ; Pattern_Syntax # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR -2E52 ; Pattern_Syntax # Po TIRONIAN SIGN CAPITAL ET -2E53..2E7F ; Pattern_Syntax # Cn [45] .. +2E52..2E54 ; Pattern_Syntax # Po [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK +2E55 ; Pattern_Syntax # Ps LEFT SQUARE BRACKET WITH STROKE +2E56 ; Pattern_Syntax # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57 ; Pattern_Syntax # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58 ; Pattern_Syntax # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; Pattern_Syntax # Ps TOP HALF LEFT PARENTHESIS +2E5A ; Pattern_Syntax # Pe TOP HALF RIGHT PARENTHESIS +2E5B ; Pattern_Syntax # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C ; Pattern_Syntax # Pe BOTTOM HALF RIGHT PARENTHESIS +2E5D ; Pattern_Syntax # Pd OBLIQUE HYPHEN +2E5E..2E7F ; Pattern_Syntax # Cn [34] .. 3001..3003 ; Pattern_Syntax # Po [3] IDEOGRAPHIC COMMA..DITTO MARK 3008 ; Pattern_Syntax # Ps LEFT ANGLE BRACKET 3009 ; Pattern_Syntax # Pe RIGHT ANGLE BRACKET @@ -1682,11 +1727,12 @@ FE45..FE46 ; Pattern_Syntax # Po [2] SESAME DOT..WHITE SESAME DOT 0600..0605 ; Prepended_Concatenation_Mark # Cf [6] ARABIC NUMBER SIGN..ARABIC NUMBER MARK ABOVE 06DD ; Prepended_Concatenation_Mark # Cf ARABIC END OF AYAH 070F ; Prepended_Concatenation_Mark # Cf SYRIAC ABBREVIATION MARK +0890..0891 ; Prepended_Concatenation_Mark # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE 08E2 ; Prepended_Concatenation_Mark # Cf ARABIC DISPUTED END OF AYAH 110BD ; Prepended_Concatenation_Mark # Cf KAITHI NUMBER SIGN 110CD ; Prepended_Concatenation_Mark # Cf KAITHI NUMBER SIGN ABOVE -# Total code points: 11 +# Total code points: 13 # ================================================ diff --git a/lib/unicore/PropValueAliases.txt b/lib/unicore/PropValueAliases.txt index 2023baf4d2..f0cb26bdab 100644 --- a/lib/unicore/PropValueAliases.txt +++ b/lib/unicore/PropValueAliases.txt @@ -1,6 +1,6 @@ -# PropertyValueAliases-13.0.0.txt -# Date: 2019-11-13, 21:52:10 GMT -# © 2019 Unicode®, Inc. +# PropertyValueAliases-14.0.0.txt +# Date: 2021-05-10, 21:08:53 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -89,6 +89,7 @@ age; 11.0 ; V11_0 age; 12.0 ; V12_0 age; 12.1 ; V12_1 age; 13.0 ; V13_0 +age; 14.0 ; V14_0 age; NA ; Unassigned # Alphabetic (Alpha) @@ -160,6 +161,7 @@ blk; Ancient_Greek_Numbers ; Ancient_Greek_Numbers blk; Ancient_Symbols ; Ancient_Symbols blk; Arabic ; Arabic blk; Arabic_Ext_A ; Arabic_Extended_A +blk; Arabic_Ext_B ; Arabic_Extended_B blk; Arabic_Math ; Arabic_Mathematical_Alphabetic_Symbols blk; Arabic_PF_A ; Arabic_Presentation_Forms_A ; Arabic_Presentation_Forms-A blk; Arabic_PF_B ; Arabic_Presentation_Forms_B @@ -216,6 +218,7 @@ blk; Cuneiform ; Cuneiform blk; Cuneiform_Numbers ; Cuneiform_Numbers_And_Punctuation blk; Currency_Symbols ; Currency_Symbols blk; Cypriot_Syllabary ; Cypriot_Syllabary +blk; Cypro_Minoan ; Cypro_Minoan blk; Cyrillic ; Cyrillic blk; Cyrillic_Ext_A ; Cyrillic_Extended_A blk; Cyrillic_Ext_B ; Cyrillic_Extended_B @@ -246,6 +249,7 @@ blk; Enclosed_Ideographic_Sup ; Enclosed_Ideographic_Supplement blk; Ethiopic ; Ethiopic blk; Ethiopic_Ext ; Ethiopic_Extended blk; Ethiopic_Ext_A ; Ethiopic_Extended_A +blk; Ethiopic_Ext_B ; Ethiopic_Extended_B blk; Ethiopic_Sup ; Ethiopic_Supplement blk; Geometric_Shapes ; Geometric_Shapes blk; Geometric_Shapes_Ext ; Geometric_Shapes_Extended @@ -285,6 +289,7 @@ blk; Jamo_Ext_B ; Hangul_Jamo_Extended_B blk; Javanese ; Javanese blk; Kaithi ; Kaithi blk; Kana_Ext_A ; Kana_Extended_A +blk; Kana_Ext_B ; Kana_Extended_B blk; Kana_Sup ; Kana_Supplement blk; Kanbun ; Kanbun blk; Kangxi ; Kangxi_Radicals @@ -306,6 +311,8 @@ blk; Latin_Ext_B ; Latin_Extended_B blk; Latin_Ext_C ; Latin_Extended_C blk; Latin_Ext_D ; Latin_Extended_D blk; Latin_Ext_E ; Latin_Extended_E +blk; Latin_Ext_F ; Latin_Extended_F +blk; Latin_Ext_G ; Latin_Extended_G blk; Lepcha ; Lepcha blk; Letterlike_Symbols ; Letterlike_Symbols blk; Limbu ; Limbu @@ -372,6 +379,7 @@ blk; Old_Persian ; Old_Persian blk; Old_Sogdian ; Old_Sogdian blk; Old_South_Arabian ; Old_South_Arabian blk; Old_Turkic ; Old_Turkic +blk; Old_Uyghur ; Old_Uyghur blk; Oriya ; Oriya blk; Ornamental_Dingbats ; Ornamental_Dingbats blk; Osage ; Osage @@ -433,6 +441,7 @@ blk; Tai_Xuan_Jing ; Tai_Xuan_Jing_Symbols blk; Takri ; Takri blk; Tamil ; Tamil blk; Tamil_Sup ; Tamil_Supplement +blk; Tangsa ; Tangsa blk; Tangut ; Tangut blk; Tangut_Components ; Tangut_Components blk; Tangut_Sup ; Tangut_Supplement @@ -442,13 +451,16 @@ blk; Thai ; Thai blk; Tibetan ; Tibetan blk; Tifinagh ; Tifinagh blk; Tirhuta ; Tirhuta +blk; Toto ; Toto blk; Transport_And_Map ; Transport_And_Map_Symbols blk; UCAS ; Unified_Canadian_Aboriginal_Syllabics; Canadian_Syllabics blk; UCAS_Ext ; Unified_Canadian_Aboriginal_Syllabics_Extended +blk; UCAS_Ext_A ; Unified_Canadian_Aboriginal_Syllabics_Extended_A blk; Ugaritic ; Ugaritic blk; Vai ; Vai blk; Vedic_Ext ; Vedic_Extensions blk; Vertical_Forms ; Vertical_Forms +blk; Vithkuqi ; Vithkuqi blk; VS ; Variation_Selectors blk; VS_Sup ; Variation_Selectors_Supplement blk; Wancho ; Wancho @@ -458,6 +470,7 @@ blk; Yi_Radicals ; Yi_Radicals blk; Yi_Syllables ; Yi_Syllables blk; Yijing ; Yijing_Hexagram_Symbols blk; Zanabazar_Square ; Zanabazar_Square +blk; Znamenny_Music ; Znamenny_Musical_Notation # Canonical_Combining_Class (ccc) @@ -1032,6 +1045,8 @@ jg ; Taw ; Taw jg ; Teh_Marbuta ; Teh_Marbuta jg ; Teh_Marbuta_Goal ; Hamza_On_Heh_Goal jg ; Teth ; Teth +jg ; Thin_Yeh ; Thin_Yeh +jg ; Vertical_Tail ; Vertical_Tail jg ; Waw ; Waw jg ; Yeh ; Yeh jg ; Yeh_Barree ; Yeh_Barree @@ -1262,6 +1277,7 @@ sc ; Cham ; Cham sc ; Cher ; Cherokee sc ; Chrs ; Chorasmian sc ; Copt ; Coptic ; Qaac +sc ; Cpmn ; Cypro_Minoan sc ; Cprt ; Cypriot sc ; Cyrl ; Cyrillic sc ; Deva ; Devanagari @@ -1341,6 +1357,7 @@ sc ; Orkh ; Old_Turkic sc ; Orya ; Oriya sc ; Osge ; Osage sc ; Osma ; Osmanya +sc ; Ougr ; Old_Uyghur sc ; Palm ; Palmyrene sc ; Pauc ; Pau_Cin_Hau sc ; Perm ; Old_Permic @@ -1383,8 +1400,11 @@ sc ; Thaa ; Thaana sc ; Thai ; Thai sc ; Tibt ; Tibetan sc ; Tirh ; Tirhuta +sc ; Tnsa ; Tangsa +sc ; Toto ; Toto sc ; Ugar ; Ugaritic sc ; Vaii ; Vai +sc ; Vith ; Vithkuqi sc ; Wara ; Warang_Citi sc ; Wcho ; Wancho sc ; Xpeo ; Old_Persian diff --git a/lib/unicore/PropertyAliases.txt b/lib/unicore/PropertyAliases.txt index 04644b8a28..3e4b429e45 100644 --- a/lib/unicore/PropertyAliases.txt +++ b/lib/unicore/PropertyAliases.txt @@ -1,6 +1,6 @@ -# PropertyAliases-13.0.0.txt -# Date: 2019-10-23, 03:46:32 GMT -# © 2019 Unicode®, Inc. +# PropertyAliases-14.0.0.txt +# Date: 2021-03-08, 19:35:48 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # diff --git a/lib/unicore/ReadMe.txt b/lib/unicore/ReadMe.txt index 390624de3d..e7c080f9f0 100644 --- a/lib/unicore/ReadMe.txt +++ b/lib/unicore/ReadMe.txt @@ -1,6 +1,6 @@ # Unicode Character Database -# Date: 2019-09-11, 16:03:00 GMT [KW] -# © 2019 Unicode®, Inc. +# Date: 2021-09-10, 17:22:00 GMT [KW] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see https://www.unicode.org/terms_of_use.html # @@ -10,7 +10,7 @@ # UAX #44, "Unicode Character Database" # UTS #51, "Unicode Emoji" # -# The UAXes and UTS #51 can be accessed at https://www.unicode.org/versions/Unicode13.0.0/ +# The UAXes and UTS #51 can be accessed at https://www.unicode.org/versions/Unicode14.0.0/ -This directory contains the preliminary data files under development -for the Unicode Character Database, for Version 13.0.0 of the Unicode Standard. +This directory contains the final data files +for the Unicode Character Database, for Version 14.0.0 of the Unicode Standard. diff --git a/lib/unicore/ScriptExtensions.txt b/lib/unicore/ScriptExtensions.txt index b561feeb29..3f5cd1c0db 100644 --- a/lib/unicore/ScriptExtensions.txt +++ b/lib/unicore/ScriptExtensions.txt @@ -1,6 +1,6 @@ -# ScriptExtensions-13.0.0.txt -# Date: 2020-01-22, 00:07:43 GMT -# © 2020 Unicode®, Inc. +# ScriptExtensions-14.0.0.txt +# Date: 2021-06-04, 02:19:38 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -11,10 +11,10 @@ # with more than one script, but with a limited number of scripts. # For each code point, there is one or more property values. Each such value is a Script property value. # For more information, see: -# UAX #24, Unicode Script Property: http://www.unicode.org/reports/tr24/ +# UAX #24, Unicode Script Property: https://www.unicode.org/reports/tr24/ # Especially the sections: -# http://www.unicode.org/reports/tr24/#Assignment_Script_Values -# http://www.unicode.org/reports/tr24/#Assignment_ScriptX_Values +# https://www.unicode.org/reports/tr24/#Assignment_Script_Values +# https://www.unicode.org/reports/tr24/#Assignment_ScriptX_Values # # Each Script_Extensions value in this file consists of a set # of one or more abbreviated Script property values. The ordering of the @@ -119,6 +119,14 @@ # ================================================ +# Script_Extensions=Syrc + +1DFA ; Syrc # Mn COMBINING DOT BELOW LEFT + +# Total code points: 1 + +# ================================================ + # Script_Extensions=Arab Copt 102E0 ; Arab Copt # Mn COPTIC EPACT THOUSANDS MARK @@ -136,6 +144,15 @@ # ================================================ +# Script_Extensions=Arab Nkoo + +FD3E ; Arab Nkoo # Pe ORNATE LEFT PARENTHESIS +FD3F ; Arab Nkoo # Ps ORNATE RIGHT PARENTHESIS + +# Total code points: 2 + +# ================================================ + # Script_Extensions=Arab Syrc 064B..0655 ; Arab Syrc # Mn [11] ARABIC FATHATAN..ARABIC HAMZA BELOW @@ -186,10 +203,10 @@ A9CF ; Bugi Java # Lm JAVANESE PANGRANGKEP # Script_Extensions=Cprt Linb -10100..10102 ; Cprt Linb # Po [3] AEGEAN WORD SEPARATOR LINE..AEGEAN CHECK MARK +10102 ; Cprt Linb # Po AEGEAN CHECK MARK 10137..1013F ; Cprt Linb # So [9] AEGEAN WEIGHT BASE UNIT..AEGEAN MEASURE THIRD SUBUNIT -# Total code points: 12 +# Total code points: 10 # ================================================ @@ -342,6 +359,14 @@ FF9E..FF9F ; Hira Kana # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFW # ================================================ +# Script_Extensions=Mani Ougr + +10AF2 ; Mani Ougr # Po MANICHAEAN PUNCTUATION DOUBLE DOT WITHIN DOT + +# Total code points: 1 + +# ================================================ + # Script_Extensions=Mong Phag 1802..1803 ; Mong Phag # Po [2] MONGOLIAN COMMA..MONGOLIAN FULL STOP @@ -383,6 +408,14 @@ FF9E..FF9F ; Hira Kana # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFW # ================================================ +# Script_Extensions=Cpmn Cprt Linb + +10100..10101 ; Cpmn Cprt Linb # Po [2] AEGEAN WORD SEPARATOR LINE..AEGEAN WORD SEPARATOR DOT + +# Total code points: 2 + +# ================================================ + # Script_Extensions=Cprt Lina Linb 10107..10133 ; Cprt Lina Linb # No [45] AEGEAN NUMBER ONE..AEGEAN NUMBER NINETY THOUSAND @@ -449,16 +482,6 @@ A92E ; Kali Latn Mymr # Po KAYAH LI SIGN CWI # ================================================ -# Script_Extensions=Arab Rohg Syrc Thaa Yezi - -060C ; Arab Rohg Syrc Thaa Yezi # Po ARABIC COMMA -061B ; Arab Rohg Syrc Thaa Yezi # Po ARABIC SEMICOLON -061F ; Arab Rohg Syrc Thaa Yezi # Po ARABIC QUESTION MARK - -# Total code points: 3 - -# ================================================ - # Script_Extensions=Bopo Hang Hani Hira Kana 3003 ; Bopo Hang Hani Hira Kana # Po DITTO MARK @@ -474,6 +497,15 @@ FE45..FE46 ; Bopo Hang Hani Hira Kana # Po [2] SESAME DOT..WHITE SESAME DOT # ================================================ +# Script_Extensions=Arab Nkoo Rohg Syrc Thaa Yezi + +060C ; Arab Nkoo Rohg Syrc Thaa Yezi # Po ARABIC COMMA +061B ; Arab Nkoo Rohg Syrc Thaa Yezi # Po ARABIC SEMICOLON + +# Total code points: 2 + +# ================================================ + # Script_Extensions=Bopo Hang Hani Hira Kana Yiii 3001..3002 ; Bopo Hang Hani Hira Kana Yiii # Po [2] IDEOGRAPHIC COMMA..IDEOGRAPHIC FULL STOP @@ -513,9 +545,9 @@ FF64..FF65 ; Bopo Hang Hani Hira Kana Yiii # Po [2] HALFWIDTH IDEOGRAPHIC C # ================================================ -# Script_Extensions=Adlm Arab Mand Mani Phlp Rohg Sogd Syrc +# Script_Extensions=Adlm Arab Nkoo Rohg Syrc Thaa Yezi -0640 ; Adlm Arab Mand Mani Phlp Rohg Sogd Syrc # Lm ARABIC TATWEEL +061F ; Adlm Arab Nkoo Rohg Syrc Thaa Yezi # Po ARABIC QUESTION MARK # Total code points: 1 @@ -529,6 +561,14 @@ FF64..FF65 ; Bopo Hang Hani Hira Kana Yiii # Po [2] HALFWIDTH IDEOGRAPHIC C # ================================================ +# Script_Extensions=Adlm Arab Mand Mani Ougr Phlp Rohg Sogd Syrc + +0640 ; Adlm Arab Mand Mani Ougr Phlp Rohg Sogd Syrc # Lm ARABIC TATWEEL + +# Total code points: 1 + +# ================================================ + # Script_Extensions=Deva Dogr Gujr Guru Khoj Kthi Mahj Modi Sind Takr Tirh A836..A837 ; Deva Dogr Gujr Guru Khoj Kthi Mahj Modi Sind Takr Tirh # So [2] NORTH INDIC QUARTER MARK..NORTH INDIC PLACEHOLDER MARK diff --git a/lib/unicore/Scripts.txt b/lib/unicore/Scripts.txt index e0363f54d1..a138373011 100644 --- a/lib/unicore/Scripts.txt +++ b/lib/unicore/Scripts.txt @@ -1,16 +1,16 @@ -# Scripts-13.0.0.txt -# Date: 2020-01-22, 00:07:43 GMT -# © 2020 Unicode®, Inc. +# Scripts-14.0.0.txt +# Date: 2021-07-10, 00:35:31 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Unicode Character Database # For documentation, see http://www.unicode.org/reports/tr44/ # For more information, see: -# UAX #24, Unicode Script Property: http://www.unicode.org/reports/tr24/ +# UAX #24, Unicode Script Property: https://www.unicode.org/reports/tr24/ # Especially the sections: -# http://www.unicode.org/reports/tr24/#Assignment_Script_Values -# http://www.unicode.org/reports/tr24/#Assignment_ScriptX_Values +# https://www.unicode.org/reports/tr24/#Assignment_Script_Values +# https://www.unicode.org/reports/tr24/#Assignment_ScriptX_Values # # ================================================ @@ -154,7 +154,7 @@ 208A..208C ; Common # Sm [3] SUBSCRIPT PLUS SIGN..SUBSCRIPT EQUALS SIGN 208D ; Common # Ps SUBSCRIPT LEFT PARENTHESIS 208E ; Common # Pe SUBSCRIPT RIGHT PARENTHESIS -20A0..20BF ; Common # Sc [32] EURO-CURRENCY SIGN..BITCOIN SIGN +20A0..20C0 ; Common # Sc [33] EURO-CURRENCY SIGN..SOM SIGN 2100..2101 ; Common # So [2] ACCOUNT OF..ADDRESSED TO THE SUBJECT 2102 ; Common # L& DOUBLE-STRUCK CAPITAL C 2103..2106 ; Common # So [4] DEGREE CELSIUS..CADA UNA @@ -347,7 +347,16 @@ 2E42 ; Common # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK 2E43..2E4F ; Common # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER 2E50..2E51 ; Common # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR -2E52 ; Common # Po TIRONIAN SIGN CAPITAL ET +2E52..2E54 ; Common # Po [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK +2E55 ; Common # Ps LEFT SQUARE BRACKET WITH STROKE +2E56 ; Common # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57 ; Common # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58 ; Common # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; Common # Ps TOP HALF LEFT PARENTHESIS +2E5A ; Common # Pe TOP HALF RIGHT PARENTHESIS +2E5B ; Common # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C ; Common # Pe BOTTOM HALF RIGHT PARENTHESIS +2E5D ; Common # Pd OBLIQUE HYPHEN 2FF0..2FFB ; Common # So [12] IDEOGRAPHIC DESCRIPTION CHARACTER LEFT TO RIGHT..IDEOGRAPHIC DESCRIPTION CHARACTER OVERLAID 3000 ; Common # Zs IDEOGRAPHIC SPACE 3001..3003 ; Common # Po [3] IDEOGRAPHIC COMMA..DITTO MARK @@ -511,9 +520,8 @@ FFFC..FFFD ; Common # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHAR 10190..1019C ; Common # So [13] ROMAN SEXTANS SIGN..ASCIA SYMBOL 101D0..101FC ; Common # So [45] PHAISTOS DISC SIGN PEDESTRIAN..PHAISTOS DISC SIGN WAVY BAND 102E1..102FB ; Common # No [27] COPTIC EPACT DIGIT ONE..COPTIC EPACT NUMBER NINE HUNDRED -16FE2 ; Common # Po OLD CHINESE HOOK MARK -16FE3 ; Common # Lm OLD CHINESE ITERATION MARK 1BCA0..1BCA3 ; Common # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF50..1CFC3 ; Common # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5 ; Common # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126 ; Common # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129..1D164 ; Common # So [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE @@ -523,7 +531,7 @@ FFFC..FFFD ; Common # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHAR 1D173..1D17A ; Common # Cf [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE 1D183..1D184 ; Common # So [2] MUSICAL SYMBOL ARPEGGIATO UP..MUSICAL SYMBOL ARPEGGIATO DOWN 1D18C..1D1A9 ; Common # So [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH -1D1AE..1D1E8 ; Common # So [59] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KIEVAN FLAT SIGN +1D1AE..1D1EA ; Common # So [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON 1D2E0..1D2F3 ; Common # No [20] MAYAN NUMERAL ZERO..MAYAN NUMERAL NINETEEN 1D300..1D356 ; Common # So [87] MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING 1D360..1D378 ; Common # No [25] COUNTING ROD UNIT DIGIT ONE..TALLY MARK FIVE @@ -593,35 +601,36 @@ FFFC..FFFD ; Common # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHAR 1F300..1F3FA ; Common # So [251] CYCLONE..AMPHORA 1F3FB..1F3FF ; Common # Sk [5] EMOJI MODIFIER FITZPATRICK TYPE-1-2..EMOJI MODIFIER FITZPATRICK TYPE-6 1F400..1F6D7 ; Common # So [728] RAT..ELEVATOR -1F6E0..1F6EC ; Common # So [13] HAMMER AND WRENCH..AIRPLANE ARRIVING +1F6DD..1F6EC ; Common # So [16] PLAYGROUND SLIDE..AIRPLANE ARRIVING 1F6F0..1F6FC ; Common # So [13] SATELLITE..ROLLER SKATE 1F700..1F773 ; Common # So [116] ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE 1F780..1F7D8 ; Common # So [89] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7E0..1F7EB ; Common # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE +1F7F0 ; Common # So HEAVY EQUALS SIGN 1F800..1F80B ; Common # So [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847 ; Common # So [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859 ; Common # So [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW 1F860..1F887 ; Common # So [40] WIDE-HEADED LEFTWARDS LIGHT BARB ARROW..WIDE-HEADED SOUTH WEST VERY HEAVY BARB ARROW 1F890..1F8AD ; Common # So [30] LEFTWARDS TRIANGLE ARROWHEAD..WHITE ARROW SHAFT WIDTH TWO THIRDS 1F8B0..1F8B1 ; Common # So [2] ARROW POINTING UPWARDS THEN NORTH WEST..ARROW POINTING RIGHTWARDS THEN CURVING SOUTH WEST -1F900..1F978 ; Common # So [121] CIRCLED CROSS FORMEE WITH FOUR DOTS..DISGUISED FACE -1F97A..1F9CB ; Common # So [82] FACE WITH PLEADING EYES..BUBBLE TEA -1F9CD..1FA53 ; Common # So [135] STANDING PERSON..BLACK CHESS KNIGHT-BISHOP +1F900..1FA53 ; Common # So [340] CIRCLED CROSS FORMEE WITH FOUR DOTS..BLACK CHESS KNIGHT-BISHOP 1FA60..1FA6D ; Common # So [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER 1FA70..1FA74 ; Common # So [5] BALLET SHOES..THONG SANDAL -1FA78..1FA7A ; Common # So [3] DROP OF BLOOD..STETHOSCOPE +1FA78..1FA7C ; Common # So [5] DROP OF BLOOD..CRUTCH 1FA80..1FA86 ; Common # So [7] YO-YO..NESTING DOLLS -1FA90..1FAA8 ; Common # So [25] RINGED PLANET..ROCK -1FAB0..1FAB6 ; Common # So [7] FLY..FEATHER -1FAC0..1FAC2 ; Common # So [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAD0..1FAD6 ; Common # So [7] BLUEBERRIES..TEAPOT +1FA90..1FAAC ; Common # So [29] RINGED PLANET..HAMSA +1FAB0..1FABA ; Common # So [11] FLY..NEST WITH EGGS +1FAC0..1FAC5 ; Common # So [6] ANATOMICAL HEART..PERSON WITH CROWN +1FAD0..1FAD9 ; Common # So [10] BLUEBERRIES..JAR +1FAE0..1FAE7 ; Common # So [8] MELTING FACE..BUBBLES +1FAF0..1FAF6 ; Common # So [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS 1FB00..1FB92 ; Common # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA ; Common # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON 1FBF0..1FBF9 ; Common # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE E0001 ; Common # Cf LANGUAGE TAG E0020..E007F ; Common # Cf [96] TAG SPACE..CANCEL TAG -# Total code points: 8087 +# Total code points: 8252 # ================================================ @@ -664,8 +673,11 @@ A770 ; Latin # Lm MODIFIER LETTER US A771..A787 ; Latin # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER INSULAR T A78B..A78E ; Latin # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; Latin # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; Latin # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; Latin # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; Latin # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; Latin # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; Latin # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; Latin # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; Latin # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; Latin # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; Latin # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; Latin # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -679,8 +691,14 @@ AB69 ; Latin # Lm MODIFIER LETTER SMALL TURNED W FB00..FB06 ; Latin # L& [7] LATIN SMALL LIGATURE FF..LATIN SMALL LIGATURE ST FF21..FF3A ; Latin # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z FF41..FF5A ; Latin # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL LETTER Z +10780..10785 ; Latin # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Latin # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Latin # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL +1DF00..1DF09 ; Latin # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; Latin # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; Latin # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL -# Total code points: 1374 +# Total code points: 1475 # ================================================ @@ -820,7 +838,7 @@ FB46..FB4F ; Hebrew # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATU 060E..060F ; Arabic # So [2] ARABIC POETIC VERSE SIGN..ARABIC SIGN MISRA 0610..061A ; Arabic # Mn [11] ARABIC SIGN SALLALLAHOU ALAYHE WASSALLAM..ARABIC SMALL KASRA 061C ; Arabic # Cf ARABIC LETTER MARK -061E ; Arabic # Po ARABIC TRIPLE DOT PUNCTUATION MARK +061D..061E ; Arabic # Po [2] ARABIC END OF TEXT MARK..ARABIC TRIPLE DOT PUNCTUATION MARK 0620..063F ; Arabic # Lo [32] ARABIC LETTER KASHMIRI YEH..ARABIC LETTER FARSI YEH WITH THREE DOTS ABOVE 0641..064A ; Arabic # Lo [10] ARABIC LETTER FEH..ARABIC LETTER YEH 0656..065F ; Arabic # Mn [10] ARABIC SUBSCRIPT ALEF..ARABIC WAVY HAMZA BELOW @@ -843,18 +861,25 @@ FB46..FB4F ; Hebrew # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATU 06FD..06FE ; Arabic # So [2] ARABIC SIGN SINDHI AMPERSAND..ARABIC SIGN SINDHI POSTPOSITION MEN 06FF ; Arabic # Lo ARABIC LETTER HEH WITH INVERTED V 0750..077F ; Arabic # Lo [48] ARABIC LETTER BEH WITH THREE DOTS HORIZONTALLY BELOW..ARABIC LETTER KAF WITH TWO DOTS ABOVE -08A0..08B4 ; Arabic # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; Arabic # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE -08D3..08E1 ; Arabic # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0870..0887 ; Arabic # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0888 ; Arabic # Sk ARABIC RAISED ROUND DOT +0889..088E ; Arabic # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0890..0891 ; Arabic # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +0898..089F ; Arabic # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08A0..08C8 ; Arabic # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; Arabic # Lm ARABIC SMALL FARSI YEH +08CA..08E1 ; Arabic # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..08FF ; Arabic # Mn [29] ARABIC TURNED DAMMA BELOW..ARABIC MARK SIDEWAYS NOON GHUNNA FB50..FBB1 ; Arabic # Lo [98] ARABIC LETTER ALEF WASLA ISOLATED FORM..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM -FBB2..FBC1 ; Arabic # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2 ; Arabic # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FBD3..FD3D ; Arabic # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM +FD40..FD4F ; Arabic # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH FD50..FD8F ; Arabic # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM FD92..FDC7 ; Arabic # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM +FDCF ; Arabic # So ARABIC LIGATURE SALAAMUHU ALAYNAA FDF0..FDFB ; Arabic # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU FDFC ; Arabic # Sc RIAL SIGN -FDFD ; Arabic # So ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFD..FDFF ; Arabic # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FE70..FE74 ; Arabic # Lo [5] ARABIC FATHATAN ISOLATED FORM..ARABIC KASRATAN ISOLATED FORM FE76..FEFC ; Arabic # Lo [135] ARABIC FATHA ISOLATED FORM..ARABIC LIGATURE LAM WITH ALEF FINAL FORM 10E60..10E7E ; Arabic # No [31] RUMI DIGIT ONE..RUMI FRACTION TWO THIRDS @@ -893,7 +918,7 @@ FE76..FEFC ; Arabic # Lo [135] ARABIC FATHA ISOLATED FORM..ARABIC LIGATURE LA 1EEAB..1EEBB ; Arabic # Lo [17] ARABIC MATHEMATICAL DOUBLE-STRUCK LAM..ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN 1EEF0..1EEF1 ; Arabic # Sm [2] ARABIC MATHEMATICAL OPERATOR MEEM WITH HAH WITH TATWEEL..ARABIC MATHEMATICAL OPERATOR HAH WITH DAL -# Total code points: 1291 +# Total code points: 1365 # ================================================ @@ -1113,6 +1138,7 @@ A8FF ; Devanagari # Mn DEVANAGARI VOWEL SIGN AY 0C0E..0C10 ; Telugu # Lo [3] TELUGU LETTER E..TELUGU LETTER AI 0C12..0C28 ; Telugu # Lo [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C39 ; Telugu # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C3C ; Telugu # Mn TELUGU SIGN NUKTA 0C3D ; Telugu # Lo TELUGU SIGN AVAGRAHA 0C3E..0C40 ; Telugu # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44 ; Telugu # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR @@ -1120,6 +1146,7 @@ A8FF ; Devanagari # Mn DEVANAGARI VOWEL SIGN AY 0C4A..0C4D ; Telugu # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56 ; Telugu # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK 0C58..0C5A ; Telugu # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; Telugu # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; Telugu # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63 ; Telugu # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C66..0C6F ; Telugu # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE @@ -1127,7 +1154,7 @@ A8FF ; Devanagari # Mn DEVANAGARI VOWEL SIGN AY 0C78..0C7E ; Telugu # No [7] TELUGU FRACTION DIGIT ZERO FOR ODD POWERS OF FOUR..TELUGU FRACTION DIGIT THREE FOR EVEN POWERS OF FOUR 0C7F ; Telugu # So TELUGU SIGN TUUMU -# Total code points: 98 +# Total code points: 100 # ================================================ @@ -1150,13 +1177,13 @@ A8FF ; Devanagari # Mn DEVANAGARI VOWEL SIGN AY 0CCA..0CCB ; Kannada # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC..0CCD ; Kannada # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA 0CD5..0CD6 ; Kannada # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE ; Kannada # Lo KANNADA LETTER FA +0CDD..0CDE ; Kannada # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; Kannada # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; Kannada # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; Kannada # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE 0CF1..0CF2 ; Kannada # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA -# Total code points: 89 +# Total code points: 90 # ================================================ @@ -1411,8 +1438,12 @@ AB09..AB0E ; Ethiopic # Lo [6] ETHIOPIC SYLLABLE DDHU..ETHIOPIC SYLLABLE DD AB11..AB16 ; Ethiopic # Lo [6] ETHIOPIC SYLLABLE DZU..ETHIOPIC SYLLABLE DZO AB20..AB26 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE CCHHA..ETHIOPIC SYLLABLE CCHHO AB28..AB2E ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE BBA..ETHIOPIC SYLLABLE BBO +1E7E0..1E7E6 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; Ethiopic # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; Ethiopic # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; Ethiopic # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE -# Total code points: 495 +# Total code points: 523 # ================================================ @@ -1430,8 +1461,9 @@ AB70..ABBF ; Cherokee # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETT 166E ; Canadian_Aboriginal # Po CANADIAN SYLLABICS FULL STOP 166F..167F ; Canadian_Aboriginal # Lo [17] CANADIAN SYLLABICS QAI..CANADIAN SYLLABICS BLACKFOOT W 18B0..18F5 ; Canadian_Aboriginal # Lo [70] CANADIAN SYLLABICS OY..CANADIAN SYLLABICS CARRIER DENTAL S +11AB0..11ABF ; Canadian_Aboriginal # Lo [16] CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA -# Total code points: 710 +# Total code points: 726 # ================================================ @@ -1480,6 +1512,7 @@ AB70..ABBF ; Cherokee # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETT 1807..180A ; Mongolian # Po [4] MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER..MONGOLIAN NIRUGU 180B..180D ; Mongolian # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; Mongolian # Cf MONGOLIAN VOWEL SEPARATOR +180F ; Mongolian # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1810..1819 ; Mongolian # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE 1820..1842 ; Mongolian # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843 ; Mongolian # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -1491,18 +1524,18 @@ AB70..ABBF ; Cherokee # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETT 18AA ; Mongolian # Lo MONGOLIAN LETTER MANCHU ALI GALI LHA 11660..1166C ; Mongolian # Po [13] MONGOLIAN BIRGA WITH ORNAMENT..MONGOLIAN TURNED SWIRL BIRGA WITH DOUBLE ORNAMENT -# Total code points: 167 +# Total code points: 168 # ================================================ 3041..3096 ; Hiragana # Lo [86] HIRAGANA LETTER SMALL A..HIRAGANA LETTER SMALL KE 309D..309E ; Hiragana # Lm [2] HIRAGANA ITERATION MARK..HIRAGANA VOICED ITERATION MARK 309F ; Hiragana # Lo HIRAGANA DIGRAPH YORI -1B001..1B11E ; Hiragana # Lo [286] HIRAGANA LETTER ARCHAIC YE..HENTAIGANA LETTER N-MU-MO-2 +1B001..1B11F ; Hiragana # Lo [287] HIRAGANA LETTER ARCHAIC YE..HIRAGANA LETTER ARCHAIC WU 1B150..1B152 ; Hiragana # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1F200 ; Hiragana # So SQUARE HIRAGANA HOKA -# Total code points: 379 +# Total code points: 380 # ================================================ @@ -1514,10 +1547,14 @@ AB70..ABBF ; Cherokee # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETT 3300..3357 ; Katakana # So [88] SQUARE APAATO..SQUARE WATTO FF66..FF6F ; Katakana # Lo [10] HALFWIDTH KATAKANA LETTER WO..HALFWIDTH KATAKANA LETTER SMALL TU FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAKANA LETTER N +1AFF0..1AFF3 ; Katakana # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; Katakana # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; Katakana # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 1B000 ; Katakana # Lo KATAKANA LETTER ARCHAIC E +1B120..1B122 ; Katakana # Lo [3] KATAKANA LETTER ARCHAIC YI..KATAKANA LETTER ARCHAIC WU 1B164..1B167 ; Katakana # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N -# Total code points: 304 +# Total code points: 320 # ================================================ @@ -1538,19 +1575,21 @@ FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAK 3038..303A ; Han # Nl [3] HANGZHOU NUMERAL TEN..HANGZHOU NUMERAL THIRTY 303B ; Han # Lm VERTICAL IDEOGRAPHIC ITERATION MARK 3400..4DBF ; Han # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; Han # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC +4E00..9FFF ; Han # Lo [20992] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFF F900..FA6D ; Han # Lo [366] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA6D FA70..FAD9 ; Han # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9 +16FE2 ; Han # Po OLD CHINESE HOOK MARK +16FE3 ; Han # Lm OLD CHINESE ITERATION MARK 16FF0..16FF1 ; Han # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY -20000..2A6DD ; Han # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; Han # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; Han # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; Han # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; Han # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Han # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Han # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 2F800..2FA1D ; Han # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D 30000..3134A ; Han # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 94204 +# Total code points: 94215 # ================================================ @@ -1593,15 +1632,14 @@ A490..A4C6 ; Yi # So [55] YI RADICAL QOT..YI RADICAL KE 0951..0954 ; Inherited # Mn [4] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI ACUTE ACCENT 1AB0..1ABD ; Inherited # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; Inherited # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; Inherited # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; Inherited # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1CD0..1CD2 ; Inherited # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA 1CD4..1CE0 ; Inherited # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA 1CE2..1CE8 ; Inherited # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL 1CED ; Inherited # Mn VEDIC SIGN TIRYAK 1CF4 ; Inherited # Mn VEDIC TONE CANDRA ABOVE 1CF8..1CF9 ; Inherited # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE -1DC0..1DF9 ; Inherited # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; Inherited # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; Inherited # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 200C..200D ; Inherited # Cf [2] ZERO WIDTH NON-JOINER..ZERO WIDTH JOINER 20D0..20DC ; Inherited # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0 ; Inherited # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH @@ -1615,26 +1653,30 @@ FE20..FE2D ; Inherited # Mn [14] COMBINING LIGATURE LEFT HALF..COMBINING CON 101FD ; Inherited # Mn PHAISTOS DISC SIGN COMBINING OBLIQUE STROKE 102E0 ; Inherited # Mn COPTIC EPACT THOUSANDS MARK 1133B ; Inherited # Mn COMBINING BINDU BELOW +1CF00..1CF2D ; Inherited # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; Inherited # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D167..1D169 ; Inherited # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D17B..1D182 ; Inherited # Mn [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE 1D185..1D18B ; Inherited # Mn [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1D1AA..1D1AD ; Inherited # Mn [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO E0100..E01EF ; Inherited # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 573 +# Total code points: 657 # ================================================ -1700..170C ; Tagalog # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; Tagalog # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711 ; Tagalog # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1714 ; Tagalog # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA +1715 ; Tagalog # Mc TAGALOG SIGN PAMUDPOD +171F ; Tagalog # Lo TAGALOG LETTER ARCHAIC RA -# Total code points: 20 +# Total code points: 23 # ================================================ 1720..1731 ; Hanunoo # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA -1732..1734 ; Hanunoo # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733 ; Hanunoo # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734 ; Hanunoo # Mc HANUNOO SIGN PAMUDPOD # Total code points: 21 @@ -1762,15 +1804,14 @@ E0100..E01EF ; Inherited # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-2 # ================================================ -2C00..2C2E ; Glagolitic # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; Glagolitic # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C00..2C5F ; Glagolitic # L& [96] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 1E000..1E006 ; Glagolitic # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; Glagolitic # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; Glagolitic # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI 1E023..1E024 ; Glagolitic # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; Glagolitic # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA -# Total code points: 132 +# Total code points: 134 # ================================================ @@ -1836,14 +1877,15 @@ A82C ; Syloti_Nagri # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA 1B3D..1B41 ; Balinese # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42 ; Balinese # Mn BALINESE VOWEL SIGN PEPET 1B43..1B44 ; Balinese # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG -1B45..1B4B ; Balinese # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; Balinese # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59 ; Balinese # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B5A..1B60 ; Balinese # Po [7] BALINESE PANTI..BALINESE PAMENENG 1B61..1B6A ; Balinese # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE 1B6B..1B73 ; Balinese # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1B74..1B7C ; Balinese # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +1B7D..1B7E ; Balinese # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG -# Total code points: 121 +# Total code points: 124 # ================================================ @@ -2178,9 +2220,10 @@ ABF0..ABF9 ; Meetei_Mayek # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DI 110BB..110BC ; Kaithi # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN 110BD ; Kaithi # Cf KAITHI NUMBER SIGN 110BE..110C1 ; Kaithi # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA +110C2 ; Kaithi # Mn KAITHI VOWEL SIGN VOCALIC R 110CD ; Kaithi # Cf KAITHI NUMBER SIGN ABOVE -# Total code points: 67 +# Total code points: 68 # ================================================ @@ -2207,9 +2250,13 @@ ABF0..ABF9 ; Meetei_Mayek # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DI 11047..1104D ; Brahmi # Po [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 11052..11065 ; Brahmi # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND 11066..1106F ; Brahmi # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11070 ; Brahmi # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11071..11072 ; Brahmi # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074 ; Brahmi # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075 ; Brahmi # Lo BRAHMI LETTER OLD TAMIL LLA 1107F ; Brahmi # Mn BRAHMI NUMBER JOINER -# Total code points: 109 +# Total code points: 115 # ================================================ @@ -2301,9 +2348,10 @@ ABF0..ABF9 ; Meetei_Mayek # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DI 116B6 ; Takri # Mc TAKRI SIGN VIRAMA 116B7 ; Takri # Mn TAKRI SIGN NUKTA 116B8 ; Takri # Lo TAKRI LETTER ARCHAIC KHA +116B9 ; Takri # Po TAKRI ABBREVIATION SIGN 116C0..116C9 ; Takri # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE -# Total code points: 67 +# Total code points: 68 # ================================================ @@ -2561,8 +2609,9 @@ ABF0..ABF9 ; Meetei_Mayek # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DI 1173A..1173B ; Ahom # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY 1173C..1173E ; Ahom # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI 1173F ; Ahom # So AHOM SYMBOL VI +11740..11746 ; Ahom # Lo [7] AHOM LETTER CA..AHOM LETTER LLA -# Total code points: 58 +# Total code points: 65 # ================================================ @@ -2897,4 +2946,46 @@ ABF0..ABF9 ; Meetei_Mayek # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DI # Total code points: 47 +# ================================================ + +12F90..12FF0 ; Cypro_Minoan # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2 ; Cypro_Minoan # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 + +# Total code points: 99 + +# ================================================ + +10F70..10F81 ; Old_Uyghur # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F82..10F85 ; Old_Uyghur # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW +10F86..10F89 ; Old_Uyghur # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS + +# Total code points: 26 + +# ================================================ + +16A70..16ABE ; Tangsa # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; Tangsa # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE + +# Total code points: 89 + +# ================================================ + +1E290..1E2AD ; Toto # Lo [30] TOTO LETTER PA..TOTO LETTER A +1E2AE ; Toto # Mn TOTO SIGN RISING TONE + +# Total code points: 31 + +# ================================================ + +10570..1057A ; Vithkuqi # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Vithkuqi # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Vithkuqi # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Vithkuqi # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; Vithkuqi # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Vithkuqi # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Vithkuqi # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Vithkuqi # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE + +# Total code points: 70 + # EOF diff --git a/lib/unicore/SpecialCasing.txt b/lib/unicore/SpecialCasing.txt index 2a1a5a1d6b..1c2e968a8c 100644 --- a/lib/unicore/SpecialCasing.txt +++ b/lib/unicore/SpecialCasing.txt @@ -1,6 +1,6 @@ -# SpecialCasing-13.0.0.txt -# Date: 2019-09-08, 23:31:24 GMT -# © 2019 Unicode®, Inc. +# SpecialCasing-14.0.0.txt +# Date: 2021-03-08, 19:35:55 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # diff --git a/lib/unicore/StandardizedVariants.txt b/lib/unicore/StandardizedVariants.txt index ee386cd920..5c3c0149ba 100644 --- a/lib/unicore/StandardizedVariants.txt +++ b/lib/unicore/StandardizedVariants.txt @@ -1,7 +1,7 @@ -# StandardizedVariants-13.0.0.txt -# Date: 2019-05-21, 17:56:00 GMT [KW, LI, RP] -# © 2019 Unicode®, Inc. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# StandardizedVariants-14.0.0.txt +# Date: 2021-01-26, 18:20:00 GMT [KW, LI, RP] +# © 2021 Unicode®, Inc. +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Specification of the variation sequences that are defined in the # Unicode Standard. @@ -26,13 +26,13 @@ # # For more information on standardized variation sequences, # see Section 23.4, Variation Selectors, -# in The Unicode Standard, Version 13.0. +# in The Unicode Standard, Version 14.0. # # For more information on the Ideographic Variation Database, -# see http://www.unicode.org/ivd/ +# see https://www.unicode.org/ivd/ # # For more information on emoji variation sequences, -# see http://www.unicode.org/reports/tr51/ +# see https://www.unicode.org/reports/tr51/ # # Format: # Field 0: the variation sequence @@ -77,6 +77,62 @@ 2ACC FE00; with stroke through bottom members; # SUPERSET OF ABOVE NOT EQUAL TO FF10 FE00; short diagonal stroke form; # FULLWIDTH DIGIT ZERO +# Mathematical alphabet script variants + +1D49C FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL A +212C FE00; chancery style; # SCRIPT CAPITAL B +1D49E FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL C +1D49F FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL D +2130 FE00; chancery style; # SCRIPT CAPITAL E +2131 FE00; chancery style; # SCRIPT CAPITAL F +1D4A2 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL G +210B FE00; chancery style; # SCRIPT CAPITAL H +2110 FE00; chancery style; # SCRIPT CAPITAL I +1D4A5 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL J +1D4A6 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL K +2112 FE00; chancery style; # SCRIPT CAPITAL L +2133 FE00; chancery style; # SCRIPT CAPITAL M +1D4A9 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL N +1D4AA FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL O +1D4AB FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL P +1D4AC FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL Q +211B FE00; chancery style; # SCRIPT CAPITAL R +1D4AE FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL S +1D4AF FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL T +1D4B0 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL U +1D4B1 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL V +1D4B2 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL W +1D4B3 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL X +1D4B4 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL Y +1D4B5 FE00; chancery style; # MATHEMATICAL SCRIPT CAPITAL Z + +1D49C FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL A +212C FE01; roundhand style; # SCRIPT CAPITAL B +1D49E FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL C +1D49F FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL D +2130 FE01; roundhand style; # SCRIPT CAPITAL E +2131 FE01; roundhand style; # SCRIPT CAPITAL F +1D4A2 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL G +210B FE01; roundhand style; # SCRIPT CAPITAL H +2110 FE01; roundhand style; # SCRIPT CAPITAL I +1D4A5 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL J +1D4A6 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL K +2112 FE01; roundhand style; # SCRIPT CAPITAL L +2133 FE01; roundhand style; # SCRIPT CAPITAL M +1D4A9 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL N +1D4AA FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL O +1D4AB FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL P +1D4AC FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL Q +211B FE01; roundhand style; # SCRIPT CAPITAL R +1D4AE FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL S +1D4AF FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL T +1D4B0 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL U +1D4B1 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL V +1D4B2 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL W +1D4B3 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL X +1D4B4 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL Y +1D4B5 FE01; roundhand style; # MATHEMATICAL SCRIPT CAPITAL Z + # East Asian punctuation positional variants 3001 FE00; corner-justified form; # IDEOGRAPHIC COMMA diff --git a/lib/unicore/UnicodeData.txt b/lib/unicore/UnicodeData.txt index e22f967bba..b5abef7ed4 100644 --- a/lib/unicore/UnicodeData.txt +++ b/lib/unicore/UnicodeData.txt @@ -1525,6 +1525,7 @@ 061A;ARABIC SMALL KASRA;Mn;32;NSM;;;;;N;;;;; 061B;ARABIC SEMICOLON;Po;0;AL;;;;;N;;;;; 061C;ARABIC LETTER MARK;Cf;0;AL;;;;;N;;;;; +061D;ARABIC END OF TEXT MARK;Po;0;AL;;;;;N;;;;; 061E;ARABIC TRIPLE DOT PUNCTUATION MARK;Po;0;AL;;;;;N;;;;; 061F;ARABIC QUESTION MARK;Po;0;AL;;;;;N;;;;; 0620;ARABIC LETTER KASHMIRI YEH;Lo;0;AL;;;;;N;;;;; @@ -2089,6 +2090,47 @@ 0868;SYRIAC LETTER MALAYALAM LLA;Lo;0;AL;;;;;N;;;;; 0869;SYRIAC LETTER MALAYALAM LLLA;Lo;0;AL;;;;;N;;;;; 086A;SYRIAC LETTER MALAYALAM SSA;Lo;0;AL;;;;;N;;;;; +0870;ARABIC LETTER ALEF WITH ATTACHED FATHA;Lo;0;AL;;;;;N;;;;; +0871;ARABIC LETTER ALEF WITH ATTACHED TOP RIGHT FATHA;Lo;0;AL;;;;;N;;;;; +0872;ARABIC LETTER ALEF WITH RIGHT MIDDLE STROKE;Lo;0;AL;;;;;N;;;;; +0873;ARABIC LETTER ALEF WITH LEFT MIDDLE STROKE;Lo;0;AL;;;;;N;;;;; +0874;ARABIC LETTER ALEF WITH ATTACHED KASRA;Lo;0;AL;;;;;N;;;;; +0875;ARABIC LETTER ALEF WITH ATTACHED BOTTOM RIGHT KASRA;Lo;0;AL;;;;;N;;;;; +0876;ARABIC LETTER ALEF WITH ATTACHED ROUND DOT ABOVE;Lo;0;AL;;;;;N;;;;; +0877;ARABIC LETTER ALEF WITH ATTACHED RIGHT ROUND DOT;Lo;0;AL;;;;;N;;;;; +0878;ARABIC LETTER ALEF WITH ATTACHED LEFT ROUND DOT;Lo;0;AL;;;;;N;;;;; +0879;ARABIC LETTER ALEF WITH ATTACHED ROUND DOT BELOW;Lo;0;AL;;;;;N;;;;; +087A;ARABIC LETTER ALEF WITH DOT ABOVE;Lo;0;AL;;;;;N;;;;; +087B;ARABIC LETTER ALEF WITH ATTACHED TOP RIGHT FATHA AND DOT ABOVE;Lo;0;AL;;;;;N;;;;; +087C;ARABIC LETTER ALEF WITH RIGHT MIDDLE STROKE AND DOT ABOVE;Lo;0;AL;;;;;N;;;;; +087D;ARABIC LETTER ALEF WITH ATTACHED BOTTOM RIGHT KASRA AND DOT ABOVE;Lo;0;AL;;;;;N;;;;; +087E;ARABIC LETTER ALEF WITH ATTACHED TOP RIGHT FATHA AND LEFT RING;Lo;0;AL;;;;;N;;;;; +087F;ARABIC LETTER ALEF WITH RIGHT MIDDLE STROKE AND LEFT RING;Lo;0;AL;;;;;N;;;;; +0880;ARABIC LETTER ALEF WITH ATTACHED BOTTOM RIGHT KASRA AND LEFT RING;Lo;0;AL;;;;;N;;;;; +0881;ARABIC LETTER ALEF WITH ATTACHED RIGHT HAMZA;Lo;0;AL;;;;;N;;;;; +0882;ARABIC LETTER ALEF WITH ATTACHED LEFT HAMZA;Lo;0;AL;;;;;N;;;;; +0883;ARABIC TATWEEL WITH OVERSTRUCK HAMZA;Lo;0;AL;;;;;N;;;;; +0884;ARABIC TATWEEL WITH OVERSTRUCK WAW;Lo;0;AL;;;;;N;;;;; +0885;ARABIC TATWEEL WITH TWO DOTS BELOW;Lo;0;AL;;;;;N;;;;; +0886;ARABIC LETTER THIN YEH;Lo;0;AL;;;;;N;;;;; +0887;ARABIC BASELINE ROUND DOT;Lo;0;AL;;;;;N;;;;; +0888;ARABIC RAISED ROUND DOT;Sk;0;AL;;;;;N;;;;; +0889;ARABIC LETTER NOON WITH INVERTED SMALL V;Lo;0;AL;;;;;N;;;;; +088A;ARABIC LETTER HAH WITH INVERTED SMALL V BELOW;Lo;0;AL;;;;;N;;;;; +088B;ARABIC LETTER TAH WITH DOT BELOW;Lo;0;AL;;;;;N;;;;; +088C;ARABIC LETTER TAH WITH THREE DOTS BELOW;Lo;0;AL;;;;;N;;;;; +088D;ARABIC LETTER KEHEH WITH TWO DOTS VERTICALLY BELOW;Lo;0;AL;;;;;N;;;;; +088E;ARABIC VERTICAL TAIL;Lo;0;AL;;;;;N;;;;; +0890;ARABIC POUND MARK ABOVE;Cf;0;AN;;;;;N;;;;; +0891;ARABIC PIASTRE MARK ABOVE;Cf;0;AN;;;;;N;;;;; +0898;ARABIC SMALL HIGH WORD AL-JUZ;Mn;230;NSM;;;;;N;;;;; +0899;ARABIC SMALL LOW WORD ISHMAAM;Mn;220;NSM;;;;;N;;;;; +089A;ARABIC SMALL LOW WORD IMAALA;Mn;220;NSM;;;;;N;;;;; +089B;ARABIC SMALL LOW WORD TASHEEL;Mn;220;NSM;;;;;N;;;;; +089C;ARABIC MADDA WAAJIB;Mn;230;NSM;;;;;N;;;;; +089D;ARABIC SUPERSCRIPT ALEF MOKHASSAS;Mn;230;NSM;;;;;N;;;;; +089E;ARABIC DOUBLED MADDA;Mn;230;NSM;;;;;N;;;;; +089F;ARABIC HALF MADDA OVER MADDA;Mn;230;NSM;;;;;N;;;;; 08A0;ARABIC LETTER BEH WITH SMALL V BELOW;Lo;0;AL;;;;;N;;;;; 08A1;ARABIC LETTER BEH WITH HAMZA ABOVE;Lo;0;AL;;;;;N;;;;; 08A2;ARABIC LETTER JEEM WITH TWO DOTS ABOVE;Lo;0;AL;;;;;N;;;;; @@ -2110,6 +2152,7 @@ 08B2;ARABIC LETTER ZAIN WITH INVERTED V ABOVE;Lo;0;AL;;;;;N;;;;; 08B3;ARABIC LETTER AIN WITH THREE DOTS BELOW;Lo;0;AL;;;;;N;;;;; 08B4;ARABIC LETTER KAF WITH DOT BELOW;Lo;0;AL;;;;;N;;;;; +08B5;ARABIC LETTER QAF WITH DOT BELOW AND NO DOTS ABOVE;Lo;0;AL;;;;;N;;;;; 08B6;ARABIC LETTER BEH WITH SMALL MEEM ABOVE;Lo;0;AL;;;;;N;;;;; 08B7;ARABIC LETTER PEH WITH SMALL MEEM ABOVE;Lo;0;AL;;;;;N;;;;; 08B8;ARABIC LETTER TEH WITH SMALL TEH ABOVE;Lo;0;AL;;;;;N;;;;; @@ -2128,6 +2171,17 @@ 08C5;ARABIC LETTER JEEM WITH THREE DOTS ABOVE;Lo;0;AL;;;;;N;;;;; 08C6;ARABIC LETTER JEEM WITH THREE DOTS BELOW;Lo;0;AL;;;;;N;;;;; 08C7;ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE;Lo;0;AL;;;;;N;;;;; +08C8;ARABIC LETTER GRAF;Lo;0;AL;;;;;N;;;;; +08C9;ARABIC SMALL FARSI YEH;Lm;0;AL;;;;;N;;;;; +08CA;ARABIC SMALL HIGH FARSI YEH;Mn;230;NSM;;;;;N;;;;; +08CB;ARABIC SMALL HIGH YEH BARREE WITH TWO DOTS BELOW;Mn;230;NSM;;;;;N;;;;; +08CC;ARABIC SMALL HIGH WORD SAH;Mn;230;NSM;;;;;N;;;;; +08CD;ARABIC SMALL HIGH ZAH;Mn;230;NSM;;;;;N;;;;; +08CE;ARABIC LARGE ROUND DOT ABOVE;Mn;230;NSM;;;;;N;;;;; +08CF;ARABIC LARGE ROUND DOT BELOW;Mn;220;NSM;;;;;N;;;;; +08D0;ARABIC SUKUN BELOW;Mn;220;NSM;;;;;N;;;;; +08D1;ARABIC LARGE CIRCLE BELOW;Mn;220;NSM;;;;;N;;;;; +08D2;ARABIC LARGE ROUND DOT INSIDE CIRCLE BELOW;Mn;220;NSM;;;;;N;;;;; 08D3;ARABIC SMALL LOW WAW;Mn;220;NSM;;;;;N;;;;; 08D4;ARABIC SMALL HIGH WORD AR-RUB;Mn;230;NSM;;;;;N;;;;; 08D5;ARABIC SMALL HIGH SAD;Mn;230;NSM;;;;;N;;;;; @@ -2786,6 +2840,7 @@ 0C37;TELUGU LETTER SSA;Lo;0;L;;;;;N;;;;; 0C38;TELUGU LETTER SA;Lo;0;L;;;;;N;;;;; 0C39;TELUGU LETTER HA;Lo;0;L;;;;;N;;;;; +0C3C;TELUGU SIGN NUKTA;Mn;7;NSM;;;;;N;;;;; 0C3D;TELUGU SIGN AVAGRAHA;Lo;0;L;;;;;N;;;;; 0C3E;TELUGU VOWEL SIGN AA;Mn;0;NSM;;;;;N;;;;; 0C3F;TELUGU VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;; @@ -2806,6 +2861,7 @@ 0C58;TELUGU LETTER TSA;Lo;0;L;;;;;N;;;;; 0C59;TELUGU LETTER DZA;Lo;0;L;;;;;N;;;;; 0C5A;TELUGU LETTER RRRA;Lo;0;L;;;;;N;;;;; +0C5D;TELUGU LETTER NAKAARA POLLU;Lo;0;L;;;;;N;;;;; 0C60;TELUGU LETTER VOCALIC RR;Lo;0;L;;;;;N;;;;; 0C61;TELUGU LETTER VOCALIC LL;Lo;0;L;;;;;N;;;;; 0C62;TELUGU VOWEL SIGN VOCALIC L;Mn;0;NSM;;;;;N;;;;; @@ -2901,6 +2957,7 @@ 0CCD;KANNADA SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;; 0CD5;KANNADA LENGTH MARK;Mc;0;L;;;;;N;;;;; 0CD6;KANNADA AI LENGTH MARK;Mc;0;L;;;;;N;;;;; +0CDD;KANNADA LETTER NAKAARA POLLU;Lo;0;L;;;;;N;;;;; 0CDE;KANNADA LETTER FA;Lo;0;L;;;;;N;;;;; 0CE0;KANNADA LETTER VOCALIC RR;Lo;0;L;;;;;N;;;;; 0CE1;KANNADA LETTER VOCALIC LL;Lo;0;L;;;;;N;;;;; @@ -5258,6 +5315,7 @@ 170A;TAGALOG LETTER BA;Lo;0;L;;;;;N;;;;; 170B;TAGALOG LETTER MA;Lo;0;L;;;;;N;;;;; 170C;TAGALOG LETTER YA;Lo;0;L;;;;;N;;;;; +170D;TAGALOG LETTER RA;Lo;0;L;;;;;N;;;;; 170E;TAGALOG LETTER LA;Lo;0;L;;;;;N;;;;; 170F;TAGALOG LETTER WA;Lo;0;L;;;;;N;;;;; 1710;TAGALOG LETTER SA;Lo;0;L;;;;;N;;;;; @@ -5265,6 +5323,8 @@ 1712;TAGALOG VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;; 1713;TAGALOG VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;; 1714;TAGALOG SIGN VIRAMA;Mn;9;NSM;;;;;N;;;;; +1715;TAGALOG SIGN PAMUDPOD;Mc;9;L;;;;;N;;;;; +171F;TAGALOG LETTER ARCHAIC RA;Lo;0;L;;;;;N;;;;; 1720;HANUNOO LETTER A;Lo;0;L;;;;;N;;;;; 1721;HANUNOO LETTER I;Lo;0;L;;;;;N;;;;; 1722;HANUNOO LETTER U;Lo;0;L;;;;;N;;;;; @@ -5285,7 +5345,7 @@ 1731;HANUNOO LETTER HA;Lo;0;L;;;;;N;;;;; 1732;HANUNOO VOWEL SIGN I;Mn;0;NSM;;;;;N;;;;; 1733;HANUNOO VOWEL SIGN U;Mn;0;NSM;;;;;N;;;;; -1734;HANUNOO SIGN PAMUDPOD;Mn;9;NSM;;;;;N;;;;; +1734;HANUNOO SIGN PAMUDPOD;Mc;9;L;;;;;N;;;;; 1735;PHILIPPINE SINGLE PUNCTUATION;Po;0;L;;;;;N;;;;; 1736;PHILIPPINE DOUBLE PUNCTUATION;Po;0;L;;;;;N;;;;; 1740;BUHID LETTER A;Lo;0;L;;;;;N;;;;; @@ -5455,6 +5515,7 @@ 180C;MONGOLIAN FREE VARIATION SELECTOR TWO;Mn;0;NSM;;;;;N;;;;; 180D;MONGOLIAN FREE VARIATION SELECTOR THREE;Mn;0;NSM;;;;;N;;;;; 180E;MONGOLIAN VOWEL SEPARATOR;Cf;0;BN;;;;;N;;;;; +180F;MONGOLIAN FREE VARIATION SELECTOR FOUR;Mn;0;NSM;;;;;N;;;;; 1810;MONGOLIAN DIGIT ZERO;Nd;0;L;;0;0;0;N;;;;; 1811;MONGOLIAN DIGIT ONE;Nd;0;L;;1;1;1;N;;;;; 1812;MONGOLIAN DIGIT TWO;Nd;0;L;;2;2;2;N;;;;; @@ -6059,6 +6120,20 @@ 1ABE;COMBINING PARENTHESES OVERLAY;Me;0;NSM;;;;;N;;;;; 1ABF;COMBINING LATIN SMALL LETTER W BELOW;Mn;220;NSM;;;;;N;;;;; 1AC0;COMBINING LATIN SMALL LETTER TURNED W BELOW;Mn;220;NSM;;;;;N;;;;; +1AC1;COMBINING LEFT PARENTHESIS ABOVE LEFT;Mn;230;NSM;;;;;N;;;;; +1AC2;COMBINING RIGHT PARENTHESIS ABOVE RIGHT;Mn;230;NSM;;;;;N;;;;; +1AC3;COMBINING LEFT PARENTHESIS BELOW LEFT;Mn;220;NSM;;;;;N;;;;; +1AC4;COMBINING RIGHT PARENTHESIS BELOW RIGHT;Mn;220;NSM;;;;;N;;;;; +1AC5;COMBINING SQUARE BRACKETS ABOVE;Mn;230;NSM;;;;;N;;;;; +1AC6;COMBINING NUMBER SIGN ABOVE;Mn;230;NSM;;;;;N;;;;; +1AC7;COMBINING INVERTED DOUBLE ARCH ABOVE;Mn;230;NSM;;;;;N;;;;; +1AC8;COMBINING PLUS SIGN ABOVE;Mn;230;NSM;;;;;N;;;;; +1AC9;COMBINING DOUBLE PLUS SIGN ABOVE;Mn;230;NSM;;;;;N;;;;; +1ACA;COMBINING DOUBLE PLUS SIGN BELOW;Mn;220;NSM;;;;;N;;;;; +1ACB;COMBINING TRIPLE ACUTE ACCENT;Mn;230;NSM;;;;;N;;;;; +1ACC;COMBINING LATIN SMALL LETTER INSULAR G;Mn;230;NSM;;;;;N;;;;; +1ACD;COMBINING LATIN SMALL LETTER INSULAR R;Mn;230;NSM;;;;;N;;;;; +1ACE;COMBINING LATIN SMALL LETTER INSULAR T;Mn;230;NSM;;;;;N;;;;; 1B00;BALINESE SIGN ULU RICEM;Mn;0;NSM;;;;;N;;;;; 1B01;BALINESE SIGN ULU CANDRA;Mn;0;NSM;;;;;N;;;;; 1B02;BALINESE SIGN CECEK;Mn;0;NSM;;;;;N;;;;; @@ -6135,6 +6210,7 @@ 1B49;BALINESE LETTER VE SASAK;Lo;0;L;;;;;N;;;;; 1B4A;BALINESE LETTER ZAL SASAK;Lo;0;L;;;;;N;;;;; 1B4B;BALINESE LETTER ASYURA SASAK;Lo;0;L;;;;;N;;;;; +1B4C;BALINESE LETTER ARCHAIC JNYA;Lo;0;L;;;;;N;;;;; 1B50;BALINESE DIGIT ZERO;Nd;0;L;;0;0;0;N;;;;; 1B51;BALINESE DIGIT ONE;Nd;0;L;;1;1;1;N;;;;; 1B52;BALINESE DIGIT TWO;Nd;0;L;;2;2;2;N;;;;; @@ -6180,6 +6256,8 @@ 1B7A;BALINESE MUSICAL SYMBOL LEFT-HAND CLOSED PLAK;So;0;L;;;;;N;;;;; 1B7B;BALINESE MUSICAL SYMBOL LEFT-HAND CLOSED PLUK;So;0;L;;;;;N;;;;; 1B7C;BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING;So;0;L;;;;;N;;;;; +1B7D;BALINESE PANTI LANTANG;Po;0;L;;;;;N;;;;; +1B7E;BALINESE PAMADA LANTANG;Po;0;L;;;;;N;;;;; 1B80;SUNDANESE SIGN PANYECEK;Mn;0;NSM;;;;;N;;;;; 1B81;SUNDANESE SIGN PANGLAYAR;Mn;0;NSM;;;;;N;;;;; 1B82;SUNDANESE SIGN PANGWISAD;Mc;0;L;;;;;N;;;;; @@ -6778,6 +6856,7 @@ 1DF7;COMBINING KAVYKA ABOVE LEFT;Mn;228;NSM;;;;;N;;;;; 1DF8;COMBINING DOT ABOVE LEFT;Mn;228;NSM;;;;;N;;;;; 1DF9;COMBINING WIDE INVERTED BRIDGE BELOW;Mn;220;NSM;;;;;N;;;;; +1DFA;COMBINING DOT BELOW LEFT;Mn;218;NSM;;;;;N;;;;; 1DFB;COMBINING DELETION MARK;Mn;230;NSM;;;;;N;;;;; 1DFC;COMBINING DOUBLE INVERTED BREVE BELOW;Mn;233;NSM;;;;;N;;;;; 1DFD;COMBINING ALMOST EQUAL TO BELOW;Mn;220;NSM;;;;;N;;;;; @@ -7457,6 +7536,7 @@ 20BD;RUBLE SIGN;Sc;0;ET;;;;;N;;;;; 20BE;LARI SIGN;Sc;0;ET;;;;;N;;;;; 20BF;BITCOIN SIGN;Sc;0;ET;;;;;N;;;;; +20C0;SOM SIGN;Sc;0;ET;;;;;N;;;;; 20D0;COMBINING LEFT HARPOON ABOVE;Mn;230;NSM;;;;;N;NON-SPACING LEFT HARPOON ABOVE;;;; 20D1;COMBINING RIGHT HARPOON ABOVE;Mn;230;NSM;;;;;N;NON-SPACING RIGHT HARPOON ABOVE;;;; 20D2;COMBINING LONG VERTICAL LINE OVERLAY;Mn;1;NSM;;;;;N;NON-SPACING LONG VERTICAL BAR OVERLAY;;;; @@ -10300,6 +10380,7 @@ 2C2C;GLAGOLITIC CAPITAL LETTER SHTAPIC;Lu;0;L;;;;;N;;;;2C5C; 2C2D;GLAGOLITIC CAPITAL LETTER TROKUTASTI A;Lu;0;L;;;;;N;;;;2C5D; 2C2E;GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE;Lu;0;L;;;;;N;;;;2C5E; +2C2F;GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI;Lu;0;L;;;;;N;;;;2C5F; 2C30;GLAGOLITIC SMALL LETTER AZU;Ll;0;L;;;;;N;;;2C00;;2C00 2C31;GLAGOLITIC SMALL LETTER BUKY;Ll;0;L;;;;;N;;;2C01;;2C01 2C32;GLAGOLITIC SMALL LETTER VEDE;Ll;0;L;;;;;N;;;2C02;;2C02 @@ -10347,6 +10428,7 @@ 2C5C;GLAGOLITIC SMALL LETTER SHTAPIC;Ll;0;L;;;;;N;;;2C2C;;2C2C 2C5D;GLAGOLITIC SMALL LETTER TROKUTASTI A;Ll;0;L;;;;;N;;;2C2D;;2C2D 2C5E;GLAGOLITIC SMALL LETTER LATINATE MYSLITE;Ll;0;L;;;;;N;;;2C2E;;2C2E +2C5F;GLAGOLITIC SMALL LETTER CAUDATE CHRIVI;Ll;0;L;;;;;N;;;2C2F;;2C2F 2C60;LATIN CAPITAL LETTER L WITH DOUBLE BAR;Lu;0;L;;;;;N;;;;2C61; 2C61;LATIN SMALL LETTER L WITH DOUBLE BAR;Ll;0;L;;;;;N;;;2C60;;2C60 2C62;LATIN CAPITAL LETTER L WITH MIDDLE TILDE;Lu;0;L;;;;;N;;;;026B; @@ -10795,6 +10877,17 @@ 2E50;CROSS PATTY WITH RIGHT CROSSBAR;So;0;ON;;;;;N;;;;; 2E51;CROSS PATTY WITH LEFT CROSSBAR;So;0;ON;;;;;N;;;;; 2E52;TIRONIAN SIGN CAPITAL ET;Po;0;ON;;;;;N;;;;; +2E53;MEDIEVAL EXCLAMATION MARK;Po;0;ON;;;;;N;;;;; +2E54;MEDIEVAL QUESTION MARK;Po;0;ON;;;;;N;;;;; +2E55;LEFT SQUARE BRACKET WITH STROKE;Ps;0;ON;;;;;Y;;;;; +2E56;RIGHT SQUARE BRACKET WITH STROKE;Pe;0;ON;;;;;Y;;;;; +2E57;LEFT SQUARE BRACKET WITH DOUBLE STROKE;Ps;0;ON;;;;;Y;;;;; +2E58;RIGHT SQUARE BRACKET WITH DOUBLE STROKE;Pe;0;ON;;;;;Y;;;;; +2E59;TOP HALF LEFT PARENTHESIS;Ps;0;ON;;;;;Y;;;;; +2E5A;TOP HALF RIGHT PARENTHESIS;Pe;0;ON;;;;;Y;;;;; +2E5B;BOTTOM HALF LEFT PARENTHESIS;Ps;0;ON;;;;;Y;;;;; +2E5C;BOTTOM HALF RIGHT PARENTHESIS;Pe;0;ON;;;;;Y;;;;; +2E5D;OBLIQUE HYPHEN;Pd;0;ON;;;;;N;;;;; 2E80;CJK RADICAL REPEAT;So;0;ON;;;;;N;;;;; 2E81;CJK RADICAL CLIFF;So;0;ON;;;;;N;;;;; 2E82;CJK RADICAL SECOND ONE;So;0;ON;;;;;N;;;;; @@ -12204,7 +12297,7 @@ 4DFE;HEXAGRAM FOR AFTER COMPLETION;So;0;ON;;;;;N;;;;; 4DFF;HEXAGRAM FOR BEFORE COMPLETION;So;0;ON;;;;;N;;;;; 4E00;;Lo;0;L;;;;;N;;;;; -9FFC;;Lo;0;L;;;;;N;;;;; +9FFF;;Lo;0;L;;;;;N;;;;; A000;YI SYLLABLE IT;Lo;0;L;;;;;N;;;;; A001;YI SYLLABLE IX;Lo;0;L;;;;;N;;;;; A002;YI SYLLABLE I;Lo;0;L;;;;;N;;;;; @@ -14149,6 +14242,8 @@ A7BC;LATIN CAPITAL LETTER GLOTTAL I;Lu;0;L;;;;;N;;;;A7BD; A7BD;LATIN SMALL LETTER GLOTTAL I;Ll;0;L;;;;;N;;;A7BC;;A7BC A7BE;LATIN CAPITAL LETTER GLOTTAL U;Lu;0;L;;;;;N;;;;A7BF; A7BF;LATIN SMALL LETTER GLOTTAL U;Ll;0;L;;;;;N;;;A7BE;;A7BE +A7C0;LATIN CAPITAL LETTER OLD POLISH O;Lu;0;L;;;;;N;;;;A7C1; +A7C1;LATIN SMALL LETTER OLD POLISH O;Ll;0;L;;;;;N;;;A7C0;;A7C0 A7C2;LATIN CAPITAL LETTER ANGLICANA W;Lu;0;L;;;;;N;;;;A7C3; A7C3;LATIN SMALL LETTER ANGLICANA W;Ll;0;L;;;;;N;;;A7C2;;A7C2 A7C4;LATIN CAPITAL LETTER C WITH PALATAL HOOK;Lu;0;L;;;;;N;;;;A794; @@ -14158,6 +14253,17 @@ A7C7;LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY;Lu;0;L;;;;;N;;;;A7C8; A7C8;LATIN SMALL LETTER D WITH SHORT STROKE OVERLAY;Ll;0;L;;;;;N;;;A7C7;;A7C7 A7C9;LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY;Lu;0;L;;;;;N;;;;A7CA; A7CA;LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY;Ll;0;L;;;;;N;;;A7C9;;A7C9 +A7D0;LATIN CAPITAL LETTER CLOSED INSULAR G;Lu;0;L;;;;;N;;;;A7D1; +A7D1;LATIN SMALL LETTER CLOSED INSULAR G;Ll;0;L;;;;;N;;;A7D0;;A7D0 +A7D3;LATIN SMALL LETTER DOUBLE THORN;Ll;0;L;;;;;N;;;;; +A7D5;LATIN SMALL LETTER DOUBLE WYNN;Ll;0;L;;;;;N;;;;; +A7D6;LATIN CAPITAL LETTER MIDDLE SCOTS S;Lu;0;L;;;;;N;;;;A7D7; +A7D7;LATIN SMALL LETTER MIDDLE SCOTS S;Ll;0;L;;;;;N;;;A7D6;;A7D6 +A7D8;LATIN CAPITAL LETTER SIGMOID S;Lu;0;L;;;;;N;;;;A7D9; +A7D9;LATIN SMALL LETTER SIGMOID S;Ll;0;L;;;;;N;;;A7D8;;A7D8 +A7F2;MODIFIER LETTER CAPITAL C;Lm;0;L; 0043;;;;N;;;;; +A7F3;MODIFIER LETTER CAPITAL F;Lm;0;L; 0046;;;;N;;;;; +A7F4;MODIFIER LETTER CAPITAL Q;Lm;0;L; 0051;;;;N;;;;; A7F5;LATIN CAPITAL LETTER REVERSED HALF H;Lu;0;L;;;;;N;;;;A7F6; A7F6;LATIN SMALL LETTER REVERSED HALF H;Ll;0;L;;;;;N;;;A7F5;;A7F5 A7F7;LATIN EPIGRAPHIC LETTER SIDEWAYS I;Lo;0;L;;;;;N;;;;; @@ -15794,6 +15900,7 @@ FBBE;ARABIC SYMBOL TWO DOTS VERTICALLY BELOW;Sk;0;AL;;;;;N;;;;; FBBF;ARABIC SYMBOL RING;Sk;0;AL;;;;;N;;;;; FBC0;ARABIC SYMBOL SMALL TAH ABOVE;Sk;0;AL;;;;;N;;;;; FBC1;ARABIC SYMBOL SMALL TAH BELOW;Sk;0;AL;;;;;N;;;;; +FBC2;ARABIC SYMBOL WASLA ABOVE;Sk;0;AL;;;;;N;;;;; FBD3;ARABIC LETTER NG ISOLATED FORM;Lo;0;AL; 06AD;;;;N;;;;; FBD4;ARABIC LETTER NG FINAL FORM;Lo;0;AL; 06AD;;;;N;;;;; FBD5;ARABIC LETTER NG INITIAL FORM;Lo;0;AL; 06AD;;;;N;;;;; @@ -16159,6 +16266,22 @@ FD3C;ARABIC LIGATURE ALEF WITH FATHATAN FINAL FORM;Lo;0;AL; 0627 064B;;;; FD3D;ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM;Lo;0;AL; 0627 064B;;;;N;;;;; FD3E;ORNATE LEFT PARENTHESIS;Pe;0;ON;;;;;N;;;;; FD3F;ORNATE RIGHT PARENTHESIS;Ps;0;ON;;;;;N;;;;; +FD40;ARABIC LIGATURE RAHIMAHU ALLAAH;So;0;ON;;;;;N;;;;; +FD41;ARABIC LIGATURE RADI ALLAAHU ANH;So;0;ON;;;;;N;;;;; +FD42;ARABIC LIGATURE RADI ALLAAHU ANHAA;So;0;ON;;;;;N;;;;; +FD43;ARABIC LIGATURE RADI ALLAAHU ANHUM;So;0;ON;;;;;N;;;;; +FD44;ARABIC LIGATURE RADI ALLAAHU ANHUMAA;So;0;ON;;;;;N;;;;; +FD45;ARABIC LIGATURE RADI ALLAAHU ANHUNNA;So;0;ON;;;;;N;;;;; +FD46;ARABIC LIGATURE SALLALLAAHU ALAYHI WA-AALIH;So;0;ON;;;;;N;;;;; +FD47;ARABIC LIGATURE ALAYHI AS-SALAAM;So;0;ON;;;;;N;;;;; +FD48;ARABIC LIGATURE ALAYHIM AS-SALAAM;So;0;ON;;;;;N;;;;; +FD49;ARABIC LIGATURE ALAYHIMAA AS-SALAAM;So;0;ON;;;;;N;;;;; +FD4A;ARABIC LIGATURE ALAYHI AS-SALAATU WAS-SALAAM;So;0;ON;;;;;N;;;;; +FD4B;ARABIC LIGATURE QUDDISA SIRRAH;So;0;ON;;;;;N;;;;; +FD4C;ARABIC LIGATURE SALLALLAHU ALAYHI WAAALIHEE WA-SALLAM;So;0;ON;;;;;N;;;;; +FD4D;ARABIC LIGATURE ALAYHAA AS-SALAAM;So;0;ON;;;;;N;;;;; +FD4E;ARABIC LIGATURE TABAARAKA WA-TAAALAA;So;0;ON;;;;;N;;;;; +FD4F;ARABIC LIGATURE RAHIMAHUM ALLAAH;So;0;ON;;;;;N;;;;; FD50;ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM;Lo;0;AL; 062A 062C 0645;;;;N;;;;; FD51;ARABIC LIGATURE TEH WITH HAH WITH JEEM FINAL FORM;Lo;0;AL; 062A 062D 062C;;;;N;;;;; FD52;ARABIC LIGATURE TEH WITH HAH WITH JEEM INITIAL FORM;Lo;0;AL; 062A 062D 062C;;;;N;;;;; @@ -16277,6 +16400,7 @@ FDC4;ARABIC LIGATURE AIN WITH JEEM WITH MEEM INITIAL FORM;Lo;0;AL; 0639 FDC5;ARABIC LIGATURE SAD WITH MEEM WITH MEEM INITIAL FORM;Lo;0;AL; 0635 0645 0645;;;;N;;;;; FDC6;ARABIC LIGATURE SEEN WITH KHAH WITH YEH FINAL FORM;Lo;0;AL; 0633 062E 064A;;;;N;;;;; FDC7;ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM;Lo;0;AL; 0646 062C 064A;;;;N;;;;; +FDCF;ARABIC LIGATURE SALAAMUHU ALAYNAA;So;0;ON;;;;;N;;;;; FDF0;ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM;Lo;0;AL; 0635 0644 06D2;;;;N;;;;; FDF1;ARABIC LIGATURE QALA USED AS KORANIC STOP SIGN ISOLATED FORM;Lo;0;AL; 0642 0644 06D2;;;;N;;;;; FDF2;ARABIC LIGATURE ALLAH ISOLATED FORM;Lo;0;AL; 0627 0644 0644 0647;;;;N;;;;; @@ -16291,6 +16415,8 @@ FDFA;ARABIC LIGATURE SALLALLAHOU ALAYHE WASALLAM;Lo;0;AL; 0635 0644 06 FDFB;ARABIC LIGATURE JALLAJALALOUHOU;Lo;0;AL; 062C 0644 0020 062C 0644 0627 0644 0647;;;;N;ARABIC LETTER JALLAJALALOUHOU;;;; FDFC;RIAL SIGN;Sc;0;AL; 0631 06CC 0627 0644;;;;N;;;;; FDFD;ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM;So;0;ON;;;;;N;;;;; +FDFE;ARABIC LIGATURE SUBHAANAHU WA TAAALAA;So;0;ON;;;;;N;;;;; +FDFF;ARABIC LIGATURE AZZA WA JALL;So;0;ON;;;;;N;;;;; FE00;VARIATION SELECTOR-1;Mn;0;NSM;;;;;N;;;;; FE01;VARIATION SELECTOR-2;Mn;0;NSM;;;;;N;;;;; FE02;VARIATION SELECTOR-3;Mn;0;NSM;;;;;N;;;;; @@ -17798,6 +17924,76 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 10562;CAUCASIAN ALBANIAN LETTER PIWR;Lo;0;L;;;;;N;;;;; 10563;CAUCASIAN ALBANIAN LETTER KIW;Lo;0;L;;;;;N;;;;; 1056F;CAUCASIAN ALBANIAN CITATION MARK;Po;0;L;;;;;N;;;;; +10570;VITHKUQI CAPITAL LETTER A;Lu;0;L;;;;;N;;;;10597; +10571;VITHKUQI CAPITAL LETTER BBE;Lu;0;L;;;;;N;;;;10598; +10572;VITHKUQI CAPITAL LETTER BE;Lu;0;L;;;;;N;;;;10599; +10573;VITHKUQI CAPITAL LETTER CE;Lu;0;L;;;;;N;;;;1059A; +10574;VITHKUQI CAPITAL LETTER CHE;Lu;0;L;;;;;N;;;;1059B; +10575;VITHKUQI CAPITAL LETTER DE;Lu;0;L;;;;;N;;;;1059C; +10576;VITHKUQI CAPITAL LETTER DHE;Lu;0;L;;;;;N;;;;1059D; +10577;VITHKUQI CAPITAL LETTER EI;Lu;0;L;;;;;N;;;;1059E; +10578;VITHKUQI CAPITAL LETTER E;Lu;0;L;;;;;N;;;;1059F; +10579;VITHKUQI CAPITAL LETTER FE;Lu;0;L;;;;;N;;;;105A0; +1057A;VITHKUQI CAPITAL LETTER GA;Lu;0;L;;;;;N;;;;105A1; +1057C;VITHKUQI CAPITAL LETTER HA;Lu;0;L;;;;;N;;;;105A3; +1057D;VITHKUQI CAPITAL LETTER HHA;Lu;0;L;;;;;N;;;;105A4; +1057E;VITHKUQI CAPITAL LETTER I;Lu;0;L;;;;;N;;;;105A5; +1057F;VITHKUQI CAPITAL LETTER IJE;Lu;0;L;;;;;N;;;;105A6; +10580;VITHKUQI CAPITAL LETTER JE;Lu;0;L;;;;;N;;;;105A7; +10581;VITHKUQI CAPITAL LETTER KA;Lu;0;L;;;;;N;;;;105A8; +10582;VITHKUQI CAPITAL LETTER LA;Lu;0;L;;;;;N;;;;105A9; +10583;VITHKUQI CAPITAL LETTER LLA;Lu;0;L;;;;;N;;;;105AA; +10584;VITHKUQI CAPITAL LETTER ME;Lu;0;L;;;;;N;;;;105AB; +10585;VITHKUQI CAPITAL LETTER NE;Lu;0;L;;;;;N;;;;105AC; +10586;VITHKUQI CAPITAL LETTER NJE;Lu;0;L;;;;;N;;;;105AD; +10587;VITHKUQI CAPITAL LETTER O;Lu;0;L;;;;;N;;;;105AE; +10588;VITHKUQI CAPITAL LETTER PE;Lu;0;L;;;;;N;;;;105AF; +10589;VITHKUQI CAPITAL LETTER QA;Lu;0;L;;;;;N;;;;105B0; +1058A;VITHKUQI CAPITAL LETTER RE;Lu;0;L;;;;;N;;;;105B1; +1058C;VITHKUQI CAPITAL LETTER SE;Lu;0;L;;;;;N;;;;105B3; +1058D;VITHKUQI CAPITAL LETTER SHE;Lu;0;L;;;;;N;;;;105B4; +1058E;VITHKUQI CAPITAL LETTER TE;Lu;0;L;;;;;N;;;;105B5; +1058F;VITHKUQI CAPITAL LETTER THE;Lu;0;L;;;;;N;;;;105B6; +10590;VITHKUQI CAPITAL LETTER U;Lu;0;L;;;;;N;;;;105B7; +10591;VITHKUQI CAPITAL LETTER VE;Lu;0;L;;;;;N;;;;105B8; +10592;VITHKUQI CAPITAL LETTER XE;Lu;0;L;;;;;N;;;;105B9; +10594;VITHKUQI CAPITAL LETTER Y;Lu;0;L;;;;;N;;;;105BB; +10595;VITHKUQI CAPITAL LETTER ZE;Lu;0;L;;;;;N;;;;105BC; +10597;VITHKUQI SMALL LETTER A;Ll;0;L;;;;;N;;;10570;;10570 +10598;VITHKUQI SMALL LETTER BBE;Ll;0;L;;;;;N;;;10571;;10571 +10599;VITHKUQI SMALL LETTER BE;Ll;0;L;;;;;N;;;10572;;10572 +1059A;VITHKUQI SMALL LETTER CE;Ll;0;L;;;;;N;;;10573;;10573 +1059B;VITHKUQI SMALL LETTER CHE;Ll;0;L;;;;;N;;;10574;;10574 +1059C;VITHKUQI SMALL LETTER DE;Ll;0;L;;;;;N;;;10575;;10575 +1059D;VITHKUQI SMALL LETTER DHE;Ll;0;L;;;;;N;;;10576;;10576 +1059E;VITHKUQI SMALL LETTER EI;Ll;0;L;;;;;N;;;10577;;10577 +1059F;VITHKUQI SMALL LETTER E;Ll;0;L;;;;;N;;;10578;;10578 +105A0;VITHKUQI SMALL LETTER FE;Ll;0;L;;;;;N;;;10579;;10579 +105A1;VITHKUQI SMALL LETTER GA;Ll;0;L;;;;;N;;;1057A;;1057A +105A3;VITHKUQI SMALL LETTER HA;Ll;0;L;;;;;N;;;1057C;;1057C +105A4;VITHKUQI SMALL LETTER HHA;Ll;0;L;;;;;N;;;1057D;;1057D +105A5;VITHKUQI SMALL LETTER I;Ll;0;L;;;;;N;;;1057E;;1057E +105A6;VITHKUQI SMALL LETTER IJE;Ll;0;L;;;;;N;;;1057F;;1057F +105A7;VITHKUQI SMALL LETTER JE;Ll;0;L;;;;;N;;;10580;;10580 +105A8;VITHKUQI SMALL LETTER KA;Ll;0;L;;;;;N;;;10581;;10581 +105A9;VITHKUQI SMALL LETTER LA;Ll;0;L;;;;;N;;;10582;;10582 +105AA;VITHKUQI SMALL LETTER LLA;Ll;0;L;;;;;N;;;10583;;10583 +105AB;VITHKUQI SMALL LETTER ME;Ll;0;L;;;;;N;;;10584;;10584 +105AC;VITHKUQI SMALL LETTER NE;Ll;0;L;;;;;N;;;10585;;10585 +105AD;VITHKUQI SMALL LETTER NJE;Ll;0;L;;;;;N;;;10586;;10586 +105AE;VITHKUQI SMALL LETTER O;Ll;0;L;;;;;N;;;10587;;10587 +105AF;VITHKUQI SMALL LETTER PE;Ll;0;L;;;;;N;;;10588;;10588 +105B0;VITHKUQI SMALL LETTER QA;Ll;0;L;;;;;N;;;10589;;10589 +105B1;VITHKUQI SMALL LETTER RE;Ll;0;L;;;;;N;;;1058A;;1058A +105B3;VITHKUQI SMALL LETTER SE;Ll;0;L;;;;;N;;;1058C;;1058C +105B4;VITHKUQI SMALL LETTER SHE;Ll;0;L;;;;;N;;;1058D;;1058D +105B5;VITHKUQI SMALL LETTER TE;Ll;0;L;;;;;N;;;1058E;;1058E +105B6;VITHKUQI SMALL LETTER THE;Ll;0;L;;;;;N;;;1058F;;1058F +105B7;VITHKUQI SMALL LETTER U;Ll;0;L;;;;;N;;;10590;;10590 +105B8;VITHKUQI SMALL LETTER VE;Ll;0;L;;;;;N;;;10591;;10591 +105B9;VITHKUQI SMALL LETTER XE;Ll;0;L;;;;;N;;;10592;;10592 +105BB;VITHKUQI SMALL LETTER Y;Ll;0;L;;;;;N;;;10594;;10594 +105BC;VITHKUQI SMALL LETTER ZE;Ll;0;L;;;;;N;;;10595;;10595 10600;LINEAR A SIGN AB001;Lo;0;L;;;;;N;;;;; 10601;LINEAR A SIGN AB002;Lo;0;L;;;;;N;;;;; 10602;LINEAR A SIGN AB003;Lo;0;L;;;;;N;;;;; @@ -18139,6 +18335,63 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 10765;LINEAR A SIGN A805;Lo;0;L;;;;;N;;;;; 10766;LINEAR A SIGN A806;Lo;0;L;;;;;N;;;;; 10767;LINEAR A SIGN A807;Lo;0;L;;;;;N;;;;; +10780;MODIFIER LETTER SMALL CAPITAL AA;Lm;0;L;;;;;N;;;;; +10781;MODIFIER LETTER SUPERSCRIPT TRIANGULAR COLON;Lm;0;L; 02D0;;;;N;;;;; +10782;MODIFIER LETTER SUPERSCRIPT HALF TRIANGULAR COLON;Lm;0;L; 02D1;;;;N;;;;; +10783;MODIFIER LETTER SMALL AE;Lm;0;L; 00E6;;;;N;;;;; +10784;MODIFIER LETTER SMALL CAPITAL B;Lm;0;L; 0299;;;;N;;;;; +10785;MODIFIER LETTER SMALL B WITH HOOK;Lm;0;L; 0253;;;;N;;;;; +10787;MODIFIER LETTER SMALL DZ DIGRAPH;Lm;0;L; 02A3;;;;N;;;;; +10788;MODIFIER LETTER SMALL DZ DIGRAPH WITH RETROFLEX HOOK;Lm;0;L; AB66;;;;N;;;;; +10789;MODIFIER LETTER SMALL DZ DIGRAPH WITH CURL;Lm;0;L; 02A5;;;;N;;;;; +1078A;MODIFIER LETTER SMALL DEZH DIGRAPH;Lm;0;L; 02A4;;;;N;;;;; +1078B;MODIFIER LETTER SMALL D WITH TAIL;Lm;0;L; 0256;;;;N;;;;; +1078C;MODIFIER LETTER SMALL D WITH HOOK;Lm;0;L; 0257;;;;N;;;;; +1078D;MODIFIER LETTER SMALL D WITH HOOK AND TAIL;Lm;0;L; 1D91;;;;N;;;;; +1078E;MODIFIER LETTER SMALL REVERSED E;Lm;0;L; 0258;;;;N;;;;; +1078F;MODIFIER LETTER SMALL CLOSED REVERSED OPEN E;Lm;0;L; 025E;;;;N;;;;; +10790;MODIFIER LETTER SMALL FENG DIGRAPH;Lm;0;L; 02A9;;;;N;;;;; +10791;MODIFIER LETTER SMALL RAMS HORN;Lm;0;L; 0264;;;;N;;;;; +10792;MODIFIER LETTER SMALL CAPITAL G;Lm;0;L; 0262;;;;N;;;;; +10793;MODIFIER LETTER SMALL G WITH HOOK;Lm;0;L; 0260;;;;N;;;;; +10794;MODIFIER LETTER SMALL CAPITAL G WITH HOOK;Lm;0;L; 029B;;;;N;;;;; +10795;MODIFIER LETTER SMALL H WITH STROKE;Lm;0;L; 0127;;;;N;;;;; +10796;MODIFIER LETTER SMALL CAPITAL H;Lm;0;L; 029C;;;;N;;;;; +10797;MODIFIER LETTER SMALL HENG WITH HOOK;Lm;0;L; 0267;;;;N;;;;; +10798;MODIFIER LETTER SMALL DOTLESS J WITH STROKE AND HOOK;Lm;0;L; 0284;;;;N;;;;; +10799;MODIFIER LETTER SMALL LS DIGRAPH;Lm;0;L; 02AA;;;;N;;;;; +1079A;MODIFIER LETTER SMALL LZ DIGRAPH;Lm;0;L; 02AB;;;;N;;;;; +1079B;MODIFIER LETTER SMALL L WITH BELT;Lm;0;L; 026C;;;;N;;;;; +1079C;MODIFIER LETTER SMALL CAPITAL L WITH BELT;Lm;0;L; 1DF04;;;;N;;;;; +1079D;MODIFIER LETTER SMALL L WITH RETROFLEX HOOK AND BELT;Lm;0;L; A78E;;;;N;;;;; +1079E;MODIFIER LETTER SMALL LEZH;Lm;0;L; 026E;;;;N;;;;; +1079F;MODIFIER LETTER SMALL LEZH WITH RETROFLEX HOOK;Lm;0;L; 1DF05;;;;N;;;;; +107A0;MODIFIER LETTER SMALL TURNED Y;Lm;0;L; 028E;;;;N;;;;; +107A1;MODIFIER LETTER SMALL TURNED Y WITH BELT;Lm;0;L; 1DF06;;;;N;;;;; +107A2;MODIFIER LETTER SMALL O WITH STROKE;Lm;0;L; 00F8;;;;N;;;;; +107A3;MODIFIER LETTER SMALL CAPITAL OE;Lm;0;L; 0276;;;;N;;;;; +107A4;MODIFIER LETTER SMALL CLOSED OMEGA;Lm;0;L; 0277;;;;N;;;;; +107A5;MODIFIER LETTER SMALL Q;Lm;0;L; 0071;;;;N;;;;; +107A6;MODIFIER LETTER SMALL TURNED R WITH LONG LEG;Lm;0;L; 027A;;;;N;;;;; +107A7;MODIFIER LETTER SMALL TURNED R WITH LONG LEG AND RETROFLEX HOOK;Lm;0;L; 1DF08;;;;N;;;;; +107A8;MODIFIER LETTER SMALL R WITH TAIL;Lm;0;L; 027D;;;;N;;;;; +107A9;MODIFIER LETTER SMALL R WITH FISHHOOK;Lm;0;L; 027E;;;;N;;;;; +107AA;MODIFIER LETTER SMALL CAPITAL R;Lm;0;L; 0280;;;;N;;;;; +107AB;MODIFIER LETTER SMALL TC DIGRAPH WITH CURL;Lm;0;L; 02A8;;;;N;;;;; +107AC;MODIFIER LETTER SMALL TS DIGRAPH;Lm;0;L; 02A6;;;;N;;;;; +107AD;MODIFIER LETTER SMALL TS DIGRAPH WITH RETROFLEX HOOK;Lm;0;L; AB67;;;;N;;;;; +107AE;MODIFIER LETTER SMALL TESH DIGRAPH;Lm;0;L; 02A7;;;;N;;;;; +107AF;MODIFIER LETTER SMALL T WITH RETROFLEX HOOK;Lm;0;L; 0288;;;;N;;;;; +107B0;MODIFIER LETTER SMALL V WITH RIGHT HOOK;Lm;0;L; 2C71;;;;N;;;;; +107B2;MODIFIER LETTER SMALL CAPITAL Y;Lm;0;L; 028F;;;;N;;;;; +107B3;MODIFIER LETTER GLOTTAL STOP WITH STROKE;Lm;0;L; 02A1;;;;N;;;;; +107B4;MODIFIER LETTER REVERSED GLOTTAL STOP WITH STROKE;Lm;0;L; 02A2;;;;N;;;;; +107B5;MODIFIER LETTER BILABIAL CLICK;Lm;0;L; 0298;;;;N;;;;; +107B6;MODIFIER LETTER DENTAL CLICK;Lm;0;L; 01C0;;;;N;;;;; +107B7;MODIFIER LETTER LATERAL CLICK;Lm;0;L; 01C1;;;;N;;;;; +107B8;MODIFIER LETTER ALVEOLAR CLICK;Lm;0;L; 01C2;;;;N;;;;; +107B9;MODIFIER LETTER RETROFLEX CLICK WITH RETROFLEX HOOK;Lm;0;L; 1DF0A;;;;N;;;;; +107BA;MODIFIER LETTER SMALL S WITH CURL;Lm;0;L; 1DF1E;;;;N;;;;; 10800;CYPRIOT SYLLABLE A;Lo;0;R;;;;;N;;;;; 10801;CYPRIOT SYLLABLE E;Lo;0;R;;;;;N;;;;; 10802;CYPRIOT SYLLABLE I;Lo;0;R;;;;;N;;;;; @@ -19222,6 +19475,32 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 10F57;SOGDIAN PUNCTUATION CIRCLE WITH DOT;Po;0;AL;;;;;N;;;;; 10F58;SOGDIAN PUNCTUATION TWO CIRCLES WITH DOTS;Po;0;AL;;;;;N;;;;; 10F59;SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT;Po;0;AL;;;;;N;;;;; +10F70;OLD UYGHUR LETTER ALEPH;Lo;0;R;;;;;N;;;;; +10F71;OLD UYGHUR LETTER BETH;Lo;0;R;;;;;N;;;;; +10F72;OLD UYGHUR LETTER GIMEL-HETH;Lo;0;R;;;;;N;;;;; +10F73;OLD UYGHUR LETTER WAW;Lo;0;R;;;;;N;;;;; +10F74;OLD UYGHUR LETTER ZAYIN;Lo;0;R;;;;;N;;;;; +10F75;OLD UYGHUR LETTER FINAL HETH;Lo;0;R;;;;;N;;;;; +10F76;OLD UYGHUR LETTER YODH;Lo;0;R;;;;;N;;;;; +10F77;OLD UYGHUR LETTER KAPH;Lo;0;R;;;;;N;;;;; +10F78;OLD UYGHUR LETTER LAMEDH;Lo;0;R;;;;;N;;;;; +10F79;OLD UYGHUR LETTER MEM;Lo;0;R;;;;;N;;;;; +10F7A;OLD UYGHUR LETTER NUN;Lo;0;R;;;;;N;;;;; +10F7B;OLD UYGHUR LETTER SAMEKH;Lo;0;R;;;;;N;;;;; +10F7C;OLD UYGHUR LETTER PE;Lo;0;R;;;;;N;;;;; +10F7D;OLD UYGHUR LETTER SADHE;Lo;0;R;;;;;N;;;;; +10F7E;OLD UYGHUR LETTER RESH;Lo;0;R;;;;;N;;;;; +10F7F;OLD UYGHUR LETTER SHIN;Lo;0;R;;;;;N;;;;; +10F80;OLD UYGHUR LETTER TAW;Lo;0;R;;;;;N;;;;; +10F81;OLD UYGHUR LETTER LESH;Lo;0;R;;;;;N;;;;; +10F82;OLD UYGHUR COMBINING DOT ABOVE;Mn;230;NSM;;;;;N;;;;; +10F83;OLD UYGHUR COMBINING DOT BELOW;Mn;220;NSM;;;;;N;;;;; +10F84;OLD UYGHUR COMBINING TWO DOTS ABOVE;Mn;230;NSM;;;;;N;;;;; +10F85;OLD UYGHUR COMBINING TWO DOTS BELOW;Mn;220;NSM;;;;;N;;;;; +10F86;OLD UYGHUR PUNCTUATION BAR;Po;0;R;;;;;N;;;;; +10F87;OLD UYGHUR PUNCTUATION TWO BARS;Po;0;R;;;;;N;;;;; +10F88;OLD UYGHUR PUNCTUATION TWO DOTS;Po;0;R;;;;;N;;;;; +10F89;OLD UYGHUR PUNCTUATION FOUR DOTS;Po;0;R;;;;;N;;;;; 10FB0;CHORASMIAN LETTER ALEPH;Lo;0;R;;;;;N;;;;; 10FB1;CHORASMIAN LETTER SMALL ALEPH;Lo;0;R;;;;;N;;;;; 10FB2;CHORASMIAN LETTER BETH;Lo;0;R;;;;;N;;;;; @@ -19381,6 +19660,12 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1106D;BRAHMI DIGIT SEVEN;Nd;0;L;;7;7;7;N;;;;; 1106E;BRAHMI DIGIT EIGHT;Nd;0;L;;8;8;8;N;;;;; 1106F;BRAHMI DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; +11070;BRAHMI SIGN OLD TAMIL VIRAMA;Mn;9;NSM;;;;;N;;;;; +11071;BRAHMI LETTER OLD TAMIL SHORT E;Lo;0;L;;;;;N;;;;; +11072;BRAHMI LETTER OLD TAMIL SHORT O;Lo;0;L;;;;;N;;;;; +11073;BRAHMI VOWEL SIGN OLD TAMIL SHORT E;Mn;0;NSM;;;;;N;;;;; +11074;BRAHMI VOWEL SIGN OLD TAMIL SHORT O;Mn;0;NSM;;;;;N;;;;; +11075;BRAHMI LETTER OLD TAMIL LLA;Lo;0;L;;;;;N;;;;; 1107F;BRAHMI NUMBER JOINER;Mn;9;NSM;;;;;N;;;;; 11080;KAITHI SIGN CANDRABINDU;Mn;0;NSM;;;;;N;;;;; 11081;KAITHI SIGN ANUSVARA;Mn;0;NSM;;;;;N;;;;; @@ -19448,6 +19733,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 110BF;KAITHI DOUBLE SECTION MARK;Po;0;L;;;;;N;;;;; 110C0;KAITHI DANDA;Po;0;L;;;;;N;;;;; 110C1;KAITHI DOUBLE DANDA;Po;0;L;;;;;N;;;;; +110C2;KAITHI VOWEL SIGN VOCALIC R;Mn;0;NSM;;;;;N;;;;; 110CD;KAITHI NUMBER SIGN ABOVE;Cf;0;L;;;;;N;;;;; 110D0;SORA SOMPENG LETTER SAH;Lo;0;L;;;;;N;;;;; 110D1;SORA SOMPENG LETTER TAH;Lo;0;L;;;;;N;;;;; @@ -20385,6 +20671,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 116B6;TAKRI SIGN VIRAMA;Mc;9;L;;;;;N;;;;; 116B7;TAKRI SIGN NUKTA;Mn;7;NSM;;;;;N;;;;; 116B8;TAKRI LETTER ARCHAIC KHA;Lo;0;L;;;;;N;;;;; +116B9;TAKRI ABBREVIATION SIGN;Po;0;L;;;;;N;;;;; 116C0;TAKRI DIGIT ZERO;Nd;0;L;;0;0;0;N;;;;; 116C1;TAKRI DIGIT ONE;Nd;0;L;;1;1;1;N;;;;; 116C2;TAKRI DIGIT TWO;Nd;0;L;;2;2;2;N;;;;; @@ -20453,6 +20740,13 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1173D;AHOM SIGN SECTION;Po;0;L;;;;;N;;;;; 1173E;AHOM SIGN RULAI;Po;0;L;;;;;N;;;;; 1173F;AHOM SYMBOL VI;So;0;L;;;;;N;;;;; +11740;AHOM LETTER CA;Lo;0;L;;;;;N;;;;; +11741;AHOM LETTER TTA;Lo;0;L;;;;;N;;;;; +11742;AHOM LETTER TTHA;Lo;0;L;;;;;N;;;;; +11743;AHOM LETTER DDA;Lo;0;L;;;;;N;;;;; +11744;AHOM LETTER DDHA;Lo;0;L;;;;;N;;;;; +11745;AHOM LETTER NNA;Lo;0;L;;;;;N;;;;; +11746;AHOM LETTER LLA;Lo;0;L;;;;;N;;;;; 11800;DOGRA LETTER A;Lo;0;L;;;;;N;;;;; 11801;DOGRA LETTER AA;Lo;0;L;;;;;N;;;;; 11802;DOGRA LETTER I;Lo;0;L;;;;;N;;;;; @@ -20889,6 +21183,22 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 11AA0;SOYOMBO HEAD MARK WITH MOON AND SUN;Po;0;L;;;;;N;;;;; 11AA1;SOYOMBO TERMINAL MARK-1;Po;0;L;;;;;N;;;;; 11AA2;SOYOMBO TERMINAL MARK-2;Po;0;L;;;;;N;;;;; +11AB0;CANADIAN SYLLABICS NATTILIK HI;Lo;0;L;;;;;N;;;;; +11AB1;CANADIAN SYLLABICS NATTILIK HII;Lo;0;L;;;;;N;;;;; +11AB2;CANADIAN SYLLABICS NATTILIK HO;Lo;0;L;;;;;N;;;;; +11AB3;CANADIAN SYLLABICS NATTILIK HOO;Lo;0;L;;;;;N;;;;; +11AB4;CANADIAN SYLLABICS NATTILIK HA;Lo;0;L;;;;;N;;;;; +11AB5;CANADIAN SYLLABICS NATTILIK HAA;Lo;0;L;;;;;N;;;;; +11AB6;CANADIAN SYLLABICS NATTILIK SHRI;Lo;0;L;;;;;N;;;;; +11AB7;CANADIAN SYLLABICS NATTILIK SHRII;Lo;0;L;;;;;N;;;;; +11AB8;CANADIAN SYLLABICS NATTILIK SHRO;Lo;0;L;;;;;N;;;;; +11AB9;CANADIAN SYLLABICS NATTILIK SHROO;Lo;0;L;;;;;N;;;;; +11ABA;CANADIAN SYLLABICS NATTILIK SHRA;Lo;0;L;;;;;N;;;;; +11ABB;CANADIAN SYLLABICS NATTILIK SHRAA;Lo;0;L;;;;;N;;;;; +11ABC;CANADIAN SYLLABICS SPE;Lo;0;L;;;;;N;;;;; +11ABD;CANADIAN SYLLABICS SPI;Lo;0;L;;;;;N;;;;; +11ABE;CANADIAN SYLLABICS SPO;Lo;0;L;;;;;N;;;;; +11ABF;CANADIAN SYLLABICS SPA;Lo;0;L;;;;;N;;;;; 11AC0;PAU CIN HAU LETTER PA;Lo;0;L;;;;;N;;;;; 11AC1;PAU CIN HAU LETTER KA;Lo;0;L;;;;;N;;;;; 11AC2;PAU CIN HAU LETTER LA;Lo;0;L;;;;;N;;;;; @@ -22560,6 +22870,105 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 12541;CUNEIFORM SIGN ZA7;Lo;0;L;;;;;N;;;;; 12542;CUNEIFORM SIGN ZU OVER ZU PLUS SAR;Lo;0;L;;;;;N;;;;; 12543;CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU;Lo;0;L;;;;;N;;;;; +12F90;CYPRO-MINOAN SIGN CM001;Lo;0;L;;;;;N;;;;; +12F91;CYPRO-MINOAN SIGN CM002;Lo;0;L;;;;;N;;;;; +12F92;CYPRO-MINOAN SIGN CM004;Lo;0;L;;;;;N;;;;; +12F93;CYPRO-MINOAN SIGN CM005;Lo;0;L;;;;;N;;;;; +12F94;CYPRO-MINOAN SIGN CM006;Lo;0;L;;;;;N;;;;; +12F95;CYPRO-MINOAN SIGN CM007;Lo;0;L;;;;;N;;;;; +12F96;CYPRO-MINOAN SIGN CM008;Lo;0;L;;;;;N;;;;; +12F97;CYPRO-MINOAN SIGN CM009;Lo;0;L;;;;;N;;;;; +12F98;CYPRO-MINOAN SIGN CM010;Lo;0;L;;;;;N;;;;; +12F99;CYPRO-MINOAN SIGN CM011;Lo;0;L;;;;;N;;;;; +12F9A;CYPRO-MINOAN SIGN CM012;Lo;0;L;;;;;N;;;;; +12F9B;CYPRO-MINOAN SIGN CM012B;Lo;0;L;;;;;N;;;;; +12F9C;CYPRO-MINOAN SIGN CM013;Lo;0;L;;;;;N;;;;; +12F9D;CYPRO-MINOAN SIGN CM015;Lo;0;L;;;;;N;;;;; +12F9E;CYPRO-MINOAN SIGN CM017;Lo;0;L;;;;;N;;;;; +12F9F;CYPRO-MINOAN SIGN CM019;Lo;0;L;;;;;N;;;;; +12FA0;CYPRO-MINOAN SIGN CM021;Lo;0;L;;;;;N;;;;; +12FA1;CYPRO-MINOAN SIGN CM023;Lo;0;L;;;;;N;;;;; +12FA2;CYPRO-MINOAN SIGN CM024;Lo;0;L;;;;;N;;;;; +12FA3;CYPRO-MINOAN SIGN CM025;Lo;0;L;;;;;N;;;;; +12FA4;CYPRO-MINOAN SIGN CM026;Lo;0;L;;;;;N;;;;; +12FA5;CYPRO-MINOAN SIGN CM027;Lo;0;L;;;;;N;;;;; +12FA6;CYPRO-MINOAN SIGN CM028;Lo;0;L;;;;;N;;;;; +12FA7;CYPRO-MINOAN SIGN CM029;Lo;0;L;;;;;N;;;;; +12FA8;CYPRO-MINOAN SIGN CM030;Lo;0;L;;;;;N;;;;; +12FA9;CYPRO-MINOAN SIGN CM033;Lo;0;L;;;;;N;;;;; +12FAA;CYPRO-MINOAN SIGN CM034;Lo;0;L;;;;;N;;;;; +12FAB;CYPRO-MINOAN SIGN CM035;Lo;0;L;;;;;N;;;;; +12FAC;CYPRO-MINOAN SIGN CM036;Lo;0;L;;;;;N;;;;; +12FAD;CYPRO-MINOAN SIGN CM037;Lo;0;L;;;;;N;;;;; +12FAE;CYPRO-MINOAN SIGN CM038;Lo;0;L;;;;;N;;;;; +12FAF;CYPRO-MINOAN SIGN CM039;Lo;0;L;;;;;N;;;;; +12FB0;CYPRO-MINOAN SIGN CM040;Lo;0;L;;;;;N;;;;; +12FB1;CYPRO-MINOAN SIGN CM041;Lo;0;L;;;;;N;;;;; +12FB2;CYPRO-MINOAN SIGN CM044;Lo;0;L;;;;;N;;;;; +12FB3;CYPRO-MINOAN SIGN CM046;Lo;0;L;;;;;N;;;;; +12FB4;CYPRO-MINOAN SIGN CM047;Lo;0;L;;;;;N;;;;; +12FB5;CYPRO-MINOAN SIGN CM049;Lo;0;L;;;;;N;;;;; +12FB6;CYPRO-MINOAN SIGN CM050;Lo;0;L;;;;;N;;;;; +12FB7;CYPRO-MINOAN SIGN CM051;Lo;0;L;;;;;N;;;;; +12FB8;CYPRO-MINOAN SIGN CM052;Lo;0;L;;;;;N;;;;; +12FB9;CYPRO-MINOAN SIGN CM053;Lo;0;L;;;;;N;;;;; +12FBA;CYPRO-MINOAN SIGN CM054;Lo;0;L;;;;;N;;;;; +12FBB;CYPRO-MINOAN SIGN CM055;Lo;0;L;;;;;N;;;;; +12FBC;CYPRO-MINOAN SIGN CM056;Lo;0;L;;;;;N;;;;; +12FBD;CYPRO-MINOAN SIGN CM058;Lo;0;L;;;;;N;;;;; +12FBE;CYPRO-MINOAN SIGN CM059;Lo;0;L;;;;;N;;;;; +12FBF;CYPRO-MINOAN SIGN CM060;Lo;0;L;;;;;N;;;;; +12FC0;CYPRO-MINOAN SIGN CM061;Lo;0;L;;;;;N;;;;; +12FC1;CYPRO-MINOAN SIGN CM062;Lo;0;L;;;;;N;;;;; +12FC2;CYPRO-MINOAN SIGN CM063;Lo;0;L;;;;;N;;;;; +12FC3;CYPRO-MINOAN SIGN CM064;Lo;0;L;;;;;N;;;;; +12FC4;CYPRO-MINOAN SIGN CM066;Lo;0;L;;;;;N;;;;; +12FC5;CYPRO-MINOAN SIGN CM067;Lo;0;L;;;;;N;;;;; +12FC6;CYPRO-MINOAN SIGN CM068;Lo;0;L;;;;;N;;;;; +12FC7;CYPRO-MINOAN SIGN CM069;Lo;0;L;;;;;N;;;;; +12FC8;CYPRO-MINOAN SIGN CM070;Lo;0;L;;;;;N;;;;; +12FC9;CYPRO-MINOAN SIGN CM071;Lo;0;L;;;;;N;;;;; +12FCA;CYPRO-MINOAN SIGN CM072;Lo;0;L;;;;;N;;;;; +12FCB;CYPRO-MINOAN SIGN CM073;Lo;0;L;;;;;N;;;;; +12FCC;CYPRO-MINOAN SIGN CM074;Lo;0;L;;;;;N;;;;; +12FCD;CYPRO-MINOAN SIGN CM075;Lo;0;L;;;;;N;;;;; +12FCE;CYPRO-MINOAN SIGN CM075B;Lo;0;L;;;;;N;;;;; +12FCF;CYPRO-MINOAN SIGN CM076;Lo;0;L;;;;;N;;;;; +12FD0;CYPRO-MINOAN SIGN CM078;Lo;0;L;;;;;N;;;;; +12FD1;CYPRO-MINOAN SIGN CM079;Lo;0;L;;;;;N;;;;; +12FD2;CYPRO-MINOAN SIGN CM080;Lo;0;L;;;;;N;;;;; +12FD3;CYPRO-MINOAN SIGN CM081;Lo;0;L;;;;;N;;;;; +12FD4;CYPRO-MINOAN SIGN CM082;Lo;0;L;;;;;N;;;;; +12FD5;CYPRO-MINOAN SIGN CM083;Lo;0;L;;;;;N;;;;; +12FD6;CYPRO-MINOAN SIGN CM084;Lo;0;L;;;;;N;;;;; +12FD7;CYPRO-MINOAN SIGN CM085;Lo;0;L;;;;;N;;;;; +12FD8;CYPRO-MINOAN SIGN CM086;Lo;0;L;;;;;N;;;;; +12FD9;CYPRO-MINOAN SIGN CM087;Lo;0;L;;;;;N;;;;; +12FDA;CYPRO-MINOAN SIGN CM088;Lo;0;L;;;;;N;;;;; +12FDB;CYPRO-MINOAN SIGN CM089;Lo;0;L;;;;;N;;;;; +12FDC;CYPRO-MINOAN SIGN CM090;Lo;0;L;;;;;N;;;;; +12FDD;CYPRO-MINOAN SIGN CM091;Lo;0;L;;;;;N;;;;; +12FDE;CYPRO-MINOAN SIGN CM092;Lo;0;L;;;;;N;;;;; +12FDF;CYPRO-MINOAN SIGN CM094;Lo;0;L;;;;;N;;;;; +12FE0;CYPRO-MINOAN SIGN CM095;Lo;0;L;;;;;N;;;;; +12FE1;CYPRO-MINOAN SIGN CM096;Lo;0;L;;;;;N;;;;; +12FE2;CYPRO-MINOAN SIGN CM097;Lo;0;L;;;;;N;;;;; +12FE3;CYPRO-MINOAN SIGN CM098;Lo;0;L;;;;;N;;;;; +12FE4;CYPRO-MINOAN SIGN CM099;Lo;0;L;;;;;N;;;;; +12FE5;CYPRO-MINOAN SIGN CM100;Lo;0;L;;;;;N;;;;; +12FE6;CYPRO-MINOAN SIGN CM101;Lo;0;L;;;;;N;;;;; +12FE7;CYPRO-MINOAN SIGN CM102;Lo;0;L;;;;;N;;;;; +12FE8;CYPRO-MINOAN SIGN CM103;Lo;0;L;;;;;N;;;;; +12FE9;CYPRO-MINOAN SIGN CM104;Lo;0;L;;;;;N;;;;; +12FEA;CYPRO-MINOAN SIGN CM105;Lo;0;L;;;;;N;;;;; +12FEB;CYPRO-MINOAN SIGN CM107;Lo;0;L;;;;;N;;;;; +12FEC;CYPRO-MINOAN SIGN CM108;Lo;0;L;;;;;N;;;;; +12FED;CYPRO-MINOAN SIGN CM109;Lo;0;L;;;;;N;;;;; +12FEE;CYPRO-MINOAN SIGN CM110;Lo;0;L;;;;;N;;;;; +12FEF;CYPRO-MINOAN SIGN CM112;Lo;0;L;;;;;N;;;;; +12FF0;CYPRO-MINOAN SIGN CM114;Lo;0;L;;;;;N;;;;; +12FF1;CYPRO-MINOAN SIGN CM301;Po;0;L;;;;;N;;;;; +12FF2;CYPRO-MINOAN SIGN CM302;Po;0;L;;;;;N;;;;; 13000;EGYPTIAN HIEROGLYPH A001;Lo;0;L;;;;;N;;;;; 13001;EGYPTIAN HIEROGLYPH A002;Lo;0;L;;;;;N;;;;; 13002;EGYPTIAN HIEROGLYPH A003;Lo;0;L;;;;;N;;;;; @@ -24835,6 +25244,95 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 16A69;MRO DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 16A6E;MRO DANDA;Po;0;L;;;;;N;;;;; 16A6F;MRO DOUBLE DANDA;Po;0;L;;;;;N;;;;; +16A70;TANGSA LETTER OZ;Lo;0;L;;;;;N;;;;; +16A71;TANGSA LETTER OC;Lo;0;L;;;;;N;;;;; +16A72;TANGSA LETTER OQ;Lo;0;L;;;;;N;;;;; +16A73;TANGSA LETTER OX;Lo;0;L;;;;;N;;;;; +16A74;TANGSA LETTER AZ;Lo;0;L;;;;;N;;;;; +16A75;TANGSA LETTER AC;Lo;0;L;;;;;N;;;;; +16A76;TANGSA LETTER AQ;Lo;0;L;;;;;N;;;;; +16A77;TANGSA LETTER AX;Lo;0;L;;;;;N;;;;; +16A78;TANGSA LETTER VZ;Lo;0;L;;;;;N;;;;; +16A79;TANGSA LETTER VC;Lo;0;L;;;;;N;;;;; +16A7A;TANGSA LETTER VQ;Lo;0;L;;;;;N;;;;; +16A7B;TANGSA LETTER VX;Lo;0;L;;;;;N;;;;; +16A7C;TANGSA LETTER EZ;Lo;0;L;;;;;N;;;;; +16A7D;TANGSA LETTER EC;Lo;0;L;;;;;N;;;;; +16A7E;TANGSA LETTER EQ;Lo;0;L;;;;;N;;;;; +16A7F;TANGSA LETTER EX;Lo;0;L;;;;;N;;;;; +16A80;TANGSA LETTER IZ;Lo;0;L;;;;;N;;;;; +16A81;TANGSA LETTER IC;Lo;0;L;;;;;N;;;;; +16A82;TANGSA LETTER IQ;Lo;0;L;;;;;N;;;;; +16A83;TANGSA LETTER IX;Lo;0;L;;;;;N;;;;; +16A84;TANGSA LETTER UZ;Lo;0;L;;;;;N;;;;; +16A85;TANGSA LETTER UC;Lo;0;L;;;;;N;;;;; +16A86;TANGSA LETTER UQ;Lo;0;L;;;;;N;;;;; +16A87;TANGSA LETTER UX;Lo;0;L;;;;;N;;;;; +16A88;TANGSA LETTER AWZ;Lo;0;L;;;;;N;;;;; +16A89;TANGSA LETTER AWC;Lo;0;L;;;;;N;;;;; +16A8A;TANGSA LETTER AWQ;Lo;0;L;;;;;N;;;;; +16A8B;TANGSA LETTER AWX;Lo;0;L;;;;;N;;;;; +16A8C;TANGSA LETTER UIZ;Lo;0;L;;;;;N;;;;; +16A8D;TANGSA LETTER UIC;Lo;0;L;;;;;N;;;;; +16A8E;TANGSA LETTER UIQ;Lo;0;L;;;;;N;;;;; +16A8F;TANGSA LETTER UIX;Lo;0;L;;;;;N;;;;; +16A90;TANGSA LETTER FINAL NG;Lo;0;L;;;;;N;;;;; +16A91;TANGSA LETTER LONG UEX;Lo;0;L;;;;;N;;;;; +16A92;TANGSA LETTER SHORT UEZ;Lo;0;L;;;;;N;;;;; +16A93;TANGSA LETTER SHORT AWX;Lo;0;L;;;;;N;;;;; +16A94;TANGSA LETTER UEC;Lo;0;L;;;;;N;;;;; +16A95;TANGSA LETTER UEZ;Lo;0;L;;;;;N;;;;; +16A96;TANGSA LETTER UEQ;Lo;0;L;;;;;N;;;;; +16A97;TANGSA LETTER UEX;Lo;0;L;;;;;N;;;;; +16A98;TANGSA LETTER UIUZ;Lo;0;L;;;;;N;;;;; +16A99;TANGSA LETTER UIUC;Lo;0;L;;;;;N;;;;; +16A9A;TANGSA LETTER UIUQ;Lo;0;L;;;;;N;;;;; +16A9B;TANGSA LETTER UIUX;Lo;0;L;;;;;N;;;;; +16A9C;TANGSA LETTER MZ;Lo;0;L;;;;;N;;;;; +16A9D;TANGSA LETTER MC;Lo;0;L;;;;;N;;;;; +16A9E;TANGSA LETTER MQ;Lo;0;L;;;;;N;;;;; +16A9F;TANGSA LETTER MX;Lo;0;L;;;;;N;;;;; +16AA0;TANGSA LETTER KA;Lo;0;L;;;;;N;;;;; +16AA1;TANGSA LETTER KHA;Lo;0;L;;;;;N;;;;; +16AA2;TANGSA LETTER GA;Lo;0;L;;;;;N;;;;; +16AA3;TANGSA LETTER NGA;Lo;0;L;;;;;N;;;;; +16AA4;TANGSA LETTER SA;Lo;0;L;;;;;N;;;;; +16AA5;TANGSA LETTER YA;Lo;0;L;;;;;N;;;;; +16AA6;TANGSA LETTER WA;Lo;0;L;;;;;N;;;;; +16AA7;TANGSA LETTER PA;Lo;0;L;;;;;N;;;;; +16AA8;TANGSA LETTER NYA;Lo;0;L;;;;;N;;;;; +16AA9;TANGSA LETTER PHA;Lo;0;L;;;;;N;;;;; +16AAA;TANGSA LETTER BA;Lo;0;L;;;;;N;;;;; +16AAB;TANGSA LETTER MA;Lo;0;L;;;;;N;;;;; +16AAC;TANGSA LETTER NA;Lo;0;L;;;;;N;;;;; +16AAD;TANGSA LETTER HA;Lo;0;L;;;;;N;;;;; +16AAE;TANGSA LETTER LA;Lo;0;L;;;;;N;;;;; +16AAF;TANGSA LETTER HTA;Lo;0;L;;;;;N;;;;; +16AB0;TANGSA LETTER TA;Lo;0;L;;;;;N;;;;; +16AB1;TANGSA LETTER DA;Lo;0;L;;;;;N;;;;; +16AB2;TANGSA LETTER RA;Lo;0;L;;;;;N;;;;; +16AB3;TANGSA LETTER NHA;Lo;0;L;;;;;N;;;;; +16AB4;TANGSA LETTER SHA;Lo;0;L;;;;;N;;;;; +16AB5;TANGSA LETTER CA;Lo;0;L;;;;;N;;;;; +16AB6;TANGSA LETTER TSA;Lo;0;L;;;;;N;;;;; +16AB7;TANGSA LETTER GHA;Lo;0;L;;;;;N;;;;; +16AB8;TANGSA LETTER HTTA;Lo;0;L;;;;;N;;;;; +16AB9;TANGSA LETTER THA;Lo;0;L;;;;;N;;;;; +16ABA;TANGSA LETTER XA;Lo;0;L;;;;;N;;;;; +16ABB;TANGSA LETTER FA;Lo;0;L;;;;;N;;;;; +16ABC;TANGSA LETTER DHA;Lo;0;L;;;;;N;;;;; +16ABD;TANGSA LETTER CHA;Lo;0;L;;;;;N;;;;; +16ABE;TANGSA LETTER ZA;Lo;0;L;;;;;N;;;;; +16AC0;TANGSA DIGIT ZERO;Nd;0;L;;0;0;0;N;;;;; +16AC1;TANGSA DIGIT ONE;Nd;0;L;;1;1;1;N;;;;; +16AC2;TANGSA DIGIT TWO;Nd;0;L;;2;2;2;N;;;;; +16AC3;TANGSA DIGIT THREE;Nd;0;L;;3;3;3;N;;;;; +16AC4;TANGSA DIGIT FOUR;Nd;0;L;;4;4;4;N;;;;; +16AC5;TANGSA DIGIT FIVE;Nd;0;L;;5;5;5;N;;;;; +16AC6;TANGSA DIGIT SIX;Nd;0;L;;6;6;6;N;;;;; +16AC7;TANGSA DIGIT SEVEN;Nd;0;L;;7;7;7;N;;;;; +16AC8;TANGSA DIGIT EIGHT;Nd;0;L;;8;8;8;N;;;;; +16AC9;TANGSA DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 16AD0;BASSA VAH LETTER ENNI;Lo;0;L;;;;;N;;;;; 16AD1;BASSA VAH LETTER KA;Lo;0;L;;;;;N;;;;; 16AD2;BASSA VAH LETTER SE;Lo;0;L;;;;;N;;;;; @@ -26487,6 +26985,19 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 18CD5;KHITAN SMALL SCRIPT CHARACTER-18CD5;Lo;0;L;;;;;N;;;;; 18D00;;Lo;0;L;;;;;N;;;;; 18D08;;Lo;0;L;;;;;N;;;;; +1AFF0;KATAKANA LETTER MINNAN TONE-2;Lm;0;L;;;;;N;;;;; +1AFF1;KATAKANA LETTER MINNAN TONE-3;Lm;0;L;;;;;N;;;;; +1AFF2;KATAKANA LETTER MINNAN TONE-4;Lm;0;L;;;;;N;;;;; +1AFF3;KATAKANA LETTER MINNAN TONE-5;Lm;0;L;;;;;N;;;;; +1AFF5;KATAKANA LETTER MINNAN TONE-7;Lm;0;L;;;;;N;;;;; +1AFF6;KATAKANA LETTER MINNAN TONE-8;Lm;0;L;;;;;N;;;;; +1AFF7;KATAKANA LETTER MINNAN NASALIZED TONE-1;Lm;0;L;;;;;N;;;;; +1AFF8;KATAKANA LETTER MINNAN NASALIZED TONE-2;Lm;0;L;;;;;N;;;;; +1AFF9;KATAKANA LETTER MINNAN NASALIZED TONE-3;Lm;0;L;;;;;N;;;;; +1AFFA;KATAKANA LETTER MINNAN NASALIZED TONE-4;Lm;0;L;;;;;N;;;;; +1AFFB;KATAKANA LETTER MINNAN NASALIZED TONE-5;Lm;0;L;;;;;N;;;;; +1AFFD;KATAKANA LETTER MINNAN NASALIZED TONE-7;Lm;0;L;;;;;N;;;;; +1AFFE;KATAKANA LETTER MINNAN NASALIZED TONE-8;Lm;0;L;;;;;N;;;;; 1B000;KATAKANA LETTER ARCHAIC E;Lo;0;L;;;;;N;;;;; 1B001;HIRAGANA LETTER ARCHAIC YE;Lo;0;L;;;;;N;;;;; 1B002;HENTAIGANA LETTER A-1;Lo;0;L;;;;;N;;;;; @@ -26774,6 +27285,10 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1B11C;HENTAIGANA LETTER WO-7;Lo;0;L;;;;;N;;;;; 1B11D;HENTAIGANA LETTER N-MU-MO-1;Lo;0;L;;;;;N;;;;; 1B11E;HENTAIGANA LETTER N-MU-MO-2;Lo;0;L;;;;;N;;;;; +1B11F;HIRAGANA LETTER ARCHAIC WU;Lo;0;L;;;;;N;;;;; +1B120;KATAKANA LETTER ARCHAIC YI;Lo;0;L;;;;;N;;;;; +1B121;KATAKANA LETTER ARCHAIC YE;Lo;0;L;;;;;N;;;;; +1B122;KATAKANA LETTER ARCHAIC WU;Lo;0;L;;;;;N;;;;; 1B150;HIRAGANA LETTER SMALL WI;Lo;0;L;;;;;N;;;;; 1B151;HIRAGANA LETTER SMALL WE;Lo;0;L;;;;;N;;;;; 1B152;HIRAGANA LETTER SMALL WO;Lo;0;L;;;;;N;;;;; @@ -27324,6 +27839,191 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1BCA1;SHORTHAND FORMAT CONTINUING OVERLAP;Cf;0;BN;;;;;N;;;;; 1BCA2;SHORTHAND FORMAT DOWN STEP;Cf;0;BN;;;;;N;;;;; 1BCA3;SHORTHAND FORMAT UP STEP;Cf;0;BN;;;;;N;;;;; +1CF00;ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF01;ZNAMENNY COMBINING MARK NIZKO S KRYZHEM ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF02;ZNAMENNY COMBINING MARK TSATA ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF03;ZNAMENNY COMBINING MARK GORAZDO NIZKO ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF04;ZNAMENNY COMBINING MARK NIZKO ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF05;ZNAMENNY COMBINING MARK SREDNE ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF06;ZNAMENNY COMBINING MARK MALO POVYSHE ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF07;ZNAMENNY COMBINING MARK POVYSHE ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF08;ZNAMENNY COMBINING MARK VYSOKO ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF09;ZNAMENNY COMBINING MARK MALO POVYSHE S KHOKHLOM ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF0A;ZNAMENNY COMBINING MARK POVYSHE S KHOKHLOM ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF0B;ZNAMENNY COMBINING MARK VYSOKO S KHOKHLOM ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF0C;ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF0D;ZNAMENNY COMBINING MARK NIZKO S KRYZHEM ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF0E;ZNAMENNY COMBINING MARK TSATA ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF0F;ZNAMENNY COMBINING MARK GORAZDO NIZKO ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF10;ZNAMENNY COMBINING MARK NIZKO ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF11;ZNAMENNY COMBINING MARK SREDNE ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF12;ZNAMENNY COMBINING MARK MALO POVYSHE ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF13;ZNAMENNY COMBINING MARK POVYSHE ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF14;ZNAMENNY COMBINING MARK VYSOKO ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF15;ZNAMENNY COMBINING MARK MALO POVYSHE S KHOKHLOM ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF16;ZNAMENNY COMBINING MARK POVYSHE S KHOKHLOM ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF17;ZNAMENNY COMBINING MARK VYSOKO S KHOKHLOM ON RIGHT;Mn;0;NSM;;;;;N;;;;; +1CF18;ZNAMENNY COMBINING MARK TSATA S KRYZHEM;Mn;0;NSM;;;;;N;;;;; +1CF19;ZNAMENNY COMBINING MARK MALO POVYSHE S KRYZHEM;Mn;0;NSM;;;;;N;;;;; +1CF1A;ZNAMENNY COMBINING MARK STRANNO MALO POVYSHE;Mn;0;NSM;;;;;N;;;;; +1CF1B;ZNAMENNY COMBINING MARK POVYSHE S KRYZHEM;Mn;0;NSM;;;;;N;;;;; +1CF1C;ZNAMENNY COMBINING MARK POVYSHE STRANNO;Mn;0;NSM;;;;;N;;;;; +1CF1D;ZNAMENNY COMBINING MARK VYSOKO S KRYZHEM;Mn;0;NSM;;;;;N;;;;; +1CF1E;ZNAMENNY COMBINING MARK MALO POVYSHE STRANNO;Mn;0;NSM;;;;;N;;;;; +1CF1F;ZNAMENNY COMBINING MARK GORAZDO VYSOKO;Mn;0;NSM;;;;;N;;;;; +1CF20;ZNAMENNY COMBINING MARK ZELO;Mn;0;NSM;;;;;N;;;;; +1CF21;ZNAMENNY COMBINING MARK ON;Mn;0;NSM;;;;;N;;;;; +1CF22;ZNAMENNY COMBINING MARK RAVNO;Mn;0;NSM;;;;;N;;;;; +1CF23;ZNAMENNY COMBINING MARK TIKHAYA;Mn;0;NSM;;;;;N;;;;; +1CF24;ZNAMENNY COMBINING MARK BORZAYA;Mn;0;NSM;;;;;N;;;;; +1CF25;ZNAMENNY COMBINING MARK UDARKA;Mn;0;NSM;;;;;N;;;;; +1CF26;ZNAMENNY COMBINING MARK PODVERTKA;Mn;0;NSM;;;;;N;;;;; +1CF27;ZNAMENNY COMBINING MARK LOMKA;Mn;0;NSM;;;;;N;;;;; +1CF28;ZNAMENNY COMBINING MARK KUPNAYA;Mn;0;NSM;;;;;N;;;;; +1CF29;ZNAMENNY COMBINING MARK KACHKA;Mn;0;NSM;;;;;N;;;;; +1CF2A;ZNAMENNY COMBINING MARK ZEVOK;Mn;0;NSM;;;;;N;;;;; +1CF2B;ZNAMENNY COMBINING MARK SKOBA;Mn;0;NSM;;;;;N;;;;; +1CF2C;ZNAMENNY COMBINING MARK RAZSEKA;Mn;0;NSM;;;;;N;;;;; +1CF2D;ZNAMENNY COMBINING MARK KRYZH ON LEFT;Mn;0;NSM;;;;;N;;;;; +1CF30;ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO;Mn;0;NSM;;;;;N;;;;; +1CF31;ZNAMENNY COMBINING TONAL RANGE MARK SVETLO;Mn;0;NSM;;;;;N;;;;; +1CF32;ZNAMENNY COMBINING TONAL RANGE MARK TRESVETLO;Mn;0;NSM;;;;;N;;;;; +1CF33;ZNAMENNY COMBINING MARK ZADERZHKA;Mn;0;NSM;;;;;N;;;;; +1CF34;ZNAMENNY COMBINING MARK DEMESTVENNY ZADERZHKA;Mn;0;NSM;;;;;N;;;;; +1CF35;ZNAMENNY COMBINING MARK OTSECHKA;Mn;0;NSM;;;;;N;;;;; +1CF36;ZNAMENNY COMBINING MARK PODCHASHIE;Mn;0;NSM;;;;;N;;;;; +1CF37;ZNAMENNY COMBINING MARK PODCHASHIE WITH VERTICAL STROKE;Mn;0;NSM;;;;;N;;;;; +1CF38;ZNAMENNY COMBINING MARK CHASHKA;Mn;0;NSM;;;;;N;;;;; +1CF39;ZNAMENNY COMBINING MARK CHASHKA POLNAYA;Mn;0;NSM;;;;;N;;;;; +1CF3A;ZNAMENNY COMBINING MARK OBLACHKO;Mn;0;NSM;;;;;N;;;;; +1CF3B;ZNAMENNY COMBINING MARK SOROCHYA NOZHKA;Mn;0;NSM;;;;;N;;;;; +1CF3C;ZNAMENNY COMBINING MARK TOCHKA;Mn;0;NSM;;;;;N;;;;; +1CF3D;ZNAMENNY COMBINING MARK DVOETOCHIE;Mn;0;NSM;;;;;N;;;;; +1CF3E;ZNAMENNY COMBINING ATTACHING VERTICAL OMET;Mn;0;NSM;;;;;N;;;;; +1CF3F;ZNAMENNY COMBINING MARK CURVED OMET;Mn;0;NSM;;;;;N;;;;; +1CF40;ZNAMENNY COMBINING MARK KRYZH;Mn;0;NSM;;;;;N;;;;; +1CF41;ZNAMENNY COMBINING LOWER TONAL RANGE INDICATOR;Mn;0;NSM;;;;;N;;;;; +1CF42;ZNAMENNY PRIZNAK MODIFIER LEVEL-2;Mn;0;NSM;;;;;N;;;;; +1CF43;ZNAMENNY PRIZNAK MODIFIER LEVEL-3;Mn;0;NSM;;;;;N;;;;; +1CF44;ZNAMENNY PRIZNAK MODIFIER DIRECTION FLIP;Mn;0;NSM;;;;;N;;;;; +1CF45;ZNAMENNY PRIZNAK MODIFIER KRYZH;Mn;0;NSM;;;;;N;;;;; +1CF46;ZNAMENNY PRIZNAK MODIFIER ROG;Mn;0;NSM;;;;;N;;;;; +1CF50;ZNAMENNY NEUME KRYUK;So;0;L;;;;;N;;;;; +1CF51;ZNAMENNY NEUME KRYUK TIKHY;So;0;L;;;;;N;;;;; +1CF52;ZNAMENNY NEUME PARAKLIT;So;0;L;;;;;N;;;;; +1CF53;ZNAMENNY NEUME DVA V CHELNU;So;0;L;;;;;N;;;;; +1CF54;ZNAMENNY NEUME KLYUCH;So;0;L;;;;;N;;;;; +1CF55;ZNAMENNY NEUME ZANOZHEK;So;0;L;;;;;N;;;;; +1CF56;ZNAMENNY NEUME STOPITSA;So;0;L;;;;;N;;;;; +1CF57;ZNAMENNY NEUME STOPITSA S OCHKOM;So;0;L;;;;;N;;;;; +1CF58;ZNAMENNY NEUME PEREVODKA;So;0;L;;;;;N;;;;; +1CF59;ZNAMENNY NEUME PEREVODKA NEPOSTOYANNAYA;So;0;L;;;;;N;;;;; +1CF5A;ZNAMENNY NEUME STOPITSA WITH SOROCHYA NOZHKA;So;0;L;;;;;N;;;;; +1CF5B;ZNAMENNY NEUME CHELYUSTKA;So;0;L;;;;;N;;;;; +1CF5C;ZNAMENNY NEUME PALKA;So;0;L;;;;;N;;;;; +1CF5D;ZNAMENNY NEUME ZAPYATAYA;So;0;L;;;;;N;;;;; +1CF5E;ZNAMENNY NEUME GOLUBCHIK BORZY;So;0;L;;;;;N;;;;; +1CF5F;ZNAMENNY NEUME GOLUBCHIK TIKHY;So;0;L;;;;;N;;;;; +1CF60;ZNAMENNY NEUME GOLUBCHIK MRACHNY;So;0;L;;;;;N;;;;; +1CF61;ZNAMENNY NEUME GOLUBCHIK SVETLY;So;0;L;;;;;N;;;;; +1CF62;ZNAMENNY NEUME GOLUBCHIK TRESVETLY;So;0;L;;;;;N;;;;; +1CF63;ZNAMENNY NEUME VRAKHIYA PROSTAYA;So;0;L;;;;;N;;;;; +1CF64;ZNAMENNY NEUME VRAKHIYA MRACHNAYA;So;0;L;;;;;N;;;;; +1CF65;ZNAMENNY NEUME VRAKHIYA SVETLAYA;So;0;L;;;;;N;;;;; +1CF66;ZNAMENNY NEUME VRAKHIYA TRESVETLAYA;So;0;L;;;;;N;;;;; +1CF67;ZNAMENNY NEUME VRAKHIYA KLYUCHEVAYA PROSTAYA;So;0;L;;;;;N;;;;; +1CF68;ZNAMENNY NEUME VRAKHIYA KLYUCHEVAYA MRACHNAYA;So;0;L;;;;;N;;;;; +1CF69;ZNAMENNY NEUME VRAKHIYA KLYUCHEVAYA SVETLAYA;So;0;L;;;;;N;;;;; +1CF6A;ZNAMENNY NEUME VRAKHIYA KLYUCHEVAYA TRESVETLAYA;So;0;L;;;;;N;;;;; +1CF6B;ZNAMENNY NEUME DOUBLE ZAPYATAYA;So;0;L;;;;;N;;;;; +1CF6C;ZNAMENNY NEUME REVERSED CHELYUSTKA;So;0;L;;;;;N;;;;; +1CF6D;ZNAMENNY NEUME DERBITSA;So;0;L;;;;;N;;;;; +1CF6E;ZNAMENNY NEUME KHAMILO;So;0;L;;;;;N;;;;; +1CF6F;ZNAMENNY NEUME CHASHKA;So;0;L;;;;;N;;;;; +1CF70;ZNAMENNY NEUME PODCHASHIE;So;0;L;;;;;N;;;;; +1CF71;ZNAMENNY NEUME SKAMEYTSA MRACHNAYA;So;0;L;;;;;N;;;;; +1CF72;ZNAMENNY NEUME SKAMEYTSA SVETLAYA;So;0;L;;;;;N;;;;; +1CF73;ZNAMENNY NEUME SKAMEYTSA TRESVETLAYA;So;0;L;;;;;N;;;;; +1CF74;ZNAMENNY NEUME SKAMEYTSA TIKHAYA;So;0;L;;;;;N;;;;; +1CF75;ZNAMENNY NEUME DEMESTVENNY KLYUCH;So;0;L;;;;;N;;;;; +1CF76;ZNAMENNY NEUME SKAMEYTSA KLYUCHEVAYA SVETLAYA;So;0;L;;;;;N;;;;; +1CF77;ZNAMENNY NEUME SKAMEYTSA KLYUCHENEPOSTOYANNAYA;So;0;L;;;;;N;;;;; +1CF78;ZNAMENNY NEUME SKAMEYTSA KLYUCHEVAYA TIKHAYA;So;0;L;;;;;N;;;;; +1CF79;ZNAMENNY NEUME SKAMEYTSA DVOECHELNAYA PROSTAYA;So;0;L;;;;;N;;;;; +1CF7A;ZNAMENNY NEUME SKAMEYTSA DVOECHELNAYA SVETLAYA;So;0;L;;;;;N;;;;; +1CF7B;ZNAMENNY NEUME SKAMEYTSA DVOECHELNAYA NEPOSTOYANNAYA;So;0;L;;;;;N;;;;; +1CF7C;ZNAMENNY NEUME SKAMEYTSA DVOECHELNAYA KLYUCHEVAYA;So;0;L;;;;;N;;;;; +1CF7D;ZNAMENNY NEUME SLOZHITIE;So;0;L;;;;;N;;;;; +1CF7E;ZNAMENNY NEUME SLOZHITIE S ZAPYATOY;So;0;L;;;;;N;;;;; +1CF7F;ZNAMENNY NEUME SLOZHITIE ZAKRYTOE;So;0;L;;;;;N;;;;; +1CF80;ZNAMENNY NEUME SLOZHITIE S KRYZHEM;So;0;L;;;;;N;;;;; +1CF81;ZNAMENNY NEUME KRYZH;So;0;L;;;;;N;;;;; +1CF82;ZNAMENNY NEUME ROG;So;0;L;;;;;N;;;;; +1CF83;ZNAMENNY NEUME FITA;So;0;L;;;;;N;;;;; +1CF84;ZNAMENNY NEUME KOBYLA;So;0;L;;;;;N;;;;; +1CF85;ZNAMENNY NEUME ZMEYTSA;So;0;L;;;;;N;;;;; +1CF86;ZNAMENNY NEUME STATYA;So;0;L;;;;;N;;;;; +1CF87;ZNAMENNY NEUME STATYA S ZAPYATOY;So;0;L;;;;;N;;;;; +1CF88;ZNAMENNY NEUME STATYA S KRYZHEM;So;0;L;;;;;N;;;;; +1CF89;ZNAMENNY NEUME STATYA S ZAPYATOY I KRYZHEM;So;0;L;;;;;N;;;;; +1CF8A;ZNAMENNY NEUME STATYA S KRYZHEM I ZAPYATOY;So;0;L;;;;;N;;;;; +1CF8B;ZNAMENNY NEUME STATYA ZAKRYTAYA;So;0;L;;;;;N;;;;; +1CF8C;ZNAMENNY NEUME STATYA ZAKRYTAYA S ZAPYATOY;So;0;L;;;;;N;;;;; +1CF8D;ZNAMENNY NEUME STATYA S ROGOM;So;0;L;;;;;N;;;;; +1CF8E;ZNAMENNY NEUME STATYA S DVUMYA ZAPYATYMI;So;0;L;;;;;N;;;;; +1CF8F;ZNAMENNY NEUME STATYA S ZAPYATOY I PODCHASHIEM;So;0;L;;;;;N;;;;; +1CF90;ZNAMENNY NEUME POLKULIZMY;So;0;L;;;;;N;;;;; +1CF91;ZNAMENNY NEUME STATYA NEPOSTOYANNAYA;So;0;L;;;;;N;;;;; +1CF92;ZNAMENNY NEUME STRELA PROSTAYA;So;0;L;;;;;N;;;;; +1CF93;ZNAMENNY NEUME STRELA MRACHNOTIKHAYA;So;0;L;;;;;N;;;;; +1CF94;ZNAMENNY NEUME STRELA KRYZHEVAYA;So;0;L;;;;;N;;;;; +1CF95;ZNAMENNY NEUME STRELA POLUPOVODNAYA;So;0;L;;;;;N;;;;; +1CF96;ZNAMENNY NEUME STRELA POVODNAYA;So;0;L;;;;;N;;;;; +1CF97;ZNAMENNY NEUME STRELA NEPOSTOYANNAYA;So;0;L;;;;;N;;;;; +1CF98;ZNAMENNY NEUME STRELA KLYUCHEPOVODNAYA;So;0;L;;;;;N;;;;; +1CF99;ZNAMENNY NEUME STRELA KLYUCHENEPOSTOYANNAYA;So;0;L;;;;;N;;;;; +1CF9A;ZNAMENNY NEUME STRELA TIKHAYA PUTNAYA;So;0;L;;;;;N;;;;; +1CF9B;ZNAMENNY NEUME STRELA DVOECHELNAYA;So;0;L;;;;;N;;;;; +1CF9C;ZNAMENNY NEUME STRELA DVOECHELNOKRYZHEVAYA;So;0;L;;;;;N;;;;; +1CF9D;ZNAMENNY NEUME STRELA DVOECHELNOPOVODNAYA;So;0;L;;;;;N;;;;; +1CF9E;ZNAMENNY NEUME STRELA DVOECHELNAYA KLYUCHEVAYA;So;0;L;;;;;N;;;;; +1CF9F;ZNAMENNY NEUME STRELA DVOECHELNOPOVODNAYA KLYUCHEVAYA;So;0;L;;;;;N;;;;; +1CFA0;ZNAMENNY NEUME STRELA GROMNAYA WITH SINGLE ZAPYATAYA;So;0;L;;;;;N;;;;; +1CFA1;ZNAMENNY NEUME STRELA GROMOPOVODNAYA WITH SINGLE ZAPYATAYA;So;0;L;;;;;N;;;;; +1CFA2;ZNAMENNY NEUME STRELA GROMNAYA;So;0;L;;;;;N;;;;; +1CFA3;ZNAMENNY NEUME STRELA GROMOPOVODNAYA;So;0;L;;;;;N;;;;; +1CFA4;ZNAMENNY NEUME STRELA GROMOPOVODNAYA WITH DOUBLE ZAPYATAYA;So;0;L;;;;;N;;;;; +1CFA5;ZNAMENNY NEUME STRELA GROMOKRYZHEVAYA;So;0;L;;;;;N;;;;; +1CFA6;ZNAMENNY NEUME STRELA GROMOKRYZHEVAYA POVODNAYA;So;0;L;;;;;N;;;;; +1CFA7;ZNAMENNY NEUME MECHIK;So;0;L;;;;;N;;;;; +1CFA8;ZNAMENNY NEUME MECHIK POVODNY;So;0;L;;;;;N;;;;; +1CFA9;ZNAMENNY NEUME MECHIK KLYUCHEVOY;So;0;L;;;;;N;;;;; +1CFAA;ZNAMENNY NEUME MECHIK KLYUCHEPOVODNY;So;0;L;;;;;N;;;;; +1CFAB;ZNAMENNY NEUME MECHIK KLYUCHENEPOSTOYANNY;So;0;L;;;;;N;;;;; +1CFAC;ZNAMENNY NEUME STRELA TRYASOGLASNAYA;So;0;L;;;;;N;;;;; +1CFAD;ZNAMENNY NEUME STRELA TRYASOPOVODNAYA;So;0;L;;;;;N;;;;; +1CFAE;ZNAMENNY NEUME STRELA TRYASOSTRELNAYA;So;0;L;;;;;N;;;;; +1CFAF;ZNAMENNY NEUME OSOKA;So;0;L;;;;;N;;;;; +1CFB0;ZNAMENNY NEUME OSOKA SVETLAYA;So;0;L;;;;;N;;;;; +1CFB1;ZNAMENNY NEUME OSOKA TRESVETLAYA;So;0;L;;;;;N;;;;; +1CFB2;ZNAMENNY NEUME OSOKA KRYUKOVAYA SVETLAYA;So;0;L;;;;;N;;;;; +1CFB3;ZNAMENNY NEUME OSOKA KLYUCHEVAYA SVETLAYA;So;0;L;;;;;N;;;;; +1CFB4;ZNAMENNY NEUME OSOKA KLYUCHEVAYA NEPOSTOYANNAYA;So;0;L;;;;;N;;;;; +1CFB5;ZNAMENNY NEUME STRELA KRYUKOVAYA;So;0;L;;;;;N;;;;; +1CFB6;ZNAMENNY NEUME STRELA KRYUKOVAYA POVODNAYA;So;0;L;;;;;N;;;;; +1CFB7;ZNAMENNY NEUME STRELA KRYUKOVAYA GROMNAYA WITH SINGLE ZAPYATAYA;So;0;L;;;;;N;;;;; +1CFB8;ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOPOVODNAYA WITH SINGLE ZAPYATAYA;So;0;L;;;;;N;;;;; +1CFB9;ZNAMENNY NEUME STRELA KRYUKOVAYA GROMNAYA;So;0;L;;;;;N;;;;; +1CFBA;ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOPOVODNAYA;So;0;L;;;;;N;;;;; +1CFBB;ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOPOVODNAYA WITH DOUBLE ZAPYATAYA;So;0;L;;;;;N;;;;; +1CFBC;ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOKRYZHEVAYA;So;0;L;;;;;N;;;;; +1CFBD;ZNAMENNY NEUME STRELA KRYUKOVAYA GROMOKRYZHEVAYA POVODNAYA;So;0;L;;;;;N;;;;; +1CFBE;ZNAMENNY NEUME STRELA KRYUKOVAYA TRYASKA;So;0;L;;;;;N;;;;; +1CFBF;ZNAMENNY NEUME KUFISMA;So;0;L;;;;;N;;;;; +1CFC0;ZNAMENNY NEUME OBLAKO;So;0;L;;;;;N;;;;; +1CFC1;ZNAMENNY NEUME DUDA;So;0;L;;;;;N;;;;; +1CFC2;ZNAMENNY NEUME NEMKA;So;0;L;;;;;N;;;;; +1CFC3;ZNAMENNY NEUME PAUK;So;0;L;;;;;N;;;;; 1D000;BYZANTINE MUSICAL SYMBOL PSILI;So;0;L;;;;;N;;;;; 1D001;BYZANTINE MUSICAL SYMBOL DASEIA;So;0;L;;;;;N;;;;; 1D002;BYZANTINE MUSICAL SYMBOL PERISPOMENI;So;0;L;;;;;N;;;;; @@ -27801,6 +28501,8 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1D1E6;MUSICAL SYMBOL KIEVAN EIGHTH NOTE STEM DOWN;So;0;L;;;;;N;;;;; 1D1E7;MUSICAL SYMBOL KIEVAN EIGHTH NOTE STEM UP;So;0;L;;;;;N;;;;; 1D1E8;MUSICAL SYMBOL KIEVAN FLAT SIGN;So;0;L;;;;;N;;;;; +1D1E9;MUSICAL SYMBOL SORI;So;0;ON;;;;;N;;;;; +1D1EA;MUSICAL SYMBOL KORON;So;0;ON;;;;;N;;;;; 1D200;GREEK VOCAL NOTATION SYMBOL-1;So;0;ON;;;;;N;;;;; 1D201;GREEK VOCAL NOTATION SYMBOL-2;So;0;ON;;;;;N;;;;; 1D202;GREEK VOCAL NOTATION SYMBOL-3;So;0;ON;;;;;N;;;;; @@ -29671,6 +30373,37 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1DAAD;SIGNWRITING ROTATION MODIFIER-14;Mn;0;NSM;;;;;N;;;;; 1DAAE;SIGNWRITING ROTATION MODIFIER-15;Mn;0;NSM;;;;;N;;;;; 1DAAF;SIGNWRITING ROTATION MODIFIER-16;Mn;0;NSM;;;;;N;;;;; +1DF00;LATIN SMALL LETTER FENG DIGRAPH WITH TRILL;Ll;0;L;;;;;N;;;;; +1DF01;LATIN SMALL LETTER REVERSED SCRIPT G;Ll;0;L;;;;;N;;;;; +1DF02;LATIN LETTER SMALL CAPITAL TURNED G;Ll;0;L;;;;;N;;;;; +1DF03;LATIN SMALL LETTER REVERSED K;Ll;0;L;;;;;N;;;;; +1DF04;LATIN LETTER SMALL CAPITAL L WITH BELT;Ll;0;L;;;;;N;;;;; +1DF05;LATIN SMALL LETTER LEZH WITH RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; +1DF06;LATIN SMALL LETTER TURNED Y WITH BELT;Ll;0;L;;;;;N;;;;; +1DF07;LATIN SMALL LETTER REVERSED ENG;Ll;0;L;;;;;N;;;;; +1DF08;LATIN SMALL LETTER TURNED R WITH LONG LEG AND RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; +1DF09;LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; +1DF0A;LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK;Lo;0;L;;;;;N;;;;; +1DF0B;LATIN SMALL LETTER ESH WITH DOUBLE BAR;Ll;0;L;;;;;N;;;;; +1DF0C;LATIN SMALL LETTER ESH WITH DOUBLE BAR AND CURL;Ll;0;L;;;;;N;;;;; +1DF0D;LATIN SMALL LETTER TURNED T WITH CURL;Ll;0;L;;;;;N;;;;; +1DF0E;LATIN LETTER INVERTED GLOTTAL STOP WITH CURL;Ll;0;L;;;;;N;;;;; +1DF0F;LATIN LETTER STRETCHED C WITH CURL;Ll;0;L;;;;;N;;;;; +1DF10;LATIN LETTER SMALL CAPITAL TURNED K;Ll;0;L;;;;;N;;;;; +1DF11;LATIN SMALL LETTER L WITH FISHHOOK;Ll;0;L;;;;;N;;;;; +1DF12;LATIN SMALL LETTER DEZH DIGRAPH WITH PALATAL HOOK;Ll;0;L;;;;;N;;;;; +1DF13;LATIN SMALL LETTER L WITH BELT AND PALATAL HOOK;Ll;0;L;;;;;N;;;;; +1DF14;LATIN SMALL LETTER ENG WITH PALATAL HOOK;Ll;0;L;;;;;N;;;;; +1DF15;LATIN SMALL LETTER TURNED R WITH PALATAL HOOK;Ll;0;L;;;;;N;;;;; +1DF16;LATIN SMALL LETTER R WITH FISHHOOK AND PALATAL HOOK;Ll;0;L;;;;;N;;;;; +1DF17;LATIN SMALL LETTER TESH DIGRAPH WITH PALATAL HOOK;Ll;0;L;;;;;N;;;;; +1DF18;LATIN SMALL LETTER EZH WITH PALATAL HOOK;Ll;0;L;;;;;N;;;;; +1DF19;LATIN SMALL LETTER DEZH DIGRAPH WITH RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; +1DF1A;LATIN SMALL LETTER I WITH STROKE AND RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; +1DF1B;LATIN SMALL LETTER O WITH RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; +1DF1C;LATIN SMALL LETTER TESH DIGRAPH WITH RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; +1DF1D;LATIN SMALL LETTER C WITH RETROFLEX HOOK;Ll;0;L;;;;;N;;;;; +1DF1E;LATIN SMALL LETTER S WITH CURL;Ll;0;L;;;;;N;;;;; 1E000;COMBINING GLAGOLITIC LETTER AZU;Mn;230;NSM;;;;;N;;;;; 1E001;COMBINING GLAGOLITIC LETTER BUKY;Mn;230;NSM;;;;;N;;;;; 1E002;COMBINING GLAGOLITIC LETTER VEDE;Mn;230;NSM;;;;;N;;;;; @@ -29780,6 +30513,37 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1E149;NYIAKENG PUACHUE HMONG DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 1E14E;NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ;Lo;0;L;;;;;N;;;;; 1E14F;NYIAKENG PUACHUE HMONG CIRCLED CA;So;0;L;;;;;N;;;;; +1E290;TOTO LETTER PA;Lo;0;L;;;;;N;;;;; +1E291;TOTO LETTER BA;Lo;0;L;;;;;N;;;;; +1E292;TOTO LETTER TA;Lo;0;L;;;;;N;;;;; +1E293;TOTO LETTER DA;Lo;0;L;;;;;N;;;;; +1E294;TOTO LETTER KA;Lo;0;L;;;;;N;;;;; +1E295;TOTO LETTER GA;Lo;0;L;;;;;N;;;;; +1E296;TOTO LETTER MA;Lo;0;L;;;;;N;;;;; +1E297;TOTO LETTER NA;Lo;0;L;;;;;N;;;;; +1E298;TOTO LETTER NGA;Lo;0;L;;;;;N;;;;; +1E299;TOTO LETTER SA;Lo;0;L;;;;;N;;;;; +1E29A;TOTO LETTER CHA;Lo;0;L;;;;;N;;;;; +1E29B;TOTO LETTER YA;Lo;0;L;;;;;N;;;;; +1E29C;TOTO LETTER WA;Lo;0;L;;;;;N;;;;; +1E29D;TOTO LETTER JA;Lo;0;L;;;;;N;;;;; +1E29E;TOTO LETTER HA;Lo;0;L;;;;;N;;;;; +1E29F;TOTO LETTER RA;Lo;0;L;;;;;N;;;;; +1E2A0;TOTO LETTER LA;Lo;0;L;;;;;N;;;;; +1E2A1;TOTO LETTER I;Lo;0;L;;;;;N;;;;; +1E2A2;TOTO LETTER BREATHY I;Lo;0;L;;;;;N;;;;; +1E2A3;TOTO LETTER IU;Lo;0;L;;;;;N;;;;; +1E2A4;TOTO LETTER BREATHY IU;Lo;0;L;;;;;N;;;;; +1E2A5;TOTO LETTER U;Lo;0;L;;;;;N;;;;; +1E2A6;TOTO LETTER E;Lo;0;L;;;;;N;;;;; +1E2A7;TOTO LETTER BREATHY E;Lo;0;L;;;;;N;;;;; +1E2A8;TOTO LETTER EO;Lo;0;L;;;;;N;;;;; +1E2A9;TOTO LETTER BREATHY EO;Lo;0;L;;;;;N;;;;; +1E2AA;TOTO LETTER O;Lo;0;L;;;;;N;;;;; +1E2AB;TOTO LETTER AE;Lo;0;L;;;;;N;;;;; +1E2AC;TOTO LETTER BREATHY AE;Lo;0;L;;;;;N;;;;; +1E2AD;TOTO LETTER A;Lo;0;L;;;;;N;;;;; +1E2AE;TOTO SIGN RISING TONE;Mn;230;NSM;;;;;N;;;;; 1E2C0;WANCHO LETTER AA;Lo;0;L;;;;;N;;;;; 1E2C1;WANCHO LETTER A;Lo;0;L;;;;;N;;;;; 1E2C2;WANCHO LETTER BA;Lo;0;L;;;;;N;;;;; @@ -29839,6 +30603,34 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1E2F8;WANCHO DIGIT EIGHT;Nd;0;L;;8;8;8;N;;;;; 1E2F9;WANCHO DIGIT NINE;Nd;0;L;;9;9;9;N;;;;; 1E2FF;WANCHO NGUN SIGN;Sc;0;ET;;;;;N;;;;; +1E7E0;ETHIOPIC SYLLABLE HHYA;Lo;0;L;;;;;N;;;;; +1E7E1;ETHIOPIC SYLLABLE HHYU;Lo;0;L;;;;;N;;;;; +1E7E2;ETHIOPIC SYLLABLE HHYI;Lo;0;L;;;;;N;;;;; +1E7E3;ETHIOPIC SYLLABLE HHYAA;Lo;0;L;;;;;N;;;;; +1E7E4;ETHIOPIC SYLLABLE HHYEE;Lo;0;L;;;;;N;;;;; +1E7E5;ETHIOPIC SYLLABLE HHYE;Lo;0;L;;;;;N;;;;; +1E7E6;ETHIOPIC SYLLABLE HHYO;Lo;0;L;;;;;N;;;;; +1E7E8;ETHIOPIC SYLLABLE GURAGE HHWA;Lo;0;L;;;;;N;;;;; +1E7E9;ETHIOPIC SYLLABLE HHWI;Lo;0;L;;;;;N;;;;; +1E7EA;ETHIOPIC SYLLABLE HHWEE;Lo;0;L;;;;;N;;;;; +1E7EB;ETHIOPIC SYLLABLE HHWE;Lo;0;L;;;;;N;;;;; +1E7ED;ETHIOPIC SYLLABLE GURAGE MWI;Lo;0;L;;;;;N;;;;; +1E7EE;ETHIOPIC SYLLABLE GURAGE MWEE;Lo;0;L;;;;;N;;;;; +1E7F0;ETHIOPIC SYLLABLE GURAGE QWI;Lo;0;L;;;;;N;;;;; +1E7F1;ETHIOPIC SYLLABLE GURAGE QWEE;Lo;0;L;;;;;N;;;;; +1E7F2;ETHIOPIC SYLLABLE GURAGE QWE;Lo;0;L;;;;;N;;;;; +1E7F3;ETHIOPIC SYLLABLE GURAGE BWI;Lo;0;L;;;;;N;;;;; +1E7F4;ETHIOPIC SYLLABLE GURAGE BWEE;Lo;0;L;;;;;N;;;;; +1E7F5;ETHIOPIC SYLLABLE GURAGE KWI;Lo;0;L;;;;;N;;;;; +1E7F6;ETHIOPIC SYLLABLE GURAGE KWEE;Lo;0;L;;;;;N;;;;; +1E7F7;ETHIOPIC SYLLABLE GURAGE KWE;Lo;0;L;;;;;N;;;;; +1E7F8;ETHIOPIC SYLLABLE GURAGE GWI;Lo;0;L;;;;;N;;;;; +1E7F9;ETHIOPIC SYLLABLE GURAGE GWEE;Lo;0;L;;;;;N;;;;; +1E7FA;ETHIOPIC SYLLABLE GURAGE GWE;Lo;0;L;;;;;N;;;;; +1E7FB;ETHIOPIC SYLLABLE GURAGE FWI;Lo;0;L;;;;;N;;;;; +1E7FC;ETHIOPIC SYLLABLE GURAGE FWEE;Lo;0;L;;;;;N;;;;; +1E7FD;ETHIOPIC SYLLABLE GURAGE PWI;Lo;0;L;;;;;N;;;;; +1E7FE;ETHIOPIC SYLLABLE GURAGE PWEE;Lo;0;L;;;;;N;;;;; 1E800;MENDE KIKAKUI SYLLABLE M001 KI;Lo;0;R;;;;;N;;;;; 1E801;MENDE KIKAKUI SYLLABLE M002 KA;Lo;0;R;;;;;N;;;;; 1E802;MENDE KIKAKUI SYLLABLE M003 KU;Lo;0;R;;;;;N;;;;; @@ -31886,6 +32678,9 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1F6D5;HINDU TEMPLE;So;0;ON;;;;;N;;;;; 1F6D6;HUT;So;0;ON;;;;;N;;;;; 1F6D7;ELEVATOR;So;0;ON;;;;;N;;;;; +1F6DD;PLAYGROUND SLIDE;So;0;ON;;;;;N;;;;; +1F6DE;WHEEL;So;0;ON;;;;;N;;;;; +1F6DF;RING BUOY;So;0;ON;;;;;N;;;;; 1F6E0;HAMMER AND WRENCH;So;0;ON;;;;;N;;;;; 1F6E1;SHIELD;So;0;ON;;;;;N;;;;; 1F6E2;OIL DRUM;So;0;ON;;;;;N;;;;; @@ -32129,6 +32924,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1F7E9;LARGE GREEN SQUARE;So;0;ON;;;;;N;;;;; 1F7EA;LARGE PURPLE SQUARE;So;0;ON;;;;;N;;;;; 1F7EB;LARGE BROWN SQUARE;So;0;ON;;;;;N;;;;; +1F7F0;HEAVY EQUALS SIGN;So;0;ON;;;;;N;;;;; 1F800;LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD;So;0;ON;;;;;N;;;;; 1F801;UPWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD;So;0;ON;;;;;N;;;;; 1F802;RIGHTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD;So;0;ON;;;;;N;;;;; @@ -32400,6 +33196,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1F976;FREEZING FACE;So;0;ON;;;;;N;;;;; 1F977;NINJA;So;0;ON;;;;;N;;;;; 1F978;DISGUISED FACE;So;0;ON;;;;;N;;;;; +1F979;FACE HOLDING BACK TEARS;So;0;ON;;;;;N;;;;; 1F97A;FACE WITH PLEADING EYES;So;0;ON;;;;;N;;;;; 1F97B;SARI;So;0;ON;;;;;N;;;;; 1F97C;LAB COAT;So;0;ON;;;;;N;;;;; @@ -32482,6 +33279,7 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1F9C9;MATE DRINK;So;0;ON;;;;;N;;;;; 1F9CA;ICE CUBE;So;0;ON;;;;;N;;;;; 1F9CB;BUBBLE TEA;So;0;ON;;;;;N;;;;; +1F9CC;TROLL;So;0;ON;;;;;N;;;;; 1F9CD;STANDING PERSON;So;0;ON;;;;;N;;;;; 1F9CE;KNEELING PERSON;So;0;ON;;;;;N;;;;; 1F9CF;DEAF PERSON;So;0;ON;;;;;N;;;;; @@ -32639,6 +33437,8 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FA78;DROP OF BLOOD;So;0;ON;;;;;N;;;;; 1FA79;ADHESIVE BANDAGE;So;0;ON;;;;;N;;;;; 1FA7A;STETHOSCOPE;So;0;ON;;;;;N;;;;; +1FA7B;X-RAY;So;0;ON;;;;;N;;;;; +1FA7C;CRUTCH;So;0;ON;;;;;N;;;;; 1FA80;YO-YO;So;0;ON;;;;;N;;;;; 1FA81;KITE;So;0;ON;;;;;N;;;;; 1FA82;PARACHUTE;So;0;ON;;;;;N;;;;; @@ -32671,6 +33471,10 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FAA6;HEADSTONE;So;0;ON;;;;;N;;;;; 1FAA7;PLACARD;So;0;ON;;;;;N;;;;; 1FAA8;ROCK;So;0;ON;;;;;N;;;;; +1FAA9;MIRROR BALL;So;0;ON;;;;;N;;;;; +1FAAA;IDENTIFICATION CARD;So;0;ON;;;;;N;;;;; +1FAAB;LOW BATTERY;So;0;ON;;;;;N;;;;; +1FAAC;HAMSA;So;0;ON;;;;;N;;;;; 1FAB0;FLY;So;0;ON;;;;;N;;;;; 1FAB1;WORM;So;0;ON;;;;;N;;;;; 1FAB2;BEETLE;So;0;ON;;;;;N;;;;; @@ -32678,9 +33482,16 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FAB4;POTTED PLANT;So;0;ON;;;;;N;;;;; 1FAB5;WOOD;So;0;ON;;;;;N;;;;; 1FAB6;FEATHER;So;0;ON;;;;;N;;;;; +1FAB7;LOTUS;So;0;ON;;;;;N;;;;; +1FAB8;CORAL;So;0;ON;;;;;N;;;;; +1FAB9;EMPTY NEST;So;0;ON;;;;;N;;;;; +1FABA;NEST WITH EGGS;So;0;ON;;;;;N;;;;; 1FAC0;ANATOMICAL HEART;So;0;ON;;;;;N;;;;; 1FAC1;LUNGS;So;0;ON;;;;;N;;;;; 1FAC2;PEOPLE HUGGING;So;0;ON;;;;;N;;;;; +1FAC3;PREGNANT MAN;So;0;ON;;;;;N;;;;; +1FAC4;PREGNANT PERSON;So;0;ON;;;;;N;;;;; +1FAC5;PERSON WITH CROWN;So;0;ON;;;;;N;;;;; 1FAD0;BLUEBERRIES;So;0;ON;;;;;N;;;;; 1FAD1;BELL PEPPER;So;0;ON;;;;;N;;;;; 1FAD2;OLIVE;So;0;ON;;;;;N;;;;; @@ -32688,6 +33499,24 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FAD4;TAMALE;So;0;ON;;;;;N;;;;; 1FAD5;FONDUE;So;0;ON;;;;;N;;;;; 1FAD6;TEAPOT;So;0;ON;;;;;N;;;;; +1FAD7;POURING LIQUID;So;0;ON;;;;;N;;;;; +1FAD8;BEANS;So;0;ON;;;;;N;;;;; +1FAD9;JAR;So;0;ON;;;;;N;;;;; +1FAE0;MELTING FACE;So;0;ON;;;;;N;;;;; +1FAE1;SALUTING FACE;So;0;ON;;;;;N;;;;; +1FAE2;FACE WITH OPEN EYES AND HAND OVER MOUTH;So;0;ON;;;;;N;;;;; +1FAE3;FACE WITH PEEKING EYE;So;0;ON;;;;;N;;;;; +1FAE4;FACE WITH DIAGONAL MOUTH;So;0;ON;;;;;N;;;;; +1FAE5;DOTTED LINE FACE;So;0;ON;;;;;N;;;;; +1FAE6;BITING LIP;So;0;ON;;;;;N;;;;; +1FAE7;BUBBLES;So;0;ON;;;;;N;;;;; +1FAF0;HAND WITH INDEX FINGER AND THUMB CROSSED;So;0;ON;;;;;N;;;;; +1FAF1;RIGHTWARDS HAND;So;0;ON;;;;;N;;;;; +1FAF2;LEFTWARDS HAND;So;0;ON;;;;;N;;;;; +1FAF3;PALM DOWN HAND;So;0;ON;;;;;N;;;;; +1FAF4;PALM UP HAND;So;0;ON;;;;;N;;;;; +1FAF5;INDEX POINTING AT THE VIEWER;So;0;ON;;;;;N;;;;; +1FAF6;HEART HANDS;So;0;ON;;;;;N;;;;; 1FB00;BLOCK SEXTANT-1;So;0;ON;;;;;N;;;;; 1FB01;BLOCK SEXTANT-2;So;0;ON;;;;;N;;;;; 1FB02;BLOCK SEXTANT-12;So;0;ON;;;;;N;;;;; @@ -32901,9 +33730,9 @@ FFFD;REPLACEMENT CHARACTER;So;0;ON;;;;;N;;;;; 1FBF8;SEGMENTED DIGIT EIGHT;Nd;0;EN; 0038;8;8;8;N;;;;; 1FBF9;SEGMENTED DIGIT NINE;Nd;0;EN; 0039;9;9;9;N;;;;; 20000;;Lo;0;L;;;;;N;;;;; -2A6DD;;Lo;0;L;;;;;N;;;;; +2A6DF;;Lo;0;L;;;;;N;;;;; 2A700;;Lo;0;L;;;;;N;;;;; -2B734;;Lo;0;L;;;;;N;;;;; +2B738;;Lo;0;L;;;;;N;;;;; 2B740;;Lo;0;L;;;;;N;;;;; 2B81D;;Lo;0;L;;;;;N;;;;; 2B820;;Lo;0;L;;;;;N;;;;; diff --git a/lib/unicore/VerticalOrientation.txt b/lib/unicore/VerticalOrientation.txt index 1cc92e31f9..35caa05bf1 100644 --- a/lib/unicore/VerticalOrientation.txt +++ b/lib/unicore/VerticalOrientation.txt @@ -1,16 +1,16 @@ -# VerticalOrientation-13.0.0.txt -# Date: 2019-10-07, 05:27:01 GMT [EM, KI, LI] -# © 2019 Unicode®, Inc. +# VerticalOrientation-14.0.0.txt +# Date: 2021-07-06, 09:58:53 GMT [EM, KI, LI, KW, MS] +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. -# For terms of use, see http://www.unicode.org/terms_of_use.html +# For terms of use, see https://www.unicode.org/terms_of_use.html # # Unicode Character Database -# For documentation, see http://www.unicode.org/reports/tr44/ +# For documentation, see https://www.unicode.org/reports/tr44/ # # Vertical_Orientation (vo) Property # # This file defines the Vertical_Orientation property. See UAX #50: -# Unicode Vertical Text Layout, at http://www.unicode.org/reports/tr50/ +# Unicode Vertical Text Layout, at https://www.unicode.org/reports/tr50/ # # The format of the file is two fields separated by a semicolon. # Field 0: Unicode code point value or range of code point values in @@ -45,9 +45,11 @@ # Egyptian Hieroglyphs & Controls: U+13000..U+1343F # Anatolian Hieroglyphs: U+14400..U+1467F # Ideographic Symbols & Tangut: U+16FE0..U+18AFF -# Khitan Small Script & Tangut Sup: U+18B00..U+18D8F +# Khitan Small Script & Tangut Sup: U+18B00..U+18D7F +# Kana Extended-B: U+1AFF0..U+1AFFF # Kana Extended-A & Small Kana Ext: U+1B100..U+1B16F # Nushu: U+1B170..U+1B2FF +# Musical Symbols: U+1CF00..U+1CFCF # Musical Symbols: U+1D000..U+1D1FF # Mayan Numerals: U+1D2E0..U+1D2FF # Symbols & Rods: U+1D300..U+1D37F @@ -205,7 +207,7 @@ 0610..061A ; R # Mn [11] ARABIC SIGN SALLALLAHOU ALAYHE WASSALLAM..ARABIC SMALL KASRA 061B ; R # Po ARABIC SEMICOLON 061C ; R # Cf ARABIC LETTER MARK -061E..061F ; R # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; R # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 0620..063F ; R # Lo [32] ARABIC LETTER KASHMIRI YEH..ARABIC LETTER FARSI YEH WITH THREE DOTS ABOVE 0640 ; R # Lm ARABIC TATWEEL 0641..064A ; R # Lo [10] ARABIC LETTER FEH..ARABIC LETTER YEH @@ -263,9 +265,14 @@ 0859..085B ; R # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK 085E ; R # Po MANDAIC PUNCTUATION 0860..086A ; R # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; R # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; R # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE -08D3..08E1 ; R # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0870..0887 ; R # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0888 ; R # Sk ARABIC RAISED ROUND DOT +0889..088E ; R # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0890..0891 ; R # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +0898..089F ; R # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08A0..08C8 ; R # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; R # Lm ARABIC SMALL FARSI YEH +08CA..08E1 ; R # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E2 ; R # Cf ARABIC DISPUTED END OF AYAH 08E3..08FF ; R # Mn [29] ARABIC TURNED DAMMA BELOW..ARABIC MARK SIDEWAYS NOON GHUNNA 0900..0902 ; R # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA @@ -422,6 +429,7 @@ 0C0E..0C10 ; R # Lo [3] TELUGU LETTER E..TELUGU LETTER AI 0C12..0C28 ; R # Lo [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C39 ; R # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C3C ; R # Mn TELUGU SIGN NUKTA 0C3D ; R # Lo TELUGU SIGN AVAGRAHA 0C3E..0C40 ; R # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44 ; R # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR @@ -429,6 +437,7 @@ 0C4A..0C4D ; R # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56 ; R # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK 0C58..0C5A ; R # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; R # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; R # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63 ; R # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C66..0C6F ; R # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE @@ -454,7 +463,7 @@ 0CCA..0CCB ; R # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC..0CCD ; R # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA 0CD5..0CD6 ; R # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE ; R # Lo KANNADA LETTER FA +0CDD..0CDE ; R # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; R # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; R # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; R # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -640,11 +649,13 @@ 16EB..16ED ; R # Po [3] RUNIC SINGLE PUNCTUATION..RUNIC CROSS PUNCTUATION 16EE..16F0 ; R # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; R # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; R # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; R # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711 ; R # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1714 ; R # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA +1715 ; R # Mc TAGALOG SIGN PAMUDPOD +171F ; R # Lo TAGALOG LETTER ARCHAIC RA 1720..1731 ; R # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA -1732..1734 ; R # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733 ; R # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734 ; R # Mc HANUNOO SIGN PAMUDPOD 1735..1736 ; R # Po [2] PHILIPPINE SINGLE PUNCTUATION..PHILIPPINE DOUBLE PUNCTUATION 1740..1751 ; R # Lo [18] BUHID LETTER A..BUHID LETTER HA 1752..1753 ; R # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U @@ -672,6 +683,7 @@ 1807..180A ; R # Po [4] MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER..MONGOLIAN NIRUGU 180B..180D ; R # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; R # Cf MONGOLIAN VOWEL SEPARATOR +180F ; R # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1810..1819 ; R # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE 1820..1842 ; R # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843 ; R # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -728,7 +740,7 @@ 1AA8..1AAD ; R # Po [6] TAI THAM SIGN KAAN..TAI THAM SIGN CAANG 1AB0..1ABD ; R # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; R # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; R # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; R # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; R # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; R # Mc BALINESE SIGN BISAH 1B05..1B33 ; R # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA @@ -740,12 +752,13 @@ 1B3D..1B41 ; R # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42 ; R # Mn BALINESE VOWEL SIGN PEPET 1B43..1B44 ; R # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG -1B45..1B4B ; R # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; R # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59 ; R # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B5A..1B60 ; R # Po [7] BALINESE PANTI..BALINESE PAMENENG 1B61..1B6A ; R # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE 1B6B..1B73 ; R # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1B74..1B7C ; R # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +1B7D..1B7E ; R # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1B80..1B81 ; R # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR 1B82 ; R # Mc SUNDANESE SIGN PANGWISAD 1B83..1BA0 ; R # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA @@ -804,8 +817,7 @@ 1D79..1D7F ; R # Ll [7] LATIN SMALL LETTER INSULAR G..LATIN SMALL LETTER UPSILON WITH STROKE 1D80..1D9A ; R # Ll [27] LATIN SMALL LETTER B WITH PALATAL HOOK..LATIN SMALL LETTER EZH WITH RETROFLEX HOOK 1D9B..1DBF ; R # Lm [37] MODIFIER LETTER SMALL TURNED ALPHA..MODIFIER LETTER SMALL THETA -1DC0..1DF9 ; R # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; R # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; R # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 1E00..1EFF ; R # L& [256] LATIN CAPITAL LETTER A WITH RING BELOW..LATIN SMALL LETTER Y WITH LOOP 1F00..1F15 ; R # L& [22] GREEK SMALL LETTER ALPHA WITH PSILI..GREEK SMALL LETTER EPSILON WITH DASIA AND OXIA 1F18..1F1D ; R # Lu [6] GREEK CAPITAL LETTER EPSILON WITH PSILI..GREEK CAPITAL LETTER EPSILON WITH DASIA AND OXIA @@ -886,7 +898,7 @@ 208D ; R # Ps SUBSCRIPT LEFT PARENTHESIS 208E ; R # Pe SUBSCRIPT RIGHT PARENTHESIS 2090..209C ; R # Lm [13] LATIN SUBSCRIPT SMALL LETTER A..LATIN SUBSCRIPT SMALL LETTER T -20A0..20BF ; R # Sc [32] EURO-CURRENCY SIGN..BITCOIN SIGN +20A0..20C0 ; R # Sc [33] EURO-CURRENCY SIGN..SOM SIGN 20D0..20DC ; R # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0 ; U # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH 20E1 ; R # Mn COMBINING LEFT RIGHT ARROW ABOVE @@ -1087,8 +1099,7 @@ 2BD3..2BEB ; U # So [25] PLUTO FORM TWO..STAR WITH RIGHT HALF BLACK 2BEC..2BEF ; R # So [4] LEFTWARDS TWO-HEADED ARROW WITH TRIANGLE ARROWHEADS..DOWNWARDS TWO-HEADED ARROW WITH TRIANGLE ARROWHEADS 2BF0..2BFF ; U # So [16] ERIS FORM ONE..HELLSCHREIBER PAUSE SYMBOL -2C00..2C2E ; R # Lu [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; R # Ll [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C00..2C5F ; R # L& [96] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C60..2C7B ; R # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; R # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2C7F ; R # Lu [2] LATIN CAPITAL LETTER S WITH SWASH TAIL..LATIN CAPITAL LETTER Z WITH SWASH TAIL @@ -1156,7 +1167,16 @@ 2E42 ; R # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK 2E43..2E4F ; R # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER 2E50..2E51 ; U # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR -2E52 ; R # Po TIRONIAN SIGN CAPITAL ET +2E52..2E54 ; R # Po [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK +2E55 ; R # Ps LEFT SQUARE BRACKET WITH STROKE +2E56 ; R # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57 ; R # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58 ; R # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; R # Ps TOP HALF LEFT PARENTHESIS +2E5A ; R # Pe TOP HALF RIGHT PARENTHESIS +2E5B ; R # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C ; R # Pe BOTTOM HALF RIGHT PARENTHESIS +2E5D ; R # Pd OBLIQUE HYPHEN 2E80..2E99 ; U # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9A ; U # Cn 2E9B..2EF3 ; U # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE @@ -1294,8 +1314,7 @@ 3380..33FF ; U # So [128] SQUARE PA AMPS..SQUARE GAL 3400..4DBF ; U # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF 4DC0..4DFF ; U # So [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION -4E00..9FFC ; U # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -9FFD..9FFF ; U # Cn [3] .. +4E00..9FFF ; U # Lo [20992] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFF A000..A014 ; U # Lo [21] YI SYLLABLE IT..YI SYLLABLE E A015 ; U # Lm YI SYLLABLE WU A016..A48C ; U # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR @@ -1336,8 +1355,11 @@ A788 ; R # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; R # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; R # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; R # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; R # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; R # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; R # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; R # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; R # Ll LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; R # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; R # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; R # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; R # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; R # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -1495,15 +1517,17 @@ FB40..FB41 ; R # Lo [2] HEBREW LETTER NUN WITH DAGESH..HEBREW LETTER SA FB43..FB44 ; R # Lo [2] HEBREW LETTER FINAL PE WITH DAGESH..HEBREW LETTER PE WITH DAGESH FB46..FB4F ; R # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATURE ALEF LAMED FB50..FBB1 ; R # Lo [98] ARABIC LETTER ALEF WASLA ISOLATED FORM..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM -FBB2..FBC1 ; R # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2 ; R # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FBD3..FD3D ; R # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM FD3E ; R # Pe ORNATE LEFT PARENTHESIS FD3F ; R # Ps ORNATE RIGHT PARENTHESIS +FD40..FD4F ; R # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH FD50..FD8F ; R # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM FD92..FDC7 ; R # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM +FDCF ; R # So ARABIC LIGATURE SALAAMUHU ALAYNAA FDF0..FDFB ; R # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU FDFC ; R # Sc RIAL SIGN -FDFD ; R # So ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFD..FDFF ; R # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FE00..FE0F ; R # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16 FE10..FE16 ; U # Po [7] PRESENTATION FORM FOR VERTICAL COMMA..PRESENTATION FORM FOR VERTICAL QUESTION MARK FE17 ; U # Ps PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET @@ -1660,9 +1684,20 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 10500..10527 ; R # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; R # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW 1056F ; R # Po CAUCASIAN ALBANIAN CITATION MARK +10570..1057A ; R # Lu [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; R # Lu [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; R # Lu [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; R # Lu [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; R # Ll [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; R # Ll [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; R # Ll [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; R # Ll [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; R # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; R # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; R # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; R # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; R # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; R # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; R # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; R # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; R # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -1741,6 +1776,9 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 10F46..10F50 ; R # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW 10F51..10F54 ; R # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED 10F55..10F59 ; R # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F70..10F81 ; R # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F82..10F85 ; R # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW +10F86..10F89 ; R # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 10FB0..10FC4 ; R # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FC5..10FCB ; R # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED 10FE0..10FF6 ; R # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH @@ -1752,6 +1790,10 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 11047..1104D ; R # Po [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 11052..11065 ; R # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND 11066..1106F ; R # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11070 ; R # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11071..11072 ; R # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074 ; R # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075 ; R # Lo BRAHMI LETTER OLD TAMIL LLA 1107F ; R # Mn BRAHMI NUMBER JOINER 11080..11081 ; R # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA 11082 ; R # Mc KAITHI SIGN VISARGA @@ -1763,6 +1805,7 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 110BB..110BC ; R # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN 110BD ; R # Cf KAITHI NUMBER SIGN 110BE..110C1 ; R # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA +110C2 ; R # Mn KAITHI VOWEL SIGN VOCALIC R 110CD ; R # Cf KAITHI NUMBER SIGN ABOVE 110D0..110E8 ; R # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 110F0..110F9 ; R # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE @@ -1899,6 +1942,7 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 116B6 ; R # Mc TAKRI SIGN VIRAMA 116B7 ; R # Mn TAKRI SIGN NUKTA 116B8 ; R # Lo TAKRI LETTER ARCHAIC KHA +116B9 ; R # Po TAKRI ABBREVIATION SIGN 116C0..116C9 ; R # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE 11700..1171A ; R # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA 1171D..1171F ; R # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA @@ -1910,6 +1954,7 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 1173A..1173B ; R # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY 1173C..1173E ; R # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI 1173F ; R # So AHOM SYMBOL VI +11740..11746 ; R # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; R # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E ; R # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 1182F..11837 ; R # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA @@ -1970,6 +2015,7 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 11A9D ; U # Lo SOYOMBO MARK PLUTA 11A9E..11AA2 ; U # Po [5] SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME..SOYOMBO TERMINAL MARK-2 11AA3..11AAF ; U # Cn [13] .. +11AB0..11ABF ; U # Lo [16] CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA 11AC0..11AF8 ; R # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; R # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; R # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA @@ -2026,6 +2072,8 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 12400..1246E ; R # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12470..12474 ; R # Po [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON 12480..12543 ; R # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; R # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2 ; R # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13000..1342E ; U # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 1342F ; U # Cn 13430..13438 ; U # Cf [9] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT @@ -2036,6 +2084,8 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 16A40..16A5E ; R # Lo [31] MRO LETTER TA..MRO LETTER TEK 16A60..16A69 ; R # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE 16A6E..16A6F ; R # Po [2] MRO DANDA..MRO DOUBLE DANDA +16A70..16ABE ; R # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; R # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED ; R # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF0..16AF4 ; R # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16AF5 ; R # Po BASSA VAH FULL STOP @@ -2062,7 +2112,7 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 16FE0..16FE1 ; U # Lm [2] TANGUT ITERATION MARK..NUSHU ITERATION MARK 16FE2 ; U # Po OLD CHINESE HOOK MARK 16FE3 ; U # Lm OLD CHINESE ITERATION MARK -16FE4 ; U # Lo KHITAN SMALL SCRIPT FILLER +16FE4 ; U # Mn KHITAN SMALL SCRIPT FILLER 16FE5..16FEF ; U # Cn [11] .. 16FF0..16FF1 ; U # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY 16FF2..16FFF ; U # Cn [14] .. @@ -2072,10 +2122,16 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 18B00..18CD5 ; U # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5 18CD6..18CFF ; U # Cn [42] .. 18D00..18D08 ; U # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -18D09..18D8F ; U # Cn [135] .. +18D09..18D7F ; U # Cn [119] .. +1AFF0..1AFF3 ; U # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF4 ; U # Cn +1AFF5..1AFFB ; U # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFC ; U # Cn +1AFFD..1AFFE ; U # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1AFFF ; U # Cn 1B000..1B0FF ; U # Lo [256] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER RE-2 -1B100..1B11E ; U # Lo [31] HENTAIGANA LETTER RE-3..HENTAIGANA LETTER N-MU-MO-2 -1B11F..1B12F ; U # Cn [17] .. +1B100..1B122 ; U # Lo [35] HENTAIGANA LETTER RE-3..KATAKANA LETTER ARCHAIC WU +1B123..1B12F ; U # Cn [13] .. 1B130..1B14F ; U # Cn [32] .. 1B150..1B152 ; U # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B153..1B163 ; U # Cn [17] .. @@ -2091,6 +2147,12 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 1BC9D..1BC9E ; R # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 1BC9F ; R # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1BCA0..1BCA3 ; R # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF00..1CF2D ; U # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF2E..1CF2F ; U # Cn [2] .. +1CF30..1CF46 ; U # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG +1CF47..1CF4F ; U # Cn [9] .. +1CF50..1CFC3 ; U # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK +1CFC4..1CFCF ; U # Cn [12] .. 1D000..1D0F5 ; U # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D0F6..1D0FF ; U # Cn [10] .. 1D100..1D126 ; U # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 @@ -2106,8 +2168,8 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 1D185..1D18B ; U # Mn [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1D18C..1D1A9 ; U # So [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH 1D1AA..1D1AD ; U # Mn [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO -1D1AE..1D1E8 ; U # So [59] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KIEVAN FLAT SIGN -1D1E9..1D1FF ; U # Cn [23] .. +1D1AE..1D1EA ; U # So [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON +1D1EB..1D1FF ; U # Cn [21] .. 1D200..1D241 ; R # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54 1D242..1D244 ; R # Mn [3] COMBINING GREEK MUSICAL TRISEME..COMBINING GREEK MUSICAL PENTASEME 1D245 ; R # So GREEK MUSICAL LEIMMA @@ -2172,6 +2234,9 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 1DA9B..1DA9F ; U # Mn [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6 1DAA0 ; U # Cn 1DAA1..1DAAF ; U # Mn [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16 +1DF00..1DF09 ; R # Ll [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; R # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; R # Ll [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E000..1E006 ; R # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; R # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; R # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -2183,10 +2248,16 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 1E140..1E149 ; R # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1E14E ; R # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1E14F ; R # So NYIAKENG PUACHUE HMONG CIRCLED CA +1E290..1E2AD ; R # Lo [30] TOTO LETTER PA..TOTO LETTER A +1E2AE ; R # Mn TOTO SIGN RISING TONE 1E2C0..1E2EB ; R # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1E2EC..1E2EF ; R # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E2F0..1E2F9 ; R # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE 1E2FF ; R # Sc WANCHO NGUN SIGN +1E7E0..1E7E6 ; R # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; R # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; R # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; R # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; R # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8C7..1E8CF ; R # No [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE 1E8D0..1E8D6 ; R # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS @@ -2270,8 +2341,8 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 1F600..1F64F ; U # So [80] GRINNING FACE..PERSON WITH FOLDED HANDS 1F650..1F67F ; U # So [48] NORTH WEST POINTING LEAF..REVERSE CHECKER BOARD 1F680..1F6D7 ; U # So [88] ROCKET..ELEVATOR -1F6D8..1F6DF ; U # Cn [8] .. -1F6E0..1F6EC ; U # So [13] HAMMER AND WRENCH..AIRPLANE ARRIVING +1F6D8..1F6DC ; U # Cn [5] .. +1F6DD..1F6EC ; U # So [16] PLAYGROUND SLIDE..AIRPLANE ARRIVING 1F6ED..1F6EF ; U # Cn [3] .. 1F6F0..1F6FC ; U # So [13] SATELLITE..ROLLER SKATE 1F6FD..1F6FF ; U # Cn [3] .. @@ -2280,43 +2351,45 @@ FFFC..FFFD ; U # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARA 1F780..1F7D8 ; U # So [89] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7D9..1F7DF ; U # Cn [7] .. 1F7E0..1F7EB ; U # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE -1F7EC..1F7FF ; U # Cn [20] .. +1F7EC..1F7EF ; U # Cn [4] .. +1F7F0 ; U # So HEAVY EQUALS SIGN +1F7F1..1F7FF ; U # Cn [15] .. 1F800..1F80B ; R # So [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847 ; R # So [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859 ; R # So [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW 1F860..1F887 ; R # So [40] WIDE-HEADED LEFTWARDS LIGHT BARB ARROW..WIDE-HEADED SOUTH WEST VERY HEAVY BARB ARROW 1F890..1F8AD ; R # So [30] LEFTWARDS TRIANGLE ARROWHEAD..WHITE ARROW SHAFT WIDTH TWO THIRDS 1F8B0..1F8B1 ; R # So [2] ARROW POINTING UPWARDS THEN NORTH WEST..ARROW POINTING RIGHTWARDS THEN CURVING SOUTH WEST -1F900..1F978 ; U # So [121] CIRCLED CROSS FORMEE WITH FOUR DOTS..DISGUISED FACE -1F979 ; U # Cn -1F97A..1F9CB ; U # So [82] FACE WITH PLEADING EYES..BUBBLE TEA -1F9CC ; U # Cn -1F9CD..1F9FF ; U # So [51] STANDING PERSON..NAZAR AMULET +1F900..1F9FF ; U # So [256] CIRCLED CROSS FORMEE WITH FOUR DOTS..NAZAR AMULET 1FA00..1FA53 ; U # So [84] NEUTRAL CHESS KING..BLACK CHESS KNIGHT-BISHOP 1FA54..1FA5F ; U # Cn [12] .. 1FA60..1FA6D ; U # So [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER 1FA6E..1FA6F ; U # Cn [2] .. 1FA70..1FA74 ; U # So [5] BALLET SHOES..THONG SANDAL 1FA75..1FA77 ; U # Cn [3] .. -1FA78..1FA7A ; U # So [3] DROP OF BLOOD..STETHOSCOPE -1FA7B..1FA7F ; U # Cn [5] .. +1FA78..1FA7C ; U # So [5] DROP OF BLOOD..CRUTCH +1FA7D..1FA7F ; U # Cn [3] .. 1FA80..1FA86 ; U # So [7] YO-YO..NESTING DOLLS 1FA87..1FA8F ; U # Cn [9] .. -1FA90..1FAA8 ; U # So [25] RINGED PLANET..ROCK -1FAA9..1FAAF ; U # Cn [7] .. -1FAB0..1FAB6 ; U # So [7] FLY..FEATHER -1FAB7..1FABF ; U # Cn [9] .. -1FAC0..1FAC2 ; U # So [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAC3..1FACF ; U # Cn [13] .. -1FAD0..1FAD6 ; U # So [7] BLUEBERRIES..TEAPOT -1FAD7..1FAFF ; U # Cn [41] .. +1FA90..1FAAC ; U # So [29] RINGED PLANET..HAMSA +1FAAD..1FAAF ; U # Cn [3] .. +1FAB0..1FABA ; U # So [11] FLY..NEST WITH EGGS +1FABB..1FABF ; U # Cn [5] .. +1FAC0..1FAC5 ; U # So [6] ANATOMICAL HEART..PERSON WITH CROWN +1FAC6..1FACF ; U # Cn [10] .. +1FAD0..1FAD9 ; U # So [10] BLUEBERRIES..JAR +1FADA..1FADF ; U # Cn [6] .. +1FAE0..1FAE7 ; U # So [8] MELTING FACE..BUBBLES +1FAE8..1FAEF ; U # Cn [8] .. +1FAF0..1FAF6 ; U # So [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS +1FAF7..1FAFF ; U # Cn [9] .. 1FB00..1FB92 ; R # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA ; R # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON 1FBF0..1FBF9 ; R # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -20000..2A6DD ; U # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A6DE..2A6FF ; U # Cn [34] .. -2A700..2B734 ; U # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 -2B735..2B73F ; U # Cn [11] .. +20000..2A6DF ; U # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A6E0..2A6FF ; U # Cn [32] .. +2A700..2B738 ; U # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 +2B739..2B73F ; U # Cn [7] .. 2B740..2B81D ; U # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B81E..2B81F ; U # Cn [2] .. 2B820..2CEA1 ; U # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 diff --git a/lib/unicore/auxiliary/GCBTest.txt b/lib/unicore/auxiliary/GCBTest.txt index 5baf292a07..eff2fd33b0 100644 --- a/lib/unicore/auxiliary/GCBTest.txt +++ b/lib/unicore/auxiliary/GCBTest.txt @@ -1,6 +1,6 @@ -# GraphemeBreakTest-13.0.0.txt -# Date: 2019-11-15, 19:49:10 GMT -# © 2019 Unicode®, Inc. +# GraphemeBreakTest-14.0.0.txt +# Date: 2021-03-08, 06:22:32 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # diff --git a/lib/unicore/auxiliary/GraphemeBreakProperty.txt b/lib/unicore/auxiliary/GraphemeBreakProperty.txt index 6ee92f6eec..dd2569064a 100644 --- a/lib/unicore/auxiliary/GraphemeBreakProperty.txt +++ b/lib/unicore/auxiliary/GraphemeBreakProperty.txt @@ -1,6 +1,6 @@ -# GraphemeBreakProperty-13.0.0.txt -# Date: 2019-10-21, 14:30:35 GMT -# © 2019 Unicode®, Inc. +# GraphemeBreakProperty-14.0.0.txt +# Date: 2021-08-12, 23:13:02 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -21,6 +21,7 @@ 0600..0605 ; Prepend # Cf [6] ARABIC NUMBER SIGN..ARABIC NUMBER MARK ABOVE 06DD ; Prepend # Cf ARABIC END OF AYAH 070F ; Prepend # Cf SYRIAC ABBREVIATION MARK +0890..0891 ; Prepend # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE 08E2 ; Prepend # Cf ARABIC DISPUTED END OF AYAH 0D4E ; Prepend # Lo MALAYALAM LETTER DOT REPH 110BD ; Prepend # Cf KAITHI NUMBER SIGN @@ -32,7 +33,7 @@ 11A84..11A89 ; Prepend # Lo [6] SOYOMBO SIGN JIHVAMULIYA..SOYOMBO CLUSTER-INITIAL LETTER SA 11D46 ; Prepend # Lo MASARAM GONDI REPHA -# Total code points: 24 +# Total code points: 26 # ================================================ @@ -104,7 +105,8 @@ E01F0..E0FFF ; Control # Cn [3600] .. 0825..0827 ; Extend # Mn [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U 0829..082D ; Extend # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA 0859..085B ; Extend # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3..08E1 ; Extend # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0898..089F ; Extend # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08CA..08E1 ; Extend # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; Extend # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 093A ; Extend # Mn DEVANAGARI VOWEL SIGN OE 093C ; Extend # Mn DEVANAGARI SIGN NUKTA @@ -151,6 +153,7 @@ E01F0..E0FFF ; Control # Cn [3600] .. 0BD7 ; Extend # Mc TAMIL AU LENGTH MARK 0C00 ; Extend # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE 0C04 ; Extend # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3C ; Extend # Mn TELUGU SIGN NUKTA 0C3E..0C40 ; Extend # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C46..0C48 ; Extend # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI 0C4A..0C4D ; Extend # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA @@ -206,7 +209,7 @@ E01F0..E0FFF ; Control # Cn [3600] .. 109D ; Extend # Mn MYANMAR VOWEL SIGN AITON AI 135D..135F ; Extend # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK 1712..1714 ; Extend # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1732..1734 ; Extend # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733 ; Extend # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U 1752..1753 ; Extend # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1772..1773 ; Extend # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U 17B4..17B5 ; Extend # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA @@ -215,6 +218,7 @@ E01F0..E0FFF ; Control # Cn [3600] .. 17C9..17D3 ; Extend # Mn [11] KHMER SIGN MUUSIKATOAN..KHMER SIGN BATHAMASAT 17DD ; Extend # Mn KHMER SIGN ATTHACAN 180B..180D ; Extend # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; Extend # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1885..1886 ; Extend # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 18A9 ; Extend # Mn MONGOLIAN LETTER ALI GALI DAGALGA 1920..1922 ; Extend # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U @@ -232,7 +236,7 @@ E01F0..E0FFF ; Control # Cn [3600] .. 1A7F ; Extend # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 1AB0..1ABD ; Extend # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; Extend # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; Extend # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; Extend # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; Extend # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B34 ; Extend # Mn BALINESE SIGN REREKAN 1B35 ; Extend # Mc BALINESE VOWEL SIGN TEDUNG @@ -256,8 +260,7 @@ E01F0..E0FFF ; Control # Cn [3600] .. 1CED ; Extend # Mn VEDIC SIGN TIRYAK 1CF4 ; Extend # Mn VEDIC TONE CANDRA ABOVE 1CF8..1CF9 ; Extend # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE -1DC0..1DF9 ; Extend # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; Extend # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; Extend # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 200C ; Extend # Cf ZERO WIDTH NON-JOINER 20D0..20DC ; Extend # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0 ; Extend # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH @@ -322,11 +325,15 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 10D24..10D27 ; Extend # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10EAB..10EAC ; Extend # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F46..10F50 ; Extend # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; Extend # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 11001 ; Extend # Mn BRAHMI SIGN ANUSVARA 11038..11046 ; Extend # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA +11070 ; Extend # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Extend # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 1107F..11081 ; Extend # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 110B3..110B6 ; Extend # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B9..110BA ; Extend # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Extend # Mn KAITHI VOWEL SIGN VOCALIC R 11100..11102 ; Extend # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; Extend # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112D..11134 ; Extend # Mn [8] CHAKMA VOWEL SIGN AI..CHAKMA MAAYYAA @@ -412,6 +419,8 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 16F8F..16F92 ; Extend # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; Extend # Mn KHITAN SMALL SCRIPT FILLER 1BC9D..1BC9E ; Extend # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK +1CF00..1CF2D ; Extend # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; Extend # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D165 ; Extend # Mc MUSICAL SYMBOL COMBINING STEM 1D167..1D169 ; Extend # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16E..1D172 ; Extend # Mc [5] MUSICAL SYMBOL COMBINING FLAG-1..MUSICAL SYMBOL COMBINING FLAG-5 @@ -431,6 +440,7 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 1E023..1E024 ; Extend # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; Extend # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; Extend # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; Extend # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; Extend # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; Extend # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E94A ; Extend # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA @@ -438,7 +448,7 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT E0020..E007F ; Extend # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 1984 +# Total code points: 2095 # ================================================ @@ -495,6 +505,8 @@ E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 103B..103C ; SpacingMark # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA 1056..1057 ; SpacingMark # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR 1084 ; SpacingMark # Mc MYANMAR VOWEL SIGN SHAN E +1715 ; SpacingMark # Mc TAGALOG SIGN PAMUDPOD +1734 ; SpacingMark # Mc HANUNOO SIGN PAMUDPOD 17B6 ; SpacingMark # Mc KHMER VOWEL SIGN AA 17BE..17C5 ; SpacingMark # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU 17C7..17C8 ; SpacingMark # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU @@ -579,7 +591,6 @@ ABEC ; SpacingMark # Mc MEETEI MAYEK LUM IYEK 116AC ; SpacingMark # Mc TAKRI SIGN VISARGA 116AE..116AF ; SpacingMark # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II 116B6 ; SpacingMark # Mc TAKRI SIGN VIRAMA -11720..11721 ; SpacingMark # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA 11726 ; SpacingMark # Mc AHOM VOWEL SIGN E 1182C..1182E ; SpacingMark # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 11838 ; SpacingMark # Mc DOGRA SIGN VISARGA diff --git a/lib/unicore/auxiliary/LBTest.txt b/lib/unicore/auxiliary/LBTest.txt index d8666c458f..8d1cef0f78 100644 --- a/lib/unicore/auxiliary/LBTest.txt +++ b/lib/unicore/auxiliary/LBTest.txt @@ -1,6 +1,6 @@ -# LineBreakTest-13.0.0.txt -# Date: 2019-11-21, 16:13:36 GMT -# © 2019 Unicode®, Inc. +# LineBreakTest-14.0.0.txt +# Date: 2021-08-20, 21:08:45 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -1846,9 +1846,9 @@ × AC00 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × AC00 × 0308 ÷ 2329 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [9.0] COMBINING DIAERESIS (CM1_CM) ÷ [999.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × AC00 × 0308 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] -× AC00 × 0025 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× AC00 × 0025 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × AC00 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] -× AC00 × 0308 × 0025 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× AC00 × 0308 × 0025 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × AC00 × 0308 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] × AC00 ÷ 0024 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) ÷ [999.0] DOLLAR SIGN (PR) ÷ [0.3] × AC00 × 0020 ÷ 0024 ÷ # × [0.3] HANGUL SYLLABLE GA (H2) × [7.01] SPACE (SP) ÷ [18.0] DOLLAR SIGN (PR) ÷ [0.3] @@ -2018,9 +2018,9 @@ × AC01 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × AC01 × 0308 ÷ 2329 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [9.0] COMBINING DIAERESIS (CM1_CM) ÷ [999.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × AC01 × 0308 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] -× AC01 × 0025 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× AC01 × 0025 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × AC01 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] -× AC01 × 0308 × 0025 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× AC01 × 0308 × 0025 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × AC01 × 0308 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] × AC01 ÷ 0024 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) ÷ [999.0] DOLLAR SIGN (PR) ÷ [0.3] × AC01 × 0020 ÷ 0024 ÷ # × [0.3] HANGUL SYLLABLE GAG (H3) × [7.01] SPACE (SP) ÷ [18.0] DOLLAR SIGN (PR) ÷ [0.3] @@ -3050,9 +3050,9 @@ × 1100 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × 1100 × 0308 ÷ 2329 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [9.0] COMBINING DIAERESIS (CM1_CM) ÷ [999.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × 1100 × 0308 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] -× 1100 × 0025 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× 1100 × 0025 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × 1100 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] -× 1100 × 0308 × 0025 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× 1100 × 0308 × 0025 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × 1100 × 0308 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] × 1100 ÷ 0024 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) ÷ [999.0] DOLLAR SIGN (PR) ÷ [0.3] × 1100 × 0020 ÷ 0024 ÷ # × [0.3] HANGUL CHOSEONG KIYEOK (JL) × [7.01] SPACE (SP) ÷ [18.0] DOLLAR SIGN (PR) ÷ [0.3] @@ -3222,9 +3222,9 @@ × 11A8 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × 11A8 × 0308 ÷ 2329 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [9.0] COMBINING DIAERESIS (CM1_CM) ÷ [999.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × 11A8 × 0308 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] -× 11A8 × 0025 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× 11A8 × 0025 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × 11A8 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] -× 11A8 × 0308 × 0025 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× 11A8 × 0308 × 0025 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × 11A8 × 0308 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] × 11A8 ÷ 0024 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) ÷ [999.0] DOLLAR SIGN (PR) ÷ [0.3] × 11A8 × 0020 ÷ 0024 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [7.01] SPACE (SP) ÷ [18.0] DOLLAR SIGN (PR) ÷ [0.3] @@ -3394,9 +3394,9 @@ × 1160 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × 1160 × 0308 ÷ 2329 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [9.0] COMBINING DIAERESIS (CM1_CM) ÷ [999.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] × 1160 × 0308 × 0020 ÷ 2329 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] LEFT-POINTING ANGLE BRACKET (OP) ÷ [0.3] -× 1160 × 0025 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× 1160 × 0025 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × 1160 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] -× 1160 × 0308 × 0025 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] PERCENT SIGN (PO) ÷ [0.3] +× 1160 × 0308 × 0025 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.01] PERCENT SIGN (PO) ÷ [0.3] × 1160 × 0308 × 0020 ÷ 0025 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] PERCENT SIGN (PO) ÷ [0.3] × 1160 ÷ 0024 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) ÷ [999.0] DOLLAR SIGN (PR) ÷ [0.3] × 1160 × 0020 ÷ 0024 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [7.01] SPACE (SP) ÷ [18.0] DOLLAR SIGN (PR) ÷ [0.3] @@ -4538,13 +4538,13 @@ × 0024 × 0020 ÷ 00A0 ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) ÷ [18.0] NO-BREAK SPACE (GL) ÷ [0.3] × 0024 × 0308 × 00A0 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [12.2] NO-BREAK SPACE (GL) ÷ [0.3] × 0024 × 0308 × 0020 ÷ 00A0 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] NO-BREAK SPACE (GL) ÷ [0.3] -× 0024 × AC00 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.03] HANGUL SYLLABLE GA (H2) ÷ [0.3] +× 0024 × AC00 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.02] HANGUL SYLLABLE GA (H2) ÷ [0.3] × 0024 × 0020 ÷ AC00 ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) ÷ [18.0] HANGUL SYLLABLE GA (H2) ÷ [0.3] -× 0024 × 0308 × AC00 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.03] HANGUL SYLLABLE GA (H2) ÷ [0.3] +× 0024 × 0308 × AC00 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] HANGUL SYLLABLE GA (H2) ÷ [0.3] × 0024 × 0308 × 0020 ÷ AC00 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] HANGUL SYLLABLE GA (H2) ÷ [0.3] -× 0024 × AC01 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.03] HANGUL SYLLABLE GAG (H3) ÷ [0.3] +× 0024 × AC01 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.02] HANGUL SYLLABLE GAG (H3) ÷ [0.3] × 0024 × 0020 ÷ AC01 ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) ÷ [18.0] HANGUL SYLLABLE GAG (H3) ÷ [0.3] -× 0024 × 0308 × AC01 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.03] HANGUL SYLLABLE GAG (H3) ÷ [0.3] +× 0024 × 0308 × AC01 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] HANGUL SYLLABLE GAG (H3) ÷ [0.3] × 0024 × 0308 × 0020 ÷ AC01 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] HANGUL SYLLABLE GAG (H3) ÷ [0.3] × 0024 × 05D0 ÷ # × [0.3] DOLLAR SIGN (PR) × [24.02] HEBREW LETTER ALEF (HL) ÷ [0.3] × 0024 × 0020 ÷ 05D0 ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) ÷ [18.0] HEBREW LETTER ALEF (HL) ÷ [0.3] @@ -4566,17 +4566,17 @@ × 0024 × 0020 × 002C ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) × [13.02] COMMA (IS) ÷ [0.3] × 0024 × 0308 × 002C ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [13.03] COMMA (IS) ÷ [0.3] × 0024 × 0308 × 0020 × 002C ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) × [13.02] COMMA (IS) ÷ [0.3] -× 0024 × 1100 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.03] HANGUL CHOSEONG KIYEOK (JL) ÷ [0.3] +× 0024 × 1100 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.02] HANGUL CHOSEONG KIYEOK (JL) ÷ [0.3] × 0024 × 0020 ÷ 1100 ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) ÷ [18.0] HANGUL CHOSEONG KIYEOK (JL) ÷ [0.3] -× 0024 × 0308 × 1100 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.03] HANGUL CHOSEONG KIYEOK (JL) ÷ [0.3] +× 0024 × 0308 × 1100 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] HANGUL CHOSEONG KIYEOK (JL) ÷ [0.3] × 0024 × 0308 × 0020 ÷ 1100 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] HANGUL CHOSEONG KIYEOK (JL) ÷ [0.3] -× 0024 × 11A8 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.03] HANGUL JONGSEONG KIYEOK (JT) ÷ [0.3] +× 0024 × 11A8 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.02] HANGUL JONGSEONG KIYEOK (JT) ÷ [0.3] × 0024 × 0020 ÷ 11A8 ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) ÷ [18.0] HANGUL JONGSEONG KIYEOK (JT) ÷ [0.3] -× 0024 × 0308 × 11A8 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.03] HANGUL JONGSEONG KIYEOK (JT) ÷ [0.3] +× 0024 × 0308 × 11A8 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] HANGUL JONGSEONG KIYEOK (JT) ÷ [0.3] × 0024 × 0308 × 0020 ÷ 11A8 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] HANGUL JONGSEONG KIYEOK (JT) ÷ [0.3] -× 0024 × 1160 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.03] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] +× 0024 × 1160 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.02] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] × 0024 × 0020 ÷ 1160 ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) ÷ [18.0] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] -× 0024 × 0308 × 1160 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.03] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] +× 0024 × 0308 × 1160 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [27.02] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] × 0024 × 0308 × 0020 ÷ 1160 ÷ # × [0.3] DOLLAR SIGN (PR) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] × 0024 × 000A ÷ # × [0.3] DOLLAR SIGN (PR) × [6.0] (LF) ÷ [0.3] × 0024 × 0020 × 000A ÷ # × [0.3] DOLLAR SIGN (PR) × [7.01] SPACE (SP) × [6.0] (LF) ÷ [0.3] @@ -5838,9 +5838,9 @@ × 261D × 0020 ÷ 261D ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [7.01] SPACE (SP) ÷ [18.0] WHITE UP POINTING INDEX (EB) ÷ [0.3] × 261D × 0308 ÷ 261D ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [9.0] COMBINING DIAERESIS (CM1_CM) ÷ [999.0] WHITE UP POINTING INDEX (EB) ÷ [0.3] × 261D × 0308 × 0020 ÷ 261D ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] WHITE UP POINTING INDEX (EB) ÷ [0.3] -× 261D × 1F3FB ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [30.2] EMOJI MODIFIER FITZPATRICK TYPE-1-2 (EM) ÷ [0.3] +× 261D × 1F3FB ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [30.21] EMOJI MODIFIER FITZPATRICK TYPE-1-2 (EM) ÷ [0.3] × 261D × 0020 ÷ 1F3FB ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [7.01] SPACE (SP) ÷ [18.0] EMOJI MODIFIER FITZPATRICK TYPE-1-2 (EM) ÷ [0.3] -× 261D × 0308 × 1F3FB ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [9.0] COMBINING DIAERESIS (CM1_CM) × [30.2] EMOJI MODIFIER FITZPATRICK TYPE-1-2 (EM) ÷ [0.3] +× 261D × 0308 × 1F3FB ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [9.0] COMBINING DIAERESIS (CM1_CM) × [30.21] EMOJI MODIFIER FITZPATRICK TYPE-1-2 (EM) ÷ [0.3] × 261D × 0308 × 0020 ÷ 1F3FB ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [9.0] COMBINING DIAERESIS (CM1_CM) × [7.01] SPACE (SP) ÷ [18.0] EMOJI MODIFIER FITZPATRICK TYPE-1-2 (EM) ÷ [0.3] × 261D × 0029 ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [13.02] RIGHT PARENTHESIS (CP_CP30) ÷ [0.3] × 261D × 0020 × 0029 ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [7.01] SPACE (SP) × [13.02] RIGHT PARENTHESIS (CP_CP30) ÷ [0.3] @@ -7452,9 +7452,9 @@ × 1160 × 1160 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [26.02] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] × 11A8 × 11A8 ÷ # × [0.3] HANGUL JONGSEONG KIYEOK (JT) × [26.03] HANGUL JONGSEONG KIYEOK (JT) ÷ [0.3] × 1160 × 2024 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [22.0] ONE DOT LEADER (IN) ÷ [0.3] -× 1160 × 0025 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [27.02] PERCENT SIGN (PO) ÷ [0.3] -× 0024 × 1160 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.03] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] -× 261D × 1F3FB ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [30.2] EMOJI MODIFIER FITZPATRICK TYPE-1-2 (EM) ÷ [0.3] +× 1160 × 0025 ÷ # × [0.3] HANGUL JUNGSEONG FILLER (JV) × [27.01] PERCENT SIGN (PO) ÷ [0.3] +× 0024 × 1160 ÷ # × [0.3] DOLLAR SIGN (PR) × [27.02] HANGUL JUNGSEONG FILLER (JV) ÷ [0.3] +× 261D × 1F3FB ÷ # × [0.3] WHITE UP POINTING INDEX (EB) × [30.21] EMOJI MODIFIER FITZPATRICK TYPE-1-2 (EM) ÷ [0.3] × 0066 × 0069 × 006E × 0061 × 006C ÷ # × [0.3] LATIN SMALL LETTER F (AL) × [28.0] LATIN SMALL LETTER I (AL) × [28.0] LATIN SMALL LETTER N (AL) × [28.0] LATIN SMALL LETTER A (AL) × [28.0] LATIN SMALL LETTER L (AL) ÷ [0.3] × 0063 × 0061 × 006E × 0027 × 0074 ÷ # × [0.3] LATIN SMALL LETTER C (AL) × [28.0] LATIN SMALL LETTER A (AL) × [28.0] LATIN SMALL LETTER N (AL) × [19.01] APOSTROPHE (QU) × [19.02] LATIN SMALL LETTER T (AL) ÷ [0.3] × 0063 × 0061 × 006E × 2019 × 0074 ÷ # × [0.3] LATIN SMALL LETTER C (AL) × [28.0] LATIN SMALL LETTER A (AL) × [28.0] LATIN SMALL LETTER N (AL) × [19.01] RIGHT SINGLE QUOTATION MARK (QU) × [19.02] LATIN SMALL LETTER T (AL) ÷ [0.3] @@ -7678,7 +7678,9 @@ × 1F1F7 × 1F1FA ÷ 1F1F8 × 1F1EA ÷ # × [0.3] REGIONAL INDICATOR SYMBOL LETTER R (RI) × [30.11] REGIONAL INDICATOR SYMBOL LETTER U (RI) ÷ [30.13] REGIONAL INDICATOR SYMBOL LETTER S (RI) × [30.11] REGIONAL INDICATOR SYMBOL LETTER E (RI) ÷ [0.3] × 1F1F7 × 1F1FA × 200B ÷ 1F1F8 × 1F1EA ÷ # × [0.3] REGIONAL INDICATOR SYMBOL LETTER R (RI) × [30.11] REGIONAL INDICATOR SYMBOL LETTER U (RI) × [7.02] ZERO WIDTH SPACE (ZW) ÷ [8.0] REGIONAL INDICATOR SYMBOL LETTER S (RI) × [30.12] REGIONAL INDICATOR SYMBOL LETTER E (RI) ÷ [0.3] × 05D0 × 002D × 05D0 ÷ # × [0.3] HEBREW LETTER ALEF (HL) × [21.02] HYPHEN-MINUS (HY) × [21.1] HEBREW LETTER ALEF (HL) ÷ [0.3] +× 1F02C × 1F3FF ÷ # × [0.3] (Other) × [30.22] EMOJI MODIFIER FITZPATRICK TYPE-6 (EM) ÷ [0.3] +× 00A9 ÷ 1F3FF ÷ # × [0.3] COPYRIGHT SIGN (AL) ÷ [999.0] EMOJI MODIFIER FITZPATRICK TYPE-6 (EM) ÷ [0.3] # -# Lines: 7652 +# Lines: 7654 # # EOF diff --git a/lib/unicore/auxiliary/SBTest.txt b/lib/unicore/auxiliary/SBTest.txt index 5ae1f88110..61ea42cf1a 100644 --- a/lib/unicore/auxiliary/SBTest.txt +++ b/lib/unicore/auxiliary/SBTest.txt @@ -1,6 +1,6 @@ -# SentenceBreakTest-13.0.0.txt -# Date: 2019-11-20, 22:27:22 GMT -# © 2019 Unicode®, Inc. +# SentenceBreakTest-14.0.0.txt +# Date: 2021-03-08, 06:22:40 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # diff --git a/lib/unicore/auxiliary/SentenceBreakProperty.txt b/lib/unicore/auxiliary/SentenceBreakProperty.txt index 432385b269..4b12b85492 100644 --- a/lib/unicore/auxiliary/SentenceBreakProperty.txt +++ b/lib/unicore/auxiliary/SentenceBreakProperty.txt @@ -1,6 +1,6 @@ -# SentenceBreakProperty-13.0.0.txt -# Date: 2019-11-27, 03:13:39 GMT -# © 2019 Unicode®, Inc. +# SentenceBreakProperty-14.0.0.txt +# Date: 2021-08-12, 23:13:21 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -55,7 +55,8 @@ 0825..0827 ; Extend # Mn [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U 0829..082D ; Extend # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA 0859..085B ; Extend # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3..08E1 ; Extend # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0898..089F ; Extend # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08CA..08E1 ; Extend # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; Extend # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 0903 ; Extend # Mc DEVANAGARI SIGN VISARGA 093A ; Extend # Mn DEVANAGARI VOWEL SIGN OE @@ -124,6 +125,7 @@ 0C00 ; Extend # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE 0C01..0C03 ; Extend # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA 0C04 ; Extend # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3C ; Extend # Mn TELUGU SIGN NUKTA 0C3E..0C40 ; Extend # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44 ; Extend # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR 0C46..0C48 ; Extend # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI @@ -202,7 +204,9 @@ 109D ; Extend # Mn MYANMAR VOWEL SIGN AITON AI 135D..135F ; Extend # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK 1712..1714 ; Extend # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1732..1734 ; Extend # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1715 ; Extend # Mc TAGALOG SIGN PAMUDPOD +1732..1733 ; Extend # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734 ; Extend # Mc HANUNOO SIGN PAMUDPOD 1752..1753 ; Extend # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1772..1773 ; Extend # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U 17B4..17B5 ; Extend # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA @@ -214,6 +218,7 @@ 17C9..17D3 ; Extend # Mn [11] KHMER SIGN MUUSIKATOAN..KHMER SIGN BATHAMASAT 17DD ; Extend # Mn KHMER SIGN ATTHACAN 180B..180D ; Extend # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; Extend # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1885..1886 ; Extend # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 18A9 ; Extend # Mn MONGOLIAN LETTER ALI GALI DAGALGA 1920..1922 ; Extend # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U @@ -241,7 +246,7 @@ 1A7F ; Extend # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 1AB0..1ABD ; Extend # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; Extend # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; Extend # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; Extend # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; Extend # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; Extend # Mc BALINESE SIGN BISAH 1B34 ; Extend # Mn BALINESE SIGN REREKAN @@ -281,8 +286,7 @@ 1CF4 ; Extend # Mn VEDIC TONE CANDRA ABOVE 1CF7 ; Extend # Mc VEDIC SIGN ATIKRAMA 1CF8..1CF9 ; Extend # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE -1DC0..1DF9 ; Extend # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; Extend # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; Extend # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 200C..200D ; Extend # Cf [2] ZERO WIDTH NON-JOINER..ZERO WIDTH JOINER 20D0..20DC ; Extend # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0 ; Extend # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH @@ -368,16 +372,20 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 10D24..10D27 ; Extend # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10EAB..10EAC ; Extend # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F46..10F50 ; Extend # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; Extend # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 11000 ; Extend # Mc BRAHMI SIGN CANDRABINDU 11001 ; Extend # Mn BRAHMI SIGN ANUSVARA 11002 ; Extend # Mc BRAHMI SIGN VISARGA 11038..11046 ; Extend # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA +11070 ; Extend # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Extend # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 1107F..11081 ; Extend # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 11082 ; Extend # Mc KAITHI SIGN VISARGA 110B0..110B2 ; Extend # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II 110B3..110B6 ; Extend # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B7..110B8 ; Extend # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU 110B9..110BA ; Extend # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Extend # Mn KAITHI VOWEL SIGN VOCALIC R 11100..11102 ; Extend # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; Extend # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112C ; Extend # Mc CHAKMA VOWEL SIGN E @@ -516,6 +524,8 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 16FE4 ; Extend # Mn KHITAN SMALL SCRIPT FILLER 16FF0..16FF1 ; Extend # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY 1BC9D..1BC9E ; Extend # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK +1CF00..1CF2D ; Extend # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; Extend # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D165..1D166 ; Extend # Mc [2] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING SPRECHGESANG STEM 1D167..1D169 ; Extend # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16D..1D172 ; Extend # Mc [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 @@ -535,13 +545,14 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 1E023..1E024 ; Extend # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; Extend # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; Extend # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; Extend # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; Extend # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; Extend # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E94A ; Extend # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA E0020..E007F ; Extend # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2395 +# Total code points: 2508 # ================================================ @@ -558,6 +569,7 @@ E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 061C ; Format # Cf ARABIC LETTER MARK 06DD ; Format # Cf ARABIC END OF AYAH 070F ; Format # Cf SYRIAC ABBREVIATION MARK +0890..0891 ; Format # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE 08E2 ; Format # Cf ARABIC DISPUTED END OF AYAH 180E ; Format # Cf MONGOLIAN VOWEL SEPARATOR 200B ; Format # Cf ZERO WIDTH SPACE @@ -574,7 +586,7 @@ FFF9..FFFB ; Format # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANN 1D173..1D17A ; Format # Cf [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE E0001 ; Format # Cf LANGUAGE TAG -# Total code points: 63 +# Total code points: 65 # ================================================ @@ -1035,7 +1047,7 @@ E0001 ; Format # Cf LANGUAGE TAG 2170..217F ; Lower # Nl [16] SMALL ROMAN NUMERAL ONE..SMALL ROMAN NUMERAL ONE THOUSAND 2184 ; Lower # L& LATIN SMALL LETTER REVERSED C 24D0..24E9 ; Lower # So [26] CIRCLED LATIN SMALL LETTER A..CIRCLED LATIN SMALL LETTER Z -2C30..2C5E ; Lower # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C30..2C5F ; Lower # L& [48] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C61 ; Lower # L& LATIN SMALL LETTER L WITH DOUBLE BAR 2C65..2C66 ; Lower # L& [2] LATIN SMALL LETTER A WITH STROKE..LATIN SMALL LETTER T WITH DIAGONAL STROKE 2C68 ; Lower # L& LATIN SMALL LETTER H WITH DESCENDER @@ -1207,9 +1219,15 @@ A7B9 ; Lower # L& LATIN SMALL LETTER U WITH STROKE A7BB ; Lower # L& LATIN SMALL LETTER GLOTTAL A A7BD ; Lower # L& LATIN SMALL LETTER GLOTTAL I A7BF ; Lower # L& LATIN SMALL LETTER GLOTTAL U +A7C1 ; Lower # L& LATIN SMALL LETTER OLD POLISH O A7C3 ; Lower # L& LATIN SMALL LETTER ANGLICANA W A7C8 ; Lower # L& LATIN SMALL LETTER D WITH SHORT STROKE OVERLAY A7CA ; Lower # L& LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D1 ; Lower # L& LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; Lower # L& LATIN SMALL LETTER DOUBLE THORN +A7D5 ; Lower # L& LATIN SMALL LETTER DOUBLE WYNN +A7D7 ; Lower # L& LATIN SMALL LETTER MIDDLE SCOTS S +A7D9 ; Lower # L& LATIN SMALL LETTER SIGMOID S A7F6 ; Lower # L& LATIN SMALL LETTER REVERSED HALF H A7F8..A7F9 ; Lower # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE A7FA ; Lower # L& LATIN LETTER SMALL CAPITAL TURNED M @@ -1222,6 +1240,14 @@ FB13..FB17 ; Lower # L& [5] ARMENIAN SMALL LIGATURE MEN NOW..ARMENIAN SMALL FF41..FF5A ; Lower # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL LETTER Z 10428..1044F ; Lower # L& [40] DESERET SMALL LETTER LONG I..DESERET SMALL LETTER EW 104D8..104FB ; Lower # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA +10597..105A1 ; Lower # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Lower # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Lower # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Lower # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE +10780 ; Lower # Lm MODIFIER LETTER SMALL CAPITAL AA +10783..10785 ; Lower # Lm [3] MODIFIER LETTER SMALL AE..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Lower # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Lower # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10CC0..10CF2 ; Lower # L& [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US 118C0..118DF ; Lower # L& [32] WARANG CITI SMALL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 16E60..16E7F ; Lower # L& [32] MEDEFAIDRIN SMALL LETTER M..MEDEFAIDRIN SMALL LETTER Y @@ -1253,9 +1279,11 @@ FF41..FF5A ; Lower # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 1D7AA..1D7C2 ; Lower # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA 1D7C4..1D7C9 ; Lower # L& [6] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC PI SYMBOL 1D7CB ; Lower # L& MATHEMATICAL BOLD SMALL DIGAMMA +1DF00..1DF09 ; Lower # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0B..1DF1E ; Lower # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E922..1E943 ; Lower # L& [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 2297 +# Total code points: 2424 # ================================================ @@ -1693,7 +1721,7 @@ FF41..FF5A ; Lower # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN 2160..216F ; Upper # Nl [16] ROMAN NUMERAL ONE..ROMAN NUMERAL ONE THOUSAND 2183 ; Upper # L& ROMAN NUMERAL REVERSED ONE HUNDRED 24B6..24CF ; Upper # So [26] CIRCLED LATIN CAPITAL LETTER A..CIRCLED LATIN CAPITAL LETTER Z -2C00..2C2E ; Upper # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C00..2C2F ; Upper # L& [48] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI 2C60 ; Upper # L& LATIN CAPITAL LETTER L WITH DOUBLE BAR 2C62..2C64 ; Upper # L& [3] LATIN CAPITAL LETTER L WITH MIDDLE TILDE..LATIN CAPITAL LETTER R WITH TAIL 2C67 ; Upper # L& LATIN CAPITAL LETTER H WITH DESCENDER @@ -1858,13 +1886,21 @@ A7B8 ; Upper # L& LATIN CAPITAL LETTER U WITH STROKE A7BA ; Upper # L& LATIN CAPITAL LETTER GLOTTAL A A7BC ; Upper # L& LATIN CAPITAL LETTER GLOTTAL I A7BE ; Upper # L& LATIN CAPITAL LETTER GLOTTAL U +A7C0 ; Upper # L& LATIN CAPITAL LETTER OLD POLISH O A7C2 ; Upper # L& LATIN CAPITAL LETTER ANGLICANA W A7C4..A7C7 ; Upper # L& [4] LATIN CAPITAL LETTER C WITH PALATAL HOOK..LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY A7C9 ; Upper # L& LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY +A7D0 ; Upper # L& LATIN CAPITAL LETTER CLOSED INSULAR G +A7D6 ; Upper # L& LATIN CAPITAL LETTER MIDDLE SCOTS S +A7D8 ; Upper # L& LATIN CAPITAL LETTER SIGMOID S A7F5 ; Upper # L& LATIN CAPITAL LETTER REVERSED HALF H FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Upper # L& [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW 104B0..104D3 ; Upper # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA +10570..1057A ; Upper # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Upper # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Upper # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Upper # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE 10C80..10CB2 ; Upper # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 118A0..118BF ; Upper # L& [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 16E40..16E5F ; Upper # L& [32] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y @@ -1904,7 +1940,7 @@ FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LAT 1F150..1F169 ; Upper # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; Upper # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 1896 +# Total code points: 1936 # ================================================ @@ -1943,8 +1979,10 @@ FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LAT 0828 ; OLetter # Lm SAMARITAN MODIFIER LETTER I 0840..0858 ; OLetter # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 0860..086A ; OLetter # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; OLetter # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; OLetter # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +0870..0887 ; OLetter # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; OLetter # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +08A0..08C8 ; OLetter # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; OLetter # Lm ARABIC SMALL FARSI YEH 0904..0939 ; OLetter # Lo [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA 093D ; OLetter # Lo DEVANAGARI SIGN AVAGRAHA 0950 ; OLetter # Lo DEVANAGARI OM @@ -2010,6 +2048,7 @@ FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LAT 0C2A..0C39 ; OLetter # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA 0C3D ; OLetter # Lo TELUGU SIGN AVAGRAHA 0C58..0C5A ; OLetter # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; OLetter # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; OLetter # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C80 ; OLetter # Lo KANNADA SIGN SPACING CANDRABINDU 0C85..0C8C ; OLetter # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L @@ -2018,7 +2057,7 @@ FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LAT 0CAA..0CB3 ; OLetter # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA 0CB5..0CB9 ; OLetter # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA 0CBD ; OLetter # Lo KANNADA SIGN AVAGRAHA -0CDE ; OLetter # Lo KANNADA LETTER FA +0CDD..0CDE ; OLetter # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; OLetter # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CF1..0CF2 ; OLetter # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA 0D04..0D0C ; OLetter # Lo [9] MALAYALAM LETTER VEDIC ANUSVARA..MALAYALAM LETTER VOCALIC L @@ -2088,9 +2127,8 @@ FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LAT 16A0..16EA ; OLetter # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16EE..16F0 ; OLetter # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; OLetter # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; OLetter # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; OLetter # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA -1720..1731 ; OLetter # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA +1700..1711 ; OLetter # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA +171F..1731 ; OLetter # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA 1740..1751 ; OLetter # Lo [18] BUHID LETTER A..BUHID LETTER HA 1760..176C ; OLetter # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA 176E..1770 ; OLetter # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA @@ -2113,7 +2151,7 @@ FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LAT 1A20..1A54 ; OLetter # Lo [53] TAI THAM LETTER HIGH KA..TAI THAM LETTER GREAT SA 1AA7 ; OLetter # Lm TAI THAM SIGN MAI YAMOK 1B05..1B33 ; OLetter # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA -1B45..1B4B ; OLetter # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; OLetter # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B83..1BA0 ; OLetter # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA 1BAE..1BAF ; OLetter # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA 1BBA..1BE5 ; OLetter # Lo [44] SUNDANESE AVAGRAHA..BATAK LETTER U @@ -2161,8 +2199,7 @@ FF21..FF3A ; Upper # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LAT 31A0..31BF ; OLetter # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH 31F0..31FF ; OLetter # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO 3400..4DBF ; OLetter # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; OLetter # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; OLetter # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; OLetter # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; OLetter # Lm YI SYLLABLE WU A016..A48C ; OLetter # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A4D0..A4F7 ; OLetter # Lo [40] LISU LETTER BA..LISU LETTER OE @@ -2178,6 +2215,7 @@ A6E6..A6EF ; OLetter # Nl [10] BAMUM LETTER MO..BAMUM LETTER KOGHOM A717..A71F ; OLetter # Lm [9] MODIFIER LETTER DOT VERTICAL BAR..MODIFIER LETTER LOW INVERTED EXCLAMATION MARK A788 ; OLetter # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A78F ; OLetter # Lo LATIN LETTER SINOLOGICAL DOT +A7F2..A7F4 ; OLetter # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F7 ; OLetter # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7FB..A801 ; OLetter # Lo [7] LATIN EPIGRAPHIC LETTER REVERSED F..SYLOTI NAGRI LETTER I A803..A805 ; OLetter # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O @@ -2275,6 +2313,7 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 10600..10736 ; OLetter # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; OLetter # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; OLetter # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10781..10782 ; OLetter # Lm [2] MODIFIER LETTER SUPERSCRIPT TRIANGULAR COLON..MODIFIER LETTER SUPERSCRIPT HALF TRIANGULAR COLON 10800..10805 ; OLetter # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; OLetter # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; OLetter # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -2308,9 +2347,12 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 10F00..10F1C ; OLetter # Lo [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL 10F27 ; OLetter # Lo OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F45 ; OLetter # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN +10F70..10F81 ; OLetter # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH 10FB0..10FC4 ; OLetter # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; OLetter # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11003..11037 ; OLetter # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA +11071..11072 ; OLetter # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11075 ; OLetter # Lo BRAHMI LETTER OLD TAMIL LLA 11083..110AF ; OLetter # Lo [45] KAITHI LETTER A..KAITHI LETTER HA 110D0..110E8 ; OLetter # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 11103..11126 ; OLetter # Lo [36] CHAKMA LETTER AA..CHAKMA LETTER HAA @@ -2352,6 +2394,7 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 11680..116AA ; OLetter # Lo [43] TAKRI LETTER A..TAKRI LETTER RRA 116B8 ; OLetter # Lo TAKRI LETTER ARCHAIC KHA 11700..1171A ; OLetter # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; OLetter # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; OLetter # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 118FF..11906 ; OLetter # Lo [8] WARANG CITI OM..DIVES AKURU LETTER E 11909 ; OLetter # Lo DIVES AKURU LETTER O @@ -2370,7 +2413,7 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 11A50 ; OLetter # Lo SOYOMBO LETTER A 11A5C..11A89 ; OLetter # Lo [46] SOYOMBO LETTER KA..SOYOMBO CLUSTER-INITIAL LETTER SA 11A9D ; OLetter # Lo SOYOMBO MARK PLUTA -11AC0..11AF8 ; OLetter # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; OLetter # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; OLetter # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; OLetter # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C40 ; OLetter # Lo BHAIKSUKI SIGN AVAGRAHA @@ -2388,10 +2431,12 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 12000..12399 ; OLetter # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12400..1246E ; OLetter # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; OLetter # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; OLetter # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; OLetter # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; OLetter # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; OLetter # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; OLetter # Lo [31] MRO LETTER TA..MRO LETTER TEK +16A70..16ABE ; OLetter # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA 16AD0..16AED ; OLetter # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16B00..16B2F ; OLetter # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 16B40..16B43 ; OLetter # Lm [4] PAHAWH HMONG SIGN VOS SEEV..PAHAWH HMONG SIGN IB YAM @@ -2405,7 +2450,10 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 17000..187F7 ; OLetter # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; OLetter # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; OLetter # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; OLetter # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; OLetter # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; OLetter # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; OLetter # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; OLetter # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; OLetter # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; OLetter # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; OLetter # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -2413,10 +2461,16 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1BC70..1BC7C ; OLetter # Lo [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK 1BC80..1BC88 ; OLetter # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 1BC90..1BC99 ; OLetter # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW +1DF0A ; OLetter # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1E100..1E12C ; OLetter # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; OLetter # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E14E ; OLetter # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ +1E290..1E2AD ; OLetter # Lo [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; OLetter # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH +1E7E0..1E7E6 ; OLetter # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; OLetter # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; OLetter # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; OLetter # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; OLetter # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E94B ; OLetter # Lm ADLAM NASALIZATION MARK 1EE00..1EE03 ; OLetter # Lo [4] ARABIC MATHEMATICAL ALEF..ARABIC MATHEMATICAL DAL @@ -2452,15 +2506,15 @@ FFDA..FFDC ; OLetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1EEA1..1EEA3 ; OLetter # Lo [3] ARABIC MATHEMATICAL DOUBLE-STRUCK BEH..ARABIC MATHEMATICAL DOUBLE-STRUCK DAL 1EEA5..1EEA9 ; OLetter # Lo [5] ARABIC MATHEMATICAL DOUBLE-STRUCK WAW..ARABIC MATHEMATICAL DOUBLE-STRUCK YEH 1EEAB..1EEBB ; OLetter # Lo [17] ARABIC MATHEMATICAL DOUBLE-STRUCK LAM..ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN -20000..2A6DD ; OLetter # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; OLetter # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; OLetter # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; OLetter # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; OLetter # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; OLetter # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; OLetter # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 2F800..2FA1D ; OLetter # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D 30000..3134A ; OLetter # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 127413 +# Total code points: 127761 # ================================================ @@ -2520,6 +2574,7 @@ FF10..FF19 ; Numeric # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 11D50..11D59 ; Numeric # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE 11DA0..11DA9 ; Numeric # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE 16A60..16A69 ; Numeric # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE +16AC0..16AC9 ; Numeric # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; Numeric # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 1D7CE..1D7FF ; Numeric # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; Numeric # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -2527,7 +2582,7 @@ FF10..FF19 ; Numeric # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 1E950..1E959 ; Numeric # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; Numeric # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 652 +# Total code points: 662 # ================================================ @@ -2543,7 +2598,7 @@ FF0E ; ATerm # Po FULLWIDTH FULL STOP 0021 ; STerm # Po EXCLAMATION MARK 003F ; STerm # Po QUESTION MARK 0589 ; STerm # Po ARMENIAN FULL STOP -061E..061F ; STerm # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; STerm # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 06D4 ; STerm # Po ARABIC FULL STOP 0700..0702 ; STerm # Po [3] SYRIAC END OF PARAGRAPH..SYRIAC SUBLINEAR FULL STOP 07F9 ; STerm # Po NKO EXCLAMATION MARK @@ -2562,12 +2617,14 @@ FF0E ; ATerm # Po FULLWIDTH FULL STOP 1AA8..1AAB ; STerm # Po [4] TAI THAM SIGN KAAN..TAI THAM SIGN SATKAANKUU 1B5A..1B5B ; STerm # Po [2] BALINESE PANTI..BALINESE PAMADA 1B5E..1B5F ; STerm # Po [2] BALINESE CARIK SIKI..BALINESE CARIK PAREREN +1B7D..1B7E ; STerm # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1C3B..1C3C ; STerm # Po [2] LEPCHA PUNCTUATION TA-ROL..LEPCHA PUNCTUATION NYET THYOOM TA-ROL 1C7E..1C7F ; STerm # Po [2] OL CHIKI PUNCTUATION MUCAAD..OL CHIKI PUNCTUATION DOUBLE MUCAAD 203C..203D ; STerm # Po [2] DOUBLE EXCLAMATION MARK..INTERROBANG 2047..2049 ; STerm # Po [3] DOUBLE QUESTION MARK..EXCLAMATION QUESTION MARK 2E2E ; STerm # Po REVERSED QUESTION MARK 2E3C ; STerm # Po STENOGRAPHIC FULL STOP +2E53..2E54 ; STerm # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK 3002 ; STerm # Po IDEOGRAPHIC FULL STOP A4FF ; STerm # Po LISU PUNCTUATION FULL STOP A60E..A60F ; STerm # Po [2] VAI FULL STOP..VAI QUESTION MARK @@ -2586,6 +2643,7 @@ FF1F ; STerm # Po FULLWIDTH QUESTION MARK FF61 ; STerm # Po HALFWIDTH IDEOGRAPHIC FULL STOP 10A56..10A57 ; STerm # Po [2] KHAROSHTHI PUNCTUATION DANDA..KHAROSHTHI PUNCTUATION DOUBLE DANDA 10F55..10F59 ; STerm # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F86..10F89 ; STerm # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 11047..11048 ; STerm # Po [2] BRAHMI DANDA..BRAHMI DOUBLE DANDA 110BE..110C1 ; STerm # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA 11141..11143 ; STerm # Po [3] CHAKMA DANDA..CHAKMA QUESTION MARK @@ -2614,7 +2672,7 @@ FF61 ; STerm # Po HALFWIDTH IDEOGRAPHIC FULL STOP 1BC9F ; STerm # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1DA88 ; STerm # Po SIGNWRITING FULL STOP -# Total code points: 140 +# Total code points: 149 # ================================================ @@ -2734,6 +2792,14 @@ FF61 ; STerm # Po HALFWIDTH IDEOGRAPHIC FULL STOP 2E28 ; Close # Ps LEFT DOUBLE PARENTHESIS 2E29 ; Close # Pe RIGHT DOUBLE PARENTHESIS 2E42 ; Close # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK +2E55 ; Close # Ps LEFT SQUARE BRACKET WITH STROKE +2E56 ; Close # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57 ; Close # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58 ; Close # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; Close # Ps TOP HALF LEFT PARENTHESIS +2E5A ; Close # Pe TOP HALF RIGHT PARENTHESIS +2E5B ; Close # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C ; Close # Pe BOTTOM HALF RIGHT PARENTHESIS 3008 ; Close # Ps LEFT ANGLE BRACKET 3009 ; Close # Pe RIGHT ANGLE BRACKET 300A ; Close # Ps LEFT DOUBLE ANGLE BRACKET @@ -2794,7 +2860,7 @@ FF62 ; Close # Ps HALFWIDTH LEFT CORNER BRACKET FF63 ; Close # Pe HALFWIDTH RIGHT CORNER BRACKET 1F676..1F678 ; Close # So [3] SANS-SERIF HEAVY DOUBLE TURNED COMMA QUOTATION MARK ORNAMENT..SANS-SERIF HEAVY LOW DOUBLE COMMA QUOTATION MARK ORNAMENT -# Total code points: 187 +# Total code points: 195 # ================================================ diff --git a/lib/unicore/auxiliary/WBTest.txt b/lib/unicore/auxiliary/WBTest.txt index 3e85759b85..1d1435bfc7 100644 --- a/lib/unicore/auxiliary/WBTest.txt +++ b/lib/unicore/auxiliary/WBTest.txt @@ -1,6 +1,6 @@ -# WordBreakTest-13.0.0.txt -# Date: 2019-11-20, 22:27:23 GMT -# © 2019 Unicode®, Inc. +# WordBreakTest-14.0.0.txt +# Date: 2021-03-08, 06:22:40 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # diff --git a/lib/unicore/auxiliary/WordBreakProperty.txt b/lib/unicore/auxiliary/WordBreakProperty.txt index 36d1438c26..73cd069dcb 100644 --- a/lib/unicore/auxiliary/WordBreakProperty.txt +++ b/lib/unicore/auxiliary/WordBreakProperty.txt @@ -1,6 +1,6 @@ -# WordBreakProperty-13.0.0.txt -# Date: 2020-01-22, 00:07:44 GMT -# © 2020 Unicode®, Inc. +# WordBreakProperty-14.0.0.txt +# Date: 2021-07-10, 00:35:32 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -91,7 +91,8 @@ FB46..FB4F ; Hebrew_Letter # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW 0825..0827 ; Extend # Mn [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U 0829..082D ; Extend # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA 0859..085B ; Extend # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3..08E1 ; Extend # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0898..089F ; Extend # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08CA..08E1 ; Extend # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; Extend # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 0903 ; Extend # Mc DEVANAGARI SIGN VISARGA 093A ; Extend # Mn DEVANAGARI VOWEL SIGN OE @@ -160,6 +161,7 @@ FB46..FB4F ; Hebrew_Letter # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW 0C00 ; Extend # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE 0C01..0C03 ; Extend # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA 0C04 ; Extend # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3C ; Extend # Mn TELUGU SIGN NUKTA 0C3E..0C40 ; Extend # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44 ; Extend # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR 0C46..0C48 ; Extend # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI @@ -238,7 +240,9 @@ FB46..FB4F ; Hebrew_Letter # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW 109D ; Extend # Mn MYANMAR VOWEL SIGN AITON AI 135D..135F ; Extend # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK 1712..1714 ; Extend # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1732..1734 ; Extend # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1715 ; Extend # Mc TAGALOG SIGN PAMUDPOD +1732..1733 ; Extend # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734 ; Extend # Mc HANUNOO SIGN PAMUDPOD 1752..1753 ; Extend # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1772..1773 ; Extend # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U 17B4..17B5 ; Extend # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA @@ -250,6 +254,7 @@ FB46..FB4F ; Hebrew_Letter # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW 17C9..17D3 ; Extend # Mn [11] KHMER SIGN MUUSIKATOAN..KHMER SIGN BATHAMASAT 17DD ; Extend # Mn KHMER SIGN ATTHACAN 180B..180D ; Extend # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; Extend # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1885..1886 ; Extend # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 18A9 ; Extend # Mn MONGOLIAN LETTER ALI GALI DAGALGA 1920..1922 ; Extend # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U @@ -277,7 +282,7 @@ FB46..FB4F ; Hebrew_Letter # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW 1A7F ; Extend # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 1AB0..1ABD ; Extend # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; Extend # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; Extend # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; Extend # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; Extend # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; Extend # Mc BALINESE SIGN BISAH 1B34 ; Extend # Mn BALINESE SIGN REREKAN @@ -317,8 +322,7 @@ FB46..FB4F ; Hebrew_Letter # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW 1CF4 ; Extend # Mn VEDIC TONE CANDRA ABOVE 1CF7 ; Extend # Mc VEDIC SIGN ATIKRAMA 1CF8..1CF9 ; Extend # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE -1DC0..1DF9 ; Extend # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; Extend # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; Extend # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 200C ; Extend # Cf ZERO WIDTH NON-JOINER 20D0..20DC ; Extend # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0 ; Extend # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH @@ -404,16 +408,20 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 10D24..10D27 ; Extend # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10EAB..10EAC ; Extend # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F46..10F50 ; Extend # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; Extend # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 11000 ; Extend # Mc BRAHMI SIGN CANDRABINDU 11001 ; Extend # Mn BRAHMI SIGN ANUSVARA 11002 ; Extend # Mc BRAHMI SIGN VISARGA 11038..11046 ; Extend # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA +11070 ; Extend # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Extend # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 1107F..11081 ; Extend # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 11082 ; Extend # Mc KAITHI SIGN VISARGA 110B0..110B2 ; Extend # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II 110B3..110B6 ; Extend # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B7..110B8 ; Extend # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU 110B9..110BA ; Extend # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Extend # Mn KAITHI VOWEL SIGN VOCALIC R 11100..11102 ; Extend # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; Extend # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112C ; Extend # Mc CHAKMA VOWEL SIGN E @@ -552,6 +560,8 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 16FE4 ; Extend # Mn KHITAN SMALL SCRIPT FILLER 16FF0..16FF1 ; Extend # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY 1BC9D..1BC9E ; Extend # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK +1CF00..1CF2D ; Extend # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; Extend # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D165..1D166 ; Extend # Mc [2] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING SPRECHGESANG STEM 1D167..1D169 ; Extend # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16D..1D172 ; Extend # Mc [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 @@ -571,6 +581,7 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT 1E023..1E024 ; Extend # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; Extend # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; Extend # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; Extend # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; Extend # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; Extend # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E94A ; Extend # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA @@ -578,7 +589,7 @@ FF9E..FF9F ; Extend # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDT E0020..E007F ; Extend # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2399 +# Total code points: 2512 # ================================================ @@ -593,6 +604,7 @@ E0100..E01EF ; Extend # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 061C ; Format # Cf ARABIC LETTER MARK 06DD ; Format # Cf ARABIC END OF AYAH 070F ; Format # Cf SYRIAC ABBREVIATION MARK +0890..0891 ; Format # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE 08E2 ; Format # Cf ARABIC DISPUTED END OF AYAH 180E ; Format # Cf MONGOLIAN VOWEL SEPARATOR 200E..200F ; Format # Cf [2] LEFT-TO-RIGHT MARK..RIGHT-TO-LEFT MARK @@ -608,7 +620,7 @@ FFF9..FFFB ; Format # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANN 1D173..1D17A ; Format # Cf [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE E0001 ; Format # Cf LANGUAGE TAG -# Total code points: 62 +# Total code points: 64 # ================================================ @@ -624,10 +636,14 @@ E0001 ; Format # Cf LANGUAGE TAG FF66..FF6F ; Katakana # Lo [10] HALFWIDTH KATAKANA LETTER WO..HALFWIDTH KATAKANA LETTER SMALL TU FF70 ; Katakana # Lm HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND MARK FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAKANA LETTER N +1AFF0..1AFF3 ; Katakana # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; Katakana # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; Katakana # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 1B000 ; Katakana # Lo KATAKANA LETTER ARCHAIC E +1B120..1B122 ; Katakana # Lo [3] KATAKANA LETTER ARCHAIC YI..KATAKANA LETTER ARCHAIC WU 1B164..1B167 ; Katakana # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N -# Total code points: 314 +# Total code points: 330 # ================================================ @@ -699,8 +715,10 @@ FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAK 0828 ; ALetter # Lm SAMARITAN MODIFIER LETTER I 0840..0858 ; ALetter # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 0860..086A ; ALetter # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; ALetter # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; ALetter # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +0870..0887 ; ALetter # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; ALetter # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +08A0..08C8 ; ALetter # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; ALetter # Lm ARABIC SMALL FARSI YEH 0904..0939 ; ALetter # Lo [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA 093D ; ALetter # Lo DEVANAGARI SIGN AVAGRAHA 0950 ; ALetter # Lo DEVANAGARI OM @@ -766,6 +784,7 @@ FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAK 0C2A..0C39 ; ALetter # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA 0C3D ; ALetter # Lo TELUGU SIGN AVAGRAHA 0C58..0C5A ; ALetter # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; ALetter # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; ALetter # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C80 ; ALetter # Lo KANNADA SIGN SPACING CANDRABINDU 0C85..0C8C ; ALetter # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L @@ -774,7 +793,7 @@ FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAK 0CAA..0CB3 ; ALetter # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA 0CB5..0CB9 ; ALetter # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA 0CBD ; ALetter # Lo KANNADA SIGN AVAGRAHA -0CDE ; ALetter # Lo KANNADA LETTER FA +0CDD..0CDE ; ALetter # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; ALetter # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CF1..0CF2 ; ALetter # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA 0D04..0D0C ; ALetter # Lo [9] MALAYALAM LETTER VEDIC ANUSVARA..MALAYALAM LETTER VOCALIC L @@ -825,9 +844,8 @@ FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAK 16A0..16EA ; ALetter # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16EE..16F0 ; ALetter # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; ALetter # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; ALetter # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; ALetter # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA -1720..1731 ; ALetter # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA +1700..1711 ; ALetter # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA +171F..1731 ; ALetter # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA 1740..1751 ; ALetter # Lo [18] BUHID LETTER A..BUHID LETTER HA 1760..176C ; ALetter # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA 176E..1770 ; ALetter # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA @@ -841,7 +859,7 @@ FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAK 1900..191E ; ALetter # Lo [31] LIMBU VOWEL-CARRIER LETTER..LIMBU LETTER TRA 1A00..1A16 ; ALetter # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA 1B05..1B33 ; ALetter # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA -1B45..1B4B ; ALetter # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; ALetter # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B83..1BA0 ; ALetter # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA 1BAE..1BAF ; ALetter # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA 1BBA..1BE5 ; ALetter # Lo [44] SUNDANESE AVAGRAHA..BATAK LETTER U @@ -903,9 +921,7 @@ FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAK 2183..2184 ; ALetter # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C 2185..2188 ; ALetter # Nl [4] ROMAN NUMERAL SIX LATE FORM..ROMAN NUMERAL ONE HUNDRED THOUSAND 24B6..24E9 ; ALetter # So [52] CIRCLED LATIN CAPITAL LETTER A..CIRCLED LATIN SMALL LETTER Z -2C00..2C2E ; ALetter # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; ALetter # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; ALetter # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; ALetter # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; ALetter # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; ALetter # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CEB..2CEE ; ALetter # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA @@ -957,8 +973,11 @@ A788 ; ALetter # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; ALetter # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; ALetter # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; ALetter # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; ALetter # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; ALetter # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; ALetter # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; ALetter # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; ALetter # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; ALetter # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; ALetter # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; ALetter # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; ALetter # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; ALetter # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -1040,9 +1059,20 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 104D8..104FB ; ALetter # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA 10500..10527 ; ALetter # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; ALetter # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW +10570..1057A ; ALetter # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; ALetter # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; ALetter # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; ALetter # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; ALetter # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; ALetter # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; ALetter # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; ALetter # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; ALetter # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; ALetter # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; ALetter # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; ALetter # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; ALetter # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; ALetter # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; ALetter # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; ALetter # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; ALetter # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -1078,9 +1108,12 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 10F00..10F1C ; ALetter # Lo [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL 10F27 ; ALetter # Lo OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F45 ; ALetter # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN +10F70..10F81 ; ALetter # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH 10FB0..10FC4 ; ALetter # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; ALetter # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11003..11037 ; ALetter # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA +11071..11072 ; ALetter # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11075 ; ALetter # Lo BRAHMI LETTER OLD TAMIL LLA 11083..110AF ; ALetter # Lo [45] KAITHI LETTER A..KAITHI LETTER HA 110D0..110E8 ; ALetter # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 11103..11126 ; ALetter # Lo [36] CHAKMA LETTER AA..CHAKMA LETTER HAA @@ -1140,7 +1173,7 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 11A50 ; ALetter # Lo SOYOMBO LETTER A 11A5C..11A89 ; ALetter # Lo [46] SOYOMBO LETTER KA..SOYOMBO CLUSTER-INITIAL LETTER SA 11A9D ; ALetter # Lo SOYOMBO MARK PLUTA -11AC0..11AF8 ; ALetter # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; ALetter # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; ALetter # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; ALetter # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C40 ; ALetter # Lo BHAIKSUKI SIGN AVAGRAHA @@ -1158,10 +1191,12 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 12000..12399 ; ALetter # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12400..1246E ; ALetter # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; ALetter # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; ALetter # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; ALetter # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; ALetter # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; ALetter # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; ALetter # Lo [31] MRO LETTER TA..MRO LETTER TEK +16A70..16ABE ; ALetter # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA 16AD0..16AED ; ALetter # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16B00..16B2F ; ALetter # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 16B40..16B43 ; ALetter # Lm [4] PAHAWH HMONG SIGN VOS SEEV..PAHAWH HMONG SIGN IB YAM @@ -1207,10 +1242,18 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1D78A..1D7A8 ; ALetter # L& [31] MATHEMATICAL SANS-SERIF BOLD EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA 1D7AA..1D7C2 ; ALetter # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA 1D7C4..1D7CB ; ALetter # L& [8] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL BOLD SMALL DIGAMMA +1DF00..1DF09 ; ALetter # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; ALetter # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; ALetter # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E100..1E12C ; ALetter # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; ALetter # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E14E ; ALetter # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ +1E290..1E2AD ; ALetter # Lo [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; ALetter # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH +1E7E0..1E7E6 ; ALetter # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; ALetter # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; ALetter # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; ALetter # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; ALetter # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E900..1E943 ; ALetter # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA 1E94B ; ALetter # Lm ADLAM NASALIZATION MARK @@ -1251,7 +1294,7 @@ FFDA..FFDC ; ALetter # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL 1F150..1F169 ; ALetter # So [26] NEGATIVE CIRCLED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F189 ; ALetter # So [26] NEGATIVE SQUARED LATIN CAPITAL LETTER A..NEGATIVE SQUARED LATIN CAPITAL LETTER Z -# Total code points: 28854 +# Total code points: 29336 # ================================================ @@ -1356,6 +1399,7 @@ FF10..FF19 ; Numeric # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 11D50..11D59 ; Numeric # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE 11DA0..11DA9 ; Numeric # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE 16A60..16A69 ; Numeric # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE +16AC0..16AC9 ; Numeric # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; Numeric # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 1D7CE..1D7FF ; Numeric # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; Numeric # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -1363,7 +1407,7 @@ FF10..FF19 ; Numeric # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 1E950..1E959 ; Numeric # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; Numeric # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 651 +# Total code points: 661 # ================================================ diff --git a/lib/unicore/emoji/emoji.txt b/lib/unicore/emoji/emoji.txt index 5d7dc1b156..7806c7ab53 100644 --- a/lib/unicore/emoji/emoji.txt +++ b/lib/unicore/emoji/emoji.txt @@ -1,11 +1,11 @@ -# emoji-data.txt -# Date: 2020-01-28, 20:52:38 GMT -# © 2020 Unicode®, Inc. +# emoji-data-14.0.0.txt +# Date: 2021-08-26, 17:22:22 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # # Emoji Data for UTS #51 -# Version: 13.0 +# Used with Emoji Version 14.0 and subsequent minor revisions (if any) # # For documentation and usage, see http://www.unicode.org/reports/tr51 # @@ -22,7 +22,7 @@ # All omitted code points have Emoji=No # @missing: 0000..10FFFF ; Emoji ; No -0023 ; Emoji # E0.0 [1] (#️) number sign +0023 ; Emoji # E0.0 [1] (#️) hash sign 002A ; Emoji # E0.0 [1] (*️) asterisk 0030..0039 ; Emoji # E0.0 [10] (0️..9️) digit zero..digit nine 00A9 ; Emoji # E0.6 [1] (©️) copyright @@ -119,8 +119,8 @@ 2747 ; Emoji # E0.6 [1] (❇️) sparkle 274C ; Emoji # E0.6 [1] (❌) cross mark 274E ; Emoji # E0.6 [1] (❎) cross mark button -2753..2755 ; Emoji # E0.6 [3] (❓..❕) question mark..white exclamation mark -2757 ; Emoji # E0.6 [1] (❗) exclamation mark +2753..2755 ; Emoji # E0.6 [3] (❓..❕) red question mark..white exclamation mark +2757 ; Emoji # E0.6 [1] (❗) red exclamation mark 2763 ; Emoji # E1.0 [1] (❣️) heart exclamation 2764 ; Emoji # E0.6 [1] (❤️) red heart 2795..2797 ; Emoji # E0.6 [3] (➕..➗) plus..divide @@ -239,7 +239,7 @@ 1F509 ; Emoji # E1.0 [1] (🔉) speaker medium volume 1F50A..1F514 ; Emoji # E0.6 [11] (🔊..🔔) speaker high volume..bell 1F515 ; Emoji # E1.0 [1] (🔕) bell with slash -1F516..1F52B ; Emoji # E0.6 [22] (🔖..🔫) bookmark..pistol +1F516..1F52B ; Emoji # E0.6 [22] (🔖..🔫) bookmark..water pistol 1F52C..1F52D ; Emoji # E1.0 [2] (🔬..🔭) microscope..telescope 1F52E..1F53D ; Emoji # E0.6 [16] (🔮..🔽) crystal ball..downwards button 1F549..1F54A ; Emoji # E0.7 [2] (🕉️..🕊️) om..dove @@ -294,7 +294,7 @@ 1F62E..1F62F ; Emoji # E1.0 [2] (😮..😯) face with open mouth..hushed face 1F630..1F633 ; Emoji # E0.6 [4] (😰..😳) anxious face with sweat..flushed face 1F634 ; Emoji # E1.0 [1] (😴) sleeping face -1F635 ; Emoji # E0.6 [1] (😵) dizzy face +1F635 ; Emoji # E0.6 [1] (😵) face with crossed-out eyes 1F636 ; Emoji # E1.0 [1] (😶) face without mouth 1F637..1F640 ; Emoji # E0.6 [10] (😷..🙀) face with medical mask..weary cat 1F641..1F644 ; Emoji # E1.0 [4] (🙁..🙄) slightly frowning face..face with rolling eyes @@ -341,6 +341,7 @@ 1F6D1..1F6D2 ; Emoji # E3.0 [2] (🛑..🛒) stop sign..shopping cart 1F6D5 ; Emoji # E12.0 [1] (🛕) hindu temple 1F6D6..1F6D7 ; Emoji # E13.0 [2] (🛖..🛗) hut..elevator +1F6DD..1F6DF ; Emoji # E14.0 [3] (🛝..🛟) playground slide..ring buoy 1F6E0..1F6E5 ; Emoji # E0.7 [6] (🛠️..🛥️) hammer and wrench..motor boat 1F6E9 ; Emoji # E0.7 [1] (🛩️) small airplane 1F6EB..1F6EC ; Emoji # E1.0 [2] (🛫..🛬) airplane departure..airplane arrival @@ -352,6 +353,7 @@ 1F6FA ; Emoji # E12.0 [1] (🛺) auto rickshaw 1F6FB..1F6FC ; Emoji # E13.0 [2] (🛻..🛼) pickup truck..roller skate 1F7E0..1F7EB ; Emoji # E12.0 [12] (🟠..🟫) orange circle..brown square +1F7F0 ; Emoji # E14.0 [1] (🟰) heavy equals sign 1F90C ; Emoji # E13.0 [1] (🤌) pinched fingers 1F90D..1F90F ; Emoji # E12.0 [3] (🤍..🤏) white heart..pinching hand 1F910..1F918 ; Emoji # E1.0 [9] (🤐..🤘) zipper-mouth face..sign of the horns @@ -375,6 +377,7 @@ 1F972 ; Emoji # E13.0 [1] (🥲) smiling face with tear 1F973..1F976 ; Emoji # E11.0 [4] (🥳..🥶) partying face..cold face 1F977..1F978 ; Emoji # E13.0 [2] (🥷..🥸) ninja..disguised face +1F979 ; Emoji # E14.0 [1] (🥹) face holding back tears 1F97A ; Emoji # E11.0 [1] (🥺) pleading face 1F97B ; Emoji # E12.0 [1] (🥻) sari 1F97C..1F97F ; Emoji # E11.0 [4] (🥼..🥿) lab coat..flat shoe @@ -392,21 +395,29 @@ 1F9C1..1F9C2 ; Emoji # E11.0 [2] (🧁..🧂) cupcake..salt 1F9C3..1F9CA ; Emoji # E12.0 [8] (🧃..🧊) beverage box..ice 1F9CB ; Emoji # E13.0 [1] (🧋) bubble tea +1F9CC ; Emoji # E14.0 [1] (🧌) troll 1F9CD..1F9CF ; Emoji # E12.0 [3] (🧍..🧏) person standing..deaf person 1F9D0..1F9E6 ; Emoji # E5.0 [23] (🧐..🧦) face with monocle..socks 1F9E7..1F9FF ; Emoji # E11.0 [25] (🧧..🧿) red envelope..nazar amulet 1FA70..1FA73 ; Emoji # E12.0 [4] (🩰..🩳) ballet shoes..shorts 1FA74 ; Emoji # E13.0 [1] (🩴) thong sandal 1FA78..1FA7A ; Emoji # E12.0 [3] (🩸..🩺) drop of blood..stethoscope +1FA7B..1FA7C ; Emoji # E14.0 [2] (🩻..🩼) x-ray..crutch 1FA80..1FA82 ; Emoji # E12.0 [3] (🪀..🪂) yo-yo..parachute 1FA83..1FA86 ; Emoji # E13.0 [4] (🪃..🪆) boomerang..nesting dolls 1FA90..1FA95 ; Emoji # E12.0 [6] (🪐..🪕) ringed planet..banjo 1FA96..1FAA8 ; Emoji # E13.0 [19] (🪖..🪨) military helmet..rock +1FAA9..1FAAC ; Emoji # E14.0 [4] (🪩..🪬) mirror ball..hamsa 1FAB0..1FAB6 ; Emoji # E13.0 [7] (🪰..🪶) fly..feather +1FAB7..1FABA ; Emoji # E14.0 [4] (🪷..🪺) lotus..nest with eggs 1FAC0..1FAC2 ; Emoji # E13.0 [3] (🫀..🫂) anatomical heart..people hugging +1FAC3..1FAC5 ; Emoji # E14.0 [3] (🫃..🫅) pregnant man..person with crown 1FAD0..1FAD6 ; Emoji # E13.0 [7] (🫐..🫖) blueberries..teapot +1FAD7..1FAD9 ; Emoji # E14.0 [3] (🫗..🫙) pouring liquid..jar +1FAE0..1FAE7 ; Emoji # E14.0 [8] (🫠..🫧) melting face..bubbles +1FAF0..1FAF6 ; Emoji # E14.0 [7] (🫰..🫶) hand with index finger and thumb crossed..heart hands -# Total elements: 1367 +# Total elements: 1404 # ================================================ @@ -438,8 +449,8 @@ 2728 ; Emoji_Presentation # E0.6 [1] (✨) sparkles 274C ; Emoji_Presentation # E0.6 [1] (❌) cross mark 274E ; Emoji_Presentation # E0.6 [1] (❎) cross mark button -2753..2755 ; Emoji_Presentation # E0.6 [3] (❓..❕) question mark..white exclamation mark -2757 ; Emoji_Presentation # E0.6 [1] (❗) exclamation mark +2753..2755 ; Emoji_Presentation # E0.6 [3] (❓..❕) red question mark..white exclamation mark +2757 ; Emoji_Presentation # E0.6 [1] (❗) red exclamation mark 2795..2797 ; Emoji_Presentation # E0.6 [3] (➕..➗) plus..divide 27B0 ; Emoji_Presentation # E0.6 [1] (➰) curly loop 27BF ; Emoji_Presentation # E1.0 [1] (➿) double curly loop @@ -533,7 +544,7 @@ 1F509 ; Emoji_Presentation # E1.0 [1] (🔉) speaker medium volume 1F50A..1F514 ; Emoji_Presentation # E0.6 [11] (🔊..🔔) speaker high volume..bell 1F515 ; Emoji_Presentation # E1.0 [1] (🔕) bell with slash -1F516..1F52B ; Emoji_Presentation # E0.6 [22] (🔖..🔫) bookmark..pistol +1F516..1F52B ; Emoji_Presentation # E0.6 [22] (🔖..🔫) bookmark..water pistol 1F52C..1F52D ; Emoji_Presentation # E1.0 [2] (🔬..🔭) microscope..telescope 1F52E..1F53D ; Emoji_Presentation # E0.6 [16] (🔮..🔽) crystal ball..downwards button 1F54B..1F54E ; Emoji_Presentation # E1.0 [4] (🕋..🕎) kaaba..menorah @@ -569,7 +580,7 @@ 1F62E..1F62F ; Emoji_Presentation # E1.0 [2] (😮..😯) face with open mouth..hushed face 1F630..1F633 ; Emoji_Presentation # E0.6 [4] (😰..😳) anxious face with sweat..flushed face 1F634 ; Emoji_Presentation # E1.0 [1] (😴) sleeping face -1F635 ; Emoji_Presentation # E0.6 [1] (😵) dizzy face +1F635 ; Emoji_Presentation # E0.6 [1] (😵) face with crossed-out eyes 1F636 ; Emoji_Presentation # E1.0 [1] (😶) face without mouth 1F637..1F640 ; Emoji_Presentation # E0.6 [10] (😷..🙀) face with medical mask..weary cat 1F641..1F644 ; Emoji_Presentation # E1.0 [4] (🙁..🙄) slightly frowning face..face with rolling eyes @@ -614,6 +625,7 @@ 1F6D1..1F6D2 ; Emoji_Presentation # E3.0 [2] (🛑..🛒) stop sign..shopping cart 1F6D5 ; Emoji_Presentation # E12.0 [1] (🛕) hindu temple 1F6D6..1F6D7 ; Emoji_Presentation # E13.0 [2] (🛖..🛗) hut..elevator +1F6DD..1F6DF ; Emoji_Presentation # E14.0 [3] (🛝..🛟) playground slide..ring buoy 1F6EB..1F6EC ; Emoji_Presentation # E1.0 [2] (🛫..🛬) airplane departure..airplane arrival 1F6F4..1F6F6 ; Emoji_Presentation # E3.0 [3] (🛴..🛶) kick scooter..canoe 1F6F7..1F6F8 ; Emoji_Presentation # E5.0 [2] (🛷..🛸) sled..flying saucer @@ -621,6 +633,7 @@ 1F6FA ; Emoji_Presentation # E12.0 [1] (🛺) auto rickshaw 1F6FB..1F6FC ; Emoji_Presentation # E13.0 [2] (🛻..🛼) pickup truck..roller skate 1F7E0..1F7EB ; Emoji_Presentation # E12.0 [12] (🟠..🟫) orange circle..brown square +1F7F0 ; Emoji_Presentation # E14.0 [1] (🟰) heavy equals sign 1F90C ; Emoji_Presentation # E13.0 [1] (🤌) pinched fingers 1F90D..1F90F ; Emoji_Presentation # E12.0 [3] (🤍..🤏) white heart..pinching hand 1F910..1F918 ; Emoji_Presentation # E1.0 [9] (🤐..🤘) zipper-mouth face..sign of the horns @@ -644,6 +657,7 @@ 1F972 ; Emoji_Presentation # E13.0 [1] (🥲) smiling face with tear 1F973..1F976 ; Emoji_Presentation # E11.0 [4] (🥳..🥶) partying face..cold face 1F977..1F978 ; Emoji_Presentation # E13.0 [2] (🥷..🥸) ninja..disguised face +1F979 ; Emoji_Presentation # E14.0 [1] (🥹) face holding back tears 1F97A ; Emoji_Presentation # E11.0 [1] (🥺) pleading face 1F97B ; Emoji_Presentation # E12.0 [1] (🥻) sari 1F97C..1F97F ; Emoji_Presentation # E11.0 [4] (🥼..🥿) lab coat..flat shoe @@ -661,21 +675,29 @@ 1F9C1..1F9C2 ; Emoji_Presentation # E11.0 [2] (🧁..🧂) cupcake..salt 1F9C3..1F9CA ; Emoji_Presentation # E12.0 [8] (🧃..🧊) beverage box..ice 1F9CB ; Emoji_Presentation # E13.0 [1] (🧋) bubble tea +1F9CC ; Emoji_Presentation # E14.0 [1] (🧌) troll 1F9CD..1F9CF ; Emoji_Presentation # E12.0 [3] (🧍..🧏) person standing..deaf person 1F9D0..1F9E6 ; Emoji_Presentation # E5.0 [23] (🧐..🧦) face with monocle..socks 1F9E7..1F9FF ; Emoji_Presentation # E11.0 [25] (🧧..🧿) red envelope..nazar amulet 1FA70..1FA73 ; Emoji_Presentation # E12.0 [4] (🩰..🩳) ballet shoes..shorts 1FA74 ; Emoji_Presentation # E13.0 [1] (🩴) thong sandal 1FA78..1FA7A ; Emoji_Presentation # E12.0 [3] (🩸..🩺) drop of blood..stethoscope +1FA7B..1FA7C ; Emoji_Presentation # E14.0 [2] (🩻..🩼) x-ray..crutch 1FA80..1FA82 ; Emoji_Presentation # E12.0 [3] (🪀..🪂) yo-yo..parachute 1FA83..1FA86 ; Emoji_Presentation # E13.0 [4] (🪃..🪆) boomerang..nesting dolls 1FA90..1FA95 ; Emoji_Presentation # E12.0 [6] (🪐..🪕) ringed planet..banjo 1FA96..1FAA8 ; Emoji_Presentation # E13.0 [19] (🪖..🪨) military helmet..rock +1FAA9..1FAAC ; Emoji_Presentation # E14.0 [4] (🪩..🪬) mirror ball..hamsa 1FAB0..1FAB6 ; Emoji_Presentation # E13.0 [7] (🪰..🪶) fly..feather +1FAB7..1FABA ; Emoji_Presentation # E14.0 [4] (🪷..🪺) lotus..nest with eggs 1FAC0..1FAC2 ; Emoji_Presentation # E13.0 [3] (🫀..🫂) anatomical heart..people hugging +1FAC3..1FAC5 ; Emoji_Presentation # E14.0 [3] (🫃..🫅) pregnant man..person with crown 1FAD0..1FAD6 ; Emoji_Presentation # E13.0 [7] (🫐..🫖) blueberries..teapot +1FAD7..1FAD9 ; Emoji_Presentation # E14.0 [3] (🫗..🫙) pouring liquid..jar +1FAE0..1FAE7 ; Emoji_Presentation # E14.0 [8] (🫠..🫧) melting face..bubbles +1FAF0..1FAF6 ; Emoji_Presentation # E14.0 [7] (🫰..🫶) hand with index finger and thumb crossed..heart hands -# Total elements: 1148 +# Total elements: 1185 # ================================================ @@ -738,15 +760,17 @@ 1F9BB ; Emoji_Modifier_Base # E12.0 [1] (🦻) ear with hearing aid 1F9CD..1F9CF ; Emoji_Modifier_Base # E12.0 [3] (🧍..🧏) person standing..deaf person 1F9D1..1F9DD ; Emoji_Modifier_Base # E5.0 [13] (🧑..🧝) person..elf +1FAC3..1FAC5 ; Emoji_Modifier_Base # E14.0 [3] (🫃..🫅) pregnant man..person with crown +1FAF0..1FAF6 ; Emoji_Modifier_Base # E14.0 [7] (🫰..🫶) hand with index finger and thumb crossed..heart hands -# Total elements: 122 +# Total elements: 132 # ================================================ # All omitted code points have Emoji_Component=No # @missing: 0000..10FFFF ; Emoji_Component ; No -0023 ; Emoji_Component # E0.0 [1] (#️) number sign +0023 ; Emoji_Component # E0.0 [1] (#️) hash sign 002A ; Emoji_Component # E0.0 [1] (*️) asterisk 0030..0039 ; Emoji_Component # E0.0 [10] (0️..9️) digit zero..digit nine 200D ; Emoji_Component # E0.0 [1] (‍) zero width joiner @@ -902,8 +926,8 @@ E0020..E007F ; Emoji_Component # E0.0 [96] (󠀠..󠁿) tag space..c 2747 ; Extended_Pictographic# E0.6 [1] (❇️) sparkle 274C ; Extended_Pictographic# E0.6 [1] (❌) cross mark 274E ; Extended_Pictographic# E0.6 [1] (❎) cross mark button -2753..2755 ; Extended_Pictographic# E0.6 [3] (❓..❕) question mark..white exclamation mark -2757 ; Extended_Pictographic# E0.6 [1] (❗) exclamation mark +2753..2755 ; Extended_Pictographic# E0.6 [3] (❓..❕) red question mark..white exclamation mark +2757 ; Extended_Pictographic# E0.6 [1] (❗) red exclamation mark 2763 ; Extended_Pictographic# E1.0 [1] (❣️) heart exclamation 2764 ; Extended_Pictographic# E0.6 [1] (❤️) red heart 2765..2767 ; Extended_Pictographic# E0.0 [3] (❥..❧) ROTATED HEAVY BLACK HEART BULLET..ROTATED FLORAL HEART BULLET @@ -1041,7 +1065,7 @@ E0020..E007F ; Emoji_Component # E0.0 [96] (󠀠..󠁿) tag space..c 1F509 ; Extended_Pictographic# E1.0 [1] (🔉) speaker medium volume 1F50A..1F514 ; Extended_Pictographic# E0.6 [11] (🔊..🔔) speaker high volume..bell 1F515 ; Extended_Pictographic# E1.0 [1] (🔕) bell with slash -1F516..1F52B ; Extended_Pictographic# E0.6 [22] (🔖..🔫) bookmark..pistol +1F516..1F52B ; Extended_Pictographic# E0.6 [22] (🔖..🔫) bookmark..water pistol 1F52C..1F52D ; Extended_Pictographic# E1.0 [2] (🔬..🔭) microscope..telescope 1F52E..1F53D ; Extended_Pictographic# E0.6 [16] (🔮..🔽) crystal ball..downwards button 1F546..1F548 ; Extended_Pictographic# E0.0 [3] (🕆..🕈) WHITE LATIN CROSS..CELTIC CROSS @@ -1117,7 +1141,7 @@ E0020..E007F ; Emoji_Component # E0.0 [96] (󠀠..󠁿) tag space..c 1F62E..1F62F ; Extended_Pictographic# E1.0 [2] (😮..😯) face with open mouth..hushed face 1F630..1F633 ; Extended_Pictographic# E0.6 [4] (😰..😳) anxious face with sweat..flushed face 1F634 ; Extended_Pictographic# E1.0 [1] (😴) sleeping face -1F635 ; Extended_Pictographic# E0.6 [1] (😵) dizzy face +1F635 ; Extended_Pictographic# E0.6 [1] (😵) face with crossed-out eyes 1F636 ; Extended_Pictographic# E1.0 [1] (😶) face without mouth 1F637..1F640 ; Extended_Pictographic# E0.6 [10] (😷..🙀) face with medical mask..weary cat 1F641..1F644 ; Extended_Pictographic# E1.0 [4] (🙁..🙄) slightly frowning face..face with rolling eyes @@ -1166,7 +1190,8 @@ E0020..E007F ; Emoji_Component # E0.0 [96] (󠀠..󠁿) tag space..c 1F6D3..1F6D4 ; Extended_Pictographic# E0.0 [2] (🛓..🛔) STUPA..PAGODA 1F6D5 ; Extended_Pictographic# E12.0 [1] (🛕) hindu temple 1F6D6..1F6D7 ; Extended_Pictographic# E13.0 [2] (🛖..🛗) hut..elevator -1F6D8..1F6DF ; Extended_Pictographic# E0.0 [8] (🛘..🛟) .. +1F6D8..1F6DC ; Extended_Pictographic# E0.0 [5] (🛘..🛜) .. +1F6DD..1F6DF ; Extended_Pictographic# E14.0 [3] (🛝..🛟) playground slide..ring buoy 1F6E0..1F6E5 ; Extended_Pictographic# E0.7 [6] (🛠️..🛥️) hammer and wrench..motor boat 1F6E6..1F6E8 ; Extended_Pictographic# E0.0 [3] (🛦..🛨) UP-POINTING MILITARY AIRPLANE..UP-POINTING SMALL AIRPLANE 1F6E9 ; Extended_Pictographic# E0.7 [1] (🛩️) small airplane @@ -1185,7 +1210,9 @@ E0020..E007F ; Emoji_Component # E0.0 [96] (󠀠..󠁿) tag space..c 1F774..1F77F ; Extended_Pictographic# E0.0 [12] (🝴..🝿) .. 1F7D5..1F7DF ; Extended_Pictographic# E0.0 [11] (🟕..🟟) CIRCLED TRIANGLE.. 1F7E0..1F7EB ; Extended_Pictographic# E12.0 [12] (🟠..🟫) orange circle..brown square -1F7EC..1F7FF ; Extended_Pictographic# E0.0 [20] (🟬..🟿) .. +1F7EC..1F7EF ; Extended_Pictographic# E0.0 [4] (🟬..🟯) .. +1F7F0 ; Extended_Pictographic# E14.0 [1] (🟰) heavy equals sign +1F7F1..1F7FF ; Extended_Pictographic# E0.0 [15] (🟱..🟿) .. 1F80C..1F80F ; Extended_Pictographic# E0.0 [4] (🠌..🠏) .. 1F848..1F84F ; Extended_Pictographic# E0.0 [8] (🡈..🡏) .. 1F85A..1F85F ; Extended_Pictographic# E0.0 [6] (🡚..🡟) .. @@ -1214,7 +1241,7 @@ E0020..E007F ; Emoji_Component # E0.0 [96] (󠀠..󠁿) tag space..c 1F972 ; Extended_Pictographic# E13.0 [1] (🥲) smiling face with tear 1F973..1F976 ; Extended_Pictographic# E11.0 [4] (🥳..🥶) partying face..cold face 1F977..1F978 ; Extended_Pictographic# E13.0 [2] (🥷..🥸) ninja..disguised face -1F979 ; Extended_Pictographic# E0.0 [1] (🥹) +1F979 ; Extended_Pictographic# E14.0 [1] (🥹) face holding back tears 1F97A ; Extended_Pictographic# E11.0 [1] (🥺) pleading face 1F97B ; Extended_Pictographic# E12.0 [1] (🥻) sari 1F97C..1F97F ; Extended_Pictographic# E11.0 [4] (🥼..🥿) lab coat..flat shoe @@ -1232,7 +1259,7 @@ E0020..E007F ; Emoji_Component # E0.0 [96] (󠀠..󠁿) tag space..c 1F9C1..1F9C2 ; Extended_Pictographic# E11.0 [2] (🧁..🧂) cupcake..salt 1F9C3..1F9CA ; Extended_Pictographic# E12.0 [8] (🧃..🧊) beverage box..ice 1F9CB ; Extended_Pictographic# E13.0 [1] (🧋) bubble tea -1F9CC ; Extended_Pictographic# E0.0 [1] (🧌) +1F9CC ; Extended_Pictographic# E14.0 [1] (🧌) troll 1F9CD..1F9CF ; Extended_Pictographic# E12.0 [3] (🧍..🧏) person standing..deaf person 1F9D0..1F9E6 ; Extended_Pictographic# E5.0 [23] (🧐..🧦) face with monocle..socks 1F9E7..1F9FF ; Extended_Pictographic# E11.0 [25] (🧧..🧿) red envelope..nazar amulet @@ -1241,19 +1268,28 @@ E0020..E007F ; Emoji_Component # E0.0 [96] (󠀠..󠁿) tag space..c 1FA74 ; Extended_Pictographic# E13.0 [1] (🩴) thong sandal 1FA75..1FA77 ; Extended_Pictographic# E0.0 [3] (🩵..🩷) .. 1FA78..1FA7A ; Extended_Pictographic# E12.0 [3] (🩸..🩺) drop of blood..stethoscope -1FA7B..1FA7F ; Extended_Pictographic# E0.0 [5] (🩻..🩿) .. +1FA7B..1FA7C ; Extended_Pictographic# E14.0 [2] (🩻..🩼) x-ray..crutch +1FA7D..1FA7F ; Extended_Pictographic# E0.0 [3] (🩽..🩿) .. 1FA80..1FA82 ; Extended_Pictographic# E12.0 [3] (🪀..🪂) yo-yo..parachute 1FA83..1FA86 ; Extended_Pictographic# E13.0 [4] (🪃..🪆) boomerang..nesting dolls 1FA87..1FA8F ; Extended_Pictographic# E0.0 [9] (🪇..🪏) .. 1FA90..1FA95 ; Extended_Pictographic# E12.0 [6] (🪐..🪕) ringed planet..banjo 1FA96..1FAA8 ; Extended_Pictographic# E13.0 [19] (🪖..🪨) military helmet..rock -1FAA9..1FAAF ; Extended_Pictographic# E0.0 [7] (🪩..🪯) .. +1FAA9..1FAAC ; Extended_Pictographic# E14.0 [4] (🪩..🪬) mirror ball..hamsa +1FAAD..1FAAF ; Extended_Pictographic# E0.0 [3] (🪭..🪯) .. 1FAB0..1FAB6 ; Extended_Pictographic# E13.0 [7] (🪰..🪶) fly..feather -1FAB7..1FABF ; Extended_Pictographic# E0.0 [9] (🪷..🪿) .. +1FAB7..1FABA ; Extended_Pictographic# E14.0 [4] (🪷..🪺) lotus..nest with eggs +1FABB..1FABF ; Extended_Pictographic# E0.0 [5] (🪻..🪿) .. 1FAC0..1FAC2 ; Extended_Pictographic# E13.0 [3] (🫀..🫂) anatomical heart..people hugging -1FAC3..1FACF ; Extended_Pictographic# E0.0 [13] (🫃..🫏) .. +1FAC3..1FAC5 ; Extended_Pictographic# E14.0 [3] (🫃..🫅) pregnant man..person with crown +1FAC6..1FACF ; Extended_Pictographic# E0.0 [10] (🫆..🫏) .. 1FAD0..1FAD6 ; Extended_Pictographic# E13.0 [7] (🫐..🫖) blueberries..teapot -1FAD7..1FAFF ; Extended_Pictographic# E0.0 [41] (🫗..🫿) .. +1FAD7..1FAD9 ; Extended_Pictographic# E14.0 [3] (🫗..🫙) pouring liquid..jar +1FADA..1FADF ; Extended_Pictographic# E0.0 [6] (🫚..🫟) .. +1FAE0..1FAE7 ; Extended_Pictographic# E14.0 [8] (🫠..🫧) melting face..bubbles +1FAE8..1FAEF ; Extended_Pictographic# E0.0 [8] (🫨..🫯) .. +1FAF0..1FAF6 ; Extended_Pictographic# E14.0 [7] (🫰..🫶) hand with index finger and thumb crossed..heart hands +1FAF7..1FAFF ; Extended_Pictographic# E0.0 [9] (🫷..🫿) .. 1FC00..1FFFD ; Extended_Pictographic# E0.0[1022] (🰀..🿽) .. # Total elements: 3537 diff --git a/lib/unicore/extracted/DBidiClass.txt b/lib/unicore/extracted/DBidiClass.txt index 2454abd480..4012dc25da 100644 --- a/lib/unicore/extracted/DBidiClass.txt +++ b/lib/unicore/extracted/DBidiClass.txt @@ -1,6 +1,6 @@ -# DerivedBidiClass-13.0.0.txt -# Date: 2019-10-21, 14:30:28 GMT -# © 2019 Unicode®, Inc. +# DerivedBidiClass-14.0.0.txt +# Date: 2021-07-10, 00:35:02 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -9,19 +9,19 @@ # ================================================ -# Bidi Class (listing UnicodeData.txt, field 4: see UAX #44: http://www.unicode.org/reports/tr44/) +# Bidi Class (listing UnicodeData.txt, field 4: see UAX #44: https://www.unicode.org/reports/tr44/) # Unlike other properties, unassigned code points in blocks # reserved for right-to-left scripts are given either types R or AL. # # The unassigned code points that default to AL are in the ranges: -# [\u0600-\u07BF \u0860-\u086F \u08A0-\u08FF \uFB50-\uFDCF \uFDF0-\uFDFF \uFE70-\uFEFF +# [\u0600-\u07BF \u0860-\u08FF \uFB50-\uFDCF \uFDF0-\uFDFF \uFE70-\uFEFF # \U00010D00-\U00010D3F \U00010F30-\U00010F6F # \U0001EC70-\U0001ECBF \U0001ED00-\U0001ED4F \U0001EE00-\U0001EEFF] # # This includes code points in the Arabic, Syriac, and Thaana blocks, among others. # # The unassigned code points that default to R are in the ranges: -# [\u0590-\u05FF \u07C0-\u085F \u0870-\u089F \uFB1D-\uFB4F +# [\u0590-\u05FF \u07C0-\u085F \uFB1D-\uFB4F # \U00010800-\U00010CFF \U00010D40-\U00010F2F \U00010F70-\U00010FFF # \U0001E800-\U0001EC6F \U0001ECC0-\U0001ECFF \U0001ED50-\U0001EDFF \U0001EF00-\U0001EFFF] # @@ -194,6 +194,7 @@ 0C3D ; L # Lo TELUGU SIGN AVAGRAHA 0C41..0C44 ; L # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR 0C58..0C5A ; L # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; L # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; L # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C66..0C6F ; L # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE 0C77 ; L # Po TELUGU SIGN SIDDHAM @@ -214,7 +215,7 @@ 0CC7..0CC8 ; L # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI 0CCA..0CCB ; L # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CD5..0CD6 ; L # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE ; L # Lo KANNADA LETTER FA +0CDD..0CDE ; L # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; L # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE6..0CEF ; L # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE 0CF1..0CF2 ; L # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA @@ -351,9 +352,10 @@ 16EB..16ED ; L # Po [3] RUNIC SINGLE PUNCTUATION..RUNIC CROSS PUNCTUATION 16EE..16F0 ; L # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; L # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; L # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; L # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA -1720..1731 ; L # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA +1700..1711 ; L # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA +1715 ; L # Mc TAGALOG SIGN PAMUDPOD +171F..1731 ; L # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA +1734 ; L # Mc HANUNOO SIGN PAMUDPOD 1735..1736 ; L # Po [2] PHILIPPINE SINGLE PUNCTUATION..PHILIPPINE DOUBLE PUNCTUATION 1740..1751 ; L # Lo [18] BUHID LETTER A..BUHID LETTER HA 1760..176C ; L # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA @@ -407,11 +409,12 @@ 1B3B ; L # Mc BALINESE VOWEL SIGN RA REPA TEDUNG 1B3D..1B41 ; L # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B43..1B44 ; L # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG -1B45..1B4B ; L # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; L # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59 ; L # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B5A..1B60 ; L # Po [7] BALINESE PANTI..BALINESE PAMENENG 1B61..1B6A ; L # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE 1B74..1B7C ; L # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +1B7D..1B7E ; L # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1B82 ; L # Mc SUNDANESE SIGN PANGWISAD 1B83..1BA0 ; L # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA 1BA1 ; L # Mc SUNDANESE CONSONANT SIGN PAMINGKAL @@ -499,9 +502,7 @@ 249C..24E9 ; L # So [78] PARENTHESIZED LATIN SMALL LETTER A..CIRCLED LATIN SMALL LETTER Z 26AC ; L # So MEDIUM SMALL WHITE CIRCLE 2800..28FF ; L # So [256] BRAILLE PATTERN BLANK..BRAILLE PATTERN DOTS-12345678 -2C00..2C2E ; L # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; L # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; L # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; L # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; L # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; L # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CEB..2CEE ; L # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA @@ -556,8 +557,7 @@ 337B..33DD ; L # So [99] SQUARE ERA NAME HEISEI..SQUARE WB 33E0..33FE ; L # So [31] IDEOGRAPHIC TELEGRAPH SYMBOL FOR DAY ONE..IDEOGRAPHIC TELEGRAPH SYMBOL FOR DAY THIRTY-ONE 3400..4DBF ; L # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; L # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; L # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; L # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; L # Lm YI SYLLABLE WU A016..A48C ; L # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A4D0..A4F7 ; L # Lo [40] LISU LETTER BA..LISU LETTER OE @@ -581,8 +581,11 @@ A771..A787 ; L # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER INSULAR A789..A78A ; L # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; L # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; L # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; L # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; L # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; L # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; L # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; L # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; L # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; L # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; L # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; L # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; L # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -731,14 +734,27 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 10500..10527 ; L # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; L # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW 1056F ; L # Po CAUCASIAN ALBANIAN CITATION MARK +10570..1057A ; L # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; L # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; L # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; L # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; L # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; L # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; L # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; L # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; L # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; L # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; L # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; L # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; L # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; L # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 11000 ; L # Mc BRAHMI SIGN CANDRABINDU 11002 ; L # Mc BRAHMI SIGN VISARGA 11003..11037 ; L # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA 11047..1104D ; L # Po [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 11066..1106F ; L # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11071..11072 ; L # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11075 ; L # Lo BRAHMI LETTER OLD TAMIL LLA 11082 ; L # Mc KAITHI SIGN VISARGA 11083..110AF ; L # Lo [45] KAITHI LETTER A..KAITHI LETTER HA 110B0..110B2 ; L # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II @@ -841,6 +857,7 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 116AE..116AF ; L # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II 116B6 ; L # Mc TAKRI SIGN VIRAMA 116B8 ; L # Lo TAKRI LETTER ARCHAIC KHA +116B9 ; L # Po TAKRI ABBREVIATION SIGN 116C0..116C9 ; L # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE 11700..1171A ; L # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA 11720..11721 ; L # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA @@ -849,6 +866,7 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 1173A..1173B ; L # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY 1173C..1173E ; L # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI 1173F ; L # So AHOM SYMBOL VI +11740..11746 ; L # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; L # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E ; L # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 11838 ; L # Mc DOGRA SIGN VISARGA @@ -891,7 +909,7 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 11A9A..11A9C ; L # Po [3] SOYOMBO MARK TSHEG..SOYOMBO MARK DOUBLE SHAD 11A9D ; L # Lo SOYOMBO MARK PLUTA 11A9E..11AA2 ; L # Po [5] SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME..SOYOMBO TERMINAL MARK-2 -11AC0..11AF8 ; L # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; L # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; L # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; L # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C2F ; L # Mc BHAIKSUKI VOWEL SIGN AA @@ -929,6 +947,8 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 12400..1246E ; L # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12470..12474 ; L # Po [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON 12480..12543 ; L # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; L # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2 ; L # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13000..1342E ; L # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 13430..13438 ; L # Cf [9] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT 14400..14646 ; L # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 @@ -936,6 +956,8 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 16A40..16A5E ; L # Lo [31] MRO LETTER TA..MRO LETTER TEK 16A60..16A69 ; L # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE 16A6E..16A6F ; L # Po [2] MRO DANDA..MRO DOUBLE DANDA +16A70..16ABE ; L # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; L # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED ; L # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF5 ; L # Po BASSA VAH FULL STOP 16B00..16B2F ; L # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU @@ -961,7 +983,10 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 17000..187F7 ; L # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; L # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; L # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; L # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; L # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; L # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; L # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; L # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; L # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; L # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; L # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -971,6 +996,7 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 1BC90..1BC99 ; L # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW 1BC9C ; L # So DUPLOYAN SIGN O WITH CROSS 1BC9F ; L # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP +1CF50..1CFC3 ; L # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5 ; L # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126 ; L # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129..1D164 ; L # So [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE @@ -1023,13 +1049,21 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 1DA76..1DA83 ; L # So [14] SIGNWRITING LIMB COMBINATION..SIGNWRITING LOCATION DEPTH 1DA85..1DA86 ; L # So [2] SIGNWRITING LOCATION TORSO..SIGNWRITING LOCATION LIMBS DIGITS 1DA87..1DA8B ; L # Po [5] SIGNWRITING COMMA..SIGNWRITING PARENTHESIS +1DF00..1DF09 ; L # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; L # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; L # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E100..1E12C ; L # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; L # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E140..1E149 ; L # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1E14E ; L # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1E14F ; L # So NYIAKENG PUACHUE HMONG CIRCLED CA +1E290..1E2AD ; L # Lo [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; L # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1E2F0..1E2F9 ; L # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE +1E7E0..1E7E6 ; L # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; L # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; L # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; L # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1F110..1F12E ; L # So [31] PARENTHESIZED LATIN CAPITAL LETTER A..CIRCLED WZ 1F130..1F169 ; L # So [58] SQUARED LATIN CAPITAL LETTER A..NEGATIVE CIRCLED LATIN CAPITAL LETTER Z 1F170..1F1AC ; L # So [61] NEGATIVE SQUARED LATIN CAPITAL LETTER A..SQUARED VOD @@ -1037,8 +1071,8 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER 1F210..1F23B ; L # So [44] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-914D 1F240..1F248 ; L # So [9] TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-672C..TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-6557 1F250..1F251 ; L # So [2] CIRCLED IDEOGRAPH ADVANTAGE..CIRCLED IDEOGRAPH ACCEPT -20000..2A6DD ; L # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; L # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; L # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; L # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; L # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; L # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; L # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 @@ -1047,8 +1081,8 @@ FFDA..FFDC ; L # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER F0000..FFFFD ; L # Co [65534] .. 100000..10FFFD; L # Co [65534] .. -# The above property value applies to 826312 code points not listed here. -# Total code points: 1096473 +# The above property value applies to 825575 code points not listed here. +# Total code points: 1096333 # ================================================ @@ -1082,7 +1116,6 @@ F0000..FFFFD ; L # Co [65534] .. 085C..085D ; R # Cn [2] .. 085E ; R # Po MANDAIC PUNCTUATION 085F ; R # Cn -0870..089F ; R # Cn [48] .. 200F ; R # Cf RIGHT-TO-LEFT MARK FB1D ; R # Lo HEBREW LETTER YOD WITH HIRIQ FB1F..FB28 ; R # Lo [10] HEBREW LIGATURE YIDDISH YOD YOD PATAH..HEBREW LETTER WIDE TAV @@ -1197,7 +1230,9 @@ FB46..FB4F ; R # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATURE AL 10F1D..10F26 ; R # No [10] OLD SOGDIAN NUMBER ONE..OLD SOGDIAN FRACTION ONE HALF 10F27 ; R # Lo OLD SOGDIAN LIGATURE AYIN-DALETH 10F28..10F2F ; R # Cn [8] .. -10F70..10FAF ; R # Cn [64] .. +10F70..10F81 ; R # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F86..10F89 ; R # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS +10F8A..10FAF ; R # Cn [38] .. 10FB0..10FC4 ; R # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FC5..10FCB ; R # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED 10FCC..10FDF ; R # Cn [20] .. @@ -1218,7 +1253,7 @@ FB46..FB4F ; R # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATURE AL 1ED50..1EDFF ; R # Cn [176] .. 1EF00..1EFFF ; R # Cn [256] .. -# Total code points: 3763 +# Total code points: 3711 # ================================================ @@ -1277,8 +1312,8 @@ FF0D ; ES # Pd FULLWIDTH HYPHEN-MINUS 0E3F ; ET # Sc THAI CURRENCY SYMBOL BAHT 17DB ; ET # Sc KHMER CURRENCY SYMBOL RIEL 2030..2034 ; ET # Po [5] PER MILLE SIGN..TRIPLE PRIME -20A0..20BF ; ET # Sc [32] EURO-CURRENCY SIGN..BITCOIN SIGN -20C0..20CF ; ET # Cn [16] .. +20A0..20C0 ; ET # Sc [33] EURO-CURRENCY SIGN..SOM SIGN +20C1..20CF ; ET # Cn [15] .. 212E ; ET # So ESTIMATED SYMBOL 2213 ; ET # Sm MINUS-OR-PLUS SIGN A838 ; ET # Sc NORTH INDIC RUPEE MARK @@ -1304,11 +1339,12 @@ FFE5..FFE6 ; ET # Sc [2] FULLWIDTH YEN SIGN..FULLWIDTH WON SIGN 0660..0669 ; AN # Nd [10] ARABIC-INDIC DIGIT ZERO..ARABIC-INDIC DIGIT NINE 066B..066C ; AN # Po [2] ARABIC DECIMAL SEPARATOR..ARABIC THOUSANDS SEPARATOR 06DD ; AN # Cf ARABIC END OF AYAH +0890..0891 ; AN # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE 08E2 ; AN # Cf ARABIC DISPUTED END OF AYAH 10D30..10D39 ; AN # Nd [10] HANIFI ROHINGYA DIGIT ZERO..HANIFI ROHINGYA DIGIT NINE 10E60..10E7E ; AN # No [31] RUMI DIGIT ONE..RUMI FRACTION TWO THIRDS -# Total code points: 61 +# Total code points: 63 # ================================================ @@ -1663,7 +1699,16 @@ FF1A ; CS # Po FULLWIDTH COLON 2E42 ; ON # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK 2E43..2E4F ; ON # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER 2E50..2E51 ; ON # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR -2E52 ; ON # Po TIRONIAN SIGN CAPITAL ET +2E52..2E54 ; ON # Po [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK +2E55 ; ON # Ps LEFT SQUARE BRACKET WITH STROKE +2E56 ; ON # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57 ; ON # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58 ; ON # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; ON # Ps TOP HALF LEFT PARENTHESIS +2E5A ; ON # Pe TOP HALF RIGHT PARENTHESIS +2E5B ; ON # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C ; ON # Pe BOTTOM HALF RIGHT PARENTHESIS +2E5D ; ON # Pd OBLIQUE HYPHEN 2E80..2E99 ; ON # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3 ; ON # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5 ; ON # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -1725,7 +1770,9 @@ A874..A877 ; ON # Po [4] PHAGS-PA SINGLE HEAD MARK..PHAGS-PA MARK DOUBLE SH AB6A..AB6B ; ON # Sk [2] MODIFIER LETTER LEFT TACK..MODIFIER LETTER RIGHT TACK FD3E ; ON # Pe ORNATE LEFT PARENTHESIS FD3F ; ON # Ps ORNATE RIGHT PARENTHESIS -FDFD ; ON # So ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FD40..FD4F ; ON # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH +FDCF ; ON # So ARABIC LIGATURE SALAAMUHU ALAYNAA +FDFD..FDFF ; ON # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FE10..FE16 ; ON # Po [7] PRESENTATION FORM FOR VERTICAL COMMA..PRESENTATION FORM FOR VERTICAL QUESTION MARK FE17 ; ON # Ps PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET FE18 ; ON # Pe PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRAKCET @@ -1815,6 +1862,7 @@ FFFC..FFFD ; ON # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTE 11FD5..11FDC ; ON # So [8] TAMIL SIGN NEL..TAMIL SIGN MUKKURUNI 11FE1..11FF1 ; ON # So [17] TAMIL SIGN PAARAM..TAMIL SIGN VAKAIYARAA 16FE2 ; ON # Po OLD CHINESE HOOK MARK +1D1E9..1D1EA ; ON # So [2] MUSICAL SYMBOL SORI..MUSICAL SYMBOL KORON 1D200..1D241 ; ON # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54 1D245 ; ON # So GREEK MUSICAL LEIMMA 1D300..1D356 ; ON # So [87] MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING @@ -1839,32 +1887,33 @@ FFFC..FFFD ; ON # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTE 1F300..1F3FA ; ON # So [251] CYCLONE..AMPHORA 1F3FB..1F3FF ; ON # Sk [5] EMOJI MODIFIER FITZPATRICK TYPE-1-2..EMOJI MODIFIER FITZPATRICK TYPE-6 1F400..1F6D7 ; ON # So [728] RAT..ELEVATOR -1F6E0..1F6EC ; ON # So [13] HAMMER AND WRENCH..AIRPLANE ARRIVING +1F6DD..1F6EC ; ON # So [16] PLAYGROUND SLIDE..AIRPLANE ARRIVING 1F6F0..1F6FC ; ON # So [13] SATELLITE..ROLLER SKATE 1F700..1F773 ; ON # So [116] ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE 1F780..1F7D8 ; ON # So [89] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7E0..1F7EB ; ON # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE +1F7F0 ; ON # So HEAVY EQUALS SIGN 1F800..1F80B ; ON # So [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847 ; ON # So [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859 ; ON # So [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW 1F860..1F887 ; ON # So [40] WIDE-HEADED LEFTWARDS LIGHT BARB ARROW..WIDE-HEADED SOUTH WEST VERY HEAVY BARB ARROW 1F890..1F8AD ; ON # So [30] LEFTWARDS TRIANGLE ARROWHEAD..WHITE ARROW SHAFT WIDTH TWO THIRDS 1F8B0..1F8B1 ; ON # So [2] ARROW POINTING UPWARDS THEN NORTH WEST..ARROW POINTING RIGHTWARDS THEN CURVING SOUTH WEST -1F900..1F978 ; ON # So [121] CIRCLED CROSS FORMEE WITH FOUR DOTS..DISGUISED FACE -1F97A..1F9CB ; ON # So [82] FACE WITH PLEADING EYES..BUBBLE TEA -1F9CD..1FA53 ; ON # So [135] STANDING PERSON..BLACK CHESS KNIGHT-BISHOP +1F900..1FA53 ; ON # So [340] CIRCLED CROSS FORMEE WITH FOUR DOTS..BLACK CHESS KNIGHT-BISHOP 1FA60..1FA6D ; ON # So [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER 1FA70..1FA74 ; ON # So [5] BALLET SHOES..THONG SANDAL -1FA78..1FA7A ; ON # So [3] DROP OF BLOOD..STETHOSCOPE +1FA78..1FA7C ; ON # So [5] DROP OF BLOOD..CRUTCH 1FA80..1FA86 ; ON # So [7] YO-YO..NESTING DOLLS -1FA90..1FAA8 ; ON # So [25] RINGED PLANET..ROCK -1FAB0..1FAB6 ; ON # So [7] FLY..FEATHER -1FAC0..1FAC2 ; ON # So [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAD0..1FAD6 ; ON # So [7] BLUEBERRIES..TEAPOT +1FA90..1FAAC ; ON # So [29] RINGED PLANET..HAMSA +1FAB0..1FABA ; ON # So [11] FLY..NEST WITH EGGS +1FAC0..1FAC5 ; ON # So [6] ANATOMICAL HEART..PERSON WITH CROWN +1FAD0..1FAD9 ; ON # So [10] BLUEBERRIES..JAR +1FAE0..1FAE7 ; ON # So [8] MELTING FACE..BUBBLES +1FAF0..1FAF6 ; ON # So [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS 1FB00..1FB92 ; ON # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA ; ON # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON -# Total code points: 5931 +# Total code points: 6000 # ================================================ @@ -1939,7 +1988,8 @@ FFFFE..FFFFF ; BN # Cn [2] .. 0825..0827 ; NSM # Mn [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U 0829..082D ; NSM # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA 0859..085B ; NSM # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3..08E1 ; NSM # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0898..089F ; NSM # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08CA..08E1 ; NSM # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; NSM # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 093A ; NSM # Mn DEVANAGARI VOWEL SIGN OE 093C ; NSM # Mn DEVANAGARI SIGN NUKTA @@ -1980,6 +2030,7 @@ FFFFE..FFFFF ; BN # Cn [2] .. 0BCD ; NSM # Mn TAMIL SIGN VIRAMA 0C00 ; NSM # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE 0C04 ; NSM # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3C ; NSM # Mn TELUGU SIGN NUKTA 0C3E..0C40 ; NSM # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C46..0C48 ; NSM # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI 0C4A..0C4D ; NSM # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA @@ -2027,7 +2078,7 @@ FFFFE..FFFFF ; BN # Cn [2] .. 109D ; NSM # Mn MYANMAR VOWEL SIGN AITON AI 135D..135F ; NSM # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK 1712..1714 ; NSM # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1732..1734 ; NSM # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733 ; NSM # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U 1752..1753 ; NSM # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1772..1773 ; NSM # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U 17B4..17B5 ; NSM # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA @@ -2036,6 +2087,7 @@ FFFFE..FFFFF ; BN # Cn [2] .. 17C9..17D3 ; NSM # Mn [11] KHMER SIGN MUUSIKATOAN..KHMER SIGN BATHAMASAT 17DD ; NSM # Mn KHMER SIGN ATTHACAN 180B..180D ; NSM # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; NSM # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1885..1886 ; NSM # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 18A9 ; NSM # Mn MONGOLIAN LETTER ALI GALI DAGALGA 1920..1922 ; NSM # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U @@ -2053,7 +2105,7 @@ FFFFE..FFFFF ; BN # Cn [2] .. 1A7F ; NSM # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 1AB0..1ABD ; NSM # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; NSM # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; NSM # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; NSM # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; NSM # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B34 ; NSM # Mn BALINESE SIGN REREKAN 1B36..1B3A ; NSM # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA @@ -2076,8 +2128,7 @@ FFFFE..FFFFF ; BN # Cn [2] .. 1CED ; NSM # Mn VEDIC SIGN TIRYAK 1CF4 ; NSM # Mn VEDIC TONE CANDRA ABOVE 1CF8..1CF9 ; NSM # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE -1DC0..1DF9 ; NSM # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; NSM # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; NSM # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 20D0..20DC ; NSM # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0 ; NSM # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH 20E1 ; NSM # Mn COMBINING LEFT RIGHT ARROW ABOVE @@ -2139,11 +2190,15 @@ FE20..FE2F ; NSM # Mn [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC 10D24..10D27 ; NSM # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10EAB..10EAC ; NSM # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F46..10F50 ; NSM # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; NSM # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 11001 ; NSM # Mn BRAHMI SIGN ANUSVARA 11038..11046 ; NSM # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA +11070 ; NSM # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; NSM # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 1107F..11081 ; NSM # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 110B3..110B6 ; NSM # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B9..110BA ; NSM # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; NSM # Mn KAITHI VOWEL SIGN VOCALIC R 11100..11102 ; NSM # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; NSM # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112D..11134 ; NSM # Mn [8] CHAKMA VOWEL SIGN AI..CHAKMA MAAYYAA @@ -2223,6 +2278,8 @@ FE20..FE2F ; NSM # Mn [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC 16F8F..16F92 ; NSM # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; NSM # Mn KHITAN SMALL SCRIPT FILLER 1BC9D..1BC9E ; NSM # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK +1CF00..1CF2D ; NSM # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; NSM # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D167..1D169 ; NSM # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D17B..1D182 ; NSM # Mn [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE 1D185..1D18B ; NSM # Mn [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE @@ -2240,12 +2297,13 @@ FE20..FE2F ; NSM # Mn [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC 1E023..1E024 ; NSM # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; NSM # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; NSM # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; NSM # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; NSM # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; NSM # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E94A ; NSM # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA E0100..E01EF ; NSM # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 1847 +# Total code points: 1958 # ================================================ @@ -2256,8 +2314,7 @@ E0100..E01EF ; NSM # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 060D ; AL # Po ARABIC DATE SEPARATOR 061B ; AL # Po ARABIC SEMICOLON 061C ; AL # Cf ARABIC LETTER MARK -061D ; AL # Cn -061E..061F ; AL # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; AL # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 0620..063F ; AL # Lo [32] ARABIC LETTER KASHMIRI YEH..ARABIC LETTER FARSI YEH WITH THREE DOTS ABOVE 0640 ; AL # Lm ARABIC TATWEEL 0641..064A ; AL # Lo [10] ARABIC LETTER FEH..ARABIC LETTER YEH @@ -2282,22 +2339,23 @@ E0100..E01EF ; NSM # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 07B2..07BF ; AL # Cn [14] .. 0860..086A ; AL # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA 086B..086F ; AL # Cn [5] .. -08A0..08B4 ; AL # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B5 ; AL # Cn -08B6..08C7 ; AL # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE -08C8..08D2 ; AL # Cn [11] .. +0870..0887 ; AL # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0888 ; AL # Sk ARABIC RAISED ROUND DOT +0889..088E ; AL # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +088F ; AL # Cn +0892..0897 ; AL # Cn [6] .. +08A0..08C8 ; AL # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; AL # Lm ARABIC SMALL FARSI YEH FB50..FBB1 ; AL # Lo [98] ARABIC LETTER ALEF WASLA ISOLATED FORM..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM -FBB2..FBC1 ; AL # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW -FBC2..FBD2 ; AL # Cn [17] .. +FBB2..FBC2 ; AL # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE +FBC3..FBD2 ; AL # Cn [16] .. FBD3..FD3D ; AL # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM -FD40..FD4F ; AL # Cn [16] .. FD50..FD8F ; AL # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM FD90..FD91 ; AL # Cn [2] .. FD92..FDC7 ; AL # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM -FDC8..FDCF ; AL # Cn [8] .. +FDC8..FDCE ; AL # Cn [7] .. FDF0..FDFB ; AL # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU FDFC ; AL # Sc RIAL SIGN -FDFE..FDFF ; AL # Cn [2] .. FE70..FE74 ; AL # Lo [5] ARABIC FATHATAN ISOLATED FORM..ARABIC KASRATAN ISOLATED FORM FE75 ; AL # Cn FE76..FEFC ; AL # Lo [135] ARABIC FATHA ISOLATED FORM..ARABIC LIGATURE LAM WITH ALEF FINAL FORM @@ -2389,7 +2447,7 @@ FEFD..FEFE ; AL # Cn [2] .. 1EEBC..1EEEF ; AL # Cn [52] .. 1EEF2..1EEFF ; AL # Cn [14] .. -# Total code points: 1698 +# Total code points: 1708 # ================================================ diff --git a/lib/unicore/extracted/DBinaryProperties.txt b/lib/unicore/extracted/DBinaryProperties.txt index 4c31bac119..60409c05ba 100644 --- a/lib/unicore/extracted/DBinaryProperties.txt +++ b/lib/unicore/extracted/DBinaryProperties.txt @@ -1,6 +1,6 @@ -# DerivedBinaryProperties-13.0.0.txt -# Date: 2019-09-08, 23:31:04 GMT -# © 2019 Unicode®, Inc. +# DerivedBinaryProperties-14.0.0.txt +# Date: 2021-06-04, 02:19:15 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -9,7 +9,7 @@ # ================================================ -# Bidi_Mirrored (listing UnicodeData.txt, field 9: see UAX #44: http://www.unicode.org/reports/tr44/) +# Bidi_Mirrored (listing UnicodeData.txt, field 9: see UAX #44: https://www.unicode.org/reports/tr44/) 0028 ; Bidi_Mirrored # Ps LEFT PARENTHESIS 0029 ; Bidi_Mirrored # Pe RIGHT PARENTHESIS @@ -185,6 +185,14 @@ 2E27 ; Bidi_Mirrored # Pe RIGHT SIDEWAYS U BRACKET 2E28 ; Bidi_Mirrored # Ps LEFT DOUBLE PARENTHESIS 2E29 ; Bidi_Mirrored # Pe RIGHT DOUBLE PARENTHESIS +2E55 ; Bidi_Mirrored # Ps LEFT SQUARE BRACKET WITH STROKE +2E56 ; Bidi_Mirrored # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57 ; Bidi_Mirrored # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58 ; Bidi_Mirrored # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; Bidi_Mirrored # Ps TOP HALF LEFT PARENTHESIS +2E5A ; Bidi_Mirrored # Pe TOP HALF RIGHT PARENTHESIS +2E5B ; Bidi_Mirrored # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C ; Bidi_Mirrored # Pe BOTTOM HALF RIGHT PARENTHESIS 3008 ; Bidi_Mirrored # Ps LEFT ANGLE BRACKET 3009 ; Bidi_Mirrored # Pe RIGHT ANGLE BRACKET 300A ; Bidi_Mirrored # Ps LEFT DOUBLE ANGLE BRACKET @@ -228,6 +236,6 @@ FF63 ; Bidi_Mirrored # Pe HALFWIDTH RIGHT CORNER BRACKET 1D789 ; Bidi_Mirrored # Sm MATHEMATICAL SANS-SERIF BOLD PARTIAL DIFFERENTIAL 1D7C3 ; Bidi_Mirrored # Sm MATHEMATICAL SANS-SERIF BOLD ITALIC PARTIAL DIFFERENTIAL -# Total code points: 545 +# Total code points: 553 # EOF diff --git a/lib/unicore/extracted/DCombiningClass.txt b/lib/unicore/extracted/DCombiningClass.txt index b4c75cd459..4ad8205790 100644 --- a/lib/unicore/extracted/DCombiningClass.txt +++ b/lib/unicore/extracted/DCombiningClass.txt @@ -1,6 +1,6 @@ -# DerivedCombiningClass-13.0.0.txt -# Date: 2019-11-13, 21:51:57 GMT -# © 2019 Unicode®, Inc. +# DerivedCombiningClass-14.0.0.txt +# Date: 2021-07-10, 00:35:05 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -9,7 +9,7 @@ # ================================================ -# Combining Class (listing UnicodeData.txt, field 3: see UAX #44: http://www.unicode.org/reports/tr44/) +# Combining Class (listing UnicodeData.txt, field 3: see UAX #44: https://www.unicode.org/reports/tr44/) # All code points not explicitly listed for Canonical_Combining_Class # have the value Not_Reordered (0). @@ -139,7 +139,7 @@ 060E..060F ; 0 # So [2] ARABIC POETIC VERSE SIGN..ARABIC SIGN MISRA 061B ; 0 # Po ARABIC SEMICOLON 061C ; 0 # Cf ARABIC LETTER MARK -061E..061F ; 0 # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; 0 # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 0620..063F ; 0 # Lo [32] ARABIC LETTER KASHMIRI YEH..ARABIC LETTER FARSI YEH WITH THREE DOTS ABOVE 0640 ; 0 # Lm ARABIC TATWEEL 0641..064A ; 0 # Lo [10] ARABIC LETTER FEH..ARABIC LETTER YEH @@ -180,8 +180,12 @@ 0840..0858 ; 0 # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 085E ; 0 # Po MANDAIC PUNCTUATION 0860..086A ; 0 # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; 0 # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; 0 # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +0870..0887 ; 0 # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0888 ; 0 # Sk ARABIC RAISED ROUND DOT +0889..088E ; 0 # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0890..0891 ; 0 # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +08A0..08C8 ; 0 # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; 0 # Lm ARABIC SMALL FARSI YEH 08E2 ; 0 # Cf ARABIC DISPUTED END OF AYAH 0900..0902 ; 0 # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA 0903 ; 0 # Mc DEVANAGARI SIGN VISARGA @@ -331,6 +335,7 @@ 0C46..0C48 ; 0 # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI 0C4A..0C4C ; 0 # Mn [3] TELUGU VOWEL SIGN O..TELUGU VOWEL SIGN AU 0C58..0C5A ; 0 # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; 0 # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; 0 # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63 ; 0 # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C66..0C6F ; 0 # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE @@ -355,7 +360,7 @@ 0CCA..0CCB ; 0 # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC ; 0 # Mn KANNADA VOWEL SIGN AU 0CD5..0CD6 ; 0 # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE ; 0 # Lo KANNADA LETTER FA +0CDD..0CDE ; 0 # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; 0 # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; 0 # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; 0 # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -532,10 +537,9 @@ 16EB..16ED ; 0 # Po [3] RUNIC SINGLE PUNCTUATION..RUNIC CROSS PUNCTUATION 16EE..16F0 ; 0 # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; 0 # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; 0 # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; 0 # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711 ; 0 # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1713 ; 0 # Mn [2] TAGALOG VOWEL SIGN I..TAGALOG VOWEL SIGN U -1720..1731 ; 0 # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA +171F..1731 ; 0 # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA 1732..1733 ; 0 # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U 1735..1736 ; 0 # Po [2] PHILIPPINE SINGLE PUNCTUATION..PHILIPPINE DOUBLE PUNCTUATION 1740..1751 ; 0 # Lo [18] BUHID LETTER A..BUHID LETTER HA @@ -564,6 +568,7 @@ 1807..180A ; 0 # Po [4] MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER..MONGOLIAN NIRUGU 180B..180D ; 0 # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; 0 # Cf MONGOLIAN VOWEL SEPARATOR +180F ; 0 # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1810..1819 ; 0 # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE 1820..1842 ; 0 # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843 ; 0 # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -622,11 +627,12 @@ 1B3D..1B41 ; 0 # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42 ; 0 # Mn BALINESE VOWEL SIGN PEPET 1B43 ; 0 # Mc BALINESE VOWEL SIGN PEPET TEDUNG -1B45..1B4B ; 0 # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; 0 # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59 ; 0 # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B5A..1B60 ; 0 # Po [7] BALINESE PANTI..BALINESE PAMENENG 1B61..1B6A ; 0 # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE 1B74..1B7C ; 0 # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +1B7D..1B7E ; 0 # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1B80..1B81 ; 0 # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR 1B82 ; 0 # Mc SUNDANESE SIGN PANGWISAD 1B83..1BA0 ; 0 # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA @@ -744,7 +750,7 @@ 208D ; 0 # Ps SUBSCRIPT LEFT PARENTHESIS 208E ; 0 # Pe SUBSCRIPT RIGHT PARENTHESIS 2090..209C ; 0 # Lm [13] LATIN SUBSCRIPT SMALL LETTER A..LATIN SUBSCRIPT SMALL LETTER T -20A0..20BF ; 0 # Sc [32] EURO-CURRENCY SIGN..BITCOIN SIGN +20A0..20C0 ; 0 # Sc [33] EURO-CURRENCY SIGN..SOM SIGN 20DD..20E0 ; 0 # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH 20E2..20E4 ; 0 # Me [3] COMBINING ENCLOSING SCREEN..COMBINING ENCLOSING UPWARD POINTING TRIANGLE 2100..2101 ; 0 # So [2] ACCOUNT OF..ADDRESSED TO THE SUBJECT @@ -905,9 +911,7 @@ 2B4D..2B73 ; 0 # So [39] DOWNWARDS TRIANGLE-HEADED ZIGZAG ARROW..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR 2B76..2B95 ; 0 # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW 2B97..2BFF ; 0 # So [105] SYMBOL FOR TYPE A ELECTRONICS..HELLSCHREIBER PAUSE SYMBOL -2C00..2C2E ; 0 # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; 0 # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; 0 # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; 0 # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; 0 # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; 0 # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CE5..2CEA ; 0 # So [6] COPTIC SYMBOL MI RO..COPTIC SYMBOL SHIMA SIMA @@ -970,7 +974,16 @@ 2E42 ; 0 # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK 2E43..2E4F ; 0 # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER 2E50..2E51 ; 0 # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR -2E52 ; 0 # Po TIRONIAN SIGN CAPITAL ET +2E52..2E54 ; 0 # Po [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK +2E55 ; 0 # Ps LEFT SQUARE BRACKET WITH STROKE +2E56 ; 0 # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57 ; 0 # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58 ; 0 # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; 0 # Ps TOP HALF LEFT PARENTHESIS +2E5A ; 0 # Pe TOP HALF RIGHT PARENTHESIS +2E5B ; 0 # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C ; 0 # Pe BOTTOM HALF RIGHT PARENTHESIS +2E5D ; 0 # Pd OBLIQUE HYPHEN 2E80..2E99 ; 0 # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP 2E9B..2EF3 ; 0 # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE 2F00..2FD5 ; 0 # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE @@ -1043,8 +1056,7 @@ 32C0..33FF ; 0 # So [320] IDEOGRAPHIC TELEGRAPH SYMBOL FOR JANUARY..SQUARE GAL 3400..4DBF ; 0 # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF 4DC0..4DFF ; 0 # So [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION -4E00..9FFC ; 0 # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; 0 # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; 0 # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; 0 # Lm YI SYLLABLE WU A016..A48C ; 0 # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A490..A4C6 ; 0 # So [55] YI RADICAL QOT..YI RADICAL KE @@ -1078,8 +1090,11 @@ A788 ; 0 # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; 0 # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; 0 # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; 0 # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; 0 # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; 0 # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; 0 # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; 0 # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; 0 # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; 0 # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; 0 # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; 0 # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; 0 # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; 0 # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -1215,15 +1230,17 @@ FB3E ; 0 # Lo HEBREW LETTER MEM WITH DAGESH FB40..FB41 ; 0 # Lo [2] HEBREW LETTER NUN WITH DAGESH..HEBREW LETTER SAMEKH WITH DAGESH FB43..FB44 ; 0 # Lo [2] HEBREW LETTER FINAL PE WITH DAGESH..HEBREW LETTER PE WITH DAGESH FB46..FBB1 ; 0 # Lo [108] HEBREW LETTER TSADI WITH DAGESH..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM -FBB2..FBC1 ; 0 # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2 ; 0 # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FBD3..FD3D ; 0 # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM FD3E ; 0 # Pe ORNATE LEFT PARENTHESIS FD3F ; 0 # Ps ORNATE RIGHT PARENTHESIS +FD40..FD4F ; 0 # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH FD50..FD8F ; 0 # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM FD92..FDC7 ; 0 # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM +FDCF ; 0 # So ARABIC LIGATURE SALAAMUHU ALAYNAA FDF0..FDFB ; 0 # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU FDFC ; 0 # Sc RIAL SIGN -FDFD ; 0 # So ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFD..FDFF ; 0 # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FE00..FE0F ; 0 # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16 FE10..FE16 ; 0 # Po [7] PRESENTATION FORM FOR VERTICAL COMMA..PRESENTATION FORM FOR VERTICAL QUESTION MARK FE17 ; 0 # Ps PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET @@ -1365,9 +1382,20 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 10500..10527 ; 0 # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; 0 # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW 1056F ; 0 # Po CAUCASIAN ALBANIAN CITATION MARK +10570..1057A ; 0 # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; 0 # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; 0 # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; 0 # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; 0 # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; 0 # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; 0 # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; 0 # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; 0 # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; 0 # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; 0 # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; 0 # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; 0 # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; 0 # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; 0 # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; 0 # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; 0 # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -1439,6 +1467,8 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 10F30..10F45 ; 0 # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN 10F51..10F54 ; 0 # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED 10F55..10F59 ; 0 # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F70..10F81 ; 0 # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F86..10F89 ; 0 # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 10FB0..10FC4 ; 0 # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FC5..10FCB ; 0 # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED 10FE0..10FF6 ; 0 # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH @@ -1450,6 +1480,9 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 11047..1104D ; 0 # Po [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 11052..11065 ; 0 # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND 11066..1106F ; 0 # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11071..11072 ; 0 # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074 ; 0 # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075 ; 0 # Lo BRAHMI LETTER OLD TAMIL LLA 11080..11081 ; 0 # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA 11082 ; 0 # Mc KAITHI SIGN VISARGA 11083..110AF ; 0 # Lo [45] KAITHI LETTER A..KAITHI LETTER HA @@ -1459,6 +1492,7 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 110BB..110BC ; 0 # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN 110BD ; 0 # Cf KAITHI NUMBER SIGN 110BE..110C1 ; 0 # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA +110C2 ; 0 # Mn KAITHI VOWEL SIGN VOCALIC R 110CD ; 0 # Cf KAITHI NUMBER SIGN ABOVE 110D0..110E8 ; 0 # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 110F0..110F9 ; 0 # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE @@ -1582,6 +1616,7 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 116AE..116AF ; 0 # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II 116B0..116B5 ; 0 # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU 116B8 ; 0 # Lo TAKRI LETTER ARCHAIC KHA +116B9 ; 0 # Po TAKRI ABBREVIATION SIGN 116C0..116C9 ; 0 # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE 11700..1171A ; 0 # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA 1171D..1171F ; 0 # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA @@ -1593,6 +1628,7 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 1173A..1173B ; 0 # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY 1173C..1173E ; 0 # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI 1173F ; 0 # So AHOM SYMBOL VI +11740..11746 ; 0 # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; 0 # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E ; 0 # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 1182F..11837 ; 0 # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA @@ -1645,7 +1681,7 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 11A9A..11A9C ; 0 # Po [3] SOYOMBO MARK TSHEG..SOYOMBO MARK DOUBLE SHAD 11A9D ; 0 # Lo SOYOMBO MARK PLUTA 11A9E..11AA2 ; 0 # Po [5] SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME..SOYOMBO TERMINAL MARK-2 -11AC0..11AF8 ; 0 # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; 0 # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; 0 # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; 0 # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C2F ; 0 # Mc BHAIKSUKI VOWEL SIGN AA @@ -1700,6 +1736,8 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 12400..1246E ; 0 # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12470..12474 ; 0 # Po [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON 12480..12543 ; 0 # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; 0 # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2 ; 0 # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13000..1342E ; 0 # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 13430..13438 ; 0 # Cf [9] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT 14400..14646 ; 0 # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 @@ -1707,6 +1745,8 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 16A40..16A5E ; 0 # Lo [31] MRO LETTER TA..MRO LETTER TEK 16A60..16A69 ; 0 # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE 16A6E..16A6F ; 0 # Po [2] MRO DANDA..MRO DOUBLE DANDA +16A70..16ABE ; 0 # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; 0 # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED ; 0 # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF5 ; 0 # Po BASSA VAH FULL STOP 16B00..16B2F ; 0 # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU @@ -1735,7 +1775,10 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 17000..187F7 ; 0 # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; 0 # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; 0 # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; 0 # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; 0 # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; 0 # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; 0 # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; 0 # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; 0 # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; 0 # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; 0 # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -1747,6 +1790,9 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 1BC9D ; 0 # Mn DUPLOYAN THICK LETTER SELECTOR 1BC9F ; 0 # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1BCA0..1BCA3 ; 0 # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF00..1CF2D ; 0 # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; 0 # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG +1CF50..1CFC3 ; 0 # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5 ; 0 # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126 ; 0 # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129..1D164 ; 0 # So [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE @@ -1754,7 +1800,7 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 1D173..1D17A ; 0 # Cf [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE 1D183..1D184 ; 0 # So [2] MUSICAL SYMBOL ARPEGGIATO UP..MUSICAL SYMBOL ARPEGGIATO DOWN 1D18C..1D1A9 ; 0 # So [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH -1D1AE..1D1E8 ; 0 # So [59] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KIEVAN FLAT SIGN +1D1AE..1D1EA ; 0 # So [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON 1D200..1D241 ; 0 # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54 1D245 ; 0 # So GREEK MUSICAL LEIMMA 1D2E0..1D2F3 ; 0 # No [20] MAYAN NUMERAL ZERO..MAYAN NUMERAL NINETEEN @@ -1813,14 +1859,22 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 1DA87..1DA8B ; 0 # Po [5] SIGNWRITING COMMA..SIGNWRITING PARENTHESIS 1DA9B..1DA9F ; 0 # Mn [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6 1DAA1..1DAAF ; 0 # Mn [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16 +1DF00..1DF09 ; 0 # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; 0 # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; 0 # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E100..1E12C ; 0 # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; 0 # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E140..1E149 ; 0 # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1E14E ; 0 # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1E14F ; 0 # So NYIAKENG PUACHUE HMONG CIRCLED CA +1E290..1E2AD ; 0 # Lo [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; 0 # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1E2F0..1E2F9 ; 0 # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE 1E2FF ; 0 # Sc WANCHO NGUN SIGN +1E7E0..1E7E6 ; 0 # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; 0 # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; 0 # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; 0 # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; 0 # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8C7..1E8CF ; 0 # No [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE 1E900..1E943 ; 0 # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA @@ -1885,33 +1939,34 @@ FFFC..FFFD ; 0 # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 1F300..1F3FA ; 0 # So [251] CYCLONE..AMPHORA 1F3FB..1F3FF ; 0 # Sk [5] EMOJI MODIFIER FITZPATRICK TYPE-1-2..EMOJI MODIFIER FITZPATRICK TYPE-6 1F400..1F6D7 ; 0 # So [728] RAT..ELEVATOR -1F6E0..1F6EC ; 0 # So [13] HAMMER AND WRENCH..AIRPLANE ARRIVING +1F6DD..1F6EC ; 0 # So [16] PLAYGROUND SLIDE..AIRPLANE ARRIVING 1F6F0..1F6FC ; 0 # So [13] SATELLITE..ROLLER SKATE 1F700..1F773 ; 0 # So [116] ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE 1F780..1F7D8 ; 0 # So [89] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7E0..1F7EB ; 0 # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE +1F7F0 ; 0 # So HEAVY EQUALS SIGN 1F800..1F80B ; 0 # So [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847 ; 0 # So [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859 ; 0 # So [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW 1F860..1F887 ; 0 # So [40] WIDE-HEADED LEFTWARDS LIGHT BARB ARROW..WIDE-HEADED SOUTH WEST VERY HEAVY BARB ARROW 1F890..1F8AD ; 0 # So [30] LEFTWARDS TRIANGLE ARROWHEAD..WHITE ARROW SHAFT WIDTH TWO THIRDS 1F8B0..1F8B1 ; 0 # So [2] ARROW POINTING UPWARDS THEN NORTH WEST..ARROW POINTING RIGHTWARDS THEN CURVING SOUTH WEST -1F900..1F978 ; 0 # So [121] CIRCLED CROSS FORMEE WITH FOUR DOTS..DISGUISED FACE -1F97A..1F9CB ; 0 # So [82] FACE WITH PLEADING EYES..BUBBLE TEA -1F9CD..1FA53 ; 0 # So [135] STANDING PERSON..BLACK CHESS KNIGHT-BISHOP +1F900..1FA53 ; 0 # So [340] CIRCLED CROSS FORMEE WITH FOUR DOTS..BLACK CHESS KNIGHT-BISHOP 1FA60..1FA6D ; 0 # So [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER 1FA70..1FA74 ; 0 # So [5] BALLET SHOES..THONG SANDAL -1FA78..1FA7A ; 0 # So [3] DROP OF BLOOD..STETHOSCOPE +1FA78..1FA7C ; 0 # So [5] DROP OF BLOOD..CRUTCH 1FA80..1FA86 ; 0 # So [7] YO-YO..NESTING DOLLS -1FA90..1FAA8 ; 0 # So [25] RINGED PLANET..ROCK -1FAB0..1FAB6 ; 0 # So [7] FLY..FEATHER -1FAC0..1FAC2 ; 0 # So [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAD0..1FAD6 ; 0 # So [7] BLUEBERRIES..TEAPOT +1FA90..1FAAC ; 0 # So [29] RINGED PLANET..HAMSA +1FAB0..1FABA ; 0 # So [11] FLY..NEST WITH EGGS +1FAC0..1FAC5 ; 0 # So [6] ANATOMICAL HEART..PERSON WITH CROWN +1FAD0..1FAD9 ; 0 # So [10] BLUEBERRIES..JAR +1FAE0..1FAE7 ; 0 # So [8] MELTING FACE..BUBBLES +1FAF0..1FAF6 ; 0 # So [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS 1FB00..1FB92 ; 0 # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA ; 0 # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON 1FBF0..1FBF9 ; 0 # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -20000..2A6DD ; 0 # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; 0 # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; 0 # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; 0 # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; 0 # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; 0 # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; 0 # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 @@ -1923,8 +1978,8 @@ E0100..E01EF ; 0 # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 F0000..FFFFD ; 0 # Co [65534] .. 100000..10FFFD; 0 # Co [65534] .. -# The above property value applies to 832720 code points not listed here. -# Total code points: 1113240 +# The above property value applies to 831882 code points not listed here. +# Total code points: 1113200 # ================================================ @@ -1961,6 +2016,7 @@ F0000..FFFFD ; 0 # Co [65534] .. 0A3C ; 7 # Mn GURMUKHI SIGN NUKTA 0ABC ; 7 # Mn GUJARATI SIGN NUKTA 0B3C ; 7 # Mn ORIYA SIGN NUKTA +0C3C ; 7 # Mn TELUGU SIGN NUKTA 0CBC ; 7 # Mn KANNADA SIGN NUKTA 1037 ; 7 # Mn MYANMAR SIGN DOT BELOW 1B34 ; 7 # Mn BALINESE SIGN REREKAN @@ -1982,7 +2038,7 @@ A9B3 ; 7 # Mn JAVANESE SIGN CECAK TELU 11D42 ; 7 # Mn MASARAM GONDI SIGN NUKTA 1E94A ; 7 # Mn ADLAM NUKTA -# Total code points: 26 +# Total code points: 27 # ================================================ @@ -2012,7 +2068,8 @@ A9B3 ; 7 # Mn JAVANESE SIGN CECAK TELU 0F84 ; 9 # Mn TIBETAN MARK HALANTA 1039..103A ; 9 # Mn [2] MYANMAR SIGN VIRAMA..MYANMAR SIGN ASAT 1714 ; 9 # Mn TAGALOG SIGN VIRAMA -1734 ; 9 # Mn HANUNOO SIGN PAMUDPOD +1715 ; 9 # Mc TAGALOG SIGN PAMUDPOD +1734 ; 9 # Mc HANUNOO SIGN PAMUDPOD 17D2 ; 9 # Mn KHMER SIGN COENG 1A60 ; 9 # Mn TAI THAM SIGN SAKOT 1B44 ; 9 # Mc BALINESE ADEG ADEG @@ -2029,6 +2086,7 @@ AAF6 ; 9 # Mn MEETEI MAYEK VIRAMA ABED ; 9 # Mn MEETEI MAYEK APUN IYEK 10A3F ; 9 # Mn KHAROSHTHI VIRAMA 11046 ; 9 # Mn BRAHMI VIRAMA +11070 ; 9 # Mn BRAHMI SIGN OLD TAMIL VIRAMA 1107F ; 9 # Mn BRAHMI NUMBER JOINER 110B9 ; 9 # Mn KAITHI SIGN VIRAMA 11133..11134 ; 9 # Mn [2] CHAKMA VIRAMA..CHAKMA MAAYYAA @@ -2053,7 +2111,7 @@ ABED ; 9 # Mn MEETEI MAYEK APUN IYEK 11D44..11D45 ; 9 # Mn [2] MASARAM GONDI SIGN HALANTA..MASARAM GONDI VIRAMA 11D97 ; 9 # Mn GUNJALA GONDI VIRAMA -# Total code points: 61 +# Total code points: 63 # ================================================ @@ -2385,9 +2443,10 @@ FB1E ; 26 # Mn HEBREW POINT JUDEO-SPANISH VARIKA # Canonical_Combining_Class=Below_Left +1DFA ; 218 # Mn COMBINING DOT BELOW LEFT 302A ; 218 # Mn IDEOGRAPHIC LEVEL TONE MARK -# Total code points: 1 +# Total code points: 2 # ================================================ @@ -2426,7 +2485,8 @@ FB1E ; 26 # Mn HEBREW POINT JUDEO-SPANISH VARIKA 07F2 ; 220 # Mn NKO COMBINING NASALIZATION MARK 07FD ; 220 # Mn NKO DANTAYALAN 0859..085B ; 220 # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3 ; 220 # Mn ARABIC SMALL LOW WAW +0899..089B ; 220 # Mn [3] ARABIC SMALL LOW WORD ISHMAAM..ARABIC SMALL LOW WORD TASHEEL +08CF..08D3 ; 220 # Mn [5] ARABIC LARGE ROUND DOT BELOW..ARABIC SMALL LOW WAW 08E3 ; 220 # Mn ARABIC TURNED DAMMA BELOW 08E6 ; 220 # Mn ARABIC CURLY KASRA 08E9 ; 220 # Mn ARABIC CURLY KASRATAN @@ -2445,6 +2505,8 @@ FB1E ; 26 # Mn HEBREW POINT JUDEO-SPANISH VARIKA 1AB5..1ABA ; 220 # Mn [6] COMBINING X-X BELOW..COMBINING STRONG CENTRALIZATION STROKE BELOW 1ABD ; 220 # Mn COMBINING PARENTHESES BELOW 1ABF..1AC0 ; 220 # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1AC3..1AC4 ; 220 # Mn [2] COMBINING LEFT PARENTHESIS BELOW LEFT..COMBINING RIGHT PARENTHESIS BELOW RIGHT +1ACA ; 220 # Mn COMBINING DOUBLE PLUS SIGN BELOW 1B6C ; 220 # Mn BALINESE MUSICAL SYMBOL COMBINING ENDEP 1CD5..1CD9 ; 220 # Mn [5] VEDIC TONE YAJURVEDIC AGGRAVATED INDEPENDENT SVARITA..VEDIC TONE YAJURVEDIC KATHAKA INDEPENDENT SVARITA SCHROEDER 1CDC..1CDF ; 220 # Mn [4] VEDIC TONE KATHAKA ANUDATTA..VEDIC TONE THREE DOTS BELOW @@ -2468,11 +2530,13 @@ FE27..FE2D ; 220 # Mn [7] COMBINING LIGATURE LEFT HALF BELOW..COMBINING CON 10F46..10F47 ; 220 # Mn [2] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING TWO DOTS BELOW 10F4B ; 220 # Mn SOGDIAN COMBINING CURVE BELOW 10F4D..10F50 ; 220 # Mn [4] SOGDIAN COMBINING HOOK BELOW..SOGDIAN COMBINING STROKE BELOW +10F83 ; 220 # Mn OLD UYGHUR COMBINING DOT BELOW +10F85 ; 220 # Mn OLD UYGHUR COMBINING TWO DOTS BELOW 1D17B..1D182 ; 220 # Mn [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE 1D18A..1D18B ; 220 # Mn [2] MUSICAL SYMBOL COMBINING DOUBLE TONGUE..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1E8D0..1E8D6 ; 220 # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS -# Total code points: 165 +# Total code points: 177 # ================================================ @@ -2557,6 +2621,9 @@ FE27..FE2D ; 220 # Mn [7] COMBINING LIGATURE LEFT HALF BELOW..COMBINING CON 081B..0823 ; 230 # Mn [9] SAMARITAN MARK EPENTHETIC YUT..SAMARITAN VOWEL SIGN A 0825..0827 ; 230 # Mn [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U 0829..082D ; 230 # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA +0898 ; 230 # Mn ARABIC SMALL HIGH WORD AL-JUZ +089C..089F ; 230 # Mn [4] ARABIC MADDA WAAJIB..ARABIC HALF MADDA OVER MADDA +08CA..08CE ; 230 # Mn [5] ARABIC SMALL HIGH FARSI YEH..ARABIC LARGE ROUND DOT ABOVE 08D4..08E1 ; 230 # Mn [14] ARABIC SMALL HIGH WORD AR-RUB..ARABIC SMALL HIGH SIGN SAFHA 08E4..08E5 ; 230 # Mn [2] ARABIC CURLY FATHA..ARABIC CURLY DAMMA 08E7..08E8 ; 230 # Mn [2] ARABIC CURLY FATHATAN..ARABIC CURLY DAMMATAN @@ -2576,6 +2643,9 @@ FE27..FE2D ; 220 # Mn [7] COMBINING LIGATURE LEFT HALF BELOW..COMBINING CON 1A75..1A7C ; 230 # Mn [8] TAI THAM SIGN TONE-1..TAI THAM SIGN KHUEN-LUE KARAN 1AB0..1AB4 ; 230 # Mn [5] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING TRIPLE DOT 1ABB..1ABC ; 230 # Mn [2] COMBINING PARENTHESES ABOVE..COMBINING DOUBLE PARENTHESES ABOVE +1AC1..1AC2 ; 230 # Mn [2] COMBINING LEFT PARENTHESIS ABOVE LEFT..COMBINING RIGHT PARENTHESIS ABOVE RIGHT +1AC5..1AC9 ; 230 # Mn [5] COMBINING SQUARE BRACKETS ABOVE..COMBINING DOUBLE PLUS SIGN ABOVE +1ACB..1ACE ; 230 # Mn [4] COMBINING TRIPLE ACUTE ACCENT..COMBINING LATIN SMALL LETTER INSULAR T 1B6B ; 230 # Mn BALINESE MUSICAL SYMBOL COMBINING TEGEH 1B6D..1B73 ; 230 # Mn [7] BALINESE MUSICAL SYMBOL COMBINING KEMPUL..BALINESE MUSICAL SYMBOL COMBINING GONG 1CD0..1CD2 ; 230 # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA @@ -2618,6 +2688,8 @@ FE2E..FE2F ; 230 # Mn [2] COMBINING CYRILLIC TITLO LEFT HALF..COMBINING CYR 10EAB..10EAC ; 230 # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F48..10F4A ; 230 # Mn [3] SOGDIAN COMBINING DOT ABOVE..SOGDIAN COMBINING CURVE ABOVE 10F4C ; 230 # Mn SOGDIAN COMBINING HOOK ABOVE +10F82 ; 230 # Mn OLD UYGHUR COMBINING DOT ABOVE +10F84 ; 230 # Mn OLD UYGHUR COMBINING TWO DOTS ABOVE 11100..11102 ; 230 # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11366..1136C ; 230 # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX 11370..11374 ; 230 # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA @@ -2632,10 +2704,11 @@ FE2E..FE2F ; 230 # Mn [2] COMBINING CYRILLIC TITLO LEFT HALF..COMBINING CYR 1E023..1E024 ; 230 # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; 230 # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; 230 # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; 230 # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; 230 # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E944..1E949 ; 230 # Mn [6] ADLAM ALIF LENGTHENER..ADLAM GEMINATE CONSONANT MODIFIER -# Total code points: 484 +# Total code points: 508 # ================================================ diff --git a/lib/unicore/extracted/DDecompositionType.txt b/lib/unicore/extracted/DDecompositionType.txt index a0bc563643..5af556b0d4 100644 --- a/lib/unicore/extracted/DDecompositionType.txt +++ b/lib/unicore/extracted/DDecompositionType.txt @@ -1,6 +1,6 @@ -# DerivedDecompositionType-13.0.0.txt -# Date: 2019-09-08, 23:31:06 GMT -# © 2019 Unicode®, Inc. +# DerivedDecompositionType-14.0.0.txt +# Date: 2021-06-04, 02:19:17 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -9,7 +9,7 @@ # ================================================ -# Decomposition_Type (from UnicodeData.txt, field 5: see UAX #44: http://www.unicode.org/reports/tr44/) +# Decomposition_Type (from UnicodeData.txt, field 5: see UAX #44: https://www.unicode.org/reports/tr44/) # All code points not explicitly listed for Decomposition_Type # have the value None. @@ -861,12 +861,16 @@ FEFB ; Isolated # Lo ARABIC LIGATURE LAM WITH ALEF ISOLATED FORM 3196..319F ; Super # So [10] IDEOGRAPHIC ANNOTATION TOP MARK..IDEOGRAPHIC ANNOTATION MAN MARK A69C..A69D ; Super # Lm [2] MODIFIER LETTER CYRILLIC HARD SIGN..MODIFIER LETTER CYRILLIC SOFT SIGN A770 ; Super # Lm MODIFIER LETTER US +A7F2..A7F4 ; Super # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F8..A7F9 ; Super # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE AB5C..AB5F ; Super # Lm [4] MODIFIER LETTER SMALL HENG..MODIFIER LETTER SMALL U WITH LEFT HOOK AB69 ; Super # Lm MODIFIER LETTER SMALL TURNED W +10781..10785 ; Super # Lm [5] MODIFIER LETTER SUPERSCRIPT TRIANGULAR COLON..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Super # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Super # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 1F16A..1F16C ; Super # So [3] RAISED MC SIGN..RAISED MR SIGN -# Total code points: 154 +# Total code points: 213 # ================================================ diff --git a/lib/unicore/extracted/DEastAsianWidth.txt b/lib/unicore/extracted/DEastAsianWidth.txt index 79fe3ebec5..6bc84ff98d 100644 --- a/lib/unicore/extracted/DEastAsianWidth.txt +++ b/lib/unicore/extracted/DEastAsianWidth.txt @@ -1,6 +1,6 @@ -# DerivedEastAsianWidth-13.0.0.txt -# Date: 2019-10-21, 14:30:31 GMT -# © 2019 Unicode®, Inc. +# DerivedEastAsianWidth-14.0.0.txt +# Date: 2021-07-10, 00:35:07 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -143,7 +143,7 @@ 0610..061A ; N # Mn [11] ARABIC SIGN SALLALLAHOU ALAYHE WASSALLAM..ARABIC SMALL KASRA 061B ; N # Po ARABIC SEMICOLON 061C ; N # Cf ARABIC LETTER MARK -061E..061F ; N # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; N # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 0620..063F ; N # Lo [32] ARABIC LETTER KASHMIRI YEH..ARABIC LETTER FARSI YEH WITH THREE DOTS ABOVE 0640 ; N # Lm ARABIC TATWEEL 0641..064A ; N # Lo [10] ARABIC LETTER FEH..ARABIC LETTER YEH @@ -199,9 +199,14 @@ 0859..085B ; N # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK 085E ; N # Po MANDAIC PUNCTUATION 0860..086A ; N # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; N # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; N # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE -08D3..08E1 ; N # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0870..0887 ; N # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0888 ; N # Sk ARABIC RAISED ROUND DOT +0889..088E ; N # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0890..0891 ; N # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +0898..089F ; N # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08A0..08C8 ; N # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; N # Lm ARABIC SMALL FARSI YEH +08CA..08E1 ; N # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E2 ; N # Cf ARABIC DISPUTED END OF AYAH 08E3..0902 ; N # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 0903 ; N # Mc DEVANAGARI SIGN VISARGA @@ -356,6 +361,7 @@ 0C0E..0C10 ; N # Lo [3] TELUGU LETTER E..TELUGU LETTER AI 0C12..0C28 ; N # Lo [23] TELUGU LETTER O..TELUGU LETTER NA 0C2A..0C39 ; N # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA +0C3C ; N # Mn TELUGU SIGN NUKTA 0C3D ; N # Lo TELUGU SIGN AVAGRAHA 0C3E..0C40 ; N # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44 ; N # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR @@ -363,6 +369,7 @@ 0C4A..0C4D ; N # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA 0C55..0C56 ; N # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK 0C58..0C5A ; N # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; N # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; N # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C62..0C63 ; N # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL 0C66..0C6F ; N # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE @@ -388,7 +395,7 @@ 0CCA..0CCB ; N # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO 0CCC..0CCD ; N # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA 0CD5..0CD6 ; N # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK -0CDE ; N # Lo KANNADA LETTER FA +0CDD..0CDE ; N # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; N # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CE2..0CE3 ; N # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL 0CE6..0CEF ; N # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE @@ -573,11 +580,12 @@ 16EB..16ED ; N # Po [3] RUNIC SINGLE PUNCTUATION..RUNIC CROSS PUNCTUATION 16EE..16F0 ; N # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; N # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; N # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; N # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA +1700..1711 ; N # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA 1712..1714 ; N # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1720..1731 ; N # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA -1732..1734 ; N # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1715 ; N # Mc TAGALOG SIGN PAMUDPOD +171F..1731 ; N # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA +1732..1733 ; N # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734 ; N # Mc HANUNOO SIGN PAMUDPOD 1735..1736 ; N # Po [2] PHILIPPINE SINGLE PUNCTUATION..PHILIPPINE DOUBLE PUNCTUATION 1740..1751 ; N # Lo [18] BUHID LETTER A..BUHID LETTER HA 1752..1753 ; N # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U @@ -605,6 +613,7 @@ 1807..180A ; N # Po [4] MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER..MONGOLIAN NIRUGU 180B..180D ; N # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE 180E ; N # Cf MONGOLIAN VOWEL SEPARATOR +180F ; N # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1810..1819 ; N # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE 1820..1842 ; N # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843 ; N # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -659,7 +668,7 @@ 1AA8..1AAD ; N # Po [6] TAI THAM SIGN KAAN..TAI THAM SIGN CAANG 1AB0..1ABD ; N # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; N # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; N # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; N # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; N # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; N # Mc BALINESE SIGN BISAH 1B05..1B33 ; N # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA @@ -671,12 +680,13 @@ 1B3D..1B41 ; N # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG 1B42 ; N # Mn BALINESE VOWEL SIGN PEPET 1B43..1B44 ; N # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG -1B45..1B4B ; N # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; N # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B50..1B59 ; N # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE 1B5A..1B60 ; N # Po [7] BALINESE PANTI..BALINESE PAMENENG 1B61..1B6A ; N # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE 1B6B..1B73 ; N # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1B74..1B7C ; N # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING +1B7D..1B7E ; N # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1B80..1B81 ; N # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR 1B82 ; N # Mc SUNDANESE SIGN PANGWISAD 1B83..1BA0 ; N # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA @@ -733,8 +743,7 @@ 1D78 ; N # Lm MODIFIER LETTER CYRILLIC EN 1D79..1D9A ; N # L& [34] LATIN SMALL LETTER INSULAR G..LATIN SMALL LETTER EZH WITH RETROFLEX HOOK 1D9B..1DBF ; N # Lm [37] MODIFIER LETTER SMALL TURNED ALPHA..MODIFIER LETTER SMALL THETA -1DC0..1DF9 ; N # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; N # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; N # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 1E00..1F15 ; N # L& [278] LATIN CAPITAL LETTER A WITH RING BELOW..GREEK SMALL LETTER EPSILON WITH DASIA AND OXIA 1F18..1F1D ; N # L& [6] GREEK CAPITAL LETTER EPSILON WITH PSILI..GREEK CAPITAL LETTER EPSILON WITH DASIA AND OXIA 1F20..1F45 ; N # L& [38] GREEK SMALL LETTER ETA WITH PSILI..GREEK SMALL LETTER OMICRON WITH DASIA AND OXIA @@ -806,7 +815,7 @@ 2090..209C ; N # Lm [13] LATIN SUBSCRIPT SMALL LETTER A..LATIN SUBSCRIPT SMALL LETTER T 20A0..20A8 ; N # Sc [9] EURO-CURRENCY SIGN..RUPEE SIGN 20AA..20AB ; N # Sc [2] NEW SHEQEL SIGN..DONG SIGN -20AD..20BF ; N # Sc [19] KIP SIGN..BITCOIN SIGN +20AD..20C0 ; N # Sc [20] KIP SIGN..SOM SIGN 20D0..20DC ; N # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20DD..20E0 ; N # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH 20E1 ; N # Mn COMBINING LEFT RIGHT ARROW ABOVE @@ -1036,9 +1045,7 @@ 2B5A..2B73 ; N # So [26] SLANTED NORTH ARROW WITH HOOKED HEAD..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR 2B76..2B95 ; N # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW 2B97..2BFF ; N # So [105] SYMBOL FOR TYPE A ELECTRONICS..HELLSCHREIBER PAUSE SYMBOL -2C00..2C2E ; N # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; N # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; N # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; N # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; N # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; N # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CE5..2CEA ; N # So [6] COPTIC SYMBOL MI RO..COPTIC SYMBOL SHIMA SIMA @@ -1104,7 +1111,16 @@ 2E42 ; N # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK 2E43..2E4F ; N # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER 2E50..2E51 ; N # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR -2E52 ; N # Po TIRONIAN SIGN CAPITAL ET +2E52..2E54 ; N # Po [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK +2E55 ; N # Ps LEFT SQUARE BRACKET WITH STROKE +2E56 ; N # Pe RIGHT SQUARE BRACKET WITH STROKE +2E57 ; N # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E58 ; N # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; N # Ps TOP HALF LEFT PARENTHESIS +2E5A ; N # Pe TOP HALF RIGHT PARENTHESIS +2E5B ; N # Ps BOTTOM HALF LEFT PARENTHESIS +2E5C ; N # Pe BOTTOM HALF RIGHT PARENTHESIS +2E5D ; N # Pd OBLIQUE HYPHEN 303F ; N # So IDEOGRAPHIC HALF FILL SPACE 4DC0..4DFF ; N # So [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION A4D0..A4F7 ; N # Lo [40] LISU LETTER BA..LISU LETTER OE @@ -1141,8 +1157,11 @@ A788 ; N # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; N # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; N # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; N # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; N # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; N # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; N # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; N # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; N # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; N # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; N # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; N # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; N # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; N # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -1285,15 +1304,17 @@ FB3E ; N # Lo HEBREW LETTER MEM WITH DAGESH FB40..FB41 ; N # Lo [2] HEBREW LETTER NUN WITH DAGESH..HEBREW LETTER SAMEKH WITH DAGESH FB43..FB44 ; N # Lo [2] HEBREW LETTER FINAL PE WITH DAGESH..HEBREW LETTER PE WITH DAGESH FB46..FBB1 ; N # Lo [108] HEBREW LETTER TSADI WITH DAGESH..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM -FBB2..FBC1 ; N # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2 ; N # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FBD3..FD3D ; N # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM FD3E ; N # Pe ORNATE LEFT PARENTHESIS FD3F ; N # Ps ORNATE RIGHT PARENTHESIS +FD40..FD4F ; N # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH FD50..FD8F ; N # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM FD92..FDC7 ; N # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM +FDCF ; N # So ARABIC LIGATURE SALAAMUHU ALAYNAA FDF0..FDFB ; N # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU FDFC ; N # Sc RIAL SIGN -FDFD ; N # So ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFD..FDFF ; N # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FE20..FE2F ; N # Mn [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC TITLO RIGHT HALF FE70..FE74 ; N # Lo [5] ARABIC FATHATAN ISOLATED FORM..ARABIC KASRATAN ISOLATED FORM FE76..FEFC ; N # Lo [135] ARABIC FATHA ISOLATED FORM..ARABIC LIGATURE LAM WITH ALEF FINAL FORM @@ -1345,9 +1366,20 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 10500..10527 ; N # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; N # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW 1056F ; N # Po CAUCASIAN ALBANIAN CITATION MARK +10570..1057A ; N # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; N # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; N # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; N # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; N # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; N # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; N # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; N # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; N # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; N # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; N # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; N # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; N # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; N # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; N # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; N # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; N # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -1424,6 +1456,9 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 10F46..10F50 ; N # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW 10F51..10F54 ; N # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED 10F55..10F59 ; N # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F70..10F81 ; N # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F82..10F85 ; N # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW +10F86..10F89 ; N # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 10FB0..10FC4 ; N # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FC5..10FCB ; N # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED 10FE0..10FF6 ; N # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH @@ -1435,6 +1470,10 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 11047..1104D ; N # Po [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 11052..11065 ; N # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND 11066..1106F ; N # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE +11070 ; N # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11071..11072 ; N # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11073..11074 ; N # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O +11075 ; N # Lo BRAHMI LETTER OLD TAMIL LLA 1107F..11081 ; N # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 11082 ; N # Mc KAITHI SIGN VISARGA 11083..110AF ; N # Lo [45] KAITHI LETTER A..KAITHI LETTER HA @@ -1445,6 +1484,7 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 110BB..110BC ; N # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN 110BD ; N # Cf KAITHI NUMBER SIGN 110BE..110C1 ; N # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA +110C2 ; N # Mn KAITHI VOWEL SIGN VOCALIC R 110CD ; N # Cf KAITHI NUMBER SIGN ABOVE 110D0..110E8 ; N # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 110F0..110F9 ; N # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE @@ -1579,6 +1619,7 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 116B6 ; N # Mc TAKRI SIGN VIRAMA 116B7 ; N # Mn TAKRI SIGN NUKTA 116B8 ; N # Lo TAKRI LETTER ARCHAIC KHA +116B9 ; N # Po TAKRI ABBREVIATION SIGN 116C0..116C9 ; N # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE 11700..1171A ; N # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA 1171D..1171F ; N # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA @@ -1590,6 +1631,7 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 1173A..1173B ; N # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY 1173C..1173E ; N # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI 1173F ; N # So AHOM SYMBOL VI +11740..11746 ; N # Lo [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; N # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1182C..1182E ; N # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II 1182F..11837 ; N # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA @@ -1647,7 +1689,7 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 11A9A..11A9C ; N # Po [3] SOYOMBO MARK TSHEG..SOYOMBO MARK DOUBLE SHAD 11A9D ; N # Lo SOYOMBO MARK PLUTA 11A9E..11AA2 ; N # Po [5] SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME..SOYOMBO TERMINAL MARK-2 -11AC0..11AF8 ; N # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; N # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; N # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; N # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C2F ; N # Mc BHAIKSUKI VOWEL SIGN AA @@ -1703,6 +1745,8 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 12400..1246E ; N # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12470..12474 ; N # Po [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON 12480..12543 ; N # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; N # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2 ; N # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13000..1342E ; N # Lo [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 13430..13438 ; N # Cf [9] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END SEGMENT 14400..14646 ; N # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 @@ -1710,6 +1754,8 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 16A40..16A5E ; N # Lo [31] MRO LETTER TA..MRO LETTER TEK 16A60..16A69 ; N # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE 16A6E..16A6F ; N # Po [2] MRO DANDA..MRO DOUBLE DANDA +16A70..16ABE ; N # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA +16AC0..16AC9 ; N # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16AD0..16AED ; N # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16AF0..16AF4 ; N # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE 16AF5 ; N # Po BASSA VAH FULL STOP @@ -1741,6 +1787,9 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 1BC9D..1BC9E ; N # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 1BC9F ; N # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1BCA0..1BCA3 ; N # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF00..1CF2D ; N # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; N # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG +1CF50..1CFC3 ; N # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5 ; N # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126 ; N # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129..1D164 ; N # So [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE @@ -1754,7 +1803,7 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 1D185..1D18B ; N # Mn [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE 1D18C..1D1A9 ; N # So [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH 1D1AA..1D1AD ; N # Mn [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO -1D1AE..1D1E8 ; N # So [59] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KIEVAN FLAT SIGN +1D1AE..1D1EA ; N # So [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON 1D200..1D241 ; N # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54 1D242..1D244 ; N # Mn [3] COMBINING GREEK MUSICAL TRISEME..COMBINING GREEK MUSICAL PENTASEME 1D245 ; N # So GREEK MUSICAL LEIMMA @@ -1814,6 +1863,9 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 1DA87..1DA8B ; N # Po [5] SIGNWRITING COMMA..SIGNWRITING PARENTHESIS 1DA9B..1DA9F ; N # Mn [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6 1DAA1..1DAAF ; N # Mn [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16 +1DF00..1DF09 ; N # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; N # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; N # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E000..1E006 ; N # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE 1E008..1E018 ; N # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU 1E01B..1E021 ; N # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI @@ -1825,10 +1877,16 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER 1E140..1E149 ; N # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE 1E14E ; N # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1E14F ; N # So NYIAKENG PUACHUE HMONG CIRCLED CA +1E290..1E2AD ; N # Lo [30] TOTO LETTER PA..TOTO LETTER A +1E2AE ; N # Mn TOTO SIGN RISING TONE 1E2C0..1E2EB ; N # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH 1E2EC..1E2EF ; N # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E2F0..1E2F9 ; N # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE 1E2FF ; N # Sc WANCHO NGUN SIGN +1E7E0..1E7E6 ; N # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; N # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; N # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; N # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; N # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8C7..1E8CF ; N # No [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE 1E8D0..1E8D6 ; N # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS @@ -1934,8 +1992,8 @@ FFFC ; N # So OBJECT REPLACEMENT CHARACTER E0001 ; N # Cf LANGUAGE TAG E0020..E007F ; N # Cf [96] TAG SPACE..CANCEL TAG -# The above property value applies to 767414 code points not listed here. -# Total code points: 792699 +# The above property value applies to 766585 code points not listed here. +# Total code points: 792645 # ================================================ @@ -2278,9 +2336,7 @@ FFED..FFEE ; H # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 32B1..32BF ; W # No [15] CIRCLED NUMBER THIRTY SIX..CIRCLED NUMBER FIFTY 32C0..33FF ; W # So [320] IDEOGRAPHIC TELEGRAPH SYMBOL FOR JANUARY..SQUARE GAL 3400..4DBF ; W # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; W # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -9FFD..9FFF ; W # Cn [3] .. -A000..A014 ; W # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; W # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A015 ; W # Lm YI SYLLABLE WU A016..A48C ; W # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A490..A4C6 ; W # So [55] YI RADICAL QOT..YI RADICAL KE @@ -2342,7 +2398,10 @@ FE6A..FE6B ; W # Po [2] SMALL PERCENT SIGN..SMALL COMMERCIAL AT 17000..187F7 ; W # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; W # Lo [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; W # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; W # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1AFF0..1AFF3 ; W # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; W # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; W # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 +1B000..1B122 ; W # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; W # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; W # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; W # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -2379,25 +2438,27 @@ FE6A..FE6B ; W # Po [2] SMALL PERCENT SIGN..SMALL COMMERCIAL AT 1F6CC ; W # So SLEEPING ACCOMMODATION 1F6D0..1F6D2 ; W # So [3] PLACE OF WORSHIP..SHOPPING TROLLEY 1F6D5..1F6D7 ; W # So [3] HINDU TEMPLE..ELEVATOR +1F6DD..1F6DF ; W # So [3] PLAYGROUND SLIDE..RING BUOY 1F6EB..1F6EC ; W # So [2] AIRPLANE DEPARTURE..AIRPLANE ARRIVING 1F6F4..1F6FC ; W # So [9] SCOOTER..ROLLER SKATE 1F7E0..1F7EB ; W # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE +1F7F0 ; W # So HEAVY EQUALS SIGN 1F90C..1F93A ; W # So [47] PINCHED FINGERS..FENCER 1F93C..1F945 ; W # So [10] WRESTLERS..GOAL NET -1F947..1F978 ; W # So [50] FIRST PLACE MEDAL..DISGUISED FACE -1F97A..1F9CB ; W # So [82] FACE WITH PLEADING EYES..BUBBLE TEA -1F9CD..1F9FF ; W # So [51] STANDING PERSON..NAZAR AMULET +1F947..1F9FF ; W # So [185] FIRST PLACE MEDAL..NAZAR AMULET 1FA70..1FA74 ; W # So [5] BALLET SHOES..THONG SANDAL -1FA78..1FA7A ; W # So [3] DROP OF BLOOD..STETHOSCOPE +1FA78..1FA7C ; W # So [5] DROP OF BLOOD..CRUTCH 1FA80..1FA86 ; W # So [7] YO-YO..NESTING DOLLS -1FA90..1FAA8 ; W # So [25] RINGED PLANET..ROCK -1FAB0..1FAB6 ; W # So [7] FLY..FEATHER -1FAC0..1FAC2 ; W # So [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAD0..1FAD6 ; W # So [7] BLUEBERRIES..TEAPOT -20000..2A6DD ; W # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A6DE..2A6FF ; W # Cn [34] .. -2A700..2B734 ; W # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 -2B735..2B73F ; W # Cn [11] .. +1FA90..1FAAC ; W # So [29] RINGED PLANET..HAMSA +1FAB0..1FABA ; W # So [11] FLY..NEST WITH EGGS +1FAC0..1FAC5 ; W # So [6] ANATOMICAL HEART..PERSON WITH CROWN +1FAD0..1FAD9 ; W # So [10] BLUEBERRIES..JAR +1FAE0..1FAE7 ; W # So [8] MELTING FACE..BUBBLES +1FAF0..1FAF6 ; W # So [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS +20000..2A6DF ; W # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A6E0..2A6FF ; W # Cn [32] .. +2A700..2B738 ; W # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 +2B739..2B73F ; W # Cn [7] .. 2B740..2B81D ; W # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B81E..2B81F ; W # Cn [2] .. 2B820..2CEA1 ; W # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 @@ -2409,7 +2470,7 @@ FE6A..FE6B ; W # Po [2] SMALL PERCENT SIGN..SMALL COMMERCIAL AT 30000..3134A ; W # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 3134B..3FFFD ; W # Cn [60595] .. -# Total code points: 182336 +# Total code points: 182390 # ================================================ diff --git a/lib/unicore/extracted/DGeneralCategory.txt b/lib/unicore/extracted/DGeneralCategory.txt index 3e82c7fc53..a36d42a3e8 100644 --- a/lib/unicore/extracted/DGeneralCategory.txt +++ b/lib/unicore/extracted/DGeneralCategory.txt @@ -1,6 +1,6 @@ -# DerivedGeneralCategory-13.0.0.txt -# Date: 2019-10-21, 14:30:32 GMT -# © 2019 Unicode®, Inc. +# DerivedGeneralCategory-14.0.0.txt +# Date: 2021-07-10, 00:35:08 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -27,7 +27,6 @@ 05C8..05CF ; Cn # [8] .. 05EB..05EE ; Cn # [4] .. 05F5..05FF ; Cn # [11] .. -061D ; Cn # 070E ; Cn # 074B..074C ; Cn # [2] .. 07B2..07BF ; Cn # [14] .. @@ -36,9 +35,9 @@ 083F ; Cn # 085C..085D ; Cn # [2] .. 085F ; Cn # -086B..089F ; Cn # [53] .. -08B5 ; Cn # -08C8..08D2 ; Cn # [11] .. +086B..086F ; Cn # [5] .. +088F ; Cn # +0892..0897 ; Cn # [6] .. 0984 ; Cn # 098D..098E ; Cn # [2] .. 0991..0992 ; Cn # [2] .. @@ -116,12 +115,13 @@ 0C0D ; Cn # 0C11 ; Cn # 0C29 ; Cn # -0C3A..0C3C ; Cn # [3] .. +0C3A..0C3B ; Cn # [2] .. 0C45 ; Cn # 0C49 ; Cn # 0C4E..0C54 ; Cn # [7] .. 0C57 ; Cn # -0C5B..0C5F ; Cn # [5] .. +0C5B..0C5C ; Cn # [2] .. +0C5E..0C5F ; Cn # [2] .. 0C64..0C65 ; Cn # [2] .. 0C70..0C76 ; Cn # [7] .. 0C8D ; Cn # @@ -132,7 +132,7 @@ 0CC5 ; Cn # 0CC9 ; Cn # 0CCE..0CD4 ; Cn # [7] .. -0CD7..0CDD ; Cn # [7] .. +0CD7..0CDC ; Cn # [6] .. 0CDF ; Cn # 0CE4..0CE5 ; Cn # [2] .. 0CF0 ; Cn # @@ -200,8 +200,7 @@ 13FE..13FF ; Cn # [2] .. 169D..169F ; Cn # [3] .. 16F9..16FF ; Cn # [7] .. -170D ; Cn # -1715..171F ; Cn # [11] .. +1716..171E ; Cn # [9] .. 1737..173F ; Cn # [9] .. 1754..175F ; Cn # [12] .. 176D ; Cn # @@ -210,7 +209,6 @@ 17DE..17DF ; Cn # [2] .. 17EA..17EF ; Cn # [6] .. 17FA..17FF ; Cn # [6] .. -180F ; Cn # 181A..181F ; Cn # [6] .. 1879..187F ; Cn # [7] .. 18AB..18AF ; Cn # [5] .. @@ -230,9 +228,9 @@ 1A8A..1A8F ; Cn # [6] .. 1A9A..1A9F ; Cn # [6] .. 1AAE..1AAF ; Cn # [2] .. -1AC1..1AFF ; Cn # [63] .. -1B4C..1B4F ; Cn # [4] .. -1B7D..1B7F ; Cn # [3] .. +1ACF..1AFF ; Cn # [49] .. +1B4D..1B4F ; Cn # [3] .. +1B7F ; Cn # 1BF4..1BFB ; Cn # [8] .. 1C38..1C3A ; Cn # [3] .. 1C4A..1C4C ; Cn # [3] .. @@ -240,7 +238,6 @@ 1CBB..1CBC ; Cn # [2] .. 1CC8..1CCF ; Cn # [8] .. 1CFB..1CFF ; Cn # [5] .. -1DFA ; Cn # 1F16..1F17 ; Cn # [2] .. 1F1E..1F1F ; Cn # [2] .. 1F46..1F47 ; Cn # [2] .. @@ -261,15 +258,13 @@ 2072..2073 ; Cn # [2] .. 208F ; Cn # 209D..209F ; Cn # [3] .. -20C0..20CF ; Cn # [16] .. +20C1..20CF ; Cn # [15] .. 20F1..20FF ; Cn # [15] .. 218C..218F ; Cn # [4] .. 2427..243F ; Cn # [25] .. 244B..245F ; Cn # [21] .. 2B74..2B75 ; Cn # [2] .. 2B96 ; Cn # -2C2F ; Cn # -2C5F ; Cn # 2CF4..2CF8 ; Cn # [5] .. 2D26 ; Cn # 2D28..2D2C ; Cn # [5] .. @@ -285,7 +280,7 @@ 2DCF ; Cn # 2DD7 ; Cn # 2DDF ; Cn # -2E53..2E7F ; Cn # [45] .. +2E5E..2E7F ; Cn # [34] .. 2E9A ; Cn # 2EF4..2EFF ; Cn # [12] .. 2FD6..2FEF ; Cn # [26] .. @@ -297,13 +292,14 @@ 318F ; Cn # 31E4..31EF ; Cn # [12] .. 321F ; Cn # -9FFD..9FFF ; Cn # [3] .. A48D..A48F ; Cn # [3] .. A4C7..A4CF ; Cn # [9] .. A62C..A63F ; Cn # [20] .. A6F8..A6FF ; Cn # [8] .. -A7C0..A7C1 ; Cn # [2] .. -A7CB..A7F4 ; Cn # [42] .. +A7CB..A7CF ; Cn # [5] .. +A7D2 ; Cn # +A7D4 ; Cn # +A7DA..A7F1 ; Cn # [24] .. A82D..A82F ; Cn # [3] .. A83A..A83F ; Cn # [6] .. A878..A87F ; Cn # [8] .. @@ -339,11 +335,10 @@ FB3D ; Cn # FB3F ; Cn # FB42 ; Cn # FB45 ; Cn # -FBC2..FBD2 ; Cn # [17] .. -FD40..FD4F ; Cn # [16] .. +FBC3..FBD2 ; Cn # [16] .. FD90..FD91 ; Cn # [2] .. -FDC8..FDEF ; Cn # [40] .. -FDFE..FDFF ; Cn # [2] .. +FDC8..FDCE ; Cn # [7] .. +FDD0..FDEF ; Cn # [32] .. FE1A..FE1F ; Cn # [6] .. FE53 ; Cn # FE67 ; Cn # @@ -387,10 +382,20 @@ FFFE..FFFF ; Cn # [2] .. 104FC..104FF ; Cn # [4] .. 10528..1052F ; Cn # [8] .. 10564..1056E ; Cn # [11] .. -10570..105FF ; Cn # [144] .. +1057B ; Cn # +1058B ; Cn # +10593 ; Cn # +10596 ; Cn # +105A2 ; Cn # +105B2 ; Cn # +105BA ; Cn # +105BD..105FF ; Cn # [67] .. 10737..1073F ; Cn # [9] .. 10756..1075F ; Cn # [10] .. -10768..107FF ; Cn # [152] .. +10768..1077F ; Cn # [24] .. +10786 ; Cn # +107B1 ; Cn # +107BB..107FF ; Cn # [69] .. 10806..10807 ; Cn # [2] .. 10809 ; Cn # 10836 ; Cn # @@ -433,12 +438,13 @@ FFFE..FFFF ; Cn # [2] .. 10EAE..10EAF ; Cn # [2] .. 10EB2..10EFF ; Cn # [78] .. 10F28..10F2F ; Cn # [8] .. -10F5A..10FAF ; Cn # [86] .. +10F5A..10F6F ; Cn # [22] .. +10F8A..10FAF ; Cn # [38] .. 10FCC..10FDF ; Cn # [20] .. 10FF7..10FFF ; Cn # [9] .. 1104E..11051 ; Cn # [4] .. -11070..1107E ; Cn # [15] .. -110C2..110CC ; Cn # [11] .. +11076..1107E ; Cn # [9] .. +110C3..110CC ; Cn # [10] .. 110CE..110CF ; Cn # [2] .. 110E9..110EF ; Cn # [7] .. 110FA..110FF ; Cn # [6] .. @@ -480,11 +486,11 @@ FFFE..FFFF ; Cn # [2] .. 11645..1164F ; Cn # [11] .. 1165A..1165F ; Cn # [6] .. 1166D..1167F ; Cn # [19] .. -116B9..116BF ; Cn # [7] .. +116BA..116BF ; Cn # [6] .. 116CA..116FF ; Cn # [54] .. 1171B..1171C ; Cn # [2] .. 1172C..1172F ; Cn # [4] .. -11740..117FF ; Cn # [192] .. +11747..117FF ; Cn # [185] .. 1183C..1189F ; Cn # [100] .. 118F3..118FE ; Cn # [12] .. 11907..11908 ; Cn # [2] .. @@ -499,7 +505,7 @@ FFFE..FFFF ; Cn # [2] .. 119D8..119D9 ; Cn # [2] .. 119E5..119FF ; Cn # [27] .. 11A48..11A4F ; Cn # [8] .. -11AA3..11ABF ; Cn # [29] .. +11AA3..11AAF ; Cn # [13] .. 11AF9..11BFF ; Cn # [263] .. 11C09 ; Cn # 11C37 ; Cn # @@ -527,14 +533,16 @@ FFFE..FFFF ; Cn # [2] .. 1239A..123FF ; Cn # [102] .. 1246F ; Cn # 12475..1247F ; Cn # [11] .. -12544..12FFF ; Cn # [2748] .. +12544..12F8F ; Cn # [2636] .. +12FF3..12FFF ; Cn # [13] .. 1342F ; Cn # 13439..143FF ; Cn # [4039] .. 14647..167FF ; Cn # [8633] .. 16A39..16A3F ; Cn # [7] .. 16A5F ; Cn # 16A6A..16A6D ; Cn # [4] .. -16A70..16ACF ; Cn # [96] .. +16ABF ; Cn # +16ACA..16ACF ; Cn # [6] .. 16AEE..16AEF ; Cn # [2] .. 16AF6..16AFF ; Cn # [10] .. 16B46..16B4F ; Cn # [10] .. @@ -550,8 +558,11 @@ FFFE..FFFF ; Cn # [2] .. 16FF2..16FFF ; Cn # [14] .. 187F8..187FF ; Cn # [8] .. 18CD6..18CFF ; Cn # [42] .. -18D09..1AFFF ; Cn # [8951] .. -1B11F..1B14F ; Cn # [49] .. +18D09..1AFEF ; Cn # [8935] .. +1AFF4 ; Cn # +1AFFC ; Cn # +1AFFF ; Cn # +1B123..1B14F ; Cn # [45] .. 1B153..1B163 ; Cn # [17] .. 1B168..1B16F ; Cn # [8] .. 1B2FC..1BBFF ; Cn # [2308] .. @@ -559,10 +570,13 @@ FFFE..FFFF ; Cn # [2] .. 1BC7D..1BC7F ; Cn # [3] .. 1BC89..1BC8F ; Cn # [7] .. 1BC9A..1BC9B ; Cn # [2] .. -1BCA4..1CFFF ; Cn # [4956] .. +1BCA4..1CEFF ; Cn # [4700] .. +1CF2E..1CF2F ; Cn # [2] .. +1CF47..1CF4F ; Cn # [9] .. +1CFC4..1CFFF ; Cn # [60] .. 1D0F6..1D0FF ; Cn # [10] .. 1D127..1D128 ; Cn # [2] .. -1D1E9..1D1FF ; Cn # [23] .. +1D1EB..1D1FF ; Cn # [21] .. 1D246..1D2DF ; Cn # [154] .. 1D2F4..1D2FF ; Cn # [12] .. 1D357..1D35F ; Cn # [9] .. @@ -589,7 +603,8 @@ FFFE..FFFF ; Cn # [2] .. 1D7CC..1D7CD ; Cn # [2] .. 1DA8C..1DA9A ; Cn # [15] .. 1DAA0 ; Cn # -1DAB0..1DFFF ; Cn # [1360] .. +1DAB0..1DEFF ; Cn # [1104] .. +1DF1F..1DFFF ; Cn # [225] .. 1E007 ; Cn # 1E019..1E01A ; Cn # [2] .. 1E022 ; Cn # @@ -598,9 +613,14 @@ FFFE..FFFF ; Cn # [2] .. 1E12D..1E12F ; Cn # [3] .. 1E13E..1E13F ; Cn # [2] .. 1E14A..1E14D ; Cn # [4] .. -1E150..1E2BF ; Cn # [368] .. +1E150..1E28F ; Cn # [320] .. +1E2AF..1E2BF ; Cn # [17] .. 1E2FA..1E2FE ; Cn # [5] .. -1E300..1E7FF ; Cn # [1280] .. +1E300..1E7DF ; Cn # [1248] .. +1E7E7 ; Cn # +1E7EC ; Cn # +1E7EF ; Cn # +1E7FF ; Cn # 1E8C5..1E8C6 ; Cn # [2] .. 1E8D7..1E8FF ; Cn # [41] .. 1E94C..1E94F ; Cn # [4] .. @@ -654,34 +674,35 @@ FFFE..FFFF ; Cn # [2] .. 1F249..1F24F ; Cn # [7] .. 1F252..1F25F ; Cn # [14] .. 1F266..1F2FF ; Cn # [154] .. -1F6D8..1F6DF ; Cn # [8] .. +1F6D8..1F6DC ; Cn # [5] .. 1F6ED..1F6EF ; Cn # [3] .. 1F6FD..1F6FF ; Cn # [3] .. 1F774..1F77F ; Cn # [12] .. 1F7D9..1F7DF ; Cn # [7] .. -1F7EC..1F7FF ; Cn # [20] .. +1F7EC..1F7EF ; Cn # [4] .. +1F7F1..1F7FF ; Cn # [15] .. 1F80C..1F80F ; Cn # [4] .. 1F848..1F84F ; Cn # [8] .. 1F85A..1F85F ; Cn # [6] .. 1F888..1F88F ; Cn # [8] .. 1F8AE..1F8AF ; Cn # [2] .. 1F8B2..1F8FF ; Cn # [78] .. -1F979 ; Cn # -1F9CC ; Cn # 1FA54..1FA5F ; Cn # [12] .. 1FA6E..1FA6F ; Cn # [2] .. 1FA75..1FA77 ; Cn # [3] .. -1FA7B..1FA7F ; Cn # [5] .. +1FA7D..1FA7F ; Cn # [3] .. 1FA87..1FA8F ; Cn # [9] .. -1FAA9..1FAAF ; Cn # [7] .. -1FAB7..1FABF ; Cn # [9] .. -1FAC3..1FACF ; Cn # [13] .. -1FAD7..1FAFF ; Cn # [41] .. +1FAAD..1FAAF ; Cn # [3] .. +1FABB..1FABF ; Cn # [5] .. +1FAC6..1FACF ; Cn # [10] .. +1FADA..1FADF ; Cn # [6] .. +1FAE8..1FAEF ; Cn # [8] .. +1FAF7..1FAFF ; Cn # [9] .. 1FB93 ; Cn # 1FBCB..1FBEF ; Cn # [37] .. 1FBFA..1FFFF ; Cn # [1030] .. -2A6DE..2A6FF ; Cn # [34] .. -2B735..2B73F ; Cn # [11] .. +2A6E0..2A6FF ; Cn # [32] .. +2B739..2B73F ; Cn # [7] .. 2B81E..2B81F ; Cn # [2] .. 2CEA2..2CEAF ; Cn # [14] .. 2EBE1..2F7FF ; Cn # [3103] .. @@ -693,7 +714,7 @@ E01F0..EFFFF ; Cn # [65040] .. FFFFE..FFFFF ; Cn # [2] .. 10FFFE..10FFFF; Cn # [2] .. -# Total code points: 830672 +# Total code points: 829834 # ================================================ @@ -1130,7 +1151,7 @@ FFFFE..FFFFF ; Cn # [2] .. 213E..213F ; Lu # [2] DOUBLE-STRUCK CAPITAL GAMMA..DOUBLE-STRUCK CAPITAL PI 2145 ; Lu # DOUBLE-STRUCK ITALIC CAPITAL D 2183 ; Lu # ROMAN NUMERAL REVERSED ONE HUNDRED -2C00..2C2E ; Lu # [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE +2C00..2C2F ; Lu # [48] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER CAUDATE CHRIVI 2C60 ; Lu # LATIN CAPITAL LETTER L WITH DOUBLE BAR 2C62..2C64 ; Lu # [3] LATIN CAPITAL LETTER L WITH MIDDLE TILDE..LATIN CAPITAL LETTER R WITH TAIL 2C67 ; Lu # LATIN CAPITAL LETTER H WITH DESCENDER @@ -1295,13 +1316,21 @@ A7B8 ; Lu # LATIN CAPITAL LETTER U WITH STROKE A7BA ; Lu # LATIN CAPITAL LETTER GLOTTAL A A7BC ; Lu # LATIN CAPITAL LETTER GLOTTAL I A7BE ; Lu # LATIN CAPITAL LETTER GLOTTAL U +A7C0 ; Lu # LATIN CAPITAL LETTER OLD POLISH O A7C2 ; Lu # LATIN CAPITAL LETTER ANGLICANA W A7C4..A7C7 ; Lu # [4] LATIN CAPITAL LETTER C WITH PALATAL HOOK..LATIN CAPITAL LETTER D WITH SHORT STROKE OVERLAY A7C9 ; Lu # LATIN CAPITAL LETTER S WITH SHORT STROKE OVERLAY +A7D0 ; Lu # LATIN CAPITAL LETTER CLOSED INSULAR G +A7D6 ; Lu # LATIN CAPITAL LETTER MIDDLE SCOTS S +A7D8 ; Lu # LATIN CAPITAL LETTER SIGMOID S A7F5 ; Lu # LATIN CAPITAL LETTER REVERSED HALF H FF21..FF3A ; Lu # [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z 10400..10427 ; Lu # [40] DESERET CAPITAL LETTER LONG I..DESERET CAPITAL LETTER EW 104B0..104D3 ; Lu # [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA +10570..1057A ; Lu # [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; Lu # [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; Lu # [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; Lu # [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE 10C80..10CB2 ; Lu # [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US 118A0..118BF ; Lu # [32] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI CAPITAL LETTER VIYO 16E40..16E5F ; Lu # [32] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN CAPITAL LETTER Y @@ -1338,7 +1367,7 @@ FF21..FF3A ; Lu # [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAP 1D7CA ; Lu # MATHEMATICAL BOLD CAPITAL DIGAMMA 1E900..1E921 ; Lu # [34] ADLAM CAPITAL LETTER ALIF..ADLAM CAPITAL LETTER SHA -# Total code points: 1791 +# Total code points: 1831 # ================================================ @@ -1775,7 +1804,7 @@ FF21..FF3A ; Lu # [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAP 2146..2149 ; Ll # [4] DOUBLE-STRUCK ITALIC SMALL D..DOUBLE-STRUCK ITALIC SMALL J 214E ; Ll # TURNED SMALL F 2184 ; Ll # LATIN SMALL LETTER REVERSED C -2C30..2C5E ; Ll # [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE +2C30..2C5F ; Ll # [48] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI 2C61 ; Ll # LATIN SMALL LETTER L WITH DOUBLE BAR 2C65..2C66 ; Ll # [2] LATIN SMALL LETTER A WITH STROKE..LATIN SMALL LETTER T WITH DIAGONAL STROKE 2C68 ; Ll # LATIN SMALL LETTER H WITH DESCENDER @@ -1944,9 +1973,15 @@ A7B9 ; Ll # LATIN SMALL LETTER U WITH STROKE A7BB ; Ll # LATIN SMALL LETTER GLOTTAL A A7BD ; Ll # LATIN SMALL LETTER GLOTTAL I A7BF ; Ll # LATIN SMALL LETTER GLOTTAL U +A7C1 ; Ll # LATIN SMALL LETTER OLD POLISH O A7C3 ; Ll # LATIN SMALL LETTER ANGLICANA W A7C8 ; Ll # LATIN SMALL LETTER D WITH SHORT STROKE OVERLAY A7CA ; Ll # LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D1 ; Ll # LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; Ll # LATIN SMALL LETTER DOUBLE THORN +A7D5 ; Ll # LATIN SMALL LETTER DOUBLE WYNN +A7D7 ; Ll # LATIN SMALL LETTER MIDDLE SCOTS S +A7D9 ; Ll # LATIN SMALL LETTER SIGMOID S A7F6 ; Ll # LATIN SMALL LETTER REVERSED HALF H A7FA ; Ll # LATIN LETTER SMALL CAPITAL TURNED M AB30..AB5A ; Ll # [43] LATIN SMALL LETTER BARRED ALPHA..LATIN SMALL LETTER Y WITH SHORT RIGHT LEG @@ -1957,6 +1992,10 @@ FB13..FB17 ; Ll # [5] ARMENIAN SMALL LIGATURE MEN NOW..ARMENIAN SMALL LIGAT FF41..FF5A ; Ll # [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL LETTER Z 10428..1044F ; Ll # [40] DESERET SMALL LETTER LONG I..DESERET SMALL LETTER EW 104D8..104FB ; Ll # [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA +10597..105A1 ; Ll # [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; Ll # [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; Ll # [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; Ll # [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10CC0..10CF2 ; Ll # [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US 118C0..118DF ; Ll # [32] WARANG CITI SMALL LETTER NGAA..WARANG CITI SMALL LETTER VIYO 16E60..16E7F ; Ll # [32] MEDEFAIDRIN SMALL LETTER M..MEDEFAIDRIN SMALL LETTER Y @@ -1988,9 +2027,11 @@ FF41..FF5A ; Ll # [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL 1D7AA..1D7C2 ; Ll # [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA 1D7C4..1D7C9 ; Ll # [6] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC PI SYMBOL 1D7CB ; Ll # MATHEMATICAL BOLD SMALL DIGAMMA +1DF00..1DF09 ; Ll # [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0B..1DF1E ; Ll # [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E922..1E943 ; Ll # [34] ADLAM SMALL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 2155 +# Total code points: 2227 # ================================================ @@ -2028,6 +2069,7 @@ FF41..FF5A ; Ll # [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL 081A ; Lm # SAMARITAN MODIFIER LETTER EPENTHETIC YUT 0824 ; Lm # SAMARITAN MODIFIER LETTER SHORT A 0828 ; Lm # SAMARITAN MODIFIER LETTER I +08C9 ; Lm # ARABIC SMALL FARSI YEH 0971 ; Lm # DEVANAGARI SIGN HIGH SPACING DOT 0E46 ; Lm # THAI CHARACTER MAIYAMOK 0EC6 ; Lm # LAO KO LA @@ -2058,6 +2100,7 @@ A69C..A69D ; Lm # [2] MODIFIER LETTER CYRILLIC HARD SIGN..MODIFIER LETTER C A717..A71F ; Lm # [9] MODIFIER LETTER DOT VERTICAL BAR..MODIFIER LETTER LOW INVERTED EXCLAMATION MARK A770 ; Lm # MODIFIER LETTER US A788 ; Lm # MODIFIER LETTER LOW CIRCUMFLEX ACCENT +A7F2..A7F4 ; Lm # [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F8..A7F9 ; Lm # [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE A9CF ; Lm # JAVANESE PANGRANGKEP A9E6 ; Lm # MYANMAR MODIFIER LETTER SHAN REDUPLICATION @@ -2068,14 +2111,20 @@ AB5C..AB5F ; Lm # [4] MODIFIER LETTER SMALL HENG..MODIFIER LETTER SMALL U W AB69 ; Lm # MODIFIER LETTER SMALL TURNED W FF70 ; Lm # HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND MARK FF9E..FF9F ; Lm # [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK +10780..10785 ; Lm # [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; Lm # [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; Lm # [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 16B40..16B43 ; Lm # [4] PAHAWH HMONG SIGN VOS SEEV..PAHAWH HMONG SIGN IB YAM 16F93..16F9F ; Lm # [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8 16FE0..16FE1 ; Lm # [2] TANGUT ITERATION MARK..NUSHU ITERATION MARK 16FE3 ; Lm # OLD CHINESE ITERATION MARK +1AFF0..1AFF3 ; Lm # [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; Lm # [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; Lm # [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 1E137..1E13D ; Lm # [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E94B ; Lm # ADLAM NASALIZATION MARK -# Total code points: 260 +# Total code points: 334 # ================================================ @@ -2104,8 +2153,9 @@ FF9E..FF9F ; Lm # [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAK 0800..0815 ; Lo # [22] SAMARITAN LETTER ALAF..SAMARITAN LETTER TAAF 0840..0858 ; Lo # [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 0860..086A ; Lo # [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; Lo # [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; Lo # [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +0870..0887 ; Lo # [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0889..088E ; Lo # [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +08A0..08C8 ; Lo # [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF 0904..0939 ; Lo # [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA 093D ; Lo # DEVANAGARI SIGN AVAGRAHA 0950 ; Lo # DEVANAGARI OM @@ -2170,6 +2220,7 @@ FF9E..FF9F ; Lm # [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAK 0C2A..0C39 ; Lo # [16] TELUGU LETTER PA..TELUGU LETTER HA 0C3D ; Lo # TELUGU SIGN AVAGRAHA 0C58..0C5A ; Lo # [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; Lo # TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; Lo # [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C80 ; Lo # KANNADA SIGN SPACING CANDRABINDU 0C85..0C8C ; Lo # [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L @@ -2178,7 +2229,7 @@ FF9E..FF9F ; Lm # [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAK 0CAA..0CB3 ; Lo # [10] KANNADA LETTER PA..KANNADA LETTER LLA 0CB5..0CB9 ; Lo # [5] KANNADA LETTER VA..KANNADA LETTER HA 0CBD ; Lo # KANNADA SIGN AVAGRAHA -0CDE ; Lo # KANNADA LETTER FA +0CDD..0CDE ; Lo # [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; Lo # [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CF1..0CF2 ; Lo # [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA 0D04..0D0C ; Lo # [9] MALAYALAM LETTER VEDIC ANUSVARA..MALAYALAM LETTER VOCALIC L @@ -2242,9 +2293,8 @@ FF9E..FF9F ; Lm # [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAK 1681..169A ; Lo # [26] OGHAM LETTER BEITH..OGHAM LETTER PEITH 16A0..16EA ; Lo # [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16F1..16F8 ; Lo # [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; Lo # [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; Lo # [4] TAGALOG LETTER LA..TAGALOG LETTER HA -1720..1731 ; Lo # [18] HANUNOO LETTER A..HANUNOO LETTER HA +1700..1711 ; Lo # [18] TAGALOG LETTER A..TAGALOG LETTER HA +171F..1731 ; Lo # [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA 1740..1751 ; Lo # [18] BUHID LETTER A..BUHID LETTER HA 1760..176C ; Lo # [13] TAGBANWA LETTER A..TAGBANWA LETTER YA 176E..1770 ; Lo # [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA @@ -2264,7 +2314,7 @@ FF9E..FF9F ; Lm # [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAK 1A00..1A16 ; Lo # [23] BUGINESE LETTER KA..BUGINESE LETTER HA 1A20..1A54 ; Lo # [53] TAI THAM LETTER HIGH KA..TAI THAM LETTER GREAT SA 1B05..1B33 ; Lo # [47] BALINESE LETTER AKARA..BALINESE LETTER HA -1B45..1B4B ; Lo # [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; Lo # [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B83..1BA0 ; Lo # [30] SUNDANESE LETTER A..SUNDANESE LETTER HA 1BAE..1BAF ; Lo # [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA 1BBA..1BE5 ; Lo # [44] SUNDANESE AVAGRAHA..BATAK LETTER U @@ -2297,8 +2347,7 @@ FF9E..FF9F ; Lm # [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAK 31A0..31BF ; Lo # [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH 31F0..31FF ; Lo # [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO 3400..4DBF ; Lo # [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; Lo # [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -A000..A014 ; Lo # [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; Lo # [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A016..A48C ; Lo # [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A4D0..A4F7 ; Lo # [40] LISU LETTER BA..LISU LETTER OE A500..A60B ; Lo # [268] VAI SYLLABLE EE..VAI SYLLABLE NG @@ -2426,9 +2475,12 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 10F00..10F1C ; Lo # [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL 10F27 ; Lo # OLD SOGDIAN LIGATURE AYIN-DALETH 10F30..10F45 ; Lo # [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN +10F70..10F81 ; Lo # [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH 10FB0..10FC4 ; Lo # [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FE0..10FF6 ; Lo # [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11003..11037 ; Lo # [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA +11071..11072 ; Lo # [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11075 ; Lo # BRAHMI LETTER OLD TAMIL LLA 11083..110AF ; Lo # [45] KAITHI LETTER A..KAITHI LETTER HA 110D0..110E8 ; Lo # [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE 11103..11126 ; Lo # [36] CHAKMA LETTER AA..CHAKMA LETTER HAA @@ -2470,6 +2522,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 11680..116AA ; Lo # [43] TAKRI LETTER A..TAKRI LETTER RRA 116B8 ; Lo # TAKRI LETTER ARCHAIC KHA 11700..1171A ; Lo # [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA +11740..11746 ; Lo # [7] AHOM LETTER CA..AHOM LETTER LLA 11800..1182B ; Lo # [44] DOGRA LETTER A..DOGRA LETTER RRA 118FF..11906 ; Lo # [8] WARANG CITI OM..DIVES AKURU LETTER E 11909 ; Lo # DIVES AKURU LETTER O @@ -2488,7 +2541,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 11A50 ; Lo # SOYOMBO LETTER A 11A5C..11A89 ; Lo # [46] SOYOMBO LETTER KA..SOYOMBO CLUSTER-INITIAL LETTER SA 11A9D ; Lo # SOYOMBO MARK PLUTA -11AC0..11AF8 ; Lo # [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; Lo # [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; Lo # [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; Lo # [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C40 ; Lo # BHAIKSUKI SIGN AVAGRAHA @@ -2505,10 +2558,12 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 11FB0 ; Lo # LISU LETTER YHA 12000..12399 ; Lo # [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12480..12543 ; Lo # [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; Lo # [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 13000..1342E ; Lo # [1071] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH AA032 14400..14646 ; Lo # [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; Lo # [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; Lo # [31] MRO LETTER TA..MRO LETTER TEK +16A70..16ABE ; Lo # [79] TANGSA LETTER OZ..TANGSA LETTER ZA 16AD0..16AED ; Lo # [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16B00..16B2F ; Lo # [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 16B63..16B77 ; Lo # [21] PAHAWH HMONG SIGN VOS LUB..PAHAWH HMONG SIGN CIM NRES TOS @@ -2518,7 +2573,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 17000..187F7 ; Lo # [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18CD5 ; Lo # [1238] TANGUT COMPONENT-001..KHITAN SMALL SCRIPT CHARACTER-18CD5 18D00..18D08 ; Lo # [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; Lo # [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1B000..1B122 ; Lo # [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B150..1B152 ; Lo # [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO 1B164..1B167 ; Lo # [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N 1B170..1B2FB ; Lo # [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB @@ -2526,9 +2581,15 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 1BC70..1BC7C ; Lo # [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK 1BC80..1BC88 ; Lo # [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 1BC90..1BC99 ; Lo # [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW +1DF0A ; Lo # LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK 1E100..1E12C ; Lo # [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E14E ; Lo # NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ +1E290..1E2AD ; Lo # [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; Lo # [44] WANCHO LETTER AA..WANCHO LETTER YIH +1E7E0..1E7E6 ; Lo # [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; Lo # [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; Lo # [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; Lo # [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; Lo # [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1EE00..1EE03 ; Lo # [4] ARABIC MATHEMATICAL ALEF..ARABIC MATHEMATICAL DAL 1EE05..1EE1F ; Lo # [27] ARABIC MATHEMATICAL WAW..ARABIC MATHEMATICAL DOTLESS QAF @@ -2563,15 +2624,15 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 1EEA1..1EEA3 ; Lo # [3] ARABIC MATHEMATICAL DOUBLE-STRUCK BEH..ARABIC MATHEMATICAL DOUBLE-STRUCK DAL 1EEA5..1EEA9 ; Lo # [5] ARABIC MATHEMATICAL DOUBLE-STRUCK WAW..ARABIC MATHEMATICAL DOUBLE-STRUCK YEH 1EEAB..1EEBB ; Lo # [17] ARABIC MATHEMATICAL DOUBLE-STRUCK LAM..ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN -20000..2A6DD ; Lo # [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A700..2B734 ; Lo # [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 +20000..2A6DF ; Lo # [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A700..2B738 ; Lo # [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 2B740..2B81D ; Lo # [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B820..2CEA1 ; Lo # [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 2CEB0..2EBE0 ; Lo # [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0 2F800..2FA1D ; Lo # [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D 30000..3134A ; Lo # [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A -# Total code points: 127004 +# Total code points: 127333 # ================================================ @@ -2601,7 +2662,8 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 0825..0827 ; Mn # [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U 0829..082D ; Mn # [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA 0859..085B ; Mn # [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3..08E1 ; Mn # [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0898..089F ; Mn # [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08CA..08E1 ; Mn # [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; Mn # [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 093A ; Mn # DEVANAGARI VOWEL SIGN OE 093C ; Mn # DEVANAGARI SIGN NUKTA @@ -2642,6 +2704,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 0BCD ; Mn # TAMIL SIGN VIRAMA 0C00 ; Mn # TELUGU SIGN COMBINING CANDRABINDU ABOVE 0C04 ; Mn # TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3C ; Mn # TELUGU SIGN NUKTA 0C3E..0C40 ; Mn # [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C46..0C48 ; Mn # [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI 0C4A..0C4D ; Mn # [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA @@ -2691,7 +2754,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 109D ; Mn # MYANMAR VOWEL SIGN AITON AI 135D..135F ; Mn # [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK 1712..1714 ; Mn # [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1732..1734 ; Mn # [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733 ; Mn # [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U 1752..1753 ; Mn # [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1772..1773 ; Mn # [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U 17B4..17B5 ; Mn # [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA @@ -2700,6 +2763,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 17C9..17D3 ; Mn # [11] KHMER SIGN MUUSIKATOAN..KHMER SIGN BATHAMASAT 17DD ; Mn # KHMER SIGN ATTHACAN 180B..180D ; Mn # [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; Mn # MONGOLIAN FREE VARIATION SELECTOR FOUR 1885..1886 ; Mn # [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 18A9 ; Mn # MONGOLIAN LETTER ALI GALI DAGALGA 1920..1922 ; Mn # [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U @@ -2716,7 +2780,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 1A73..1A7C ; Mn # [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN 1A7F ; Mn # TAI THAM COMBINING CRYPTOGRAMMIC DOT 1AB0..1ABD ; Mn # [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW -1ABF..1AC0 ; Mn # [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; Mn # [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; Mn # [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B34 ; Mn # BALINESE SIGN REREKAN 1B36..1B3A ; Mn # [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA @@ -2739,8 +2803,7 @@ FFDA..FFDC ; Lo # [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I 1CED ; Mn # VEDIC SIGN TIRYAK 1CF4 ; Mn # VEDIC TONE CANDRA ABOVE 1CF8..1CF9 ; Mn # [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE -1DC0..1DF9 ; Mn # [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; Mn # [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; Mn # [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 20D0..20DC ; Mn # [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE 20E1 ; Mn # COMBINING LEFT RIGHT ARROW ABOVE 20E5..20F0 ; Mn # [12] COMBINING REVERSE SOLIDUS OVERLAY..COMBINING ASTERISK ABOVE @@ -2799,11 +2862,15 @@ FE20..FE2F ; Mn # [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC TITL 10D24..10D27 ; Mn # [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10EAB..10EAC ; Mn # [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F46..10F50 ; Mn # [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; Mn # [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 11001 ; Mn # BRAHMI SIGN ANUSVARA 11038..11046 ; Mn # [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA +11070 ; Mn # BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; Mn # [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 1107F..11081 ; Mn # [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 110B3..110B6 ; Mn # [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B9..110BA ; Mn # [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; Mn # KAITHI VOWEL SIGN VOCALIC R 11100..11102 ; Mn # [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; Mn # [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112D..11134 ; Mn # [8] CHAKMA VOWEL SIGN AI..CHAKMA MAAYYAA @@ -2883,6 +2950,8 @@ FE20..FE2F ; Mn # [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC TITL 16F8F..16F92 ; Mn # [4] MIAO TONE RIGHT..MIAO TONE BELOW 16FE4 ; Mn # KHITAN SMALL SCRIPT FILLER 1BC9D..1BC9E ; Mn # [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK +1CF00..1CF2D ; Mn # [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; Mn # [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D167..1D169 ; Mn # [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D17B..1D182 ; Mn # [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE 1D185..1D18B ; Mn # [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE @@ -2900,12 +2969,13 @@ FE20..FE2F ; Mn # [16] COMBINING LIGATURE LEFT HALF..COMBINING CYRILLIC TITL 1E023..1E024 ; Mn # [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; Mn # [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; Mn # [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; Mn # TOTO SIGN RISING TONE 1E2EC..1E2EF ; Mn # [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; Mn # [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E94A ; Mn # [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA E0100..E01EF ; Mn # [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 1839 +# Total code points: 1950 # ================================================ @@ -2980,6 +3050,8 @@ A670..A672 ; Me # [3] COMBINING CYRILLIC TEN MILLIONS SIGN..COMBINING CYRIL 1087..108C ; Mc # [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3 108F ; Mc # MYANMAR SIGN RUMAI PALAUNG TONE-5 109A..109C ; Mc # [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A +1715 ; Mc # TAGALOG SIGN PAMUDPOD +1734 ; Mc # HANUNOO SIGN PAMUDPOD 17B6 ; Mc # KHMER VOWEL SIGN AA 17BE..17C5 ; Mc # [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU 17C7..17C8 ; Mc # [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU @@ -3099,7 +3171,7 @@ ABEC ; Mc # MEETEI MAYEK LUM IYEK 1D165..1D166 ; Mc # [2] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING SPRECHGESANG STEM 1D16D..1D172 ; Mc # [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 -# Total code points: 443 +# Total code points: 445 # ================================================ @@ -3160,6 +3232,7 @@ FF10..FF19 ; Nd # [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 11D50..11D59 ; Nd # [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE 11DA0..11DA9 ; Nd # [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE 16A60..16A69 ; Nd # [10] MRO DIGIT ZERO..MRO DIGIT NINE +16AC0..16AC9 ; Nd # [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; Nd # [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 1D7CE..1D7FF ; Nd # [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; Nd # [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -3167,7 +3240,7 @@ FF10..FF19 ; Nd # [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 1E950..1E959 ; Nd # [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; Nd # [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 650 +# Total code points: 660 # ================================================ @@ -3314,6 +3387,7 @@ A830..A835 ; No # [6] NORTH INDIC FRACTION ONE QUARTER..NORTH INDIC FRACTIO 061C ; Cf # ARABIC LETTER MARK 06DD ; Cf # ARABIC END OF AYAH 070F ; Cf # SYRIAC ABBREVIATION MARK +0890..0891 ; Cf # [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE 08E2 ; Cf # ARABIC DISPUTED END OF AYAH 180E ; Cf # MONGOLIAN VOWEL SEPARATOR 200B..200F ; Cf # [5] ZERO WIDTH SPACE..RIGHT-TO-LEFT MARK @@ -3330,7 +3404,7 @@ FFF9..FFFB ; Cf # [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTATION E0001 ; Cf # LANGUAGE TAG E0020..E007F ; Cf # [96] TAG SPACE..CANCEL TAG -# Total code points: 161 +# Total code points: 163 # ================================================ @@ -3364,6 +3438,7 @@ D800..DFFF ; Cs # [2048] .. 2E1A ; Pd # HYPHEN WITH DIAERESIS 2E3A..2E3B ; Pd # [2] TWO-EM DASH..THREE-EM DASH 2E40 ; Pd # DOUBLE HYPHEN +2E5D ; Pd # OBLIQUE HYPHEN 301C ; Pd # WAVE DASH 3030 ; Pd # WAVY DASH 30A0 ; Pd # KATAKANA-HIRAGANA DOUBLE HYPHEN @@ -3373,7 +3448,7 @@ FE63 ; Pd # SMALL HYPHEN-MINUS FF0D ; Pd # FULLWIDTH HYPHEN-MINUS 10EAD ; Pd # YEZIDI HYPHENATION MARK -# Total code points: 25 +# Total code points: 26 # ================================================ @@ -3425,6 +3500,10 @@ FF0D ; Pd # FULLWIDTH HYPHEN-MINUS 2E26 ; Ps # LEFT SIDEWAYS U BRACKET 2E28 ; Ps # LEFT DOUBLE PARENTHESIS 2E42 ; Ps # DOUBLE LOW-REVERSED-9 QUOTATION MARK +2E55 ; Ps # LEFT SQUARE BRACKET WITH STROKE +2E57 ; Ps # LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; Ps # TOP HALF LEFT PARENTHESIS +2E5B ; Ps # BOTTOM HALF LEFT PARENTHESIS 3008 ; Ps # LEFT ANGLE BRACKET 300A ; Ps # LEFT DOUBLE ANGLE BRACKET 300C ; Ps # LEFT CORNER BRACKET @@ -3455,7 +3534,7 @@ FF5B ; Ps # FULLWIDTH LEFT CURLY BRACKET FF5F ; Ps # FULLWIDTH LEFT WHITE PARENTHESIS FF62 ; Ps # HALFWIDTH LEFT CORNER BRACKET -# Total code points: 75 +# Total code points: 79 # ================================================ @@ -3504,6 +3583,10 @@ FF62 ; Ps # HALFWIDTH LEFT CORNER BRACKET 2E25 ; Pe # BOTTOM RIGHT HALF BRACKET 2E27 ; Pe # RIGHT SIDEWAYS U BRACKET 2E29 ; Pe # RIGHT DOUBLE PARENTHESIS +2E56 ; Pe # RIGHT SQUARE BRACKET WITH STROKE +2E58 ; Pe # RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E5A ; Pe # TOP HALF RIGHT PARENTHESIS +2E5C ; Pe # BOTTOM HALF RIGHT PARENTHESIS 3009 ; Pe # RIGHT ANGLE BRACKET 300B ; Pe # RIGHT DOUBLE ANGLE BRACKET 300D ; Pe # RIGHT CORNER BRACKET @@ -3534,7 +3617,7 @@ FF5D ; Pe # FULLWIDTH RIGHT CURLY BRACKET FF60 ; Pe # FULLWIDTH RIGHT WHITE PARENTHESIS FF63 ; Pe # HALFWIDTH RIGHT CORNER BRACKET -# Total code points: 73 +# Total code points: 77 # ================================================ @@ -3576,7 +3659,7 @@ FF3F ; Pc # FULLWIDTH LOW LINE 0609..060A ; Po # [2] ARABIC-INDIC PER MILLE SIGN..ARABIC-INDIC PER TEN THOUSAND SIGN 060C..060D ; Po # [2] ARABIC COMMA..ARABIC DATE SEPARATOR 061B ; Po # ARABIC SEMICOLON -061E..061F ; Po # [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; Po # [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 066A..066D ; Po # [4] ARABIC PERCENT SIGN..ARABIC FIVE POINTED STAR 06D4 ; Po # ARABIC FULL STOP 0700..070D ; Po # [14] SYRIAC END OF PARAGRAPH..SYRIAC HARKLEAN ASTERISCUS @@ -3613,6 +3696,7 @@ FF3F ; Pc # FULLWIDTH LOW LINE 1AA0..1AA6 ; Po # [7] TAI THAM SIGN WIANG..TAI THAM SIGN REVERSED ROTATED RANA 1AA8..1AAD ; Po # [6] TAI THAM SIGN KAAN..TAI THAM SIGN CAANG 1B5A..1B60 ; Po # [7] BALINESE PANTI..BALINESE PAMENENG +1B7D..1B7E ; Po # [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1BFC..1BFF ; Po # [4] BATAK SYMBOL BINDU NA METEK..BATAK SYMBOL BINDU PANGOLAT 1C3B..1C3F ; Po # [5] LEPCHA PUNCTUATION TA-ROL..LEPCHA PUNCTUATION TSHOOK 1C7E..1C7F ; Po # [2] OL CHIKI PUNCTUATION MUCAAD..OL CHIKI PUNCTUATION DOUBLE MUCAAD @@ -3641,7 +3725,7 @@ FF3F ; Pc # FULLWIDTH LOW LINE 2E3C..2E3F ; Po # [4] STENOGRAPHIC FULL STOP..CAPITULUM 2E41 ; Po # REVERSED COMMA 2E43..2E4F ; Po # [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER -2E52 ; Po # TIRONIAN SIGN CAPITAL ET +2E52..2E54 ; Po # [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK 3001..3003 ; Po # [3] IDEOGRAPHIC COMMA..DITTO MARK 303D ; Po # PART ALTERNATION MARK 30FB ; Po # KATAKANA MIDDLE DOT @@ -3695,6 +3779,7 @@ FF64..FF65 ; Po # [2] HALFWIDTH IDEOGRAPHIC COMMA..HALFWIDTH KATAKANA MIDDL 10B39..10B3F ; Po # [7] AVESTAN ABBREVIATION MARK..LARGE ONE RING OVER TWO RINGS PUNCTUATION 10B99..10B9C ; Po # [4] PSALTER PAHLAVI SECTION MARK..PSALTER PAHLAVI FOUR DOTS WITH DOT 10F55..10F59 ; Po # [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F86..10F89 ; Po # [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 11047..1104D ; Po # [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS 110BB..110BC ; Po # [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN 110BE..110C1 ; Po # [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA @@ -3713,6 +3798,7 @@ FF64..FF65 ; Po # [2] HALFWIDTH IDEOGRAPHIC COMMA..HALFWIDTH KATAKANA MIDDL 115C1..115D7 ; Po # [23] SIDDHAM SIGN SIDDHAM..SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES 11641..11643 ; Po # [3] MODI DANDA..MODI ABBREVIATION SIGN 11660..1166C ; Po # [13] MONGOLIAN BIRGA WITH ORNAMENT..MONGOLIAN TURNED SWIRL BIRGA WITH DOUBLE ORNAMENT +116B9 ; Po # TAKRI ABBREVIATION SIGN 1173C..1173E ; Po # [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI 1183B ; Po # DOGRA ABBREVIATION SIGN 11944..11946 ; Po # [3] DIVES AKURU DOUBLE DANDA..DIVES AKURU END OF TEXT MARK @@ -3725,6 +3811,7 @@ FF64..FF65 ; Po # [2] HALFWIDTH IDEOGRAPHIC COMMA..HALFWIDTH KATAKANA MIDDL 11EF7..11EF8 ; Po # [2] MAKASAR PASSIMBANG..MAKASAR END OF SECTION 11FFF ; Po # TAMIL PUNCTUATION END OF TEXT 12470..12474 ; Po # [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON +12FF1..12FF2 ; Po # [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 16A6E..16A6F ; Po # [2] MRO DANDA..MRO DOUBLE DANDA 16AF5 ; Po # BASSA VAH FULL STOP 16B37..16B3B ; Po # [5] PAHAWH HMONG SIGN VOS THOM..PAHAWH HMONG SIGN VOS FEEM @@ -3735,7 +3822,7 @@ FF64..FF65 ; Po # [2] HALFWIDTH IDEOGRAPHIC COMMA..HALFWIDTH KATAKANA MIDDL 1DA87..1DA8B ; Po # [5] SIGNWRITING COMMA..SIGNWRITING PARENTHESIS 1E95E..1E95F ; Po # [2] ADLAM INITIAL EXCLAMATION MARK..ADLAM INITIAL QUESTION MARK -# Total code points: 593 +# Total code points: 605 # ================================================ @@ -3823,7 +3910,7 @@ FFE9..FFEC ; Sm # [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS ARROW 0BF9 ; Sc # TAMIL RUPEE SIGN 0E3F ; Sc # THAI CURRENCY SYMBOL BAHT 17DB ; Sc # KHMER CURRENCY SYMBOL RIEL -20A0..20BF ; Sc # [32] EURO-CURRENCY SIGN..BITCOIN SIGN +20A0..20C0 ; Sc # [33] EURO-CURRENCY SIGN..SOM SIGN A838 ; Sc # NORTH INDIC RUPEE MARK FDFC ; Sc # RIAL SIGN FE69 ; Sc # SMALL DOLLAR SIGN @@ -3834,7 +3921,7 @@ FFE5..FFE6 ; Sc # [2] FULLWIDTH YEN SIGN..FULLWIDTH WON SIGN 1E2FF ; Sc # WANCHO NGUN SIGN 1ECB0 ; Sc # INDIC SIYAQ RUPEE MARK -# Total code points: 62 +# Total code points: 63 # ================================================ @@ -3853,6 +3940,7 @@ FFE5..FFE6 ; Sc # [2] FULLWIDTH YEN SIGN..FULLWIDTH WON SIGN 02EF..02FF ; Sk # [17] MODIFIER LETTER LOW DOWN ARROWHEAD..MODIFIER LETTER LOW LEFT ARROW 0375 ; Sk # GREEK LOWER NUMERAL SIGN 0384..0385 ; Sk # [2] GREEK TONOS..GREEK DIALYTIKA TONOS +0888 ; Sk # ARABIC RAISED ROUND DOT 1FBD ; Sk # GREEK KORONIS 1FBF..1FC1 ; Sk # [3] GREEK PSILI..GREEK DIALYTIKA AND PERISPOMENI 1FCD..1FCF ; Sk # [3] GREEK PSILI AND VARIA..GREEK PSILI AND PERISPOMENI @@ -3865,13 +3953,13 @@ A720..A721 ; Sk # [2] MODIFIER LETTER STRESS AND HIGH TONE..MODIFIER LETTER A789..A78A ; Sk # [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN AB5B ; Sk # MODIFIER BREVE WITH INVERTED BREVE AB6A..AB6B ; Sk # [2] MODIFIER LETTER LEFT TACK..MODIFIER LETTER RIGHT TACK -FBB2..FBC1 ; Sk # [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2 ; Sk # [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FF3E ; Sk # FULLWIDTH CIRCUMFLEX ACCENT FF40 ; Sk # FULLWIDTH GRAVE ACCENT FFE3 ; Sk # FULLWIDTH MACRON 1F3FB..1F3FF ; Sk # [5] EMOJI MODIFIER FITZPATRICK TYPE-1-2..EMOJI MODIFIER FITZPATRICK TYPE-6 -# Total code points: 123 +# Total code points: 125 # ================================================ @@ -3984,7 +4072,9 @@ A828..A82B ; So # [4] SYLOTI NAGRI POETRY MARK-1..SYLOTI NAGRI POETRY MARK- A836..A837 ; So # [2] NORTH INDIC QUARTER MARK..NORTH INDIC PLACEHOLDER MARK A839 ; So # NORTH INDIC QUANTITY MARK AA77..AA79 ; So # [3] MYANMAR SYMBOL AITON EXCLAMATION..MYANMAR SYMBOL AITON TWO -FDFD ; So # ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FD40..FD4F ; So # [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH +FDCF ; So # ARABIC LIGATURE SALAAMUHU ALAYNAA +FDFD..FDFF ; So # [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FFE4 ; So # FULLWIDTH BROKEN BAR FFE8 ; So # HALFWIDTH FORMS LIGHT VERTICAL FFED..FFEE ; So # [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE @@ -4003,13 +4093,14 @@ FFFC..FFFD ; So # [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 16B3C..16B3F ; So # [4] PAHAWH HMONG SIGN XYEEM NTXIV..PAHAWH HMONG SIGN XYEEM FAIB 16B45 ; So # PAHAWH HMONG SIGN CIM TSOV ROG 1BC9C ; So # DUPLOYAN SIGN O WITH CROSS +1CF50..1CFC3 ; So # [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5 ; So # [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126 ; So # [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129..1D164 ; So # [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE 1D16A..1D16C ; So # [3] MUSICAL SYMBOL FINGERED TREMOLO-1..MUSICAL SYMBOL FINGERED TREMOLO-3 1D183..1D184 ; So # [2] MUSICAL SYMBOL ARPEGGIATO UP..MUSICAL SYMBOL ARPEGGIATO DOWN 1D18C..1D1A9 ; So # [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH -1D1AE..1D1E8 ; So # [59] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KIEVAN FLAT SIGN +1D1AE..1D1EA ; So # [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON 1D200..1D241 ; So # [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54 1D245 ; So # GREEK MUSICAL LEIMMA 1D300..1D356 ; So # [87] MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING @@ -4035,32 +4126,33 @@ FFFC..FFFD ; So # [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER 1F260..1F265 ; So # [6] ROUNDED SYMBOL FOR FU..ROUNDED SYMBOL FOR CAI 1F300..1F3FA ; So # [251] CYCLONE..AMPHORA 1F400..1F6D7 ; So # [728] RAT..ELEVATOR -1F6E0..1F6EC ; So # [13] HAMMER AND WRENCH..AIRPLANE ARRIVING +1F6DD..1F6EC ; So # [16] PLAYGROUND SLIDE..AIRPLANE ARRIVING 1F6F0..1F6FC ; So # [13] SATELLITE..ROLLER SKATE 1F700..1F773 ; So # [116] ALCHEMICAL SYMBOL FOR QUINTESSENCE..ALCHEMICAL SYMBOL FOR HALF OUNCE 1F780..1F7D8 ; So # [89] BLACK LEFT-POINTING ISOSCELES RIGHT TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7E0..1F7EB ; So # [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE +1F7F0 ; So # HEAVY EQUALS SIGN 1F800..1F80B ; So # [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD 1F810..1F847 ; So # [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW 1F850..1F859 ; So # [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW 1F860..1F887 ; So # [40] WIDE-HEADED LEFTWARDS LIGHT BARB ARROW..WIDE-HEADED SOUTH WEST VERY HEAVY BARB ARROW 1F890..1F8AD ; So # [30] LEFTWARDS TRIANGLE ARROWHEAD..WHITE ARROW SHAFT WIDTH TWO THIRDS 1F8B0..1F8B1 ; So # [2] ARROW POINTING UPWARDS THEN NORTH WEST..ARROW POINTING RIGHTWARDS THEN CURVING SOUTH WEST -1F900..1F978 ; So # [121] CIRCLED CROSS FORMEE WITH FOUR DOTS..DISGUISED FACE -1F97A..1F9CB ; So # [82] FACE WITH PLEADING EYES..BUBBLE TEA -1F9CD..1FA53 ; So # [135] STANDING PERSON..BLACK CHESS KNIGHT-BISHOP +1F900..1FA53 ; So # [340] CIRCLED CROSS FORMEE WITH FOUR DOTS..BLACK CHESS KNIGHT-BISHOP 1FA60..1FA6D ; So # [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER 1FA70..1FA74 ; So # [5] BALLET SHOES..THONG SANDAL -1FA78..1FA7A ; So # [3] DROP OF BLOOD..STETHOSCOPE +1FA78..1FA7C ; So # [5] DROP OF BLOOD..CRUTCH 1FA80..1FA86 ; So # [7] YO-YO..NESTING DOLLS -1FA90..1FAA8 ; So # [25] RINGED PLANET..ROCK -1FAB0..1FAB6 ; So # [7] FLY..FEATHER -1FAC0..1FAC2 ; So # [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAD0..1FAD6 ; So # [7] BLUEBERRIES..TEAPOT +1FA90..1FAAC ; So # [29] RINGED PLANET..HAMSA +1FAB0..1FABA ; So # [11] FLY..NEST WITH EGGS +1FAC0..1FAC5 ; So # [6] ANATOMICAL HEART..PERSON WITH CROWN +1FAD0..1FAD9 ; So # [10] BLUEBERRIES..JAR +1FAE0..1FAE7 ; So # [8] MELTING FACE..BUBBLES +1FAF0..1FAF6 ; So # [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS 1FB00..1FB92 ; So # [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA ; So # [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON -# Total code points: 6431 +# Total code points: 6605 # ================================================ diff --git a/lib/unicore/extracted/DJoinGroup.txt b/lib/unicore/extracted/DJoinGroup.txt index 0888bf0181..da46dd0a42 100644 --- a/lib/unicore/extracted/DJoinGroup.txt +++ b/lib/unicore/extracted/DJoinGroup.txt @@ -1,6 +1,6 @@ -# DerivedJoiningGroup-13.0.0.txt -# Date: 2019-09-08, 23:31:07 GMT -# © 2019 Unicode®, Inc. +# DerivedJoiningGroup-14.0.0.txt +# Date: 2021-05-11, 21:19:35 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -41,8 +41,9 @@ 0671..0673 ; Alef # Lo [3] ARABIC LETTER ALEF WASLA..ARABIC LETTER ALEF WITH WAVY HAMZA BELOW 0675 ; Alef # Lo ARABIC LETTER HIGH HAMZA ALEF 0773..0774 ; Alef # Lo [2] ARABIC LETTER ALEF WITH EXTENDED ARABIC-INDIC DIGIT TWO ABOVE..ARABIC LETTER ALEF WITH EXTENDED ARABIC-INDIC DIGIT THREE ABOVE +0870..0882 ; Alef # Lo [19] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC LETTER ALEF WITH ATTACHED LEFT HAMZA -# Total code points: 10 +# Total code points: 29 # ================================================ @@ -110,10 +111,12 @@ 06AB ; Gaf # Lo ARABIC LETTER KAF WITH RING 06AF..06B4 ; Gaf # Lo [6] ARABIC LETTER GAF..ARABIC LETTER GAF WITH THREE DOTS ABOVE 0762..0764 ; Gaf # Lo [3] ARABIC LETTER KEHEH WITH DOT ABOVE..ARABIC LETTER KEHEH WITH THREE DOTS POINTING UPWARDS BELOW +088D ; Gaf # Lo ARABIC LETTER KEHEH WITH TWO DOTS VERTICALLY BELOW 08B0 ; Gaf # Lo ARABIC LETTER GAF WITH INVERTED STROKE 08C2 ; Gaf # Lo ARABIC LETTER KEHEH WITH SMALL V +08C8 ; Gaf # Lo ARABIC LETTER GRAF -# Total code points: 15 +# Total code points: 17 # ================================================ @@ -131,11 +134,12 @@ 076E..076F ; Hah # Lo [2] ARABIC LETTER HAH WITH SMALL ARABIC LETTER TAH BELOW..ARABIC LETTER HAH WITH SMALL ARABIC LETTER TAH AND TWO DOTS 0772 ; Hah # Lo ARABIC LETTER HAH WITH SMALL ARABIC LETTER TAH ABOVE 077C ; Hah # Lo ARABIC LETTER HAH WITH EXTENDED ARABIC-INDIC DIGIT FOUR BELOW +088A ; Hah # Lo ARABIC LETTER HAH WITH INVERTED SMALL V BELOW 08A2 ; Hah # Lo ARABIC LETTER JEEM WITH TWO DOTS ABOVE 08C1 ; Hah # Lo ARABIC LETTER TCHEH WITH SMALL V 08C5..08C6 ; Hah # Lo [2] ARABIC LETTER JEEM WITH THREE DOTS ABOVE..ARABIC LETTER JEEM WITH THREE DOTS BELOW -# Total code points: 21 +# Total code points: 22 # ================================================ @@ -224,8 +228,9 @@ 0646 ; Noon # Lo ARABIC LETTER NOON 06B9..06BC ; Noon # Lo [4] ARABIC LETTER NOON WITH DOT BELOW..ARABIC LETTER NOON WITH RING 0767..0769 ; Noon # Lo [3] ARABIC LETTER NOON WITH TWO DOTS BELOW..ARABIC LETTER NOON WITH SMALL V +0889 ; Noon # Lo ARABIC LETTER NOON WITH INVERTED SMALL V -# Total code points: 8 +# Total code points: 9 # ================================================ @@ -245,8 +250,9 @@ 066F ; Qaf # Lo ARABIC LETTER DOTLESS QAF 06A7..06A8 ; Qaf # Lo [2] ARABIC LETTER QAF WITH DOT ABOVE..ARABIC LETTER QAF WITH THREE DOTS ABOVE 08A5 ; Qaf # Lo ARABIC LETTER QAF WITH DOT BELOW +08B5 ; Qaf # Lo ARABIC LETTER QAF WITH DOT BELOW AND NO DOTS ABOVE -# Total code points: 5 +# Total code points: 6 # ================================================ @@ -323,9 +329,10 @@ 0637..0638 ; Tah # Lo [2] ARABIC LETTER TAH..ARABIC LETTER ZAH 069F ; Tah # Lo ARABIC LETTER TAH WITH THREE DOTS ABOVE +088B..088C ; Tah # Lo [2] ARABIC LETTER TAH WITH DOT BELOW..ARABIC LETTER TAH WITH THREE DOTS BELOW 08A3 ; Tah # Lo ARABIC LETTER TAH WITH TWO DOTS ABOVE -# Total code points: 4 +# Total code points: 6 # ================================================ @@ -723,4 +730,16 @@ # Total code points: 4 +# ================================================ + +0886 ; Thin_Yeh # Lo ARABIC LETTER THIN YEH + +# Total code points: 1 + +# ================================================ + +088E ; Vertical_Tail # Lo ARABIC VERTICAL TAIL + +# Total code points: 1 + # EOF diff --git a/lib/unicore/extracted/DJoinType.txt b/lib/unicore/extracted/DJoinType.txt index 57229cc736..7c36d028a3 100644 --- a/lib/unicore/extracted/DJoinType.txt +++ b/lib/unicore/extracted/DJoinType.txt @@ -1,6 +1,6 @@ -# DerivedJoiningType-13.0.0.txt -# Date: 2020-01-21, 07:36:28 GMT -# © 2020 Unicode®, Inc. +# DerivedJoiningType-14.0.0.txt +# Date: 2021-05-28, 21:49:06 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -22,10 +22,11 @@ 0640 ; C # Lm ARABIC TATWEEL 07FA ; C # Lm NKO LAJANYALAN +0883..0885 ; C # Lo [3] ARABIC TATWEEL WITH OVERSTRUCK HAMZA..ARABIC TATWEEL WITH TWO DOTS BELOW 180A ; C # Po MONGOLIAN NIRUGU 200D ; C # Cf ZERO WIDTH JOINER -# Total code points: 4 +# Total code points: 7 # ================================================ @@ -67,11 +68,12 @@ 0860 ; D # Lo SYRIAC LETTER MALAYALAM NGA 0862..0865 ; D # Lo [4] SYRIAC LETTER MALAYALAM NYA..SYRIAC LETTER MALAYALAM NNNA 0868 ; D # Lo SYRIAC LETTER MALAYALAM LLA +0886 ; D # Lo ARABIC LETTER THIN YEH +0889..088D ; D # Lo [5] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC LETTER KEHEH WITH TWO DOTS VERTICALLY BELOW 08A0..08A9 ; D # Lo [10] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER YEH WITH TWO DOTS BELOW AND DOT ABOVE 08AF..08B0 ; D # Lo [2] ARABIC LETTER SAD WITH THREE DOTS BELOW..ARABIC LETTER GAF WITH INVERTED STROKE -08B3..08B4 ; D # Lo [2] ARABIC LETTER AIN WITH THREE DOTS BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08B8 ; D # Lo [3] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER TEH WITH SMALL TEH ABOVE -08BA..08C7 ; D # Lo [14] ARABIC LETTER YEH WITH TWO DOTS BELOW AND SMALL NOON ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +08B3..08B8 ; D # Lo [6] ARABIC LETTER AIN WITH THREE DOTS BELOW..ARABIC LETTER TEH WITH SMALL TEH ABOVE +08BA..08C8 ; D # Lo [15] ARABIC LETTER YEH WITH TWO DOTS BELOW AND SMALL NOON ABOVE..ARABIC LETTER GRAF 1807 ; D # Po MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER 1820..1842 ; D # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI 1843 ; D # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN @@ -96,6 +98,8 @@ A840..A871 ; D # Lo [50] PHAGS-PA LETTER KA..PHAGS-PA SUBJOINED LETTER RA 10F30..10F32 ; D # Lo [3] SOGDIAN LETTER ALEPH..SOGDIAN LETTER GIMEL 10F34..10F44 ; D # Lo [17] SOGDIAN LETTER WAW..SOGDIAN LETTER LESH 10F51..10F53 ; D # No [3] SOGDIAN NUMBER ONE..SOGDIAN NUMBER TWENTY +10F70..10F73 ; D # Lo [4] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER WAW +10F76..10F81 ; D # Lo [12] OLD UYGHUR LETTER YODH..OLD UYGHUR LETTER LESH 10FB0 ; D # Lo CHORASMIAN LETTER ALEPH 10FB2..10FB3 ; D # Lo [2] CHORASMIAN LETTER BETH..CHORASMIAN LETTER GIMEL 10FB8 ; D # Lo CHORASMIAN LETTER ZAYIN @@ -106,7 +110,7 @@ A840..A871 ; D # Lo [50] PHAGS-PA LETTER KA..PHAGS-PA SUBJOINED LETTER RA 10FCA ; D # No CHORASMIAN NUMBER TWENTY 1E900..1E943 ; D # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA -# Total code points: 586 +# Total code points: 610 # ================================================ @@ -147,6 +151,8 @@ A840..A871 ; D # Lo [50] PHAGS-PA LETTER KA..PHAGS-PA SUBJOINED LETTER RA 0856..0858 ; R # Lo [3] MANDAIC LETTER DUSHENNA..MANDAIC LETTER AIN 0867 ; R # Lo SYRIAC LETTER MALAYALAM RA 0869..086A ; R # Lo [2] SYRIAC LETTER MALAYALAM LLLA..SYRIAC LETTER MALAYALAM SSA +0870..0882 ; R # Lo [19] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC LETTER ALEF WITH ATTACHED LEFT HAMZA +088E ; R # Lo ARABIC VERTICAL TAIL 08AA..08AC ; R # Lo [3] ARABIC LETTER REH WITH LOOP..ARABIC LETTER ROHINGYA YEH 08AE ; R # Lo ARABIC LETTER DAL WITH THREE DOTS BELOW 08B1..08B2 ; R # Lo [2] ARABIC LETTER STRAIGHT WAW..ARABIC LETTER ZAIN WITH INVERTED V ABOVE @@ -169,13 +175,14 @@ A840..A871 ; D # Lo [50] PHAGS-PA LETTER KA..PHAGS-PA SUBJOINED LETTER RA 10D22 ; R # Lo HANIFI ROHINGYA MARK SAKIN 10F33 ; R # Lo SOGDIAN LETTER HE 10F54 ; R # No SOGDIAN NUMBER ONE HUNDRED +10F74..10F75 ; R # Lo [2] OLD UYGHUR LETTER ZAYIN..OLD UYGHUR LETTER FINAL HETH 10FB4..10FB6 ; R # Lo [3] CHORASMIAN LETTER DALETH..CHORASMIAN LETTER WAW 10FB9..10FBA ; R # Lo [2] CHORASMIAN LETTER HETH..CHORASMIAN LETTER YODH 10FBD ; R # Lo CHORASMIAN LETTER MEM 10FC2..10FC3 ; R # Lo [2] CHORASMIAN LETTER RESH..CHORASMIAN LETTER SHIN 10FC9 ; R # No CHORASMIAN NUMBER TEN -# Total code points: 130 +# Total code points: 152 # ================================================ @@ -221,7 +228,8 @@ A872 ; L # Lo PHAGS-PA SUPERFIXED LETTER RA 0825..0827 ; T # Mn [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U 0829..082D ; T # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA 0859..085B ; T # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3..08E1 ; T # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0898..089F ; T # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08CA..08E1 ; T # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; T # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 093A ; T # Mn DEVANAGARI VOWEL SIGN OE 093C ; T # Mn DEVANAGARI SIGN NUKTA @@ -262,6 +270,7 @@ A872 ; L # Lo PHAGS-PA SUPERFIXED LETTER RA 0BCD ; T # Mn TAMIL SIGN VIRAMA 0C00 ; T # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE 0C04 ; T # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3C ; T # Mn TELUGU SIGN NUKTA 0C3E..0C40 ; T # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C46..0C48 ; T # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI 0C4A..0C4D ; T # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA @@ -311,7 +320,7 @@ A872 ; L # Lo PHAGS-PA SUPERFIXED LETTER RA 109D ; T # Mn MYANMAR VOWEL SIGN AITON AI 135D..135F ; T # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK 1712..1714 ; T # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1732..1734 ; T # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1732..1733 ; T # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U 1752..1753 ; T # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1772..1773 ; T # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U 17B4..17B5 ; T # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA @@ -320,6 +329,7 @@ A872 ; L # Lo PHAGS-PA SUPERFIXED LETTER RA 17C9..17D3 ; T # Mn [11] KHMER SIGN MUUSIKATOAN..KHMER SIGN BATHAMASAT 17DD ; T # Mn KHMER SIGN ATTHACAN 180B..180D ; T # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; T # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1885..1886 ; T # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 18A9 ; T # Mn MONGOLIAN LETTER ALI GALI DAGALGA 1920..1922 ; T # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U @@ -337,7 +347,7 @@ A872 ; L # Lo PHAGS-PA SUPERFIXED LETTER RA 1A7F ; T # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 1AB0..1ABD ; T # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; T # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; T # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; T # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; T # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B34 ; T # Mn BALINESE SIGN REREKAN 1B36..1B3A ; T # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA @@ -360,8 +370,7 @@ A872 ; L # Lo PHAGS-PA SUPERFIXED LETTER RA 1CED ; T # Mn VEDIC SIGN TIRYAK 1CF4 ; T # Mn VEDIC TONE CANDRA ABOVE 1CF8..1CF9 ; T # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE -1DC0..1DF9 ; T # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; T # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; T # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 200B ; T # Cf ZERO WIDTH SPACE 200E..200F ; T # Cf [2] LEFT-TO-RIGHT MARK..RIGHT-TO-LEFT MARK 202A..202E ; T # Cf [5] LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE @@ -430,11 +439,15 @@ FFF9..FFFB ; T # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTATI 10D24..10D27 ; T # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10EAB..10EAC ; T # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F46..10F50 ; T # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; T # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 11001 ; T # Mn BRAHMI SIGN ANUSVARA 11038..11046 ; T # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA +11070 ; T # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; T # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 1107F..11081 ; T # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 110B3..110B6 ; T # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B9..110BA ; T # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; T # Mn KAITHI VOWEL SIGN VOCALIC R 11100..11102 ; T # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; T # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112D..11134 ; T # Mn [8] CHAKMA VOWEL SIGN AI..CHAKMA MAAYYAA @@ -516,6 +529,8 @@ FFF9..FFFB ; T # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTATI 16FE4 ; T # Mn KHITAN SMALL SCRIPT FILLER 1BC9D..1BC9E ; T # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 1BCA0..1BCA3 ; T # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF00..1CF2D ; T # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; T # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D167..1D169 ; T # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D173..1D17A ; T # Cf [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE 1D17B..1D182 ; T # Mn [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE @@ -534,6 +549,7 @@ FFF9..FFFB ; T # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTATI 1E023..1E024 ; T # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; T # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; T # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; T # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; T # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; T # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E94A ; T # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA @@ -542,6 +558,6 @@ E0001 ; T # Cf LANGUAGE TAG E0020..E007F ; T # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; T # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 1997 +# Total code points: 2108 # EOF diff --git a/lib/unicore/extracted/DLineBreak.txt b/lib/unicore/extracted/DLineBreak.txt index 0f326def56..2504c3f7e1 100644 --- a/lib/unicore/extracted/DLineBreak.txt +++ b/lib/unicore/extracted/DLineBreak.txt @@ -1,6 +1,6 @@ -# DerivedLineBreak-13.0.0.txt -# Date: 2020-02-17, 18:43:18 GMT -# © 2020 Unicode®, Inc. +# DerivedLineBreak-14.0.0.txt +# Date: 2021-07-10, 00:35:09 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -24,8 +24,8 @@ E000..F8FF ; XX # Co [6400] .. F0000..FFFFD ; XX # Co [65534] .. 100000..10FFFD; XX # Co [65534] .. -# The above property value applies to 763788 code points not listed here. -# Total code points: 901256 +# The above property value applies to 762997 code points not listed here. +# Total code points: 900465 # ================================================ @@ -80,6 +80,10 @@ F0000..FFFFD ; XX # Co [65534] .. 2E26 ; OP # Ps LEFT SIDEWAYS U BRACKET 2E28 ; OP # Ps LEFT DOUBLE PARENTHESIS 2E42 ; OP # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK +2E55 ; OP # Ps LEFT SQUARE BRACKET WITH STROKE +2E57 ; OP # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE +2E59 ; OP # Ps TOP HALF LEFT PARENTHESIS +2E5B ; OP # Ps BOTTOM HALF LEFT PARENTHESIS 3008 ; OP # Ps LEFT ANGLE BRACKET 300A ; OP # Ps LEFT DOUBLE ANGLE BRACKET 300C ; OP # Ps LEFT CORNER BRACKET @@ -117,7 +121,7 @@ FF62 ; OP # Ps HALFWIDTH LEFT CORNER BRACKET 145CE ; OP # Lo ANATOLIAN HIEROGLYPH A410 BEGIN LOGOGRAM MARK 1E95E..1E95F ; OP # Po [2] ADLAM INITIAL EXCLAMATION MARK..ADLAM INITIAL QUESTION MARK -# Total code points: 88 +# Total code points: 92 # ================================================ @@ -164,6 +168,10 @@ FF62 ; OP # Ps HALFWIDTH LEFT CORNER BRACKET 2E25 ; CL # Pe BOTTOM RIGHT HALF BRACKET 2E27 ; CL # Pe RIGHT SIDEWAYS U BRACKET 2E29 ; CL # Pe RIGHT DOUBLE PARENTHESIS +2E56 ; CL # Pe RIGHT SQUARE BRACKET WITH STROKE +2E58 ; CL # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE +2E5A ; CL # Pe TOP HALF RIGHT PARENTHESIS +2E5C ; CL # Pe BOTTOM HALF RIGHT PARENTHESIS 3001..3002 ; CL # Po [2] IDEOGRAPHIC COMMA..IDEOGRAPHIC FULL STOP 3009 ; CL # Pe RIGHT ANGLE BRACKET 300B ; CL # Pe RIGHT DOUBLE ANGLE BRACKET @@ -209,7 +217,7 @@ FF64 ; CL # Po HALFWIDTH IDEOGRAPHIC COMMA 13438 ; CL # Cf EGYPTIAN HIEROGLYPH END SEGMENT 145CF ; CL # Lo ANATOLIAN HIEROGLYPH A410A END LOGOGRAM MARK -# Total code points: 91 +# Total code points: 95 # ================================================ @@ -302,7 +310,7 @@ FF9E..FF9F ; NS # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KA 003F ; EX # Po QUESTION MARK 05C6 ; EX # Po HEBREW PUNCTUATION NUN HAFUKHA 061B ; EX # Po ARABIC SEMICOLON -061E..061F ; EX # Po [2] ARABIC TRIPLE DOT PUNCTUATION MARK..ARABIC QUESTION MARK +061D..061F ; EX # Po [3] ARABIC END OF TEXT MARK..ARABIC QUESTION MARK 06D4 ; EX # Po ARABIC FULL STOP 07F9 ; EX # Po NKO EXCLAMATION MARK 0F0D..0F11 ; EX # Po [5] TIBETAN MARK SHAD..TIBETAN MARK RIN CHEN SPUNGS SHAD @@ -314,6 +322,7 @@ FF9E..FF9F ; NS # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KA 2CF9 ; EX # Po COPTIC OLD NUBIAN FULL STOP 2CFE ; EX # Po COPTIC FULL STOP 2E2E ; EX # Po REVERSED QUESTION MARK +2E53..2E54 ; EX # Po [2] MEDIEVAL EXCLAMATION MARK..MEDIEVAL QUESTION MARK A60E ; EX # Po VAI FULL STOP A876..A877 ; EX # Po [2] PHAGS-PA MARK SHAD..PHAGS-PA MARK DOUBLE SHAD FE15..FE16 ; EX # Po [2] PRESENTATION FORM FOR VERTICAL EXCLAMATION MARK..PRESENTATION FORM FOR VERTICAL QUESTION MARK @@ -323,7 +332,7 @@ FF1F ; EX # Po FULLWIDTH QUESTION MARK 115C4..115C5 ; EX # Po [2] SIDDHAM SEPARATOR DOT..SIDDHAM SEPARATOR BAR 11C71 ; EX # Po MARCHEN MARK SHAD -# Total code points: 37 +# Total code points: 40 # ================================================ @@ -371,7 +380,7 @@ FE13..FE14 ; IS # Po [2] PRESENTATION FORM FOR VERTICAL COLON..PRESENTATION 20B7..20BA ; PR # Sc [4] SPESMILO SIGN..TURKISH LIRA SIGN 20BC..20BD ; PR # Sc [2] MANAT SIGN..RUBLE SIGN 20BF ; PR # Sc BITCOIN SIGN -20C0..20CF ; PR # Cn [16] .. +20C1..20CF ; PR # Cn [15] .. 2116 ; PR # So NUMERO SIGN 2212..2213 ; PR # Sm [2] MINUS SIGN..MINUS-OR-PLUS SIGN FE69 ; PR # Sc SMALL DOLLAR SIGN @@ -380,7 +389,7 @@ FFE1 ; PR # Sc FULLWIDTH POUND SIGN FFE5..FFE6 ; PR # Sc [2] FULLWIDTH YEN SIGN..FULLWIDTH WON SIGN 1E2FF ; PR # Sc WANCHO NGUN SIGN -# Total code points: 68 +# Total code points: 67 # ================================================ @@ -400,6 +409,7 @@ FFE5..FFE6 ; PR # Sc [2] FULLWIDTH YEN SIGN..FULLWIDTH WON SIGN 20B6 ; PO # Sc LIVRE TOURNOIS SIGN 20BB ; PO # Sc NORDIC MARK SIGN 20BE ; PO # Sc LARI SIGN +20C0 ; PO # Sc SOM SIGN 2103 ; PO # So DEGREE CELSIUS 2109 ; PO # So DEGREE FAHRENHEIT A838 ; PO # Sc NORTH INDIC RUPEE MARK @@ -411,7 +421,7 @@ FFE0 ; PO # Sc FULLWIDTH CENT SIGN 1ECAC ; PO # So INDIC SIYAQ PLACEHOLDER 1ECB0 ; PO # Sc INDIC SIYAQ RUPEE MARK -# Total code points: 36 +# Total code points: 37 # ================================================ @@ -472,6 +482,7 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 11D50..11D59 ; NU # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE 11DA0..11DA9 ; NU # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE 16A60..16A69 ; NU # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE +16AC0..16AC9 ; NU # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; NU # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 1D7CE..1D7FF ; NU # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; NU # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -479,7 +490,7 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 1E950..1E959 ; NU # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; NU # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 642 +# Total code points: 652 # ================================================ @@ -588,8 +599,12 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 0840..0858 ; AL # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN 085E ; AL # Po MANDAIC PUNCTUATION 0860..086A ; AL # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA -08A0..08B4 ; AL # Lo [21] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER KAF WITH DOT BELOW -08B6..08C7 ; AL # Lo [18] ARABIC LETTER BEH WITH SMALL MEEM ABOVE..ARABIC LETTER LAM WITH SMALL ARABIC LETTER TAH ABOVE +0870..0887 ; AL # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT +0888 ; AL # Sk ARABIC RAISED ROUND DOT +0889..088E ; AL # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL +0890..0891 ; AL # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE +08A0..08C8 ; AL # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF +08C9 ; AL # Lm ARABIC SMALL FARSI YEH 08E2 ; AL # Cf ARABIC DISPUTED END OF AYAH 0904..0939 ; AL # Lo [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA 093D ; AL # Lo DEVANAGARI SIGN AVAGRAHA @@ -667,6 +682,7 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 0C2A..0C39 ; AL # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA 0C3D ; AL # Lo TELUGU SIGN AVAGRAHA 0C58..0C5A ; AL # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA +0C5D ; AL # Lo TELUGU LETTER NAKAARA POLLU 0C60..0C61 ; AL # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL 0C78..0C7E ; AL # No [7] TELUGU FRACTION DIGIT ZERO FOR ODD POWERS OF FOUR..TELUGU FRACTION DIGIT THREE FOR EVEN POWERS OF FOUR 0C7F ; AL # So TELUGU SIGN TUUMU @@ -677,7 +693,7 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 0CAA..0CB3 ; AL # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA 0CB5..0CB9 ; AL # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA 0CBD ; AL # Lo KANNADA SIGN AVAGRAHA -0CDE ; AL # Lo KANNADA LETTER FA +0CDD..0CDE ; AL # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA 0CE0..0CE1 ; AL # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL 0CF1..0CF2 ; AL # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA 0D04..0D0C ; AL # Lo [9] MALAYALAM LETTER VEDIC ANUSVARA..MALAYALAM LETTER VOCALIC L @@ -753,9 +769,8 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 16A0..16EA ; AL # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X 16EE..16F0 ; AL # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL 16F1..16F8 ; AL # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC -1700..170C ; AL # Lo [13] TAGALOG LETTER A..TAGALOG LETTER YA -170E..1711 ; AL # Lo [4] TAGALOG LETTER LA..TAGALOG LETTER HA -1720..1731 ; AL # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA +1700..1711 ; AL # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA +171F..1731 ; AL # Lo [19] TAGALOG LETTER ARCHAIC RA..HANUNOO LETTER HA 1740..1751 ; AL # Lo [18] BUHID LETTER A..BUHID LETTER HA 1760..176C ; AL # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA 176E..1770 ; AL # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA @@ -777,7 +792,7 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 1A00..1A16 ; AL # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA 1A1E..1A1F ; AL # Po [2] BUGINESE PALLAWA..BUGINESE END OF SECTION 1B05..1B33 ; AL # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA -1B45..1B4B ; AL # Lo [7] BALINESE LETTER KAF SASAK..BALINESE LETTER ASYURA SASAK +1B45..1B4C ; AL # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA 1B5C ; AL # Po BALINESE WINDU 1B61..1B6A ; AL # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE 1B74..1B7C ; AL # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING @@ -1012,9 +1027,7 @@ ABF0..ABF9 ; NU # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE 2B5A..2B73 ; AL # So [26] SLANTED NORTH ARROW WITH HOOKED HEAD..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR 2B76..2B95 ; AL # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW 2B97..2BFF ; AL # So [105] SYMBOL FOR TYPE A ELECTRONICS..HELLSCHREIBER PAUSE SYMBOL -2C00..2C2E ; AL # L& [47] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC CAPITAL LETTER LATINATE MYSLITE -2C30..2C5E ; AL # L& [47] GLAGOLITIC SMALL LETTER AZU..GLAGOLITIC SMALL LETTER LATINATE MYSLITE -2C60..2C7B ; AL # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E +2C00..2C7B ; AL # L& [124] GLAGOLITIC CAPITAL LETTER AZU..LATIN LETTER SMALL CAPITAL TURNED E 2C7C..2C7D ; AL # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V 2C7E..2CE4 ; AL # L& [103] LATIN CAPITAL LETTER S WITH SWASH TAIL..COPTIC SYMBOL KAI 2CE5..2CEA ; AL # So [6] COPTIC SYMBOL MI RO..COPTIC SYMBOL SHIMA SIMA @@ -1074,8 +1087,11 @@ A788 ; AL # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT A789..A78A ; AL # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN A78B..A78E ; AL # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT A78F ; AL # Lo LATIN LETTER SINOLOGICAL DOT -A790..A7BF ; AL # L& [48] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER GLOTTAL U -A7C2..A7CA ; AL # L& [9] LATIN CAPITAL LETTER ANGLICANA W..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A790..A7CA ; AL # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY +A7D0..A7D1 ; AL # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G +A7D3 ; AL # L& LATIN SMALL LETTER DOUBLE THORN +A7D5..A7D9 ; AL # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S +A7F2..A7F4 ; AL # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q A7F5..A7F6 ; AL # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H A7F7 ; AL # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I A7F8..A7F9 ; AL # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE @@ -1126,12 +1142,14 @@ FB00..FB06 ; AL # L& [7] LATIN SMALL LIGATURE FF..LATIN SMALL LIGATURE ST FB13..FB17 ; AL # L& [5] ARMENIAN SMALL LIGATURE MEN NOW..ARMENIAN SMALL LIGATURE MEN XEH FB29 ; AL # Sm HEBREW LETTER ALTERNATIVE PLUS SIGN FB50..FBB1 ; AL # Lo [98] ARABIC LETTER ALEF WASLA ISOLATED FORM..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM -FBB2..FBC1 ; AL # Sk [16] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL SMALL TAH BELOW +FBB2..FBC2 ; AL # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE FBD3..FD3D ; AL # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM +FD40..FD4F ; AL # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH FD50..FD8F ; AL # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM FD92..FDC7 ; AL # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM +FDCF ; AL # So ARABIC LIGATURE SALAAMUHU ALAYNAA FDF0..FDFB ; AL # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU -FDFD ; AL # So ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM +FDFD..FDFF ; AL # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL FE70..FE74 ; AL # Lo [5] ARABIC FATHATAN ISOLATED FORM..ARABIC KASRATAN ISOLATED FORM FE76..FEFC ; AL # Lo [135] ARABIC FATHA ISOLATED FORM..ARABIC LIGATURE LAM WITH ALEF FINAL FORM FFE8 ; AL # So HALFWIDTH FORMS LIGHT VERTICAL @@ -1175,9 +1193,20 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 10500..10527 ; AL # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE 10530..10563 ; AL # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW 1056F ; AL # Po CAUCASIAN ALBANIAN CITATION MARK +10570..1057A ; AL # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA +1057C..1058A ; AL # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE +1058C..10592 ; AL # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE +10594..10595 ; AL # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE +10597..105A1 ; AL # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA +105A3..105B1 ; AL # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE +105B3..105B9 ; AL # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE +105BB..105BC ; AL # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE 10600..10736 ; AL # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664 10740..10755 ; AL # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE 10760..10767 ; AL # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807 +10780..10785 ; AL # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK +10787..107B0 ; AL # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK +107B2..107BA ; AL # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL 10800..10805 ; AL # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA 10808 ; AL # Lo CYPRIOT SYLLABLE JO 1080A..10835 ; AL # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO @@ -1239,12 +1268,16 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 10F30..10F45 ; AL # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN 10F51..10F54 ; AL # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED 10F55..10F59 ; AL # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT +10F70..10F81 ; AL # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH +10F86..10F89 ; AL # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS 10FB0..10FC4 ; AL # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW 10FC5..10FCB ; AL # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED 10FE0..10FF6 ; AL # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH 11003..11037 ; AL # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA 11049..1104D ; AL # Po [5] BRAHMI PUNCTUATION DOT..BRAHMI PUNCTUATION LOTUS 11052..11065 ; AL # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND +11071..11072 ; AL # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O +11075 ; AL # Lo BRAHMI LETTER OLD TAMIL LLA 11083..110AF ; AL # Lo [45] KAITHI LETTER A..KAITHI LETTER HA 110BB..110BC ; AL # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN 110BD ; AL # Cf KAITHI NUMBER SIGN @@ -1299,6 +1332,7 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 11644 ; AL # Lo MODI SIGN HUVA 11680..116AA ; AL # Lo [43] TAKRI LETTER A..TAKRI LETTER RRA 116B8 ; AL # Lo TAKRI LETTER ARCHAIC KHA +116B9 ; AL # Po TAKRI ABBREVIATION SIGN 11800..1182B ; AL # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA 1183B ; AL # Po DOGRA ABBREVIATION SIGN 118A0..118DF ; AL # L& [64] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI SMALL LETTER VIYO @@ -1322,7 +1356,7 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 11A50 ; AL # Lo SOYOMBO LETTER A 11A5C..11A89 ; AL # Lo [46] SOYOMBO LETTER KA..SOYOMBO CLUSTER-INITIAL LETTER SA 11A9D ; AL # Lo SOYOMBO MARK PLUTA -11AC0..11AF8 ; AL # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL +11AB0..11AF8 ; AL # Lo [73] CANADIAN SYLLABICS NATTILIK HI..PAU CIN HAU GLOTTAL STOP FINAL 11C00..11C08 ; AL # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L 11C0A..11C2E ; AL # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA 11C40 ; AL # Lo BHAIKSUKI SIGN AVAGRAHA @@ -1345,6 +1379,8 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 12000..12399 ; AL # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U 12400..1246E ; AL # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 12480..12543 ; AL # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU +12F90..12FF0 ; AL # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114 +12FF1..12FF2 ; AL # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302 13000..13257 ; AL # Lo [600] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH O006 1325E..13281 ; AL # Lo [36] EGYPTIAN HIEROGLYPH O007..EGYPTIAN HIEROGLYPH O033 13283..13285 ; AL # Lo [3] EGYPTIAN HIEROGLYPH O034..EGYPTIAN HIEROGLYPH O036 @@ -1354,6 +1390,7 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 145D0..14646 ; AL # Lo [119] ANATOLIAN HIEROGLYPH A411..ANATOLIAN HIEROGLYPH A530 16800..16A38 ; AL # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ 16A40..16A5E ; AL # Lo [31] MRO LETTER TA..MRO LETTER TEK +16A70..16ABE ; AL # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA 16AD0..16AED ; AL # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I 16B00..16B2F ; AL # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU 16B3A..16B3B ; AL # Po [2] PAHAWH HMONG SIGN VOS THIAB..PAHAWH HMONG SIGN VOS FEEM @@ -1370,18 +1407,22 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 16F50 ; AL # Lo MIAO LETTER NASALIZATION 16F93..16F9F ; AL # Lm [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8 18B00..18CD5 ; AL # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5 +1AFF0..1AFF3 ; AL # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5 +1AFF5..1AFFB ; AL # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5 +1AFFD..1AFFE ; AL # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8 1BC00..1BC6A ; AL # Lo [107] DUPLOYAN LETTER H..DUPLOYAN LETTER VOCALIC M 1BC70..1BC7C ; AL # Lo [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK 1BC80..1BC88 ; AL # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL 1BC90..1BC99 ; AL # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW 1BC9C ; AL # So DUPLOYAN SIGN O WITH CROSS +1CF50..1CFC3 ; AL # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK 1D000..1D0F5 ; AL # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO 1D100..1D126 ; AL # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2 1D129..1D164 ; AL # So [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE 1D16A..1D16C ; AL # So [3] MUSICAL SYMBOL FINGERED TREMOLO-1..MUSICAL SYMBOL FINGERED TREMOLO-3 1D183..1D184 ; AL # So [2] MUSICAL SYMBOL ARPEGGIATO UP..MUSICAL SYMBOL ARPEGGIATO DOWN 1D18C..1D1A9 ; AL # So [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH -1D1AE..1D1E8 ; AL # So [59] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KIEVAN FLAT SIGN +1D1AE..1D1EA ; AL # So [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON 1D200..1D241 ; AL # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54 1D245 ; AL # So GREEK MUSICAL LEIMMA 1D2E0..1D2F3 ; AL # No [20] MAYAN NUMERAL ZERO..MAYAN NUMERAL NINETEEN @@ -1433,11 +1474,19 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 1DA76..1DA83 ; AL # So [14] SIGNWRITING LIMB COMBINATION..SIGNWRITING LOCATION DEPTH 1DA85..1DA86 ; AL # So [2] SIGNWRITING LOCATION TORSO..SIGNWRITING LOCATION LIMBS DIGITS 1DA8B ; AL # Po SIGNWRITING PARENTHESIS +1DF00..1DF09 ; AL # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK +1DF0A ; AL # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK +1DF0B..1DF1E ; AL # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL 1E100..1E12C ; AL # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W 1E137..1E13D ; AL # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER 1E14E ; AL # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ 1E14F ; AL # So NYIAKENG PUACHUE HMONG CIRCLED CA +1E290..1E2AD ; AL # Lo [30] TOTO LETTER PA..TOTO LETTER A 1E2C0..1E2EB ; AL # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH +1E7E0..1E7E6 ; AL # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO +1E7E8..1E7EB ; AL # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE +1E7ED..1E7EE ; AL # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE +1E7F0..1E7FE ; AL # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE 1E800..1E8C4 ; AL # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON 1E8C7..1E8CF ; AL # No [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE 1E900..1E943 ; AL # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA @@ -1511,7 +1560,7 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 1FB00..1FB92 ; AL # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK 1FB94..1FBCA ; AL # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON -# Total code points: 21400 +# Total code points: 22043 # ================================================ @@ -1599,9 +1648,7 @@ FFED..FFEE ; AL # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE 32B1..32BF ; ID # No [15] CIRCLED NUMBER THIRTY SIX..CIRCLED NUMBER FIFTY 32C0..33FF ; ID # So [320] IDEOGRAPHIC TELEGRAPH SYMBOL FOR JANUARY..SQUARE GAL 3400..4DBF ; ID # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF -4E00..9FFC ; ID # Lo [20989] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFC -9FFD..9FFF ; ID # Cn [3] .. -A000..A014 ; ID # Lo [21] YI SYLLABLE IT..YI SYLLABLE E +4E00..A014 ; ID # Lo [21013] CJK UNIFIED IDEOGRAPH-4E00..YI SYLLABLE E A016..A48C ; ID # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR A490..A4C6 ; ID # So [55] YI RADICAL QOT..YI RADICAL KE F900..FA6D ; ID # Lo [366] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA6D @@ -1652,7 +1699,7 @@ FFE4 ; ID # So FULLWIDTH BROKEN BAR 17000..187F7 ; ID # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7 18800..18AFF ; ID # Lo [768] TANGUT COMPONENT-001..TANGUT COMPONENT-768 18D00..18D08 ; ID # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08 -1B000..1B11E ; ID # Lo [287] KATAKANA LETTER ARCHAIC E..HENTAIGANA LETTER N-MU-MO-2 +1B000..1B122 ; ID # Lo [291] KATAKANA LETTER ARCHAIC E..KATAKANA LETTER ARCHAIC WU 1B170..1B2FB ; ID # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB 1F000..1F02B ; ID # So [44] MAHJONG TILE EAST WIND..MAHJONG TILE BACK 1F02C..1F02F ; ID # Cn [4] .. @@ -1718,8 +1765,8 @@ FFE4 ; ID # So FULLWIDTH BROKEN BAR 1F6B7..1F6BF ; ID # So [9] NO PEDESTRIANS..SHOWER 1F6C1..1F6CB ; ID # So [11] BATHTUB..COUCH AND LAMP 1F6CD..1F6D7 ; ID # So [11] SHOPPING BAGS..ELEVATOR -1F6D8..1F6DF ; ID # Cn [8] .. -1F6E0..1F6EC ; ID # So [13] HAMMER AND WRENCH..AIRPLANE ARRIVING +1F6D8..1F6DC ; ID # Cn [5] .. +1F6DD..1F6EC ; ID # So [16] PLAYGROUND SLIDE..AIRPLANE ARRIVING 1F6ED..1F6EF ; ID # Cn [3] .. 1F6F0..1F6FC ; ID # So [13] SATELLITE..ROLLER SKATE 1F6FD..1F6FF ; ID # Cn [3] .. @@ -1727,7 +1774,9 @@ FFE4 ; ID # So FULLWIDTH BROKEN BAR 1F7D5..1F7D8 ; ID # So [4] CIRCLED TRIANGLE..NEGATIVE CIRCLED SQUARE 1F7D9..1F7DF ; ID # Cn [7] .. 1F7E0..1F7EB ; ID # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE -1F7EC..1F7FF ; ID # Cn [20] .. +1F7EC..1F7EF ; ID # Cn [4] .. +1F7F0 ; ID # So HEAVY EQUALS SIGN +1F7F1..1F7FF ; ID # Cn [15] .. 1F80C..1F80F ; ID # Cn [4] .. 1F848..1F84F ; ID # Cn [8] .. 1F85A..1F85F ; ID # Cn [6] .. @@ -1741,13 +1790,10 @@ FFE4 ; ID # So FULLWIDTH BROKEN BAR 1F927..1F92F ; ID # So [9] SNEEZING FACE..SHOCKED FACE WITH EXPLODING HEAD 1F93A..1F93B ; ID # So [2] FENCER..MODERN PENTATHLON 1F93F..1F976 ; ID # So [56] DIVING MASK..FREEZING FACE -1F978 ; ID # So DISGUISED FACE -1F979 ; ID # Cn -1F97A..1F9B4 ; ID # So [59] FACE WITH PLEADING EYES..BONE +1F978..1F9B4 ; ID # So [61] DISGUISED FACE..BONE 1F9B7 ; ID # So TOOTH 1F9BA ; ID # So SAFETY VEST -1F9BC..1F9CB ; ID # So [16] MOTORIZED WHEELCHAIR..BUBBLE TEA -1F9CC ; ID # Cn +1F9BC..1F9CC ; ID # So [17] MOTORIZED WHEELCHAIR..TROLL 1F9D0 ; ID # So FACE WITH MONOCLE 1F9DE..1F9FF ; ID # So [34] GENIE..NAZAR AMULET 1FA54..1FA5F ; ID # Cn [12] .. @@ -1755,23 +1801,26 @@ FFE4 ; ID # So FULLWIDTH BROKEN BAR 1FA6E..1FA6F ; ID # Cn [2] .. 1FA70..1FA74 ; ID # So [5] BALLET SHOES..THONG SANDAL 1FA75..1FA77 ; ID # Cn [3] .. -1FA78..1FA7A ; ID # So [3] DROP OF BLOOD..STETHOSCOPE -1FA7B..1FA7F ; ID # Cn [5] .. +1FA78..1FA7C ; ID # So [5] DROP OF BLOOD..CRUTCH +1FA7D..1FA7F ; ID # Cn [3] .. 1FA80..1FA86 ; ID # So [7] YO-YO..NESTING DOLLS 1FA87..1FA8F ; ID # Cn [9] .. -1FA90..1FAA8 ; ID # So [25] RINGED PLANET..ROCK -1FAA9..1FAAF ; ID # Cn [7] .. -1FAB0..1FAB6 ; ID # So [7] FLY..FEATHER -1FAB7..1FABF ; ID # Cn [9] .. +1FA90..1FAAC ; ID # So [29] RINGED PLANET..HAMSA +1FAAD..1FAAF ; ID # Cn [3] .. +1FAB0..1FABA ; ID # So [11] FLY..NEST WITH EGGS +1FABB..1FABF ; ID # Cn [5] .. 1FAC0..1FAC2 ; ID # So [3] ANATOMICAL HEART..PEOPLE HUGGING -1FAC3..1FACF ; ID # Cn [13] .. -1FAD0..1FAD6 ; ID # So [7] BLUEBERRIES..TEAPOT -1FAD7..1FAFF ; ID # Cn [41] .. +1FAC6..1FACF ; ID # Cn [10] .. +1FAD0..1FAD9 ; ID # So [10] BLUEBERRIES..JAR +1FADA..1FADF ; ID # Cn [6] .. +1FAE0..1FAE7 ; ID # So [8] MELTING FACE..BUBBLES +1FAE8..1FAEF ; ID # Cn [8] .. +1FAF7..1FAFF ; ID # Cn [9] .. 1FC00..1FFFD ; ID # Cn [1022] .. -20000..2A6DD ; ID # Lo [42718] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DD -2A6DE..2A6FF ; ID # Cn [34] .. -2A700..2B734 ; ID # Lo [4149] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B734 -2B735..2B73F ; ID # Cn [11] .. +20000..2A6DF ; ID # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF +2A6E0..2A6FF ; ID # Cn [32] .. +2A700..2B738 ; ID # Lo [4153] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B738 +2B739..2B73F ; ID # Cn [7] .. 2B740..2B81D ; ID # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D 2B81E..2B81F ; ID # Cn [2] .. 2B820..2CEA1 ; ID # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1 @@ -1783,7 +1832,7 @@ FFE4 ; ID # So FULLWIDTH BROKEN BAR 30000..3134A ; ID # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A 3134B..3FFFD ; ID # Cn [60595] .. -# Total code points: 172462 +# Total code points: 172456 # ================================================ @@ -1840,7 +1889,8 @@ FE19 ; IN # Po PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS 0825..0827 ; CM # Mn [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U 0829..082D ; CM # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA 0859..085B ; CM # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK -08D3..08E1 ; CM # Mn [15] ARABIC SMALL LOW WAW..ARABIC SMALL HIGH SIGN SAFHA +0898..089F ; CM # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA +08CA..08E1 ; CM # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA 08E3..0902 ; CM # Mn [32] ARABIC TURNED DAMMA BELOW..DEVANAGARI SIGN ANUSVARA 0903 ; CM # Mc DEVANAGARI SIGN VISARGA 093A ; CM # Mn DEVANAGARI VOWEL SIGN OE @@ -1909,6 +1959,7 @@ FE19 ; IN # Po PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS 0C00 ; CM # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE 0C01..0C03 ; CM # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA 0C04 ; CM # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE +0C3C ; CM # Mn TELUGU SIGN NUKTA 0C3E..0C40 ; CM # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II 0C41..0C44 ; CM # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR 0C46..0C48 ; CM # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI @@ -1958,10 +2009,13 @@ FE19 ; IN # Po PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS 0FC6 ; CM # Mn TIBETAN SYMBOL PADMA GDAN 135D..135F ; CM # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK 1712..1714 ; CM # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA -1732..1734 ; CM # Mn [3] HANUNOO VOWEL SIGN I..HANUNOO SIGN PAMUDPOD +1715 ; CM # Mc TAGALOG SIGN PAMUDPOD +1732..1733 ; CM # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U +1734 ; CM # Mc HANUNOO SIGN PAMUDPOD 1752..1753 ; CM # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U 1772..1773 ; CM # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U 180B..180D ; CM # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE +180F ; CM # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR 1885..1886 ; CM # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA 18A9 ; CM # Mn MONGOLIAN LETTER ALI GALI DAGALGA 1920..1922 ; CM # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U @@ -1978,7 +2032,7 @@ FE19 ; IN # Po PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS 1A7F ; CM # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT 1AB0..1ABD ; CM # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW 1ABE ; CM # Me COMBINING PARENTHESES OVERLAY -1ABF..1AC0 ; CM # Mn [2] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER TURNED W BELOW +1ABF..1ACE ; CM # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T 1B00..1B03 ; CM # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG 1B04 ; CM # Mc BALINESE SIGN BISAH 1B34 ; CM # Mn BALINESE SIGN REREKAN @@ -2018,8 +2072,7 @@ FE19 ; IN # Po PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS 1CF4 ; CM # Mn VEDIC TONE CANDRA ABOVE 1CF7 ; CM # Mc VEDIC SIGN ATIKRAMA 1CF8..1CF9 ; CM # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE -1DC0..1DF9 ; CM # Mn [58] COMBINING DOTTED GRAVE ACCENT..COMBINING WIDE INVERTED BRIDGE BELOW -1DFB..1DFF ; CM # Mn [5] COMBINING DELETION MARK..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW +1DC0..1DFF ; CM # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW 200C ; CM # Cf ZERO WIDTH NON-JOINER 200E..200F ; CM # Cf [2] LEFT-TO-RIGHT MARK..RIGHT-TO-LEFT MARK 202A..202E ; CM # Cf [5] LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE @@ -2100,16 +2153,20 @@ FFF9..FFFB ; CM # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTAT 10D24..10D27 ; CM # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI 10EAB..10EAC ; CM # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK 10F46..10F50 ; CM # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW +10F82..10F85 ; CM # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW 11000 ; CM # Mc BRAHMI SIGN CANDRABINDU 11001 ; CM # Mn BRAHMI SIGN ANUSVARA 11002 ; CM # Mc BRAHMI SIGN VISARGA 11038..11046 ; CM # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA +11070 ; CM # Mn BRAHMI SIGN OLD TAMIL VIRAMA +11073..11074 ; CM # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O 1107F..11081 ; CM # Mn [3] BRAHMI NUMBER JOINER..KAITHI SIGN ANUSVARA 11082 ; CM # Mc KAITHI SIGN VISARGA 110B0..110B2 ; CM # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II 110B3..110B6 ; CM # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI 110B7..110B8 ; CM # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU 110B9..110BA ; CM # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA +110C2 ; CM # Mn KAITHI VOWEL SIGN VOCALIC R 11100..11102 ; CM # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA 11127..1112B ; CM # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU 1112C ; CM # Mc CHAKMA VOWEL SIGN E @@ -2243,6 +2300,8 @@ FFF9..FFFB ; CM # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTAT 16FF0..16FF1 ; CM # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY 1BC9D..1BC9E ; CM # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK 1BCA0..1BCA3 ; CM # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP +1CF00..1CF2D ; CM # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT +1CF30..1CF46 ; CM # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG 1D165..1D166 ; CM # Mc [2] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING SPRECHGESANG STEM 1D167..1D169 ; CM # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3 1D16D..1D172 ; CM # Mc [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5 @@ -2263,6 +2322,7 @@ FFF9..FFFB ; CM # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTAT 1E023..1E024 ; CM # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS 1E026..1E02A ; CM # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA 1E130..1E136 ; CM # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D +1E2AE ; CM # Mn TOTO SIGN RISING TONE 1E2EC..1E2EF ; CM # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI 1E8D0..1E8D6 ; CM # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS 1E944..1E94A ; CM # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA @@ -2270,7 +2330,7 @@ E0001 ; CM # Cf LANGUAGE TAG E0020..E007F ; CM # Cf [96] TAG SPACE..CANCEL TAG E0100..E01EF ; CM # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256 -# Total code points: 2286 +# Total code points: 2399 # ================================================ @@ -2333,6 +2393,7 @@ A8FC ; BB # Po DEVANAGARI SIGN SIDDHAM 1804..1805 ; BA # Po [2] MONGOLIAN COLON..MONGOLIAN FOUR DOTS 1B5A..1B5B ; BA # Po [2] BALINESE PANTI..BALINESE PAMADA 1B5D..1B60 ; BA # Po [4] BALINESE CARIK PAMUNGKAH..BALINESE PAMENENG +1B7D..1B7E ; BA # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG 1C3B..1C3F ; BA # Po [5] LEPCHA PUNCTUATION TA-ROL..LEPCHA PUNCTUATION TSHOOK 1C7E..1C7F ; BA # Po [2] OL CHIKI PUNCTUATION MUCAAD..OL CHIKI PUNCTUATION DOUBLE MUCAAD 2000..2006 ; BA # Zs [7] EN QUAD..SIX-PER-EM SPACE @@ -2359,6 +2420,7 @@ A8FC ; BB # Po DEVANAGARI SIGN SIDDHAM 2E43..2E4A ; BA # Po [8] DASH WITH LEFT UPTURN..DOTTED SOLIDUS 2E4C ; BA # Po MEDIEVAL COMMA 2E4E..2E4F ; BA # Po [2] PUNCTUS ELEVATUS MARK..CORNISH VERSE DIVIDER +2E5D ; BA # Pd OBLIQUE HYPHEN 3000 ; BA # Zs IDEOGRAPHIC SPACE A4FE..A4FF ; BA # Po [2] LISU PUNCTUATION COMMA..LISU PUNCTUATION FULL STOP A60D ; BA # Po VAI COMMA @@ -2409,7 +2471,7 @@ ABEB ; BA # Po MEETEI MAYEK CHEIKHEI 1BC9F ; BA # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP 1DA87..1DA8A ; BA # Po [4] SIGNWRITING COMMA..SIGNWRITING COLON -# Total code points: 244 +# Total code points: 247 # ================================================ @@ -2577,8 +2639,9 @@ AADE..AADF ; SA # Po [2] TAI VIET SYMBOL HO HOI..TAI VIET SYMBOL KOI KOI 11727..1172B ; SA # Mn [5] AHOM VOWEL SIGN AW..AHOM SIGN KILLER 1173A..1173B ; SA # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY 1173F ; SA # So AHOM SYMBOL VI +11740..11746 ; SA # Lo [7] AHOM LETTER CA..AHOM LETTER LLA -# Total code points: 750 +# Total code points: 757 # ================================================ @@ -3698,8 +3761,10 @@ FF70 ; CJ # Lm HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND MARK 1F9BB ; EB # So EAR WITH HEARING AID 1F9CD..1F9CF ; EB # So [3] STANDING PERSON..DEAF PERSON 1F9D1..1F9DD ; EB # So [13] ADULT..ELF +1FAC3..1FAC5 ; EB # So [3] PREGNANT MAN..PERSON WITH CROWN +1FAF0..1FAF6 ; EB # So [7] HAND WITH INDEX FINGER AND THUMB CROSSED..HEART HANDS -# Total code points: 122 +# Total code points: 132 # ================================================ diff --git a/lib/unicore/extracted/DNumType.txt b/lib/unicore/extracted/DNumType.txt index 984afe2f17..6d819ea990 100644 --- a/lib/unicore/extracted/DNumType.txt +++ b/lib/unicore/extracted/DNumType.txt @@ -1,6 +1,6 @@ -# DerivedNumericType-13.0.0.txt -# Date: 2019-09-08, 23:31:09 GMT -# © 2019 Unicode®, Inc. +# DerivedNumericType-14.0.0.txt +# Date: 2021-03-08, 06:22:31 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -265,6 +265,7 @@ FF10..FF19 ; Decimal # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 11D50..11D59 ; Decimal # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE 11DA0..11DA9 ; Decimal # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE 16A60..16A69 ; Decimal # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE +16AC0..16AC9 ; Decimal # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE 16B50..16B59 ; Decimal # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE 1D7CE..1D7FF ; Decimal # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE 1E140..1E149 ; Decimal # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE @@ -272,6 +273,6 @@ FF10..FF19 ; Decimal # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE 1E950..1E959 ; Decimal # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE 1FBF0..1FBF9 ; Decimal # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE -# Total code points: 650 +# Total code points: 660 # EOF diff --git a/lib/unicore/extracted/DNumValues.txt b/lib/unicore/extracted/DNumValues.txt index f70662acc9..84cb90749a 100644 --- a/lib/unicore/extracted/DNumValues.txt +++ b/lib/unicore/extracted/DNumValues.txt @@ -1,6 +1,6 @@ -# DerivedNumericValues-13.0.0.txt -# Date: 2019-09-08, 23:31:10 GMT -# © 2019 Unicode®, Inc. +# DerivedNumericValues-14.0.0.txt +# Date: 2021-03-08, 06:22:32 GMT +# © 2021 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. # For terms of use, see http://www.unicode.org/terms_of_use.html # @@ -106,6 +106,7 @@ FF10 ; 0.0 ; ; 0 # Nd FULLWIDTH DIGIT ZERO 11D50 ; 0.0 ; ; 0 # Nd MASARAM GONDI DIGIT ZERO 11DA0 ; 0.0 ; ; 0 # Nd GUNJALA GONDI DIGIT ZERO 16A60 ; 0.0 ; ; 0 # Nd MRO DIGIT ZERO +16AC0 ; 0.0 ; ; 0 # Nd TANGSA DIGIT ZERO 16B50 ; 0.0 ; ; 0 # Nd PAHAWH HMONG DIGIT ZERO 16E80 ; 0.0 ; ; 0 # No MEDEFAIDRIN DIGIT ZERO 1D2E0 ; 0.0 ; ; 0 # No MAYAN NUMERAL ZERO @@ -121,7 +122,7 @@ FF10 ; 0.0 ; ; 0 # Nd FULLWIDTH DIGIT ZERO 1F10B..1F10C ; 0.0 ; ; 0 # No [2] DINGBAT CIRCLED SANS-SERIF DIGIT ZERO..DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ZERO 1FBF0 ; 0.0 ; ; 0 # Nd SEGMENTED DIGIT ZERO -# Total code points: 83 +# Total code points: 84 # ================================================ @@ -520,6 +521,7 @@ FF11 ; 1.0 ; ; 1 # Nd FULLWIDTH DIGIT ONE 1244F ; 1.0 ; ; 1 # Nl CUNEIFORM NUMERIC SIGN ONE BAN2 12458 ; 1.0 ; ; 1 # Nl CUNEIFORM NUMERIC SIGN ONE ESHE3 16A61 ; 1.0 ; ; 1 # Nd MRO DIGIT ONE +16AC1 ; 1.0 ; ; 1 # Nd TANGSA DIGIT ONE 16B51 ; 1.0 ; ; 1 # Nd PAHAWH HMONG DIGIT ONE 16E81 ; 1.0 ; ; 1 # No MEDEFAIDRIN DIGIT ONE 16E94 ; 1.0 ; ; 1 # No MEDEFAIDRIN DIGIT ONE ALTERNATE FORM @@ -544,7 +546,7 @@ FF11 ; 1.0 ; ; 1 # Nd FULLWIDTH DIGIT ONE 1FBF1 ; 1.0 ; ; 1 # Nd SEGMENTED DIGIT ONE 2092A ; 1.0 ; ; 1 # Lo CJK UNIFIED IDEOGRAPH-2092A -# Total code points: 140 +# Total code points: 141 # ================================================ @@ -667,6 +669,7 @@ FF12 ; 2.0 ; ; 2 # Nd FULLWIDTH DIGIT TWO 12456 ; 2.0 ; ; 2 # Nl CUNEIFORM NUMERIC SIGN NIGIDAMIN 12459 ; 2.0 ; ; 2 # Nl CUNEIFORM NUMERIC SIGN TWO ESHE3 16A62 ; 2.0 ; ; 2 # Nd MRO DIGIT TWO +16AC2 ; 2.0 ; ; 2 # Nd TANGSA DIGIT TWO 16B52 ; 2.0 ; ; 2 # Nd PAHAWH HMONG DIGIT TWO 16E82 ; 2.0 ; ; 2 # No MEDEFAIDRIN DIGIT TWO 16E95 ; 2.0 ; ; 2 # No MEDEFAIDRIN DIGIT TWO ALTERNATE FORM @@ -691,7 +694,7 @@ FF12 ; 2.0 ; ; 2 # Nd FULLWIDTH DIGIT TWO 1FBF2 ; 2.0 ; ; 2 # Nd SEGMENTED DIGIT TWO 22390 ; 2.0 ; ; 2 # Lo CJK UNIFIED IDEOGRAPH-22390 -# Total code points: 139 +# Total code points: 140 # ================================================ @@ -809,6 +812,7 @@ FF13 ; 3.0 ; ; 3 # Nd FULLWIDTH DIGIT THREE 12451 ; 3.0 ; ; 3 # Nl CUNEIFORM NUMERIC SIGN THREE BAN2 12457 ; 3.0 ; ; 3 # Nl CUNEIFORM NUMERIC SIGN NIGIDAESH 16A63 ; 3.0 ; ; 3 # Nd MRO DIGIT THREE +16AC3 ; 3.0 ; ; 3 # Nd TANGSA DIGIT THREE 16B53 ; 3.0 ; ; 3 # Nd PAHAWH HMONG DIGIT THREE 16E83 ; 3.0 ; ; 3 # No MEDEFAIDRIN DIGIT THREE 16E96 ; 3.0 ; ; 3 # No MEDEFAIDRIN DIGIT THREE ALTERNATE FORM @@ -835,7 +839,7 @@ FF13 ; 3.0 ; ; 3 # Nd FULLWIDTH DIGIT THREE 22998 ; 3.0 ; ; 3 # Lo CJK UNIFIED IDEOGRAPH-22998 23B1B ; 3.0 ; ; 3 # Lo CJK UNIFIED IDEOGRAPH-23B1B -# Total code points: 140 +# Total code points: 141 # ================================================ @@ -948,6 +952,7 @@ FF14 ; 4.0 ; ; 4 # Nd FULLWIDTH DIGIT FOUR 12452..12453 ; 4.0 ; ; 4 # Nl [2] CUNEIFORM NUMERIC SIGN FOUR BAN2..CUNEIFORM NUMERIC SIGN FOUR BAN2 VARIANT FORM 12469 ; 4.0 ; ; 4 # Nl CUNEIFORM NUMERIC SIGN FOUR U VARIANT FORM 16A64 ; 4.0 ; ; 4 # Nd MRO DIGIT FOUR +16AC4 ; 4.0 ; ; 4 # Nd TANGSA DIGIT FOUR 16B54 ; 4.0 ; ; 4 # Nd PAHAWH HMONG DIGIT FOUR 16E84 ; 4.0 ; ; 4 # No MEDEFAIDRIN DIGIT FOUR 1D2E4 ; 4.0 ; ; 4 # No MAYAN NUMERAL FOUR @@ -972,7 +977,7 @@ FF14 ; 4.0 ; ; 4 # Nd FULLWIDTH DIGIT FOUR 200E2 ; 4.0 ; ; 4 # Lo CJK UNIFIED IDEOGRAPH-200E2 2626D ; 4.0 ; ; 4 # Lo CJK UNIFIED IDEOGRAPH-2626D -# Total code points: 131 +# Total code points: 132 # ================================================ @@ -1088,6 +1093,7 @@ FF15 ; 5.0 ; ; 5 # Nd FULLWIDTH DIGIT FIVE 12454..12455 ; 5.0 ; ; 5 # Nl [2] CUNEIFORM NUMERIC SIGN FIVE BAN2..CUNEIFORM NUMERIC SIGN FIVE BAN2 VARIANT FORM 1246A ; 5.0 ; ; 5 # Nl CUNEIFORM NUMERIC SIGN FIVE U VARIANT FORM 16A65 ; 5.0 ; ; 5 # Nd MRO DIGIT FIVE +16AC5 ; 5.0 ; ; 5 # Nd TANGSA DIGIT FIVE 16B55 ; 5.0 ; ; 5 # Nd PAHAWH HMONG DIGIT FIVE 16E85 ; 5.0 ; ; 5 # No MEDEFAIDRIN DIGIT FIVE 1D2E5 ; 5.0 ; ; 5 # No MAYAN NUMERAL FIVE @@ -1111,7 +1117,7 @@ FF15 ; 5.0 ; ; 5 # Nd FULLWIDTH DIGIT FIVE 1FBF5 ; 5.0 ; ; 5 # Nd SEGMENTED DIGIT FIVE 20121 ; 5.0 ; ; 5 # Lo CJK UNIFIED IDEOGRAPH-20121 -# Total code points: 129 +# Total code points: 130 # ================================================ @@ -1214,6 +1220,7 @@ FF16 ; 6.0 ; ; 6 # Nd FULLWIDTH DIGIT SIX 1244E ; 6.0 ; ; 6 # Nl CUNEIFORM NUMERIC SIGN SIX ASH TENU 1246B ; 6.0 ; ; 6 # Nl CUNEIFORM NUMERIC SIGN SIX U VARIANT FORM 16A66 ; 6.0 ; ; 6 # Nd MRO DIGIT SIX +16AC6 ; 6.0 ; ; 6 # Nd TANGSA DIGIT SIX 16B56 ; 6.0 ; ; 6 # Nd PAHAWH HMONG DIGIT SIX 16E86 ; 6.0 ; ; 6 # No MEDEFAIDRIN DIGIT SIX 1D2E6 ; 6.0 ; ; 6 # No MAYAN NUMERAL SIX @@ -1235,7 +1242,7 @@ FF16 ; 6.0 ; ; 6 # Nd FULLWIDTH DIGIT SIX 1FBF6 ; 6.0 ; ; 6 # Nd SEGMENTED DIGIT SIX 20AEA ; 6.0 ; ; 6 # Lo CJK UNIFIED IDEOGRAPH-20AEA -# Total code points: 113 +# Total code points: 114 # ================================================ @@ -1335,6 +1342,7 @@ FF17 ; 7.0 ; ; 7 # Nd FULLWIDTH DIGIT SEVEN 12441..12443 ; 7.0 ; ; 7 # Nl [3] CUNEIFORM NUMERIC SIGN SEVEN VARIANT FORM IMIN3..CUNEIFORM NUMERIC SIGN SEVEN VARIANT FORM IMIN B 1246C ; 7.0 ; ; 7 # Nl CUNEIFORM NUMERIC SIGN SEVEN U VARIANT FORM 16A67 ; 7.0 ; ; 7 # Nd MRO DIGIT SEVEN +16AC7 ; 7.0 ; ; 7 # Nd TANGSA DIGIT SEVEN 16B57 ; 7.0 ; ; 7 # Nd PAHAWH HMONG DIGIT SEVEN 16E87 ; 7.0 ; ; 7 # No MEDEFAIDRIN DIGIT SEVEN 1D2E7 ; 7.0 ; ; 7 # No MAYAN NUMERAL SEVEN @@ -1356,7 +1364,7 @@ FF17 ; 7.0 ; ; 7 # Nd FULLWIDTH DIGIT SEVEN 1FBF7 ; 7.0 ; ; 7 # Nd SEGMENTED DIGIT SEVEN 20001 ; 7.0 ; ; 7 # Lo CJK UNIFIED IDEOGRAPH-20001 -# Total code points: 112 +# Total code points: 113 # ================================================ @@ -1454,6 +1462,7 @@ FF18 ; 8.0 ; ; 8 # Nd FULLWIDTH DIGIT EIGHT 12444..12445 ; 8.0 ; ; 8 # Nl [2] CUNEIFORM NUMERIC SIGN EIGHT VARIANT FORM USSU..CUNEIFORM NUMERIC SIGN EIGHT VARIANT FORM USSU3 1246D ; 8.0 ; ; 8 # Nl CUNEIFORM NUMERIC SIGN EIGHT U VARIANT FORM 16A68 ; 8.0 ; ; 8 # Nd MRO DIGIT EIGHT +16AC8 ; 8.0 ; ; 8 # Nd TANGSA DIGIT EIGHT 16B58 ; 8.0 ; ; 8 # Nd PAHAWH HMONG DIGIT EIGHT 16E88 ; 8.0 ; ; 8 # No MEDEFAIDRIN DIGIT EIGHT 1D2E8 ; 8.0 ; ; 8 # No MAYAN NUMERAL EIGHT @@ -1474,7 +1483,7 @@ FF18 ; 8.0 ; ; 8 # Nd FULLWIDTH DIGIT EIGHT 1F109 ; 8.0 ; ; 8 # No DIGIT EIGHT COMMA 1FBF8 ; 8.0 ; ; 8 # Nd SEGMENTED DIGIT EIGHT -# Total code points: 108 +# Total code points: 109 # ================================================ @@ -1573,6 +1582,7 @@ FF19 ; 9.0 ; ; 9 # Nd FULLWIDTH DIGIT NINE 12446..12449 ; 9.0 ; ; 9 # Nl [4] CUNEIFORM NUMERIC SIGN NINE VARIANT FORM ILIMMU..CUNEIFORM NUMERIC SIGN NINE VARIANT FORM ILIMMU A 1246E ; 9.0 ; ; 9 # Nl CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM 16A69 ; 9.0 ; ; 9 # Nd MRO DIGIT NINE +16AC9 ; 9.0 ; ; 9 # Nd TANGSA DIGIT NINE 16B59 ; 9.0 ; ; 9 # Nd PAHAWH HMONG DIGIT NINE 16E89 ; 9.0 ; ; 9 # No MEDEFAIDRIN DIGIT NINE 1D2E9 ; 9.0 ; ; 9 # No MAYAN NUMERAL NINE @@ -1594,7 +1604,7 @@ FF19 ; 9.0 ; ; 9 # Nd FULLWIDTH DIGIT NINE 1FBF9 ; 9.0 ; ; 9 # Nd SEGMENTED DIGIT NINE 2F890 ; 9.0 ; ; 9 # Lo CJK COMPATIBILITY IDEOGRAPH-2F890 -# Total code points: 112 +# Total code points: 113 # ================================================ diff --git a/lib/unicore/mktables b/lib/unicore/mktables index 89a2e15ef5..187915bc8b 100644 --- a/lib/unicore/mktables +++ b/lib/unicore/mktables @@ -48,7 +48,7 @@ sub NON_ASCII_PLATFORM { ord("A") != 65 } # expected, a warning will be generated. If an older version is being # compiled, any bounds tests that fail in the generated test file (-maketest # option) will be marked as TODO. -my $version_of_mk_invlist_bounds = v13.0.0; +my $version_of_mk_invlist_bounds = v14.0.0; ########################################################################## # diff --git a/lib/unicore/uni_keywords.pl b/lib/unicore/uni_keywords.pl index b08ab3b738..1cb7904a9f 100644 --- a/lib/unicore/uni_keywords.pl +++ b/lib/unicore/uni_keywords.pl @@ -4,19 +4,19 @@ # Any changes made here will be lost! %Unicode::UCD::uni_prop_ptrs_indices = ( - '_perl_any_folds' => 1187, - '_perl_charname_begin' => 1188, - '_perl_charname_continue' => 1189, - '_perl_folds_to_multi_char' => 1190, - '_perl_idcont' => 1191, - '_perl_idstart' => 1192, - '_perl_is_in_multi_char_fold' => 1193, - '_perl_nchar' => 1194, - '_perl_patws' => 1195, - '_perl_problematic_locale_foldeds_start' => 1196, - '_perl_problematic_locale_folds' => 1197, - '_perl_quotemeta' => 1198, - '_perl_surrogate' => 1199, + '_perl_any_folds' => 1211, + '_perl_charname_begin' => 1212, + '_perl_charname_continue' => 1213, + '_perl_folds_to_multi_char' => 1214, + '_perl_idcont' => 1215, + '_perl_idstart' => 1216, + '_perl_is_in_multi_char_fold' => 1217, + '_perl_nchar' => 1218, + '_perl_patws' => 1219, + '_perl_problematic_locale_foldeds_start' => 1220, + '_perl_problematic_locale_folds' => 1221, + '_perl_quotemeta' => 1222, + '_perl_surrogate' => 1223, 'adlm' => 1, 'aegeannumbers' => 2, 'age=10' => 3, @@ -24,1280 +24,1304 @@ 'age=12' => 5, 'age=12.1' => 6, 'age=13' => 7, - 'age=2' => 8, - 'age=2.1' => 9, - 'age=3' => 10, - 'age=3.1' => 11, - 'age=3.2' => 12, - 'age=4' => 13, - 'age=4.1' => 14, - 'age=5' => 15, - 'age=5.1' => 16, - 'age=5.2' => 17, - 'age=6' => 18, - 'age=6.1' => 19, - 'age=6.2' => 20, - 'age=6.3' => 21, - 'age=7' => 22, - 'age=8' => 23, - 'age=9' => 24, - 'age=na' => 25, - 'aghb' => 26, - 'ahex' => 970, - 'ahom' => 27, - 'alchemical' => 28, - 'all' => 29, - 'alnum' => 1161, - 'alpha' => 1162, - 'alphabetic' => 1162, - 'alphabeticpf' => 30, - 'ancientgreekmusic' => 31, - 'ancientgreeknumbers' => 32, - 'ancientsymbols' => 33, - 'any' => 34, - 'arab' => 35, - 'arabicexta' => 36, - 'arabicmath' => 37, - 'arabicpfa' => 38, - 'arabicpfb' => 39, - 'arabicsup' => 40, - 'armi' => 41, - 'armn' => 42, - 'arrows' => 43, - 'ascii' => 44, - 'asciihexdigit' => 970, - 'assigned' => 45, - 'avst' => 46, - 'bali' => 47, - 'bamu' => 48, - 'bamumsup' => 49, - 'basiclatin' => 44, - 'bass' => 50, - 'batk' => 51, - 'bc=al' => 52, - 'bc=an' => 53, - 'bc=b' => 54, - 'bc=bn' => 55, - 'bc=cs' => 56, - 'bc=en' => 57, - 'bc=es' => 58, - 'bc=et' => 59, - 'bc=fsi' => 60, - 'bc=l' => 61, - 'bc=lre' => 62, - 'bc=lri' => 63, - 'bc=lro' => 64, - 'bc=nsm' => 65, - 'bc=on' => 66, - 'bc=pdf' => 67, - 'bc=pdi' => 68, - 'bc=r' => 69, - 'bc=rle' => 70, - 'bc=rli' => 71, - 'bc=rlo' => 72, - 'bc=s' => 73, - 'bc=ws' => 74, - 'beng' => 75, - 'bhks' => 76, - 'bidic' => 77, - 'bidim' => 78, - 'blank' => 1163, - 'blockelements' => 79, - 'bopo' => 80, - 'bopomofoext' => 81, - 'boxdrawing' => 82, - 'bpt=c' => 83, - 'bpt=n' => 84, - 'bpt=o' => 85, - 'brah' => 86, - 'brai' => 87, - 'bugi' => 88, - 'buhd' => 89, - 'byzantinemusic' => 90, - 'c' => 91, - 'cakm' => 92, - 'cans' => 93, - 'cari' => 94, - 'cased' => 95, - 'casedletter' => 96, - 'cc' => 1164, - 'ccc=0' => 97, - 'ccc=1' => 98, - 'ccc=10' => 99, - 'ccc=103' => 100, - 'ccc=107' => 101, - 'ccc=11' => 102, - 'ccc=118' => 103, - 'ccc=12' => 104, - 'ccc=122' => 105, - 'ccc=129' => 106, - 'ccc=13' => 107, - 'ccc=130' => 108, - 'ccc=132' => 109, - 'ccc=14' => 110, - 'ccc=15' => 111, - 'ccc=16' => 112, - 'ccc=17' => 113, - 'ccc=18' => 114, - 'ccc=19' => 115, - 'ccc=20' => 116, - 'ccc=202' => 117, - 'ccc=21' => 118, - 'ccc=214' => 119, - 'ccc=216' => 120, - 'ccc=22' => 121, - 'ccc=23' => 122, - 'ccc=24' => 123, - 'ccc=25' => 124, - 'ccc=26' => 125, - 'ccc=27' => 126, - 'ccc=28' => 127, - 'ccc=29' => 128, - 'ccc=30' => 129, - 'ccc=31' => 130, - 'ccc=32' => 131, - 'ccc=33' => 132, - 'ccc=34' => 133, - 'ccc=35' => 134, - 'ccc=36' => 135, - 'ccc=6' => 136, - 'ccc=7' => 137, - 'ccc=8' => 138, - 'ccc=84' => 139, - 'ccc=9' => 140, - 'ccc=91' => 141, - 'ccc=a' => 142, - 'ccc=al' => 143, - 'ccc=ar' => 144, - 'ccc=b' => 145, - 'ccc=bl' => 146, - 'ccc=br' => 147, - 'ccc=da' => 148, - 'ccc=db' => 149, - 'ccc=is' => 150, - 'ccc=l' => 151, - 'ccc=r' => 152, - 'ce' => 153, - 'cf' => 154, - 'cham' => 155, - 'cher' => 156, - 'cherokeesup' => 157, - 'chesssymbols' => 158, - 'chrs' => 159, - 'ci' => 160, - 'cjk' => 161, - 'cjkcompat' => 162, - 'cjkcompatforms' => 163, - 'cjkcompatideographs' => 164, - 'cjkcompatideographssup' => 165, - 'cjkexta' => 166, - 'cjkextb' => 167, - 'cjkextc' => 168, - 'cjkextd' => 169, - 'cjkexte' => 170, - 'cjkextf' => 171, - 'cjkextg' => 172, - 'cjkradicalssup' => 173, - 'cjkstrokes' => 174, - 'cjksymbols' => 175, - 'cn' => 176, - 'cntrl' => 1164, - 'co' => 177, - 'compatjamo' => 178, - 'compex' => 179, - 'control' => 1164, - 'controlpictures' => 180, - 'copt' => 181, - 'copticepactnumbers' => 182, - 'countingrod' => 183, - 'cprt' => 184, - 'cuneiformnumbers' => 185, - 'currencysymbols' => 186, - 'cwcf' => 187, - 'cwcm' => 188, - 'cwkcf' => 189, - 'cwl' => 190, - 'cwt' => 191, - 'cwu' => 192, - 'cypriotsyllabary' => 193, - 'cyrillicexta' => 194, - 'cyrillicextb' => 195, - 'cyrillicextc' => 196, - 'cyrillicsup' => 197, - 'cyrl' => 198, - 'dash' => 199, - 'decimalnumber' => 1165, - 'dep' => 200, - 'deva' => 201, - 'devanagariext' => 202, - 'di' => 203, - 'dia' => 204, - 'diacriticals' => 205, - 'diacriticalsext' => 206, - 'diacriticalsforsymbols' => 207, - 'diacriticalssup' => 208, - 'diak' => 209, - 'digit' => 1165, - 'dingbats' => 210, - 'dogr' => 211, - 'domino' => 212, - 'dsrt' => 213, - 'dt=can' => 214, - 'dt=com' => 215, - 'dt=enc' => 216, - 'dt=fin' => 217, - 'dt=font' => 218, - 'dt=fra' => 219, - 'dt=init' => 220, - 'dt=iso' => 221, - 'dt=med' => 222, - 'dt=nar' => 223, - 'dt=nb' => 224, - 'dt=noncanon' => 225, - 'dt=none' => 226, - 'dt=sml' => 227, - 'dt=sqr' => 228, - 'dt=sub' => 229, - 'dt=sup' => 230, - 'dt=vert' => 231, - 'dupl' => 232, - 'ea=a' => 234, - 'ea=f' => 235, - 'ea=h' => 236, - 'ea=n' => 237, - 'ea=na' => 238, - 'ea=w' => 239, - 'earlydynasticcuneiform' => 233, - 'ebase' => 240, - 'ecomp' => 241, - 'egyp' => 242, - 'egyptianhieroglyphformatcontrols' => 243, - 'elba' => 244, - 'elym' => 245, - 'emod' => 246, - 'emoji' => 247, - 'emoticons' => 248, - 'enclosedalphanum' => 249, - 'enclosedalphanumsup' => 250, - 'enclosedcjk' => 251, - 'enclosedideographicsup' => 252, - 'epres' => 253, - 'ethi' => 254, - 'ethiopicext' => 255, - 'ethiopicexta' => 256, - 'ethiopicsup' => 257, - 'ext' => 258, - 'extpict' => 259, - 'gcb=cn' => 260, - 'gcb=ex' => 261, - 'gcb=l' => 262, - 'gcb=pp' => 263, - 'gcb=sm' => 264, - 'gcb=t' => 265, - 'gcb=v' => 266, - 'gcb=xx' => 267, - 'geometricshapes' => 268, - 'geometricshapesext' => 269, - 'geor' => 270, - 'georgianext' => 271, - 'georgiansup' => 272, - 'glag' => 273, - 'glagoliticsup' => 274, - 'gong' => 275, - 'gonm' => 276, - 'goth' => 277, - 'gran' => 278, - 'graph' => 1166, - 'grbase' => 279, - 'greekext' => 280, - 'grek' => 281, - 'grext' => 282, - 'gujr' => 283, - 'guru' => 284, - 'halfandfullforms' => 285, - 'halfmarks' => 286, - 'han' => 287, - 'hang' => 288, - 'hano' => 289, - 'hatr' => 290, - 'hebr' => 291, - 'hex' => 1173, - 'hexdigit' => 1173, - 'highpusurrogates' => 292, - 'highsurrogates' => 293, - 'hira' => 294, - 'hluw' => 295, - 'hmng' => 296, - 'hmnp' => 297, - 'horizspace' => 1163, - 'hst=na' => 298, - 'hung' => 299, - 'hyphen_perl_aux' => 300, - 'idc' => 301, - 'identifierstatus=allowed' => 302, - 'identifierstatus=restricted' => 303, - 'identifiertype=defaultignorable' => 304, - 'identifiertype=exclusion' => 305, - 'identifiertype=inclusion' => 306, - 'identifiertype=limiteduse' => 307, - 'identifiertype=notcharacter' => 308, - 'identifiertype=notnfkc' => 309, - 'identifiertype=notxid' => 310, - 'identifiertype=obsolete' => 311, - 'identifiertype=recommended' => 312, - 'identifiertype=technical' => 313, - 'identifiertype=uncommonuse' => 314, - 'ideo' => 315, - 'ideographicsymbols' => 316, - 'ids' => 317, - 'idsb' => 318, - 'idst' => 319, - 'in=1.1' => 517, - 'in=10' => 512, - 'in=11' => 513, - 'in=12' => 514, - 'in=12.1' => 515, - 'in=13' => 516, - 'in=2' => 518, - 'in=2.1' => 519, - 'in=3' => 520, - 'in=3.1' => 521, - 'in=3.2' => 522, - 'in=4' => 523, - 'in=4.1' => 524, - 'in=5' => 525, - 'in=5.1' => 526, - 'in=5.2' => 527, - 'in=6' => 528, - 'in=6.1' => 529, - 'in=6.2' => 530, - 'in=6.3' => 531, - 'in=7' => 532, - 'in=8' => 533, - 'in=9' => 534, - 'inadlam' => 320, - 'inahom' => 321, - 'inanatolianhieroglyphs' => 322, - 'inarabic' => 323, - 'inarmenian' => 324, - 'inavestan' => 325, - 'inbalinese' => 326, - 'inbamum' => 327, - 'inbassavah' => 328, - 'inbatak' => 329, - 'inbengali' => 330, - 'inbhaiksuki' => 331, - 'inbopomofo' => 332, - 'inbrahmi' => 333, - 'inbuginese' => 334, - 'inbuhid' => 335, - 'incarian' => 336, - 'incaucasianalbanian' => 337, - 'inchakma' => 338, - 'incham' => 339, - 'incherokee' => 340, - 'inchorasmian' => 341, - 'incoptic' => 342, - 'incuneiform' => 343, - 'incyrillic' => 344, - 'indevanagari' => 345, - 'indicnumberforms' => 346, - 'indicsiyaqnumbers' => 347, - 'indivesakuru' => 348, - 'indogra' => 349, - 'induployan' => 350, - 'inegyptianhieroglyphs' => 351, - 'inelbasan' => 352, - 'inelymaic' => 353, - 'inethiopic' => 354, - 'ingeorgian' => 355, - 'inglagolitic' => 356, - 'ingothic' => 357, - 'ingrantha' => 358, - 'ingreek' => 359, - 'ingujarati' => 360, - 'ingunjalagondi' => 361, - 'ingurmukhi' => 362, - 'inhangul' => 363, - 'inhanifirohingya' => 364, - 'inhanunoo' => 365, - 'inhatran' => 366, - 'inhebrew' => 367, - 'inhiragana' => 368, - 'inidc' => 369, - 'inimperialaramaic' => 370, - 'ininscriptionalpahlavi' => 371, - 'ininscriptionalparthian' => 372, - 'injavanese' => 373, - 'inkaithi' => 374, - 'inkannada' => 375, - 'inkatakana' => 376, - 'inkharoshthi' => 377, - 'inkhitansmallscript' => 378, - 'inkhmer' => 379, - 'inkhojki' => 380, - 'inkhudawadi' => 381, - 'inlao' => 382, - 'inlepcha' => 383, - 'inlimbu' => 384, - 'inlineara' => 385, - 'inlisu' => 386, - 'inlycian' => 387, - 'inlydian' => 388, - 'inmahajani' => 389, - 'inmakasar' => 390, - 'inmalayalam' => 391, - 'inmandaic' => 392, - 'inmanichaean' => 393, - 'inmarchen' => 394, - 'inmasaramgondi' => 395, - 'inmedefaidrin' => 396, - 'inmeeteimayek' => 397, - 'inmendekikakui' => 398, - 'inmeroiticcursive' => 399, - 'inmiao' => 400, - 'inmodi' => 401, - 'inmongolian' => 402, - 'inmro' => 403, - 'inmultani' => 404, - 'inmyanmar' => 405, - 'innabataean' => 406, - 'innandinagari' => 407, - 'innewa' => 408, - 'innewtailue' => 409, - 'innko' => 410, - 'innushu' => 411, - 'innyiakengpuachuehmong' => 412, - 'inogham' => 413, - 'inoldhungarian' => 414, - 'inolditalic' => 415, - 'inoldpermic' => 416, - 'inoldpersian' => 417, - 'inoldsogdian' => 418, - 'inoldturkic' => 419, - 'inoriya' => 420, - 'inosage' => 421, - 'inosmanya' => 422, - 'inpahawhhmong' => 423, - 'inpaucinhau' => 424, - 'inpc=bottom' => 425, - 'inpc=bottomandleft' => 426, - 'inpc=bottomandright' => 427, - 'inpc=left' => 428, - 'inpc=leftandright' => 429, - 'inpc=na' => 430, - 'inpc=overstruck' => 431, - 'inpc=right' => 432, - 'inpc=top' => 433, - 'inpc=topandbottom' => 434, - 'inpc=topandbottomandleft' => 435, - 'inpc=topandbottomandright' => 436, - 'inpc=topandleft' => 437, - 'inpc=topandleftandright' => 438, - 'inpc=topandright' => 439, - 'inphagspa' => 440, - 'inphoenician' => 441, - 'inpsalterpahlavi' => 442, - 'inpunctuation' => 443, - 'inrejang' => 444, - 'inrunic' => 445, - 'insamaritan' => 446, - 'insaurashtra' => 447, - 'insc=avagraha' => 448, - 'insc=bindu' => 449, - 'insc=brahmijoiningnumber' => 450, - 'insc=cantillationmark' => 451, - 'insc=consonant' => 452, - 'insc=consonantdead' => 453, - 'insc=consonantfinal' => 454, - 'insc=consonantheadletter' => 455, - 'insc=consonantinitialpostfixed' => 456, - 'insc=consonantkiller' => 457, - 'insc=consonantmedial' => 458, - 'insc=consonantplaceholder' => 459, - 'insc=consonantprecedingrepha' => 460, - 'insc=consonantprefixed' => 461, - 'insc=consonantsubjoined' => 462, - 'insc=consonantsucceedingrepha' => 463, - 'insc=consonantwithstacker' => 464, - 'insc=geminationmark' => 465, - 'insc=invisiblestacker' => 466, - 'insc=modifyingletter' => 467, - 'insc=nonjoiner' => 468, - 'insc=nukta' => 469, - 'insc=number' => 470, - 'insc=numberjoiner' => 471, - 'insc=other' => 472, - 'insc=purekiller' => 473, - 'insc=registershifter' => 474, - 'insc=syllablemodifier' => 475, - 'insc=toneletter' => 476, - 'insc=tonemark' => 477, - 'insc=virama' => 478, - 'insc=visarga' => 479, - 'insc=vowel' => 480, - 'insc=voweldependent' => 481, - 'insc=vowelindependent' => 482, - 'insiddham' => 483, - 'insinhala' => 484, - 'insogdian' => 485, - 'insorasompeng' => 486, - 'insoyombo' => 487, - 'insundanese' => 488, - 'insylotinagri' => 489, - 'insyriac' => 490, - 'intagalog' => 491, - 'intagbanwa' => 492, - 'intaile' => 493, - 'intaitham' => 494, - 'intaiviet' => 495, - 'intakri' => 496, - 'intamil' => 497, - 'intangut' => 498, - 'intelugu' => 499, - 'inthaana' => 500, - 'inthai' => 501, - 'intibetan' => 502, - 'intifinagh' => 503, - 'intirhuta' => 504, - 'inugaritic' => 505, - 'invai' => 506, - 'invs' => 507, - 'inwancho' => 508, - 'inwarangciti' => 509, - 'inyezidi' => 510, - 'inzanabazarsquare' => 511, - 'ipaext' => 535, - 'ital' => 536, - 'jamo' => 537, - 'jamoexta' => 538, - 'jamoextb' => 539, - 'java' => 540, - 'jg=africanfeh' => 541, - 'jg=africannoon' => 542, - 'jg=africanqaf' => 543, - 'jg=ain' => 544, - 'jg=alaph' => 545, - 'jg=alef' => 546, - 'jg=beh' => 547, - 'jg=beth' => 548, - 'jg=burushaskiyehbarree' => 549, - 'jg=dal' => 550, - 'jg=dalathrish' => 551, - 'jg=e' => 552, - 'jg=farsiyeh' => 553, - 'jg=fe' => 554, - 'jg=feh' => 555, - 'jg=finalsemkath' => 556, - 'jg=gaf' => 557, - 'jg=gamal' => 558, - 'jg=hah' => 559, - 'jg=hamzaonhehgoal' => 560, - 'jg=hanifirohingyakinnaya' => 561, - 'jg=hanifirohingyapa' => 562, - 'jg=he' => 563, - 'jg=heh' => 564, - 'jg=hehgoal' => 565, - 'jg=heth' => 566, - 'jg=kaf' => 567, - 'jg=kaph' => 568, - 'jg=khaph' => 569, - 'jg=knottedheh' => 570, - 'jg=lam' => 571, - 'jg=lamadh' => 572, - 'jg=malayalambha' => 573, - 'jg=malayalamja' => 574, - 'jg=malayalamlla' => 575, - 'jg=malayalamllla' => 576, - 'jg=malayalamnga' => 577, - 'jg=malayalamnna' => 578, - 'jg=malayalamnnna' => 579, - 'jg=malayalamnya' => 580, - 'jg=malayalamra' => 581, - 'jg=malayalamssa' => 582, - 'jg=malayalamtta' => 583, - 'jg=manichaeanaleph' => 584, - 'jg=manichaeanayin' => 585, - 'jg=manichaeanbeth' => 586, - 'jg=manichaeandaleth' => 587, - 'jg=manichaeandhamedh' => 588, - 'jg=manichaeanfive' => 589, - 'jg=manichaeangimel' => 590, - 'jg=manichaeanheth' => 591, - 'jg=manichaeanhundred' => 592, - 'jg=manichaeankaph' => 593, - 'jg=manichaeanlamedh' => 594, - 'jg=manichaeanmem' => 595, - 'jg=manichaeannun' => 596, - 'jg=manichaeanone' => 597, - 'jg=manichaeanpe' => 598, - 'jg=manichaeanqoph' => 599, - 'jg=manichaeanresh' => 600, - 'jg=manichaeansadhe' => 601, - 'jg=manichaeansamekh' => 602, - 'jg=manichaeantaw' => 603, - 'jg=manichaeanten' => 604, - 'jg=manichaeanteth' => 605, - 'jg=manichaeanthamedh' => 606, - 'jg=manichaeantwenty' => 607, - 'jg=manichaeanwaw' => 608, - 'jg=manichaeanyodh' => 609, - 'jg=manichaeanzayin' => 610, - 'jg=meem' => 611, - 'jg=mim' => 612, - 'jg=nojoininggroup' => 613, - 'jg=noon' => 614, - 'jg=nun' => 615, - 'jg=nya' => 616, - 'jg=pe' => 617, - 'jg=qaf' => 618, - 'jg=qaph' => 619, - 'jg=reh' => 620, - 'jg=reversedpe' => 621, - 'jg=rohingyayeh' => 622, - 'jg=sad' => 623, - 'jg=sadhe' => 624, - 'jg=seen' => 625, - 'jg=semkath' => 626, - 'jg=shin' => 627, - 'jg=straightwaw' => 628, - 'jg=swashkaf' => 629, - 'jg=syriacwaw' => 630, - 'jg=tah' => 631, - 'jg=taw' => 632, - 'jg=tehmarbuta' => 633, - 'jg=teth' => 634, - 'jg=waw' => 635, - 'jg=yeh' => 636, - 'jg=yehbarree' => 637, - 'jg=yehwithtail' => 638, - 'jg=yudh' => 639, - 'jg=yudhhe' => 640, - 'jg=zain' => 641, - 'jg=zhain' => 642, - 'joinc' => 643, - 'jt=c' => 644, - 'jt=d' => 645, - 'jt=l' => 646, - 'jt=r' => 647, - 'jt=t' => 648, - 'jt=u' => 649, - 'kali' => 650, - 'kana' => 651, - 'kanaexta' => 652, - 'kanasup' => 653, - 'kanbun' => 654, - 'kangxi' => 655, - 'katakanaext' => 656, - 'khar' => 657, - 'khmersymbols' => 658, - 'khmr' => 659, - 'khoj' => 660, - 'kits' => 661, - 'knda' => 662, - 'kthi' => 663, - 'l' => 664, - 'l_' => 96, - 'l_amp_' => 96, - 'lana' => 665, - 'lao' => 666, - 'latin1' => 667, - 'latinexta' => 668, - 'latinextadditional' => 669, - 'latinextb' => 670, - 'latinextc' => 671, - 'latinextd' => 672, - 'latinexte' => 673, - 'latn' => 674, - 'lb=ai' => 675, - 'lb=al' => 676, - 'lb=b2' => 677, - 'lb=ba' => 678, - 'lb=bb' => 679, - 'lb=bk' => 680, - 'lb=cb' => 681, - 'lb=cj' => 682, - 'lb=cl' => 683, - 'lb=cm' => 684, - 'lb=cp' => 685, - 'lb=cr' => 686, - 'lb=ex' => 687, - 'lb=gl' => 688, - 'lb=h2' => 689, - 'lb=h3' => 690, - 'lb=hl' => 691, - 'lb=hy' => 692, - 'lb=id' => 693, - 'lb=in' => 694, - 'lb=is' => 695, - 'lb=lf' => 696, - 'lb=nl' => 697, - 'lb=ns' => 698, - 'lb=nu' => 699, - 'lb=op' => 700, - 'lb=po' => 701, - 'lb=pr' => 702, - 'lb=qu' => 703, - 'lb=sa' => 704, - 'lb=sg_perl_aux' => 705, - 'lb=sp' => 706, - 'lb=sy' => 707, - 'lb=wj' => 708, - 'lb=xx' => 709, - 'lb=zw' => 710, - 'lb=zwj' => 711, - 'lc' => 96, - 'lepc' => 712, - 'letterlikesymbols' => 713, - 'limb' => 714, - 'lina' => 715, - 'linb' => 716, - 'linearbideograms' => 717, - 'linearbsyllabary' => 718, - 'lisu' => 719, - 'lisusup' => 720, - 'll' => 724, - 'lm' => 721, - 'lo' => 722, - 'loe' => 723, - 'lower' => 1167, - 'lowercase' => 1167, - 'lowercaseletter' => 724, - 'lowsurrogates' => 725, - 'lt' => 1124, - 'lu' => 1130, - 'lyci' => 726, - 'lydi' => 727, - 'm' => 728, - 'mahj' => 729, - 'mahjong' => 730, - 'maka' => 731, - 'mand' => 732, - 'mani' => 733, - 'marc' => 734, - 'math' => 735, - 'mathalphanum' => 736, - 'mathoperators' => 737, - 'mayannumerals' => 738, - 'mc' => 739, - 'me' => 740, - 'medf' => 741, - 'meeteimayekext' => 742, - 'mend' => 743, - 'merc' => 744, - 'mero' => 745, - 'miao' => 746, - 'miscarrows' => 747, - 'miscmathsymbolsa' => 748, - 'miscmathsymbolsb' => 749, - 'miscpictographs' => 750, - 'miscsymbols' => 751, - 'misctechnical' => 752, - 'mlym' => 753, - 'mn' => 754, - 'modi' => 755, - 'modifierletters' => 756, - 'modifiertoneletters' => 757, - 'mong' => 758, - 'mongoliansup' => 759, - 'mro' => 760, - 'mtei' => 761, - 'mult' => 762, - 'music' => 763, - 'myanmarexta' => 764, - 'myanmarextb' => 765, - 'mymr' => 766, - 'n' => 767, - 'nand' => 768, - 'narb' => 769, - 'nb' => 770, - 'nbat' => 771, - 'nd' => 1165, - 'newa' => 772, - 'nfcqc=m' => 773, - 'nfcqc=y' => 774, - 'nfdqc=y' => 775, - 'nfkcqc=n' => 776, - 'nfkcqc=y' => 777, - 'nfkdqc=n' => 778, - 'nko' => 779, - 'nl' => 780, - 'no' => 781, - 'nshu' => 782, - 'nt=di' => 783, - 'nt=nu' => 784, - 'numberforms' => 785, - 'nv=0' => 786, - 'nv=1' => 787, - 'nv=1/10' => 812, - 'nv=1/12' => 813, - 'nv=1/16' => 814, - 'nv=1/160' => 815, - 'nv=1/2' => 816, - 'nv=1/20' => 817, - 'nv=1/3' => 818, - 'nv=1/32' => 819, - 'nv=1/320' => 820, - 'nv=1/4' => 821, - 'nv=1/40' => 822, - 'nv=1/5' => 823, - 'nv=1/6' => 824, - 'nv=1/64' => 825, - 'nv=1/7' => 826, - 'nv=1/8' => 827, - 'nv=1/80' => 828, - 'nv=1/9' => 829, - 'nv=10' => 788, - 'nv=100' => 789, - 'nv=1000' => 790, - 'nv=10000' => 791, - 'nv=100000' => 792, - 'nv=1000000' => 793, - 'nv=10000000' => 794, - 'nv=100000000' => 795, - 'nv=10000000000' => 796, - 'nv=1000000000000' => 797, - 'nv=11' => 798, - 'nv=11/12' => 799, - 'nv=11/2' => 800, - 'nv=12' => 801, - 'nv=13' => 802, - 'nv=13/2' => 803, - 'nv=14' => 804, - 'nv=15' => 805, - 'nv=15/2' => 806, - 'nv=16' => 807, - 'nv=17' => 808, - 'nv=17/2' => 809, - 'nv=18' => 810, - 'nv=19' => 811, - 'nv=2' => 830, - 'nv=2/3' => 847, - 'nv=2/5' => 848, - 'nv=20' => 831, - 'nv=200' => 832, - 'nv=2000' => 833, - 'nv=20000' => 834, - 'nv=200000' => 835, - 'nv=20000000' => 836, - 'nv=21' => 837, - 'nv=216000' => 838, - 'nv=22' => 839, - 'nv=23' => 840, - 'nv=24' => 841, - 'nv=25' => 842, - 'nv=26' => 843, - 'nv=27' => 844, - 'nv=28' => 845, - 'nv=29' => 846, - 'nv=3' => 849, - 'nv=3/16' => 864, - 'nv=3/2' => 865, - 'nv=3/20' => 866, - 'nv=3/4' => 867, - 'nv=3/5' => 868, - 'nv=3/64' => 869, - 'nv=3/8' => 870, - 'nv=3/80' => 871, - 'nv=30' => 850, - 'nv=300' => 851, - 'nv=3000' => 852, - 'nv=30000' => 853, - 'nv=300000' => 854, - 'nv=31' => 855, - 'nv=32' => 856, - 'nv=33' => 857, - 'nv=34' => 858, - 'nv=35' => 859, - 'nv=36' => 860, - 'nv=37' => 861, - 'nv=38' => 862, - 'nv=39' => 863, - 'nv=4' => 872, - 'nv=4/5' => 888, - 'nv=40' => 873, - 'nv=400' => 874, - 'nv=4000' => 875, - 'nv=40000' => 876, - 'nv=400000' => 877, - 'nv=41' => 878, - 'nv=42' => 879, - 'nv=43' => 880, - 'nv=432000' => 881, - 'nv=44' => 882, - 'nv=45' => 883, - 'nv=46' => 884, - 'nv=47' => 885, - 'nv=48' => 886, - 'nv=49' => 887, - 'nv=5' => 889, - 'nv=5/12' => 895, - 'nv=5/2' => 896, - 'nv=5/6' => 897, - 'nv=5/8' => 898, - 'nv=50' => 890, - 'nv=500' => 891, - 'nv=5000' => 892, - 'nv=50000' => 893, - 'nv=500000' => 894, - 'nv=6' => 899, - 'nv=60' => 900, - 'nv=600' => 901, - 'nv=6000' => 902, - 'nv=60000' => 903, - 'nv=600000' => 904, - 'nv=7' => 905, - 'nv=7/12' => 911, - 'nv=7/2' => 912, - 'nv=7/8' => 913, - 'nv=70' => 906, - 'nv=700' => 907, - 'nv=7000' => 908, - 'nv=70000' => 909, - 'nv=700000' => 910, - 'nv=8' => 914, - 'nv=80' => 915, - 'nv=800' => 916, - 'nv=8000' => 917, - 'nv=80000' => 918, - 'nv=800000' => 919, - 'nv=9' => 920, - 'nv=9/2' => 926, - 'nv=90' => 921, - 'nv=900' => 922, - 'nv=9000' => 923, - 'nv=90000' => 924, - 'nv=900000' => 925, - 'nv=_minus_1/2' => 928, - 'nv=nan' => 927, - 'ocr' => 929, - 'ogam' => 930, - 'olck' => 931, - 'orkh' => 932, - 'ornamentaldingbats' => 933, - 'orya' => 934, - 'osge' => 935, - 'osma' => 936, - 'ottomansiyaqnumbers' => 937, - 'p' => 938, - 'palm' => 939, - 'patsyn' => 940, - 'pauc' => 941, - 'pc' => 942, - 'pcm' => 943, - 'pd' => 944, - 'pe' => 945, - 'perlspace' => 967, - 'perlword' => 969, - 'perm' => 946, - 'pf' => 947, - 'phag' => 948, - 'phaistos' => 949, - 'phli' => 950, - 'phlp' => 951, - 'phnx' => 952, - 'phoneticext' => 953, - 'phoneticextsup' => 954, - 'pi' => 955, - 'playingcards' => 956, - 'po' => 957, - 'posixalnum' => 958, - 'posixalpha' => 959, - 'posixblank' => 960, - 'posixcntrl' => 961, - 'posixdigit' => 962, - 'posixgraph' => 963, - 'posixlower' => 964, - 'posixprint' => 965, - 'posixpunct' => 966, - 'posixspace' => 967, - 'posixupper' => 968, - 'posixword' => 969, - 'posixxdigit' => 970, - 'print' => 1168, - 'prti' => 971, - 'ps' => 972, - 'pua' => 973, - 'qaai' => 974, - 'qmark' => 975, - 'radical' => 976, - 'ri' => 977, - 'rjng' => 978, - 'rohg' => 979, - 'rumi' => 980, - 'runr' => 981, - 's' => 982, - 'samr' => 983, - 'sarb' => 984, - 'saur' => 985, - 'sb=at' => 986, - 'sb=cl' => 987, - 'sb=ex' => 988, - 'sb=fo' => 989, - 'sb=le' => 990, - 'sb=lo' => 991, - 'sb=nu' => 992, - 'sb=sc' => 993, - 'sb=se' => 994, - 'sb=sp' => 995, - 'sb=st' => 996, - 'sb=up' => 997, - 'sb=xx' => 998, - 'sc' => 999, - 'sc=adlm' => 1000, - 'sc=arab' => 1001, - 'sc=beng' => 1002, - 'sc=bopo' => 1003, - 'sc=bugi' => 1004, - 'sc=buhd' => 1005, - 'sc=cakm' => 1006, - 'sc=copt' => 1007, - 'sc=cprt' => 1008, - 'sc=cyrl' => 1009, - 'sc=deva' => 1010, - 'sc=dogr' => 1011, - 'sc=dupl' => 1012, - 'sc=geor' => 1013, - 'sc=glag' => 1014, - 'sc=gong' => 1015, - 'sc=gonm' => 1016, - 'sc=gran' => 1017, - 'sc=grek' => 1018, - 'sc=gujr' => 1019, - 'sc=guru' => 1020, - 'sc=han' => 1021, - 'sc=hang' => 1022, - 'sc=hano' => 1023, - 'sc=hira' => 1024, - 'sc=java' => 1025, - 'sc=kali' => 1026, - 'sc=kana' => 1027, - 'sc=khoj' => 1028, - 'sc=knda' => 1029, - 'sc=kthi' => 1030, - 'sc=latn' => 1031, - 'sc=limb' => 1032, - 'sc=lina' => 1033, - 'sc=linb' => 1034, - 'sc=mahj' => 1035, - 'sc=mand' => 1036, - 'sc=mani' => 1037, - 'sc=mlym' => 1038, - 'sc=modi' => 1039, - 'sc=mong' => 1040, - 'sc=mult' => 1041, - 'sc=mymr' => 1042, - 'sc=nand' => 1043, - 'sc=orya' => 1044, - 'sc=perm' => 1045, - 'sc=phag' => 1046, - 'sc=phlp' => 1047, - 'sc=qaai' => 1048, - 'sc=rohg' => 1049, - 'sc=shrd' => 1050, - 'sc=sind' => 1051, - 'sc=sinh' => 1052, - 'sc=sogd' => 1053, - 'sc=sylo' => 1054, - 'sc=syrc' => 1055, - 'sc=tagb' => 1056, - 'sc=takr' => 1057, - 'sc=tale' => 1058, - 'sc=taml' => 1059, - 'sc=telu' => 1060, - 'sc=tglg' => 1061, - 'sc=thaa' => 1062, - 'sc=tirh' => 1063, - 'sc=yezi' => 1064, - 'sc=yi' => 1065, - 'sc=zyyy' => 1066, - 'sd' => 1067, - 'sgnw' => 1068, - 'shaw' => 1069, - 'shorthandformatcontrols' => 1070, - 'shrd' => 1071, - 'sidd' => 1072, - 'sind' => 1073, - 'sinh' => 1074, - 'sinhalaarchaicnumbers' => 1075, - 'sk' => 1076, - 'sm' => 1077, - 'smallforms' => 1078, - 'smallkanaext' => 1079, - 'so' => 1080, - 'sogd' => 1081, - 'sogo' => 1082, - 'sora' => 1083, - 'soyo' => 1084, - 'space' => 1170, - 'spaceperl' => 1170, - 'specials' => 1085, - 'sterm' => 1086, - 'sund' => 1087, - 'sundanesesup' => 1088, - 'suparrowsa' => 1089, - 'suparrowsb' => 1090, - 'suparrowsc' => 1091, - 'superandsub' => 1092, - 'supmathoperators' => 1093, - 'suppuaa' => 1094, - 'suppuab' => 1095, - 'suppunctuation' => 1096, - 'supsymbolsandpictographs' => 1097, - 'suttonsignwriting' => 1098, - 'sylo' => 1099, - 'symbolsandpictographsexta' => 1100, - 'symbolsforlegacycomputing' => 1101, - 'syrc' => 1102, - 'syriacsup' => 1103, - 'tagb' => 1104, - 'tags' => 1105, - 'taixuanjing' => 1106, - 'takr' => 1107, - 'tale' => 1108, - 'talu' => 1109, - 'tamilsup' => 1110, - 'taml' => 1111, - 'tang' => 1112, - 'tangutcomponents' => 1113, - 'tangutsup' => 1114, - 'tavt' => 1115, - 'telu' => 1116, - 'term' => 1117, - 'tfng' => 1118, - 'tglg' => 1119, - 'thaa' => 1120, - 'thai' => 1121, - 'tibt' => 1122, - 'tirh' => 1123, - 'title' => 1124, - 'titlecase' => 1124, - 'titlecaseletter' => 1124, - 'transportandmap' => 1125, - 'ucas' => 1126, - 'ucasext' => 1127, - 'ugar' => 1128, - 'uideo' => 1129, - 'upper' => 1171, - 'uppercase' => 1171, - 'uppercaseletter' => 1130, - 'vai' => 1131, - 'vedicext' => 1132, - 'verticalforms' => 1133, - 'vertspace' => 1134, - 'vo=r' => 1135, - 'vo=tr' => 1136, - 'vo=tu' => 1137, - 'vo=u' => 1138, - 'vs' => 1139, - 'vssup' => 1140, - 'wara' => 1141, - 'wb=dq' => 1142, - 'wb=eb' => 1143, - 'wb=ex' => 1144, - 'wb=extend' => 1145, - 'wb=fo' => 1146, - 'wb=ka' => 1147, - 'wb=le' => 1148, - 'wb=mb' => 1149, - 'wb=ml' => 1150, - 'wb=mn' => 1151, - 'wb=nl' => 1152, - 'wb=nu' => 1153, - 'wb=sq' => 1154, - 'wb=wsegspace' => 1155, - 'wb=xx' => 1156, - 'wcho' => 1157, - 'whitespace' => 1170, - 'word' => 1172, - 'wspace' => 1170, - 'xdigit' => 1173, - 'xidc' => 1158, - 'xids' => 1159, - 'xpeo' => 1160, - 'xperlspace' => 1170, - 'xposixalnum' => 1161, - 'xposixalpha' => 1162, - 'xposixblank' => 1163, - 'xposixcntrl' => 1164, - 'xposixdigit' => 1165, - 'xposixgraph' => 1166, - 'xposixlower' => 1167, - 'xposixprint' => 1168, - 'xposixpunct' => 1169, - 'xposixspace' => 1170, - 'xposixupper' => 1171, - 'xposixword' => 1172, - 'xposixxdigit' => 1173, - 'xsux' => 1174, - 'yezi' => 1175, - 'yi' => 1176, - 'yijing' => 1177, - 'yiradicals' => 1178, - 'yisyllables' => 1179, - 'z' => 1180, - 'zanb' => 1181, - 'zl' => 1182, - 'zp' => 1183, - 'zs' => 1184, - 'zyyy' => 1185, - 'zzzz' => 1186, + 'age=14' => 8, + 'age=2' => 9, + 'age=2.1' => 10, + 'age=3' => 11, + 'age=3.1' => 12, + 'age=3.2' => 13, + 'age=4' => 14, + 'age=4.1' => 15, + 'age=5' => 16, + 'age=5.1' => 17, + 'age=5.2' => 18, + 'age=6' => 19, + 'age=6.1' => 20, + 'age=6.2' => 21, + 'age=6.3' => 22, + 'age=7' => 23, + 'age=8' => 24, + 'age=9' => 25, + 'age=na' => 26, + 'aghb' => 27, + 'ahex' => 986, + 'ahom' => 28, + 'alchemical' => 29, + 'all' => 30, + 'alnum' => 1184, + 'alpha' => 1185, + 'alphabetic' => 1185, + 'alphabeticpf' => 31, + 'ancientgreekmusic' => 32, + 'ancientgreeknumbers' => 33, + 'ancientsymbols' => 34, + 'any' => 35, + 'arab' => 36, + 'arabicexta' => 37, + 'arabicextb' => 38, + 'arabicmath' => 39, + 'arabicpfa' => 40, + 'arabicpfb' => 41, + 'arabicsup' => 42, + 'armi' => 43, + 'armn' => 44, + 'arrows' => 45, + 'ascii' => 46, + 'asciihexdigit' => 986, + 'assigned' => 47, + 'avst' => 48, + 'bali' => 49, + 'bamu' => 50, + 'bamumsup' => 51, + 'basiclatin' => 46, + 'bass' => 52, + 'batk' => 53, + 'bc=al' => 54, + 'bc=an' => 55, + 'bc=b' => 56, + 'bc=bn' => 57, + 'bc=cs' => 58, + 'bc=en' => 59, + 'bc=es' => 60, + 'bc=et' => 61, + 'bc=fsi' => 62, + 'bc=l' => 63, + 'bc=lre' => 64, + 'bc=lri' => 65, + 'bc=lro' => 66, + 'bc=nsm' => 67, + 'bc=on' => 68, + 'bc=pdf' => 69, + 'bc=pdi' => 70, + 'bc=r' => 71, + 'bc=rle' => 72, + 'bc=rli' => 73, + 'bc=rlo' => 74, + 'bc=s' => 75, + 'bc=ws' => 76, + 'beng' => 77, + 'bhks' => 78, + 'bidic' => 79, + 'bidim' => 80, + 'blank' => 1186, + 'blockelements' => 81, + 'bopo' => 82, + 'bopomofoext' => 83, + 'boxdrawing' => 84, + 'bpt=c' => 85, + 'bpt=n' => 86, + 'bpt=o' => 87, + 'brah' => 88, + 'brai' => 89, + 'bugi' => 90, + 'buhd' => 91, + 'byzantinemusic' => 92, + 'c' => 93, + 'cakm' => 94, + 'cans' => 95, + 'cari' => 96, + 'cased' => 97, + 'casedletter' => 98, + 'cc' => 1187, + 'ccc=0' => 99, + 'ccc=1' => 100, + 'ccc=10' => 101, + 'ccc=103' => 102, + 'ccc=107' => 103, + 'ccc=11' => 104, + 'ccc=118' => 105, + 'ccc=12' => 106, + 'ccc=122' => 107, + 'ccc=129' => 108, + 'ccc=13' => 109, + 'ccc=130' => 110, + 'ccc=132' => 111, + 'ccc=14' => 112, + 'ccc=15' => 113, + 'ccc=16' => 114, + 'ccc=17' => 115, + 'ccc=18' => 116, + 'ccc=19' => 117, + 'ccc=20' => 118, + 'ccc=202' => 119, + 'ccc=21' => 120, + 'ccc=214' => 121, + 'ccc=216' => 122, + 'ccc=22' => 123, + 'ccc=23' => 124, + 'ccc=24' => 125, + 'ccc=25' => 126, + 'ccc=26' => 127, + 'ccc=27' => 128, + 'ccc=28' => 129, + 'ccc=29' => 130, + 'ccc=30' => 131, + 'ccc=31' => 132, + 'ccc=32' => 133, + 'ccc=33' => 134, + 'ccc=34' => 135, + 'ccc=35' => 136, + 'ccc=36' => 137, + 'ccc=6' => 138, + 'ccc=7' => 139, + 'ccc=8' => 140, + 'ccc=84' => 141, + 'ccc=9' => 142, + 'ccc=91' => 143, + 'ccc=a' => 144, + 'ccc=al' => 145, + 'ccc=ar' => 146, + 'ccc=b' => 147, + 'ccc=bl' => 148, + 'ccc=br' => 149, + 'ccc=da' => 150, + 'ccc=db' => 151, + 'ccc=is' => 152, + 'ccc=l' => 153, + 'ccc=r' => 154, + 'ce' => 155, + 'cf' => 156, + 'cham' => 157, + 'cher' => 158, + 'cherokeesup' => 159, + 'chesssymbols' => 160, + 'chrs' => 161, + 'ci' => 162, + 'cjk' => 163, + 'cjkcompat' => 164, + 'cjkcompatforms' => 165, + 'cjkcompatideographs' => 166, + 'cjkcompatideographssup' => 167, + 'cjkexta' => 168, + 'cjkextb' => 169, + 'cjkextc' => 170, + 'cjkextd' => 171, + 'cjkexte' => 172, + 'cjkextf' => 173, + 'cjkextg' => 174, + 'cjkradicalssup' => 175, + 'cjkstrokes' => 176, + 'cjksymbols' => 177, + 'cn' => 178, + 'cntrl' => 1187, + 'co' => 179, + 'compatjamo' => 180, + 'compex' => 181, + 'control' => 1187, + 'controlpictures' => 182, + 'copt' => 183, + 'copticepactnumbers' => 184, + 'countingrod' => 185, + 'cpmn' => 186, + 'cprt' => 187, + 'cuneiformnumbers' => 188, + 'currencysymbols' => 189, + 'cwcf' => 190, + 'cwcm' => 191, + 'cwkcf' => 192, + 'cwl' => 193, + 'cwt' => 194, + 'cwu' => 195, + 'cypriotsyllabary' => 196, + 'cyrillicexta' => 197, + 'cyrillicextb' => 198, + 'cyrillicextc' => 199, + 'cyrillicsup' => 200, + 'cyrl' => 201, + 'dash' => 202, + 'decimalnumber' => 1188, + 'dep' => 203, + 'deva' => 204, + 'devanagariext' => 205, + 'di' => 206, + 'dia' => 207, + 'diacriticals' => 208, + 'diacriticalsext' => 209, + 'diacriticalsforsymbols' => 210, + 'diacriticalssup' => 211, + 'diak' => 212, + 'digit' => 1188, + 'dingbats' => 213, + 'dogr' => 214, + 'domino' => 215, + 'dsrt' => 216, + 'dt=can' => 217, + 'dt=com' => 218, + 'dt=enc' => 219, + 'dt=fin' => 220, + 'dt=font' => 221, + 'dt=fra' => 222, + 'dt=init' => 223, + 'dt=iso' => 224, + 'dt=med' => 225, + 'dt=nar' => 226, + 'dt=nb' => 227, + 'dt=noncanon' => 228, + 'dt=none' => 229, + 'dt=sml' => 230, + 'dt=sqr' => 231, + 'dt=sub' => 232, + 'dt=sup' => 233, + 'dt=vert' => 234, + 'dupl' => 235, + 'ea=a' => 237, + 'ea=f' => 238, + 'ea=h' => 239, + 'ea=n' => 240, + 'ea=na' => 241, + 'ea=w' => 242, + 'earlydynasticcuneiform' => 236, + 'ebase' => 243, + 'ecomp' => 244, + 'egyp' => 245, + 'egyptianhieroglyphformatcontrols' => 246, + 'elba' => 247, + 'elym' => 248, + 'emod' => 249, + 'emoji' => 250, + 'emoticons' => 251, + 'enclosedalphanum' => 252, + 'enclosedalphanumsup' => 253, + 'enclosedcjk' => 254, + 'enclosedideographicsup' => 255, + 'epres' => 256, + 'ethi' => 257, + 'ethiopicext' => 258, + 'ethiopicexta' => 259, + 'ethiopicextb' => 260, + 'ethiopicsup' => 261, + 'ext' => 262, + 'extpict' => 263, + 'gcb=cn' => 264, + 'gcb=ex' => 265, + 'gcb=l' => 266, + 'gcb=pp' => 267, + 'gcb=sm' => 268, + 'gcb=t' => 269, + 'gcb=v' => 270, + 'gcb=xx' => 271, + 'geometricshapes' => 272, + 'geometricshapesext' => 273, + 'geor' => 274, + 'georgianext' => 275, + 'georgiansup' => 276, + 'glag' => 277, + 'glagoliticsup' => 278, + 'gong' => 279, + 'gonm' => 280, + 'goth' => 281, + 'gran' => 282, + 'graph' => 1189, + 'grbase' => 283, + 'greekext' => 284, + 'grek' => 285, + 'grext' => 286, + 'gujr' => 287, + 'guru' => 288, + 'halfandfullforms' => 289, + 'halfmarks' => 290, + 'han' => 291, + 'hang' => 292, + 'hano' => 293, + 'hatr' => 294, + 'hebr' => 295, + 'hex' => 1196, + 'hexdigit' => 1196, + 'highpusurrogates' => 296, + 'highsurrogates' => 297, + 'hira' => 298, + 'hluw' => 299, + 'hmng' => 300, + 'hmnp' => 301, + 'horizspace' => 1186, + 'hst=na' => 302, + 'hung' => 303, + 'hyphen_perl_aux' => 304, + 'idc' => 305, + 'identifierstatus=allowed' => 306, + 'identifierstatus=restricted' => 307, + 'identifiertype=defaultignorable' => 308, + 'identifiertype=exclusion' => 309, + 'identifiertype=inclusion' => 310, + 'identifiertype=limiteduse' => 311, + 'identifiertype=notcharacter' => 312, + 'identifiertype=notnfkc' => 313, + 'identifiertype=notxid' => 314, + 'identifiertype=obsolete' => 315, + 'identifiertype=recommended' => 316, + 'identifiertype=technical' => 317, + 'identifiertype=uncommonuse' => 318, + 'ideo' => 319, + 'ideographicsymbols' => 320, + 'ids' => 321, + 'idsb' => 322, + 'idst' => 323, + 'in=1.1' => 527, + 'in=10' => 521, + 'in=11' => 522, + 'in=12' => 523, + 'in=12.1' => 524, + 'in=13' => 525, + 'in=14' => 526, + 'in=2' => 528, + 'in=2.1' => 529, + 'in=3' => 530, + 'in=3.1' => 531, + 'in=3.2' => 532, + 'in=4' => 533, + 'in=4.1' => 534, + 'in=5' => 535, + 'in=5.1' => 536, + 'in=5.2' => 537, + 'in=6' => 538, + 'in=6.1' => 539, + 'in=6.2' => 540, + 'in=6.3' => 541, + 'in=7' => 542, + 'in=8' => 543, + 'in=9' => 544, + 'inadlam' => 324, + 'inahom' => 325, + 'inanatolianhieroglyphs' => 326, + 'inarabic' => 327, + 'inarmenian' => 328, + 'inavestan' => 329, + 'inbalinese' => 330, + 'inbamum' => 331, + 'inbassavah' => 332, + 'inbatak' => 333, + 'inbengali' => 334, + 'inbhaiksuki' => 335, + 'inbopomofo' => 336, + 'inbrahmi' => 337, + 'inbuginese' => 338, + 'inbuhid' => 339, + 'incarian' => 340, + 'incaucasianalbanian' => 341, + 'inchakma' => 342, + 'incham' => 343, + 'incherokee' => 344, + 'inchorasmian' => 345, + 'incoptic' => 346, + 'incuneiform' => 347, + 'incyprominoan' => 348, + 'incyrillic' => 349, + 'indevanagari' => 350, + 'indicnumberforms' => 351, + 'indicsiyaqnumbers' => 352, + 'indivesakuru' => 353, + 'indogra' => 354, + 'induployan' => 355, + 'inegyptianhieroglyphs' => 356, + 'inelbasan' => 357, + 'inelymaic' => 358, + 'inethiopic' => 359, + 'ingeorgian' => 360, + 'inglagolitic' => 361, + 'ingothic' => 362, + 'ingrantha' => 363, + 'ingreek' => 364, + 'ingujarati' => 365, + 'ingunjalagondi' => 366, + 'ingurmukhi' => 367, + 'inhangul' => 368, + 'inhanifirohingya' => 369, + 'inhanunoo' => 370, + 'inhatran' => 371, + 'inhebrew' => 372, + 'inhiragana' => 373, + 'inidc' => 374, + 'inimperialaramaic' => 375, + 'ininscriptionalpahlavi' => 376, + 'ininscriptionalparthian' => 377, + 'injavanese' => 378, + 'inkaithi' => 379, + 'inkannada' => 380, + 'inkatakana' => 381, + 'inkharoshthi' => 382, + 'inkhitansmallscript' => 383, + 'inkhmer' => 384, + 'inkhojki' => 385, + 'inkhudawadi' => 386, + 'inlao' => 387, + 'inlepcha' => 388, + 'inlimbu' => 389, + 'inlineara' => 390, + 'inlisu' => 391, + 'inlycian' => 392, + 'inlydian' => 393, + 'inmahajani' => 394, + 'inmakasar' => 395, + 'inmalayalam' => 396, + 'inmandaic' => 397, + 'inmanichaean' => 398, + 'inmarchen' => 399, + 'inmasaramgondi' => 400, + 'inmedefaidrin' => 401, + 'inmeeteimayek' => 402, + 'inmendekikakui' => 403, + 'inmeroiticcursive' => 404, + 'inmiao' => 405, + 'inmodi' => 406, + 'inmongolian' => 407, + 'inmro' => 408, + 'inmultani' => 409, + 'inmyanmar' => 410, + 'innabataean' => 411, + 'innandinagari' => 412, + 'innewa' => 413, + 'innewtailue' => 414, + 'innko' => 415, + 'innushu' => 416, + 'innyiakengpuachuehmong' => 417, + 'inogham' => 418, + 'inoldhungarian' => 419, + 'inolditalic' => 420, + 'inoldpermic' => 421, + 'inoldpersian' => 422, + 'inoldsogdian' => 423, + 'inoldturkic' => 424, + 'inolduyghur' => 425, + 'inoriya' => 426, + 'inosage' => 427, + 'inosmanya' => 428, + 'inpahawhhmong' => 429, + 'inpaucinhau' => 430, + 'inpc=bottom' => 431, + 'inpc=bottomandleft' => 432, + 'inpc=bottomandright' => 433, + 'inpc=left' => 434, + 'inpc=leftandright' => 435, + 'inpc=na' => 436, + 'inpc=overstruck' => 437, + 'inpc=right' => 438, + 'inpc=top' => 439, + 'inpc=topandbottom' => 440, + 'inpc=topandbottomandleft' => 441, + 'inpc=topandbottomandright' => 442, + 'inpc=topandleft' => 443, + 'inpc=topandleftandright' => 444, + 'inpc=topandright' => 445, + 'inphagspa' => 446, + 'inphoenician' => 447, + 'inpsalterpahlavi' => 448, + 'inpunctuation' => 449, + 'inrejang' => 450, + 'inrunic' => 451, + 'insamaritan' => 452, + 'insaurashtra' => 453, + 'insc=avagraha' => 454, + 'insc=bindu' => 455, + 'insc=brahmijoiningnumber' => 456, + 'insc=cantillationmark' => 457, + 'insc=consonant' => 458, + 'insc=consonantdead' => 459, + 'insc=consonantfinal' => 460, + 'insc=consonantheadletter' => 461, + 'insc=consonantinitialpostfixed' => 462, + 'insc=consonantkiller' => 463, + 'insc=consonantmedial' => 464, + 'insc=consonantplaceholder' => 465, + 'insc=consonantprecedingrepha' => 466, + 'insc=consonantprefixed' => 467, + 'insc=consonantsubjoined' => 468, + 'insc=consonantsucceedingrepha' => 469, + 'insc=consonantwithstacker' => 470, + 'insc=geminationmark' => 471, + 'insc=invisiblestacker' => 472, + 'insc=modifyingletter' => 473, + 'insc=nonjoiner' => 474, + 'insc=nukta' => 475, + 'insc=number' => 476, + 'insc=numberjoiner' => 477, + 'insc=other' => 478, + 'insc=purekiller' => 479, + 'insc=registershifter' => 480, + 'insc=syllablemodifier' => 481, + 'insc=toneletter' => 482, + 'insc=tonemark' => 483, + 'insc=virama' => 484, + 'insc=visarga' => 485, + 'insc=vowel' => 486, + 'insc=voweldependent' => 487, + 'insc=vowelindependent' => 488, + 'insiddham' => 489, + 'insinhala' => 490, + 'insogdian' => 491, + 'insorasompeng' => 492, + 'insoyombo' => 493, + 'insundanese' => 494, + 'insylotinagri' => 495, + 'insyriac' => 496, + 'intagalog' => 497, + 'intagbanwa' => 498, + 'intaile' => 499, + 'intaitham' => 500, + 'intaiviet' => 501, + 'intakri' => 502, + 'intamil' => 503, + 'intangsa' => 504, + 'intangut' => 505, + 'intelugu' => 506, + 'inthaana' => 507, + 'inthai' => 508, + 'intibetan' => 509, + 'intifinagh' => 510, + 'intirhuta' => 511, + 'intoto' => 512, + 'inugaritic' => 513, + 'invai' => 514, + 'invithkuqi' => 515, + 'invs' => 516, + 'inwancho' => 517, + 'inwarangciti' => 518, + 'inyezidi' => 519, + 'inzanabazarsquare' => 520, + 'ipaext' => 545, + 'ital' => 546, + 'jamo' => 547, + 'jamoexta' => 548, + 'jamoextb' => 549, + 'java' => 550, + 'jg=africanfeh' => 551, + 'jg=africannoon' => 552, + 'jg=africanqaf' => 553, + 'jg=ain' => 554, + 'jg=alaph' => 555, + 'jg=alef' => 556, + 'jg=beh' => 557, + 'jg=beth' => 558, + 'jg=burushaskiyehbarree' => 559, + 'jg=dal' => 560, + 'jg=dalathrish' => 561, + 'jg=e' => 562, + 'jg=farsiyeh' => 563, + 'jg=fe' => 564, + 'jg=feh' => 565, + 'jg=finalsemkath' => 566, + 'jg=gaf' => 567, + 'jg=gamal' => 568, + 'jg=hah' => 569, + 'jg=hamzaonhehgoal' => 570, + 'jg=hanifirohingyakinnaya' => 571, + 'jg=hanifirohingyapa' => 572, + 'jg=he' => 573, + 'jg=heh' => 574, + 'jg=hehgoal' => 575, + 'jg=heth' => 576, + 'jg=kaf' => 577, + 'jg=kaph' => 578, + 'jg=khaph' => 579, + 'jg=knottedheh' => 580, + 'jg=lam' => 581, + 'jg=lamadh' => 582, + 'jg=malayalambha' => 583, + 'jg=malayalamja' => 584, + 'jg=malayalamlla' => 585, + 'jg=malayalamllla' => 586, + 'jg=malayalamnga' => 587, + 'jg=malayalamnna' => 588, + 'jg=malayalamnnna' => 589, + 'jg=malayalamnya' => 590, + 'jg=malayalamra' => 591, + 'jg=malayalamssa' => 592, + 'jg=malayalamtta' => 593, + 'jg=manichaeanaleph' => 594, + 'jg=manichaeanayin' => 595, + 'jg=manichaeanbeth' => 596, + 'jg=manichaeandaleth' => 597, + 'jg=manichaeandhamedh' => 598, + 'jg=manichaeanfive' => 599, + 'jg=manichaeangimel' => 600, + 'jg=manichaeanheth' => 601, + 'jg=manichaeanhundred' => 602, + 'jg=manichaeankaph' => 603, + 'jg=manichaeanlamedh' => 604, + 'jg=manichaeanmem' => 605, + 'jg=manichaeannun' => 606, + 'jg=manichaeanone' => 607, + 'jg=manichaeanpe' => 608, + 'jg=manichaeanqoph' => 609, + 'jg=manichaeanresh' => 610, + 'jg=manichaeansadhe' => 611, + 'jg=manichaeansamekh' => 612, + 'jg=manichaeantaw' => 613, + 'jg=manichaeanten' => 614, + 'jg=manichaeanteth' => 615, + 'jg=manichaeanthamedh' => 616, + 'jg=manichaeantwenty' => 617, + 'jg=manichaeanwaw' => 618, + 'jg=manichaeanyodh' => 619, + 'jg=manichaeanzayin' => 620, + 'jg=meem' => 621, + 'jg=mim' => 622, + 'jg=nojoininggroup' => 623, + 'jg=noon' => 624, + 'jg=nun' => 625, + 'jg=nya' => 626, + 'jg=pe' => 627, + 'jg=qaf' => 628, + 'jg=qaph' => 629, + 'jg=reh' => 630, + 'jg=reversedpe' => 631, + 'jg=rohingyayeh' => 632, + 'jg=sad' => 633, + 'jg=sadhe' => 634, + 'jg=seen' => 635, + 'jg=semkath' => 636, + 'jg=shin' => 637, + 'jg=straightwaw' => 638, + 'jg=swashkaf' => 639, + 'jg=syriacwaw' => 640, + 'jg=tah' => 641, + 'jg=taw' => 642, + 'jg=tehmarbuta' => 643, + 'jg=teth' => 644, + 'jg=thinyeh' => 645, + 'jg=verticaltail' => 646, + 'jg=waw' => 647, + 'jg=yeh' => 648, + 'jg=yehbarree' => 649, + 'jg=yehwithtail' => 650, + 'jg=yudh' => 651, + 'jg=yudhhe' => 652, + 'jg=zain' => 653, + 'jg=zhain' => 654, + 'joinc' => 655, + 'jt=c' => 656, + 'jt=d' => 657, + 'jt=l' => 658, + 'jt=r' => 659, + 'jt=t' => 660, + 'jt=u' => 661, + 'kali' => 662, + 'kana' => 663, + 'kanaexta' => 664, + 'kanaextb' => 665, + 'kanasup' => 666, + 'kanbun' => 667, + 'kangxi' => 668, + 'katakanaext' => 669, + 'khar' => 670, + 'khmersymbols' => 671, + 'khmr' => 672, + 'khoj' => 673, + 'kits' => 674, + 'knda' => 675, + 'kthi' => 676, + 'l' => 677, + 'l_' => 98, + 'l_amp_' => 98, + 'lana' => 678, + 'lao' => 679, + 'latin1' => 680, + 'latinexta' => 681, + 'latinextadditional' => 682, + 'latinextb' => 683, + 'latinextc' => 684, + 'latinextd' => 685, + 'latinexte' => 686, + 'latinextf' => 687, + 'latinextg' => 688, + 'latn' => 689, + 'lb=ai' => 690, + 'lb=al' => 691, + 'lb=b2' => 692, + 'lb=ba' => 693, + 'lb=bb' => 694, + 'lb=bk' => 695, + 'lb=cb' => 696, + 'lb=cj' => 697, + 'lb=cl' => 698, + 'lb=cm' => 699, + 'lb=cp' => 700, + 'lb=cr' => 701, + 'lb=ex' => 702, + 'lb=gl' => 703, + 'lb=h2' => 704, + 'lb=h3' => 705, + 'lb=hl' => 706, + 'lb=hy' => 707, + 'lb=id' => 708, + 'lb=in' => 709, + 'lb=is' => 710, + 'lb=lf' => 711, + 'lb=nl' => 712, + 'lb=ns' => 713, + 'lb=nu' => 714, + 'lb=op' => 715, + 'lb=po' => 716, + 'lb=pr' => 717, + 'lb=qu' => 718, + 'lb=sa' => 719, + 'lb=sg_perl_aux' => 720, + 'lb=sp' => 721, + 'lb=sy' => 722, + 'lb=wj' => 723, + 'lb=xx' => 724, + 'lb=zw' => 725, + 'lb=zwj' => 726, + 'lc' => 98, + 'lepc' => 727, + 'letterlikesymbols' => 728, + 'limb' => 729, + 'lina' => 730, + 'linb' => 731, + 'linearbideograms' => 732, + 'linearbsyllabary' => 733, + 'lisu' => 734, + 'lisusup' => 735, + 'll' => 739, + 'lm' => 736, + 'lo' => 737, + 'loe' => 738, + 'lower' => 1190, + 'lowercase' => 1190, + 'lowercaseletter' => 739, + 'lowsurrogates' => 740, + 'lt' => 1143, + 'lu' => 1152, + 'lyci' => 741, + 'lydi' => 742, + 'm' => 743, + 'mahj' => 744, + 'mahjong' => 745, + 'maka' => 746, + 'mand' => 747, + 'mani' => 748, + 'marc' => 749, + 'math' => 750, + 'mathalphanum' => 751, + 'mathoperators' => 752, + 'mayannumerals' => 753, + 'mc' => 754, + 'me' => 755, + 'medf' => 756, + 'meeteimayekext' => 757, + 'mend' => 758, + 'merc' => 759, + 'mero' => 760, + 'miao' => 761, + 'miscarrows' => 762, + 'miscmathsymbolsa' => 763, + 'miscmathsymbolsb' => 764, + 'miscpictographs' => 765, + 'miscsymbols' => 766, + 'misctechnical' => 767, + 'mlym' => 768, + 'mn' => 769, + 'modi' => 770, + 'modifierletters' => 771, + 'modifiertoneletters' => 772, + 'mong' => 773, + 'mongoliansup' => 774, + 'mro' => 775, + 'mtei' => 776, + 'mult' => 777, + 'music' => 778, + 'myanmarexta' => 779, + 'myanmarextb' => 780, + 'mymr' => 781, + 'n' => 782, + 'nand' => 783, + 'narb' => 784, + 'nb' => 785, + 'nbat' => 786, + 'nd' => 1188, + 'newa' => 787, + 'nfcqc=m' => 788, + 'nfcqc=y' => 789, + 'nfdqc=y' => 790, + 'nfkcqc=n' => 791, + 'nfkcqc=y' => 792, + 'nfkdqc=n' => 793, + 'nko' => 794, + 'nl' => 795, + 'no' => 796, + 'nshu' => 797, + 'nt=di' => 798, + 'nt=nu' => 799, + 'numberforms' => 800, + 'nv=0' => 801, + 'nv=1' => 802, + 'nv=1/10' => 827, + 'nv=1/12' => 828, + 'nv=1/16' => 829, + 'nv=1/160' => 830, + 'nv=1/2' => 831, + 'nv=1/20' => 832, + 'nv=1/3' => 833, + 'nv=1/32' => 834, + 'nv=1/320' => 835, + 'nv=1/4' => 836, + 'nv=1/40' => 837, + 'nv=1/5' => 838, + 'nv=1/6' => 839, + 'nv=1/64' => 840, + 'nv=1/7' => 841, + 'nv=1/8' => 842, + 'nv=1/80' => 843, + 'nv=1/9' => 844, + 'nv=10' => 803, + 'nv=100' => 804, + 'nv=1000' => 805, + 'nv=10000' => 806, + 'nv=100000' => 807, + 'nv=1000000' => 808, + 'nv=10000000' => 809, + 'nv=100000000' => 810, + 'nv=10000000000' => 811, + 'nv=1000000000000' => 812, + 'nv=11' => 813, + 'nv=11/12' => 814, + 'nv=11/2' => 815, + 'nv=12' => 816, + 'nv=13' => 817, + 'nv=13/2' => 818, + 'nv=14' => 819, + 'nv=15' => 820, + 'nv=15/2' => 821, + 'nv=16' => 822, + 'nv=17' => 823, + 'nv=17/2' => 824, + 'nv=18' => 825, + 'nv=19' => 826, + 'nv=2' => 845, + 'nv=2/3' => 862, + 'nv=2/5' => 863, + 'nv=20' => 846, + 'nv=200' => 847, + 'nv=2000' => 848, + 'nv=20000' => 849, + 'nv=200000' => 850, + 'nv=20000000' => 851, + 'nv=21' => 852, + 'nv=216000' => 853, + 'nv=22' => 854, + 'nv=23' => 855, + 'nv=24' => 856, + 'nv=25' => 857, + 'nv=26' => 858, + 'nv=27' => 859, + 'nv=28' => 860, + 'nv=29' => 861, + 'nv=3' => 864, + 'nv=3/16' => 879, + 'nv=3/2' => 880, + 'nv=3/20' => 881, + 'nv=3/4' => 882, + 'nv=3/5' => 883, + 'nv=3/64' => 884, + 'nv=3/8' => 885, + 'nv=3/80' => 886, + 'nv=30' => 865, + 'nv=300' => 866, + 'nv=3000' => 867, + 'nv=30000' => 868, + 'nv=300000' => 869, + 'nv=31' => 870, + 'nv=32' => 871, + 'nv=33' => 872, + 'nv=34' => 873, + 'nv=35' => 874, + 'nv=36' => 875, + 'nv=37' => 876, + 'nv=38' => 877, + 'nv=39' => 878, + 'nv=4' => 887, + 'nv=4/5' => 903, + 'nv=40' => 888, + 'nv=400' => 889, + 'nv=4000' => 890, + 'nv=40000' => 891, + 'nv=400000' => 892, + 'nv=41' => 893, + 'nv=42' => 894, + 'nv=43' => 895, + 'nv=432000' => 896, + 'nv=44' => 897, + 'nv=45' => 898, + 'nv=46' => 899, + 'nv=47' => 900, + 'nv=48' => 901, + 'nv=49' => 902, + 'nv=5' => 904, + 'nv=5/12' => 910, + 'nv=5/2' => 911, + 'nv=5/6' => 912, + 'nv=5/8' => 913, + 'nv=50' => 905, + 'nv=500' => 906, + 'nv=5000' => 907, + 'nv=50000' => 908, + 'nv=500000' => 909, + 'nv=6' => 914, + 'nv=60' => 915, + 'nv=600' => 916, + 'nv=6000' => 917, + 'nv=60000' => 918, + 'nv=600000' => 919, + 'nv=7' => 920, + 'nv=7/12' => 926, + 'nv=7/2' => 927, + 'nv=7/8' => 928, + 'nv=70' => 921, + 'nv=700' => 922, + 'nv=7000' => 923, + 'nv=70000' => 924, + 'nv=700000' => 925, + 'nv=8' => 929, + 'nv=80' => 930, + 'nv=800' => 931, + 'nv=8000' => 932, + 'nv=80000' => 933, + 'nv=800000' => 934, + 'nv=9' => 935, + 'nv=9/2' => 941, + 'nv=90' => 936, + 'nv=900' => 937, + 'nv=9000' => 938, + 'nv=90000' => 939, + 'nv=900000' => 940, + 'nv=_minus_1/2' => 943, + 'nv=nan' => 942, + 'ocr' => 944, + 'ogam' => 945, + 'olck' => 946, + 'orkh' => 947, + 'ornamentaldingbats' => 948, + 'orya' => 949, + 'osge' => 950, + 'osma' => 951, + 'ottomansiyaqnumbers' => 952, + 'ougr' => 953, + 'p' => 954, + 'palm' => 955, + 'patsyn' => 956, + 'pauc' => 957, + 'pc' => 958, + 'pcm' => 959, + 'pd' => 960, + 'pe' => 961, + 'perlspace' => 983, + 'perlword' => 985, + 'perm' => 962, + 'pf' => 963, + 'phag' => 964, + 'phaistos' => 965, + 'phli' => 966, + 'phlp' => 967, + 'phnx' => 968, + 'phoneticext' => 969, + 'phoneticextsup' => 970, + 'pi' => 971, + 'playingcards' => 972, + 'po' => 973, + 'posixalnum' => 974, + 'posixalpha' => 975, + 'posixblank' => 976, + 'posixcntrl' => 977, + 'posixdigit' => 978, + 'posixgraph' => 979, + 'posixlower' => 980, + 'posixprint' => 981, + 'posixpunct' => 982, + 'posixspace' => 983, + 'posixupper' => 984, + 'posixword' => 985, + 'posixxdigit' => 986, + 'print' => 1191, + 'prti' => 987, + 'ps' => 988, + 'pua' => 989, + 'qaai' => 990, + 'qmark' => 991, + 'radical' => 992, + 'ri' => 993, + 'rjng' => 994, + 'rohg' => 995, + 'rumi' => 996, + 'runr' => 997, + 's' => 998, + 'samr' => 999, + 'sarb' => 1000, + 'saur' => 1001, + 'sb=at' => 1002, + 'sb=cl' => 1003, + 'sb=ex' => 1004, + 'sb=fo' => 1005, + 'sb=le' => 1006, + 'sb=lo' => 1007, + 'sb=nu' => 1008, + 'sb=sc' => 1009, + 'sb=se' => 1010, + 'sb=sp' => 1011, + 'sb=st' => 1012, + 'sb=up' => 1013, + 'sb=xx' => 1014, + 'sc' => 1015, + 'sc=adlm' => 1016, + 'sc=arab' => 1017, + 'sc=beng' => 1018, + 'sc=bopo' => 1019, + 'sc=bugi' => 1020, + 'sc=buhd' => 1021, + 'sc=cakm' => 1022, + 'sc=copt' => 1023, + 'sc=cpmn' => 1024, + 'sc=cprt' => 1025, + 'sc=cyrl' => 1026, + 'sc=deva' => 1027, + 'sc=dogr' => 1028, + 'sc=dupl' => 1029, + 'sc=geor' => 1030, + 'sc=glag' => 1031, + 'sc=gong' => 1032, + 'sc=gonm' => 1033, + 'sc=gran' => 1034, + 'sc=grek' => 1035, + 'sc=gujr' => 1036, + 'sc=guru' => 1037, + 'sc=han' => 1038, + 'sc=hang' => 1039, + 'sc=hano' => 1040, + 'sc=hira' => 1041, + 'sc=java' => 1042, + 'sc=kali' => 1043, + 'sc=kana' => 1044, + 'sc=khoj' => 1045, + 'sc=knda' => 1046, + 'sc=kthi' => 1047, + 'sc=latn' => 1048, + 'sc=limb' => 1049, + 'sc=lina' => 1050, + 'sc=linb' => 1051, + 'sc=mahj' => 1052, + 'sc=mand' => 1053, + 'sc=mani' => 1054, + 'sc=mlym' => 1055, + 'sc=modi' => 1056, + 'sc=mong' => 1057, + 'sc=mult' => 1058, + 'sc=mymr' => 1059, + 'sc=nand' => 1060, + 'sc=nko' => 1061, + 'sc=orya' => 1062, + 'sc=ougr' => 1063, + 'sc=perm' => 1064, + 'sc=phag' => 1065, + 'sc=phlp' => 1066, + 'sc=qaai' => 1067, + 'sc=rohg' => 1068, + 'sc=shrd' => 1069, + 'sc=sind' => 1070, + 'sc=sinh' => 1071, + 'sc=sogd' => 1072, + 'sc=sylo' => 1073, + 'sc=syrc' => 1074, + 'sc=tagb' => 1075, + 'sc=takr' => 1076, + 'sc=tale' => 1077, + 'sc=taml' => 1078, + 'sc=telu' => 1079, + 'sc=tglg' => 1080, + 'sc=thaa' => 1081, + 'sc=tirh' => 1082, + 'sc=yezi' => 1083, + 'sc=yi' => 1084, + 'sc=zyyy' => 1085, + 'sd' => 1086, + 'sgnw' => 1087, + 'shaw' => 1088, + 'shorthandformatcontrols' => 1089, + 'shrd' => 1090, + 'sidd' => 1091, + 'sind' => 1092, + 'sinh' => 1093, + 'sinhalaarchaicnumbers' => 1094, + 'sk' => 1095, + 'sm' => 1096, + 'smallforms' => 1097, + 'smallkanaext' => 1098, + 'so' => 1099, + 'sogd' => 1100, + 'sogo' => 1101, + 'sora' => 1102, + 'soyo' => 1103, + 'space' => 1193, + 'spaceperl' => 1193, + 'specials' => 1104, + 'sterm' => 1105, + 'sund' => 1106, + 'sundanesesup' => 1107, + 'suparrowsa' => 1108, + 'suparrowsb' => 1109, + 'suparrowsc' => 1110, + 'superandsub' => 1111, + 'supmathoperators' => 1112, + 'suppuaa' => 1113, + 'suppuab' => 1114, + 'suppunctuation' => 1115, + 'supsymbolsandpictographs' => 1116, + 'suttonsignwriting' => 1117, + 'sylo' => 1118, + 'symbolsandpictographsexta' => 1119, + 'symbolsforlegacycomputing' => 1120, + 'syrc' => 1121, + 'syriacsup' => 1122, + 'tagb' => 1123, + 'tags' => 1124, + 'taixuanjing' => 1125, + 'takr' => 1126, + 'tale' => 1127, + 'talu' => 1128, + 'tamilsup' => 1129, + 'taml' => 1130, + 'tang' => 1131, + 'tangutcomponents' => 1132, + 'tangutsup' => 1133, + 'tavt' => 1134, + 'telu' => 1135, + 'term' => 1136, + 'tfng' => 1137, + 'tglg' => 1138, + 'thaa' => 1139, + 'thai' => 1140, + 'tibt' => 1141, + 'tirh' => 1142, + 'title' => 1143, + 'titlecase' => 1143, + 'titlecaseletter' => 1143, + 'tnsa' => 1144, + 'toto' => 1145, + 'transportandmap' => 1146, + 'ucas' => 1147, + 'ucasext' => 1148, + 'ucasexta' => 1149, + 'ugar' => 1150, + 'uideo' => 1151, + 'upper' => 1194, + 'uppercase' => 1194, + 'uppercaseletter' => 1152, + 'vai' => 1153, + 'vedicext' => 1154, + 'verticalforms' => 1155, + 'vertspace' => 1156, + 'vith' => 1157, + 'vo=r' => 1158, + 'vo=tr' => 1159, + 'vo=tu' => 1160, + 'vo=u' => 1161, + 'vs' => 1162, + 'vssup' => 1163, + 'wara' => 1164, + 'wb=dq' => 1165, + 'wb=eb' => 1166, + 'wb=ex' => 1167, + 'wb=extend' => 1168, + 'wb=fo' => 1169, + 'wb=ka' => 1170, + 'wb=le' => 1171, + 'wb=mb' => 1172, + 'wb=ml' => 1173, + 'wb=mn' => 1174, + 'wb=nl' => 1175, + 'wb=nu' => 1176, + 'wb=sq' => 1177, + 'wb=wsegspace' => 1178, + 'wb=xx' => 1179, + 'wcho' => 1180, + 'whitespace' => 1193, + 'word' => 1195, + 'wspace' => 1193, + 'xdigit' => 1196, + 'xidc' => 1181, + 'xids' => 1182, + 'xpeo' => 1183, + 'xperlspace' => 1193, + 'xposixalnum' => 1184, + 'xposixalpha' => 1185, + 'xposixblank' => 1186, + 'xposixcntrl' => 1187, + 'xposixdigit' => 1188, + 'xposixgraph' => 1189, + 'xposixlower' => 1190, + 'xposixprint' => 1191, + 'xposixpunct' => 1192, + 'xposixspace' => 1193, + 'xposixupper' => 1194, + 'xposixword' => 1195, + 'xposixxdigit' => 1196, + 'xsux' => 1197, + 'yezi' => 1198, + 'yi' => 1199, + 'yijing' => 1200, + 'yiradicals' => 1201, + 'yisyllables' => 1202, + 'z' => 1203, + 'zanb' => 1204, + 'zl' => 1205, + 'znamennymusic' => 1206, + 'zp' => 1207, + 'zs' => 1208, + 'zyyy' => 1209, + 'zzzz' => 1210, ); 1; # Generated from: # 688d673ec947f7ccf898b4eae9848139d4d33676b688dee54f449f8bf9d3bbd2 lib/Unicode/UCD.pm -# ce96627d4fc91b4fd886c409caeb9b76cf7bd345e12f05c6701add7f233f6437 lib/unicore/ArabicShaping.txt -# 0e69eef3da722cc104522d8372e86d5b86bb7afcc761b0c991e39e832294946d lib/unicore/BidiBrackets.txt -# a00d9d21585106a52113fb7b1d3d0373a5835be72e76862fb559ebddd474d70e lib/unicore/BidiMirroring.txt -# 81a82b6a9fcf1a9c12f588d7a1decd73a9afdc4cac95b0eb7e576e7942d6c19f lib/unicore/Blocks.txt -# 99d231d7c91688bbe8ca8ccebcc2f46b5b222f844babe4827295bae11e2abe5f lib/unicore/CaseFolding.txt -# 38badafd818d8405324fe298c0676be0c95186368c84b5368375fd871a645144 lib/unicore/CompositionExclusions.txt -# e779a443d3aa2a3166a15becaa2b737c922480e32c0453d5956093633555078f lib/unicore/DAge.txt -# a5d45f59b39deaab3c72ce8c1a2e212a5e086dff11b1f9d5bb0e352642e82248 lib/unicore/DCoreProperties.txt -# 3ac44e11c84bdaf6b207d2c2c20eed857ae17052393fc7f71b0fe951186ba906 lib/unicore/DNormalizationProps.txt -# 4f822ec7a9ebbb3138ad29bade8b9688d25b39c7a3c0b7431f01e7229e4fcb6e lib/unicore/EastAsianWidth.txt -# fc535aa1047a70105ab9a22c2b4c3f363a2ff02fe48ebbc5eeb9873b2752ff0b lib/unicore/EquivalentUnifiedIdeograph.txt -# b9c5158ce944d2fec57e0e4ecb716bdabfc3bdde73525f1772fe03f61a30d473 lib/unicore/HangulSyllableType.txt -# 36c1b2a626ff1fb23b8b21e6ea8712698f8ce668dded1cb48b8ddf6a6a1b04e9 lib/unicore/IdStatus.txt -# 4857c4ffa3898e6128b2d46b0a02e499a663fb91464a69ef3611096f01293acc lib/unicore/IdType.txt -# 69197b019fa5f2fb0d8c6ed1ed8acb9f2e8b5b8f45a947953ffa652f3bf54983 lib/unicore/IndicPositionalCategory.txt -# 6604e2f0fde7428675364aa0006bc686b79488dcc60ae8cb29800af2be3352e8 lib/unicore/IndicSyllabicCategory.txt -# 84ead63924aaa74b988b2eaf254a8733276ed108633ce2ef77a9ee1de7818162 lib/unicore/Jamo.txt -# d5abcd8f54c8a2aa912924c485ccf7f968ad98feaa303d8e9a29ad89172f1faf lib/unicore/LineBreak.txt -# 985128e8c8b2540233331d9b27d897d2c23bd5bcf1d05da960befce6efc59542 lib/unicore/NameAliases.txt -# 27282b8aa01d4d0c44aef436cb74195ae8639ffa187aeee4e6247af76febea76 lib/unicore/NamedSequences.txt -# 485b5a3ed25dbf1f94dfa5a9b69d8b4550ffd0c33045ccc55ccfd7c80b2a40cf lib/unicore/PropList.txt -# 6b3902e9268cd843fe65cbdea992108c9528343ec0679f800b96f356bb553e5a lib/unicore/PropValueAliases.txt -# 2bd5777847e3d6add3c7e5c0d1393ddcab89e5a0ac3ff498cb0c53041f0b86e4 lib/unicore/PropertyAliases.txt -# 03a61dc89422e44cc2b73e8e893321007880ab69e2a4d281c0f1bc29c602b9d0 lib/unicore/ScriptExtensions.txt -# 9a5ed1ec9b5f0d7147e9371ad792ab39203611af7637cff2aa4a5c663b172cde lib/unicore/Scripts.txt -# 6424312f1dc39b22e0ff9c0ffb13dfad424d9b03e6a6dc6bca941f6bf5ef1ffd lib/unicore/SpecialCasing.txt -# bdbffbbfc8ad4d3a6d01b5891510458f3d36f7170422af4ea2bed3211a73e8bb lib/unicore/UnicodeData.txt -# 160f41816234addb511901d5f21febd69574578dd93de6ef8153e35693325575 lib/unicore/VerticalOrientation.txt -# 32dfb37d21db530529a6ec3dc13d96f21f8e7c7faf7ff3db8a9760cd76cec81d lib/unicore/auxiliary/GCBTest.txt -# 2bd3c5e2d62701ff81fb3ec318e179a4618cabb1493b1e0dd2b4e7e56c5437c4 lib/unicore/auxiliary/GraphemeBreakProperty.txt -# c51fbebfa82a0f36473b44bfd71d5ef6cb6a1f81fb313375dc9a1910d79bb2b6 lib/unicore/auxiliary/LBTest.txt -# 80b0107750818d8f370bd120b6fe56b6855b60581f72affe8b60409a469b4b65 lib/unicore/auxiliary/SBTest.txt -# 09e3166ebab166ac630a227f77f4e794ebd433271abd5588f5a67e7f199c71ee lib/unicore/auxiliary/SentenceBreakProperty.txt -# bf5373ce28a5df06796c93dc159dd15a997bb2950c92704b40ae8190cfc3716d lib/unicore/auxiliary/WBTest.txt -# a2b7373cf2fe3fa3b26dbb53405ca849985f771ff47f1c61743978003ff80499 lib/unicore/auxiliary/WordBreakProperty.txt -# d2686f400a638c80775d7c662556fb8fa8dd3bbe4aa548d9d31624264c6e1bb1 lib/unicore/emoji/emoji.txt -# b827ae5da8c2b08947cc9a120a7b7fd2f1676fb160b508df78075381635b127c lib/unicore/extracted/DBidiClass.txt -# 6fdc5b5ef40444a8f0c772e6b67c00498d4216fe0c0fdf76744ce338f2ad3810 lib/unicore/extracted/DBinaryProperties.txt -# e14928a5bf6ad5958a80332bd42e96e14420080a95c660e5da29384e496755d0 lib/unicore/extracted/DCombiningClass.txt -# 579a03281fbe87b78d5d9a8523de4d255edd7e4ca6eab0e4c7729de97e9b89b1 lib/unicore/extracted/DDecompositionType.txt -# ad83c59b257e9d480ffd3001d4ac240c5fed7cb1919453e1c4e8877035256bcd lib/unicore/extracted/DEastAsianWidth.txt -# 4502f0969e4e6558c4b4c6ca4c23dad70b863d61dd3d5eed1a62a6c3c99fd570 lib/unicore/extracted/DGeneralCategory.txt -# 00bb88b89e2adb646f3177f9444e2d3192386b81a5de9556104b338274b253e1 lib/unicore/extracted/DJoinGroup.txt -# ac835b6e11a60c9820d3cf2d1cb0558dd68efb8f53f404a51632e4726690a6d7 lib/unicore/extracted/DJoinType.txt -# baba9dfc133e3cb770a89aaf0973b1341fa61c2da6c176baf6428898b3b568d8 lib/unicore/extracted/DLineBreak.txt -# 6d4a8c945dd7db83ed617cbb7d937de7f4ecf016ff22970d846e996a7c9a2a5d lib/unicore/extracted/DNumType.txt -# 5b7c14380d5cceeaffcfbc18db1ed936391d2af2d51f5a41f1a17b692c77e59b lib/unicore/extracted/DNumValues.txt -# 4e169849b96b76987a8fc443ef421b44d2dcebbd981bb457f6a13e8af77cdbe2 lib/unicore/mktables -# 50b85a67451145545a65cea370dab8d3444fbfe07e9c34cef560c5b7da9d3eef lib/unicore/version +# c7698811e9adb6cc98fb996a7de4be2b6532f2ac67e76055cc8afdbf6ee18af3 lib/unicore/ArabicShaping.txt +# 24a74555f918bbe99f5b3f1b83cf36fc0e205bb8a600a6a3aa539c710a3dcf27 lib/unicore/BidiBrackets.txt +# 7a5c74cedc1616a9af0a9d22e108ae592d86fe93649c144ae6ba49f193a44122 lib/unicore/BidiMirroring.txt +# 598870dddef7b34b5a972916528c456aff2765b79cd4f9647fb58ceb767e7f17 lib/unicore/Blocks.txt +# a566cd48687b2cd897e02501118b2413c14ae86d318f9abbbba97feb84189f0f lib/unicore/CaseFolding.txt +# 3360762fc3295cea54ab251c31df621d05ba4b94d46c60eaac29aa16d70ad1e0 lib/unicore/CompositionExclusions.txt +# 7e058dec02147098bc9c28d86209f0f251bba0538f3b5a705ad02ea3bb709fe0 lib/unicore/DAge.txt +# e3eddd7d469cd1b0feed7528defad1a1cc7c6a9ceb0ae4446a6d10921ed2e7bc lib/unicore/DCoreProperties.txt +# b2c444c20730b097787fdf50bd7d6dd3fc5256ab8084f5b35b11c8776eca674c lib/unicore/DNormalizationProps.txt +# f901ac011aa32a09224d6555da71e2532c59c1d3381322829de0e3b880507250 lib/unicore/EastAsianWidth.txt +# 5995522f01633073911dad1edb74d13aa832f42862c0392a79627b85d52f2391 lib/unicore/EquivalentUnifiedIdeograph.txt +# cd1c9367cba438afa965fcb5edc6ed3ec6e685fd5dd21c0cc20c026f04beb0e5 lib/unicore/HangulSyllableType.txt +# 3f3f368fccdb37f350ecedc20b37fa71ab31c04e847884c77780d34283539f73 lib/unicore/IdStatus.txt +# 45a150c23961b58d7784704af6c4daccd6517d97b6489e53d13bbdbf9e4f065f lib/unicore/IdType.txt +# d8704c8725568813a947ff2ef38bcf1f05e2a6fbea6876ba384890f187a8bf61 lib/unicore/IndicPositionalCategory.txt +# c7b969b653dc278fb66ab4136223d320e30ad19367eb791ae60dcc6d92071b16 lib/unicore/IndicSyllabicCategory.txt +# 39ff89e0a329e1ccce6d54fad8cf82e90926901928c0ca9b9a2ad5681f330dd9 lib/unicore/Jamo.txt +# 9e06e9f35c6959fb91dcc7993f90d58523c3079bc62c6b25f828b4cdebc5d70c lib/unicore/LineBreak.txt +# 14b3b677d33f95c51423dce6eef4a6a28b4b160451ecedee4b91edb6745cf4a3 lib/unicore/NameAliases.txt +# db5745688affcdc0c3927a1ee0667018a96a7b24513f866d5235e98fef6c2436 lib/unicore/NamedSequences.txt +# 6bddfdb850417a5bee6deff19290fd1b138589909afb50f5a049f343bf2c6722 lib/unicore/PropList.txt +# eb755757e20b72b330b2948df3cf2ff7adb0e31bb060140dc09dafb132ace2cd lib/unicore/PropValueAliases.txt +# 859d7225f2d2a460b3ccb1d61a7945f8cc219acdf5aa53b66b7a1e4bf6ebfc87 lib/unicore/PropertyAliases.txt +# d37eedf63ff9c48bac863d5f76862373d6cf5269fd21253d499e2430d638c01d lib/unicore/ScriptExtensions.txt +# 52db475c4ec445e73b0b16915448c357614946ad7062843c563e00d7535c6510 lib/unicore/Scripts.txt +# c667b45908fd269af25fd55d2fc5bbc157fb1b77675936e25c513ce32e080334 lib/unicore/SpecialCasing.txt +# 36018e68657fdcb3485f636630ffe8c8532e01c977703d2803f5b89d6c5feafb lib/unicore/UnicodeData.txt +# 869ff43dd012f924d03c89fc268c88f0e7eea72f0228b91ca30455afdb84f8fd lib/unicore/VerticalOrientation.txt +# ddc7d4d1f3838573b94fc5d83ff7217e63c47b22ae1cd40c5fe1a54efc15589b lib/unicore/auxiliary/GCBTest.txt +# 97e79f1f8d9cd76d120f2420381a01abc00a7c78a2aa583fa3f9627264a99742 lib/unicore/auxiliary/GraphemeBreakProperty.txt +# 488dbb6a7e1d0070d4aa7c175352c818ff6425172850d1b40c6177726658cb05 lib/unicore/auxiliary/LBTest.txt +# 7e42dd749dbb94aa44b13faf9df6319d9a16ce2ea09a3a094fcfbb5962168040 lib/unicore/auxiliary/SBTest.txt +# 7092ca4117cec891c25c7724132efc519e1dece01ae9fd6068035a9db04d526e lib/unicore/auxiliary/SentenceBreakProperty.txt +# 8094b544ec1580c7e41ac0187805cc1aeb330a90301ec7505563e1a59318284e lib/unicore/auxiliary/WBTest.txt +# 7716752aad296d4ab23ff4ed0a2746fc5328750ff84e9e7d6f3828ee9eaef742 lib/unicore/auxiliary/WordBreakProperty.txt +# b597836124298b8f7fa076273802840cfc3271a25f5c397a082e120954b82c3c lib/unicore/emoji/emoji.txt +# e5fe51acc74e3e83b4fb4c7b25f3c34491d6eb8095c9955d0712dafbca7b3c2b lib/unicore/extracted/DBidiClass.txt +# cd0a14176d93bf440b77a582a0d678190fc0688b15442d4cfb250bf2e27956af lib/unicore/extracted/DBinaryProperties.txt +# 12b0c3af9b600b49488d66545a3e7844ea980809627201bf9afeebe1c9f16f4e lib/unicore/extracted/DCombiningClass.txt +# f76064b298cfbd715ba542e7894f7a507d32da2f011070d1d01df95cad9817d6 lib/unicore/extracted/DDecompositionType.txt +# f9bef074cc916db57fece99d54a4505f8e7c7b17481619e3f0005211f7717d4b lib/unicore/extracted/DEastAsianWidth.txt +# cde679c8461976ed40d7edf61ae98cbb947540831f06f5bc7da7decbf91a1420 lib/unicore/extracted/DGeneralCategory.txt +# 9bb891831328713603a486a4a03df7f7987c3e1e8144a6d1ac71fd061ef3f732 lib/unicore/extracted/DJoinGroup.txt +# e97c65bbea0a69d2fae6ec4182b09e519e13232e20bd804b3004edc0f36bb0d4 lib/unicore/extracted/DJoinType.txt +# 43f6df50e4878f501b417e366b0ee097ae5ccb2d4ce942026bed3d62d78e7887 lib/unicore/extracted/DLineBreak.txt +# a04502ebb36a45d83cbe48a7d8132ea8143edb7b3d34d0aa6afe4a9685049741 lib/unicore/extracted/DNumType.txt +# 11075771b112e8e7ccf6ffa637c4c91eadc3ef3db0517b24e605df8fd3624239 lib/unicore/extracted/DNumValues.txt +# 24b7b7bda1a2ab4684ba53355d82ad227c1624b337b37c3b96f2e4b902eea1f2 lib/unicore/mktables +# c72bbdeda99714db1c8024d3311da4aef3c0db3b9b9f11455a7cfe10d5e9aba3 lib/unicore/version # 0a6b5ab33bb1026531f816efe81aea1a8ffcd34a27cbea37dd6a70a63d73c844 regen/charset_translations.pl # 5f8520d3a17ade6317fc0c423f5091470924b1ef425bca0c41ce8e4a9f8460fe regen/mk_PL_charclass.pl -# 04a5294218c412e5ee2e0d9f8d22af1d95bbfd2cafae3935cbb6b5871e9f9704 regen/mk_invlists.pl +# 6defb8383a69034f8279fea4ff66e09bf58049c4cbecf2331b9b245c45d4f2d5 regen/mk_invlists.pl # ex: set ro: diff --git a/lib/unicore/version b/lib/unicore/version index 02161ca86e..4b964e9654 100644 --- a/lib/unicore/version +++ b/lib/unicore/version @@ -1 +1 @@ -13.0.0 +14.0.0 diff --git a/pod/perldelta.pod b/pod/perldelta.pod index 7ea95874f6..c61c46a504 100644 --- a/pod/perldelta.pod +++ b/pod/perldelta.pod @@ -35,6 +35,10 @@ at a later time, during scope exit. For more information, see L. +=head2 Unicode 14.0 is supported + +See L for details. + =head2 SIGFPE no longer deferred Floating-point exceptions are now delivered immediately, in the same way diff --git a/regcharclass.h b/regcharclass.h index 0500d572bd..c4d2f9db69 100644 --- a/regcharclass.h +++ b/regcharclass.h @@ -245,7 +245,7 @@ ( ( 0x80 == ((const U8*)s)[2] ) ? 3 : 0 ) \ : ( 0x9E == ((const U8*)s)[1] ) ? \ ( ( inRANGE_helper_(U8, ((const U8*)s)[2], 0xB4, 0xB5) ) ? 3 : 0 ) \ - : ( ( 0xA0 == ((const U8*)s)[1] ) && ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x8B, 0x8E) ) ) ? 3 : 0 )\ + : ( ( 0xA0 == ((const U8*)s)[1] ) && ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x8B, 0x8F) ) ) ? 3 : 0 )\ : ( 0xE2 == ((const U8*)s)[0] ) ? \ ( ( 0x80 == ((const U8*)s)[1] ) ? \ ( ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x80, 0xBE) ) ? 3 : 0 ) \ @@ -1482,7 +1482,7 @@ ( ( 0x41 == ((const U8*)s)[2] ) ? 3 : 0 ) \ : ( ( 0x71 == ((const U8*)s)[1] ) && ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x63, 0x64) ) ) ? 3 : 0 )\ : ( 0xBE == ((const U8*)s)[0] ) ? \ - ( ( ( 0x41 == ((const U8*)s)[1] ) && ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x52, 0x55) ) ) ? 3 : 0 )\ + ( ( ( 0x41 == ((const U8*)s)[1] ) && ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x52, 0x56) ) ) ? 3 : 0 )\ : ( 0xCA == ((const U8*)s)[0] ) ? \ ( ( 0x41 == ((const U8*)s)[1] || inRANGE_helper_(U8, NATIVE_UTF8_TO_I8(((const U8*)s)[1]), 0xAD, 0xBF) ) ?\ 3 \ @@ -2711,7 +2711,7 @@ ( ( 0x41 == ((const U8*)s)[2] ) ? 3 : 0 ) \ : ( ( 0x70 == ((const U8*)s)[1] ) && ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x62, 0x63) ) ) ? 3 : 0 )\ : ( 0xBE == ((const U8*)s)[0] ) ? \ - ( ( ( 0x41 == ((const U8*)s)[1] ) && ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x52, 0x55) ) ) ? 3 : 0 )\ + ( ( ( 0x41 == ((const U8*)s)[1] ) && ( inRANGE_helper_(U8, ((const U8*)s)[2], 0x52, 0x56) ) ) ? 3 : 0 )\ : ( 0xCA == ((const U8*)s)[0] ) ? \ ( ( 0x41 == ((const U8*)s)[1] || inRANGE_helper_(U8, NATIVE_UTF8_TO_I8(((const U8*)s)[1]), 0xAD, 0xBF) ) ?\ 3 \ @@ -3715,55 +3715,55 @@ /* Generated from: * 688d673ec947f7ccf898b4eae9848139d4d33676b688dee54f449f8bf9d3bbd2 lib/Unicode/UCD.pm - * ce96627d4fc91b4fd886c409caeb9b76cf7bd345e12f05c6701add7f233f6437 lib/unicore/ArabicShaping.txt - * 0e69eef3da722cc104522d8372e86d5b86bb7afcc761b0c991e39e832294946d lib/unicore/BidiBrackets.txt - * a00d9d21585106a52113fb7b1d3d0373a5835be72e76862fb559ebddd474d70e lib/unicore/BidiMirroring.txt - * 81a82b6a9fcf1a9c12f588d7a1decd73a9afdc4cac95b0eb7e576e7942d6c19f lib/unicore/Blocks.txt - * 99d231d7c91688bbe8ca8ccebcc2f46b5b222f844babe4827295bae11e2abe5f lib/unicore/CaseFolding.txt - * 38badafd818d8405324fe298c0676be0c95186368c84b5368375fd871a645144 lib/unicore/CompositionExclusions.txt - * e779a443d3aa2a3166a15becaa2b737c922480e32c0453d5956093633555078f lib/unicore/DAge.txt - * a5d45f59b39deaab3c72ce8c1a2e212a5e086dff11b1f9d5bb0e352642e82248 lib/unicore/DCoreProperties.txt - * 3ac44e11c84bdaf6b207d2c2c20eed857ae17052393fc7f71b0fe951186ba906 lib/unicore/DNormalizationProps.txt - * 4f822ec7a9ebbb3138ad29bade8b9688d25b39c7a3c0b7431f01e7229e4fcb6e lib/unicore/EastAsianWidth.txt - * fc535aa1047a70105ab9a22c2b4c3f363a2ff02fe48ebbc5eeb9873b2752ff0b lib/unicore/EquivalentUnifiedIdeograph.txt - * b9c5158ce944d2fec57e0e4ecb716bdabfc3bdde73525f1772fe03f61a30d473 lib/unicore/HangulSyllableType.txt - * 36c1b2a626ff1fb23b8b21e6ea8712698f8ce668dded1cb48b8ddf6a6a1b04e9 lib/unicore/IdStatus.txt - * 4857c4ffa3898e6128b2d46b0a02e499a663fb91464a69ef3611096f01293acc lib/unicore/IdType.txt - * 69197b019fa5f2fb0d8c6ed1ed8acb9f2e8b5b8f45a947953ffa652f3bf54983 lib/unicore/IndicPositionalCategory.txt - * 6604e2f0fde7428675364aa0006bc686b79488dcc60ae8cb29800af2be3352e8 lib/unicore/IndicSyllabicCategory.txt - * 84ead63924aaa74b988b2eaf254a8733276ed108633ce2ef77a9ee1de7818162 lib/unicore/Jamo.txt - * d5abcd8f54c8a2aa912924c485ccf7f968ad98feaa303d8e9a29ad89172f1faf lib/unicore/LineBreak.txt - * 985128e8c8b2540233331d9b27d897d2c23bd5bcf1d05da960befce6efc59542 lib/unicore/NameAliases.txt - * 27282b8aa01d4d0c44aef436cb74195ae8639ffa187aeee4e6247af76febea76 lib/unicore/NamedSequences.txt - * 485b5a3ed25dbf1f94dfa5a9b69d8b4550ffd0c33045ccc55ccfd7c80b2a40cf lib/unicore/PropList.txt - * 6b3902e9268cd843fe65cbdea992108c9528343ec0679f800b96f356bb553e5a lib/unicore/PropValueAliases.txt - * 2bd5777847e3d6add3c7e5c0d1393ddcab89e5a0ac3ff498cb0c53041f0b86e4 lib/unicore/PropertyAliases.txt - * 03a61dc89422e44cc2b73e8e893321007880ab69e2a4d281c0f1bc29c602b9d0 lib/unicore/ScriptExtensions.txt - * 9a5ed1ec9b5f0d7147e9371ad792ab39203611af7637cff2aa4a5c663b172cde lib/unicore/Scripts.txt - * 6424312f1dc39b22e0ff9c0ffb13dfad424d9b03e6a6dc6bca941f6bf5ef1ffd lib/unicore/SpecialCasing.txt - * bdbffbbfc8ad4d3a6d01b5891510458f3d36f7170422af4ea2bed3211a73e8bb lib/unicore/UnicodeData.txt - * 160f41816234addb511901d5f21febd69574578dd93de6ef8153e35693325575 lib/unicore/VerticalOrientation.txt - * 32dfb37d21db530529a6ec3dc13d96f21f8e7c7faf7ff3db8a9760cd76cec81d lib/unicore/auxiliary/GCBTest.txt - * 2bd3c5e2d62701ff81fb3ec318e179a4618cabb1493b1e0dd2b4e7e56c5437c4 lib/unicore/auxiliary/GraphemeBreakProperty.txt - * c51fbebfa82a0f36473b44bfd71d5ef6cb6a1f81fb313375dc9a1910d79bb2b6 lib/unicore/auxiliary/LBTest.txt - * 80b0107750818d8f370bd120b6fe56b6855b60581f72affe8b60409a469b4b65 lib/unicore/auxiliary/SBTest.txt - * 09e3166ebab166ac630a227f77f4e794ebd433271abd5588f5a67e7f199c71ee lib/unicore/auxiliary/SentenceBreakProperty.txt - * bf5373ce28a5df06796c93dc159dd15a997bb2950c92704b40ae8190cfc3716d lib/unicore/auxiliary/WBTest.txt - * a2b7373cf2fe3fa3b26dbb53405ca849985f771ff47f1c61743978003ff80499 lib/unicore/auxiliary/WordBreakProperty.txt - * d2686f400a638c80775d7c662556fb8fa8dd3bbe4aa548d9d31624264c6e1bb1 lib/unicore/emoji/emoji.txt - * b827ae5da8c2b08947cc9a120a7b7fd2f1676fb160b508df78075381635b127c lib/unicore/extracted/DBidiClass.txt - * 6fdc5b5ef40444a8f0c772e6b67c00498d4216fe0c0fdf76744ce338f2ad3810 lib/unicore/extracted/DBinaryProperties.txt - * e14928a5bf6ad5958a80332bd42e96e14420080a95c660e5da29384e496755d0 lib/unicore/extracted/DCombiningClass.txt - * 579a03281fbe87b78d5d9a8523de4d255edd7e4ca6eab0e4c7729de97e9b89b1 lib/unicore/extracted/DDecompositionType.txt - * ad83c59b257e9d480ffd3001d4ac240c5fed7cb1919453e1c4e8877035256bcd lib/unicore/extracted/DEastAsianWidth.txt - * 4502f0969e4e6558c4b4c6ca4c23dad70b863d61dd3d5eed1a62a6c3c99fd570 lib/unicore/extracted/DGeneralCategory.txt - * 00bb88b89e2adb646f3177f9444e2d3192386b81a5de9556104b338274b253e1 lib/unicore/extracted/DJoinGroup.txt - * ac835b6e11a60c9820d3cf2d1cb0558dd68efb8f53f404a51632e4726690a6d7 lib/unicore/extracted/DJoinType.txt - * baba9dfc133e3cb770a89aaf0973b1341fa61c2da6c176baf6428898b3b568d8 lib/unicore/extracted/DLineBreak.txt - * 6d4a8c945dd7db83ed617cbb7d937de7f4ecf016ff22970d846e996a7c9a2a5d lib/unicore/extracted/DNumType.txt - * 5b7c14380d5cceeaffcfbc18db1ed936391d2af2d51f5a41f1a17b692c77e59b lib/unicore/extracted/DNumValues.txt - * 4e169849b96b76987a8fc443ef421b44d2dcebbd981bb457f6a13e8af77cdbe2 lib/unicore/mktables - * 50b85a67451145545a65cea370dab8d3444fbfe07e9c34cef560c5b7da9d3eef lib/unicore/version + * c7698811e9adb6cc98fb996a7de4be2b6532f2ac67e76055cc8afdbf6ee18af3 lib/unicore/ArabicShaping.txt + * 24a74555f918bbe99f5b3f1b83cf36fc0e205bb8a600a6a3aa539c710a3dcf27 lib/unicore/BidiBrackets.txt + * 7a5c74cedc1616a9af0a9d22e108ae592d86fe93649c144ae6ba49f193a44122 lib/unicore/BidiMirroring.txt + * 598870dddef7b34b5a972916528c456aff2765b79cd4f9647fb58ceb767e7f17 lib/unicore/Blocks.txt + * a566cd48687b2cd897e02501118b2413c14ae86d318f9abbbba97feb84189f0f lib/unicore/CaseFolding.txt + * 3360762fc3295cea54ab251c31df621d05ba4b94d46c60eaac29aa16d70ad1e0 lib/unicore/CompositionExclusions.txt + * 7e058dec02147098bc9c28d86209f0f251bba0538f3b5a705ad02ea3bb709fe0 lib/unicore/DAge.txt + * e3eddd7d469cd1b0feed7528defad1a1cc7c6a9ceb0ae4446a6d10921ed2e7bc lib/unicore/DCoreProperties.txt + * b2c444c20730b097787fdf50bd7d6dd3fc5256ab8084f5b35b11c8776eca674c lib/unicore/DNormalizationProps.txt + * f901ac011aa32a09224d6555da71e2532c59c1d3381322829de0e3b880507250 lib/unicore/EastAsianWidth.txt + * 5995522f01633073911dad1edb74d13aa832f42862c0392a79627b85d52f2391 lib/unicore/EquivalentUnifiedIdeograph.txt + * cd1c9367cba438afa965fcb5edc6ed3ec6e685fd5dd21c0cc20c026f04beb0e5 lib/unicore/HangulSyllableType.txt + * 3f3f368fccdb37f350ecedc20b37fa71ab31c04e847884c77780d34283539f73 lib/unicore/IdStatus.txt + * 45a150c23961b58d7784704af6c4daccd6517d97b6489e53d13bbdbf9e4f065f lib/unicore/IdType.txt + * d8704c8725568813a947ff2ef38bcf1f05e2a6fbea6876ba384890f187a8bf61 lib/unicore/IndicPositionalCategory.txt + * c7b969b653dc278fb66ab4136223d320e30ad19367eb791ae60dcc6d92071b16 lib/unicore/IndicSyllabicCategory.txt + * 39ff89e0a329e1ccce6d54fad8cf82e90926901928c0ca9b9a2ad5681f330dd9 lib/unicore/Jamo.txt + * 9e06e9f35c6959fb91dcc7993f90d58523c3079bc62c6b25f828b4cdebc5d70c lib/unicore/LineBreak.txt + * 14b3b677d33f95c51423dce6eef4a6a28b4b160451ecedee4b91edb6745cf4a3 lib/unicore/NameAliases.txt + * db5745688affcdc0c3927a1ee0667018a96a7b24513f866d5235e98fef6c2436 lib/unicore/NamedSequences.txt + * 6bddfdb850417a5bee6deff19290fd1b138589909afb50f5a049f343bf2c6722 lib/unicore/PropList.txt + * eb755757e20b72b330b2948df3cf2ff7adb0e31bb060140dc09dafb132ace2cd lib/unicore/PropValueAliases.txt + * 859d7225f2d2a460b3ccb1d61a7945f8cc219acdf5aa53b66b7a1e4bf6ebfc87 lib/unicore/PropertyAliases.txt + * d37eedf63ff9c48bac863d5f76862373d6cf5269fd21253d499e2430d638c01d lib/unicore/ScriptExtensions.txt + * 52db475c4ec445e73b0b16915448c357614946ad7062843c563e00d7535c6510 lib/unicore/Scripts.txt + * c667b45908fd269af25fd55d2fc5bbc157fb1b77675936e25c513ce32e080334 lib/unicore/SpecialCasing.txt + * 36018e68657fdcb3485f636630ffe8c8532e01c977703d2803f5b89d6c5feafb lib/unicore/UnicodeData.txt + * 869ff43dd012f924d03c89fc268c88f0e7eea72f0228b91ca30455afdb84f8fd lib/unicore/VerticalOrientation.txt + * ddc7d4d1f3838573b94fc5d83ff7217e63c47b22ae1cd40c5fe1a54efc15589b lib/unicore/auxiliary/GCBTest.txt + * 97e79f1f8d9cd76d120f2420381a01abc00a7c78a2aa583fa3f9627264a99742 lib/unicore/auxiliary/GraphemeBreakProperty.txt + * 488dbb6a7e1d0070d4aa7c175352c818ff6425172850d1b40c6177726658cb05 lib/unicore/auxiliary/LBTest.txt + * 7e42dd749dbb94aa44b13faf9df6319d9a16ce2ea09a3a094fcfbb5962168040 lib/unicore/auxiliary/SBTest.txt + * 7092ca4117cec891c25c7724132efc519e1dece01ae9fd6068035a9db04d526e lib/unicore/auxiliary/SentenceBreakProperty.txt + * 8094b544ec1580c7e41ac0187805cc1aeb330a90301ec7505563e1a59318284e lib/unicore/auxiliary/WBTest.txt + * 7716752aad296d4ab23ff4ed0a2746fc5328750ff84e9e7d6f3828ee9eaef742 lib/unicore/auxiliary/WordBreakProperty.txt + * b597836124298b8f7fa076273802840cfc3271a25f5c397a082e120954b82c3c lib/unicore/emoji/emoji.txt + * e5fe51acc74e3e83b4fb4c7b25f3c34491d6eb8095c9955d0712dafbca7b3c2b lib/unicore/extracted/DBidiClass.txt + * cd0a14176d93bf440b77a582a0d678190fc0688b15442d4cfb250bf2e27956af lib/unicore/extracted/DBinaryProperties.txt + * 12b0c3af9b600b49488d66545a3e7844ea980809627201bf9afeebe1c9f16f4e lib/unicore/extracted/DCombiningClass.txt + * f76064b298cfbd715ba542e7894f7a507d32da2f011070d1d01df95cad9817d6 lib/unicore/extracted/DDecompositionType.txt + * f9bef074cc916db57fece99d54a4505f8e7c7b17481619e3f0005211f7717d4b lib/unicore/extracted/DEastAsianWidth.txt + * cde679c8461976ed40d7edf61ae98cbb947540831f06f5bc7da7decbf91a1420 lib/unicore/extracted/DGeneralCategory.txt + * 9bb891831328713603a486a4a03df7f7987c3e1e8144a6d1ac71fd061ef3f732 lib/unicore/extracted/DJoinGroup.txt + * e97c65bbea0a69d2fae6ec4182b09e519e13232e20bd804b3004edc0f36bb0d4 lib/unicore/extracted/DJoinType.txt + * 43f6df50e4878f501b417e366b0ee097ae5ccb2d4ce942026bed3d62d78e7887 lib/unicore/extracted/DLineBreak.txt + * a04502ebb36a45d83cbe48a7d8132ea8143edb7b3d34d0aa6afe4a9685049741 lib/unicore/extracted/DNumType.txt + * 11075771b112e8e7ccf6ffa637c4c91eadc3ef3db0517b24e605df8fd3624239 lib/unicore/extracted/DNumValues.txt + * 24b7b7bda1a2ab4684ba53355d82ad227c1624b337b37c3b96f2e4b902eea1f2 lib/unicore/mktables + * c72bbdeda99714db1c8024d3311da4aef3c0db3b9b9f11455a7cfe10d5e9aba3 lib/unicore/version * 0a6b5ab33bb1026531f816efe81aea1a8ffcd34a27cbea37dd6a70a63d73c844 regen/charset_translations.pl * 1aa94679c695efd507b7e4491629dba1021b74c21a5324dfd3a582a5d654bd32 regen/regcharclass.pl * b2f896452d2b30da3e04800f478c60c1fd0b03d6b668689b020f1e3cf1f1cdd9 regen/regcharclass_multi_char_folds.pl diff --git a/regen/mk_invlists.pl b/regen/mk_invlists.pl index 8ea6254b57..7ed83dd5e6 100644 --- a/regen/mk_invlists.pl +++ b/regen/mk_invlists.pl @@ -1543,10 +1543,15 @@ sub output_LB_table() { } } - # LB30b Do not break between an emoji base and an emoji modifier. + # LB30b Do not break between an emoji base (or potential emoji) and an + # emoji modifier. + # EB × EM + # [\p{Extended_Pictographic}&\p{Cn}] × EM $lb_table[$lb_enums{'E_Base'}][$lb_enums{'E_Modifier'}] = $lb_actions{'LB_NOBREAK'}; + $lb_table[$lb_enums{'Unassigned_Extended_Pictographic_Ideographic'}] + [$lb_enums{'E_Modifier'}] = $lb_actions{'LB_NOBREAK'}; # LB30a Break between two regional indicator symbols if and only if there # are an even number of regional indicators preceding the position of the @@ -1597,18 +1602,6 @@ sub output_LB_table() { = $lb_actions{'LB_NOBREAK'}; # LB27 Treat a Korean Syllable Block the same as ID. - # (JL | JV | JT | H2 | H3) × IN - $lb_table[$lb_enums{'JL'}][$lb_enums{'Inseparable'}] - = $lb_actions{'LB_NOBREAK'}; - $lb_table[$lb_enums{'JV'}][$lb_enums{'Inseparable'}] - = $lb_actions{'LB_NOBREAK'}; - $lb_table[$lb_enums{'JT'}][$lb_enums{'Inseparable'}] - = $lb_actions{'LB_NOBREAK'}; - $lb_table[$lb_enums{'H2'}][$lb_enums{'Inseparable'}] - = $lb_actions{'LB_NOBREAK'}; - $lb_table[$lb_enums{'H3'}][$lb_enums{'Inseparable'}] - = $lb_actions{'LB_NOBREAK'}; - # (JL | JV | JT | H2 | H3) × PO $lb_table[$lb_enums{'JL'}][$lb_enums{'Postfix_Numeric'}] = $lb_actions{'LB_NOBREAK'}; diff --git a/uni_keywords.h b/uni_keywords.h index 51c9fc134b..e3af0bb890 100644 --- a/uni_keywords.h +++ b/uni_keywords.h @@ -10,176 +10,179 @@ #define MPH_VALt I16 /* -rows: 7264 -seed: 1348825708 -full length of keys: 101931 -blob length: 10351 -ref length: 58112 -data size: 68463 (%67.17) +rows: 7416 +seed: 1348825710 +full length of keys: 104113 +blob length: 10571 +ref length: 59328 +data size: 69899 (%67.14) */ STATIC const unsigned char mph_blob[] = - "unifiedcanadianaboriginalsyllabicsextendedcjkcompatibilityideogra" - "phssupplementarabicmathematicalalphabeticsymbolscombiningdiacriti" - "calmarksforsymbolscombiningdiacriticalmarkssupplementmiscellaneou" - "ssymbolsandpictographscombiningdiacriticalmarksextendedmiscellane" - "ousmathematicalsymbolsamiscellaneousmathematicalsymbolsbsupplemen" - "talmathematicaloperatorssupplementalsymbolsandpictographsegyptian" - "hieroglyphformatcontrolsideographicdescriptioncharactersideograph" - "icsymbolsandpunctuationmathematicalalphanumericsymbolscjkunifiedi" - "deographsextensionacjkunifiedideographsextensionbcjkunifiedideogr" - "aphsextensionccjkunifiedideographsextensiondcjkunifiedideographse" - "xtensionecjkunifiedideographsextensionfcjkunifiedideographsextens" - "iongcuneiformnumbersandpunctuationenclosedalphanumericsupplements" - "ymbolsandpictographsextendedaenclosedideographicsupplementmiscell" - "aneoussymbolsandarrowsphoneticextensionssupplementsupplementarypr" - "ivateuseareaasupplementaryprivateuseareabvariationselectorssupple" - "mentalphabeticpresentationformsancientgreekmusicalnotationenclose" - "dcjklettersandmonthsopticalcharacterrecognitionprependedconcatena" - "tionmark=changeswhennfkccasefolded=conditionaljapanesestarterdefa" - "ultignorablecodepoint=halfwidthandfullwidthformskatakanaphonetice" - "xtensionsconsonantinitialpostfixedfullcompositionexclusion=supers" - "criptsandsubscriptssymbolsandpictographsextasymbolsforlegacycompu" - "tingarabicpresentationformsaarabicpresentationformsbcanonicalcomb" - "iningclass=cjksymbolsandpunctuationcombiningmarksforsymbolsconson" - "antsucceedingrephahighprivateusesurrogatesindicpositionalcategory" - "=supsymbolsandpictographsbyzantinemusicalsymbolsconsonantprecedin" - "grephageometricshapesextendedhangulcompatibilityjamolatinextended" - "additionalshorthandformatcontrolssupplementalpunctuationbidipaire" - "dbrackettype=changeswhencasefolded=changeswhencasemapped=changesw" - "henlowercased=changeswhentitlecased=changeswhenuppercased=cjkcomp" - "atideographssupcommonindicnumberformsdiacriticalsforsymbolsearlyd" - "ynasticcuneiformindicsyllabiccategory=logicalorderexception=misce" - "llaneoustechnicalnoncharactercodepoint=spacingmodifierletterstran" - "sportandmapsymbolscjkcompatibilityformscjkradicalssupplementcyril" - "licsupplementaryextendedpictographic=graphemeclusterbreak=hanifir" - "ohingyakinnayainscriptionalparthianmeeteimayekextensionspopdirect" - "ionalisolatesinhalaarchaicnumbersyijinghexagramsymbolsanatolianhi" - "eroglyphsconnectorpunctuationconsonantplaceholderconsonantwithsta" - "ckerglagoliticsupplementinscriptionalpahlavilefttorightembeddingn" - "yiakengpuachuehmongpopdirectionalformatrighttoleftembeddingtermin" - "alpunctuation=topandbottomandrightverticalorientation=ancientgree" - "knumbersbrahmijoiningnumberburushaskiyehbarreeconsonantheadletter" - "countingrodnumeralsegyptianhieroglyphsenclosedalphanumsuphangulja" - "moextendedahanguljamoextendedbhangulsyllabletype=idstrinaryoperat" - "or=lefttorightoverridemeroitichieroglyphsmodifiertonelettersmongo" - "liansupplementottomansiyaqnumbersrighttoleftoverridesundanesesupp" - "lementsupplementalarrowsasupplementalarrowsbsupplementalarrowscto" - "pandbottomandleftattachedaboverightcherokeesupplementcombininghal" - "fmarksconsonantsubjoinedcopticepactnumbersdecompositiontype=devan" - "agariextendedemojimodifierbase=emojipresentation=ethiopicsuppleme" - "nteuropeanterminatorfirststrongisolategeneralpunctuationgeorgians" - "upplementidsbinaryoperator=initialpunctuationlatinextadditionalle" - "fttorightisolateornamentaldingbatsparagraphseparatorpatternwhites" - "pace=regionalindicator=righttoleftisolateruminumeralsymbolssmallk" - "anaextensiontaixuanjingsymbolstopandleftandrighttransformedrotate" - "dtransformeduprightvariationselector=alchemicalsymbolsattachedbel" - "owleftcanadiansyllabicscaucasianalbanianconsonantprefixedcyrillic" - "extendedacyrillicextendedbcyrillicextendedcethiopicextendedaeurop" - "eanseparatoridentifierstatus=indicsiyaqnumberskhitansmallscriptle" - "tterlikesymbolsmanichaeandhamedhmanichaeanhundredmanichaeanthamed" - "hscriptextensions=sentenceterminal=smallformvariantssuttonsignwri" - "tingunifiedideograph=arabicsupplementbopomofoextendedcantillation" - "markcloseparenthesisclosepunctuationcypriotsyllabaryfinalpunctuat" - "iongeneralcategory=georgianextendedhalfandfullformshanifirohingya" - "pahighpusurrogatesinvisiblestackerlatin1supplementlinearbideogram" - "slinearbsyllabarymanichaeandalethmanichaeanlamedhmanichaeansamekh" - "manichaeantwentymiscmathsymbolsamiscmathsymbolsbmyanmarextendedam" - "yanmarextendedbotherpunctuationsegmentseparatorsupmathoperatorssy" - "llablemodifiersyriacsupplementtangutcomponentstangutsupplementvow" - "elindependentarabicextendedabamumsupplementboundaryneutralbraille" - "patternscommonseparatorconsonantkillerconsonantmedialcontingentbr" - "eakcontrolpicturescurrencysymbolsdashpunctuationdiacriticalsextdi" - "acriticalssupeastasianwidth=emojicomponent=graphemeextend=hanguls" - "yllablesidentifiertype=imperialaramaiclowercaselettermanichaeanal" - "ephmanichaeangimelmanichaeansadhemanichaeanzayinmeroiticcursivemi" - "scpictographsmodifyingletternfkcquickcheck=nfkdquickcheck=oldnort" - "harabianoldsoutharabianopenpunctuationregistershiftertamilsupplem" - "enttitlecaseletteruppercaselettervedicextensionsvisualorderleftza" - "nabazarsquareancientsymbolsasciihexdigit=carriagereturncaseignora" - "ble=cjkcompatformscomplexcontextconsonantfinalemojimodifier=europ" - "eannumbergeminationmarkgreekandcoptichamzaonhehgoalhighsurrogates" - "kanasupplementkangxiradicalslatinextendedblatinextendedclatinexte" - "ndeddlatinextendedelisusupplementmandatorybreakmanichaeanayinmani" - "chaeanbethmanichaeanfivemanichaeanhethmanichaeankaphmanichaeanqop" - "hmanichaeanreshmanichaeantethmanichaeanyodhmodifiersymbolnfcquick" - "check=nfdquickcheck=nojoininggroupnonspacingmarkpatternsyntax=pho" - "neticextsuppostfixnumericpsalterpahlaviquotationmark=sentencebrea" - "k=spaceseparatorsuppunctuationtehmarbutagoalvoweldependent1000000" - "000000aegeannumbersbidimirrored=blockelementsconsonantdeaddecimal" - "numberenclosingmarkgraphemebase=greekextendediotasubscriptipaexte" - "nsionsjoininggroup=kanaextendedalineseparatorlowsurrogatesmalayal" - "amlllamalayalamnnnamanichaeanmemmanichaeannunmanichaeanonemanicha" - "eantawmanichaeantenmanichaeanwawmayannumeralsmisctechnicalnotappl" - "icablenumericvalue=prefixnumericverticalformsalphabeticpfarabicle" - "tterarabicnumberbidicontrol=breaksymbolschesssymbolscyrillicextac" - "yrillicextbcyrillicextcethiopicextaextendnumletfinalsemkathglueaf" - "terzwjgunjalagondihebrewletterideographic=infixnumericjoincontrol" - "=joiningtype=khmersymbolsletternumbermahjongtilesmalayalambhamala" - "yalamllamalayalamngamalayalamnnamalayalamnyamalayalamssamalayalam" - "ttamanichaeanpemasaramgondimathalphanummendekikakuinoncanonicalno" - "tcharacternotreorderednumberjoinernumerictype=oldhungarianotherne" - "utralphaistosdiscplayingcardsrightjoiningtrailingjamoxidcontinue=" - "africannoonalphabetic=breakbeforecasedletterdeprecated=dominotile" - "sdoubleabovedoublebelowdoublequotedualjoiningexclamationinseparab" - "leinseperablejoincausingkanavoicingkatakanaextleadingjamoleftjoin" - "inglvtsyllablemalayalamjamalayalamramedefaidrinmiscsymbolsmyanmar" - "extamyanmarextbnandinagariotherletterothernumberothersymbolpahawh" - "hmongrecommendedrohingyayehsinglequotesoftdotted=sorasompengstrai" - "ghtwawsuperandsubsylotinagritopandrighttransparentuncommonuseyehw" - "ithtailyisyllablesafricanfehafricanqafarabicextabasiclatinbelowri" - "ghtbidiclass=boxdrawingbreakafterchorasmiancjkstrokescompatjamoda" - "lathrishdiacritic=divesakuruhanreadingkharoshthiknottedhehlimited" - "uselinebreak=lowercase=lvsyllablemiscarrowsnonjoiningnonstarterol" - "dpersianoldsogdianoverstruckphoenicianpresentin=purekillerrestric" - "tedreversedpesaurashtrasmallformssuparrowsasuparrowsbsuparrowscun" - "assigneduppercase=warangcitiwordbreak=wordjoineryiradicals-5.00e-" - "01aboveleftambiguousarabicpfaarabicpfbbhaiksukibreakbothemoticons" - "extender=inclusioninheritedkhudawadilatinextblatinextclatinextdmi" - "dlettermidnumletnabataeannewtailuenonjoinerolditalicoldpermicoldt" - "urkicpalmyrenepaucinhausamaritanscontinuesyriacwawvoweljamowsegsp" - "acexidstart=1.00e-011.11e-011.25e-011.25e-021.43e-011.50e+001.50e" - "-011.56e-021.67e-011.88e-012.00e-012.50e+002.50e-012.50e-02200000" - "003.12e-023.13e-023.13e-033.33e-013.50e+003.75e-013.75e-024.00e-0" - "14.17e-014.50e+004.69e-025.00e-025.50e+005.83e-016.00e-016.25e-01" - "6.25e-026.25e-036.50e+006.67e-017.50e+007.50e-018.00e-018.33e-018" - ".33e-028.50e+008.75e-019.17e-01armenianavagrahabalinesebassavahbu" - "gineseduployanebasegazextpict=farsiyehfractiongujaratigurmukhihir" - "aganaisolatedjamoextajamoextbjavanesekanaextalinefeedmahajaninext" - "lineobsoleteradical=specialsswashkaftagbanwatifinaghtonemarkugari" - "ticaletterallowedavestanbengalicjkextacjkextbcjkextccjkextdcjkext" - "ecjkextfcjkextgcompex=deseretelbasanelymaicgranthagrbase=hanunooh" - "yphen=kannadakayahlilinearamakasarmandaicmarchenmultaninewlinenfk" - "cqc=nfkdqc=noblocknobreaknotnfkcolchikioletterosmanyaoverlaypatsy" - "n=phagspascript=sharadashaviansiddhamsoyombosuppuaasuppuabtagalog" - "taithamtaiviettibetantirhutaucasextunknownvisargawspace=zwspace21" - "6000300000400000432000500000600000700000800000900000alpha=bidic=b" - "idim=block=carianccc103ccc107ccc118ccc122ccc129ccc130ccc132ccc133" - "chakmacirclecwkcf=ecomp=emoji=epres=gothicgrext=hatranjoinc=kaith" - "ikanbunkhojkilamadhlepchalower=lycianlydiannarrownchar=nfcqc=nfdq" - "c=notxidpatws=qmark=rejangsterm=teluguthaanauideo=upper=viramawan" - "choyezidiyudhhe1/1601/32011/12adlamahex=alaphatermbatakbindubuhid" - "ccc14ccc15ccc16ccc17ccc18ccc19ccc20ccc21ccc22ccc23ccc24ccc25ccc26" - "ccc27ccc28ccc29ccc30ccc31ccc32ccc33ccc34ccc35ccc36ccc84ccc91cntrl" - "cwcf=cwcm=dash=dograemod=falseidsb=idst=inpc=insc=khaphlimbumath=" - "maybenuktanushuoghamoriyaosagerunictailetakrivssupxidc=xids=zhain" - "-1/21/101/201/401/641/8010.011.011/212.113.013/215/217/23/163/203" - "/643/805/127/12adlmage=aghbahomalefarmiarmnataratblavstbatkbhksbl" - "k=bpt=buhdcakmcansccc=chrscprtcwl=cwt=cwu=cyrldep=dia=diakdsrtfon" - "tgcb=gonggonmgrekgujrguruhanohluwhmnghmnphst=kalikhmrkitskndakthi" - "lanalaoolatnlinalinbloe=medfmeemmercmiaomlymmroomteimymrnarbnbatn" - "ewankoonshuogamolckorkhoryaosgepcm=phlpphnxplrdprtiqaacqaaiqaphrj" - "ngrohgrunrsamrsarbscx=seensgnwshawshinshrdsogosyrctagstaletalutam" - "ltavttfngtglgthaitibttruev100v110v120v121v130vaiiwchowidexpeoxsux" - "yiiizainzanbzinhzyyyzzzz1/51/71/92/32/520221421822222422622823023" - "22332342403.23/43/54/55.15.25/65/86.16.37.07/89.09/2bc=behci=di=d" - "t=ea=ebgfsigafgc=jg=jt=lb=lrelrilromimnv=ocrpdfrehri=sd=smlsqrtah" - "v20v21v30v31v32v40v41v50v51v52v60v61v62v63v70v80v90vo=vs=wb=yes38" - "39444546474849b2bkh2h3jljvkvl&l_vrxxzlzpzs_perl_problematic_local" - "e_foldeds_is_in_multi_char_fold_perl_folds_to_perl_charname_begin" - "any_foldsquotemetaisxposixisposixblankprintishorizisxperlisperlis" - "spaceisvertisuni"; -/* mph_blob length: 10351 */ + "unifiedcanadianaboriginalsyllabicsextendedacjkcompatibilityideogr" + "aphssupplementarabicmathematicalalphabeticsymbolscombiningdiacrit" + "icalmarksforsymbolscombiningdiacriticalmarkssupplementmiscellaneo" + "ussymbolsandpictographscombiningdiacriticalmarksextendedmiscellan" + "eousmathematicalsymbolsamiscellaneousmathematicalsymbolsbsuppleme" + "ntalmathematicaloperatorssupplementalsymbolsandpictographsegyptia" + "nhieroglyphformatcontrolsideographicdescriptioncharactersideograp" + "hicsymbolsandpunctuationmathematicalalphanumericsymbolscjkunified" + "ideographsextensionacjkunifiedideographsextensionbcjkunifiedideog" + "raphsextensionccjkunifiedideographsextensiondcjkunifiedideographs" + "extensionecjkunifiedideographsextensionfcjkunifiedideographsexten" + "siongcuneiformnumbersandpunctuationenclosedalphanumericsupplement" + "symbolsandpictographsextendedaenclosedideographicsupplementmiscel" + "laneoussymbolsandarrowsphoneticextensionssupplementsupplementaryp" + "rivateuseareaasupplementaryprivateuseareabvariationselectorssuppl" + "ementalphabeticpresentationformsancientgreekmusicalnotationenclos" + "edcjklettersandmonthsopticalcharacterrecognitionprependedconcaten" + "ationmark=changeswhennfkccasefolded=conditionaljapanesestarterdef" + "aultignorablecodepoint=halfwidthandfullwidthformskatakanaphonetic" + "extensionsconsonantinitialpostfixedfullcompositionexclusion=super" + "scriptsandsubscriptssymbolsandpictographsextasymbolsforlegacycomp" + "utingarabicpresentationformsaarabicpresentationformsbcanonicalcom" + "biningclass=cjksymbolsandpunctuationcombiningmarksforsymbolsconso" + "nantsucceedingrephahighprivateusesurrogatesindicpositionalcategor" + "y=supsymbolsandpictographsbyzantinemusicalsymbolsconsonantprecedi" + "ngrephageometricshapesextendedhangulcompatibilityjamolatinextende" + "dadditionalshorthandformatcontrolssupplementalpunctuationznamenny" + "musicalnotationbidipairedbrackettype=changeswhencasefolded=change" + "swhencasemapped=changeswhenlowercased=changeswhentitlecased=chang" + "eswhenuppercased=cjkcompatideographssupcommonindicnumberformsdiac" + "riticalsforsymbolsearlydynasticcuneiformindicsyllabiccategory=log" + "icalorderexception=miscellaneoustechnicalnoncharactercodepoint=sp" + "acingmodifierletterstransportandmapsymbolscjkcompatibilityformscj" + "kradicalssupplementcyrillicsupplementaryextendedpictographic=grap" + "hemeclusterbreak=hanifirohingyakinnayainscriptionalparthianmeetei" + "mayekextensionspopdirectionalisolatesinhalaarchaicnumbersyijinghe" + "xagramsymbolsanatolianhieroglyphsconnectorpunctuationconsonantpla" + "ceholderconsonantwithstackerglagoliticsupplementinscriptionalpahl" + "avilefttorightembeddingnyiakengpuachuehmongpopdirectionalformatri" + "ghttoleftembeddingterminalpunctuation=topandbottomandrightvertica" + "lorientation=ancientgreeknumbersbrahmijoiningnumberburushaskiyehb" + "arreeconsonantheadlettercountingrodnumeralsegyptianhieroglyphsenc" + "losedalphanumsuphanguljamoextendedahanguljamoextendedbhangulsylla" + "bletype=idstrinaryoperator=lefttorightoverridemeroitichieroglyphs" + "modifiertonelettersmongoliansupplementottomansiyaqnumbersrighttol" + "eftoverridesundanesesupplementsupplementalarrowsasupplementalarro" + "wsbsupplementalarrowsctopandbottomandleftattachedaboverightcherok" + "eesupplementcombininghalfmarksconsonantsubjoinedcopticepactnumber" + "sdecompositiontype=devanagariextendedemojimodifierbase=emojiprese" + "ntation=ethiopicsupplementeuropeanterminatorfirststrongisolategen" + "eralpunctuationgeorgiansupplementidsbinaryoperator=initialpunctua" + "tionlatinextadditionallefttorightisolateornamentaldingbatsparagra" + "phseparatorpatternwhitespace=regionalindicator=righttoleftisolate" + "ruminumeralsymbolssmallkanaextensiontaixuanjingsymbolstopandlefta" + "ndrighttransformedrotatedtransformeduprightvariationselector=alch" + "emicalsymbolsattachedbelowleftcanadiansyllabicscaucasianalbanianc" + "onsonantprefixedcyrillicextendedacyrillicextendedbcyrillicextende" + "dcethiopicextendedaethiopicextendedbeuropeanseparatoridentifierst" + "atus=indicsiyaqnumberskhitansmallscriptletterlikesymbolsmanichaea" + "ndhamedhmanichaeanhundredmanichaeanthamedhscriptextensions=senten" + "ceterminal=smallformvariantssuttonsignwritingunifiedideograph=ara" + "bicsupplementbopomofoextendedcantillationmarkcloseparenthesisclos" + "epunctuationcypriotsyllabaryfinalpunctuationgeneralcategory=georg" + "ianextendedhalfandfullformshanifirohingyapahighpusurrogatesinvisi" + "blestackerlatin1supplementlinearbideogramslinearbsyllabarymanicha" + "eandalethmanichaeanlamedhmanichaeansamekhmanichaeantwentymiscmath" + "symbolsamiscmathsymbolsbmyanmarextendedamyanmarextendedbotherpunc" + "tuationsegmentseparatorsupmathoperatorssyllablemodifiersyriacsupp" + "lementtangutcomponentstangutsupplementvowelindependentarabicexten" + "dedaarabicextendedbbamumsupplementboundaryneutralbraillepatternsc" + "ommonseparatorconsonantkillerconsonantmedialcontingentbreakcontro" + "lpicturescurrencysymbolsdashpunctuationdiacriticalsextdiacritical" + "ssupeastasianwidth=emojicomponent=graphemeextend=hangulsyllablesi" + "dentifiertype=imperialaramaiclowercaselettermanichaeanalephmanich" + "aeangimelmanichaeansadhemanichaeanzayinmeroiticcursivemiscpictogr" + "aphsmodifyingletternfkcquickcheck=nfkdquickcheck=oldnortharabiano" + "ldsoutharabianopenpunctuationregistershiftertamilsupplementtitlec" + "aseletteruppercaselettervedicextensionsvisualorderleftzanabazarsq" + "uareancientsymbolsasciihexdigit=carriagereturncaseignorable=cjkco" + "mpatformscomplexcontextconsonantfinalemojimodifier=europeannumber" + "geminationmarkgreekandcoptichamzaonhehgoalhighsurrogateskanasuppl" + "ementkangxiradicalslatinextendedblatinextendedclatinextendeddlati" + "nextendedelatinextendedflatinextendedglisusupplementmandatorybrea" + "kmanichaeanayinmanichaeanbethmanichaeanfivemanichaeanhethmanichae" + "ankaphmanichaeanqophmanichaeanreshmanichaeantethmanichaeanyodhmod" + "ifiersymbolnfcquickcheck=nfdquickcheck=nojoininggroupnonspacingma" + "rkpatternsyntax=phoneticextsuppostfixnumericpsalterpahlaviquotati" + "onmark=sentencebreak=spaceseparatorsuppunctuationtehmarbutagoalvo" + "weldependent1000000000000aegeannumbersbidimirrored=blockelementsc" + "onsonantdeaddecimalnumberenclosingmarkgraphemebase=greekextendedi" + "otasubscriptipaextensionsjoininggroup=kanaextendedakanaextendedbl" + "ineseparatorlowsurrogatesmalayalamlllamalayalamnnnamanichaeanmemm" + "anichaeannunmanichaeanonemanichaeantawmanichaeantenmanichaeanwawm" + "ayannumeralsmisctechnicalnotapplicablenumericvalue=prefixnumericv" + "erticalformsalphabeticpfarabicletterarabicnumberbidicontrol=break" + "symbolschesssymbolscyrillicextacyrillicextbcyrillicextcethiopicex" + "taethiopicextbextendnumletfinalsemkathglueafterzwjgunjalagondiheb" + "rewletterideographic=infixnumericjoincontrol=joiningtype=khmersym" + "bolsletternumbermahjongtilesmalayalambhamalayalamllamalayalamngam" + "alayalamnnamalayalamnyamalayalamssamalayalamttamanichaeanpemasara" + "mgondimathalphanummendekikakuinoncanonicalnotcharacternotreordere" + "dnumberjoinernumerictype=oldhungarianotherneutralphaistosdiscplay" + "ingcardsrightjoiningtrailingjamoverticaltailxidcontinue=africanno" + "onalphabetic=breakbeforecasedlettercyprominoandeprecated=dominoti" + "lesdoubleabovedoublebelowdoublequotedualjoiningexclamationinsepar" + "ableinseperablejoincausingkanavoicingkatakanaextleadingjamoleftjo" + "ininglvtsyllablemalayalamjamalayalamramedefaidrinmiscsymbolsmyanm" + "arextamyanmarextbnandinagariotherletterothernumberothersymbolpaha" + "whhmongrecommendedrohingyayehsinglequotesoftdotted=sorasompengstr" + "aightwawsuperandsubsylotinagritopandrighttransparentuncommonuseye" + "hwithtailyisyllablesafricanfehafricanqafarabicextaarabicextbbasic" + "latinbelowrightbidiclass=boxdrawingbreakafterchorasmiancjkstrokes" + "compatjamodalathrishdiacritic=divesakuruhanreadingkharoshthiknott" + "edhehlimiteduselinebreak=lowercase=lvsyllablemiscarrowsnonjoining" + "nonstarteroldpersianoldsogdianoverstruckphoenicianpresentin=purek" + "illerrestrictedreversedpesaurashtrasmallformssuparrowsasuparrowsb" + "suparrowscunassigneduppercase=warangcitiwordbreak=wordjoineryirad" + "icals-5.00e-01aboveleftambiguousarabicpfaarabicpfbbhaiksukibreakb" + "othemoticonsextender=inclusioninheritedkhudawadilatinextblatinext" + "clatinextdlatinextflatinextgmidlettermidnumletnabataeannewtailuen" + "onjoinerolditalicoldpermicoldturkicolduyghurpalmyrenepaucinhausam" + "aritanscontinuesyriacwawvoweljamowsegspacexidstart=1.00e-011.11e-" + "011.25e-011.25e-021.43e-011.50e+001.50e-011.56e-021.67e-011.88e-0" + "12.00e-012.50e+002.50e-012.50e-02200000003.12e-023.13e-023.13e-03" + "3.33e-013.50e+003.75e-013.75e-024.00e-014.17e-014.50e+004.69e-025" + ".00e-025.50e+005.83e-016.00e-016.25e-016.25e-026.25e-036.50e+006." + "67e-017.50e+007.50e-018.00e-018.33e-018.33e-028.50e+008.75e-019.1" + "7e-01armenianavagrahabalinesebassavahbugineseduployanebasegazextp" + "ict=farsiyehfractiongujaratigurmukhihiraganaisolatedjamoextajamoe" + "xtbjavanesekanaextakanaextblinefeedmahajaninextlineobsoleteradica" + "l=specialsswashkaftagbanwatifinaghtonemarkucasextaugariticvithkuq" + "ialetterallowedavestanbengalicjkextacjkextbcjkextccjkextdcjkextec" + "jkextfcjkextgcompex=deseretelbasanelymaicgranthagrbase=hanunoohyp" + "hen=kannadakayahlilinearamakasarmandaicmarchenmultaninewlinenfkcq" + "c=nfkdqc=noblocknobreaknotnfkcolchikioletterosmanyaoverlaypatsyn=" + "phagspascript=sharadashaviansiddhamsoyombosuppuaasuppuabtagalogta" + "ithamtaivietthinyehtibetantirhutaunknownvisargawspace=zwspace2160" + "00300000400000432000500000600000700000800000900000alpha=bidic=bid" + "im=block=carianccc103ccc107ccc118ccc122ccc129ccc130ccc132ccc133ch" + "akmacirclecwkcf=ecomp=emoji=epres=gothicgrext=hatranjoinc=kaithik" + "anbunkhojkilamadhlepchalower=lycianlydiannarrownchar=nfcqc=nfdqc=" + "notxidpatws=qmark=rejangsterm=tangsateluguthaanauideo=upper=viram" + "awanchoyezidiyudhhe1/1601/32011/12adlamahex=alaphatermbatakbindub" + "uhidccc14ccc15ccc16ccc17ccc18ccc19ccc20ccc21ccc22ccc23ccc24ccc25c" + "cc26ccc27ccc28ccc29ccc30ccc31ccc32ccc33ccc34ccc35ccc36ccc84ccc91c" + "ntrlcwcf=cwcm=dash=dograemod=falseidsb=idst=inpc=insc=khaphlimbum" + "ath=maybenuktanushuoghamoriyaosagerunictailetakrivssupxidc=xids=z" + "hain-1/21/101/201/401/641/8010.011.011/212.113.013/214.015/217/23" + "/163/203/643/805/127/12adlmage=aghbahomalefarmiarmnataratblavstba" + "tkbhksblk=bpt=buhdcakmcansccc=chrscpmncprtcwl=cwt=cwu=cyrldep=dia" + "=diakdsrtfontgcb=gonggonmgrekgujrguruhanohluwhmnghmnphst=kalikhmr" + "kitskndakthilanalaoolatnlinalinbloe=medfmeemmercmiaomlymmroomteim" + "ymrnarbnbatnewankoonshuogamolckorkhoryaosgeougrpcm=phlpphnxplrdpr" + "tiqaacqaaiqaphrjngrohgrunrsamrsarbscx=seensgnwshawshinshrdsogosyr" + "ctagstaletalutamltavttfngtglgthaitibttnsatototruev100v110v120v121" + "v130v140vaiiwchowidexpeoxsuxyiiizainzanbzinhzyyyzzzz1/51/71/92/32" + "/52022182222242262282302322332342403.23/43/54/55.15.25/65/86.16.3" + "7.07/89.09/2bc=behci=di=dt=ea=ebgfsigafgc=jg=jt=lb=lrelrilromimnv" + "=ocrpdfrehri=sd=smlsqrtahv20v21v30v31v32v40v41v50v51v52v60v61v62v" + "63v70v80v90vo=vs=wb=yes3839444546474849b2bkh2h3jljvkvl&l_vrxxzlzp" + "zs_perl_problematic_locale_foldeds_is_in_multi_char_fold_perl_fol" + "ds_to_perl_charname_beginany_foldsquotemetaisxposixisposixblankpr" + "intishorizisxperlisperlisspaceisvertisuni"; +/* mph_blob length: 10571 */ struct mph_struct { U16 seed2; @@ -191,7277 +194,7429 @@ struct mph_struct { }; #define MPH_RSHIFT 8 -#define MPH_BUCKETS 7264 +#define MPH_BUCKETS 7416 -STATIC const U32 MPH_SEED1 = 0x5065726c; +STATIC const U32 MPH_SEED1 = 0x5065726e; STATIC const U32 MPH_FNV_CONST = 0x01000193; /* The comments give the input key for the row it is in */ STATIC const struct mph_struct mph_table[MPH_BUCKETS] = { - { 2, 9768, 9632, 4, 4, UNI_LINA } /* scx=lina */, - { 2, 5791, 6572, 13, 4, UNI_JG__NOON } /* joininggroup=noon */, - { 1, 7325, 9384, 3, 4, UNI_IN__10 } /* in=10.0 */, - { 2, 9488, 7188, 4, 10, UNI_INKHAROSHTHI } /* blk=kharoshthi */, - { 1, 1417, 23, 24, 2, UNI_CCC__AL } /* canonicalcombiningclass=al */, - { 0, 184, 2666, 3, 10, UNI_COUNTINGROD } /* iscountingrod */, - { 0, 1654, 0, 23, 0, UNI_COMPATJAMO } /* hangulcompatibilityjamo */, - { 8, 7158, 9836, 10, 4, UNI_DIA } /* diacritic=true */, - { 2, 8780, 8373, 7, 6, UNI_CJKEXTD } /* block=cjkextd */, - { 1, 5986, 9973, 13, 3, UNI_NV__5_SLASH_6 } /* numericvalue=5/6 */, - { 1, 10027, 6323, 3, 5, UNI_JG__GAMAL } /* jg=gamal */, - { 0, 8900, 0, 6, 0, UNI_KTHI } /* kaithi */, - { 6, 1537, 2455, 24, 5, UNI_INPC__RIGHT } /* indicpositionalcategory=right */, - { 0, 7398, 0, 10, 0, UNI_SUPARROWSC } /* suparrowsc */, - { 1, 9002, 0, 6, 0, UNI_TELU } /* telugu */, - { 4, 10024, 9503, 3, 2, UNI_MC } /* gc=mc */, - { 0, 7218, 18, 10, 2, UNI_RI } /* linebreak=ri */, - { 0, 1856, 0, 21, 0, UNI_CWU } /* changeswhenuppercased */, - { 1, 2779, 0, 3, 0, UNI_IDS } /* ids */, - { 8, 10048, 9061, 3, 4, UNI_NV__1_SLASH_12 } /* nv=1/12 */, - { 0, 10006, 10135, 3, 3, UNI_DI } /* di=yes */, - { 0, 8780, 5947, 6, 13, UNI_MAYANNUMERALS } /* block=mayannumerals */, - { 1, 9444, 10108, 4, 3, UNI_AGE__6_DOT_1 } /* age=v61 */, - { 0, 5186, 0, 14, 0, UNI_HIGHSURROGATES } /* highsurrogates */, - { 0, 10333, 1528, 3, 8, UNI__PERL_SURROGATE } /* issurrogate */, - { 1, 7739, 3, 8, 1, -UNI_IDS } /* idstart=f */, - { 0, 184, 6840, 2, 11, UNI_NAND } /* isnandinagari */, - { 0, 446, 0, 32, 0, UNI_IDEOGRAPHICSYMBOLS } /* ideographicsymbolsandpunctuation */, - { 4, 9448, 0, 4, 0, UNI_AGHB } /* aghb */, - { 3, 3836, 9712, 17, 4, UNI_OSGE } /* scriptextensions=osge */, - { 0, 9270, 7685, 3, 8, UNI_INPAUCINHAU } /* inpaucinhau */, - { 0, 10048, 9055, 3, 3, UNI_NV__1_SLASH_3 } /* nv=1/3 */, - { 7, 1834, 10135, 22, 3, UNI_CWT } /* changeswhentitlecased=yes */, - { 1, 9768, 8414, 4, 7, UNI_ELBA } /* scx=elbasan */, - { 4, 8780, 1673, 6, 4, UNI_JAMO } /* block=jamo */, - { 0, 8688, 5662, 3, 12, UNI_AEGEANNUMBERS } /* isaegeannumbers */, - { 0, 1552, 5040, 9, 5, UNI_XPOSIXDIGIT } /* category=digit */, - { 4, 10296, 25, 3, 1, UNI_PS } /* isps */, - { 0, 1536, 0, 4, 0, UNI_SIND } /* sind */, - { 0, 1417, 8807, 24, 3, UNI_CCC__118 } /* canonicalcombiningclass=118 */, - { 5, 8774, 9836, 6, 4, UNI_BIDIM } /* bidim=true */, - { 2, 9488, 283, 4, 33, UNI_MISCMATHSYMBOLSB } /* blk=miscellaneousmathematicalsymbolsb */, - { 0, 1823, 0, 9, 0, UNI_XPOSIXLOWER } /* lowercase */, - { 1, 184, 8924, 2, 4, UNI_LEPC } /* islepc */, - { 0, 9277, 8243, 3, 8, UNI_SC__MAHJ } /* sc=mahajani */, - { 1, 9277, 9315, 3, 5, UNI_SC__ORYA } /* sc=oriya */, - { 3, 9768, 8936, 4, 6, UNI_LYCI } /* scx=lycian */, - { 1, 5270, 0, 14, 0, UNI_LATINEXTE } /* latinextendede */, - { 1, 3836, 4448, 17, 4, UNI_BAMU } /* scriptextensions=bamu */, - { 0, 8267, 26, 8, 1, UNI_RADICAL } /* radical=y */, - { 0, 32, 0, 2, 0, UNI__PERL_SURROGATE } /* cs */, - { 16, 1417, 3564, 24, 13, UNI_CCC__202 } /* canonicalcombiningclass=attachedbelow */, - { 0, 10024, 4943, 3, 15, UNI_TITLE } /* gc=titlecaseletter */, - { 0, 2182, 406, 21, 7, UNI_GCB__CN } /* graphemeclusterbreak=control */, - { 1, 6241, 24, 12, 1, UNI_JT__L } /* joiningtype=l */, - { 0, 10048, 9973, 3, 3, UNI_NV__5_SLASH_6 } /* nv=5/6 */, - { 1, 21, 7585, 2, 9, UNI_LATINEXTC } /* inlatinextc */, - { 0, 3836, 9864, 17, 4, UNI_WCHO } /* scriptextensions=wcho */, - { 1, 3367, 26, 18, 1, UNI__PERL_PATWS } /* patternwhitespace=y */, - { 0, 8780, 2469, 6, 20, UNI_INNYIAKENGPUACHUEHMONG } /* block=nyiakengpuachuehmong */, - { 1, 8780, 749, 6, 21, UNI_ENCLOSEDALPHANUM } /* block=enclosedalphanumerics */, - { 2, 184, 9576, 2, 4, UNI_GURU } /* isguru */, - { 0, 10333, 9793, 3, 3, UNI_SOGO } /* issogo */, - { 0, 10048, 7771, 3, 8, UNI_NV__1_SLASH_80 } /* nv=1.25e-02 */, - { 1, 9444, 9991, 4, 3, UNI_AGE__9 } /* age=9.0 */, - { 0, 9488, 567, 4, 2, UNI_NB } /* blk=nb */, - { 0, 9488, 1922, 4, 12, UNI_DIACRITICALS } /* blk=diacriticals */, - { 13, 1537, 2555, 24, 6, UNI_INPC__BOTTOM } /* indicpositionalcategory=bottom */, - { 1, 10024, 5497, 3, 11, UNI_MC } /* gc=spacingmark */, - { 3, 2784, 80, 4, 8, UNI_ARABICMATH } /* inarabicmath */, - { 0, 5791, 5620, 13, 14, UNI_JG__HAMZAONHEHGOAL } /* joininggroup=tehmarbutagoal */, - { 32, 4791, 1595, 3, 13, UNI_MUSIC } /* inmusicalsymbols */, - { 0, 8589, 2329, 7, 20, UNI_HLUW } /* script=anatolianhieroglyphs */, - { 0, 7088, 3374, 10, 10, UNI_BC__WS } /* bidiclass=whitespace */, - { 0, 184, 7168, 2, 10, UNI_DIAK } /* isdivesakuru */, - { 0, 184, 9636, 2, 4, UNI_LINB } /* islinb */, - { 0, 9488, 7684, 4, 9, UNI_INPAUCINHAU } /* blk=paucinhau */, - { 0, 6939, 0, 11, 0, UNI_SORA } /* sorasompeng */, - { 3, 9768, 8131, 4, 8, UNI_DUPL } /* scx=duployan */, - { 1, 9488, 629, 4, 30, UNI_CJKEXTE } /* blk=cjkunifiedideographsextensione */, - { 8, 9488, 2098, 4, 21, UNI_CJKCOMPATFORMS } /* blk=cjkcompatibilityforms */, - { 1, 10290, 96, 6, 5, UNI_XPOSIXALPHA } /* xposixalpha */, - { 1, 9732, 0, 4, 0, UNI_PRTI } /* prti */, - { 0, 8589, 3241, 7, 8, UNI_SC__GEOR } /* script=georgian */, - { 1, 5032, 0, 14, 0, UNI_ahex_values_index } /* asciihexdigit= */, - { 1, 3529, 36, 18, 1, UNI_VS } /* variationselector=t */, - { 0, 2569, 409, 20, 2, UNI_VO__TR } /* verticalorientation=tr */, - { 3, 2182, 6763, 21, 3, UNI_LB__H3 } /* graphemeclusterbreak=lvt */, - { 1, 9768, 8299, 4, 8, UNI_TFNG } /* scx=tifinagh */, - { 0, 6553, 0, 11, 0, UNI_XIDC } /* xidcontinue */, - { 0, 3836, 4793, 17, 15, UNI_MERC } /* scriptextensions=meroiticcursive */, - { 10, 341, 0, 2, 0, UNI_PE } /* pe */, - { 1, 3097, 8846, 18, 6, UNI_DT__ENC } /* decompositiontype=circle */, - { 2, 4688, 6609, 15, 10, UNI_DEP } /* identifiertype=deprecated */, - { 0, 184, 9231, 3, 3, UNI_CWCF } /* iscwcf */, - { 2, 8780, 6829, 6, 11, UNI_MYANMAREXTB } /* block=myanmarextb */, - { 0, 5986, 7781, 13, 1, UNI_NV__4 } /* numericvalue=4 */, - { 1, 0, 0, 34, 0, UNI_UCAS } /* unifiedcanadianaboriginalsyllabics */, - { 1, 1417, 3007, 24, 18, UNI_CCC__216 } /* canonicalcombiningclass=attachedaboveright */, - { 1, 1966, 9090, 22, 5, UNI_INSC__BINDU } /* indicsyllabiccategory=bindu */, - { 0, 6229, 1025, 12, 2, -UNI_JOINC } /* joincontrol=no */, - { 2, 9997, 2893, 3, 19, UNI_BC__RLO } /* bc=righttoleftoverride */, - { 5, 8780, 149, 7, 34, UNI_DIACRITICALSSUP } /* block=combiningdiacriticalmarkssupplement */, - { 1, 9528, 0, 4, 0, UNI_cwu_values_index } /* cwu= */, - { 0, 9277, 9440, 3, 4, UNI_SC__ADLM } /* sc=adlm */, - { 1, 9488, 9032, 4, 6, UNI_INWANCHO } /* blk=wancho */, - { 7, 10048, 8756, 3, 2, UNI_NV__90 } /* nv=90 */, - { 0, 9277, 9812, 3, 4, UNI_SC__TAML } /* sc=taml */, - { 8, 5986, 8720, 13, 6, UNI_NV__400000 } /* numericvalue=400000 */, - { 1, 10009, 1253, 3, 4, UNI_DT__INIT } /* dt=init */, - { 0, 7218, 866, 10, 2, UNI_LB__SP } /* linebreak=sp */, - { 3, 9997, 2449, 3, 11, UNI_BC__L } /* bc=lefttoright */, - { 2, 3115, 0, 13, 0, UNI_DEVANAGARIEXT } /* devanagariext */, - { 1, 5791, 3785, 13, 17, UNI_JG__MANICHAEANDHAMEDH } /* joininggroup=manichaeandhamedh */, - { 1, 9508, 7178, 4, 10, UNI_CCC__6 } /* ccc=hanreading */, - { 4, 5986, 8750, 13, 3, UNI_NV__800 } /* numericvalue=800 */, - { 5, 5060, 9255, 14, 5, -UNI_CI } /* caseignorable=false */, - { 2, 184, 6818, 2, 11, UNI_MYANMAREXTA } /* ismyanmarexta */, - { 0, 5037, 1, 9, 1, -UNI_XPOSIXXDIGIT } /* hexdigit=n */, - { 0, 21, 5662, 3, 12, UNI_AEGEANNUMBERS } /* inaegeannumbers */, - { 1, 4898, 0, 15, 0, UNI_PS } /* openpunctuation */, - { 8, 5986, 8714, 13, 4, UNI_NV__3000 } /* numericvalue=3000 */, - { 0, 8589, 9736, 7, 4, UNI_SC__COPT } /* script=qaac */, - { 0, 7088, 10036, 10, 3, UNI_BC__LRE } /* bidiclass=lre */, - { 2, 5564, 9836, 14, 4, UNI_QMARK } /* quotationmark=true */, - { 1, 9277, 9864, 3, 4, UNI_WCHO } /* sc=wcho */, - { 3, 9508, 7978, 4, 2, UNI_CCC__16 } /* ccc=16 */, - { 2, 5564, 26, 14, 1, UNI_QMARK } /* quotationmark=y */, - { 0, 6231, 2120, 3, 20, UNI_CJKRADICALSSUP } /* incjkradicalssupplement */, - { 7, 10048, 8732, 3, 6, UNI_NV__500000 } /* nv=500000 */, - { 1, 3836, 9660, 17, 4, UNI_MLYM } /* scriptextensions=mlym */, - { 0, 1552, 1899, 9, 2, UNI_PC } /* category=pc */, - { 0, 9768, 78, 4, 4, UNI_ARAB } /* scx=arab */, - { 21, 10296, 7676, 3, 8, UNI_PALM } /* ispalmyrene */, - { 0, 27, 0, 2, 0, UNI_LOWERCASELETTER } /* ll */, - { 1, 1823, 0, 5, 0, UNI_XPOSIXLOWER } /* lower */, - { 0, 10027, 6349, 3, 12, UNI_JG__MALAYALAMSSA } /* jg=malayalamssa */, - { 3, 8780, 2203, 6, 14, UNI_INHANIFIROHINGYA } /* block=hanifirohingya */, - { 2, 184, 8219, 2, 4, UNI_JAVA } /* isjava */, - { 0, 9488, 4568, 4, 15, UNI_CURRENCYSYMBOLS } /* blk=currencysymbols */, - { 1, 6420, 1061, 3, 26, UNI_OCR } /* inopticalcharacterrecognition */, - { 2, 5791, 3802, 13, 17, UNI_JG__MANICHAEANHUNDRED } /* joininggroup=manichaeanhundred */, - { 16, 1188, 8646, 3, 6, UNI_INTAITHAM } /* intaitham */, - { 9, 1018, 0, 5, 0, UNI_MUSIC } /* music */, - { 0, 9488, 7495, 4, 9, UNI_ARABICPFA } /* blk=arabicpfa */, - { 1, 9260, 0, 5, 0, UNI_idsb_values_index } /* idsb= */, - { 0, 8589, 9700, 7, 4, UNI_OLCK } /* script=olck */, - { 0, 1417, 1756, 24, 2, UNI_CCC__BR } /* canonicalcombiningclass=br */, - { 4, 9270, 472, 3, 2, UNI_PUA } /* inpua */, - { 0, 184, 9652, 2, 4, UNI_MERC } /* ismerc */, - { 4, 1189, 0, 3, 0, UNI_nt_values_index } /* nt= */, - { 8, 9275, 4353, 5, 16, UNI_INSC__SYLLABLEMODIFIER } /* insc=syllablemodifier */, - { 3, 10288, 2779, 3, 3, UNI_XIDS } /* isxids */, - { 1, 184, 0, 4, 0, UNI_CE } /* isce */, - { 3, 8688, 5019, 3, 13, UNI_ANCIENTSYMBOLS } /* isancientsymbols */, - { 1, 9508, 8823, 5, 4, UNI_CCC__13 } /* ccc=ccc13 */, - { 1, 9768, 8219, 4, 8, UNI_JAVA } /* scx=javanese */, - { 2, 8400, 26, 7, 1, UNI_COMPEX } /* compex=y */, - { 1, 10027, 7016, 3, 11, UNI_JG__YEHWITHTAIL } /* jg=yehwithtail */, - { 1, 7155, 34, 3, 2, UNI_XPOSIXXDIGIT } /* ishex */, - { 0, 5986, 7915, 13, 8, UNI_NV__3_SLASH_80 } /* numericvalue=3.75e-02 */, - { 17, 9997, 1, 4, 1, UNI_BC__BN } /* bc=bn */, - { 6, 1188, 2077, 3, 21, UNI_TRANSPORTANDMAP } /* intransportandmapsymbols */, - { 0, 184, 10176, 2, 2, UNI_ZL } /* iszl */, - { 2, 6469, 11, 12, 2, UNI_NT__DI } /* numerictype=di */, - { 8, 10033, 7512, 3, 2, UNI_LB__BB } /* lb=bb */, - { 0, 7325, 9985, 3, 3, UNI_IN__7 } /* in=7.0 */, - { 0, 2224, 0, 21, 0, UNI_PRTI } /* inscriptionalparthian */, - { 7, 9768, 9636, 4, 4, UNI_LINB } /* scx=linb */, - { 1, 8936, 0, 6, 0, UNI_LYCI } /* lycian */, - { 0, 9997, 3313, 3, 18, UNI_BC__LRI } /* bc=lefttorightisolate */, - { 2, 8589, 8421, 7, 4, UNI_ELYM } /* script=elym */, - { 2, 2182, 4305, 21, 5, UNI_GCB__XX } /* graphemeclusterbreak=other */, - { 1, 8780, 8394, 7, 6, UNI_CJKEXTG } /* block=cjkextg */, - { 5, 9864, 0, 4, 0, UNI_WCHO } /* wcho */, - { 0, 9768, 9335, 4, 4, UNI_TAKR } /* scx=takr */, - { 0, 1828, 0, 6, 0, UNI_cased_values_index } /* cased= */, - { 2, 184, 4569, 3, 13, UNI_SC } /* iscurrencysymbol */, - { 2, 8780, 2061, 6, 4, UNI_INMODI } /* block=modi */, - { 2, 184, 3241, 2, 4, UNI_GEOR } /* isgeor */, - { 8, 3836, 7651, 17, 4, UNI_ITAL } /* scriptextensions=ital */, - { 0, 184, 62, 2, 5, UNI_XPOSIXGRAPH } /* isgraph */, - { 0, 8589, 1628, 7, 4, UNI_SC__PHAG } /* script=phag */, - { 0, 9014, 1025, 6, 2, -UNI_UIDEO } /* uideo=no */, - { 2, 979, 0, 27, 0, UNI_ALPHABETICPF } /* alphabeticpresentationforms */, - { 0, 8589, 2288, 8, 3, UNI_SC__SINH } /* script=sinh */, - { 2, 8589, 5003, 7, 15, UNI_ZANB } /* script=zanabazarsquare */, - { 4, 9277, 9704, 3, 4, UNI_ORKH } /* sc=orkh */, - { 0, 5986, 7899, 13, 8, UNI_NV__7_SLASH_2 } /* numericvalue=3.50e+00 */, - { 6, 9488, 8673, 4, 7, UNI_UCASEXT } /* blk=ucasext */, - { 0, 8477, 0, 4, 0, UNI_MAKA } /* maka */, - { 5, 1417, 8793, 25, 4, UNI_CCC__10 } /* canonicalcombiningclass=ccc10 */, - { 0, 2245, 0, 14, 0, UNI_MEETEIMAYEKEXT } /* meeteimayekext */, - { 0, 9277, 8876, 3, 4, UNI_GOTH } /* sc=goth */, - { 0, 112, 0, 2, 0, UNI_SC } /* sc */, - { 2, 3836, 9820, 17, 4, UNI_TFNG } /* scriptextensions=tfng */, - { 1, 10048, 9361, 3, 3, UNI_NV__1_SLASH_2 } /* nv=1/2 */, - { 11, 8509, 751, 4, 19, UNI_ENCLOSEDALPHANUM } /* inenclosedalphanumerics */, - { 0, 8780, 3600, 8, 15, UNI_INCAUCASIANALBANIAN } /* block=caucasianalbanian */, - { 0, 9488, 8171, 4, 8, UNI_INGUJARATI } /* blk=gujarati */, - { 1, 8780, 2855, 6, 9, UNI_INMONGOLIAN } /* block=mongolian */, - { 1, 21, 8203, 2, 8, UNI_JAMOEXTA } /* injamoexta */, - { 5, 4916, 8653, 3, 6, UNI_TAVT } /* istaiviet */, - { 0, 9488, 250, 4, 33, UNI_MISCMATHSYMBOLSA } /* blk=miscellaneousmathematicalsymbolsa */, - { 0, 8688, 2469, 3, 2, UNI_ANY } /* isany */, - { 0, 6241, 7, 12, 1, UNI_JT__C } /* joiningtype=c */, - { 9, 8786, 0, 6, 0, UNI_CARI } /* carian */, - { 8, 5256, 0, 14, 0, UNI_LATINEXTD } /* latinextendedd */, - { 3, 5791, 5179, 13, 3, UNI_JG__HEH } /* joininggroup=heh */, - { 0, 7218, 414, 10, 11, UNI_LB__ID } /* linebreak=ideographic */, - { 0, 9277, 8107, 3, 8, UNI_BALI } /* sc=balinese */, - { 3, 10048, 7835, 3, 8, UNI_NV__5_SLASH_2 } /* nv=2.50e+00 */, - { 1, 8780, 4273, 6, 16, UNI_MYANMAREXTA } /* block=myanmarextendeda */, - { 0, 9277, 8888, 3, 4, UNI_HATR } /* sc=hatr */, - { 1, 7558, 6195, 4, 4, UNI_INHEBREW } /* inhebrew */, - { 7, 8589, 8187, 7, 8, UNI_SC__HIRA } /* script=hiragana */, - { 2, 10027, 5410, 3, 14, UNI_JG__MANICHAEANTETH } /* jg=manichaeanteth */, - { 0, 1417, 10166, 24, 2, UNI_CCC__8 } /* canonicalcombiningclass=kv */, - { 2, 184, 9640, 2, 3, UNI_LOE } /* isloe */, - { 0, 8870, 1, 6, 1, -UNI_EPRES } /* epres=n */, - { 4, 9524, 0, 4, 0, UNI_cwt_values_index } /* cwt= */, - { 0, 1166, 9255, 26, 5, -UNI_DI } /* defaultignorablecodepoint=false */, - { 1, 8780, 1922, 6, 12, UNI_DIACRITICALS } /* block=diacriticals */, - { 13, 3836, 2684, 17, 19, UNI_EGYP } /* scriptextensions=egyptianhieroglyphs */, - { 2, 8780, 8673, 6, 7, UNI_UCASEXT } /* block=ucasext */, - { 0, 8780, 8645, 6, 7, UNI_INTAITHAM } /* block=taitham */, - { 5, 5986, 7843, 13, 8, UNI_NV__1_SLASH_4 } /* numericvalue=2.50e-01 */, - { 2, 217, 0, 33, 0, UNI_DIACRITICALSEXT } /* combiningdiacriticalmarksextended */, - { 5, 10024, 6851, 3, 11, UNI_LO } /* gc=otherletter */, - { 2, 9997, 23, 3, 2, UNI_BC__AL } /* bc=al */, - { 6, 8780, 2912, 6, 12, UNI_SUNDANESESUP } /* block=sundanesesup */, - { 1, 3836, 8659, 17, 7, UNI_TIBT } /* scriptextensions=tibetan */, - { 0, 8645, 0, 7, 0, UNI_LANA } /* taitham */, - { 2, 9277, 8786, 3, 6, UNI_CARI } /* sc=carian */, - { 0, 7418, 26, 10, 1, UNI_XPOSIXUPPER } /* uppercase=y */, - { 20, 7318, 10114, 10, 3, UNI_IN__6_DOT_3 } /* presentin=v63 */, - { 5, 1188, 3458, 3, 10, UNI_TAIXUANJING } /* intaixuanjing */, - { 3, 184, 9632, 2, 4, UNI_LINA } /* islina */, - { 2, 9997, 2489, 3, 20, UNI_BC__PDF } /* bc=popdirectionalformat */, - { 4, 8780, 8547, 6, 7, UNI_OLCK } /* block=olchiki */, - { 0, 8942, 0, 4, 0, UNI_LYDI } /* lydi */, - { 0, 6035, 0, 2, 0, UNI_PF } /* pf */, - { 7, 9265, 10135, 5, 3, UNI_IDST } /* idst=yes */, - { 0, 184, 2061, 2, 14, UNI_LM } /* ismodifierletter */, - { 1, 184, 2287, 2, 21, UNI_SINHALAARCHAICNUMBERS } /* issinhalaarchaicnumbers */, - { 3, 2569, 471, 20, 2, UNI_VO__TU } /* verticalorientation=tu */, - { 2, 184, 1631, 2, 18, UNI_GEOMETRICSHAPESEXT } /* isgeometricshapesext */, - { 4, 10048, 9924, 3, 2, UNI_NV__42 } /* nv=42 */, - { 2, 184, 339, 2, 2, UNI_LO } /* islo */, - { 1, 9768, 9330, 4, 5, UNI_TALE } /* scx=taile */, - { 0, 9277, 6193, 3, 6, UNI_HEBR } /* sc=hebrew */, - { 1, 184, 8491, 2, 4, UNI_MARC } /* ismarc */, - { 0, 8780, 467, 6, 11, UNI_INPUNCTUATION } /* block=punctuation */, - { 16, 9071, 1, 4, 1, -UNI_XPOSIXXDIGIT } /* hex=n */, - { 1, 9270, 7309, 3, 9, UNI_INPHOENICIAN } /* inphoenician */, - { 16, 3836, 8414, 17, 7, UNI_ELBA } /* scriptextensions=elbasan */, - { 0, 3836, 8463, 17, 7, UNI_KALI } /* scriptextensions=kayahli */, - { 0, 9768, 7188, 4, 4, UNI_KHAR } /* scx=khar */, - { 0, 10296, 1629, 3, 3, UNI_PHAG } /* isphag */, - { 2, 5746, 26, 6, 1, UNI_EBASE } /* ebase=y */, - { 1, 8780, 8315, 6, 8, UNI_INUGARITIC } /* block=ugaritic */, - { 0, 9277, 9632, 3, 4, UNI_SC__LINA } /* sc=lina */, - { 5, 8884, 9255, 4, 5, -UNI_EXT } /* ext=false */, - { 0, 10129, 3, 3, 1, -UNI_VS } /* vs=f */, - { 3, 9528, 26, 4, 1, UNI_CWU } /* cwu=y */, - { 1, 6229, 1, 12, 1, -UNI_JOINC } /* joincontrol=n */, - { 5, 184, 9544, 2, 4, UNI_DIAK } /* isdiak */, - { 5, 9704, 0, 4, 0, UNI_ORKH } /* orkh */, - { 0, 9768, 7657, 4, 9, UNI_PERM } /* scx=oldpermic */, - { 0, 9277, 8291, 3, 8, UNI_SC__TAGB } /* sc=tagbanwa */, - { 1, 8780, 7531, 6, 9, UNI_EMOTICONS } /* block=emoticons */, - { 1, 9488, 7504, 4, 9, UNI_ARABICPFB } /* blk=arabicpfb */, - { 1, 8870, 9836, 6, 4, UNI_EPRES } /* epres=true */, - { 1, 9270, 0, 5, 0, UNI_inpc_values_index } /* inpc= */, - { 1, 8694, 9255, 7, 5, -UNI_XPOSIXSPACE } /* wspace=false */, - { 16, 4791, 2837, 3, 18, UNI_MODIFIERTONELETTERS } /* inmodifiertoneletters */, - { 1, 9277, 8414, 3, 4, UNI_ELBA } /* sc=elba */, - { 1, 9768, 9516, 4, 4, UNI_CPRT } /* scx=cprt */, - { 6, 7318, 10117, 10, 3, UNI_IN__7 } /* presentin=v70 */, - { 1, 9640, 1025, 4, 2, -UNI_LOE } /* loe=no */, - { 0, 184, 1587, 2, 1, UNI_Z } /* isz */, - { 4, 7218, 9557, 10, 2, UNI_LB__CB } /* linebreak=cb */, - { 16, 9275, 8307, 5, 8, UNI_INSC__TONEMARK } /* insc=tonemark */, - { 0, 9277, 8936, 3, 6, UNI_LYCI } /* sc=lycian */, - { 1, 2722, 0, 19, 0, UNI_JAMOEXTA } /* hanguljamoextendeda */, - { 0, 8512, 17, 8, 1, UNI_NFKCQC__N } /* nfkcqc=no */, - { 2, 9270, 909, 3, 13, UNI_PUA } /* inprivateusearea */, - { 0, 9275, 5700, 5, 13, UNI_INSC__CONSONANTDEAD } /* insc=consonantdead */, - { 2, 9484, 0, 4, 0, UNI_BHKS } /* bhks */, - { 7, 9768, 4448, 4, 5, UNI_BAMU } /* scx=bamum */, - { 1, 8589, 3115, 7, 10, UNI_SC__DEVA } /* script=devanagari */, - { 0, 8852, 0, 6, 0, UNI_cwkcf_values_index } /* cwkcf= */, - { 2, 6805, 2014, 6, 18, UNI_MISCTECHNICAL } /* inmiscellaneoustechnical */, - { 4, 8589, 4001, 7, 7, UNI_SC__CPRT } /* script=cypriot */, - { 4, 9488, 1192, 4, 26, UNI_HALFANDFULLFORMS } /* blk=halfwidthandfullwidthforms */, - { 2, 8780, 5550, 6, 14, UNI_INPSALTERPAHLAVI } /* block=psalterpahlavi */, - { 3, 132, 0, 2, 0, UNI_LM } /* lm */, - { 16, 5986, 7851, 13, 8, UNI_NV__1_SLASH_40 } /* numericvalue=2.50e-02 */, - { 2, 8780, 8442, 6, 7, UNI_INHANUNOO } /* block=hanunoo */, - { 1, 9275, 8687, 5, 7, UNI_INSC__VISARGA } /* insc=visarga */, - { 4, 10033, 8449, 3, 2, UNI_LB__HY } /* lb=hy */, - { 0, 6805, 861, 6, 6, UNI_MISCARROWS } /* inmiscarrows */, - { 0, 9488, 599, 4, 30, UNI_CJKEXTD } /* blk=cjkunifiedideographsextensiond */, - { 0, 9277, 4478, 3, 7, UNI_BRAI } /* sc=braille */, - { 0, 10033, 25, 3, 2, UNI_LB__SY } /* lb=sy */, - { 0, 7325, 0, 3, 0, UNI_in_values_index } /* in= */, - { 2, 7249, 533, 4, 2, UNI_CANS } /* iscans */, - { 0, 4542, 1633, 4, 16, UNI_GEOMETRICSHAPESEXT } /* ingeometricshapesext */, - { 3, 9488, 3598, 4, 17, UNI_INCAUCASIANALBANIAN } /* blk=caucasianalbanian */, - { 1, 3836, 3241, 17, 4, UNI_GEOR } /* scriptextensions=geor */, - { 0, 4033, 7408, 16, 10, UNI_CN } /* generalcategory=unassigned */, - { 1, 2224, 3871, 3, 16, UNI_SMALLFORMS } /* insmallformvariants */, - { 0, 3836, 4145, 17, 7, UNI_LINB } /* scriptextensions=linearb */, - { 2, 9768, 2140, 4, 8, UNI_CYRL } /* scx=cyrillic */, - { 0, 9070, 10135, 5, 3, UNI_POSIXXDIGIT } /* ahex=yes */, - { 10, 8589, 6409, 7, 4, UNI_MEND } /* script=mend */, - { 1, 6609, 0, 11, 0, UNI_dep_values_index } /* deprecated= */, - { 0, 9277, 8491, 3, 7, UNI_MARC } /* sc=marchen */, - { 2, 9508, 9101, 5, 4, UNI_CCC__14 } /* ccc=ccc14 */, - { 5, 184, 3887, 2, 17, UNI_SUTTONSIGNWRITING } /* issuttonsignwriting */, - { 1, 21, 9325, 2, 5, UNI_INRUNIC } /* inrunic */, - { 2, 10024, 8855, 3, 2, UNI_CF } /* gc=cf */, - { 8, 1417, 8823, 25, 4, UNI_CCC__13 } /* canonicalcombiningclass=ccc13 */, - { 5, 4113, 25, 3, 1, UNI_INVS } /* invs */, - { 2, 5986, 8011, 13, 8, UNI_NV__13_SLASH_2 } /* numericvalue=6.50e+00 */, - { 2, 4853, 1, 15, 1, UNI_NFKDQC__N } /* nfkdquickcheck=n */, - { 0, 10027, 4209, 3, 16, UNI_JG__MANICHAEANSAMEKH } /* jg=manichaeansamekh */, - { 1, 569, 0, 30, 0, UNI_CJKEXTC } /* cjkunifiedideographsextensionc */, - { 2, 9345, 9255, 5, 5, -UNI_XIDC } /* xidc=false */, - { 1, 9488, 8936, 4, 6, UNI_INLYCIAN } /* blk=lycian */, - { 0, 184, 3151, 2, 17, UNI_EPRES } /* isemojipresentation */, - { 1, 8978, 1025, 6, 2, -UNI__PERL_PATWS } /* patws=no */, - { 1, 10033, 7522, 3, 9, UNI_LB__B2 } /* lb=breakboth */, - { 2, 1417, 2809, 24, 2, UNI_CCC__1 } /* canonicalcombiningclass=ov */, - { 1, 8780, 8387, 7, 6, UNI_CJKEXTF } /* block=cjkextf */, - { 3, 9015, 26, 5, 1, UNI_IDEO } /* ideo=y */, - { 0, 1552, 6598, 9, 11, UNI_CASEDLETTER } /* category=casedletter */, - { 1, 9540, 1025, 4, 2, -UNI_DIA } /* dia=no */, - { 0, 21, 5830, 2, 13, UNI_LOWSURROGATES } /* inlowsurrogates */, - { 0, 3259, 26, 18, 1, UNI_IDSB } /* idsbinaryoperator=y */, - { 0, 57, 0, 2, 0, UNI_YI } /* yi */, - { 1, 184, 2817, 2, 19, UNI_MERO } /* ismeroitichieroglyphs */, - { 1, 8589, 9804, 7, 4, UNI_SC__TALE } /* script=tale */, - { 2, 6609, 1, 11, 1, -UNI_DEP } /* deprecated=n */, - { 2, 5986, 9055, 13, 4, UNI_NV__1_SLASH_32 } /* numericvalue=1/32 */, - { 0, 9262, 400, 3, 6, UNI_SB__FO } /* sb=format */, - { 8, 8780, 8414, 6, 7, UNI_INELBASAN } /* block=elbasan */, - { 0, 7088, 6049, 10, 12, UNI_BC__AN } /* bidiclass=arabicnumber */, - { 1, 10048, 9364, 3, 4, UNI_NV__1_SLASH_10 } /* nv=1/10 */, - { 0, 8780, 6961, 6, 11, UNI_SUPERANDSUB } /* block=superandsub */, - { 3, 184, 5284, 2, 14, UNI_LISUSUP } /* islisusupplement */, - { 7, 9492, 7, 4, 1, UNI_BPT__C } /* bpt=c */, - { 8, 9768, 8414, 4, 4, UNI_ELBA } /* scx=elba */, - { 5, 10024, 467, 3, 5, UNI_P } /* gc=punct */, - { 0, 1966, 8099, 22, 8, UNI_INSC__AVAGRAHA } /* indicsyllabiccategory=avagraha */, - { 3, 9275, 4523, 5, 15, UNI_INSC__CONSONANTMEDIAL } /* insc=consonantmedial */, - { 1, 8589, 9680, 7, 4, UNI_NBAT } /* script=nbat */, - { 1, 10048, 7747, 3, 8, UNI_NV__1_SLASH_10 } /* nv=1.00e-01 */, - { 1, 9488, 4065, 4, 16, UNI_HALFANDFULLFORMS } /* blk=halfandfullforms */, - { 11, 7438, 8139, 10, 8, UNI_WB__EB } /* wordbreak=ebasegaz */, - { 0, 2224, 2970, 3, 18, UNI_SUPARROWSC } /* insupplementalarrowsc */, - { 0, 9524, 26, 4, 1, UNI_CWT } /* cwt=y */, - { 1, 9277, 9572, 3, 4, UNI_SC__GUJR } /* sc=gujr */, - { 4, 1552, 107, 10, 5, UNI_S } /* category=symbol */, - { 0, 10048, 5648, 3, 4, UNI_NV__1000 } /* nv=1000 */, - { 0, 10009, 8163, 3, 3, UNI_DT__FRA } /* dt=fra */, - { 0, 7558, 0, 9, 0, UNI_QAAI } /* inherited */, - { 3, 1768, 26, 22, 1, UNI_CWCF } /* changeswhencasefolded=y */, - { 0, 3836, 2913, 18, 8, UNI_SUND } /* scriptextensions=sundanese */, - { 10, 9277, 8547, 3, 7, UNI_OLCK } /* sc=olchiki */, - { 0, 9488, 42, 4, 16, UNI_CJKCOMPAT } /* blk=cjkcompatibility */, - { 2, 3836, 8315, 17, 4, UNI_UGAR } /* scriptextensions=ugar */, - { 0, 8996, 0, 7, 0, UNI_STERM } /* sterm=t */, - { 0, 9488, 4928, 4, 15, UNI_TAMILSUP } /* blk=tamilsupplement */, - { 0, 3836, 7558, 17, 9, UNI_QAAI } /* scriptextensions=inherited */, - { 0, 1552, 17, 10, 1, UNI_SO } /* category=so */, - { 0, 9277, 7675, 3, 4, UNI_PALM } /* sc=palm */, - { 0, 8780, 7513, 6, 9, UNI_INBHAIKSUKI } /* block=bhaiksuki */, - { 1, 9250, 0, 5, 0, UNI_emod_values_index } /* emod= */, - { 4, 8589, 719, 7, 9, UNI_XSUX } /* script=cuneiform */, - { 0, 9240, 1025, 5, 2, -UNI_DASH } /* dash=no */, - { 3, 8780, 6807, 6, 11, UNI_MISCSYMBOLS } /* block=miscsymbols */, - { 1, 10048, 9055, 3, 5, UNI_NV__1_SLASH_320 } /* nv=1/320 */, - { 1, 4628, 9, 15, 2, UNI_EA__NA } /* eastasianwidth=na */, - { 0, 184, 1673, 2, 4, UNI_JAMO } /* isjamo */, - { 3, 7155, 4098, 3, 15, UNI_HIGHPUSURROGATES } /* ishighpusurrogates */, - { 3, 2779, 36, 19, 1, UNI_IDST } /* idstrinaryoperator=t */, - { 2, 10027, 7348, 3, 10, UNI_JG__REVERSEDPE } /* jg=reversedpe */, - { 6, 9488, 2224, 4, 21, UNI_ININSCRIPTIONALPARTHIAN } /* blk=inscriptionalparthian */, - { 1, 7088, 0, 10, 0, UNI_bc_values_index } /* bidiclass= */, - { 0, 8589, 8291, 7, 8, UNI_SC__TAGB } /* script=tagbanwa */, - { 0, 4033, 10180, 16, 2, UNI_ZS } /* generalcategory=zs */, - { 0, 8780, 1631, 6, 18, UNI_GEOMETRICSHAPESEXT } /* block=geometricshapesext */, - { 0, 7318, 10111, 10, 3, UNI_IN__6_DOT_2 } /* presentin=v62 */, - { 0, 8894, 1025, 6, 2, -UNI_JOINC } /* joinc=no */, - { 2, 3836, 1115, 17, 4, UNI_HANG } /* scriptextensions=hang */, - { 2, 9596, 9, 4, 2, UNI_HST__NA } /* hst=na */, - { 1, 8780, 250, 6, 33, UNI_MISCMATHSYMBOLSA } /* block=miscellaneousmathematicalsymbolsa */, - { 3, 10009, 2280, 3, 3, UNI_DT__ISO } /* dt=iso */, - { 4, 9488, 5752, 4, 13, UNI_GREEKEXT } /* blk=greekextended */, - { 17, 7378, 0, 10, 0, UNI_SUPARROWSA } /* suparrowsa */, - { 2, 9520, 0, 3, 0, UNI_CWL } /* cwl */, - { 2, 9556, 10174, 4, 2, UNI_GCB__XX } /* gcb=xx */, - { 1, 10048, 7781, 3, 2, UNI_NV__43 } /* nv=43 */, - { 1, 8780, 3115, 6, 13, UNI_DEVANAGARIEXT } /* block=devanagariext */, - { 4, 3836, 6253, 17, 5, UNI_KHMR } /* scriptextensions=khmer */, - { 8, 3836, 2288, 18, 6, UNI_SINH } /* scriptextensions=sinhala */, - { 0, 10048, 10144, 3, 2, UNI_NV__45 } /* nv=45 */, - { 42, 9488, 569, 4, 30, UNI_CJKEXTC } /* blk=cjkunifiedideographsextensionc */, - { 9, 9536, 26, 4, 1, UNI_DEP } /* dep=y */, - { 0, 1790, 26, 22, 1, UNI_CWCM } /* changeswhencasemapped=y */, - { 2, 10048, 8710, 3, 4, UNI_NV__6000 } /* nv=6000 */, - { 10, 9262, 1159, 3, 2, UNI_SB__ST } /* sb=st */, - { 0, 21, 4129, 2, 16, UNI_LATIN1 } /* inlatin1supplement */, - { 1, 3836, 7288, 17, 10, UNI_SOGO } /* scriptextensions=oldsogdian */, - { 0, 21, 3295, 2, 9, UNI_LATINEXTA } /* inlatinexta */, - { 1, 184, 9600, 2, 4, UNI_KALI } /* iskali */, - { 3, 1552, 3359, 10, 8, UNI_Z } /* category=separator */, - { 12, 5986, 5648, 13, 13, UNI_NV__1000000000000 } /* numericvalue=1000000000000 */, - { 2, 3382, 26, 3, 1, UNI_CE } /* ce=y */, - { 1, 5214, 0, 14, 0, UNI_KANGXI } /* kangxiradicals */, - { 4, 9716, 9836, 4, 4, UNI_PCM } /* pcm=true */, - { 0, 10132, 10174, 3, 2, UNI_WB__XX } /* wb=xx */, - { 3, 8780, 6840, 6, 11, UNI_INNANDINAGARI } /* block=nandinagari */, - { 0, 8589, 2608, 7, 6, UNI_BRAH } /* script=brahmi */, - { 2, 9277, 9636, 3, 4, UNI_SC__LINB } /* sc=linb */, - { 0, 3169, 0, 18, 0, UNI_ETHIOPICSUP } /* ethiopicsupplement */, - { 2, 2224, 2913, 3, 11, UNI_SUNDANESESUP } /* insundanesesup */, - { 2, 9275, 5102, 5, 14, UNI_INSC__CONSONANTFINAL } /* insc=consonantfinal */, - { 0, 8780, 1906, 6, 16, UNI_INDICNUMBERFORMS } /* block=indicnumberforms */, - { 5, 8780, 3547, 6, 10, UNI_ALCHEMICAL } /* block=alchemical */, - { 0, 8780, 316, 6, 33, UNI_SUPMATHOPERATORS } /* block=supplementalmathematicaloperators */, - { 3, 21, 8942, 2, 6, UNI_INLYDIAN } /* inlydian */, - { 2, 9277, 2140, 3, 8, UNI_SC__CYRL } /* sc=cyrillic */, - { 0, 1867, 0, 9, 0, UNI_XPOSIXUPPER } /* uppercase */, - { 6, 7088, 865, 10, 2, UNI_BC__WS } /* bidiclass=ws */, - { 1, 4033, 1287, 16, 2, UNI_UPPERCASELETTER } /* generalcategory=lu */, - { 6, 7218, 6675, 10, 11, UNI_LB__EX } /* linebreak=exclamation */, - { 0, 8589, 1900, 7, 6, UNI_SC__ZYYY } /* script=common */, - { 1, 9768, 8428, 4, 4, UNI_GRAN } /* scx=gran */, - { 0, 8596, 0, 7, 0, UNI_SHRD } /* sharada */, - { 3, 1537, 3475, 24, 18, UNI_INPC__TOPANDLEFTANDRIGHT } /* indicpositionalcategory=topandleftandright */, - { 1, 9488, 8942, 4, 6, UNI_INLYDIAN } /* blk=lydian */, - { 0, 1552, 4305, 9, 5, UNI_C } /* category=other */, - { 0, 9277, 8876, 3, 6, UNI_GOTH } /* sc=gothic */, - { 0, 184, 7531, 2, 9, UNI_EMOTICONS } /* isemoticons */, - { 0, 1966, 4508, 22, 15, UNI_INSC__CONSONANTKILLER } /* indicsyllabiccategory=consonantkiller */, - { 1, 9556, 5746, 4, 5, UNI_WB__EB } /* gcb=ebase */, - { 3, 9277, 6481, 3, 12, UNI_HUNG } /* sc=oldhungarian */, - { 0, 4643, 0, 14, 0, UNI_ECOMP } /* emojicomponent */, - { 3, 2224, 8618, 3, 6, UNI_INSOYOMBO } /* insoyombo */, - { 5, 8780, 2817, 6, 19, UNI_MERO } /* block=meroitichieroglyphs */, - { 3, 8435, 1, 7, 1, -UNI_GRBASE } /* grbase=n */, - { 7, 8512, 0, 8, 0, UNI_NFKCQC__N } /* nfkcqc=n */, - { 0, 48, 0, 1, 0, UNI_P } /* p */, - { 1, 1812, 1025, 22, 2, -UNI_CWL } /* changeswhenlowercased=no */, - { 0, 7155, 2204, 3, 3, UNI_HAN } /* ishani */, - { 1, 9270, 2994, 5, 13, UNI_INPC__BOTTOMANDLEFT } /* inpc=bottomandleft */, - { 0, 184, 8456, 2, 7, UNI_KNDA } /* iskannada */, - { 0, 8762, 36, 6, 1, UNI_XPOSIXALPHA } /* alpha=t */, - { 2, 3937, 0, 11, 0, UNI_BOPOMOFOEXT } /* bopomofoext */, - { 7, 10024, 1066, 3, 2, UNI_CASEDLETTER } /* gc=lc */, - { 2, 8477, 0, 7, 0, UNI_MAKA } /* makasar */, - { 0, 9488, 2140, 4, 21, UNI_CYRILLICSUP } /* blk=cyrillicsupplementary */, - { 0, 8780, 446, 6, 18, UNI_IDEOGRAPHICSYMBOLS } /* block=ideographicsymbols */, - { 0, 9488, 9285, 4, 5, UNI_INLIMBU } /* blk=limbu */, - { 1, 5986, 7795, 13, 8, UNI_NV__3_SLASH_20 } /* numericvalue=1.50e-01 */, - { 0, 1417, 7477, 24, 9, UNI_CCC__AL } /* canonicalcombiningclass=aboveleft */, - { 0, 9997, 3700, 3, 17, UNI_BC__ES } /* bc=europeanseparator */, - { 2, 184, 6972, 2, 11, UNI_SYLO } /* issylotinagri */, - { 0, 5032, 9255, 14, 5, -UNI_POSIXXDIGIT } /* asciihexdigit=false */, - { 3, 8688, 3923, 4, 7, UNI_ARABICSUP } /* isarabicsup */, - { 0, 8780, 2931, 6, 19, UNI_SUPARROWSA } /* block=supplementalarrowsa */, - { 2, 9488, 2308, 4, 21, UNI_YIJING } /* blk=yijinghexagramsymbols */, - { 0, 5661, 0, 13, 0, UNI_AEGEANNUMBERS } /* aegeannumbers */, - { 5, 7076, 4479, 3, 6, UNI_BRAI } /* inbraille */, - { 0, 184, 4245, 2, 10, UNI_SM } /* ismathsymbol */, - { 13, 8780, 1585, 6, 14, UNI_BYZANTINEMUSIC } /* block=byzantinemusic */, - { 0, 9508, 9106, 5, 4, UNI_CCC__15 } /* ccc=ccc15 */, - { 2, 9768, 4385, 4, 6, UNI_TANG } /* scx=tangut */, - { 3, 1537, 3343, 4, 6, UNI_DINGBATS } /* indingbats */, - { 8, 9488, 2054, 4, 22, UNI_MODIFIERLETTERS } /* blk=spacingmodifierletters */, - { 4, 539, 0, 30, 0, UNI_CJKEXTB } /* cjkunifiedideographsextensionb */, - { 1, 184, 3439, 2, 12, UNI_SMALLKANAEXT } /* issmallkanaext */, - { 0, 1269, 3, 25, 1, -UNI_COMPEX } /* fullcompositionexclusion=f */, - { 26, 9275, 2646, 5, 19, UNI_INSC__CONSONANTHEADLETTER } /* insc=consonantheadletter */, - { 1, 5986, 9428, 13, 4, UNI_NV__3_SLASH_80 } /* numericvalue=3/80 */, - { 0, 8780, 8352, 7, 6, UNI_CJKEXTA } /* block=cjkexta */, - { 1, 8884, 26, 4, 1, UNI_EXT } /* ext=y */, - { 0, 9997, 8, 3, 2, UNI_BC__AN } /* bc=an */, - { 6, 9736, 0, 4, 0, UNI_COPT } /* qaac */, - { 0, 3097, 5012, 18, 6, UNI_DT__SQR } /* decompositiontype=square */, - { 1, 2119, 0, 21, 0, UNI_CJKRADICALSSUP } /* cjkradicalssupplement */, - { 0, 10048, 5648, 3, 6, UNI_NV__100000 } /* nv=100000 */, - { 9, 9270, 3481, 5, 12, UNI_INPC__LEFTANDRIGHT } /* inpc=leftandright */, - { 0, 8589, 2469, 7, 20, UNI_HMNP } /* script=nyiakengpuachuehmong */, - { 4, 9488, 6277, 4, 7, UNI_MAHJONG } /* blk=mahjong */, - { 6, 1552, 341, 9, 2, UNI_PE } /* category=pe */, - { 0, 3097, 8533, 18, 7, UNI_DT__NB } /* decompositiontype=nobreak */, - { 0, 3836, 6940, 18, 10, UNI_SORA } /* scriptextensions=sorasompeng */, - { 0, 4033, 467, 16, 5, UNI_P } /* generalcategory=punct */, - { 0, 8780, 3870, 6, 17, UNI_SMALLFORMS } /* block=smallformvariants */, - { 3, 10333, 2913, 3, 3, UNI_SUND } /* issund */, - { 2, 10024, 727, 3, 2, UNI_MN } /* gc=mn */, - { 2, 6231, 43, 3, 8, UNI_CJKCOMPAT } /* incjkcompat */, - { 17, 8589, 9797, 8, 3, UNI_SC__SYRC } /* script=syrc */, - { 1, 1417, 8811, 25, 4, UNI_CCC__12 } /* canonicalcombiningclass=ccc12 */, - { 1, 3379, 36, 6, 1, UNI_XPOSIXSPACE } /* space=t */, - { 1, 10296, 1867, 7, 5, UNI_POSIXUPPER } /* isposixupper */, - { 1, 3259, 3, 18, 1, -UNI_IDSB } /* idsbinaryoperator=f */, - { 3, 1417, 3007, 24, 13, UNI_CCC__214 } /* canonicalcombiningclass=attachedabove */, - { 1, 7028, 9039, 3, 5, UNI_YEZI } /* isyezidi */, - { 4, 7218, 4360, 10, 9, UNI_EMOD } /* linebreak=emodifier */, - { 1, 1417, 2455, 24, 5, UNI_CCC__R } /* canonicalcombiningclass=right */, - { 0, 1273, 10135, 21, 3, UNI_CE } /* compositionexclusion=yes */, - { 1, 8780, 8603, 6, 7, UNI_SHAW } /* block=shavian */, - { 3, 9768, 8876, 4, 4, UNI_GOTH } /* scx=goth */, - { 4, 2182, 0, 21, 0, UNI_gcb_values_index } /* graphemeclusterbreak= */, - { 0, 8780, 8652, 6, 7, UNI_INTAIVIET } /* block=taiviet */, - { 8, 9886, 5006, 5, 12, UNI_INZANABAZARSQUARE } /* inzanabazarsquare */, - { 0, 8589, 8638, 7, 7, UNI_SC__TGLG } /* script=tagalog */, - { 16, 1768, 1025, 22, 2, -UNI_CWCF } /* changeswhencasefolded=no */, - { 1, 2224, 2951, 3, 18, UNI_SUPARROWSB } /* insupplementalarrowsb */, - { 0, 6553, 36, 12, 1, UNI_XIDC } /* xidcontinue=t */, - { 1, 9564, 0, 4, 0, UNI_GONM } /* gonm */, - { 7, 8780, 8131, 6, 8, UNI_INDUPLOYAN } /* block=duployan */, - { 1, 9768, 8786, 4, 4, UNI_CARI } /* scx=cari */, - { 3, 9277, 1654, 3, 6, UNI_SC__HANG } /* sc=hangul */, - { 0, 184, 3421, 2, 4, UNI_RUMI } /* isrumi */, - { 3, 9768, 2817, 4, 4, UNI_MERO } /* scx=mero */, - { 0, 184, 3785, 2, 4, UNI_MANI } /* ismani */, - { 11, 9488, 5606, 4, 14, UNI_SUPPUNCTUATION } /* blk=suppunctuation */, - { 1, 10250, 6556, 15, 8, UNI__PERL_CHARNAME_CONTINUE } /* _perl_charname_continue */, - { 0, 8780, 8561, 6, 7, UNI_INOSMANYA } /* block=osmanya */, - { 1, 10027, 9044, 3, 6, UNI_JG__YUDHHE } /* jg=yudhhe */, - { 0, 9768, 8652, 4, 7, UNI_TAVT } /* scx=taiviet */, - { 0, 10012, 1192, 3, 9, UNI_EA__H } /* ea=halfwidth */, - { 3, 3836, 9704, 17, 4, UNI_ORKH } /* scriptextensions=orkh */, - { 1, 7318, 10108, 10, 3, UNI_IN__6_DOT_1 } /* presentin=v61 */, - { 12, 5791, 6349, 13, 12, UNI_JG__MALAYALAMSSA } /* joininggroup=malayalamssa */, - { 0, 10048, 8744, 3, 4, UNI_NV__7000 } /* nv=7000 */, - { 0, 3367, 36, 18, 1, UNI__PERL_PATWS } /* patternwhitespace=t */, - { 0, 4853, 0, 15, 0, UNI_nfkdqc_values_index } /* nfkdquickcheck= */, - { 2, 9488, 809, 4, 29, UNI_ENCLOSEDIDEOGRAPHICSUP } /* blk=enclosedideographicsupplement */, - { 4, 184, 749, 2, 30, UNI_ENCLOSEDALPHANUMSUP } /* isenclosedalphanumericsupplement */, - { 1, 9020, 10135, 6, 3, UNI_XPOSIXUPPER } /* upper=yes */, - { 1, 5986, 8750, 13, 5, UNI_NV__80000 } /* numericvalue=80000 */, - { 0, 9768, 8171, 4, 8, UNI_GUJR } /* scx=gujarati */, - { 0, 3379, 10135, 6, 3, UNI_XPOSIXSPACE } /* space=yes */, - { 1, 9768, 8582, 4, 7, UNI_PHAG } /* scx=phagspa */, - { 0, 3836, 3785, 17, 10, UNI_MANI } /* scriptextensions=manichaean */, - { 5, 9488, 4793, 4, 15, UNI_INMEROITICCURSIVE } /* blk=meroiticcursive */, - { 0, 184, 6277, 2, 12, UNI_MAHJONG } /* ismahjongtiles */, - { 0, 9997, 1353, 3, 3, UNI_BC__RLE } /* bc=rle */, - { 2, 184, 9245, 2, 4, UNI_DOGR } /* isdogr */, - { 32, 9768, 9644, 4, 4, UNI_MEDF } /* scx=medf */, - { 0, 9768, 6409, 4, 12, UNI_MEND } /* scx=mendekikakui */, - { 8, 10132, 5746, 3, 5, UNI_WB__EB } /* wb=ebase */, - { 0, 10048, 7826, 3, 2, UNI_NV__12 } /* nv=12 */, - { 6, 10132, 4856, 3, 2, UNI_WB__DQ } /* wb=dq */, - { 9, 10132, 34, 3, 6, UNI_WB__EXTEND } /* wb=extend */, - { 6, 10027, 4778, 3, 15, UNI_JG__MANICHAEANZAYIN } /* jg=manichaeanzayin */, - { 0, 8484, 0, 7, 0, UNI_MAND } /* mandaic */, - { 2, 184, 9888, 2, 4, UNI_ZANB } /* iszanb */, - { 1, 3367, 9255, 18, 5, -UNI__PERL_PATWS } /* patternwhitespace=false */, - { 1, 8589, 1222, 7, 4, UNI_SC__KANA } /* script=kana */, - { 11, 10024, 2061, 3, 14, UNI_LM } /* gc=modifierletter */, - { 2, 9488, 8786, 4, 6, UNI_INCARIAN } /* blk=carian */, - { 3, 9488, 78, 4, 6, UNI_INARABIC } /* blk=arabic */, - { 2, 5791, 7348, 13, 10, UNI_JG__REVERSEDPE } /* joininggroup=reversedpe */, - { 4, 10296, 5718, 7, 5, UNI_POSIXALNUM } /* isposixalnum */, - { 1, 8589, 6193, 7, 4, UNI_HEBR } /* script=hebr */, - { 2, 10048, 10142, 3, 2, UNI_NV__44 } /* nv=44 */, - { 1, 9070, 9255, 5, 5, -UNI_POSIXXDIGIT } /* ahex=false */, - { 5, 9768, 9452, 4, 4, UNI_AHOM } /* scx=ahom */, - { 6, 1966, 8307, 22, 8, UNI_INSC__TONEMARK } /* indicsyllabiccategory=tonemark */, - { 8, 2032, 0, 22, 0, UNI_nchar_values_index } /* noncharactercodepoint= */, - { 0, 184, 4049, 2, 16, UNI_GEORGIANEXT } /* isgeorgianextended */, - { 0, 9488, 539, 4, 30, UNI_CJKEXTB } /* blk=cjkunifiedideographsextensionb */, - { 0, 106, 0, 6, 0, UNI_S } /* symbol */, - { 1, 8780, 6481, 6, 12, UNI_INOLDHUNGARIAN } /* block=oldhungarian */, - { 2, 9997, 0, 4, 0, UNI_BC__B } /* bc=b */, - { 1, 8780, 6818, 6, 11, UNI_MYANMAREXTA } /* block=myanmarexta */, - { 12, 2760, 6763, 19, 3, UNI_LB__H3 } /* hangulsyllabletype=lvt */, - { 1, 8780, 4129, 6, 6, UNI_LATIN1 } /* block=latin1 */, - { 2, 5986, 7859, 13, 5, UNI_NV__20000 } /* numericvalue=20000 */, - { 6, 7218, 10158, 10, 2, UNI_LB__H2 } /* linebreak=h2 */, - { 0, 10048, 7931, 3, 8, UNI_NV__5_SLASH_12 } /* nv=4.17e-01 */, - { 10, 4916, 9817, 3, 3, UNI_TAVT } /* istavt */, - { 0, 4033, 25, 16, 1, UNI_S } /* generalcategory=s */, - { 1, 8131, 0, 8, 0, UNI_DUPL } /* duployan */, - { 1, 9716, 26, 4, 1, UNI_PCM } /* pcm=y */, - { 8, 10180, 0, 2, 0, UNI_ZS } /* zs */, - { 1, 9488, 3921, 4, 16, UNI_ARABICSUP } /* blk=arabicsupplement */, - { 2, 10322, 3379, 5, 5, UNI_XPOSIXSPACE } /* xperlspace */, - { 1, 184, 183, 2, 20, UNI_MISCSYMBOLS } /* ismiscellaneoussymbols */, - { 0, 7318, 7931, 10, 3, UNI_IN__4_DOT_1 } /* presentin=4.1 */, - { 3, 8978, 0, 5, 0, UNI__PERL_PATWS } /* patws */, - { 0, 9556, 34, 4, 2, UNI_GCB__EX } /* gcb=ex */, - { 4, 9020, 1, 6, 1, -UNI_XPOSIXUPPER } /* upper=n */, - { 0, 5986, 8710, 13, 2, UNI_NV__60 } /* numericvalue=60 */, - { 0, 9544, 0, 4, 0, UNI_DIAK } /* diak */, - { 0, 10308, 0, 5, 0, UNI_XPOSIXPRINT } /* print */, - { 2, 1966, 5634, 22, 14, UNI_INSC__VOWELDEPENDENT } /* indicsyllabiccategory=voweldependent */, - { 1, 4033, 1171, 16, 2, UNI_TITLE } /* generalcategory=lt */, - { 4, 6231, 6098, 3, 11, UNI_CYRILLICEXTA } /* incyrillicexta */, - { 0, 7325, 9852, 3, 4, UNI_IN__12_DOT_1 } /* in=v121 */, - { 1, 5564, 36, 14, 1, UNI_QMARK } /* quotationmark=t */, - { 0, 9091, 8133, 4, 6, UNI_INDUPLOYAN } /* induployan */, - { 0, 8780, 2308, 6, 21, UNI_YIJING } /* block=yijinghexagramsymbols */, - { 8, 8930, 10135, 6, 3, UNI_XPOSIXLOWER } /* lower=yes */, - { 0, 8954, 10135, 6, 3, UNI__PERL_NCHAR } /* nchar=yes */, - { 2, 184, 3, 3, 1, UNI_CF } /* iscf */, - { 1, 8589, 3169, 7, 4, UNI_ETHI } /* script=ethi */, - { 7, 9637, 5690, 5, 10, UNI_BLOCKELEMENTS } /* inblockelements */, - { 0, 9508, 9111, 5, 4, UNI_CCC__16 } /* ccc=ccc16 */, - { 5, 8589, 9644, 7, 4, UNI_MEDF } /* script=medf */, - { 8, 5466, 0, 15, 0, UNI_DT__CAN } /* nfdquickcheck=n */, - { 1, 8589, 3079, 7, 6, UNI_SC__COPT } /* script=coptic */, - { 10, 8688, 183, 4, 2, UNI_ARMI } /* isarmi */, - { 4, 8589, 4703, 7, 15, UNI_ARMI } /* script=imperialaramaic */, - { 0, 3836, 9285, 17, 4, UNI_LIMB } /* scriptextensions=limb */, - { 0, 8589, 6884, 7, 11, UNI_HMNG } /* script=pahawhhmong */, - { 17, 184, 1033, 2, 27, UNI_ENCLOSEDCJK } /* isenclosedcjklettersandmonths */, - { 1, 8589, 9720, 7, 4, UNI_SC__PHLP } /* script=phlp */, - { 1, 339, 0, 2, 0, UNI_LO } /* lo */, - { 3, 9488, 838, 4, 29, UNI_MISCARROWS } /* blk=miscellaneoussymbolsandarrows */, - { 4, 8966, 26, 6, 1, UNI_NFDQC__Y } /* nfdqc=y */, - { 1, 8780, 4369, 6, 16, UNI_SYRIACSUP } /* block=syriacsupplement */, - { 1, 1417, 9151, 25, 4, UNI_CCC__24 } /* canonicalcombiningclass=ccc24 */, - { 0, 21, 5200, 2, 7, UNI_KANASUP } /* inkanasup */, - { 5, 1273, 0, 20, 0, UNI_CE } /* compositionexclusion */, - { 1, 8780, 2950, 6, 19, UNI_SUPARROWSB } /* block=supplementalarrowsb */, - { 1, 3457, 0, 11, 0, UNI_TAIXUANJING } /* taixuanjing */, - { 0, 5578, 36, 15, 1, UNI_SB__ST } /* sentencebreak=st */, - { 2, 184, 43, 3, 35, UNI_CJKCOMPATIDEOGRAPHSSUP } /* iscjkcompatibilityideographssupplement */, - { 0, 184, 4478, 2, 7, UNI_BRAI } /* isbraille */, - { 1, 8589, 4385, 7, 6, UNI_TANG } /* script=tangut */, - { 0, 10033, 9713, 3, 2, UNI_LB__SG } /* lb=sg */, - { 0, 1192, 0, 26, 0, UNI_HALFANDFULLFORMS } /* halfwidthandfullwidthforms */, - { 2, 38, 0, 2, 0, UNI_XPOSIXDIGIT } /* nd */, - { 1, 8589, 9305, 7, 5, UNI_NSHU } /* script=nushu */, - { 1, 9270, 9, 5, 2, UNI_INPC__NA } /* inpc=na */, - { 4, 1552, 2268, 9, 2, UNI_PD } /* category=pd */, - { 0, 629, 0, 30, 0, UNI_CJKEXTE } /* cjkunifiedideographsextensione */, - { 12, 7249, 5062, 4, 11, UNI_CI } /* iscaseignorable */, - { 3, 5986, 9412, 13, 4, UNI_NV__17_SLASH_2 } /* numericvalue=17/2 */, - { 0, 8589, 9588, 7, 4, UNI_HMNG } /* script=hmng */, - { 1, 7325, 9848, 3, 4, UNI_IN__12 } /* in=v120 */, - { 0, 8780, 8275, 6, 8, UNI_SPECIALS } /* block=specials */, - { 6, 9488, 7428, 4, 10, UNI_INWARANGCITI } /* blk=warangciti */, - { 6, 7228, 1, 10, 1, -UNI_XPOSIXLOWER } /* lowercase=n */, - { 6, 5986, 8726, 13, 6, UNI_NV__432000 } /* numericvalue=432000 */, - { 1, 1537, 6621, 3, 10, UNI_DOMINO } /* indominotiles */, - { 0, 9540, 3, 4, 1, -UNI_DIA } /* dia=f */, - { 0, 7155, 1514, 3, 23, UNI_HIGHPUSURROGATES } /* ishighprivateusesurrogates */, - { 0, 5032, 9836, 14, 4, UNI_POSIXXDIGIT } /* asciihexdigit=true */, - { 0, 10033, 10154, 3, 2, UNI_LB__B2 } /* lb=b2 */, - { 6, 3904, 0, 17, 0, UNI_uideo_values_index } /* unifiedideograph= */, - { 1, 3385, 9255, 18, 5, -UNI_RI } /* regionalindicator=false */, - { 0, 9488, 3734, 4, 17, UNI_INDICSIYAQNUMBERS } /* blk=indicsiyaqnumbers */, - { 2, 9860, 0, 4, 0, UNI_VAI } /* vaii */, - { 4, 5791, 4209, 13, 16, UNI_JG__MANICHAEANSAMEKH } /* joininggroup=manichaeansamekh */, - { 0, 5791, 87, 13, 2, UNI_JG__HE } /* joininggroup=he */, - { 0, 8589, 9335, 7, 5, UNI_SC__TAKR } /* script=takri */, - { 13, 9277, 9708, 3, 4, UNI_SC__ORYA } /* sc=orya */, - { 1, 9277, 2061, 3, 4, UNI_SC__MODI } /* sc=modi */, - { 2, 10027, 6785, 3, 11, UNI_JG__MALAYALAMRA } /* jg=malayalamra */, - { 1, 7567, 0, 9, 0, UNI_SIND } /* khudawadi */, - { 0, 184, 728, 2, 6, UNI_N } /* isnumber */, - { 0, 9708, 0, 4, 0, UNI_ORYA } /* orya */, - { 1, 1906, 0, 16, 0, UNI_INDICNUMBERFORMS } /* indicnumberforms */, - { 0, 8780, 8924, 6, 6, UNI_INLEPCHA } /* block=lepcha */, - { 0, 10048, 9050, 3, 4, UNI_NV__1_SLASH_16 } /* nv=1/16 */, - { 0, 10288, 5718, 8, 5, UNI_XPOSIXALNUM } /* isxposixalnum */, - { 6, 9488, 5661, 4, 13, UNI_AEGEANNUMBERS } /* blk=aegeannumbers */, - { 8, 3983, 0, 18, 0, UNI_PE } /* isclosepunctuation */, - { 11, 3097, 4532, 18, 6, UNI_DT__MED } /* decompositiontype=medial */, - { 0, 10132, 6169, 3, 12, UNI_WB__EB } /* wb=glueafterzwj */, - { 0, 5791, 5895, 13, 13, UNI_JG__MANICHAEANONE } /* joininggroup=manichaeanone */, - { 0, 8954, 3, 6, 1, -UNI__PERL_NCHAR } /* nchar=f */, - { 3, 4658, 36, 15, 1, UNI_GREXT } /* graphemeextend=t */, - { 2, 7418, 10135, 10, 3, UNI_XPOSIXUPPER } /* uppercase=yes */, - { 1, 10296, 0, 4, 0, UNI_PO } /* ispo */, - { 0, 8589, 3785, 7, 4, UNI_SC__MANI } /* script=mani */, - { 1, 3836, 4703, 17, 15, UNI_ARMI } /* scriptextensions=imperialaramaic */, - { 1, 2224, 2932, 3, 18, UNI_SUPARROWSA } /* insupplementalarrowsa */, - { 13, 8780, 4401, 6, 9, UNI_TANGUTSUP } /* block=tangutsup */, - { 8, 8780, 7129, 7, 9, UNI_CJKSTROKES } /* block=cjkstrokes */, - { 0, 21, 8211, 2, 8, UNI_JAMOEXTB } /* injamoextb */, - { 0, 45, 0, 2, 0, UNI_CO } /* co */, - { 4, 3097, 6421, 18, 8, UNI_DT__NONCANON } /* decompositiontype=noncanon */, - { 16, 184, 1166, 2, 25, UNI_DI } /* isdefaultignorablecodepoint */, - { 2, 9277, 9860, 3, 3, UNI_VAI } /* sc=vai */, - { 1, 8491, 0, 7, 0, UNI_MARC } /* marchen */, - { 4, 184, 5564, 2, 13, UNI_QMARK } /* isquotationmark */, - { 2, 10024, 5713, 3, 13, UNI_XPOSIXDIGIT } /* gc=decimalnumber */, - { 1, 10033, 184, 3, 2, UNI_LB__IS } /* lb=is */, - { 1, 9315, 0, 5, 0, UNI_ORYA } /* oriya */, - { 0, 9812, 0, 4, 0, UNI_TAML } /* taml */, - { 0, 4989, 1868, 3, 4, UNI_XPOSIXUPPER } /* isupper */, - { 0, 5986, 5648, 13, 5, UNI_NV__10000 } /* numericvalue=10000 */, - { 16, 8780, 3026, 7, 10, UNI_CHEROKEESUP } /* block=cherokeesup */, - { 1, 8780, 8610, 6, 7, UNI_INSIDDHAM } /* block=siddham */, - { 1, 2161, 3, 21, 1, -UNI_EXTPICT } /* extendedpictographic=f */, - { 1, 9488, 8091, 4, 8, UNI_INARMENIAN } /* blk=armenian */, - { 1, 9277, 9065, 3, 5, UNI_SC__ADLM } /* sc=adlam */, - { 12, 3836, 8344, 17, 7, UNI_BENG } /* scriptextensions=bengali */, - { 0, 2032, 0, 21, 0, UNI__PERL_NCHAR } /* noncharactercodepoint */, - { 8, 3421, 0, 18, 0, UNI_RUMI } /* ruminumeralsymbols */, - { 1, 9277, 8115, 3, 4, UNI_BASS } /* sc=bass */, - { 1, 184, 3169, 2, 8, UNI_ETHI } /* isethiopic */, - { 0, 3836, 9824, 17, 4, UNI_TGLG } /* scriptextensions=tglg */, - { 0, 184, 8942, 2, 4, UNI_LYDI } /* islydi */, - { 0, 1812, 0, 22, 0, UNI_cwl_values_index } /* changeswhenlowercased= */, - { 3, 7318, 10105, 10, 3, UNI_IN__6 } /* presentin=v60 */, - { 5, 10296, 9721, 3, 3, UNI_PHLP } /* isphlp */, - { 3, 10132, 7603, 3, 9, UNI_WB__ML } /* wb=midletter */, - { 4, 2224, 7694, 3, 8, UNI_INSAMARITAN } /* insamaritan */, - { 4, 10048, 10148, 3, 2, UNI_NV__47 } /* nv=47 */, - { 1, 5986, 9409, 13, 3, UNI_NV__5_SLASH_2 } /* numericvalue=5/2 */, - { 5, 184, 4448, 2, 8, UNI_BAMUMSUP } /* isbamumsup */, - { 2, 9488, 509, 4, 30, UNI_CJKEXTA } /* blk=cjkunifiedideographsextensiona */, - { 0, 10027, 4733, 3, 15, UNI_JG__MANICHAEANALEPH } /* jg=manichaeanaleph */, - { 13, 10033, 10030, 3, 2, UNI_GCB__T } /* lb=jt */, - { 1, 9277, 6840, 3, 4, UNI_SC__NAND } /* sc=nand */, - { 2, 9997, 2798, 3, 19, UNI_BC__LRO } /* bc=lefttorightoverride */, - { 4, 1269, 10135, 25, 3, UNI_COMPEX } /* fullcompositionexclusion=yes */, - { 1, 8780, 2684, 6, 19, UNI_INEGYPTIANHIEROGLYPHS } /* block=egyptianhieroglyphs */, - { 0, 8589, 8611, 8, 3, UNI_SIDD } /* script=sidd */, - { 15, 1591, 2685, 3, 18, UNI_INEGYPTIANHIEROGLYPHS } /* inegyptianhieroglyphs */, - { 0, 10027, 7198, 3, 10, UNI_JG__KNOTTEDHEH } /* jg=knottedheh */, - { 1, 8589, 8611, 8, 6, UNI_SIDD } /* script=siddham */, - { 0, 9065, 0, 5, 0, UNI_ADLM } /* adlam */, - { 1, 8589, 6973, 8, 3, UNI_SC__SYLO } /* script=sylo */, - { 0, 1114, 26, 26, 1, UNI_CWKCF } /* changeswhennfkccasefolded=y */, - { 1, 9768, 2288, 5, 3, UNI_SINH } /* scx=sinh */, - { 7, 10009, 6421, 3, 8, UNI_DT__NONCANON } /* dt=noncanon */, - { 0, 9768, 8115, 4, 4, UNI_BASS } /* scx=bass */, - { 16, 6231, 720, 3, 8, UNI_INCUNEIFORM } /* incuneiform */, - { 19, 1417, 9211, 25, 4, UNI_CCC__36 } /* canonicalcombiningclass=ccc36 */, - { 9, 2569, 3511, 20, 18, UNI_VO__TU } /* verticalorientation=transformedupright */, - { 2, 2529, 1, 20, 1, -UNI_TERM } /* terminalpunctuation=n */, - { 0, 184, 1911, 2, 11, UNI_NUMBERFORMS } /* isnumberforms */, - { 0, 3836, 5843, 17, 9, UNI_MLYM } /* scriptextensions=malayalam */, - { 1, 9508, 9300, 4, 5, UNI_CCC__7 } /* ccc=nukta */, - { 0, 5674, 1, 13, 1, -UNI_BIDIM } /* bidimirrored=n */, - { 0, 10132, 1218, 3, 2, UNI_WB__KA } /* wb=ka */, - { 6, 10182, 25, 29, 1, UNI__PERL_PROBLEMATIC_LOCALE_FOLDS } /* _perl_problematic_locale_folds */, - { 0, 6554, 36, 11, 1, UNI_IDC } /* idcontinue=t */, - { 0, 1417, 8813, 24, 3, UNI_CCC__122 } /* canonicalcombiningclass=122 */, - { 1, 7218, 10160, 10, 2, UNI_LB__H3 } /* linebreak=h3 */, - { 14, 184, 9496, 2, 4, UNI_BUHD } /* isbuhd */, - { 21, 6231, 720, 3, 15, UNI_CUNEIFORMNUMBERS } /* incuneiformnumbers */, - { 1, 9277, 9712, 3, 4, UNI_OSGE } /* sc=osge */, - { 1, 10178, 0, 2, 0, UNI_ZP } /* zp */, - { 5, 9488, 8840, 4, 6, UNI_INCHAKMA } /* blk=chakma */, - { 2, 8589, 2429, 7, 20, UNI_PHLI } /* script=inscriptionalpahlavi */, - { 1, 5791, 4081, 13, 16, UNI_JG__HANIFIROHINGYAPA } /* joininggroup=hanifirohingyapa */, - { 2, 6928, 10135, 11, 3, UNI_SD } /* softdotted=yes */, - { 1, 7088, 3403, 10, 18, UNI_BC__RLI } /* bidiclass=righttoleftisolate */, - { 1, 8589, 1537, 8, 3, UNI_SC__SIND } /* script=sind */, - { 0, 5986, 9428, 13, 3, UNI_NV__3_SLASH_8 } /* numericvalue=3/8 */, - { 4, 3836, 4478, 17, 4, UNI_BRAI } /* scriptextensions=brai */, - { 0, 8984, 36, 6, 1, UNI_QMARK } /* qmark=t */, - { 0, 4791, 8499, 3, 6, UNI_INMULTANI } /* inmultani */, - { 9, 10024, 1899, 3, 2, UNI_PC } /* gc=pc */, - { 2, 3836, 9624, 17, 4, UNI_LAO } /* scriptextensions=laoo */, - { 4, 9488, 8526, 4, 7, UNI_NB } /* blk=noblock */, - { 1, 9277, 9038, 3, 6, UNI_SC__YEZI } /* sc=yezidi */, - { 2, 9768, 8611, 5, 6, UNI_SIDD } /* scx=siddham */, - { 0, 2741, 0, 19, 0, UNI_JAMOEXTB } /* hanguljamoextendedb */, - { 8, 8589, 1013, 7, 5, UNI_SC__GREK } /* script=greek */, - { 1, 9488, 7378, 4, 10, UNI_SUPARROWSA } /* blk=suparrowsa */, - { 0, 10290, 10308, 6, 5, UNI_XPOSIXPRINT } /* xposixprint */, - { 1, 5060, 26, 14, 1, UNI_CI } /* caseignorable=y */, - { 3, 184, 2245, 2, 11, UNI_MTEI } /* ismeeteimayek */, - { 1, 10063, 3, 3, 1, -UNI_SD } /* sd=f */, - { 6, 7318, 7923, 10, 3, UNI_IN__4 } /* presentin=4.0 */, - { 1, 8589, 4448, 7, 5, UNI_BAMU } /* script=bamum */, - { 1, 5986, 8750, 13, 2, UNI_NV__80 } /* numericvalue=80 */, - { 0, 9768, 9544, 4, 4, UNI_DIAK } /* scx=diak */, - { 0, 7155, 1418, 3, 3, UNI_HANO } /* ishano */, - { 3, 8780, 1442, 7, 9, UNI_CJKSYMBOLS } /* block=cjksymbols */, - { 0, 10009, 4017, 3, 3, UNI_DT__FIN } /* dt=fin */, - { 6, 8589, 7675, 7, 9, UNI_PALM } /* script=palmyrene */, - { 0, 9488, 7657, 4, 9, UNI_INOLDPERMIC } /* blk=oldpermic */, - { 4, 1417, 7178, 24, 4, UNI_CCC__6 } /* canonicalcombiningclass=hanr */, - { 0, 6862, 0, 11, 0, UNI_NO } /* othernumber */, - { 0, 867, 0, 18, 0, UNI_PHONETICEXT } /* phoneticextensions */, - { 0, 10009, 3501, 3, 3, UNI_DT__MED } /* dt=med */, - { 5, 1417, 9156, 25, 4, UNI_CCC__25 } /* canonicalcombiningclass=ccc25 */, - { 3, 5986, 9055, 13, 5, UNI_NV__1_SLASH_320 } /* numericvalue=1/320 */, - { 0, 8589, 6792, 8, 3, UNI_SAMR } /* script=samr */, - { 0, 9488, 8463, 4, 7, UNI_KALI } /* blk=kayahli */, - { 24, 7076, 3938, 3, 10, UNI_BOPOMOFOEXT } /* inbopomofoext */, - { 1, 9508, 0, 4, 0, UNI_ccc_values_index } /* ccc= */, - { 1, 8780, 2969, 6, 19, UNI_SUPARROWSC } /* block=supplementalarrowsc */, - { 21, 4628, 4471, 15, 7, UNI_EA__N } /* eastasianwidth=neutral */, - { 2, 9277, 9038, 3, 4, UNI_SC__YEZI } /* sc=yezi */, - { 1, 8780, 5158, 6, 14, UNI_INGREEK } /* block=greekandcoptic */, - { 4, 9508, 9116, 5, 4, UNI_CCC__17 } /* ccc=ccc17 */, - { 5, 8780, 8366, 7, 6, UNI_CJKEXTC } /* block=cjkextc */, - { 0, 599, 0, 30, 0, UNI_CJKEXTD } /* cjkunifiedideographsextensiond */, - { 0, 21, 8219, 2, 8, UNI_INJAVANESE } /* injavanese */, - { 0, 9262, 34, 3, 6, UNI_SB__EX } /* sb=extend */, - { 1, 7438, 10174, 10, 2, UNI_WB__XX } /* wordbreak=xx */, - { 0, 8589, 7684, 7, 9, UNI_PAUC } /* script=paucinhau */, - { 0, 6469, 39, 12, 2, UNI_XPOSIXDIGIT } /* numerictype=de */, - { 0, 10003, 0, 3, 0, UNI_ci_values_index } /* ci= */, - { 0, 9488, 6253, 4, 5, UNI_INKHMER } /* blk=khmer */, - { 0, 9015, 36, 5, 1, UNI_IDEO } /* ideo=t */, - { 0, 1189, 39, 3, 2, UNI_XPOSIXDIGIT } /* nt=de */, - { 1, 4916, 8646, 3, 6, UNI_LANA } /* istaitham */, - { 4, 6193, 0, 6, 0, UNI_HEBR } /* hebrew */, - { 2, 7318, 9396, 10, 4, UNI_IN__12_DOT_1 } /* presentin=12.1 */, - { 7, 9488, 2703, 4, 19, UNI_ENCLOSEDALPHANUMSUP } /* blk=enclosedalphanumsup */, - { 8, 9277, 7558, 3, 9, UNI_SC__QAAI } /* sc=inherited */, - { 0, 8780, 3734, 6, 17, UNI_INDICSIYAQNUMBERS } /* block=indicsiyaqnumbers */, - { 1, 1269, 1025, 25, 2, -UNI_COMPEX } /* fullcompositionexclusion=no */, - { 1, 8966, 0, 8, 0, UNI_DT__CAN } /* nfdqc=no */, - { 0, 10033, 1186, 3, 2, UNI_LB__PO } /* lb=po */, - { 1, 8780, 114, 7, 34, UNI_DIACRITICALSFORSYMBOLS } /* block=combiningdiacriticalmarksforsymbols */, - { 0, 1184, 0, 3, 0, UNI_DEP } /* dep */, - { 1, 3836, 9560, 17, 4, UNI_GONG } /* scriptextensions=gong */, - { 35, 9070, 36, 5, 1, UNI_POSIXXDIGIT } /* ahex=t */, - { 0, 9768, 9572, 4, 4, UNI_GUJR } /* scx=gujr */, - { 0, 184, 9736, 2, 4, UNI_COPT } /* isqaac */, - { 0, 7249, 12, 5, 3, UNI_CARI } /* iscarian */, - { 3, 10027, 341, 3, 2, UNI_JG__PE } /* jg=pe */, - { 1, 10027, 5480, 3, 14, UNI_JG__NOJOININGGROUP } /* jg=nojoininggroup */, - { 0, 7325, 10120, 3, 3, UNI_IN__8 } /* in=v80 */, - { 2, 8780, 4340, 6, 13, UNI_MATHOPERATORS } /* block=mathoperators */, - { 3, 9492, 5904, 4, 4, UNI_BPT__N } /* bpt=none */, - { 4, 184, 8179, 2, 8, UNI_GURU } /* isgurmukhi */, - { 0, 9346, 10135, 4, 3, UNI_IDC } /* idc=yes */, - { 4, 7076, 1219, 3, 4, UNI_INBATAK } /* inbatak */, - { 5, 6928, 3, 11, 1, -UNI_SD } /* softdotted=f */, - { 0, 184, 9680, 2, 4, UNI_NBAT } /* isnbat */, - { 0, 9488, 4369, 4, 16, UNI_SYRIACSUP } /* blk=syriacsupplement */, - { 1, 8780, 5214, 6, 6, UNI_KANGXI } /* block=kangxi */, - { 1, 10132, 34, 3, 2, UNI_WB__EX } /* wb=ex */, - { 3, 9768, 8219, 4, 4, UNI_JAVA } /* scx=java */, - { 9, 9768, 3751, 4, 17, UNI_KITS } /* scx=khitansmallscript */, - { 5, 9556, 5633, 4, 2, UNI_LB__H2 } /* gcb=lv */, - { 3, 10132, 8144, 3, 3, UNI_WB__EB } /* wb=gaz */, - { 1, 4385, 0, 4, 0, UNI_TANG } /* tang */, - { 1, 3734, 0, 17, 0, UNI_INDICSIYAQNUMBERS } /* indicsiyaqnumbers */, - { 0, 9488, 4385, 4, 16, UNI_TANGUTCOMPONENTS } /* blk=tangutcomponents */, - { 8, 10048, 8756, 3, 4, UNI_NV__9000 } /* nv=9000 */, - { 6, 8780, 3457, 6, 18, UNI_TAIXUANJING } /* block=taixuanjingsymbols */, - { 2, 184, 3026, 3, 17, UNI_CHEROKEESUP } /* ischerokeesupplement */, - { 0, 9488, 8624, 4, 7, UNI_SUPPUAA } /* blk=suppuaa */, - { 1, 8774, 1025, 6, 2, -UNI_BIDIM } /* bidim=no */, - { 2, 7438, 108, 10, 2, UNI_WB__MB } /* wordbreak=mb */, - { 2, 1910, 0, 2, 0, UNI_CN } /* cn */, - { 4, 5564, 10135, 14, 3, UNI_QMARK } /* quotationmark=yes */, - { 1, 7218, 3, 11, 1, UNI_LB__LF } /* linebreak=lf */, - { 5, 4116, 5779, 3, 12, UNI_IPAEXT } /* isipaextensions */, - { 8, 9262, 138, 3, 2, UNI_SB__FO } /* sb=fo */, - { 0, 3097, 3439, 18, 5, UNI_DT__SML } /* decompositiontype=small */, - { 10, 8589, 6385, 7, 12, UNI_SC__GONM } /* script=masaramgondi */, - { 5, 4791, 2856, 3, 11, UNI_MONGOLIANSUP } /* inmongoliansup */, - { 2, 8780, 6397, 6, 12, UNI_MATHALPHANUM } /* block=mathalphanum */, - { 10, 8589, 2409, 7, 10, UNI_SC__GLAG } /* script=glagolitic */, - { 0, 8589, 9692, 7, 4, UNI_NSHU } /* script=nshu */, - { 0, 8780, 8491, 6, 7, UNI_INMARCHEN } /* block=marchen */, - { 4, 9488, 2329, 4, 20, UNI_INANATOLIANHIEROGLYPHS } /* blk=anatolianhieroglyphs */, - { 18, 3836, 9616, 17, 4, UNI_KTHI } /* scriptextensions=kthi */, - { 1, 6420, 6482, 3, 11, UNI_INOLDHUNGARIAN } /* inoldhungarian */, - { 0, 1505, 2254, 5, 5, UNI_GREEKEXT } /* ingreekext */, - { 2, 184, 8526, 2, 7, UNI_NB } /* isnoblock */, - { 0, 719, 0, 16, 0, UNI_CUNEIFORMNUMBERS } /* cuneiformnumbers */, - { 20, 9488, 2741, 4, 19, UNI_JAMOEXTB } /* blk=hanguljamoextendedb */, - { 0, 4688, 8259, 15, 8, UNI_IDENTIFIERTYPE__OBSOLETE } /* identifiertype=obsolete */, - { 8, 9488, 3921, 4, 9, UNI_ARABICSUP } /* blk=arabicsup */, - { 2, 5060, 10135, 14, 3, UNI_CI } /* caseignorable=yes */, - { 3, 9488, 7388, 4, 10, UNI_SUPARROWSB } /* blk=suparrowsb */, - { 9, 4033, 10178, 16, 2, UNI_ZP } /* generalcategory=zp */, - { 4, 8589, 8477, 7, 7, UNI_MAKA } /* script=makasar */, - { 0, 6469, 495, 12, 2, UNI_NT__NU } /* numerictype=nu */, - { 18, 10027, 5843, 3, 13, UNI_JG__MALAYALAMLLLA } /* jg=malayalamllla */, - { 0, 8780, 3052, 6, 9, UNI_HALFMARKS } /* block=halfmarks */, - { 2, 8780, 283, 6, 33, UNI_MISCMATHSYMBOLSB } /* block=miscellaneousmathematicalsymbolsb */, - { 3, 8978, 36, 6, 1, UNI__PERL_PATWS } /* patws=t */, - { 8, 3836, 8652, 17, 7, UNI_TAVT } /* scriptextensions=taiviet */, - { 5, 9444, 7408, 4, 10, UNI_AGE__NA } /* age=unassigned */, - { 10, 9260, 3, 5, 1, -UNI_IDSB } /* idsb=f */, - { 8, 4628, 865, 15, 1, UNI_EA__W } /* eastasianwidth=w */, - { 1, 9768, 6840, 4, 11, UNI_NAND } /* scx=nandinagari */, - { 2, 10048, 10146, 3, 2, UNI_NV__46 } /* nv=46 */, - { 2, 9230, 9836, 5, 4, UNI_CWCF } /* cwcf=true */, - { 4, 8894, 10135, 6, 3, UNI_JOINC } /* joinc=yes */, - { 3, 2032, 26, 22, 1, UNI__PERL_NCHAR } /* noncharactercodepoint=y */, - { 0, 184, 1066, 2, 2, UNI_CASEDLETTER } /* islc */, - { 4, 10048, 7877, 3, 2, UNI_NV__13 } /* nv=13 */, - { 0, 8780, 5214, 6, 14, UNI_KANGXI } /* block=kangxiradicals */, - { 0, 3836, 9320, 17, 5, UNI_OSGE } /* scriptextensions=osage */, - { 1, 10024, 0, 3, 0, UNI_gc_values_index } /* gc= */, - { 1, 21, 7594, 2, 9, UNI_LATINEXTD } /* inlatinextd */, - { 6, 9488, 5214, 4, 6, UNI_KANGXI } /* blk=kangxi */, - { 8, 9508, 3564, 4, 17, UNI_WB__EB } /* ccc=attachedbelowleft */, - { 26, 6193, 0, 4, 0, UNI_HEBR } /* hebr */, - { 2, 4289, 0, 16, 0, UNI_MYANMAREXTB } /* myanmarextendedb */, - { 4, 9277, 9804, 3, 4, UNI_SC__TALE } /* sc=tale */, - { 0, 9230, 3, 5, 1, -UNI_CWCF } /* cwcf=f */, - { 16, 6231, 7119, 3, 9, UNI_INCHORASMIAN } /* inchorasmian */, - { 2, 10048, 5648, 3, 2, UNI_NV__10 } /* nv=10 */, - { 0, 4916, 4402, 3, 8, UNI_TANGUTSUP } /* istangutsup */, - { 0, 8449, 10135, 7, 3, UNI_HYPHEN } /* hyphen=yes */, - { 16, 10182, 10270, 6, 9, UNI__PERL_ANY_FOLDS } /* _perl_any_folds */, - { 0, 10027, 9884, 3, 4, UNI_JG__ZAIN } /* jg=zain */, - { 12, 10250, 10265, 15, 5, UNI__PERL_CHARNAME_BEGIN } /* _perl_charname_begin */, - { 0, 3836, 719, 17, 9, UNI_XSUX } /* scriptextensions=cuneiform */, - { 0, 4033, 727, 16, 2, UNI_MN } /* generalcategory=mn */, - { 0, 184, 3044, 3, 17, UNI_HALFMARKS } /* iscombininghalfmarks */, - { 11, 7249, 1017, 4, 2, UNI_CAKM } /* iscakm */, - { 0, 7358, 0, 10, 0, UNI_SAUR } /* saurashtra */, - { 0, 10027, 5921, 3, 13, UNI_JG__MANICHAEANTEN } /* jg=manichaeanten */, - { 1, 9277, 2608, 3, 6, UNI_BRAH } /* sc=brahmi */, - { 0, 21, 4129, 2, 9, UNI_LATIN1 } /* inlatin1sup */, - { 0, 7531, 0, 9, 0, UNI_EMOTICONS } /* emoticons */, - { 13, 3836, 2608, 17, 4, UNI_BRAH } /* scriptextensions=brah */, - { 4, 9640, 9255, 4, 5, -UNI_LOE } /* loe=false */, - { 0, 8780, 3583, 8, 15, UNI_UCAS } /* block=canadiansyllabics */, - { 0, 9592, 0, 4, 0, UNI_HMNP } /* hmnp */, - { 9, 10027, 2637, 3, 3, UNI_JG__YEH } /* jg=yeh */, - { 3, 8780, 6939, 6, 11, UNI_INSORASOMPENG } /* block=sorasompeng */, - { 2, 6231, 6122, 3, 11, UNI_CYRILLICEXTC } /* incyrillicextc */, - { 4, 4033, 5817, 16, 13, UNI_ZL } /* generalcategory=lineseparator */, - { 1, 5791, 4733, 13, 15, UNI_JG__MANICHAEANALEPH } /* joininggroup=manichaeanaleph */, - { 1, 3836, 57, 17, 2, UNI_YI } /* scriptextensions=yi */, - { 5, 9444, 9396, 4, 4, UNI_AGE__12_DOT_1 } /* age=12.1 */, - { 1, 7318, 8043, 10, 3, UNI_IN__8 } /* presentin=8.0 */, - { 1, 5791, 6785, 13, 11, UNI_JG__MALAYALAMRA } /* joininggroup=malayalamra */, - { 0, 8870, 0, 5, 0, UNI_EPRES } /* epres */, - { 0, 8519, 26, 7, 1, UNI_DT__NONE } /* nfkdqc=y */, - { 2, 5578, 1823, 14, 5, UNI_SB__LO } /* sentencebreak=lower */, - { 1, 9277, 9728, 3, 4, UNI_MIAO } /* sc=plrd */, - { 0, 9008, 0, 6, 0, UNI_THAA } /* thaana */, - { 8, 25, 0, 1, 0, UNI_S } /* s */, - { 2, 4989, 8316, 3, 7, UNI_UGAR } /* isugaritic */, - { 0, 8984, 10135, 6, 3, UNI_QMARK } /* qmark=yes */, - { 0, 4718, 0, 15, 0, UNI_LOWERCASELETTER } /* lowercaseletter */, - { 0, 184, 4129, 2, 9, UNI_LATIN1 } /* islatin1sup */, - { 0, 8780, 2287, 6, 21, UNI_SINHALAARCHAICNUMBERS } /* block=sinhalaarchaicnumbers */, - { 0, 4033, 4718, 16, 15, UNI_LOWERCASELETTER } /* generalcategory=lowercaseletter */, - { 32, 8780, 867, 6, 11, UNI_PHONETICEXT } /* block=phoneticext */, - { 0, 7218, 6193, 10, 12, UNI_LB__HL } /* linebreak=hebrewletter */, - { 1, 3133, 1, 18, 1, -UNI_EBASE } /* emojimodifierbase=n */, - { 0, 8780, 5606, 6, 14, UNI_SUPPUNCTUATION } /* block=suppunctuation */, - { 1, 1166, 0, 26, 0, UNI_di_values_index } /* defaultignorablecodepoint= */, - { 0, 10012, 9868, 3, 4, UNI_EA__W } /* ea=wide */, - { 1, 9488, 4479, 5, 6, UNI_BRAI } /* blk=braille */, - { 0, 9508, 3007, 4, 13, UNI_CCC__214 } /* ccc=attachedabove */, - { 1, 1417, 9161, 25, 4, UNI_CCC__26 } /* canonicalcombiningclass=ccc26 */, - { 0, 21, 8912, 2, 6, UNI_INKHOJKI } /* inkhojki */, - { 0, 8858, 26, 6, 1, UNI_ECOMP } /* ecomp=y */, - { 16, 9768, 9724, 4, 4, UNI_PHNX } /* scx=phnx */, - { 6, 9768, 8091, 4, 8, UNI_ARMN } /* scx=armenian */, - { 4, 9277, 8107, 3, 4, UNI_BALI } /* sc=bali */, - { 6, 10132, 10015, 3, 3, UNI_WB__EB } /* wb=ebg */, - { 0, 689, 0, 30, 0, UNI_CJKEXTG } /* cjkunifiedideographsextensiong */, - { 3, 6231, 3026, 3, 10, UNI_CHEROKEESUP } /* incherokeesup */, - { 1, 4703, 0, 15, 0, UNI_ARMI } /* imperialaramaic */, - { 0, 8589, 8924, 7, 6, UNI_LEPC } /* script=lepcha */, - { 0, 1552, 6035, 9, 2, UNI_PF } /* category=pf */, - { 18, 567, 0, 2, 0, UNI_NB } /* nb */, - { 4, 7218, 908, 10, 2, UNI_LB__PR } /* linebreak=pr */, - { 0, 4916, 9331, 3, 4, UNI_TALE } /* istaile */, - { 0, 21, 9038, 2, 6, UNI_INYEZIDI } /* inyezidi */, - { 6, 5986, 7789, 13, 2, UNI_NV__50 } /* numericvalue=50 */, - { 5, 10315, 3379, 5, 5, UNI_XPOSIXBLANK } /* horizspace */, - { 1, 184, 8841, 3, 5, UNI_CAKM } /* ischakma */, - { 1, 8884, 36, 4, 1, UNI_EXT } /* ext=t */, - { 0, 9768, 9812, 4, 4, UNI_TAML } /* scx=taml */, - { 0, 8780, 6620, 6, 6, UNI_DOMINO } /* block=domino */, - { 1, 8589, 8618, 8, 6, UNI_SOYO } /* script=soyombo */, - { 3, 3836, 2224, 17, 21, UNI_PRTI } /* scriptextensions=inscriptionalparthian */, - { 0, 8780, 43, 7, 2, UNI_CJK } /* block=cjk */, - { 0, 7318, 10078, 10, 3, UNI_IN__2_DOT_1 } /* presentin=v21 */, - { 5, 8780, 8359, 7, 6, UNI_CJKEXTB } /* block=cjkextb */, - { 6, 184, 3133, 2, 17, UNI_EBASE } /* isemojimodifierbase */, - { 0, 8780, 8912, 6, 6, UNI_INKHOJKI } /* block=khojki */, - { 0, 9277, 3785, 3, 10, UNI_SC__MANI } /* sc=manichaean */, - { 2, 10003, 36, 3, 1, UNI_CI } /* ci=t */, - { 1, 9277, 9512, 3, 4, UNI_CHRS } /* sc=chrs */, - { 3, 3367, 1, 18, 1, -UNI__PERL_PATWS } /* patternwhitespace=n */, - { 3, 8123, 0, 8, 0, UNI_BUGI } /* buginese */, - { 1, 10132, 4360, 3, 9, UNI_WB__EB } /* wb=emodifier */, - { 8, 8780, 2703, 6, 19, UNI_ENCLOSEDALPHANUMSUP } /* block=enclosedalphanumsup */, - { 1, 8780, 749, 6, 16, UNI_ENCLOSEDALPHANUM } /* block=enclosedalphanum */, - { 3, 8666, 0, 7, 0, UNI_TIRH } /* tirhuta */, - { 7, 9997, 10054, 3, 3, UNI_BC__PDF } /* bc=pdf */, - { 2, 8589, 9085, 7, 5, UNI_BATK } /* script=batak */, - { 1, 9488, 42, 4, 3, UNI_CJK } /* blk=cjk */, - { 1, 10033, 18, 3, 2, UNI_RI } /* lb=ri */, - { 1, 1188, 9003, 3, 5, UNI_INTELUGU } /* intelugu */, - { 17, 184, 1018, 2, 5, UNI_MUSIC } /* ismusic */, - { 3, 10024, 1587, 3, 1, UNI_Z } /* gc=z */, - { 1, 8491, 0, 4, 0, UNI_MARC } /* marc */, - { 14, 6231, 43, 3, 35, UNI_CJKCOMPATIDEOGRAPHSSUP } /* incjkcompatibilityideographssupplement */, - { 0, 5037, 9836, 9, 4, UNI_XPOSIXXDIGIT } /* hexdigit=true */, - { 0, 6420, 7279, 3, 9, UNI_INOLDPERSIAN } /* inoldpersian */, - { 0, 9488, 8116, 5, 7, UNI_INBASSAVAH } /* blk=bassavah */, - { 6, 9235, 0, 4, 0, UNI_CWCM } /* cwcm */, - { 6, 9488, 7693, 4, 9, UNI_INSAMARITAN } /* blk=samaritan */, - { 8, 1417, 9206, 25, 4, UNI_CCC__35 } /* canonicalcombiningclass=ccc35 */, - { 0, 10296, 2, 3, 1, UNI_PI } /* ispi */, - { 2, 9768, 9464, 4, 4, UNI_ARMN } /* scx=armn */, - { 0, 5508, 3, 14, 1, -UNI_PATSYN } /* patternsyntax=f */, - { 0, 1008, 0, 2, 0, UNI_CI } /* ci */, - { 0, 9277, 7291, 3, 4, UNI_SC__SOGD } /* sc=sogd */, - { 11, 184, 6840, 2, 4, UNI_NAND } /* isnand */, - { 11, 8147, 1025, 8, 2, -UNI_EXTPICT } /* extpict=no */, - { 0, 184, 720, 3, 29, UNI_CUNEIFORMNUMBERS } /* iscuneiformnumbersandpunctuation */, - { 1, 5986, 7819, 13, 8, UNI_NV__3_SLASH_16 } /* numericvalue=1.88e-01 */, - { 0, 9488, 183, 4, 20, UNI_MISCSYMBOLS } /* blk=miscellaneoussymbols */, - { 0, 9488, 8407, 4, 7, UNI_DSRT } /* blk=deseret */, - { 0, 10129, 9255, 3, 5, -UNI_VS } /* vs=false */, - { 0, 5032, 3, 14, 1, -UNI_POSIXXDIGIT } /* asciihexdigit=f */, - { 1, 184, 5284, 2, 7, UNI_LISUSUP } /* islisusup */, - { 2, 9488, 8631, 4, 7, UNI_SUPPUAB } /* blk=suppuab */, - { 10, 1552, 7, 10, 1, UNI_SC } /* category=sc */, - { 4, 184, 720, 3, 15, UNI_CUNEIFORMNUMBERS } /* iscuneiformnumbers */, - { 10, 3151, 0, 18, 0, UNI_epres_values_index } /* emojipresentation= */, - { 6, 5791, 5382, 13, 14, UNI_JG__MANICHAEANQOPH } /* joininggroup=manichaeanqoph */, - { 1, 8267, 0, 8, 0, UNI_radical_values_index } /* radical= */, - { 3, 3374, 26, 11, 1, UNI_XPOSIXSPACE } /* whitespace=y */, - { 10, 9464, 0, 4, 0, UNI_ARMN } /* armn */, - { 3, 7028, 9039, 3, 3, UNI_YEZI } /* isyezi */, - { 1, 8780, 3026, 7, 7, UNI_INCHEROKEE } /* block=cherokee */, - { 0, 10063, 0, 3, 0, UNI_sd_values_index } /* sd= */, - { 2, 3836, 1537, 18, 3, UNI_SIND } /* scriptextensions=sind */, - { 0, 8894, 1, 6, 1, -UNI_JOINC } /* joinc=n */, - { 10, 10296, 9729, 3, 3, UNI_MIAO } /* isplrd */, - { 0, 9488, 2722, 4, 19, UNI_JAMOEXTA } /* blk=hanguljamoextendeda */, - { 1, 10009, 8948, 3, 6, UNI_DT__NAR } /* dt=narrow */, - { 1, 8780, 6884, 6, 11, UNI_INPAHAWHHMONG } /* block=pahawhhmong */, - { 2, 3836, 7308, 17, 10, UNI_PHNX } /* scriptextensions=phoenician */, - { 0, 9235, 36, 5, 1, UNI_CWCM } /* cwcm=t */, - { 8, 8589, 9688, 7, 4, UNI_NKO } /* script=nkoo */, - { 1, 9508, 7078, 4, 10, UNI_CCC__BR } /* ccc=belowright */, - { 4, 6133, 0, 12, 0, UNI_ETHIOPICEXTA } /* ethiopicexta */, - { 1, 10033, 10164, 3, 2, UNI_GCB__V } /* lb=jv */, - { 3, 9768, 1222, 4, 4, UNI_KANA } /* scx=kana */, - { 0, 10048, 9060, 3, 5, UNI_NV__11_SLASH_12 } /* nv=11/12 */, - { 2, 4033, 48, 16, 1, UNI_P } /* generalcategory=p */, - { 7, 9997, 4321, 3, 16, UNI_BC__S } /* bc=segmentseparator */, - { 1, 9768, 9828, 4, 4, UNI_THAI } /* scx=thai */, - { 0, 184, 5508, 2, 13, UNI_PATSYN } /* ispatternsyntax */, - { 0, 9277, 2912, 3, 4, UNI_SUND } /* sc=sund */, - { 0, 3836, 9532, 17, 4, UNI_CYRL } /* scriptextensions=cyrl */, - { 1, 184, 43, 3, 15, UNI_CJKCOMPAT } /* iscjkcompatibility */, - { 2, 3529, 1, 18, 1, -UNI_VS } /* variationselector=n */, - { 0, 9768, 9668, 4, 4, UNI_MTEI } /* scx=mtei */, - { 0, 8589, 9752, 7, 4, UNI_SC__ROHG } /* script=rohg */, - { 14, 4583, 0, 4, 0, UNI_DASH } /* dash */, - { 6, 5986, 10152, 13, 2, UNI_NV__49 } /* numericvalue=49 */, - { 0, 184, 1060, 3, 3, UNI_COPT } /* iscopt */, - { 7, 117, 1908, 4, 14, UNI_INDICNUMBERFORMS } /* inindicnumberforms */, - { 3, 1899, 0, 2, 0, UNI_PC } /* pc */, - { 0, 7155, 5187, 3, 13, UNI_HIGHSURROGATES } /* ishighsurrogates */, - { 1, 2182, 34, 21, 2, UNI_GCB__EX } /* graphemeclusterbreak=ex */, - { 0, 10048, 7754, 3, 2, UNI_NV__11 } /* nv=11 */, - { 2, 3259, 0, 18, 0, UNI_idsb_values_index } /* idsbinaryoperator= */, - { 0, 21, 1677, 2, 9, UNI_LATINEXTE } /* inlatinexte */, - { 0, 8589, 2061, 7, 4, UNI_SC__MODI } /* script=modi */, - { 6, 7158, 1025, 10, 2, -UNI_DIA } /* diacritic=no */, - { 0, 10296, 909, 3, 9, UNI_CO } /* isprivateuse */, - { 0, 1417, 9201, 25, 4, UNI_CCC__34 } /* canonicalcombiningclass=ccc34 */, - { 0, 7739, 26, 8, 1, UNI_IDS } /* idstart=y */, - { 0, 809, 0, 22, 0, UNI_ENCLOSEDIDEOGRAPHICSUP } /* enclosedideographicsup */, - { 3, 9277, 2203, 3, 14, UNI_SC__ROHG } /* sc=hanifirohingya */, - { 8, 1537, 4600, 4, 13, UNI_DIACRITICALSEXT } /* indiacriticalsext */, - { 10, 3836, 9038, 17, 4, UNI_YEZI } /* scriptextensions=yezi */, - { 15, 9997, 3403, 3, 18, UNI_BC__RLI } /* bc=righttoleftisolate */, - { 0, 184, 6928, 2, 10, UNI_SD } /* issoftdotted */, - { 12, 9444, 9, 4, 2, UNI_AGE__NA } /* age=na */, - { 0, 21, 5256, 2, 14, UNI_LATINEXTD } /* inlatinextendedd */, - { 1, 7739, 9255, 8, 5, -UNI_IDS } /* idstart=false */, - { 3, 184, 3937, 2, 4, UNI_BOPO } /* isbopo */, - { 22, 10290, 10303, 6, 5, UNI_XPOSIXBLANK } /* xposixblank */, - { 1, 3151, 3, 18, 1, -UNI_EPRES } /* emojipresentation=f */, - { 1, 5037, 36, 9, 1, UNI_XPOSIXXDIGIT } /* hexdigit=t */, - { 1, 3025, 0, 18, 0, UNI_CHEROKEESUP } /* cherokeesupplement */, - { 0, 7155, 4066, 3, 15, UNI_HALFANDFULLFORMS } /* ishalfandfullforms */, - { 0, 10340, 3379, 6, 5, UNI_VERTSPACE } /* isvertspace */, - { 4, 10012, 9, 3, 2, UNI_EA__NA } /* ea=na */, - { 6, 8780, 8990, 6, 6, UNI_INREJANG } /* block=rejang */, - { 0, 7228, 36, 10, 1, UNI_XPOSIXLOWER } /* lowercase=t */, - { 8, 3836, 9860, 17, 4, UNI_VAI } /* scriptextensions=vaii */, - { 0, 1417, 8799, 25, 5, UNI_CCC__107 } /* canonicalcombiningclass=ccc107 */, - { 1, 6231, 6110, 3, 11, UNI_CYRILLICEXTB } /* incyrillicextb */, - { 0, 9444, 7826, 4, 4, UNI_AGE__12 } /* age=12.0 */, - { 4, 1812, 10135, 22, 3, UNI_CWL } /* changeswhenlowercased=yes */, - { 0, 406, 0, 7, 0, UNI_XPOSIXCNTRL } /* control */, - { 1, 9488, 6884, 4, 11, UNI_INPAHAWHHMONG } /* blk=pahawhhmong */, - { 11, 8589, 9480, 7, 4, UNI_BATK } /* script=batk */, - { 3, 5739, 9255, 13, 5, -UNI_GRBASE } /* graphemebase=false */, - { 7, 8589, 8840, 7, 6, UNI_SC__CAKM } /* script=chakma */, - { 0, 9488, 7398, 4, 10, UNI_SUPARROWSC } /* blk=suparrowsc */, - { 0, 9768, 2409, 4, 4, UNI_GLAG } /* scx=glag */, - { 1, 9277, 2287, 3, 7, UNI_SC__SINH } /* sc=sinhala */, - { 12, 10024, 339, 3, 2, UNI_LO } /* gc=lo */, - { 0, 7438, 125, 10, 2, UNI_LB__CR } /* wordbreak=cr */, - { 0, 9277, 2855, 3, 9, UNI_SC__MONG } /* sc=mongolian */, - { 1, 8414, 0, 7, 0, UNI_ELBA } /* elbasan */, - { 0, 10296, 2571, 3, 3, UNI_PRTI } /* isprti */, - { 1, 3836, 3025, 17, 8, UNI_CHER } /* scriptextensions=cherokee */, - { 1, 1591, 3170, 3, 7, UNI_INETHIOPIC } /* inethiopic */, - { 0, 8780, 6620, 6, 11, UNI_DOMINO } /* block=dominotiles */, - { 0, 1417, 9166, 25, 4, UNI_CCC__27 } /* canonicalcombiningclass=ccc27 */, - { 2, 4116, 3278, 3, 17, UNI_PI } /* isinitialpunctuation */, - { 18, 8888, 0, 4, 0, UNI_HATR } /* hatr */, - { 0, 8589, 7292, 8, 6, UNI_SC__SOGD } /* script=sogdian */, - { 3, 4791, 2062, 3, 3, UNI_INMODI } /* inmodi */, - { 1, 2218, 9689, 3, 2, UNI_INNKO } /* innko */, - { 4, 8930, 9255, 6, 5, -UNI_XPOSIXLOWER } /* lower=false */, - { 1, 3836, 1654, 17, 6, UNI_HANG } /* scriptextensions=hangul */, - { 2, 8780, 1466, 7, 23, UNI_DIACRITICALSFORSYMBOLS } /* block=combiningmarksforsymbols */, - { 2, 8589, 8936, 7, 4, UNI_LYCI } /* script=lyci */, - { 6, 184, 7, 3, 1, UNI_XPOSIXCNTRL } /* iscc */, - { 1, 9277, 8786, 3, 4, UNI_CARI } /* sc=cari */, - { 2, 184, 114, 3, 24, UNI_DIACRITICALS } /* iscombiningdiacriticalmarks */, - { 5, 9488, 7278, 4, 10, UNI_INOLDPERSIAN } /* blk=oldpersian */, - { 20, 1552, 206, 9, 2, UNI_PI } /* category=pi */, - { 1, 9508, 10172, 4, 2, UNI_CCC__9 } /* ccc=vr */, - { 0, 184, 1442, 3, 23, UNI_CJKSYMBOLS } /* iscjksymbolsandpunctuation */, - { 2, 10024, 598, 3, 2, UNI_XPOSIXCNTRL } /* gc=cc */, - { 14, 7325, 10096, 3, 3, UNI_IN__5 } /* in=v50 */, - { 0, 9277, 8680, 3, 7, UNI_ZZZZ } /* sc=unknown */, - { 0, 9270, 2555, 5, 6, UNI_INPC__BOTTOM } /* inpc=bottom */, - { 4, 8589, 1176, 8, 3, UNI_SORA } /* script=sora */, - { 2, 659, 0, 30, 0, UNI_CJKEXTF } /* cjkunifiedideographsextensionf */, - { 0, 8960, 17, 7, 1, UNI_COMPEX } /* nfcqc=no */, - { 1, 1417, 9468, 24, 4, UNI_CCC__216 } /* canonicalcombiningclass=atar */, - { 4, 8694, 1025, 7, 2, -UNI_XPOSIXSPACE } /* wspace=no */, - { 0, 9888, 0, 4, 0, UNI_ZANB } /* zanb */, - { 14, 8780, 3341, 6, 8, UNI_DINGBATS } /* block=dingbats */, - { 1, 7218, 5746, 10, 5, UNI_EBASE } /* linebreak=ebase */, - { 1, 8575, 1, 7, 1, -UNI_PATSYN } /* patsyn=n */, - { 0, 10048, 9380, 3, 4, UNI_NV__1_SLASH_80 } /* nv=1/80 */, - { 3, 9800, 0, 4, 0, UNI_TAGS } /* tags */, - { 1, 10290, 5039, 6, 6, UNI_XPOSIXXDIGIT } /* xposixxdigit */, - { 0, 9488, 2874, 4, 19, UNI_OTTOMANSIYAQNUMBERS } /* blk=ottomansiyaqnumbers */, - { 1, 9997, 6049, 3, 12, UNI_BC__AN } /* bc=arabicnumber */, - { 0, 4916, 8292, 3, 7, UNI_TAGB } /* istagbanwa */, - { 1, 4628, 0, 15, 0, UNI_ea_values_index } /* eastasianwidth= */, - { 0, 184, 8924, 2, 6, UNI_LEPC } /* islepcha */, - { 0, 7693, 0, 9, 0, UNI_SAMR } /* samaritan */, - { 0, 7318, 10075, 10, 3, UNI_IN__2 } /* presentin=v20 */, - { 5, 9488, 1294, 4, 25, UNI_SUPERANDSUB } /* blk=superscriptsandsubscripts */, - { 0, 10048, 7859, 3, 4, UNI_NV__2000 } /* nv=2000 */, - { 12, 21, 7188, 2, 10, UNI_INKHAROSHTHI } /* inkharoshthi */, - { 7, 3836, 3937, 17, 8, UNI_BOPO } /* scriptextensions=bopomofo */, - { 0, 9556, 6178, 4, 3, UNI_LB__ZWJ } /* gcb=zwj */, - { 2, 184, 149, 3, 34, UNI_DIACRITICALSSUP } /* iscombiningdiacriticalmarkssupplement */, - { 14, 6420, 4869, 3, 14, UNI_NARB } /* inoldnortharabian */, - { 0, 10030, 0, 4, 0, UNI_JT__L } /* jt=l */, - { 1, 2203, 0, 14, 0, UNI_ROHG } /* hanifirohingya */, - { 1, 5791, 6346, 13, 3, UNI_JG__NYA } /* joininggroup=nya */, - { 0, 8780, 6505, 6, 8, UNI_PHAISTOS } /* block=phaistos */, - { 4, 184, 9684, 2, 4, UNI_NEWA } /* isnewa */, - { 32, 4033, 908, 16, 10, UNI_CO } /* generalcategory=privateuse */, - { 12, 9277, 9484, 3, 4, UNI_BHKS } /* sc=bhks */, - { 5, 509, 0, 20, 0, UNI_CJK } /* cjkunifiedideographs */, - { 1, 10027, 7048, 3, 10, UNI_JG__AFRICANQAF } /* jg=africanqaf */, - { 0, 7438, 5851, 10, 2, UNI_WB__ML } /* wordbreak=ml */, - { 3, 9612, 0, 4, 0, UNI_KNDA } /* knda */, - { 1, 9488, 148, 4, 35, UNI_DIACRITICALSSUP } /* blk=combiningdiacriticalmarkssupplement */, - { 3, 7325, 7755, 3, 3, UNI_IN__1_DOT_1 } /* in=1.1 */, - { 0, 1552, 32, 9, 2, UNI__PERL_SURROGATE } /* category=cs */, - { 2, 9508, 6445, 4, 12, UNI_CCC__0 } /* ccc=notreordered */, - { 0, 2218, 7631, 3, 8, UNI_INNEWTAILUE } /* innewtailue */, - { 4, 9488, 8227, 4, 8, UNI_KANAEXTA } /* blk=kanaexta */, - { 0, 1988, 1025, 22, 2, -UNI_LOE } /* logicalorderexception=no */, - { 26, 8960, 47, 6, 1, UNI_NFCQC__M } /* nfcqc=m */, - { 0, 5986, 7859, 13, 3, UNI_NV__200 } /* numericvalue=200 */, - { 4, 3937, 0, 4, 0, UNI_BOPO } /* bopo */, - { 0, 8894, 9255, 6, 5, -UNI_JOINC } /* joinc=false */, - { 0, 21, 8924, 2, 6, UNI_INLEPCHA } /* inlepcha */, - { 0, 6553, 0, 12, 0, UNI_xidc_values_index } /* xidcontinue= */, - { 7, 7076, 4449, 3, 4, UNI_INBAMUM } /* inbamum */, - { 1, 10027, 4773, 3, 3, UNI_JG__SAD } /* jg=sad */, - { 0, 7218, 10174, 10, 2, UNI_LB__XX } /* linebreak=xx */, - { 0, 8780, 5284, 6, 7, UNI_LISUSUP } /* block=lisusup */, - { 0, 5578, 9080, 14, 5, UNI_SB__AT } /* sentencebreak=aterm */, - { 0, 10033, 4360, 3, 9, UNI_EMOD } /* lb=emodifier */, - { 1, 9277, 1536, 3, 4, UNI_SC__SIND } /* sc=sind */, - { 1, 8589, 8484, 7, 7, UNI_SC__MAND } /* script=mandaic */, - { 0, 3385, 0, 18, 0, UNI_ri_values_index } /* regionalindicator= */, - { 6, 3836, 9888, 17, 4, UNI_ZANB } /* scriptextensions=zanb */, - { 4, 9768, 2560, 4, 4, UNI_MAND } /* scx=mand */, - { 0, 6517, 0, 12, 0, UNI_PLAYINGCARDS } /* playingcards */, - { 1, 8780, 43, 7, 25, UNI_CJKCOMPATIDEOGRAPHS } /* block=cjkcompatibilityideographs */, - { 3, 8147, 0, 9, 0, -UNI_EXTPICT } /* extpict=f */, - { 0, 8780, 6517, 6, 12, UNI_PLAYINGCARDS } /* block=playingcards */, - { 1, 10027, 5856, 3, 13, UNI_JG__MALAYALAMNNNA } /* jg=malayalamnnna */, - { 1, 6420, 3332, 3, 17, UNI_ORNAMENTALDINGBATS } /* inornamentaldingbats */, - { 0, 9277, 497, 5, 3, UNI_KHMR } /* sc=khmer */, - { 0, 8780, 8942, 6, 6, UNI_INLYDIAN } /* block=lydian */, - { 1, 9488, 749, 4, 21, UNI_ENCLOSEDALPHANUM } /* blk=enclosedalphanumerics */, - { 0, 4033, 132, 16, 2, UNI_LM } /* generalcategory=lm */, - { 0, 8780, 3457, 6, 11, UNI_TAIXUANJING } /* block=taixuanjing */, - { 2, 2224, 896, 3, 27, UNI_SUPPUAA } /* insupplementaryprivateuseareaa */, - { 0, 3379, 1025, 6, 2, -UNI_XPOSIXSPACE } /* space=no */, - { 0, 1812, 26, 22, 1, UNI_CWL } /* changeswhenlowercased=y */, - { 0, 9768, 9680, 4, 4, UNI_NBAT } /* scx=nbat */, - { 0, 4791, 393, 3, 2, UNI_INMRO } /* inmro */, - { 1, 184, 9664, 2, 3, UNI_MRO } /* ismro */, - { 2, 9488, 5804, 4, 13, UNI_KANAEXTA } /* blk=kanaextendeda */, - { 0, 10132, 0, 3, 0, UNI_wb_values_index } /* wb= */, - { 0, 8924, 0, 4, 0, UNI_LEPC } /* lepc */, - { 6, 8659, 0, 7, 0, UNI_TIBT } /* tibetan */, - { 2, 184, 1060, 3, 5, UNI_COPT } /* iscoptic */, - { 22, 9508, 9026, 4, 6, UNI_CCC__9 } /* ccc=virama */, - { 1, 9270, 868, 3, 10, UNI_PHONETICEXT } /* inphoneticext */, - { 0, 1677, 0, 5, 0, UNI_LATN } /* latin */, - { 1, 3385, 9836, 18, 4, UNI_RI } /* regionalindicator=true */, - { 0, 1790, 36, 22, 1, UNI_CWCM } /* changeswhencasemapped=t */, - { 3, 8589, 9660, 7, 4, UNI_SC__MLYM } /* script=mlym */, - { 0, 10033, 6169, 3, 4, UNI_LB__GL } /* lb=glue */, - { 4, 1537, 2988, 24, 19, UNI_INPC__TOPANDBOTTOMANDLEFT } /* indicpositionalcategory=topandbottomandleft */, - { 3, 5791, 3819, 13, 17, UNI_JG__MANICHAEANTHAMEDH } /* joininggroup=manichaeanthamedh */, - { 4, 5986, 10150, 13, 2, UNI_NV__48 } /* numericvalue=48 */, - { 4, 184, 6796, 2, 11, UNI_MEDF } /* ismedefaidrin */, - { 18, 3382, 36, 3, 1, UNI_CE } /* ce=t */, - { 8, 10048, 7978, 3, 2, UNI_NV__16 } /* nv=16 */, - { 1, 7438, 73, 10, 2, UNI_WB__EB } /* wordbreak=em */, - { 2, 1417, 9196, 25, 4, UNI_CCC__33 } /* canonicalcombiningclass=ccc33 */, - { 19, 9768, 9620, 4, 4, UNI_LANA } /* scx=lana */, - { 2, 3382, 10135, 3, 3, UNI_CE } /* ce=yes */, - { 17, 8780, 4883, 6, 15, UNI_SARB } /* block=oldsoutharabian */, - { 17, 8243, 0, 8, 0, UNI_MAHJ } /* mahajani */, - { 1, 5674, 0, 13, 0, UNI_bidim_values_index } /* bidimirrored= */, - { 2, 9488, 867, 4, 18, UNI_PHONETICEXT } /* blk=phoneticextensions */, - { 0, 6229, 36, 12, 1, UNI_JOINC } /* joincontrol=t */, - { 16, 3836, 9576, 17, 4, UNI_GURU } /* scriptextensions=guru */, - { 4, 5791, 5620, 13, 10, UNI_JG__TEHMARBUTA } /* joininggroup=tehmarbuta */, - { 2, 10048, 9055, 3, 4, UNI_NV__1_SLASH_32 } /* nv=1/32 */, - { 0, 21, 5270, 2, 14, UNI_LATINEXTE } /* inlatinextendede */, - { 1, 10030, 0, 3, 1, UNI_JT__U } /* jt=u */, - { 0, 184, 9226, 3, 4, UNI_XPOSIXCNTRL } /* iscntrl */, - { 0, 7218, 25, 10, 2, UNI_LB__SY } /* linebreak=sy */, - { 7, 3097, 10066, 18, 3, UNI_DT__SML } /* decompositiontype=sml */, - { 12, 184, 9533, 3, 3, UNI_CYRL } /* iscyrl */, - { 1, 4791, 2856, 3, 18, UNI_MONGOLIANSUP } /* inmongoliansupplement */, - { 10, 4658, 9836, 15, 4, UNI_GREXT } /* graphemeextend=true */, - { 9, 7218, 10156, 10, 2, UNI_LB__BK } /* linebreak=bk */, - { 1, 9488, 4673, 4, 15, UNI_INHANGUL } /* blk=hangulsyllables */, - { 3, 184, 2010, 2, 22, UNI_MISCTECHNICAL } /* ismiscellaneoustechnical */, - { 3, 4033, 5592, 16, 14, UNI_ZS } /* generalcategory=spaceseparator */, - { 1, 10048, 9413, 3, 3, UNI_NV__7_SLASH_2 } /* nv=7/2 */, - { 0, 7088, 3773, 10, 3, UNI_BC__RLI } /* bidiclass=rli */, - { 4, 9488, 3683, 4, 17, UNI_ETHIOPICEXTA } /* blk=ethiopicextendeda */, - { 2, 9230, 26, 5, 1, UNI_CWCF } /* cwcf=y */, - { 0, 8589, 9002, 7, 6, UNI_SC__TELU } /* script=telugu */, - { 0, 10009, 45, 3, 6, UNI_DT__COM } /* dt=compat */, - { 0, 9240, 9255, 5, 5, -UNI_DASH } /* dash=false */, - { 0, 10024, 4718, 3, 15, UNI_LOWERCASELETTER } /* gc=lowercaseletter */, - { 1, 5986, 8720, 13, 3, UNI_NV__400 } /* numericvalue=400 */, - { 0, 2280, 9316, 3, 4, UNI_ORYA } /* isoriya */, - { 0, 3374, 1025, 11, 2, -UNI_XPOSIXSPACE } /* whitespace=no */, - { 1, 8688, 2314, 3, 3, UNI_POSIXXDIGIT } /* isahex */, - { 6, 9768, 9664, 4, 4, UNI_MRO } /* scx=mroo */, - { 0, 9768, 2855, 4, 9, UNI_MONG } /* scx=mongolian */, - { 0, 8780, 6086, 7, 11, UNI_CHESSSYMBOLS } /* block=chesssymbols */, - { 3, 184, 895, 2, 28, UNI_SUPPUAA } /* issupplementaryprivateuseareaa */, - { 8, 8882, 10135, 6, 3, UNI_GREXT } /* grext=yes */, - { 0, 9768, 9748, 4, 4, UNI_RJNG } /* scx=rjng */, - { 2, 8780, 690, 7, 29, UNI_CJKEXTG } /* block=cjkunifiedideographsextensiong */, - { 8, 2218, 8527, 3, 6, UNI_NB } /* innoblock */, - { 2, 8589, 9664, 7, 3, UNI_MRO } /* script=mro */, - { 0, 10063, 9255, 3, 5, -UNI_SD } /* sd=false */, - { 20, 4033, 106, 16, 6, UNI_S } /* generalcategory=symbol */, - { 2, 10027, 9456, 3, 4, UNI_JG__ALEF } /* jg=alef */, - { 0, 4916, 9009, 3, 5, UNI_THAA } /* isthaana */, - { 7, 7325, 7827, 3, 3, UNI_IN__2 } /* in=2.0 */, - { 0, 1417, 9131, 25, 4, UNI_CCC__20 } /* canonicalcombiningclass=ccc20 */, - { 1, 3374, 0, 10, 0, UNI_XPOSIXSPACE } /* whitespace */, - { 2, 184, 1700, 2, 23, UNI_SHORTHANDFORMATCONTROLS } /* isshorthandformatcontrols */, - { 0, 8638, 0, 7, 0, UNI_TGLG } /* tagalog */, - { 9, 8780, 9002, 6, 6, UNI_INTELUGU } /* block=telugu */, - { 10, 9488, 1654, 4, 6, UNI_INHANGUL } /* blk=hangul */, - { 4, 9488, 8610, 4, 7, UNI_INSIDDHAM } /* blk=siddham */, - { 1, 10012, 4471, 3, 7, UNI_EA__N } /* ea=neutral */, - { 1, 3836, 9732, 17, 4, UNI_PRTI } /* scriptextensions=prti */, - { 1, 184, 1218, 2, 26, UNI_KATAKANAEXT } /* iskatakanaphoneticextensions */, - { 7, 9277, 7569, 5, 7, UNI_SC__SIND } /* sc=khudawadi */, - { 0, 10291, 62, 5, 5, UNI_POSIXGRAPH } /* posixgraph */, - { 23, 184, 6620, 2, 11, UNI_DOMINO } /* isdominotiles */, - { 0, 9896, 0, 4, 0, UNI_ZYYY } /* zyyy */, - { 0, 10027, 5354, 3, 14, UNI_JG__MANICHAEANHETH } /* jg=manichaeanheth */, - { 4, 5986, 7468, 13, 9, UNI_NV___MINUS_1_SLASH_2 } /* numericvalue=-5.00e-01 */, - { 0, 10048, 8043, 3, 8, UNI_NV__4_SLASH_5 } /* nv=8.00e-01 */, - { 0, 3836, 7657, 17, 9, UNI_PERM } /* scriptextensions=oldpermic */, - { 1, 184, 1835, 3, 20, UNI_CWT } /* ischangeswhentitlecased */, - { 4, 9488, 1677, 4, 23, UNI_LATINEXTADDITIONAL } /* blk=latinextendedadditional */, - { 1, 2280, 9709, 3, 3, UNI_ORYA } /* isorya */, - { 2, 3836, 8924, 17, 6, UNI_LEPC } /* scriptextensions=lepcha */, - { 1, 9768, 6193, 4, 4, UNI_HEBR } /* scx=hebr */, - { 2, 9488, 5816, 5, 7, UNI_INBALINESE } /* blk=balinese */, - { 1, 9508, 2455, 4, 5, UNI_CCC__R } /* ccc=right */, - { 0, 1677, 0, 9, 0, UNI_LATINEXTE } /* latinexte */, - { 0, 9277, 2409, 3, 4, UNI_SC__GLAG } /* sc=glag */, - { 2, 9488, 5522, 4, 14, UNI_PHONETICEXTSUP } /* blk=phoneticextsup */, - { 0, 7438, 6917, 10, 11, UNI_WB__SQ } /* wordbreak=singlequote */, - { 1, 2182, 5633, 21, 2, UNI_LB__H2 } /* graphemeclusterbreak=lv */, - { 40, 6231, 3026, 3, 17, UNI_CHEROKEESUP } /* incherokeesupplement */, - { 6, 467, 0, 5, 0, UNI_P } /* punct */, - { 1, 10024, 5817, 3, 13, UNI_ZL } /* gc=lineseparator */, - { 0, 9768, 8337, 4, 7, UNI_AVST } /* scx=avestan */, - { 1, 184, 114, 3, 34, UNI_DIACRITICALSFORSYMBOLS } /* iscombiningdiacriticalmarksforsymbols */, - { 4, 9488, 1513, 4, 24, UNI_HIGHPUSURROGATES } /* blk=highprivateusesurrogates */, - { 0, 9277, 4001, 3, 7, UNI_SC__CPRT } /* sc=cypriot */, - { 0, 5986, 9380, 13, 4, UNI_NV__1_SLASH_80 } /* numericvalue=1/80 */, - { 0, 10291, 5040, 5, 5, UNI_POSIXDIGIT } /* posixdigit */, - { 6, 8589, 9310, 7, 5, UNI_OGAM } /* script=ogham */, - { 0, 184, 2245, 2, 21, UNI_MEETEIMAYEKEXT } /* ismeeteimayekextensions */, - { 1, 3836, 8442, 17, 7, UNI_HANO } /* scriptextensions=hanunoo */, - { 1, 6241, 7258, 12, 10, UNI_JT__U } /* joiningtype=nonjoining */, - { 2, 10009, 4017, 3, 5, UNI_DT__FIN } /* dt=final */, - { 9, 3836, 6277, 17, 4, UNI_MAHJ } /* scriptextensions=mahj */, - { 3, 4989, 1129, 3, 3, UNI_UCAS } /* isucas */, - { 2, 8509, 2705, 4, 17, UNI_ENCLOSEDALPHANUMSUP } /* inenclosedalphanumsup */, - { 5, 10051, 0, 3, 0, UNI_OCR } /* ocr */, - { 1, 3717, 8330, 17, 7, UNI_IDENTIFIERSTATUS__ALLOWED } /* identifierstatus=allowed */, - { 0, 9768, 1628, 4, 4, UNI_PHAG } /* scx=phag */, - { 1, 10024, 6265, 3, 12, UNI_NL } /* gc=letternumber */, - { 0, 8996, 9837, 7, 3, UNI_STERM } /* sterm=true */, - { 0, 9488, 3683, 4, 11, UNI_ETHIOPICEXT } /* blk=ethiopicext */, - { 1, 9768, 6484, 4, 4, UNI_HUNG } /* scx=hung */, - { 9, 9038, 0, 6, 0, UNI_YEZI } /* yezidi */, - { 0, 6231, 7129, 3, 9, UNI_CJKSTROKES } /* incjkstrokes */, - { 2, 10033, 0, 3, 0, UNI_lb_values_index } /* lb= */, - { 0, 8960, 0, 7, 0, UNI_COMPEX } /* nfcqc=n */, - { 0, 1189, 5713, 3, 7, UNI_XPOSIXDIGIT } /* nt=decimal */, - { 4, 6241, 6, 12, 1, UNI_JT__D } /* joiningtype=d */, - { 0, 9277, 4883, 3, 15, UNI_SARB } /* sc=oldsoutharabian */, - { 0, 6805, 206, 6, 11, UNI_MISCPICTOGRAPHS } /* inmiscpictographs */, - { 8, 10024, 467, 3, 11, UNI_P } /* gc=punctuation */, - { 9, 9768, 8187, 4, 4, UNI_HIRA } /* scx=hira */, - { 4, 184, 7513, 2, 9, UNI_BHKS } /* isbhaiksuki */, - { 2, 5986, 9376, 13, 4, UNI_NV__1_SLASH_64 } /* numericvalue=1/64 */, - { 21, 9488, 7531, 4, 9, UNI_EMOTICONS } /* blk=emoticons */, - { 6, 7684, 0, 4, 0, UNI_PAUC } /* pauc */, - { 12, 4273, 0, 7, 0, UNI_MYMR } /* myanmar */, - { 12, 7657, 0, 9, 0, UNI_PERM } /* oldpermic */, - { 0, 6231, 510, 3, 19, UNI_CJK } /* incjkunifiedideographs */, - { 8, 184, 9644, 2, 4, UNI_MEDF } /* ismedf */, - { 3, 951, 0, 18, 0, UNI_INVS } /* variationselectors */, - { 0, 8780, 5018, 6, 14, UNI_ANCIENTSYMBOLS } /* block=ancientsymbols */, - { 5, 1417, 3015, 24, 10, UNI_CCC__AR } /* canonicalcombiningclass=aboveright */, - { 1, 4116, 3260, 3, 3, UNI_IDSB } /* isidsb */, - { 68, 1966, 2389, 22, 20, UNI_INSC__CONSONANTWITHSTACKER } /* indicsyllabiccategory=consonantwithstacker */, - { 3, 10126, 18, 3, 1, UNI_VO__R } /* vo=r */, - { 8, 8688, 9441, 3, 3, UNI_ADLM } /* isadlm */, - { 6, 9277, 2608, 3, 4, UNI_BRAH } /* sc=brah */, - { 10, 10333, 6, 3, 1, UNI_SD } /* issd */, - { 0, 4033, 27, 16, 2, UNI_LOWERCASELETTER } /* generalcategory=ll */, - { 9, 5791, 4778, 13, 15, UNI_JG__MANICHAEANZAYIN } /* joininggroup=manichaeanzayin */, - { 0, 8780, 1631, 6, 15, UNI_GEOMETRICSHAPES } /* block=geometricshapes */, - { 0, 8870, 0, 6, 0, UNI_epres_values_index } /* epres= */, - { 1, 9716, 36, 4, 1, UNI_PCM } /* pcm=t */, - { 0, 3836, 8498, 17, 7, UNI_MULT } /* scriptextensions=multani */, - { 0, 184, 4360, 2, 4, UNI_EMOD } /* isemod */, - { 0, 10033, 42, 3, 2, UNI_LB__CJ } /* lb=cj */, - { 1, 5986, 8744, 13, 4, UNI_NV__7000 } /* numericvalue=7000 */, - { 0, 1591, 7533, 4, 7, UNI_EMOTICONS } /* inemoticons */, - { 2, 9488, 10051, 4, 3, UNI_OCR } /* blk=ocr */, - { 9, 9768, 7292, 5, 3, UNI_SOGD } /* scx=sogd */, - { 0, 9768, 9564, 4, 4, UNI_GONM } /* scx=gonm */, - { 2, 3836, 8477, 17, 7, UNI_MAKA } /* scriptextensions=makasar */, - { 34, 3836, 6973, 18, 10, UNI_SYLO } /* scriptextensions=sylotinagri */, - { 2, 1417, 4134, 24, 1, UNI_CCC__1 } /* canonicalcombiningclass=1 */, - { 9, 9556, 6763, 4, 3, UNI_LB__H3 } /* gcb=lvt */, - { 0, 184, 1585, 2, 23, UNI_BYZANTINEMUSIC } /* isbyzantinemusicalsymbols */, - { 0, 1537, 0, 24, 0, UNI_inpc_values_index } /* indicpositionalcategory= */, - { 0, 1979, 4720, 11, 13, UNI_LOWERCASELETTER } /* category=lowercaseletter */, - { 0, 5986, 9404, 13, 4, UNI_NV__13_SLASH_2 } /* numericvalue=13/2 */, - { 0, 8780, 779, 6, 30, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* block=symbolsandpictographsextendeda */, - { 17, 9277, 8428, 3, 4, UNI_SC__GRAN } /* sc=gran */, - { 0, 9768, 9692, 4, 4, UNI_NSHU } /* scx=nshu */, - { 0, 4273, 0, 16, 0, UNI_MYANMAREXTA } /* myanmarextendeda */, - { 0, 7218, 6178, 10, 3, UNI_LB__ZWJ } /* linebreak=zwj */, - { 1, 8768, 3, 6, 1, -UNI_BIDIC } /* bidic=f */, - { 3, 8930, 1025, 6, 2, -UNI_XPOSIXLOWER } /* lower=no */, - { 8, 10048, 7933, 3, 2, UNI_NV__17 } /* nv=17 */, - { 1, 1417, 9191, 25, 4, UNI_CCC__32 } /* canonicalcombiningclass=ccc32 */, - { 5, 9444, 10084, 4, 3, UNI_AGE__3_DOT_1 } /* age=v31 */, - { 0, 9488, 8582, 4, 7, UNI_INPHAGSPA } /* blk=phagspa */, - { 4, 8589, 2817, 7, 4, UNI_MERO } /* script=mero */, - { 8, 8449, 3, 7, 1, -UNI_HYPHEN } /* hyphen=f */, - { 13, 8997, 3, 5, 1, -UNI_TERM } /* term=f */, - { 0, 10048, 8708, 3, 6, UNI_NV__216000 } /* nv=216000 */, - { 0, 7438, 1194, 10, 2, UNI_LB__LF } /* wordbreak=lf */, - { 1, 3836, 6884, 17, 11, UNI_HMNG } /* scriptextensions=pahawhhmong */, - { 1, 10027, 9772, 3, 4, UNI_JG__SEEN } /* jg=seen */, - { 9, 3836, 9448, 17, 4, UNI_AGHB } /* scriptextensions=aghb */, - { 0, 3836, 3895, 18, 3, UNI_SGNW } /* scriptextensions=sgnw */, - { 32, 10030, 36, 3, 1, UNI_JT__T } /* jt=t */, - { 10, 3836, 8171, 17, 8, UNI_GUJR } /* scriptextensions=gujarati */, - { 15, 21, 5228, 2, 14, UNI_LATINEXTB } /* inlatinextendedb */, - { 1, 9444, 9985, 4, 3, UNI_AGE__7 } /* age=7.0 */, - { 9, 4422, 3117, 4, 16, UNI_DEVANAGARIEXT } /* indevanagariextended */, - { 0, 184, 9480, 2, 4, UNI_BATK } /* isbatk */, - { 1, 10333, 7292, 3, 3, UNI_SOGD } /* issogd */, - { 0, 1812, 36, 22, 1, UNI_CWL } /* changeswhenlowercased=t */, - { 0, 8864, 1025, 6, 2, -UNI_EMOJI } /* emoji=no */, - { 2, 9508, 8795, 4, 3, UNI_CCC__103 } /* ccc=103 */, - { 6, 8603, 0, 7, 0, UNI_SHAW } /* shavian */, - { 0, 4145, 0, 7, 0, UNI_LINB } /* linearb */, - { 1, 1979, 1045, 10, 5, UNI_L } /* category=letter */, - { 4, 8456, 0, 7, 0, UNI_KNDA } /* kannada */, - { 0, 1552, 3349, 9, 18, UNI_ZP } /* category=paragraphseparator */, - { 2, 9277, 8421, 3, 4, UNI_ELYM } /* sc=elym */, - { 2, 4688, 7005, 15, 11, UNI_IDENTIFIERTYPE__UNCOMMONUSE } /* identifiertype=uncommonuse */, - { 1, 4688, 6895, 15, 11, UNI_IDENTIFIERTYPE__RECOMMENDED } /* identifiertype=recommended */, - { 0, 1417, 9136, 25, 4, UNI_CCC__21 } /* canonicalcombiningclass=ccc21 */, - { 0, 8688, 1395, 4, 22, UNI_ARABICPFB } /* isarabicpresentationformsb */, - { 1, 2224, 7292, 3, 6, UNI_INSOGDIAN } /* insogdian */, - { 9, 8589, 7630, 7, 9, UNI_TALU } /* script=newtailue */, - { 1, 8780, 4385, 6, 16, UNI_TANGUTCOMPONENTS } /* block=tangutcomponents */, - { 3, 4033, 3349, 16, 18, UNI_ZP } /* generalcategory=paragraphseparator */, - { 4, 10048, 7963, 3, 8, UNI_NV__11_SLASH_2 } /* nv=5.50e+00 */, - { 2, 8768, 0, 6, 0, UNI_bidic_values_index } /* bidic= */, - { 6, 184, 923, 2, 28, UNI_SUPPUAB } /* issupplementaryprivateuseareab */, - { 3, 9262, 10174, 3, 2, UNI_SB__XX } /* sb=xx */, - { 2, 2224, 7369, 3, 9, UNI_SMALLFORMS } /* insmallforms */, - { 0, 8864, 10135, 6, 3, UNI_EMOJI } /* emoji=yes */, - { 10, 10024, 132, 3, 2, UNI_LM } /* gc=lm */, - { 0, 8780, 4433, 6, 15, UNI_ARABICEXTA } /* block=arabicextendeda */, - { 5, 1171, 0, 2, 0, UNI_TITLE } /* lt */, - { 0, 9444, 10117, 4, 3, UNI_AGE__7 } /* age=v70 */, - { 0, 8589, 78, 7, 6, UNI_SC__ARAB } /* script=arabic */, - { 1, 8780, 9330, 6, 5, UNI_INTAILE } /* block=taile */, - { 6, 9277, 3785, 3, 4, UNI_SC__MANI } /* sc=mani */, - { 0, 9997, 6037, 3, 12, UNI_BC__AL } /* bc=arabicletter */, - { 5, 6241, 0, 12, 0, UNI_jt_values_index } /* joiningtype= */, - { 0, 4791, 6819, 3, 10, UNI_MYANMAREXTA } /* inmyanmarexta */, - { 3, 9277, 8617, 3, 7, UNI_SOYO } /* sc=soyombo */, - { 0, 2288, 1195, 5, 23, UNI_HALFANDFULLFORMS } /* inhalfwidthandfullwidthforms */, - { 2, 8470, 0, 7, 0, UNI_LINA } /* lineara */, - { 5, 3374, 9836, 11, 4, UNI_XPOSIXSPACE } /* whitespace=true */, - { 5, 9014, 26, 6, 1, UNI_UIDEO } /* uideo=y */, - { 0, 9768, 9824, 4, 4, UNI_TGLG } /* scx=tglg */, - { 12, 5578, 10174, 14, 2, UNI_SB__XX } /* sentencebreak=xx */, - { 2, 1537, 2449, 24, 4, UNI_INPC__LEFT } /* indicpositionalcategory=left */, - { 2, 9488, 867, 4, 28, UNI_PHONETICEXTSUP } /* blk=phoneticextensionssupplement */, - { 1, 184, 3115, 2, 10, UNI_DEVA } /* isdevanagari */, - { 3, 9262, 49, 3, 2, UNI_SB__AT } /* sb=at */, - { 9, 8589, 8498, 7, 7, UNI_SC__MULT } /* script=multani */, - { 0, 9277, 9824, 3, 4, UNI_SC__TGLG } /* sc=tglg */, - { 2, 1087, 36, 27, 1, UNI_PCM } /* prependedconcatenationmark=t */, - { 0, 3311, 0, 3, 0, UNI_ALL } /* all */, - { 1, 8930, 1, 6, 1, -UNI_XPOSIXLOWER } /* lower=n */, - { 4, 3901, 6184, 5, 9, UNI_INGUNJALAGONDI } /* ingunjalagondi */, - { 0, 6420, 7667, 3, 8, UNI_INOLDTURKIC } /* inoldturkic */, - { 1, 8589, 9892, 7, 4, UNI_SC__QAAI } /* script=zinh */, - { 0, 184, 8876, 2, 4, UNI_GOTH } /* isgoth */, - { 5, 10003, 26, 3, 1, UNI_CI } /* ci=y */, - { 1, 10182, 8979, 7, 4, UNI__PERL_PATWS } /* _perl_patws */, - { 14, 7158, 1, 10, 1, -UNI_DIA } /* diacritic=n */, - { 1, 9488, 6253, 4, 12, UNI_KHMERSYMBOLS } /* blk=khmersymbols */, - { 5, 9290, 36, 5, 1, UNI_MATH } /* math=t */, - { 0, 184, 435, 2, 5, UNI__PERL_NCHAR } /* isnchar */, - { 3, 9596, 5633, 4, 2, UNI_LB__H2 } /* hst=lv */, - { 2, 9277, 9452, 3, 4, UNI_AHOM } /* sc=ahom */, - { 0, 184, 8477, 2, 4, UNI_MAKA } /* ismaka */, - { 3, 7594, 0, 9, 0, UNI_LATINEXTD } /* latinextd */, - { 1, 9277, 7358, 3, 4, UNI_SAUR } /* sc=saur */, - { 3, 9488, 5284, 4, 7, UNI_LISUSUP } /* blk=lisusup */, - { 0, 9020, 0, 6, 0, UNI_upper_values_index } /* upper= */, - { 6, 8864, 0, 6, 0, UNI_emoji_values_index } /* emoji= */, - { 0, 4422, 3117, 4, 11, UNI_DEVANAGARIEXT } /* indevanagariext */, - { 0, 8688, 80, 4, 33, UNI_ARABICMATH } /* isarabicmathematicalalphabeticsymbols */, - { 1, 3836, 0, 17, 0, UNI_scx_values_index } /* scriptextensions= */, - { 4, 9488, 7308, 4, 10, UNI_INPHOENICIAN } /* blk=phoenician */, - { 3, 5791, 6313, 13, 12, UNI_JG__MALAYALAMNGA } /* joininggroup=malayalamnga */, - { 9, 3836, 7168, 17, 10, UNI_DIAK } /* scriptextensions=divesakuru */, - { 1, 9277, 1219, 4, 7, UNI_SC__KANA } /* sc=katakana */, - { 0, 4033, 133, 16, 4, UNI_M } /* generalcategory=mark */, - { 1, 10048, 7939, 3, 8, UNI_NV__9_SLASH_2 } /* nv=4.50e+00 */, - { 1, 2288, 4098, 3, 15, UNI_HIGHPUSURROGATES } /* inhighpusurrogates */, - { 4, 9277, 9664, 3, 3, UNI_MRO } /* sc=mro */, - { 2, 7291, 0, 7, 0, UNI_SOGD } /* sogdian */, - { 1, 1417, 8837, 24, 3, UNI_WB__EB } /* canonicalcombiningclass=133 */, - { 0, 4033, 339, 16, 2, UNI_LO } /* generalcategory=lo */, - { 0, 7540, 36, 9, 1, UNI_EXT } /* extender=t */, - { 3, 10296, 6, 3, 1, UNI_PD } /* ispd */, - { 9, 9508, 24, 4, 1, UNI_CCC__L } /* ccc=l */, - { 0, 1417, 9952, 24, 3, UNI_CCC__IS } /* canonicalcombiningclass=240 */, - { 0, 7438, 727, 10, 2, UNI_WB__MN } /* wordbreak=mn */, - { 32, 9488, 1878, 4, 22, UNI_CJKCOMPATIDEOGRAPHSSUP } /* blk=cjkcompatideographssup */, - { 48, 184, 4145, 2, 16, UNI_LINEARBIDEOGRAMS } /* islinearbideograms */, - { 0, 3836, 9245, 17, 4, UNI_DOGR } /* scriptextensions=dogr */, - { 0, 1552, 6862, 9, 11, UNI_NO } /* category=othernumber */, - { 14, 184, 9656, 2, 4, UNI_MIAO } /* ismiao */, - { 0, 6576, 36, 11, 1, UNI_XPOSIXALPHA } /* alphabetic=t */, - { 0, 5791, 6162, 13, 7, UNI_JG__SEMKATH } /* joininggroup=semkath */, - { 5, 184, 8219, 2, 8, UNI_JAVA } /* isjavanese */, - { 3, 3836, 8491, 17, 7, UNI_MARC } /* scriptextensions=marchen */, - { 4, 4033, 400, 16, 6, UNI_CF } /* generalcategory=format */, - { 9, 8780, 4369, 6, 9, UNI_SYRIACSUP } /* block=syriacsup */, - { 0, 9488, 3581, 4, 17, UNI_UCAS } /* blk=canadiansyllabics */, - { 0, 10027, 2627, 3, 19, UNI_JG__BURUSHASKIYEHBARREE } /* jg=burushaskiyehbarree */, - { 1, 8780, 3080, 7, 17, UNI_COPTICEPACTNUMBERS } /* block=copticepactnumbers */, - { 1, 9277, 2287, 3, 4, UNI_SC__SINH } /* sc=sinh */, - { 6, 9716, 1025, 4, 2, -UNI_PCM } /* pcm=no */, - { 0, 184, 3937, 2, 16, UNI_BOPOMOFOEXT } /* isbopomofoextended */, - { 0, 8870, 3, 6, 1, -UNI_EPRES } /* epres=f */, - { 0, 3223, 0, 18, 0, UNI_INPUNCTUATION } /* generalpunctuation */, - { 3, 8589, 6277, 7, 4, UNI_SC__MAHJ } /* script=mahj */, - { 3, 9997, 32, 3, 2, UNI_BC__CS } /* bc=cs */, - { 0, 3151, 1025, 18, 2, -UNI_EPRES } /* emojipresentation=no */, - { 0, 184, 1677, 2, 9, UNI_LATINEXTE } /* islatinexte */, - { 0, 7438, 0, 4, 0, UNI_XPOSIXWORD } /* word */, - { 0, 4033, 112, 16, 2, UNI_SC } /* generalcategory=sc */, - { 1, 9488, 7621, 4, 9, UNI_INNABATAEAN } /* blk=nabataean */, - { 0, 9277, 9672, 3, 4, UNI_SC__MYMR } /* sc=mymr */, - { 3, 7218, 533, 10, 2, UNI_LB__NS } /* linebreak=ns */, - { 2, 8780, 8115, 6, 8, UNI_INBASSAVAH } /* block=bassavah */, - { 3, 951, 0, 17, 0, UNI_VS } /* variationselector */, - { 1, 8589, 9038, 7, 4, UNI_SC__YEZI } /* script=yezi */, - { 6, 9277, 9736, 3, 4, UNI_SC__COPT } /* sc=qaac */, - { 0, 8688, 97, 3, 4, UNI_XPOSIXALPHA } /* isalpha */, - { 2, 4033, 4305, 16, 16, UNI_PO } /* generalcategory=otherpunctuation */, - { 1, 10132, 6193, 3, 12, UNI_LB__HL } /* wb=hebrewletter */, - { 17, 1417, 6719, 24, 11, UNI_CCC__8 } /* canonicalcombiningclass=kanavoicing */, - { 2, 1188, 4386, 3, 5, UNI_INTANGUT } /* intangut */, - { 1, 9277, 4273, 3, 7, UNI_SC__MYMR } /* sc=myanmar */, - { 46, 8924, 0, 6, 0, UNI_LEPC } /* lepcha */, - { 1, 1417, 5649, 24, 1, UNI_CCC__0 } /* canonicalcombiningclass=0 */, - { 1, 8589, 9896, 7, 4, UNI_SC__ZYYY } /* script=zyyy */, - { 16, 10009, 0, 3, 0, UNI_dt_values_index } /* dt= */, - { 6, 2784, 863, 4, 4, UNI_ARROWS } /* inarrows */, - { 16, 9277, 4478, 3, 4, UNI_BRAI } /* sc=brai */, - { 11, 9444, 10081, 4, 3, UNI_AGE__3 } /* age=v30 */, - { 10, 9516, 0, 4, 0, UNI_CPRT } /* cprt */, - { 2, 184, 9668, 2, 4, UNI_MTEI } /* ismtei */, - { 0, 184, 6961, 2, 11, UNI_SUPERANDSUB } /* issuperandsub */, - { 0, 10048, 7930, 3, 2, UNI_NV__14 } /* nv=14 */, - { 1, 9270, 868, 3, 27, UNI_PHONETICEXTSUP } /* inphoneticextensionssupplement */, - { 0, 184, 5214, 2, 6, UNI_KANGXI } /* iskangxi */, - { 0, 9277, 8187, 3, 4, UNI_SC__HIRA } /* sc=hira */, - { 0, 184, 133, 2, 4, UNI_M } /* ismark */, - { 3, 7188, 0, 10, 0, UNI_KHAR } /* kharoshthi */, - { 0, 2280, 8549, 4, 5, UNI_OLCK } /* isolchiki */, - { 1, 184, 8131, 2, 4, UNI_DUPL } /* isdupl */, - { 0, 9444, 7806, 4, 1, UNI_AGE__6 } /* age=6 */, - { 0, 1417, 9186, 25, 4, UNI_CCC__31 } /* canonicalcombiningclass=ccc31 */, - { 0, 1878, 0, 19, 0, UNI_CJKCOMPATIDEOGRAPHS } /* cjkcompatideographs */, - { 2, 1417, 6642, 24, 11, UNI_CCC__DB } /* canonicalcombiningclass=doublebelow */, - { 0, 4916, 8292, 3, 3, UNI_TAGB } /* istagb */, - { 5, 10027, 6162, 3, 7, UNI_JG__SEMKATH } /* jg=semkath */, - { 6, 184, 2061, 2, 4, UNI_MODI } /* ismodi */, - { 4, 2784, 7497, 4, 7, UNI_ARABICPFA } /* inarabicpfa */, - { 0, 8780, 5778, 6, 6, UNI_IPAEXT } /* block=ipaext */, - { 1, 3836, 4149, 18, 3, UNI_SARB } /* scriptextensions=sarb */, - { 1, 10027, 4225, 3, 16, UNI_JG__MANICHAEANTWENTY } /* jg=manichaeantwenty */, - { 1, 21, 5242, 2, 14, UNI_LATINEXTC } /* inlatinextendedc */, - { 1, 5986, 7787, 13, 8, UNI_NV__3_SLASH_2 } /* numericvalue=1.50e+00 */, - { 2, 184, 7567, 2, 9, UNI_SIND } /* iskhudawadi */, - { 21, 184, 3169, 2, 11, UNI_ETHIOPICSUP } /* isethiopicsup */, - { 1, 2533, 982, 5, 24, UNI_ALPHABETICPF } /* inalphabeticpresentationforms */, - { 2, 9310, 0, 5, 0, UNI_OGAM } /* ogham */, - { 10, 5986, 9368, 13, 4, UNI_NV__1_SLASH_20 } /* numericvalue=1/20 */, - { 1, 7088, 3349, 10, 18, UNI_BC__B } /* bidiclass=paragraphseparator */, - { 5, 10048, 9392, 3, 4, UNI_NV__11_SLASH_2 } /* nv=11/2 */, - { 5, 10024, 27, 3, 2, UNI_LOWERCASELETTER } /* gc=ll */, - { 8, 9488, 749, 4, 16, UNI_ENCLOSEDALPHANUM } /* blk=enclosedalphanum */, - { 0, 9071, 3, 4, 1, -UNI_XPOSIXXDIGIT } /* hex=f */, - { 0, 9997, 0, 3, 0, UNI_bc_values_index } /* bc= */, - { 0, 5564, 1, 14, 1, -UNI_QMARK } /* quotationmark=n */, - { 0, 4113, 952, 3, 27, UNI_VSSUP } /* invariationselectorssupplement */, - { 7, 382, 0, 4, 0, UNI_EGYP } /* egyp */, - { 2, 7088, 5829, 10, 3, UNI_BC__RLO } /* bidiclass=rlo */, - { 1, 9488, 183, 4, 34, UNI_MISCPICTOGRAPHS } /* blk=miscellaneoussymbolsandpictographs */, - { 0, 8912, 0, 6, 0, UNI_KHOJ } /* khojki */, - { 1, 9804, 0, 4, 0, UNI_TALE } /* tale */, - { 0, 8688, 1007, 3, 16, UNI_ANCIENTGREEKMUSIC } /* isancientgreekmusic */, - { 6, 8575, 0, 7, 0, UNI_patsyn_values_index } /* patsyn= */, - { 2, 9768, 6385, 4, 12, UNI_GONM } /* scx=masaramgondi */, - { 20, 3385, 36, 18, 1, UNI_RI } /* regionalindicator=t */, - { 14, 21, 4129, 2, 6, UNI_LATIN1 } /* inlatin1 */, - { 7, 8780, 446, 6, 32, UNI_IDEOGRAPHICSYMBOLS } /* block=ideographicsymbolsandpunctuation */, - { 1, 8589, 7648, 7, 9, UNI_ITAL } /* script=olditalic */, - { 4, 5791, 10072, 13, 3, UNI_JG__TAH } /* joininggroup=tah */, - { 9, 1188, 4929, 3, 14, UNI_TAMILSUP } /* intamilsupplement */, - { 0, 9488, 8337, 4, 7, UNI_INAVESTAN } /* blk=avestan */, - { 0, 10033, 8449, 3, 6, UNI_LB__HY } /* lb=hyphen */, - { 0, 10333, 2529, 3, 4, UNI_STERM } /* issterm */, - { 11, 9508, 6719, 4, 11, UNI_CCC__8 } /* ccc=kanavoicing */, - { 1, 3836, 9315, 17, 5, UNI_ORYA } /* scriptextensions=oriya */, - { 4, 1287, 0, 2, 0, UNI_UPPERCASELETTER } /* lu */, - { 4, 1417, 7859, 24, 3, UNI_WB__EB } /* canonicalcombiningclass=200 */, - { 10, 184, 478, 2, 31, UNI_MATHALPHANUM } /* ismathematicalalphanumericsymbols */, - { 18, 10033, 202, 3, 2, UNI_LB__SA } /* lb=sa */, - { 0, 1417, 9472, 24, 4, UNI_WB__EB } /* canonicalcombiningclass=atbl */, - { 0, 10296, 1823, 7, 5, UNI_POSIXLOWER } /* isposixlower */, - { 1, 1417, 9141, 25, 4, UNI_CCC__22 } /* canonicalcombiningclass=ccc22 */, - { 1, 10288, 10308, 8, 5, UNI_XPOSIXPRINT } /* isxposixprint */, - { 0, 113, 0, 25, 0, UNI_DIACRITICALS } /* combiningdiacriticalmarks */, - { 2, 7218, 42, 10, 2, UNI_LB__CJ } /* linebreak=cj */, - { 20, 2287, 0, 7, 0, UNI_SINH } /* sinhala */, - { 6, 9768, 9588, 4, 4, UNI_HMNG } /* scx=hmng */, - { 4, 2280, 6852, 3, 10, UNI_LO } /* isotherletter */, - { 0, 6205, 0, 12, 0, UNI_ideo_values_index } /* ideographic= */, - { 8, 8780, 7139, 7, 9, UNI_COMPATJAMO } /* block=compatjamo */, - { 0, 9488, 779, 4, 30, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* blk=symbolsandpictographsextendeda */, - { 0, 10027, 4177, 3, 16, UNI_JG__MANICHAEANDALETH } /* jg=manichaeandaleth */, - { 3, 10024, 1910, 3, 2, UNI_CN } /* gc=cn */, - { 0, 1188, 3458, 3, 17, UNI_TAIXUANJING } /* intaixuanjingsymbols */, - { 0, 9640, 26, 4, 1, UNI_LOE } /* loe=y */, - { 2, 8688, 1371, 4, 22, UNI_ARABICPFA } /* isarabicpresentationformsa */, - { 0, 8589, 7660, 7, 4, UNI_SC__PERM } /* script=perm */, - { 3, 8852, 9836, 6, 4, UNI_CWKCF } /* cwkcf=true */, - { 0, 1845, 0, 5, 0, UNI_TITLE } /* title */, - { 70, 5986, 7875, 13, 8, UNI_NV__1_SLASH_32 } /* numericvalue=3.13e-02 */, - { 1, 1812, 0, 21, 0, UNI_CWL } /* changeswhenlowercased */, - { 13, 9548, 0, 4, 0, UNI_DSRT } /* dsrt */, - { 0, 1269, 26, 25, 1, UNI_COMPEX } /* fullcompositionexclusion=y */, - { 1, 8780, 8227, 6, 8, UNI_KANAEXTA } /* block=kanaexta */, - { 0, 3836, 9245, 17, 5, UNI_DOGR } /* scriptextensions=dogra */, - { 0, 5804, 0, 13, 0, UNI_KANAEXTA } /* kanaextendeda */, - { 4, 1966, 1244, 22, 9, UNI_INSC__CONSONANT } /* indicsyllabiccategory=consonant */, - { 1, 3836, 1218, 17, 8, UNI_KANA } /* scriptextensions=katakana */, - { 0, 9277, 9684, 3, 4, UNI_NEWA } /* sc=newa */, - { 5, 7155, 6194, 3, 5, UNI_HEBR } /* ishebrew */, - { 0, 3836, 9896, 17, 4, UNI_ZYYY } /* scriptextensions=zyyy */, - { 28, 4791, 2338, 10, 11, UNI_MERO } /* inmeroitichieroglyphs */, - { 1, 6609, 3, 11, 1, -UNI_DEP } /* deprecated=f */, - { 0, 184, 3223, 2, 18, UNI_INPUNCTUATION } /* isgeneralpunctuation */, - { 0, 8780, 4973, 6, 15, UNI_VEDICEXT } /* block=vedicextensions */, - { 8, 9488, 7069, 5, 9, UNI_ASCII } /* blk=basiclatin */, - { 1, 6505, 0, 8, 0, UNI_PHAISTOS } /* phaistos */, - { 0, 8780, 7458, 6, 10, UNI_YIRADICALS } /* block=yiradicals */, - { 4, 7621, 0, 9, 0, UNI_NBAT } /* nabataean */, - { 1, 5986, 8732, 13, 4, UNI_NV__5000 } /* numericvalue=5000 */, - { 1, 8589, 9476, 7, 4, UNI_AVST } /* script=avst */, - { 0, 8966, 10135, 6, 3, UNI_NFDQC__Y } /* nfdqc=yes */, - { 2, 8780, 3937, 6, 11, UNI_BOPOMOFOEXT } /* block=bopomofoext */, - { 2, 21, 1007, 3, 16, UNI_ANCIENTGREEKMUSIC } /* inancientgreekmusic */, - { 2, 10048, 9910, 3, 3, UNI_NV__1_SLASH_9 } /* nv=1/9 */, - { 0, 1417, 8831, 24, 3, UNI_CCC__132 } /* canonicalcombiningclass=132 */, - { 1, 10033, 395, 3, 2, UNI_LB__GL } /* lb=gl */, - { 3, 184, 8906, 2, 6, UNI_KANBUN } /* iskanbun */, - { 0, 8589, 865, 10, 1, UNI_SHAW } /* script=shaw */, - { 5, 9277, 9008, 3, 6, UNI_SC__THAA } /* sc=thaana */, - { 2, 10048, 8750, 3, 2, UNI_NV__80 } /* nv=80 */, - { 0, 1631, 0, 18, 0, UNI_GEOMETRICSHAPESEXT } /* geometricshapesext */, - { 33, 10327, 0, 4, 0, UNI_PE } /* ispe */, - { 1, 8780, 5960, 6, 13, UNI_MISCTECHNICAL } /* block=misctechnical */, - { 2, 184, 867, 2, 28, UNI_PHONETICEXTSUP } /* isphoneticextensionssupplement */, - { 0, 9488, 7630, 4, 9, UNI_INNEWTAILUE } /* blk=newtailue */, - { 0, 9277, 8315, 3, 8, UNI_UGAR } /* sc=ugaritic */, - { 1, 8884, 0, 4, 0, UNI_ext_values_index } /* ext= */, - { 0, 184, 720, 3, 8, UNI_XSUX } /* iscuneiform */, - { 0, 9275, 2844, 5, 10, UNI_INSC__TONELETTER } /* insc=toneletter */, - { 0, 5791, 5420, 13, 4, UNI_JG__TETH } /* joininggroup=teth */, - { 1, 21, 5200, 2, 14, UNI_KANASUP } /* inkanasupplement */, - { 3, 186, 0, 2, 0, UNI_CE } /* ce */, - { 4, 9250, 26, 5, 1, UNI_EMOD } /* emod=y */, - { 1, 9235, 10135, 5, 3, UNI_CWCM } /* cwcm=yes */, - { 1, 2061, 0, 14, 0, UNI_LM } /* modifierletter */, - { 4, 9768, 9700, 4, 4, UNI_OLCK } /* scx=olck */, - { 0, 3382, 1, 3, 1, -UNI_CE } /* ce=n */, - { 20, 9270, 8583, 3, 6, UNI_INPHAGSPA } /* inphagspa */, - { 1, 7218, 6587, 10, 11, UNI_LB__BB } /* linebreak=breakbefore */, - { 0, 9768, 8491, 4, 7, UNI_MARC } /* scx=marchen */, - { 0, 9444, 9856, 4, 4, UNI_AGE__13 } /* age=v130 */, - { 0, 7418, 3, 10, 1, -UNI_XPOSIXUPPER } /* uppercase=f */, - { 1, 7651, 0, 4, 0, UNI_ITAL } /* ital */, - { 3, 184, 43, 3, 8, UNI_CJKCOMPAT } /* iscjkcompat */, - { 1, 3836, 9756, 17, 4, UNI_RUNR } /* scriptextensions=runr */, - { 2, 9277, 8924, 3, 6, UNI_LEPC } /* sc=lepcha */, - { 0, 9768, 3785, 4, 4, UNI_MANI } /* scx=mani */, - { 0, 184, 510, 3, 19, UNI_CJK } /* iscjkunifiedideographs */, - { 1, 10027, 5172, 3, 14, UNI_JG__HAMZAONHEHGOAL } /* jg=hamzaonhehgoal */, - { 4, 9492, 0, 4, 0, UNI_bpt_values_index } /* bpt= */, - { 13, 4791, 6411, 4, 10, UNI_INMENDEKIKAKUI } /* inmendekikakui */, - { 3, 9768, 6792, 5, 3, UNI_SAMR } /* scx=samr */, - { 2, 5791, 9648, 13, 4, UNI_JG__MEEM } /* joininggroup=meem */, - { 0, 9768, 9804, 4, 4, UNI_TALE } /* scx=tale */, - { 1, 9488, 1465, 4, 24, UNI_DIACRITICALSFORSYMBOLS } /* blk=combiningmarksforsymbols */, - { 8, 10048, 10138, 3, 2, UNI_NV__38 } /* nv=38 */, - { 0, 3379, 10183, 5, 4, UNI_XPOSIXSPACE } /* spaceperl */, - { 5, 2224, 924, 3, 27, UNI_SUPPUAB } /* insupplementaryprivateuseareab */, - { 1, 8589, 8618, 8, 3, UNI_SOYO } /* script=soyo */, - { 8, 4838, 26, 15, 1, UNI_NFKCQC__Y } /* nfkcquickcheck=y */, - { 10, 3836, 2913, 18, 3, UNI_SUND } /* scriptextensions=sund */, - { 1, 1417, 7814, 24, 1, UNI_CCC__7 } /* canonicalcombiningclass=7 */, - { 34, 1417, 78, 24, 2, UNI_CCC__AR } /* canonicalcombiningclass=ar */, - { 0, 10333, 3895, 3, 3, UNI_SGNW } /* issgnw */, - { 1, 184, 7139, 3, 9, UNI_COMPATJAMO } /* iscompatjamo */, - { 6, 1186, 0, 2, 0, UNI_PO } /* po */, - { 40, 10048, 9108, 3, 2, UNI_NV__15 } /* nv=15 */, - { 0, 9488, 1906, 4, 16, UNI_INDICNUMBERFORMS } /* blk=indicnumberforms */, - { 1, 9351, 9255, 4, 5, -UNI_IDS } /* ids=false */, - { 32, 3421, 0, 4, 0, UNI_RUMI } /* rumi */, - { 21, 9576, 0, 4, 0, UNI_GURU } /* guru */, - { 10, 10048, 7899, 3, 8, UNI_NV__7_SLASH_2 } /* nv=3.50e+00 */, - { 4, 184, 7594, 2, 9, UNI_LATINEXTD } /* islatinextd */, - { 1, 5986, 10144, 13, 2, UNI_NV__45 } /* numericvalue=45 */, - { 58, 9768, 8912, 4, 4, UNI_KHOJ } /* scx=khoj */, - { 0, 3836, 9310, 17, 5, UNI_OGAM } /* scriptextensions=ogham */, - { 0, 9351, 36, 4, 1, UNI_IDS } /* ids=t */, - { 16, 8864, 3, 6, 1, -UNI_EMOJI } /* emoji=f */, - { 1, 1417, 9181, 25, 4, UNI_CCC__30 } /* canonicalcombiningclass=ccc30 */, - { 0, 184, 8407, 2, 7, UNI_DSRT } /* isdeseret */, - { 0, 9444, 7814, 4, 1, UNI_AGE__7 } /* age=7 */, - { 14, 7088, 37, 10, 2, UNI_BC__EN } /* bidiclass=en */, - { 16, 184, 3115, 2, 4, UNI_DEVA } /* isdeva */, - { 0, 8589, 3785, 7, 10, UNI_SC__MANI } /* script=manichaean */, - { 8, 10296, 5039, 7, 6, UNI_POSIXXDIGIT } /* isposixxdigit */, - { 2, 9250, 0, 10, 0, -UNI_EMOD } /* emod=false */, - { 2, 9277, 2429, 3, 20, UNI_PHLI } /* sc=inscriptionalpahlavi */, - { 6, 1417, 7874, 24, 2, UNI_CCC__23 } /* canonicalcombiningclass=23 */, - { 0, 9488, 1700, 4, 23, UNI_SHORTHANDFORMATCONTROLS } /* blk=shorthandformatcontrols */, - { 32, 9277, 8123, 3, 4, UNI_SC__BUGI } /* sc=bugi */, - { 10, 4033, 9503, 16, 2, UNI_MC } /* generalcategory=mc */, - { 0, 9872, 0, 4, 0, UNI_XPEO } /* xpeo */, - { 20, 9540, 9836, 4, 4, UNI_DIA } /* dia=true */, - { 0, 2912, 0, 12, 0, UNI_SUNDANESESUP } /* sundanesesup */, - { 0, 7218, 5564, 10, 9, UNI_LB__QU } /* linebreak=quotation */, - { 6, 9768, 7168, 4, 10, UNI_DIAK } /* scx=divesakuru */, - { 0, 1465, 0, 24, 0, UNI_DIACRITICALSFORSYMBOLS } /* combiningmarksforsymbols */, - { 16, 3836, 8936, 17, 6, UNI_LYCI } /* scriptextensions=lycian */, - { 8, 8589, 2409, 7, 4, UNI_SC__GLAG } /* script=glag */, - { 32, 9768, 9604, 4, 4, UNI_KHMR } /* scx=khmr */, - { 17, 8780, 3768, 6, 17, UNI_LETTERLIKESYMBOLS } /* block=letterlikesymbols */, - { 2, 8694, 0, 7, 0, UNI_wspace_values_index } /* wspace= */, - { 7, 8978, 10135, 6, 3, UNI__PERL_PATWS } /* patws=yes */, - { 5, 9275, 2369, 5, 20, UNI_INSC__CONSONANTPLACEHOLDER } /* insc=consonantplaceholder */, - { 1, 9768, 8291, 4, 8, UNI_TAGB } /* scx=tagbanwa */, - { 3, 3133, 0, 17, 0, UNI_EBASE } /* emojimodifierbase */, - { 0, 7218, 83, 10, 2, UNI_LB__CM } /* linebreak=cm */, - { 0, 9277, 9245, 3, 4, UNI_SC__DOGR } /* sc=dogr */, - { 0, 8780, 6193, 6, 6, UNI_INHEBREW } /* block=hebrew */, - { 1, 10288, 9877, 3, 3, UNI_XSUX } /* isxsux */, - { 0, 1417, 8793, 25, 5, UNI_CCC__103 } /* canonicalcombiningclass=ccc103 */, - { 16, 184, 3768, 2, 17, UNI_LETTERLIKESYMBOLS } /* isletterlikesymbols */, - { 0, 8780, 7675, 6, 9, UNI_PALM } /* block=palmyrene */, - { 0, 8780, 8582, 6, 7, UNI_INPHAGSPA } /* block=phagspa */, - { 0, 3115, 0, 4, 0, UNI_DEVA } /* deva */, - { 0, 1552, 4943, 9, 15, UNI_TITLE } /* category=titlecaseletter */, - { 1, 8780, 8428, 6, 7, UNI_INGRANTHA } /* block=grantha */, - { 0, 8435, 3, 7, 1, -UNI_GRBASE } /* grbase=f */, - { 2, 9768, 9480, 4, 4, UNI_BATK } /* scx=batk */, - { 0, 8589, 9820, 7, 4, UNI_TFNG } /* script=tfng */, - { 4, 10132, 5012, 3, 2, UNI_WB__SQ } /* wb=sq */, - { 0, 10027, 10045, 3, 3, UNI_JG__MIM } /* jg=mim */, - { 12, 7218, 34, 10, 2, UNI_LB__EX } /* linebreak=ex */, - { 0, 1790, 0, 22, 0, UNI_cwcm_values_index } /* changeswhencasemapped= */, - { 8, 4097, 0, 16, 0, UNI_HIGHPUSURROGATES } /* highpusurrogates */, - { 4, 1417, 3572, 24, 9, UNI_CCC__BL } /* canonicalcombiningclass=belowleft */, - { 2, 6609, 9836, 11, 4, UNI_DEP } /* deprecated=true */, - { 0, 3097, 4017, 18, 3, UNI_DT__FIN } /* decompositiontype=fin */, - { 0, 8589, 9572, 7, 4, UNI_SC__GUJR } /* script=gujr */, - { 2, 1033, 0, 11, 0, UNI_ENCLOSEDCJK } /* enclosedcjk */, - { 2, 1591, 3684, 3, 16, UNI_ETHIOPICEXTA } /* inethiopicextendeda */, - { 2, 1790, 9836, 22, 4, UNI_CWCM } /* changeswhencasemapped=true */, - { 1, 1417, 9146, 25, 4, UNI_CCC__23 } /* canonicalcombiningclass=ccc23 */, - { 0, 9345, 36, 5, 1, UNI_XIDC } /* xidc=t */, - { 2, 9277, 9584, 3, 4, UNI_HLUW } /* sc=hluw */, - { 32, 8858, 36, 6, 1, UNI_ECOMP } /* ecomp=t */, - { 0, 184, 5739, 2, 12, UNI_GRBASE } /* isgraphemebase */, - { 5, 184, 4161, 2, 16, UNI_LINEARBSYLLABARY } /* islinearbsyllabary */, - { 0, 184, 17, 3, 1, UNI_CO } /* isco */, - { 0, 1966, 4417, 22, 16, UNI_INSC__VOWELINDEPENDENT } /* indicsyllabiccategory=vowelindependent */, - { 0, 3836, 5550, 17, 14, UNI_PHLP } /* scriptextensions=psalterpahlavi */, - { 1, 1025, 0, 2, 0, UNI_NO } /* no */, - { 0, 5986, 7883, 13, 8, UNI_NV__1_SLASH_320 } /* numericvalue=3.13e-03 */, - { 1, 5791, 9456, 13, 4, UNI_JG__ALEF } /* joininggroup=alef */, - { 1, 8589, 7188, 7, 4, UNI_KHAR } /* script=khar */, - { 0, 3836, 8888, 17, 4, UNI_HATR } /* scriptextensions=hatr */, - { 0, 9640, 10135, 4, 3, UNI_LOE } /* loe=yes */, - { 11, 7228, 9255, 10, 5, -UNI_XPOSIXLOWER } /* lowercase=false */, - { 1, 8512, 9295, 7, 5, UNI_NFCQC__M } /* nfkcqc=maybe */, - { 33, 9508, 7859, 4, 2, UNI_CCC__20 } /* ccc=20 */, - { 8, 1856, 26, 22, 1, UNI_CWU } /* changeswhenuppercased=y */, - { 1, 8780, 9085, 6, 5, UNI_INBATAK } /* block=batak */, - { 9, 9536, 1025, 4, 2, -UNI_DEP } /* dep=no */, - { 17, 8688, 4435, 4, 13, UNI_ARABICEXTA } /* isarabicextendeda */, - { 0, 8780, 7630, 6, 9, UNI_INNEWTAILUE } /* block=newtailue */, - { 1, 10024, 4305, 3, 16, UNI_PO } /* gc=otherpunctuation */, - { 0, 8997, 1025, 5, 2, -UNI_TERM } /* term=no */, - { 65, 6554, 10135, 11, 3, UNI_IDC } /* idcontinue=yes */, - { 32, 9508, 9211, 5, 4, UNI_CCC__36 } /* ccc=ccc36 */, - { 10, 10033, 6697, 3, 11, UNI_LB__IN } /* lb=inseperable */, - { 1, 8936, 0, 4, 0, UNI_LYCI } /* lyci */, - { 2, 1269, 0, 24, 0, UNI_COMPEX } /* fullcompositionexclusion */, - { 0, 8589, 8291, 7, 4, UNI_SC__TAGB } /* script=tagb */, - { 1, 8780, 4161, 6, 16, UNI_LINEARBSYLLABARY } /* block=linearbsyllabary */, - { 1, 184, 9740, 2, 4, UNI_QAAI } /* isqaai */, - { 2, 8780, 8219, 6, 8, UNI_INJAVANESE } /* block=javanese */, - { 0, 8780, 2224, 6, 21, UNI_ININSCRIPTIONALPARTHIAN } /* block=inscriptionalparthian */, - { 3, 2874, 0, 19, 0, UNI_OTTOMANSIYAQNUMBERS } /* ottomansiyaqnumbers */, - { 6, 3259, 1, 18, 1, -UNI_IDSB } /* idsbinaryoperator=n */, - { 8, 2569, 3504, 20, 7, UNI_VO__R } /* verticalorientation=rotated */, - { 34, 9768, 7188, 4, 10, UNI_KHAR } /* scx=kharoshthi */, - { 16, 184, 1025, 2, 2, UNI_NO } /* isno */, - { 1, 10024, 133, 3, 4, UNI_M } /* gc=mark */, - { 2, 10024, 45, 3, 2, UNI_CO } /* gc=co */, - { 1, 9488, 3768, 4, 17, UNI_LETTERLIKESYMBOLS } /* blk=letterlikesymbols */, - { 81, 2224, 4338, 3, 15, UNI_SUPMATHOPERATORS } /* insupmathoperators */, - { 12, 2224, 317, 3, 32, UNI_SUPMATHOPERATORS } /* insupplementalmathematicaloperators */, - { 8, 7088, 4493, 10, 15, UNI_BC__CS } /* bidiclass=commonseparator */, - { 1, 10048, 9380, 3, 3, UNI_NV__1_SLASH_8 } /* nv=1/8 */, - { 1, 184, 1791, 3, 20, UNI_CWCM } /* ischangeswhencasemapped */, - { 2, 1834, 0, 21, 0, UNI_CWT } /* changeswhentitlecased */, - { 1, 9277, 7278, 3, 10, UNI_XPEO } /* sc=oldpersian */, - { 0, 3097, 7, 18, 3, UNI_DT__CAN } /* decompositiontype=can */, - { 20, 184, 7358, 2, 10, UNI_SAUR } /* issaurashtra */, - { 0, 5116, 10135, 14, 3, UNI_EMOD } /* emojimodifier=yes */, - { 3, 10296, 3, 3, 1, UNI_PF } /* ispf */, - { 0, 10132, 18, 3, 2, UNI_RI } /* wb=ri */, - { 7, 8512, 0, 7, 0, UNI_nfkcqc_values_index } /* nfkcqc= */, - { 16, 9488, 2912, 4, 9, UNI_INSUNDANESE } /* blk=sundanese */, - { 4, 9768, 8187, 4, 8, UNI_HIRA } /* scx=hiragana */, - { 2, 9608, 0, 4, 0, UNI_KITS } /* kits */, - { 5, 9768, 5550, 4, 14, UNI_PHLP } /* scx=psalterpahlavi */, - { 1, 1552, 4017, 9, 16, UNI_PF } /* category=finalpunctuation */, - { 0, 9512, 0, 4, 0, UNI_CHRS } /* chrs */, - { 1, 7325, 10102, 3, 3, UNI_IN__5_DOT_2 } /* in=v52 */, - { 32, 9277, 8115, 3, 8, UNI_BASS } /* sc=bassavah */, - { 0, 7218, 8701, 10, 7, UNI_LB__ZW } /* linebreak=zwspace */, - { 4, 3836, 7567, 17, 9, UNI_SIND } /* scriptextensions=khudawadi */, - { 4, 10048, 7814, 3, 1, UNI_NV__7 } /* nv=7 */, - { 0, 9768, 8942, 4, 6, UNI_LYDI } /* scx=lydian */, - { 2, 8930, 0, 6, 0, UNI_lower_values_index } /* lower= */, - { 5, 9768, 2913, 5, 8, UNI_SUND } /* scx=sundanese */, - { 0, 184, 2950, 2, 19, UNI_SUPARROWSB } /* issupplementalarrowsb */, - { 0, 3836, 9008, 17, 4, UNI_THAA } /* scriptextensions=thaa */, - { 0, 10048, 7971, 3, 8, UNI_NV__7_SLASH_12 } /* nv=5.83e-01 */, - { 12, 8589, 8414, 7, 4, UNI_ELBA } /* script=elba */, - { 0, 7738, 26, 9, 1, UNI_XIDS } /* xidstart=y */, - { 1, 8400, 10135, 7, 3, UNI_COMPEX } /* compex=yes */, - { 0, 9596, 6741, 4, 11, UNI_GCB__L } /* hst=leadingjamo */, - { 1, 8780, 4401, 6, 16, UNI_TANGUTSUP } /* block=tangutsupplement */, - { 1, 8589, 2913, 8, 3, UNI_SUND } /* script=sund */, - { 0, 10182, 6554, 6, 6, UNI__PERL_IDCONT } /* _perl_idcont */, - { 1, 9488, 9828, 4, 4, UNI_INTHAI } /* blk=thai */, - { 1, 8589, 9504, 7, 4, UNI_CANS } /* script=cans */, - { 2, 8589, 9496, 7, 4, UNI_SC__BUHD } /* script=buhd */, - { 1, 8780, 4145, 6, 16, UNI_LINEARBIDEOGRAMS } /* block=linearbideograms */, - { 0, 8780, 8477, 6, 7, UNI_INMAKASAR } /* block=makasar */, - { 0, 1552, 1587, 9, 1, UNI_Z } /* category=z */, - { 1, 10048, 10140, 3, 2, UNI_NV__39 } /* nv=39 */, - { 2, 9588, 0, 4, 0, UNI_HMNG } /* hmng */, - { 0, 2760, 6763, 19, 11, UNI_LB__H3 } /* hangulsyllabletype=lvtsyllable */, - { 3, 8978, 1, 6, 1, -UNI__PERL_PATWS } /* patws=n */, - { 5, 5791, 9355, 13, 5, UNI_JG__ZHAIN } /* joininggroup=zhain */, - { 2, 8589, 2485, 7, 4, UNI_SC__MONG } /* script=mong */, - { 0, 9556, 24, 4, 1, UNI_GCB__L } /* gcb=l */, - { 2, 9444, 10087, 4, 3, UNI_AGE__3_DOT_2 } /* age=v32 */, - { 1, 1417, 7806, 24, 1, UNI_CCC__6 } /* canonicalcombiningclass=6 */, - { 0, 5986, 8750, 13, 4, UNI_NV__8000 } /* numericvalue=8000 */, - { 3, 9488, 1631, 4, 15, UNI_GEOMETRICSHAPES } /* blk=geometricshapes */, - { 5, 8780, 2409, 6, 20, UNI_GLAGOLITICSUP } /* block=glagoliticsupplement */, - { 1, 8780, 7358, 6, 10, UNI_INSAURASHTRA } /* block=saurashtra */, - { 3, 4791, 4290, 3, 15, UNI_MYANMAREXTB } /* inmyanmarextendedb */, - { 16, 7076, 8116, 3, 7, UNI_INBASSAVAH } /* inbassavah */, - { 1, 9528, 9836, 4, 4, UNI_CWU } /* cwu=true */, - { 5, 4033, 5497, 16, 11, UNI_MC } /* generalcategory=spacingmark */, - { 0, 5986, 10142, 13, 2, UNI_NV__44 } /* numericvalue=44 */, - { 4, 8780, 0, 12, 0, UNI_INCARIAN } /* block=carian */, - { 2, 9277, 8582, 3, 7, UNI_SC__PHAG } /* sc=phagspa */, - { 0, 9277, 9516, 3, 4, UNI_SC__CPRT } /* sc=cprt */, - { 5, 9444, 7781, 4, 1, UNI_AGE__4 } /* age=4 */, - { 0, 4113, 6013, 3, 12, UNI_VERTICALFORMS } /* inverticalforms */, - { 0, 5791, 3, 15, 1, UNI_JG__KAF } /* joininggroup=kaf */, - { 12, 10006, 1025, 3, 2, -UNI_DI } /* di=no */, - { 34, 1505, 5755, 5, 10, UNI_GREEKEXT } /* ingreekextended */, - { 2, 8589, 7675, 7, 4, UNI_PALM } /* script=palm */, - { 1, 1417, 7858, 24, 2, UNI_CCC__22 } /* canonicalcombiningclass=22 */, - { 17, 1417, 4912, 24, 2, UNI_CCC__0 } /* canonicalcombiningclass=nr */, - { 0, 7155, 8443, 3, 6, UNI_HANO } /* ishanunoo */, - { 2, 6061, 1025, 12, 2, -UNI_BIDIC } /* bidicontrol=no */, - { 1, 7438, 72, 10, 2, UNI_WB__LE } /* wordbreak=le */, - { 0, 8997, 0, 5, 0, UNI_term_values_index } /* term= */, - { 0, 10290, 5718, 6, 5, UNI_XPOSIXALNUM } /* xposixalnum */, - { 7, 10048, 9424, 3, 4, UNI_NV__3_SLASH_64 } /* nv=3/64 */, - { 0, 478, 0, 31, 0, UNI_MATHALPHANUM } /* mathematicalalphanumericsymbols */, - { 0, 1979, 7, 10, 1, UNI_CASEDLETTER } /* category=lc */, - { 0, 1114, 9836, 26, 4, UNI_CWKCF } /* changeswhennfkccasefolded=true */, - { 1, 21, 1677, 2, 14, UNI_LATINEXTA } /* inlatinextendeda */, - { 2, 9997, 3349, 3, 18, UNI_BC__B } /* bc=paragraphseparator */, - { 0, 42, 0, 3, 0, UNI_CJK } /* cjk */, - { 15, 10333, 1176, 3, 3, UNI_SORA } /* issora */, - { 10, 9488, 4868, 4, 15, UNI_NARB } /* blk=oldnortharabian */, - { 15, 9488, 2855, 4, 9, UNI_INMONGOLIAN } /* blk=mongolian */, - { 0, 2203, 0, 4, 0, UNI_HAN } /* hani */, - { 0, 4116, 447, 3, 17, UNI_IDEOGRAPHICSYMBOLS } /* isideographicsymbols */, - { 5, 10012, 865, 3, 1, UNI_EA__W } /* ea=w */, - { 3, 8688, 29, 4, 4, UNI_ARAB } /* isarabic */, - { 1, 8589, 4273, 7, 7, UNI_SC__MYMR } /* script=myanmar */, - { 12, 7218, 6697, 10, 11, UNI_LB__IN } /* linebreak=inseperable */, - { 1, 6420, 9311, 3, 4, UNI_INOGHAM } /* inogham */, - { 5, 7228, 26, 10, 1, UNI_XPOSIXLOWER } /* lowercase=y */, - { 0, 7218, 751, 10, 2, UNI_LB__CL } /* linebreak=cl */, - { 8, 9508, 1179, 4, 2, UNI_CCC__BL } /* ccc=bl */, - { 19, 2760, 5973, 19, 13, UNI_HST__NA } /* hangulsyllabletype=notapplicable */, - { 8, 8589, 2140, 7, 8, UNI_SC__CYRL } /* script=cyrillic */, - { 0, 5739, 1025, 13, 2, -UNI_GRBASE } /* graphemebase=no */, - { 0, 3133, 36, 18, 1, UNI_EBASE } /* emojimodifierbase=t */, - { 0, 184, 1631, 2, 23, UNI_GEOMETRICSHAPESEXT } /* isgeometricshapesextended */, - { 1, 8589, 4448, 7, 4, UNI_BAMU } /* script=bamu */, - { 4, 9488, 3043, 4, 18, UNI_HALFMARKS } /* blk=combininghalfmarks */, - { 2, 1393, 0, 24, 0, UNI_ARABICPFB } /* arabicpresentationformsb */, - { 0, 9277, 4868, 3, 15, UNI_NARB } /* sc=oldnortharabian */, - { 1, 10290, 62, 6, 5, UNI_XPOSIXGRAPH } /* xposixgraph */, - { 0, 10027, 5420, 3, 4, UNI_JG__TETH } /* jg=teth */, - { 2, 184, 4569, 3, 14, UNI_CURRENCYSYMBOLS } /* iscurrencysymbols */, - { 2, 10024, 106, 3, 6, UNI_S } /* gc=symbol */, - { 1, 10048, 8756, 3, 5, UNI_NV__90000 } /* nv=90000 */, - { 0, 3836, 3751, 17, 17, UNI_KITS } /* scriptextensions=khitansmallscript */, - { 0, 184, 3080, 3, 17, UNI_COPTICEPACTNUMBERS } /* iscopticepactnumbers */, - { 6, 8780, 8179, 6, 8, UNI_INGURMUKHI } /* block=gurmukhi */, - { 3, 3439, 0, 18, 0, UNI_SMALLKANAEXT } /* smallkanaextension */, - { 6, 1537, 2994, 24, 13, UNI_INPC__BOTTOMANDLEFT } /* indicpositionalcategory=bottomandleft */, - { 2, 1417, 9919, 24, 3, UNI_CCC__202 } /* canonicalcombiningclass=202 */, - { 64, 6231, 1467, 4, 22, UNI_DIACRITICALSFORSYMBOLS } /* incombiningmarksforsymbols */, - { 0, 8780, 1700, 6, 23, UNI_SHORTHANDFORMATCONTROLS } /* block=shorthandformatcontrols */, - { 0, 21, 3549, 4, 8, UNI_ALCHEMICAL } /* inalchemical */, - { 7, 21, 5284, 2, 7, UNI_LISUSUP } /* inlisusup */, - { 1, 2224, 3440, 3, 17, UNI_SMALLKANAEXT } /* insmallkanaextension */, - { 0, 184, 1, 3, 1, UNI_CN } /* iscn */, - { 0, 10132, 400, 3, 6, UNI_WB__FO } /* wb=format */, - { 1, 3836, 8942, 17, 6, UNI_LYDI } /* scriptextensions=lydian */, - { 3, 5060, 0, 14, 0, UNI_ci_values_index } /* caseignorable= */, - { 34, 9768, 3598, 4, 17, UNI_AGHB } /* scx=caucasianalbanian */, - { 1, 8509, 751, 4, 28, UNI_ENCLOSEDALPHANUMSUP } /* inenclosedalphanumericsupplement */, - { 11, 1822, 0, 2, 0, UNI_NL } /* nl */, - { 8, 9277, 4703, 3, 15, UNI_ARMI } /* sc=imperialaramaic */, - { 9, 8780, 5752, 6, 13, UNI_GREEKEXT } /* block=greekextended */, - { 0, 8589, 8123, 7, 8, UNI_SC__BUGI } /* script=buginese */, - { 6, 184, 3026, 3, 7, UNI_CHER } /* ischerokee */, - { 0, 1537, 2549, 24, 12, UNI_INPC__TOPANDBOTTOM } /* indicpositionalcategory=topandbottom */, - { 2, 9540, 1, 4, 1, -UNI_DIA } /* dia=n */, - { 0, 7318, 10102, 10, 3, UNI_IN__5_DOT_2 } /* presentin=v52 */, - { 0, 9508, 9468, 4, 4, UNI_CCC__216 } /* ccc=atar */, - { 0, 184, 9560, 2, 4, UNI_GONG } /* isgong */, - { 0, 2161, 0, 20, 0, UNI_EXTPICT } /* extendedpictographic */, - { 0, 8768, 1025, 6, 2, -UNI_BIDIC } /* bidic=no */, - { 14, 8780, 3295, 6, 9, UNI_LATINEXTA } /* block=latinexta */, - { 2, 2280, 2875, 3, 18, UNI_OTTOMANSIYAQNUMBERS } /* isottomansiyaqnumbers */, - { 3, 10296, 8979, 3, 4, UNI__PERL_PATWS } /* ispatws */, - { 1, 9508, 7778, 4, 2, UNI_CCC__21 } /* ccc=21 */, - { 3, 7325, 9397, 3, 3, UNI_IN__2_DOT_1 } /* in=2.1 */, - { 4, 4868, 0, 15, 0, UNI_NARB } /* oldnortharabian */, - { 32, 2098, 0, 21, 0, UNI_CJKCOMPATFORMS } /* cjkcompatibilityforms */, - { 0, 3295, 0, 9, 0, UNI_LATINEXTA } /* latinexta */, - { 3, 3836, 8123, 17, 8, UNI_BUGI } /* scriptextensions=buginese */, - { 1, 9488, 3241, 4, 11, UNI_GEORGIANSUP } /* blk=georgiansup */, - { 8, 1417, 8805, 25, 5, UNI_CCC__118 } /* canonicalcombiningclass=ccc118 */, - { 2, 9277, 7666, 3, 9, UNI_ORKH } /* sc=oldturkic */, - { 1, 8774, 10135, 6, 3, UNI_BIDIM } /* bidim=yes */, - { 5, 8954, 0, 7, 0, -UNI__PERL_NCHAR } /* nchar=n */, - { 0, 184, 1822, 2, 2, UNI_NL } /* isnl */, - { 0, 10310, 8301, 4, 6, UNI_INTIFINAGH } /* intifinagh */, - { 0, 8780, 114, 7, 24, UNI_DIACRITICALS } /* block=combiningdiacriticalmarks */, - { 0, 1677, 0, 23, 0, UNI_LATINEXTADDITIONAL } /* latinextendedadditional */, - { 3, 2161, 1, 21, 1, -UNI_EXTPICT } /* extendedpictographic=n */, - { 2, 1552, 406, 9, 7, UNI_XPOSIXCNTRL } /* category=control */, - { 11, 7218, 58, 10, 2, UNI_LB__ID } /* linebreak=id */, - { 16, 4916, 1116, 3, 3, UNI_TANG } /* istang */, - { 0, 5578, 495, 14, 7, UNI_SB__NU } /* sentencebreak=numeric */, - { 0, 1417, 8825, 24, 3, UNI_CCC__130 } /* canonicalcombiningclass=130 */, - { 1, 10288, 5039, 8, 6, UNI_XPOSIXXDIGIT } /* isxposixxdigit */, - { 1, 9444, 9852, 4, 4, UNI_AGE__12_DOT_1 } /* age=v121 */, - { 0, 9277, 9448, 3, 4, UNI_AGHB } /* sc=aghb */, - { 0, 5986, 7827, 13, 8, UNI_NV__1_SLASH_5 } /* numericvalue=2.00e-01 */, - { 3, 1188, 8653, 3, 6, UNI_INTAIVIET } /* intaiviet */, - { 4, 2182, 5497, 21, 11, UNI_GCB__SM } /* graphemeclusterbreak=spacingmark */, - { 1, 8589, 9676, 7, 4, UNI_NARB } /* script=narb */, - { 2, 4369, 0, 6, 0, UNI_SYRC } /* syriac */, - { 2, 4305, 0, 16, 0, UNI_PO } /* otherpunctuation */, - { 0, 9524, 1025, 4, 2, -UNI_CWT } /* cwt=no */, - { 2, 1966, 728, 22, 6, UNI_INSC__NUMBER } /* indicsyllabiccategory=number */, - { 12, 2287, 0, 4, 0, UNI_SINH } /* sinh */, - { 0, 10009, 5012, 3, 6, UNI_DT__SQR } /* dt=square */, - { 0, 9488, 8421, 4, 7, UNI_INELYMAIC } /* blk=elymaic */, - { 1, 9277, 7657, 3, 9, UNI_SC__PERM } /* sc=oldpermic */, - { 2, 9340, 0, 5, 0, UNI_VSSUP } /* vssup */, - { 1, 8882, 0, 6, 0, UNI_grext_values_index } /* grext= */, - { 0, 9277, 8219, 3, 8, UNI_SC__JAVA } /* sc=javanese */, - { 3, 5791, 2637, 13, 3, UNI_JG__YEH } /* joininggroup=yeh */, - { 21, 3836, 8498, 17, 4, UNI_MULT } /* scriptextensions=mult */, - { 5, 8774, 1, 6, 1, -UNI_BIDIM } /* bidim=n */, - { 16, 1188, 9336, 3, 4, UNI_INTAKRI } /* intakri */, - { 18, 10048, 7806, 3, 1, UNI_NV__6 } /* nv=6 */, - { 1, 3836, 8131, 17, 8, UNI_DUPL } /* scriptextensions=duployan */, - { 2, 5739, 1, 13, 1, -UNI_GRBASE } /* graphemebase=n */, - { 1, 8978, 9836, 6, 4, UNI__PERL_PATWS } /* patws=true */, - { 5, 9351, 1025, 4, 2, -UNI_IDS } /* ids=no */, - { 1, 10033, 96, 3, 10, UNI_LB__AL } /* lb=alphabetic */, - { 0, 7325, 10099, 3, 3, UNI_IN__5_DOT_1 } /* in=v51 */, - { 0, 1537, 6621, 3, 5, UNI_DOMINO } /* indomino */, - { 1, 9488, 719, 4, 9, UNI_INCUNEIFORM } /* blk=cuneiform */, - { 10, 9488, 8603, 4, 7, UNI_SHAW } /* blk=shavian */, - { 12, 9240, 0, 5, 0, UNI_dash_values_index } /* dash= */, - { 5, 10027, 6373, 3, 12, UNI_JG__MANICHAEANPE } /* jg=manichaeanpe */, - { 0, 1552, 4305, 9, 16, UNI_PO } /* category=otherpunctuation */, - { 1, 184, 8115, 2, 8, UNI_BASS } /* isbassavah */, - { 3, 8894, 36, 6, 1, UNI_JOINC } /* joinc=t */, - { 0, 9488, 6409, 4, 12, UNI_INMENDEKIKAKUI } /* blk=mendekikakui */, - { 0, 8449, 9255, 7, 5, -UNI_HYPHEN } /* hyphen=false */, - { 0, 8762, 26, 6, 1, UNI_XPOSIXALPHA } /* alpha=y */, - { 2, 9277, 7428, 3, 10, UNI_WARA } /* sc=warangciti */, - { 0, 2569, 3493, 20, 18, UNI_VO__TR } /* verticalorientation=transformedrotated */, - { 0, 3836, 8315, 17, 8, UNI_UGAR } /* scriptextensions=ugaritic */, - { 0, 8589, 5843, 7, 9, UNI_SC__MLYM } /* script=malayalam */, - { 1, 1585, 0, 14, 0, UNI_BYZANTINEMUSIC } /* byzantinemusic */, - { 0, 10027, 8155, 3, 8, UNI_JG__FARSIYEH } /* jg=farsiyeh */, - { 0, 6805, 287, 6, 29, UNI_MISCMATHSYMBOLSB } /* inmiscellaneousmathematicalsymbolsb */, - { 2, 9488, 9310, 4, 5, UNI_INOGHAM } /* blk=ogham */, - { 4, 6231, 3796, 3, 3, UNI_INCHAM } /* incham */, - { 8, 184, 2931, 2, 19, UNI_SUPARROWSA } /* issupplementalarrowsa */, - { 17, 7076, 7069, 3, 9, UNI_ASCII } /* inbasiclatin */, - { 0, 1441, 0, 24, 0, UNI_CJKSYMBOLS } /* cjksymbolsandpunctuation */, - { 2, 8589, 4145, 7, 7, UNI_SC__LINB } /* script=linearb */, - { 4, 7660, 0, 4, 0, UNI_PERM } /* perm */, - { 18, 9768, 3937, 4, 8, UNI_BOPO } /* scx=bopomofo */, - { 0, 9277, 3079, 3, 4, UNI_SC__COPT } /* sc=copt */, - { 3, 8617, 0, 7, 0, UNI_SOYO } /* soyombo */, - { 2, 4916, 8300, 3, 7, UNI_TFNG } /* istifinagh */, - { 2, 3836, 8912, 17, 4, UNI_KHOJ } /* scriptextensions=khoj */, - { 13, 9508, 7859, 4, 3, UNI_WB__EB } /* ccc=200 */, - { 0, 9768, 9732, 4, 4, UNI_PRTI } /* scx=prti */, - { 0, 2784, 7506, 4, 7, UNI_ARABICPFB } /* inarabicpfb */, - { 1, 6061, 0, 11, 0, UNI_BIDIC } /* bidicontrol */, - { 0, 9444, 7469, 4, 1, UNI_AGE__5 } /* age=5 */, - { 1, 9768, 9325, 4, 5, UNI_RUNR } /* scx=runic */, - { 0, 6231, 2141, 3, 20, UNI_CYRILLICSUP } /* incyrillicsupplementary */, - { 1, 8589, 9008, 7, 4, UNI_SC__THAA } /* script=thaa */, - { 0, 184, 5040, 2, 5, UNI_XPOSIXDIGIT } /* isdigit */, - { 1, 8589, 8876, 7, 6, UNI_GOTH } /* script=gothic */, - { 8, 9768, 57, 4, 2, UNI_YI } /* scx=yi */, - { 0, 4049, 0, 16, 0, UNI_GEORGIANEXT } /* georgianextended */, - { 0, 1189, 495, 3, 2, UNI_NT__NU } /* nt=nu */, - { 0, 3374, 36, 11, 1, UNI_XPOSIXSPACE } /* whitespace=t */, - { 0, 206, 0, 2, 0, UNI_PI } /* pi */, - { 2, 3379, 0, 5, 0, UNI_XPOSIXSPACE } /* space */, - { 20, 3836, 9285, 17, 5, UNI_LIMB } /* scriptextensions=limbu */, - { 5, 3836, 3169, 17, 4, UNI_ETHI } /* scriptextensions=ethi */, - { 0, 5578, 34, 14, 6, UNI_SB__EX } /* sentencebreak=extend */, - { 0, 3836, 7666, 17, 9, UNI_ORKH } /* scriptextensions=oldturkic */, - { 0, 8780, 9325, 6, 5, UNI_INRUNIC } /* block=runic */, - { 1, 9014, 0, 5, 0, UNI_UIDEO } /* uideo */, - { 2, 10024, 406, 3, 7, UNI_XPOSIXCNTRL } /* gc=control */, - { 8, 184, 3349, 2, 18, UNI_ZP } /* isparagraphseparator */, - { 1, 10126, 3504, 3, 7, UNI_VO__R } /* vo=rotated */, - { 0, 10009, 2569, 3, 8, UNI_DT__VERT } /* dt=vertical */, - { 3, 5674, 3, 13, 1, -UNI_BIDIM } /* bidimirrored=f */, - { 0, 9488, 951, 4, 28, UNI_VSSUP } /* blk=variationselectorssupplement */, - { 37, 5324, 6279, 4, 10, UNI_MAHJONG } /* inmahjongtiles */, - { 18, 9508, 8801, 4, 3, UNI_CCC__107 } /* ccc=107 */, - { 0, 9768, 6884, 4, 11, UNI_HMNG } /* scx=pahawhhmong */, - { 1, 5986, 10148, 13, 2, UNI_NV__47 } /* numericvalue=47 */, - { 1, 8780, 5200, 6, 7, UNI_KANASUP } /* block=kanasup */, - { 4, 9768, 0, 4, 0, UNI_scx_values_index } /* scx= */, - { 28, 7738, 0, 4, 0, UNI_XIDS } /* xids */, - { 0, 5778, 0, 13, 0, UNI_IPAEXT } /* ipaextensions */, - { 2, 7738, 9836, 9, 4, UNI_XIDS } /* xidstart=true */, - { 0, 1768, 9255, 22, 5, -UNI_CWCF } /* changeswhencasefolded=false */, - { 0, 10048, 9913, 3, 3, UNI_NV__2_SLASH_3 } /* nv=2/3 */, - { 2, 6609, 26, 11, 1, UNI_DEP } /* deprecated=y */, - { 34, 21, 1007, 3, 26, UNI_ANCIENTGREEKMUSIC } /* inancientgreekmusicalnotation */, - { 0, 2182, 5585, 21, 2, UNI_WB__EB } /* graphemeclusterbreak=eb */, - { 0, 1988, 10135, 22, 3, UNI_LOE } /* logicalorderexception=yes */, - { 0, 184, 3367, 2, 17, UNI__PERL_PATWS } /* ispatternwhitespace */, - { 2, 3385, 26, 18, 1, UNI_RI } /* regionalindicator=y */, - { 1, 184, 6012, 2, 13, UNI_VERTICALFORMS } /* isverticalforms */, - { 1, 9270, 6885, 3, 10, UNI_INPAHAWHHMONG } /* inpahawhhmong */, - { 1, 9768, 7428, 4, 4, UNI_WARA } /* scx=wara */, - { 1, 8780, 2076, 6, 15, UNI_TRANSPORTANDMAP } /* block=transportandmap */, - { 2, 78, 0, 4, 0, UNI_ARAB } /* arab */, - { 0, 9275, 1489, 5, 24, UNI_INSC__CONSONANTSUCCEEDINGREPHA } /* insc=consonantsucceedingrepha */, - { 12, 9277, 7660, 3, 4, UNI_SC__PERM } /* sc=perm */, - { 3, 184, 1922, 2, 22, UNI_DIACRITICALSFORSYMBOLS } /* isdiacriticalsforsymbols */, - { 2, 8589, 9283, 7, 4, UNI_PHLI } /* script=phli */, - { 6, 10024, 1025, 3, 2, UNI_NO } /* gc=no */, - { 0, 10009, 2569, 3, 4, UNI_DT__VERT } /* dt=vert */, - { 6, 4033, 2349, 16, 20, UNI_PC } /* generalcategory=connectorpunctuation */, - { 0, 10027, 5908, 3, 13, UNI_JG__MANICHAEANTAW } /* jg=manichaeantaw */, - { 9, 10132, 1218, 3, 8, UNI_WB__KA } /* wb=katakana */, - { 8, 7228, 0, 10, 0, UNI_lower_values_index } /* lowercase= */, - { 0, 8780, 8841, 7, 5, UNI_INCHAKMA } /* block=chakma */, - { 1, 184, 2, 3, 1, UNI_CI } /* isci */, - { 0, 9768, 4928, 4, 5, UNI_TAML } /* scx=tamil */, - { 3, 5746, 10135, 6, 3, UNI_EBASE } /* ebase=yes */, - { 1, 9768, 1218, 4, 8, UNI_KANA } /* scx=katakana */, - { 1, 2224, 4370, 3, 8, UNI_SYRIACSUP } /* insyriacsup */, - { 0, 10024, 1822, 3, 2, UNI_NL } /* gc=nl */, - { 16, 184, 1823, 2, 9, UNI_XPOSIXLOWER } /* islowercase */, - { 16, 10048, 7979, 3, 8, UNI_NV__3_SLASH_5 } /* nv=6.00e-01 */, - { 3, 3379, 1, 6, 1, -UNI_XPOSIXSPACE } /* space=n */, - { 4, 1552, 1186, 9, 2, UNI_PO } /* category=po */, - { 0, 6623, 2876, 4, 17, UNI_OTTOMANSIYAQNUMBERS } /* inottomansiyaqnumbers */, - { 17, 9277, 8171, 3, 8, UNI_SC__GUJR } /* sc=gujarati */, - { 4, 9508, 9201, 5, 4, UNI_CCC__34 } /* ccc=ccc34 */, - { 2, 9488, 42, 4, 36, UNI_CJKCOMPATIDEOGRAPHSSUP } /* blk=cjkcompatibilityideographssupplement */, - { 0, 10048, 9420, 3, 4, UNI_NV__3_SLASH_20 } /* nv=3/20 */, - { 2, 9346, 0, 4, 0, UNI_idc_values_index } /* idc= */, - { 0, 10027, 1511, 3, 3, UNI_JG__HAH } /* jg=hah */, - { 0, 10027, 5340, 3, 14, UNI_JG__MANICHAEANFIVE } /* jg=manichaeanfive */, - { 0, 2912, 0, 19, 0, UNI_SUNDANESESUP } /* sundanesesupplement */, - { 17, 9768, 719, 4, 9, UNI_XSUX } /* scx=cuneiform */, - { 0, 3259, 0, 4, 0, UNI_IDSB } /* idsb */, - { 0, 8589, 8582, 7, 7, UNI_SC__PHAG } /* script=phagspa */, - { 17, 1552, 9503, 9, 2, UNI_MC } /* category=mc */, - { 14, 3836, 7684, 17, 9, UNI_PAUC } /* scriptextensions=paucinhau */, - { 0, 4916, 4944, 3, 14, UNI_TITLE } /* istitlecaseletter */, - { 5, 9496, 0, 4, 0, UNI_BUHD } /* buhd */, - { 0, 9508, 7858, 4, 2, UNI_CCC__22 } /* ccc=22 */, - { 1, 184, 1319, 2, 25, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* issymbolsandpictographsexta */, - { 1, 10296, 0, 12, 0, UNI_POSIXBLANK } /* isposixblank */, - { 1, 6928, 1, 11, 1, -UNI_SD } /* softdotted=n */, - { 2, 3836, 9002, 17, 4, UNI_TELU } /* scriptextensions=telu */, - { 6, 184, 3683, 2, 11, UNI_ETHIOPICEXT } /* isethiopicext */, - { 9, 9290, 9255, 5, 5, -UNI_MATH } /* math=false */, - { 0, 8780, 895, 6, 28, UNI_SUPPUAA } /* block=supplementaryprivateuseareaa */, - { 16, 8219, 0, 4, 0, UNI_JAVA } /* java */, - { 0, 9488, 8442, 4, 7, UNI_INHANUNOO } /* blk=hanunoo */, - { 0, 5791, 4225, 13, 16, UNI_JG__MANICHAEANTWENTY } /* joininggroup=manichaeantwenty */, - { 19, 184, 6409, 2, 4, UNI_MEND } /* ismend */, - { 3, 5037, 9255, 9, 5, -UNI_XPOSIXXDIGIT } /* hexdigit=false */, - { 9, 9560, 0, 4, 0, UNI_GONG } /* gong */, - { 0, 117, 2226, 4, 19, UNI_ININSCRIPTIONALPARTHIAN } /* ininscriptionalparthian */, - { 3, 8589, 9512, 7, 4, UNI_CHRS } /* script=chrs */, - { 3, 5739, 0, 13, 0, UNI_grbase_values_index } /* graphemebase= */, - { 0, 7218, 6169, 10, 4, UNI_LB__GL } /* linebreak=glue */, - { 0, 184, 1901, 3, 21, UNI_INDICNUMBERFORMS } /* iscommonindicnumberforms */, - { 0, 10024, 7, 3, 1, UNI_C } /* gc=c */, - { 1, 117, 5779, 3, 5, UNI_IPAEXT } /* inipaext */, - { 1, 8688, 15, 4, 2, UNI_ARAB } /* isarab */, - { 4, 9444, 9848, 4, 4, UNI_AGE__12 } /* age=v120 */, - { 3, 9768, 9664, 4, 3, UNI_MRO } /* scx=mro */, - { 16, 9460, 0, 4, 0, UNI_ARMI } /* armi */, - { 1, 8589, 3895, 8, 3, UNI_SGNW } /* script=sgnw */, - { 2, 3836, 8407, 17, 7, UNI_DSRT } /* scriptextensions=deseret */, - { 0, 10048, 9050, 3, 5, UNI_NV__1_SLASH_160 } /* nv=1/160 */, - { 1, 9768, 9008, 4, 4, UNI_THAA } /* scx=thaa */, - { 14, 8960, 0, 6, 0, UNI_nfcqc_values_index } /* nfcqc= */, - { 3, 9262, 8554, 3, 7, UNI_SB__LE } /* sb=oletter */, - { 1, 8267, 36, 8, 1, UNI_RADICAL } /* radical=t */, - { 0, 8855, 0, 2, 0, UNI_CF } /* cf */, - { 8, 1417, 184, 24, 2, UNI_CCC__IS } /* canonicalcombiningclass=is */, - { 0, 9250, 36, 5, 1, UNI_EMOD } /* emod=t */, - { 0, 7155, 8188, 3, 7, UNI_HIRA } /* ishiragana */, - { 19, 9556, 5497, 4, 11, UNI_GCB__SM } /* gcb=spacingmark */, - { 2, 184, 6061, 2, 5, UNI_BIDIC } /* isbidic */, - { 2, 7540, 10135, 9, 3, UNI_EXT } /* extender=yes */, - { 3, 8780, 8470, 6, 7, UNI_INLINEARA } /* block=lineara */, - { 8, 10291, 10308, 5, 5, UNI_POSIXPRINT } /* posixprint */, - { 0, 10027, 6313, 3, 12, UNI_JG__MALAYALAMNGA } /* jg=malayalamnga */, - { 3, 10048, 7469, 3, 1, UNI_NV__5 } /* nv=5 */, - { 51, 9351, 26, 4, 1, UNI_IDS } /* ids=y */, - { 1, 9997, 5829, 3, 3, UNI_BC__RLO } /* bc=rlo */, - { 0, 9488, 9684, 4, 4, UNI_INNEWA } /* blk=newa */, - { 2, 9768, 3025, 4, 8, UNI_CHER } /* scx=cherokee */, - { 0, 1417, 10172, 24, 2, UNI_CCC__9 } /* canonicalcombiningclass=vr */, - { 15, 10333, 7, 3, 1, UNI_SC } /* issc */, - { 0, 7318, 7950, 10, 1, UNI_IN__9 } /* presentin=9 */, - { 0, 2288, 5187, 3, 13, UNI_HIGHSURROGATES } /* inhighsurrogates */, - { 14, 10009, 4532, 3, 6, UNI_DT__MED } /* dt=medial */, - { 0, 6231, 2099, 3, 20, UNI_CJKCOMPATFORMS } /* incjkcompatibilityforms */, - { 16, 3241, 0, 8, 0, UNI_GEOR } /* georgian */, - { 0, 9270, 6506, 3, 11, UNI_PHAISTOS } /* inphaistosdisc */, - { 8, 4643, 0, 15, 0, UNI_ecomp_values_index } /* emojicomponent= */, - { 17, 5791, 8283, 13, 8, UNI_JG__SWASHKAF } /* joininggroup=swashkaf */, - { 0, 5986, 9050, 13, 4, UNI_NV__1_SLASH_16 } /* numericvalue=1/16 */, - { 5, 9508, 3015, 4, 10, UNI_CCC__AR } /* ccc=aboveright */, - { 4, 2280, 9713, 3, 3, UNI_OSGE } /* isosge */, - { 1, 9768, 4868, 4, 15, UNI_NARB } /* scx=oldnortharabian */, - { 1, 9260, 1, 5, 1, -UNI_IDSB } /* idsb=n */, - { 1, 5986, 7803, 13, 8, UNI_NV__1_SLASH_64 } /* numericvalue=1.56e-02 */, - { 2, 8179, 0, 8, 0, UNI_GURU } /* gurmukhi */, - { 3, 9488, 8179, 4, 8, UNI_INGURMUKHI } /* blk=gurmukhi */, - { 0, 9277, 7648, 3, 9, UNI_ITAL } /* sc=olditalic */, - { 1, 8882, 36, 6, 1, UNI_GREXT } /* grext=t */, - { 32, 9768, 9315, 4, 5, UNI_ORYA } /* scx=oriya */, - { 0, 10024, 3358, 3, 9, UNI_Z } /* gc=separator */, - { 1, 2429, 0, 20, 0, UNI_PHLI } /* inscriptionalpahlavi */, - { 3, 5986, 10146, 13, 2, UNI_NV__46 } /* numericvalue=46 */, - { 22, 10048, 8042, 3, 2, UNI_NV__18 } /* nv=18 */, - { 5, 8954, 9836, 6, 4, UNI__PERL_NCHAR } /* nchar=true */, - { 0, 4401, 0, 16, 0, UNI_TANGUTSUP } /* tangutsupplement */, - { 0, 8780, 5284, 6, 4, UNI_INLISU } /* block=lisu */, - { 0, 9536, 36, 4, 1, UNI_DEP } /* dep=t */, - { 19, 21, 7027, 2, 11, UNI_YISYLLABLES } /* inyisyllables */, - { 0, 9444, 7765, 4, 1, UNI_AGE__2 } /* age=2 */, - { 0, 9768, 3115, 4, 10, UNI_DEVA } /* scx=devanagari */, - { 0, 184, 3295, 2, 9, UNI_LATINEXTA } /* islatinexta */, - { 2, 4422, 8409, 4, 5, UNI_DSRT } /* indeseret */, - { 2, 4478, 0, 15, 0, UNI_BRAI } /* braillepatterns */, - { 0, 8589, 8470, 7, 7, UNI_SC__LINA } /* script=lineara */, - { 9, 1988, 1, 22, 1, -UNI_LOE } /* logicalorderexception=n */, - { 1, 1417, 7859, 24, 2, UNI_CCC__20 } /* canonicalcombiningclass=20 */, - { 13, 9488, 6517, 4, 12, UNI_PLAYINGCARDS } /* blk=playingcards */, - { 2, 895, 0, 28, 0, UNI_SUPPUAA } /* supplementaryprivateuseareaa */, - { 0, 10027, 6950, 3, 11, UNI_JG__STRAIGHTWAW } /* jg=straightwaw */, - { 0, 2722, 0, 10, 0, UNI_JAMO } /* hanguljamo */, - { 1, 2224, 5607, 3, 13, UNI_SUPPUNCTUATION } /* insuppunctuation */, - { 0, 9277, 3079, 3, 6, UNI_SC__COPT } /* sc=coptic */, - { 1, 5032, 0, 5, 0, UNI_ASCII } /* ascii */, - { 0, 3836, 9484, 17, 4, UNI_BHKS } /* scriptextensions=bhks */, - { 0, 10006, 26, 3, 1, UNI_DI } /* di=y */, - { 1, 10048, 9432, 3, 4, UNI_NV__5_SLASH_12 } /* nv=5/12 */, - { 0, 1979, 47, 10, 1, UNI_LM } /* category=lm */, - { 5, 9688, 0, 3, 0, UNI_NKO } /* nko */, - { 2, 9700, 0, 4, 0, UNI_OLCK } /* olck */, - { 1, 9580, 0, 4, 0, UNI_HANO } /* hano */, - { 3, 2182, 1910, 21, 2, UNI_GCB__CN } /* graphemeclusterbreak=cn */, - { 0, 8780, 9038, 6, 6, UNI_INYEZIDI } /* block=yezidi */, - { 0, 6553, 10135, 12, 3, UNI_XIDC } /* xidcontinue=yes */, - { 0, 184, 7428, 2, 4, UNI_WARA } /* iswara */, - { 9, 7088, 2798, 10, 19, UNI_BC__LRO } /* bidiclass=lefttorightoverride */, - { 1, 9768, 6409, 4, 4, UNI_MEND } /* scx=mend */, - { 4, 1417, 756, 24, 2, UNI_CCC__DA } /* canonicalcombiningclass=da */, - { 1, 9768, 6940, 5, 10, UNI_SORA } /* scx=sorasompeng */, - { 13, 400, 0, 6, 0, UNI_CF } /* format */, - { 3, 2182, 3385, 21, 17, UNI_RI } /* graphemeclusterbreak=regionalindicator */, - { 0, 10288, 467, 8, 5, UNI_XPOSIXPUNCT } /* isxposixpunct */, - { 0, 5452, 0, 14, 0, UNI_nfcqc_values_index } /* nfcquickcheck= */, - { 4, 10296, 131, 3, 3, UNI_PALM } /* ispalm */, - { 1, 4033, 1527, 16, 9, UNI__PERL_SURROGATE } /* generalcategory=surrogate */, - { 9, 3836, 4370, 18, 5, UNI_SYRC } /* scriptextensions=syriac */, - { 7, 8984, 1025, 6, 2, -UNI_QMARK } /* qmark=no */, - { 0, 4033, 32, 16, 2, UNI__PERL_SURROGATE } /* generalcategory=cs */, - { 2, 8575, 0, 6, 0, UNI_PATSYN } /* patsyn */, - { 15, 9488, 3295, 4, 18, UNI_LATINEXTADDITIONAL } /* blk=latinextadditional */, - { 1, 8589, 9864, 7, 4, UNI_WCHO } /* script=wcho */, - { 0, 8435, 1025, 7, 2, -UNI_GRBASE } /* grbase=no */, - { 11, 9277, 9796, 3, 4, UNI_SC__SYRC } /* sc=syrc */, - { 0, 8780, 3887, 6, 17, UNI_SUTTONSIGNWRITING } /* block=suttonsignwriting */, - { 1, 9277, 2560, 3, 4, UNI_SC__MAND } /* sc=mand */, - { 20, 3151, 0, 17, 0, UNI_EPRES } /* emojipresentation */, - { 41, 10012, 8948, 3, 6, UNI_EA__NA } /* ea=narrow */, - { 2, 184, 8414, 2, 7, UNI_ELBA } /* iselbasan */, - { 8, 8589, 7666, 7, 9, UNI_ORKH } /* script=oldturkic */, - { 1, 5578, 2529, 15, 4, UNI_SB__ST } /* sentencebreak=sterm */, - { 1, 9277, 7118, 3, 10, UNI_CHRS } /* sc=chorasmian */, - { 2, 4433, 0, 15, 0, UNI_ARABICEXTA } /* arabicextendeda */, - { 0, 2855, 0, 12, 0, UNI_MONGOLIANSUP } /* mongoliansup */, - { 1, 1166, 0, 25, 0, UNI_DI } /* defaultignorablecodepoint */, - { 0, 5508, 0, 13, 0, UNI_PATSYN } /* patternsyntax */, - { 0, 6796, 0, 11, 0, UNI_MEDF } /* medefaidrin */, - { 0, 184, 218, 3, 32, UNI_DIACRITICALSEXT } /* iscombiningdiacriticalmarksextended */, - { 1, 9488, 4973, 4, 15, UNI_VEDICEXT } /* blk=vedicextensions */, - { 4, 8400, 36, 7, 1, UNI_COMPEX } /* compex=t */, - { 0, 3836, 382, 17, 4, UNI_EGYP } /* scriptextensions=egyp */, - { 1, 9014, 36, 6, 1, UNI_UIDEO } /* uideo=t */, - { 1, 5791, 5179, 13, 7, UNI_JG__HEHGOAL } /* joininggroup=hehgoal */, - { 1, 6205, 9836, 12, 4, UNI_IDEO } /* ideographic=true */, - { 0, 8882, 1025, 6, 2, -UNI_GREXT } /* grext=no */, - { 1, 3259, 10135, 18, 3, UNI_IDSB } /* idsbinaryoperator=yes */, - { 9, 9275, 6463, 5, 6, UNI_LB__ZWJ } /* insc=joiner */, - { 0, 184, 43, 3, 25, UNI_CJKCOMPATIDEOGRAPHS } /* iscjkcompatibilityideographs */, - { 0, 10030, 7258, 3, 10, UNI_JT__U } /* jt=nonjoining */, - { 0, 7318, 10096, 10, 3, UNI_IN__5 } /* presentin=v50 */, - { 4, 10027, 5378, 3, 4, UNI_JG__KAPH } /* jg=kaph */, - { 18, 10048, 5648, 3, 11, UNI_NV__10000000000 } /* nv=10000000000 */, - { 0, 9345, 26, 5, 1, UNI_XIDC } /* xidc=y */, - { 0, 8997, 10135, 5, 3, UNI_TERM } /* term=yes */, - { 5, 8780, 7585, 6, 9, UNI_LATINEXTC } /* block=latinextc */, - { 5, 10030, 0, 3, 0, UNI_jt_values_index } /* jt= */, - { 4, 867, 0, 11, 0, UNI_PHONETICEXT } /* phoneticext */, - { 1, 8780, 43, 7, 15, UNI_CJKCOMPAT } /* block=cjkcompatibility */, - { 1, 3097, 9552, 18, 4, UNI_DT__FONT } /* decompositiontype=font */, - { 0, 184, 8936, 2, 4, UNI_LYCI } /* islyci */, - { 5, 7585, 0, 9, 0, UNI_LATINEXTC } /* latinextc */, - { 0, 9488, 8638, 4, 7, UNI_INTAGALOG } /* blk=tagalog */, - { 3, 9508, 7874, 4, 2, UNI_CCC__23 } /* ccc=23 */, - { 40, 7218, 1751, 10, 2, UNI_LB__AI } /* linebreak=ai */, - { 0, 9508, 9206, 5, 4, UNI_CCC__35 } /* ccc=ccc35 */, - { 0, 9488, 5830, 4, 13, UNI_LOWSURROGATES } /* blk=lowsurrogates */, - { 0, 9488, 7027, 4, 11, UNI_YISYLLABLES } /* blk=yisyllables */, - { 1, 4791, 2247, 4, 9, UNI_INMEETEIMAYEK } /* inmeeteimayek */, - { 8, 6231, 4569, 3, 14, UNI_CURRENCYSYMBOLS } /* incurrencysymbols */, - { 3, 9768, 2817, 4, 19, UNI_MERO } /* scx=meroitichieroglyphs */, - { 1, 8780, 2874, 6, 19, UNI_OTTOMANSIYAQNUMBERS } /* block=ottomansiyaqnumbers */, - { 0, 10048, 7781, 3, 1, UNI_NV__4 } /* nv=4 */, - { 0, 8780, 3937, 6, 16, UNI_BOPOMOFOEXT } /* block=bopomofoextended */, - { 6, 9508, 3564, 4, 13, UNI_CCC__202 } /* ccc=attachedbelow */, - { 1, 7076, 4479, 3, 14, UNI_BRAI } /* inbraillepatterns */, - { 4, 2280, 4306, 3, 4, UNI_C } /* isother */, - { 0, 9488, 8243, 4, 8, UNI_INMAHAJANI } /* blk=mahajani */, - { 17, 8780, 809, 6, 29, UNI_ENCLOSEDIDEOGRAPHICSUP } /* block=enclosedideographicsupplement */, - { 2, 9768, 8243, 4, 8, UNI_MAHJ } /* scx=mahajani */, - { 1, 9492, 4898, 4, 4, UNI_BPT__O } /* bpt=open */, - { 9, 5791, 7048, 13, 10, UNI_JG__AFRICANQAF } /* joininggroup=africanqaf */, - { 0, 4916, 2532, 5, 16, UNI_TERM } /* isterminalpunctuation */, - { 1, 5986, 8714, 13, 6, UNI_NV__300000 } /* numericvalue=300000 */, - { 0, 4116, 415, 3, 10, UNI_IDEO } /* isideographic */, - { 21, 1465, 0, 13, 0, UNI_M } /* combiningmark */, - { 0, 8780, 923, 6, 28, UNI_SUPPUAB } /* block=supplementaryprivateuseareab */, - { 2, 9768, 6481, 4, 12, UNI_HUNG } /* scx=oldhungarian */, - { 2, 1417, 9026, 24, 6, UNI_CCC__9 } /* canonicalcombiningclass=virama */, - { 1, 9277, 7684, 3, 9, UNI_PAUC } /* sc=paucinhau */, - { 1, 184, 951, 2, 17, UNI_VS } /* isvariationselector */, - { 0, 184, 9604, 2, 4, UNI_KHMR } /* iskhmr */, - { 10, 6576, 26, 11, 1, UNI_XPOSIXALPHA } /* alphabetic=y */, - { 11, 7318, 7821, 10, 1, UNI_IN__8 } /* presentin=8 */, - { 1, 3097, 567, 18, 2, UNI_DT__NB } /* decompositiontype=nb */, - { 2, 7325, 9844, 3, 4, UNI_IN__11 } /* in=v110 */, - { 0, 8780, 9320, 6, 5, UNI_INOSAGE } /* block=osage */, - { 0, 4643, 1025, 15, 2, -UNI_ECOMP } /* emojicomponent=no */, - { 8, 3259, 9255, 18, 5, -UNI_IDSB } /* idsbinaryoperator=false */, - { 2, 184, 3341, 2, 8, UNI_DINGBATS } /* isdingbats */, - { 0, 184, 8227, 2, 8, UNI_KANAEXTA } /* iskanaexta */, - { 8, 8780, 8666, 6, 7, UNI_INTIRHUTA } /* block=tirhuta */, - { 1, 8589, 8344, 7, 7, UNI_SC__BENG } /* script=bengali */, - { 0, 5032, 1, 14, 1, -UNI_POSIXXDIGIT } /* asciihexdigit=n */, - { 6, 1417, 9300, 24, 5, UNI_CCC__7 } /* canonicalcombiningclass=nukta */, - { 1, 10298, 0, 10, 0, UNI_POSIXBLANK } /* posixblank */, - { 3, 10009, 10069, 3, 3, UNI_DT__SQR } /* dt=sqr */, - { 67, 8589, 8888, 7, 6, UNI_HATR } /* script=hatran */, - { 0, 2182, 10015, 21, 3, UNI_WB__EB } /* graphemeclusterbreak=ebg */, - { 3, 1417, 5765, 24, 13, UNI_CCC__IS } /* canonicalcombiningclass=iotasubscript */, - { 11, 5003, 0, 15, 0, UNI_ZANB } /* zanabazarsquare */, - { 24, 9277, 8123, 3, 8, UNI_SC__BUGI } /* sc=buginese */, - { 2, 9508, 78, 4, 2, UNI_CCC__AR } /* ccc=ar */, - { 0, 5432, 0, 3, 0, UNI_ANY } /* any */, - { 1, 8589, 9628, 7, 4, UNI_SC__LATN } /* script=latn */, - { 0, 10048, 9428, 3, 4, UNI_NV__3_SLASH_80 } /* nv=3/80 */, - { 1, 7438, 0, 10, 0, UNI_wb_values_index } /* wordbreak= */, - { 10, 184, 6229, 2, 5, UNI_JOINC } /* isjoinc */, - { 1, 9488, 8652, 4, 7, UNI_INTAIVIET } /* blk=taiviet */, - { 0, 8147, 26, 8, 1, UNI_EXTPICT } /* extpict=y */, - { 8, 10048, 9203, 3, 2, UNI_NV__34 } /* nv=34 */, - { 0, 9528, 9255, 4, 5, -UNI_CWU } /* cwu=false */, - { 1, 6553, 26, 12, 1, UNI_XIDC } /* xidcontinue=y */, - { 1, 3836, 6796, 17, 11, UNI_MEDF } /* scriptextensions=medefaidrin */, - { 16, 3836, 2409, 17, 10, UNI_GLAG } /* scriptextensions=glagolitic */, - { 2, 1114, 0, 26, 0, UNI_cwkcf_values_index } /* changeswhennfkccasefolded= */, - { 10, 9508, 9919, 4, 3, UNI_CCC__202 } /* ccc=202 */, - { 11, 8589, 9812, 7, 4, UNI_SC__TAML } /* script=taml */, - { 5, 9444, 7782, 4, 1, UNI_AGE__3 } /* age=3 */, - { 4, 184, 2969, 2, 19, UNI_SUPARROWSC } /* issupplementalarrowsc */, - { 2, 10048, 8082, 3, 2, UNI_NV__19 } /* nv=19 */, - { 1, 6231, 43, 3, 2, UNI_CJK } /* incjk */, - { 0, 5074, 0, 14, 0, UNI_CJKCOMPATFORMS } /* cjkcompatforms */, - { 0, 8435, 0, 7, 0, UNI_grbase_values_index } /* grbase= */, - { 1, 8509, 1035, 4, 25, UNI_ENCLOSEDCJK } /* inenclosedcjklettersandmonths */, - { 3, 9508, 7178, 4, 4, UNI_CCC__6 } /* ccc=hanr */, - { 2, 6253, 0, 5, 0, UNI_KHMR } /* khmer */, - { 0, 8589, 3241, 7, 4, UNI_SC__GEOR } /* script=geor */, - { 8, 9488, 1586, 5, 22, UNI_BYZANTINEMUSIC } /* blk=byzantinemusicalsymbols */, - { 1, 10027, 2637, 3, 9, UNI_JG__YEHBARREE } /* jg=yehbarree */, - { 2, 10027, 5336, 3, 4, UNI_JG__BETH } /* jg=beth */, - { 0, 5986, 9379, 13, 2, UNI_NV__41 } /* numericvalue=41 */, - { 0, 7218, 8680, 10, 7, UNI_LB__XX } /* linebreak=unknown */, - { 4, 4658, 1025, 15, 2, -UNI_GREXT } /* graphemeextend=no */, - { 1, 8876, 0, 6, 0, UNI_GOTH } /* gothic */, - { 2, 7410, 0, 8, 0, UNI_ASSIGNED } /* assigned */, - { 1, 2912, 0, 9, 0, UNI_SUND } /* sundanese */, - { 2, 8780, 8638, 6, 7, UNI_INTAGALOG } /* block=tagalog */, - { 0, 7318, 9848, 10, 4, UNI_IN__12 } /* presentin=v120 */, - { 1, 1417, 9168, 24, 2, UNI_CCC__27 } /* canonicalcombiningclass=27 */, - { 3, 923, 0, 28, 0, UNI_SUPPUAB } /* supplementaryprivateuseareab */, - { 2, 9488, 2409, 4, 13, UNI_GLAGOLITICSUP } /* blk=glagoliticsup */, - { 5, 21, 6253, 2, 5, UNI_INKHMER } /* inkhmer */, - { 0, 5986, 7859, 13, 6, UNI_NV__200000 } /* numericvalue=200000 */, - { 0, 4989, 1, 3, 33, UNI_UCAS } /* isunifiedcanadianaboriginalsyllabics */, - { 2, 9520, 3, 4, 1, -UNI_CWL } /* cwl=f */, - { 4, 9768, 7, 4, 18, UNI_CANS } /* scx=canadianaboriginal */, - { 6, 8780, 7657, 6, 9, UNI_INOLDPERMIC } /* block=oldpermic */, - { 1, 3581, 0, 17, 0, UNI_UCAS } /* canadiansyllabics */, - { 0, 7325, 10123, 3, 3, UNI_IN__9 } /* in=v90 */, - { 0, 4791, 4274, 3, 15, UNI_MYANMAREXTA } /* inmyanmarextendeda */, - { 2, 1979, 24, 10, 1, UNI_LOWERCASELETTER } /* category=ll */, - { 3, 3133, 0, 13, 0, UNI_EMOD } /* emojimodifier */, - { 85, 9277, 8421, 3, 7, UNI_ELYM } /* sc=elymaic */, - { 0, 8780, 1631, 6, 23, UNI_GEOMETRICSHAPESEXT } /* block=geometricshapesextended */, - { 9, 5578, 4305, 14, 5, UNI_SB__XX } /* sentencebreak=other */, - { 2, 8688, 80, 4, 8, UNI_ARABICMATH } /* isarabicmath */, - { 0, 10030, 18, 3, 1, UNI_JT__R } /* jt=r */, - { 33, 10012, 66, 3, 1, UNI_EA__H } /* ea=h */, - { 5, 3836, 8604, 18, 6, UNI_SHAW } /* scriptextensions=shavian */, - { 2, 9488, 2469, 4, 20, UNI_INNYIAKENGPUACHUEHMONG } /* blk=nyiakengpuachuehmong */, - { 0, 6231, 43, 3, 25, UNI_CJKCOMPATIDEOGRAPHS } /* incjkcompatibilityideographs */, - { 0, 3836, 2608, 17, 6, UNI_BRAH } /* scriptextensions=brahmi */, - { 1, 10048, 9916, 3, 3, UNI_NV__2_SLASH_5 } /* nv=2/5 */, - { 0, 9277, 9888, 3, 4, UNI_ZANB } /* sc=zanb */, - { 0, 8509, 751, 4, 14, UNI_ENCLOSEDALPHANUM } /* inenclosedalphanum */, - { 5, 10033, 5536, 3, 14, UNI_LB__PO } /* lb=postfixnumeric */, - { 0, 7739, 9836, 8, 4, UNI_IDS } /* idstart=true */, - { 4, 10033, 4538, 3, 15, UNI_LB__CB } /* lb=contingentbreak */, - { 18, 9277, 9644, 3, 4, UNI_MEDF } /* sc=medf */, - { 18, 9556, 125, 4, 2, UNI_LB__CR } /* gcb=cr */, - { 3, 3836, 8611, 18, 6, UNI_SIDD } /* scriptextensions=siddham */, - { 3, 6265, 0, 12, 0, UNI_NL } /* letternumber */, - { 33, 184, 316, 2, 33, UNI_SUPMATHOPERATORS } /* issupplementalmathematicaloperators */, - { 1, 9997, 5130, 3, 14, UNI_BC__EN } /* bc=europeannumber */, - { 14, 9488, 7138, 4, 10, UNI_COMPATJAMO } /* blk=compatjamo */, - { 0, 8780, 8498, 6, 7, UNI_INMULTANI } /* block=multani */, - { 2, 9768, 8666, 4, 4, UNI_TIRH } /* scx=tirh */, - { 2, 8780, 1018, 6, 5, UNI_MUSIC } /* block=music */, - { 3, 9488, 3115, 4, 13, UNI_DEVANAGARIEXT } /* blk=devanagariext */, - { 1, 9277, 6972, 3, 11, UNI_SC__SYLO } /* sc=sylotinagri */, - { 0, 3836, 7660, 17, 4, UNI_PERM } /* scriptextensions=perm */, - { 0, 8589, 8337, 7, 7, UNI_AVST } /* script=avestan */, - { 4, 8589, 8456, 7, 7, UNI_SC__KNDA } /* script=kannada */, - { 6, 9768, 9560, 4, 4, UNI_GONG } /* scx=gong */, - { 0, 9768, 9660, 4, 4, UNI_MLYM } /* scx=mlym */, - { 0, 2280, 6323, 3, 3, UNI_OGAM } /* isogam */, - { 0, 8780, 7567, 6, 9, UNI_INKHUDAWADI } /* block=khudawadi */, - { 0, 9277, 7168, 3, 10, UNI_DIAK } /* sc=divesakuru */, - { 0, 7318, 10099, 10, 3, UNI_IN__5_DOT_1 } /* presentin=v51 */, - { 3, 8589, 8561, 7, 7, UNI_OSMA } /* script=osmanya */, - { 1, 8780, 951, 6, 18, UNI_INVS } /* block=variationselectors */, - { 9, 2665, 0, 19, 0, UNI_COUNTINGROD } /* countingrodnumerals */, - { 0, 8688, 97, 3, 9, UNI_XPOSIXALPHA } /* isalphabetic */, - { 3, 3374, 0, 11, 0, UNI_wspace_values_index } /* whitespace= */, - { 8, 9277, 18, 6, 1, UNI_KHAR } /* sc=khar */, - { 2, 6231, 115, 4, 23, UNI_DIACRITICALS } /* incombiningdiacriticalmarks */, - { 16, 9640, 36, 4, 1, UNI_LOE } /* loe=t */, - { 9, 1591, 383, 3, 31, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* inegyptianhieroglyphformatcontrols */, - { 20, 9488, 2140, 4, 18, UNI_CYRILLICSUP } /* blk=cyrillicsupplement */, - { 2, 8780, 2666, 7, 10, UNI_COUNTINGROD } /* block=countingrod */, - { 5, 8589, 8315, 7, 8, UNI_UGAR } /* script=ugaritic */, - { 0, 5986, 8738, 13, 6, UNI_NV__600000 } /* numericvalue=600000 */, - { 14, 1537, 2555, 24, 14, UNI_INPC__BOTTOMANDRIGHT } /* indicpositionalcategory=bottomandright */, - { 18, 8780, 7576, 6, 9, UNI_LATINEXTB } /* block=latinextb */, - { 1, 10296, 467, 7, 5, UNI_POSIXPUNCT } /* isposixpunct */, - { 2, 9020, 9255, 6, 5, -UNI_XPOSIXUPPER } /* upper=false */, - { 1, 4049, 0, 11, 0, UNI_GEORGIANEXT } /* georgianext */, - { 7, 3025, 0, 8, 0, UNI_CHER } /* cherokee */, - { 0, 8589, 9592, 7, 4, UNI_HMNP } /* script=hmnp */, - { 4, 10048, 7987, 3, 8, UNI_NV__5_SLASH_8 } /* nv=6.25e-01 */, - { 0, 10033, 1140, 3, 26, UNI_LB__CJ } /* lb=conditionaljapanesestarter */, - { 0, 6241, 6708, 12, 11, UNI_JT__C } /* joiningtype=joincausing */, - { 0, 2122, 0, 7, 0, UNI_RADICAL } /* radical */, - { 0, 3836, 3025, 17, 4, UNI_CHER } /* scriptextensions=cher */, - { 0, 10027, 5620, 3, 14, UNI_JG__HAMZAONHEHGOAL } /* jg=tehmarbutagoal */, - { 0, 7068, 0, 10, 0, UNI_ASCII } /* basiclatin */, - { 0, 3836, 9335, 17, 5, UNI_TAKR } /* scriptextensions=takri */, - { 9, 328, 0, 21, 0, UNI_MATHOPERATORS } /* mathematicaloperators */, - { 0, 21, 1218, 2, 8, UNI_INKATAKANA } /* inkatakana */, - { 2, 184, 6086, 3, 11, UNI_CHESSSYMBOLS } /* ischesssymbols */, - { 37, 10012, 0, 3, 0, UNI_ea_values_index } /* ea= */, - { 1, 5324, 6387, 4, 10, UNI_INMASARAMGONDI } /* inmasaramgondi */, - { 0, 8589, 7684, 7, 4, UNI_PAUC } /* script=pauc */, - { 16, 2140, 0, 11, 0, UNI_CYRILLICSUP } /* cyrillicsup */, - { 1, 5986, 10138, 13, 2, UNI_NV__38 } /* numericvalue=38 */, - { 3, 9488, 4097, 4, 16, UNI_HIGHPUSURROGATES } /* blk=highpusurrogates */, - { 1, 9488, 8124, 5, 7, UNI_INBUGINESE } /* blk=buginese */, - { 5, 184, 382, 2, 4, UNI_EGYP } /* isegyp */, - { 2, 8780, 3683, 6, 11, UNI_ETHIOPICEXT } /* block=ethiopicext */, - { 43, 1552, 5498, 10, 10, UNI_MC } /* category=spacingmark */, - { 4, 10048, 8750, 3, 3, UNI_NV__800 } /* nv=800 */, - { 1, 3529, 3, 18, 1, -UNI_VS } /* variationselector=f */, - { 12, 9768, 9002, 4, 4, UNI_TELU } /* scx=telu */, - { 0, 7028, 2, 3, 1, UNI_YI } /* isyi */, - { 0, 9528, 1025, 4, 2, -UNI_CWU } /* cwu=no */, - { 1, 4643, 1, 15, 1, -UNI_ECOMP } /* emojicomponent=n */, - { 0, 10009, 1294, 3, 5, UNI_DT__SUP } /* dt=super */, - { 1, 9524, 36, 4, 1, UNI_CWT } /* cwt=t */, - { 27, 8589, 3937, 7, 4, UNI_SC__BOPO } /* script=bopo */, - { 1, 7088, 5130, 10, 14, UNI_BC__EN } /* bidiclass=europeannumber */, - { 0, 10291, 5718, 5, 5, UNI_POSIXALNUM } /* posixalnum */, - { 14, 8858, 1025, 6, 2, -UNI_ECOMP } /* ecomp=no */, - { 25, 8780, 1879, 7, 18, UNI_CJKCOMPATIDEOGRAPHS } /* block=cjkcompatideographs */, - { 3, 8780, 510, 7, 19, UNI_CJK } /* block=cjkunifiedideographs */, - { 1, 4001, 0, 7, 0, UNI_CPRT } /* cypriot */, - { 1, 5986, 9055, 13, 3, UNI_NV__1_SLASH_3 } /* numericvalue=1/3 */, - { 9, 9997, 6493, 3, 12, UNI_BC__ON } /* bc=otherneutral */, - { 15, 9508, 6642, 4, 11, UNI_CCC__DB } /* ccc=doublebelow */, - { 6, 8780, 9684, 6, 4, UNI_INNEWA } /* block=newa */, - { 0, 10033, 21, 3, 2, UNI_LB__IN } /* lb=in */, - { 2, 1537, 2549, 24, 3, UNI_INPC__TOP } /* indicpositionalcategory=top */, - { 28, 4017, 0, 16, 0, UNI_PF } /* finalpunctuation */, - { 0, 8996, 26, 6, 1, UNI_STERM } /* sterm=y */, - { 3, 8780, 1060, 6, 27, UNI_OCR } /* block=opticalcharacterrecognition */, - { 5, 10333, 8611, 3, 3, UNI_SIDD } /* issidd */, - { 0, 2140, 0, 8, 0, UNI_CYRL } /* cyrillic */, - { 0, 10048, 7782, 3, 1, UNI_NV__3 } /* nv=3 */, - { 4, 9997, 3773, 3, 3, UNI_BC__RLI } /* bc=rli */, - { 2, 3836, 3785, 17, 4, UNI_MANI } /* scriptextensions=mani */, - { 1, 10126, 0, 3, 1, UNI_VO__U } /* vo=u */, - { 2, 184, 5497, 2, 11, UNI_MC } /* isspacingmark */, - { 2, 2779, 26, 19, 1, UNI_IDST } /* idstrinaryoperator=y */, - { 3, 184, 2855, 2, 19, UNI_MONGOLIANSUP } /* ismongoliansupplement */, - { 2, 10033, 8236, 4, 7, UNI_LB__LF } /* lb=linefeed */, - { 38, 1768, 0, 22, 0, UNI_cwcf_values_index } /* changeswhencasefolded= */, - { 18, 10333, 47, 3, 1, UNI_SM } /* issm */, - { 0, 908, 0, 14, 0, UNI_PUA } /* privateusearea */, - { 1, 184, 510, 3, 29, UNI_CJKEXTA } /* iscjkunifiedideographsextensiona */, - { 1, 8435, 0, 6, 0, UNI_GRBASE } /* grbase */, - { 0, 10048, 9208, 3, 2, UNI_NV__35 } /* nv=35 */, - { 0, 7218, 495, 10, 2, UNI_LB__NU } /* linebreak=nu */, - { 0, 10048, 8744, 3, 6, UNI_NV__700000 } /* nv=700000 */, - { 17, 184, 9628, 2, 4, UNI_LATN } /* islatn */, - { 0, 8589, 9568, 7, 4, UNI_SC__GREK } /* script=grek */, - { 0, 8575, 3, 7, 1, -UNI_PATSYN } /* patsyn=f */, - { 1, 9508, 9191, 5, 4, UNI_CCC__32 } /* ccc=ccc32 */, - { 0, 10333, 8618, 3, 3, UNI_SOYO } /* issoyo */, - { 8, 7576, 0, 9, 0, UNI_LATINEXTB } /* latinextb */, - { 13, 3836, 8219, 17, 4, UNI_JAVA } /* scriptextensions=java */, - { 3, 3836, 9476, 17, 4, UNI_AVST } /* scriptextensions=avst */, - { 2, 9640, 0, 3, 0, UNI_LOE } /* loe */, - { 1, 1966, 6463, 22, 6, UNI_LB__ZWJ } /* indicsyllabiccategory=joiner */, - { 0, 6805, 254, 6, 29, UNI_MISCMATHSYMBOLSA } /* inmiscellaneousmathematicalsymbolsa */, - { 0, 8780, 7058, 6, 10, UNI_ARABICEXTA } /* block=arabicexta */, - { 0, 184, 9325, 2, 5, UNI_RUNR } /* isrunic */, - { 7, 10024, 9225, 3, 5, UNI_XPOSIXCNTRL } /* gc=cntrl */, - { 8, 9596, 911, 4, 1, UNI_GCB__V } /* hst=v */, - { 0, 9277, 4385, 3, 6, UNI_TANG } /* sc=tangut */, - { 64, 8780, 1911, 6, 11, UNI_NUMBERFORMS } /* block=numberforms */, - { 38, 5986, 8720, 13, 2, UNI_NV__40 } /* numericvalue=40 */, - { 1, 8780, 0, 6, 34, UNI_UCAS } /* block=unifiedcanadianaboriginalsyllabics */, - { 1, 184, 7585, 2, 9, UNI_LATINEXTC } /* islatinextc */, - { 1, 3836, 9572, 17, 4, UNI_GUJR } /* scriptextensions=gujr */, - { 1, 8589, 2245, 7, 11, UNI_MTEI } /* script=meeteimayek */, - { 12, 9488, 3649, 4, 17, UNI_CYRILLICEXTB } /* blk=cyrillicextendedb */, - { 4, 7438, 8144, 10, 3, UNI_WB__EB } /* wordbreak=gaz */, - { 10, 7155, 5038, 3, 7, UNI_XPOSIXXDIGIT } /* ishexdigit */, - { 0, 7540, 1, 9, 1, -UNI_EXT } /* extender=n */, - { 0, 21, 7567, 2, 9, UNI_INKHUDAWADI } /* inkhudawadi */, - { 9, 9488, 1219, 5, 4, UNI_INBATAK } /* blk=batak */, - { 2, 7088, 426, 10, 2, UNI_BC__ES } /* bidiclass=es */, - { 2, 3836, 9676, 17, 4, UNI_NARB } /* scriptextensions=narb */, - { 2, 1417, 8002, 24, 2, UNI_CCC__26 } /* canonicalcombiningclass=26 */, - { 4, 10063, 1, 3, 1, -UNI_SD } /* sd=n */, - { 0, 4033, 1587, 16, 1, UNI_Z } /* generalcategory=z */, - { 6, 18, 0, 2, 0, UNI_RI } /* ri */, - { 0, 6554, 26, 11, 1, UNI_IDC } /* idcontinue=y */, - { 6, 6829, 0, 11, 0, UNI_MYANMAREXTB } /* myanmarextb */, - { 1, 7318, 9991, 10, 3, UNI_IN__9 } /* presentin=9.0 */, - { 0, 9277, 9330, 3, 5, UNI_SC__TALE } /* sc=taile */, - { 0, 9480, 0, 4, 0, UNI_BATK } /* batk */, - { 31, 1979, 0, 11, 0, UNI_LO } /* category=lo */, - { 2, 4116, 7559, 3, 8, UNI_QAAI } /* isinherited */, - { 0, 1417, 7778, 24, 2, UNI_CCC__21 } /* canonicalcombiningclass=21 */, - { 2, 8780, 6133, 6, 12, UNI_ETHIOPICEXTA } /* block=ethiopicexta */, - { 5, 7228, 10135, 10, 3, UNI_XPOSIXLOWER } /* lowercase=yes */, - { 0, 9277, 7308, 3, 10, UNI_PHNX } /* sc=phoenician */, - { 2, 9720, 0, 4, 0, UNI_PHLP } /* phlp */, - { 0, 8589, 9668, 7, 4, UNI_MTEI } /* script=mtei */, - { 0, 9768, 8876, 4, 6, UNI_GOTH } /* scx=gothic */, - { 0, 2224, 2913, 3, 8, UNI_INSUNDANESE } /* insundanese */, - { 41, 8780, 1344, 6, 25, UNI_SYMBOLSFORLEGACYCOMPUTING } /* block=symbolsforlegacycomputing */, - { 0, 184, 9748, 2, 4, UNI_RJNG } /* isrjng */, - { 1, 10048, 8744, 3, 2, UNI_NV__70 } /* nv=70 */, - { 0, 5843, 0, 9, 0, UNI_MLYM } /* malayalam */, - { 7, 9275, 4417, 5, 16, UNI_INSC__VOWELINDEPENDENT } /* insc=vowelindependent */, - { 9, 9488, 8456, 4, 7, UNI_INKANNADA } /* blk=kannada */, - { 8, 10129, 26, 3, 1, UNI_VS } /* vs=y */, - { 1, 8780, 4973, 6, 8, UNI_VEDICEXT } /* block=vedicext */, - { 1, 10182, 435, 6, 5, UNI__PERL_NCHAR } /* _perl_nchar */, - { 2, 4791, 2247, 4, 19, UNI_MEETEIMAYEKEXT } /* inmeeteimayekextensions */, - { 28, 184, 1585, 2, 14, UNI_BYZANTINEMUSIC } /* isbyzantinemusic */, - { 3, 9270, 909, 3, 9, UNI_PUA } /* inprivateuse */, - { 1, 2182, 8144, 21, 3, UNI_WB__EB } /* graphemeclusterbreak=gaz */, - { 0, 9290, 10135, 5, 3, UNI_MATH } /* math=yes */, - { 0, 9277, 9310, 3, 5, UNI_OGAM } /* sc=ogham */, - { 0, 8449, 0, 6, 0, UNI_HYPHEN } /* hyphen */, - { 16, 11, 0, 2, 0, UNI_DI } /* di */, - { 0, 8688, 8338, 3, 6, UNI_AVST } /* isavestan */, - { 2, 10033, 7486, 3, 9, UNI_LB__AI } /* lb=ambiguous */, - { 0, 1828, 3, 6, 1, -UNI_CASED } /* cased=f */, - { 0, 10288, 9225, 8, 5, UNI_XPOSIXCNTRL } /* isxposixcntrl */, - { 7, 3169, 0, 4, 0, UNI_ETHI } /* ethi */, - { 24, 1552, 5713, 9, 13, UNI_XPOSIXDIGIT } /* category=decimalnumber */, - { 0, 8780, 78, 6, 6, UNI_INARABIC } /* block=arabic */, - { 1, 8780, 382, 6, 32, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* block=egyptianhieroglyphformatcontrols */, - { 2, 1417, 9171, 25, 4, UNI_CCC__28 } /* canonicalcombiningclass=ccc28 */, - { 4, 8589, 7428, 7, 4, UNI_WARA } /* script=wara */, - { 50, 1768, 10135, 22, 3, UNI_CWCF } /* changeswhencasefolded=yes */, - { 0, 7438, 3385, 10, 17, UNI_RI } /* wordbreak=regionalindicator */, - { 0, 9536, 9255, 4, 5, -UNI_DEP } /* dep=false */, - { 32, 7218, 3379, 10, 5, UNI_LB__SP } /* linebreak=space */, - { 3, 1552, 5438, 9, 14, UNI_SK } /* category=modifiersymbol */, - { 5, 5791, 10045, 13, 3, UNI_JG__MIM } /* joininggroup=mim */, - { 2, 42, 0, 36, 0, UNI_CJKCOMPATIDEOGRAPHSSUP } /* cjkcompatibilityideographssupplement */, - { 7, 8780, 8596, 6, 7, UNI_SC__SHRD } /* block=sharada */, - { 3, 9488, 8414, 4, 7, UNI_INELBASAN } /* blk=elbasan */, - { 9, 9488, 5778, 4, 13, UNI_IPAEXT } /* blk=ipaextensions */, - { 19, 7288, 0, 10, 0, UNI_SOGO } /* oldsogdian */, - { 1, 10296, 83, 3, 2, UNI_PCM } /* ispcm */, - { 0, 6231, 6086, 3, 11, UNI_CHESSSYMBOLS } /* inchesssymbols */, - { 2, 3632, 0, 17, 0, UNI_CYRILLICEXTA } /* cyrillicextendeda */, - { 0, 8780, 9664, 6, 3, UNI_INMRO } /* block=mro */, - { 4, 10009, 9552, 3, 4, UNI_DT__FONT } /* dt=font */, - { 3, 5986, 8744, 13, 6, UNI_NV__700000 } /* numericvalue=700000 */, - { 6, 7438, 8323, 10, 7, UNI_WB__LE } /* wordbreak=aletter */, - { 0, 8930, 9836, 6, 4, UNI_XPOSIXLOWER } /* lower=true */, - { 4, 1417, 3015, 24, 5, UNI_CCC__A } /* canonicalcombiningclass=above */, - { 2, 9488, 8187, 4, 8, UNI_INHIRAGANA } /* blk=hiragana */, - { 0, 8780, 1677, 6, 9, UNI_LATINEXTE } /* block=latinexte */, - { 1, 5324, 8493, 4, 5, UNI_INMARCHEN } /* inmarchen */, - { 0, 9508, 7765, 4, 2, UNI_CCC__25 } /* ccc=25 */, - { 10, 9245, 0, 5, 0, UNI_DOGR } /* dogra */, - { 16, 184, 4658, 2, 14, UNI_GREXT } /* isgraphemeextend */, - { 0, 1966, 4823, 22, 15, UNI_INSC__MODIFYINGLETTER } /* indicsyllabiccategory=modifyingletter */, - { 0, 2182, 34, 21, 6, UNI_GCB__EX } /* graphemeclusterbreak=extend */, - { 0, 9508, 9196, 5, 4, UNI_CCC__33 } /* ccc=ccc33 */, - { 0, 5986, 10140, 13, 2, UNI_NV__39 } /* numericvalue=39 */, - { 4, 8780, 720, 7, 15, UNI_CUNEIFORMNUMBERS } /* block=cuneiformnumbers */, - { 14, 8780, 1013, 6, 5, UNI_INGREEK } /* block=greek */, - { 0, 4129, 0, 9, 0, UNI_LATIN1 } /* latin1sup */, - { 0, 10048, 7995, 3, 8, UNI_NV__1_SLASH_16 } /* nv=6.25e-02 */, - { 6, 9070, 26, 5, 1, UNI_POSIXXDIGIT } /* ahex=y */, - { 1, 8589, 2684, 7, 19, UNI_EGYP } /* script=egyptianhieroglyphs */, - { 0, 7218, 6178, 10, 2, UNI_LB__ZW } /* linebreak=zw */, - { 0, 184, 1677, 2, 23, UNI_LATINEXTADDITIONAL } /* islatinextendedadditional */, - { 0, 8589, 9065, 7, 5, UNI_SC__ADLM } /* script=adlam */, - { 32, 6231, 219, 4, 31, UNI_DIACRITICALSEXT } /* incombiningdiacriticalmarksextended */, - { 4, 8589, 4793, 7, 15, UNI_MERC } /* script=meroiticcursive */, - { 0, 3836, 9700, 17, 4, UNI_OLCK } /* scriptextensions=olck */, - { 0, 1966, 4417, 22, 5, UNI_INSC__VOWEL } /* indicsyllabiccategory=vowel */, - { 1, 10048, 5648, 3, 13, UNI_NV__1000000000000 } /* nv=1000000000000 */, - { 0, 10024, 4898, 3, 15, UNI_PS } /* gc=openpunctuation */, - { 1, 2218, 2470, 3, 19, UNI_INNYIAKENGPUACHUEHMONG } /* innyiakengpuachuehmong */, - { 0, 184, 7068, 2, 10, UNI_ASCII } /* isbasiclatin */, - { 2, 9488, 8131, 4, 8, UNI_INDUPLOYAN } /* blk=duployan */, - { 0, 5986, 7987, 13, 8, UNI_NV__5_SLASH_8 } /* numericvalue=6.25e-01 */, - { 0, 4989, 1368, 3, 3, UNI_UGAR } /* isugar */, - { 12, 1417, 8817, 25, 5, UNI_CCC__129 } /* canonicalcombiningclass=ccc129 */, - { 0, 9756, 0, 4, 0, UNI_RUNR } /* runr */, - { 1, 8780, 8456, 6, 7, UNI_INKANNADA } /* block=kannada */, - { 8, 8780, 838, 6, 29, UNI_MISCARROWS } /* block=miscellaneoussymbolsandarrows */, - { 3, 5791, 5368, 13, 14, UNI_JG__MANICHAEANKAPH } /* joininggroup=manichaeankaph */, - { 2, 184, 3421, 2, 18, UNI_RUMI } /* isruminumeralsymbols */, - { 0, 10296, 7, 3, 1, UNI_PC } /* ispc */, - { 5, 10048, 8010, 3, 2, UNI_NV__36 } /* nv=36 */, - { 41, 598, 0, 2, 0, UNI_XPOSIXCNTRL } /* cc */, - { 1, 5830, 0, 13, 0, UNI_LOWSURROGATES } /* lowsurrogates */, - { 1, 9488, 6972, 4, 11, UNI_INSYLOTINAGRI } /* blk=sylotinagri */, - { 2, 4688, 1284, 15, 9, UNI_IDENTIFIERTYPE__EXCLUSION } /* identifiertype=exclusion */, - { 32, 8852, 3, 6, 1, -UNI_CWKCF } /* cwkcf=f */, - { 0, 9508, 7922, 4, 2, UNI_CCC__24 } /* ccc=24 */, - { 1, 6397, 0, 12, 0, UNI_MATHALPHANUM } /* mathalphanum */, - { 1, 8780, 8888, 6, 6, UNI_INHATRAN } /* block=hatran */, - { 1, 10048, 7765, 3, 1, UNI_NV__2 } /* nv=2 */, - { 4, 5986, 9361, 13, 3, UNI_NV__1_SLASH_2 } /* numericvalue=1/2 */, - { 0, 1966, 4305, 22, 5, UNI_INSC__OTHER } /* indicsyllabiccategory=other */, - { 0, 4033, 74, 16, 2, UNI_ME } /* generalcategory=me */, - { 2, 5986, 7995, 13, 8, UNI_NV__1_SLASH_16 } /* numericvalue=6.25e-02 */, - { 2, 6231, 2141, 3, 10, UNI_CYRILLICSUP } /* incyrillicsup */, - { 8, 8996, 3, 6, 1, -UNI_STERM } /* sterm=f */, - { 0, 184, 9032, 2, 6, UNI_WCHO } /* iswancho */, - { 8, 3937, 0, 16, 0, UNI_BOPOMOFOEXT } /* bopomofoextended */, - { 10, 10048, 8066, 3, 2, UNI_NV__28 } /* nv=28 */, - { 8, 2779, 3, 19, 1, -UNI_IDST } /* idstrinaryoperator=f */, - { 6, 10009, 1417, 3, 9, UNI_DT__CAN } /* dt=canonical */, - { 1, 3836, 9748, 17, 4, UNI_RJNG } /* scriptextensions=rjng */, - { 22, 3836, 7675, 17, 9, UNI_PALM } /* scriptextensions=palmyrene */, - { 14, 4643, 10135, 15, 3, UNI_ECOMP } /* emojicomponent=yes */, - { 8, 10033, 125, 3, 2, UNI_LB__CR } /* lb=cr */, - { 0, 8780, 8187, 6, 8, UNI_INHIRAGANA } /* block=hiragana */, - { 12, 9500, 0, 4, 0, UNI_CAKM } /* cakm */, - { 0, 4542, 4051, 4, 14, UNI_GEORGIANEXT } /* ingeorgianextended */, - { 0, 9235, 1, 5, 1, -UNI_CWCM } /* cwcm=n */, - { 0, 8780, 4569, 7, 14, UNI_CURRENCYSYMBOLS } /* block=currencysymbols */, - { 9, 3836, 4273, 17, 7, UNI_MYMR } /* scriptextensions=myanmar */, - { 1, 3836, 3115, 17, 10, UNI_DEVA } /* scriptextensions=devanagari */, - { 0, 8589, 8786, 7, 6, UNI_CARI } /* script=carian */, - { 8, 9277, 9680, 3, 4, UNI_NBAT } /* sc=nbat */, - { 0, 1417, 7950, 24, 1, UNI_CCC__9 } /* canonicalcombiningclass=9 */, - { 1, 9277, 9900, 3, 4, UNI_ZZZZ } /* sc=zzzz */, - { 0, 9680, 0, 4, 0, UNI_NBAT } /* nbat */, - { 11, 3836, 9504, 17, 4, UNI_CANS } /* scriptextensions=cans */, - { 0, 1417, 7765, 24, 2, UNI_CCC__25 } /* canonicalcombiningclass=25 */, - { 0, 2032, 36, 22, 1, UNI__PERL_NCHAR } /* noncharactercodepoint=t */, - { 33, 10290, 467, 6, 5, UNI_XPOSIXPUNCT } /* xposixpunct */, - { 0, 2076, 0, 15, 0, UNI_TRANSPORTANDMAP } /* transportandmap */, - { 34, 9508, 5649, 4, 1, UNI_CCC__0 } /* ccc=0 */, - { 18, 9260, 9255, 5, 5, -UNI_IDSB } /* idsb=false */, - { 4, 5986, 7781, 13, 2, UNI_NV__43 } /* numericvalue=43 */, - { 1, 184, 9305, 2, 5, UNI_NSHU } /* isnushu */, - { 3, 5986, 7779, 13, 8, UNI_NV__1_SLASH_7 } /* numericvalue=1.43e-01 */, - { 0, 10132, 495, 3, 2, UNI_WB__NU } /* wb=nu */, - { 0, 10033, 5746, 3, 5, UNI_EBASE } /* lb=ebase */, - { 1, 1166, 26, 26, 1, UNI_DI } /* defaultignorablecodepoint=y */, - { 1, 9768, 1537, 5, 3, UNI_SIND } /* scx=sind */, - { 0, 7218, 4842, 10, 2, UNI_LB__QU } /* linebreak=qu */, - { 0, 3921, 0, 9, 0, UNI_ARABICSUP } /* arabicsup */, - { 1, 7088, 102, 10, 2, UNI_BC__ET } /* bidiclass=et */, - { 6, 8768, 1, 6, 1, -UNI_BIDIC } /* bidic=n */, - { 1, 1417, 2449, 24, 4, UNI_CCC__L } /* canonicalcombiningclass=left */, - { 0, 184, 7576, 2, 9, UNI_LATINEXTB } /* islatinextb */, - { 1, 9488, 3666, 4, 17, UNI_CYRILLICEXTC } /* blk=cyrillicextendedc */, - { 1, 7076, 2609, 3, 5, UNI_INBRAHMI } /* inbrahmi */, - { 0, 8449, 1, 7, 1, -UNI_HYPHEN } /* hyphen=n */, - { 86, 9556, 1087, 4, 7, UNI_GCB__PP } /* gcb=prepend */, - { 0, 8997, 1, 5, 1, -UNI_TERM } /* term=n */, - { 1, 9265, 0, 5, 0, UNI_idst_values_index } /* idst= */, - { 0, 4033, 2061, 16, 14, UNI_LM } /* generalcategory=modifierletter */, - { 0, 9488, 2245, 4, 14, UNI_MEETEIMAYEKEXT } /* blk=meeteimayekext */, - { 0, 8589, 8561, 7, 4, UNI_OSMA } /* script=osma */, - { 6, 3836, 2485, 17, 4, UNI_MONG } /* scriptextensions=mong */, - { 0, 2182, 262, 21, 2, UNI_GCB__SM } /* graphemeclusterbreak=sm */, - { 10, 8589, 3598, 7, 17, UNI_AGHB } /* script=caucasianalbanian */, - { 100, 3836, 2288, 18, 3, UNI_SINH } /* scriptextensions=sinh */, - { 14, 9768, 9880, 4, 4, UNI_YI } /* scx=yiii */, - { 1, 10027, 10000, 3, 3, UNI_JG__BEH } /* jg=beh */, - { 2, 9488, 4049, 4, 16, UNI_GEORGIANEXT } /* blk=georgianextended */, - { 1, 5037, 1025, 9, 2, -UNI_XPOSIXXDIGIT } /* hexdigit=no */, - { 0, 7684, 0, 9, 0, UNI_PAUC } /* paucinhau */, - { 2, 9070, 9836, 5, 4, UNI_POSIXXDIGIT } /* ahex=true */, - { 0, 8589, 8187, 7, 4, UNI_SC__HIRA } /* script=hira */, - { 16, 9768, 9628, 4, 4, UNI_LATN } /* scx=latn */, - { 0, 1417, 1755, 24, 2, UNI_CCC__DB } /* canonicalcombiningclass=db */, - { 6, 10048, 1249, 3, 3, UNI_NV__NAN } /* nv=nan */, - { 32, 2061, 0, 4, 0, UNI_MODI } /* modi */, - { 2, 9524, 9255, 4, 5, -UNI_CWT } /* cwt=false */, - { 5, 10288, 5040, 8, 5, UNI_XPOSIXDIGIT } /* isxposixdigit */, - { 5, 184, 4598, 2, 15, UNI_DIACRITICALSEXT } /* isdiacriticalsext */, - { 0, 9346, 9255, 4, 5, -UNI_IDC } /* idc=false */, - { 0, 6181, 0, 12, 0, UNI_GONG } /* gunjalagondi */, - { 4, 6928, 9836, 11, 4, UNI_SD } /* softdotted=true */, - { 0, 21, 1673, 2, 4, UNI_JAMO } /* injamo */, - { 0, 8762, 3, 6, 1, -UNI_XPOSIXALPHA } /* alpha=f */, - { 3, 1700, 0, 23, 0, UNI_SHORTHANDFORMATCONTROLS } /* shorthandformatcontrols */, - { 5, 8589, 9712, 7, 4, UNI_OSGE } /* script=osge */, - { 98, 1417, 9940, 24, 3, UNI_CCC__A } /* canonicalcombiningclass=230 */, - { 1, 5791, 756, 13, 3, UNI_JG__DAL } /* joininggroup=dal */, - { 4, 184, 122, 2, 9, UNI_DIA } /* isdiacritic */, - { 0, 7218, 5585, 10, 2, UNI_EBASE } /* linebreak=eb */, - { 0, 10291, 96, 5, 5, UNI_POSIXALPHA } /* posixalpha */, - { 1, 10024, 1287, 3, 2, UNI_UPPERCASELETTER } /* gc=lu */, - { 41, 9235, 1025, 5, 2, -UNI_CWCM } /* cwcm=no */, - { 2, 7408, 0, 10, 0, UNI_CN } /* unassigned */, - { 18, 9262, 0, 3, 0, UNI_sb_values_index } /* sb= */, - { 0, 3836, 9797, 18, 3, UNI_SYRC } /* scriptextensions=syrc */, - { 2, 7155, 1655, 3, 5, UNI_HANG } /* ishangul */, - { 1, 382, 0, 32, 0, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* egyptianhieroglyphformatcontrols */, - { 0, 5746, 3, 6, 1, -UNI_EBASE } /* ebase=f */, - { 1, 3385, 10135, 18, 3, UNI_RI } /* regionalindicator=yes */, - { 7, 9240, 9836, 5, 4, UNI_DASH } /* dash=true */, - { 1, 7218, 0, 10, 0, UNI_lb_values_index } /* linebreak= */, - { 4, 1417, 9176, 25, 4, UNI_CCC__29 } /* canonicalcombiningclass=ccc29 */, - { 1, 10288, 6554, 3, 3, UNI_XIDC } /* isxidc */, - { 0, 3901, 8173, 4, 6, UNI_INGUJARATI } /* ingujarati */, - { 1, 3649, 0, 17, 0, UNI_CYRILLICEXTB } /* cyrillicextendedb */, - { 0, 9277, 7684, 3, 4, UNI_PAUC } /* sc=pauc */, - { 1, 1417, 7978, 24, 2, UNI_CCC__16 } /* canonicalcombiningclass=16 */, - { 11, 5214, 0, 6, 0, UNI_KANGXI } /* kangxi */, - { 0, 5578, 400, 14, 6, UNI_SB__FO } /* sentencebreak=format */, - { 52, 9277, 2245, 3, 11, UNI_MTEI } /* sc=meeteimayek */, - { 1, 8780, 9315, 6, 5, UNI_INORIYA } /* block=oriya */, - { 0, 2218, 16, 3, 1, UNI_NB } /* innb */, - { 0, 9277, 3241, 3, 4, UNI_SC__GEOR } /* sc=geor */, - { 2, 1768, 0, 21, 0, UNI_CWCF } /* changeswhencasefolded */, - { 2, 1856, 36, 22, 1, UNI_CWU } /* changeswhenuppercased=t */, - { 8, 8589, 8942, 7, 6, UNI_LYDI } /* script=lydian */, - { 13, 9488, 7368, 4, 10, UNI_SMALLFORMS } /* blk=smallforms */, - { 0, 8930, 3, 6, 1, -UNI_XPOSIXLOWER } /* lower=f */, - { 20, 9488, 3600, 4, 4, UNI_UCAS } /* blk=ucas */, - { 0, 4033, 6851, 16, 11, UNI_LO } /* generalcategory=otherletter */, - { 16, 8780, 7594, 6, 9, UNI_LATINEXTD } /* block=latinextd */, - { 1, 7088, 3187, 10, 18, UNI_BC__ET } /* bidiclass=europeanterminator */, - { 18, 7318, 9982, 10, 3, UNI_IN__6_DOT_3 } /* presentin=6.3 */, - { 2, 9508, 8002, 4, 2, UNI_CCC__26 } /* ccc=26 */, - { 1, 8780, 3937, 6, 8, UNI_INBOPOMOFO } /* block=bopomofo */, - { 0, 9508, 9181, 5, 4, UNI_CCC__30 } /* ccc=ccc30 */, - { 0, 5452, 26, 14, 1, UNI_NFCQC__Y } /* nfcquickcheck=y */, - { 0, 1867, 0, 5, 0, UNI_XPOSIXUPPER } /* upper */, - { 1, 10033, 3379, 3, 5, UNI_LB__SP } /* lb=space */, - { 1, 10009, 6421, 3, 12, UNI_DT__NONCANON } /* dt=noncanonical */, - { 1, 9488, 0, 4, 34, UNI_UCAS } /* blk=unifiedcanadianaboriginalsyllabics */, - { 0, 10048, 8003, 3, 8, UNI_NV__1_SLASH_160 } /* nv=6.25e-03 */, - { 0, 5116, 26, 14, 1, UNI_EMOD } /* emojimodifier=y */, - { 0, 8780, 478, 6, 31, UNI_MATHALPHANUM } /* block=mathematicalalphanumericsymbols */, - { 0, 10333, 8618, 3, 6, UNI_SOYO } /* issoyombo */, - { 6, 9488, 8666, 4, 7, UNI_INTIRHUTA } /* blk=tirhuta */, - { 0, 8996, 9255, 6, 5, -UNI_STERM } /* sterm=false */, - { 0, 8780, 4002, 7, 15, UNI_CYPRIOTSYLLABARY } /* block=cypriotsyllabary */, - { 1, 10290, 7438, 6, 4, UNI_XPOSIXWORD } /* xposixword */, - { 1, 1585, 0, 23, 0, UNI_BYZANTINEMUSIC } /* byzantinemusicalsymbols */, - { 0, 4113, 952, 3, 17, UNI_INVS } /* invariationselectors */, - { 0, 2280, 9321, 3, 4, UNI_OSGE } /* isosage */, - { 6, 9672, 0, 4, 0, UNI_MYMR } /* mymr */, - { 18, 9277, 0, 3, 0, UNI_sc_values_index } /* sc= */, - { 0, 9277, 9008, 3, 4, UNI_SC__THAA } /* sc=thaa */, - { 0, 9277, 7428, 3, 4, UNI_WARA } /* sc=wara */, - { 12, 184, 6385, 2, 12, UNI_GONM } /* ismasaramgondi */, - { 0, 5947, 0, 13, 0, UNI_MAYANNUMERALS } /* mayannumerals */, - { 0, 9277, 9628, 3, 4, UNI_SC__LATN } /* sc=latn */, - { 4, 8894, 0, 6, 0, UNI_joinc_values_index } /* joinc= */, - { 0, 9275, 6457, 5, 12, UNI_INSC__NUMBERJOINER } /* insc=numberjoiner */, - { 0, 5986, 9061, 13, 4, UNI_NV__1_SLASH_12 } /* numericvalue=1/12 */, - { 2, 8187, 0, 8, 0, UNI_HIRA } /* hiragana */, - { 0, 184, 1879, 3, 21, UNI_CJKCOMPATIDEOGRAPHSSUP } /* iscjkcompatideographssup */, - { 9, 9508, 3572, 4, 9, UNI_CCC__BL } /* ccc=belowleft */, - { 1, 3683, 0, 16, 0, UNI_ETHIOPICEXT } /* ethiopicextended */, - { 0, 184, 3358, 2, 9, UNI_Z } /* isseparator */, - { 1, 1966, 4523, 22, 15, UNI_INSC__CONSONANTMEDIAL } /* indicsyllabiccategory=consonantmedial */, - { 0, 9768, 9484, 4, 4, UNI_BHKS } /* scx=bhks */, - { 1, 8780, 4613, 6, 15, UNI_DIACRITICALSSUP } /* block=diacriticalssup */, - { 0, 9277, 9792, 3, 4, UNI_SOGO } /* sc=sogo */, - { 17, 184, 9692, 2, 4, UNI_NSHU } /* isnshu */, - { 1, 2182, 6169, 21, 12, UNI_WB__EB } /* graphemeclusterbreak=glueafterzwj */, - { 0, 7318, 9856, 10, 4, UNI_IN__13 } /* presentin=v130 */, - { 1, 3836, 9832, 17, 4, UNI_TIBT } /* scriptextensions=tibt */, - { 0, 9270, 468, 3, 10, UNI_INPUNCTUATION } /* inpunctuation */, - { 2, 5791, 5843, 13, 13, UNI_JG__MALAYALAMLLLA } /* joininggroup=malayalamllla */, - { 2, 3097, 45, 18, 3, UNI_DT__COM } /* decompositiontype=com */, - { 0, 10048, 4134, 3, 1, UNI_NV__1 } /* nv=1 */, - { 0, 8463, 0, 7, 0, UNI_KALI } /* kayahli */, - { 0, 8435, 9836, 7, 4, UNI_GRBASE } /* grbase=true */, - { 24, 6553, 3, 12, 1, -UNI_XIDC } /* xidcontinue=f */, - { 1, 4583, 0, 15, 0, UNI_PD } /* dashpunctuation */, - { 16, 10288, 5040, 3, 5, UNI_XPOSIXXDIGIT } /* isxdigit */, - { 0, 9768, 9736, 4, 4, UNI_COPT } /* scx=qaac */, - { 2, 8780, 4928, 6, 15, UNI_TAMILSUP } /* block=tamilsupplement */, - { 2, 9768, 9900, 4, 4, UNI_ZZZZ } /* scx=zzzz */, - { 44, 10333, 17, 3, 1, UNI_SO } /* isso */, - { 1, 8442, 0, 7, 0, UNI_HANO } /* hanunoo */, - { 1, 1828, 0, 5, 0, UNI_CASED } /* cased */, - { 0, 8894, 26, 6, 1, UNI_JOINC } /* joinc=y */, - { 1, 1834, 26, 22, 1, UNI_CWT } /* changeswhentitlecased=y */, - { 0, 78, 0, 35, 0, UNI_ARABICMATH } /* arabicmathematicalalphabeticsymbols */, - { 0, 10033, 3385, 3, 17, UNI_RI } /* lb=regionalindicator */, - { 1, 8589, 2288, 8, 6, UNI_SC__SINH } /* script=sinhala */, - { 0, 8688, 5033, 3, 12, UNI_POSIXXDIGIT } /* isasciihexdigit */, - { 8, 3374, 10135, 11, 3, UNI_XPOSIXSPACE } /* whitespace=yes */, - { 2, 7158, 3, 10, 1, -UNI_DIA } /* diacritic=f */, - { 2, 8589, 1218, 7, 8, UNI_SC__KANA } /* script=katakana */, - { 2, 5986, 9924, 13, 2, UNI_NV__42 } /* numericvalue=42 */, - { 4, 184, 8853, 3, 4, UNI_CWKCF } /* iscwkcf */, - { 3, 10048, 9984, 3, 2, UNI_NV__37 } /* nv=37 */, - { 0, 1845, 0, 9, 0, UNI_TITLE } /* titlecase */, - { 0, 9350, 0, 5, 0, UNI_xids_values_index } /* xids= */, - { 2, 8780, 6253, 6, 5, UNI_INKHMER } /* block=khmer */, - { 0, 184, 570, 3, 29, UNI_CJKEXTC } /* iscjkunifiedideographsextensionc */, - { 0, 5791, 7016, 13, 11, UNI_JG__YEHWITHTAIL } /* joininggroup=yehwithtail */, - { 3, 10009, 1253, 3, 7, UNI_DT__INIT } /* dt=initial */, - { 3, 184, 4808, 2, 15, UNI_MISCPICTOGRAPHS } /* ismiscpictographs */, - { 3, 9488, 2684, 4, 19, UNI_INEGYPTIANHIEROGLYPHS } /* blk=egyptianhieroglyphs */, - { 3, 2529, 26, 20, 1, UNI_TERM } /* terminalpunctuation=y */, - { 1, 9488, 4479, 5, 14, UNI_BRAI } /* blk=braillepatterns */, - { 1, 2224, 4370, 3, 15, UNI_SYRIACSUP } /* insyriacsupplement */, - { 0, 8589, 9516, 7, 4, UNI_SC__CPRT } /* script=cprt */, - { 0, 7088, 0, 11, 0, UNI_BC__B } /* bidiclass=b */, - { 0, 1417, 7922, 24, 2, UNI_CCC__24 } /* canonicalcombiningclass=24 */, - { 10, 3836, 8243, 17, 8, UNI_MAHJ } /* scriptextensions=mahajani */, - { 0, 8589, 9484, 7, 4, UNI_BHKS } /* script=bhks */, - { 5, 184, 6229, 2, 11, UNI_JOINC } /* isjoincontrol */, - { 0, 4033, 1217, 16, 2, UNI_SK } /* generalcategory=sk */, - { 3, 9640, 9836, 4, 4, UNI_LOE } /* loe=true */, - { 0, 7739, 36, 8, 1, UNI_IDS } /* idstart=t */, - { 2, 9277, 9668, 3, 4, UNI_MTEI } /* sc=mtei */, - { 0, 9997, 24, 3, 1, UNI_BC__L } /* bc=l */, - { 1, 184, 4448, 2, 4, UNI_BAMU } /* isbamu */, - { 3, 9277, 9592, 3, 4, UNI_HMNP } /* sc=hmnp */, - { 34, 9277, 9776, 3, 4, UNI_SGNW } /* sc=sgnw */, - { 3, 6205, 36, 12, 1, UNI_IDEO } /* ideographic=t */, - { 16, 7088, 3756, 10, 3, UNI_BC__NSM } /* bidiclass=nsm */, - { 0, 21, 9032, 2, 6, UNI_INWANCHO } /* inwancho */, - { 3, 2182, 125, 21, 2, UNI_LB__CR } /* graphemeclusterbreak=cr */, - { 17, 8589, 8179, 7, 8, UNI_SC__GURU } /* script=gurmukhi */, - { 2, 9277, 8337, 3, 7, UNI_AVST } /* sc=avestan */, - { 0, 9536, 9836, 4, 4, UNI_DEP } /* dep=true */, - { 0, 9262, 69, 3, 2, UNI_SB__UP } /* sb=up */, - { 6, 2054, 0, 22, 0, UNI_MODIFIERLETTERS } /* spacingmodifierletters */, - { 1, 7218, 7512, 10, 2, UNI_LB__BB } /* linebreak=bb */, - { 0, 5674, 0, 12, 0, UNI_BIDIM } /* bidimirrored */, - { 2, 9488, 6481, 4, 12, UNI_INOLDHUNGARIAN } /* blk=oldhungarian */, - { 10, 184, 11, 2, 3, UNI_DIA } /* isdia */, - { 6, 4116, 3260, 3, 16, UNI_IDSB } /* isidsbinaryoperator */, - { 1, 5037, 26, 9, 1, UNI_XPOSIXXDIGIT } /* hexdigit=y */, - { 32, 9508, 7890, 4, 2, UNI_CCC__33 } /* ccc=33 */, - { 0, 9277, 9548, 3, 4, UNI_DSRT } /* sc=dsrt */, - { 0, 5791, 7055, 13, 3, UNI_JG__QAF } /* joininggroup=qaf */, - { 4, 21, 9285, 2, 5, UNI_INLIMBU } /* inlimbu */, - { 16, 9277, 719, 3, 9, UNI_XSUX } /* sc=cuneiform */, - { 8, 8780, 1218, 6, 8, UNI_INKATAKANA } /* block=katakana */, - { 2, 9488, 1319, 4, 25, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* blk=symbolsandpictographsexta */, - { 0, 1417, 7821, 24, 1, UNI_CCC__8 } /* canonicalcombiningclass=8 */, - { 6, 10296, 96, 7, 5, UNI_POSIXALPHA } /* isposixalpha */, - { 0, 8780, 4448, 6, 15, UNI_BAMUMSUP } /* block=bamumsupplement */, - { 8, 7218, 3385, 10, 17, UNI_RI } /* linebreak=regionalindicator */, - { 1, 9636, 0, 4, 0, UNI_LINB } /* linb */, - { 0, 9488, 467, 4, 11, UNI_INPUNCTUATION } /* blk=punctuation */, - { 17, 9277, 8942, 3, 6, UNI_LYDI } /* sc=lydian */, - { 2, 10024, 1171, 3, 2, UNI_TITLE } /* gc=lt */, - { 0, 4033, 4017, 16, 16, UNI_PF } /* generalcategory=finalpunctuation */, - { 0, 10033, 6179, 3, 2, UNI_LB__WJ } /* lb=wj */, - { 38, 4658, 9255, 15, 5, -UNI_GREXT } /* graphemeextend=false */, - { 16, 10048, 8714, 3, 3, UNI_NV__300 } /* nv=300 */, - { 1, 9235, 0, 5, 0, UNI_cwcm_values_index } /* cwcm= */, - { 0, 9596, 36, 4, 1, UNI_GCB__T } /* hst=t */, - { 20, 9768, 9283, 4, 4, UNI_PHLI } /* scx=phli */, - { 0, 8762, 9255, 6, 5, -UNI_XPOSIXALPHA } /* alpha=false */, - { 4, 3836, 8561, 17, 7, UNI_OSMA } /* scriptextensions=osmanya */, - { 0, 8589, 7, 7, 18, UNI_CANS } /* script=canadianaboriginal */, - { 1, 9488, 6554, 4, 3, UNI_INIDC } /* blk=idc */, - { 0, 8984, 1, 6, 1, -UNI_QMARK } /* qmark=n */, - { 24, 10027, 6301, 3, 12, UNI_JG__MALAYALAMLLA } /* jg=malayalamlla */, - { 3, 184, 9564, 2, 4, UNI_GONM } /* isgonm */, - { 0, 4033, 6873, 16, 11, UNI_SO } /* generalcategory=othersymbol */, - { 0, 8780, 6385, 6, 12, UNI_INMASARAMGONDI } /* block=masaramgondi */, - { 49, 8762, 9836, 6, 4, UNI_XPOSIXALPHA } /* alpha=true */, - { 0, 184, 10170, 2, 2, UNI_CASEDLETTER } /* isl_ */, - { 0, 8589, 9900, 7, 4, UNI_ZZZZ } /* script=zzzz */, - { 0, 10063, 9836, 3, 4, UNI_SD } /* sd=true */, - { 0, 9488, 3169, 4, 18, UNI_ETHIOPICSUP } /* blk=ethiopicsupplement */, - { 2, 6229, 0, 11, 0, UNI_JOINC } /* joincontrol */, - { 1, 9277, 9002, 3, 6, UNI_SC__TELU } /* sc=telugu */, - { 1, 8780, 7119, 7, 9, UNI_INCHORASMIAN } /* block=chorasmian */, - { 13, 6553, 9255, 12, 5, -UNI_XIDC } /* xidcontinue=false */, - { 2, 9277, 9335, 3, 5, UNI_SC__TAKR } /* sc=takri */, - { 0, 4829, 2411, 4, 18, UNI_GLAGOLITICSUP } /* inglagoliticsupplement */, - { 2, 8589, 8491, 7, 7, UNI_MARC } /* script=marchen */, - { 0, 1856, 9255, 22, 5, -UNI_CWU } /* changeswhenuppercased=false */, - { 4, 10048, 7923, 3, 8, UNI_NV__2_SLASH_5 } /* nv=4.00e-01 */, - { 49, 9768, 8942, 4, 4, UNI_LYDI } /* scx=lydi */, - { 4, 7318, 7987, 10, 3, UNI_IN__6_DOT_2 } /* presentin=6.2 */, - { 0, 3666, 0, 17, 0, UNI_CYRILLICEXTC } /* cyrillicextendedc */, - { 5, 9032, 0, 6, 0, UNI_WCHO } /* wancho */, - { 1, 10027, 6157, 3, 12, UNI_JG__FINALSEMKATH } /* jg=finalsemkath */, - { 0, 9540, 36, 4, 1, UNI_DIA } /* dia=t */, - { 0, 3836, 9516, 17, 4, UNI_CPRT } /* scriptextensions=cprt */, - { 2, 9277, 7, 3, 18, UNI_CANS } /* sc=canadianaboriginal */, - { 2, 9277, 3025, 3, 4, UNI_CHER } /* sc=cher */, - { 2, 184, 9752, 2, 4, UNI_ROHG } /* isrohg */, - { 0, 5564, 3, 14, 1, -UNI_QMARK } /* quotationmark=f */, - { 1, 9508, 9186, 5, 4, UNI_CCC__31 } /* ccc=ccc31 */, - { 3, 8780, 9310, 6, 5, UNI_INOGHAM } /* block=ogham */, - { 1, 9277, 2224, 3, 21, UNI_PRTI } /* sc=inscriptionalparthian */, - { 0, 1552, 1465, 9, 13, UNI_M } /* category=combiningmark */, - { 1, 2280, 125, 3, 2, UNI_OCR } /* isocr */, - { 0, 9508, 9223, 4, 2, UNI_CCC__91 } /* ccc=91 */, - { 12, 5791, 65, 15, 2, UNI_JG__KAPH } /* joininggroup=kaph */, - { 0, 184, 951, 2, 18, UNI_INVS } /* isvariationselectors */, - { 1, 10126, 3511, 3, 18, UNI_VO__TU } /* vo=transformedupright */, - { 5, 9277, 1115, 3, 4, UNI_SC__HANG } /* sc=hang */, - { 32, 7218, 21, 10, 2, UNI_LB__IN } /* linebreak=in */, - { 5, 4916, 9336, 3, 4, UNI_TAKR } /* istakri */, - { 1, 9277, 8407, 3, 7, UNI_DSRT } /* sc=deseret */, - { 50, 10132, 8505, 3, 7, UNI_WB__NL } /* wb=newline */, - { 0, 1417, 7933, 24, 2, UNI_CCC__17 } /* canonicalcombiningclass=17 */, - { 6, 5791, 2627, 13, 19, UNI_JG__BURUSHASKIYEHBARREE } /* joininggroup=burushaskiyehbarree */, - { 0, 8780, 2141, 7, 7, UNI_INCYRILLIC } /* block=cyrillic */, - { 6, 10333, 8604, 3, 6, UNI_SHAW } /* isshavian */, - { 2, 10027, 5934, 3, 13, UNI_JG__MANICHAEANWAW } /* jg=manichaeanwaw */, - { 0, 184, 5494, 2, 14, UNI_MN } /* isnonspacingmark */, - { 9, 5986, 8003, 13, 8, UNI_NV__1_SLASH_160 } /* numericvalue=6.25e-03 */, - { 0, 10132, 72, 3, 2, UNI_WB__LE } /* wb=le */, - { 14, 7076, 8346, 4, 5, UNI_INBENGALI } /* inbengali */, - { 18, 21, 9624, 2, 3, UNI_INLAO } /* inlao */, - { 1, 9488, 2076, 4, 22, UNI_TRANSPORTANDMAP } /* blk=transportandmapsymbols */, - { 0, 1988, 0, 21, 0, UNI_LOE } /* logicalorderexception */, - { 10, 4916, 2077, 3, 14, UNI_TRANSPORTANDMAP } /* istransportandmap */, - { 2, 5578, 0, 14, 0, UNI_sb_values_index } /* sentencebreak= */, - { 2, 4791, 6830, 3, 10, UNI_MYANMAREXTB } /* inmyanmarextb */, - { 0, 8780, 5661, 6, 13, UNI_AEGEANNUMBERS } /* block=aegeannumbers */, - { 0, 10024, 5592, 3, 14, UNI_ZS } /* gc=spaceseparator */, - { 6, 2140, 0, 21, 0, UNI_CYRILLICSUP } /* cyrillicsupplementary */, - { 0, 8852, 10135, 6, 3, UNI_CWKCF } /* cwkcf=yes */, - { 0, 9488, 923, 4, 28, UNI_SUPPUAB } /* blk=supplementaryprivateuseareab */, - { 3, 8147, 1942, 10, 3, -UNI_EXTPICT } /* extpict=false */, - { 2, 8780, 6181, 6, 12, UNI_INGUNJALAGONDI } /* block=gunjalagondi */, - { 3, 8589, 9732, 7, 4, UNI_PRTI } /* script=prti */, - { 6, 3382, 3, 3, 1, -UNI_CE } /* ce=f */, - { 8, 10048, 5649, 3, 1, UNI_NV__0 } /* nv=0 */, - { 0, 9508, 4134, 4, 1, UNI_CCC__1 } /* ccc=1 */, - { 0, 7218, 7486, 10, 9, UNI_LB__AI } /* linebreak=ambiguous */, - { 0, 7308, 0, 10, 0, UNI_PHNX } /* phoenician */, - { 1, 9277, 57, 3, 2, UNI_SC__YI } /* sc=yi */, - { 1, 8589, 9832, 7, 4, UNI_TIBT } /* script=tibt */, - { 2, 1552, 5593, 10, 13, UNI_ZS } /* category=spaceseparator */, - { 0, 8547, 0, 7, 0, UNI_OLCK } /* olchiki */, - { 4, 3836, 7621, 17, 9, UNI_NBAT } /* scriptextensions=nabataean */, - { 0, 6805, 187, 6, 16, UNI_MISCSYMBOLS } /* inmiscellaneoussymbols */, - { 0, 749, 0, 21, 0, UNI_ENCLOSEDALPHANUM } /* enclosedalphanumerics */, - { 8, 9768, 8123, 4, 4, UNI_BUGI } /* scx=bugi */, - { 1, 21, 5033, 3, 4, UNI_ASCII } /* inascii */, - { 2, 3836, 8942, 17, 4, UNI_LYDI } /* scriptextensions=lydi */, - { 1, 9768, 9872, 4, 4, UNI_XPEO } /* scx=xpeo */, - { 28, 10033, 414, 3, 11, UNI_LB__ID } /* lb=ideographic */, - { 19, 9444, 10120, 4, 3, UNI_AGE__8 } /* age=v80 */, - { 4, 10033, 988, 3, 2, UNI_LB__CP } /* lb=cp */, - { 0, 10048, 8714, 3, 2, UNI_NV__30 } /* nv=30 */, - { 43, 5791, 5892, 13, 3, UNI_JG__NUN } /* joininggroup=nun */, - { 1, 10129, 9836, 3, 4, UNI_VS } /* vs=true */, - { 3, 184, 540, 3, 29, UNI_CJKEXTB } /* iscjkunifiedideographsextensionb */, - { 0, 1552, 0, 10, 0, UNI_S } /* category=s */, - { 1, 8780, 4793, 6, 15, UNI_INMEROITICCURSIVE } /* block=meroiticcursive */, - { 4, 9997, 2509, 3, 20, UNI_BC__RLE } /* bc=righttoleftembedding */, - { 11, 3836, 9592, 17, 4, UNI_HMNP } /* scriptextensions=hmnp */, - { 0, 3079, 0, 18, 0, UNI_COPTICEPACTNUMBERS } /* copticepactnumbers */, - { 40, 3836, 9604, 17, 4, UNI_KHMR } /* scriptextensions=khmr */, - { 0, 8780, 3683, 6, 17, UNI_ETHIOPICEXTA } /* block=ethiopicextendeda */, - { 0, 7158, 26, 10, 1, UNI_DIA } /* diacritic=y */, - { 1, 4916, 1846, 3, 8, UNI_TITLE } /* istitlecase */, - { 1, 8400, 0, 6, 0, UNI_COMPEX } /* compex */, - { 0, 6469, 5713, 12, 7, UNI_XPOSIXDIGIT } /* numerictype=decimal */, - { 64, 10024, 728, 3, 6, UNI_N } /* gc=number */, - { 1, 9508, 7806, 4, 1, UNI_CCC__6 } /* ccc=6 */, - { 0, 3836, 7630, 17, 9, UNI_TALU } /* scriptextensions=newtailue */, - { 17, 9277, 9095, 3, 5, UNI_SC__BUHD } /* sc=buhid */, - { 2, 9728, 0, 4, 0, UNI_MIAO } /* plrd */, - { 2, 7088, 4321, 10, 16, UNI_BC__S } /* bidiclass=segmentseparator */, - { 17, 8780, 1294, 6, 25, UNI_SUPERANDSUB } /* block=superscriptsandsubscripts */, - { 2, 5674, 26, 13, 1, UNI_BIDIM } /* bidimirrored=y */, - { 9, 9488, 3632, 4, 17, UNI_CYRILLICEXTA } /* blk=cyrillicextendeda */, - { 0, 3836, 9812, 17, 4, UNI_TAML } /* scriptextensions=taml */, - { 0, 21, 6253, 2, 12, UNI_KHMERSYMBOLS } /* inkhmersymbols */, - { 0, 8694, 36, 7, 1, UNI_XPOSIXSPACE } /* wspace=t */, - { 0, 8864, 1, 6, 1, -UNI_EMOJI } /* emoji=n */, - { 0, 3836, 8618, 18, 3, UNI_SOYO } /* scriptextensions=soyo */, - { 3, 8589, 9560, 7, 4, UNI_SC__GONG } /* script=gong */, - { 32, 184, 4478, 2, 15, UNI_BRAI } /* isbraillepatterns */, - { 1, 7155, 8889, 3, 5, UNI_HATR } /* ishatran */, - { 1, 9488, 8275, 4, 8, UNI_SPECIALS } /* blk=specials */, - { 0, 9508, 8727, 4, 2, UNI_CCC__32 } /* ccc=32 */, - { 0, 9768, 9704, 4, 4, UNI_ORKH } /* scx=orkh */, - { 2, 3097, 749, 18, 3, UNI_DT__ENC } /* decompositiontype=enc */, - { 0, 9768, 1176, 5, 3, UNI_SORA } /* scx=sora */, - { 0, 10327, 47, 5, 1, UNI_PERM } /* isperm */, - { 17, 5060, 9836, 14, 4, UNI_CI } /* caseignorable=true */, - { 2, 8267, 1025, 8, 2, -UNI_RADICAL } /* radical=no */, - { 1, 10048, 5648, 3, 9, UNI_NV__100000000 } /* nv=100000000 */, - { 0, 184, 9612, 2, 4, UNI_KNDA } /* isknda */, - { 0, 7325, 7754, 3, 2, UNI_IN__11 } /* in=11 */, - { 0, 5791, 6325, 13, 12, UNI_JG__MALAYALAMNNA } /* joininggroup=malayalamnna */, - { 0, 5060, 3, 14, 1, -UNI_CI } /* caseignorable=f */, - { 45, 6818, 0, 11, 0, UNI_MYANMAREXTA } /* myanmarexta */, - { 1, 5578, 34, 14, 2, UNI_SB__EX } /* sentencebreak=ex */, - { 0, 8589, 8786, 7, 4, UNI_CARI } /* script=cari */, - { 3, 1552, 728, 9, 6, UNI_N } /* category=number */, - { 6, 5986, 7947, 13, 8, UNI_NV__3_SLASH_64 } /* numericvalue=4.69e-02 */, - { 0, 8589, 9448, 7, 4, UNI_AGHB } /* script=aghb */, - { 0, 4116, 5779, 3, 5, UNI_IPAEXT } /* isipaext */, - { 7, 8780, 720, 7, 29, UNI_CUNEIFORMNUMBERS } /* block=cuneiformnumbersandpunctuation */, - { 1, 10320, 17, 5, 1, UNI_XPEO } /* isxpeo */, - { 14, 9508, 9121, 5, 4, UNI_CCC__18 } /* ccc=ccc18 */, - { 0, 6231, 2120, 3, 13, UNI_CJKRADICALSSUP } /* incjkradicalssup */, - { 1, 9277, 6385, 3, 12, UNI_SC__GONM } /* sc=masaramgondi */, - { 0, 8575, 9836, 7, 4, UNI_PATSYN } /* patsyn=true */, - { 4, 8589, 8491, 7, 4, UNI_MARC } /* script=marc */, - { 3, 9277, 8840, 3, 6, UNI_SC__CAKM } /* sc=chakma */, - { 0, 1417, 9943, 24, 3, UNI_CCC__AR } /* canonicalcombiningclass=232 */, - { 2, 2784, 3923, 4, 14, UNI_ARABICSUP } /* inarabicsupplement */, - { 0, 9768, 8315, 4, 8, UNI_UGAR } /* scx=ugaritic */, - { 0, 9632, 0, 4, 0, UNI_LINA } /* lina */, - { 0, 10027, 4773, 3, 5, UNI_JG__SADHE } /* jg=sadhe */, - { 1, 7249, 9, 4, 16, UNI_CANS } /* iscanadianaboriginal */, - { 0, 2182, 70, 21, 2, UNI_GCB__PP } /* graphemeclusterbreak=pp */, - { 1, 6928, 1025, 11, 2, -UNI_SD } /* softdotted=no */, - { 2, 10129, 36, 3, 1, UNI_VS } /* vs=t */, - { 13, 9768, 1654, 4, 6, UNI_HANG } /* scx=hangul */, - { 7, 8780, 749, 6, 30, UNI_ENCLOSEDALPHANUMSUP } /* block=enclosedalphanumericsupplement */, - { 0, 7249, 754, 4, 3, UNI_CASED } /* iscased */, - { 2, 3295, 0, 18, 0, UNI_LATINEXTADDITIONAL } /* latinextadditional */, - { 34, 8882, 9836, 6, 4, UNI_GREXT } /* grext=true */, - { 0, 5578, 7, 15, 1, UNI_SB__SC } /* sentencebreak=sc */, - { 0, 2529, 9837, 21, 3, UNI_TERM } /* terminalpunctuation=true */, - { 0, 316, 0, 33, 0, UNI_SUPMATHOPERATORS } /* supplementalmathematicaloperators */, - { 0, 9262, 3358, 3, 3, UNI_SB__SE } /* sb=sep */, - { 0, 6231, 3045, 4, 16, UNI_HALFMARKS } /* incombininghalfmarks */, - { 16, 184, 1857, 3, 20, UNI_CWU } /* ischangeswhenuppercased */, - { 1, 10009, 435, 4, 2, UNI_DT__ENC } /* dt=enc */, - { 0, 1552, 4898, 9, 15, UNI_PS } /* category=openpunctuation */, - { 0, 8589, 6973, 8, 10, UNI_SC__SYLO } /* script=sylotinagri */, - { 6, 184, 5752, 2, 13, UNI_GREEKEXT } /* isgreekextended */, - { 3, 7458, 0, 10, 0, UNI_YIRADICALS } /* yiradicals */, - { 0, 10027, 4203, 3, 3, UNI_JG__LAM } /* jg=lam */, - { 0, 1828, 1025, 6, 2, -UNI_CASED } /* cased=no */, - { 0, 10048, 8820, 3, 2, UNI_NV__29 } /* nv=29 */, - { 0, 1087, 1, 27, 1, -UNI_PCM } /* prependedconcatenationmark=n */, - { 3, 9768, 8315, 4, 4, UNI_UGAR } /* scx=ugar */, - { 0, 5564, 9255, 14, 5, -UNI_QMARK } /* quotationmark=false */, - { 1, 7218, 6686, 10, 11, UNI_LB__IN } /* linebreak=inseparable */, - { 8, 7738, 1025, 9, 2, -UNI_XIDS } /* xidstart=no */, - { 8, 42, 0, 9, 0, UNI_CJKCOMPAT } /* cjkcompat */, - { 2, 8617, 0, 4, 0, UNI_SOYO } /* soyo */, - { 6, 3598, 0, 17, 0, UNI_AGHB } /* caucasianalbanian */, - { 0, 9768, 8107, 4, 8, UNI_BALI } /* scx=balinese */, - { 2, 8996, 0, 6, 0, UNI_sterm_values_index } /* sterm= */, - { 0, 6409, 0, 4, 0, UNI_MEND } /* mend */, - { 1, 7318, 9979, 10, 3, UNI_IN__6_DOT_1 } /* presentin=6.1 */, - { 0, 1552, 74, 9, 2, UNI_ME } /* category=me */, - { 0, 6620, 0, 11, 0, UNI_DOMINO } /* dominotiles */, - { 0, 9488, 2076, 4, 15, UNI_TRANSPORTANDMAP } /* blk=transportandmap */, - { 0, 1922, 0, 22, 0, UNI_DIACRITICALSFORSYMBOLS } /* diacriticalsforsymbols */, - { 16, 7218, 7108, 10, 10, UNI_LB__BA } /* linebreak=breakafter */, - { 0, 9444, 10090, 4, 3, UNI_AGE__4 } /* age=v40 */, - { 4, 9245, 0, 4, 0, UNI_DOGR } /* dogr */, - { 5, 5986, 7811, 13, 8, UNI_NV__1_SLASH_6 } /* numericvalue=1.67e-01 */, - { 21, 4033, 1822, 16, 2, UNI_NL } /* generalcategory=nl */, - { 0, 7218, 23, 10, 2, UNI_LB__AL } /* linebreak=al */, - { 0, 8589, 8407, 7, 7, UNI_DSRT } /* script=deseret */, - { 0, 9488, 3079, 4, 18, UNI_COPTICEPACTNUMBERS } /* blk=copticepactnumbers */, - { 0, 9768, 9708, 4, 4, UNI_ORYA } /* scx=orya */, - { 3, 6205, 1025, 12, 2, -UNI_IDEO } /* ideographic=no */, - { 2, 184, 3241, 2, 8, UNI_GEOR } /* isgeorgian */, - { 0, 5746, 0, 6, 0, UNI_ebase_values_index } /* ebase= */, - { 3, 184, 34, 2, 3, UNI_EXT } /* isext */, - { 1, 10027, 8283, 3, 8, UNI_JG__SWASHKAF } /* jg=swashkaf */, - { 1, 184, 8990, 2, 6, UNI_RJNG } /* isrejang */, - { 4, 8780, 2836, 6, 19, UNI_MODIFIERTONELETTERS } /* block=modifiertoneletters */, - { 0, 184, 9620, 2, 4, UNI_LANA } /* islana */, - { 1, 5791, 10021, 13, 3, UNI_JG__GAF } /* joininggroup=gaf */, - { 18, 184, 3439, 2, 18, UNI_SMALLKANAEXT } /* issmallkanaextension */, - { 1, 10132, 1194, 3, 2, UNI_LB__LF } /* wb=lf */, - { 9, 9071, 9836, 4, 4, UNI_XPOSIXXDIGIT } /* hex=true */, - { 0, 1417, 7930, 24, 2, UNI_CCC__14 } /* canonicalcombiningclass=14 */, - { 8, 9277, 8442, 3, 7, UNI_SC__HANO } /* sc=hanunoo */, - { 1, 6231, 1879, 3, 18, UNI_CJKCOMPATIDEOGRAPHS } /* incjkcompatideographs */, - { 1, 6469, 5040, 12, 5, UNI_NT__DI } /* numerictype=digit */, - { 0, 2032, 10135, 22, 3, UNI__PERL_NCHAR } /* noncharactercodepoint=yes */, - { 1, 5986, 9364, 13, 4, UNI_NV__1_SLASH_10 } /* numericvalue=1/10 */, - { 16, 3904, 1, 17, 1, -UNI_UIDEO } /* unifiedideograph=n */, - { 11, 5791, 7045, 13, 2, UNI_JG__FE } /* joininggroup=fe */, - { 17, 9584, 0, 4, 0, UNI_HLUW } /* hluw */, - { 4, 113, 0, 35, 0, UNI_DIACRITICALSFORSYMBOLS } /* combiningdiacriticalmarksforsymbols */, - { 1, 5791, 9044, 13, 6, UNI_JG__YUDHHE } /* joininggroup=yudhhe */, - { 0, 7318, 7782, 10, 1, UNI_IN__3 } /* presentin=3 */, - { 3, 9508, 8066, 4, 2, UNI_CCC__28 } /* ccc=28 */, - { 6, 9277, 9740, 3, 4, UNI_SC__QAAI } /* sc=qaai */, - { 0, 9508, 8831, 4, 3, UNI_CCC__132 } /* ccc=132 */, - { 8, 184, 4289, 2, 16, UNI_MYANMAREXTB } /* ismyanmarextendedb */, - { 1, 9488, 7058, 4, 10, UNI_ARABICEXTA } /* blk=arabicexta */, - { 8, 6553, 9836, 12, 4, UNI_XIDC } /* xidcontinue=true */, - { 0, 9556, 8139, 4, 8, UNI_WB__EB } /* gcb=ebasegaz */, - { 1, 7291, 0, 4, 0, UNI_SOGD } /* sogd */, - { 0, 5986, 9907, 13, 3, UNI_NV__1_SLASH_7 } /* numericvalue=1/7 */, - { 2, 7028, 2309, 3, 5, UNI_YIJING } /* isyijing */, - { 97, 9768, 8900, 4, 6, UNI_KTHI } /* scx=kaithi */, - { 0, 9768, 7308, 4, 10, UNI_PHNX } /* scx=phoenician */, - { 0, 10027, 5895, 3, 13, UNI_JG__MANICHAEANONE } /* jg=manichaeanone */, - { 0, 10003, 9255, 3, 5, -UNI_CI } /* ci=false */, - { 44, 3751, 0, 17, 0, UNI_KITS } /* khitansmallscript */, - { 3, 8780, 8344, 6, 7, UNI_INBENGALI } /* block=bengali */, - { 0, 8780, 7666, 6, 9, UNI_INOLDTURKIC } /* block=oldturkic */, - { 34, 7218, 6179, 10, 2, UNI_LB__WJ } /* linebreak=wj */, - { 0, 3836, 9828, 17, 4, UNI_THAI } /* scriptextensions=thai */, - { 0, 9488, 8299, 4, 8, UNI_INTIFINAGH } /* blk=tifinagh */, - { 2, 8780, 4097, 6, 16, UNI_HIGHPUSURROGATES } /* block=highpusurrogates */, - { 0, 8780, 3547, 6, 17, UNI_ALCHEMICAL } /* block=alchemicalsymbols */, - { 0, 7325, 9400, 3, 4, UNI_IN__13 } /* in=13.0 */, - { 0, 2760, 24, 19, 1, UNI_GCB__L } /* hangulsyllabletype=l */, - { 8, 4113, 1751, 3, 2, UNI_INVAI } /* invai */, - { 3, 4916, 9821, 3, 3, UNI_TFNG } /* istfng */, - { 0, 4033, 7, 16, 1, UNI_C } /* generalcategory=c */, - { 0, 184, 630, 3, 29, UNI_CJKEXTE } /* iscjkunifiedideographsextensione */, - { 0, 9345, 10135, 5, 3, UNI_XIDC } /* xidc=yes */, - { 0, 9488, 8547, 4, 7, UNI_OLCK } /* blk=olchiki */, - { 33, 9768, 9532, 4, 4, UNI_CYRL } /* scx=cyrl */, - { 0, 6939, 0, 4, 0, UNI_SORA } /* sora */, - { 3, 10033, 6686, 3, 11, UNI_LB__IN } /* lb=inseparable */, - { 0, 8400, 9836, 7, 4, UNI_COMPEX } /* compex=true */, - { 6, 8978, 3, 6, 1, -UNI__PERL_PATWS } /* patws=f */, - { 2, 9488, 446, 4, 32, UNI_IDEOGRAPHICSYMBOLS } /* blk=ideographicsymbolsandpunctuation */, - { 0, 7138, 0, 10, 0, UNI_COMPATJAMO } /* compatjamo */, - { 0, 4989, 1, 3, 41, UNI_UCASEXT } /* isunifiedcanadianaboriginalsyllabicsextended */, - { 1, 184, 3385, 2, 17, UNI_RI } /* isregionalindicator */, - { 0, 5508, 1025, 14, 2, -UNI_PATSYN } /* patternsyntax=no */, - { 6, 10290, 3379, 6, 5, UNI_XPOSIXSPACE } /* xposixspace */, - { 0, 184, 2409, 2, 13, UNI_GLAGOLITICSUP } /* isglagoliticsup */, - { 0, 9508, 7814, 4, 1, UNI_CCC__7 } /* ccc=7 */, - { 8, 8561, 0, 7, 0, UNI_OSMA } /* osmanya */, - { 14, 7438, 6193, 10, 12, UNI_LB__HL } /* wordbreak=hebrewletter */, - { 2, 184, 8203, 2, 8, UNI_JAMOEXTA } /* isjamoexta */, - { 5, 1166, 36, 26, 1, UNI_DI } /* defaultignorablecodepoint=t */, - { 7, 8774, 9255, 6, 5, -UNI_BIDIM } /* bidim=false */, - { 9, 7088, 24, 10, 1, UNI_BC__L } /* bidiclass=l */, - { 24, 9277, 8936, 3, 4, UNI_LYCI } /* sc=lyci */, - { 0, 9277, 8914, 5, 4, UNI_SC__KHOJ } /* sc=khojki */, - { 0, 9528, 3, 4, 1, -UNI_CWU } /* cwu=f */, - { 0, 4033, 262, 16, 2, UNI_SM } /* generalcategory=sm */, - { 2, 6609, 1025, 11, 2, -UNI_DEP } /* deprecated=no */, - { 0, 9768, 7684, 4, 4, UNI_PAUC } /* scx=pauc */, - { 4, 7325, 5648, 3, 2, UNI_IN__10 } /* in=10 */, - { 1, 9997, 18, 3, 1, UNI_BC__R } /* bc=r */, - { 30, 9085, 0, 5, 0, UNI_BATK } /* batak */, - { 1, 184, 2409, 2, 10, UNI_GLAG } /* isglagolitic */, - { 0, 9768, 2608, 4, 6, UNI_BRAH } /* scx=brahmi */, - { 0, 8780, 8299, 6, 8, UNI_INTIFINAGH } /* block=tifinagh */, - { 1, 8780, 6025, 6, 12, UNI_ALPHABETICPF } /* block=alphabeticpf */, - { 4, 119, 8877, 3, 5, UNI_INGOTHIC } /* ingothic */, - { 0, 10024, 32, 3, 2, UNI__PERL_SURROGATE } /* gc=cs */, - { 45, 3115, 0, 10, 0, UNI_DEVA } /* devanagari */, - { 0, 9270, 6506, 3, 7, UNI_PHAISTOS } /* inphaistos */, - { 14, 184, 4145, 2, 7, UNI_LINB } /* islinearb */, - { 3, 9508, 9126, 5, 4, UNI_CCC__19 } /* ccc=ccc19 */, - { 0, 10033, 6073, 3, 12, UNI_LB__SY } /* lb=breaksymbols */, - { 0, 9277, 2912, 3, 9, UNI_SUND } /* sc=sundanese */, - { 1, 3259, 0, 17, 0, UNI_IDSB } /* idsbinaryoperator */, - { 0, 3836, 2245, 17, 11, UNI_MTEI } /* scriptextensions=meeteimayek */, - { 1, 1856, 0, 22, 0, UNI_cwu_values_index } /* changeswhenuppercased= */, - { 6, 24, 0, 1, 0, UNI_L } /* l */, - { 2, 184, 4643, 2, 14, UNI_ECOMP } /* isemojicomponent */, - { 1, 7218, 8449, 10, 6, UNI_LB__HY } /* linebreak=hyphen */, - { 1, 10048, 9408, 3, 4, UNI_NV__15_SLASH_2 } /* nv=15/2 */, - { 1, 7028, 5219, 3, 9, UNI_YIRADICALS } /* isyiradicals */, - { 5, 7076, 9096, 3, 4, UNI_INBUHID } /* inbuhid */, - { 1, 184, 7632, 3, 2, UNI_CWT } /* iscwt */, - { 34, 9277, 9760, 3, 4, UNI_SAMR } /* sc=samr */, - { 3, 9488, 3223, 4, 18, UNI_INPUNCTUATION } /* blk=generalpunctuation */, - { 12, 7088, 1353, 10, 3, UNI_BC__RLE } /* bidiclass=rle */, - { 1, 8780, 3044, 7, 17, UNI_HALFMARKS } /* block=combininghalfmarks */, - { 0, 21, 7428, 2, 10, UNI_INWARANGCITI } /* inwarangciti */, - { 19, 1417, 9946, 24, 3, UNI_CCC__DB } /* canonicalcombiningclass=233 */, - { 1, 184, 1922, 2, 12, UNI_DIACRITICALS } /* isdiacriticals */, - { 0, 9768, 9728, 4, 4, UNI_MIAO } /* scx=plrd */, - { 2, 9768, 8344, 4, 7, UNI_BENG } /* scx=bengali */, - { 1, 9326, 1183, 4, 3, UNI_ANY } /* unicode */, - { 23, 8589, 7359, 8, 3, UNI_SAUR } /* script=saur */, - { 12, 5752, 0, 13, 0, UNI_GREEKEXT } /* greekextended */, - { 0, 4542, 3243, 4, 9, UNI_GEORGIANSUP } /* ingeorgiansup */, - { 4, 4658, 0, 14, 0, UNI_GREXT } /* graphemeextend */, - { 0, 9275, 9090, 5, 5, UNI_INSC__BINDU } /* insc=bindu */, - { 0, 2308, 0, 6, 0, UNI_YIJING } /* yijing */, - { 1, 9277, 8561, 3, 7, UNI_OSMA } /* sc=osmanya */, - { 0, 3358, 0, 9, 0, UNI_Z } /* separator */, - { 0, 8589, 9604, 7, 4, UNI_KHMR } /* script=khmr */, - { 1, 2529, 0, 19, 0, UNI_TERM } /* terminalpunctuation */, - { 1, 10027, 6337, 3, 12, UNI_JG__MALAYALAMNYA } /* jg=malayalamnya */, - { 1, 3259, 1025, 18, 2, -UNI_IDSB } /* idsbinaryoperator=no */, - { 0, 184, 5687, 2, 13, UNI_BLOCKELEMENTS } /* isblockelements */, - { 8, 8984, 0, 6, 0, UNI_qmark_values_index } /* qmark= */, - { 8, 4688, 8540, 15, 7, UNI_IDENTIFIERTYPE__NOTNFKC } /* identifiertype=notnfkc */, - { 2, 10132, 73, 3, 2, UNI_WB__EB } /* wb=em */, - { 1, 7438, 7612, 10, 9, UNI_WB__MB } /* wordbreak=midnumlet */, - { 1, 9692, 0, 4, 0, UNI_NSHU } /* nshu */, - { 14, 1966, 7328, 22, 10, UNI_INSC__PUREKILLER } /* indicsyllabiccategory=purekiller */, - { 19, 8589, 1677, 7, 5, UNI_SC__LATN } /* script=latin */, - { 1, 9488, 9656, 4, 4, UNI_INMIAO } /* blk=miao */, - { 18, 10126, 3522, 3, 7, UNI_VO__U } /* vo=upright */, - { 0, 2569, 3522, 20, 7, UNI_VO__U } /* verticalorientation=upright */, - { 0, 3836, 3241, 17, 8, UNI_GEOR } /* scriptextensions=georgian */, - { 17, 9768, 7428, 4, 10, UNI_WARA } /* scx=warangciti */, - { 2, 8688, 8093, 4, 6, UNI_ARMN } /* isarmenian */, - { 0, 7218, 340, 10, 2, UNI_LB__OP } /* linebreak=op */, - { 0, 184, 838, 2, 29, UNI_MISCARROWS } /* ismiscellaneoussymbolsandarrows */, - { 12, 5791, 6361, 13, 12, UNI_JG__MALAYALAMTTA } /* joininggroup=malayalamtta */, - { 0, 8984, 0, 5, 0, UNI_QMARK } /* qmark */, - { 3, 10003, 3, 3, 1, -UNI_CI } /* ci=f */, - { 1, 3836, 3894, 18, 10, UNI_SGNW } /* scriptextensions=signwriting */, - { 0, 3424, 8316, 3, 7, UNI_INUGARITIC } /* inugaritic */, - { 0, 184, 2120, 3, 20, UNI_CJKRADICALSSUP } /* iscjkradicalssupplement */, - { 102, 8780, 6730, 6, 11, UNI_KATAKANAEXT } /* block=katakanaext */, - { 0, 9071, 0, 4, 0, UNI_hex_values_index } /* hex= */, - { 4, 9508, 8820, 4, 2, UNI_CCC__29 } /* ccc=29 */, - { 2, 4829, 2411, 4, 8, UNI_INGLAGOLITIC } /* inglagolitic */, - { 1, 8780, 3439, 6, 18, UNI_SMALLKANAEXT } /* block=smallkanaextension */, - { 0, 7318, 7979, 10, 3, UNI_IN__6 } /* presentin=6.0 */, - { 0, 3836, 2061, 17, 4, UNI_MODI } /* scriptextensions=modi */, - { 10, 9290, 26, 5, 1, UNI_MATH } /* math=y */, - { 1, 9444, 10093, 4, 3, UNI_AGE__4_DOT_1 } /* age=v41 */, - { 16, 7418, 1025, 10, 2, -UNI_XPOSIXUPPER } /* uppercase=no */, - { 0, 8780, 630, 7, 29, UNI_CJKEXTE } /* block=cjkunifiedideographsextensione */, - { 11, 10327, 7438, 6, 4, UNI_POSIXWORD } /* isperlword */, - { 10, 184, 38, 2, 2, UNI_XPOSIXDIGIT } /* isnd */, - { 1, 1188, 4929, 3, 4, UNI_INTAMIL } /* intamil */, - { 0, 9508, 3572, 4, 5, UNI_CCC__B } /* ccc=below */, - { 0, 5986, 9420, 13, 4, UNI_NV__3_SLASH_20 } /* numericvalue=3/20 */, - { 11, 10063, 1025, 3, 2, -UNI_SD } /* sd=no */, - { 36, 3853, 9836, 17, 4, UNI_STERM } /* sentenceterminal=true */, - { 17, 3870, 0, 17, 0, UNI_SMALLFORMS } /* smallformvariants */, - { 0, 4916, 5994, 3, 3, UNI_TALU } /* istalu */, - { 1, 5791, 5326, 13, 14, UNI_JG__MANICHAEANBETH } /* joininggroup=manichaeanbeth */, - { 3, 2280, 9311, 3, 4, UNI_OGAM } /* isogham */, - { 0, 1417, 9108, 24, 2, UNI_CCC__15 } /* canonicalcombiningclass=15 */, - { 0, 10048, 5648, 3, 7, UNI_NV__1000000 } /* nv=1000000 */, - { 1, 9488, 6730, 4, 11, UNI_KATAKANAEXT } /* blk=katakanaext */, - { 0, 8884, 1025, 4, 2, -UNI_EXT } /* ext=no */, - { 4, 6231, 3667, 3, 16, UNI_CYRILLICEXTC } /* incyrillicextendedc */, - { 54, 10009, 8533, 3, 7, UNI_DT__NB } /* dt=nobreak */, - { 13, 9768, 9888, 4, 4, UNI_ZANB } /* scx=zanb */, - { 0, 10296, 8576, 3, 5, UNI_PATSYN } /* ispatsyn */, - { 20, 4478, 0, 4, 0, UNI_BRAI } /* brai */, - { 0, 4033, 6265, 16, 12, UNI_NL } /* generalcategory=letternumber */, - { 1, 9488, 8365, 4, 7, UNI_CJKEXTC } /* blk=cjkextc */, - { 4, 7318, 7765, 10, 1, UNI_IN__2 } /* presentin=2 */, - { 0, 5116, 36, 14, 1, UNI_EMOD } /* emojimodifier=t */, - { 0, 2569, 3379, 4, 5, UNI_VERTSPACE } /* vertspace */, - { 0, 8996, 10135, 6, 3, UNI_STERM } /* sterm=yes */, - { 0, 5687, 0, 13, 0, UNI_BLOCKELEMENTS } /* blockelements */, - { 1, 9488, 8645, 4, 7, UNI_INTAITHAM } /* blk=taitham */, - { 2, 10303, 0, 5, 0, UNI_XPOSIXBLANK } /* blank */, - { 0, 8589, 9500, 7, 4, UNI_SC__CAKM } /* script=cakm */, - { 0, 8589, 9245, 7, 4, UNI_SC__DOGR } /* script=dogr */, - { 0, 5986, 8750, 13, 6, UNI_NV__800000 } /* numericvalue=800000 */, - { 0, 3904, 10135, 17, 3, UNI_UIDEO } /* unifiedideograph=yes */, - { 2, 3836, 3079, 17, 4, UNI_COPT } /* scriptextensions=copt */, - { 1, 9768, 6253, 4, 5, UNI_KHMR } /* scx=khmer */, - { 1, 8996, 1025, 6, 2, -UNI_STERM } /* sterm=no */, - { 64, 9768, 8990, 4, 6, UNI_RJNG } /* scx=rejang */, - { 1, 1188, 9331, 3, 4, UNI_INTAILE } /* intaile */, - { 5, 8780, 7278, 6, 10, UNI_INOLDPERSIAN } /* block=oldpersian */, - { 1, 8774, 3, 6, 1, -UNI_BIDIM } /* bidim=f */, - { 0, 4809, 1162, 4, 2, UNI_CPRT } /* iscprt */, - { 0, 9508, 8837, 4, 3, UNI_WB__EB } /* ccc=133 */, - { 8, 10033, 6193, 3, 12, UNI_LB__HL } /* lb=hebrewletter */, - { 1, 10048, 9428, 3, 3, UNI_NV__3_SLASH_8 } /* nv=3/8 */, - { 1, 8519, 0, 7, 0, UNI_nfkdqc_values_index } /* nfkdqc= */, - { 8, 9488, 7248, 4, 10, UNI_MISCARROWS } /* blk=miscarrows */, - { 32, 184, 4002, 3, 15, UNI_CYPRIOTSYLLABARY } /* iscypriotsyllabary */, - { 0, 1966, 5700, 22, 13, UNI_INSC__CONSONANTDEAD } /* indicsyllabiccategory=consonantdead */, - { 0, 1834, 36, 22, 1, UNI_CWT } /* changeswhentitlecased=t */, - { 121, 9277, 8091, 3, 8, UNI_ARMN } /* sc=armenian */, - { 6, 10048, 8727, 3, 2, UNI_NV__32 } /* nv=32 */, - { 0, 1505, 1016, 5, 2, UNI_INGREEK } /* ingreek */, - { 1, 3836, 4448, 17, 5, UNI_BAMU } /* scriptextensions=bamum */, - { 2, 9488, 113, 4, 35, UNI_DIACRITICALSFORSYMBOLS } /* blk=combiningdiacriticalmarksforsymbols */, - { 1, 8942, 0, 6, 0, UNI_LYDI } /* lydian */, - { 3, 9277, 9476, 3, 4, UNI_AVST } /* sc=avst */, - { 0, 7418, 1, 10, 1, -UNI_XPOSIXUPPER } /* uppercase=n */, - { 6, 9488, 719, 4, 16, UNI_CUNEIFORMNUMBERS } /* blk=cuneiformnumbers */, - { 0, 4853, 10135, 15, 3, UNI_DT__NONE } /* nfkdquickcheck=yes */, - { 0, 8589, 8666, 7, 7, UNI_SC__TIRH } /* script=tirhuta */, - { 4, 184, 328, 2, 21, UNI_MATHOPERATORS } /* ismathematicaloperators */, - { 1, 184, 600, 3, 29, UNI_CJKEXTD } /* iscjkunifiedideographsextensiond */, - { 0, 9488, 6193, 4, 6, UNI_INHEBREW } /* blk=hebrew */, - { 3, 8780, 720, 7, 8, UNI_INCUNEIFORM } /* block=cuneiform */, - { 9, 9508, 6631, 4, 11, UNI_CCC__DA } /* ccc=doubleabove */, - { 0, 4628, 3, 15, 1, UNI_EA__F } /* eastasianwidth=f */, - { 9, 9488, 1060, 4, 27, UNI_OCR } /* blk=opticalcharacterrecognition */, - { 0, 8589, 9440, 7, 4, UNI_SC__ADLM } /* script=adlm */, - { 9, 10296, 7309, 3, 9, UNI_PHNX } /* isphoenician */, - { 4, 184, 3853, 2, 16, UNI_STERM } /* issentenceterminal */, - { 9, 9277, 9496, 3, 4, UNI_SC__BUHD } /* sc=buhd */, - { 25, 10027, 0, 3, 0, UNI_jg_values_index } /* jg= */, - { 4, 3836, 6193, 17, 6, UNI_HEBR } /* scriptextensions=hebrew */, - { 0, 3097, 1417, 18, 9, UNI_DT__CAN } /* decompositiontype=canonical */, - { 1, 7076, 7514, 3, 8, UNI_INBHAIKSUKI } /* inbhaiksuki */, - { 3, 3836, 7359, 18, 3, UNI_SAUR } /* scriptextensions=saur */, - { 1, 3836, 9728, 17, 4, UNI_MIAO } /* scriptextensions=plrd */, - { 0, 3836, 8876, 17, 6, UNI_GOTH } /* scriptextensions=gothic */, - { 0, 1273, 3, 21, 1, -UNI_CE } /* compositionexclusion=f */, - { 5, 3836, 8547, 17, 7, UNI_OLCK } /* scriptextensions=olchiki */, - { 2, 9768, 4385, 4, 4, UNI_TANG } /* scx=tang */, - { 5, 9997, 25, 3, 1, UNI_BC__S } /* bc=s */, - { 0, 6229, 26, 12, 1, UNI_JOINC } /* joincontrol=y */, - { 61, 10048, 8051, 3, 8, UNI_NV__5_SLASH_6 } /* nv=8.33e-01 */, - { 7, 9014, 9255, 6, 5, -UNI_UIDEO } /* uideo=false */, - { 32, 9768, 7292, 5, 6, UNI_SOGD } /* scx=sogdian */, - { 2, 3151, 26, 18, 1, UNI_EPRES } /* emojipresentation=y */, - { 3, 8589, 8131, 7, 4, UNI_SC__DUPL } /* script=dupl */, - { 1, 7218, 2640, 10, 2, UNI_LB__BA } /* linebreak=ba */, - { 1, 8780, 5843, 6, 9, UNI_INMALAYALAM } /* block=malayalam */, - { 17, 4916, 8667, 3, 3, UNI_TIRH } /* istirh */, - { 0, 5324, 330, 4, 19, UNI_MATHOPERATORS } /* inmathematicaloperators */, - { 7, 1417, 8820, 24, 2, UNI_CCC__29 } /* canonicalcombiningclass=29 */, - { 7, 4916, 9833, 3, 3, UNI_TIBT } /* istibt */, - { 0, 9508, 8714, 4, 2, UNI_CCC__30 } /* ccc=30 */, - { 0, 9277, 8645, 3, 7, UNI_LANA } /* sc=taitham */, - { 17, 6229, 9255, 12, 5, -UNI_JOINC } /* joincontrol=false */, - { 2, 4033, 5438, 16, 14, UNI_SK } /* generalcategory=modifiersymbol */, - { 8, 7218, 10154, 10, 2, UNI_LB__B2 } /* linebreak=b2 */, - { 0, 47, 0, 1, 0, UNI_M } /* m */, - { 3, 10333, 9797, 3, 3, UNI_SYRC } /* issyrc */, - { 9, 184, 8211, 2, 8, UNI_JAMOEXTB } /* isjamoextb */, - { 1, 10168, 0, 2, 0, UNI_CASEDLETTER } /* l& */, - { 0, 9277, 9880, 3, 4, UNI_SC__YI } /* sc=yiii */, - { 0, 8589, 7657, 7, 9, UNI_SC__PERM } /* script=oldpermic */, - { 2, 9488, 2409, 4, 20, UNI_GLAGOLITICSUP } /* blk=glagoliticsupplement */, - { 1, 184, 7188, 2, 10, UNI_KHAR } /* iskharoshthi */, - { 4, 184, 9529, 3, 2, UNI_CWU } /* iscwu */, - { 71, 8147, 10135, 8, 3, UNI_EXTPICT } /* extpict=yes */, - { 6, 7325, 7923, 3, 3, UNI_IN__4 } /* in=4.0 */, - { 0, 1417, 9949, 24, 3, UNI_CCC__DA } /* canonicalcombiningclass=234 */, - { 5, 10291, 1823, 5, 5, UNI_POSIXLOWER } /* posixlower */, - { 0, 2224, 6973, 3, 10, UNI_INSYLOTINAGRI } /* insylotinagri */, - { 3, 7076, 4449, 3, 7, UNI_BAMUMSUP } /* inbamumsup */, - { 21, 9768, 9038, 4, 6, UNI_YEZI } /* scx=yezidi */, - { 22, 9476, 0, 4, 0, UNI_AVST } /* avst */, - { 0, 8780, 3223, 6, 18, UNI_INPUNCTUATION } /* block=generalpunctuation */, - { 6, 9488, 8428, 4, 7, UNI_INGRANTHA } /* blk=grantha */, - { 0, 7325, 7877, 3, 2, UNI_IN__13 } /* in=13 */, - { 2, 5578, 5, 15, 1, UNI_SB__SE } /* sentencebreak=se */, - { 3, 9508, 9188, 4, 2, UNI_CCC__31 } /* ccc=31 */, - { 7, 9488, 8358, 4, 7, UNI_CJKEXTB } /* blk=cjkextb */, - { 0, 9277, 9624, 3, 3, UNI_LAO } /* sc=lao */, - { 0, 184, 9548, 2, 4, UNI_DSRT } /* isdsrt */, - { 96, 7325, 10111, 3, 3, UNI_IN__6_DOT_2 } /* in=v62 */, - { 10, 9508, 8823, 5, 5, UNI_CCC__130 } /* ccc=ccc130 */, - { 32, 9488, 1561, 4, 24, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* blk=supsymbolsandpictographs */, - { 0, 10340, 25, 3, 1, UNI_VS } /* isvs */, - { 0, 5032, 36, 14, 1, UNI_POSIXXDIGIT } /* asciihexdigit=t */, - { 0, 9524, 9836, 4, 4, UNI_CWT } /* cwt=true */, - { 19, 7438, 10015, 10, 3, UNI_WB__EB } /* wordbreak=ebg */, - { 5, 10048, 8059, 3, 8, UNI_NV__1_SLASH_12 } /* nv=8.33e-02 */, - { 4, 10290, 1823, 6, 5, UNI_XPOSIXLOWER } /* xposixlower */, - { 1, 5739, 3, 13, 1, -UNI_GRBASE } /* graphemebase=f */, - { 0, 184, 5242, 2, 14, UNI_LATINEXTC } /* islatinextendedc */, - { 48, 3379, 3, 6, 1, -UNI_XPOSIXSPACE } /* space=f */, - { 1, 10024, 38, 3, 2, UNI_XPOSIXDIGIT } /* gc=nd */, - { 0, 10027, 6346, 3, 3, UNI_JG__NYA } /* jg=nya */, - { 2, 2224, 8276, 3, 7, UNI_SPECIALS } /* inspecials */, - { 2, 8780, 7308, 6, 10, UNI_INPHOENICIAN } /* block=phoenician */, - { 3, 8780, 8337, 6, 7, UNI_INAVESTAN } /* block=avestan */, - { 0, 9488, 4401, 4, 9, UNI_TANGUTSUP } /* blk=tangutsup */, - { 9, 8780, 7098, 6, 10, UNI_BOXDRAWING } /* block=boxdrawing */, - { 0, 10048, 9168, 3, 2, UNI_NV__27 } /* nv=27 */, - { 6, 4916, 1846, 3, 4, UNI_TITLE } /* istitle */, - { 2, 184, 9896, 2, 4, UNI_ZYYY } /* iszyyy */, - { 1, 184, 3241, 2, 18, UNI_GEORGIANSUP } /* isgeorgiansupplement */, - { 18, 10048, 9188, 3, 2, UNI_NV__31 } /* nv=31 */, - { 0, 10033, 1751, 3, 2, UNI_LB__AI } /* lb=ai */, - { 0, 10048, 8744, 3, 5, UNI_NV__70000 } /* nv=70000 */, - { 2, 10012, 1, 3, 1, UNI_EA__N } /* ea=n */, - { 0, 1269, 36, 25, 1, UNI_COMPEX } /* fullcompositionexclusion=t */, - { 0, 3836, 9789, 18, 3, UNI_SHRD } /* scriptextensions=shrd */, - { 32, 9540, 26, 4, 1, UNI_DIA } /* dia=y */, - { 27, 1552, 0, 9, 0, UNI_gc_values_index } /* category= */, - { 0, 9488, 5947, 4, 13, UNI_MAYANNUMERALS } /* blk=mayannumerals */, - { 1, 7438, 1218, 10, 8, UNI_WB__KA } /* wordbreak=katakana */, - { 0, 2329, 0, 20, 0, UNI_HLUW } /* anatolianhieroglyphs */, - { 1, 10027, 5312, 3, 14, UNI_JG__MANICHAEANAYIN } /* jg=manichaeanayin */, - { 0, 7318, 7469, 10, 3, UNI_IN__5 } /* presentin=5.0 */, - { 0, 1417, 8829, 25, 5, UNI_CCC__132 } /* canonicalcombiningclass=ccc132 */, - { 26, 3097, 68, 18, 3, UNI_DT__SUP } /* decompositiontype=sup */, - { 20, 9240, 36, 5, 1, UNI_DASH } /* dash=t */, - { 11, 8780, 600, 7, 29, UNI_CJKEXTD } /* block=cjkunifiedideographsextensiond */, - { 1, 8780, 9656, 6, 4, UNI_INMIAO } /* block=miao */, - { 20, 9997, 10039, 3, 3, UNI_BC__LRI } /* bc=lri */, - { 0, 7325, 10114, 3, 3, UNI_IN__6_DOT_3 } /* in=v63 */, - { 6, 5986, 9376, 13, 3, UNI_NV__1_SLASH_6 } /* numericvalue=1/6 */, - { 0, 184, 9688, 2, 4, UNI_NKO } /* isnkoo */, - { 0, 8780, 9245, 6, 5, UNI_INDOGRA } /* block=dogra */, - { 5, 1417, 7826, 24, 2, UNI_CCC__12 } /* canonicalcombiningclass=12 */, - { 1, 8589, 9724, 7, 4, UNI_PHNX } /* script=phnx */, - { 0, 5791, 7711, 13, 9, UNI_JG__SYRIACWAW } /* joininggroup=syriacwaw */, - { 0, 58, 0, 4, 0, UNI_IDEO } /* ideo */, - { 2, 8780, 9860, 6, 3, UNI_INVAI } /* block=vai */, - { 1, 9508, 5765, 4, 13, UNI_CCC__IS } /* ccc=iotasubscript */, - { 0, 9768, 7694, 5, 8, UNI_SAMR } /* scx=samaritan */, - { 0, 9277, 2684, 3, 19, UNI_EGYP } /* sc=egyptianhieroglyphs */, - { 2, 5324, 6399, 4, 10, UNI_MATHALPHANUM } /* inmathalphanum */, - { 0, 2784, 29, 4, 4, UNI_INARABIC } /* inarabic */, - { 0, 2608, 0, 4, 0, UNI_BRAH } /* brah */, - { 0, 4658, 10135, 15, 3, UNI_GREXT } /* graphemeextend=yes */, - { 5, 9488, 5843, 4, 9, UNI_INMALAYALAM } /* blk=malayalam */, - { 6, 1417, 7178, 24, 10, UNI_CCC__6 } /* canonicalcombiningclass=hanreading */, - { 0, 4643, 9836, 15, 4, UNI_ECOMP } /* emojicomponent=true */, - { 2, 10033, 4842, 3, 2, UNI_LB__QU } /* lb=qu */, - { 0, 9768, 7630, 4, 9, UNI_TALU } /* scx=newtailue */, - { 0, 9508, 8825, 4, 3, UNI_CCC__130 } /* ccc=130 */, - { 0, 9488, 895, 4, 28, UNI_SUPPUAA } /* blk=supplementaryprivateuseareaa */, - { 5, 3836, 9876, 17, 4, UNI_XSUX } /* scriptextensions=xsux */, - { 1, 184, 9095, 2, 5, UNI_BUHD } /* isbuhid */, - { 0, 9277, 859, 4, 3, UNI_SC__KNDA } /* sc=knda */, - { 0, 5324, 6279, 4, 5, UNI_MAHJONG } /* inmahjong */, - { 0, 4553, 0, 15, 0, UNI_CONTROLPICTURES } /* controlpictures */, - { 0, 5986, 9904, 13, 3, UNI_NV__1_SLASH_5 } /* numericvalue=1/5 */, - { 2, 3424, 8674, 3, 6, UNI_UCASEXT } /* inucasext */, - { 5, 8589, 9624, 7, 3, UNI_LAO } /* script=lao */, - { 17, 8589, 8421, 7, 7, UNI_ELYM } /* script=elymaic */, - { 1, 184, 3633, 3, 16, UNI_CYRILLICEXTA } /* iscyrillicextendeda */, - { 7, 8589, 9616, 7, 4, UNI_SC__KTHI } /* script=kthi */, - { 0, 9488, 6818, 4, 11, UNI_MYANMAREXTA } /* blk=myanmarexta */, - { 10, 1834, 9255, 22, 5, -UNI_CWT } /* changeswhentitlecased=false */, - { 1, 1828, 9836, 6, 4, UNI_CASED } /* cased=true */, - { 0, 9444, 7827, 4, 3, UNI_AGE__2 } /* age=2.0 */, - { 0, 9277, 493, 3, 3, UNI_SC__HAN } /* sc=han */, - { 194, 184, 2245, 2, 14, UNI_MEETEIMAYEKEXT } /* ismeeteimayekext */, - { 0, 1552, 48, 9, 1, UNI_P } /* category=p */, - { 1, 9768, 3115, 4, 4, UNI_DEVA } /* scx=deva */, - { 0, 10333, 44, 3, 1, UNI_SK } /* issk */, - { 0, 7218, 8236, 11, 7, UNI_LB__LF } /* linebreak=linefeed */, - { 1, 9277, 7693, 3, 9, UNI_SAMR } /* sc=samaritan */, - { 18, 5986, 7755, 13, 8, UNI_NV__1_SLASH_9 } /* numericvalue=1.11e-01 */, - { 7, 184, 4049, 2, 11, UNI_GEORGIANEXT } /* isgeorgianext */, - { 2, 8960, 9295, 6, 5, UNI_NFCQC__M } /* nfcqc=maybe */, - { 4, 9014, 9836, 6, 4, UNI_UIDEO } /* uideo=true */, - { 16, 10048, 7890, 3, 2, UNI_NV__33 } /* nv=33 */, - { 0, 8589, 5171, 7, 4, UNI_CHAM } /* script=cham */, - { 3, 5791, 4763, 13, 15, UNI_JG__MANICHAEANSADHE } /* joininggroup=manichaeansadhe */, - { 0, 10048, 8714, 3, 6, UNI_NV__300000 } /* nv=300000 */, - { 1, 9277, 9732, 3, 4, UNI_PRTI } /* sc=prti */, - { 1, 8780, 5075, 7, 13, UNI_CJKCOMPATFORMS } /* block=cjkcompatforms */, - { 20, 184, 690, 3, 29, UNI_CJKEXTG } /* iscjkunifiedideographsextensiong */, - { 1, 184, 5522, 2, 14, UNI_PHONETICEXTSUP } /* isphoneticextsup */, - { 34, 7248, 0, 10, 0, UNI_MISCARROWS } /* miscarrows */, - { 3, 1966, 8687, 22, 7, UNI_INSC__VISARGA } /* indicsyllabiccategory=visarga */, - { 17, 9508, 8835, 5, 5, UNI_WB__EB } /* ccc=ccc133 */, - { 9, 9283, 0, 4, 0, UNI_PHLI } /* phli */, - { 0, 9624, 0, 4, 0, UNI_LAO } /* laoo */, - { 6, 10333, 7359, 3, 3, UNI_SAUR } /* issaur */, - { 0, 6469, 495, 12, 7, UNI_NT__NU } /* numerictype=numeric */, - { 1, 184, 727, 2, 2, UNI_MN } /* ismn */, - { 51, 10033, 58, 3, 2, UNI_LB__ID } /* lb=id */, - { 1, 9488, 9624, 4, 3, UNI_INLAO } /* blk=lao */, - { 1, 1988, 3, 22, 1, -UNI_LOE } /* logicalorderexception=f */, - { 0, 1513, 0, 24, 0, UNI_HIGHPUSURROGATES } /* highprivateusesurrogates */, - { 8, 1552, 1025, 9, 2, UNI_NO } /* category=no */, - { 1, 9768, 8428, 4, 7, UNI_GRAN } /* scx=grantha */, - { 1, 10048, 8075, 3, 8, UNI_NV__7_SLASH_8 } /* nv=8.75e-01 */, - { 0, 8780, 7621, 6, 9, UNI_INNABATAEAN } /* block=nabataean */, - { 0, 184, 1274, 3, 19, UNI_CE } /* iscompositionexclusion */, - { 0, 5791, 1511, 13, 3, UNI_JG__HAH } /* joininggroup=hah */, - { 0, 9277, 9808, 3, 4, UNI_TALU } /* sc=talu */, - { 2, 4033, 1059, 16, 2, UNI_SO } /* generalcategory=so */, - { 17, 6554, 9836, 11, 4, UNI_IDC } /* idcontinue=true */, - { 3, 3836, 4883, 17, 15, UNI_SARB } /* scriptextensions=oldsoutharabian */, - { 8, 184, 2122, 2, 7, UNI_RADICAL } /* isradical */, - { 1, 7325, 7826, 3, 2, UNI_IN__12 } /* in=12 */, - { 17, 7158, 10135, 10, 3, UNI_DIA } /* diacritic=yes */, - { 1, 8589, 7168, 7, 10, UNI_DIAK } /* script=divesakuru */, - { 0, 9330, 0, 5, 0, UNI_TALE } /* taile */, - { 1, 1417, 8066, 24, 2, UNI_CCC__28 } /* canonicalcombiningclass=28 */, - { 0, 10296, 7438, 7, 4, UNI_POSIXWORD } /* isposixword */, - { 2, 184, 1033, 2, 11, UNI_ENCLOSEDCJK } /* isenclosedcjk */, - { 34, 7368, 0, 10, 0, UNI_SMALLFORMS } /* smallforms */, - { 4, 184, 9900, 2, 4, UNI_ZZZZ } /* iszzzz */, - { 3, 10027, 4748, 3, 15, UNI_JG__MANICHAEANGIMEL } /* jg=manichaeangimel */, - { 9, 3836, 6409, 17, 4, UNI_MEND } /* scriptextensions=mend */, - { 0, 10012, 8, 3, 1, UNI_EA__A } /* ea=a */, - { 0, 1834, 1025, 22, 2, -UNI_CWT } /* changeswhentitlecased=no */, - { 2, 7155, 4674, 3, 14, UNI_INHANGUL } /* ishangulsyllables */, - { 128, 10033, 3985, 3, 16, UNI_LB__CL } /* lb=closepunctuation */, - { 7, 10132, 495, 3, 7, UNI_WB__NU } /* wb=numeric */, - { 0, 1, 0, 1, 0, UNI_N } /* n */, - { 131, 5986, 8710, 13, 3, UNI_NV__600 } /* numericvalue=600 */, - { 0, 9768, 6193, 4, 6, UNI_HEBR } /* scx=hebrew */, - { 1, 1115, 0, 4, 0, UNI_HANG } /* hang */, - { 0, 1417, 9121, 25, 4, UNI_CCC__18 } /* canonicalcombiningclass=ccc18 */, - { 0, 7325, 7931, 3, 3, UNI_IN__4_DOT_1 } /* in=4.1 */, - { 0, 9277, 8610, 3, 4, UNI_SIDD } /* sc=sidd */, - { 0, 184, 3115, 2, 18, UNI_DEVANAGARIEXT } /* isdevanagariextended */, - { 2, 9277, 2240, 4, 3, UNI_SC__KTHI } /* sc=kthi */, - { 0, 5986, 7891, 13, 8, UNI_NV__1_SLASH_3 } /* numericvalue=3.33e-01 */, - { 0, 7218, 8251, 10, 8, UNI_LB__NL } /* linebreak=nextline */, - { 3, 9768, 9896, 4, 4, UNI_ZYYY } /* scx=zyyy */, - { 0, 7218, 6217, 10, 12, UNI_LB__IS } /* linebreak=infixnumeric */, - { 4, 9277, 9756, 3, 4, UNI_RUNR } /* sc=runr */, - { 8, 9488, 9008, 4, 6, UNI_INTHAANA } /* blk=thaana */, - { 0, 6409, 0, 12, 0, UNI_MEND } /* mendekikakui */, - { 0, 4305, 0, 5, 0, UNI_C } /* other */, - { 0, 7325, 8043, 3, 3, UNI_IN__8 } /* in=8.0 */, - { 1, 9277, 9480, 3, 4, UNI_BATK } /* sc=batk */, - { 0, 8589, 9608, 7, 4, UNI_KITS } /* script=kits */, - { 3, 3785, 0, 4, 0, UNI_MANI } /* mani */, - { 0, 9660, 0, 4, 0, UNI_MLYM } /* mlym */, - { 9, 6061, 36, 12, 1, UNI_BIDIC } /* bidicontrol=t */, - { 1, 9652, 0, 4, 0, UNI_MERC } /* merc */, - { 0, 10024, 4568, 3, 14, UNI_SC } /* gc=currencysymbol */, - { 168, 1856, 1025, 22, 2, -UNI_CWU } /* changeswhenuppercased=no */, - { 0, 9488, 2203, 4, 14, UNI_INHANIFIROHINGYA } /* blk=hanifirohingya */, - { 2, 184, 8435, 2, 6, UNI_GRBASE } /* isgrbase */, - { 4, 8688, 5033, 3, 4, UNI_ASCII } /* isascii */, - { 9, 9768, 4478, 4, 7, UNI_BRAI } /* scx=braille */, - { 0, 9768, 8547, 4, 7, UNI_OLCK } /* scx=olchiki */, - { 4, 7648, 0, 9, 0, UNI_ITAL } /* olditalic */, - { 0, 9277, 8942, 3, 4, UNI_LYDI } /* sc=lydi */, - { 19, 1552, 4245, 9, 10, UNI_SM } /* category=mathsymbol */, - { 0, 8589, 8547, 7, 7, UNI_OLCK } /* script=olchiki */, - { 1, 10132, 6917, 3, 11, UNI_WB__SQ } /* wb=singlequote */, - { 1, 8780, 8936, 6, 6, UNI_INLYCIAN } /* block=lycian */, - { 1, 9488, 4257, 4, 16, UNI_MISCMATHSYMBOLSB } /* blk=miscmathsymbolsb */, - { 3, 4033, 4305, 16, 5, UNI_C } /* generalcategory=other */, - { 0, 8780, 9065, 6, 5, UNI_INADLAM } /* block=adlam */, - { 0, 8780, 9340, 6, 5, UNI_VSSUP } /* block=vssup */, - { 0, 10236, 10220, 14, 11, UNI__PERL_FOLDS_TO_MULTI_CHAR } /* _perl_folds_to_multi_char */, - { 1, 3836, 4385, 17, 4, UNI_TANG } /* scriptextensions=tang */, - { 2, 10048, 8002, 3, 2, UNI_NV__26 } /* nv=26 */, - { 1, 6884, 0, 11, 0, UNI_HMNG } /* pahawhhmong */, - { 10, 2288, 2076, 4, 4, UNI_INHATRAN } /* inhatran */, - { 32, 184, 5200, 2, 14, UNI_KANASUP } /* iskanasupplement */, - { 33, 3097, 45, 18, 6, UNI_DT__COM } /* decompositiontype=compat */, - { 0, 7218, 3969, 10, 16, UNI_LB__CP } /* linebreak=closeparenthesis */, - { 16, 7318, 9967, 10, 3, UNI_IN__5_DOT_1 } /* presentin=5.1 */, - { 0, 2032, 9255, 22, 5, -UNI__PERL_NCHAR } /* noncharactercodepoint=false */, - { 9, 1417, 7877, 24, 2, UNI_CCC__13 } /* canonicalcombiningclass=13 */, - { 11, 9997, 865, 3, 2, UNI_BC__WS } /* bc=ws */, - { 1, 184, 5713, 2, 13, UNI_XPOSIXDIGIT } /* isdecimalnumber */, - { 4, 3836, 3115, 17, 4, UNI_DEVA } /* scriptextensions=deva */, - { 0, 8780, 2120, 7, 13, UNI_CJKRADICALSSUP } /* block=cjkradicalssup */, - { 38, 9488, 3341, 4, 8, UNI_DINGBATS } /* blk=dingbats */, - { 0, 5158, 0, 14, 0, UNI_INGREEK } /* greekandcoptic */, - { 0, 3079, 0, 4, 0, UNI_COPT } /* copt */, - { 0, 8589, 9032, 7, 6, UNI_WCHO } /* script=wancho */, - { 0, 9277, 5171, 3, 4, UNI_CHAM } /* sc=cham */, - { 0, 9277, 9724, 3, 4, UNI_PHNX } /* sc=phnx */, - { 0, 9860, 0, 3, 0, UNI_VAI } /* vai */, - { 4, 184, 7248, 2, 10, UNI_MISCARROWS } /* ismiscarrows */, - { 68, 7738, 10135, 9, 3, UNI_XIDS } /* xidstart=yes */, - { 21, 184, 567, 2, 2, UNI_NB } /* isnb */, - { 8, 1417, 9216, 25, 4, UNI_CCC__84 } /* canonicalcombiningclass=ccc84 */, - { 0, 21, 3421, 2, 4, UNI_RUMI } /* inrumi */, - { 0, 4448, 0, 5, 0, UNI_BAMU } /* bamum */, - { 1, 8589, 9460, 7, 4, UNI_ARMI } /* script=armi */, - { 0, 7325, 7821, 3, 1, UNI_IN__8 } /* in=8 */, - { 4, 9768, 4448, 4, 4, UNI_BAMU } /* scx=bamu */, - { 16, 9488, 6012, 4, 13, UNI_VERTICALFORMS } /* blk=verticalforms */, - { 34, 8589, 9728, 7, 4, UNI_MIAO } /* script=plrd */, - { 0, 9444, 9397, 4, 3, UNI_AGE__2_DOT_1 } /* age=2.1 */, - { 0, 719, 0, 30, 0, UNI_CUNEIFORMNUMBERS } /* cuneiformnumbersandpunctuation */, - { 0, 9768, 3169, 4, 4, UNI_ETHI } /* scx=ethi */, - { 0, 8780, 2010, 6, 22, UNI_MISCTECHNICAL } /* block=miscellaneoustechnical */, - { 0, 10126, 0, 3, 0, UNI_vo_values_index } /* vo= */, - { 7, 1988, 9836, 22, 4, UNI_LOE } /* logicalorderexception=true */, - { 2, 8589, 57, 7, 2, UNI_SC__YI } /* script=yi */, - { 0, 8400, 1025, 7, 2, -UNI_COMPEX } /* compex=no */, - { 1, 3836, 8666, 17, 4, UNI_TIRH } /* scriptextensions=tirh */, - { 1, 10060, 0, 3, 0, UNI_ri_values_index } /* ri= */, - { 1, 8449, 0, 7, 0, UNI_hyphen_values_index } /* hyphen= */, - { 0, 9488, 6829, 4, 11, UNI_MYANMAREXTB } /* blk=myanmarextb */, - { 0, 5578, 8554, 14, 7, UNI_SB__LE } /* sentencebreak=oletter */, - { 50, 6231, 3633, 3, 16, UNI_CYRILLICEXTA } /* incyrillicextendeda */, - { 4, 10033, 10174, 3, 2, UNI_LB__XX } /* lb=xx */, - { 0, 184, 9236, 3, 3, UNI_CWCM } /* iscwcm */, - { 1, 3836, 8414, 17, 4, UNI_ELBA } /* scriptextensions=elba */, - { 0, 184, 6277, 2, 7, UNI_MAHJONG } /* ismahjong */, - { 0, 5791, 6906, 13, 11, UNI_JG__ROHINGYAYEH } /* joininggroup=rohingyayeh */, + { 2, 9474, 729, 5, 6, UNI_INSC__NUMBER } /* insc=number */, + { 0, 10553, 1177, 3, 3, UNI_SORA } /* issora */, + { 0, 9731, 0, 3, 0, UNI_CWT } /* cwt */, + { 3, 7580, 7772, 10, 9, UNI_WB__MB } /* wordbreak=midnumlet */, + { 0, 9711, 9028, 5, 5, UNI_WB__EB } /* ccc=ccc133 */, + { 0, 9087, 9454, 6, 5, -UNI_JOINC } /* joinc=false */, + { 1, 10011, 0, 4, 0, UNI_TAGS } /* tags */, + { 0, 218, 0, 33, 0, UNI_DIACRITICALSEXT } /* combiningdiacriticalmarksextended */, + { 0, 9476, 9519, 3, 5, UNI_OSGE } /* sc=osage */, + { 1, 8973, 5771, 6, 13, UNI_BLOCKELEMENTS } /* block=blockelements */, + { 1, 3121, 2593, 18, 8, UNI_DT__VERT } /* decompositiontype=vertical */, + { 0, 9691, 1007, 4, 17, UNI_ANCIENTGREEKMUSIC } /* blk=ancientgreekmusic */, + { 0, 6083, 8108, 13, 8, UNI_NV__9_SLASH_2 } /* numericvalue=4.50e+00 */, + { 0, 9979, 9207, 4, 4, UNI_THAA } /* scx=thaa */, + { 2, 185, 5758, 2, 12, UNI_BIDIM } /* isbidimirrored */, + { 0, 5116, 1026, 14, 2, -UNI_CI } /* caseignorable=no */, + { 5, 9214, 10055, 5, 4, UNI_IDEO } /* ideo=true */, + { 2, 7060, 10355, 11, 3, UNI_SD } /* softdotted=yes */, + { 2, 8973, 3463, 6, 18, UNI_SMALLKANAEXT } /* block=smallkanaextension */, + { 1, 6340, 8545, 3, 6, UNI_CJKEXTA } /* incjkexta */, + { 0, 10247, 7490, 3, 10, UNI_JG__REVERSEDPE } /* jg=reversedpe */, + { 0, 9979, 6924, 5, 3, UNI_SAMR } /* scx=samr */, + { 1, 4847, 2880, 3, 18, UNI_MONGOLIANSUP } /* inmongoliansupplement */, + { 0, 9979, 10027, 4, 4, UNI_TAVT } /* scx=tavt */, + { 1, 10244, 48, 3, 1, UNI_M } /* gc=m */, + { 0, 9979, 9529, 4, 5, UNI_TALE } /* scx=taile */, + { 2, 9476, 9183, 3, 6, UNI_RJNG } /* sc=rejang */, + { 0, 10268, 8068, 3, 8, UNI_NV__7_SLASH_2 } /* nv=3.50e+00 */, + { 2, 1836, 0, 22, 0, UNI_cwl_values_index } /* changeswhenlowercased= */, + { 3, 4909, 26, 15, 1, UNI_DT__NONE } /* nfkdquickcheck=y */, + { 2, 1537, 0, 4, 0, UNI_SIND } /* sind */, + { 1, 3391, 1, 18, 1, -UNI__PERL_PATWS } /* patternwhitespace=n */, + { 0, 6506, 0, 12, 0, UNI_MATHALPHANUM } /* mathalphanum */, + { 2, 9459, 0, 5, 0, UNI_idsb_values_index } /* idsb= */, + { 0, 7230, 2473, 10, 20, UNI_BC__LRE } /* bidiclass=lefttorightembedding */, + { 2, 1990, 3085, 22, 18, UNI_INSC__CONSONANTSUBJOINED } /* indicsyllabiccategory=consonantsubjoined */, + { 0, 9469, 2573, 5, 12, UNI_INPC__TOPANDBOTTOM } /* inpc=topandbottom */, + { 5, 10244, 4026, 3, 16, UNI_PE } /* gc=closepunctuation */, + { 1, 9476, 4314, 3, 7, UNI_SC__MYMR } /* sc=myanmar */, + { 1, 185, 4610, 3, 14, UNI_CONTROLPICTURES } /* iscontrolpictures */, + { 7, 8973, 3139, 6, 13, UNI_DEVANAGARIEXT } /* block=devanagariext */, + { 0, 185, 7500, 2, 10, UNI_SAUR } /* issaurashtra */, + { 0, 185, 4669, 2, 15, UNI_DIACRITICALSSUP } /* isdiacriticalssup */, + { 8, 9691, 5326, 4, 14, UNI_LATINEXTE } /* blk=latinextendede */, + { 0, 7297, 6430, 3, 3, UNI_HMNG } /* ishmng */, + { 0, 6697, 10055, 11, 4, UNI_XPOSIXALPHA } /* alphabetic=true */, + { 0, 10226, 26, 3, 1, UNI_DI } /* di=y */, + { 1, 9691, 7826, 4, 9, UNI_INOLDTURKIC } /* blk=oldturkic */, + { 1, 6083, 7948, 13, 8, UNI_NV__1_SLASH_7 } /* numericvalue=1.43e-01 */, + { 0, 9979, 2453, 4, 20, UNI_PHLI } /* scx=inscriptionalpahlavi */, + { 12, 9691, 9117, 4, 6, UNI_INLEPCHA } /* blk=lepcha */, + { 0, 9979, 9033, 4, 6, UNI_CAKM } /* scx=chakma */, + { 2, 185, 750, 2, 21, UNI_ENCLOSEDALPHANUM } /* isenclosedalphanumerics */, + { 0, 4074, 4026, 16, 16, UNI_PE } /* generalcategory=closepunctuation */, + { 3, 6083, 9560, 13, 3, UNI_NV__1_SLASH_2 } /* numericvalue=1/2 */, + { 0, 7300, 10055, 10, 4, UNI_DIA } /* diacritic=true */, + { 1, 7467, 10316, 3, 3, UNI_IN__5 } /* in=v50 */, + { 1, 185, 3894, 2, 16, UNI_STERM } /* issentenceterminal */, + { 21, 2803, 0, 19, 0, UNI_idst_values_index } /* idstrinaryoperator= */, + { 0, 9691, 8544, 4, 7, UNI_CJKEXTA } /* blk=cjkexta */, + { 2, 10247, 4266, 3, 16, UNI_JG__MANICHAEANTWENTY } /* jg=manichaeantwenty */, + { 0, 7460, 7995, 10, 2, UNI_IN__12 } /* presentin=12 */, + { 6, 8782, 9524, 7, 5, UNI_RUNR } /* script=runic */, + { 1, 9075, 36, 6, 1, UNI_GREXT } /* grext=t */, + { 5, 185, 2012, 2, 21, UNI_LOE } /* islogicalorderexception */, + { 0, 9979, 9651, 4, 4, UNI_AGHB } /* scx=aghb */, + { 5, 6340, 2691, 4, 9, UNI_COUNTINGROD } /* incountingrod */, + { 0, 1538, 2573, 24, 20, UNI_INPC__TOPANDBOTTOMANDRIGHT } /* indicpositionalcategory=topandbottomandright */, + { 1, 2584, 0, 4, 0, UNI_MAND } /* mand */, + { 3, 7297, 1194, 3, 25, UNI_HALFANDFULLFORMS } /* ishalfwidthandfullwidthforms */, + { 1, 9476, 9683, 3, 4, UNI_BATK } /* sc=batk */, + { 1, 5045, 1892, 3, 8, UNI_XPOSIXUPPER } /* isuppercase */, + { 1, 3121, 10286, 18, 3, UNI_DT__SML } /* decompositiontype=sml */, + { 3, 9476, 3826, 3, 4, UNI_SC__MANI } /* sc=mani */, + { 1, 6350, 7400, 12, 10, UNI_JT__U } /* joiningtype=nonjoining */, + { 1, 9691, 4106, 4, 16, UNI_HALFANDFULLFORMS } /* blk=halfandfullforms */, + { 0, 3406, 1026, 3, 2, -UNI_CE } /* ce=no */, + { 0, 10268, 8907, 3, 4, UNI_NV__3000 } /* nv=3000 */, + { 1, 6083, 8028, 13, 8, UNI_NV__20000000 } /* numericvalue=20000000 */, + { 8, 9691, 8420, 4, 8, UNI_INMAHAJANI } /* blk=mahajani */, + { 2, 9691, 8600, 4, 7, UNI_DSRT } /* blk=deseret */, + { 1, 185, 5326, 2, 14, UNI_LATINEXTE } /* islatinextendede */, + { 0, 9476, 3265, 3, 8, UNI_SC__GEOR } /* sc=georgian */, + { 0, 10268, 8028, 3, 2, UNI_NV__20 } /* nv=20 */, + { 2, 9691, 7330, 4, 10, UNI_INKHAROSHTHI } /* blk=kharoshthi */, + { 2, 10470, 10485, 15, 5, UNI__PERL_CHARNAME_BEGIN } /* _perl_charname_begin */, + { 4, 6529, 9515, 3, 4, UNI_INORIYA } /* inoriya */, + { 0, 10244, 6983, 3, 11, UNI_LO } /* gc=otherletter */, + { 0, 21, 7754, 2, 9, UNI_LATINEXTG } /* inlatinextg */, + { 1, 5029, 0, 15, 0, UNI_VEDICEXT } /* vedicextensions */, + { 2, 10352, 4401, 3, 9, UNI_WB__EB } /* wb=emodifier */, + { 7, 9476, 8356, 3, 4, UNI_SC__HIRA } /* sc=hira */, + { 2, 185, 5368, 2, 4, UNI_LISU } /* islisu */, + { 1, 3175, 0, 18, 0, UNI_epres_values_index } /* emojipresentation= */, + { 1, 10268, 8119, 3, 1, UNI_NV__9 } /* nv=9 */, + { 4, 3877, 8348, 17, 8, UNI_GURU } /* scriptextensions=gurmukhi */, + { 5, 9051, 9454, 6, 5, -UNI_ECOMP } /* ecomp=false */, + { 1, 8973, 1443, 7, 9, UNI_CJKSYMBOLS } /* block=cjksymbols */, + { 3, 9979, 58, 4, 2, UNI_YI } /* scx=yi */, + { 1, 1553, 9706, 9, 2, UNI_MC } /* category=mc */, + { 1, 7460, 0, 10, 0, UNI_in_values_index } /* presentin= */, + { 0, 8691, 0, 7, 0, UNI_MULT } /* multani */, + { 1, 10123, 0, 4, 0, UNI_ZZZZ } /* zzzz */, + { 3, 9434, 0, 5, 0, UNI_cwcm_values_index } /* cwcm= */, + { 1, 9711, 9024, 4, 3, UNI_CCC__132 } /* ccc=132 */, + { 16, 7060, 10055, 11, 4, UNI_SD } /* softdotted=true */, + { 0, 3877, 79, 17, 6, UNI_ARAB } /* scriptextensions=arabic */, + { 30, 9476, 10019, 3, 4, UNI_TALU } /* sc=talu */, + { 0, 10510, 63, 6, 5, UNI_XPOSIXGRAPH } /* xposixgraph */, + { 6, 10247, 5420, 3, 4, UNI_JG__BETH } /* jg=beth */, + { 2, 185, 8284, 2, 8, UNI_BASS } /* isbassavah */, + { 6, 4598, 3267, 4, 9, UNI_GEORGIANSUP } /* ingeorgiansup */, + { 1, 8782, 9799, 7, 4, UNI_HMNP } /* script=hmnp */, + { 7, 7510, 0, 10, 0, UNI_SMALLFORMS } /* smallforms */, + { 0, 8754, 0, 7, 0, UNI_OSMA } /* osmanya */, + { 0, 7460, 10334, 10, 3, UNI_IN__6_DOT_3 } /* presentin=v63 */, + { 0, 5408, 6388, 4, 5, UNI_MAHJONG } /* inmahjong */, + { 1, 9711, 9407, 4, 2, UNI_CCC__35 } /* ccc=35 */, + { 1, 8973, 2765, 6, 19, UNI_JAMOEXTB } /* block=hanguljamoextendedb */, + { 0, 5662, 496, 14, 2, UNI_SB__NU } /* sentencebreak=nu */, + { 13, 9476, 9117, 3, 6, UNI_LEPC } /* sc=lepcha */, + { 10, 8973, 44, 7, 25, UNI_CJKCOMPATIDEOGRAPHS } /* block=cjkcompatibilityideographs */, + { 0, 8973, 2879, 6, 19, UNI_MONGOLIANSUP } /* block=mongoliansupplement */, + { 0, 185, 4534, 2, 7, UNI_BRAI } /* isbraille */, + { 0, 3877, 1116, 17, 4, UNI_HANG } /* scriptextensions=hang */, + { 1, 9979, 9859, 4, 4, UNI_MERC } /* scx=merc */, + { 0, 10268, 8156, 3, 8, UNI_NV__5_SLASH_8 } /* nv=6.25e-01 */, + { 3, 9647, 7950, 4, 1, UNI_AGE__4 } /* age=4 */, + { 3, 2808, 1396, 4, 22, UNI_ARABICPFB } /* inarabicpresentationformsb */, + { 0, 9691, 5227, 4, 4, UNI_INCHAM } /* blk=cham */, + { 2, 1990, 5784, 22, 13, UNI_INSC__CONSONANTDEAD } /* indicsyllabiccategory=consonantdead */, + { 9, 7580, 8516, 10, 7, UNI_WB__LE } /* wordbreak=aletter */, + { 1, 8961, 26, 6, 1, UNI_BIDIC } /* bidic=y */, + { 2, 10268, 9307, 3, 2, UNI_NV__15 } /* nv=15 */, + { 2, 2304, 7422, 4, 8, UNI_XPEO } /* isoldpersian */, + { 5, 9979, 9201, 4, 4, UNI_TELU } /* scx=telu */, + { 1, 10352, 126, 3, 2, UNI_LB__CR } /* wb=cr */, + { 1, 6340, 6207, 3, 11, UNI_CYRILLICEXTB } /* incyrillicextb */, + { 3, 9979, 8537, 4, 4, UNI_BENG } /* scx=beng */, + { 1, 3877, 9883, 17, 4, UNI_NARB } /* scriptextensions=narb */, + { 0, 10247, 6455, 3, 3, UNI_JG__NYA } /* jg=nya */, + { 1, 9691, 8775, 4, 7, UNI_INPHAGSPA } /* blk=phagspa */, + { 1, 4972, 4427, 3, 15, UNI_TANGUTCOMPONENTS } /* istangutcomponents */, + { 2, 10533, 3403, 7, 5, UNI_XPOSIXBLANK } /* ishorizspace */, + { 0, 9691, 8824, 4, 7, UNI_SUPPUAB } /* blk=suppuab */, + { 2, 8881, 3964, 4, 14, UNI_ARABICSUP } /* isarabicsupplement */, + { 2, 7655, 0, 9, 0, UNI_BHKS } /* bhaiksuki */, + { 3, 9927, 0, 3, 0, UNI_PCM } /* pcm */, + { 2, 6340, 2165, 3, 10, UNI_CYRILLICSUP } /* incyrillicsup */, + { 1, 9057, 9454, 6, 5, -UNI_EMOJI } /* emoji=false */, + { 3, 1880, 1026, 22, 2, -UNI_CWU } /* changeswhenuppercased=no */, + { 0, 9691, 7310, 4, 10, UNI_INDIVESAKURU } /* blk=divesakuru */, + { 2, 6362, 0, 5, 0, UNI_KHMR } /* khmer */, + { 5, 6158, 3, 12, 1, -UNI_BIDIC } /* bidicontrol=f */, + { 3, 4074, 4954, 16, 15, UNI_PS } /* generalcategory=openpunctuation */, + { 3, 3877, 4504, 17, 4, UNI_BAMU } /* scriptextensions=bamu */, + { 2, 5408, 6388, 4, 10, UNI_MAHJONG } /* inmahjongtiles */, + { 4, 185, 9779, 2, 4, UNI_GUJR } /* isgujr */, + { 0, 8973, 79, 6, 10, UNI_ARABICMATH } /* block=arabicmath */, + { 3, 10352, 8698, 3, 7, UNI_WB__NL } /* wb=newline */, + { 0, 1418, 9022, 25, 5, UNI_CCC__132 } /* canonicalcombiningclass=ccc132 */, + { 8, 5875, 7341, 14, 9, UNI_JG__KNOTTEDHEH } /* joininggroup=knottedheh */, + { 0, 4894, 0, 16, 0, UNI_NFKCQC__N } /* nfkcquickcheck=n */, + { 0, 2689, 0, 11, 0, UNI_COUNTINGROD } /* countingrod */, + { 0, 9979, 3936, 5, 3, UNI_SGNW } /* scx=sgnw */, + { 0, 10217, 23, 3, 2, UNI_BC__AL } /* bc=al */, + { 2, 10253, 21, 3, 2, UNI_LB__IN } /* lb=in */, + { 2, 8973, 2332, 6, 21, UNI_YIJING } /* block=yijinghexagramsymbols */, + { 0, 3403, 10355, 6, 3, UNI_XPOSIXSPACE } /* space=yes */, + { 0, 185, 85, 2, 4, UNI_MATH } /* ismath */, + { 1, 3877, 3936, 18, 3, UNI_SGNW } /* scriptextensions=sgnw */, + { 3, 9979, 10119, 4, 4, UNI_ZYYY } /* scx=zyyy */, + { 1, 5256, 0, 7, 0, UNI_KANASUP } /* kanasup */, + { 0, 9077, 1026, 4, 2, -UNI_EXT } /* ext=no */, + { 12, 8593, 10355, 7, 3, UNI_COMPEX } /* compex=yes */, + { 0, 8684, 0, 7, 0, UNI_MARC } /* marchen */, + { 0, 9461, 1891, 3, 5, UNI_SB__UP } /* sb=upper */, + { 0, 10349, 26, 3, 1, UNI_VS } /* vs=y */, + { 0, 9476, 2936, 3, 9, UNI_SUND } /* sc=sundanese */, + { 0, 2248, 897, 3, 27, UNI_SUPPUAA } /* insupplementaryprivateuseareaa */, + { 0, 9190, 1026, 5, 2, -UNI_TERM } /* term=no */, + { 4, 9476, 8691, 3, 4, UNI_SC__MULT } /* sc=mult */, + { 3, 7467, 8036, 3, 3, UNI_IN__3_DOT_1 } /* in=3.1 */, + { 1, 2593, 0, 20, 0, UNI_vo_values_index } /* verticalorientation= */, + { 0, 2206, 5830, 21, 5, UNI_WB__EB } /* graphemeclusterbreak=ebase */, + { 1, 8782, 10027, 7, 4, UNI_TAVT } /* script=tavt */, + { 2, 3391, 0, 17, 0, UNI__PERL_PATWS } /* patternwhitespace */, + { 3, 10553, 8790, 3, 6, UNI_SHRD } /* issharada */, + { 0, 3877, 7844, 17, 9, UNI_PALM } /* scriptextensions=palmyrene */, + { 0, 5823, 0, 12, 0, UNI_GRBASE } /* graphemebase */, + { 4, 185, 1034, 2, 11, UNI_ENCLOSEDCJK } /* isenclosedcjk */, + { 0, 7460, 8119, 10, 1, UNI_IN__9 } /* presentin=9 */, + { 2, 10346, 0, 3, 0, UNI_vo_values_index } /* vo= */, + { 1, 6593, 0, 4, 0, UNI_HUNG } /* hung */, + { 0, 10253, 496, 3, 7, UNI_LB__NU } /* lb=numeric */, + { 1, 185, 7261, 3, 9, UNI_CHRS } /* ischorasmian */, + { 0, 9831, 0, 4, 0, UNI_LAO } /* laoo */, + { 0, 1538, 4671, 4, 13, UNI_DIACRITICALSSUP } /* indiacriticalssup */, + { 0, 185, 5901, 2, 13, UNI_KANAEXTB } /* iskanaextendedb */, + { 0, 3103, 0, 18, 0, UNI_COPTICEPACTNUMBERS } /* copticepactnumbers */, + { 1, 8670, 0, 7, 0, UNI_MAKA } /* makasar */, + { 0, 8973, 2453, 6, 20, UNI_ININSCRIPTIONALPAHLAVI } /* block=inscriptionalpahlavi */, + { 0, 1553, 5014, 9, 15, UNI_UPPERCASELETTER } /* category=uppercaseletter */, + { 0, 8782, 4314, 7, 7, UNI_SC__MYMR } /* script=myanmar */, + { 3, 8973, 468, 6, 11, UNI_INPUNCTUATION } /* block=punctuation */, + { 9, 10268, 9612, 3, 3, UNI_NV__5_SLASH_2 } /* nv=5/2 */, + { 2, 8316, 0, 7, 0, UNI_EXTPICT } /* extpict */, + { 1, 8973, 2165, 7, 17, UNI_CYRILLICSUP } /* block=cyrillicsupplement */, + { 5, 5875, 6446, 13, 12, UNI_JG__MALAYALAMNYA } /* joininggroup=malayalamnya */, + { 0, 8973, 7330, 6, 10, UNI_INKHAROSHTHI } /* block=kharoshthi */, + { 3, 6182, 0, 12, 0, UNI_CHESSSYMBOLS } /* chesssymbols */, + { 2, 185, 9875, 2, 4, UNI_MTEI } /* ismtei */, + { 0, 10268, 5732, 3, 7, UNI_NV__1000000 } /* nv=1000000 */, + { 6, 6083, 9635, 13, 4, UNI_NV__5_SLASH_12 } /* numericvalue=5/12 */, + { 1, 9476, 9851, 3, 4, UNI_MEDF } /* sc=medf */, + { 2, 10247, 5564, 3, 14, UNI_JG__NOJOININGGROUP } /* jg=nojoininggroup */, + { 0, 185, 1793, 3, 20, UNI_CWCF } /* ischangeswhencasefolded */, + { 5, 10247, 6410, 3, 12, UNI_JG__MALAYALAMLLA } /* jg=malayalamlla */, + { 3, 9476, 9899, 3, 4, UNI_NSHU } /* sc=nshu */, + { 16, 9075, 1026, 6, 2, -UNI_GREXT } /* grext=no */, + { 4, 9691, 2227, 4, 14, UNI_INHANIFIROHINGYA } /* blk=hanifirohingya */, + { 0, 540, 0, 30, 0, UNI_CJKEXTB } /* cjkunifiedideographsextensionb */, + { 1, 9647, 7923, 4, 2, UNI_AGE__11 } /* age=11 */, + { 0, 10247, 6917, 3, 11, UNI_JG__MALAYALAMRA } /* jg=malayalamra */, + { 10, 9269, 1, 5, 1, -UNI_POSIXXDIGIT } /* ahex=n */, + { 1, 3877, 10004, 18, 3, UNI_SOGO } /* scriptextensions=sogo */, + { 0, 9476, 9959, 3, 4, UNI_RJNG } /* sc=rjng */, + { 1, 7360, 7410, 10, 10, UNI_LB__NS } /* linebreak=nonstarter */, + { 0, 3877, 7330, 17, 4, UNI_KHAR } /* scriptextensions=khar */, + { 3, 4847, 6962, 3, 10, UNI_MYANMAREXTB } /* inmyanmarextb */, + { 0, 6083, 8925, 13, 3, UNI_NV__500 } /* numericvalue=500 */, + { 0, 6083, 9579, 13, 3, UNI_NV__1_SLASH_8 } /* numericvalue=1/8 */, + { 0, 10229, 7, 3, 3, UNI_DT__CAN } /* dt=can */, + { 0, 185, 6290, 2, 12, UNI_GONG } /* isgunjalagondi */, + { 0, 3877, 7817, 17, 9, UNI_PERM } /* scriptextensions=oldpermic */, + { 0, 9691, 9891, 4, 4, UNI_INNEWA } /* blk=newa */, + { 2, 7230, 103, 10, 2, UNI_BC__ET } /* bidiclass=et */, + { 3, 9691, 8586, 4, 7, UNI_CJKEXTG } /* blk=cjkextg */, + { 1, 9763, 407, 4, 7, UNI_GCB__CN } /* gcb=control */, + { 1, 10268, 8028, 3, 6, UNI_NV__200000 } /* nv=200000 */, + { 4, 6350, 6796, 12, 11, UNI_JT__D } /* joiningtype=dualjoining */, + { 0, 10283, 26, 3, 1, UNI_SD } /* sd=y */, + { 9, 3121, 1418, 18, 9, UNI_DT__CAN } /* decompositiontype=canonical */, + { 2, 9979, 8607, 4, 7, UNI_ELBA } /* scx=elbasan */, + { 1, 7360, 84, 10, 2, UNI_LB__CM } /* linebreak=cm */, + { 0, 5368, 0, 4, 0, UNI_LISU } /* lisu */, + { 0, 8444, 1, 8, 1, -UNI_RADICAL } /* radical=n */, + { 0, 6338, 9454, 12, 5, -UNI_JOINC } /* joincontrol=false */, + { 0, 10516, 5802, 7, 5, UNI_POSIXALNUM } /* isposixalnum */, + { 0, 8973, 1925, 7, 21, UNI_INDICNUMBERFORMS } /* block=commonindicnumberforms */, + { 0, 185, 5298, 2, 14, UNI_LATINEXTC } /* islatinextendedc */, + { 7, 79, 0, 10, 0, UNI_ARABICMATH } /* arabicmath */, + { 0, 3877, 2353, 17, 20, UNI_HLUW } /* scriptextensions=anatolianhieroglyphs */, + { 0, 9979, 7835, 4, 9, UNI_OUGR } /* scx=olduyghur */, + { 1, 9691, 1219, 4, 8, UNI_INKATAKANA } /* blk=katakana */, + { 1, 8492, 0, 7, 0, UNI_UCASEXT } /* ucasext */, + { 0, 7754, 0, 9, 0, UNI_LATINEXTG } /* latinextg */, + { 0, 3877, 9715, 17, 4, UNI_CHRS } /* scriptextensions=chrs */, + { 1, 9691, 8293, 5, 7, UNI_INBUGINESE } /* blk=buginese */, + { 0, 10229, 568, 3, 2, UNI_DT__NB } /* dt=nb */, + { 0, 7230, 23, 10, 2, UNI_BC__AL } /* bidiclass=al */, + { 1, 6158, 0, 11, 0, UNI_BIDIC } /* bidicontrol */, + { 1, 8782, 3049, 7, 8, UNI_CHER } /* script=cherokee */, + { 1, 4138, 0, 16, 0, UNI_HIGHPUSURROGATES } /* highpusurrogates */, + { 10, 5662, 5, 15, 1, UNI_SB__SE } /* sentencebreak=se */, + { 1, 9979, 383, 4, 4, UNI_EGYP } /* scx=egyp */, + { 0, 6083, 7990, 13, 1, UNI_NV__8 } /* numericvalue=8 */, + { 2, 6083, 10370, 13, 2, UNI_NV__48 } /* numericvalue=48 */, + { 1, 8973, 1034, 6, 11, UNI_ENCLOSEDCJK } /* block=enclosedcjk */, + { 0, 9711, 1780, 4, 2, UNI_CCC__BR } /* ccc=br */, + { 0, 3553, 0, 18, 0, UNI_vs_values_index } /* variationselector= */, + { 0, 9691, 2311, 4, 7, UNI_INSINHALA } /* blk=sinhala */, + { 1, 9691, 1014, 4, 5, UNI_INGREEK } /* blk=greek */, + { 4, 8973, 2936, 6, 12, UNI_SUNDANESESUP } /* block=sundanesesup */, + { 4, 9476, 8476, 3, 8, UNI_TFNG } /* sc=tifinagh */, + { 3, 7467, 10334, 3, 3, UNI_IN__6_DOT_3 } /* in=v63 */, + { 0, 4847, 2861, 3, 18, UNI_MODIFIERTONELETTERS } /* inmodifiertoneletters */, + { 0, 3877, 8300, 17, 8, UNI_DUPL } /* scriptextensions=duployan */, + { 0, 7230, 18, 10, 1, UNI_BC__R } /* bidiclass=r */, + { 0, 8973, 9129, 6, 6, UNI_INLYCIAN } /* block=lycian */, + { 0, 1418, 8179, 24, 2, UNI_CCC__36 } /* canonicalcombiningclass=36 */, + { 1, 1190, 11, 3, 2, UNI_NT__DI } /* nt=di */, + { 5, 10268, 7983, 3, 1, UNI_NV__7 } /* nv=7 */, + { 1, 9647, 10328, 4, 3, UNI_AGE__6_DOT_1 } /* age=v61 */, + { 12, 21, 9831, 2, 3, UNI_INLAO } /* inlao */, + { 1, 10247, 4218, 3, 16, UNI_JG__MANICHAEANDALETH } /* jg=manichaeandaleth */, + { 0, 7297, 1117, 3, 3, UNI_HANG } /* ishang */, + { 1, 9691, 1193, 4, 26, UNI_HALFANDFULLFORMS } /* blk=halfwidthandfullwidthforms */, + { 2, 10247, 5989, 3, 3, UNI_JG__NUN } /* jg=nun */, { 0, 11, 0, 3, 0, UNI_DIA } /* dia */, - { 1, 9488, 3547, 4, 10, UNI_ALCHEMICAL } /* blk=alchemical */, - { 0, 10060, 1025, 3, 2, -UNI_RI } /* ri=no */, - { 23, 8954, 9255, 6, 5, -UNI__PERL_NCHAR } /* nchar=false */, - { 11, 7738, 36, 9, 1, UNI_XIDS } /* xidstart=t */, - { 16, 1628, 0, 4, 0, UNI_PHAG } /* phag */, - { 0, 9488, 8351, 4, 7, UNI_CJKEXTA } /* blk=cjkexta */, - { 5, 4916, 9825, 3, 3, UNI_TGLG } /* istglg */, - { 2, 1417, 8835, 25, 5, UNI_WB__EB } /* canonicalcombiningclass=ccc133 */, - { 1, 184, 3650, 3, 16, UNI_CYRILLICEXTB } /* iscyrillicextendedb */, - { 7, 5986, 9372, 13, 3, UNI_NV__1_SLASH_4 } /* numericvalue=1/4 */, - { 1, 10033, 6178, 3, 2, UNI_LB__ZW } /* lb=zw */, - { 79, 1591, 3684, 3, 15, UNI_ETHIOPICEXT } /* inethiopicextended */, - { 0, 8780, 4673, 6, 15, UNI_INHANGUL } /* block=hangulsyllables */, - { 0, 4116, 2780, 3, 3, UNI_IDST } /* isidst */, - { 0, 8780, 3169, 6, 18, UNI_ETHIOPICSUP } /* block=ethiopicsupplement */, - { 195, 7325, 9991, 3, 3, UNI_IN__9 } /* in=9.0 */, - { 1, 1537, 2549, 24, 20, UNI_INPC__TOPANDBOTTOMANDRIGHT } /* indicpositionalcategory=topandbottomandright */, - { 2, 8589, 8888, 7, 4, UNI_HATR } /* script=hatr */, - { 24, 9225, 0, 5, 0, UNI_XPOSIXCNTRL } /* cntrl */, - { 17, 9768, 9568, 4, 4, UNI_GREK } /* scx=grek */, - { 0, 9290, 0, 5, 0, UNI_math_values_index } /* math= */, - { 0, 7218, 73, 10, 2, UNI_EMOD } /* linebreak=em */, - { 0, 10333, 8597, 3, 6, UNI_SHRD } /* issharada */, - { 1, 10129, 1025, 3, 2, -UNI_VS } /* vs=no */, - { 0, 184, 660, 3, 29, UNI_CJKEXTF } /* iscjkunifiedideographsextensionf */, - { 21, 9488, 6133, 4, 12, UNI_ETHIOPICEXTA } /* blk=ethiopicexta */, - { 0, 9768, 9038, 4, 4, UNI_YEZI } /* scx=yezi */, - { 0, 5791, 341, 13, 2, UNI_JG__PE } /* joininggroup=pe */, - { 3, 9346, 3, 4, 1, -UNI_IDC } /* idc=f */, - { 1, 9508, 8829, 5, 5, UNI_CCC__132 } /* ccc=ccc132 */, - { 8, 2032, 1, 22, 1, -UNI__PERL_NCHAR } /* noncharactercodepoint=n */, - { 0, 8780, 4129, 6, 9, UNI_LATIN1 } /* block=latin1sup */, - { 0, 184, 11, 2, 2, UNI_DI } /* isdi */, - { 5, 9230, 1025, 5, 2, -UNI_CWCF } /* cwcf=no */, - { 1, 10063, 10135, 3, 3, UNI_SD } /* sd=yes */, - { 3, 5986, 8059, 13, 8, UNI_NV__1_SLASH_12 } /* numericvalue=8.33e-02 */, - { 17, 10009, 68, 3, 3, UNI_DT__SUP } /* dt=sup */, - { 12, 9528, 10135, 4, 3, UNI_CWU } /* cwu=yes */, - { 0, 7318, 10093, 10, 3, UNI_IN__4_DOT_1 } /* presentin=v41 */, - { 11, 184, 5228, 2, 14, UNI_LATINEXTB } /* islatinextendedb */, - { 32, 62, 0, 5, 0, UNI_XPOSIXGRAPH } /* graph */, - { 49, 3836, 8299, 17, 8, UNI_TFNG } /* scriptextensions=tifinagh */, - { 11, 9277, 9688, 3, 4, UNI_NKO } /* sc=nkoo */, - { 0, 184, 4273, 2, 16, UNI_MYANMAREXTA } /* ismyanmarextendeda */, - { 1, 10060, 26, 3, 1, UNI_RI } /* ri=y */, - { 19, 10310, 8661, 4, 5, UNI_INTIBETAN } /* intibetan */, - { 8, 9768, 2608, 4, 4, UNI_BRAH } /* scx=brah */, - { 0, 2288, 2743, 4, 17, UNI_JAMOEXTB } /* inhanguljamoextendedb */, - { 0, 8509, 1035, 4, 9, UNI_ENCLOSEDCJK } /* inenclosedcjk */, - { 0, 1273, 1025, 21, 2, -UNI_CE } /* compositionexclusion=no */, - { 0, 8894, 9836, 6, 4, UNI_JOINC } /* joinc=true */, - { 1, 9488, 7567, 4, 9, UNI_INKHUDAWADI } /* blk=khudawadi */, - { 6, 9556, 5585, 4, 2, UNI_WB__EB } /* gcb=eb */, - { 1, 3836, 2469, 17, 20, UNI_HMNP } /* scriptextensions=nyiakengpuachuehmong */, - { 0, 9768, 9892, 4, 4, UNI_QAAI } /* scx=zinh */, - { 1, 9444, 9844, 4, 4, UNI_AGE__11 } /* age=v110 */, - { 5, 9768, 4793, 4, 15, UNI_MERC } /* scx=meroiticcursive */, - { 16, 9275, 7328, 5, 10, UNI_INSC__PUREKILLER } /* insc=purekiller */, - { 2, 9488, 3547, 4, 17, UNI_ALCHEMICAL } /* blk=alchemicalsymbols */, - { 0, 9071, 1025, 4, 2, -UNI_XPOSIXXDIGIT } /* hex=no */, - { 1, 9277, 9696, 3, 4, UNI_OGAM } /* sc=ogam */, - { 2, 9768, 2684, 4, 19, UNI_EGYP } /* scx=egyptianhieroglyphs */, - { 3, 9536, 10135, 4, 3, UNI_DEP } /* dep=yes */, - { 7, 6554, 0, 11, 0, UNI_idc_values_index } /* idcontinue= */, - { 1, 7438, 5585, 10, 2, UNI_WB__EB } /* wordbreak=eb */, - { 3, 9768, 9820, 4, 4, UNI_TFNG } /* scx=tfng */, - { 0, 4033, 406, 16, 7, UNI_XPOSIXCNTRL } /* generalcategory=control */, - { 0, 8984, 3, 6, 1, -UNI_QMARK } /* qmark=f */, - { 0, 9768, 9335, 4, 5, UNI_TAKR } /* scx=takri */, - { 16, 8147, 0, 7, 0, UNI_EXTPICT } /* extpict */, - { 44, 4688, 1166, 15, 16, UNI_IDENTIFIERTYPE__DEFAULTIGNORABLE } /* identifiertype=defaultignorable */, - { 0, 8780, 9624, 6, 3, UNI_INLAO } /* block=lao */, - { 24, 10027, 5944, 3, 3, UNI_JG__WAW } /* jg=waw */, - { 1, 3836, 8840, 17, 6, UNI_CAKM } /* scriptextensions=chakma */, - { 2, 8519, 0, 8, 0, UNI_NFKDQC__N } /* nfkdqc=n */, - { 2, 2182, 8139, 21, 8, UNI_WB__EB } /* graphemeclusterbreak=ebasegaz */, - { 5, 10024, 74, 3, 2, UNI_ME } /* gc=me */, - { 1, 9520, 1, 4, 1, -UNI_CWL } /* cwl=n */, - { 21, 10048, 8738, 3, 5, UNI_NV__60000 } /* nv=60000 */, - { 3, 10063, 36, 3, 1, UNI_SD } /* sd=t */, - { 0, 184, 1013, 2, 5, UNI_GREK } /* isgreek */, - { 2, 9240, 10135, 5, 3, UNI_DASH } /* dash=yes */, - { 14, 9768, 9832, 4, 4, UNI_TIBT } /* scx=tibt */, - { 0, 8780, 979, 6, 27, UNI_ALPHABETICPF } /* block=alphabeticpresentationforms */, - { 2, 8780, 3295, 6, 18, UNI_LATINEXTADDITIONAL } /* block=latinextadditional */, - { 0, 184, 779, 2, 30, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* issymbolsandpictographsextendeda */, - { 0, 9488, 6961, 4, 11, UNI_SUPERANDSUB } /* blk=superandsub */, - { 1, 9350, 3, 5, 1, -UNI_XIDS } /* xids=f */, - { 2, 8589, 8243, 7, 8, UNI_SC__MAHJ } /* script=mahajani */, - { 0, 2409, 0, 4, 0, UNI_GLAG } /* glag */, - { 0, 5986, 8051, 13, 8, UNI_NV__5_SLASH_6 } /* numericvalue=8.33e-01 */, - { 0, 1552, 10176, 9, 2, UNI_ZL } /* category=zl */, - { 4, 3133, 26, 18, 1, UNI_EBASE } /* emojimodifierbase=y */, - { 1, 7325, 10105, 3, 3, UNI_IN__6 } /* in=v60 */, - { 0, 10048, 8720, 3, 4, UNI_NV__4000 } /* nv=4000 */, - { 1, 1417, 9126, 25, 4, UNI_CCC__19 } /* canonicalcombiningclass=ccc19 */, - { 43, 3836, 9305, 17, 5, UNI_NSHU } /* scriptextensions=nushu */, - { 0, 10027, 6325, 3, 12, UNI_JG__MALAYALAMNNA } /* jg=malayalamnna */, - { 1, 9508, 8010, 4, 2, UNI_CCC__36 } /* ccc=36 */, - { 0, 8780, 2722, 6, 10, UNI_JAMO } /* block=hanguljamo */, - { 1, 6808, 0, 4, 0, UNI__PERL_SURROGATE } /* iscs */, - { 0, 42, 0, 16, 0, UNI_CJKCOMPAT } /* cjkcompatibility */, - { 14, 8589, 6796, 7, 11, UNI_MEDF } /* script=medefaidrin */, - { 1, 5508, 0, 14, 0, UNI_patsyn_values_index } /* patternsyntax= */, - { 0, 10288, 1867, 8, 5, UNI_XPOSIXUPPER } /* isxposixupper */, - { 3, 8589, 7567, 7, 9, UNI_SC__SIND } /* script=khudawadi */, - { 0, 7325, 10075, 3, 3, UNI_IN__2 } /* in=v20 */, - { 24, 9604, 0, 4, 0, UNI_KHMR } /* khmr */, - { 1, 8780, 0, 6, 42, UNI_UCASEXT } /* block=unifiedcanadianaboriginalsyllabicsextended */, - { 1, 1537, 61, 3, 4, UNI_INDOGRA } /* indogra */, - { 38, 10027, 6565, 3, 11, UNI_JG__AFRICANNOON } /* jg=africannoon */, - { 1, 184, 9285, 2, 4, UNI_LIMB } /* islimb */, - { 3, 5466, 0, 16, 0, UNI_DT__CAN } /* nfdquickcheck=no */, - { 0, 7438, 6145, 10, 12, UNI_WB__EX } /* wordbreak=extendnumlet */, - { 7, 1790, 10135, 22, 3, UNI_CWCM } /* changeswhencasemapped=yes */, - { 1, 8421, 0, 4, 0, UNI_ELYM } /* elym */, - { 0, 9488, 4001, 4, 16, UNI_CYPRIOTSYLLABARY } /* blk=cypriotsyllabary */, - { 1, 3836, 8179, 17, 8, UNI_GURU } /* scriptextensions=gurmukhi */, - { 3, 10006, 9255, 3, 5, -UNI_DI } /* di=false */, - { 4, 9277, 8187, 3, 8, UNI_SC__HIRA } /* sc=hiragana */, - { 1, 10009, 45, 3, 3, UNI_DT__COM } /* dt=com */, - { 1, 6598, 0, 11, 0, UNI_CASEDLETTER } /* casedletter */, - { 1, 9351, 0, 4, 0, UNI_ids_values_index } /* ids= */, - { 0, 2950, 0, 19, 0, UNI_SUPARROWSB } /* supplementalarrowsb */, - { 0, 2784, 8093, 4, 6, UNI_INARMENIAN } /* inarmenian */, - { 16, 9768, 8115, 4, 8, UNI_BASS } /* scx=bassavah */, - { 8, 8610, 0, 4, 0, UNI_SIDD } /* sidd */, - { 2, 5032, 1025, 14, 2, -UNI_POSIXXDIGIT } /* asciihexdigit=no */, - { 1, 8780, 660, 7, 29, UNI_CJKEXTF } /* block=cjkunifiedideographsextensionf */, - { 35, 8589, 8171, 7, 8, UNI_SC__GUJR } /* script=gujarati */, - { 5, 184, 8912, 2, 6, UNI_KHOJ } /* iskhojki */, - { 0, 3836, 9708, 17, 4, UNI_ORYA } /* scriptextensions=orya */, - { 7, 7325, 7950, 3, 1, UNI_IN__9 } /* in=9 */, - { 0, 5986, 8714, 13, 2, UNI_NV__30 } /* numericvalue=30 */, - { 1, 9488, 5018, 4, 14, UNI_ANCIENTSYMBOLS } /* blk=ancientsymbols */, - { 0, 2224, 6940, 3, 10, UNI_INSORASOMPENG } /* insorasompeng */, - { 5, 3367, 9836, 18, 4, UNI__PERL_PATWS } /* patternwhitespace=true */, - { 4, 9488, 6025, 4, 12, UNI_ALPHABETICPF } /* blk=alphabeticpf */, - { 0, 1417, 5648, 24, 2, UNI_CCC__10 } /* canonicalcombiningclass=10 */, - { 3, 10024, 47, 3, 1, UNI_M } /* gc=m */, - { 0, 3836, 8107, 17, 8, UNI_BALI } /* scriptextensions=balinese */, - { 0, 2224, 2055, 3, 21, UNI_MODIFIERLETTERS } /* inspacingmodifierletters */, - { 8, 3836, 7513, 17, 9, UNI_BHKS } /* scriptextensions=bhaiksuki */, - { 38, 3836, 8484, 17, 7, UNI_MAND } /* scriptextensions=mandaic */, - { 3, 5791, 2637, 13, 9, UNI_JG__YEHBARREE } /* joininggroup=yehbarree */, - { 0, 4643, 3, 15, 1, -UNI_ECOMP } /* emojicomponent=f */, - { 3, 1417, 8823, 25, 5, UNI_CCC__130 } /* canonicalcombiningclass=ccc130 */, - { 4, 7325, 10078, 3, 3, UNI_IN__2_DOT_1 } /* in=v21 */, - { 25, 3836, 9612, 17, 4, UNI_KNDA } /* scriptextensions=knda */, - { 1, 10048, 9404, 3, 4, UNI_NV__13_SLASH_2 } /* nv=13/2 */, - { 2, 21, 8338, 3, 6, UNI_INAVESTAN } /* inavestan */, - { 2, 184, 3026, 3, 3, UNI_CHER } /* ischer */, - { 1, 3836, 9720, 17, 4, UNI_PHLP } /* scriptextensions=phlp */, - { 0, 7318, 7814, 10, 1, UNI_IN__7 } /* presentin=7 */, - { 0, 9488, 5214, 4, 14, UNI_KANGXI } /* blk=kangxiradicals */, - { 2, 3836, 8131, 17, 4, UNI_DUPL } /* scriptextensions=dupl */, - { 16, 8780, 2141, 7, 20, UNI_CYRILLICSUP } /* block=cyrillicsupplementary */, - { 1, 4928, 0, 15, 0, UNI_TAMILSUP } /* tamilsupplement */, - { 1, 184, 8401, 3, 5, UNI_COMPEX } /* iscompex */, - { 50, 1537, 3475, 24, 10, UNI_INPC__TOPANDLEFT } /* indicpositionalcategory=topandleft */, - { 1, 7325, 9955, 3, 3, UNI_IN__3_DOT_2 } /* in=3.2 */, - { 37, 9277, 5550, 3, 14, UNI_SC__PHLP } /* sc=psalterpahlavi */, - { 51, 10288, 7739, 3, 7, UNI_XIDS } /* isxidstart */, - { 4, 7318, 9970, 10, 3, UNI_IN__5_DOT_2 } /* presentin=5.2 */, - { 0, 3547, 0, 10, 0, UNI_ALCHEMICAL } /* alchemical */, - { 32, 9997, 3205, 3, 18, UNI_BC__FSI } /* bc=firststrongisolate */, - { 0, 5986, 8732, 13, 5, UNI_NV__50000 } /* numericvalue=50000 */, - { 32, 9536, 0, 4, 0, UNI_dep_values_index } /* dep= */, - { 1, 8780, 78, 6, 10, UNI_ARABICMATH } /* block=arabicmath */, - { 3, 184, 407, 3, 6, UNI_XPOSIXCNTRL } /* iscontrol */, - { 0, 184, 1677, 2, 14, UNI_LATINEXTA } /* islatinextendeda */, - { 2, 3836, 9584, 17, 4, UNI_HLUW } /* scriptextensions=hluw */, - { 2, 9488, 0, 4, 0, UNI_blk_values_index } /* blk= */, - { 0, 8589, 78, 7, 4, UNI_SC__ARAB } /* script=arab */, - { 1, 184, 3667, 3, 16, UNI_CYRILLICEXTC } /* iscyrillicextendedc */, - { 0, 8774, 26, 6, 1, UNI_BIDIM } /* bidim=y */, - { 179, 184, 5726, 2, 13, UNI_ME } /* isenclosingmark */, - { 5, 9270, 2549, 5, 3, UNI_INPC__TOP } /* inpc=top */, - { 5, 9488, 9340, 4, 5, UNI_VSSUP } /* blk=vssup */, - { 44, 8589, 8414, 7, 7, UNI_ELBA } /* script=elbasan */, - { 4, 1189, 495, 3, 7, UNI_NT__NU } /* nt=numeric */, - { 1, 4033, 1044, 16, 6, UNI_L } /* generalcategory=letter */, - { 0, 4033, 5494, 16, 14, UNI_MN } /* generalcategory=nonspacingmark */, - { 11, 10340, 1751, 3, 2, UNI_VAI } /* isvai */, - { 20, 184, 9572, 2, 4, UNI_GUJR } /* isgujr */, - { 8, 3836, 8291, 17, 4, UNI_TAGB } /* scriptextensions=tagb */, - { 0, 8589, 9688, 7, 3, UNI_NKO } /* script=nko */, - { 60, 2855, 0, 9, 0, UNI_MONG } /* mongolian */, - { 2, 184, 2608, 2, 6, UNI_BRAH } /* isbrahmi */, - { 0, 184, 1218, 2, 8, UNI_KANA } /* iskatakana */, - { 0, 9536, 1, 4, 1, -UNI_DEP } /* dep=n */, - { 3, 8780, 1513, 6, 24, UNI_HIGHPUSURROGATES } /* block=highprivateusesurrogates */, - { 0, 7318, 10090, 10, 3, UNI_IN__4 } /* presentin=v40 */, - { 0, 4628, 8, 15, 1, UNI_EA__A } /* eastasianwidth=a */, - { 1, 78, 0, 10, 0, UNI_ARABICMATH } /* arabicmath */, - { 12, 9277, 6939, 3, 4, UNI_SORA } /* sc=sora */, - { 1, 4791, 1019, 3, 4, UNI_MUSIC } /* inmusic */, - { 0, 7218, 2444, 10, 2, UNI_LB__HL } /* linebreak=hl */, - { 33, 4673, 0, 15, 0, UNI_INHANGUL } /* hangulsyllables */, - { 1, 184, 8428, 2, 7, UNI_GRAN } /* isgrantha */, - { 4, 3382, 9255, 3, 5, -UNI_CE } /* ce=false */, - { 2, 4033, 1563, 16, 2, UNI_PS } /* generalcategory=ps */, - { 0, 1746, 752, 23, 4, UNI_BPT__C } /* bidipairedbrackettype=close */, - { 0, 184, 8882, 2, 5, UNI_GREXT } /* isgrext */, - { 3, 6231, 3026, 3, 7, UNI_INCHEROKEE } /* incherokee */, - { 0, 184, 7098, 2, 10, UNI_BOXDRAWING } /* isboxdrawing */, - { 0, 7540, 3, 9, 1, -UNI_EXT } /* extender=f */, - { 0, 1591, 6134, 3, 11, UNI_ETHIOPICEXTA } /* inethiopicexta */, - { 0, 10340, 67, 3, 4, UNI_VSSUP } /* isvssup */, - { 2, 9520, 9836, 4, 4, UNI_CWL } /* cwl=true */, - { 57, 8780, 6796, 6, 11, UNI_INMEDEFAIDRIN } /* block=medefaidrin */, - { 6, 9488, 3421, 4, 18, UNI_RUMI } /* blk=ruminumeralsymbols */, - { 12, 9265, 3, 5, 1, -UNI_IDST } /* idst=f */, - { 4, 9508, 9208, 4, 2, UNI_CCC__35 } /* ccc=35 */, - { 1, 6805, 187, 6, 30, UNI_MISCPICTOGRAPHS } /* inmiscellaneoussymbolsandpictographs */, - { 5, 5466, 0, 14, 0, UNI_nfdqc_values_index } /* nfdquickcheck= */, - { 1, 9488, 6939, 4, 11, UNI_INSORASOMPENG } /* blk=sorasompeng */, - { 0, 9230, 36, 5, 1, UNI_CWCF } /* cwcf=t */, - { 1, 9444, 7821, 4, 1, UNI_AGE__8 } /* age=8 */, - { 0, 6554, 9255, 11, 5, -UNI_IDC } /* idcontinue=false */, - { 0, 9277, 7291, 3, 7, UNI_SC__SOGD } /* sc=sogdian */, - { 13, 8589, 9285, 7, 4, UNI_SC__LIMB } /* script=limb */, - { 3, 3836, 9496, 17, 4, UNI_BUHD } /* scriptextensions=buhd */, - { 0, 2931, 0, 19, 0, UNI_SUPARROWSA } /* supplementalarrowsa */, - { 64, 184, 2684, 2, 19, UNI_EGYP } /* isegyptianhieroglyphs */, - { 2, 8509, 811, 4, 27, UNI_ENCLOSEDIDEOGRAPHICSUP } /* inenclosedideographicsupplement */, - { 0, 9277, 6793, 5, 2, UNI_KHMR } /* sc=khmr */, - { 0, 8780, 1319, 6, 25, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* block=symbolsandpictographsexta */, - { 69, 5986, 8820, 13, 2, UNI_NV__29 } /* numericvalue=29 */, - { 0, 184, 5947, 2, 13, UNI_MAYANNUMERALS } /* ismayannumerals */, - { 9, 6805, 2023, 6, 9, UNI_MISCTECHNICAL } /* inmisctechnical */, - { 1, 9277, 8603, 3, 7, UNI_SHAW } /* sc=shavian */, - { 0, 1828, 10135, 6, 3, UNI_CASED } /* cased=yes */, - { 0, 9768, 4478, 4, 4, UNI_BRAI } /* scx=brai */, - { 5, 9768, 8666, 4, 7, UNI_TIRH } /* scx=tirhuta */, - { 0, 9275, 7639, 5, 9, UNI_INSC__NONJOINER } /* insc=nonjoiner */, - { 1, 1114, 36, 26, 1, UNI_CWKCF } /* changeswhennfkccasefolded=t */, - { 0, 3836, 9564, 17, 4, UNI_GONM } /* scriptextensions=gonm */, - { 0, 8589, 9612, 7, 4, UNI_SC__KNDA } /* script=knda */, - { 0, 4958, 0, 15, 0, UNI_UPPERCASELETTER } /* uppercaseletter */, - { 1, 10333, 4149, 3, 3, UNI_SARB } /* issarb */, - { 7, 1828, 1, 6, 1, -UNI_CASED } /* cased=n */, - { 0, 9277, 9002, 3, 4, UNI_SC__TELU } /* sc=telu */, - { 0, 9444, 9384, 4, 4, UNI_AGE__10 } /* age=10.0 */, - { 0, 8780, 3921, 6, 16, UNI_ARABICSUP } /* block=arabicsupplement */, - { 0, 8589, 9532, 7, 4, UNI_SC__CYRL } /* script=cyrl */, - { 1, 5986, 9436, 13, 4, UNI_NV__7_SLASH_12 } /* numericvalue=7/12 */, - { 1, 1561, 0, 24, 0, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* supsymbolsandpictographs */, - { 0, 4916, 4402, 3, 15, UNI_TANGUTSUP } /* istangutsupplement */, - { 48, 7325, 9840, 3, 4, UNI_IN__10 } /* in=v100 */, - { 1, 7325, 10108, 3, 3, UNI_IN__6_DOT_1 } /* in=v61 */, - { 2, 7318, 7755, 10, 3, UNI_IN__1_DOT_1 } /* presentin=1.1 */, - { 7, 9070, 0, 4, 0, UNI_POSIXXDIGIT } /* ahex */, - { 1, 3836, 7188, 17, 4, UNI_KHAR } /* scriptextensions=khar */, - { 0, 719, 0, 9, 0, UNI_XSUX } /* cuneiform */, - { 96, 8780, 4448, 6, 8, UNI_BAMUMSUP } /* block=bamumsup */, - { 0, 9488, 1441, 4, 10, UNI_CJKSYMBOLS } /* blk=cjksymbols */, - { 21, 10132, 6653, 3, 11, UNI_WB__DQ } /* wb=doublequote */, - { 1, 8780, 6972, 6, 11, UNI_INSYLOTINAGRI } /* block=sylotinagri */, - { 0, 3836, 2817, 17, 19, UNI_MERO } /* scriptextensions=meroitichieroglyphs */, - { 0, 184, 3683, 2, 16, UNI_ETHIOPICEXT } /* isethiopicextended */, - { 0, 9014, 1, 6, 1, -UNI_UIDEO } /* uideo=n */, - { 1, 8400, 1, 7, 1, -UNI_COMPEX } /* compex=n */, - { 0, 9277, 8888, 3, 6, UNI_HATR } /* sc=hatran */, - { 0, 1166, 9836, 26, 4, UNI_DI } /* defaultignorablecodepoint=true */, - { 0, 10291, 1867, 5, 5, UNI_POSIXUPPER } /* posixupper */, - { 0, 6231, 3650, 3, 16, UNI_CYRILLICEXTB } /* incyrillicextendedb */, - { 1, 8589, 493, 7, 3, UNI_SC__HAN } /* script=han */, - { 0, 8780, 2099, 7, 20, UNI_CJKCOMPATFORMS } /* block=cjkcompatibilityforms */, - { 2, 5986, 7979, 13, 8, UNI_NV__3_SLASH_5 } /* numericvalue=6.00e-01 */, - { 2, 10048, 7922, 3, 2, UNI_NV__24 } /* nv=24 */, - { 3, 2469, 0, 20, 0, UNI_HMNP } /* nyiakengpuachuehmong */, - { 25, 4829, 2411, 4, 11, UNI_GLAGOLITICSUP } /* inglagoliticsup */, - { 3, 21, 4145, 2, 16, UNI_LINEARBIDEOGRAMS } /* inlinearbideograms */, - { 0, 809, 0, 29, 0, UNI_ENCLOSEDIDEOGRAPHICSUP } /* enclosedideographicsupplement */, - { 0, 1856, 1, 22, 1, -UNI_CWU } /* changeswhenuppercased=n */, - { 0, 184, 2141, 3, 20, UNI_CYRILLICSUP } /* iscyrillicsupplementary */, - { 0, 5986, 9188, 13, 2, UNI_NV__31 } /* numericvalue=31 */, - { 2, 8780, 43, 7, 35, UNI_CJKCOMPATIDEOGRAPHSSUP } /* block=cjkcompatibilityideographssupplement */, - { 1, 10033, 23, 3, 2, UNI_LB__AL } /* lb=al */, - { 0, 10027, 87, 3, 2, UNI_JG__HE } /* jg=he */, - { 4, 10132, 108, 3, 2, UNI_WB__MB } /* wb=mb */, - { 2, 4033, 1465, 16, 13, UNI_M } /* generalcategory=combiningmark */, - { 1, 9325, 0, 5, 0, UNI_RUNR } /* runic */, - { 1, 1552, 727, 9, 2, UNI_MN } /* category=mn */, - { 0, 7088, 10054, 10, 3, UNI_BC__PDF } /* bidiclass=pdf */, - { 1, 9656, 0, 4, 0, UNI_MIAO } /* miao */, - { 0, 2969, 0, 19, 0, UNI_SUPARROWSC } /* supplementalarrowsc */, - { 1, 9508, 8708, 4, 3, UNI_CCC__216 } /* ccc=216 */, - { 0, 9768, 9616, 4, 4, UNI_KTHI } /* scx=kthi */, - { 0, 6609, 36, 11, 1, UNI_DEP } /* deprecated=t */, - { 0, 8780, 510, 7, 29, UNI_CJKEXTA } /* block=cjkunifiedideographsextensiona */, - { 6, 10027, 6572, 3, 4, UNI_JG__NOON } /* jg=noon */, - { 1, 2182, 1194, 21, 2, UNI_LB__LF } /* graphemeclusterbreak=lf */, - { 0, 8589, 4478, 7, 4, UNI_BRAI } /* script=brai */, - { 1, 9768, 9576, 4, 4, UNI_GURU } /* scx=guru */, - { 0, 8780, 1006, 6, 27, UNI_ANCIENTGREEKMUSIC } /* block=ancientgreekmusicalnotation */, - { 0, 8858, 9836, 6, 4, UNI_ECOMP } /* ecomp=true */, - { 16, 8780, 3241, 6, 8, UNI_INGEORGIAN } /* block=georgian */, - { 0, 5739, 0, 12, 0, UNI_GRBASE } /* graphemebase */, - { 40, 4928, 0, 5, 0, UNI_TAML } /* tamil */, - { 0, 10024, 24, 3, 1, UNI_L } /* gc=l */, - { 0, 9768, 9793, 5, 3, UNI_SOGO } /* scx=sogo */, - { 25, 1768, 3, 22, 1, -UNI_CWCF } /* changeswhencasefolded=f */, - { 29, 1417, 7754, 24, 2, UNI_CCC__11 } /* canonicalcombiningclass=11 */, - { 0, 8589, 7651, 7, 4, UNI_ITAL } /* script=ital */, - { 0, 9488, 8393, 4, 7, UNI_CJKEXTG } /* blk=cjkextg */, - { 1, 9508, 18, 4, 1, UNI_CCC__R } /* ccc=r */, - { 34, 8688, 7411, 3, 7, UNI_ASSIGNED } /* isassigned */, - { 0, 21, 3295, 2, 18, UNI_LATINEXTADDITIONAL } /* inlatinextadditional */, - { 1, 9997, 4464, 4, 14, UNI_BC__BN } /* bc=boundaryneutral */, - { 0, 2760, 9, 19, 2, UNI_HST__NA } /* hangulsyllabletype=na */, - { 1, 7318, 7806, 10, 1, UNI_IN__6 } /* presentin=6 */, - { 43, 10033, 6587, 3, 11, UNI_LB__BB } /* lb=breakbefore */, - { 1, 9716, 0, 4, 0, UNI_pcm_values_index } /* pcm= */, - { 0, 9277, 1628, 3, 4, UNI_SC__PHAG } /* sc=phag */, - { 3, 2529, 9255, 20, 5, -UNI_TERM } /* terminalpunctuation=false */, - { 0, 9488, 5032, 4, 5, UNI_ASCII } /* blk=ascii */, - { 0, 9488, 8484, 4, 7, UNI_INMANDAIC } /* blk=mandaic */, - { 8, 8852, 1, 6, 1, -UNI_CWKCF } /* cwkcf=n */, - { 4, 7325, 7867, 3, 3, UNI_IN__3_DOT_1 } /* in=3.1 */, - { 0, 9275, 1608, 5, 23, UNI_INSC__CONSONANTPRECEDINGREPHA } /* insc=consonantprecedingrepha */, - { 0, 1273, 9255, 21, 5, -UNI_CE } /* compositionexclusion=false */, - { 1, 8996, 1, 6, 1, -UNI_STERM } /* sterm=n */, - { 1, 9792, 0, 4, 0, UNI_SOGO } /* sogo */, - { 0, 184, 6409, 2, 12, UNI_MEND } /* ismendekikakui */, - { 3, 9508, 9168, 4, 2, UNI_CCC__27 } /* ccc=27 */, - { 5, 4853, 26, 15, 1, UNI_DT__NONE } /* nfkdquickcheck=y */, - { 6, 9277, 8344, 3, 7, UNI_SC__BENG } /* sc=bengali */, - { 2, 9277, 2469, 3, 20, UNI_HMNP } /* sc=nyiakengpuachuehmong */, - { 1, 1417, 9928, 24, 3, UNI_CCC__BR } /* canonicalcombiningclass=222 */, - { 0, 3836, 3937, 17, 4, UNI_BOPO } /* scriptextensions=bopo */, - { 4, 3836, 7118, 17, 10, UNI_CHRS } /* scriptextensions=chorasmian */, - { 6, 8589, 9756, 7, 4, UNI_RUNR } /* script=runr */, - { 0, 9277, 5003, 3, 15, UNI_ZANB } /* sc=zanabazarsquare */, - { 0, 2182, 6178, 21, 3, UNI_LB__ZWJ } /* graphemeclusterbreak=zwj */, - { 2, 9508, 5377, 4, 2, UNI_CCC__7 } /* ccc=nk */, - { 0, 2779, 1, 19, 1, -UNI_IDST } /* idstrinaryoperator=n */, - { 2, 9488, 2010, 4, 22, UNI_MISCTECHNICAL } /* blk=miscellaneoustechnical */, - { 19, 1966, 0, 22, 0, UNI_insc_values_index } /* indicsyllabiccategory= */, - { 0, 9277, 7288, 3, 10, UNI_SOGO } /* sc=oldsogdian */, - { 2, 9488, 9688, 4, 3, UNI_INNKO } /* blk=nko */, - { 16, 8589, 8123, 7, 4, UNI_SC__BUGI } /* script=bugi */, - { 1, 5986, 8756, 13, 3, UNI_NV__900 } /* numericvalue=900 */, - { 0, 9235, 3, 5, 1, -UNI_CWCM } /* cwcm=f */, - { 6, 8589, 9704, 7, 4, UNI_ORKH } /* script=orkh */, - { 4, 8780, 4808, 6, 15, UNI_MISCPICTOGRAPHS } /* block=miscpictographs */, - { 2, 9520, 1025, 4, 2, -UNI_CWL } /* cwl=no */, - { 0, 9277, 9720, 3, 4, UNI_SC__PHLP } /* sc=phlp */, - { 64, 7738, 0, 8, 0, UNI_XIDS } /* xidstart */, - { 42, 9768, 5284, 4, 4, UNI_LISU } /* scx=lisu */, - { 0, 8561, 0, 4, 0, UNI_OSMA } /* osma */, - { 145, 6241, 6664, 12, 11, UNI_JT__D } /* joiningtype=dualjoining */, - { 4, 8882, 26, 6, 1, UNI_GREXT } /* grext=y */, - { 3, 1552, 1822, 9, 2, UNI_NL } /* category=nl */, - { 5, 3529, 10135, 18, 3, UNI_VS } /* variationselector=yes */, - { 0, 7675, 0, 4, 0, UNI_PALM } /* palm */, - { 0, 10009, 8195, 3, 8, UNI_DT__ISO } /* dt=isolated */, - { 16, 7504, 0, 9, 0, UNI_ARABICPFB } /* arabicpfb */, - { 0, 9760, 0, 4, 0, UNI_SAMR } /* samr */, - { 1, 9508, 7821, 4, 1, UNI_CCC__8 } /* ccc=8 */, - { 2, 184, 9503, 2, 2, UNI_MC } /* ismc */, - { 2, 3836, 8924, 17, 4, UNI_LEPC } /* scriptextensions=lepc */, - { 0, 9556, 70, 4, 2, UNI_GCB__PP } /* gcb=pp */, - { 3, 184, 8428, 2, 4, UNI_GRAN } /* isgran */, - { 49, 6576, 9836, 11, 4, UNI_XPOSIXALPHA } /* alphabetic=true */, - { 0, 10048, 9368, 3, 4, UNI_NV__1_SLASH_20 } /* nv=1/20 */, - { 15, 9488, 78, 4, 10, UNI_ARABICMATH } /* blk=arabicmath */, - { 0, 8864, 36, 6, 1, UNI_EMOJI } /* emoji=t */, - { 1, 9350, 9255, 5, 5, -UNI_XIDS } /* xids=false */, - { 1, 7438, 6178, 10, 3, UNI_LB__ZWJ } /* wordbreak=zwj */, - { 40, 4928, 0, 8, 0, UNI_TAMILSUP } /* tamilsup */, - { 0, 9270, 6518, 3, 11, UNI_PLAYINGCARDS } /* inplayingcards */, - { 31, 9275, 4823, 5, 15, UNI_INSC__MODIFYINGLETTER } /* insc=modifyingletter */, - { 0, 3836, 9085, 17, 5, UNI_BATK } /* scriptextensions=batak */, - { 0, 8688, 3548, 3, 16, UNI_ALCHEMICAL } /* isalchemicalsymbols */, - { 0, 9508, 9203, 4, 2, UNI_CCC__34 } /* ccc=34 */, - { 7, 2589, 0, 19, 0, UNI_ANCIENTGREEKNUMBERS } /* ancientgreeknumbers */, - { 2, 10006, 36, 3, 1, UNI_DI } /* di=t */, - { 0, 8997, 9255, 5, 5, -UNI_TERM } /* term=false */, - { 0, 10030, 6, 3, 1, UNI_JT__D } /* jt=d */, - { 1, 9768, 2203, 4, 14, UNI_ROHG } /* scx=hanifirohingya */, - { 1, 184, 24, 2, 1, UNI_L } /* isl */, - { 1, 2760, 7238, 19, 10, UNI_LB__H2 } /* hangulsyllabletype=lvsyllable */, - { 4, 8589, 8498, 7, 4, UNI_SC__MULT } /* script=mult */, - { 0, 1114, 10135, 26, 3, UNI_CWKCF } /* changeswhennfkccasefolded=yes */, - { 0, 3985, 0, 16, 0, UNI_PE } /* closepunctuation */, - { 10, 9768, 8491, 4, 4, UNI_MARC } /* scx=marc */, - { 1, 9768, 4273, 4, 7, UNI_MYMR } /* scx=myanmar */, - { 4, 5466, 10135, 14, 3, UNI_NFDQC__Y } /* nfdquickcheck=yes */, - { 1, 5986, 8066, 13, 2, UNI_NV__28 } /* numericvalue=28 */, - { 1, 7228, 3, 10, 1, -UNI_XPOSIXLOWER } /* lowercase=f */, - { 139, 8780, 2912, 6, 9, UNI_INSUNDANESE } /* block=sundanese */, - { 0, 5746, 9836, 6, 4, UNI_EBASE } /* ebase=true */, - { 1, 5791, 9044, 13, 4, UNI_JG__YUDH } /* joininggroup=yudh */, - { 0, 8780, 1654, 6, 23, UNI_COMPATJAMO } /* block=hangulcompatibilityjamo */, - { 22, 10132, 138, 3, 2, UNI_WB__FO } /* wb=fo */, - { 0, 10027, 10057, 3, 3, UNI_JG__REH } /* jg=reh */, - { 0, 5986, 9424, 13, 4, UNI_NV__3_SLASH_64 } /* numericvalue=3/64 */, - { 0, 8589, 7359, 8, 9, UNI_SAUR } /* script=saurashtra */, - { 4, 1417, 3564, 24, 17, UNI_WB__EB } /* canonicalcombiningclass=attachedbelowleft */, - { 0, 10033, 6178, 3, 3, UNI_LB__ZWJ } /* lb=zwj */, - { 3, 8762, 1, 6, 1, -UNI_XPOSIXALPHA } /* alpha=n */, - { 8, 7088, 8, 10, 2, UNI_BC__AN } /* bidiclass=an */, - { 1, 184, 18, 2, 2, UNI_RI } /* isri */, - { 17, 10027, 5382, 3, 14, UNI_JG__MANICHAEANQOPH } /* jg=manichaeanqoph */, - { 1, 9768, 7660, 4, 4, UNI_PERM } /* scx=perm */, - { 0, 3836, 9464, 17, 4, UNI_ARMN } /* scriptextensions=armn */, - { 0, 512, 0, 16, 0, UNI_UIDEO } /* unifiedideograph */, - { 0, 9488, 2245, 4, 21, UNI_MEETEIMAYEKEXT } /* blk=meeteimayekextensions */, - { 3, 7738, 9255, 9, 5, -UNI_XIDS } /* xidstart=false */, - { 33, 8694, 10135, 7, 3, UNI_XPOSIXSPACE } /* wspace=yes */, - { 17, 9444, 7950, 4, 1, UNI_AGE__9 } /* age=9 */, - { 74, 2817, 0, 19, 0, UNI_MERO } /* meroitichieroglyphs */, - { 0, 8589, 9620, 7, 4, UNI_LANA } /* script=lana */, - { 0, 9768, 5003, 4, 15, UNI_ZANB } /* scx=zanabazarsquare */, - { 1, 5746, 1, 6, 1, -UNI_EBASE } /* ebase=n */, - { 0, 8780, 9032, 6, 6, UNI_INWANCHO } /* block=wancho */, - { 8, 5284, 0, 4, 0, UNI_LISU } /* lisu */, - { 20, 1900, 0, 22, 0, UNI_INDICNUMBERFORMS } /* commonindicnumberforms */, - { 0, 6576, 10135, 11, 3, UNI_XPOSIXALPHA } /* alphabetic=yes */, - { 0, 1006, 0, 17, 0, UNI_ANCIENTGREEKMUSIC } /* ancientgreekmusic */, - { 0, 5986, 8714, 13, 3, UNI_NV__300 } /* numericvalue=300 */, - { 0, 3043, 0, 18, 0, UNI_HALFMARKS } /* combininghalfmarks */, - { 0, 9277, 9335, 3, 4, UNI_SC__TAKR } /* sc=takr */, - { 8, 7738, 0, 9, 0, UNI_xids_values_index } /* xidstart= */, - { 0, 184, 9756, 2, 4, UNI_RUNR } /* isrunr */, - { 1, 184, 7188, 2, 4, UNI_KHAR } /* iskhar */, - { 3, 8884, 1, 4, 1, -UNI_EXT } /* ext=n */, - { 4, 9351, 10135, 4, 3, UNI_IDS } /* ids=yes */, - { 1, 184, 3169, 2, 4, UNI_ETHI } /* isethi */, - { 10, 2224, 1345, 3, 24, UNI_SYMBOLSFORLEGACYCOMPUTING } /* insymbolsforlegacycomputing */, - { 2, 8780, 3026, 7, 17, UNI_CHEROKEESUP } /* block=cherokeesupplement */, - { 4, 9444, 9844, 4, 3, UNI_IN__1_DOT_1 } /* age=v11 */, - { 0, 9768, 382, 4, 4, UNI_EGYP } /* scx=egyp */, - { 89, 3277, 0, 18, 0, UNI_PI } /* initialpunctuation */, - { 4, 9488, 9664, 4, 3, UNI_INMRO } /* blk=mro */, - { 0, 9277, 8561, 3, 4, UNI_OSMA } /* sc=osma */, - { 0, 3098, 0, 5, 0, UNI_ECOMP } /* ecomp */, - { 0, 10012, 1204, 3, 9, UNI_EA__F } /* ea=fullwidth */, - { 16, 1537, 9, 24, 2, UNI_INPC__NA } /* indicpositionalcategory=na */, - { 0, 10048, 7874, 3, 2, UNI_NV__23 } /* nv=23 */, - { 0, 5791, 5354, 13, 14, UNI_JG__MANICHAEANHETH } /* joininggroup=manichaeanheth */, - { 1, 1114, 1025, 26, 2, -UNI_CWKCF } /* changeswhennfkccasefolded=no */, - { 2, 3853, 9255, 17, 5, -UNI_STERM } /* sentenceterminal=false */, - { 0, 7088, 2268, 10, 3, UNI_BC__PDI } /* bidiclass=pdi */, - { 2, 184, 9616, 2, 4, UNI_KTHI } /* iskthi */, - { 4, 10027, 5, 3, 1, UNI_JG__E } /* jg=e */, - { 0, 1344, 0, 25, 0, UNI_SYMBOLSFORLEGACYCOMPUTING } /* symbolsforlegacycomputing */, - { 0, 2703, 0, 19, 0, UNI_ENCLOSEDALPHANUMSUP } /* enclosedalphanumsup */, - { 1, 7318, 9852, 10, 4, UNI_IN__12_DOT_1 } /* presentin=v121 */, - { 1, 8589, 2608, 7, 4, UNI_BRAH } /* script=brah */, - { 58, 9488, 6109, 4, 12, UNI_CYRILLICEXTB } /* blk=cyrillicextb */, - { 35, 6231, 720, 3, 29, UNI_CUNEIFORMNUMBERS } /* incuneiformnumbersandpunctuation */, - { 98, 9277, 9828, 3, 4, UNI_THAI } /* sc=thai */, - { 37, 2288, 3055, 5, 6, UNI_HALFMARKS } /* inhalfmarks */, - { 7, 5986, 8727, 13, 2, UNI_NV__32 } /* numericvalue=32 */, - { 0, 8852, 0, 5, 0, UNI_CWKCF } /* cwkcf */, - { 2, 9488, 6807, 4, 11, UNI_MISCSYMBOLS } /* blk=miscsymbols */, - { 1, 8589, 9872, 7, 4, UNI_XPEO } /* script=xpeo */, - { 3, 1979, 5818, 10, 12, UNI_ZL } /* category=lineseparator */, - { 3, 1417, 3572, 24, 5, UNI_CCC__B } /* canonicalcombiningclass=below */, - { 17, 1369, 0, 24, 0, UNI_ARABICPFA } /* arabicpresentationformsa */, - { 82, 9262, 751, 3, 5, UNI_SB__CL } /* sb=close */, - { 13, 2529, 0, 21, 0, UNI_TERM } /* terminalpunctuation=t */, - { 3, 9488, 4241, 4, 16, UNI_MISCMATHSYMBOLSA } /* blk=miscmathsymbolsa */, - { 0, 9488, 8386, 4, 7, UNI_CJKEXTF } /* blk=cjkextf */, - { 12, 8780, 1033, 6, 11, UNI_ENCLOSEDCJK } /* block=enclosedcjk */, - { 1, 9277, 8428, 3, 7, UNI_SC__GRAN } /* sc=grantha */, - { 0, 749, 0, 16, 0, UNI_ENCLOSEDALPHANUM } /* enclosedalphanum */, - { 0, 9488, 1369, 4, 24, UNI_ARABICPFA } /* blk=arabicpresentationformsa */, - { 2, 3331, 0, 18, 0, UNI_ORNAMENTALDINGBATS } /* ornamentaldingbats */, - { 1, 9524, 1, 4, 1, -UNI_CWT } /* cwt=n */, - { 0, 7076, 4449, 3, 14, UNI_BAMUMSUP } /* inbamumsupplement */, - { 2, 7318, 7469, 10, 1, UNI_IN__5 } /* presentin=5 */, - { 0, 9230, 0, 4, 0, UNI_CWCF } /* cwcf */, - { 1, 9277, 9688, 3, 3, UNI_NKO } /* sc=nko */, - { 0, 8631, 0, 7, 0, UNI_SUPPUAB } /* suppuab */, - { 142, 9540, 9255, 4, 5, -UNI_DIA } /* dia=false */, - { 2, 4033, 4568, 16, 14, UNI_SC } /* generalcategory=currencysymbol */, - { 30, 8870, 26, 6, 1, UNI_EPRES } /* epres=y */, - { 1, 9768, 6886, 5, 3, UNI_SHAW } /* scx=shaw */, - { 1, 5032, 26, 14, 1, UNI_POSIXXDIGIT } /* asciihexdigit=y */, - { 6, 5986, 9910, 13, 3, UNI_NV__1_SLASH_9 } /* numericvalue=1/9 */, - { 0, 3836, 9688, 17, 4, UNI_NKO } /* scriptextensions=nkoo */, - { 0, 9277, 9780, 3, 4, UNI_SHAW } /* sc=shaw */, - { 6, 10048, 7950, 3, 1, UNI_NV__9 } /* nv=9 */, - { 0, 7325, 9401, 3, 3, UNI_IN__3 } /* in=3.0 */, - { 24, 5739, 26, 13, 1, UNI_GRBASE } /* graphemebase=y */, - { 3, 184, 2836, 2, 19, UNI_MODIFIERTONELETTERS } /* ismodifiertoneletters */, - { 2, 1834, 0, 22, 0, UNI_cwt_values_index } /* changeswhentitlecased= */, - { 0, 184, 951, 2, 28, UNI_VSSUP } /* isvariationselectorssupplement */, - { 0, 9768, 9448, 4, 4, UNI_AGHB } /* scx=aghb */, - { 1, 9768, 9789, 5, 3, UNI_SHRD } /* scx=shrd */, - { 0, 9508, 8805, 5, 5, UNI_CCC__118 } /* ccc=ccc118 */, - { 6, 6085, 0, 12, 0, UNI_CHESSSYMBOLS } /* chesssymbols */, - { 3, 10048, 8710, 3, 2, UNI_NV__60 } /* nv=60 */, - { 0, 3097, 10069, 18, 3, UNI_DT__SQR } /* decompositiontype=sqr */, - { 1, 6553, 1, 12, 1, -UNI_XIDC } /* xidcontinue=n */, - { 0, 8147, 36, 8, 1, UNI_EXTPICT } /* extpict=t */, - { 1, 8780, 809, 6, 22, UNI_ENCLOSEDIDEOGRAPHICSUP } /* block=enclosedideographicsup */, - { 5, 117, 4704, 3, 14, UNI_INIMPERIALARAMAIC } /* inimperialaramaic */, - { 24, 9277, 3937, 3, 8, UNI_SC__BOPO } /* sc=bopomofo */, - { 0, 8996, 0, 5, 0, UNI_STERM } /* sterm */, - { 5, 184, 6620, 2, 6, UNI_DOMINO } /* isdomino */, - { 0, 3836, 4478, 17, 7, UNI_BRAI } /* scriptextensions=braille */, - { 3, 8147, 0, 8, 0, UNI_extpict_values_index } /* extpict= */, - { 1, 4422, 3117, 4, 8, UNI_INDEVANAGARI } /* indevanagari */, - { 0, 5578, 751, 14, 2, UNI_SB__CL } /* sentencebreak=cl */, - { 0, 10048, 7765, 3, 2, UNI_NV__25 } /* nv=25 */, - { 7, 8954, 0, 6, 0, UNI_nchar_values_index } /* nchar= */, - { 26, 9488, 7118, 4, 10, UNI_INCHORASMIAN } /* blk=chorasmian */, - { 5, 184, 1466, 3, 12, UNI_M } /* iscombiningmark */, - { 0, 10296, 10309, 3, 4, UNI_XPOSIXPRINT } /* isprint */, - { 1, 10048, 0, 3, 0, UNI_nv_values_index } /* nv= */, - { 8, 7218, 7268, 10, 10, UNI_LB__NS } /* linebreak=nonstarter */, - { 2, 5791, 4177, 13, 16, UNI_JG__MANICHAEANDALETH } /* joininggroup=manichaeandaleth */, - { 5, 8589, 8606, 10, 4, UNI_SHAW } /* script=shavian */, - { 1, 9688, 0, 4, 0, UNI_NKO } /* nkoo */, - { 0, 8780, 2589, 6, 19, UNI_ANCIENTGREEKNUMBERS } /* block=ancientgreeknumbers */, - { 0, 8589, 9696, 7, 4, UNI_OGAM } /* script=ogam */, - { 33, 10027, 6774, 3, 11, UNI_JG__MALAYALAMJA } /* jg=malayalamja */, - { 0, 3853, 10135, 17, 3, UNI_STERM } /* sentenceterminal=yes */, - { 17, 2288, 2724, 4, 17, UNI_JAMOEXTA } /* inhanguljamoextendeda */, - { 0, 7155, 9585, 3, 3, UNI_HLUW } /* ishluw */, - { 0, 10048, 9376, 3, 4, UNI_NV__1_SLASH_64 } /* nv=1/64 */, - { 0, 184, 3133, 2, 5, UNI_EMOJI } /* isemoji */, - { 42, 2140, 0, 18, 0, UNI_CYRILLICSUP } /* cyrillicsupplement */, - { 4, 184, 4793, 2, 15, UNI_MERC } /* ismeroiticcursive */, - { 11, 7540, 9836, 9, 4, UNI_EXT } /* extender=true */, - { 0, 78, 0, 6, 0, UNI_ARAB } /* arabic */, - { 0, 9520, 9255, 4, 5, -UNI_CWL } /* cwl=false */, - { 1, 184, 2032, 2, 21, UNI__PERL_NCHAR } /* isnoncharactercodepoint */, - { 5, 8351, 0, 7, 0, UNI_CJKEXTA } /* cjkexta */, - { 5, 7438, 4856, 10, 2, UNI_WB__DQ } /* wordbreak=dq */, - { 0, 8589, 8299, 7, 8, UNI_TFNG } /* script=tifinagh */, - { 13, 4628, 1192, 15, 9, UNI_EA__H } /* eastasianwidth=halfwidth */, - { 2, 9508, 9934, 4, 3, UNI_CCC__R } /* ccc=226 */, - { 0, 8589, 8990, 7, 6, UNI_RJNG } /* script=rejang */, - { 29, 10048, 7803, 3, 8, UNI_NV__1_SLASH_64 } /* nv=1.56e-02 */, - { 0, 8780, 951, 6, 28, UNI_VSSUP } /* block=variationselectorssupplement */, - { 0, 6484, 0, 4, 0, UNI_HUNG } /* hung */, - { 2, 3097, 6421, 18, 12, UNI_DT__NONCANON } /* decompositiontype=noncanonical */, - { 0, 3836, 7428, 17, 4, UNI_WARA } /* scriptextensions=wara */, - { 6, 10060, 36, 3, 1, UNI_RI } /* ri=t */, - { 2, 1188, 8292, 3, 7, UNI_INTAGBANWA } /* intagbanwa */, - { 3, 184, 47, 2, 1, UNI_M } /* ism */, - { 12, 6710, 3881, 4, 4, UNI_INCARIAN } /* incarian */, - { 0, 8780, 4273, 6, 7, UNI_INMYANMAR } /* block=myanmar */, - { 3, 9275, 3061, 5, 18, UNI_INSC__CONSONANTSUBJOINED } /* insc=consonantsubjoined */, - { 0, 9508, 9221, 5, 4, UNI_CCC__91 } /* ccc=ccc91 */, - { 13, 8589, 4385, 7, 4, UNI_TANG } /* script=tang */, - { 0, 7088, 2893, 10, 19, UNI_BC__RLO } /* bidiclass=righttoleftoverride */, - { 0, 8589, 7558, 7, 9, UNI_SC__QAAI } /* script=inherited */, - { 1, 7088, 10018, 10, 3, UNI_BC__FSI } /* bidiclass=fsi */, - { 3, 8780, 6505, 6, 12, UNI_PHAISTOS } /* block=phaistosdisc */, - { 0, 10024, 10168, 3, 2, UNI_CASEDLETTER } /* gc=l& */, - { 2, 10033, 5564, 3, 9, UNI_LB__QU } /* lb=quotation */, - { 3, 9488, 1033, 4, 27, UNI_ENCLOSEDCJK } /* blk=enclosedcjklettersandmonths */, - { 6, 2224, 780, 3, 29, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* insymbolsandpictographsextendeda */, - { 1, 184, 3870, 2, 17, UNI_SMALLFORMS } /* issmallformvariants */, - { 0, 9808, 0, 4, 0, UNI_TALU } /* talu */, - { 5, 6805, 4261, 6, 12, UNI_MISCMATHSYMBOLSB } /* inmiscmathsymbolsb */, - { 8, 3836, 9008, 17, 6, UNI_THAA } /* scriptextensions=thaana */, - { 6, 9277, 78, 3, 4, UNI_SC__ARAB } /* sc=arab */, - { 1, 2218, 9685, 3, 3, UNI_INNEWA } /* innewa */, - { 1, 3367, 0, 18, 0, UNI_patws_values_index } /* patternwhitespace= */, - { 1, 6061, 10135, 12, 3, UNI_BIDIC } /* bidicontrol=yes */, - { 0, 8780, 9305, 6, 5, UNI_INNUSHU } /* block=nushu */, - { 1, 9488, 8596, 4, 7, UNI_SC__SHRD } /* blk=sharada */, - { 0, 9768, 8344, 4, 4, UNI_BENG } /* scx=beng */, - { 6, 3853, 3, 17, 1, -UNI_STERM } /* sentenceterminal=f */, - { 1, 779, 0, 30, 0, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* symbolsandpictographsextendeda */, - { 1, 9260, 1025, 5, 2, -UNI_IDSB } /* idsb=no */, - { 1, 9768, 7621, 4, 9, UNI_NBAT } /* scx=nabataean */, - { 3, 8780, 2076, 6, 22, UNI_TRANSPORTANDMAP } /* block=transportandmapsymbols */, - { 0, 6469, 0, 12, 0, UNI_nt_values_index } /* numerictype= */, - { 0, 7218, 7522, 10, 9, UNI_LB__B2 } /* linebreak=breakboth */, - { 0, 9277, 9245, 3, 5, UNI_SC__DOGR } /* sc=dogra */, - { 0, 9488, 908, 4, 10, UNI_PUA } /* blk=privateuse */, - { 7, 10027, 6906, 3, 11, UNI_JG__ROHINGYAYEH } /* jg=rohingyayeh */, - { 3, 2288, 1656, 4, 21, UNI_COMPATJAMO } /* inhangulcompatibilityjamo */, - { 2, 3097, 1294, 18, 5, UNI_DT__SUP } /* decompositiontype=super */, - { 2, 9488, 4598, 4, 15, UNI_DIACRITICALSEXT } /* blk=diacriticalsext */, - { 0, 9508, 7950, 4, 1, UNI_CCC__9 } /* ccc=9 */, - { 5, 4065, 0, 16, 0, UNI_HALFANDFULLFORMS } /* halfandfullforms */, - { 2, 7088, 3700, 10, 17, UNI_BC__ES } /* bidiclass=europeanseparator */, - { 48, 8589, 2855, 7, 9, UNI_SC__MONG } /* script=mongolian */, - { 0, 7218, 395, 10, 2, UNI_LB__GL } /* linebreak=gl */, - { 1, 9008, 0, 4, 0, UNI_THAA } /* thaa */, - { 3, 9488, 6121, 4, 12, UNI_CYRILLICEXTC } /* blk=cyrillicextc */, - { 4, 184, 1944, 2, 22, UNI_EARLYDYNASTICCUNEIFORM } /* isearlydynasticcuneiform */, - { 8, 10024, 6035, 3, 2, UNI_PF } /* gc=pf */, - { 0, 10048, 8750, 3, 4, UNI_NV__8000 } /* nv=8000 */, - { 2, 4116, 6, 3, 2, UNI_IDC } /* isidc */, - { 7, 10048, 7858, 3, 2, UNI_NV__22 } /* nv=22 */, - { 1, 9488, 2609, 5, 5, UNI_INBRAHMI } /* blk=brahmi */, - { 0, 8115, 0, 4, 0, UNI_BASS } /* bass */, - { 2, 9768, 8477, 4, 7, UNI_MAKA } /* scx=makasar */, - { 0, 8780, 570, 7, 29, UNI_CJKEXTC } /* block=cjkunifiedideographsextensionc */, - { 0, 10033, 5585, 3, 2, UNI_EBASE } /* lb=eb */, - { 14, 2119, 0, 14, 0, UNI_CJKRADICALSSUP } /* cjkradicalssup */, - { 0, 493, 0, 3, 0, UNI_HAN } /* han */, - { 1, 3836, 2817, 17, 4, UNI_MERO } /* scriptextensions=mero */, - { 1, 10288, 6554, 3, 10, UNI_XIDC } /* isxidcontinue */, - { 65, 184, 6807, 2, 11, UNI_MISCSYMBOLS } /* ismiscsymbols */, - { 65, 9508, 9922, 4, 3, UNI_CCC__214 } /* ccc=214 */, - { 100, 8275, 0, 8, 0, UNI_SPECIALS } /* specials */, - { 0, 5986, 7890, 13, 2, UNI_NV__33 } /* numericvalue=33 */, - { 0, 2288, 1514, 3, 23, UNI_HIGHPUSURROGATES } /* inhighprivateusesurrogates */, - { 24, 2760, 5633, 19, 2, UNI_LB__H2 } /* hangulsyllabletype=lv */, - { 17, 184, 908, 2, 14, UNI_PUA } /* isprivateusearea */, - { 0, 9768, 8659, 4, 7, UNI_TIBT } /* scx=tibetan */, - { 4, 10129, 10135, 3, 3, UNI_VS } /* vs=yes */, - { 1, 7540, 9255, 9, 5, -UNI_EXT } /* extender=false */, - { 1, 9350, 1025, 5, 2, -UNI_XIDS } /* xids=no */, - { 1, 9768, 8645, 4, 7, UNI_LANA } /* scx=taitham */, - { 0, 8589, 2817, 7, 19, UNI_MERO } /* script=meroitichieroglyphs */, - { 11, 9504, 0, 4, 0, UNI_CANS } /* cans */, - { 0, 9277, 9580, 3, 4, UNI_SC__HANO } /* sc=hano */, - { 15, 10024, 1, 3, 1, UNI_N } /* gc=n */, - { 21, 3836, 9740, 17, 4, UNI_QAAI } /* scriptextensions=qaai */, - { 22, 10033, 5088, 3, 14, UNI_LB__SA } /* lb=complexcontext */, - { 0, 1417, 9223, 24, 2, UNI_CCC__91 } /* canonicalcombiningclass=91 */, - { 0, 9596, 6541, 4, 12, UNI_GCB__T } /* hst=trailingjamo */, - { 0, 8688, 3923, 4, 14, UNI_ARABICSUP } /* isarabicsupplement */, - { 4, 184, 3893, 2, 11, UNI_SGNW } /* issignwriting */, - { 0, 7118, 0, 10, 0, UNI_CHRS } /* chorasmian */, - { 4, 0, 0, 42, 0, UNI_UCASEXT } /* unifiedcanadianaboriginalsyllabicsextended */, - { 3, 10333, 6973, 3, 3, UNI_SYLO } /* issylo */, - { 5, 7088, 2509, 10, 11, UNI_BC__R } /* bidiclass=righttoleft */, - { 5, 9275, 4417, 5, 5, UNI_INSC__VOWEL } /* insc=vowel */, - { 0, 10024, 5494, 3, 14, UNI_MN } /* gc=nonspacingmark */, - { 32, 1552, 9225, 9, 5, UNI_XPOSIXCNTRL } /* category=cntrl */, - { 16, 9262, 9080, 3, 5, UNI_SB__AT } /* sb=aterm */, - { 0, 10033, 908, 3, 2, UNI_LB__PR } /* lb=pr */, - { 0, 7318, 7781, 10, 1, UNI_IN__4 } /* presentin=4 */, - { 0, 4883, 0, 15, 0, UNI_SARB } /* oldsoutharabian */, - { 0, 5791, 4773, 13, 3, UNI_JG__SAD } /* joininggroup=sad */, - { 1, 183, 0, 20, 0, UNI_MISCSYMBOLS } /* miscellaneoussymbols */, - { 1, 6231, 3081, 4, 16, UNI_COPTICEPACTNUMBERS } /* incopticepactnumbers */, - { 1, 5116, 1, 14, 1, -UNI_EMOD } /* emojimodifier=n */, - { 0, 3836, 9636, 17, 4, UNI_LINB } /* scriptextensions=linb */, - { 32, 8780, 349, 6, 33, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* block=supplementalsymbolsandpictographs */, - { 0, 5018, 0, 14, 0, UNI_ANCIENTSYMBOLS } /* ancientsymbols */, - { 4, 10048, 7821, 3, 1, UNI_NV__8 } /* nv=8 */, - { 3, 5986, 9380, 13, 3, UNI_NV__1_SLASH_8 } /* numericvalue=1/8 */, - { 3, 9488, 8379, 4, 7, UNI_CJKEXTE } /* blk=cjkexte */, - { 24, 4916, 3458, 3, 10, UNI_TAIXUANJING } /* istaixuanjing */, - { 1, 8864, 9255, 6, 5, -UNI_EMOJI } /* emoji=false */, - { 1, 3836, 2560, 17, 4, UNI_MAND } /* scriptextensions=mand */, - { 1, 8912, 0, 4, 0, UNI_KHOJ } /* khoj */, - { 0, 8780, 8243, 6, 8, UNI_INMAHAJANI } /* block=mahajani */, - { 1, 9277, 3241, 3, 8, UNI_SC__GEOR } /* sc=georgian */, - { 1, 8187, 0, 4, 0, UNI_HIRA } /* hira */, - { 23, 184, 2054, 2, 22, UNI_MODIFIERLETTERS } /* isspacingmodifierletters */, - { 0, 1417, 7858, 24, 3, UNI_CCC__B } /* canonicalcombiningclass=220 */, - { 0, 9290, 9836, 5, 4, UNI_MATH } /* math=true */, - { 1, 5986, 9432, 13, 4, UNI_NV__5_SLASH_12 } /* numericvalue=5/12 */, - { 1, 9768, 9808, 4, 4, UNI_TALU } /* scx=talu */, - { 15, 3529, 9255, 18, 5, -UNI_VS } /* variationselector=false */, - { 0, 1537, 7170, 4, 8, UNI_INDIVESAKURU } /* indivesakuru */, - { 1, 3529, 9836, 18, 4, UNI_VS } /* variationselector=true */, - { 8, 1834, 1, 22, 1, -UNI_CWT } /* changeswhentitlecased=n */, - { 0, 3097, 2569, 18, 4, UNI_DT__VERT } /* decompositiontype=vert */, - { 2, 4916, 2297, 3, 3, UNI_THAI } /* isthai */, - { 51, 9556, 34, 4, 6, UNI_GCB__EX } /* gcb=extend */, - { 1, 184, 2350, 3, 19, UNI_PC } /* isconnectorpunctuation */, - { 8, 7158, 0, 10, 0, UNI_dia_values_index } /* diacritic= */, - { 2, 4033, 728, 16, 6, UNI_N } /* generalcategory=number */, - { 0, 10048, 8756, 3, 3, UNI_NV__900 } /* nv=900 */, - { 2, 9488, 113, 4, 25, UNI_DIACRITICALS } /* blk=combiningdiacriticalmarks */, - { 1, 96, 0, 10, 0, UNI_XPOSIXALPHA } /* alphabetic */, - { 0, 9488, 1677, 4, 9, UNI_LATINEXTE } /* blk=latinexte */, - { 0, 184, 809, 2, 29, UNI_ENCLOSEDIDEOGRAPHICSUP } /* isenclosedideographicsupplement */, - { 3, 8589, 8876, 7, 4, UNI_GOTH } /* script=goth */, - { 0, 10048, 7778, 3, 2, UNI_NV__21 } /* nv=21 */, - { 1, 2529, 1025, 20, 2, -UNI_TERM } /* terminalpunctuation=no */, - { 1, 184, 5746, 2, 5, UNI_EBASE } /* isebase */, - { 0, 8589, 1115, 7, 4, UNI_SC__HANG } /* script=hang */, - { 54, 184, 3295, 2, 18, UNI_LATINEXTADDITIONAL } /* islatinextadditional */, - { 31, 9488, 3683, 4, 16, UNI_ETHIOPICEXT } /* blk=ethiopicextended */, - { 3, 7438, 5746, 10, 5, UNI_WB__EB } /* wordbreak=ebase */, - { 5, 8589, 8091, 7, 8, UNI_ARMN } /* script=armenian */, - { 22, 7076, 1586, 3, 22, UNI_BYZANTINEMUSIC } /* inbyzantinemusicalsymbols */, - { 0, 7155, 8450, 3, 5, UNI_HYPHEN } /* ishyphen */, - { 0, 5791, 5, 13, 1, UNI_JG__E } /* joininggroup=e */, - { 1, 9277, 9656, 3, 4, UNI_MIAO } /* sc=miao */, - { 3, 10132, 8139, 3, 8, UNI_WB__EB } /* wb=ebasegaz */, - { 2, 1417, 0, 24, 0, UNI_ccc_values_index } /* canonicalcombiningclass= */, - { 1, 2529, 10135, 20, 3, UNI_TERM } /* terminalpunctuation=yes */, - { 4, 9816, 0, 4, 0, UNI_TAVT } /* tavt */, - { 5, 8768, 36, 6, 1, UNI_BIDIC } /* bidic=t */, - { 0, 9768, 8107, 4, 4, UNI_BALI } /* scx=bali */, - { 0, 8449, 36, 7, 1, UNI_HYPHEN } /* hyphen=t */, - { 1, 9444, 10102, 4, 3, UNI_AGE__5_DOT_2 } /* age=v52 */, - { 14, 5986, 8732, 13, 6, UNI_NV__500000 } /* numericvalue=500000 */, - { 0, 4916, 8584, 3, 3, UNI_TAGS } /* istags */, - { 8, 9788, 0, 4, 0, UNI_SHRD } /* shrd */, - { 2, 9488, 4973, 4, 8, UNI_VEDICEXT } /* blk=vedicext */, - { 1, 9488, 2855, 4, 12, UNI_MONGOLIANSUP } /* blk=mongoliansup */, - { 0, 9020, 36, 6, 1, UNI_XPOSIXUPPER } /* upper=t */, - { 24, 1417, 9221, 25, 4, UNI_CCC__91 } /* canonicalcombiningclass=ccc91 */, - { 1, 9488, 2429, 4, 20, UNI_ININSCRIPTIONALPAHLAVI } /* blk=inscriptionalpahlavi */, - { 1, 6277, 0, 12, 0, UNI_MAHJONG } /* mahjongtiles */, - { 0, 184, 8484, 2, 7, UNI_MAND } /* ismandaic */, - { 3, 8780, 2666, 7, 18, UNI_COUNTINGROD } /* block=countingrodnumerals */, - { 1, 184, 9864, 2, 4, UNI_WCHO } /* iswcho */, - { 33, 5060, 1, 14, 1, -UNI_CI } /* caseignorable=n */, - { 0, 184, 1, 2, 1, UNI_N } /* isn */, - { 7, 8780, 4478, 6, 7, UNI_BRAI } /* block=braille */, - { 8, 5578, 1867, 14, 5, UNI_SB__UP } /* sentencebreak=upper */, - { 6, 9768, 7651, 4, 4, UNI_ITAL } /* scx=ital */, - { 4, 10048, 8738, 3, 6, UNI_NV__600000 } /* nv=600000 */, - { 13, 3079, 0, 6, 0, UNI_COPT } /* coptic */, - { 8, 8589, 2224, 7, 21, UNI_PRTI } /* script=inscriptionalparthian */, - { 1, 3836, 9600, 17, 4, UNI_KALI } /* scriptextensions=kali */, - { 47, 1417, 16, 24, 1, UNI_CCC__B } /* canonicalcombiningclass=b */, - { 1, 8589, 2913, 8, 8, UNI_SUND } /* script=sundanese */, - { 33, 10048, 8019, 3, 8, UNI_NV__2_SLASH_3 } /* nv=6.67e-01 */, - { 32, 3424, 1, 3, 41, UNI_UCASEXT } /* inunifiedcanadianaboriginalsyllabicsextended */, - { 16, 9768, 8442, 4, 7, UNI_HANO } /* scx=hanunoo */, - { 26, 9070, 1025, 5, 2, -UNI_POSIXXDIGIT } /* ahex=no */, - { 0, 184, 8936, 2, 6, UNI_LYCI } /* islycian */, - { 1, 6253, 0, 12, 0, UNI_KHMERSYMBOLS } /* khmersymbols */, - { 0, 9768, 5843, 4, 9, UNI_MLYM } /* scx=malayalam */, - { 0, 10024, 341, 3, 2, UNI_PE } /* gc=pe */, - { 7, 9488, 3331, 4, 18, UNI_ORNAMENTALDINGBATS } /* blk=ornamentaldingbats */, - { 4, 9508, 3015, 4, 5, UNI_CCC__A } /* ccc=above */, - { 1, 9488, 3457, 4, 18, UNI_TAIXUANJING } /* blk=taixuanjingsymbols */, - { 0, 5791, 7199, 14, 9, UNI_JG__KNOTTEDHEH } /* joininggroup=knottedheh */, - { 5, 1417, 8795, 24, 3, UNI_CCC__103 } /* canonicalcombiningclass=103 */, - { 1, 5791, 10057, 13, 3, UNI_JG__REH } /* joininggroup=reh */, - { 3, 9488, 5688, 5, 12, UNI_BLOCKELEMENTS } /* blk=blockelements */, - { 0, 1878, 0, 22, 0, UNI_CJKCOMPATIDEOGRAPHSSUP } /* cjkcompatideographssup */, - { 1, 7318, 9840, 10, 4, UNI_IN__10 } /* presentin=v100 */, - { 0, 8780, 7291, 6, 7, UNI_INSOGDIAN } /* block=sogdian */, - { 24, 9277, 8990, 3, 6, UNI_RJNG } /* sc=rejang */, - { 0, 10027, 9648, 3, 4, UNI_JG__MEEM } /* jg=meem */, - { 5, 9724, 0, 4, 0, UNI_PHNX } /* phnx */, - { 2, 184, 2855, 2, 12, UNI_MONGOLIANSUP } /* ismongoliansup */, - { 1, 9768, 3241, 4, 8, UNI_GEOR } /* scx=georgian */, - { 4, 10033, 10160, 3, 2, UNI_LB__H3 } /* lb=h3 */, - { 2, 9492, 751, 4, 5, UNI_BPT__C } /* bpt=close */, - { 8, 8407, 0, 7, 0, UNI_DSRT } /* deseret */, - { 56, 10048, 8750, 3, 6, UNI_NV__800000 } /* nv=800000 */, - { 1, 2409, 0, 13, 0, UNI_GLAGOLITICSUP } /* glagoliticsup */, - { 16, 9768, 9592, 4, 4, UNI_HMNP } /* scx=hmnp */, - { 9, 8589, 9584, 7, 4, UNI_HLUW } /* script=hluw */, - { 1, 2280, 4885, 4, 13, UNI_SARB } /* isoldsoutharabian */, - { 1, 3836, 9664, 17, 4, UNI_MRO } /* scriptextensions=mroo */, - { 176, 6420, 9321, 3, 4, UNI_INOSAGE } /* inosage */, - { 1, 8780, 8906, 6, 6, UNI_KANBUN } /* block=kanbun */, - { 81, 1944, 0, 22, 0, UNI_EARLYDYNASTICCUNEIFORM } /* earlydynasticcuneiform */, - { 2, 9277, 382, 3, 4, UNI_EGYP } /* sc=egyp */, - { 0, 1087, 3, 27, 1, -UNI_PCM } /* prependedconcatenationmark=f */, - { 0, 8589, 7288, 7, 10, UNI_SOGO } /* script=oldsogdian */, - { 10, 9488, 5270, 4, 14, UNI_LATINEXTE } /* blk=latinextendede */, - { 112, 3836, 9900, 17, 4, UNI_ZZZZ } /* scriptextensions=zzzz */, - { 0, 8688, 2590, 3, 18, UNI_ANCIENTGREEKNUMBERS } /* isancientgreeknumbers */, - { 65, 9997, 10042, 3, 3, UNI_BC__LRO } /* bc=lro */, - { 0, 10033, 1465, 3, 13, UNI_LB__CM } /* lb=combiningmark */, - { 28, 8780, 43, 7, 8, UNI_CJKCOMPAT } /* block=cjkcompat */, - { 32, 7630, 0, 9, 0, UNI_TALU } /* newtailue */, - { 3, 9768, 493, 4, 3, UNI_HAN } /* scx=han */, - { 4, 10340, 9861, 3, 3, UNI_VAI } /* isvaii */, - { 4, 10027, 7045, 3, 3, UNI_JG__FEH } /* jg=feh */, - { 1, 6710, 3583, 4, 15, UNI_UCAS } /* incanadiansyllabics */, - { 2, 4791, 6798, 4, 9, UNI_INMEDEFAIDRIN } /* inmedefaidrin */, - { 4, 9768, 8456, 4, 7, UNI_KNDA } /* scx=kannada */, - { 56, 1527, 0, 9, 0, UNI__PERL_SURROGATE } /* surrogate */, - { 1, 8780, 2855, 6, 12, UNI_MONGOLIANSUP } /* block=mongoliansup */, - { 0, 6807, 0, 11, 0, UNI_MISCSYMBOLS } /* miscsymbols */, - { 1, 9290, 3, 5, 1, -UNI_MATH } /* math=f */, - { 0, 8780, 1677, 6, 23, UNI_LATINEXTADDITIONAL } /* block=latinextendedadditional */, - { 7, 9071, 10135, 4, 3, UNI_XPOSIXXDIGIT } /* hex=yes */, - { 0, 5986, 9203, 13, 2, UNI_NV__34 } /* numericvalue=34 */, - { 2, 8780, 540, 7, 29, UNI_CJKEXTB } /* block=cjkunifiedideographsextensionb */, - { 0, 9038, 0, 4, 0, UNI_YEZI } /* yezi */, - { 33, 5284, 0, 14, 0, UNI_LISUSUP } /* lisusupplement */, - { 9, 4033, 4958, 16, 15, UNI_UPPERCASELETTER } /* generalcategory=uppercaseletter */, - { 0, 3836, 9808, 17, 4, UNI_TALU } /* scriptextensions=talu */, - { 8, 3836, 9860, 17, 3, UNI_VAI } /* scriptextensions=vai */, - { 5, 9768, 9008, 4, 6, UNI_THAA } /* scx=thaana */, - { 0, 8589, 7278, 7, 10, UNI_XPEO } /* script=oldpersian */, - { 0, 3836, 3169, 17, 8, UNI_ETHI } /* scriptextensions=ethiopic */, - { 9, 1828, 9255, 6, 5, -UNI_CASED } /* cased=false */, - { 0, 10030, 6994, 3, 11, UNI_JT__T } /* jt=transparent */, - { 0, 9768, 8421, 4, 4, UNI_ELYM } /* scx=elym */, - { 2, 9488, 2061, 4, 15, UNI_MODIFIERLETTERS } /* blk=modifierletters */, - { 1, 8589, 9464, 7, 4, UNI_ARMN } /* script=armn */, - { 7, 9488, 8372, 4, 7, UNI_CJKEXTD } /* blk=cjkextd */, - { 100, 8589, 8912, 7, 6, UNI_SC__KHOJ } /* script=khojki */, - { 0, 9488, 4449, 5, 4, UNI_INBAMUM } /* blk=bamum */, - { 57, 8780, 8659, 6, 7, UNI_INTIBETAN } /* block=tibetan */, - { 2, 9235, 9255, 5, 5, -UNI_CWCM } /* cwcm=false */, - { 0, 3904, 3, 17, 1, -UNI_UIDEO } /* unifiedideograph=f */, - { 0, 7188, 0, 4, 0, UNI_KHAR } /* khar */, - { 2, 8780, 2477, 6, 3, UNI_PUA } /* block=pua */, - { 32, 8780, 7248, 6, 10, UNI_MISCARROWS } /* block=miscarrows */, - { 138, 9270, 5523, 3, 13, UNI_PHONETICEXTSUP } /* inphoneticextsup */, - { 0, 4916, 4929, 3, 14, UNI_TAMILSUP } /* istamilsupplement */, - { 1, 3836, 9632, 17, 4, UNI_LINA } /* scriptextensions=lina */, - { 0, 8780, 0, 6, 0, UNI_blk_values_index } /* block= */, - { 68, 8589, 9002, 7, 4, UNI_SC__TELU } /* script=telu */, - { 22, 5578, 339, 14, 2, UNI_SB__LO } /* sentencebreak=lo */, - { 0, 2349, 0, 20, 0, UNI_PC } /* connectorpunctuation */, - { 1, 184, 5674, 2, 5, UNI_BIDIM } /* isbidim */, - { 24, 10024, 908, 3, 10, UNI_CO } /* gc=privateuse */, - { 64, 21, 2308, 2, 21, UNI_YIJING } /* inyijinghexagramsymbols */, - { 0, 3836, 7648, 17, 9, UNI_ITAL } /* scriptextensions=olditalic */, - { 0, 9508, 3007, 4, 18, UNI_CCC__216 } /* ccc=attachedaboveright */, - { 2, 9503, 0, 2, 0, UNI_MC } /* mc */, - { 8, 9277, 5843, 3, 9, UNI_SC__MLYM } /* sc=malayalam */, - { 0, 9716, 1, 4, 1, -UNI_PCM } /* pcm=n */, - { 29, 9997, 2266, 3, 21, UNI_BC__PDI } /* bc=popdirectionalisolate */, - { 0, 10296, 10308, 7, 5, UNI_POSIXPRINT } /* isposixprint */, - { 32, 10027, 4193, 3, 16, UNI_JG__MANICHAEANLAMEDH } /* jg=manichaeanlamedh */, - { 138, 10333, 6886, 3, 3, UNI_SHAW } /* isshaw */, - { 0, 9488, 5074, 4, 14, UNI_CJKCOMPATFORMS } /* blk=cjkcompatforms */, - { 31, 3683, 0, 11, 0, UNI_ETHIOPICEXT } /* ethiopicext */, - { 17, 9768, 9740, 4, 4, UNI_QAAI } /* scx=qaai */, - { 3, 7218, 495, 10, 7, UNI_LB__NU } /* linebreak=numeric */, - { 6, 9540, 0, 4, 0, UNI_dia_values_index } /* dia= */, - { 0, 9070, 0, 5, 0, UNI_ahex_values_index } /* ahex= */, - { 0, 8780, 3633, 7, 16, UNI_CYRILLICEXTA } /* block=cyrillicextendeda */, - { 2, 4385, 0, 16, 0, UNI_TANGUTCOMPONENTS } /* tangutcomponents */, - { 50, 8780, 6098, 7, 11, UNI_CYRILLICEXTA } /* block=cyrillicexta */, - { 0, 9275, 4113, 5, 16, UNI_INSC__INVISIBLESTACKER } /* insc=invisiblestacker */, - { 0, 9488, 1344, 4, 25, UNI_SYMBOLSFORLEGACYCOMPUTING } /* blk=symbolsforlegacycomputing */, - { 1, 4542, 1633, 4, 13, UNI_GEOMETRICSHAPES } /* ingeometricshapes */, - { 4, 9488, 6397, 4, 12, UNI_MATHALPHANUM } /* blk=mathalphanum */, - { 4, 9345, 0, 5, 0, UNI_xidc_values_index } /* xidc= */, - { 1, 3836, 9588, 17, 4, UNI_HMNG } /* scriptextensions=hmng */, - { 0, 7228, 9836, 10, 4, UNI_XPOSIXLOWER } /* lowercase=true */, - { 166, 10024, 400, 3, 6, UNI_CF } /* gc=format */, - { 2, 9488, 5158, 4, 14, UNI_INGREEK } /* blk=greekandcoptic */, - { 1, 838, 0, 29, 0, UNI_MISCARROWS } /* miscellaneoussymbolsandarrows */, - { 4, 8882, 3, 6, 1, -UNI_GREXT } /* grext=f */, - { 16, 2288, 4675, 4, 13, UNI_INHANGUL } /* inhangulsyllables */, - { 0, 9270, 2549, 5, 20, UNI_INPC__TOPANDBOTTOMANDRIGHT } /* inpc=topandbottomandright */, - { 0, 3921, 0, 16, 0, UNI_ARABICSUP } /* arabicsupplement */, - { 8, 21, 2308, 2, 6, UNI_YIJING } /* inyijing */, - { 0, 7495, 0, 9, 0, UNI_ARABICPFA } /* arabicpfa */, - { 0, 184, 4340, 2, 13, UNI_MATHOPERATORS } /* ismathoperators */, - { 0, 9488, 5778, 4, 6, UNI_IPAEXT } /* blk=ipaext */, - { 0, 10027, 5620, 3, 10, UNI_JG__TEHMARBUTA } /* jg=tehmarbuta */, - { 0, 2182, 73, 21, 2, UNI_WB__EB } /* graphemeclusterbreak=em */, - { 0, 1979, 10169, 10, 1, UNI_CASEDLETTER } /* category=l& */, - { 0, 9528, 1, 4, 1, -UNI_CWU } /* cwu=n */, - { 0, 2760, 7720, 19, 9, UNI_GCB__V } /* hangulsyllabletype=voweljamo */, - { 5, 184, 10168, 2, 2, UNI_CASEDLETTER } /* isl& */, - { 182, 8365, 0, 7, 0, UNI_CJKEXTC } /* cjkextc */, - { 4, 9768, 2224, 4, 21, UNI_PRTI } /* scx=inscriptionalparthian */, - { 2, 9320, 0, 5, 0, UNI_OSGE } /* osage */, - { 144, 9020, 1025, 6, 2, -UNI_XPOSIXUPPER } /* upper=no */, - { 0, 9488, 1900, 4, 22, UNI_INDICNUMBERFORMS } /* blk=commonindicnumberforms */, - { 1, 5986, 8075, 13, 8, UNI_NV__7_SLASH_8 } /* numericvalue=8.75e-01 */, - { 0, 5116, 1025, 14, 2, -UNI_EMOD } /* emojimodifier=no */, - { 141, 9444, 10099, 4, 3, UNI_AGE__5_DOT_1 } /* age=v51 */, - { 0, 8688, 5719, 3, 4, UNI_XPOSIXALNUM } /* isalnum */, - { 12, 10333, 0, 7, 0, UNI_XPOSIXSPACE } /* isspace */, - { 2, 1631, 0, 23, 0, UNI_GEOMETRICSHAPESEXT } /* geometricshapesextended */, - { 1, 2288, 8188, 3, 7, UNI_INHIRAGANA } /* inhiragana */, - { 3, 9230, 10135, 5, 3, UNI_CWCF } /* cwcf=yes */, - { 9, 9508, 9931, 4, 3, UNI_CCC__L } /* ccc=224 */, - { 8, 9768, 9245, 4, 4, UNI_DOGR } /* scx=dogr */, - { 1, 6420, 7649, 3, 8, UNI_INOLDITALIC } /* inolditalic */, - { 0, 9768, 6973, 5, 3, UNI_SYLO } /* scx=sylo */, - { 37, 5578, 69, 14, 2, UNI_SB__UP } /* sentencebreak=up */, - { 2, 2280, 7290, 4, 8, UNI_SOGO } /* isoldsogdian */, - { 0, 5116, 9836, 14, 4, UNI_EMOD } /* emojimodifier=true */, - { 0, 9277, 6409, 3, 4, UNI_MEND } /* sc=mend */, - { 113, 10333, 2913, 3, 8, UNI_SUND } /* issundanese */, - { 2, 3836, 7675, 17, 4, UNI_PALM } /* scriptextensions=palm */, - { 34, 8589, 9548, 7, 4, UNI_DSRT } /* script=dsrt */, - { 10, 9768, 7118, 4, 10, UNI_CHRS } /* scx=chorasmian */, - { 0, 9997, 3374, 3, 10, UNI_BC__WS } /* bc=whitespace */, - { 1, 8852, 1025, 6, 2, -UNI_CWKCF } /* cwkcf=no */, - { 7, 2477, 0, 3, 0, UNI_PUA } /* pua */, - { 1, 184, 809, 2, 22, UNI_ENCLOSEDIDEOGRAPHICSUP } /* isenclosedideographicsup */, - { 0, 1417, 8, 24, 1, UNI_CCC__A } /* canonicalcombiningclass=a */, - { 46, 5466, 26, 14, 1, UNI_NFDQC__Y } /* nfdquickcheck=y */, - { 0, 2182, 24, 21, 1, UNI_GCB__L } /* graphemeclusterbreak=l */, - { 5, 9275, 1244, 5, 9, UNI_INSC__CONSONANT } /* insc=consonant */, - { 1, 10048, 8732, 3, 5, UNI_NV__50000 } /* nv=50000 */, - { 0, 10024, 10176, 3, 2, UNI_ZL } /* gc=zl */, - { 5, 9488, 4883, 4, 15, UNI_SARB } /* blk=oldsoutharabian */, - { 43, 184, 5270, 2, 14, UNI_LATINEXTE } /* islatinextendede */, - { 0, 10063, 26, 3, 1, UNI_SD } /* sd=y */, - { 0, 5791, 5918, 13, 3, UNI_JG__TAW } /* joininggroup=taw */, - { 10, 3385, 3, 18, 1, -UNI_RI } /* regionalindicator=f */, - { 2, 9488, 7594, 4, 9, UNI_LATINEXTD } /* blk=latinextd */, - { 0, 3836, 1900, 17, 6, UNI_ZYYY } /* scriptextensions=common */, - { 0, 10033, 10158, 3, 2, UNI_LB__H2 } /* lb=h2 */, - { 144, 9768, 7359, 5, 3, UNI_SAUR } /* scx=saur */, - { 1, 10048, 7859, 3, 6, UNI_NV__200000 } /* nv=200000 */, - { 0, 5986, 7923, 13, 8, UNI_NV__2_SLASH_5 } /* numericvalue=4.00e-01 */, - { 32, 184, 2141, 3, 10, UNI_CYRILLICSUP } /* iscyrillicsup */, - { 0, 4916, 3458, 3, 17, UNI_TAIXUANJING } /* istaixuanjingsymbols */, - { 4, 8780, 2141, 7, 17, UNI_CYRILLICSUP } /* block=cyrillicsupplement */, - { 7, 8780, 4448, 6, 5, UNI_INBAMUM } /* block=bamum */, - { 1, 8091, 0, 8, 0, UNI_ARMN } /* armenian */, - { 32, 184, 0, 3, 0, UNI_C } /* isc */, - { 0, 184, 8115, 2, 4, UNI_BASS } /* isbass */, - { 3, 184, 4583, 2, 4, UNI_DASH } /* isdash */, - { 1, 9488, 4401, 4, 16, UNI_TANGUTSUP } /* blk=tangutsupplement */, - { 1, 8780, 4257, 6, 16, UNI_MISCMATHSYMBOLSB } /* block=miscmathsymbolsb */, - { 2, 9015, 1, 5, 1, -UNI_IDEO } /* ideo=n */, - { 0, 184, 1677, 2, 5, UNI_LATN } /* islatin */, - { 12, 10288, 3379, 8, 5, UNI_XPOSIXSPACE } /* isxposixspace */, - { 89, 9488, 3439, 4, 18, UNI_SMALLKANAEXT } /* blk=smallkanaextension */, - { 1, 2569, 0, 20, 0, UNI_vo_values_index } /* verticalorientation= */, - { 0, 10024, 2268, 3, 2, UNI_PD } /* gc=pd */, - { 30, 9488, 5256, 4, 14, UNI_LATINEXTD } /* blk=latinextendedd */, - { 0, 8780, 567, 6, 2, UNI_NB } /* block=nb */, - { 4, 10048, 7859, 3, 2, UNI_NV__20 } /* nv=20 */, - { 0, 9444, 10123, 4, 3, UNI_AGE__9 } /* age=v90 */, - { 0, 1417, 8811, 25, 5, UNI_CCC__122 } /* canonicalcombiningclass=ccc122 */, - { 0, 9488, 7291, 4, 7, UNI_INSOGDIAN } /* blk=sogdian */, - { 36, 10003, 1, 3, 1, -UNI_CI } /* ci=n */, - { 1, 9277, 2817, 3, 4, UNI_MERO } /* sc=mero */, - { 0, 10030, 6529, 3, 12, UNI_JT__R } /* jt=rightjoining */, - { 2, 3836, 9325, 17, 5, UNI_RUNR } /* scriptextensions=runic */, - { 0, 7058, 0, 10, 0, UNI_ARABICEXTA } /* arabicexta */, - { 0, 3836, 8786, 17, 6, UNI_CARI } /* scriptextensions=carian */, - { 8, 4658, 1, 15, 1, -UNI_GREXT } /* graphemeextend=n */, - { 6, 9768, 1900, 4, 6, UNI_ZYYY } /* scx=common */, - { 25, 9488, 2817, 4, 19, UNI_MERO } /* blk=meroitichieroglyphs */, - { 0, 21, 5214, 2, 6, UNI_KANGXI } /* inkangxi */, - { 65, 9488, 8990, 4, 6, UNI_INREJANG } /* blk=rejang */, - { 0, 7318, 9955, 10, 3, UNI_IN__3_DOT_2 } /* presentin=3.2 */, - { 0, 7325, 9388, 3, 4, UNI_IN__11 } /* in=11.0 */, - { 1, 5791, 4193, 13, 16, UNI_JG__MANICHAEANLAMEDH } /* joininggroup=manichaeanlamedh */, - { 3, 10027, 3785, 3, 17, UNI_JG__MANICHAEANDHAMEDH } /* jg=manichaeandhamedh */, - { 2, 2855, 0, 19, 0, UNI_MONGOLIANSUP } /* mongoliansupplement */, - { 0, 749, 0, 30, 0, UNI_ENCLOSEDALPHANUMSUP } /* enclosedalphanumericsupplement */, - { 0, 8780, 6012, 6, 13, UNI_VERTICALFORMS } /* block=verticalforms */, - { 1, 7325, 7765, 3, 1, UNI_IN__2 } /* in=2 */, - { 2, 9488, 6097, 4, 12, UNI_CYRILLICEXTA } /* blk=cyrillicexta */, - { 2, 8589, 0, 7, 0, UNI_sc_values_index } /* script= */, - { 3, 446, 0, 18, 0, UNI_IDEOGRAPHICSYMBOLS } /* ideographicsymbols */, - { 0, 5986, 9208, 13, 2, UNI_NV__35 } /* numericvalue=35 */, - { 0, 9277, 2203, 3, 4, UNI_SC__HAN } /* sc=hani */, - { 10, 9277, 2409, 3, 10, UNI_SC__GLAG } /* sc=glagolitic */, - { 2, 8984, 9836, 6, 4, UNI_QMARK } /* qmark=true */, - { 3, 5452, 9295, 14, 5, UNI_NFCQC__M } /* nfcquickcheck=maybe */, - { 0, 9508, 9218, 4, 2, UNI_CCC__84 } /* ccc=84 */, - { 1, 5791, 5312, 13, 14, UNI_JG__MANICHAEANAYIN } /* joininggroup=manichaeanayin */, - { 3, 184, 3683, 2, 17, UNI_ETHIOPICEXTA } /* isethiopicextendeda */, - { 2, 10027, 7055, 3, 3, UNI_JG__QAF } /* jg=qaf */, - { 0, 2076, 0, 22, 0, UNI_TRANSPORTANDMAP } /* transportandmapsymbols */, - { 2, 21, 8900, 2, 6, UNI_INKAITHI } /* inkaithi */, - { 0, 8882, 0, 5, 0, UNI_GREXT } /* grext */, - { 24, 9488, 1393, 4, 24, UNI_ARABICPFB } /* blk=arabicpresentationformsb */, - { 64, 1552, 4583, 9, 15, UNI_PD } /* category=dashpunctuation */, - { 0, 7438, 7730, 11, 8, UNI_WB__WSEGSPACE } /* wordbreak=wsegspace */, - { 0, 9768, 9864, 4, 4, UNI_WCHO } /* scx=wcho */, - { 1, 10024, 10178, 3, 2, UNI_ZP } /* gc=zp */, - { 0, 10027, 6361, 3, 12, UNI_JG__MALAYALAMTTA } /* jg=malayalamtta */, - { 40, 5986, 9408, 13, 4, UNI_NV__15_SLASH_2 } /* numericvalue=15/2 */, - { 5, 5791, 5410, 13, 14, UNI_JG__MANICHAEANTETH } /* joininggroup=manichaeanteth */, - { 13, 7088, 6493, 10, 12, UNI_BC__ON } /* bidiclass=otherneutral */, - { 32, 8780, 1060, 7, 5, UNI_INCOPTIC } /* block=coptic */, - { 32, 9488, 5186, 4, 14, UNI_HIGHSURROGATES } /* blk=highsurrogates */, - { 8, 9768, 7648, 4, 9, UNI_ITAL } /* scx=olditalic */, - { 37, 3529, 0, 18, 0, UNI_vs_values_index } /* variationselector= */, - { 3, 8624, 0, 7, 0, UNI_SUPPUAA } /* suppuaa */, - { 0, 1188, 2077, 3, 14, UNI_TRANSPORTANDMAP } /* intransportandmap */, - { 97, 9488, 4449, 5, 7, UNI_BAMUMSUP } /* blk=bamumsup */, - { 1, 184, 8344, 2, 4, UNI_BENG } /* isbeng */, - { 1, 1417, 9934, 24, 3, UNI_CCC__R } /* canonicalcombiningclass=226 */, - { 6, 9768, 9816, 4, 4, UNI_TAVT } /* scx=tavt */, - { 82, 7738, 1, 9, 1, -UNI_XIDS } /* xidstart=n */, - { 2, 8123, 0, 4, 0, UNI_BUGI } /* bugi */, - { 166, 4257, 0, 16, 0, UNI_MISCMATHSYMBOLSB } /* miscmathsymbolsb */, - { 56, 5986, 9416, 13, 4, UNI_NV__3_SLASH_16 } /* numericvalue=3/16 */, - { 0, 9768, 8924, 4, 6, UNI_LEPC } /* scx=lepcha */, - { 33, 8966, 0, 6, 0, UNI_nfdqc_values_index } /* nfdqc= */, - { 0, 1087, 9255, 27, 5, -UNI_PCM } /* prependedconcatenationmark=false */, - { 0, 8780, 3169, 6, 8, UNI_INETHIOPIC } /* block=ethiopic */, - { 0, 184, 5256, 2, 14, UNI_LATINEXTD } /* islatinextendedd */, - { 0, 8589, 8115, 7, 4, UNI_BASS } /* script=bass */, - { 0, 7155, 1655, 3, 22, UNI_COMPATJAMO } /* ishangulcompatibilityjamo */, - { 0, 8780, 3650, 7, 16, UNI_CYRILLICEXTB } /* block=cyrillicextendedb */, - { 53, 9997, 5494, 3, 14, UNI_BC__NSM } /* bc=nonspacingmark */, - { 0, 5791, 5396, 13, 14, UNI_JG__MANICHAEANRESH } /* joininggroup=manichaeanresh */, - { 2, 9556, 18, 4, 2, UNI_RI } /* gcb=ri */, - { 2, 8780, 6110, 7, 11, UNI_CYRILLICEXTB } /* block=cyrillicextb */, - { 3, 9488, 3079, 4, 6, UNI_INCOPTIC } /* blk=coptic */, - { 8, 7155, 6485, 3, 3, UNI_HUNG } /* ishung */, - { 0, 5791, 5882, 13, 13, UNI_JG__MANICHAEANNUN } /* joininggroup=manichaeannun */, - { 1, 5791, 7038, 13, 10, UNI_JG__AFRICANFEH } /* joininggroup=africanfeh */, - { 2, 4628, 1, 15, 1, UNI_EA__N } /* eastasianwidth=n */, - { 1, 9768, 3169, 4, 8, UNI_ETHI } /* scx=ethiopic */, - { 1, 8780, 7504, 6, 9, UNI_ARABICPFB } /* block=arabicpfb */, - { 0, 10033, 10162, 3, 2, UNI_GCB__L } /* lb=jl */, - { 0, 9277, 9764, 3, 4, UNI_SARB } /* sc=sarb */, - { 3, 21, 5284, 2, 4, UNI_INLISU } /* inlisu */, - { 0, 8780, 9452, 6, 4, UNI_INAHOM } /* block=ahom */, - { 0, 3097, 8163, 18, 3, UNI_DT__FRA } /* decompositiontype=fra */, - { 1, 9260, 10135, 5, 3, UNI_IDSB } /* idsb=yes */, - { 3, 9262, 112, 3, 2, UNI_SB__SC } /* sb=sc */, - { 6, 9768, 3937, 4, 4, UNI_BOPO } /* scx=bopo */, - { 3, 3382, 0, 3, 0, UNI_ce_values_index } /* ce= */, - { 0, 5986, 5648, 13, 3, UNI_NV__100 } /* numericvalue=100 */, - { 1, 7438, 138, 10, 2, UNI_WB__FO } /* wordbreak=fo */, - { 214, 8882, 9255, 6, 5, -UNI_GREXT } /* grext=false */, - { 1, 9351, 3, 4, 1, -UNI_IDS } /* ids=f */, - { 0, 1273, 1, 21, 1, -UNI_CE } /* compositionexclusion=n */, - { 1, 9277, 9788, 3, 4, UNI_SC__SHRD } /* sc=shrd */, - { 1, 9488, 4161, 4, 16, UNI_LINEARBSYLLABARY } /* blk=linearbsyllabary */, - { 0, 21, 8456, 2, 7, UNI_INKANNADA } /* inkannada */, - { 0, 8589, 6181, 7, 12, UNI_SC__GONG } /* script=gunjalagondi */, - { 16, 8358, 0, 7, 0, UNI_CJKEXTB } /* cjkextb */, - { 1, 9262, 125, 3, 2, UNI_LB__CR } /* sb=cr */, - { 1, 10027, 5882, 3, 13, UNI_JG__MANICHAEANNUN } /* jg=manichaeannun */, - { 2, 8589, 9564, 7, 4, UNI_SC__GONM } /* script=gonm */, - { 0, 9768, 9095, 4, 5, UNI_BUHD } /* scx=buhid */, - { 0, 9444, 10096, 4, 3, UNI_AGE__5 } /* age=v50 */, - { 2, 1188, 4929, 3, 7, UNI_TAMILSUP } /* intamilsup */, - { 8, 7218, 202, 10, 2, UNI_LB__SA } /* linebreak=sa */, - { 33, 9277, 7358, 3, 10, UNI_SAUR } /* sc=saurashtra */, - { 0, 7218, 988, 10, 2, UNI_LB__CP } /* linebreak=cp */, - { 1, 7088, 2489, 10, 20, UNI_BC__PDF } /* bidiclass=popdirectionalformat */, - { 5, 10027, 5179, 3, 7, UNI_JG__HEHGOAL } /* jg=hehgoal */, - { 8, 10024, 2349, 3, 20, UNI_PC } /* gc=connectorpunctuation */, - { 9, 1966, 3061, 22, 18, UNI_INSC__CONSONANTSUBJOINED } /* indicsyllabiccategory=consonantsubjoined */, - { 48, 7325, 9396, 3, 4, UNI_IN__12_DOT_1 } /* in=12.1 */, - { 0, 7438, 34, 10, 2, UNI_WB__EX } /* wordbreak=ex */, - { 24, 10012, 3, 3, 1, UNI_EA__F } /* ea=f */, - { 1, 4033, 5040, 16, 5, UNI_XPOSIXDIGIT } /* generalcategory=digit */, - { 2, 10333, 8632, 3, 6, UNI_SUPPUAB } /* issuppuab */, - { 105, 9768, 9684, 4, 4, UNI_NEWA } /* scx=newa */, - { 32, 1166, 1025, 26, 2, -UNI_DI } /* defaultignorablecodepoint=no */, - { 3, 9488, 7128, 4, 10, UNI_CJKSTROKES } /* blk=cjkstrokes */, - { 0, 5791, 4773, 13, 5, UNI_JG__SADHE } /* joininggroup=sadhe */, - { 14, 4033, 467, 16, 11, UNI_P } /* generalcategory=punctuation */, - { 0, 8780, 8291, 6, 8, UNI_INTAGBANWA } /* block=tagbanwa */, - { 1, 6553, 0, 4, 0, UNI_XIDC } /* xidc */, - { 10, 8435, 26, 7, 1, UNI_GRBASE } /* grbase=y */, - { 16, 9488, 809, 4, 22, UNI_ENCLOSEDIDEOGRAPHICSUP } /* blk=enclosedideographicsup */, - { 36, 6805, 4245, 6, 12, UNI_MISCMATHSYMBOLSA } /* inmiscmathsymbolsa */, - { 137, 184, 5752, 2, 8, UNI_GREEKEXT } /* isgreekext */, - { 3, 7088, 2266, 10, 21, UNI_BC__PDI } /* bidiclass=popdirectionalisolate */, - { 67, 9270, 2455, 5, 5, UNI_INPC__RIGHT } /* inpc=right */, - { 0, 1417, 7078, 24, 10, UNI_CCC__BR } /* canonicalcombiningclass=belowright */, - { 4, 4916, 4929, 3, 4, UNI_TAML } /* istamil */, - { 65, 7088, 2509, 10, 20, UNI_BC__RLE } /* bidiclass=righttoleftembedding */, - { 0, 9768, 8421, 4, 7, UNI_ELYM } /* scx=elymaic */, - { 9, 8694, 9836, 7, 4, UNI_XPOSIXSPACE } /* wspace=true */, - { 0, 3836, 7359, 18, 9, UNI_SAUR } /* scriptextensions=saurashtra */, - { 4, 7076, 8124, 3, 7, UNI_INBUGINESE } /* inbuginese */, - { 0, 1966, 5102, 22, 14, UNI_INSC__CONSONANTFINAL } /* indicsyllabiccategory=consonantfinal */, - { 4, 9768, 8131, 4, 4, UNI_DUPL } /* scx=dupl */, - { 0, 8780, 1006, 6, 17, UNI_ANCIENTGREEKMUSIC } /* block=ancientgreekmusic */, - { 1, 9488, 8291, 4, 8, UNI_INTAGBANWA } /* blk=tagbanwa */, - { 3, 184, 4129, 2, 16, UNI_LATIN1 } /* islatin1supplement */, - { 0, 9265, 9836, 5, 4, UNI_IDST } /* idst=true */, - { 42, 9488, 5171, 4, 4, UNI_INCHAM } /* blk=cham */, - { 3, 9488, 2287, 4, 21, UNI_SINHALAARCHAICNUMBERS } /* blk=sinhalaarchaicnumbers */, - { 1, 9488, 7585, 4, 9, UNI_LATINEXTC } /* blk=latinextc */, - { 0, 9488, 328, 4, 21, UNI_MATHOPERATORS } /* blk=mathematicaloperators */, - { 0, 4628, 9868, 15, 4, UNI_EA__W } /* eastasianwidth=wide */, - { 57, 10333, 2288, 3, 6, UNI_SINH } /* issinhala */, - { 0, 4033, 3358, 16, 9, UNI_Z } /* generalcategory=separator */, - { 12, 5791, 6323, 13, 5, UNI_JG__GAMAL } /* joininggroup=gamal */, - { 0, 9488, 5003, 4, 15, UNI_INZANABAZARSQUARE } /* blk=zanabazarsquare */, - { 2, 9345, 3, 5, 1, -UNI_XIDC } /* xidc=f */, - { 16, 3836, 9880, 17, 4, UNI_YI } /* scriptextensions=yiii */, - { 260, 3836, 8666, 17, 7, UNI_TIRH } /* scriptextensions=tirhuta */, - { 0, 5791, 8155, 13, 8, UNI_JG__FARSIYEH } /* joininggroup=farsiyeh */, - { 0, 8780, 4241, 6, 16, UNI_MISCMATHSYMBOLSA } /* block=miscmathsymbolsa */, - { 3, 10009, 5904, 3, 4, UNI_DT__NONE } /* dt=none */, - { 275, 184, 8352, 3, 6, UNI_CJKEXTA } /* iscjkexta */, - { 0, 9277, 6884, 3, 11, UNI_HMNG } /* sc=pahawhhmong */, - { 19, 10033, 5046, 3, 14, UNI_LB__CR } /* lb=carriagereturn */, - { 2, 2224, 1562, 3, 23, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* insupsymbolsandpictographs */, - { 5, 9488, 42, 4, 26, UNI_CJKCOMPATIDEOGRAPHS } /* blk=cjkcompatibilityideographs */, - { 93, 7088, 23, 10, 2, UNI_BC__AL } /* bidiclass=al */, - { 9, 8780, 5270, 6, 14, UNI_LATINEXTE } /* block=latinextendede */, - { 1, 9488, 7168, 4, 10, UNI_INDIVESAKURU } /* blk=divesakuru */, - { 2, 184, 4017, 2, 16, UNI_PF } /* isfinalpunctuation */, - { 2, 5986, 8067, 13, 8, UNI_NV__17_SLASH_2 } /* numericvalue=8.50e+00 */, - { 0, 8780, 8484, 6, 7, UNI_INMANDAIC } /* block=mandaic */, - { 6, 8780, 3421, 6, 4, UNI_RUMI } /* block=rumi */, - { 0, 10027, 5326, 3, 14, UNI_JG__MANICHAEANBETH } /* jg=manichaeanbeth */, - { 0, 3836, 78, 17, 4, UNI_ARAB } /* scriptextensions=arab */, - { 5, 3836, 8645, 17, 7, UNI_LANA } /* scriptextensions=taitham */, - { 1, 9277, 8477, 3, 4, UNI_MAKA } /* sc=maka */, - { 1, 1537, 7298, 24, 10, UNI_INPC__OVERSTRUCK } /* indicpositionalcategory=overstruck */, - { 1, 9488, 9800, 4, 4, UNI_TAGS } /* blk=tags */, - { 0, 5606, 0, 14, 0, UNI_SUPPUNCTUATION } /* suppunctuation */, - { 0, 6554, 0, 3, 0, UNI_IDC } /* idc */, - { 86, 3836, 5284, 17, 4, UNI_LISU } /* scriptextensions=lisu */, - { 1, 9488, 3887, 4, 17, UNI_SUTTONSIGNWRITING } /* blk=suttonsignwriting */, - { 0, 8435, 10135, 7, 3, UNI_GRBASE } /* grbase=yes */, - { 0, 184, 4002, 3, 6, UNI_CPRT } /* iscypriot */, - { 0, 10033, 9557, 3, 2, UNI_LB__CB } /* lb=cb */, - { 0, 8780, 2141, 7, 10, UNI_CYRILLICSUP } /* block=cyrillicsup */, - { 1, 3836, 78, 17, 6, UNI_ARAB } /* scriptextensions=arabic */, - { 13, 184, 9608, 2, 4, UNI_KITS } /* iskits */, - { 137, 184, 7540, 2, 8, UNI_EXT } /* isextender */, - { 1, 7325, 7782, 3, 1, UNI_IN__3 } /* in=3 */, - { 36, 2308, 0, 21, 0, UNI_YIJING } /* yijinghexagramsymbols */, - { 0, 5986, 8010, 13, 2, UNI_NV__36 } /* numericvalue=36 */, - { 1, 5578, 1089, 15, 2, UNI_SB__SE } /* sentencebreak=sep */, - { 3, 9668, 0, 4, 0, UNI_MTEI } /* mtei */, - { 2, 3379, 9836, 6, 4, UNI_XPOSIXSPACE } /* space=true */, - { 0, 6061, 9255, 12, 5, -UNI_BIDIC } /* bidicontrol=false */, - { 0, 6609, 0, 10, 0, UNI_DEP } /* deprecated */, - { 2, 10048, 7947, 3, 8, UNI_NV__3_SLASH_64 } /* nv=4.69e-02 */, - { 3, 4643, 9255, 15, 5, -UNI_ECOMP } /* emojicomponent=false */, - { 64, 8780, 8631, 6, 7, UNI_SUPPUAB } /* block=suppuab */, - { 3, 184, 8498, 2, 4, UNI_MULT } /* ismult */, - { 1, 9644, 0, 4, 0, UNI_MEDF } /* medf */, - { 0, 10048, 9416, 3, 4, UNI_NV__3_SLASH_16 } /* nv=3/16 */, - { 1, 9265, 1025, 5, 2, -UNI_IDST } /* idst=no */, - { 0, 1006, 0, 27, 0, UNI_ANCIENTGREEKMUSIC } /* ancientgreekmusicalnotation */, - { 1, 8589, 9672, 7, 4, UNI_SC__MYMR } /* script=mymr */, - { 1, 21, 3751, 2, 17, UNI_INKHITANSMALLSCRIPT } /* inkhitansmallscript */, - { 0, 4116, 415, 3, 31, UNI_INIDC } /* isideographicdescriptioncharacters */, - { 3, 10024, 10180, 3, 2, UNI_ZS } /* gc=zs */, - { 1, 10033, 340, 3, 2, UNI_LB__OP } /* lb=op */, - { 5, 9488, 749, 4, 30, UNI_ENCLOSEDALPHANUMSUP } /* blk=enclosedalphanumericsupplement */, - { 14, 184, 1184, 2, 3, UNI_DEP } /* isdep */, - { 2, 6231, 2667, 4, 17, UNI_COUNTINGROD } /* incountingrodnumerals */, - { 0, 8780, 8526, 6, 7, UNI_NB } /* block=noblock */, - { 79, 7438, 7612, 10, 6, UNI_WB__MN } /* wordbreak=midnum */, - { 136, 5986, 7955, 13, 8, UNI_NV__1_SLASH_20 } /* numericvalue=5.00e-02 */, - { 5, 184, 2161, 2, 20, UNI_EXTPICT } /* isextendedpictographic */, - { 3, 2280, 1759, 4, 2, UNI_OLCK } /* isolck */, - { 0, 184, 1115, 3, 24, UNI_CWKCF } /* ischangeswhennfkccasefolded */, - { 2, 9071, 9255, 4, 5, -UNI_XPOSIXXDIGIT } /* hex=false */, - { 0, 184, 1044, 2, 6, UNI_L } /* isletter */, - { 0, 9768, 3785, 4, 10, UNI_MANI } /* scx=manichaean */, - { 4, 3836, 6484, 17, 4, UNI_HUNG } /* scriptextensions=hung */, - { 0, 9488, 979, 4, 27, UNI_ALPHABETICPF } /* blk=alphabeticpresentationforms */, - { 4, 5791, 9884, 13, 4, UNI_JG__ZAIN } /* joininggroup=zain */, - { 31, 8780, 7239, 6, 2, UNI_INVS } /* block=vs */, - { 72, 9997, 4493, 3, 15, UNI_BC__CS } /* bc=commonseparator */, - { 2, 1768, 9836, 22, 4, UNI_CWCF } /* changeswhencasefolded=true */, - { 0, 7318, 0, 10, 0, UNI_in_values_index } /* presentin= */, - { 13, 10024, 4017, 3, 16, UNI_PF } /* gc=finalpunctuation */, - { 2, 10048, 9360, 3, 4, UNI_NV___MINUS_1_SLASH_2 } /* nv=-1/2 */, - { 0, 4241, 0, 16, 0, UNI_MISCMATHSYMBOLSA } /* miscmathsymbolsa */, - { 0, 10048, 8726, 3, 6, UNI_NV__432000 } /* nv=432000 */, - { 0, 3836, 9688, 17, 3, UNI_NKO } /* scriptextensions=nko */, - { 1, 8780, 6122, 7, 11, UNI_CYRILLICEXTC } /* block=cyrillicextc */, - { 4, 8780, 2061, 6, 15, UNI_MODIFIERLETTERS } /* block=modifierletters */, - { 0, 8780, 8123, 6, 8, UNI_INBUGINESE } /* block=buginese */, - { 3, 8780, 3667, 7, 16, UNI_CYRILLICEXTC } /* block=cyrillicextendedc */, - { 137, 414, 0, 32, 0, UNI_INIDC } /* ideographicdescriptioncharacters */, - { 290, 9488, 7288, 4, 10, UNI_INOLDSOGDIAN } /* blk=oldsogdian */, - { 0, 9786, 8598, 4, 5, UNI_SC__SHRD } /* insharada */, - { 0, 9768, 8463, 4, 7, UNI_KALI } /* scx=kayahli */, - { 0, 1188, 4402, 3, 8, UNI_TANGUTSUP } /* intangutsup */, - { 0, 184, 867, 2, 11, UNI_PHONETICEXT } /* isphoneticext */, - { 4, 10296, 7207, 3, 3, UNI_PHLI } /* isphli */, - { 11, 9508, 9928, 4, 3, UNI_CCC__BR } /* ccc=222 */, - { 8, 3367, 0, 17, 0, UNI__PERL_PATWS } /* patternwhitespace */, - { 1, 5986, 7859, 13, 8, UNI_NV__20000000 } /* numericvalue=20000000 */, - { 0, 728, 0, 6, 0, UNI_N } /* number */, - { 1, 10048, 7779, 3, 8, UNI_NV__1_SLASH_7 } /* nv=1.43e-01 */, - { 1, 1166, 1, 26, 1, -UNI_DI } /* defaultignorablecodepoint=n */, - { 9, 9752, 0, 4, 0, UNI_ROHG } /* rohg */, - { 0, 1966, 3615, 22, 17, UNI_INSC__CONSONANTPREFIXED } /* indicsyllabiccategory=consonantprefixed */, - { 6, 8780, 7388, 6, 10, UNI_SUPARROWSB } /* block=suparrowsb */, - { 2, 1966, 2369, 22, 20, UNI_INSC__CONSONANTPLACEHOLDER } /* indicsyllabiccategory=consonantplaceholder */, - { 0, 5986, 7859, 13, 4, UNI_NV__2000 } /* numericvalue=2000 */, - { 4, 4129, 0, 6, 0, UNI_LATIN1 } /* latin1 */, - { 4, 10033, 3, 4, 1, UNI_LB__LF } /* lb=lf */, - { 5, 9275, 3953, 5, 16, UNI_INSC__CANTILLATIONMARK } /* insc=cantillationmark */, - { 36, 4033, 206, 16, 2, UNI_PI } /* generalcategory=pi */, - { 7, 9572, 0, 4, 0, UNI_GUJR } /* gujr */, - { 1, 6961, 0, 11, 0, UNI_SUPERANDSUB } /* superandsub */, - { 5, 9488, 509, 4, 20, UNI_CJK } /* blk=cjkunifiedideographs */, - { 0, 1294, 0, 25, 0, UNI_SUPERANDSUB } /* superscriptsandsubscripts */, - { 76, 9277, 8659, 3, 7, UNI_TIBT } /* sc=tibetan */, - { 1, 7249, 6600, 4, 9, UNI_CASEDLETTER } /* iscasedletter */, - { 0, 4033, 3985, 16, 16, UNI_PE } /* generalcategory=closepunctuation */, - { 0, 9270, 3475, 5, 10, UNI_INPC__TOPANDLEFT } /* inpc=topandleft */, - { 1, 3836, 8115, 17, 4, UNI_BASS } /* scriptextensions=bass */, - { 2, 8780, 7027, 6, 11, UNI_YISYLLABLES } /* block=yisyllables */, - { 1, 9351, 9836, 4, 4, UNI_IDS } /* ids=true */, - { 0, 8379, 0, 7, 0, UNI_CJKEXTE } /* cjkexte */, - { 0, 8780, 4129, 6, 16, UNI_LATIN1 } /* block=latin1supplement */, - { 43, 9277, 9876, 3, 4, UNI_XSUX } /* sc=xsux */, - { 0, 10030, 7, 3, 1, UNI_JT__C } /* jt=c */, - { 0, 5986, 7874, 13, 2, UNI_NV__23 } /* numericvalue=23 */, - { 0, 9488, 6620, 4, 6, UNI_DOMINO } /* blk=domino */, - { 8, 9508, 8568, 4, 7, UNI_CCC__1 } /* ccc=overlay */, - { 3, 184, 7388, 2, 10, UNI_SUPARROWSB } /* issuparrowsb */, - { 0, 3836, 8597, 18, 6, UNI_SHRD } /* scriptextensions=sharada */, - { 39, 9488, 3751, 4, 17, UNI_INKHITANSMALLSCRIPT } /* blk=khitansmallscript */, - { 0, 9488, 7576, 4, 9, UNI_LATINEXTB } /* blk=latinextb */, - { 31, 8589, 7694, 8, 8, UNI_SAMR } /* script=samaritan */, - { 82, 9997, 2449, 3, 20, UNI_BC__LRE } /* bc=lefttorightembedding */, - { 1, 9768, 1677, 4, 5, UNI_LATN } /* scx=latin */, - { 32, 1537, 4615, 4, 13, UNI_DIACRITICALSSUP } /* indiacriticalssup */, - { 0, 4116, 2225, 3, 20, UNI_PRTI } /* isinscriptionalparthian */, - { 2, 5037, 0, 9, 0, UNI_hex_values_index } /* hexdigit= */, - { 0, 1966, 9300, 22, 5, UNI_INSC__NUKTA } /* indicsyllabiccategory=nukta */, - { 1, 6710, 3601, 5, 14, UNI_INCAUCASIANALBANIAN } /* incaucasianalbanian */, - { 26, 7155, 5585, 3, 3, UNI_HEBR } /* ishebr */, - { 0, 7325, 9967, 3, 3, UNI_IN__5_DOT_1 } /* in=5.1 */, - { 65, 1746, 0, 23, 0, UNI_BPT__C } /* bidipairedbrackettype=c */, - { 0, 10003, 1025, 3, 2, -UNI_CI } /* ci=no */, - { 74, 4033, 598, 16, 2, UNI_XPOSIXCNTRL } /* generalcategory=cc */, - { 0, 184, 9085, 2, 5, UNI_BATK } /* isbatak */, - { 1, 9488, 4613, 4, 15, UNI_DIACRITICALSSUP } /* blk=diacriticalssup */, - { 0, 9488, 2140, 4, 8, UNI_INCYRILLIC } /* blk=cyrillic */, - { 1, 3379, 9255, 6, 5, -UNI_XPOSIXSPACE } /* space=false */, - { 1, 3836, 6481, 17, 12, UNI_HUNG } /* scriptextensions=oldhungarian */, - { 2, 8780, 1192, 6, 26, UNI_HALFANDFULLFORMS } /* block=halfwidthandfullwidthforms */, - { 0, 1189, 5040, 3, 5, UNI_NT__DI } /* nt=digit */, - { 55, 3836, 3079, 17, 6, UNI_COPT } /* scriptextensions=coptic */, - { 16, 184, 5438, 2, 14, UNI_SK } /* ismodifiersymbol */, - { 0, 10183, 3379, 4, 5, UNI_POSIXSPACE } /* perlspace */, - { 2, 5986, 9413, 13, 3, UNI_NV__7_SLASH_2 } /* numericvalue=7/2 */, - { 3, 3133, 10135, 18, 3, UNI_EBASE } /* emojimodifierbase=yes */, - { 2, 10027, 7038, 3, 10, UNI_JG__AFRICANFEH } /* jg=africanfeh */, - { 1, 8858, 1, 6, 1, -UNI_ECOMP } /* ecomp=n */, - { 0, 9488, 1673, 4, 4, UNI_JAMO } /* blk=jamo */, - { 0, 5578, 125, 14, 2, UNI_LB__CR } /* sentencebreak=cr */, - { 3, 3382, 9836, 3, 4, UNI_CE } /* ce=true */, - { 0, 3836, 9668, 17, 4, UNI_MTEI } /* scriptextensions=mtei */, - { 2, 8978, 0, 6, 0, UNI_patws_values_index } /* patws= */, - { 0, 9768, 7675, 4, 4, UNI_PALM } /* scx=palm */, - { 3, 3836, 6193, 17, 4, UNI_HEBR } /* scriptextensions=hebr */, - { 1, 3904, 9836, 17, 4, UNI_UIDEO } /* unifiedideograph=true */, - { 13, 1552, 1563, 9, 2, UNI_PS } /* category=ps */, - { 0, 184, 349, 2, 33, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* issupplementalsymbolsandpictographs */, - { 68, 1087, 1025, 27, 2, -UNI_PCM } /* prependedconcatenationmark=no */, - { 73, 9277, 8131, 3, 4, UNI_SC__DUPL } /* sc=dupl */, - { 0, 9488, 2140, 4, 11, UNI_CYRILLICSUP } /* blk=cyrillicsup */, - { 8, 10340, 4975, 4, 6, UNI_VEDICEXT } /* isvedicext */, - { 64, 9488, 8876, 4, 6, UNI_INGOTHIC } /* blk=gothic */, - { 1, 8589, 7188, 7, 10, UNI_KHAR } /* script=kharoshthi */, - { 2, 1417, 8708, 24, 3, UNI_CCC__216 } /* canonicalcombiningclass=216 */, - { 11, 1591, 8415, 3, 6, UNI_INELBASAN } /* inelbasan */, - { 142, 8780, 5256, 6, 14, UNI_LATINEXTD } /* block=latinextendedd */, - { 138, 9768, 1115, 4, 4, UNI_HANG } /* scx=hang */, - { 33, 4688, 7550, 16, 8, UNI_IDENTIFIERTYPE__INCLUSION } /* identifiertype=inclusion */, - { 48, 8589, 9684, 7, 4, UNI_NEWA } /* script=newa */, - { 58, 9768, 9476, 4, 4, UNI_AVST } /* scx=avst */, - { 158, 5508, 26, 14, 1, UNI_PATSYN } /* patternsyntax=y */, - { 0, 5986, 9964, 13, 3, UNI_NV__4_SLASH_5 } /* numericvalue=4/5 */, - { 0, 9900, 0, 4, 0, UNI_ZZZZ } /* zzzz */, - { 24, 10048, 7907, 3, 8, UNI_NV__3_SLASH_8 } /* nv=3.75e-01 */, - { 3, 9488, 4273, 4, 16, UNI_MYANMAREXTA } /* blk=myanmarextendeda */, - { 0, 9768, 9624, 4, 4, UNI_LAO } /* scx=laoo */, - { 1, 5739, 10135, 13, 3, UNI_GRBASE } /* graphemebase=yes */, - { 0, 10048, 5648, 3, 3, UNI_NV__100 } /* nv=100 */, - { 5, 8852, 36, 6, 1, UNI_CWKCF } /* cwkcf=t */, - { 9, 184, 8107, 2, 8, UNI_BALI } /* isbalinese */, - { 2, 10048, 9964, 3, 3, UNI_NV__4_SLASH_5 } /* nv=4/5 */, - { 1, 9508, 9925, 4, 3, UNI_CCC__BL } /* ccc=218 */, - { 0, 9768, 4703, 4, 15, UNI_ARMI } /* scx=imperialaramaic */, - { 0, 9488, 5200, 4, 14, UNI_KANASUP } /* blk=kanasupplement */, - { 20, 5986, 9984, 13, 2, UNI_NV__37 } /* numericvalue=37 */, - { 1, 21, 8227, 2, 8, UNI_KANAEXTA } /* inkanaexta */, - { 2, 8131, 0, 4, 0, UNI_DUPL } /* dupl */, - { 3, 9768, 9688, 4, 4, UNI_NKO } /* scx=nkoo */, - { 0, 3836, 9892, 17, 4, UNI_QAAI } /* scriptextensions=zinh */, - { 6, 7218, 7448, 10, 10, UNI_LB__WJ } /* linebreak=wordjoiner */, - { 2, 9488, 2245, 4, 11, UNI_INMEETEIMAYEK } /* blk=meeteimayek */, - { 5, 9768, 8840, 4, 6, UNI_CAKM } /* scx=chakma */, - { 37, 9488, 478, 4, 31, UNI_MATHALPHANUM } /* blk=mathematicalalphanumericsymbols */, - { 1, 5791, 5340, 13, 14, UNI_JG__MANICHAEANFIVE } /* joininggroup=manichaeanfive */, - { 1, 10048, 9405, 3, 3, UNI_NV__3_SLASH_2 } /* nv=3/2 */, - { 1, 184, 7129, 3, 9, UNI_CJKSTROKES } /* iscjkstrokes */, - { 0, 3836, 2429, 17, 20, UNI_PHLI } /* scriptextensions=inscriptionalpahlavi */, - { 1, 9488, 2409, 4, 10, UNI_INGLAGOLITIC } /* blk=glagolitic */, - { 1, 9556, 6170, 5, 11, UNI_WB__EB } /* gcb=glueafterzwj */, - { 0, 9997, 37, 3, 2, UNI_BC__EN } /* bc=en */, - { 33, 9768, 2469, 4, 20, UNI_HMNP } /* scx=nyiakengpuachuehmong */, - { 0, 184, 5817, 2, 13, UNI_ZL } /* islineseparator */, - { 13, 3904, 26, 17, 1, UNI_UIDEO } /* unifiedideograph=y */, - { 0, 9768, 2485, 4, 4, UNI_MONG } /* scx=mong */, - { 0, 5116, 0, 14, 0, UNI_emod_values_index } /* emojimodifier= */, - { 0, 10288, 1823, 8, 5, UNI_XPOSIXLOWER } /* isxposixlower */, - { 7, 9768, 7278, 4, 10, UNI_XPEO } /* scx=oldpersian */, - { 0, 9262, 495, 3, 2, UNI_SB__NU } /* sb=nu */, - { 2, 9508, 7477, 4, 9, UNI_CCC__AL } /* ccc=aboveleft */, - { 1, 8449, 9836, 7, 4, UNI_HYPHEN } /* hyphen=true */, - { 2, 3836, 9568, 17, 4, UNI_GREK } /* scriptextensions=grek */, - { 84, 10048, 8720, 3, 6, UNI_NV__400000 } /* nv=400000 */, - { 1, 1552, 7408, 9, 10, UNI_CN } /* category=unassigned */, - { 0, 7418, 0, 10, 0, UNI_upper_values_index } /* uppercase= */, - { 1, 4033, 10176, 16, 2, UNI_ZL } /* generalcategory=zl */, - { 2, 4793, 0, 15, 0, UNI_MERC } /* meroiticcursive */, - { 0, 8589, 6484, 7, 4, UNI_HUNG } /* script=hung */, - { 0, 184, 8942, 2, 6, UNI_LYDI } /* islydian */, - { 0, 3367, 3, 18, 1, -UNI__PERL_PATWS } /* patternwhitespace=f */, - { 48, 5791, 9744, 13, 4, UNI_JG__QAPH } /* joininggroup=qaph */, - { 90, 4916, 8660, 3, 6, UNI_TIBT } /* istibetan */, - { 1, 3097, 8163, 18, 8, UNI_DT__FRA } /* decompositiontype=fraction */, - { 2, 2784, 3923, 4, 7, UNI_ARABICSUP } /* inarabicsup */, - { 3, 184, 3796, 3, 3, UNI_CHAM } /* ischam */, - { 0, 4116, 1907, 3, 15, UNI_INDICNUMBERFORMS } /* isindicnumberforms */, - { 1, 3836, 2203, 17, 14, UNI_ROHG } /* scriptextensions=hanifirohingya */, - { 1, 1966, 4353, 22, 16, UNI_INSC__SYLLABLEMODIFIER } /* indicsyllabiccategory=syllablemodifier */, - { 1, 1417, 9931, 24, 3, UNI_CCC__L } /* canonicalcombiningclass=224 */, - { 1, 9488, 7099, 5, 9, UNI_BOXDRAWING } /* blk=boxdrawing */, - { 0, 8589, 8428, 7, 7, UNI_SC__GRAN } /* script=grantha */, - { 1, 9768, 8912, 4, 6, UNI_KHOJ } /* scx=khojki */, - { 5, 9488, 9065, 4, 5, UNI_INADLAM } /* blk=adlam */, - { 0, 184, 5960, 2, 13, UNI_MISCTECHNICAL } /* ismisctechnical */, - { 66, 7325, 7408, 3, 10, UNI_AGE__NA } /* in=unassigned */, - { 0, 9556, 911, 4, 1, UNI_GCB__V } /* gcb=v */, - { 0, 9275, 4305, 5, 5, UNI_INSC__OTHER } /* insc=other */, - { 1, 9600, 0, 4, 0, UNI_KALI } /* kali */, - { 0, 8852, 9255, 6, 5, -UNI_CWKCF } /* cwkcf=false */, - { 10, 10296, 9225, 7, 5, UNI_POSIXCNTRL } /* isposixcntrl */, - { 1, 7318, 9401, 10, 3, UNI_IN__3 } /* presentin=3.0 */, - { 28, 8267, 10135, 8, 3, UNI_RADICAL } /* radical=yes */, - { 0, 9768, 7513, 4, 9, UNI_BHKS } /* scx=bhaiksuki */, - { 0, 5039, 0, 6, 0, UNI_XPOSIXXDIGIT } /* xdigit */, - { 0, 9488, 5284, 4, 4, UNI_INLISU } /* blk=lisu */, - { 1, 5986, 8708, 13, 6, UNI_NV__216000 } /* numericvalue=216000 */, - { 3, 8780, 4928, 6, 8, UNI_TAMILSUP } /* block=tamilsup */, - { 16, 8780, 9335, 6, 5, UNI_INTAKRI } /* block=takri */, - { 0, 9346, 1, 4, 1, -UNI_IDC } /* idc=n */, - { 0, 2032, 3, 22, 1, -UNI__PERL_NCHAR } /* noncharactercodepoint=f */, - { 1, 6928, 0, 10, 0, UNI_SD } /* softdotted */, - { 0, 3893, 0, 11, 0, UNI_SGNW } /* signwriting */, - { 3, 8780, 4065, 6, 16, UNI_HALFANDFULLFORMS } /* block=halfandfullforms */, - { 0, 9440, 0, 4, 0, UNI_ADLM } /* adlm */, - { 1, 9262, 33, 3, 2, UNI_SB__SE } /* sb=se */, - { 0, 4628, 66, 15, 1, UNI_EA__H } /* eastasianwidth=h */, - { 66, 1988, 26, 22, 1, UNI_LOE } /* logicalorderexception=y */, - { 0, 8780, 7398, 6, 10, UNI_SUPARROWSC } /* block=suparrowsc */, - { 20, 7028, 2309, 3, 20, UNI_YIJING } /* isyijinghexagramsymbols */, - { 3, 184, 7398, 2, 10, UNI_SUPARROWSC } /* issuparrowsc */, - { 0, 9768, 8618, 5, 3, UNI_SOYO } /* scx=soyo */, - { 9, 8780, 908, 6, 10, UNI_PUA } /* block=privateuse */, - { 0, 1790, 1, 22, 1, -UNI_CWCM } /* changeswhencasemapped=n */, - { 34, 8589, 9600, 7, 4, UNI_SC__KALI } /* script=kali */, - { 16, 8372, 0, 7, 0, UNI_CJKEXTD } /* cjkextd */, - { 0, 1188, 4402, 3, 15, UNI_TANGUTSUP } /* intangutsupplement */, - { 69, 9275, 5144, 5, 14, UNI_INSC__GEMINATIONMARK } /* insc=geminationmark */, - { 6, 8780, 3169, 6, 11, UNI_ETHIOPICSUP } /* block=ethiopicsup */, - { 7, 9488, 414, 4, 32, UNI_INIDC } /* blk=ideographicdescriptioncharacters */, - { 1, 8589, 9320, 7, 5, UNI_OSGE } /* script=osage */, - { 0, 9768, 8561, 4, 7, UNI_OSMA } /* scx=osmanya */, - { 33, 8780, 5522, 6, 14, UNI_PHONETICEXTSUP } /* block=phoneticextsup */, - { 4, 10006, 1, 3, 1, -UNI_DI } /* di=n */, - { 72, 184, 2061, 2, 15, UNI_MODIFIERLETTERS } /* ismodifierletters */, - { 0, 9508, 1756, 4, 2, UNI_CCC__BR } /* ccc=br */, - { 0, 5986, 7858, 13, 2, UNI_NV__22 } /* numericvalue=22 */, - { 1, 9540, 10135, 4, 3, UNI_DIA } /* dia=yes */, - { 35, 6205, 26, 12, 1, UNI_IDEO } /* ideographic=y */, - { 4, 4146, 1947, 5, 19, UNI_EARLYDYNASTICCUNEIFORM } /* inearlydynasticcuneiform */, - { 1, 6231, 600, 3, 29, UNI_CJKEXTD } /* incjkunifiedideographsextensiond */, - { 1, 5674, 36, 13, 1, UNI_BIDIM } /* bidimirrored=t */, - { 5, 3836, 8115, 17, 8, UNI_BASS } /* scriptextensions=bassavah */, - { 0, 9508, 8082, 4, 2, UNI_CCC__19 } /* ccc=19 */, - { 3, 7325, 7469, 3, 3, UNI_IN__5 } /* in=5.0 */, - { 2, 7438, 8505, 10, 7, UNI_WB__NL } /* wordbreak=newline */, - { 1, 7218, 125, 10, 2, UNI_LB__CR } /* linebreak=cr */, - { 7, 9444, 7755, 4, 3, UNI_IN__1_DOT_1 } /* age=1.1 */, - { 78, 9488, 2836, 4, 19, UNI_MODIFIERTONELETTERS } /* blk=modifiertoneletters */, - { 1, 9488, 4289, 4, 16, UNI_MYANMAREXTB } /* blk=myanmarextendedb */, - { 2, 10296, 5040, 7, 5, UNI_POSIXDIGIT } /* isposixdigit */, - { 1, 5791, 9281, 14, 4, UNI_JG__KHAPH } /* joininggroup=khaph */, - { 0, 7325, 9856, 3, 4, UNI_IN__13 } /* in=v130 */, - { 2, 3853, 1025, 17, 2, -UNI_STERM } /* sentenceterminal=no */, - { 0, 10024, 4958, 3, 15, UNI_UPPERCASELETTER } /* gc=uppercaseletter */, - { 0, 184, 8131, 2, 8, UNI_DUPL } /* isduployan */, - { 2, 21, 3768, 2, 17, UNI_LETTERLIKESYMBOLS } /* inletterlikesymbols */, - { 7, 7325, 10084, 3, 3, UNI_IN__3_DOT_1 } /* in=v31 */, - { 0, 7155, 5219, 3, 3, UNI_HIRA } /* ishira */, - { 2, 9508, 184, 4, 2, UNI_CCC__IS } /* ccc=is */, - { 197, 1417, 8801, 24, 3, UNI_CCC__107 } /* canonicalcombiningclass=107 */, - { 68, 9768, 7288, 4, 10, UNI_SOGO } /* scx=oldsogdian */, - { 3, 184, 74, 2, 2, UNI_ME } /* isme */, - { 1, 9997, 10018, 3, 3, UNI_BC__FSI } /* bc=fsi */, - { 40, 9350, 1, 5, 1, -UNI_XIDS } /* xids=n */, - { 10, 7325, 7826, 3, 4, UNI_IN__12 } /* in=12.0 */, - { 1, 9488, 3295, 4, 9, UNI_LATINEXTA } /* blk=latinexta */, - { 124, 5986, 8720, 13, 4, UNI_NV__4000 } /* numericvalue=4000 */, - { 0, 5791, 6301, 13, 12, UNI_JG__MALAYALAMLLA } /* joininggroup=malayalamlla */, - { 4, 1631, 0, 15, 0, UNI_GEOMETRICSHAPES } /* geometricshapes */, - { 34, 1087, 0, 26, 0, UNI_PCM } /* prependedconcatenationmark */, - { 1, 1746, 5904, 22, 4, UNI_BPT__N } /* bidipairedbrackettype=none */, - { 1, 2161, 9255, 21, 5, -UNI_EXTPICT } /* extendedpictographic=false */, - { 18, 8589, 8107, 7, 4, UNI_BALI } /* script=bali */, - { 0, 8673, 0, 7, 0, UNI_UCASEXT } /* ucasext */, - { 35, 1417, 1179, 24, 2, UNI_CCC__BL } /* canonicalcombiningclass=bl */, - { 0, 8780, 5242, 6, 14, UNI_LATINEXTC } /* block=latinextendedc */, - { 1, 184, 8366, 3, 6, UNI_CJKEXTC } /* iscjkextc */, - { 0, 9305, 0, 5, 0, UNI_NSHU } /* nushu */, - { 6, 9488, 2061, 4, 4, UNI_INMODI } /* blk=modi */, - { 0, 2061, 0, 15, 0, UNI_MODIFIERLETTERS } /* modifierletters */, - { 149, 8780, 8107, 6, 8, UNI_INBALINESE } /* block=balinese */, - { 3, 4628, 8948, 15, 6, UNI_EA__NA } /* eastasianwidth=narrow */, - { 0, 7318, 7867, 10, 3, UNI_IN__3_DOT_1 } /* presentin=3.1 */, - { 128, 10024, 206, 3, 2, UNI_PI } /* gc=pi */, - { 40, 7155, 2507, 3, 3, UNI_HATR } /* ishatr */, - { 0, 10310, 8668, 4, 5, UNI_INTIRHUTA } /* intirhuta */, - { 10, 9488, 1677, 4, 14, UNI_LATINEXTA } /* blk=latinextendeda */, - { 8, 4568, 0, 15, 0, UNI_CURRENCYSYMBOLS } /* currencysymbols */, - { 16, 9768, 8123, 4, 8, UNI_BUGI } /* scx=buginese */, - { 0, 8780, 8407, 6, 7, UNI_DSRT } /* block=deseret */, - { 100, 21, 4161, 2, 16, UNI_LINEARBSYLLABARY } /* inlinearbsyllabary */, - { 23, 184, 4337, 2, 16, UNI_SUPMATHOPERATORS } /* issupmathoperators */, - { 2, 8780, 183, 6, 34, UNI_MISCPICTOGRAPHS } /* block=miscellaneoussymbolsandpictographs */, - { 0, 9556, 4360, 4, 9, UNI_WB__EB } /* gcb=emodifier */, - { 0, 8589, 9808, 7, 4, UNI_TALU } /* script=talu */, - { 3, 9488, 1218, 4, 26, UNI_KATAKANAEXT } /* blk=katakanaphoneticextensions */, - { 0, 9596, 6763, 4, 3, UNI_LB__H3 } /* hst=lvt */, - { 0, 9596, 0, 4, 0, UNI_hst_values_index } /* hst= */, - { 0, 8171, 0, 8, 0, UNI_GUJR } /* gujarati */, - { 34, 9277, 8617, 3, 4, UNI_SOYO } /* sc=soyo */, - { 1, 3259, 36, 18, 1, UNI_IDSB } /* idsbinaryoperator=t */, - { 2, 8575, 9255, 7, 5, -UNI_PATSYN } /* patsyn=false */, - { 0, 10048, 7915, 3, 8, UNI_NV__3_SLASH_80 } /* nv=3.75e-02 */, - { 104, 5778, 0, 6, 0, UNI_IPAEXT } /* ipaext */, - { 0, 3367, 1025, 18, 2, -UNI__PERL_PATWS } /* patternwhitespace=no */, - { 201, 9488, 4273, 4, 7, UNI_INMYANMAR } /* blk=myanmar */, - { 1, 349, 0, 33, 0, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* supplementalsymbolsandpictographs */, - { 251, 10126, 409, 3, 2, UNI_VO__TR } /* vo=tr */, - { 2, 2161, 36, 21, 1, UNI_EXTPICT } /* extendedpictographic=t */, - { 1, 9508, 9146, 5, 4, UNI_CCC__23 } /* ccc=ccc23 */, - { 0, 6420, 125, 3, 2, UNI_OCR } /* inocr */, - { 16, 8589, 0, 14, 0, UNI_SC__SHRD } /* script=sharada */, - { 2, 8694, 26, 7, 1, UNI_XPOSIXSPACE } /* wspace=y */, - { 195, 1417, 8042, 24, 2, UNI_CCC__18 } /* canonicalcombiningclass=18 */, - { 1, 7318, 10123, 10, 3, UNI_IN__9 } /* presentin=v90 */, - { 0, 8954, 36, 6, 1, UNI__PERL_NCHAR } /* nchar=t */, - { 5, 4628, 7486, 15, 9, UNI_EA__A } /* eastasianwidth=ambiguous */, - { 4, 184, 3241, 2, 11, UNI_GEORGIANSUP } /* isgeorgiansup */, - { 0, 2224, 3440, 3, 11, UNI_SMALLKANAEXT } /* insmallkanaext */, - { 1, 7318, 9400, 10, 4, UNI_IN__13 } /* presentin=13.0 */, - { 0, 8589, 2203, 7, 14, UNI_SC__ROHG } /* script=hanifirohingya */, - { 0, 1552, 1910, 9, 2, UNI_CN } /* category=cn */, - { 2, 184, 4554, 3, 14, UNI_CONTROLPICTURES } /* iscontrolpictures */, - { 3, 10027, 6289, 3, 12, UNI_JG__MALAYALAMBHA } /* jg=malayalambha */, - { 2, 4116, 7740, 3, 6, UNI_IDS } /* isidstart */, - { 6, 9768, 2288, 5, 6, UNI_SINH } /* scx=sinhala */, - { 16, 6241, 18, 12, 1, UNI_JT__R } /* joiningtype=r */, - { 6, 7318, 7827, 10, 3, UNI_IN__2 } /* presentin=2.0 */, - { 0, 10132, 4305, 3, 5, UNI_WB__XX } /* wb=other */, - { 4, 10048, 9961, 3, 3, UNI_NV__3_SLASH_5 } /* nv=3/5 */, - { 13, 9556, 5008, 5, 2, UNI_WB__EB } /* gcb=gaz */, - { 0, 9768, 3079, 4, 6, UNI_COPT } /* scx=coptic */, - { 0, 9768, 9612, 4, 4, UNI_KNDA } /* scx=knda */, - { 0, 9235, 9836, 5, 4, UNI_CWCM } /* cwcm=true */, - { 0, 8780, 5003, 6, 15, UNI_INZANABAZARSQUARE } /* block=zanabazarsquare */, - { 8, 5674, 0, 5, 0, UNI_BIDIM } /* bidim */, - { 7, 2161, 0, 21, 0, UNI_extpict_values_index } /* extendedpictographic= */, - { 1, 9768, 9624, 4, 3, UNI_LAO } /* scx=lao */, - { 0, 8780, 2409, 6, 10, UNI_INGLAGOLITIC } /* block=glagolitic */, - { 0, 3836, 8936, 17, 4, UNI_LYCI } /* scriptextensions=lyci */, - { 5, 4791, 4274, 3, 6, UNI_INMYANMAR } /* inmyanmar */, - { 83, 8589, 8680, 7, 7, UNI_ZZZZ } /* script=unknown */, - { 1, 9277, 2278, 4, 3, UNI_SC__KALI } /* sc=kali */, - { 3, 9488, 8477, 4, 7, UNI_INMAKASAR } /* blk=makasar */, - { 32, 4568, 0, 14, 0, UNI_SC } /* currencysymbol */, - { 0, 184, 7693, 2, 9, UNI_SAMR } /* issamaritan */, - { 2, 5986, 5648, 13, 9, UNI_NV__100000000 } /* numericvalue=100000000 */, - { 0, 184, 3026, 3, 10, UNI_CHEROKEESUP } /* ischerokeesup */, - { 3, 5718, 0, 5, 0, UNI_XPOSIXALNUM } /* alnum */, - { 32, 8780, 414, 6, 32, UNI_INIDC } /* block=ideographicdescriptioncharacters */, - { 0, 9488, 6085, 4, 12, UNI_CHESSSYMBOLS } /* blk=chesssymbols */, - { 193, 8780, 2409, 6, 13, UNI_GLAGOLITICSUP } /* block=glagoliticsup */, - { 2, 8589, 6840, 7, 11, UNI_SC__NAND } /* script=nandinagari */, - { 4, 9277, 8498, 3, 7, UNI_SC__MULT } /* sc=multani */, - { 1, 7155, 2723, 3, 18, UNI_JAMOEXTA } /* ishanguljamoextendeda */, - { 11, 184, 250, 2, 33, UNI_MISCMATHSYMBOLSA } /* ismiscellaneousmathematicalsymbolsa */, - { 0, 9488, 7675, 4, 9, UNI_PALM } /* blk=palmyrene */, - { 9, 9262, 7702, 3, 9, UNI_SB__SC } /* sb=scontinue */, - { 1, 10132, 6178, 3, 3, UNI_LB__ZWJ } /* wb=zwj */, - { 4, 8589, 4370, 8, 5, UNI_SC__SYRC } /* script=syriac */, - { 33, 9768, 8611, 5, 3, UNI_SIDD } /* scx=sidd */, - { 11, 5986, 7939, 13, 8, UNI_NV__9_SLASH_2 } /* numericvalue=4.50e+00 */, - { 0, 7158, 36, 10, 1, UNI_DIA } /* diacritic=t */, - { 1, 1552, 1, 9, 1, UNI_N } /* category=n */, - { 83, 3836, 8618, 18, 6, UNI_SOYO } /* scriptextensions=soyombo */, - { 3, 184, 5200, 2, 7, UNI_KANASUP } /* iskanasup */, - { 5, 9277, 9283, 3, 4, UNI_PHLI } /* sc=phli */, - { 96, 9275, 0, 5, 0, UNI_insc_values_index } /* insc= */, - { 0, 8428, 0, 4, 0, UNI_GRAN } /* gran */, - { 0, 9346, 9836, 4, 4, UNI_IDC } /* idc=true */, - { 2, 3836, 9624, 17, 3, UNI_LAO } /* scriptextensions=lao */, - { 0, 21, 1218, 2, 26, UNI_KATAKANAEXT } /* inkatakanaphoneticextensions */, - { 17, 2161, 1025, 21, 2, -UNI_EXTPICT } /* extendedpictographic=no */, - { 0, 8780, 1218, 6, 26, UNI_KATAKANAEXT } /* block=katakanaphoneticextensions */, - { 12, 9768, 2913, 5, 3, UNI_SUND } /* scx=sund */, - { 0, 184, 1269, 2, 24, UNI_COMPEX } /* isfullcompositionexclusion */, - { 1, 10048, 7827, 3, 8, UNI_NV__1_SLASH_5 } /* nv=2.00e-01 */, - { 3, 9488, 6277, 4, 12, UNI_MAHJONG } /* blk=mahjongtiles */, - { 352, 9262, 495, 3, 7, UNI_SB__NU } /* sb=numeric */, - { 1, 10296, 9725, 3, 3, UNI_PHNX } /* isphnx */, - { 2, 8780, 7495, 6, 9, UNI_ARABICPFA } /* block=arabicpfa */, - { 0, 6805, 0, 13, 0, UNI_MISCSYMBOLS } /* inmiscsymbols */, - { 0, 9716, 0, 3, 0, UNI_PCM } /* pcm */, - { 258, 9277, 3598, 3, 17, UNI_AGHB } /* sc=caucasianalbanian */, - { 4, 8768, 26, 6, 1, UNI_BIDIC } /* bidic=y */, - { 2, 8780, 9095, 6, 5, UNI_INBUHID } /* block=buhid */, - { 1, 8393, 0, 7, 0, UNI_CJKEXTG } /* cjkextg */, - { 3, 117, 415, 3, 31, UNI_INIDC } /* inideographicdescriptioncharacters */, - { 0, 1417, 6631, 24, 11, UNI_CCC__DA } /* canonicalcombiningclass=doubleabove */, - { 80, 9265, 1, 5, 1, -UNI_IDST } /* idst=n */, - { 63, 9488, 3115, 4, 10, UNI_INDEVANAGARI } /* blk=devanagari */, - { 0, 2224, 4370, 3, 5, UNI_INSYRIAC } /* insyriac */, - { 0, 6205, 3, 12, 1, -UNI_IDEO } /* ideographic=f */, - { 37, 184, 9660, 2, 4, UNI_MLYM } /* ismlym */, - { 1, 5791, 4748, 13, 15, UNI_JG__MANICHAEANGIMEL } /* joininggroup=manichaeangimel */, - { 1, 184, 5592, 2, 14, UNI_ZS } /* isspaceseparator */, - { 9, 6554, 3, 11, 1, -UNI_IDC } /* idcontinue=f */, - { 3, 5986, 7778, 13, 2, UNI_NV__21 } /* numericvalue=21 */, - { 2, 9508, 7858, 4, 3, UNI_CCC__B } /* ccc=220 */, - { 0, 1900, 0, 6, 0, UNI_ZYYY } /* common */, - { 25, 3836, 9452, 17, 4, UNI_AHOM } /* scriptextensions=ahom */, - { 0, 9508, 9136, 5, 4, UNI_CCC__21 } /* ccc=ccc21 */, - { 0, 2529, 0, 20, 0, UNI_term_values_index } /* terminalpunctuation= */, - { 1, 8768, 9836, 6, 4, UNI_BIDIC } /* bidic=true */, - { 0, 8780, 3785, 6, 10, UNI_INMANICHAEAN } /* block=manichaean */, - { 8, 10333, 8625, 3, 6, UNI_SUPPUAA } /* issuppuaa */, - { 256, 10024, 112, 3, 2, UNI_SC } /* gc=sc */, - { 4, 9508, 8042, 4, 2, UNI_CCC__18 } /* ccc=18 */, - { 177, 10048, 8067, 3, 8, UNI_NV__17_SLASH_2 } /* nv=8.50e+00 */, - { 96, 9768, 8638, 4, 7, UNI_TGLG } /* scx=tagalog */, - { 0, 4791, 2856, 3, 8, UNI_INMONGOLIAN } /* inmongolian */, - { 0, 8688, 9477, 3, 3, UNI_AVST } /* isavst */, - { 11, 9488, 8498, 4, 7, UNI_INMULTANI } /* blk=multani */, - { 42, 6231, 630, 3, 29, UNI_CJKEXTE } /* incjkunifiedideographsextensione */, - { 2, 6231, 1061, 4, 4, UNI_INCOPTIC } /* incoptic */, - { 1, 7325, 10081, 3, 3, UNI_IN__3 } /* in=v30 */, - { 5, 1552, 908, 9, 10, UNI_CO } /* category=privateuse */, - { 0, 1591, 8422, 3, 6, UNI_INELYMAIC } /* inelymaic */, - { 64, 9275, 9300, 5, 5, UNI_INSC__NUKTA } /* insc=nukta */, - { 5, 3836, 9460, 17, 4, UNI_ARMI } /* scriptextensions=armi */, - { 0, 8688, 9449, 3, 3, UNI_AGHB } /* isaghb */, - { 0, 3097, 3501, 18, 3, UNI_DT__MED } /* decompositiontype=med */, - { 0, 184, 8123, 2, 4, UNI_BUGI } /* isbugi */, - { 8, 9014, 10135, 6, 3, UNI_UIDEO } /* uideo=yes */, - { 5, 9536, 3, 4, 1, -UNI_DEP } /* dep=f */, - { 2, 8589, 9888, 7, 4, UNI_ZANB } /* script=zanb */, - { 9, 10048, 8732, 3, 3, UNI_NV__500 } /* nv=500 */, - { 1, 184, 8870, 2, 5, UNI_EPRES } /* isepres */, - { 0, 9277, 8477, 3, 7, UNI_MAKA } /* sc=makasar */, - { 10, 3382, 1025, 3, 2, -UNI_CE } /* ce=no */, - { 10, 5324, 480, 4, 29, UNI_MATHALPHANUM } /* inmathematicalalphanumericsymbols */, - { 1, 10033, 5999, 3, 13, UNI_LB__PR } /* lb=prefixnumeric */, - { 1, 2779, 0, 18, 0, UNI_IDST } /* idstrinaryoperator */, - { 0, 4033, 5726, 16, 13, UNI_ME } /* generalcategory=enclosingmark */, - { 0, 10027, 5364, 3, 4, UNI_JG__HETH } /* jg=heth */, - { 0, 1979, 6266, 10, 11, UNI_NL } /* category=letternumber */, - { 3, 9488, 2665, 4, 19, UNI_COUNTINGROD } /* blk=countingrodnumerals */, - { 208, 8780, 7188, 6, 10, UNI_INKHAROSHTHI } /* block=kharoshthi */, - { 84, 184, 8359, 3, 6, UNI_CJKEXTB } /* iscjkextb */, - { 0, 9768, 2203, 4, 4, UNI_HAN } /* scx=hani */, - { 0, 2182, 1087, 21, 7, UNI_GCB__PP } /* graphemeclusterbreak=prepend */, - { 288, 2409, 0, 20, 0, UNI_GLAGOLITICSUP } /* glagoliticsupplement */, - { 256, 9488, 2912, 4, 12, UNI_SUNDANESESUP } /* blk=sundanesesup */, - { 0, 8780, 4703, 6, 15, UNI_INIMPERIALARAMAIC } /* block=imperialaramaic */, - { 6, 9014, 3, 6, 1, -UNI_UIDEO } /* uideo=f */, - { 0, 7218, 1186, 10, 2, UNI_LB__PO } /* linebreak=po */, - { 0, 7438, 6169, 10, 12, UNI_WB__EB } /* wordbreak=glueafterzwj */, - { 0, 184, 6181, 2, 12, UNI_GONG } /* isgunjalagondi */, - { 1, 10033, 34, 3, 2, UNI_LB__EX } /* lb=ex */, - { 2, 2280, 6874, 3, 10, UNI_SO } /* isothersymbol */, - { 1, 9277, 3115, 3, 4, UNI_SC__DEVA } /* sc=deva */, - { 0, 9488, 6505, 4, 12, UNI_PHAISTOS } /* blk=phaistosdisc */, - { 176, 8780, 5228, 6, 14, UNI_LATINEXTB } /* block=latinextendedb */, - { 25, 2533, 6028, 5, 9, UNI_ALPHABETICPF } /* inalphabeticpf */, - { 5, 9997, 2509, 3, 11, UNI_BC__R } /* bc=righttoleft */, - { 0, 8780, 7288, 6, 10, UNI_INOLDSOGDIAN } /* block=oldsogdian */, - { 186, 9277, 8131, 3, 8, UNI_SC__DUPL } /* sc=duployan */, - { 45, 1673, 0, 4, 0, UNI_JAMO } /* jamo */, - { 66, 6061, 0, 12, 0, UNI_bidic_values_index } /* bidicontrol= */, - { 0, 8589, 9038, 7, 6, UNI_SC__YEZI } /* script=yezidi */, - { 0, 1856, 3, 22, 1, -UNI_CWU } /* changeswhenuppercased=f */, - { 256, 10183, 7438, 4, 4, UNI_POSIXWORD } /* perlword */, - { 1, 9070, 3, 5, 1, -UNI_POSIXXDIGIT } /* ahex=f */, - { 0, 9277, 8596, 3, 7, UNI_SC__SHRD } /* sc=sharada */, - { 3, 5986, 0, 13, 0, UNI_nv_values_index } /* numericvalue= */, - { 3, 184, 8243, 2, 8, UNI_MAHJ } /* ismahajani */, - { 0, 9240, 26, 5, 1, UNI_DASH } /* dash=y */, - { 4, 3025, 0, 11, 0, UNI_CHEROKEESUP } /* cherokeesup */, - { 2, 6420, 4884, 3, 14, UNI_SARB } /* inoldsoutharabian */, - { 1, 9262, 72, 3, 2, UNI_SB__LE } /* sb=le */, - { 0, 9520, 0, 4, 0, UNI_cwl_values_index } /* cwl= */, - { 2, 7325, 7806, 3, 1, UNI_IN__6 } /* in=6 */, - { 2, 1417, 9922, 24, 3, UNI_CCC__214 } /* canonicalcombiningclass=214 */, - { 0, 3836, 9283, 17, 4, UNI_PHLI } /* scriptextensions=phli */, - { 0, 4916, 47, 5, 1, UNI_TERM } /* isterm */, - { 104, 7318, 9388, 10, 4, UNI_IN__11 } /* presentin=11.0 */, - { 0, 1417, 8082, 24, 2, UNI_CCC__19 } /* canonicalcombiningclass=19 */, - { 0, 2182, 911, 21, 1, UNI_GCB__V } /* graphemeclusterbreak=v */, - { 1, 262, 0, 2, 0, UNI_SM } /* sm */, - { 98, 1552, 5494, 9, 14, UNI_MN } /* category=nonspacingmark */, - { 1, 184, 1222, 2, 4, UNI_KANA } /* iskana */, - { 1, 5986, 7469, 13, 8, UNI_NV__1_SLASH_2 } /* numericvalue=5.00e-01 */, - { 57, 8780, 8624, 6, 7, UNI_SUPPUAA } /* block=suppuaa */, - { 3, 21, 5019, 3, 13, UNI_ANCIENTSYMBOLS } /* inancientsymbols */, - { 0, 3836, 4928, 17, 5, UNI_TAML } /* scriptextensions=tamil */, - { 0, 1552, 45, 9, 2, UNI_CO } /* category=co */, - { 3, 9444, 9388, 4, 4, UNI_AGE__11 } /* age=11.0 */, - { 1, 4161, 0, 16, 0, UNI_LINEARBSYLLABARY } /* linearbsyllabary */, - { 0, 9768, 2245, 4, 11, UNI_MTEI } /* scx=meeteimayek */, - { 3, 10024, 4305, 3, 5, UNI_C } /* gc=other */, - { 1, 1768, 1, 22, 1, -UNI_CWCF } /* changeswhencasefolded=n */, - { 2, 5752, 0, 8, 0, UNI_GREEKEXT } /* greekext */, - { 34, 9768, 8477, 4, 4, UNI_MAKA } /* scx=maka */, - { 2, 10048, 9958, 3, 3, UNI_NV__3_SLASH_4 } /* nv=3/4 */, - { 20, 184, 749, 2, 16, UNI_ENCLOSEDALPHANUM } /* isenclosedalphanum */, - { 0, 9488, 9320, 4, 5, UNI_INOSAGE } /* blk=osage */, - { 0, 8227, 0, 8, 0, UNI_KANAEXTA } /* kanaexta */, - { 22, 4448, 0, 8, 0, UNI_BAMUMSUP } /* bamumsup */, - { 65, 3836, 8888, 17, 6, UNI_HATR } /* scriptextensions=hatran */, - { 0, 3904, 9255, 17, 5, -UNI_UIDEO } /* unifiedideograph=false */, - { 3, 9444, 9840, 4, 4, UNI_AGE__10 } /* age=v100 */, - { 36, 3836, 9548, 17, 4, UNI_DSRT } /* scriptextensions=dsrt */, - { 128, 10048, 7795, 3, 8, UNI_NV__3_SLASH_20 } /* nv=1.50e-01 */, - { 11, 3529, 1025, 18, 2, -UNI_VS } /* variationselector=no */, - { 0, 3768, 0, 17, 0, UNI_LETTERLIKESYMBOLS } /* letterlikesymbols */, - { 40, 8400, 3, 7, 1, -UNI_COMPEX } /* compex=f */, - { 0, 184, 3751, 2, 17, UNI_KITS } /* iskhitansmallscript */, - { 0, 9488, 1654, 4, 23, UNI_COMPATJAMO } /* blk=hangulcompatibilityjamo */, - { 1, 10027, 3819, 3, 17, UNI_JG__MANICHAEANTHAMEDH } /* jg=manichaeanthamedh */, - { 0, 414, 0, 11, 0, UNI_IDEO } /* ideographic */, - { 16, 184, 4448, 2, 5, UNI_BAMU } /* isbamum */, - { 259, 10048, 7859, 3, 5, UNI_NV__20000 } /* nv=20000 */, - { 1, 1966, 7639, 22, 9, UNI_INSC__NONJOINER } /* indicsyllabiccategory=nonjoiner */, - { 0, 9488, 1218, 4, 8, UNI_INKATAKANA } /* blk=katakana */, - { 288, 1591, 3170, 3, 10, UNI_ETHIOPICSUP } /* inethiopicsup */, - { 9, 8780, 4049, 6, 11, UNI_GEORGIANEXT } /* block=georgianext */, - { 4, 9768, 8470, 4, 7, UNI_LINA } /* scx=lineara */, - { 1, 3097, 2569, 18, 8, UNI_DT__VERT } /* decompositiontype=vertical */, - { 2, 3133, 9255, 18, 5, -UNI_EBASE } /* emojimodifierbase=false */, - { 4, 7325, 10117, 3, 3, UNI_IN__7 } /* in=v70 */, - { 6, 4033, 1, 16, 1, UNI_N } /* generalcategory=n */, - { 296, 9556, 36, 4, 1, UNI_GCB__T } /* gcb=t */, - { 0, 1552, 47, 9, 1, UNI_M } /* category=m */, - { 1, 5791, 9772, 13, 4, UNI_JG__SEEN } /* joininggroup=seen */, - { 1, 9270, 3475, 5, 18, UNI_INPC__TOPANDLEFTANDRIGHT } /* inpc=topandleftandright */, - { 33, 9532, 0, 4, 0, UNI_CYRL } /* cyrl */, - { 2, 1087, 10135, 27, 3, UNI_PCM } /* prependedconcatenationmark=yes */, - { 1, 7318, 9384, 10, 4, UNI_IN__10 } /* presentin=10.0 */, - { 0, 5986, 7950, 13, 1, UNI_NV__9 } /* numericvalue=9 */, - { 1, 4116, 2780, 3, 17, UNI_IDST } /* isidstrinaryoperator */, - { 49, 9768, 8888, 4, 4, UNI_HATR } /* scx=hatr */, - { 0, 4116, 59, 3, 3, UNI_IDEO } /* isideo */, - { 0, 9488, 951, 4, 18, UNI_INVS } /* blk=variationselectors */, - { 289, 3385, 0, 17, 0, UNI_RI } /* regionalindicator */, - { 1, 8780, 7378, 6, 10, UNI_SUPARROWSA } /* block=suparrowsa */, - { 8, 7088, 25, 10, 1, UNI_BC__S } /* bidiclass=s */, - { 1, 1552, 38, 9, 2, UNI_XPOSIXDIGIT } /* category=nd */, - { 65, 4448, 0, 4, 0, UNI_BAMU } /* bamu */, - { 0, 7438, 495, 10, 2, UNI_WB__NU } /* wordbreak=nu */, - { 1, 5324, 5845, 4, 7, UNI_INMALAYALAM } /* inmalayalam */, - { 18, 9488, 1922, 4, 22, UNI_DIACRITICALSFORSYMBOLS } /* blk=diacriticalsforsymbols */, - { 3, 3785, 0, 10, 0, UNI_MANI } /* manichaean */, - { 98, 6231, 150, 4, 33, UNI_DIACRITICALSSUP } /* incombiningdiacriticalmarkssupplement */, - { 10, 1273, 9836, 21, 4, UNI_CE } /* compositionexclusion=true */, - { 1, 6481, 0, 12, 0, UNI_HUNG } /* oldhungarian */, - { 0, 8386, 0, 7, 0, UNI_CJKEXTF } /* cjkextf */, - { 4, 3385, 1025, 18, 2, -UNI_RI } /* regionalindicator=no */, - { 16, 2224, 2288, 3, 6, UNI_INSINHALA } /* insinhala */, - { 0, 8589, 6409, 7, 12, UNI_MEND } /* script=mendekikakui */, - { 1, 4989, 1868, 3, 8, UNI_XPOSIXUPPER } /* isuppercase */, - { 0, 5791, 2223, 13, 3, UNI_JG__AIN } /* joininggroup=ain */, - { 197, 8780, 328, 6, 21, UNI_MATHOPERATORS } /* block=mathematicaloperators */, - { 0, 6420, 8548, 3, 6, UNI_OLCK } /* inolchiki */, - { 0, 9488, 8345, 5, 6, UNI_INBENGALI } /* blk=bengali */, - { 0, 9488, 4553, 4, 15, UNI_CONTROLPICTURES } /* blk=controlpictures */, - { 130, 184, 7378, 2, 10, UNI_SUPARROWSA } /* issuparrowsa */, - { 4, 10048, 8750, 3, 5, UNI_NV__80000 } /* nv=80000 */, - { 17, 9488, 7666, 4, 9, UNI_INOLDTURKIC } /* blk=oldturkic */, - { 5, 3836, 8582, 17, 7, UNI_PHAG } /* scriptextensions=phagspa */, - { 2, 1552, 133, 9, 4, UNI_M } /* category=mark */, - { 1, 5986, 7859, 13, 2, UNI_NV__20 } /* numericvalue=20 */, - { 32, 9776, 0, 4, 0, UNI_SGNW } /* sgnw */, - { 1, 8780, 4337, 6, 16, UNI_SUPMATHOPERATORS } /* block=supmathoperators */, - { 0, 6231, 660, 3, 29, UNI_CJKEXTF } /* incjkunifiedideographsextensionf */, - { 0, 9508, 9131, 5, 4, UNI_CCC__20 } /* ccc=ccc20 */, - { 0, 7428, 0, 10, 0, UNI_WARA } /* warangciti */, - { 0, 7438, 6653, 10, 11, UNI_WB__DQ } /* wordbreak=doublequote */, - { 1, 250, 0, 33, 0, UNI_MISCMATHSYMBOLSA } /* miscellaneousmathematicalsymbolsa */, - { 0, 3367, 10135, 18, 3, UNI__PERL_PATWS } /* patternwhitespace=yes */, - { 21, 9277, 2329, 3, 20, UNI_HLUW } /* sc=anatolianhieroglyphs */, - { 3, 1033, 0, 27, 0, UNI_ENCLOSEDCJK } /* enclosedcjklettersandmonths */, - { 3, 9768, 9584, 4, 4, UNI_HLUW } /* scx=hluw */, - { 35, 6231, 8359, 3, 6, UNI_CJKEXTB } /* incjkextb */, - { 0, 7325, 9970, 3, 3, UNI_IN__5_DOT_2 } /* in=5.2 */, - { 1, 8512, 26, 7, 1, UNI_NFKCQC__Y } /* nfkcqc=y */, - { 0, 8589, 9325, 7, 5, UNI_RUNR } /* script=runic */, - { 0, 3836, 9095, 17, 5, UNI_BUHD } /* scriptextensions=buhid */, - { 0, 9488, 2912, 4, 19, UNI_SUNDANESESUP } /* blk=sundanesesupplement */, - { 1, 184, 8984, 2, 5, UNI_QMARK } /* isqmark */, - { 1, 10170, 0, 2, 0, UNI_CASEDLETTER } /* l_ */, - { 0, 4033, 8855, 16, 2, UNI_CF } /* generalcategory=cf */, - { 1, 10290, 9225, 6, 5, UNI_XPOSIXCNTRL } /* xposixcntrl */, - { 18, 9488, 1013, 4, 5, UNI_INGREEK } /* blk=greek */, - { 64, 9488, 3025, 4, 11, UNI_CHEROKEESUP } /* blk=cherokeesup */, - { 0, 2560, 0, 4, 0, UNI_MAND } /* mand */, - { 3, 9270, 7298, 5, 10, UNI_INPC__OVERSTRUCK } /* inpc=overstruck */, - { 0, 9277, 9860, 3, 4, UNI_VAI } /* sc=vaii */, - { 97, 3836, 9480, 17, 4, UNI_BATK } /* scriptextensions=batk */, - { 12, 9488, 9452, 4, 4, UNI_INAHOM } /* blk=ahom */, - { 0, 9277, 3169, 3, 4, UNI_ETHI } /* sc=ethi */, - { 47, 184, 10180, 2, 2, UNI_ZS } /* iszs */, - { 0, 5171, 0, 4, 0, UNI_CHAM } /* cham */, - { 4, 5674, 1025, 13, 2, -UNI_BIDIM } /* bidimirrored=no */, - { 19, 2684, 0, 19, 0, UNI_EGYP } /* egyptianhieroglyphs */, - { 0, 10009, 3439, 3, 5, UNI_DT__SML } /* dt=small */, - { 1, 8780, 9285, 6, 5, UNI_INLIMBU } /* block=limbu */, - { 0, 9596, 7238, 4, 10, UNI_LB__H2 } /* hst=lvsyllable */, - { 5, 7318, 9397, 10, 3, UNI_IN__2_DOT_1 } /* presentin=2.1 */, - { 36, 6229, 10135, 12, 3, UNI_JOINC } /* joincontrol=yes */, - { 130, 9768, 3894, 5, 10, UNI_SGNW } /* scx=signwriting */, - { 6, 3717, 0, 17, 0, UNI_identifierstatus_values_index } /* identifierstatus= */, - { 112, 8589, 6253, 7, 5, UNI_KHMR } /* script=khmer */, - { 2, 8780, 2329, 6, 20, UNI_INANATOLIANHIEROGLYPHS } /* block=anatolianhieroglyphs */, - { 0, 1273, 0, 21, 0, UNI_ce_values_index } /* compositionexclusion= */, - { 1, 10024, 1186, 3, 2, UNI_PO } /* gc=po */, - { 4, 9488, 8659, 4, 7, UNI_INTIBETAN } /* blk=tibetan */, - { 394, 5674, 9255, 13, 5, -UNI_BIDIM } /* bidimirrored=false */, - { 22, 9488, 5242, 4, 14, UNI_LATINEXTC } /* blk=latinextendedc */, - { 1, 8780, 1677, 6, 14, UNI_LATINEXTA } /* block=latinextendeda */, - { 0, 184, 8380, 3, 6, UNI_CJKEXTE } /* iscjkexte */, - { 0, 9488, 2855, 4, 19, UNI_MONGOLIANSUP } /* blk=mongoliansupplement */, - { 0, 3052, 0, 9, 0, UNI_HALFMARKS } /* halfmarks */, - { 0, 8780, 1944, 6, 22, UNI_EARLYDYNASTICCUNEIFORM } /* block=earlydynasticcuneiform */, - { 0, 8780, 9008, 6, 6, UNI_INTHAANA } /* block=thaana */, - { 6, 8884, 3, 4, 1, -UNI_EXT } /* ext=f */, - { 2, 184, 1988, 2, 21, UNI_LOE } /* islogicalorderexception */, - { 0, 5986, 8738, 13, 5, UNI_NV__60000 } /* numericvalue=60000 */, - { 0, 21, 3549, 4, 15, UNI_ALCHEMICAL } /* inalchemicalsymbols */, - { 2, 5986, 7867, 13, 8, UNI_NV__1_SLASH_32 } /* numericvalue=3.12e-02 */, - { 0, 5986, 7971, 13, 8, UNI_NV__7_SLASH_12 } /* numericvalue=5.83e-01 */, - { 0, 5508, 36, 14, 1, UNI_PATSYN } /* patternsyntax=t */, - { 0, 5739, 9836, 13, 4, UNI_GRBASE } /* graphemebase=true */, - { 0, 2182, 18, 21, 2, UNI_RI } /* graphemeclusterbreak=ri */, - { 4, 4033, 6862, 16, 11, UNI_NO } /* generalcategory=othernumber */, - { 0, 8780, 5778, 6, 13, UNI_IPAEXT } /* block=ipaextensions */, - { 0, 9768, 9712, 4, 4, UNI_OSGE } /* scx=osge */, - { 0, 9262, 1194, 3, 2, UNI_LB__LF } /* sb=lf */, - { 182, 2218, 9306, 3, 4, UNI_INNUSHU } /* innushu */, - { 0, 117, 2431, 4, 18, UNI_ININSCRIPTIONALPAHLAVI } /* ininscriptionalpahlavi */, - { 0, 3836, 1628, 17, 4, UNI_PHAG } /* scriptextensions=phag */, - { 2, 5284, 0, 7, 0, UNI_LISUSUP } /* lisusup */, - { 0, 7325, 7814, 3, 1, UNI_IN__7 } /* in=7 */, - { 1, 9997, 10036, 3, 3, UNI_BC__LRE } /* bc=lre */, - { 10, 6231, 2141, 3, 17, UNI_CYRILLICSUP } /* incyrillicsupplement */, - { 0, 8780, 9800, 6, 4, UNI_TAGS } /* block=tags */, - { 56, 10048, 8714, 3, 4, UNI_NV__3000 } /* nv=3000 */, - { 0, 8780, 3439, 6, 12, UNI_SMALLKANAEXT } /* block=smallkanaext */, - { 0, 1591, 3684, 3, 10, UNI_ETHIOPICEXT } /* inethiopicext */, - { 0, 7318, 10081, 10, 3, UNI_IN__3 } /* presentin=v30 */, - { 3, 10009, 7, 3, 3, UNI_DT__CAN } /* dt=can */, - { 0, 5791, 5424, 13, 14, UNI_JG__MANICHAEANYODH } /* joininggroup=manichaeanyodh */, - { 3, 1188, 2297, 3, 3, UNI_INTHAI } /* inthai */, - { 0, 8589, 6940, 8, 10, UNI_SORA } /* script=sorasompeng */, - { 0, 9277, 7191, 6, 7, UNI_KHAR } /* sc=kharoshthi */, - { 20, 184, 9513, 3, 3, UNI_CHRS } /* ischrs */, - { 0, 8780, 5687, 6, 13, UNI_BLOCKELEMENTS } /* block=blockelements */, - { 5, 1552, 6851, 9, 11, UNI_LO } /* category=otherletter */, - { 0, 9488, 3241, 4, 18, UNI_GEORGIANSUP } /* blk=georgiansupplement */, - { 11, 3836, 9684, 17, 4, UNI_NEWA } /* scriptextensions=newa */, - { 0, 9524, 3, 4, 1, -UNI_CWT } /* cwt=f */, - { 2, 9488, 8924, 4, 6, UNI_INLEPCHA } /* blk=lepcha */, - { 32, 1441, 0, 10, 0, UNI_CJKSYMBOLS } /* cjksymbols */, - { 0, 6420, 7289, 3, 9, UNI_INOLDSOGDIAN } /* inoldsogdian */, - { 1, 7438, 495, 10, 7, UNI_WB__NU } /* wordbreak=numeric */, - { 0, 8589, 5550, 7, 14, UNI_SC__PHLP } /* script=psalterpahlavi */, - { 3, 10048, 7755, 3, 8, UNI_NV__1_SLASH_9 } /* nv=1.11e-01 */, - { 0, 8589, 9828, 7, 4, UNI_THAI } /* script=thai */, - { 2, 10033, 6217, 3, 12, UNI_LB__IS } /* lb=infixnumeric */, - { 0, 8852, 26, 6, 1, UNI_CWKCF } /* cwkcf=y */, - { 3, 184, 2409, 2, 4, UNI_GLAG } /* isglag */, - { 2, 6061, 0, 5, 0, UNI_BIDIC } /* bidic */, - { 85, 5578, 72, 14, 2, UNI_SB__LE } /* sentencebreak=le */, - { 162, 1966, 1489, 22, 24, UNI_INSC__CONSONANTSUCCEEDINGREPHA } /* indicsyllabiccategory=consonantsucceedingrepha */, - { 0, 3836, 9664, 17, 3, UNI_MRO } /* scriptextensions=mro */, - { 0, 5986, 5648, 13, 8, UNI_NV__10000000 } /* numericvalue=10000000 */, - { 0, 184, 5075, 3, 13, UNI_CJKCOMPATFORMS } /* iscjkcompatforms */, - { 0, 10033, 7108, 3, 10, UNI_LB__BA } /* lb=breakafter */, - { 0, 2182, 4360, 21, 9, UNI_WB__EB } /* graphemeclusterbreak=emodifier */, - { 21, 6231, 1442, 3, 23, UNI_CJKSYMBOLS } /* incjksymbolsandpunctuation */, - { 35, 6873, 0, 11, 0, UNI_SO } /* othersymbol */, - { 0, 8589, 9860, 7, 3, UNI_VAI } /* script=vai */, - { 0, 8688, 6026, 3, 11, UNI_ALPHABETICPF } /* isalphabeticpf */, - { 0, 9277, 8457, 4, 6, UNI_SC__KNDA } /* sc=kannada */, - { 38, 6805, 5176, 4, 2, UNI_INMIAO } /* inmiao */, - { 8, 9768, 8888, 4, 6, UNI_HATR } /* scx=hatran */, - { 0, 184, 749, 2, 21, UNI_ENCLOSEDALPHANUM } /* isenclosedalphanumerics */, - { 0, 8589, 9315, 7, 5, UNI_SC__ORYA } /* script=oriya */, - { 133, 7438, 5012, 10, 2, UNI_WB__SQ } /* wordbreak=sq */, - { 0, 9275, 9026, 5, 6, UNI_INSC__VIRAMA } /* insc=virama */, - { 2, 4973, 0, 8, 0, UNI_VEDICEXT } /* vedicext */, - { 52, 74, 0, 2, 0, UNI_ME } /* me */, - { 26, 1979, 0, 10, 0, UNI_L } /* category=l */, - { 0, 5986, 9060, 13, 5, UNI_NV__11_SLASH_12 } /* numericvalue=11/12 */, - { 1, 8589, 8219, 7, 4, UNI_SC__JAVA } /* script=java */, - { 0, 4033, 47, 16, 1, UNI_M } /* generalcategory=m */, - { 6, 10048, 7787, 3, 8, UNI_NV__3_SLASH_2 } /* nv=1.50e+00 */, - { 1, 1966, 4113, 22, 16, UNI_INSC__INVISIBLESTACKER } /* indicsyllabiccategory=invisiblestacker */, - { 1, 4033, 4943, 16, 15, UNI_TITLE } /* generalcategory=titlecaseletter */, - { 0, 8589, 6840, 7, 4, UNI_SC__NAND } /* script=nand */, - { 1, 10060, 10135, 3, 3, UNI_RI } /* ri=yes */, - { 256, 9488, 78, 4, 35, UNI_ARABICMATH } /* blk=arabicmathematicalalphabeticsymbols */, - { 0, 9716, 10135, 4, 3, UNI_PCM } /* pcm=yes */, - { 6, 9768, 9285, 4, 5, UNI_LIMB } /* scx=limbu */, - { 1, 9768, 8484, 4, 7, UNI_MAND } /* scx=mandaic */, - { 5, 3836, 1013, 17, 5, UNI_GREK } /* scriptextensions=greek */, - { 6, 7325, 10087, 3, 3, UNI_IN__3_DOT_2 } /* in=v32 */, - { 0, 5324, 4342, 4, 11, UNI_MATHOPERATORS } /* inmathoperators */, - { 1, 4001, 0, 16, 0, UNI_CYPRIOTSYLLABARY } /* cypriotsyllabary */, - { 0, 8299, 0, 8, 0, UNI_TFNG } /* tifinagh */, - { 196, 2288, 1656, 4, 4, UNI_INHANGUL } /* inhangul */, - { 2, 5986, 7821, 13, 1, UNI_NV__8 } /* numericvalue=8 */, - { 64, 184, 7428, 2, 10, UNI_WARA } /* iswarangciti */, - { 1, 3836, 6409, 17, 12, UNI_MEND } /* scriptextensions=mendekikakui */, - { 3, 5986, 8744, 13, 5, UNI_NV__70000 } /* numericvalue=70000 */, - { 1, 9488, 4129, 4, 9, UNI_LATIN1 } /* blk=latin1sup */, - { 0, 7088, 18, 10, 1, UNI_BC__R } /* bidiclass=r */, - { 0, 6231, 8366, 3, 6, UNI_CJKEXTC } /* incjkextc */, - { 2, 183, 0, 34, 0, UNI_MISCPICTOGRAPHS } /* miscellaneoussymbolsandpictographs */, - { 0, 2280, 6863, 3, 10, UNI_NO } /* isothernumber */, - { 0, 9528, 36, 4, 1, UNI_CWU } /* cwu=t */, - { 265, 8589, 8900, 7, 6, UNI_SC__KTHI } /* script=kaithi */, - { 46, 6231, 43, 3, 15, UNI_CJKCOMPAT } /* incjkcompatibility */, - { 0, 9277, 8484, 3, 7, UNI_SC__MAND } /* sc=mandaic */, - { 4, 184, 9624, 2, 4, UNI_LAO } /* islaoo */, - { 3, 3836, 9692, 17, 4, UNI_NSHU } /* scriptextensions=nshu */, - { 1, 3151, 36, 18, 1, UNI_EPRES } /* emojipresentation=t */, - { 58, 3836, 7292, 18, 3, UNI_SOGD } /* scriptextensions=sogd */, - { 81, 9488, 8561, 4, 7, UNI_INOSMANYA } /* blk=osmanya */, - { 3, 21, 8990, 2, 6, UNI_INREJANG } /* inrejang */, - { 32, 7088, 10039, 10, 3, UNI_BC__LRI } /* bidiclass=lri */, - { 4, 10024, 1563, 3, 2, UNI_PS } /* gc=ps */, - { 1, 3836, 8680, 17, 7, UNI_ZZZZ } /* scriptextensions=unknown */, - { 1, 9768, 9672, 4, 4, UNI_MYMR } /* scx=mymr */, - { 0, 9071, 26, 4, 1, UNI_XPOSIXXDIGIT } /* hex=y */, - { 0, 5986, 9168, 13, 2, UNI_NV__27 } /* numericvalue=27 */, - { 0, 10033, 495, 3, 2, UNI_LB__NU } /* lb=nu */, - { 31, 8780, 2722, 6, 19, UNI_JAMOEXTA } /* block=hanguljamoextendeda */, - { 1, 184, 8414, 2, 4, UNI_ELBA } /* iselba */, - { 99, 2784, 80, 4, 33, UNI_ARABICMATH } /* inarabicmathematicalalphabeticsymbols */, - { 0, 6277, 0, 4, 0, UNI_MAHJ } /* mahj */, - { 35, 117, 3736, 4, 15, UNI_INDICSIYAQNUMBERS } /* inindicsiyaqnumbers */, - { 1, 8589, 9330, 7, 5, UNI_SC__TALE } /* script=taile */, - { 0, 9277, 9085, 3, 5, UNI_BATK } /* sc=batak */, - { 0, 9488, 4928, 4, 5, UNI_INTAMIL } /* blk=tamil */, - { 49, 3341, 0, 8, 0, UNI_DINGBATS } /* dingbats */, - { 0, 9488, 2665, 4, 11, UNI_COUNTINGROD } /* blk=countingrod */, - { 35, 4033, 0, 16, 0, UNI_gc_values_index } /* generalcategory= */, - { 4, 1114, 1, 26, 1, -UNI_CWKCF } /* changeswhennfkccasefolded=n */, - { 7, 6231, 690, 3, 29, UNI_CJKEXTG } /* incjkunifiedideographsextensiong */, - { 3, 7438, 18, 10, 2, UNI_RI } /* wordbreak=ri */, - { 0, 184, 10178, 2, 2, UNI_ZP } /* iszp */, - { 3, 5986, 9916, 13, 3, UNI_NV__2_SLASH_5 } /* numericvalue=2/5 */, - { 2, 8780, 8900, 6, 6, UNI_INKAITHI } /* block=kaithi */, - { 0, 2817, 0, 4, 0, UNI_MERO } /* mero */, - { 0, 10024, 4583, 3, 15, UNI_PD } /* gc=dashpunctuation */, - { 0, 7675, 0, 9, 0, UNI_PALM } /* palmyrene */, - { 16, 184, 2141, 3, 17, UNI_CYRILLICSUP } /* iscyrillicsupplement */, - { 3, 8780, 5830, 6, 13, UNI_LOWSURROGATES } /* block=lowsurrogates */, - { 0, 4033, 9225, 16, 5, UNI_XPOSIXCNTRL } /* generalcategory=cntrl */, - { 8, 21, 8936, 2, 6, UNI_INLYCIAN } /* inlycian */, - { 16, 5791, 9075, 13, 5, UNI_JG__ALAPH } /* joininggroup=alaph */, - { 3, 4989, 4959, 3, 14, UNI_UPPERCASELETTER } /* isuppercaseletter */, - { 120, 184, 3937, 2, 8, UNI_BOPO } /* isbopomofo */, - { 0, 10132, 8323, 3, 7, UNI_WB__LE } /* wb=aletter */, - { 4, 8589, 9245, 7, 5, UNI_SC__DOGR } /* script=dogra */, - { 67, 3853, 1, 17, 1, -UNI_STERM } /* sentenceterminal=n */, - { 0, 10182, 1159, 33, 5, UNI__PERL_PROBLEMATIC_LOCALE_FOLDEDS_START } /* _perl_problematic_locale_foldeds_start */, - { 3, 9768, 9002, 4, 6, UNI_TELU } /* scx=telugu */, - { 0, 5040, 0, 5, 0, UNI_XPOSIXDIGIT } /* digit */, - { 2, 5564, 1025, 14, 2, -UNI_QMARK } /* quotationmark=no */, - { 0, 7, 0, 1, 0, UNI_C } /* c */, - { 1, 9640, 1, 4, 1, -UNI_LOE } /* loe=n */, - { 0, 8780, 3921, 6, 9, UNI_ARABICSUP } /* block=arabicsup */, - { 0, 9828, 0, 4, 0, UNI_THAI } /* thai */, - { 0, 9488, 3241, 4, 8, UNI_INGEORGIAN } /* blk=georgian */, - { 0, 3836, 9440, 17, 4, UNI_ADLM } /* scriptextensions=adlm */, - { 163, 6609, 10135, 11, 3, UNI_DEP } /* deprecated=yes */, - { 4, 10296, 62, 7, 5, UNI_POSIXGRAPH } /* isposixgraph */, - { 0, 184, 8373, 3, 6, UNI_CJKEXTD } /* iscjkextd */, - { 103, 9488, 5228, 4, 14, UNI_LATINEXTB } /* blk=latinextendedb */, - { 1, 4791, 0, 17, 0, UNI_INMEROITICCURSIVE } /* inmeroiticcursive */, - { 4, 1812, 9255, 22, 5, -UNI_CWL } /* changeswhenlowercased=false */, - { 0, 9768, 8498, 4, 7, UNI_MULT } /* scx=multani */, - { 1, 9277, 4369, 3, 6, UNI_SC__SYRC } /* sc=syriac */, - { 1, 9270, 7676, 3, 8, UNI_PALM } /* inpalmyrene */, - { 0, 9277, 9325, 3, 5, UNI_RUNR } /* sc=runic */, - { 474, 1552, 467, 9, 5, UNI_P } /* category=punct */, - { 0, 4116, 6555, 3, 9, UNI_IDC } /* isidcontinue */, - { 0, 9716, 3, 4, 1, -UNI_PCM } /* pcm=f */, - { 0, 6620, 0, 6, 0, UNI_DOMINO } /* domino */, - { 0, 3836, 4868, 17, 15, UNI_NARB } /* scriptextensions=oldnortharabian */, - { 2, 184, 4973, 2, 15, UNI_VEDICEXT } /* isvedicextensions */, - { 11, 1828, 36, 6, 1, UNI_CASED } /* cased=t */, - { 20, 9488, 8315, 4, 8, UNI_INUGARITIC } /* blk=ugaritic */, - { 0, 7218, 184, 10, 2, UNI_LB__IS } /* linebreak=is */, - { 0, 7739, 1025, 8, 2, -UNI_IDS } /* idstart=no */, - { 4, 9488, 9038, 4, 6, UNI_INYEZIDI } /* blk=yezidi */, - { 0, 8589, 9285, 7, 5, UNI_SC__LIMB } /* script=limbu */, - { 2, 7325, 7987, 3, 3, UNI_IN__6_DOT_2 } /* in=6.2 */, - { 3, 7155, 2723, 3, 9, UNI_JAMO } /* ishanguljamo */, - { 0, 7318, 10084, 10, 3, UNI_IN__3_DOT_1 } /* presentin=v31 */, - { 1, 3097, 9868, 18, 4, UNI_EA__F } /* decompositiontype=wide */, - { 106, 9277, 6939, 3, 11, UNI_SORA } /* sc=sorasompeng */, - { 0, 9488, 8211, 4, 8, UNI_JAMOEXTB } /* blk=jamoextb */, - { 12, 9556, 0, 4, 0, UNI_gcb_values_index } /* gcb= */, - { 41, 2182, 36, 21, 1, UNI_GCB__T } /* graphemeclusterbreak=t */, - { 0, 7325, 7781, 3, 1, UNI_IN__4 } /* in=4 */, - { 3, 8762, 10135, 6, 3, UNI_XPOSIXALPHA } /* alpha=yes */, - { 0, 1552, 6873, 9, 11, UNI_SO } /* category=othersymbol */, - { 5, 1059, 0, 2, 0, UNI_SO } /* so */, - { 0, 9556, 1194, 4, 2, UNI_LB__LF } /* gcb=lf */, - { 0, 3836, 8786, 17, 4, UNI_CARI } /* scriptextensions=cari */, - { 0, 10333, 8611, 3, 6, UNI_SIDD } /* issiddham */, - { 7, 5986, 9994, 13, 3, UNI_NV__9_SLASH_2 } /* numericvalue=9/2 */, - { 48, 5578, 138, 14, 2, UNI_SB__FO } /* sentencebreak=fo */, - { 6, 9277, 8638, 3, 7, UNI_SC__TGLG } /* sc=tagalog */, - { 69, 4643, 26, 15, 1, UNI_ECOMP } /* emojicomponent=y */, - { 128, 5200, 0, 14, 0, UNI_KANASUP } /* kanasupplement */, - { 1, 5986, 8042, 13, 2, UNI_NV__18 } /* numericvalue=18 */, - { 0, 8906, 0, 6, 0, UNI_KANBUN } /* kanbun */, - { 2, 4916, 9336, 3, 3, UNI_TAKR } /* istakr */, - { 1, 184, 2120, 3, 13, UNI_CJKRADICALSSUP } /* iscjkradicalssup */, - { 18, 3097, 1253, 18, 4, UNI_DT__INIT } /* decompositiontype=init */, - { 3, 9640, 0, 4, 0, UNI_loe_values_index } /* loe= */, - { 25, 3097, 5904, 18, 4, UNI_DT__NONE } /* decompositiontype=none */, - { 9, 7318, 10120, 10, 3, UNI_IN__8 } /* presentin=v80 */, - { 0, 6097, 0, 12, 0, UNI_CYRILLICEXTA } /* cyrillicexta */, - { 88, 9488, 2119, 4, 21, UNI_CJKRADICALSSUP } /* blk=cjkradicalssupplement */, - { 6, 184, 7621, 2, 9, UNI_NBAT } /* isnabataean */, - { 1, 8780, 7368, 6, 10, UNI_SMALLFORMS } /* block=smallforms */, - { 1, 8884, 9836, 4, 4, UNI_EXT } /* ext=true */, - { 3, 8610, 0, 7, 0, UNI_SIDD } /* siddham */, - { 344, 5116, 3, 14, 1, -UNI_EMOD } /* emojimodifier=f */, - { 0, 9508, 9940, 4, 3, UNI_CCC__A } /* ccc=230 */, - { 1, 908, 0, 10, 0, UNI_CO } /* privateuse */, - { 1, 184, 10303, 2, 5, UNI_XPOSIXBLANK } /* isblank */, - { 0, 3836, 9672, 17, 4, UNI_MYMR } /* scriptextensions=mymr */, - { 0, 9768, 9512, 4, 4, UNI_CHRS } /* scx=chrs */, - { 38, 6231, 5075, 3, 13, UNI_CJKCOMPATFORMS } /* incjkcompatforms */, - { 5, 5564, 0, 13, 0, UNI_QMARK } /* quotationmark */, - { 0, 184, 283, 2, 33, UNI_MISCMATHSYMBOLSB } /* ismiscellaneousmathematicalsymbolsb */, - { 5, 1417, 9937, 24, 3, UNI_CCC__AL } /* canonicalcombiningclass=228 */, - { 1, 1188, 9009, 3, 5, UNI_INTHAANA } /* inthaana */, - { 0, 4033, 24, 16, 1, UNI_L } /* generalcategory=l */, - { 8, 9277, 2817, 3, 19, UNI_MERO } /* sc=meroitichieroglyphs */, - { 4, 3836, 9628, 17, 4, UNI_LATN } /* scriptextensions=latn */, - { 1, 1834, 3, 22, 1, -UNI_CWT } /* changeswhentitlecased=f */, - { 2, 8774, 36, 6, 1, UNI_BIDIM } /* bidim=t */, - { 0, 5791, 5856, 13, 13, UNI_JG__MALAYALAMNNNA } /* joininggroup=malayalamnnna */, - { 11, 5791, 6289, 13, 12, UNI_JG__MALAYALAMBHA } /* joininggroup=malayalambha */, - { 99, 7218, 4538, 10, 15, UNI_LB__CB } /* linebreak=contingentbreak */, - { 84, 2218, 6842, 4, 9, UNI_INNANDINAGARI } /* innandinagari */, - { 5, 4916, 9009, 3, 3, UNI_THAA } /* isthaa */, - { 1, 1552, 7, 9, 1, UNI_C } /* category=c */, - { 150, 2218, 1912, 3, 10, UNI_NUMBERFORMS } /* innumberforms */, - { 5, 9277, 9285, 3, 5, UNI_SC__LIMB } /* sc=limbu */, - { 135, 9768, 9797, 5, 3, UNI_SYRC } /* scx=syrc */, - { 10, 184, 4273, 2, 7, UNI_MYMR } /* ismyanmar */, - { 3, 8780, 4598, 6, 15, UNI_DIACRITICALSEXT } /* block=diacriticalsext */, - { 0, 9488, 3025, 4, 18, UNI_CHEROKEESUP } /* blk=cherokeesupplement */, - { 1, 1790, 0, 21, 0, UNI_CWCM } /* changeswhencasemapped */, - { 1, 7155, 2742, 3, 18, UNI_JAMOEXTB } /* ishanguljamoextendedb */, - { 23, 8780, 4478, 6, 15, UNI_BRAI } /* block=braillepatterns */, - { 0, 10333, 10183, 7, 4, UNI_XPOSIXSPACE } /* isspaceperl */, - { 6, 10027, 5179, 3, 3, UNI_JG__HEH } /* jg=heh */, - { 0, 8589, 9580, 7, 4, UNI_SC__HANO } /* script=hano */, - { 26, 10182, 7739, 6, 7, UNI__PERL_IDSTART } /* _perl_idstart */, - { 0, 9350, 36, 5, 1, UNI_XIDS } /* xids=t */, - { 306, 2224, 3888, 3, 16, UNI_SUTTONSIGNWRITING } /* insuttonsignwriting */, - { 88, 7325, 9982, 3, 3, UNI_IN__6_DOT_3 } /* in=6.3 */, - { 258, 10006, 9836, 3, 4, UNI_DI } /* di=true */, - { 0, 8954, 17, 7, 1, -UNI__PERL_NCHAR } /* nchar=no */, - { 0, 184, 1723, 2, 23, UNI_SUPPUNCTUATION } /* issupplementalpunctuation */, - { 0, 10024, 1527, 3, 9, UNI__PERL_SURROGATE } /* gc=surrogate */, - { 0, 3836, 9724, 17, 4, UNI_PHNX } /* scriptextensions=phnx */, - { 232, 6840, 0, 4, 0, UNI_NAND } /* nand */, - { 1, 10027, 5892, 3, 3, UNI_JG__NUN } /* jg=nun */, - { 32, 10327, 3379, 6, 5, UNI_POSIXSPACE } /* isperlspace */, - { 0, 7168, 0, 10, 0, UNI_DIAK } /* divesakuru */, - { 1, 2836, 0, 19, 0, UNI_MODIFIERTONELETTERS } /* modifiertoneletters */, - { 1, 8858, 10135, 6, 3, UNI_ECOMP } /* ecomp=yes */, - { 0, 9768, 9500, 4, 4, UNI_CAKM } /* scx=cakm */, - { 1, 7218, 9713, 10, 2, UNI_LB__SG } /* linebreak=sg */, - { 0, 9768, 7558, 4, 9, UNI_QAAI } /* scx=inherited */, - { 33, 9250, 10135, 5, 3, UNI_EMOD } /* emod=yes */, - { 0, 1273, 36, 21, 1, UNI_CE } /* compositionexclusion=t */, - { 0, 1417, 5377, 24, 2, UNI_CCC__7 } /* canonicalcombiningclass=nk */, - { 0, 1979, 0, 10, 1, UNI_UPPERCASELETTER } /* category=lu */, - { 1, 9488, 6181, 4, 12, UNI_INGUNJALAGONDI } /* blk=gunjalagondi */, - { 0, 9277, 9305, 3, 5, UNI_NSHU } /* sc=nushu */, - { 2, 7128, 0, 10, 0, UNI_CJKSTROKES } /* cjkstrokes */, - { 1, 9488, 7358, 4, 10, UNI_INSAURASHTRA } /* blk=saurashtra */, - { 2, 184, 9624, 2, 3, UNI_LAO } /* islao */, - { 0, 5986, 8002, 13, 2, UNI_NV__26 } /* numericvalue=26 */, - { 0, 7218, 10162, 10, 2, UNI_GCB__L } /* linebreak=jl */, - { 32, 9508, 9141, 5, 4, UNI_CCC__22 } /* ccc=ccc22 */, - { 3, 3836, 8900, 17, 6, UNI_KTHI } /* scriptextensions=kaithi */, - { 1, 4360, 0, 4, 0, UNI_EMOD } /* emod */, - { 97, 10132, 1822, 3, 2, UNI_WB__NL } /* wb=nl */, - { 1, 3836, 9500, 17, 4, UNI_CAKM } /* scriptextensions=cakm */, - { 1, 9768, 2429, 4, 20, UNI_PHLI } /* scx=inscriptionalpahlavi */, - { 0, 9488, 9335, 4, 5, UNI_INTAKRI } /* blk=takri */, - { 0, 5438, 0, 14, 0, UNI_SK } /* modifiersymbol */, - { 0, 8512, 10135, 7, 3, UNI_NFKCQC__Y } /* nfkcqc=yes */, - { 64, 9768, 9876, 4, 4, UNI_XSUX } /* scx=xsux */, - { 0, 5037, 10135, 9, 3, UNI_XPOSIXXDIGIT } /* hexdigit=yes */, - { 11, 2161, 10135, 21, 3, UNI_EXTPICT } /* extendedpictographic=yes */, - { 1, 6928, 9255, 11, 5, -UNI_SD } /* softdotted=false */, - { 0, 1189, 5904, 3, 4, UNI_NV__NAN } /* nt=none */, - { 32, 1856, 10135, 22, 3, UNI_CWU } /* changeswhenuppercased=yes */, - { 4, 9488, 0, 4, 42, UNI_UCASEXT } /* blk=unifiedcanadianaboriginalsyllabicsextended */, - { 6, 8315, 0, 4, 0, UNI_UGAR } /* ugar */, - { 81, 5986, 8732, 13, 3, UNI_NV__500 } /* numericvalue=500 */, - { 12, 6928, 0, 11, 0, UNI_sd_values_index } /* softdotted= */, - { 0, 9277, 7675, 3, 9, UNI_PALM } /* sc=palmyrene */, - { 1, 9768, 4370, 5, 5, UNI_SYRC } /* scx=syriac */, - { 2, 7438, 1218, 10, 2, UNI_WB__KA } /* wordbreak=ka */, - { 4, 9768, 9676, 4, 4, UNI_NARB } /* scx=narb */, - { 0, 2760, 0, 19, 0, UNI_hst_values_index } /* hangulsyllabletype= */, - { 9, 2760, 6541, 19, 12, UNI_GCB__T } /* hangulsyllabletype=trailingjamo */, - { 3, 3836, 6886, 18, 3, UNI_SHAW } /* scriptextensions=shaw */, - { 332, 6061, 26, 12, 1, UNI_BIDIC } /* bidicontrol=y */, - { 0, 3836, 7, 17, 18, UNI_CANS } /* scriptextensions=canadianaboriginal */, - { 30, 7228, 1025, 10, 2, -UNI_XPOSIXLOWER } /* lowercase=no */, - { 8, 9444, 9400, 4, 4, UNI_AGE__13 } /* age=13.0 */, - { 4, 2032, 9836, 22, 4, UNI__PERL_NCHAR } /* noncharactercodepoint=true */, - { 0, 6840, 0, 11, 0, UNI_NAND } /* nandinagari */, - { 1, 10333, 6792, 3, 3, UNI_SAMR } /* issamr */, - { 0, 9488, 2119, 4, 14, UNI_CJKRADICALSSUP } /* blk=cjkradicalssup */, - { 0, 5550, 0, 14, 0, UNI_PHLP } /* psalterpahlavi */, - { 0, 9768, 9496, 4, 4, UNI_BUHD } /* scx=buhd */, - { 0, 2280, 7650, 4, 7, UNI_ITAL } /* isolditalic */, - { 4, 10048, 7789, 3, 2, UNI_NV__50 } /* nv=50 */, - { 532, 9277, 9532, 3, 4, UNI_SC__CYRL } /* sc=cyrl */, - { 117, 5791, 10000, 13, 3, UNI_JG__BEH } /* joininggroup=beh */, - { 0, 8589, 8942, 7, 4, UNI_LYDI } /* script=lydi */, - { 4, 8589, 8666, 7, 4, UNI_SC__TIRH } /* script=tirh */, - { 512, 9277, 3169, 3, 8, UNI_ETHI } /* sc=ethiopic */, - { 0, 9768, 9860, 4, 3, UNI_VAI } /* scx=vai */, - { 544, 4688, 7208, 15, 10, UNI_IDENTIFIERTYPE__LIMITEDUSE } /* identifiertype=limiteduse */, - { 0, 9488, 1723, 4, 23, UNI_SUPPUNCTUATION } /* blk=supplementalpunctuation */, - { 0, 7218, 5046, 10, 14, UNI_LB__CR } /* linebreak=carriagereturn */, - { 0, 184, 8394, 3, 6, UNI_CJKEXTG } /* iscjkextg */, - { 2, 4916, 4188, 3, 3, UNI_TALE } /* istale */, - { 0, 6609, 9255, 11, 5, -UNI_DEP } /* deprecated=false */, - { 26, 8780, 3115, 6, 18, UNI_DEVANAGARIEXT } /* block=devanagariextended */, - { 1, 9488, 2589, 4, 19, UNI_ANCIENTGREEKNUMBERS } /* blk=ancientgreeknumbers */, - { 0, 5324, 8245, 4, 6, UNI_INMAHAJANI } /* inmahajani */, - { 0, 8858, 3, 6, 1, -UNI_ECOMP } /* ecomp=f */, - { 0, 9768, 6796, 4, 11, UNI_MEDF } /* scx=medefaidrin */, - { 0, 5986, 8082, 13, 2, UNI_NV__19 } /* numericvalue=19 */, - { 0, 7318, 7408, 10, 10, UNI_AGE__NA } /* presentin=unassigned */, - { 32, 6231, 8841, 3, 5, UNI_INCHAKMA } /* inchakma */, - { 0, 1087, 0, 27, 0, UNI_pcm_values_index } /* prependedconcatenationmark= */, - { 1, 8780, 9828, 6, 4, UNI_INTHAI } /* block=thai */, - { 0, 2287, 0, 21, 0, UNI_SINHALAARCHAICNUMBERS } /* sinhalaarchaicnumbers */, - { 0, 9290, 1, 5, 1, -UNI_MATH } /* math=n */, - { 40, 9768, 2061, 4, 4, UNI_MODI } /* scx=modi */, - { 0, 1060, 0, 27, 0, UNI_OCR } /* opticalcharacterrecognition */, - { 0, 3097, 1309, 18, 3, UNI_DT__SUB } /* decompositiontype=sub */, - { 82, 10027, 7148, 3, 10, UNI_JG__DALATHRISH } /* jg=dalathrish */, - { 0, 7318, 10087, 10, 3, UNI_IN__3_DOT_2 } /* presentin=v32 */, - { 65, 10033, 751, 3, 2, UNI_LB__CL } /* lb=cl */, - { 0, 9240, 3, 5, 1, -UNI_DASH } /* dash=f */, - { 0, 3836, 9544, 17, 4, UNI_DIAK } /* scriptextensions=diak */, - { 0, 9275, 1244, 5, 25, UNI_INSC__CONSONANTINITIALPOSTFIXED } /* insc=consonantinitialpostfixed */, - { 1, 4116, 447, 3, 31, UNI_IDEOGRAPHICSYMBOLS } /* isideographicsymbolsandpunctuation */, - { 0, 9488, 7648, 4, 9, UNI_INOLDITALIC } /* blk=olditalic */, - { 1, 7325, 7469, 3, 1, UNI_IN__5 } /* in=5 */, - { 11, 4628, 1204, 15, 9, UNI_EA__F } /* eastasianwidth=fullwidth */, - { 9, 3133, 9836, 18, 4, UNI_EBASE } /* emojimodifierbase=true */, - { 73, 9277, 6972, 3, 4, UNI_SC__SYLO } /* sc=sylo */, - { 4, 6061, 9836, 12, 4, UNI_BIDIC } /* bidicontrol=true */, - { 0, 184, 5284, 2, 4, UNI_LISU } /* islisu */, - { 1, 3836, 8421, 17, 7, UNI_ELYM } /* scriptextensions=elymaic */, - { 0, 9230, 0, 5, 0, UNI_cwcf_values_index } /* cwcf= */, - { 0, 184, 1561, 2, 24, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* issupsymbolsandpictographs */, - { 0, 4658, 3, 15, 1, -UNI_GREXT } /* graphemeextend=f */, - { 1, 9488, 217, 4, 33, UNI_DIACRITICALSEXT } /* blk=combiningdiacriticalmarksextended */, - { 1, 5578, 6556, 15, 8, UNI_SB__SC } /* sentencebreak=scontinue */, - { 3, 9250, 9836, 5, 4, UNI_EMOD } /* emod=true */, - { 98, 9260, 36, 5, 1, UNI_IDSB } /* idsb=t */, - { 173, 1966, 6457, 22, 12, UNI_INSC__NUMBERJOINER } /* indicsyllabiccategory=numberjoiner */, - { 104, 4688, 0, 15, 0, UNI_identifiertype_values_index } /* identifiertype= */, - { 260, 8589, 9576, 7, 4, UNI_SC__GURU } /* script=guru */, - { 16, 3836, 9696, 17, 4, UNI_OGAM } /* scriptextensions=ogam */, - { 1, 8400, 9255, 7, 5, -UNI_COMPEX } /* compex=false */, - { 36, 10296, 3379, 7, 5, UNI_POSIXSPACE } /* isposixspace */, - { 0, 9508, 9946, 4, 3, UNI_CCC__DB } /* ccc=233 */, - { 0, 6109, 0, 12, 0, UNI_CYRILLICEXTB } /* cyrillicextb */, - { 0, 184, 8900, 2, 6, UNI_KTHI } /* iskaithi */, - { 0, 951, 0, 28, 0, UNI_VSSUP } /* variationselectorssupplement */, - { 276, 9596, 5973, 4, 13, UNI_HST__NA } /* hst=notapplicable */, - { 61, 1723, 0, 23, 0, UNI_SUPPUNCTUATION } /* supplementalpunctuation */, - { 3, 3097, 4017, 18, 5, UNI_DT__FIN } /* decompositiontype=final */, - { 0, 9345, 9836, 5, 4, UNI_XIDC } /* xidc=true */, - { 461, 8589, 9793, 8, 3, UNI_SOGO } /* script=sogo */, - { 0, 8780, 5032, 6, 5, UNI_ASCII } /* block=ascii */, - { 0, 8589, 9624, 7, 4, UNI_LAO } /* script=laoo */, - { 5, 2288, 2205, 4, 12, UNI_INHANIFIROHINGYA } /* inhanifirohingya */, - { 3, 42, 0, 26, 0, UNI_CJKCOMPATIDEOGRAPHS } /* cjkcompatibilityideographs */, - { 1, 8780, 5284, 6, 14, UNI_LISUSUP } /* block=lisusupplement */, - { 0, 8291, 0, 4, 0, UNI_TAGB } /* tagb */, - { 0, 4989, 7409, 3, 9, UNI_CN } /* isunassigned */, - { 10, 8870, 36, 6, 1, UNI_EPRES } /* epres=t */, - { 1, 9488, 5960, 4, 13, UNI_MISCTECHNICAL } /* blk=misctechnical */, - { 6, 8589, 8645, 7, 7, UNI_LANA } /* script=taitham */, - { 5, 9488, 1006, 4, 27, UNI_ANCIENTGREEKMUSIC } /* blk=ancientgreekmusicalnotation */, - { 0, 4113, 4974, 3, 7, UNI_VEDICEXT } /* invedicext */, - { 2, 122, 0, 9, 0, UNI_DIA } /* diacritic */, - { 0, 1812, 1, 22, 1, -UNI_CWL } /* changeswhenlowercased=n */, - { 71, 9488, 3870, 4, 17, UNI_SMALLFORMS } /* blk=smallformvariants */, - { 0, 2224, 1724, 3, 22, UNI_SUPPUNCTUATION } /* insupplementalpunctuation */, - { 32, 184, 84, 2, 4, UNI_MATH } /* ismath */, - { 0, 6231, 1879, 3, 21, UNI_CJKCOMPATIDEOGRAPHSSUP } /* incjkcompatideographssup */, - { 0, 8780, 7648, 6, 9, UNI_INOLDITALIC } /* block=olditalic */, - { 0, 9768, 8179, 4, 8, UNI_GURU } /* scx=gurmukhi */, - { 3, 184, 1171, 2, 2, UNI_TITLE } /* islt */, - { 0, 3836, 6840, 17, 11, UNI_NAND } /* scriptextensions=nandinagari */, - { 0, 1966, 2844, 22, 10, UNI_INSC__TONELETTER } /* indicsyllabiccategory=toneletter */, - { 1, 3547, 0, 17, 0, UNI_ALCHEMICAL } /* alchemicalsymbols */, - { 0, 8421, 0, 7, 0, UNI_ELYM } /* elymaic */, - { 3, 10048, 10152, 3, 2, UNI_NV__49 } /* nv=49 */, - { 0, 9488, 9315, 4, 5, UNI_INORIYA } /* blk=oriya */, - { 35, 9277, 8315, 3, 4, UNI_UGAR } /* sc=ugar */, - { 0, 9508, 9156, 5, 4, UNI_CCC__25 } /* ccc=ccc25 */, - { 36, 3836, 5171, 17, 4, UNI_CHAM } /* scriptextensions=cham */, - { 6, 4033, 1186, 16, 2, UNI_PO } /* generalcategory=po */, - { 2, 8882, 1, 6, 1, -UNI_GREXT } /* grext=n */, - { 17, 9277, 9816, 3, 4, UNI_TAVT } /* sc=tavt */, - { 0, 1563, 0, 2, 0, UNI_PS } /* ps */, - { 66, 9488, 8906, 4, 6, UNI_KANBUN } /* blk=kanbun */, - { 0, 9444, 8043, 4, 3, UNI_AGE__8 } /* age=8.0 */, - { 0, 9290, 1025, 5, 2, -UNI_MATH } /* math=no */, - { 11, 1979, 36, 10, 1, UNI_TITLE } /* category=lt */, - { 3, 10048, 9976, 3, 3, UNI_NV__5_SLASH_8 } /* nv=5/8 */, - { 0, 8997, 0, 6, 0, UNI_TERM } /* term=t */, - { 0, 184, 6730, 2, 11, UNI_KATAKANAEXT } /* iskatakanaext */, - { 262, 8780, 3600, 6, 4, UNI_UCAS } /* block=ucas */, - { 8, 7155, 9593, 3, 3, UNI_HMNP } /* ishmnp */, - { 5, 7155, 1193, 3, 25, UNI_HALFANDFULLFORMS } /* ishalfwidthandfullwidthforms */, - { 316, 9768, 8597, 5, 6, UNI_SHRD } /* scx=sharada */, - { 0, 1988, 36, 22, 1, UNI_LOE } /* logicalorderexception=t */, - { 0, 3374, 1, 11, 1, -UNI_XPOSIXSPACE } /* whitespace=n */, - { 0, 9444, 10075, 4, 3, UNI_AGE__2 } /* age=v20 */, - { 8, 9444, 9955, 4, 3, UNI_AGE__3_DOT_2 } /* age=3.2 */, - { 0, 2288, 8444, 4, 5, UNI_INHANUNOO } /* inhanunoo */, - { 0, 6231, 510, 3, 29, UNI_CJKEXTA } /* incjkunifiedideographsextensiona */, - { 2, 184, 6098, 3, 11, UNI_CYRILLICEXTA } /* iscyrillicexta */, - { 0, 10060, 1, 3, 1, -UNI_RI } /* ri=n */, - { 0, 6231, 8352, 3, 6, UNI_CJKEXTA } /* incjkexta */, - { 0, 1988, 9255, 22, 5, -UNI_LOE } /* logicalorderexception=false */, - { 2, 5791, 7045, 13, 3, UNI_JG__FEH } /* joininggroup=feh */, - { 64, 4116, 325, 3, 3, UNI_ITAL } /* isital */, - { 0, 7088, 10042, 10, 3, UNI_BC__LRO } /* bidiclass=lro */, - { 47, 7155, 8, 3, 2, UNI_HAN } /* ishan */, - { 0, 5986, 7765, 13, 2, UNI_NV__25 } /* numericvalue=25 */, - { 3, 9488, 4340, 4, 13, UNI_MATHOPERATORS } /* blk=mathoperators */, - { 0, 10033, 8680, 3, 7, UNI_LB__XX } /* lb=unknown */, - { 2, 10024, 1059, 3, 2, UNI_SO } /* gc=so */, - { 8, 7088, 407, 10, 2, UNI_BC__ON } /* bidiclass=on */, - { 3, 4245, 0, 10, 0, UNI_SM } /* mathsymbol */, - { 32, 8780, 4928, 6, 5, UNI_INTAMIL } /* block=tamil */, - { 0, 9488, 5550, 4, 14, UNI_INPSALTERPAHLAVI } /* blk=psalterpahlavi */, - { 3, 8870, 1025, 6, 2, -UNI_EPRES } /* epres=no */, - { 4, 9876, 0, 4, 0, UNI_XSUX } /* xsux */, - { 3, 8966, 0, 7, 0, UNI_DT__CAN } /* nfdqc=n */, - { 4, 9265, 9255, 5, 5, -UNI_IDST } /* idst=false */, - { 11, 7218, 5088, 10, 14, UNI_LB__SA } /* linebreak=complexcontext */, - { 1, 3836, 3598, 17, 17, UNI_AGHB } /* scriptextensions=caucasianalbanian */, - { 0, 8780, 4049, 6, 16, UNI_GEORGIANEXT } /* block=georgianextended */, - { 10, 3385, 1, 18, 1, -UNI_RI } /* regionalindicator=n */, - { 0, 8589, 9095, 7, 5, UNI_SC__BUHD } /* script=buhid */, - { 1, 10024, 10170, 3, 2, UNI_CASEDLETTER } /* gc=l_ */, - { 1, 5791, 6774, 13, 11, UNI_JG__MALAYALAMJA } /* joininggroup=malayalamja */, - { 4, 117, 5779, 3, 12, UNI_IPAEXT } /* inipaextensions */, - { 56, 5986, 8756, 13, 6, UNI_NV__900000 } /* numericvalue=900000 */, - { 2, 8589, 3169, 7, 8, UNI_ETHI } /* script=ethiopic */, - { 0, 10033, 2444, 3, 2, UNI_LB__HL } /* lb=hl */, - { 6, 1114, 9255, 26, 5, -UNI_CWKCF } /* changeswhennfkccasefolded=false */, - { 0, 10027, 9044, 3, 4, UNI_JG__YUDH } /* jg=yudh */, - { 2, 4385, 0, 6, 0, UNI_TANG } /* tangut */, - { 2, 8780, 2245, 6, 14, UNI_MEETEIMAYEKEXT } /* block=meeteimayekext */, - { 32, 3836, 9330, 17, 5, UNI_TALE } /* scriptextensions=taile */, - { 0, 3836, 8107, 17, 4, UNI_BALI } /* scriptextensions=bali */, - { 32, 5986, 5648, 13, 7, UNI_NV__1000000 } /* numericvalue=1000000 */, - { 24, 8780, 4369, 6, 6, UNI_INSYRIAC } /* block=syriac */, - { 206, 4838, 17, 16, 1, UNI_NFKCQC__N } /* nfkcquickcheck=no */, - { 2, 6061, 3, 12, 1, -UNI_BIDIC } /* bidicontrol=f */, - { 0, 9277, 8344, 3, 4, UNI_SC__BENG } /* sc=beng */, - { 0, 9277, 9544, 3, 4, UNI_DIAK } /* sc=diak */, - { 426, 4369, 0, 16, 0, UNI_SYRIACSUP } /* syriacsupplement */, - { 1, 6231, 1902, 4, 20, UNI_INDICNUMBERFORMS } /* incommonindicnumberforms */, - { 1, 10027, 9075, 3, 5, UNI_JG__ALAPH } /* jg=alaph */, - { 2, 4478, 0, 7, 0, UNI_BRAI } /* braille */, - { 1, 8589, 1654, 7, 6, UNI_SC__HANG } /* script=hangul */, - { 68, 9508, 8817, 5, 5, UNI_CCC__129 } /* ccc=ccc129 */, - { 0, 9015, 3, 5, 1, -UNI_IDEO } /* ideo=f */, - { 8, 1417, 9472, 24, 3, UNI_CCC__202 } /* canonicalcombiningclass=atb */, - { 24, 184, 4613, 2, 15, UNI_DIACRITICALSSUP } /* isdiacriticalssup */, - { 0, 9488, 4337, 4, 16, UNI_SUPMATHOPERATORS } /* blk=supmathoperators */, - { 7, 1594, 0, 14, 0, UNI_MUSIC } /* musicalsymbols */, - { 97, 4791, 2247, 4, 12, UNI_MEETEIMAYEKEXT } /* inmeeteimayekext */, - { 3, 184, 1344, 2, 25, UNI_SYMBOLSFORLEGACYCOMPUTING } /* issymbolsforlegacycomputing */, - { 51, 9488, 446, 4, 18, UNI_IDEOGRAPHICSYMBOLS } /* blk=ideographicsymbols */, - { 10, 9488, 5284, 4, 14, UNI_LISUSUP } /* blk=lisusupplement */, - { 0, 9620, 0, 4, 0, UNI_LANA } /* lana */, - { 0, 9488, 1631, 4, 23, UNI_GEOMETRICSHAPESEXT } /* blk=geometricshapesextended */, - { 0, 6231, 1442, 3, 9, UNI_CJKSYMBOLS } /* incjksymbols */, - { 0, 10132, 727, 3, 2, UNI_WB__MN } /* wb=mn */, - { 68, 1166, 10135, 26, 3, UNI_DI } /* defaultignorablecodepoint=yes */, - { 0, 1188, 8639, 3, 6, UNI_INTAGALOG } /* intagalog */, - { 320, 9488, 6796, 4, 11, UNI_INMEDEFAIDRIN } /* blk=medefaidrin */, - { 402, 3836, 8491, 17, 4, UNI_MARC } /* scriptextensions=marc */, - { 4, 9488, 5752, 4, 8, UNI_GREEKEXT } /* blk=greekext */, - { 1, 7088, 4465, 12, 13, UNI_BC__BN } /* bidiclass=boundaryneutral */, - { 91, 8688, 863, 4, 4, UNI_ARROWS } /* isarrows */, - { 0, 184, 867, 2, 18, UNI_PHONETICEXT } /* isphoneticextensions */, - { 0, 8107, 0, 4, 0, UNI_BALI } /* bali */, - { 1, 10333, 4370, 3, 8, UNI_SYRIACSUP } /* issyriacsup */, - { 0, 8337, 0, 7, 0, UNI_AVST } /* avestan */, - { 8, 184, 43, 3, 2, UNI_CJK } /* iscjk */, - { 0, 9488, 8470, 4, 7, UNI_INLINEARA } /* blk=lineara */, - { 0, 9768, 4145, 4, 7, UNI_LINB } /* scx=linearb */, - { 496, 7325, 7979, 3, 3, UNI_IN__6 } /* in=6.0 */, - { 0, 2218, 7623, 4, 7, UNI_INNABATAEAN } /* innabataean */, - { 22, 9748, 0, 4, 0, UNI_RJNG } /* rjng */, - { 0, 3836, 9736, 17, 4, UNI_COPT } /* scriptextensions=qaac */, - { 97, 2784, 4435, 4, 13, UNI_ARABICEXTA } /* inarabicextendeda */, - { 38, 9444, 9967, 4, 3, UNI_AGE__5_DOT_1 } /* age=5.1 */, - { 121, 3836, 8876, 17, 4, UNI_GOTH } /* scriptextensions=goth */, - { 5, 10033, 83, 3, 2, UNI_LB__CM } /* lb=cm */, - { 4, 9997, 102, 3, 2, UNI_BC__ET } /* bc=et */, - { 0, 5452, 10135, 14, 3, UNI_NFCQC__Y } /* nfcquickcheck=yes */, - { 12, 9488, 3025, 4, 8, UNI_INCHEROKEE } /* blk=cherokee */, - { 72, 9524, 10135, 4, 3, UNI_CWT } /* cwt=yes */, - { 22, 9277, 2485, 3, 4, UNI_SC__MONG } /* sc=mong */, - { 136, 8267, 1, 8, 1, -UNI_RADICAL } /* radical=n */, - { 68, 8219, 0, 8, 0, UNI_JAVA } /* javanese */, - { 1, 21, 9066, 3, 4, UNI_INADLAM } /* inadlam */, - { 385, 1966, 1608, 22, 23, UNI_INSC__CONSONANTPRECEDINGREPHA } /* indicsyllabiccategory=consonantprecedingrepha */, - { 0, 6576, 3, 11, 1, -UNI_XPOSIXALPHA } /* alphabetic=f */, - { 8, 5986, 7978, 13, 2, UNI_NV__16 } /* numericvalue=16 */, - { 41, 1552, 598, 9, 2, UNI_XPOSIXCNTRL } /* category=cc */, - { 8, 6241, 0, 12, 1, UNI_JT__U } /* joiningtype=u */, - { 2, 10024, 6598, 3, 11, UNI_CASEDLETTER } /* gc=casedletter */, - { 0, 9250, 1, 5, 1, -UNI_EMOD } /* emod=n */, - { 1, 6121, 0, 12, 0, UNI_CYRILLICEXTC } /* cyrillicextc */, - { 0, 6554, 0, 10, 0, UNI_IDC } /* idcontinue */, - { 0, 2760, 6741, 19, 11, UNI_GCB__L } /* hangulsyllabletype=leadingjamo */, - { 2, 5986, 9988, 13, 3, UNI_NV__7_SLASH_8 } /* numericvalue=7/8 */, - { 38, 5578, 1194, 14, 2, UNI_LB__LF } /* sentencebreak=lf */, - { 7, 10132, 3385, 3, 17, UNI_RI } /* wb=regionalindicator */, - { 2, 8589, 8428, 7, 4, UNI_SC__GRAN } /* script=gran */, - { 1, 4838, 9295, 15, 5, UNI_NFCQC__M } /* nfkcquickcheck=maybe */, - { 0, 9768, 9310, 4, 5, UNI_OGAM } /* scx=ogham */, - { 1, 3424, 1, 3, 33, UNI_UCAS } /* inunifiedcanadianaboriginalsyllabics */, - { 12, 21, 5804, 2, 13, UNI_KANAEXTA } /* inkanaextendeda */, - { 1, 1044, 0, 6, 0, UNI_L } /* letter */, - { 106, 9508, 9943, 4, 3, UNI_CCC__AR } /* ccc=232 */, - { 0, 7738, 3, 9, 1, -UNI_XIDS } /* xidstart=f */, - { 0, 184, 8491, 2, 7, UNI_MARC } /* ismarchen */, - { 32, 8589, 3751, 7, 17, UNI_KITS } /* script=khitansmallscript */, - { 0, 2280, 4899, 3, 14, UNI_PS } /* isopenpunctuation */, - { 1, 8780, 3241, 6, 11, UNI_GEORGIANSUP } /* block=georgiansup */, - { 1, 5791, 2203, 13, 21, UNI_JG__HANIFIROHINGYAKINNAYA } /* joininggroup=hanifirohingyakinnaya */, - { 92, 1966, 5144, 22, 14, UNI_INSC__GEMINATIONMARK } /* indicsyllabiccategory=geminationmark */, - { 0, 9768, 9085, 4, 5, UNI_BATK } /* scx=batak */, - { 1, 9768, 9652, 4, 4, UNI_MERC } /* scx=merc */, - { 0, 96, 0, 5, 0, UNI_XPOSIXALPHA } /* alpha */, - { 12, 8589, 9632, 7, 4, UNI_SC__LINA } /* script=lina */, - { 4, 8498, 0, 7, 0, UNI_MULT } /* multani */, - { 17, 1966, 9026, 22, 6, UNI_INSC__VIRAMA } /* indicsyllabiccategory=virama */, - { 0, 7438, 2444, 10, 2, UNI_LB__HL } /* wordbreak=hl */, - { 258, 7318, 9844, 10, 4, UNI_IN__11 } /* presentin=v110 */, - { 0, 9768, 9440, 4, 4, UNI_ADLM } /* scx=adlm */, - { 0, 8589, 7118, 7, 10, UNI_CHRS } /* script=chorasmian */, - { 36, 5508, 9836, 14, 4, UNI_PATSYN } /* patternsyntax=true */, - { 2, 3836, 9656, 17, 4, UNI_MIAO } /* scriptextensions=miao */, - { 25, 3097, 8195, 18, 8, UNI_DT__ISO } /* decompositiontype=isolated */, - { 45, 5791, 5336, 13, 4, UNI_JG__BETH } /* joininggroup=beth */, - { 3, 10048, 10150, 3, 2, UNI_NV__48 } /* nv=48 */, - { 4, 4853, 1025, 15, 2, UNI_NFKDQC__N } /* nfkdquickcheck=no */, - { 1, 10048, 8756, 3, 6, UNI_NV__900000 } /* nv=900000 */, - { 7, 9346, 36, 4, 1, UNI_IDC } /* idc=t */, - { 1, 10024, 5438, 3, 14, UNI_SK } /* gc=modifiersymbol */, - { 0, 9444, 7923, 4, 3, UNI_AGE__4 } /* age=4.0 */, - { 1, 9488, 4369, 4, 6, UNI_INSYRIAC } /* blk=syriac */, - { 69, 4916, 9004, 4, 4, UNI_TELU } /* istelugu */, - { 8, 184, 1287, 2, 2, UNI_UPPERCASELETTER } /* islu */, - { 0, 8589, 2203, 7, 4, UNI_SC__HAN } /* script=hani */, - { 1, 6928, 36, 11, 1, UNI_SD } /* softdotted=t */, - { 14, 9508, 9472, 4, 3, UNI_CCC__202 } /* ccc=atb */, - { 3, 3836, 9816, 17, 4, UNI_TAVT } /* scriptextensions=tavt */, - { 0, 9277, 9620, 3, 4, UNI_LANA } /* sc=lana */, - { 0, 7739, 1, 8, 1, -UNI_IDS } /* idstart=n */, - { 5, 7218, 8449, 10, 2, UNI_LB__HY } /* linebreak=hy */, - { 49, 8780, 3331, 6, 18, UNI_ORNAMENTALDINGBATS } /* block=ornamentaldingbats */, - { 0, 8780, 8091, 6, 8, UNI_INARMENIAN } /* block=armenian */, - { 41, 9488, 4049, 4, 11, UNI_GEORGIANEXT } /* blk=georgianext */, - { 0, 9351, 1, 4, 1, -UNI_IDS } /* ids=n */, - { 49, 9444, 10078, 4, 3, UNI_AGE__2_DOT_1 } /* age=v21 */, - { 134, 10009, 1309, 3, 3, UNI_DT__SUB } /* dt=sub */, - { 296, 9277, 9464, 3, 4, UNI_ARMN } /* sc=armn */, - { 6, 8780, 7168, 6, 10, UNI_INDIVESAKURU } /* block=divesakuru */, - { 0, 8694, 3, 7, 1, -UNI_XPOSIXSPACE } /* wspace=f */, - { 100, 10132, 7729, 3, 9, UNI_WB__WSEGSPACE } /* wb=wsegspace */, - { 1, 5791, 5480, 13, 14, UNI_JG__NOJOININGGROUP } /* joininggroup=nojoininggroup */, - { 257, 3259, 9836, 18, 4, UNI_IDSB } /* idsbinaryoperator=true */, - { 590, 5986, 9961, 13, 3, UNI_NV__3_SLASH_5 } /* numericvalue=3/5 */, - { 2, 7218, 5536, 10, 14, UNI_LB__PO } /* linebreak=postfixnumeric */, - { 39, 7428, 0, 4, 0, UNI_WARA } /* wara */, - { 0, 6231, 8387, 3, 6, UNI_CJKEXTF } /* incjkextf */, - { 0, 184, 8123, 2, 8, UNI_BUGI } /* isbuginese */, - { 0, 8509, 811, 4, 20, UNI_ENCLOSEDIDEOGRAPHICSUP } /* inenclosedideographicsup */, - { 1, 5986, 7922, 13, 2, UNI_NV__24 } /* numericvalue=24 */, - { 0, 9277, 7630, 3, 9, UNI_TALU } /* sc=newtailue */, - { 32, 8780, 2741, 6, 19, UNI_JAMOEXTB } /* block=hanguljamoextendedb */, - { 2, 10346, 1182, 5, 4, UNI_ANY } /* isunicode */, - { 128, 5060, 36, 14, 1, UNI_CI } /* caseignorable=t */, - { 0, 9508, 9151, 5, 4, UNI_CCC__24 } /* ccc=ccc24 */, - { 0, 9071, 36, 4, 1, UNI_XPOSIXXDIGIT } /* hex=t */, - { 0, 6231, 540, 3, 29, UNI_CJKEXTB } /* incjkunifiedideographsextensionb */, - { 107, 10296, 0, 3, 0, UNI_P } /* isp */, - { 0, 8115, 0, 8, 0, UNI_BASS } /* bassavah */, - { 16, 7540, 0, 9, 0, UNI_ext_values_index } /* extender= */, - { 128, 184, 9484, 2, 4, UNI_BHKS } /* isbhks */, - { 21, 8864, 26, 6, 1, UNI_EMOJI } /* emoji=y */, - { 0, 5986, 5648, 13, 11, UNI_NV__10000000000 } /* numericvalue=10000000000 */, - { 0, 4340, 0, 13, 0, UNI_MATHOPERATORS } /* mathoperators */, - { 0, 9768, 7359, 5, 9, UNI_SAUR } /* scx=saurashtra */, - { 6, 10132, 7612, 3, 9, UNI_WB__MB } /* wb=midnumlet */, - { 66, 1066, 0, 2, 0, UNI_CASEDLETTER } /* lc */, - { 0, 10027, 7112, 3, 3, UNI_JG__KAF } /* jg=kaf */, - { 0, 8876, 0, 4, 0, UNI_GOTH } /* goth */, - { 6, 6231, 2141, 3, 7, UNI_INCYRILLIC } /* incyrillic */, - { 0, 8589, 1165, 9, 2, UNI_SC__SHRD } /* script=shrd */, - { 40, 1552, 10180, 9, 2, UNI_ZS } /* category=zs */, - { 0, 4033, 5713, 16, 13, UNI_XPOSIXDIGIT } /* generalcategory=decimalnumber */, - { 577, 9015, 9255, 5, 5, -UNI_IDEO } /* ideo=false */, - { 0, 8780, 9688, 6, 3, UNI_INNKO } /* block=nko */, - { 132, 9277, 8414, 3, 7, UNI_ELBA } /* sc=elbasan */, - { 0, 10048, 8720, 3, 3, UNI_NV__400 } /* nv=400 */, - { 2, 1828, 26, 6, 1, UNI_CASED } /* cased=y */, - { 0, 184, 8912, 2, 4, UNI_KHOJ } /* iskhoj */, - { 32, 9768, 6181, 4, 12, UNI_GONG } /* scx=gunjalagondi */, - { 21, 184, 6517, 2, 12, UNI_PLAYINGCARDS } /* isplayingcards */, - { 0, 3097, 2280, 18, 3, UNI_DT__ISO } /* decompositiontype=iso */, - { 0, 4033, 6598, 16, 11, UNI_CASEDLETTER } /* generalcategory=casedletter */, - { 10, 8780, 4868, 6, 15, UNI_NARB } /* block=oldnortharabian */, - { 0, 184, 3133, 2, 13, UNI_EMOD } /* isemojimodifier */, - { 68, 10048, 8720, 3, 5, UNI_NV__40000 } /* nv=40000 */, - { 4, 10048, 7819, 3, 8, UNI_NV__3_SLASH_16 } /* nv=1.88e-01 */, - { 2, 9488, 6620, 4, 11, UNI_DOMINO } /* blk=dominotiles */, - { 428, 9345, 1, 5, 1, -UNI_XIDC } /* xidc=n */, - { 0, 3836, 2855, 17, 9, UNI_MONG } /* scriptextensions=mongolian */, - { 5, 10333, 8277, 4, 6, UNI_SPECIALS } /* isspecials */, - { 32, 10048, 7867, 3, 8, UNI_NV__1_SLASH_32 } /* nv=3.12e-02 */, - { 0, 7088, 32, 10, 2, UNI_BC__CS } /* bidiclass=cs */, - { 1, 9488, 7458, 4, 10, UNI_YIRADICALS } /* blk=yiradicals */, - { 0, 4838, 0, 15, 0, UNI_nfkcqc_values_index } /* nfkcquickcheck= */, - { 1, 8589, 8115, 7, 8, UNI_BASS } /* script=bassavah */, - { 71, 7438, 4305, 10, 5, UNI_WB__XX } /* wordbreak=other */, - { 1, 9277, 8498, 3, 4, UNI_SC__MULT } /* sc=mult */, - { 3, 5817, 0, 13, 0, UNI_ZL } /* lineseparator */, - { 5, 9277, 9832, 3, 4, UNI_TIBT } /* sc=tibt */, - { 1, 10033, 10156, 3, 2, UNI_LB__BK } /* lb=bk */, - { 0, 10030, 6664, 3, 11, UNI_JT__D } /* jt=dualjoining */, - { 17, 184, 8344, 2, 7, UNI_BENG } /* isbengali */, - { 108, 6231, 115, 4, 33, UNI_DIACRITICALSFORSYMBOLS } /* incombiningdiacriticalmarksforsymbols */, - { 0, 9277, 8666, 3, 4, UNI_SC__TIRH } /* sc=tirh */, - { 39, 184, 6110, 3, 11, UNI_CYRILLICEXTB } /* iscyrillicextb */, - { 1, 6972, 0, 4, 0, UNI_SYLO } /* sylo */, - { 60, 84, 0, 4, 0, UNI_MATH } /* math */, - { 3, 1552, 3985, 9, 16, UNI_PE } /* category=closepunctuation */, - { 0, 9768, 9032, 4, 6, UNI_WCHO } /* scx=wancho */, - { 5, 7325, 9979, 3, 3, UNI_IN__6_DOT_1 } /* in=6.1 */, - { 0, 1269, 9836, 25, 4, UNI_COMPEX } /* fullcompositionexclusion=true */, - { 0, 6231, 4002, 3, 15, UNI_CYPRIOTSYLLABARY } /* incypriotsyllabary */, - { 16, 7438, 34, 10, 6, UNI_WB__EXTEND } /* wordbreak=extend */, - { 0, 9275, 2389, 5, 20, UNI_INSC__CONSONANTWITHSTACKER } /* insc=consonantwithstacker */, - { 20, 9277, 9664, 3, 4, UNI_MRO } /* sc=mroo */, - { 0, 1417, 6445, 24, 12, UNI_CCC__0 } /* canonicalcombiningclass=notreordered */, - { 100, 9277, 9564, 3, 4, UNI_SC__GONM } /* sc=gonm */, - { 0, 9444, 7867, 4, 3, UNI_AGE__3_DOT_1 } /* age=3.1 */, - { 0, 4145, 0, 16, 0, UNI_LINEARBIDEOGRAMS } /* linearbideograms */, - { 1, 7076, 3938, 3, 15, UNI_BOPOMOFOEXT } /* inbopomofoextended */, - { 1, 8780, 7428, 6, 10, UNI_INWARANGCITI } /* block=warangciti */, - { 1, 5564, 0, 14, 0, UNI_qmark_values_index } /* quotationmark= */, - { 27, 9444, 7469, 4, 3, UNI_AGE__5 } /* age=5.0 */, - { 0, 9488, 8203, 4, 8, UNI_JAMOEXTA } /* blk=jamoexta */, - { 16, 8780, 1654, 6, 6, UNI_INHANGUL } /* block=hangul */, - { 1, 8884, 10135, 4, 3, UNI_EXT } /* ext=yes */, - { 0, 9002, 0, 4, 0, UNI_TELU } /* telu */, - { 1, 10003, 10135, 3, 3, UNI_CI } /* ci=yes */, - { 3, 9768, 4149, 5, 3, UNI_SARB } /* scx=sarb */, - { 1, 5986, 7963, 13, 8, UNI_NV__11_SLASH_2 } /* numericvalue=5.50e+00 */, - { 549, 6231, 7140, 4, 8, UNI_COMPATJAMO } /* incompatjamo */, - { 0, 8780, 3241, 6, 18, UNI_GEORGIANSUP } /* block=georgiansupplement */, - { 3, 4643, 36, 15, 1, UNI_ECOMP } /* emojicomponent=t */, - { 0, 1269, 9255, 25, 5, -UNI_COMPEX } /* fullcompositionexclusion=false */, - { 4, 1552, 467, 9, 11, UNI_P } /* category=punctuation */, - { 3, 6241, 36, 12, 1, UNI_JT__T } /* joiningtype=t */, - { 3, 21, 8463, 2, 7, UNI_KALI } /* inkayahli */, - { 334, 9508, 2449, 4, 4, UNI_CCC__L } /* ccc=left */, - { 41, 10033, 8251, 3, 8, UNI_LB__NL } /* lb=nextline */, - { 6, 9335, 0, 5, 0, UNI_TAKR } /* takri */, - { 2, 9488, 861, 4, 6, UNI_ARROWS } /* blk=arrows */, - { 0, 9350, 9836, 5, 4, UNI_XIDS } /* xids=true */, - { 7, 5986, 7933, 13, 2, UNI_NV__17 } /* numericvalue=17 */, - { 0, 184, 8107, 2, 4, UNI_BALI } /* isbali */, - { 0, 8780, 8617, 6, 7, UNI_INSOYOMBO } /* block=soyombo */, - { 0, 10048, 7955, 3, 8, UNI_NV__1_SLASH_20 } /* nv=5.00e-02 */, - { 4, 3836, 8187, 17, 8, UNI_HIRA } /* scriptextensions=hiragana */, - { 512, 3836, 8611, 18, 3, UNI_SIDD } /* scriptextensions=sidd */, - { 0, 9488, 8912, 4, 6, UNI_INKHOJKI } /* blk=khojki */, - { 3, 9444, 0, 4, 0, UNI_age_values_index } /* age= */, - { 67, 7666, 0, 9, 0, UNI_ORKH } /* oldturkic */, - { 1, 10333, 4370, 3, 5, UNI_SYRC } /* issyriac */, - { 399, 184, 8694, 2, 6, UNI_XPOSIXSPACE } /* iswspace */, - { 64, 184, 1594, 2, 14, UNI_MUSIC } /* ismusicalsymbols */, - { 16, 9488, 6505, 4, 8, UNI_PHAISTOS } /* blk=phaistos */, - { 4, 9277, 7513, 3, 9, UNI_BHKS } /* sc=bhaiksuki */, - { 164, 3836, 8337, 17, 7, UNI_AVST } /* scriptextensions=avestan */, - { 5, 8589, 7513, 7, 9, UNI_BHKS } /* script=bhaiksuki */, - { 18, 9508, 23, 4, 2, UNI_CCC__AL } /* ccc=al */, - { 0, 8780, 6409, 6, 12, UNI_INMENDEKIKAKUI } /* block=mendekikakui */, - { 104, 9768, 9752, 4, 4, UNI_ROHG } /* scx=rohg */, - { 234, 2010, 0, 22, 0, UNI_MISCTECHNICAL } /* miscellaneoustechnical */, - { 0, 3836, 2203, 17, 4, UNI_HAN } /* scriptextensions=hani */, - { 6, 10333, 107, 3, 5, UNI_S } /* issymbol */, - { 0, 6851, 0, 11, 0, UNI_LO } /* otherletter */, - { 1, 5791, 4203, 13, 3, UNI_JG__LAM } /* joininggroup=lam */, - { 0, 7438, 4360, 10, 9, UNI_WB__EB } /* wordbreak=emodifier */, - { 263, 10027, 2203, 3, 21, UNI_JG__HANIFIROHINGYAKINNAYA } /* jg=hanifirohingyakinnaya */, - { 0, 7218, 3985, 10, 16, UNI_LB__CL } /* linebreak=closepunctuation */, - { 0, 9277, 9872, 3, 4, UNI_XPEO } /* sc=xpeo */, - { 128, 10320, 3379, 7, 5, UNI_XPOSIXSPACE } /* isxperlspace */, - { 280, 9488, 1878, 4, 19, UNI_CJKCOMPATIDEOGRAPHS } /* blk=cjkcompatideographs */, - { 0, 8780, 2287, 6, 7, UNI_INSINHALA } /* block=sinhala */, - { 2, 10033, 8701, 3, 7, UNI_LB__ZW } /* lb=zwspace */, - { 7, 9488, 1594, 4, 14, UNI_MUSIC } /* blk=musicalsymbols */, - { 64, 10288, 96, 8, 5, UNI_XPOSIXALPHA } /* isxposixalpha */, - { 0, 184, 3169, 2, 18, UNI_ETHIOPICSUP } /* isethiopicsupplement */, - { 0, 8688, 7060, 4, 8, UNI_ARABICEXTA } /* isarabicexta */, - { 38, 10033, 6675, 3, 11, UNI_LB__EX } /* lb=exclamation */, - { 12, 6231, 8394, 3, 6, UNI_CJKEXTG } /* incjkextg */, - { 1, 9277, 9896, 3, 4, UNI_SC__ZYYY } /* sc=zyyy */, - { 0, 5986, 9372, 13, 4, UNI_NV__1_SLASH_40 } /* numericvalue=1/40 */, - { 2, 21, 9453, 3, 3, UNI_INAHOM } /* inahom */, - { 512, 9277, 9752, 3, 4, UNI_SC__ROHG } /* sc=rohg */, - { 11, 9444, 7931, 4, 3, UNI_AGE__4_DOT_1 } /* age=4.1 */, - { 0, 4838, 10135, 15, 3, UNI_NFKCQC__Y } /* nfkcquickcheck=yes */, - { 0, 8780, 3683, 6, 16, UNI_ETHIOPICEXT } /* block=ethiopicextended */, - { 7, 9508, 1219, 4, 3, UNI_CCC__214 } /* ccc=ata */, - { 0, 9277, 9460, 3, 4, UNI_ARMI } /* sc=armi */, - { 512, 184, 2666, 3, 18, UNI_COUNTINGROD } /* iscountingrodnumerals */, - { 3, 9277, 1900, 3, 6, UNI_SC__ZYYY } /* sc=common */, - { 0, 5986, 8043, 13, 8, UNI_NV__4_SLASH_5 } /* numericvalue=8.00e-01 */, - { 1, 7218, 6073, 10, 12, UNI_LB__SY } /* linebreak=breaksymbols */, - { 0, 3836, 2140, 17, 8, UNI_CYRL } /* scriptextensions=cyrillic */, - { 2, 867, 0, 28, 0, UNI_PHONETICEXTSUP } /* phoneticextensionssupplement */, - { 2, 8780, 1033, 6, 27, UNI_ENCLOSEDCJK } /* block=enclosedcjklettersandmonths */, - { 0, 8449, 26, 7, 1, UNI_HYPHEN } /* hyphen=y */, - { 4, 1166, 3, 26, 1, -UNI_DI } /* defaultignorablecodepoint=f */, - { 0, 1273, 26, 21, 1, UNI_CE } /* compositionexclusion=y */, - { 132, 10048, 7875, 3, 8, UNI_NV__1_SLASH_32 } /* nv=3.13e-02 */, - { 17, 8589, 9708, 7, 4, UNI_SC__ORYA } /* script=orya */, - { 0, 9997, 2268, 3, 3, UNI_BC__PDI } /* bc=pdi */, - { 44, 9265, 36, 5, 1, UNI_IDST } /* idst=t */, - { 35, 1552, 4958, 9, 15, UNI_UPPERCASELETTER } /* category=uppercaseletter */, - { 6, 9556, 73, 4, 2, UNI_WB__EB } /* gcb=em */, - { 0, 10048, 8011, 3, 8, UNI_NV__13_SLASH_2 } /* nv=6.50e+00 */, - { 1, 9250, 1025, 5, 2, -UNI_EMOD } /* emod=no */, - { 0, 5986, 7763, 13, 8, UNI_NV__1_SLASH_8 } /* numericvalue=1.25e-01 */, - { 0, 9020, 26, 6, 1, UNI_XPOSIXUPPER } /* upper=y */, - { 0, 9277, 6277, 3, 4, UNI_SC__MAHJ } /* sc=mahj */, - { 0, 5037, 3, 9, 1, -UNI_XPOSIXXDIGIT } /* hexdigit=f */, - { 135, 9277, 1677, 3, 5, UNI_SC__LATN } /* sc=latin */, - { 36, 10024, 1044, 3, 6, UNI_L } /* gc=letter */, - { 15, 4033, 1066, 16, 2, UNI_CASEDLETTER } /* generalcategory=lc */, - { 0, 10048, 8744, 3, 3, UNI_NV__700 } /* nv=700 */, - { 0, 9508, 9166, 5, 4, UNI_CCC__27 } /* ccc=ccc27 */, - { 3, 184, 6122, 3, 11, UNI_CYRILLICEXTC } /* iscyrillicextc */, - { 64, 9262, 34, 3, 2, UNI_SB__EX } /* sb=ex */, - { 0, 184, 9892, 2, 4, UNI_QAAI } /* iszinh */, - { 1, 10024, 262, 3, 2, UNI_SM } /* gc=sm */, - { 393, 9768, 7567, 4, 9, UNI_SIND } /* scx=khudawadi */, - { 0, 10129, 1, 3, 1, -UNI_VS } /* vs=n */, - { 2, 4369, 0, 9, 0, UNI_SYRIACSUP } /* syriacsup */, - { 177, 21, 2590, 3, 18, UNI_ANCIENTGREEKNUMBERS } /* inancientgreeknumbers */, - { 2, 3836, 4385, 17, 6, UNI_TANG } /* scriptextensions=tangut */, - { 5, 10048, 8714, 3, 5, UNI_NV__30000 } /* nv=30000 */, - { 2, 5986, 7747, 13, 8, UNI_NV__1_SLASH_10 } /* numericvalue=1.00e-01 */, - { 1, 184, 9672, 2, 4, UNI_MYMR } /* ismymr */, - { 1, 3836, 9065, 17, 5, UNI_ADLM } /* scriptextensions=adlam */, - { 17, 8997, 9837, 6, 3, UNI_TERM } /* term=true */, - { 0, 9556, 3385, 4, 17, UNI_RI } /* gcb=regionalindicator */, - { 1, 7318, 9985, 10, 3, UNI_IN__7 } /* presentin=7.0 */, - { 0, 10132, 6145, 3, 12, UNI_WB__EX } /* wb=extendnumlet */, - { 0, 10333, 7292, 3, 6, UNI_SOGD } /* issogdian */, - { 1, 7513, 0, 9, 0, UNI_BHKS } /* bhaiksuki */, - { 0, 1114, 0, 25, 0, UNI_CWKCF } /* changeswhennfkccasefolded */, - { 1, 3836, 7292, 18, 6, UNI_SOGD } /* scriptextensions=sogdian */, - { 6, 1966, 2608, 22, 19, UNI_INSC__BRAHMIJOININGNUMBER } /* indicsyllabiccategory=brahmijoiningnumber */, - { 3, 10033, 866, 3, 2, UNI_LB__SP } /* lb=sp */, - { 22, 9488, 5200, 4, 7, UNI_KANASUP } /* blk=kanasup */, - { 0, 184, 6253, 2, 5, UNI_KHMR } /* iskhmer */, - { 4, 9664, 0, 3, 0, UNI_MRO } /* mro */, - { 1, 1911, 0, 11, 0, UNI_NUMBERFORMS } /* numberforms */, - { 3, 9768, 9600, 4, 4, UNI_KALI } /* scx=kali */, - { 1, 10033, 4898, 3, 15, UNI_LB__OP } /* lb=openpunctuation */, - { 1, 4033, 4245, 16, 10, UNI_SM } /* generalcategory=mathsymbol */, - { 0, 8589, 7621, 7, 9, UNI_NBAT } /* script=nabataean */, - { 5, 9488, 3938, 5, 7, UNI_INBOPOMOFO } /* blk=bopomofo */, - { 0, 9488, 3115, 4, 18, UNI_DEVANAGARIEXT } /* blk=devanagariextended */, - { 5, 117, 6, 3, 2, UNI_INIDC } /* inidc */, - { 5, 9277, 3135, 5, 2, UNI_SC__KHOJ } /* sc=khoj */, - { 598, 1319, 0, 25, 0, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* symbolsandpictographsexta */, - { 0, 9768, 9580, 4, 4, UNI_HANO } /* scx=hano */, - { 79, 8780, 1594, 6, 14, UNI_MUSIC } /* block=musicalsymbols */, - { 0, 5791, 6157, 13, 12, UNI_JG__FINALSEMKATH } /* joininggroup=finalsemkath */, - { 64, 4033, 4898, 16, 15, UNI_PS } /* generalcategory=openpunctuation */, - { 1, 4989, 8674, 3, 6, UNI_UCASEXT } /* isucasext */, - { 0, 184, 3785, 2, 10, UNI_MANI } /* ismanichaean */, - { 0, 184, 1813, 3, 20, UNI_CWL } /* ischangeswhenlowercased */, - { 0, 9740, 0, 4, 0, UNI_QAAI } /* qaai */, - { 0, 5986, 8083, 13, 8, UNI_NV__11_SLASH_12 } /* numericvalue=9.17e-01 */, - { 0, 9488, 1631, 4, 18, UNI_GEOMETRICSHAPESEXT } /* blk=geometricshapesext */, - { 0, 184, 8463, 2, 7, UNI_KALI } /* iskayahli */, - { 4, 10027, 4081, 3, 16, UNI_JG__HANIFIROHINGYAPA } /* jg=hanifirohingyapa */, - { 0, 3836, 9512, 17, 4, UNI_CHRS } /* scriptextensions=chrs */, - { 19, 7318, 7826, 10, 2, UNI_IN__12 } /* presentin=12 */, - { 64, 9556, 262, 4, 2, UNI_GCB__SM } /* gcb=sm */, - { 3, 10132, 5851, 3, 2, UNI_WB__ML } /* wb=ml */, - { 1, 9488, 1586, 5, 13, UNI_BYZANTINEMUSIC } /* blk=byzantinemusic */, - { 3, 3133, 0, 18, 0, UNI_ebase_values_index } /* emojimodifierbase= */, - { 206, 10027, 9355, 3, 5, UNI_JG__ZHAIN } /* jg=zhain */, - { 204, 9277, 3937, 3, 4, UNI_SC__BOPO } /* sc=bopo */, - { 1, 10291, 9225, 5, 5, UNI_POSIXCNTRL } /* posixcntrl */, - { 3, 34, 0, 3, 0, UNI_EXT } /* ext */, - { 25, 7088, 2449, 10, 11, UNI_BC__L } /* bidiclass=lefttoright */, - { 2, 5986, 9958, 13, 3, UNI_NV__3_SLASH_4 } /* numericvalue=3/4 */, - { 66, 4973, 0, 15, 0, UNI_VEDICEXT } /* vedicextensions */, - { 1, 9444, 9401, 4, 3, UNI_AGE__3 } /* age=3.0 */, - { 41, 9014, 0, 6, 0, UNI_uideo_values_index } /* uideo= */, - { 26, 9768, 3079, 4, 4, UNI_COPT } /* scx=copt */, - { 0, 10024, 6873, 3, 11, UNI_SO } /* gc=othersymbol */, - { 14, 9277, 6484, 3, 4, UNI_HUNG } /* sc=hung */, - { 0, 1834, 9836, 22, 4, UNI_CWT } /* changeswhentitlecased=true */, - { 0, 6277, 0, 7, 0, UNI_MAHJONG } /* mahjong */, - { 41, 9015, 1025, 5, 2, -UNI_IDEO } /* ideo=no */, - { 208, 9488, 8219, 4, 8, UNI_INJAVANESE } /* blk=javanese */, - { 1, 9488, 1033, 4, 11, UNI_ENCLOSEDCJK } /* blk=enclosedcjk */, - { 5, 9277, 6193, 3, 4, UNI_HEBR } /* sc=hebr */, - { 0, 1217, 0, 2, 0, UNI_SK } /* sk */, - { 4, 10024, 7408, 3, 10, UNI_CN } /* gc=unassigned */, - { 0, 10030, 6753, 4, 10, UNI_JT__L } /* jt=leftjoining */, - { 0, 9277, 9032, 3, 6, UNI_WCHO } /* sc=wancho */, - { 16, 9444, 5648, 4, 2, UNI_AGE__10 } /* age=10 */, - { 0, 2280, 9705, 3, 3, UNI_ORKH } /* isorkh */, - { 0, 4658, 26, 15, 1, UNI_GREXT } /* graphemeextend=y */, - { 0, 9997, 3187, 3, 18, UNI_BC__ET } /* bc=europeanterminator */, - { 329, 7155, 2204, 3, 13, UNI_ROHG } /* ishanifirohingya */, - { 0, 9508, 8799, 5, 5, UNI_CCC__107 } /* ccc=ccc107 */, - { 74, 9508, 9216, 5, 4, UNI_CCC__84 } /* ccc=ccc84 */, - { 1, 8589, 8463, 7, 7, UNI_SC__KALI } /* script=kayahli */, - { 0, 10291, 467, 5, 5, UNI_POSIXPUNCT } /* posixpunct */, - { 0, 8780, 2855, 6, 19, UNI_MONGOLIANSUP } /* block=mongoliansupplement */, - { 0, 5986, 7930, 13, 2, UNI_NV__14 } /* numericvalue=14 */, - { 1, 8589, 3894, 8, 10, UNI_SGNW } /* script=signwriting */, - { 88, 10182, 10215, 6, 21, UNI__PERL_IS_IN_MULTI_CHAR_FOLD } /* _perl_is_in_multi_char_fold */, - { 14, 8589, 3115, 7, 4, UNI_SC__DEVA } /* script=deva */, - { 5, 7318, 5648, 10, 2, UNI_IN__10 } /* presentin=10 */, - { 9, 6229, 9836, 12, 4, UNI_JOINC } /* joincontrol=true */, - { 4, 9508, 8793, 5, 5, UNI_CCC__103 } /* ccc=ccc103 */, - { 10, 9488, 1944, 4, 22, UNI_EARLYDYNASTICCUNEIFORM } /* blk=earlydynasticcuneiform */, - { 1, 9508, 9949, 4, 3, UNI_CCC__DA } /* ccc=234 */, - { 224, 3836, 9620, 17, 4, UNI_LANA } /* scriptextensions=lana */, - { 292, 9488, 4433, 4, 15, UNI_ARABICEXTA } /* blk=arabicextendeda */, - { 0, 2224, 8625, 3, 6, UNI_SUPPUAA } /* insuppuaa */, - { 1, 184, 8387, 3, 6, UNI_CJKEXTF } /* iscjkextf */, - { 1, 3424, 1129, 3, 3, UNI_UCAS } /* inucas */, - { 516, 5508, 10135, 14, 3, UNI_PATSYN } /* patternsyntax=yes */, - { 5, 8688, 27, 3, 2, UNI_ALL } /* isall */, - { 0, 184, 8876, 2, 6, UNI_GOTH } /* isgothic */, - { 0, 5739, 36, 13, 1, UNI_GRBASE } /* graphemebase=t */, - { 2, 9556, 4305, 4, 5, UNI_GCB__XX } /* gcb=other */, - { 21, 21, 1677, 2, 23, UNI_LATINEXTADDITIONAL } /* inlatinextendedadditional */, - { 0, 184, 400, 2, 6, UNI_CF } /* isformat */, - { 261, 7739, 0, 8, 0, UNI_ids_values_index } /* idstart= */, - { 0, 21, 8906, 2, 6, UNI_KANBUN } /* inkanbun */, - { 37, 21, 5214, 2, 14, UNI_KANGXI } /* inkangxiradicals */, - { 334, 9235, 26, 5, 1, UNI_CWCM } /* cwcm=y */, - { 37, 8780, 6253, 6, 12, UNI_KHMERSYMBOLS } /* block=khmersymbols */, - { 0, 10048, 7883, 3, 8, UNI_NV__1_SLASH_320 } /* nv=3.13e-03 */, - { 36, 4033, 10170, 16, 2, UNI_CASEDLETTER } /* generalcategory=l_ */, - { 0, 184, 4369, 2, 16, UNI_SYRIACSUP } /* issyriacsupplement */, - { 5, 8688, 7506, 4, 7, UNI_ARABICPFB } /* isarabicpfb */, - { 0, 7739, 0, 7, 0, UNI_IDS } /* idstart */, - { 1, 184, 6939, 2, 11, UNI_SORA } /* issorasompeng */, - { 0, 7088, 2449, 10, 20, UNI_BC__LRE } /* bidiclass=lefttorightembedding */, - { 0, 1966, 2646, 22, 19, UNI_INSC__CONSONANTHEADLETTER } /* indicsyllabiccategory=consonantheadletter */, - { 135, 7218, 1822, 10, 2, UNI_LB__NL } /* linebreak=nl */, - { 1, 9768, 2409, 4, 10, UNI_GLAG } /* scx=glagolitic */, - { 0, 8589, 4883, 7, 15, UNI_SARB } /* script=oldsoutharabian */, - { 207, 3133, 0, 5, 0, UNI_EMOJI } /* emoji */, - { 5, 9444, 7754, 4, 2, UNI_AGE__11 } /* age=11 */, - { 0, 4033, 4583, 16, 15, UNI_PD } /* generalcategory=dashpunctuation */, - { 32, 5522, 0, 14, 0, UNI_PHONETICEXTSUP } /* phoneticextsup */, - { 128, 9508, 1755, 4, 2, UNI_CCC__DB } /* ccc=db */, - { 0, 9488, 6840, 4, 11, UNI_INNANDINAGARI } /* blk=nandinagari */, - { 392, 1537, 3481, 24, 12, UNI_INPC__LEFTANDRIGHT } /* indicpositionalcategory=leftandright */, - { 0, 8997, 26, 5, 1, UNI_TERM } /* term=y */, - { 1, 9277, 9748, 3, 4, UNI_RJNG } /* sc=rjng */, - { 0, 1790, 3, 22, 1, -UNI_CWCM } /* changeswhencasemapped=f */, - { 0, 184, 6133, 2, 12, UNI_ETHIOPICEXTA } /* isethiopicexta */, - { 26, 3241, 0, 18, 0, UNI_GEORGIANSUP } /* georgiansupplement */, - { 0, 2280, 7659, 4, 7, UNI_PERM } /* isoldpermic */, - { 8, 5986, 7782, 13, 1, UNI_NV__3 } /* numericvalue=3 */, - { 9, 9488, 9330, 4, 5, UNI_INTAILE } /* blk=taile */, - { 33, 6229, 3, 12, 1, -UNI_JOINC } /* joincontrol=f */, - { 128, 184, 1879, 3, 18, UNI_CJKCOMPATIDEOGRAPHS } /* iscjkcompatideographs */, - { 3, 10030, 6708, 3, 11, UNI_JT__C } /* jt=joincausing */, - { 141, 6231, 570, 3, 29, UNI_CJKEXTC } /* incjkunifiedideographsextensionc */, - { 32, 9277, 3025, 3, 8, UNI_CHER } /* sc=cherokee */, - { 0, 3836, 8344, 17, 4, UNI_BENG } /* scriptextensions=beng */, - { 2, 3151, 9836, 18, 4, UNI_EPRES } /* emojipresentation=true */, - { 0, 9262, 751, 3, 2, UNI_SB__CL } /* sb=cl */, - { 37, 6231, 8373, 3, 6, UNI_CJKEXTD } /* incjkextd */, - { 4, 3836, 9793, 18, 3, UNI_SOGO } /* scriptextensions=sogo */, - { 1, 3836, 8456, 17, 7, UNI_KNDA } /* scriptextensions=kannada */, - { 4, 9488, 4385, 4, 6, UNI_INTANGUT } /* blk=tangut */, - { 17, 8428, 0, 7, 0, UNI_GRAN } /* grantha */, - { 48, 10006, 3, 3, 1, -UNI_DI } /* di=f */, - { 32, 1552, 1529, 11, 7, UNI__PERL_SURROGATE } /* category=surrogate */, - { 18, 10313, 3379, 7, 5, UNI_XPOSIXBLANK } /* ishorizspace */, - { 0, 8589, 3025, 7, 4, UNI_CHER } /* script=cher */, - { 193, 9270, 6983, 5, 11, UNI_INPC__TOPANDRIGHT } /* inpc=topandright */, - { 0, 2779, 10135, 19, 3, UNI_IDST } /* idstrinaryoperator=yes */, - { 0, 10027, 5424, 3, 14, UNI_JG__MANICHAEANYODH } /* jg=manichaeanyodh */, - { 1, 10296, 468, 3, 4, UNI_P } /* ispunct */, - { 0, 9508, 9161, 5, 4, UNI_CCC__26 } /* ccc=ccc26 */, - { 290, 5986, 8744, 13, 2, UNI_NV__70 } /* numericvalue=70 */, - { 1, 7218, 4898, 10, 15, UNI_LB__OP } /* linebreak=openpunctuation */, - { 0, 7088, 3205, 10, 18, UNI_BC__FSI } /* bidiclass=firststrongisolate */, - { 3, 6025, 0, 12, 0, UNI_ALPHABETICPF } /* alphabeticpf */, - { 0, 9768, 9065, 4, 5, UNI_ADLM } /* scx=adlam */, - { 257, 8519, 0, 9, 0, UNI_NFKDQC__N } /* nfkdqc=no */, - { 4, 9488, 3785, 4, 10, UNI_INMANICHAEAN } /* blk=manichaean */, - { 0, 117, 447, 3, 17, UNI_IDEOGRAPHICSYMBOLS } /* inideographicsymbols */, - { 10, 8780, 867, 6, 28, UNI_PHONETICEXTSUP } /* block=phoneticextensionssupplement */, - { 33, 8589, 9008, 7, 6, UNI_SC__THAA } /* script=thaana */, - { 1, 2314, 0, 3, 0, UNI_XPOSIXXDIGIT } /* hex */, - { 1, 9508, 7754, 4, 2, UNI_CCC__11 } /* ccc=11 */, - { 34, 5791, 5908, 13, 13, UNI_JG__MANICHAEANTAW } /* joininggroup=manichaeantaw */, - { 0, 3836, 8123, 17, 4, UNI_BUGI } /* scriptextensions=bugi */, - { 118, 10048, 7891, 3, 8, UNI_NV__1_SLASH_3 } /* nv=3.33e-01 */, - { 0, 8575, 1025, 7, 2, -UNI_PATSYN } /* patsyn=no */, - { 0, 184, 1087, 2, 26, UNI_PCM } /* isprependedconcatenationmark */, - { 0, 9015, 10135, 5, 3, UNI_IDEO } /* ideo=yes */, - { 75, 10296, 468, 3, 10, UNI_P } /* ispunctuation */, - { 108, 5986, 8756, 13, 5, UNI_NV__90000 } /* numericvalue=90000 */, - { 32, 8589, 8652, 7, 7, UNI_TAVT } /* script=taiviet */, - { 4, 2224, 1320, 3, 24, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* insymbolsandpictographsexta */, - { 90, 8435, 9255, 7, 5, -UNI_GRBASE } /* grbase=false */, - { 30, 1552, 3277, 9, 18, UNI_PI } /* category=initialpunctuation */, - { 0, 8344, 0, 4, 0, UNI_BENG } /* beng */, - { 1, 3169, 0, 8, 0, UNI_ETHI } /* ethiopic */, - { 1, 1417, 8714, 24, 2, UNI_CCC__30 } /* canonicalcombiningclass=30 */, - { 0, 9508, 16, 4, 1, UNI_CCC__B } /* ccc=b */, - { 593, 9488, 9325, 4, 5, UNI_INRUNIC } /* blk=runic */, - { 1, 7218, 5298, 10, 14, UNI_LB__BK } /* linebreak=mandatorybreak */, - { 96, 3439, 0, 12, 0, UNI_SMALLKANAEXT } /* smallkanaext */, - { 321, 3836, 9002, 17, 6, UNI_TELU } /* scriptextensions=telugu */, - { 2, 9768, 9504, 4, 4, UNI_CANS } /* scx=cans */, - { 338, 8688, 9453, 3, 3, UNI_AHOM } /* isahom */, - { 0, 7318, 7826, 10, 4, UNI_IN__12 } /* presentin=12.0 */, - { 518, 8688, 980, 3, 26, UNI_ALPHABETICPF } /* isalphabeticpresentationforms */, - { 0, 2409, 0, 10, 0, UNI_GLAG } /* glagolitic */, - { 1, 9508, 8813, 4, 3, UNI_CCC__122 } /* ccc=122 */, - { 185, 1417, 1219, 24, 3, UNI_CCC__214 } /* canonicalcombiningclass=ata */, - { 47, 9444, 9970, 4, 3, UNI_AGE__5_DOT_2 } /* age=5.2 */, - { 70, 9260, 9836, 5, 4, UNI_IDSB } /* idsb=true */, - { 416, 2224, 2913, 3, 18, UNI_SUNDANESESUP } /* insundanesesupplement */, - { 0, 10048, 5648, 3, 5, UNI_NV__10000 } /* nv=10000 */, - { 0, 10027, 5869, 3, 13, UNI_JG__MANICHAEANMEM } /* jg=manichaeanmem */, - { 72, 10132, 5585, 3, 2, UNI_WB__EB } /* wb=eb */, - { 1, 6241, 6752, 12, 11, UNI_JT__L } /* joiningtype=leftjoining */, - { 129, 7318, 7877, 10, 2, UNI_IN__13 } /* presentin=13 */, - { 0, 8575, 26, 7, 1, UNI_PATSYN } /* patsyn=y */, - { 68, 9270, 4988, 5, 15, UNI_LOE } /* inpc=visualorderleft */, - { 8, 5674, 9836, 13, 4, UNI_BIDIM } /* bidimirrored=true */, - { 1, 5746, 0, 5, 0, UNI_EBASE } /* ebase */, - { 7, 10027, 9280, 3, 5, UNI_JG__KHAPH } /* jg=khaph */, - { 0, 9277, 8924, 3, 4, UNI_LEPC } /* sc=lepc */, - { 0, 9277, 9676, 3, 4, UNI_NARB } /* sc=narb */, - { 0, 21, 5284, 2, 14, UNI_LISUSUP } /* inlisusupplement */, - { 2, 10024, 3349, 3, 18, UNI_ZP } /* gc=paragraphseparator */, - { 84, 10126, 3493, 3, 18, UNI_VO__TR } /* vo=transformedrotated */, - { 0, 9277, 9660, 3, 4, UNI_SC__MLYM } /* sc=mlym */, - { 192, 9768, 3895, 5, 3, UNI_SGNW } /* scx=sgnw */, - { 25, 6229, 0, 12, 0, UNI_joinc_values_index } /* joincontrol= */, - { 0, 184, 1769, 3, 20, UNI_CWCF } /* ischangeswhencasefolded */, - { 0, 8780, 1901, 7, 21, UNI_INDICNUMBERFORMS } /* block=commonindicnumberforms */, - { 0, 9768, 7666, 4, 9, UNI_ORKH } /* scx=oldturkic */, - { 5, 8780, 8463, 6, 7, UNI_KALI } /* block=kayahli */, - { 6, 8147, 9836, 8, 4, UNI_EXTPICT } /* extpict=true */, - { 0, 8780, 2245, 6, 11, UNI_INMEETEIMAYEK } /* block=meeteimayek */, - { 3, 9277, 9692, 3, 4, UNI_NSHU } /* sc=nshu */, - { 2, 2245, 0, 11, 0, UNI_MTEI } /* meeteimayek */, - { 512, 9508, 8807, 4, 3, UNI_CCC__118 } /* ccc=118 */, - { 135, 9270, 2988, 5, 19, UNI_INPC__TOPANDBOTTOMANDLEFT } /* inpc=topandbottomandleft */, - { 1, 2485, 0, 4, 0, UNI_MONG } /* mong */, - { 0, 9488, 3457, 4, 11, UNI_TAIXUANJING } /* blk=taixuanjing */, - { 150, 10048, 5648, 3, 8, UNI_NV__10000000 } /* nv=10000000 */, - { 2, 9488, 8888, 4, 6, UNI_INHATRAN } /* blk=hatran */, - { 0, 2280, 8562, 3, 6, UNI_OSMA } /* isosmanya */, - { 1, 9488, 9860, 4, 3, UNI_INVAI } /* blk=vai */, - { 714, 9277, 8901, 4, 5, UNI_SC__KTHI } /* sc=kaithi */, - { 69, 10296, 3599, 3, 3, UNI_PAUC } /* ispauc */, - { 184, 1552, 8855, 9, 2, UNI_CF } /* category=cf */, - { 2, 10027, 7045, 3, 2, UNI_JG__FE } /* jg=fe */, - { 198, 10048, 7859, 3, 3, UNI_NV__200 } /* nv=200 */, - { 288, 10027, 10072, 3, 3, UNI_JG__TAH } /* jg=tah */, - { 128, 3097, 1253, 18, 7, UNI_DT__INIT } /* decompositiontype=initial */, - { 1, 3836, 8912, 17, 6, UNI_KHOJ } /* scriptextensions=khojki */, - { 0, 3836, 7684, 17, 4, UNI_PAUC } /* scriptextensions=pauc */, - { 0, 5242, 0, 14, 0, UNI_LATINEXTC } /* latinextendedc */, - { 11, 2569, 0, 20, 1, UNI_VO__U } /* verticalorientation=u */, - { 585, 5986, 9108, 13, 2, UNI_NV__15 } /* numericvalue=15 */, - { 0, 3241, 0, 4, 0, UNI_GEOR } /* geor */, - { 0, 1013, 0, 5, 0, UNI_GREK } /* greek */, - { 0, 184, 5214, 2, 14, UNI_KANGXI } /* iskangxiradicals */, - { 12, 4943, 0, 15, 0, UNI_TITLE } /* titlecaseletter */, - { 11, 9596, 6763, 4, 11, UNI_LB__H3 } /* hst=lvtsyllable */, - { 0, 5324, 8487, 5, 4, UNI_INMANDAIC } /* inmandaic */, - { 0, 6576, 0, 11, 0, UNI_alpha_values_index } /* alphabetic= */, - { 0, 3836, 8428, 17, 7, UNI_GRAN } /* scriptextensions=grantha */, - { 513, 5986, 8744, 13, 3, UNI_NV__700 } /* numericvalue=700 */, - { 0, 10009, 567, 3, 2, UNI_DT__NB } /* dt=nb */, - { 4, 8589, 8219, 7, 8, UNI_SC__JAVA } /* script=javanese */, - { 9, 8780, 2054, 6, 22, UNI_MODIFIERLETTERS } /* block=spacingmodifierletters */, - { 516, 3457, 0, 18, 0, UNI_TAIXUANJING } /* taixuanjingsymbols */, - { 4, 7088, 6037, 10, 12, UNI_BC__AL } /* bidiclass=arabicletter */, - { 128, 9488, 382, 4, 32, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* blk=egyptianhieroglyphformatcontrols */, - { 25, 148, 0, 35, 0, UNI_DIACRITICALSSUP } /* combiningdiacriticalmarkssupplement */, - { 0, 1552, 2061, 9, 14, UNI_LM } /* category=modifierletter */, - { 2, 9015, 9836, 5, 4, UNI_IDEO } /* ideo=true */, - { 2, 7325, 10090, 3, 3, UNI_IN__4 } /* in=v40 */, - { 1, 7158, 9255, 10, 5, -UNI_DIA } /* diacritic=false */, - { 2, 3836, 9580, 17, 4, UNI_HANO } /* scriptextensions=hano */, - { 7, 8780, 1585, 6, 23, UNI_BYZANTINEMUSIC } /* block=byzantinemusicalsymbols */, - { 0, 5791, 5172, 13, 14, UNI_JG__HAMZAONHEHGOAL } /* joininggroup=hamzaonhehgoal */, - { 13, 2280, 6483, 4, 10, UNI_HUNG } /* isoldhungarian */, - { 0, 8589, 9636, 7, 4, UNI_SC__LINB } /* script=linb */, - { 0, 8780, 78, 6, 35, UNI_ARABICMATH } /* block=arabicmathematicalalphabeticsymbols */, - { 0, 8344, 0, 7, 0, UNI_BENG } /* bengali */, - { 0, 8291, 0, 8, 0, UNI_TAGB } /* tagbanwa */, - { 3, 10132, 2444, 3, 2, UNI_LB__HL } /* wb=hl */, - { 0, 8589, 9860, 7, 4, UNI_VAI } /* script=vaii */, - { 320, 8589, 8936, 7, 6, UNI_LYCI } /* script=lycian */, - { 0, 9260, 26, 5, 1, UNI_IDSB } /* idsb=y */, - { 20, 9524, 0, 3, 0, UNI_CWT } /* cwt */, - { 512, 8978, 26, 6, 1, UNI__PERL_PATWS } /* patws=y */, - { 256, 9892, 0, 4, 0, UNI_QAAI } /* zinh */, - { 3, 10048, 8732, 3, 4, UNI_NV__5000 } /* nv=5000 */, - { 0, 9488, 7514, 5, 8, UNI_INBHAIKSUKI } /* blk=bhaiksuki */, - { 99, 9488, 2950, 4, 19, UNI_SUPARROWSB } /* blk=supplementalarrowsb */, - { 11, 8786, 0, 4, 0, UNI_CARI } /* cari */, - { 2, 2779, 9255, 19, 5, -UNI_IDST } /* idstrinaryoperator=false */, - { 2, 5986, 7765, 13, 1, UNI_NV__2 } /* numericvalue=2 */, - { 129, 184, 8498, 2, 7, UNI_MULT } /* ismultani */, - { 3, 10027, 3802, 3, 17, UNI_JG__MANICHAEANHUNDRED } /* jg=manichaeanhundred */, - { 27, 4033, 1899, 16, 2, UNI_PC } /* generalcategory=pc */, - { 2, 10024, 6862, 3, 11, UNI_NO } /* gc=othernumber */, - { 0, 184, 4257, 2, 16, UNI_MISCMATHSYMBOLSB } /* ismiscmathsymbolsb */, - { 65, 3887, 0, 17, 0, UNI_SUTTONSIGNWRITING } /* suttonsignwriting */, - { 0, 8519, 10135, 7, 3, UNI_DT__NONE } /* nfkdqc=yes */, - { 47, 7249, 2, 5, 1, UNI_CARI } /* iscari */, - { 0, 8888, 0, 6, 0, UNI_HATR } /* hatran */, - { 0, 3097, 8948, 18, 6, UNI_DT__NAR } /* decompositiontype=narrow */, - { 3, 9488, 9305, 4, 5, UNI_INNUSHU } /* blk=nushu */, - { 12, 9277, 9609, 4, 3, UNI_KITS } /* sc=kits */, - { 0, 9346, 26, 4, 1, UNI_IDC } /* idc=y */, - { 0, 6928, 26, 11, 1, UNI_SD } /* softdotted=y */, - { 1, 184, 3374, 2, 10, UNI_XPOSIXSPACE } /* iswhitespace */, - { 290, 6554, 1, 11, 1, -UNI_IDC } /* idcontinue=n */, - { 48, 7438, 1822, 10, 2, UNI_WB__NL } /* wordbreak=nl */, - { 53, 4916, 1287, 4, 2, UNI_TELU } /* istelu */, - { 97, 184, 2141, 3, 7, UNI_CYRL } /* iscyrillic */, - { 513, 9277, 4928, 3, 5, UNI_SC__TAML } /* sc=tamil */, - { 6, 3836, 8477, 17, 4, UNI_MAKA } /* scriptextensions=maka */, - { 1, 6205, 1, 12, 1, -UNI_IDEO } /* ideographic=n */, - { 153, 184, 5606, 2, 14, UNI_SUPPUNCTUATION } /* issuppunctuation */, - { 2, 7358, 0, 4, 0, UNI_SAUR } /* saur */, - { 4, 9508, 9937, 4, 3, UNI_CCC__AL } /* ccc=228 */, - { 0, 8780, 5200, 6, 14, UNI_KANASUP } /* block=kanasupplement */, - { 9, 9277, 8179, 3, 8, UNI_SC__GURU } /* sc=gurmukhi */, - { 0, 9488, 9002, 4, 6, UNI_INTELUGU } /* blk=telugu */, - { 6, 6231, 8380, 3, 6, UNI_CJKEXTE } /* incjkexte */, - { 249, 10333, 0, 3, 0, UNI_S } /* iss */, - { 1, 8589, 9740, 7, 4, UNI_SC__QAAI } /* script=qaai */, - { 1, 9508, 9176, 5, 4, UNI_CCC__29 } /* ccc=ccc29 */, - { 7, 10033, 533, 3, 2, UNI_LB__NS } /* lb=ns */, - { 24, 7540, 0, 8, 0, UNI_EXT } /* extender */, - { 1, 8780, 3115, 6, 10, UNI_INDEVANAGARI } /* block=devanagari */, - { 1, 9277, 78, 3, 6, UNI_SC__ARAB } /* sc=arabic */, - { 3, 9768, 9720, 4, 4, UNI_PHLP } /* scx=phlp */, - { 0, 8589, 9452, 7, 4, UNI_AHOM } /* script=ahom */, - { 10, 8414, 0, 4, 0, UNI_ELBA } /* elba */, - { 0, 9508, 5648, 4, 2, UNI_CCC__10 } /* ccc=10 */, - { 0, 10024, 1217, 3, 2, UNI_SK } /* gc=sk */, - { 4, 10182, 10279, 6, 9, UNI__PERL_QUOTEMETA } /* _perl_quotemeta */, - { 0, 4033, 38, 16, 2, UNI_XPOSIXDIGIT } /* generalcategory=nd */, - { 131, 3853, 0, 16, 0, UNI_STERM } /* sentenceterminal */, - { 37, 184, 5804, 2, 13, UNI_KANAEXTA } /* iskanaextendeda */, - { 357, 861, 0, 6, 0, UNI_ARROWS } /* arrows */, - { 133, 184, 8147, 2, 7, UNI_EXTPICT } /* isextpict */, - { 64, 3836, 8638, 17, 7, UNI_TGLG } /* scriptextensions=tagalog */, - { 1, 21, 2330, 3, 19, UNI_INANATOLIANHIEROGLYPHS } /* inanatolianhieroglyphs */, - { 7, 184, 7438, 2, 4, UNI_XPOSIXWORD } /* isword */, - { 2, 184, 7630, 2, 9, UNI_TALU } /* isnewtailue */, - { 35, 5986, 9913, 13, 3, UNI_NV__2_SLASH_3 } /* numericvalue=2/3 */, - { 146, 9350, 26, 5, 1, UNI_XIDS } /* xids=y */, - { 0, 8780, 2120, 7, 20, UNI_CJKRADICALSSUP } /* block=cjkradicalssupplement */, - { 33, 1922, 0, 12, 0, UNI_DIACRITICALS } /* diacriticals */, - { 0, 1552, 10178, 9, 2, UNI_ZP } /* category=zp */, - { 0, 10027, 8918, 3, 6, UNI_JG__LAMADH } /* jg=lamadh */, - { 0, 8400, 0, 7, 0, UNI_compex_values_index } /* compex= */, - { 215, 7278, 0, 10, 0, UNI_XPEO } /* oldpersian */, - { 256, 4916, 4386, 3, 5, UNI_TANG } /* istangut */, - { 516, 3853, 36, 17, 1, UNI_STERM } /* sentenceterminal=t */, - { 0, 10333, 2288, 3, 3, UNI_SINH } /* issinh */, - { 0, 9277, 3893, 3, 11, UNI_SGNW } /* sc=signwriting */, - { 171, 1269, 1, 25, 1, -UNI_COMPEX } /* fullcompositionexclusion=n */, - { 311, 9270, 2555, 5, 14, UNI_INPC__BOTTOMANDRIGHT } /* inpc=bottomandright */, - { 0, 2224, 6962, 3, 10, UNI_SUPERANDSUB } /* insuperandsub */, - { 314, 3241, 0, 11, 0, UNI_GEORGIANSUP } /* georgiansup */, - { 0, 5791, 5869, 13, 13, UNI_JG__MANICHAEANMEM } /* joininggroup=manichaeanmem */, - { 152, 5986, 8035, 13, 8, UNI_NV__3_SLASH_4 } /* numericvalue=7.50e-01 */, - { 288, 8858, 0, 6, 0, UNI_ecomp_values_index } /* ecomp= */, - { 0, 7739, 10135, 8, 3, UNI_IDS } /* idstart=yes */, - { 1, 8780, 2912, 6, 19, UNI_SUNDANESESUP } /* block=sundanesesupplement */, - { 512, 10060, 9255, 3, 5, -UNI_RI } /* ri=false */, - { 4, 8589, 8477, 7, 4, UNI_MAKA } /* script=maka */, - { 0, 9616, 0, 4, 0, UNI_KTHI } /* kthi */, - { 35, 8589, 8442, 7, 7, UNI_SC__HANO } /* script=hanunoo */, - { 603, 5791, 7148, 13, 10, UNI_JG__DALATHRISH } /* joininggroup=dalathrish */, - { 2, 7088, 1, 11, 1, UNI_BC__BN } /* bidiclass=bn */, - { 265, 2779, 0, 4, 0, UNI_IDST } /* idst */, - { 28, 10048, 8035, 3, 8, UNI_NV__3_SLASH_4 } /* nv=7.50e-01 */, - { 0, 10033, 495, 3, 7, UNI_LB__NU } /* lb=numeric */, - { 0, 4989, 58, 3, 4, UNI_UIDEO } /* isuideo */, - { 13, 8768, 9255, 6, 5, -UNI_BIDIC } /* bidic=false */, - { 292, 3836, 2409, 17, 4, UNI_GLAG } /* scriptextensions=glag */, - { 1, 9277, 9652, 3, 4, UNI_MERC } /* sc=merc */, - { 1, 9277, 8666, 3, 7, UNI_SC__TIRH } /* sc=tirhuta */, - { 64, 9277, 8291, 3, 4, UNI_SC__TAGB } /* sc=tagb */, - { 13, 4916, 8639, 3, 6, UNI_TGLG } /* istagalog */, - { 0, 9277, 8470, 3, 7, UNI_SC__LINA } /* sc=lineara */, - { 5, 184, 5830, 2, 13, UNI_LOWSURROGATES } /* islowsurrogates */, - { 714, 184, 2855, 2, 9, UNI_MONG } /* ismongolian */, - { 73, 9070, 1, 5, 1, -UNI_POSIXXDIGIT } /* ahex=n */, - { 36, 9488, 1018, 4, 5, UNI_MUSIC } /* blk=music */, - { 65, 5746, 1025, 6, 2, -UNI_EBASE } /* ebase=no */, - { 161, 10288, 7438, 8, 4, UNI_XPOSIXWORD } /* isxposixword */, - { 25, 8107, 0, 8, 0, UNI_BALI } /* balinese */, - { 2, 4613, 0, 15, 0, UNI_DIACRITICALSSUP } /* diacriticalssup */, - { 0, 9596, 7720, 4, 9, UNI_GCB__V } /* hst=voweljamo */, - { 212, 8780, 7684, 6, 9, UNI_INPAUCINHAU } /* block=paucinhau */, - { 1, 9262, 1823, 3, 5, UNI_SB__LO } /* sb=lower */, - { 0, 8498, 0, 4, 0, UNI_MULT } /* mult */, - { 0, 2245, 0, 21, 0, UNI_MEETEIMAYEKEXT } /* meeteimayekextensions */, - { 0, 9275, 2608, 5, 19, UNI_INSC__BRAHMIJOININGNUMBER } /* insc=brahmijoiningnumber */, - { 543, 9488, 3052, 4, 9, UNI_HALFMARKS } /* blk=halfmarks */, - { 0, 3097, 2785, 18, 3, UNI_DT__NAR } /* decompositiontype=nar */, - { 16, 4916, 5850, 3, 3, UNI_TAML } /* istaml */, - { 0, 3717, 7338, 17, 10, UNI_IDENTIFIERSTATUS__RESTRICTED } /* identifierstatus=restricted */, - { 3, 4129, 0, 16, 0, UNI_LATIN1 } /* latin1supplement */, - { 0, 3836, 2329, 17, 20, UNI_HLUW } /* scriptextensions=anatolianhieroglyphs */, - { 0, 10024, 4245, 3, 10, UNI_SM } /* gc=mathsymbol */, - { 389, 184, 1294, 2, 25, UNI_SUPERANDSUB } /* issuperscriptsandsubscripts */, - { 0, 5674, 10135, 13, 3, UNI_BIDIM } /* bidimirrored=yes */, - { 73, 4542, 1633, 4, 21, UNI_GEOMETRICSHAPESEXT } /* ingeometricshapesextended */, - { 1, 9768, 9860, 4, 4, UNI_VAI } /* scx=vaii */, - { 1024, 6576, 9255, 11, 5, -UNI_XPOSIXALPHA } /* alphabetic=false */, - { 0, 5228, 0, 14, 0, UNI_LATINEXTB } /* latinextendedb */, - { 0, 21, 3421, 2, 18, UNI_RUMI } /* inruminumeralsymbols */, - { 0, 5986, 7826, 13, 2, UNI_NV__12 } /* numericvalue=12 */, - { 513, 9488, 4129, 4, 16, UNI_LATIN1 } /* blk=latin1supplement */, - { 1, 10291, 7438, 5, 4, UNI_POSIXWORD } /* posixword */, - { 0, 8960, 26, 6, 1, UNI_NFCQC__Y } /* nfcqc=y */, - { 199, 9508, 9472, 4, 4, UNI_WB__EB } /* ccc=atbl */, - { 2, 9277, 8610, 3, 7, UNI_SIDD } /* sc=siddham */, - { 0, 10009, 9868, 3, 4, UNI_EA__F } /* dt=wide */, - { 0, 10048, 7469, 3, 8, UNI_NV__1_SLASH_2 } /* nv=5.00e-01 */, - { 16, 5986, 8756, 13, 2, UNI_NV__90 } /* numericvalue=90 */, - { 3, 2760, 36, 19, 1, UNI_GCB__T } /* hangulsyllabletype=t */, - { 31, 9568, 0, 4, 0, UNI_GREK } /* grek */, - { 0, 184, 8421, 2, 7, UNI_ELYM } /* iselymaic */, - { 5, 3937, 0, 8, 0, UNI_BOPO } /* bopomofo */, - { 815, 8680, 0, 7, 0, UNI_ZZZZ } /* unknown */, - { 3, 5324, 0, 12, 0, UNI_INMANICHAEAN } /* inmanichaean */, - { 2, 3836, 1222, 17, 4, UNI_KANA } /* scriptextensions=kana */, - { 0, 9285, 0, 4, 0, UNI_LIMB } /* limb */, - { 71, 184, 3115, 2, 13, UNI_DEVANAGARIEXT } /* isdevanagariext */, - { 518, 1505, 3827, 4, 5, UNI_INGRANTHA } /* ingrantha */, - { 151, 10033, 5298, 3, 14, UNI_LB__BK } /* lb=mandatorybreak */, - { 0, 8589, 9816, 7, 4, UNI_TAVT } /* script=tavt */, - { 67, 9488, 9245, 4, 5, UNI_INDOGRA } /* blk=dogra */, - { 0, 3836, 9752, 17, 4, UNI_ROHG } /* scriptextensions=rohg */, - { 32, 9270, 2549, 5, 12, UNI_INPC__TOPANDBOTTOM } /* inpc=topandbottom */, - { 0, 184, 5003, 2, 15, UNI_ZANB } /* iszanabazarsquare */, - { 6, 8203, 0, 8, 0, UNI_JAMOEXTA } /* jamoexta */, - { 1, 5037, 0, 8, 0, UNI_XPOSIXXDIGIT } /* hexdigit */, - { 48, 9335, 0, 4, 0, UNI_TAKR } /* takr */, - { 0, 1537, 1924, 4, 10, UNI_DIACRITICALS } /* indiacriticals */, - { 1, 9444, 7877, 4, 2, UNI_AGE__13 } /* age=13 */, - { 0, 727, 0, 2, 0, UNI_MN } /* mn */, - { 1, 9488, 2969, 4, 19, UNI_SUPARROWSC } /* blk=supplementalarrowsc */, - { 1, 5986, 8027, 13, 8, UNI_NV__15_SLASH_2 } /* numericvalue=7.50e+00 */, - { 34, 4838, 0, 16, 0, UNI_NFKCQC__N } /* nfkcquickcheck=n */, - { 0, 4401, 0, 9, 0, UNI_TANGUTSUP } /* tangutsup */, - { 32, 8589, 8131, 7, 8, UNI_SC__DUPL } /* script=duployan */, - { 21, 9275, 4913, 5, 15, UNI_INSC__REGISTERSHIFTER } /* insc=registershifter */, - { 52, 9528, 0, 3, 0, UNI_CWU } /* cwu */, - { 2, 184, 6061, 2, 11, UNI_BIDIC } /* isbidicontrol */, - { 0, 10033, 3969, 3, 16, UNI_LB__CP } /* lb=closeparenthesis */, - { 128, 9488, 4703, 4, 15, UNI_INIMPERIALARAMAIC } /* blk=imperialaramaic */, - { 84, 3529, 26, 18, 1, UNI_VS } /* variationselector=y */, - { 0, 8582, 0, 7, 0, UNI_PHAG } /* phagspa */, - { 545, 9277, 8491, 3, 4, UNI_MARC } /* sc=marc */, - { 0, 10048, 8083, 3, 8, UNI_NV__11_SLASH_12 } /* nv=9.17e-01 */, - { 0, 9768, 78, 4, 6, UNI_ARAB } /* scx=arabic */, - { 4, 9452, 0, 4, 0, UNI_AHOM } /* ahom */, - { 5, 184, 4241, 2, 16, UNI_MISCMATHSYMBOLSA } /* ismiscmathsymbolsa */, - { 129, 9488, 3169, 4, 11, UNI_ETHIOPICSUP } /* blk=ethiopicsup */, - { 0, 6229, 0, 5, 0, UNI_JOINC } /* joinc */, - { 0, 9277, 5284, 3, 4, UNI_LISU } /* sc=lisu */, - { 928, 8315, 0, 8, 0, UNI_UGAR } /* ugaritic */, - { 0, 1552, 400, 9, 6, UNI_CF } /* category=format */, - { 0, 10048, 9994, 3, 3, UNI_NV__9_SLASH_2 } /* nv=9/2 */, - { 279, 10048, 7811, 3, 8, UNI_NV__1_SLASH_6 } /* nv=1.67e-01 */, - { 0, 8978, 9255, 6, 5, -UNI__PERL_PATWS } /* patws=false */, - { 581, 3836, 1677, 17, 5, UNI_LATN } /* scriptextensions=latin */, - { 562, 9488, 1441, 4, 24, UNI_CJKSYMBOLS } /* blk=cjksymbolsandpunctuation */, - { 32, 1417, 8819, 24, 3, UNI_CCC__129 } /* canonicalcombiningclass=129 */, - { 1, 5452, 17, 15, 1, UNI_COMPEX } /* nfcquickcheck=no */, - { 128, 9277, 9504, 3, 4, UNI_CANS } /* sc=cans */, - { 0, 10006, 0, 3, 0, UNI_di_values_index } /* di= */, - { 2, 8780, 6277, 6, 7, UNI_MAHJONG } /* block=mahjong */, - { 145, 8780, 5186, 6, 14, UNI_HIGHSURROGATES } /* block=highsurrogates */, - { 0, 1417, 9188, 24, 2, UNI_CCC__31 } /* canonicalcombiningclass=31 */, - { 0, 1856, 9836, 22, 4, UNI_CWU } /* changeswhenuppercased=true */, - { 139, 9277, 9588, 3, 4, UNI_HMNG } /* sc=hmng */, - { 716, 9265, 26, 5, 1, UNI_IDST } /* idst=y */, - { 12, 4688, 2023, 15, 9, UNI_IDENTIFIERTYPE__TECHNICAL } /* identifiertype=technical */, - { 0, 7218, 10164, 10, 2, UNI_GCB__V } /* linebreak=jv */, - { 1, 10182, 1527, 6, 9, UNI__PERL_SURROGATE } /* _perl_surrogate */, - { 0, 2224, 350, 3, 32, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* insupplementalsymbolsandpictographs */, - { 0, 1505, 5161, 5, 11, UNI_INGREEK } /* ingreekandcoptic */, - { 65, 8589, 4868, 7, 15, UNI_NARB } /* script=oldnortharabian */, - { 0, 8589, 9656, 7, 4, UNI_MIAO } /* script=miao */, - { 301, 184, 4583, 2, 15, UNI_PD } /* isdashpunctuation */, - { 1, 9508, 9171, 5, 4, UNI_CCC__28 } /* ccc=ccc28 */, - { 1, 4113, 67, 3, 4, UNI_VSSUP } /* invssup */, - { 390, 2280, 4306, 3, 15, UNI_PO } /* isotherpunctuation */, - { 138, 10024, 1465, 3, 13, UNI_M } /* gc=combiningmark */, - { 1, 9508, 7877, 4, 2, UNI_CCC__13 } /* ccc=13 */, - { 4, 184, 4129, 2, 6, UNI_LATIN1 } /* islatin1 */, - { 147, 6241, 6529, 12, 12, UNI_JT__R } /* joiningtype=rightjoining */, - { 2, 6231, 2667, 4, 9, UNI_COUNTINGROD } /* incountingrod */, - { 2, 2280, 3332, 3, 17, UNI_ORNAMENTALDINGBATS } /* isornamentaldingbats */, - { 0, 5986, 7771, 13, 8, UNI_NV__1_SLASH_80 } /* numericvalue=1.25e-02 */, - { 0, 1417, 24, 24, 1, UNI_CCC__L } /* canonicalcombiningclass=l */, - { 2, 9020, 3, 6, 1, -UNI_XPOSIXUPPER } /* upper=f */, - { 3, 1746, 1, 22, 1, UNI_BPT__N } /* bidipairedbrackettype=n */, - { 1, 6730, 0, 11, 0, UNI_KATAKANAEXT } /* katakanaext */, - { 1, 9880, 0, 4, 0, UNI_YI } /* yiii */, - { 321, 9556, 406, 4, 7, UNI_GCB__CN } /* gcb=control */, - { 0, 9488, 3169, 4, 8, UNI_INETHIOPIC } /* blk=ethiopic */, - { 0, 9768, 8291, 4, 4, UNI_TAGB } /* scx=tagb */, - { 0, 10009, 8846, 3, 6, UNI_DT__ENC } /* dt=circle */, - { 0, 4033, 1910, 16, 2, UNI_CN } /* generalcategory=cn */, - { 0, 9508, 8811, 5, 5, UNI_CCC__122 } /* ccc=ccc122 */, - { 0, 9768, 7684, 4, 9, UNI_PAUC } /* scx=paucinhau */, - { 0, 2224, 8632, 3, 6, UNI_SUPPUAB } /* insuppuab */, - { 38, 9768, 8407, 4, 7, UNI_DSRT } /* scx=deseret */, - { 1, 8589, 3937, 7, 8, UNI_SC__BOPO } /* script=bopomofo */, - { 0, 10027, 756, 3, 3, UNI_JG__DAL } /* jg=dal */, - { 555, 435, 0, 5, 0, UNI__PERL_NCHAR } /* nchar */, - { 19, 3836, 8428, 17, 4, UNI_GRAN } /* scriptextensions=gran */, - { 0, 3097, 0, 18, 0, UNI_dt_values_index } /* decompositiontype= */, - { 3, 7076, 7099, 3, 9, UNI_BOXDRAWING } /* inboxdrawing */, - { 2, 1988, 0, 22, 0, UNI_loe_values_index } /* logicalorderexception= */, - { 641, 1966, 3953, 22, 16, UNI_INSC__CANTILLATIONMARK } /* indicsyllabiccategory=cantillationmark */, - { 0, 8870, 10135, 6, 3, UNI_EPRES } /* epres=yes */, - { 523, 1790, 1025, 22, 2, -UNI_CWCM } /* changeswhencasemapped=no */, - { 0, 9488, 2287, 4, 7, UNI_INSINHALA } /* blk=sinhala */, - { 16, 1087, 26, 27, 1, UNI_PCM } /* prependedconcatenationmark=y */, - { 0, 8780, 1561, 6, 24, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* block=supsymbolsandpictographs */, - { 0, 2665, 0, 11, 0, UNI_COUNTINGROD } /* countingrod */, - { 0, 1417, 9106, 25, 4, UNI_CCC__15 } /* canonicalcombiningclass=ccc15 */, - { 1, 8780, 8876, 6, 6, UNI_INGOTHIC } /* block=gothic */, - { 0, 21, 7458, 2, 10, UNI_YIRADICALS } /* inyiradicals */, - { 4, 3836, 9680, 17, 4, UNI_NBAT } /* scriptextensions=nbat */, - { 1, 8780, 2429, 6, 20, UNI_ININSCRIPTIONALPAHLAVI } /* block=inscriptionalpahlavi */, - { 9, 10003, 9836, 3, 4, UNI_CI } /* ci=true */, - { 768, 7076, 5816, 3, 7, UNI_INBALINESE } /* inbalinese */, - { 5, 2779, 0, 19, 0, UNI_idst_values_index } /* idstrinaryoperator= */, - { 0, 8930, 26, 6, 1, UNI_XPOSIXLOWER } /* lower=y */, - { 0, 9277, 4448, 3, 4, UNI_BAMU } /* sc=bamu */, - { 14, 7318, 7754, 10, 2, UNI_IN__11 } /* presentin=11 */, - { 0, 3115, 0, 18, 0, UNI_DEVANAGARIEXT } /* devanagariextended */, - { 0, 9095, 0, 5, 0, UNI_BUHD } /* buhid */, - { 32, 5452, 0, 15, 0, UNI_COMPEX } /* nfcquickcheck=n */, - { 0, 1746, 0, 22, 0, UNI_bpt_values_index } /* bidipairedbrackettype= */, - { 22, 3374, 9255, 11, 5, -UNI_XPOSIXSPACE } /* whitespace=false */, - { 27, 8688, 2330, 3, 19, UNI_HLUW } /* isanatolianhieroglyphs */, - { 40, 5497, 0, 11, 0, UNI_MC } /* spacingmark */, - { 2, 9768, 9608, 4, 4, UNI_KITS } /* scx=kits */, - { 43, 2784, 1395, 4, 22, UNI_ARABICPFB } /* inarabicpresentationformsb */, - { 0, 9768, 6840, 4, 4, UNI_NAND } /* scx=nand */, - { 104, 3836, 7188, 17, 10, UNI_KHAR } /* scriptextensions=kharoshthi */, - { 23, 5986, 9392, 13, 4, UNI_NV__11_SLASH_2 } /* numericvalue=11/2 */, - { 320, 10048, 9372, 3, 4, UNI_NV__1_SLASH_40 } /* nv=1/40 */, - { 0, 9768, 6277, 4, 4, UNI_MAHJ } /* scx=mahj */, - { 6, 9997, 407, 3, 2, UNI_BC__ON } /* bc=on */, - { 72, 6205, 9255, 12, 5, -UNI_IDEO } /* ideographic=false */, - { 258, 184, 6277, 2, 4, UNI_MAHJ } /* ismahj */, - { 192, 7540, 1025, 9, 2, -UNI_EXT } /* extender=no */, - { 0, 9277, 9892, 3, 4, UNI_SC__QAAI } /* sc=zinh */, - { 9, 2912, 0, 4, 0, UNI_SUND } /* sund */, - { 0, 8688, 1007, 3, 26, UNI_ANCIENTGREEKMUSIC } /* isancientgreekmusicalnotation */, - { 379, 9488, 719, 4, 30, UNI_CUNEIFORMNUMBERS } /* blk=cuneiformnumbersandpunctuation */, - { 0, 21, 8470, 2, 7, UNI_INLINEARA } /* inlineara */, - { 0, 9277, 9624, 3, 4, UNI_LAO } /* sc=laoo */, - { 1, 5791, 5364, 13, 4, UNI_JG__HETH } /* joininggroup=heth */, - { 1, 3025, 0, 4, 0, UNI_CHER } /* cher */, - { 38, 10048, 9907, 3, 3, UNI_NV__1_SLASH_7 } /* nv=1/7 */, - { 0, 2224, 7399, 3, 9, UNI_SUPARROWSC } /* insuparrowsc */, - { 6, 7325, 10093, 3, 3, UNI_IN__4_DOT_1 } /* in=v41 */, - { 1, 10024, 48, 3, 1, UNI_P } /* gc=p */, - { 0, 1921, 0, 2, 0, UNI_SD } /* sd */, - { 0, 9488, 42, 4, 9, UNI_CJKCOMPAT } /* blk=cjkcompat */, - { 0, 5791, 9784, 13, 4, UNI_JG__SHIN } /* joininggroup=shin */, - { 0, 8589, 9544, 7, 4, UNI_DIAK } /* script=diak */, - { 105, 9997, 426, 3, 2, UNI_BC__ES } /* bc=es */, - { 459, 3904, 36, 17, 1, UNI_UIDEO } /* unifiedideograph=t */, - { 40, 9345, 1025, 5, 2, -UNI_XIDC } /* xidc=no */, - { 0, 5986, 7877, 13, 2, UNI_NV__13 } /* numericvalue=13 */, - { 0, 1677, 0, 14, 0, UNI_LATINEXTA } /* latinextendeda */, - { 0, 7218, 96, 10, 10, UNI_LB__AL } /* linebreak=alphabetic */, - { 0, 10009, 2785, 3, 3, UNI_DT__NAR } /* dt=nar */, - { 572, 283, 0, 33, 0, UNI_MISCMATHSYMBOLSB } /* miscellaneousmathematicalsymbolsb */, - { 2, 9768, 4883, 4, 15, UNI_SARB } /* scx=oldsoutharabian */, - { 0, 8526, 0, 7, 0, UNI_NB } /* noblock */, - { 20, 9824, 0, 4, 0, UNI_TGLG } /* tglg */, - { 0, 9768, 8561, 4, 4, UNI_OSMA } /* scx=osma */, - { 0, 9285, 0, 5, 0, UNI_LIMB } /* limbu */, - { 6, 9277, 4145, 3, 7, UNI_SC__LINB } /* sc=linearb */, - { 330, 9275, 4508, 5, 15, UNI_INSC__CONSONANTKILLER } /* insc=consonantkiller */, - { 0, 5986, 4134, 13, 1, UNI_NV__1 } /* numericvalue=1 */, - { 20, 9640, 3, 4, 1, -UNI_LOE } /* loe=f */, - { 0, 3836, 4001, 17, 7, UNI_CPRT } /* scriptextensions=cypriot */, - { 0, 6972, 0, 11, 0, UNI_SYLO } /* sylotinagri */, - { 306, 5986, 8710, 13, 4, UNI_NV__6000 } /* numericvalue=6000 */, - { 11, 5746, 9255, 6, 5, -UNI_EBASE } /* ebase=false */, - { 962, 184, 6397, 2, 12, UNI_MATHALPHANUM } /* ismathalphanum */, - { 1, 5032, 0, 13, 0, UNI_POSIXXDIGIT } /* asciihexdigit */, - { 0, 9277, 1013, 3, 5, UNI_SC__GREK } /* sc=greek */, - { 0, 1979, 10171, 10, 1, UNI_CASEDLETTER } /* category=l_ */, - { 0, 10126, 471, 3, 2, UNI_VO__TU } /* vo=tu */, - { 0, 9508, 4912, 4, 2, UNI_CCC__0 } /* ccc=nr */, - { 0, 9832, 0, 4, 0, UNI_TIBT } /* tibt */, - { 1, 8435, 36, 7, 1, UNI_GRBASE } /* grbase=t */, - { 0, 9508, 756, 4, 2, UNI_CCC__DA } /* ccc=da */, - { 4, 8211, 0, 8, 0, UNI_JAMOEXTB } /* jamoextb */, - { 125, 1537, 4988, 24, 15, UNI_LOE } /* indicpositionalcategory=visualorderleft */, - { 0, 10048, 7843, 3, 8, UNI_NV__1_SLASH_4 } /* nv=2.50e-01 */, - { 0, 5200, 0, 7, 0, UNI_KANASUP } /* kanasup */, - { 0, 8780, 861, 6, 6, UNI_ARROWS } /* block=arrows */, - { 1, 6805, 842, 6, 25, UNI_MISCARROWS } /* inmiscellaneoussymbolsandarrows */, - { 0, 9596, 24, 4, 1, UNI_GCB__L } /* hst=l */, - { 0, 5986, 8714, 13, 5, UNI_NV__30000 } /* numericvalue=30000 */, - { 8, 9277, 4385, 3, 4, UNI_TANG } /* sc=tang */, - { 0, 8575, 10135, 7, 3, UNI_PATSYN } /* patsyn=yes */, - { 0, 1218, 0, 26, 0, UNI_KATAKANAEXT } /* katakanaphoneticextensions */, - { 3, 5986, 5649, 13, 1, UNI_NV__0 } /* numericvalue=0 */, - { 64, 10027, 5368, 3, 14, UNI_JG__MANICHAEANKAPH } /* jg=manichaeankaph */, - { 0, 10048, 9409, 3, 3, UNI_NV__5_SLASH_2 } /* nv=5/2 */, - { 776, 184, 5843, 2, 9, UNI_MLYM } /* ismalayalam */, - { 0, 4116, 2430, 3, 19, UNI_PHLI } /* isinscriptionalpahlavi */, - { 557, 9444, 7826, 4, 2, UNI_AGE__12 } /* age=12 */, - { 9, 10009, 10066, 3, 3, UNI_DT__SML } /* dt=sml */, - { 0, 9488, 4808, 4, 15, UNI_MISCPICTOGRAPHS } /* blk=miscpictographs */, - { 0, 8589, 9652, 7, 4, UNI_MERC } /* script=merc */, - { 1, 8589, 8315, 7, 4, UNI_UGAR } /* script=ugar */, - { 3, 8589, 3025, 7, 8, UNI_CHER } /* script=cherokee */, - { 0, 2529, 3, 20, 1, -UNI_TERM } /* terminalpunctuation=f */, - { 66, 9262, 8996, 3, 5, UNI_SB__ST } /* sb=sterm */, - { 0, 6012, 0, 13, 0, UNI_VERTICALFORMS } /* verticalforms */, - { 0, 8990, 0, 6, 0, UNI_RJNG } /* rejang */, - { 0, 9488, 6385, 4, 12, UNI_INMASARAMGONDI } /* blk=masaramgondi */, - { 0, 8960, 10135, 6, 3, UNI_NFCQC__Y } /* nfcqc=yes */, - { 4, 9520, 36, 4, 1, UNI_CWL } /* cwl=t */, - { 75, 1222, 0, 4, 0, UNI_KANA } /* kana */, - { 41, 4033, 341, 16, 2, UNI_PE } /* generalcategory=pe */, - { 11, 9820, 0, 4, 0, UNI_TFNG } /* tfng */, - { 0, 2288, 4068, 5, 13, UNI_HALFANDFULLFORMS } /* inhalfandfullforms */, - { 10, 5060, 1025, 14, 2, -UNI_CI } /* caseignorable=no */, - { 0, 9262, 4305, 3, 5, UNI_SB__XX } /* sb=other */, - { 90, 7155, 3053, 3, 8, UNI_HALFMARKS } /* ishalfmarks */, - { 404, 10290, 5040, 6, 5, UNI_XPOSIXDIGIT } /* xposixdigit */, - { 0, 10027, 7711, 3, 9, UNI_JG__SYRIACWAW } /* jg=syriacwaw */, - { 672, 7098, 0, 10, 0, UNI_BOXDRAWING } /* boxdrawing */, - { 1, 9768, 1013, 4, 5, UNI_GREK } /* scx=greek */, - { 0, 9444, 7987, 4, 3, UNI_AGE__6_DOT_2 } /* age=6.2 */, - { 0, 3133, 1025, 18, 2, -UNI_EBASE } /* emojimodifierbase=no */, - { 16, 1812, 9836, 22, 4, UNI_CWL } /* changeswhenlowercased=true */, - { 1, 117, 447, 3, 31, UNI_IDEOGRAPHICSYMBOLS } /* inideographicsymbolsandpunctuation */, - { 87, 1417, 8727, 24, 2, UNI_CCC__32 } /* canonicalcombiningclass=32 */, - { 546, 9768, 7675, 4, 9, UNI_PALM } /* scx=palmyrene */, - { 32, 9768, 3241, 4, 4, UNI_GEOR } /* scx=geor */, - { 0, 9764, 0, 4, 0, UNI_SARB } /* sarb */, - { 0, 10033, 73, 3, 2, UNI_EMOD } /* lb=em */, - { 4, 3836, 9335, 17, 4, UNI_TAKR } /* scriptextensions=takr */, - { 1097, 10291, 5039, 5, 6, UNI_POSIXXDIGIT } /* posixxdigit */, - { 128, 7249, 3583, 4, 15, UNI_UCAS } /* iscanadiansyllabics */, - { 268, 8589, 7308, 7, 10, UNI_PHNX } /* script=phoenician */, - { 36, 184, 2485, 2, 4, UNI_MONG } /* ismong */, - { 0, 8694, 0, 6, 0, UNI_XPOSIXSPACE } /* wspace */, - { 2, 9508, 7826, 4, 2, UNI_CCC__12 } /* ccc=12 */, - { 15, 1587, 0, 1, 0, UNI_Z } /* z */, - { 10, 10048, 9436, 3, 4, UNI_NV__7_SLASH_12 } /* nv=7/12 */, - { 2, 9488, 2308, 4, 6, UNI_YIJING } /* blk=yijing */, - { 0, 2182, 10174, 21, 2, UNI_GCB__XX } /* graphemeclusterbreak=xx */, - { 0, 1746, 17, 22, 1, UNI_BPT__O } /* bidipairedbrackettype=o */, - { 0, 3836, 493, 17, 3, UNI_HAN } /* scriptextensions=han */, - { 1, 1087, 9836, 27, 4, UNI_PCM } /* prependedconcatenationmark=true */, - { 0, 7418, 9255, 10, 5, -UNI_XPOSIXUPPER } /* uppercase=false */, - { 4, 1114, 3, 26, 1, -UNI_CWKCF } /* changeswhennfkccasefolded=f */, - { 0, 7028, 9881, 3, 3, UNI_YI } /* isyiii */, - { 4, 4033, 45, 16, 2, UNI_CO } /* generalcategory=co */, - { 0, 4916, 2077, 3, 21, UNI_TRANSPORTANDMAP } /* istransportandmapsymbols */, - { 0, 8780, 8203, 6, 8, UNI_JAMOEXTA } /* block=jamoexta */, - { 7, 7155, 1116, 3, 3, UNI_HANG } /* ishang */, - { 89, 8780, 2308, 6, 6, UNI_YIJING } /* block=yijing */, - { 21, 184, 8171, 2, 8, UNI_GUJR } /* isgujarati */, - { 1024, 9768, 8924, 4, 4, UNI_LEPC } /* scx=lepc */, - { 5, 10129, 0, 3, 0, UNI_vs_values_index } /* vs= */, - { 3, 9664, 0, 4, 0, UNI_MRO } /* mroo */, - { 0, 8780, 2245, 6, 21, UNI_MEETEIMAYEKEXT } /* block=meeteimayekextensions */, - { 0, 6576, 1025, 11, 2, -UNI_XPOSIXALPHA } /* alphabetic=no */, - { 29, 184, 382, 2, 32, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* isegyptianhieroglyphformatcontrols */, - { 2, 9270, 868, 3, 17, UNI_PHONETICEXT } /* inphoneticextensions */, - { 9, 9015, 0, 5, 0, UNI_ideo_values_index } /* ideo= */, - { 0, 10033, 7448, 3, 10, UNI_LB__WJ } /* lb=wordjoiner */, - { 7, 7239, 0, 2, 0, UNI_VS } /* vs */, - { 352, 9488, 3938, 5, 15, UNI_BOPOMOFOEXT } /* blk=bopomofoextended */, - { 0, 9488, 2477, 4, 3, UNI_PUA } /* blk=pua */, - { 7, 184, 2817, 2, 4, UNI_MERO } /* ismero */, - { 0, 5960, 0, 13, 0, UNI_MISCTECHNICAL } /* misctechnical */, - { 160, 8840, 0, 6, 0, UNI_CAKM } /* chakma */, - { 521, 5726, 0, 13, 0, UNI_ME } /* enclosingmark */, - { 23, 1417, 9101, 25, 4, UNI_CCC__14 } /* canonicalcombiningclass=ccc14 */, - { 2, 8688, 727, 4, 2, UNI_ARMN } /* isarmn */, - { 2, 184, 2469, 2, 20, UNI_HMNP } /* isnyiakengpuachuehmong */, - { 757, 10290, 1867, 6, 5, UNI_XPOSIXUPPER } /* xposixupper */, - { 8, 10132, 125, 3, 2, UNI_LB__CR } /* wb=cr */, - { 161, 9768, 4001, 4, 7, UNI_CPRT } /* scx=cypriot */, - { 0, 184, 1442, 3, 9, UNI_CJKSYMBOLS } /* iscjksymbols */, - { 0, 9768, 9548, 4, 4, UNI_DSRT } /* scx=dsrt */, - { 0, 3836, 6792, 18, 3, UNI_SAMR } /* scriptextensions=samr */, - { 144, 4542, 3226, 5, 15, UNI_INPUNCTUATION } /* ingeneralpunctuation */, - { 634, 4116, 1308, 3, 2, UNI_IDS } /* isids */, - { 10, 9346, 1025, 4, 2, -UNI_IDC } /* idc=no */, - { 32, 184, 8421, 2, 4, UNI_ELYM } /* iselym */, - { 4, 9275, 8099, 5, 8, UNI_INSC__AVAGRAHA } /* insc=avagraha */, - { 132, 8575, 36, 7, 1, UNI_PATSYN } /* patsyn=t */, - { 0, 3836, 8091, 17, 8, UNI_ARMN } /* scriptextensions=armenian */, - { 0, 5791, 6565, 13, 11, UNI_JG__AFRICANNOON } /* joininggroup=africannoon */, - { 1, 2288, 2724, 4, 8, UNI_JAMO } /* inhanguljamo */, - { 0, 5452, 47, 14, 1, UNI_NFCQC__M } /* nfcquickcheck=m */, - { 1, 9684, 0, 4, 0, UNI_NEWA } /* newa */, - { 549, 9488, 867, 4, 11, UNI_PHONETICEXT } /* blk=phoneticext */, - { 513, 8762, 1025, 6, 2, -UNI_XPOSIXALPHA } /* alpha=no */, - { 455, 8780, 5804, 6, 13, UNI_KANAEXTA } /* block=kanaextendeda */, - { 1, 184, 3937, 2, 11, UNI_BOPOMOFOEXT } /* isbopomofoext */, - { 783, 5986, 9050, 13, 5, UNI_NV__1_SLASH_160 } /* numericvalue=1/160 */, - { 7, 10024, 3277, 3, 18, UNI_PI } /* gc=initialpunctuation */, - { 0, 9262, 339, 3, 2, UNI_SB__LO } /* sb=lo */, - { 0, 2161, 26, 21, 1, UNI_EXTPICT } /* extendedpictographic=y */, - { 1140, 7249, 3600, 4, 15, UNI_AGHB } /* iscaucasianalbanian */, - { 3, 9768, 9320, 4, 5, UNI_OSGE } /* scx=osage */, - { 0, 5060, 0, 13, 0, UNI_CI } /* caseignorable */, - { 147, 10048, 9376, 3, 3, UNI_NV__1_SLASH_6 } /* nv=1/6 */, - { 301, 7027, 0, 11, 0, UNI_YISYLLABLES } /* yisyllables */, - { 9, 10033, 7268, 3, 10, UNI_LB__NS } /* lb=nonstarter */, - { 192, 5508, 9255, 14, 5, -UNI_PATSYN } /* patternsyntax=false */, - { 1, 8954, 26, 6, 1, UNI__PERL_NCHAR } /* nchar=y */, - { 1, 5986, 5648, 13, 6, UNI_NV__100000 } /* numericvalue=100000 */, - { 5, 2224, 7389, 3, 9, UNI_SUPARROWSB } /* insuparrowsb */, - { 0, 10024, 25, 3, 1, UNI_S } /* gc=s */, - { 0, 5986, 7835, 13, 8, UNI_NV__5_SLASH_2 } /* numericvalue=2.50e+00 */, - { 303, 5986, 1249, 13, 3, UNI_NV__NAN } /* numericvalue=nan */, - { 1, 1768, 36, 22, 1, UNI_CWCF } /* changeswhencasefolded=t */, - { 0, 8688, 7497, 4, 7, UNI_ARABICPFA } /* isarabicpfa */, - { 264, 8780, 183, 6, 20, UNI_MISCSYMBOLS } /* block=miscellaneoussymbols */, - { 0, 9277, 6796, 3, 11, UNI_MEDF } /* sc=medefaidrin */, - { 672, 184, 1466, 3, 23, UNI_DIACRITICALSFORSYMBOLS } /* iscombiningmarksforsymbols */, - { 3, 9997, 3756, 3, 3, UNI_BC__NSM } /* bc=nsm */, - { 4, 2569, 18, 20, 1, UNI_VO__R } /* verticalorientation=r */, - { 3, 9508, 10166, 4, 2, UNI_CCC__8 } /* ccc=kv */, - { 0, 8762, 0, 6, 0, UNI_alpha_values_index } /* alpha= */, - { 13, 9768, 8498, 4, 4, UNI_MULT } /* scx=mult */, - { 2, 5986, 5648, 13, 2, UNI_NV__10 } /* numericvalue=10 */, - { 0, 8864, 9836, 6, 4, UNI_EMOJI } /* emoji=true */, - { 0, 2224, 7359, 3, 9, UNI_INSAURASHTRA } /* insaurashtra */, - { 514, 9444, 10111, 4, 3, UNI_AGE__6_DOT_2 } /* age=v62 */, - { 1, 184, 2703, 2, 19, UNI_ENCLOSEDALPHANUMSUP } /* isenclosedalphanumsup */, - { 0, 9768, 9305, 4, 5, UNI_NSHU } /* scx=nushu */, - { 152, 1746, 4898, 22, 4, UNI_BPT__O } /* bidipairedbrackettype=open */, - { 15, 184, 183, 2, 34, UNI_MISCPICTOGRAPHS } /* ismiscellaneoussymbolsandpictographs */, - { 617, 7438, 7603, 10, 9, UNI_WB__ML } /* wordbreak=midletter */, - { 0, 5986, 8019, 13, 8, UNI_NV__2_SLASH_3 } /* numericvalue=6.67e-01 */, - { 2306, 9277, 9700, 3, 4, UNI_OLCK } /* sc=olck */, - { 2184, 9488, 349, 4, 33, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* blk=supplementalsymbolsandpictographs */, - { 3, 5324, 8479, 4, 5, UNI_INMAKASAR } /* inmakasar */, - { 1, 9277, 9500, 3, 4, UNI_SC__CAKM } /* sc=cakm */, - { 2, 3836, 1176, 18, 3, UNI_SORA } /* scriptextensions=sora */, - { 0, 8589, 7292, 8, 3, UNI_SC__SOGD } /* script=sogd */, - { 0, 3836, 9038, 17, 6, UNI_YEZI } /* scriptextensions=yezidi */, - { 0, 5791, 5944, 13, 3, UNI_JG__WAW } /* joininggroup=waw */, - { 22, 6505, 0, 12, 0, UNI_PHAISTOS } /* phaistosdisc */, - { 9, 8858, 9255, 6, 5, -UNI_ECOMP } /* ecomp=false */, - { 1, 9020, 9836, 6, 4, UNI_XPOSIXUPPER } /* upper=true */, - { 355, 2760, 911, 19, 1, UNI_GCB__V } /* hangulsyllabletype=v */, - { 0, 1417, 8010, 24, 2, UNI_CCC__36 } /* canonicalcombiningclass=36 */, - { 0, 9277, 9820, 3, 4, UNI_TFNG } /* sc=tfng */, - { 1, 1537, 6983, 24, 11, UNI_INPC__TOPANDRIGHT } /* indicpositionalcategory=topandright */, - { 0, 9277, 8, 4, 3, UNI_SC__KANA } /* sc=kana */, - { 1, 184, 4718, 2, 15, UNI_LOWERCASELETTER } /* islowercaseletter */, - { 1, 2529, 0, 4, 0, UNI_TERM } /* term */, - { 90, 9768, 5171, 4, 4, UNI_CHAM } /* scx=cham */, - { 1157, 8589, 3079, 7, 4, UNI_SC__COPT } /* script=copt */, - { 1116, 9488, 2931, 4, 19, UNI_SUPARROWSA } /* blk=supplementalarrowsa */, - { 1, 8589, 4928, 7, 5, UNI_SC__TAML } /* script=tamil */, - { 2148, 4598, 0, 15, 0, UNI_DIACRITICALSEXT } /* diacriticalsext */, - { 10, 9277, 8652, 3, 7, UNI_TAVT } /* sc=taiviet */, - { 0, 9277, 6181, 3, 12, UNI_SC__GONG } /* sc=gunjalagondi */, - { 531, 9277, 4448, 3, 5, UNI_BAMU } /* sc=bamum */, - { 49, 6420, 9316, 3, 4, UNI_INORIYA } /* inoriya */, - { 1, 10048, 7859, 3, 8, UNI_NV__20000000 } /* nv=20000000 */, - { 0, 10048, 7851, 3, 8, UNI_NV__1_SLASH_40 } /* nv=2.50e-02 */, - { 6, 9768, 8786, 4, 6, UNI_CARI } /* scx=carian */, - { 1, 5986, 7814, 13, 1, UNI_NV__7 } /* numericvalue=7 */, - { 1, 4033, 3277, 16, 18, UNI_PI } /* generalcategory=initialpunctuation */, - { 0, 4916, 4386, 3, 15, UNI_TANGUTCOMPONENTS } /* istangutcomponents */, - { 253, 8652, 0, 7, 0, UNI_TAVT } /* taiviet */, - { 0, 9488, 908, 4, 14, UNI_PUA } /* blk=privateusearea */, - { 0, 10288, 10303, 8, 5, UNI_XPOSIXBLANK } /* isxposixblank */, - { 0, 10048, 7763, 3, 8, UNI_NV__1_SLASH_8 } /* nv=1.25e-01 */, - { 26, 9488, 3421, 4, 4, UNI_RUMI } /* blk=rumi */, - { 4, 9488, 4928, 4, 8, UNI_TAMILSUP } /* blk=tamilsup */, - { 1540, 7088, 3313, 10, 18, UNI_BC__LRI } /* bidiclass=lefttorightisolate */, - { 0, 3151, 10135, 18, 3, UNI_EPRES } /* emojipresentation=yes */, - { 0, 4033, 2268, 16, 2, UNI_PD } /* generalcategory=pd */, - { 2343, 4113, 4974, 3, 14, UNI_VEDICEXT } /* invedicextensions */, - { 100, 9768, 8936, 4, 4, UNI_LYCI } /* scx=lyci */, - { 0, 3836, 8291, 17, 8, UNI_TAGB } /* scriptextensions=tagbanwa */, - { 0, 467, 0, 11, 0, UNI_P } /* punctuation */, - { 17, 10048, 8710, 3, 3, UNI_NV__600 } /* nv=600 */, - { 0, 3836, 8421, 17, 4, UNI_ELYM } /* scriptextensions=elym */, - { 66, 8589, 8924, 7, 4, UNI_LEPC } /* script=lepc */, - { 2, 9230, 1, 5, 1, -UNI_CWCF } /* cwcf=n */, - { 6, 9488, 8617, 4, 7, UNI_INSOYOMBO } /* blk=soyombo */, - { 0, 2608, 0, 6, 0, UNI_BRAH } /* brahmi */, - { 357, 184, 6829, 2, 11, UNI_MYANMAREXTB } /* ismyanmarextb */, - { 2136, 9444, 9982, 4, 3, UNI_AGE__6_DOT_3 } /* age=6.3 */, - { 1655, 9768, 9688, 4, 3, UNI_NKO } /* scx=nko */, - { 1541, 1417, 7890, 24, 2, UNI_CCC__33 } /* canonicalcombiningclass=33 */, - { 1, 8774, 0, 6, 0, UNI_bidim_values_index } /* bidim= */, - { 0, 9768, 9245, 4, 5, UNI_DOGR } /* scx=dogra */, - { 12, 9508, 9108, 4, 2, UNI_CCC__15 } /* ccc=15 */, - { 0, 10027, 9784, 3, 4, UNI_JG__SHIN } /* jg=shin */, - { 280, 8589, 8659, 7, 7, UNI_TIBT } /* script=tibetan */, - { 17, 10033, 1822, 3, 2, UNI_LB__NL } /* lb=nl */, - { 1, 3904, 1025, 17, 2, -UNI_UIDEO } /* unifiedideograph=no */, - { 227, 10048, 9988, 3, 3, UNI_NV__7_SLASH_8 } /* nv=7/8 */, - { 0, 9768, 3025, 4, 4, UNI_CHER } /* scx=cher */, - { 2, 3836, 9652, 17, 4, UNI_MERC } /* scriptextensions=merc */, - { 0, 1417, 18, 24, 1, UNI_CCC__R } /* canonicalcombiningclass=r */, - { 1, 3836, 8219, 17, 8, UNI_JAVA } /* scriptextensions=javanese */, - { 0, 4989, 513, 3, 15, UNI_UIDEO } /* isunifiedideograph */, - { 3, 184, 4478, 2, 4, UNI_BRAI } /* isbrai */, - { 17, 184, 5158, 2, 14, UNI_INGREEK } /* isgreekandcoptic */, - { 304, 3836, 7428, 17, 10, UNI_WARA } /* scriptextensions=warangciti */, - { 832, 2779, 9836, 19, 4, UNI_IDST } /* idstrinaryoperator=true */, - { 192, 9768, 9285, 4, 4, UNI_LIMB } /* scx=limb */, - { 5, 3853, 0, 17, 0, UNI_sterm_values_index } /* sentenceterminal= */, - { 0, 10024, 3985, 3, 16, UNI_PE } /* gc=closepunctuation */, - { 0, 7088, 5494, 10, 14, UNI_BC__NSM } /* bidiclass=nonspacingmark */, - { 1232, 4542, 3243, 4, 16, UNI_GEORGIANSUP } /* ingeorgiansupplement */, - { 1026, 8780, 8211, 6, 8, UNI_JAMOEXTB } /* block=jamoextb */, - { 8, 9556, 1910, 4, 2, UNI_GCB__CN } /* gcb=cn */, - { 1, 3133, 3, 18, 1, -UNI_EBASE } /* emojimodifierbase=f */, - { 0, 8589, 8912, 7, 4, UNI_SC__KHOJ } /* script=khoj */, - { 0, 184, 8470, 2, 7, UNI_LINA } /* islineara */, - { 1, 7218, 10030, 10, 2, UNI_GCB__T } /* linebreak=jt */, - { 136, 10291, 3379, 5, 5, UNI_POSIXSPACE } /* posixspace */, - { 26, 4116, 4704, 3, 14, UNI_ARMI } /* isimperialaramaic */, - { 0, 5592, 0, 14, 0, UNI_ZS } /* spaceseparator */, - { 39, 10048, 7468, 3, 9, UNI_NV___MINUS_1_SLASH_2 } /* nv=-5.00e-01 */, - { 2405, 8984, 9255, 6, 5, -UNI_QMARK } /* qmark=false */, - { 1, 8589, 9880, 7, 4, UNI_SC__YI } /* script=yiii */, - { 0, 21, 6730, 2, 11, UNI_KATAKANAEXT } /* inkatakanaext */, - { 776, 184, 8477, 2, 7, UNI_MAKA } /* ismakasar */, - { 1, 2224, 2288, 3, 20, UNI_SINHALAARCHAICNUMBERS } /* insinhalaarchaicnumbers */, - { 1540, 10296, 8583, 3, 6, UNI_PHAG } /* isphagspa */, - { 19, 9508, 8793, 5, 4, UNI_CCC__10 } /* ccc=ccc10 */, - { 0, 9270, 5551, 3, 13, UNI_INPSALTERPAHLAVI } /* inpsalterpahlavi */, - { 36, 2032, 1025, 22, 2, -UNI__PERL_NCHAR } /* noncharactercodepoint=no */, - { 23, 9488, 4145, 4, 16, UNI_LINEARBIDEOGRAMS } /* blk=linearbideograms */, - { 617, 3379, 26, 6, 1, UNI_XPOSIXSPACE } /* space=y */, - { 137, 184, 2912, 2, 19, UNI_SUNDANESESUP } /* issundanesesupplement */, - { 770, 9508, 2809, 4, 2, UNI_CCC__1 } /* ccc=ov */, - { 0, 1417, 9116, 25, 4, UNI_CCC__17 } /* canonicalcombiningclass=ccc17 */, - { 271, 5986, 7907, 13, 8, UNI_NV__3_SLASH_8 } /* numericvalue=3.75e-01 */, - { 1028, 8780, 4554, 7, 14, UNI_CONTROLPICTURES } /* block=controlpictures */, - { 400, 8780, 8421, 6, 7, UNI_INELYMAIC } /* block=elymaic */, - { 0, 9270, 2449, 5, 4, UNI_INPC__LEFT } /* inpc=left */, - { 0, 8688, 9066, 3, 4, UNI_ADLM } /* isadlam */, - { 0, 8589, 9748, 7, 4, UNI_RJNG } /* script=rjng */, - { 0, 9230, 9255, 5, 5, -UNI_CWCF } /* cwcf=false */, - { 3, 5116, 9255, 14, 5, -UNI_EMOD } /* emojimodifier=false */, - { 259, 5578, 49, 14, 2, UNI_SB__AT } /* sentencebreak=at */, - { 0, 9277, 7621, 3, 9, UNI_NBAT } /* sc=nabataean */, - { 2, 184, 3098, 2, 5, UNI_ECOMP } /* isecomp */, - { 36, 3836, 9872, 17, 4, UNI_XPEO } /* scriptextensions=xpeo */, - { 1808, 10027, 2223, 3, 3, UNI_JG__AIN } /* jg=ain */, - { 0, 4116, 3735, 3, 16, UNI_INDICSIYAQNUMBERS } /* isindicsiyaqnumbers */, - { 0, 10033, 2640, 3, 2, UNI_LB__BA } /* lb=ba */, - { 0, 10346, 8682, 4, 5, UNI_ZZZZ } /* isunknown */, - { 1, 9277, 9560, 3, 4, UNI_SC__GONG } /* sc=gong */, - { 14, 5508, 1, 14, 1, -UNI_PATSYN } /* patternsyntax=n */, - { 1, 10009, 8163, 3, 8, UNI_DT__FRA } /* dt=fraction */, - { 13, 8589, 382, 7, 4, UNI_EGYP } /* script=egyp */, - { 0, 2182, 5746, 21, 5, UNI_WB__EB } /* graphemeclusterbreak=ebase */, - { 542, 184, 7368, 2, 10, UNI_SMALLFORMS } /* issmallforms */, - { 0, 9240, 1, 5, 1, -UNI_DASH } /* dash=n */, - { 0, 3836, 6840, 17, 4, UNI_NAND } /* scriptextensions=nand */, - { 0, 9277, 6840, 3, 11, UNI_SC__NAND } /* sc=nandinagari */, - { 0, 8780, 1723, 6, 23, UNI_SUPPUNCTUATION } /* block=supplementalpunctuation */, - { 0, 9492, 17, 4, 1, UNI_BPT__O } /* bpt=o */, - { 1, 3600, 0, 4, 0, UNI_UCAS } /* ucas */, - { 329, 5578, 495, 14, 2, UNI_SB__NU } /* sentencebreak=nu */, - { 0, 8780, 10051, 6, 3, UNI_OCR } /* block=ocr */, - { 1295, 10296, 6506, 3, 7, UNI_PHAISTOS } /* isphaistos */, - { 72, 3836, 9804, 17, 4, UNI_TALE } /* scriptextensions=tale */, - { 0, 10027, 5396, 3, 14, UNI_JG__MANICHAEANRESH } /* jg=manichaeanresh */, - { 4, 10048, 9904, 3, 3, UNI_NV__1_SLASH_5 } /* nv=1/5 */, - { 2184, 133, 0, 4, 0, UNI_M } /* mark */, - { 1, 184, 6609, 2, 10, UNI_DEP } /* isdeprecated */, - { 76, 4688, 6433, 15, 12, UNI_IDENTIFIERTYPE__NOTCHARACTER } /* identifiertype=notcharacter */, - { 0, 2224, 1295, 3, 24, UNI_SUPERANDSUB } /* insuperscriptsandsubscripts */, - { 0, 9277, 3115, 3, 10, UNI_SC__DEVA } /* sc=devanagari */, - { 0, 2224, 7379, 3, 9, UNI_SUPARROWSA } /* insuparrowsa */, - { 0, 10048, 8027, 3, 8, UNI_NV__15_SLASH_2 } /* nv=7.50e+00 */, - { 12, 1552, 44, 10, 1, UNI_SK } /* category=sk */, - { 0, 184, 2560, 2, 4, UNI_MAND } /* ismand */, - { 0, 9508, 8, 4, 1, UNI_CCC__A } /* ccc=a */, - { 261, 6385, 0, 12, 0, UNI_GONM } /* masaramgondi */, - { 1, 8780, 1393, 6, 24, UNI_ARABICPFB } /* block=arabicpresentationformsb */, - { 62, 1417, 8568, 24, 7, UNI_CCC__1 } /* canonicalcombiningclass=overlay */, - { 386, 5986, 7754, 13, 2, UNI_NV__11 } /* numericvalue=11 */, - { 0, 9628, 0, 4, 0, UNI_LATN } /* latn */, - { 0, 9275, 5634, 5, 14, UNI_INSC__VOWELDEPENDENT } /* insc=voweldependent */, - { 0, 9444, 10114, 4, 3, UNI_AGE__6_DOT_3 } /* age=v63 */, - { 139, 8780, 2608, 6, 6, UNI_INBRAHMI } /* block=brahmi */, - { 0, 8780, 4289, 6, 16, UNI_MYANMAREXTB } /* block=myanmarextendedb */, - { 91, 10060, 3, 3, 1, -UNI_RI } /* ri=f */, - { 74, 8589, 9824, 7, 4, UNI_SC__TGLG } /* script=tglg */, - { 15, 9277, 3753, 5, 15, UNI_KITS } /* sc=khitansmallscript */, - { 0, 9676, 0, 4, 0, UNI_NARB } /* narb */, - { 1, 2784, 7060, 4, 8, UNI_ARABICEXTA } /* inarabicexta */, - { 6, 8589, 9876, 7, 4, UNI_XSUX } /* script=xsux */, - { 0, 2280, 7280, 4, 8, UNI_XPEO } /* isoldpersian */, - { 0, 184, 5674, 2, 12, UNI_BIDIM } /* isbidimirrored */, - { 1305, 8894, 3, 6, 1, -UNI_JOINC } /* joinc=f */, - { 13, 5791, 6337, 13, 12, UNI_JG__MALAYALAMNYA } /* joininggroup=malayalamnya */, - { 798, 184, 1631, 2, 15, UNI_GEOMETRICSHAPES } /* isgeometricshapes */, - { 1, 1188, 4386, 3, 15, UNI_TANGUTCOMPONENTS } /* intangutcomponents */, - { 513, 10033, 1527, 3, 9, UNI_LB__SG } /* lb=surrogate */, - { 5, 184, 7119, 3, 9, UNI_CHRS } /* ischorasmian */, - { 224, 9712, 0, 4, 0, UNI_OSGE } /* osge */, - { 0, 8267, 9836, 8, 4, UNI_RADICAL } /* radical=true */, - { 59, 9768, 6973, 5, 10, UNI_SYLO } /* scx=sylotinagri */, - { 1, 8780, 218, 7, 32, UNI_DIACRITICALSEXT } /* block=combiningdiacriticalmarksextended */, - { 608, 5986, 9976, 13, 3, UNI_NV__5_SLASH_8 } /* numericvalue=5/8 */, - { 2, 5986, 9360, 13, 4, UNI_NV___MINUS_1_SLASH_2 } /* numericvalue=-1/2 */, - { 705, 10024, 5726, 3, 13, UNI_ME } /* gc=enclosingmark */, - { 82, 8589, 4149, 8, 3, UNI_SARB } /* script=sarb */, - { 0, 7418, 36, 10, 1, UNI_XPOSIXUPPER } /* uppercase=t */, - { 0, 5791, 8918, 13, 6, UNI_JG__LAMADH } /* joininggroup=lamadh */, - { 514, 8589, 8107, 7, 8, UNI_BALI } /* script=balinese */, - { 0, 2161, 9836, 21, 4, UNI_EXTPICT } /* extendedpictographic=true */, - { 64, 3836, 8187, 17, 4, UNI_HIRA } /* scriptextensions=hira */, - { 16, 9488, 7239, 4, 2, UNI_INVS } /* blk=vs */, - { 1616, 8589, 7428, 7, 10, UNI_WARA } /* script=warangciti */, - { 0, 10288, 62, 8, 5, UNI_XPOSIXGRAPH } /* isxposixgraph */, - { 1, 3379, 0, 6, 0, UNI_wspace_values_index } /* space= */, - { 1042, 4658, 0, 15, 0, UNI_grext_values_index } /* graphemeextend= */, - { 1, 10048, 9379, 3, 2, UNI_NV__41 } /* nv=41 */, - { 5, 2280, 262, 3, 3, UNI_OSMA } /* isosma */, - { 0, 1966, 4913, 22, 15, UNI_INSC__REGISTERSHIFTER } /* indicsyllabiccategory=registershifter */, - { 0, 1812, 3, 22, 1, -UNI_CWL } /* changeswhenlowercased=f */, - { 0, 184, 27, 2, 2, UNI_LOWERCASELETTER } /* isll */, - { 0, 8780, 1879, 7, 21, UNI_CJKCOMPATIDEOGRAPHSSUP } /* block=cjkcompatideographssup */, - { 0, 10048, 9412, 3, 4, UNI_NV__17_SLASH_2 } /* nv=17/2 */, - { 0, 9262, 866, 3, 2, UNI_SB__SP } /* sb=sp */, - { 37, 4838, 47, 15, 1, UNI_NFCQC__M } /* nfkcquickcheck=m */, - { 224, 8589, 9664, 7, 4, UNI_MRO } /* script=mroo */, - { 1, 9488, 689, 4, 30, UNI_CJKEXTG } /* blk=cjkunifiedideographsextensiong */, - { 1, 184, 9285, 2, 5, UNI_LIMB } /* islimbu */, - { 17, 5986, 7806, 13, 1, UNI_NV__6 } /* numericvalue=6 */, - { 0, 7540, 26, 9, 1, UNI_EXT } /* extender=y */, - { 607, 9277, 9320, 3, 5, UNI_OSGE } /* sc=osage */, - { 2, 9768, 8618, 5, 6, UNI_SOYO } /* scx=soyombo */, - { 0, 5746, 36, 6, 1, UNI_EBASE } /* ebase=t */, - { 0, 3836, 8990, 17, 6, UNI_RJNG } /* scriptextensions=rejang */, - { 5, 9768, 9696, 4, 4, UNI_OGAM } /* scx=ogam */, - { 4, 3374, 3, 11, 1, -UNI_XPOSIXSPACE } /* whitespace=f */, - { 12, 184, 1901, 3, 5, UNI_ZYYY } /* iscommon */, - { 546, 10296, 7685, 3, 8, UNI_PAUC } /* ispaucinhau */, - { 0, 6469, 5904, 12, 4, UNI_NV__NAN } /* numerictype=none */, - { 80, 9277, 4793, 3, 15, UNI_MERC } /* sc=meroiticcursive */, - { 128, 8780, 6554, 6, 3, UNI_INIDC } /* block=idc */, - { 2, 9444, 7979, 4, 3, UNI_AGE__6 } /* age=6.0 */, - { 0, 1269, 0, 25, 0, UNI_compex_values_index } /* fullcompositionexclusion= */, - { 1040, 9277, 8464, 4, 6, UNI_SC__KALI } /* sc=kayahli */, - { 1, 1417, 9203, 24, 2, UNI_CCC__34 } /* canonicalcombiningclass=34 */, - { 29, 3836, 6181, 17, 12, UNI_GONG } /* scriptextensions=gunjalagondi */, - { 0, 3151, 1, 18, 1, -UNI_EPRES } /* emojipresentation=n */, - { 45, 5791, 6373, 13, 12, UNI_JG__MANICHAEANPE } /* joininggroup=manichaeanpe */, - { 0, 2224, 8611, 3, 6, UNI_INSIDDHAM } /* insiddham */, - { 24, 6061, 1, 12, 1, -UNI_BIDIC } /* bidicontrol=n */, - { 4, 184, 6505, 2, 12, UNI_PHAISTOS } /* isphaistosdisc */, - { 0, 5986, 9405, 13, 3, UNI_NV__3_SLASH_2 } /* numericvalue=3/2 */, - { 0, 1552, 4568, 9, 14, UNI_SC } /* category=currencysymbol */, - { 80, 10333, 9789, 3, 3, UNI_SHRD } /* isshrd */, - { 3, 9275, 3615, 5, 17, UNI_INSC__CONSONANTPREFIXED } /* insc=consonantprefixed */, - { 0, 9508, 7930, 4, 2, UNI_CCC__14 } /* ccc=14 */, - { 0, 9277, 6409, 3, 12, UNI_MEND } /* sc=mendekikakui */, - { 33, 9277, 9576, 3, 4, UNI_SC__GURU } /* sc=guru */, - { 0, 4916, 4929, 3, 7, UNI_TAMILSUP } /* istamilsup */, - { 18, 9488, 3938, 5, 10, UNI_BOPOMOFOEXT } /* blk=bopomofoext */, - { 19, 184, 2608, 2, 4, UNI_BRAH } /* isbrah */, - { 1, 9488, 8900, 4, 6, UNI_INKAITHI } /* blk=kaithi */, - { 0, 5791, 6950, 13, 11, UNI_JG__STRAIGHTWAW } /* joininggroup=straightwaw */, - { 16, 9262, 1867, 3, 5, UNI_SB__UP } /* sb=upper */, - { 2, 4916, 8667, 3, 6, UNI_TIRH } /* istirhuta */, - { 3, 8267, 9255, 8, 5, -UNI_RADICAL } /* radical=false */, - { 2185, 9488, 4129, 4, 6, UNI_LATIN1 } /* blk=latin1 */, - { 986, 184, 2099, 3, 20, UNI_CJKCOMPATFORMS } /* iscjkcompatibilityforms */, - { 680, 3901, 8181, 4, 6, UNI_INGURMUKHI } /* ingurmukhi */, - { 1185, 1188, 8584, 3, 3, UNI_TAGS } /* intags */, - { 242, 9768, 8604, 5, 6, UNI_SHAW } /* scx=shavian */, - { 0, 184, 3576, 3, 2, UNI_CWL } /* iscwl */, - { 0, 1417, 9925, 24, 3, UNI_CCC__BL } /* canonicalcombiningclass=218 */, - { 436, 3836, 6385, 17, 12, UNI_GONM } /* scriptextensions=masaramgondi */, - { 0, 184, 9568, 2, 4, UNI_GREK } /* isgrek */, - { 6, 4542, 4051, 4, 9, UNI_GEORGIANEXT } /* ingeorgianext */, - { 0, 3836, 9032, 17, 6, UNI_WCHO } /* scriptextensions=wancho */, - { 0, 4688, 8972, 15, 6, UNI_IDENTIFIERTYPE__NOTXID } /* identifiertype=notxid */, - { 1, 9520, 10135, 4, 3, UNI_CWL } /* cwl=yes */, - { 232, 184, 1823, 2, 5, UNI_XPOSIXLOWER } /* islower */, - { 2, 184, 6265, 2, 12, UNI_NL } /* isletternumber */, - { 462, 9508, 9952, 4, 3, UNI_CCC__IS } /* ccc=240 */, - { 133, 3836, 8470, 17, 7, UNI_LINA } /* scriptextensions=lineara */, - { 164, 9716, 9255, 4, 5, -UNI_PCM } /* pcm=false */, - { 1876, 10333, 1537, 3, 3, UNI_SIND } /* issind */, - { 0, 9508, 8805, 5, 4, UNI_CCC__11 } /* ccc=ccc11 */, - { 3, 8589, 4478, 7, 7, UNI_BRAI } /* script=braille */, - { 17, 9508, 8819, 4, 3, UNI_CCC__129 } /* ccc=129 */, - { 1, 3349, 0, 18, 0, UNI_ZP } /* paragraphseparator */, - { 2098, 8780, 4385, 6, 6, UNI_INTANGUT } /* block=tangut */, - { 0, 10027, 10021, 3, 3, UNI_JG__GAF } /* jg=gaf */, - { 0, 7218, 5999, 10, 13, UNI_LB__PR } /* linebreak=prefixnumeric */, - { 49, 1417, 9111, 25, 4, UNI_CCC__16 } /* canonicalcombiningclass=ccc16 */, - { 45, 2779, 1025, 19, 2, -UNI_IDST } /* idstrinaryoperator=no */, - { 0, 5324, 5949, 4, 11, UNI_MAYANNUMERALS } /* inmayannumerals */, - { 216, 7218, 1465, 10, 13, UNI_LB__CM } /* linebreak=combiningmark */, - { 1408, 4337, 0, 16, 0, UNI_SUPMATHOPERATORS } /* supmathoperators */, - { 0, 1552, 2349, 9, 20, UNI_PC } /* category=connectorpunctuation */, - { 0, 8930, 36, 6, 1, UNI_XPOSIXLOWER } /* lower=t */, - { 0, 5578, 751, 14, 5, UNI_SB__CL } /* sentencebreak=close */, - { 0, 5791, 0, 13, 0, UNI_jg_values_index } /* joininggroup= */, - { 8, 184, 2912, 2, 12, UNI_SUNDANESESUP } /* issundanesesup */, - { 1363, 5494, 0, 14, 0, UNI_MN } /* nonspacingmark */, - { 0, 9488, 8491, 4, 7, UNI_INMARCHEN } /* blk=marchen */, - { 0, 3836, 6973, 18, 3, UNI_SYLO } /* scriptextensions=sylo */, - { 0, 7388, 0, 10, 0, UNI_SUPARROWSB } /* suparrowsb */, - { 927, 9768, 9756, 4, 4, UNI_RUNR } /* scx=runr */, - { 0, 3151, 9255, 18, 5, -UNI_EPRES } /* emojipresentation=false */, - { 0, 6420, 8562, 3, 6, UNI_INOSMANYA } /* inosmanya */, - { 5, 9488, 1006, 4, 17, UNI_ANCIENTGREEKMUSIC } /* blk=ancientgreekmusic */, - { 0, 9556, 10015, 4, 3, UNI_WB__EB } /* gcb=ebg */, - { 0, 8780, 867, 6, 18, UNI_PHONETICEXT } /* block=phoneticextensions */, - { 0, 3836, 9644, 17, 4, UNI_MEDF } /* scriptextensions=medf */, - { 0, 5986, 7931, 13, 8, UNI_NV__5_SLASH_12 } /* numericvalue=4.17e-01 */, - { 0, 9275, 728, 5, 6, UNI_INSC__NUMBER } /* insc=number */, - { 1, 5986, 8720, 13, 5, UNI_NV__40000 } /* numericvalue=40000 */, - { 769, 5791, 5934, 13, 13, UNI_JG__MANICHAEANWAW } /* joininggroup=manichaeanwaw */, - { 2308, 3836, 5003, 17, 15, UNI_ZANB } /* scriptextensions=zanabazarsquare */, - { 10, 2784, 1371, 4, 22, UNI_ARABICPFA } /* inarabicpresentationformsa */, - { 0, 9492, 1, 4, 1, UNI_BPT__N } /* bpt=n */, - { 1, 9780, 0, 4, 0, UNI_SHAW } /* shaw */, - { 40, 7076, 1586, 3, 13, UNI_BYZANTINEMUSIC } /* inbyzantinemusic */, - { 0, 9488, 9096, 5, 4, UNI_INBUHID } /* blk=buhid */, - { 1364, 8589, 2560, 7, 4, UNI_SC__MAND } /* script=mand */, - { 541, 2280, 7668, 4, 7, UNI_ORKH } /* isoldturkic */, - { 11, 10048, 9372, 3, 3, UNI_NV__1_SLASH_4 } /* nv=1/4 */, - { 0, 3836, 9608, 17, 4, UNI_KITS } /* scriptextensions=kits */, - { 1, 9277, 7651, 3, 4, UNI_ITAL } /* sc=ital */, - { 0, 8780, 8171, 6, 8, UNI_INGUJARATI } /* block=gujarati */, - { 4, 10027, 4763, 3, 15, UNI_JG__MANICHAEANSADHE } /* jg=manichaeansadhe */, - { 2560, 8780, 3421, 6, 18, UNI_RUMI } /* block=ruminumeralsymbols */, - { 691, 10027, 5918, 3, 3, UNI_JG__TAW } /* jg=taw */, - { 1, 10024, 5040, 3, 5, UNI_XPOSIXDIGIT } /* gc=digit */, - { 0, 8780, 1922, 6, 22, UNI_DIACRITICALSFORSYMBOLS } /* block=diacriticalsforsymbols */, - { 7, 9768, 9460, 4, 4, UNI_ARMI } /* scx=armi */, - { 0, 9768, 2329, 4, 20, UNI_HLUW } /* scx=anatolianhieroglyphs */, - { 786, 1552, 5726, 9, 13, UNI_ME } /* category=enclosingmark */, - { 5, 8267, 3, 8, 1, -UNI_RADICAL } /* radical=f */, - { 3779, 8780, 1369, 6, 24, UNI_ARABICPFA } /* block=arabicpresentationformsa */, - { 0, 7438, 400, 10, 6, UNI_WB__FO } /* wordbreak=format */, - { 1028, 7218, 1527, 10, 9, UNI_LB__SG } /* linebreak=surrogate */, - { 0, 9768, 9656, 4, 4, UNI_MIAO } /* scx=miao */, - { 0, 9277, 9285, 3, 4, UNI_SC__LIMB } /* sc=limb */, - { 21, 9444, 10105, 4, 3, UNI_AGE__6 } /* age=v60 */, - { 0, 4448, 0, 15, 0, UNI_BAMUMSUP } /* bamumsupplement */, - { 404, 184, 9245, 2, 5, UNI_DOGR } /* isdogra */, - { 0, 3169, 0, 11, 0, UNI_ETHIOPICSUP } /* ethiopicsup */, - { 833, 184, 4448, 2, 15, UNI_BAMUMSUP } /* isbamumsupplement */, - { 0, 9488, 2722, 4, 10, UNI_JAMO } /* blk=hanguljamo */, - { 11, 9696, 0, 4, 0, UNI_OGAM } /* ogam */, - { 1713, 8589, 9335, 7, 4, UNI_SC__TAKR } /* script=takr */, - { 5, 10060, 9836, 3, 4, UNI_RI } /* ri=true */, - { 0, 8780, 7068, 6, 10, UNI_ASCII } /* block=basiclatin */, - { 16, 9796, 0, 4, 0, UNI_SYRC } /* syrc */, - { 1097, 6576, 1, 11, 1, -UNI_XPOSIXALPHA } /* alphabetic=n */, - { 0, 4033, 10168, 16, 2, UNI_CASEDLETTER } /* generalcategory=l& */, - { 0, 7076, 3938, 3, 7, UNI_INBOPOMOFO } /* inbopomofo */, - { 0, 8780, 3796, 7, 3, UNI_INCHAM } /* block=cham */, - { 18, 184, 6884, 2, 11, UNI_HMNG } /* ispahawhhmong */, - { 1061, 8147, 1, 8, 1, -UNI_EXTPICT } /* extpict=n */, - { 1898, 10296, 472, 3, 2, UNI_PUA } /* ispua */, - { 1, 9786, 1702, 4, 21, UNI_SHORTHANDFORMATCONTROLS } /* inshorthandformatcontrols */, - { 1921, 8780, 1442, 7, 23, UNI_CJKSYMBOLS } /* block=cjksymbolsandpunctuation */, - { 5, 4808, 0, 15, 0, UNI_MISCPICTOGRAPHS } /* miscpictographs */, - { 0, 1966, 1244, 22, 25, UNI_INSC__CONSONANTINITIALPOSTFIXED } /* indicsyllabiccategory=consonantinitialpostfixed */, - { 576, 5986, 8756, 13, 4, UNI_NV__9000 } /* numericvalue=9000 */, - { 2, 8780, 8380, 7, 6, UNI_CJKEXTE } /* block=cjkexte */, - { 0, 9488, 316, 4, 33, UNI_SUPMATHOPERATORS } /* blk=supplementalmathematicaloperators */, - { 243, 9488, 659, 4, 30, UNI_CJKEXTF } /* blk=cjkunifiedideographsextensionf */, - { 0, 184, 9664, 2, 4, UNI_MRO } /* ismroo */, - { 0, 9488, 3439, 4, 12, UNI_SMALLKANAEXT } /* blk=smallkanaext */, - { 184, 184, 6253, 2, 12, UNI_KHMERSYMBOLS } /* iskhmersymbols */, - { 476, 3836, 7278, 17, 10, UNI_XPEO } /* scriptextensions=oldpersian */, - { 0, 8666, 0, 4, 0, UNI_TIRH } /* tirh */, - { 224, 184, 2409, 2, 20, UNI_GLAGOLITICSUP } /* isglagoliticsupplement */, - { 626, 8589, 5284, 7, 4, UNI_LISU } /* script=lisu */, - { 20, 2280, 1061, 3, 26, UNI_OCR } /* isopticalcharacterrecognition */, - { 568, 9277, 8299, 3, 8, UNI_TFNG } /* sc=tifinagh */, - { 0, 6205, 10135, 12, 3, UNI_IDEO } /* ideographic=yes */, - { 0, 5713, 0, 13, 0, UNI_XPOSIXDIGIT } /* decimalnumber */, - { 0, 21, 7576, 2, 9, UNI_LATINEXTB } /* inlatinextb */, - { 3194, 10048, 8720, 3, 2, UNI_NV__40 } /* nv=40 */, - { 0, 5791, 5921, 13, 13, UNI_JG__MANICHAEANTEN } /* joininggroup=manichaeanten */, - { 4, 6231, 4560, 9, 8, UNI_CONTROLPICTURES } /* incontrolpictures */, - { 1284, 8768, 10135, 6, 3, UNI_BIDIC } /* bidic=yes */, - { 3068, 2268, 0, 2, 0, UNI_PD } /* pd */, - { 0, 6553, 1025, 12, 2, -UNI_XIDC } /* xidcontinue=no */, - { 14, 184, 132, 2, 2, UNI_LM } /* islm */, - { 8, 8589, 6481, 7, 12, UNI_HUNG } /* script=oldhungarian */, - { 0, 10132, 7612, 3, 6, UNI_WB__MN } /* wb=midnum */, - { 0, 4033, 6035, 16, 2, UNI_PF } /* generalcategory=pf */, - { 4, 9520, 26, 4, 1, UNI_CWL } /* cwl=y */, - { 1, 5986, 7469, 13, 1, UNI_NV__5 } /* numericvalue=5 */, - { 0, 9488, 4449, 5, 14, UNI_BAMUMSUP } /* blk=bamumsupplement */, - { 4, 8780, 908, 6, 14, UNI_PUA } /* block=privateusearea */, - { 2707, 8694, 1, 7, 1, -UNI_XPOSIXSPACE } /* wspace=n */, - { 292, 3683, 0, 17, 0, UNI_ETHIOPICEXTA } /* ethiopicextendeda */, - { 0, 9768, 8680, 4, 7, UNI_ZZZZ } /* scx=unknown */, - { 323, 4791, 2062, 3, 14, UNI_MODIFIERLETTERS } /* inmodifierletters */, - { 20, 7028, 7028, 3, 10, UNI_YISYLLABLES } /* isyisyllables */, - { 1, 9624, 0, 3, 0, UNI_LAO } /* lao */, - { 2, 8870, 9255, 6, 5, -UNI_EPRES } /* epres=false */, - { 529, 3836, 7694, 18, 8, UNI_SAMR } /* scriptextensions=samaritan */, - { 3055, 9444, 9979, 4, 3, UNI_AGE__6_DOT_1 } /* age=6.1 */, - { 3202, 10012, 7486, 3, 9, UNI_EA__A } /* ea=ambiguous */, - { 0, 1417, 9208, 24, 2, UNI_CCC__35 } /* canonicalcombiningclass=35 */, - { 1, 184, 9688, 2, 3, UNI_NKO } /* isnko */, - { 0, 9350, 10135, 5, 3, UNI_XIDS } /* xids=yes */, - { 161, 7418, 9836, 10, 4, UNI_XPOSIXUPPER } /* uppercase=true */, - { 0, 1552, 47, 10, 1, UNI_SM } /* category=sm */, - { 0, 9277, 9568, 3, 4, UNI_SC__GREK } /* sc=grek */, - { 0, 8589, 6193, 7, 6, UNI_HEBR } /* script=hebrew */, - { 3120, 184, 5550, 2, 14, UNI_PHLP } /* ispsalterpahlavi */, - { 1046, 7155, 6321, 3, 3, UNI_HMNG } /* ishmng */, - { 0, 8984, 26, 6, 1, UNI_QMARK } /* qmark=y */, - { 73, 1218, 0, 8, 0, UNI_KANA } /* katakana */, - { 0, 8589, 8344, 7, 4, UNI_SC__BENG } /* script=beng */, - { 1289, 7, 0, 18, 0, UNI_CANS } /* canadianaboriginal */, - { 1836, 1591, 3170, 3, 17, UNI_ETHIOPICSUP } /* inethiopicsupplement */, - { 3201, 5032, 10135, 14, 3, UNI_POSIXXDIGIT } /* asciihexdigit=yes */, - { 7, 8449, 1025, 7, 2, -UNI_HYPHEN } /* hyphen=no */, - { 136, 9488, 1911, 4, 11, UNI_NUMBERFORMS } /* blk=numberforms */, - { 1674, 9508, 7933, 4, 2, UNI_CCC__17 } /* ccc=17 */, - { 0, 8512, 47, 7, 1, UNI_NFCQC__M } /* nfkcqc=m */, - { 139, 9786, 8605, 4, 5, UNI_SHAW } /* inshavian */, - { 0, 6420, 7658, 3, 8, UNI_INOLDPERMIC } /* inoldpermic */, - { 0, 1654, 0, 6, 0, UNI_HANG } /* hangul */, - { 0, 5578, 0, 16, 0, UNI_SB__SP } /* sentencebreak=sp */, - { 332, 4033, 1025, 16, 2, UNI_NO } /* generalcategory=no */, - { 2690, 1417, 9218, 24, 2, UNI_CCC__84 } /* canonicalcombiningclass=84 */, - { 0, 1189, 11, 3, 2, UNI_NT__DI } /* nt=di */, - { 12, 7218, 1140, 10, 26, UNI_LB__CJ } /* linebreak=conditionaljapanesestarter */, - { 3801, 6241, 6994, 12, 11, UNI_JT__T } /* joiningtype=transparent */, - { 0, 8688, 3548, 3, 9, UNI_ALCHEMICAL } /* isalchemical */, - { 816, 6554, 1025, 11, 2, -UNI_IDC } /* idcontinue=no */, - { 1, 10176, 0, 2, 0, UNI_ZL } /* zl */, - { 24, 9250, 0, 6, 0, -UNI_EMOD } /* emod=f */, - { 0, 1790, 9255, 22, 5, -UNI_CWCM } /* changeswhencasemapped=false */, - { 2428, 10027, 9744, 3, 4, UNI_JG__QAPH } /* jg=qaph */, - { 1, 3853, 26, 17, 1, UNI_STERM } /* sentenceterminal=y */, - { 2398, 4542, 3243, 4, 6, UNI_INGEORGIAN } /* ingeorgian */, - { 531, 184, 9676, 2, 4, UNI_NARB } /* isnarb */, - { 12, 8780, 7693, 6, 9, UNI_INSAMARITAN } /* block=samaritan */, - { 5, 1417, 8805, 25, 4, UNI_CCC__11 } /* canonicalcombiningclass=ccc11 */, - { 0, 9488, 4369, 4, 9, UNI_SYRIACSUP } /* blk=syriacsup */, - { 4367, 8780, 5752, 6, 8, UNI_GREEKEXT } /* block=greekext */, - { 0, 1537, 1924, 4, 20, UNI_DIACRITICALSFORSYMBOLS } /* indiacriticalsforsymbols */, - { 0, 3836, 8561, 17, 4, UNI_OSMA } /* scriptextensions=osma */, - { 3590, 9508, 8811, 5, 4, UNI_CCC__12 } /* ccc=ccc12 */, - { 7694, 509, 0, 30, 0, UNI_CJKEXTA } /* cjkunifiedideographsextensiona */, - { 0, 8780, 6277, 6, 12, UNI_MAHJONG } /* block=mahjongtiles */, - { 4, 5986, 5648, 13, 4, UNI_NV__1000 } /* numericvalue=1000 */, - { 0, 2280, 4870, 4, 13, UNI_NARB } /* isoldnortharabian */, - { 7122, 8780, 3751, 6, 17, UNI_INKHITANSMALLSCRIPT } /* block=khitansmallscript */, - { 5, 9277, 8219, 3, 4, UNI_SC__JAVA } /* sc=java */ + { 1, 8782, 2584, 7, 4, UNI_SC__MAND } /* script=mand */, + { 0, 9691, 2936, 4, 12, UNI_SUNDANESESUP } /* blk=sundanesesup */, + { 2, 1990, 2393, 22, 20, UNI_INSC__CONSONANTPLACEHOLDER } /* indicsyllabiccategory=consonantplaceholder */, + { 0, 9647, 7934, 4, 1, UNI_AGE__2 } /* age=2 */, + { 0, 2248, 2937, 3, 11, UNI_SUNDANESESUP } /* insundanesesup */, + { 0, 2206, 3409, 21, 17, UNI_RI } /* graphemeclusterbreak=regionalindicator */, + { 0, 10253, 4010, 3, 16, UNI_LB__CP } /* lb=closeparenthesis */, + { 0, 3877, 7700, 17, 9, UNI_QAAI } /* scriptextensions=inherited */, + { 0, 9747, 10355, 4, 3, UNI_DIA } /* dia=yes */, + { 1, 2312, 1657, 4, 4, UNI_INHANGUL } /* inhangul */, + { 2, 185, 479, 2, 31, UNI_MATHALPHANUM } /* ismathematicalalphanumericsymbols */, + { 11, 7104, 0, 11, 0, UNI_SYLO } /* sylotinagri */, + { 0, 9979, 7781, 4, 9, UNI_NBAT } /* scx=nabataean */, + { 0, 3121, 5068, 18, 6, UNI_DT__SQR } /* decompositiontype=square */, + { 0, 10253, 18, 3, 2, UNI_RI } /* lb=ri */, + { 8, 4157, 7701, 3, 8, UNI_QAAI } /* isinherited */, + { 1, 9691, 7381, 4, 2, UNI_INVS } /* blk=vs */, + { 0, 10250, 7, 3, 1, UNI_JT__C } /* jt=c */, + { 1, 10268, 8046, 3, 2, UNI_NV__13 } /* nv=13 */, + { 3, 2248, 8825, 3, 6, UNI_SUPPUAB } /* insuppuab */, + { 0, 8973, 7673, 6, 9, UNI_EMOTICONS } /* block=emoticons */, + { 3, 9504, 0, 5, 0, UNI_NSHU } /* nushu */, + { 3, 3448, 1, 3, 42, UNI_UCASEXTA } /* inunifiedcanadianaboriginalsyllabicsextendeda */, + { 0, 10268, 7958, 3, 2, UNI_NV__50 } /* nv=50 */, + { 0, 8973, 9534, 6, 5, UNI_INTAKRI } /* block=takri */, + { 1, 7230, 4362, 10, 16, UNI_BC__S } /* bidiclass=segmentseparator */, + { 3, 2003, 10391, 10, 1, UNI_CASEDLETTER } /* category=l_ */, + { 3, 9476, 6518, 3, 4, UNI_MEND } /* sc=mend */, + { 4, 9476, 2302, 4, 3, UNI_SC__KALI } /* sc=kali */, + { 0, 43, 0, 16, 0, UNI_CJKCOMPAT } /* cjkcompatibility */, + { 2, 8782, 2433, 7, 10, UNI_SC__GLAG } /* script=glagolitic */, + { 2, 3403, 0, 5, 0, UNI_XPOSIXSPACE } /* space */, + { 0, 4847, 394, 3, 2, UNI_INMRO } /* inmro */, + { 6, 8500, 0, 4, 0, UNI_UGAR } /* ugar */, + { 7, 7360, 4594, 10, 15, UNI_LB__CB } /* linebreak=contingentbreak */, + { 1, 9476, 79, 3, 4, UNI_SC__ARAB } /* sc=arab */, + { 3, 3121, 0, 18, 0, UNI_dt_values_index } /* decompositiontype= */, + { 1, 9979, 9687, 4, 4, UNI_BHKS } /* scx=bhks */, + { 6, 4410, 0, 6, 0, UNI_SYRC } /* syriac */, + { 2, 6083, 8943, 13, 3, UNI_NV__800 } /* numericvalue=800 */, + { 0, 185, 1288, 2, 2, UNI_UPPERCASELETTER } /* islu */, + { 9, 1270, 1026, 25, 2, -UNI_COMPEX } /* fullcompositionexclusion=no */, + { 1, 185, 1295, 2, 25, UNI_SUPERANDSUB } /* issuperscriptsandsubscripts */, + { 4, 8782, 8670, 7, 4, UNI_MAKA } /* script=maka */, + { 0, 2206, 4401, 21, 9, UNI_WB__EB } /* graphemeclusterbreak=emodifier */, + { 1, 1538, 4656, 4, 13, UNI_DIACRITICALSEXT } /* indiacriticalsext */, + { 4, 9691, 350, 4, 33, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* blk=supplementalsymbolsandpictographs */, + { 4, 8284, 0, 4, 0, UNI_BASS } /* bass */, + { 0, 6083, 8076, 13, 8, UNI_NV__3_SLASH_8 } /* numericvalue=3.75e-01 */, + { 0, 5758, 0, 5, 0, UNI_BIDIM } /* bidim */, + { 4, 9763, 5717, 4, 2, UNI_LB__H2 } /* gcb=lv */, + { 3, 5550, 0, 16, 0, UNI_DT__CAN } /* nfdquickcheck=no */, + { 1, 4074, 9048, 16, 2, UNI_CF } /* generalcategory=cf */, + { 2, 600, 0, 30, 0, UNI_CJKEXTD } /* cjkunifiedideographsextensiond */, + { 1, 10268, 10358, 3, 2, UNI_NV__38 } /* nv=38 */, + { 0, 4534, 0, 7, 0, UNI_BRAI } /* braille */, + { 0, 7360, 0, 10, 0, UNI_lb_values_index } /* linebreak= */, + { 1, 3403, 10403, 5, 4, UNI_XPOSIXSPACE } /* spaceperl */, + { 6, 9691, 4939, 4, 15, UNI_SARB } /* blk=oldsoutharabian */, + { 0, 8530, 0, 7, 0, UNI_AVST } /* avestan */, + { 0, 9979, 9807, 4, 4, UNI_KALI } /* scx=kali */, + { 1, 9979, 9935, 4, 4, UNI_PHNX } /* scx=phnx */, + { 1, 3894, 0, 16, 0, UNI_STERM } /* sentenceterminal */, + { 4, 5368, 0, 14, 0, UNI_LISUSUP } /* lisusupplement */, + { 0, 9711, 8091, 4, 2, UNI_CCC__24 } /* ccc=24 */, + { 0, 3877, 3103, 17, 4, UNI_COPT } /* scriptextensions=copt */, + { 4, 8881, 9644, 3, 3, UNI_ADLM } /* isadlm */, + { 0, 5662, 496, 14, 7, UNI_SB__NU } /* sentencebreak=numeric */, + { 1, 7682, 26, 9, 1, UNI_EXT } /* extender=y */, + { 0, 6083, 8907, 13, 4, UNI_NV__3000 } /* numericvalue=3000 */, + { 4, 9476, 9939, 3, 4, UNI_MIAO } /* sc=plrd */, + { 0, 7460, 7983, 10, 1, UNI_IN__7 } /* presentin=7 */, + { 0, 1115, 0, 25, 0, UNI_CWKCF } /* changeswhennfkccasefolded */, + { 1, 10253, 3403, 3, 5, UNI_LB__SP } /* lb=space */, + { 2, 8973, 9895, 6, 3, UNI_INNKO } /* block=nko */, + { 1, 9711, 6763, 4, 11, UNI_CCC__DA } /* ccc=doubleabove */, + { 0, 9979, 7817, 4, 9, UNI_PERM } /* scx=oldpermic */, + { 0, 10253, 43, 3, 2, UNI_LB__CJ } /* lb=cj */, + { 4, 7218, 2633, 3, 5, UNI_INBRAHMI } /* inbrahmi */, + { 0, 10244, 133, 3, 2, UNI_LM } /* gc=lm */, + { 4, 1060, 0, 2, 0, UNI_SO } /* so */, + { 1, 8973, 184, 6, 34, UNI_MISCPICTOGRAPHS } /* block=miscellaneoussymbolsandpictographs */, + { 3, 9979, 7853, 4, 4, UNI_PAUC } /* scx=pauc */, + { 0, 2248, 2956, 3, 18, UNI_SUPARROWSA } /* insupplementalarrowsa */, + { 7, 9123, 26, 6, 1, UNI_XPOSIXLOWER } /* lower=y */, + { 0, 9444, 0, 4, 0, UNI_DOGR } /* dogr */, + { 1, 2164, 0, 18, 0, UNI_CYRILLICSUP } /* cyrillicsupplement */, + { 1, 1770, 753, 23, 4, UNI_BPT__C } /* bidipairedbrackettype=close */, + { 0, 6083, 8907, 13, 6, UNI_NV__300000 } /* numericvalue=300000 */, + { 0, 9691, 6386, 4, 7, UNI_MAHJONG } /* blk=mahjong */, + { 5, 185, 3600, 3, 2, UNI_CWL } /* iscwl */, + { 8, 1592, 3725, 3, 16, UNI_ETHIOPICEXTB } /* inethiopicextendedb */, + { 6, 9979, 7260, 4, 10, UNI_CHRS } /* scx=chorasmian */, + { 3, 9979, 9943, 4, 4, UNI_PRTI } /* scx=prti */, + { 0, 2493, 0, 20, 0, UNI_HMNP } /* nyiakengpuachuehmong */, + { 2, 6109, 0, 13, 0, UNI_VERTICALFORMS } /* verticalforms */, + { 12, 10402, 9172, 7, 4, UNI__PERL_PATWS } /* _perl_patws */, + { 16, 8973, 5862, 6, 13, UNI_IPAEXT } /* block=ipaextensions */, + { 0, 6674, 0, 11, 0, UNI_XIDC } /* xidcontinue */, + { 5, 185, 9063, 2, 5, UNI_EPRES } /* isepres */, + { 8, 2304, 6984, 3, 10, UNI_LO } /* isotherletter */, + { 0, 185, 7530, 2, 10, UNI_SUPARROWSB } /* issuparrowsb */, + { 0, 9459, 9454, 5, 5, -UNI_IDSB } /* idsb=false */, + { 1, 185, 5270, 2, 14, UNI_KANGXI } /* iskangxiradicals */, + { 0, 9691, 5690, 4, 14, UNI_SUPPUNCTUATION } /* blk=suppunctuation */, + { 2, 10268, 7940, 3, 8, UNI_NV__1_SLASH_80 } /* nv=1.25e-02 */, + { 4, 8782, 383, 7, 4, UNI_EGYP } /* script=egyp */, + { 1, 7580, 7049, 10, 11, UNI_WB__SQ } /* wordbreak=singlequote */, + { 5, 9763, 24, 4, 1, UNI_GCB__L } /* gcb=l */, + { 3, 9979, 9715, 4, 4, UNI_CHRS } /* scx=chrs */, + { 1, 185, 9951, 2, 4, UNI_QAAI } /* isqaai */, + { 0, 21, 5270, 2, 14, UNI_KANGXI } /* inkangxiradicals */, + { 1, 8973, 2100, 6, 22, UNI_TRANSPORTANDMAP } /* block=transportandmapsymbols */, + { 6, 10253, 6807, 3, 11, UNI_LB__EX } /* lb=exclamation */, + { 0, 9691, 8356, 4, 8, UNI_INHIRAGANA } /* blk=hiragana */, + { 4, 185, 9831, 2, 3, UNI_LAO } /* islao */, + { 1, 8973, 4282, 6, 16, UNI_MISCMATHSYMBOLSA } /* block=miscmathsymbolsa */, + { 6, 6674, 1026, 12, 2, -UNI_XIDC } /* xidcontinue=no */, + { 0, 7218, 3979, 3, 15, UNI_BOPOMOFOEXT } /* inbopomofoextended */, + { 2, 8973, 10271, 6, 3, UNI_OCR } /* block=ocr */, + { 1, 8973, 2632, 6, 6, UNI_INBRAHMI } /* block=brahmi */, + { 2, 9979, 8468, 4, 8, UNI_TAGB } /* scx=tagbanwa */, + { 0, 9691, 43, 4, 16, UNI_CJKCOMPAT } /* blk=cjkcompatibility */, + { 10, 9476, 3139, 3, 10, UNI_SC__DEVA } /* sc=devanagari */, + { 1, 9469, 3499, 5, 10, UNI_INPC__TOPANDLEFT } /* inpc=topandleft */, + { 4, 1553, 4346, 9, 16, UNI_PO } /* category=otherpunctuation */, + { 0, 5662, 752, 14, 2, UNI_SB__CL } /* sentencebreak=cl */, + { 0, 8768, 9454, 7, 5, -UNI_PATSYN } /* patsyn=false */, + { 1, 185, 2146, 2, 7, UNI_RADICAL } /* isradical */, + { 1, 9997, 1703, 4, 21, UNI_SHORTHANDFORMATCONTROLS } /* inshorthandformatcontrols */, + { 0, 10352, 6785, 3, 11, UNI_WB__DQ } /* wb=doublequote */, + { 2, 8782, 9105, 7, 4, UNI_SC__KHOJ } /* script=khoj */, + { 2, 8789, 0, 7, 0, UNI_SHRD } /* sharada */, + { 4, 9647, 10322, 4, 3, UNI_AGE__5_DOT_2 } /* age=v52 */, + { 0, 9691, 8621, 4, 7, UNI_INGRANTHA } /* blk=grantha */, + { 0, 2085, 0, 15, 0, UNI_MODIFIERLETTERS } /* modifierletters */, + { 0, 5875, 10107, 13, 4, UNI_JG__ZAIN } /* joininggroup=zain */, + { 2, 9979, 3193, 4, 8, UNI_ETHI } /* scx=ethiopic */, + { 16, 8607, 0, 7, 0, UNI_ELBA } /* elbasan */, + { 1, 10247, 9243, 3, 4, UNI_JG__YUDH } /* jg=yudh */, + { 0, 8973, 631, 7, 29, UNI_CJKEXTE } /* block=cjkunifiedideographsextensione */, + { 0, 10268, 8920, 3, 2, UNI_NV__32 } /* nv=32 */, + { 0, 7908, 1, 8, 1, -UNI_IDS } /* idstart=n */, + { 0, 9691, 7754, 4, 9, UNI_LATINEXTG } /* blk=latinextg */, + { 26, 7297, 1515, 3, 23, UNI_HIGHPUSURROGATES } /* ishighprivateusesurrogates */, + { 1, 1115, 3, 26, 1, -UNI_CWKCF } /* changeswhennfkccasefolded=f */, + { 1, 6675, 0, 11, 0, UNI_idc_values_index } /* idcontinue= */, + { 1, 8973, 6386, 6, 12, UNI_MAHJONG } /* block=mahjongtiles */, + { 0, 5875, 6434, 13, 12, UNI_JG__MALAYALAMNNA } /* joininggroup=malayalamnna */, + { 0, 3877, 6972, 17, 4, UNI_NAND } /* scriptextensions=nand */, + { 1, 10280, 26, 3, 1, UNI_RI } /* ri=y */, + { 1, 6340, 1468, 4, 22, UNI_DIACRITICALSFORSYMBOLS } /* incombiningmarksforsymbols */, + { 8, 9476, 9871, 3, 4, UNI_MRO } /* sc=mroo */, + { 1, 3877, 9843, 17, 4, UNI_LINB } /* scriptextensions=linb */, + { 0, 4282, 0, 16, 0, UNI_MISCMATHSYMBOLSA } /* miscmathsymbolsa */, + { 0, 8782, 7820, 7, 4, UNI_SC__PERM } /* script=perm */, + { 1, 7230, 24, 10, 1, UNI_BC__L } /* bidiclass=l */, + { 7, 9803, 7889, 4, 9, UNI_GCB__V } /* hst=voweljamo */, + { 1, 8817, 0, 7, 0, UNI_SUPPUAA } /* suppuaa */, + { 2, 4684, 3, 15, 1, UNI_EA__F } /* eastasianwidth=f */, + { 4, 8642, 1, 7, 1, -UNI_HYPHEN } /* hyphen=n */, + { 1, 10553, 7501, 3, 3, UNI_SAUR } /* issaur */, + { 1, 9795, 0, 4, 0, UNI_HMNG } /* hmng */, + { 1, 8782, 8811, 8, 6, UNI_SOYO } /* script=soyombo */, + { 6, 5116, 10355, 14, 3, UNI_CI } /* caseignorable=yes */, + { 0, 9476, 8775, 3, 7, UNI_SC__PHAG } /* sc=phagspa */, + { 0, 1858, 1026, 22, 2, -UNI_CWT } /* changeswhentitlecased=no */, + { 0, 9979, 5059, 4, 15, UNI_ZANB } /* scx=zanabazarsquare */, + { 1, 6340, 511, 3, 29, UNI_CJKEXTA } /* incjkunifiedideographsextensiona */, + { 6, 1538, 6753, 3, 10, UNI_DOMINO } /* indominotiles */, + { 4, 9459, 10055, 5, 4, UNI_IDSB } /* idsb=true */, + { 1, 9979, 79, 4, 4, UNI_ARAB } /* scx=arab */, + { 0, 1836, 3, 22, 1, -UNI_CWL } /* changeswhenlowercased=f */, + { 1, 5875, 5235, 13, 7, UNI_JG__HEHGOAL } /* joininggroup=hehgoal */, + { 1, 6314, 1, 12, 1, -UNI_IDEO } /* ideographic=n */, + { 0, 2012, 9454, 22, 5, -UNI_LOE } /* logicalorderexception=false */, + { 1, 9214, 26, 5, 1, UNI_IDEO } /* ideo=y */, + { 1, 8973, 8754, 6, 7, UNI_INOSMANYA } /* block=osmanya */, + { 3, 1553, 4999, 9, 15, UNI_TITLE } /* category=titlecaseletter */, + { 16, 1270, 10355, 25, 3, UNI_COMPEX } /* fullcompositionexclusion=yes */, + { 1, 2808, 3964, 4, 14, UNI_ARABICSUP } /* inarabicsupplement */, + { 0, 4909, 0, 15, 0, UNI_nfkdqc_values_index } /* nfkdquickcheck= */, + { 0, 3877, 10087, 17, 4, UNI_WCHO } /* scriptextensions=wcho */, + { 0, 7360, 6278, 10, 4, UNI_LB__GL } /* linebreak=glue */, + { 0, 9691, 5901, 4, 13, UNI_KANAEXTB } /* blk=kanaextendedb */, + { 2, 9979, 9117, 4, 6, UNI_LEPC } /* scx=lepcha */, + { 11, 9476, 9835, 3, 4, UNI_SC__LATN } /* sc=latn */, + { 8, 5648, 0, 14, 0, UNI_qmark_values_index } /* quotationmark= */, + { 0, 9153, 0, 7, 0, UNI_COMPEX } /* nfcqc=n */, + { 5, 10253, 0, 3, 0, UNI_lb_values_index } /* lb= */, + { 0, 3877, 2708, 17, 19, UNI_EGYP } /* scriptextensions=egyptianhieroglyphs */, + { 5, 9647, 7990, 4, 1, UNI_AGE__8 } /* age=8 */, + { 3, 1274, 1, 21, 1, -UNI_CE } /* compositionexclusion=n */, + { 0, 3877, 10095, 17, 4, UNI_XPEO } /* scriptextensions=xpeo */, + { 1, 10508, 6675, 3, 10, UNI_XIDC } /* isxidcontinue */, + { 2, 9691, 447, 4, 32, UNI_IDEOGRAPHICSYMBOLS } /* blk=ideographicsymbolsandpunctuation */, + { 0, 10268, 8251, 3, 2, UNI_NV__19 } /* nv=19 */, + { 0, 8955, 10355, 6, 3, UNI_XPOSIXALPHA } /* alpha=yes */, + { 3, 10268, 9559, 3, 4, UNI_NV___MINUS_1_SLASH_2 } /* nv=-1/2 */, + { 6, 2632, 0, 6, 0, UNI_BRAH } /* brahmi */, + { 1, 10250, 6796, 3, 11, UNI_JT__D } /* jt=dualjoining */, + { 4, 10244, 2292, 3, 2, UNI_PD } /* gc=pd */, + { 3, 3877, 6924, 18, 3, UNI_SAMR } /* scriptextensions=samr */, + { 3, 9474, 7799, 5, 9, UNI_INSC__NONJOINER } /* insc=nonjoiner */, + { 0, 6674, 26, 12, 1, UNI_XIDC } /* xidcontinue=y */, + { 0, 21, 5298, 2, 14, UNI_LATINEXTC } /* inlatinextendedc */, + { 1, 7360, 1141, 10, 26, UNI_LB__CJ } /* linebreak=conditionaljapanesestarter */, + { 1, 1418, 9606, 24, 3, UNI_CCC__214 } /* canonicalcombiningclass=214 */, + { 0, 5875, 5452, 13, 14, UNI_JG__MANICHAEANKAPH } /* joininggroup=manichaeankaph */, + { 1, 6340, 7271, 3, 9, UNI_CJKSTROKES } /* incjkstrokes */, + { 1, 9763, 71, 4, 2, UNI_GCB__PP } /* gcb=pp */, + { 4, 9476, 494, 3, 3, UNI_SC__HAN } /* sc=han */, + { 3, 8973, 4426, 6, 16, UNI_TANGUTCOMPONENTS } /* block=tangutcomponents */, + { 10, 2879, 0, 19, 0, UNI_MONGOLIANSUP } /* mongoliansupplement */, + { 2, 5536, 0, 15, 0, UNI_COMPEX } /* nfcquickcheck=n */, + { 1, 10217, 32, 3, 2, UNI_BC__CS } /* bc=cs */, + { 0, 1418, 8119, 24, 1, UNI_CCC__9 } /* canonicalcombiningclass=9 */, + { 3, 8782, 6924, 8, 3, UNI_SAMR } /* script=samr */, + { 0, 7460, 9595, 10, 4, UNI_IN__12_DOT_1 } /* presentin=12.1 */, + { 5, 185, 5676, 2, 14, UNI_ZS } /* isspaceseparator */, + { 1, 9979, 8284, 4, 8, UNI_BASS } /* scx=bassavah */, + { 10, 10268, 7916, 3, 8, UNI_NV__1_SLASH_10 } /* nv=1.00e-01 */, + { 0, 8973, 7646, 6, 9, UNI_ARABICPFB } /* block=arabicpfb */, + { 0, 185, 2690, 3, 18, UNI_COUNTINGROD } /* iscountingrodnumerals */, + { 4, 114, 0, 25, 0, UNI_DIACRITICALS } /* combiningdiacriticalmarks */, + { 0, 3877, 6590, 17, 12, UNI_HUNG } /* scriptextensions=oldhungarian */, + { 2, 3826, 0, 10, 0, UNI_MANI } /* manichaean */, + { 5, 3877, 8775, 17, 7, UNI_PHAG } /* scriptextensions=phagspa */, + { 3, 1880, 26, 22, 1, UNI_CWU } /* changeswhenuppercased=y */, + { 1, 9474, 6566, 5, 12, UNI_INSC__NUMBERJOINER } /* insc=numberjoiner */, + { 1, 8973, 9529, 6, 5, UNI_INTAILE } /* block=taile */, + { 3, 4157, 2804, 3, 17, UNI_IDST } /* isidstrinaryoperator */, + { 7, 8973, 868, 6, 28, UNI_PHONETICEXTSUP } /* block=phoneticextensionssupplement */, + { 1, 9691, 3979, 5, 15, UNI_BOPOMOFOEXT } /* blk=bopomofoextended */, + { 0, 1553, 2373, 9, 20, UNI_PC } /* category=connectorpunctuation */, + { 1, 5875, 4122, 13, 16, UNI_JG__HANIFIROHINGYAPA } /* joininggroup=hanifirohingyapa */, + { 0, 185, 5256, 2, 7, UNI_KANASUP } /* iskanasup */, + { 0, 2304, 6995, 3, 10, UNI_NO } /* isothernumber */, + { 19, 10470, 6677, 15, 8, UNI__PERL_CHARNAME_CONTINUE } /* _perl_charname_continue */, + { 8, 185, 9831, 2, 4, UNI_LAO } /* islaoo */, + { 0, 479, 0, 31, 0, UNI_MATHALPHANUM } /* mathematicalalphanumericsymbols */, + { 0, 5875, 5410, 13, 14, UNI_JG__MANICHAEANBETH } /* joininggroup=manichaeanbeth */, + { 3, 10244, 1067, 3, 2, UNI_CASEDLETTER } /* gc=lc */, + { 0, 6083, 8028, 13, 5, UNI_NV__20000 } /* numericvalue=20000 */, + { 0, 10244, 4346, 3, 16, UNI_PO } /* gc=otherpunctuation */, + { 2, 9691, 7200, 4, 10, UNI_ARABICEXTB } /* blk=arabicextb */, + { 0, 6350, 36, 12, 1, UNI_JT__T } /* joiningtype=t */, + { 5, 185, 2165, 3, 7, UNI_CYRL } /* iscyrillic */, + { 0, 10346, 410, 3, 2, UNI_VO__TR } /* vo=tr */, + { 4, 5312, 0, 14, 0, UNI_LATINEXTD } /* latinextendedd */, + { 2, 10244, 5096, 3, 5, UNI_XPOSIXDIGIT } /* gc=digit */, + { 0, 6083, 9627, 13, 4, UNI_NV__3_SLASH_64 } /* numericvalue=3/64 */, + { 0, 9727, 0, 4, 0, UNI_cwl_values_index } /* cwl= */, + { 0, 9763, 74, 4, 2, UNI_WB__EB } /* gcb=em */, + { 24, 9691, 1902, 4, 22, UNI_CJKCOMPATIDEOGRAPHSSUP } /* blk=cjkcompatideographssup */, + { 1, 10253, 989, 3, 2, UNI_LB__CP } /* lb=cp */, + { 0, 8973, 4984, 6, 15, UNI_TAMILSUP } /* block=tamilsupplement */, + { 2, 2242, 7791, 3, 8, UNI_INNEWTAILUE } /* innewtailue */, + { 10, 3335, 0, 3, 0, UNI_ALL } /* all */, + { 3, 1846, 0, 2, 0, UNI_NL } /* nl */, + { 5, 3877, 9875, 17, 4, UNI_MTEI } /* scriptextensions=mtei */, + { 2, 9979, 7018, 5, 3, UNI_SHAW } /* scx=shaw */, + { 0, 8973, 284, 6, 33, UNI_MISCMATHSYMBOLSB } /* block=miscellaneousmathematicalsymbolsb */, + { 4, 1223, 0, 4, 0, UNI_KANA } /* kana */, + { 1, 7907, 1, 9, 1, -UNI_XIDS } /* xidstart=n */, + { 0, 3877, 1924, 17, 6, UNI_ZYYY } /* scriptextensions=common */, + { 0, 2206, 34, 21, 6, UNI_GCB__EX } /* graphemeclusterbreak=extend */, + { 4, 185, 1632, 2, 23, UNI_GEOMETRICSHAPESEXT } /* isgeometricshapesextended */, + { 0, 8973, 8580, 7, 6, UNI_CJKEXTF } /* block=cjkextf */, + { 0, 1553, 207, 9, 2, UNI_PI } /* category=pi */, + { 2, 185, 3391, 2, 17, UNI__PERL_PATWS } /* ispatternwhitespace */, + { 10, 6937, 188, 6, 16, UNI_MISCSYMBOLS } /* inmiscellaneoussymbols */, + { 6, 1115, 0, 26, 0, UNI_cwkcf_values_index } /* changeswhennfkccasefolded= */, + { 2, 6083, 5732, 13, 3, UNI_NV__100 } /* numericvalue=100 */, + { 0, 1418, 7983, 24, 1, UNI_CCC__7 } /* canonicalcombiningclass=7 */, + { 2, 4885, 2435, 4, 18, UNI_GLAGOLITICSUP } /* inglagoliticsupplement */, + { 10, 10217, 103, 3, 2, UNI_BC__ET } /* bc=et */, + { 0, 8782, 7072, 8, 10, UNI_SORA } /* script=sorasompeng */, + { 4, 9476, 6302, 3, 4, UNI_HEBR } /* sc=hebr */, + { 1, 5875, 6662, 13, 12, UNI_JG__VERTICALTAIL } /* joininggroup=verticaltail */, + { 11, 9476, 10035, 3, 4, UNI_SC__TGLG } /* sc=tglg */, + { 0, 185, 10115, 2, 4, UNI_QAAI } /* iszinh */, + { 0, 9489, 3, 5, 1, -UNI_MATH } /* math=f */, + { 0, 10511, 5096, 5, 5, UNI_POSIXDIGIT } /* posixdigit */, + { 1, 185, 952, 2, 18, UNI_INVS } /* isvariationselectors */, + { 9, 1007, 0, 17, 0, UNI_ANCIENTGREEKMUSIC } /* ancientgreekmusic */, + { 1, 9979, 10111, 4, 4, UNI_ZANB } /* scx=zanb */, + { 0, 9979, 7700, 4, 9, UNI_QAAI } /* scx=inherited */, + { 0, 3877, 10119, 17, 4, UNI_ZYYY } /* scriptextensions=zyyy */, + { 0, 9201, 0, 4, 0, UNI_TELU } /* telu */, + { 0, 6578, 496, 12, 2, UNI_NT__NU } /* numerictype=nu */, + { 0, 185, 9947, 2, 4, UNI_COPT } /* isqaac */, + { 0, 8973, 1193, 6, 26, UNI_HALFANDFULLFORMS } /* block=halfwidthandfullwidthforms */, + { 0, 9979, 8276, 4, 8, UNI_BALI } /* scx=balinese */, + { 0, 185, 9117, 2, 4, UNI_LEPC } /* islepc */, + { 2, 4074, 4624, 16, 14, UNI_SC } /* generalcategory=currencysymbol */, + { 3, 10244, 5522, 3, 14, UNI_SK } /* gc=modifiersymbol */, + { 0, 185, 7310, 2, 10, UNI_DIAK } /* isdivesakuru */, + { 1, 10280, 0, 3, 0, UNI_ri_values_index } /* ri= */, + { 20, 5093, 0, 9, 0, UNI_hex_values_index } /* hexdigit= */, + { 1, 9489, 1026, 5, 2, -UNI_MATH } /* math=no */, + { 1, 1553, 0, 9, 0, UNI_gc_values_index } /* category= */, + { 1, 185, 2993, 2, 19, UNI_SUPARROWSC } /* issupplementalarrowsc */, + { 5, 9691, 8277, 5, 7, UNI_INBALINESE } /* blk=balinese */, + { 0, 10247, 4804, 3, 15, UNI_JG__MANICHAEANGIMEL } /* jg=manichaeangimel */, + { 1, 9075, 3, 6, 1, -UNI_GREXT } /* grext=f */, + { 1, 6083, 8236, 13, 8, UNI_NV__17_SLASH_2 } /* numericvalue=8.50e+00 */, + { 16, 9099, 0, 6, 0, UNI_KANBUN } /* kanbun */, + { 3, 9979, 3978, 4, 8, UNI_BOPO } /* scx=bopomofo */, + { 0, 9045, 3, 6, 1, -UNI_CWKCF } /* cwkcf=f */, + { 0, 7230, 3814, 10, 3, UNI_BC__RLI } /* bidiclass=rli */, + { 1, 185, 1061, 3, 3, UNI_COPT } /* iscopt */, + { 2, 7360, 8873, 10, 7, UNI_LB__XX } /* linebreak=unknown */, + { 0, 21, 2354, 3, 19, UNI_INANATOLIANHIEROGLYPHS } /* inanatolianhieroglyphs */, + { 1, 185, 3463, 2, 12, UNI_SMALLKANAEXT } /* issmallkanaext */, + { 3, 7420, 0, 10, 0, UNI_XPEO } /* oldpersian */, + { 1, 10268, 9402, 3, 2, UNI_NV__34 } /* nv=34 */, + { 1, 4972, 8832, 3, 6, UNI_TGLG } /* istagalog */, + { 3, 10244, 1846, 3, 2, UNI_NL } /* gc=nl */, + { 5, 9476, 4042, 3, 7, UNI_SC__CPRT } /* sc=cypriot */, + { 1, 185, 9887, 2, 4, UNI_NBAT } /* isnbat */, + { 0, 6083, 8046, 13, 2, UNI_NV__13 } /* numericvalue=13 */, + { 1, 7460, 10071, 10, 4, UNI_IN__12_DOT_1 } /* presentin=v121 */, + { 6, 185, 9105, 2, 4, UNI_KHOJ } /* iskhoj */, + { 1, 7580, 10235, 10, 3, UNI_WB__EB } /* wordbreak=ebg */, + { 12, 2784, 6070, 19, 13, UNI_HST__NA } /* hangulsyllabletype=notapplicable */, + { 0, 4074, 207, 16, 2, UNI_PI } /* generalcategory=pi */, + { 1, 3877, 9767, 17, 4, UNI_GONG } /* scriptextensions=gong */, + { 9, 2206, 912, 21, 1, UNI_GCB__V } /* graphemeclusterbreak=v */, + { 0, 8973, 4759, 6, 15, UNI_INIMPERIALARAMAIC } /* block=imperialaramaic */, + { 9, 185, 896, 2, 28, UNI_SUPPUAA } /* issupplementaryprivateuseareaa */, + { 1, 10516, 7, 3, 1, UNI_PC } /* ispc */, + { 0, 8887, 36, 7, 1, UNI_XPOSIXSPACE } /* wspace=t */, + { 1, 1418, 9420, 25, 4, UNI_CCC__91 } /* canonicalcombiningclass=ccc91 */, + { 0, 5116, 0, 14, 0, UNI_ci_values_index } /* caseignorable= */, + { 0, 10217, 5578, 3, 14, UNI_BC__NSM } /* bc=nonspacingmark */, + { 5, 10253, 396, 3, 2, UNI_LB__GL } /* lb=gl */, + { 1, 8642, 36, 7, 1, UNI_HYPHEN } /* hyphen=t */, + { 0, 7160, 9238, 3, 5, UNI_YEZI } /* isyezidi */, + { 0, 9051, 1, 6, 1, -UNI_ECOMP } /* ecomp=n */, + { 1, 185, 1632, 2, 15, UNI_GEOMETRICSHAPES } /* isgeometricshapes */, + { 7, 9691, 3265, 4, 8, UNI_INGEORGIAN } /* blk=georgian */, + { 0, 6083, 8132, 13, 8, UNI_NV__11_SLASH_2 } /* numericvalue=5.50e+00 */, + { 0, 3758, 0, 17, 0, UNI_identifierstatus_values_index } /* identifierstatus= */, + { 0, 185, 9871, 2, 4, UNI_MRO } /* ismroo */, + { 2, 9691, 2433, 4, 13, UNI_GLAGOLITICSUP } /* blk=glagoliticsup */, + { 6, 9711, 9004, 5, 5, UNI_CCC__122 } /* ccc=ccc122 */, + { 0, 185, 3193, 2, 4, UNI_ETHI } /* isethi */, + { 0, 8973, 2955, 6, 19, UNI_SUPARROWSA } /* block=supplementalarrowsa */, + { 1, 9476, 6518, 3, 12, UNI_MEND } /* sc=mendekikakui */, + { 0, 185, 10111, 2, 4, UNI_ZANB } /* iszanb */, + { 11, 185, 6195, 3, 11, UNI_CYRILLICEXTA } /* iscyrillicexta */, + { 0, 9691, 750, 4, 21, UNI_ENCLOSEDALPHANUM } /* blk=enclosedalphanumerics */, + { 4, 8782, 9915, 7, 4, UNI_SC__ORYA } /* script=orya */, + { 0, 3283, 10055, 18, 4, UNI_IDSB } /* idsbinaryoperator=true */, + { 2, 9647, 10190, 4, 3, UNI_AGE__5_DOT_2 } /* age=5.2 */, + { 2, 3877, 9783, 17, 4, UNI_GURU } /* scriptextensions=guru */, + { 0, 5875, 5989, 13, 3, UNI_JG__NUN } /* joininggroup=nun */, + { 0, 7300, 1, 10, 1, -UNI_DIA } /* diacritic=n */, + { 1, 10217, 2917, 3, 19, UNI_BC__RLO } /* bc=righttoleftoverride */, + { 2, 7467, 7611, 3, 3, UNI_IN__5 } /* in=5.0 */, + { 1, 7360, 1187, 10, 2, UNI_LB__PO } /* linebreak=po */, + { 0, 9476, 2453, 3, 20, UNI_PHLI } /* sc=inscriptionalpahlavi */, + { 1, 8973, 3928, 6, 17, UNI_SUTTONSIGNWRITING } /* block=suttonsignwriting */, + { 0, 10247, 88, 3, 2, UNI_JG__HE } /* jg=he */, + { 1, 10217, 18, 3, 1, UNI_BC__R } /* bc=r */, + { 1, 10253, 10374, 3, 2, UNI_LB__B2 } /* lb=b2 */, + { 0, 7817, 0, 9, 0, UNI_PERM } /* oldpermic */, + { 0, 10217, 3337, 3, 18, UNI_BC__LRI } /* bc=lefttorightisolate */, + { 2, 10540, 3403, 7, 5, UNI_XPOSIXSPACE } /* isxperlspace */, + { 0, 8973, 7853, 6, 9, UNI_INPAUCINHAU } /* block=paucinhau */, + { 3, 6083, 10360, 13, 2, UNI_NV__39 } /* numericvalue=39 */, + { 4, 10268, 8244, 3, 8, UNI_NV__7_SLASH_8 } /* nv=8.75e-01 */, + { 0, 1270, 0, 25, 0, UNI_compex_values_index } /* fullcompositionexclusion= */, + { 8, 7460, 10313, 10, 3, UNI_IN__4_DOT_1 } /* presentin=v41 */, + { 1, 9476, 1014, 3, 5, UNI_SC__GREK } /* sc=greek */, + { 1, 1270, 3, 25, 1, -UNI_COMPEX } /* fullcompositionexclusion=f */, + { 3, 8782, 10087, 7, 4, UNI_WCHO } /* script=wcho */, + { 0, 2185, 10355, 21, 3, UNI_EXTPICT } /* extendedpictographic=yes */, + { 0, 2784, 7380, 19, 10, UNI_LB__H2 } /* hangulsyllabletype=lvsyllable */, + { 0, 9691, 8396, 4, 8, UNI_KANAEXTA } /* blk=kanaexta */, + { 0, 9153, 17, 7, 1, UNI_COMPEX } /* nfcqc=no */, + { 7, 2242, 8720, 3, 6, UNI_NB } /* innoblock */, + { 1, 10250, 7400, 3, 10, UNI_JT__U } /* jt=nonjoining */, + { 3, 7460, 7611, 10, 3, UNI_IN__5 } /* presentin=5.0 */, + { 0, 6083, 8204, 13, 8, UNI_NV__3_SLASH_4 } /* numericvalue=7.50e-01 */, + { 0, 6338, 0, 11, 0, UNI_JOINC } /* joincontrol */, + { 2, 10553, 3936, 3, 3, UNI_SGNW } /* issgnw */, + { 1, 9476, 5940, 3, 9, UNI_SC__MLYM } /* sc=malayalam */, + { 0, 2808, 7202, 4, 8, UNI_ARABICEXTB } /* inarabicextb */, + { 0, 10253, 6096, 3, 13, UNI_LB__PR } /* lb=prefixnumeric */, + { 0, 599, 0, 2, 0, UNI_XPOSIXCNTRL } /* cc */, + { 12, 9219, 3, 6, 1, -UNI_XPOSIXUPPER } /* upper=f */, + { 3, 10027, 0, 4, 0, UNI_TAVT } /* tavt */, + { 8, 8782, 7570, 7, 4, UNI_WARA } /* script=wara */, + { 1, 10516, 468, 7, 5, UNI_POSIXPUNCT } /* isposixpunct */, + { 0, 9476, 9751, 3, 4, UNI_DIAK } /* sc=diak */, + { 1, 6158, 10055, 12, 4, UNI_BIDIC } /* bidicontrol=true */, + { 3, 9711, 8027, 4, 3, UNI_CCC__B } /* ccc=220 */, + { 5, 185, 1443, 3, 9, UNI_CJKSYMBOLS } /* iscjksymbols */, + { 2, 185, 5059, 2, 15, UNI_ZANB } /* iszanabazarsquare */, + { 4, 1792, 0, 22, 0, UNI_cwcf_values_index } /* changeswhencasefolded= */, + { 0, 10553, 7434, 3, 3, UNI_SOGD } /* issogd */, + { 0, 9476, 10031, 3, 4, UNI_TFNG } /* sc=tfng */, + { 1, 1770, 6001, 22, 4, UNI_BPT__N } /* bidipairedbrackettype=none */, + { 0, 9476, 7835, 3, 9, UNI_SC__OUGR } /* sc=olduyghur */, + { 1, 185, 2085, 2, 14, UNI_LM } /* ismodifierletter */, + { 3, 3877, 9444, 17, 5, UNI_DOGR } /* scriptextensions=dogra */, + { 4, 8782, 8500, 7, 4, UNI_UGAR } /* script=ugar */, + { 8, 9691, 2269, 4, 14, UNI_MEETEIMAYEKEXT } /* blk=meeteimayekext */, + { 3, 21, 2614, 3, 18, UNI_ANCIENTGREEKNUMBERS } /* inancientgreeknumbers */, + { 4, 10352, 1846, 3, 2, UNI_WB__NL } /* wb=nl */, + { 1, 8887, 0, 7, 0, UNI_wspace_values_index } /* wspace= */, + { 0, 6083, 8043, 13, 2, UNI_NV__23 } /* numericvalue=23 */, + { 0, 10553, 108, 3, 5, UNI_S } /* issymbol */, + { 1, 10253, 10378, 3, 2, UNI_LB__H2 } /* lb=h2 */, + { 1, 185, 1223, 2, 4, UNI_KANA } /* iskana */, + { 5, 4534, 0, 15, 0, UNI_BRAI } /* braillepatterns */, + { 1, 7580, 401, 10, 6, UNI_WB__FO } /* wordbreak=format */, + { 0, 10244, 468, 3, 5, UNI_P } /* gc=punct */, + { 3, 9691, 2164, 4, 8, UNI_INCYRILLIC } /* blk=cyrillic */, + { 1, 9476, 9951, 3, 4, UNI_SC__QAAI } /* sc=qaai */, + { 4, 9691, 3265, 4, 18, UNI_GEORGIANSUP } /* blk=georgiansupplement */, + { 26, 10217, 3211, 3, 18, UNI_BC__ET } /* bc=europeanterminator */, + { 6, 8316, 26, 8, 1, UNI_EXTPICT } /* extpict=y */, + { 0, 10402, 10499, 6, 9, UNI__PERL_QUOTEMETA } /* _perl_quotemeta */, + { 0, 185, 7682, 2, 8, UNI_EXT } /* isextender */, + { 1, 185, 3, 3, 1, UNI_CF } /* iscf */, + { 0, 10244, 9706, 3, 2, UNI_MC } /* gc=mc */, + { 1, 9735, 26, 4, 1, UNI_CWU } /* cwu=y */, + { 0, 9434, 3, 5, 1, -UNI_CWCM } /* cwcm=f */, + { 0, 1418, 79, 24, 2, UNI_CCC__AR } /* canonicalcombiningclass=ar */, + { 2, 9147, 36, 6, 1, UNI__PERL_NCHAR } /* nchar=t */, + { 16, 2056, 1026, 22, 2, -UNI__PERL_NCHAR } /* noncharactercodepoint=no */, + { 0, 1189, 4443, 3, 15, UNI_TANGUTSUP } /* intangutsupplement */, + { 0, 10516, 9172, 3, 4, UNI__PERL_PATWS } /* ispatws */, + { 0, 4157, 1309, 3, 2, UNI_IDS } /* isids */, + { 3, 9747, 9454, 4, 5, -UNI_DIA } /* dia=false */, + { 2, 9461, 34, 3, 6, UNI_SB__EX } /* sb=extend */, + { 1, 8782, 9903, 7, 4, UNI_OGAM } /* script=ogam */, + { 2, 2433, 0, 13, 0, UNI_GLAGOLITICSUP } /* glagoliticsup */, + { 0, 8705, 48, 7, 1, UNI_NFCQC__M } /* nfkcqc=m */, + { 1, 7270, 0, 10, 0, UNI_CJKSTROKES } /* cjkstrokes */, + { 0, 10553, 8804, 3, 6, UNI_SIDD } /* issiddham */, + { 0, 185, 3934, 2, 11, UNI_SGNW } /* issignwriting */, + { 1, 4972, 9208, 3, 3, UNI_THAA } /* isthaa */, + { 1, 2708, 0, 19, 0, UNI_EGYP } /* egyptianhieroglyphs */, + { 1, 4684, 9141, 15, 6, UNI_EA__NA } /* eastasianwidth=narrow */, + { 1, 7360, 10382, 10, 2, UNI_GCB__L } /* linebreak=jl */, + { 0, 1553, 1564, 9, 2, UNI_PS } /* category=ps */, + { 1, 9711, 8235, 4, 2, UNI_CCC__28 } /* ccc=28 */, + { 5, 3877, 9831, 17, 4, UNI_LAO } /* scriptextensions=laoo */, + { 3, 9851, 0, 4, 0, UNI_MEDF } /* medf */, + { 3, 9691, 9183, 4, 6, UNI_INREJANG } /* blk=rejang */, + { 5, 8973, 7844, 6, 9, UNI_PALM } /* block=palmyrene */, + { 0, 8973, 8260, 6, 8, UNI_INARMENIAN } /* block=armenian */, + { 2, 8973, 2690, 7, 18, UNI_COUNTINGROD } /* block=countingrodnumerals */, + { 1, 9476, 8670, 3, 7, UNI_MAKA } /* sc=makasar */, + { 0, 7060, 0, 10, 0, UNI_SD } /* softdotted */, + { 1, 9476, 6386, 3, 4, UNI_SC__MAHJ } /* sc=mahj */, + { 0, 8881, 81, 4, 8, UNI_ARABICMATH } /* isarabicmath */, + { 8, 9691, 3605, 4, 17, UNI_UCAS } /* blk=canadiansyllabics */, + { 2, 4154, 8510, 4, 6, UNI_INVITHKUQI } /* invithkuqi */, + { 9, 4744, 2047, 15, 9, UNI_IDENTIFIERTYPE__TECHNICAL } /* identifiertype=technical */, + { 0, 8782, 9069, 7, 6, UNI_GOTH } /* script=gothic */, + { 2, 5172, 26, 14, 1, UNI_EMOD } /* emojimodifier=y */, + { 2, 1858, 1, 22, 1, -UNI_CWT } /* changeswhentitlecased=n */, + { 3, 9979, 9775, 4, 4, UNI_GREK } /* scx=grek */, + { 0, 6578, 5797, 12, 7, UNI_XPOSIXDIGIT } /* numerictype=decimal */, + { 0, 5592, 3, 14, 1, -UNI_PATSYN } /* patternsyntax=f */, + { 2, 7781, 0, 9, 0, UNI_NBAT } /* nabataean */, + { 0, 9691, 5354, 4, 14, UNI_LATINEXTG } /* blk=latinextendedg */, + { 0, 6340, 7282, 4, 8, UNI_COMPATJAMO } /* incompatjamo */, + { 0, 9476, 9135, 3, 4, UNI_LYDI } /* sc=lydi */, + { 0, 2311, 0, 21, 0, UNI_SINHALAARCHAICNUMBERS } /* sinhalaarchaicnumbers */, + { 8, 9429, 3, 5, 1, -UNI_CWCF } /* cwcf=f */, + { 8, 10268, 8116, 3, 8, UNI_NV__3_SLASH_64 } /* nv=4.69e-02 */, + { 9, 9177, 0, 5, 0, UNI_QMARK } /* qmark */, + { 0, 2311, 0, 7, 0, UNI_SINH } /* sinhala */, + { 4, 4885, 2435, 4, 11, UNI_GLAGOLITICSUP } /* inglagoliticsup */, + { 0, 4504, 0, 15, 0, UNI_BAMUMSUP } /* bamumsupplement */, + { 2, 8782, 5634, 7, 14, UNI_SC__PHLP } /* script=psalterpahlavi */, + { 2, 185, 2841, 2, 19, UNI_MERO } /* ismeroitichieroglyphs */, + { 10, 9476, 8803, 3, 4, UNI_SIDD } /* sc=sidd */, + { 2, 10247, 6686, 3, 11, UNI_JG__AFRICANNOON } /* jg=africannoon */, + { 6, 8973, 9509, 6, 5, UNI_INOGHAM } /* block=ogham */, + { 3, 8782, 10035, 7, 4, UNI_SC__TGLG } /* script=tglg */, + { 0, 9691, 9264, 4, 5, UNI_INADLAM } /* blk=adlam */, + { 0, 9159, 0, 7, 0, UNI_DT__CAN } /* nfdqc=n */, + { 8, 10511, 9424, 5, 5, UNI_POSIXCNTRL } /* posixcntrl */, + { 0, 7230, 5926, 10, 3, UNI_BC__RLO } /* bidiclass=rlo */, + { 3, 9469, 5635, 3, 13, UNI_INPSALTERPAHLAVI } /* inpsalterpahlavi */, + { 1, 9979, 9069, 4, 6, UNI_GOTH } /* scx=gothic */, + { 0, 185, 6518, 2, 12, UNI_MEND } /* ismendekikakui */, + { 26, 8782, 8300, 7, 4, UNI_SC__DUPL } /* script=dupl */, + { 1, 9476, 2632, 3, 4, UNI_BRAH } /* sc=brah */, + { 10, 8782, 8356, 7, 8, UNI_SC__HIRA } /* script=hiragana */, + { 0, 2248, 7521, 3, 9, UNI_SUPARROWSA } /* insuparrowsa */, + { 0, 185, 6939, 2, 11, UNI_MISCSYMBOLS } /* ismiscsymbols */, + { 8, 1592, 8608, 3, 6, UNI_INELBASAN } /* inelbasan */, + { 2, 10247, 5424, 3, 14, UNI_JG__MANICHAEANFIVE } /* jg=manichaeanfive */, + { 2, 7700, 0, 9, 0, UNI_QAAI } /* inherited */, + { 2, 4074, 1923, 16, 2, UNI_PC } /* generalcategory=pc */, + { 8, 8887, 1, 7, 1, -UNI_XPOSIXSPACE } /* wspace=n */, + { 1, 9476, 9033, 3, 6, UNI_SC__CAKM } /* sc=chakma */, + { 0, 10253, 8428, 3, 8, UNI_LB__NL } /* lb=nextline */, + { 0, 2304, 9912, 3, 3, UNI_ORKH } /* isorkh */, + { 1, 5408, 8672, 4, 5, UNI_INMAKASAR } /* inmakasar */, + { 0, 10244, 4058, 3, 16, UNI_PF } /* gc=finalpunctuation */, + { 1, 9476, 2269, 3, 11, UNI_MTEI } /* sc=meeteimayek */, + { 2, 7360, 7590, 10, 10, UNI_LB__WJ } /* linebreak=wordjoiner */, + { 14, 9647, 8100, 4, 3, UNI_AGE__4_DOT_1 } /* age=4.1 */, + { 3, 185, 219, 3, 32, UNI_DIACRITICALSEXT } /* iscombiningdiacriticalmarksextended */, + { 0, 6083, 7934, 13, 1, UNI_NV__2 } /* numericvalue=2 */, + { 5, 7450, 0, 10, 0, UNI_PHNX } /* phoenician */, + { 2, 63, 0, 5, 0, UNI_XPOSIXGRAPH } /* graph */, + { 7, 8961, 1, 6, 1, -UNI_BIDIC } /* bidic=n */, + { 0, 9691, 6386, 4, 12, UNI_MAHJONG } /* blk=mahjongtiles */, + { 5, 9763, 6895, 4, 3, UNI_LB__H3 } /* gcb=lvt */, + { 5, 9476, 9887, 3, 4, UNI_NBAT } /* sc=nbat */, + { 0, 185, 1345, 2, 25, UNI_SYMBOLSFORLEGACYCOMPUTING } /* issymbolsforlegacycomputing */, + { 0, 9979, 9811, 4, 4, UNI_KHMR } /* scx=khmr */, + { 0, 7467, 10202, 3, 3, UNI_IN__6_DOT_3 } /* in=6.3 */, + { 10, 7467, 10295, 3, 3, UNI_IN__2 } /* in=v20 */, + { 0, 8782, 9883, 7, 4, UNI_NARB } /* script=narb */, + { 7, 1418, 9375, 25, 4, UNI_CCC__29 } /* canonicalcombiningclass=ccc29 */, + { 2, 6578, 6001, 12, 4, UNI_NV__NAN } /* numerictype=none */, + { 2, 10247, 10241, 3, 3, UNI_JG__GAF } /* jg=gaf */, + { 2, 9979, 9823, 4, 4, UNI_KTHI } /* scx=kthi */, + { 1, 8705, 9494, 7, 5, UNI_NFCQC__M } /* nfkcqc=maybe */, + { 0, 2056, 26, 22, 1, UNI__PERL_NCHAR } /* noncharactercodepoint=y */, + { 5, 3406, 26, 3, 1, UNI_CE } /* ce=y */, + { 1, 8973, 8649, 6, 7, UNI_INKANNADA } /* block=kannada */, + { 10, 9691, 8649, 4, 7, UNI_INKANNADA } /* blk=kannada */, + { 3, 185, 27, 2, 2, UNI_LOWERCASELETTER } /* isll */, + { 4, 2056, 10055, 22, 4, UNI__PERL_NCHAR } /* noncharactercodepoint=true */, + { 1, 980, 0, 27, 0, UNI_ALPHABETICPF } /* alphabeticpresentationforms */, + { 2, 1592, 3194, 3, 7, UNI_INETHIOPIC } /* inethiopic */, + { 3, 3877, 10031, 17, 4, UNI_TFNG } /* scriptextensions=tfng */, + { 0, 3877, 8649, 17, 7, UNI_KNDA } /* scriptextensions=kannada */, + { 2, 3877, 9943, 17, 4, UNI_PRTI } /* scriptextensions=prti */, + { 0, 9711, 10386, 4, 2, UNI_CCC__8 } /* ccc=kv */, + { 1, 9691, 3067, 4, 18, UNI_HALFMARKS } /* blk=combininghalfmarks */, + { 3, 6083, 8059, 13, 2, UNI_NV__33 } /* numericvalue=33 */, + { 1, 9691, 8754, 4, 7, UNI_INOSMANYA } /* blk=osmanya */, + { 17, 4847, 4315, 3, 15, UNI_MYANMAREXTA } /* inmyanmarextendeda */, + { 3, 8973, 5368, 6, 14, UNI_LISUSUP } /* block=lisusupplement */, + { 1, 8782, 9843, 7, 4, UNI_SC__LINB } /* script=linb */, + { 0, 8768, 0, 7, 0, UNI_patsyn_values_index } /* patsyn= */, + { 8, 1792, 10055, 22, 4, UNI_CWCF } /* changeswhencasefolded=true */, + { 0, 9190, 0, 6, 0, UNI_TERM } /* term=t */, + { 4, 9691, 8468, 4, 8, UNI_INTAGBANWA } /* blk=tagbanwa */, + { 9, 9461, 1160, 3, 2, UNI_SB__ST } /* sb=st */, + { 0, 10268, 7924, 3, 8, UNI_NV__1_SLASH_9 } /* nv=1.11e-01 */, + { 1, 1288, 0, 2, 0, UNI_UPPERCASELETTER } /* lu */, + { 0, 9691, 2993, 4, 19, UNI_SUPARROWSC } /* blk=supplementalarrowsc */, + { 3, 7297, 4139, 3, 15, UNI_HIGHPUSURROGATES } /* ishighpusurrogates */, + { 0, 6083, 9254, 13, 5, UNI_NV__1_SLASH_320 } /* numericvalue=1/320 */, + { 0, 8973, 9195, 6, 6, UNI_INTANGSA } /* block=tangsa */, + { 3, 2312, 5243, 3, 13, UNI_HIGHSURROGATES } /* inhighsurrogates */, + { 9, 21, 8372, 2, 8, UNI_JAMOEXTA } /* injamoexta */, + { 1, 6529, 8741, 3, 6, UNI_OLCK } /* inolchiki */, + { 4, 185, 7673, 2, 9, UNI_EMOTICONS } /* isemoticons */, + { 12, 185, 9425, 3, 4, UNI_XPOSIXCNTRL } /* iscntrl */, + { 3, 9979, 8348, 4, 8, UNI_GURU } /* scx=gurmukhi */, + { 0, 1418, 9395, 25, 4, UNI_CCC__33 } /* canonicalcombiningclass=ccc33 */, + { 0, 9476, 9201, 3, 4, UNI_SC__TELU } /* sc=telu */, + { 0, 1418, 8091, 24, 2, UNI_CCC__24 } /* canonicalcombiningclass=24 */, + { 1, 1592, 7675, 4, 7, UNI_EMOTICONS } /* inemoticons */, + { 10, 8973, 44, 7, 8, UNI_CJKCOMPAT } /* block=cjkcompat */, + { 16, 5875, 7290, 13, 10, UNI_JG__DALATHRISH } /* joininggroup=dalathrish */, + { 2, 8973, 8607, 6, 7, UNI_INELBASAN } /* block=elbasan */, + { 1, 9979, 10043, 4, 4, UNI_TIBT } /* scx=tibt */, + { 1, 185, 8614, 2, 4, UNI_ELYM } /* iselym */, + { 1, 185, 401, 2, 6, UNI_CF } /* isformat */, + { 0, 9550, 9454, 4, 5, -UNI_IDS } /* ids=false */, + { 8, 8768, 10055, 7, 4, UNI_PATSYN } /* patsyn=true */, + { 0, 9482, 0, 4, 0, UNI_PHLI } /* phli */, + { 2, 185, 8545, 3, 6, UNI_CJKEXTA } /* iscjkexta */, + { 3, 9691, 7673, 4, 9, UNI_EMOTICONS } /* blk=emoticons */, + { 1, 1506, 2278, 5, 5, UNI_GREEKEXT } /* ingreekext */, + { 9, 10560, 1775, 3, 2, UNI_VAI } /* isvai */, + { 1, 8973, 6939, 6, 11, UNI_MISCSYMBOLS } /* block=miscsymbols */, + { 6, 3448, 1130, 3, 3, UNI_UCAS } /* inucas */, + { 0, 10268, 9563, 3, 4, UNI_NV__1_SLASH_10 } /* nv=1/10 */, + { 0, 9117, 0, 4, 0, UNI_LEPC } /* lepc */, + { 5, 6083, 9013, 13, 2, UNI_NV__29 } /* numericvalue=29 */, + { 1, 9647, 10313, 4, 3, UNI_AGE__4_DOT_1 } /* age=v41 */, + { 1, 3877, 8356, 17, 4, UNI_HIRA } /* scriptextensions=hira */, + { 0, 9691, 0, 4, 0, UNI_blk_values_index } /* blk= */, + { 0, 1189, 3482, 3, 17, UNI_TAIXUANJING } /* intaixuanjingsymbols */, + { 1, 6937, 5232, 4, 2, UNI_INMIAO } /* inmiao */, + { 0, 3391, 26, 18, 1, UNI__PERL_PATWS } /* patternwhitespace=y */, + { 2, 10244, 1588, 3, 1, UNI_Z } /* gc=z */, + { 1, 9711, 5732, 4, 2, UNI_CCC__10 } /* ccc=10 */, + { 10, 8973, 6494, 6, 12, UNI_INMASARAMGONDI } /* block=masaramgondi */, + { 1, 185, 1026, 2, 2, UNI_NO } /* isno */, + { 0, 9476, 2085, 3, 4, UNI_SC__MODI } /* sc=modi */, + { 0, 9979, 9779, 4, 4, UNI_GUJR } /* scx=gujr */, + { 0, 1792, 1, 22, 1, -UNI_CWCF } /* changeswhencasefolded=n */, + { 0, 9711, 9315, 5, 4, UNI_CCC__17 } /* ccc=ccc17 */, + { 2, 185, 3724, 2, 17, UNI_ETHIOPICEXTB } /* isethiopicextendedb */, + { 5, 6340, 44, 3, 25, UNI_CJKCOMPATIDEOGRAPHS } /* incjkcompatibilityideographs */, + { 0, 4972, 8777, 3, 3, UNI_TAGS } /* istags */, + { 0, 10553, 10403, 7, 4, UNI_XPOSIXSPACE } /* isspaceperl */, + { 1, 10217, 4549, 3, 15, UNI_BC__CS } /* bc=commonseparator */, + { 4, 7280, 0, 10, 0, UNI_COMPATJAMO } /* compatjamo */, + { 11, 6158, 1026, 12, 2, -UNI_BIDIC } /* bidicontrol=no */, + { 5, 750, 0, 16, 0, UNI_ENCLOSEDALPHANUM } /* enclosedalphanum */, + { 8, 9691, 4505, 5, 7, UNI_BAMUMSUP } /* blk=bamumsup */, + { 1, 185, 4090, 2, 11, UNI_GEORGIANEXT } /* isgeorgianext */, + { 0, 185, 8621, 2, 4, UNI_GRAN } /* isgran */, + { 0, 3877, 10123, 17, 4, UNI_ZZZZ } /* scriptextensions=zzzz */, + { 0, 1418, 9012, 24, 3, UNI_CCC__129 } /* canonicalcombiningclass=129 */, + { 0, 9691, 2453, 4, 20, UNI_ININSCRIPTIONALPAHLAVI } /* blk=inscriptionalpahlavi */, + { 3, 9469, 3499, 5, 18, UNI_INPC__TOPANDLEFTANDRIGHT } /* inpc=topandleftandright */, + { 2, 9691, 9105, 4, 6, UNI_INKHOJKI } /* blk=khojki */, + { 0, 2593, 410, 20, 2, UNI_VO__TR } /* verticalorientation=tr */, + { 0, 3877, 9201, 17, 6, UNI_TELU } /* scriptextensions=telugu */, + { 0, 3877, 9201, 17, 4, UNI_TELU } /* scriptextensions=telu */, + { 1, 9691, 4849, 4, 15, UNI_INMEROITICCURSIVE } /* blk=meroiticcursive */, + { 1, 8782, 9871, 7, 4, UNI_MRO } /* script=mroo */, + { 2, 9691, 1219, 4, 26, UNI_KATAKANAEXT } /* blk=katakanaphoneticextensions */, + { 8, 3445, 0, 18, 0, UNI_RUMI } /* ruminumeralsymbols */, + { 0, 3448, 8501, 3, 7, UNI_INUGARITIC } /* inugaritic */, + { 2, 10019, 0, 4, 0, UNI_TALU } /* talu */, + { 0, 2248, 8804, 3, 6, UNI_INSIDDHAM } /* insiddham */, + { 0, 8973, 2165, 7, 10, UNI_CYRILLICSUP } /* block=cyrillicsup */, + { 0, 10283, 1, 3, 1, -UNI_SD } /* sd=n */, + { 3, 3877, 9643, 17, 4, UNI_ADLM } /* scriptextensions=adlm */, + { 6, 8782, 10008, 8, 3, UNI_SC__SYRC } /* script=syrc */, + { 0, 952, 0, 17, 0, UNI_VS } /* variationselector */, + { 8, 3877, 9799, 17, 4, UNI_HMNP } /* scriptextensions=hmnp */, + { 0, 9476, 2433, 3, 4, UNI_SC__GLAG } /* sc=glag */, + { 2, 3877, 5227, 17, 4, UNI_CHAM } /* scriptextensions=cham */, + { 0, 251, 0, 33, 0, UNI_MISCMATHSYMBOLSA } /* miscellaneousmathematicalsymbolsa */, + { 4, 185, 4043, 3, 15, UNI_CYPRIOTSYLLABARY } /* iscypriotsyllabary */, + { 3, 3877, 1219, 17, 8, UNI_KANA } /* scriptextensions=katakana */, + { 2, 9213, 9454, 6, 5, -UNI_UIDEO } /* uideo=false */, + { 0, 9979, 7863, 5, 8, UNI_SAMR } /* scx=samaritan */, + { 1, 9999, 0, 4, 0, UNI_SHRD } /* shrd */, + { 4, 9476, 8600, 3, 7, UNI_DSRT } /* sc=deseret */, + { 4, 8782, 9231, 7, 6, UNI_WCHO } /* script=wancho */, + { 10, 8973, 3050, 7, 7, UNI_INCHEROKEE } /* block=cherokee */, + { 2, 9476, 8754, 3, 7, UNI_OSMA } /* sc=osmanya */, + { 0, 10268, 10184, 3, 3, UNI_NV__4_SLASH_5 } /* nv=4/5 */, + { 3, 9711, 16, 4, 1, UNI_CCC__B } /* ccc=b */, + { 3, 1553, 5797, 9, 13, UNI_XPOSIXDIGIT } /* category=decimalnumber */, + { 11, 5875, 4804, 13, 15, UNI_JG__MANICHAEANGIMEL } /* joininggroup=manichaeangimel */, + { 1, 3283, 0, 4, 0, UNI_IDSB } /* idsb */, + { 16, 6752, 0, 6, 0, UNI_DOMINO } /* domino */, + { 1, 3877, 4984, 17, 5, UNI_TAML } /* scriptextensions=tamil */, + { 8, 185, 4639, 2, 4, UNI_DASH } /* isdash */, + { 3, 9847, 10355, 4, 3, UNI_LOE } /* loe=yes */, + { 7, 10217, 1354, 3, 3, UNI_BC__RLE } /* bc=rle */, + { 0, 10244, 1060, 3, 2, UNI_SO } /* gc=so */, + { 1, 10268, 9616, 3, 3, UNI_NV__7_SLASH_2 } /* nv=7/2 */, + { 0, 1116, 0, 4, 0, UNI_HANG } /* hang */, + { 0, 9691, 5940, 4, 9, UNI_INMALAYALAM } /* blk=malayalam */, + { 1, 9691, 6752, 4, 11, UNI_DOMINO } /* blk=dominotiles */, + { 0, 185, 9839, 2, 4, UNI_LINA } /* islina */, + { 9, 8803, 0, 7, 0, UNI_SIDD } /* siddham */, + { 1, 185, 3978, 2, 11, UNI_BOPOMOFOEXT } /* isbopomofoext */, + { 5, 10530, 8868, 4, 5, UNI_INTIRHUTA } /* intirhuta */, + { 0, 9691, 1345, 4, 25, UNI_SYMBOLSFORLEGACYCOMPUTING } /* blk=symbolsforlegacycomputing */, + { 0, 8973, 7433, 6, 7, UNI_INSOGDIAN } /* block=sogdian */, + { 1, 8316, 10055, 8, 4, UNI_EXTPICT } /* extpict=true */, + { 4, 9979, 1629, 4, 4, UNI_PHAG } /* scx=phag */, + { 0, 1814, 3, 22, 1, -UNI_CWCM } /* changeswhencasemapped=f */, + { 0, 1553, 599, 9, 2, UNI_XPOSIXCNTRL } /* category=cc */, + { 0, 185, 9484, 2, 4, UNI_LIMB } /* islimb */, + { 0, 10247, 6266, 3, 12, UNI_JG__FINALSEMKATH } /* jg=finalsemkath */, + { 2, 10244, 5676, 3, 14, UNI_ZS } /* gc=spaceseparator */, + { 1, 5662, 4346, 14, 5, UNI_SB__XX } /* sentencebreak=other */, + { 1, 2803, 1026, 19, 2, -UNI_IDST } /* idstrinaryoperator=no */, + { 8, 9979, 9787, 4, 4, UNI_HANO } /* scx=hano */, + { 1, 3877, 6494, 17, 12, UNI_GONM } /* scriptextensions=masaramgondi */, + { 9, 1115, 36, 26, 1, UNI_CWKCF } /* changeswhennfkccasefolded=t */, + { 0, 9979, 9831, 4, 3, UNI_LAO } /* scx=lao */, + { 2, 6083, 8140, 13, 8, UNI_NV__7_SLASH_12 } /* numericvalue=5.83e-01 */, + { 1, 9979, 8811, 5, 6, UNI_SOYO } /* scx=soyombo */, + { 0, 8593, 1, 7, 1, -UNI_COMPEX } /* compex=n */, + { 5, 1678, 0, 5, 0, UNI_LATN } /* latin */, + { 4, 4074, 342, 16, 2, UNI_PE } /* generalcategory=pe */, + { 0, 10403, 3403, 4, 5, UNI_POSIXSPACE } /* perlspace */, + { 0, 7360, 4401, 10, 9, UNI_EMOD } /* linebreak=emodifier */, + { 16, 8973, 6675, 6, 3, UNI_INIDC } /* block=idc */, + { 5, 10553, 0, 7, 0, UNI_XPOSIXSPACE } /* isspace */, + { 0, 10268, 9575, 3, 3, UNI_NV__1_SLASH_6 } /* nv=1/6 */, + { 10, 9711, 9606, 4, 3, UNI_CCC__214 } /* ccc=214 */, + { 7, 7218, 3979, 3, 7, UNI_INBOPOMOFO } /* inbopomofo */, + { 0, 9691, 4609, 4, 15, UNI_CONTROLPICTURES } /* blk=controlpictures */, + { 11, 8973, 4090, 6, 11, UNI_GEORGIANEXT } /* block=georgianext */, + { 6, 8973, 7540, 6, 10, UNI_SUPARROWSC } /* block=suparrowsc */, + { 2, 10223, 1026, 3, 2, -UNI_CI } /* ci=no */, + { 1, 9691, 5242, 4, 14, UNI_HIGHSURROGATES } /* blk=highsurrogates */, + { 0, 1418, 9345, 25, 4, UNI_CCC__23 } /* canonicalcombiningclass=ccc23 */, + { 10, 9213, 0, 5, 0, UNI_UIDEO } /* uideo */, + { 1, 10226, 10355, 3, 3, UNI_DI } /* di=yes */, + { 2, 185, 1320, 2, 25, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* issymbolsandpictographsexta */, + { 10, 8973, 9294, 6, 5, UNI_INBUHID } /* block=buhid */, + { 3, 9476, 8650, 4, 6, UNI_SC__KNDA } /* sc=kannada */, + { 1, 468, 0, 11, 0, UNI_P } /* punctuation */, + { 1, 10352, 73, 3, 2, UNI_WB__LE } /* wb=le */, + { 4, 3877, 8468, 17, 8, UNI_TAGB } /* scriptextensions=tagbanwa */, + { 3, 9979, 8340, 4, 8, UNI_GUJR } /* scx=gujarati */, + { 10, 4847, 6930, 4, 9, UNI_INMEDEFAIDRIN } /* inmedefaidrin */, + { 1, 9731, 1, 4, 1, -UNI_CWT } /* cwt=n */, + { 0, 9213, 3, 6, 1, -UNI_UIDEO } /* uideo=f */, + { 0, 3121, 8332, 18, 3, UNI_DT__FRA } /* decompositiontype=fra */, + { 0, 7580, 109, 10, 2, UNI_WB__MB } /* wordbreak=mb */, + { 1, 4744, 7350, 15, 10, UNI_IDENTIFIERTYPE__LIMITEDUSE } /* identifiertype=limiteduse */, + { 0, 9979, 9135, 4, 4, UNI_LYDI } /* scx=lydi */, + { 0, 8973, 2841, 6, 19, UNI_MERO } /* block=meroitichieroglyphs */, + { 0, 6083, 5732, 13, 5, UNI_NV__10000 } /* numericvalue=10000 */, + { 8, 10247, 0, 3, 0, UNI_jg_values_index } /* jg= */, + { 0, 5648, 3, 14, 1, -UNI_QMARK } /* quotationmark=f */, + { 1, 8973, 1674, 6, 4, UNI_JAMO } /* block=jamo */, + { 0, 3877, 7844, 17, 4, UNI_PALM } /* scriptextensions=palm */, + { 0, 6083, 9623, 13, 4, UNI_NV__3_SLASH_20 } /* numericvalue=3/20 */, + { 0, 6083, 8004, 13, 8, UNI_NV__5_SLASH_2 } /* numericvalue=2.50e+00 */, + { 1, 185, 7727, 2, 9, UNI_LATINEXTC } /* islatinextc */, + { 0, 9476, 9987, 3, 4, UNI_SGNW } /* sc=sgnw */, + { 1, 9691, 6730, 4, 11, UNI_INCYPROMINOAN } /* blk=cyprominoan */, + { 5, 8782, 9237, 7, 6, UNI_SC__YEZI } /* script=yezidi */, + { 2, 4699, 0, 15, 0, UNI_ecomp_values_index } /* emojicomponent= */, + { 2, 7360, 10376, 10, 2, UNI_LB__BK } /* linebreak=bk */, + { 1, 9691, 909, 4, 14, UNI_PUA } /* blk=privateusearea */, + { 34, 134, 0, 4, 0, UNI_M } /* mark */, + { 0, 3265, 0, 11, 0, UNI_GEORGIANSUP } /* georgiansup */, + { 4, 10223, 9454, 3, 5, -UNI_CI } /* ci=false */, + { 0, 6083, 8937, 13, 6, UNI_NV__700000 } /* numericvalue=700000 */, + { 2, 6083, 9559, 13, 4, UNI_NV___MINUS_1_SLASH_2 } /* numericvalue=-1/2 */, + { 6, 7580, 7899, 11, 8, UNI_WB__WSEGSPACE } /* wordbreak=wsegspace */, + { 0, 8628, 10055, 7, 4, UNI_GRBASE } /* grbase=true */, + { 4, 9847, 26, 4, 1, UNI_LOE } /* loe=y */, + { 2, 9474, 8880, 5, 7, UNI_INSC__VISARGA } /* insc=visarga */, + { 0, 1418, 3039, 24, 10, UNI_CCC__AR } /* canonicalcombiningclass=aboveright */, + { 5, 10250, 6885, 4, 10, UNI_JT__L } /* jt=leftjoining */, + { 1, 5875, 10277, 13, 3, UNI_JG__REH } /* joininggroup=reh */, + { 1, 10553, 8797, 3, 6, UNI_SHAW } /* isshavian */, + { 2, 1990, 4458, 22, 5, UNI_INSC__VOWEL } /* indicsyllabiccategory=vowel */, + { 4, 1418, 8027, 24, 2, UNI_CCC__22 } /* canonicalcombiningclass=22 */, + { 0, 3877, 9484, 17, 5, UNI_LIMB } /* scriptextensions=limbu */, + { 5, 10268, 8931, 3, 5, UNI_NV__60000 } /* nv=60000 */, + { 8, 10349, 36, 3, 1, UNI_VS } /* vs=t */, + { 0, 10229, 5068, 3, 6, UNI_DT__SQR } /* dt=square */, + { 0, 9476, 9484, 3, 5, UNI_SC__LIMB } /* sc=limbu */, + { 3, 6340, 9034, 3, 5, UNI_INCHAKMA } /* inchakma */, + { 0, 185, 115, 3, 34, UNI_DIACRITICALSFORSYMBOLS } /* iscombiningdiacriticalmarksforsymbols */, + { 1, 9691, 4410, 4, 6, UNI_INSYRIAC } /* blk=syriac */, + { 1, 185, 1925, 3, 21, UNI_INDICNUMBERFORMS } /* iscommonindicnumberforms */, + { 3, 9979, 2584, 4, 4, UNI_MAND } /* scx=mand */, + { 0, 9476, 8, 4, 3, UNI_SC__KANA } /* sc=kana */, + { 1, 6340, 7261, 3, 9, UNI_INCHORASMIAN } /* inchorasmian */, + { 1, 10229, 9141, 3, 6, UNI_DT__NAR } /* dt=narrow */, + { 0, 9647, 10340, 4, 3, UNI_AGE__8 } /* age=v80 */, + { 0, 8782, 9643, 7, 4, UNI_SC__ADLM } /* script=adlm */, + { 0, 3877, 9683, 17, 4, UNI_BATK } /* scriptextensions=batk */, + { 1, 10528, 0, 5, 0, UNI_XPOSIXPRINT } /* print */, + { 2, 10268, 9249, 3, 4, UNI_NV__1_SLASH_16 } /* nv=1/16 */, + { 6, 9476, 1629, 3, 4, UNI_SC__PHAG } /* sc=phag */, + { 3, 4074, 7550, 16, 10, UNI_CN } /* generalcategory=unassigned */, + { 1, 5408, 481, 4, 29, UNI_MATHALPHANUM } /* inmathematicalalphanumericsymbols */, + { 4, 9711, 9325, 5, 4, UNI_CCC__19 } /* ccc=ccc19 */, + { 1, 185, 5578, 2, 14, UNI_MN } /* isnonspacingmark */, + { 8, 10268, 8913, 3, 2, UNI_NV__40 } /* nv=40 */, + { 3, 2304, 9924, 3, 3, UNI_OUGR } /* isougr */, + { 13, 9461, 10394, 3, 2, UNI_SB__XX } /* sb=xx */, + { 18, 9077, 10355, 4, 3, UNI_EXT } /* ext=yes */, + { 4, 1190, 496, 3, 7, UNI_NT__NU } /* nt=numeric */, + { 1, 3877, 9183, 17, 6, UNI_RJNG } /* scriptextensions=rejang */, + { 0, 9476, 7071, 3, 4, UNI_SORA } /* sc=sora */, + { 0, 9711, 41, 4, 2, UNI_CCC__DA } /* ccc=da */, + { 0, 10268, 8236, 3, 8, UNI_NV__17_SLASH_2 } /* nv=8.50e+00 */, + { 12, 1185, 0, 3, 0, UNI_DEP } /* dep */, + { 0, 185, 3826, 2, 4, UNI_MANI } /* ismani */, + { 1, 8276, 0, 8, 0, UNI_BALI } /* balinese */, + { 0, 5830, 0, 5, 0, UNI_EBASE } /* ebase */, + { 0, 6083, 10127, 13, 3, UNI_NV__1_SLASH_5 } /* numericvalue=1/5 */, + { 0, 9691, 2433, 4, 10, UNI_INGLAGOLITIC } /* blk=glagolitic */, + { 12, 3877, 8284, 17, 4, UNI_BASS } /* scriptextensions=bass */, + { 0, 9159, 26, 6, 1, UNI_NFDQC__Y } /* nfdqc=y */, + { 0, 5901, 0, 13, 0, UNI_KANAEXTB } /* kanaextendedb */, + { 15, 3877, 3103, 17, 6, UNI_COPT } /* scriptextensions=coptic */, + { 10, 8782, 8859, 7, 7, UNI_TIBT } /* script=tibetan */, + { 1, 9476, 3193, 3, 4, UNI_ETHI } /* sc=ethi */, + { 0, 1553, 10398, 9, 2, UNI_ZP } /* category=zp */, + { 0, 8973, 6242, 6, 12, UNI_ETHIOPICEXTB } /* block=ethiopicextb */, + { 1, 10244, 1288, 3, 2, UNI_UPPERCASELETTER } /* gc=lu */, + { 42, 9476, 9967, 3, 4, UNI_RUNR } /* sc=runr */, + { 1, 9979, 8530, 4, 7, UNI_AVST } /* scx=avestan */, + { 1, 9763, 126, 4, 2, UNI_LB__CR } /* gcb=cr */, + { 8, 9476, 9791, 3, 4, UNI_HLUW } /* sc=hluw */, + { 0, 9476, 8530, 3, 7, UNI_AVST } /* sc=avestan */, + { 1, 9647, 9595, 4, 4, UNI_AGE__12_DOT_1 } /* age=12.1 */, + { 11, 9476, 10115, 3, 4, UNI_SC__QAAI } /* sc=zinh */, + { 2, 8973, 5606, 6, 14, UNI_PHONETICEXTSUP } /* block=phoneticextsup */, + { 1, 6083, 7980, 13, 8, UNI_NV__1_SLASH_6 } /* numericvalue=1.67e-01 */, + { 0, 9691, 4410, 4, 9, UNI_SYRIACSUP } /* blk=syriacsup */, + { 3, 185, 7792, 3, 2, UNI_CWT } /* iscwt */, + { 0, 8782, 9723, 7, 4, UNI_SC__CPRT } /* script=cprt */, + { 6, 9979, 9891, 4, 4, UNI_NEWA } /* scx=newa */, + { 0, 8551, 0, 7, 0, UNI_CJKEXTB } /* cjkextb */, + { 0, 8444, 9454, 8, 5, -UNI_RADICAL } /* radical=false */, + { 4, 8782, 8663, 7, 7, UNI_SC__LINA } /* script=lineara */, + { 2, 9691, 6590, 4, 12, UNI_INOLDHUNGARIAN } /* blk=oldhungarian */, + { 6, 8973, 2144, 7, 13, UNI_CJKRADICALSSUP } /* block=cjkradicalssup */, + { 2, 4074, 10398, 16, 2, UNI_ZP } /* generalcategory=zp */, + { 1, 6083, 9615, 13, 4, UNI_NV__17_SLASH_2 } /* numericvalue=17/2 */, + { 0, 7360, 126, 10, 2, UNI_LB__CR } /* linebreak=cr */, + { 0, 8973, 8635, 6, 7, UNI_INHANUNOO } /* block=hanunoo */, + { 3, 6083, 9249, 13, 4, UNI_NV__1_SLASH_16 } /* numericvalue=1/16 */, + { 0, 9691, 1701, 4, 23, UNI_SHORTHANDFORMATCONTROLS } /* blk=shorthandformatcontrols */, + { 1, 9489, 36, 5, 1, UNI_MATH } /* math=t */, + { 0, 4534, 0, 4, 0, UNI_BRAI } /* brai */, + { 11, 25, 0, 1, 0, UNI_S } /* s */, + { 2, 9464, 9454, 5, 5, -UNI_IDST } /* idst=false */, + { 2, 185, 8276, 2, 8, UNI_BALI } /* isbalinese */, + { 8, 7160, 7160, 3, 10, UNI_YISYLLABLES } /* isyisyllables */, + { 5, 8973, 1219, 6, 8, UNI_INKATAKANA } /* block=katakana */, + { 2, 2593, 3517, 20, 18, UNI_VO__TR } /* verticalorientation=transformedrotated */, + { 0, 6083, 7932, 13, 8, UNI_NV__1_SLASH_8 } /* numericvalue=1.25e-01 */, + { 3, 6083, 10364, 13, 2, UNI_NV__45 } /* numericvalue=45 */, + { 1, 9979, 8691, 4, 7, UNI_MULT } /* scx=multani */, + { 8, 2312, 3079, 5, 6, UNI_HALFMARKS } /* inhalfmarks */, + { 0, 8973, 2100, 6, 15, UNI_TRANSPORTANDMAP } /* block=transportandmap */, + { 0, 5662, 73, 14, 2, UNI_SB__LE } /* sentencebreak=le */, + { 1, 9476, 10039, 3, 4, UNI_THAI } /* sc=thai */, + { 2, 10553, 8454, 4, 6, UNI_SPECIALS } /* isspecials */, + { 0, 10217, 5926, 3, 3, UNI_BC__RLO } /* bc=rlo */, + { 1, 2206, 0, 21, 0, UNI_gcb_values_index } /* graphemeclusterbreak= */, + { 2, 1190, 6001, 3, 4, UNI_NV__NAN } /* nt=none */, + { 1, 9979, 9947, 4, 4, UNI_COPT } /* scx=qaac */, + { 0, 9979, 9643, 4, 4, UNI_ADLM } /* scx=adlm */, + { 0, 9763, 36, 4, 1, UNI_GCB__T } /* gcb=t */, + { 0, 3283, 0, 18, 0, UNI_idsb_values_index } /* idsbinaryoperator= */, + { 0, 3398, 26, 11, 1, UNI_XPOSIXSPACE } /* whitespace=y */, + { 0, 7230, 6146, 10, 12, UNI_BC__AN } /* bidiclass=arabicnumber */, + { 3, 185, 9093, 2, 6, UNI_KTHI } /* iskaithi */, + { 8, 9476, 7104, 3, 11, UNI_SC__SYLO } /* sc=sylotinagri */, + { 0, 10516, 9936, 3, 3, UNI_PHNX } /* isphnx */, + { 0, 6338, 1, 12, 1, -UNI_JOINC } /* joincontrol=n */, + { 0, 5662, 0, 16, 0, UNI_SB__SP } /* sentencebreak=sp */, + { 0, 6083, 0, 13, 0, UNI_nv_values_index } /* numericvalue= */, + { 5, 3877, 9117, 17, 4, UNI_LEPC } /* scriptextensions=lepc */, + { 1, 9979, 9799, 4, 4, UNI_HMNP } /* scx=hmnp */, + { 1, 10268, 8925, 3, 5, UNI_NV__50000 } /* nv=50000 */, + { 1, 185, 8684, 2, 4, UNI_MARC } /* ismarc */, + { 0, 9979, 9875, 4, 4, UNI_MTEI } /* scx=mtei */, + { 1, 10253, 2468, 3, 2, UNI_LB__HL } /* lb=hl */, + { 0, 9979, 3622, 4, 17, UNI_AGHB } /* scx=caucasianalbanian */, + { 1, 9691, 1442, 4, 10, UNI_CJKSYMBOLS } /* blk=cjksymbols */, + { 6, 8967, 10355, 6, 3, UNI_BIDIM } /* bidim=yes */, + { 3, 9474, 2632, 5, 19, UNI_INSC__BRAHMIJOININGNUMBER } /* insc=brahmijoiningnumber */, + { 0, 3877, 9699, 17, 4, UNI_BUHD } /* scriptextensions=buhd */, + { 1, 6083, 8052, 13, 8, UNI_NV__1_SLASH_320 } /* numericvalue=3.13e-03 */, + { 1, 9464, 10055, 5, 4, UNI_IDST } /* idst=true */, + { 5, 10244, 5578, 3, 14, UNI_MN } /* gc=nonspacingmark */, + { 0, 1418, 8998, 25, 4, UNI_CCC__11 } /* canonicalcombiningclass=ccc11 */, + { 3, 9464, 1, 5, 1, -UNI_IDST } /* idst=n */, + { 0, 1538, 3499, 24, 10, UNI_INPC__TOPANDLEFT } /* indicpositionalcategory=topandleft */, + { 9, 5830, 1026, 6, 2, -UNI_EBASE } /* ebase=no */, + { 16, 185, 2493, 2, 20, UNI_HMNP } /* isnyiakengpuachuehmong */, + { 0, 185, 3265, 2, 4, UNI_GEOR } /* isgeor */, + { 2, 5408, 6508, 4, 10, UNI_MATHALPHANUM } /* inmathalphanum */, + { 1, 2353, 0, 20, 0, UNI_HLUW } /* anatolianhieroglyphs */, + { 2, 9051, 1026, 6, 2, -UNI_ECOMP } /* ecomp=no */, + { 0, 7560, 3, 10, 1, -UNI_XPOSIXUPPER } /* uppercase=f */, + { 2, 8973, 8530, 6, 7, UNI_INAVESTAN } /* block=avestan */, + { 1, 9509, 0, 5, 0, UNI_OGAM } /* ogham */, + { 0, 2248, 2937, 3, 8, UNI_INSUNDANESE } /* insundanese */, + { 3, 1990, 729, 22, 6, UNI_INSC__NUMBER } /* indicsyllabiccategory=number */, + { 9, 7360, 6302, 10, 12, UNI_LB__HL } /* linebreak=hebrewletter */, + { 0, 8973, 115, 7, 34, UNI_DIACRITICALSFORSYMBOLS } /* block=combiningdiacriticalmarksforsymbols */, + { 0, 185, 952, 2, 28, UNI_VSSUP } /* isvariationselectorssupplement */, + { 1, 8881, 1008, 3, 16, UNI_ANCIENTGREEKMUSIC } /* isancientgreekmusic */, + { 1, 3553, 10355, 18, 3, UNI_VS } /* variationselector=yes */, + { 6, 10232, 9, 3, 2, UNI_EA__NA } /* ea=na */, + { 1, 9459, 1, 5, 1, -UNI_IDSB } /* idsb=n */, + { 6, 7467, 5732, 3, 2, UNI_IN__10 } /* in=10 */, + { 0, 415, 0, 32, 0, UNI_INIDC } /* ideographicdescriptioncharacters */, + { 2, 21, 7330, 2, 10, UNI_INKHAROSHTHI } /* inkharoshthi */, + { 5, 1770, 0, 22, 0, UNI_bpt_values_index } /* bidipairedbrackettype= */, + { 1, 4157, 3776, 3, 16, UNI_INDICSIYAQNUMBERS } /* isindicsiyaqnumbers */, + { 0, 8973, 5074, 6, 14, UNI_ANCIENTSYMBOLS } /* block=ancientsymbols */, + { 1, 9476, 9699, 3, 4, UNI_SC__BUHD } /* sc=buhd */, + { 7, 9979, 2708, 4, 19, UNI_EGYP } /* scx=egyptianhieroglyphs */, + { 0, 10253, 5830, 3, 5, UNI_EBASE } /* lb=ebase */, + { 1, 9476, 9117, 3, 4, UNI_LEPC } /* sc=lepc */, + { 0, 7826, 0, 9, 0, UNI_ORKH } /* oldturkic */, + { 17, 9711, 9385, 5, 4, UNI_CCC__31 } /* ccc=ccc31 */, + { 4, 7467, 10071, 3, 4, UNI_IN__12_DOT_1 } /* in=v121 */, + { 1, 9087, 36, 6, 1, UNI_JOINC } /* joinc=t */, + { 0, 9691, 7260, 4, 10, UNI_INCHORASMIAN } /* blk=chorasmian */, + { 1, 1274, 0, 20, 0, UNI_CE } /* compositionexclusion */, + { 1, 8782, 9207, 7, 4, UNI_SC__THAA } /* script=thaa */, + { 0, 10516, 7854, 3, 8, UNI_PAUC } /* ispaucinhau */, + { 0, 3448, 1, 3, 33, UNI_UCAS } /* inunifiedcanadianaboriginalsyllabics */, + { 0, 9461, 34, 3, 2, UNI_SB__EX } /* sb=ex */, + { 1, 4154, 5030, 3, 14, UNI_VEDICEXT } /* invedicextensions */, + { 4, 1418, 5732, 24, 2, UNI_CCC__10 } /* canonicalcombiningclass=10 */, + { 2, 185, 631, 3, 29, UNI_CJKEXTE } /* iscjkunifiedideographsextensione */, + { 4, 9474, 4346, 5, 5, UNI_INSC__OTHER } /* insc=other */, + { 0, 9476, 4186, 3, 7, UNI_SC__LINB } /* sc=linearb */, + { 0, 1189, 10052, 3, 3, UNI_INTOTO } /* intoto */, + { 10, 8973, 3826, 6, 10, UNI_INMANICHAEAN } /* block=manichaean */, + { 5, 4972, 2101, 3, 21, UNI_TRANSPORTANDMAP } /* istransportandmapsymbols */, + { 2, 9429, 0, 4, 0, UNI_CWCF } /* cwcf */, + { 3, 7360, 2664, 10, 2, UNI_LB__BA } /* linebreak=ba */, + { 1, 7360, 6287, 10, 2, UNI_LB__ZW } /* linebreak=zw */, + { 0, 7560, 10355, 10, 3, UNI_XPOSIXUPPER } /* uppercase=yes */, + { 1, 3877, 6730, 17, 11, UNI_CPMN } /* scriptextensions=cyprominoan */, + { 0, 8973, 1903, 7, 21, UNI_CJKCOMPATIDEOGRAPHSSUP } /* block=cjkcompatideographssup */, + { 2, 7360, 6829, 10, 11, UNI_LB__IN } /* linebreak=inseperable */, + { 1, 21, 8663, 2, 7, UNI_INLINEARA } /* inlineara */, + { 0, 9214, 10355, 5, 3, UNI_IDEO } /* ideo=yes */, + { 2, 2248, 8811, 3, 6, UNI_INSOYOMBO } /* insoyombo */, + { 7, 2248, 4411, 3, 8, UNI_SYRIACSUP } /* insyriacsup */, + { 10, 185, 4639, 2, 15, UNI_PD } /* isdashpunctuation */, + { 1, 3877, 8468, 17, 4, UNI_TAGB } /* scriptextensions=tagb */, + { 3, 4074, 4639, 16, 15, UNI_PD } /* generalcategory=dashpunctuation */, + { 1, 10244, 1528, 3, 9, UNI__PERL_SURROGATE } /* gc=surrogate */, + { 8, 1088, 10355, 27, 3, UNI_PCM } /* prependedconcatenationmark=yes */, + { 1, 10253, 5102, 3, 14, UNI_LB__CR } /* lb=carriagereturn */, + { 0, 4972, 8477, 3, 7, UNI_TFNG } /* istifinagh */, + { 12, 10217, 3741, 3, 17, UNI_BC__ES } /* bc=europeanseparator */, + { 0, 185, 8621, 2, 7, UNI_GRAN } /* isgrantha */, + { 0, 8854, 5275, 3, 9, UNI_YIRADICALS } /* inyiradicals */, + { 1, 9979, 3265, 4, 4, UNI_GEOR } /* scx=geor */, + { 0, 8973, 7381, 6, 2, UNI_INVS } /* block=vs */, + { 0, 7330, 0, 10, 0, UNI_KHAR } /* kharoshthi */, + { 0, 3877, 3826, 17, 10, UNI_MANI } /* scriptextensions=manichaean */, + { 10, 9731, 10055, 4, 4, UNI_CWT } /* cwt=true */, + { 1, 185, 436, 2, 5, UNI__PERL_NCHAR } /* isnchar */, + { 4, 3962, 0, 9, 0, UNI_ARABICSUP } /* arabicsup */, + { 2, 10217, 10238, 3, 3, UNI_BC__FSI } /* bc=fsi */, + { 4, 21, 9231, 2, 6, UNI_INWANCHO } /* inwancho */, + { 0, 5516, 0, 3, 0, UNI_ANY } /* any */, + { 0, 7460, 10059, 10, 4, UNI_IN__10 } /* presentin=v100 */, + { 3, 1990, 4154, 22, 16, UNI_INSC__INVISIBLESTACKER } /* indicsyllabiccategory=invisiblestacker */, + { 14, 185, 1, 2, 1, UNI_N } /* isn */, + { 4, 8973, 2085, 6, 4, UNI_INMODI } /* block=modi */, + { 8, 10253, 4898, 3, 2, UNI_LB__QU } /* lb=qu */, + { 1, 10244, 1, 3, 1, UNI_N } /* gc=n */, + { 2, 9469, 9, 5, 2, UNI_INPC__NA } /* inpc=na */, + { 6, 10268, 8925, 3, 6, UNI_NV__500000 } /* nv=500000 */, + { 0, 9727, 36, 4, 1, UNI_CWL } /* cwl=t */, + { 1, 8628, 3, 7, 1, -UNI_GRBASE } /* grbase=f */, + { 7, 7460, 7923, 10, 2, UNI_IN__11 } /* presentin=11 */, + { 0, 10217, 3797, 3, 3, UNI_BC__NSM } /* bc=nsm */, + { 9, 6338, 10355, 12, 3, UNI_JOINC } /* joincontrol=yes */, + { 3, 9691, 7540, 4, 10, UNI_SUPARROWSC } /* blk=suparrowsc */, + { 4, 7673, 0, 9, 0, UNI_EMOTICONS } /* emoticons */, + { 0, 6350, 24, 12, 1, UNI_JT__L } /* joiningtype=l */, + { 1, 10253, 5144, 3, 14, UNI_LB__SA } /* lb=complexcontext */, + { 8, 4042, 0, 16, 0, UNI_CYPRIOTSYLLABARY } /* cypriotsyllabary */, + { 1, 9711, 185, 4, 2, UNI_CCC__IS } /* ccc=is */, + { 3, 4699, 36, 15, 1, UNI_ECOMP } /* emojicomponent=t */, + { 9, 1418, 9415, 25, 4, UNI_CCC__84 } /* canonicalcombiningclass=ccc84 */, + { 0, 7230, 1, 11, 1, UNI_BC__BN } /* bidiclass=bn */, + { 2, 9691, 8492, 4, 8, UNI_UCASEXTA } /* blk=ucasexta */, + { 9, 3877, 2085, 17, 4, UNI_MODI } /* scriptextensions=modi */, + { 0, 1418, 23, 24, 2, UNI_CCC__AL } /* canonicalcombiningclass=al */, + { 0, 8973, 8404, 6, 8, UNI_KANAEXTB } /* block=kanaextb */, + { 8, 9529, 0, 5, 0, UNI_TALE } /* taile */, + { 0, 7500, 0, 10, 0, UNI_SAUR } /* saurashtra */, + { 0, 6083, 9254, 13, 3, UNI_NV__1_SLASH_3 } /* numericvalue=1/3 */, + { 10, 4759, 0, 15, 0, UNI_ARMI } /* imperialaramaic */, + { 1, 10247, 5448, 3, 4, UNI_JG__HETH } /* jg=heth */, + { 0, 185, 75, 2, 2, UNI_ME } /* isme */, + { 0, 8782, 7808, 7, 9, UNI_ITAL } /* script=olditalic */, + { 2, 8973, 810, 6, 29, UNI_ENCLOSEDIDEOGRAPHICSUP } /* block=enclosedideographicsupplement */, + { 0, 3877, 7790, 17, 9, UNI_TALU } /* scriptextensions=newtailue */, + { 3, 8782, 7430, 7, 10, UNI_SOGO } /* script=oldsogdian */, + { 10, 8782, 9201, 7, 4, UNI_SC__TELU } /* script=telu */, + { 0, 9476, 3103, 3, 4, UNI_SC__COPT } /* sc=copt */, + { 10, 7467, 10319, 3, 3, UNI_IN__5_DOT_1 } /* in=v51 */, + { 0, 6057, 0, 13, 0, UNI_MISCTECHNICAL } /* misctechnical */, + { 1, 3690, 0, 17, 0, UNI_CYRILLICEXTC } /* cyrillicextendedc */, + { 0, 9763, 5830, 4, 5, UNI_WB__EB } /* gcb=ebase */, + { 5, 9979, 3826, 4, 10, UNI_MANI } /* scx=manichaean */, + { 1, 9979, 9284, 4, 5, UNI_BATK } /* scx=batak */, + { 0, 10352, 7898, 3, 9, UNI_WB__WSEGSPACE } /* wb=wsegspace */, + { 0, 3877, 8831, 17, 7, UNI_TGLG } /* scriptextensions=tagalog */, + { 1, 7682, 9454, 9, 5, -UNI_EXT } /* extender=false */, + { 1, 7230, 408, 10, 2, UNI_BC__ON } /* bidiclass=on */, + { 0, 8973, 6362, 6, 12, UNI_KHMERSYMBOLS } /* block=khmersymbols */, + { 0, 185, 1701, 2, 23, UNI_SHORTHANDFORMATCONTROLS } /* isshorthandformatcontrols */, + { 4, 6529, 7818, 3, 8, UNI_INOLDPERMIC } /* inoldpermic */, + { 3, 10247, 6398, 3, 12, UNI_JG__MALAYALAMBHA } /* jg=malayalambha */, + { 0, 5875, 3860, 13, 17, UNI_JG__MANICHAEANTHAMEDH } /* joininggroup=manichaeanthamedh */, + { 1, 8593, 0, 6, 0, UNI_COMPEX } /* compex */, + { 10, 4286, 0, 10, 0, UNI_SM } /* mathsymbol */, + { 1, 3157, 1, 18, 1, -UNI_EBASE } /* emojimodifierbase=n */, + { 0, 7908, 26, 8, 1, UNI_IDS } /* idstart=y */, + { 13, 9711, 8920, 4, 2, UNI_CCC__32 } /* ccc=32 */, + { 0, 8973, 8372, 6, 8, UNI_JAMOEXTA } /* block=jamoexta */, + { 0, 3365, 0, 8, 0, UNI_DINGBATS } /* dingbats */, + { 0, 10268, 7947, 3, 2, UNI_NV__21 } /* nv=21 */, + { 1, 3391, 0, 18, 0, UNI_patws_values_index } /* patternwhitespace= */, + { 11, 9735, 0, 4, 0, UNI_cwu_values_index } /* cwu= */, + { 1, 10268, 9579, 3, 4, UNI_NV__1_SLASH_80 } /* nv=1/80 */, + { 1, 21, 7745, 2, 9, UNI_LATINEXTF } /* inlatinextf */, + { 1, 9461, 50, 3, 2, UNI_SB__AT } /* sb=at */, + { 0, 185, 3068, 3, 17, UNI_HALFMARKS } /* iscombininghalfmarks */, + { 0, 8845, 0, 7, 0, UNI_TAVT } /* taiviet */, + { 0, 3553, 9454, 18, 5, -UNI_VS } /* variationselector=false */, + { 0, 10402, 436, 6, 5, UNI__PERL_NCHAR } /* _perl_nchar */, + { 1, 10244, 5810, 3, 13, UNI_ME } /* gc=enclosingmark */, + { 1, 3877, 9534, 17, 4, UNI_TAKR } /* scriptextensions=takr */, + { 0, 10268, 8108, 3, 8, UNI_NV__9_SLASH_2 } /* nv=4.50e+00 */, + { 24, 10217, 3814, 3, 3, UNI_BC__RLI } /* bc=rli */, + { 0, 7560, 0, 10, 0, UNI_upper_values_index } /* uppercase= */, + { 0, 21, 4170, 2, 16, UNI_LATIN1 } /* inlatin1supplement */, + { 0, 185, 6731, 3, 10, UNI_CPMN } /* iscyprominoan */, + { 0, 909, 0, 14, 0, UNI_PUA } /* privateusearea */, + { 1, 185, 1815, 3, 20, UNI_CWCM } /* ischangeswhencasemapped */, + { 0, 7160, 2333, 3, 20, UNI_YIJING } /* isyijinghexagramsymbols */, + { 9, 10516, 7845, 3, 8, UNI_PALM } /* ispalmyrene */, + { 9, 10109, 5062, 5, 12, UNI_INZANABAZARSQUARE } /* inzanabazarsquare */, + { 1, 9476, 8468, 3, 8, UNI_SC__TAGB } /* sc=tagbanwa */, + { 0, 9691, 2708, 4, 19, UNI_INEGYPTIANHIEROGLYPHS } /* blk=egyptianhieroglyphs */, + { 1, 9476, 6290, 3, 12, UNI_SC__GONG } /* sc=gunjalagondi */, + { 0, 952, 0, 28, 0, UNI_VSSUP } /* variationselectorssupplement */, + { 1, 21, 9093, 2, 6, UNI_INKAITHI } /* inkaithi */, + { 0, 7570, 0, 10, 0, UNI_WARA } /* warangciti */, + { 12, 1678, 0, 23, 0, UNI_LATINEXTADDITIONAL } /* latinextendedadditional */, + { 2, 10398, 0, 2, 0, UNI_ZP } /* zp */, + { 1, 9927, 3, 4, 1, -UNI_PCM } /* pcm=f */, + { 0, 9711, 8119, 4, 1, UNI_CCC__9 } /* ccc=9 */, + { 0, 5093, 26, 9, 1, UNI_XPOSIXXDIGIT } /* hexdigit=y */, + { 13, 6338, 1026, 12, 2, -UNI_JOINC } /* joincontrol=no */, + { 1, 9476, 7104, 3, 4, UNI_SC__SYLO } /* sc=sylo */, + { 0, 9647, 8119, 4, 1, UNI_AGE__9 } /* age=9 */, + { 3, 9979, 8656, 4, 7, UNI_KALI } /* scx=kayahli */, + { 2, 8702, 812, 4, 20, UNI_ENCLOSEDIDEOGRAPHICSUP } /* inenclosedideographicsup */, + { 0, 9711, 10145, 4, 3, UNI_CCC__BL } /* ccc=218 */, + { 0, 9979, 6972, 4, 11, UNI_NAND } /* scx=nandinagari */, + { 6, 9691, 6218, 4, 12, UNI_CYRILLICEXTC } /* blk=cyrillicextc */, + { 3, 9691, 2311, 4, 21, UNI_SINHALAARCHAICNUMBERS } /* blk=sinhalaarchaicnumbers */, + { 1, 10247, 7340, 3, 10, UNI_JG__KNOTTEDHEH } /* jg=knottedheh */, + { 1, 8782, 9679, 7, 4, UNI_AVST } /* script=avst */, + { 0, 3877, 8838, 17, 7, UNI_LANA } /* scriptextensions=taitham */, + { 13, 4699, 10355, 15, 3, UNI_ECOMP } /* emojicomponent=yes */, + { 1, 8859, 0, 7, 0, UNI_TIBT } /* tibetan */, + { 8, 5116, 3, 14, 1, -UNI_CI } /* caseignorable=f */, + { 9, 6340, 3657, 3, 16, UNI_CYRILLICEXTA } /* incyrillicextendeda */, + { 0, 8803, 0, 4, 0, UNI_SIDD } /* sidd */, + { 0, 10268, 8099, 3, 2, UNI_NV__14 } /* nv=14 */, + { 0, 8782, 9294, 7, 5, UNI_SC__BUHD } /* script=buhid */, + { 2, 1418, 2473, 24, 4, UNI_CCC__L } /* canonicalcombiningclass=left */, + { 0, 6340, 6219, 3, 11, UNI_CYRILLICEXTC } /* incyrillicextc */, + { 9, 2808, 1372, 4, 22, UNI_ARABICPFA } /* inarabicpresentationformsa */, + { 0, 5875, 6398, 13, 12, UNI_JG__MALAYALAMBHA } /* joininggroup=malayalambha */, + { 0, 8973, 479, 6, 31, UNI_MATHALPHANUM } /* block=mathematicalalphanumericsymbols */, + { 2, 3355, 0, 18, 0, UNI_ORNAMENTALDINGBATS } /* ornamentaldingbats */, + { 1, 7218, 1220, 3, 4, UNI_INBATAK } /* inbatak */, + { 0, 7460, 9600, 10, 3, UNI_IN__3 } /* presentin=3.0 */, + { 0, 3265, 0, 18, 0, UNI_GEORGIANSUP } /* georgiansupplement */, + { 6, 9459, 36, 5, 1, UNI_IDSB } /* idsb=t */, + { 11, 9979, 8508, 4, 8, UNI_VITH } /* scx=vithkuqi */, + { 4, 8782, 8979, 7, 4, UNI_CARI } /* script=cari */, + { 0, 8973, 4170, 6, 6, UNI_LATIN1 } /* block=latin1 */, + { 0, 9735, 1026, 4, 2, -UNI_CWU } /* cwu=no */, + { 0, 8782, 9529, 7, 5, UNI_SC__TALE } /* script=taile */, + { 0, 4972, 9196, 3, 5, UNI_TNSA } /* istangsa */, + { 1, 9691, 4170, 4, 9, UNI_LATIN1 } /* blk=latin1sup */, + { 0, 21, 7570, 2, 10, UNI_INWARANGCITI } /* inwarangciti */, + { 1, 6340, 3050, 3, 7, UNI_INCHEROKEE } /* incherokee */, + { 0, 6083, 8196, 13, 8, UNI_NV__15_SLASH_2 } /* numericvalue=7.50e+00 */, + { 0, 4074, 46, 16, 2, UNI_CO } /* generalcategory=co */, + { 6, 2553, 26, 20, 1, UNI_TERM } /* terminalpunctuation=y */, + { 2, 9691, 2879, 4, 19, UNI_MONGOLIANSUP } /* blk=mongoliansupplement */, + { 6, 185, 9863, 2, 4, UNI_MIAO } /* ismiao */, + { 13, 1770, 0, 23, 0, UNI_BPT__C } /* bidipairedbrackettype=c */, + { 0, 10352, 7763, 3, 9, UNI_WB__ML } /* wb=midletter */, + { 11, 9469, 2579, 5, 14, UNI_INPC__BOTTOMANDRIGHT } /* inpc=bottomandright */, + { 0, 9550, 1, 4, 1, -UNI_IDS } /* ids=n */, + { 2, 6340, 721, 3, 29, UNI_CUNEIFORMNUMBERS } /* incuneiformnumbersandpunctuation */, + { 14, 8973, 7781, 6, 9, UNI_INNABATAEAN } /* block=nabataean */, + { 0, 9691, 952, 4, 28, UNI_VSSUP } /* blk=variationselectorssupplement */, + { 0, 185, 8292, 2, 8, UNI_BUGI } /* isbuginese */, + { 11, 9476, 9723, 3, 4, UNI_SC__CPRT } /* sc=cprt */, + { 0, 10247, 9554, 3, 5, UNI_JG__ZHAIN } /* jg=zhain */, + { 0, 8973, 9831, 6, 3, UNI_INLAO } /* block=lao */, + { 0, 1418, 9010, 25, 5, UNI_CCC__129 } /* canonicalcombiningclass=ccc129 */, + { 0, 3945, 1, 17, 1, -UNI_UIDEO } /* unifiedideograph=n */, + { 2, 185, 3157, 2, 5, UNI_EMOJI } /* isemoji */, + { 8, 7467, 9599, 3, 4, UNI_IN__13 } /* in=13.0 */, + { 0, 8782, 3193, 7, 4, UNI_ETHI } /* script=ethi */, + { 0, 7360, 7250, 10, 10, UNI_LB__BA } /* linebreak=breakafter */, + { 0, 185, 2727, 2, 19, UNI_ENCLOSEDALPHANUMSUP } /* isenclosedalphanumsup */, + { 1, 9476, 9655, 3, 4, UNI_AHOM } /* sc=ahom */, + { 0, 3877, 9911, 17, 4, UNI_ORKH } /* scriptextensions=orkh */, + { 1, 3121, 3525, 18, 3, UNI_DT__MED } /* decompositiontype=med */, + { 0, 9691, 6752, 4, 6, UNI_DOMINO } /* blk=domino */, + { 10, 10402, 7908, 6, 7, UNI__PERL_IDSTART } /* _perl_idstart */, + { 2, 3448, 8493, 3, 6, UNI_UCASEXT } /* inucasext */, + { 3, 9691, 5059, 4, 15, UNI_INZANABAZARSQUARE } /* blk=zanabazarsquare */, + { 1, 2248, 925, 3, 27, UNI_SUPPUAB } /* insupplementaryprivateuseareab */, + { 4, 1528, 0, 9, 0, UNI__PERL_SURROGATE } /* surrogate */, + { 1, 9727, 9454, 4, 5, -UNI_CWL } /* cwl=false */, + { 5, 9691, 1935, 4, 11, UNI_NUMBERFORMS } /* blk=numberforms */, + { 2, 9647, 9587, 4, 4, UNI_AGE__11 } /* age=11.0 */, + { 0, 4699, 1, 15, 1, -UNI_ECOMP } /* emojicomponent=n */, + { 0, 10560, 8509, 3, 7, UNI_VITH } /* isvithkuqi */, + { 0, 8782, 8537, 7, 7, UNI_SC__BENG } /* script=bengali */, + { 0, 9691, 8663, 4, 7, UNI_INLINEARA } /* blk=lineara */, + { 1, 2242, 2494, 3, 19, UNI_INNYIAKENGPUACHUEHMONG } /* innyiakengpuachuehmong */, + { 0, 1990, 7470, 22, 10, UNI_INSC__PUREKILLER } /* indicsyllabiccategory=purekiller */, + { 2, 185, 6230, 2, 12, UNI_ETHIOPICEXTA } /* isethiopicexta */, + { 0, 9691, 8260, 4, 8, UNI_INARMENIAN } /* blk=armenian */, + { 0, 9691, 3571, 4, 17, UNI_ALCHEMICAL } /* blk=alchemicalsymbols */, + { 3, 1014, 0, 5, 0, UNI_GREK } /* greek */, + { 1, 10516, 0, 3, 0, UNI_P } /* isp */, + { 8, 10268, 5732, 3, 13, UNI_NV__1000000000000 } /* nv=1000000000000 */, + { 3, 8973, 8775, 6, 7, UNI_INPHAGSPA } /* block=phagspa */, + { 0, 1990, 2670, 22, 19, UNI_INSC__CONSONANTHEADLETTER } /* indicsyllabiccategory=consonantheadletter */, + { 8, 9474, 4458, 5, 16, UNI_INSC__VOWELINDEPENDENT } /* insc=vowelindependent */, + { 2, 9803, 6070, 4, 13, UNI_HST__NA } /* hst=notapplicable */, + { 1, 185, 4410, 2, 16, UNI_SYRIACSUP } /* issyriacsupplement */, + { 2, 1418, 7220, 24, 10, UNI_CCC__BR } /* canonicalcombiningclass=belowright */, + { 1, 185, 44, 3, 8, UNI_CJKCOMPAT } /* iscjkcompat */, + { 0, 7460, 7550, 10, 10, UNI_AGE__NA } /* presentin=unassigned */, + { 8, 7580, 3409, 10, 17, UNI_RI } /* wordbreak=regionalindicator */, + { 0, 9476, 7817, 3, 9, UNI_SC__PERM } /* sc=oldpermic */, + { 10, 9691, 4314, 4, 7, UNI_INMYANMAR } /* blk=myanmar */, + { 1, 5758, 3, 13, 1, -UNI_BIDIM } /* bidimirrored=f */, + { 3, 9476, 6593, 3, 4, UNI_HUNG } /* sc=hung */, + { 2, 8973, 8845, 6, 7, UNI_INTAIVIET } /* block=taiviet */, + { 0, 9979, 7072, 5, 10, UNI_SORA } /* scx=sorasompeng */, + { 9, 9647, 7995, 4, 2, UNI_AGE__12 } /* age=12 */, + { 0, 3826, 0, 4, 0, UNI_MANI } /* mani */, + { 2, 10217, 408, 3, 2, UNI_BC__ON } /* bc=on */, + { 1, 8955, 0, 6, 0, UNI_alpha_values_index } /* alpha= */, + { 0, 570, 0, 30, 0, UNI_CJKEXTC } /* cjkunifiedideographsextensionc */, + { 8, 3877, 4759, 17, 15, UNI_ARMI } /* scriptextensions=imperialaramaic */, + { 6, 9727, 1, 4, 1, -UNI_CWL } /* cwl=n */, + { 6, 7297, 5669, 3, 3, UNI_HEBR } /* ishebr */, + { 0, 6937, 4302, 6, 12, UNI_MISCMATHSYMBOLSB } /* inmiscmathsymbolsb */, + { 0, 9075, 9454, 6, 5, -UNI_GREXT } /* grext=false */, + { 6, 6083, 10133, 13, 3, UNI_NV__1_SLASH_9 } /* numericvalue=1/9 */, + { 0, 2312, 2767, 4, 17, UNI_JAMOEXTB } /* inhanguljamoextendedb */, + { 1, 3877, 8276, 17, 4, UNI_BALI } /* scriptextensions=bali */, + { 8, 5172, 1, 14, 1, -UNI_EMOD } /* emojimodifier=n */, + { 0, 3877, 9129, 17, 4, UNI_LYCI } /* scriptextensions=lyci */, + { 6, 9727, 10055, 4, 4, UNI_CWL } /* cwl=true */, + { 17, 9711, 8998, 5, 5, UNI_CCC__118 } /* ccc=ccc118 */, + { 4, 6083, 9575, 13, 4, UNI_NV__1_SLASH_64 } /* numericvalue=1/64 */, + { 0, 8782, 7826, 7, 9, UNI_ORKH } /* script=oldturkic */, + { 1, 1990, 6566, 22, 12, UNI_INSC__NUMBERJOINER } /* indicsyllabiccategory=numberjoiner */, + { 2, 1990, 2868, 22, 10, UNI_INSC__TONELETTER } /* indicsyllabiccategory=toneletter */, + { 0, 9711, 10160, 4, 3, UNI_CCC__A } /* ccc=230 */, + { 0, 185, 9706, 2, 2, UNI_MC } /* ismc */, + { 3, 8444, 10055, 8, 4, UNI_RADICAL } /* radical=true */, + { 12, 9476, 5227, 3, 4, UNI_CHAM } /* sc=cham */, + { 4, 9691, 8565, 4, 7, UNI_CJKEXTD } /* blk=cjkextd */, + { 0, 3481, 0, 18, 0, UNI_TAIXUANJING } /* taixuanjingsymbols */, + { 7, 9979, 7808, 4, 9, UNI_ITAL } /* scx=olditalic */, + { 0, 4074, 10396, 16, 2, UNI_ZL } /* generalcategory=zl */, + { 2, 10268, 8052, 3, 8, UNI_NV__1_SLASH_320 } /* nv=3.13e-03 */, + { 2, 7580, 8698, 10, 7, UNI_WB__NL } /* wordbreak=newline */, + { 2, 9987, 0, 4, 0, UNI_SGNW } /* sgnw */, + { 17, 3877, 7434, 18, 6, UNI_SOGD } /* scriptextensions=sogdian */, + { 0, 4157, 416, 3, 10, UNI_IDEO } /* isideographic */, + { 0, 3265, 0, 4, 0, UNI_GEOR } /* geor */, + { 24, 9476, 2493, 3, 20, UNI_HMNP } /* sc=nyiakengpuachuehmong */, + { 1, 9647, 7924, 4, 3, UNI_IN__1_DOT_1 } /* age=1.1 */, + { 0, 9525, 1184, 4, 3, UNI_ANY } /* unicode */, + { 1, 10087, 0, 4, 0, UNI_WCHO } /* wcho */, + { 1, 10229, 2593, 3, 8, UNI_DT__VERT } /* dt=vertical */, + { 4, 4154, 953, 3, 17, UNI_INVS } /* invariationselectors */, + { 6, 9476, 2584, 3, 4, UNI_SC__MAND } /* sc=mand */, + { 2, 9647, 10075, 4, 4, UNI_AGE__13 } /* age=v130 */, + { 0, 2803, 0, 4, 0, UNI_IDST } /* idst */, + { 0, 8973, 2433, 6, 10, UNI_INGLAGOLITIC } /* block=glagolitic */, + { 0, 10352, 1219, 3, 8, UNI_WB__KA } /* wb=katakana */, + { 1, 7218, 9295, 3, 4, UNI_INBUHID } /* inbuhid */, + { 10, 4699, 9454, 15, 5, -UNI_ECOMP } /* emojicomponent=false */, + { 3, 9545, 36, 4, 1, UNI_IDC } /* idc=t */, + { 16, 6083, 8119, 13, 1, UNI_NV__9 } /* numericvalue=9 */, + { 1, 6083, 10372, 13, 2, UNI_NV__49 } /* numericvalue=49 */, + { 0, 3877, 4426, 17, 4, UNI_TANG } /* scriptextensions=tang */, + { 1, 9474, 1245, 5, 9, UNI_INSC__CONSONANT } /* insc=consonant */, + { 0, 10268, 7950, 3, 1, UNI_NV__4 } /* nv=4 */, + { 0, 10250, 6, 3, 1, UNI_JT__D } /* jt=d */, + { 1, 7230, 25, 10, 1, UNI_BC__S } /* bidiclass=s */, + { 1, 9691, 8691, 4, 7, UNI_INMULTANI } /* blk=multani */, + { 0, 868, 0, 18, 0, UNI_PHONETICEXT } /* phoneticextensions */, + { 2, 8782, 7105, 8, 3, UNI_SC__SYLO } /* script=sylo */, + { 6, 9077, 9454, 4, 5, -UNI_EXT } /* ext=false */, + { 24, 10247, 8852, 3, 7, UNI_JG__THINYEH } /* jg=thinyeh */, + { 4, 8973, 6290, 6, 12, UNI_INGUNJALAGONDI } /* block=gunjalagondi */, + { 0, 185, 8677, 2, 7, UNI_MAND } /* ismandaic */, + { 4, 8340, 0, 8, 0, UNI_GUJR } /* gujarati */, + { 1, 9647, 9596, 4, 3, UNI_AGE__2_DOT_1 } /* age=2.1 */, + { 0, 185, 9444, 2, 5, UNI_DOGR } /* isdogra */, + { 0, 1553, 6994, 9, 11, UNI_NO } /* category=othernumber */, + { 0, 1418, 9387, 24, 2, UNI_CCC__31 } /* canonicalcombiningclass=31 */, + { 3, 9647, 10325, 4, 3, UNI_AGE__6 } /* age=v60 */, + { 10, 9461, 1195, 3, 2, UNI_LB__LF } /* sb=lf */, + { 4, 7467, 10331, 3, 3, UNI_IN__6_DOT_2 } /* in=v62 */, + { 4, 10510, 468, 6, 5, UNI_XPOSIXPUNCT } /* xposixpunct */, + { 8, 3877, 7105, 18, 10, UNI_SYLO } /* scriptextensions=sylotinagri */, + { 1, 3877, 8811, 18, 6, UNI_SOYO } /* scriptextensions=soyombo */, + { 0, 3877, 9779, 17, 4, UNI_GUJR } /* scriptextensions=gujr */, + { 9, 6083, 9579, 13, 4, UNI_NV__1_SLASH_80 } /* numericvalue=1/80 */, + { 36, 8973, 4378, 6, 16, UNI_SUPMATHOPERATORS } /* block=supmathoperators */, + { 4, 750, 0, 30, 0, UNI_ENCLOSEDALPHANUMSUP } /* enclosedalphanumericsupplement */, + { 3, 8396, 0, 8, 0, UNI_KANAEXTA } /* kanaexta */, + { 0, 185, 4298, 2, 16, UNI_MISCMATHSYMBOLSB } /* ismiscmathsymbolsb */, + { 5, 1189, 8839, 3, 6, UNI_INTAITHAM } /* intaitham */, + { 9, 6937, 862, 6, 6, UNI_MISCARROWS } /* inmiscarrows */, + { 1, 9476, 9943, 3, 4, UNI_PRTI } /* sc=prti */, + { 3, 3877, 8420, 17, 8, UNI_MAHJ } /* scriptextensions=mahajani */, + { 1, 9476, 8420, 3, 8, UNI_SC__MAHJ } /* sc=mahajani */, + { 1, 9979, 4534, 4, 7, UNI_BRAI } /* scx=braille */, + { 4, 9691, 4505, 5, 14, UNI_BAMUMSUP } /* blk=bamumsupplement */, + { 3, 185, 44, 3, 35, UNI_CJKCOMPATIDEOGRAPHSSUP } /* iscjkcompatibilityideographssupplement */, + { 2, 10229, 46, 3, 6, UNI_DT__COM } /* dt=compat */, + { 0, 185, 6518, 2, 4, UNI_MEND } /* ismend */, + { 0, 10253, 6170, 3, 12, UNI_LB__SY } /* lb=breaksymbols */, + { 0, 21, 9484, 2, 5, UNI_INLIMBU } /* inlimbu */, + { 32, 4170, 0, 16, 0, UNI_LATIN1 } /* latin1supplement */, + { 12, 10352, 5830, 3, 5, UNI_WB__EB } /* wb=ebase */, + { 0, 8854, 9239, 4, 4, UNI_INYEZIDI } /* inyezidi */, + { 1, 10268, 7995, 3, 2, UNI_NV__12 } /* nv=12 */, + { 5, 10508, 3403, 8, 5, UNI_XPOSIXSPACE } /* isxposixspace */, + { 0, 1538, 7312, 4, 8, UNI_INDIVESAKURU } /* indivesakuru */, + { 1, 9979, 2164, 4, 8, UNI_CYRL } /* scx=cyrillic */, + { 2, 8782, 6590, 7, 12, UNI_HUNG } /* script=oldhungarian */, + { 3, 7844, 0, 9, 0, UNI_PALM } /* palmyrene */, + { 0, 5823, 1, 13, 1, -UNI_GRBASE } /* graphemebase=n */, + { 1, 1592, 8615, 3, 6, UNI_INELYMAIC } /* inelymaic */, + { 10, 9269, 10355, 5, 3, UNI_POSIXXDIGIT } /* ahex=yes */, + { 0, 9691, 4138, 4, 16, UNI_HIGHPUSURROGATES } /* blk=highpusurrogates */, + { 3, 9979, 9819, 4, 4, UNI_KNDA } /* scx=knda */, + { 1, 7460, 8156, 10, 3, UNI_IN__6_DOT_2 } /* presentin=6.2 */, + { 0, 10217, 37, 3, 2, UNI_BC__EN } /* bc=en */, + { 0, 6518, 0, 4, 0, UNI_MEND } /* mend */, + { 1, 9476, 6928, 3, 11, UNI_MEDF } /* sc=medefaidrin */, + { 3, 185, 1172, 2, 2, UNI_TITLE } /* islt */, + { 0, 8838, 0, 7, 0, UNI_LANA } /* taitham */, + { 0, 10244, 401, 3, 6, UNI_CF } /* gc=format */, + { 0, 1553, 4286, 9, 10, UNI_SM } /* category=mathsymbol */, + { 0, 10553, 7105, 3, 3, UNI_SYLO } /* issylo */, + { 0, 5088, 0, 14, 0, UNI_ahex_values_index } /* asciihexdigit= */, + { 3, 10352, 5948, 3, 2, UNI_WB__ML } /* wb=ml */, + { 0, 4401, 0, 4, 0, UNI_EMOD } /* emod */, + { 0, 3877, 8670, 17, 4, UNI_MAKA } /* scriptextensions=maka */, + { 1, 9057, 26, 6, 1, UNI_EMOJI } /* emoji=y */, + { 1, 3877, 8866, 17, 7, UNI_TIRH } /* scriptextensions=tirhuta */, + { 7, 4074, 407, 16, 7, UNI_XPOSIXCNTRL } /* generalcategory=control */, + { 0, 9691, 8530, 4, 7, UNI_INAVESTAN } /* blk=avestan */, + { 0, 185, 2860, 2, 19, UNI_MODIFIERTONELETTERS } /* ismodifiertoneletters */, + { 8, 10244, 1187, 3, 2, UNI_PO } /* gc=po */, + { 1, 9919, 0, 4, 0, UNI_OSGE } /* osge */, + { 1, 10268, 8907, 3, 6, UNI_NV__300000 } /* nv=300000 */, + { 1, 8782, 4411, 8, 5, UNI_SC__SYRC } /* script=syriac */, + { 2, 9691, 5888, 4, 13, UNI_KANAEXTA } /* blk=kanaextendeda */, + { 0, 10268, 8937, 3, 4, UNI_NV__7000 } /* nv=7000 */, + { 1, 9979, 3103, 4, 6, UNI_COPT } /* scx=coptic */, + { 3, 9147, 0, 6, 0, UNI_nchar_values_index } /* nchar= */, + { 2, 4074, 38, 16, 2, UNI_XPOSIXDIGIT } /* generalcategory=nd */, + { 0, 3403, 1026, 6, 2, -UNI_XPOSIXSPACE } /* space=no */, + { 1, 9270, 1026, 4, 2, -UNI_XPOSIXXDIGIT } /* hex=no */, + { 4, 1553, 5096, 9, 5, UNI_XPOSIXDIGIT } /* category=digit */, + { 1, 5830, 0, 6, 0, UNI_ebase_values_index } /* ebase= */, + { 9, 5875, 7170, 13, 10, UNI_JG__AFRICANFEH } /* joininggroup=africanfeh */, + { 3, 7467, 8212, 3, 3, UNI_IN__8 } /* in=8.0 */, + { 0, 7159, 0, 11, 0, UNI_YISYLLABLES } /* yisyllables */, + { 4, 8881, 6123, 3, 11, UNI_ALPHABETICPF } /* isalphabeticpf */, + { 19, 9711, 9367, 4, 2, UNI_CCC__27 } /* ccc=27 */, + { 5, 10349, 3, 3, 1, -UNI_VS } /* vs=f */, + { 0, 1880, 3, 22, 1, -UNI_CWU } /* changeswhenuppercased=f */, + { 2, 7360, 341, 10, 2, UNI_LB__OP } /* linebreak=op */, + { 0, 7467, 10301, 3, 3, UNI_IN__3 } /* in=v30 */, + { 1, 79, 0, 35, 0, UNI_ARABICMATH } /* arabicmathematicalalphabeticsymbols */, + { 1, 10553, 45, 3, 1, UNI_SK } /* issk */, + { 0, 5875, 5480, 13, 14, UNI_JG__MANICHAEANRESH } /* joininggroup=manichaeanresh */, + { 2, 7460, 7950, 10, 1, UNI_IN__4 } /* presentin=4 */, + { 6, 9979, 2632, 4, 6, UNI_BRAH } /* scx=brahmi */, + { 6, 8973, 511, 7, 19, UNI_CJK } /* block=cjkunifiedideographs */, + { 0, 7300, 10355, 10, 3, UNI_DIA } /* diacritic=yes */, + { 1, 1586, 0, 23, 0, UNI_BYZANTINEMUSIC } /* byzantinemusicalsymbols */, + { 0, 7460, 10325, 10, 3, UNI_IN__6 } /* presentin=v60 */, + { 0, 9735, 36, 4, 1, UNI_CWU } /* cwu=t */, + { 1, 4684, 1205, 15, 9, UNI_EA__F } /* eastasianwidth=fullwidth */, + { 2, 9691, 9895, 4, 3, UNI_INNKO } /* blk=nko */, + { 1, 185, 1588, 2, 1, UNI_Z } /* isz */, + { 5, 9979, 4190, 5, 3, UNI_SARB } /* scx=sarb */, + { 1, 10253, 6287, 3, 3, UNI_LB__ZWJ } /* lb=zwj */, + { 1, 9476, 7655, 3, 9, UNI_BHKS } /* sc=bhaiksuki */, + { 2, 9476, 8292, 3, 4, UNI_SC__BUGI } /* sc=bugi */, + { 4, 9476, 10043, 3, 4, UNI_TIBT } /* sc=tibt */, + { 0, 10349, 9454, 3, 5, -UNI_VS } /* vs=false */, + { 2, 8782, 7434, 8, 6, UNI_SC__SOGD } /* script=sogdian */, + { 12, 630, 0, 30, 0, UNI_CJKEXTE } /* cjkunifiedideographsextensione */, + { 0, 185, 7520, 2, 10, UNI_SUPARROWSA } /* issuparrowsa */, + { 0, 4157, 2804, 3, 3, UNI_IDST } /* isidst */, + { 2, 8973, 868, 6, 18, UNI_PHONETICEXT } /* block=phoneticextensions */, + { 0, 8782, 7817, 7, 9, UNI_SC__PERM } /* script=oldpermic */, + { 0, 7460, 10067, 10, 4, UNI_IN__12 } /* presentin=v120 */, + { 2, 3877, 9795, 17, 4, UNI_HMNG } /* scriptextensions=hmng */, + { 3, 6529, 7431, 3, 9, UNI_INOLDSOGDIAN } /* inoldsogdian */, + { 1, 9691, 3962, 4, 16, UNI_ARABICSUP } /* blk=arabicsupplement */, + { 2, 6083, 9619, 13, 4, UNI_NV__3_SLASH_16 } /* numericvalue=3/16 */, + { 2, 9691, 3724, 4, 17, UNI_ETHIOPICEXTB } /* blk=ethiopicextendedb */, + { 0, 9429, 26, 5, 1, UNI_CWCF } /* cwcf=y */, + { 0, 1553, 5677, 10, 13, UNI_ZS } /* category=spaceseparator */, + { 8, 8973, 7200, 6, 10, UNI_ARABICEXTB } /* block=arabicextb */, + { 3, 9819, 0, 4, 0, UNI_KNDA } /* knda */, + { 2, 10352, 34, 3, 6, UNI_WB__EXTEND } /* wb=extend */, + { 6, 185, 9683, 2, 4, UNI_BATK } /* isbatk */, + { 1, 10244, 5797, 3, 13, UNI_XPOSIXDIGIT } /* gc=decimalnumber */, + { 0, 5014, 0, 15, 0, UNI_UPPERCASELETTER } /* uppercaseletter */, + { 5, 9489, 10055, 5, 4, UNI_MATH } /* math=true */, + { 0, 5172, 36, 14, 1, UNI_EMOD } /* emojimodifier=t */, + { 1, 10268, 5732, 3, 4, UNI_NV__1000 } /* nv=1000 */, + { 0, 4894, 48, 15, 1, UNI_NFCQC__M } /* nfkcquickcheck=m */, + { 13, 10226, 36, 3, 1, UNI_DI } /* di=t */, + { 0, 8973, 2727, 6, 19, UNI_ENCLOSEDALPHANUMSUP } /* block=enclosedalphanumsup */, + { 2, 3877, 9751, 17, 4, UNI_DIAK } /* scriptextensions=diak */, + { 0, 1189, 4427, 3, 15, UNI_TANGUTCOMPONENTS } /* intangutcomponents */, + { 7, 1418, 8761, 24, 7, UNI_CCC__1 } /* canonicalcombiningclass=overlay */, + { 0, 1418, 8992, 25, 5, UNI_CCC__107 } /* canonicalcombiningclass=ccc107 */, + { 0, 8973, 3724, 6, 17, UNI_ETHIOPICEXTB } /* block=ethiopicextendedb */, + { 0, 1891, 0, 5, 0, UNI_XPOSIXUPPER } /* upper */, + { 0, 6350, 6884, 12, 11, UNI_JT__L } /* joiningtype=leftjoining */, + { 1, 7218, 7241, 3, 9, UNI_BOXDRAWING } /* inboxdrawing */, + { 2, 9476, 2311, 3, 4, UNI_SC__SINH } /* sc=sinh */, + { 0, 1814, 26, 22, 1, UNI_CWCM } /* changeswhencasemapped=y */, + { 1, 3877, 10051, 17, 4, UNI_TOTO } /* scriptextensions=toto */, + { 0, 10247, 5508, 3, 14, UNI_JG__MANICHAEANYODH } /* jg=manichaeanyodh */, + { 0, 10244, 4999, 3, 15, UNI_TITLE } /* gc=titlecaseletter */, + { 0, 1674, 0, 4, 0, UNI_JAMO } /* jamo */, + { 24, 9147, 10355, 6, 3, UNI__PERL_NCHAR } /* nchar=yes */, + { 0, 9767, 0, 4, 0, UNI_GONG } /* gong */, + { 0, 10031, 0, 4, 0, UNI_TFNG } /* tfng */, + { 2, 4157, 448, 3, 31, UNI_IDEOGRAPHICSYMBOLS } /* isideographicsymbolsandpunctuation */, + { 7, 10217, 2290, 3, 21, UNI_BC__PDI } /* bc=popdirectionalisolate */, + { 1, 10232, 1205, 3, 9, UNI_EA__F } /* ea=fullwidth */, + { 1, 7600, 0, 10, 0, UNI_YIRADICALS } /* yiradicals */, + { 0, 8973, 661, 7, 29, UNI_CJKEXTF } /* block=cjkunifiedideographsextensionf */, + { 0, 7580, 496, 10, 7, UNI_WB__NU } /* wordbreak=numeric */, + { 17, 6741, 9454, 11, 5, -UNI_DEP } /* deprecated=false */, + { 0, 9691, 7736, 4, 9, UNI_LATINEXTD } /* blk=latinextd */, + { 1, 9474, 5200, 5, 14, UNI_INSC__GEMINATIONMARK } /* insc=geminationmark */, + { 1, 9979, 8508, 4, 4, UNI_VITH } /* scx=vith */, + { 8, 8782, 2509, 7, 4, UNI_SC__MONG } /* script=mong */, + { 17, 2304, 7819, 4, 7, UNI_PERM } /* isoldpermic */, + { 0, 4157, 2454, 3, 19, UNI_PHLI } /* isinscriptionalpahlavi */, + { 12, 7218, 8539, 4, 5, UNI_INBENGALI } /* inbengali */, + { 2, 1990, 4969, 22, 15, UNI_INSC__REGISTERSHIFTER } /* indicsyllabiccategory=registershifter */, + { 1, 8754, 0, 4, 0, UNI_OSMA } /* osma */, + { 0, 10247, 5979, 3, 13, UNI_JG__MANICHAEANNUN } /* jg=manichaeannun */, + { 5, 4972, 4443, 3, 8, UNI_TANGUTSUP } /* istangutsup */, + { 4, 468, 0, 5, 0, UNI_P } /* punct */, + { 23, 10268, 7934, 3, 1, UNI_NV__2 } /* nv=2 */, + { 5, 2248, 7072, 3, 10, UNI_INSORASOMPENG } /* insorasompeng */, + { 6, 3877, 10019, 17, 4, UNI_TALU } /* scriptextensions=talu */, + { 6, 10247, 5235, 3, 3, UNI_JG__HEH } /* jg=heh */, + { 1, 4154, 953, 3, 27, UNI_VSSUP } /* invariationselectorssupplement */, + { 0, 4684, 8, 15, 1, UNI_EA__A } /* eastasianwidth=a */, + { 2, 1189, 9196, 3, 5, UNI_INTANGSA } /* intangsa */, + { 3, 9691, 9207, 4, 6, UNI_INTHAANA } /* blk=thaana */, + { 9, 3445, 0, 4, 0, UNI_RUMI } /* rumi */, + { 0, 8973, 5368, 6, 7, UNI_LISUSUP } /* block=lisusup */, + { 2, 6083, 7964, 13, 8, UNI_NV__3_SLASH_20 } /* numericvalue=1.50e-01 */, + { 14, 10253, 74, 3, 2, UNI_EMOD } /* lb=em */, + { 3, 8782, 9963, 7, 4, UNI_SC__ROHG } /* script=rohg */, + { 0, 1418, 7320, 24, 4, UNI_CCC__6 } /* canonicalcombiningclass=hanr */, + { 0, 9731, 26, 4, 1, UNI_CWT } /* cwt=y */, + { 0, 5875, 0, 13, 0, UNI_jg_values_index } /* joininggroup= */, + { 0, 9691, 9509, 4, 5, UNI_INOGHAM } /* blk=ogham */, + { 0, 10268, 10139, 3, 3, UNI_NV__2_SLASH_5 } /* nv=2/5 */, + { 9, 8973, 5901, 6, 13, UNI_KANAEXTB } /* block=kanaextendedb */, + { 0, 8973, 7736, 6, 9, UNI_LATINEXTD } /* block=latinextd */, + { 2, 185, 5368, 2, 14, UNI_LISUSUP } /* islisusupplement */, + { 17, 1418, 8028, 24, 3, UNI_WB__EB } /* canonicalcombiningclass=200 */, + { 0, 9691, 8670, 4, 7, UNI_INMAKASAR } /* blk=makasar */, + { 3, 2206, 10394, 21, 2, UNI_GCB__XX } /* graphemeclusterbreak=xx */, + { 8, 185, 1837, 3, 20, UNI_CWL } /* ischangeswhenlowercased */, + { 0, 5045, 7551, 3, 9, UNI_CN } /* isunassigned */, + { 2, 8881, 9656, 3, 3, UNI_AHOM } /* isahom */, + { 0, 8782, 3826, 7, 10, UNI_SC__MANI } /* script=manichaean */, + { 1, 9979, 8621, 4, 4, UNI_GRAN } /* scx=gran */, + { 5, 4847, 2362, 10, 11, UNI_MERO } /* inmeroitichieroglyphs */, + { 8, 1115, 1026, 26, 2, -UNI_CWKCF } /* changeswhennfkccasefolded=no */, + { 11, 0, 0, 34, 0, UNI_UCAS } /* unifiedcanadianaboriginalsyllabics */, + { 10, 9439, 1, 5, 1, -UNI_DASH } /* dash=n */, + { 3, 1189, 4985, 3, 7, UNI_TAMILSUP } /* intamilsup */, + { 8, 2227, 0, 14, 0, UNI_ROHG } /* hanifirohingya */, + { 6, 8782, 6302, 7, 6, UNI_HEBR } /* script=hebrew */, + { 5, 9803, 0, 4, 0, UNI_hst_values_index } /* hst= */, + { 2, 415, 0, 11, 0, UNI_IDEO } /* ideographic */, + { 3, 9691, 4442, 4, 9, UNI_TANGUTSUP } /* blk=tangutsup */, + { 1, 21, 5284, 2, 14, UNI_LATINEXTB } /* inlatinextendedb */, + { 1, 9476, 4534, 3, 7, UNI_BRAI } /* sc=braille */, + { 4, 8973, 44, 7, 2, UNI_CJK } /* block=cjk */, + { 2, 9464, 26, 5, 1, UNI_IDST } /* idst=y */, + { 0, 10253, 23, 3, 2, UNI_LB__AL } /* lb=al */, + { 0, 1418, 10386, 24, 2, UNI_CCC__8 } /* canonicalcombiningclass=kv */, + { 0, 10268, 8211, 3, 2, UNI_NV__18 } /* nv=18 */, + { 0, 4157, 4760, 3, 14, UNI_ARMI } /* isimperialaramaic */, + { 11, 185, 5810, 2, 13, UNI_ME } /* isenclosingmark */, + { 2, 3877, 6518, 17, 12, UNI_MEND } /* scriptextensions=mendekikakui */, + { 2, 7360, 1466, 10, 13, UNI_LB__CM } /* linebreak=combiningmark */, + { 2, 9847, 1026, 4, 2, -UNI_LOE } /* loe=no */, + { 1, 9979, 8866, 4, 7, UNI_TIRH } /* scx=tirhuta */, + { 0, 3175, 1026, 18, 2, -UNI_EPRES } /* emojipresentation=no */, + { 3, 185, 3792, 2, 17, UNI_KITS } /* iskhitansmallscript */, + { 0, 8782, 2493, 7, 20, UNI_HMNP } /* script=nyiakengpuachuehmong */, + { 6, 9691, 184, 4, 20, UNI_MISCSYMBOLS } /* blk=miscellaneoussymbols */, + { 0, 9803, 6650, 4, 12, UNI_GCB__T } /* hst=trailingjamo */, + { 3, 10244, 342, 3, 2, UNI_PE } /* gc=pe */, + { 3, 8782, 8754, 7, 4, UNI_OSMA } /* script=osma */, + { 3, 9476, 9783, 3, 4, UNI_SC__GURU } /* sc=guru */, + { 3, 1538, 3367, 4, 6, UNI_DINGBATS } /* indingbats */, + { 0, 5116, 10055, 14, 4, UNI_CI } /* caseignorable=true */, + { 4, 8973, 4654, 6, 15, UNI_DIACRITICALSEXT } /* block=diacriticalsext */, + { 2, 6083, 8228, 13, 8, UNI_NV__1_SLASH_12 } /* numericvalue=8.33e-02 */, + { 1, 9979, 4984, 4, 5, UNI_TAML } /* scx=tamil */, + { 1, 7460, 7995, 10, 4, UNI_IN__12 } /* presentin=12.0 */, + { 6, 1770, 17, 22, 1, UNI_BPT__O } /* bidipairedbrackettype=o */, + { 1, 3157, 0, 5, 0, UNI_EMOJI } /* emoji */, + { 0, 185, 3193, 2, 8, UNI_ETHI } /* isethiopic */, + { 0, 4074, 599, 16, 2, UNI_XPOSIXCNTRL } /* generalcategory=cc */, + { 0, 9691, 6182, 4, 12, UNI_CHESSSYMBOLS } /* blk=chesssymbols */, + { 3, 10247, 8324, 3, 8, UNI_JG__FARSIYEH } /* jg=farsiyeh */, + { 0, 1394, 0, 24, 0, UNI_ARABICPFB } /* arabicpresentationformsb */, + { 27, 10516, 8769, 3, 5, UNI_PATSYN } /* ispatsyn */, + { 0, 8973, 7637, 6, 9, UNI_ARABICPFA } /* block=arabicpfa */, + { 1, 3877, 10035, 17, 4, UNI_TGLG } /* scriptextensions=tglg */, + { 1, 8973, 1595, 6, 14, UNI_MUSIC } /* block=musicalsymbols */, + { 0, 7297, 1656, 3, 22, UNI_COMPATJAMO } /* ishangulcompatibilityjamo */, + { 1, 3398, 10055, 11, 4, UNI_XPOSIXSPACE } /* whitespace=true */, + { 2, 11, 0, 2, 0, UNI_DI } /* di */, + { 0, 10247, 6041, 3, 3, UNI_JG__WAW } /* jg=waw */, + { 0, 5875, 5438, 13, 14, UNI_JG__MANICHAEANHETH } /* joininggroup=manichaeanheth */, + { 6, 1792, 26, 22, 1, UNI_CWCF } /* changeswhencasefolded=y */, + { 2, 6314, 10055, 12, 4, UNI_IDEO } /* ideographic=true */, + { 0, 9476, 9767, 3, 4, UNI_SC__GONG } /* sc=gong */, + { 6, 10247, 1512, 3, 3, UNI_JG__HAH } /* jg=hah */, + { 13, 10508, 97, 8, 5, UNI_XPOSIXALPHA } /* isxposixalpha */, + { 0, 2003, 0, 11, 0, UNI_LO } /* category=lo */, + { 8, 4074, 4346, 16, 5, UNI_C } /* generalcategory=other */, + { 0, 9711, 7947, 4, 2, UNI_CCC__21 } /* ccc=21 */, + { 1, 9476, 8621, 3, 7, UNI_SC__GRAN } /* sc=grantha */, + { 4, 6675, 10055, 11, 4, UNI_IDC } /* idcontinue=true */, + { 4, 6350, 0, 12, 1, UNI_JT__U } /* joiningtype=u */, + { 10, 3877, 10043, 17, 4, UNI_TIBT } /* scriptextensions=tibt */, + { 5, 4154, 5030, 3, 7, UNI_VEDICEXT } /* invedicext */, + { 1, 185, 350, 2, 33, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* issupplementalsymbolsandpictographs */, + { 2, 10268, 8901, 3, 6, UNI_NV__216000 } /* nv=216000 */, + { 1, 7460, 7934, 10, 1, UNI_IN__2 } /* presentin=2 */, + { 0, 3877, 3139, 17, 10, UNI_DEVA } /* scriptextensions=devanagari */, + { 1, 5326, 0, 14, 0, UNI_LATINEXTE } /* latinextendede */, + { 0, 6083, 7958, 13, 2, UNI_NV__50 } /* numericvalue=50 */, + { 0, 10553, 48, 3, 1, UNI_SM } /* issm */, + { 1, 5875, 10241, 13, 3, UNI_JG__GAF } /* joininggroup=gaf */, + { 0, 9691, 4624, 4, 15, UNI_CURRENCYSYMBOLS } /* blk=currencysymbols */, + { 3, 6083, 8012, 13, 8, UNI_NV__1_SLASH_4 } /* numericvalue=2.50e-01 */, + { 2, 10247, 6458, 3, 12, UNI_JG__MALAYALAMSSA } /* jg=malayalamssa */, + { 4, 9711, 9355, 5, 4, UNI_CCC__25 } /* ccc=ccc25 */, + { 0, 9647, 9600, 4, 3, UNI_AGE__3 } /* age=3.0 */, + { 3, 8973, 1701, 6, 23, UNI_SHORTHANDFORMATCONTROLS } /* block=shorthandformatcontrols */, + { 7, 8782, 2164, 7, 8, UNI_SC__CYRL } /* script=cyrillic */, + { 8, 3139, 0, 13, 0, UNI_DEVANAGARIEXT } /* devanagariext */, + { 1, 1990, 5718, 22, 14, UNI_INSC__VOWELDEPENDENT } /* indicsyllabiccategory=voweldependent */, + { 0, 9899, 0, 4, 0, UNI_NSHU } /* nshu */, + { 15, 8973, 8587, 7, 6, UNI_CJKEXTG } /* block=cjkextg */, + { 1, 8973, 7420, 6, 10, UNI_INOLDPERSIAN } /* block=oldpersian */, + { 0, 2248, 1346, 3, 24, UNI_SYMBOLSFORLEGACYCOMPUTING } /* insymbolsforlegacycomputing */, + { 1, 1506, 1017, 5, 2, UNI_INGREEK } /* ingreek */, + { 1, 6122, 0, 12, 0, UNI_ALPHABETICPF } /* alphabeticpf */, + { 0, 9743, 10055, 4, 4, UNI_DEP } /* dep=true */, + { 0, 9979, 6518, 4, 4, UNI_MEND } /* scx=mend */, + { 0, 10247, 4829, 3, 3, UNI_JG__SAD } /* jg=sad */, + { 16, 6862, 0, 11, 0, UNI_KATAKANAEXT } /* katakanaext */, + { 0, 9979, 10123, 4, 4, UNI_ZZZZ } /* scx=zzzz */, + { 4, 10244, 729, 3, 6, UNI_N } /* gc=number */, + { 0, 21, 6862, 2, 11, UNI_KATAKANAEXT } /* inkatakanaext */, + { 1, 10553, 1529, 3, 8, UNI__PERL_SURROGATE } /* issurrogate */, + { 2, 7907, 10355, 9, 3, UNI_XIDS } /* xidstart=yes */, + { 2, 185, 1185, 2, 3, UNI_DEP } /* isdep */, + { 1, 3877, 8845, 17, 7, UNI_TAVT } /* scriptextensions=taiviet */, + { 16, 43, 0, 9, 0, UNI_CJKCOMPAT } /* cjkcompat */, + { 23, 8973, 2860, 6, 19, UNI_MODIFIERTONELETTERS } /* block=modifiertoneletters */, + { 4, 8973, 5270, 6, 14, UNI_KANGXI } /* block=kangxiradicals */, + { 0, 10268, 8140, 3, 8, UNI_NV__7_SLASH_12 } /* nv=5.83e-01 */, + { 17, 7360, 203, 10, 2, UNI_LB__SA } /* linebreak=sa */, + { 0, 9476, 383, 3, 4, UNI_EGYP } /* sc=egyp */, + { 0, 9691, 510, 4, 20, UNI_CJK } /* blk=cjkunifiedideographs */, + { 0, 2304, 6592, 4, 10, UNI_HUNG } /* isoldhungarian */, + { 2, 9476, 4426, 3, 4, UNI_TANG } /* sc=tang */, + { 0, 7330, 0, 4, 0, UNI_KHAR } /* khar */, + { 1, 9979, 8804, 5, 6, UNI_SIDD } /* scx=siddham */, + { 3, 9711, 9000, 4, 3, UNI_CCC__118 } /* ccc=118 */, + { 0, 9691, 6961, 4, 11, UNI_MYANMAREXTB } /* blk=myanmarextb */, + { 0, 5875, 4234, 13, 16, UNI_JG__MANICHAEANLAMEDH } /* joininggroup=manichaeanlamedh */, + { 1, 5875, 5953, 13, 13, UNI_JG__MALAYALAMNNNA } /* joininggroup=malayalamnnna */, + { 1, 9647, 10343, 4, 3, UNI_AGE__9 } /* age=v90 */, + { 0, 9549, 3, 5, 1, -UNI_XIDS } /* xids=f */, + { 0, 9691, 8492, 4, 7, UNI_UCASEXT } /* blk=ucasext */, + { 0, 185, 2085, 2, 15, UNI_MODIFIERLETTERS } /* ismodifierletters */, + { 1, 8854, 7160, 3, 10, UNI_YISYLLABLES } /* inyisyllables */, + { 7, 1418, 24, 24, 1, UNI_CCC__L } /* canonicalcombiningclass=l */, + { 0, 6939, 0, 11, 0, UNI_MISCSYMBOLS } /* miscsymbols */, + { 1, 9270, 26, 4, 1, UNI_XPOSIXXDIGIT } /* hex=y */, + { 0, 1115, 9454, 26, 5, -UNI_CWKCF } /* changeswhennfkccasefolded=false */, + { 3, 185, 2974, 2, 19, UNI_SUPARROWSB } /* issupplementalarrowsb */, + { 4, 3877, 8677, 17, 7, UNI_MAND } /* scriptextensions=mandaic */, + { 0, 9691, 8684, 4, 7, UNI_INMARCHEN } /* blk=marchen */, + { 0, 9171, 1026, 6, 2, -UNI__PERL_PATWS } /* patws=no */, + { 1, 2164, 0, 11, 0, UNI_CYRILLICSUP } /* cyrillicsup */, + { 8, 10247, 2227, 3, 21, UNI_JG__HANIFIROHINGYAKINNAYA } /* jg=hanifirohingyakinnaya */, + { 0, 10268, 8937, 3, 2, UNI_NV__70 } /* nv=70 */, + { 2, 5771, 0, 13, 0, UNI_BLOCKELEMENTS } /* blockelements */, + { 1, 3877, 4190, 18, 3, UNI_SARB } /* scriptextensions=sarb */, + { 0, 8782, 3265, 7, 4, UNI_SC__GEOR } /* script=geor */, + { 3, 8973, 5059, 6, 15, UNI_INZANABAZARSQUARE } /* block=zanabazarsquare */, + { 0, 10508, 63, 8, 5, UNI_XPOSIXGRAPH } /* isxposixgraph */, + { 3, 10268, 10204, 3, 2, UNI_NV__37 } /* nv=37 */, + { 14, 10217, 1, 4, 1, UNI_BC__BN } /* bc=bn */, + { 17, 3121, 8364, 18, 8, UNI_DT__ISO } /* decompositiontype=isolated */, + { 0, 6083, 7995, 13, 2, UNI_NV__12 } /* numericvalue=12 */, + { 0, 9691, 7718, 4, 9, UNI_LATINEXTB } /* blk=latinextb */, + { 20, 6083, 8903, 13, 3, UNI_NV__600 } /* numericvalue=600 */, + { 5, 6529, 9510, 3, 4, UNI_INOGHAM } /* inogham */, + { 1, 2304, 4955, 3, 14, UNI_PS } /* isopenpunctuation */, + { 0, 3877, 9871, 17, 4, UNI_MRO } /* scriptextensions=mroo */, + { 0, 8973, 2879, 6, 9, UNI_INMONGOLIAN } /* block=mongolian */, + { 2, 1553, 108, 10, 5, UNI_S } /* category=symbol */, + { 1, 4774, 0, 15, 0, UNI_LOWERCASELETTER } /* lowercaseletter */, + { 0, 10247, 4250, 3, 16, UNI_JG__MANICHAEANSAMEKH } /* jg=manichaeansamekh */, + { 1, 2784, 912, 19, 1, UNI_GCB__V } /* hangulsyllabletype=v */, + { 78, 185, 7281, 3, 9, UNI_COMPATJAMO } /* iscompatjamo */, + { 0, 5172, 1026, 14, 2, -UNI_EMOD } /* emojimodifier=no */, + { 1, 8500, 0, 8, 0, UNI_UGAR } /* ugaritic */, + { 0, 7391, 3624, 4, 15, UNI_AGHB } /* iscaucasianalbanian */, + { 10, 8782, 4924, 7, 15, UNI_NARB } /* script=oldnortharabian */, + { 3, 9743, 1, 4, 1, -UNI_DEP } /* dep=n */, + { 9, 185, 3139, 2, 4, UNI_DEVA } /* isdeva */, + { 8, 8782, 9835, 7, 4, UNI_SC__LATN } /* script=latn */, + { 19, 9069, 0, 6, 0, UNI_GOTH } /* gothic */, + { 0, 4847, 2880, 3, 11, UNI_MONGOLIANSUP } /* inmongoliansup */, + { 2, 207, 0, 2, 0, UNI_PI } /* pi */, + { 0, 4074, 909, 16, 10, UNI_CO } /* generalcategory=privateuse */, + { 4, 9711, 2479, 4, 5, UNI_CCC__R } /* ccc=right */, + { 8, 8782, 4042, 7, 7, UNI_SC__CPRT } /* script=cypriot */, + { 2, 10566, 1183, 5, 4, UNI_ANY } /* isunicode */, + { 4, 9231, 0, 6, 0, UNI_WCHO } /* wancho */, + { 6, 8973, 3463, 6, 12, UNI_SMALLKANAEXT } /* block=smallkanaext */, + { 0, 1418, 10151, 24, 3, UNI_CCC__L } /* canonicalcombiningclass=224 */, + { 0, 3877, 2433, 17, 10, UNI_GLAG } /* scriptextensions=glagolitic */, + { 0, 9691, 3979, 5, 7, UNI_INBOPOMOFO } /* blk=bopomofo */, + { 0, 10083, 0, 3, 0, UNI_VAI } /* vai */, + { 64, 8782, 8356, 7, 4, UNI_SC__HIRA } /* script=hira */, + { 1, 10268, 8124, 3, 8, UNI_NV__1_SLASH_20 } /* nv=5.00e-02 */, + { 0, 10250, 6638, 3, 12, UNI_JT__R } /* jt=rightjoining */, + { 5, 9979, 9751, 4, 4, UNI_DIAK } /* scx=diak */, + { 16, 8782, 6730, 7, 11, UNI_SC__CPMN } /* script=cyprominoan */, + { 0, 9691, 3355, 4, 18, UNI_ORNAMENTALDINGBATS } /* blk=ornamentaldingbats */, + { 33, 10244, 6719, 3, 11, UNI_CASEDLETTER } /* gc=casedletter */, + { 9, 9476, 7711, 5, 7, UNI_SC__SIND } /* sc=khudawadi */, + { 0, 5862, 0, 13, 0, UNI_IPAEXT } /* ipaextensions */, + { 1, 10244, 3301, 3, 18, UNI_PI } /* gc=initialpunctuation */, + { 0, 2553, 3, 20, 1, -UNI_TERM } /* terminalpunctuation=f */, + { 0, 1553, 38, 9, 2, UNI_XPOSIXDIGIT } /* category=nd */, + { 2, 9979, 9967, 4, 4, UNI_RUNR } /* scx=runr */, + { 4, 6937, 2047, 6, 9, UNI_MISCTECHNICAL } /* inmisctechnical */, + { 0, 6674, 9454, 12, 5, -UNI_XIDC } /* xidcontinue=false */, + { 7, 9647, 10211, 4, 3, UNI_AGE__9 } /* age=9.0 */, + { 1, 7467, 10187, 3, 3, UNI_IN__5_DOT_1 } /* in=5.1 */, + { 0, 10268, 7972, 3, 8, UNI_NV__1_SLASH_64 } /* nv=1.56e-02 */, + { 11, 6083, 10358, 13, 2, UNI_NV__38 } /* numericvalue=38 */, + { 9, 9687, 0, 4, 0, UNI_BHKS } /* bhks */, + { 1, 8973, 0, 6, 34, UNI_UCAS } /* block=unifiedcanadianaboriginalsyllabics */, + { 0, 8782, 8804, 8, 6, UNI_SIDD } /* script=siddham */, + { 4, 4074, 134, 16, 4, UNI_M } /* generalcategory=mark */, + { 1, 3877, 8388, 17, 4, UNI_JAVA } /* scriptextensions=java */, + { 2, 9045, 1026, 6, 2, -UNI_CWKCF } /* cwkcf=no */, + { 0, 9476, 8614, 3, 4, UNI_ELYM } /* sc=elym */, + { 0, 8782, 9831, 7, 3, UNI_LAO } /* script=lao */, + { 2, 8782, 6928, 7, 11, UNI_MEDF } /* script=medefaidrin */, + { 0, 185, 8380, 2, 8, UNI_JAMOEXTB } /* isjamoextb */, + { 1, 3121, 7, 18, 3, UNI_DT__CAN } /* decompositiontype=can */, + { 8, 9691, 184, 4, 34, UNI_MISCPICTOGRAPHS } /* blk=miscellaneoussymbolsandpictographs */, + { 0, 2808, 7192, 4, 8, UNI_ARABICEXTA } /* inarabicexta */, + { 8, 9979, 8614, 4, 4, UNI_ELYM } /* scx=elym */, + { 1, 185, 18, 2, 2, UNI_RI } /* isri */, + { 4, 1553, 5810, 9, 13, UNI_ME } /* category=enclosingmark */, + { 12, 10402, 10435, 6, 21, UNI__PERL_IS_IN_MULTI_CHAR_FOLD } /* _perl_is_in_multi_char_fold */, + { 0, 9691, 3445, 4, 18, UNI_RUMI } /* blk=ruminumeralsymbols */, + { 2, 9891, 0, 4, 0, UNI_NEWA } /* newa */, + { 1, 9057, 10355, 6, 3, UNI_EMOJI } /* emoji=yes */, + { 0, 9476, 9135, 3, 6, UNI_LYDI } /* sc=lydian */, + { 1, 10253, 6288, 3, 2, UNI_LB__WJ } /* lb=wj */, + { 0, 9219, 9454, 6, 5, -UNI_XPOSIXUPPER } /* upper=false */, + { 0, 2784, 0, 19, 0, UNI_hst_values_index } /* hangulsyllabletype= */, + { 2, 10250, 0, 3, 0, UNI_jt_values_index } /* jt= */, + { 8, 9647, 0, 4, 0, UNI_age_values_index } /* age= */, + { 0, 10510, 5802, 6, 5, UNI_XPOSIXALNUM } /* xposixalnum */, + { 0, 2784, 6895, 19, 3, UNI_LB__H3 } /* hangulsyllabletype=lvt */, + { 3, 8782, 9795, 7, 4, UNI_HMNG } /* script=hmng */, + { 0, 9545, 9454, 4, 5, -UNI_IDC } /* idc=false */, + { 3, 6578, 496, 12, 7, UNI_NT__NU } /* numerictype=numeric */, + { 0, 8782, 9129, 7, 4, UNI_LYCI } /* script=lyci */, + { 16, 9123, 36, 6, 1, UNI_XPOSIXLOWER } /* lower=t */, + { 0, 6083, 8943, 13, 5, UNI_NV__80000 } /* numericvalue=80000 */, + { 0, 3877, 494, 17, 3, UNI_HAN } /* scriptextensions=han */, + { 16, 10244, 1923, 3, 2, UNI_PC } /* gc=pc */, + { 16, 9979, 9081, 4, 4, UNI_HATR } /* scx=hatr */, + { 1, 3157, 9454, 18, 5, -UNI_EBASE } /* emojimodifierbase=false */, + { 12, 10244, 4639, 3, 15, UNI_PD } /* gc=dashpunctuation */, + { 17, 9691, 2143, 4, 14, UNI_CJKRADICALSSUP } /* blk=cjkradicalssup */, + { 13, 9715, 0, 4, 0, UNI_CHRS } /* chrs */, + { 1, 6083, 8028, 13, 2, UNI_NV__20 } /* numericvalue=20 */, + { 7, 9979, 9723, 4, 4, UNI_CPRT } /* scx=cprt */, + { 12, 10253, 10380, 3, 2, UNI_LB__H3 } /* lb=h3 */, + { 2, 9476, 3794, 5, 15, UNI_KITS } /* sc=khitansmallscript */, + { 0, 729, 0, 6, 0, UNI_N } /* number */, + { 2, 1858, 0, 22, 0, UNI_cwt_values_index } /* changeswhentitlecased= */, + { 2, 8782, 2937, 8, 8, UNI_SUND } /* script=sundanese */, + { 0, 9711, 23, 4, 2, UNI_CCC__AL } /* ccc=al */, + { 0, 7360, 6170, 10, 12, UNI_LB__SY } /* linebreak=breaksymbols */, + { 1, 1189, 8846, 3, 6, UNI_INTAIVIET } /* intaiviet */, + { 0, 8670, 0, 4, 0, UNI_MAKA } /* maka */, + { 1, 10217, 2473, 3, 11, UNI_BC__L } /* bc=lefttoright */, + { 0, 9691, 1724, 4, 23, UNI_SUPPUNCTUATION } /* blk=supplementalpunctuation */, + { 1, 7682, 36, 9, 1, UNI_EXT } /* extender=t */, + { 8, 7230, 10256, 10, 3, UNI_BC__LRE } /* bidiclass=lre */, + { 3, 185, 5606, 2, 14, UNI_PHONETICEXTSUP } /* isphoneticextsup */, + { 1, 3877, 8537, 17, 7, UNI_BENG } /* scriptextensions=bengali */, + { 1, 350, 0, 33, 0, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* supplementalsymbolsandpictographs */, + { 20, 1274, 10055, 21, 4, UNI_CE } /* compositionexclusion=true */, + { 1, 3877, 10023, 17, 4, UNI_TAML } /* scriptextensions=taml */, + { 1, 185, 8552, 3, 6, UNI_CJKEXTB } /* iscjkextb */, + { 0, 9461, 70, 3, 2, UNI_SB__UP } /* sb=up */, + { 1, 8705, 0, 8, 0, UNI_NFKCQC__N } /* nfkcqc=n */, + { 9, 4894, 9494, 15, 5, UNI_NFCQC__M } /* nfkcquickcheck=maybe */, + { 1, 1538, 3018, 24, 13, UNI_INPC__BOTTOMANDLEFT } /* indicpositionalcategory=bottomandleft */, + { 2, 3877, 2433, 17, 4, UNI_GLAG } /* scriptextensions=glag */, + { 0, 2100, 0, 22, 0, UNI_TRANSPORTANDMAP } /* transportandmapsymbols */, + { 0, 185, 2632, 2, 4, UNI_BRAH } /* isbrah */, + { 0, 185, 2144, 3, 13, UNI_CJKRADICALSSUP } /* iscjkradicalssup */, + { 6, 10250, 7126, 3, 11, UNI_JT__T } /* jt=transparent */, + { 3, 2433, 0, 4, 0, UNI_GLAG } /* glag */, + { 0, 9979, 6494, 4, 12, UNI_GONM } /* scx=masaramgondi */, + { 3, 3409, 1026, 18, 2, -UNI_RI } /* regionalindicator=no */, + { 0, 10103, 0, 4, 0, UNI_YI } /* yiii */, + { 13, 9895, 0, 4, 0, UNI_NKO } /* nkoo */, + { 8, 7060, 9454, 11, 5, -UNI_SD } /* softdotted=false */, + { 2, 8881, 2338, 3, 3, UNI_POSIXXDIGIT } /* isahex */, + { 0, 9190, 10355, 5, 3, UNI_TERM } /* term=yes */, + { 0, 9711, 9675, 4, 4, UNI_WB__EB } /* ccc=atbl */, + { 9, 9534, 0, 5, 0, UNI_TAKR } /* takri */, + { 0, 8973, 4849, 6, 15, UNI_INMEROITICCURSIVE } /* block=meroiticcursive */, + { 1, 8782, 8508, 7, 8, UNI_VITH } /* script=vithkuqi */, + { 0, 9476, 9231, 3, 6, UNI_WCHO } /* sc=wancho */, + { 1, 10268, 10130, 3, 3, UNI_NV__1_SLASH_7 } /* nv=1/7 */, + { 1, 9476, 6925, 5, 2, UNI_KHMR } /* sc=khmr */, + { 1, 185, 9959, 2, 4, UNI_RJNG } /* isrjng */, + { 0, 10402, 1160, 33, 5, UNI__PERL_PROBLEMATIC_LOCALE_FOLDEDS_START } /* _perl_problematic_locale_foldeds_start */, + { 0, 185, 4330, 2, 16, UNI_MYANMAREXTB } /* ismyanmarextendedb */, + { 14, 9691, 924, 4, 28, UNI_SUPPUAB } /* blk=supplementaryprivateuseareab */, + { 2, 3157, 26, 18, 1, UNI_EBASE } /* emojimodifierbase=y */, + { 16, 9489, 26, 5, 1, UNI_MATH } /* math=y */, + { 1, 5830, 1, 6, 1, -UNI_EBASE } /* ebase=n */, + { 0, 9476, 8838, 3, 7, UNI_LANA } /* sc=taitham */, + { 0, 9476, 9935, 3, 4, UNI_PHNX } /* sc=phnx */, + { 0, 8973, 6195, 7, 11, UNI_CYRILLICEXTA } /* block=cyrillicexta */, + { 0, 9691, 4505, 5, 4, UNI_INBAMUM } /* blk=bamum */, + { 16, 185, 10087, 2, 4, UNI_WCHO } /* iswcho */, + { 1, 9691, 7071, 4, 11, UNI_INSORASOMPENG } /* blk=sorasompeng */, + { 0, 6961, 0, 11, 0, UNI_MYANMAREXTB } /* myanmarextb */, + { 0, 4849, 0, 15, 0, UNI_MERC } /* meroiticcursive */, + { 3, 10508, 1891, 8, 5, UNI_XPOSIXUPPER } /* isxposixupper */, + { 18, 9691, 7709, 4, 9, UNI_INKHUDAWADI } /* blk=khudawadi */, + { 0, 185, 7060, 2, 10, UNI_SD } /* issoftdotted */, + { 1, 7580, 4401, 10, 9, UNI_WB__EB } /* wordbreak=emodifier */, + { 6, 8973, 6614, 6, 8, UNI_PHAISTOS } /* block=phaistos */, + { 2, 7360, 3403, 10, 5, UNI_LB__SP } /* linebreak=space */, + { 0, 7808, 0, 9, 0, UNI_ITAL } /* olditalic */, + { 0, 7467, 8156, 3, 3, UNI_IN__6_DOT_2 } /* in=6.2 */, + { 0, 9979, 1538, 5, 3, UNI_SIND } /* scx=sind */, + { 3, 1553, 909, 9, 10, UNI_CO } /* category=privateuse */, + { 1, 10039, 0, 4, 0, UNI_THAI } /* thai */, + { 7, 3877, 9663, 17, 4, UNI_ARMI } /* scriptextensions=armi */, + { 13, 2803, 26, 19, 1, UNI_IDST } /* idstrinaryoperator=y */, + { 3, 185, 3657, 3, 16, UNI_CYRILLICEXTA } /* iscyrillicextendeda */, + { 1, 9979, 9707, 4, 4, UNI_CANS } /* scx=cans */, + { 0, 8973, 2501, 6, 3, UNI_PUA } /* block=pua */, + { 1, 185, 3978, 2, 16, UNI_BOPOMOFOEXT } /* isbopomofoextended */, + { 3, 5648, 9454, 14, 5, -UNI_QMARK } /* quotationmark=false */, + { 1, 3758, 7480, 17, 10, UNI_IDENTIFIERSTATUS__RESTRICTED } /* identifierstatus=restricted */, + { 10, 7460, 10063, 10, 4, UNI_IN__11 } /* presentin=v110 */, + { 8, 6314, 10355, 12, 3, UNI_IDEO } /* ideographic=yes */, + { 0, 9476, 4939, 3, 15, UNI_SARB } /* sc=oldsoutharabian */, + { 1, 10352, 3409, 3, 17, UNI_RI } /* wb=regionalindicator */, + { 0, 2808, 7639, 4, 7, UNI_ARABICPFA } /* inarabicpfa */, + { 7, 8782, 9887, 7, 4, UNI_NBAT } /* script=nbat */, + { 0, 862, 0, 6, 0, UNI_ARROWS } /* arrows */, + { 9, 8642, 10355, 7, 3, UNI_HYPHEN } /* hyphen=yes */, + { 3, 3622, 0, 17, 0, UNI_AGHB } /* caucasianalbanian */, + { 1, 3877, 8388, 17, 8, UNI_JAVA } /* scriptextensions=javanese */, + { 0, 4074, 1466, 16, 13, UNI_M } /* generalcategory=combiningmark */, + { 2, 9691, 4042, 4, 16, UNI_CYPRIOTSYLLABARY } /* blk=cypriotsyllabary */, + { 0, 1923, 0, 2, 0, UNI_PC } /* pc */, + { 0, 6741, 26, 11, 1, UNI_DEP } /* deprecated=y */, + { 3, 1418, 9370, 25, 4, UNI_CCC__28 } /* canonicalcombiningclass=ccc28 */, + { 1, 8973, 2269, 6, 21, UNI_MEETEIMAYEKEXT } /* block=meeteimayekextensions */, + { 6, 5875, 5235, 13, 3, UNI_JG__HEH } /* joininggroup=heh */, + { 1, 9691, 4864, 4, 15, UNI_MISCPICTOGRAPHS } /* blk=miscpictographs */, + { 8, 9691, 1562, 4, 24, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* blk=supsymbolsandpictographs */, + { 1, 6741, 10355, 11, 3, UNI_DEP } /* deprecated=yes */, + { 13, 8973, 3962, 6, 9, UNI_ARABICSUP } /* block=arabicsup */, + { 3, 9647, 8092, 4, 3, UNI_AGE__4 } /* age=4.0 */, + { 1, 8973, 8500, 6, 8, UNI_INUGARITIC } /* block=ugaritic */, + { 1, 6083, 7951, 13, 1, UNI_NV__3 } /* numericvalue=3 */, + { 1, 2248, 351, 3, 32, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* insupplementalsymbolsandpictographs */, + { 3, 8593, 10055, 7, 4, UNI_COMPEX } /* compex=true */, + { 32, 9979, 8649, 4, 7, UNI_KNDA } /* scx=kannada */, + { 0, 3391, 10055, 18, 4, UNI__PERL_PATWS } /* patternwhitespace=true */, + { 5, 9875, 0, 4, 0, UNI_MTEI } /* mtei */, + { 2, 9691, 2765, 4, 19, UNI_JAMOEXTB } /* blk=hanguljamoextendedb */, + { 0, 7218, 4505, 3, 4, UNI_INBAMUM } /* inbamum */, + { 0, 8782, 8691, 7, 7, UNI_SC__MULT } /* script=multani */, + { 2, 8782, 9135, 7, 4, UNI_LYDI } /* script=lydi */, + { 2, 8973, 7530, 6, 10, UNI_SUPARROWSB } /* block=suparrowsb */, + { 2, 9979, 9923, 4, 4, UNI_OUGR } /* scx=ougr */, + { 12, 10250, 18, 3, 1, UNI_JT__R } /* jt=r */, + { 2, 8712, 0, 9, 0, UNI_NFKDQC__N } /* nfkdqc=no */, + { 2, 2312, 8637, 4, 5, UNI_INHANUNOO } /* inhanunoo */, + { 0, 1418, 10148, 24, 3, UNI_CCC__BR } /* canonicalcombiningclass=222 */, + { 0, 7016, 0, 11, 0, UNI_HMNG } /* pahawhhmong */, + { 21, 4894, 17, 16, 1, UNI_NFKCQC__N } /* nfkcquickcheck=no */, + { 8, 10268, 10178, 3, 3, UNI_NV__3_SLASH_4 } /* nv=3/4 */, + { 0, 8973, 6518, 6, 12, UNI_INMENDEKIKAKUI } /* block=mendekikakui */, + { 4, 6314, 26, 12, 1, UNI_IDEO } /* ideographic=y */, + { 1, 8973, 8537, 6, 7, UNI_INBENGALI } /* block=bengali */, + { 0, 185, 340, 2, 2, UNI_LO } /* islo */, + { 8, 7908, 1026, 8, 2, -UNI_IDS } /* idstart=no */, + { 9, 9691, 2100, 4, 15, UNI_TRANSPORTANDMAP } /* blk=transportandmap */, + { 9, 8973, 3624, 6, 4, UNI_UCAS } /* block=ucas */, + { 0, 9476, 7790, 3, 9, UNI_TALU } /* sc=newtailue */, + { 11, 9979, 9839, 4, 4, UNI_LINA } /* scx=lina */, + { 0, 8782, 3103, 7, 6, UNI_SC__COPT } /* script=coptic */, + { 0, 2248, 4379, 3, 15, UNI_SUPMATHOPERATORS } /* insupmathoperators */, + { 35, 4598, 4092, 4, 9, UNI_GEORGIANEXT } /* ingeorgianext */, + { 0, 9979, 7310, 4, 10, UNI_DIAK } /* scx=divesakuru */, + { 3, 3877, 8614, 17, 7, UNI_ELYM } /* scriptextensions=elymaic */, + { 4, 1990, 2632, 22, 19, UNI_INSC__BRAHMIJOININGNUMBER } /* indicsyllabiccategory=brahmijoiningnumber */, + { 1, 6083, 8920, 13, 2, UNI_NV__32 } /* numericvalue=32 */, + { 22, 9979, 6302, 4, 4, UNI_HEBR } /* scx=hebr */, + { 0, 5875, 9955, 13, 4, UNI_JG__QAPH } /* joininggroup=qaph */, + { 1, 3877, 9231, 17, 6, UNI_WCHO } /* scriptextensions=wancho */, + { 1, 1172, 0, 2, 0, UNI_TITLE } /* lt */, + { 0, 9476, 9831, 3, 4, UNI_LAO } /* sc=laoo */, + { 0, 9979, 10023, 4, 4, UNI_TAML } /* scx=taml */, + { 2, 9979, 1014, 4, 5, UNI_GREK } /* scx=greek */, + { 3, 1418, 9380, 25, 4, UNI_CCC__30 } /* canonicalcombiningclass=ccc30 */, + { 0, 9691, 2974, 4, 19, UNI_SUPARROWSB } /* blk=supplementalarrowsb */, + { 3, 5875, 6015, 13, 3, UNI_JG__TAW } /* joininggroup=taw */, + { 1, 21, 8380, 2, 8, UNI_JAMOEXTB } /* injamoextb */, + { 0, 10247, 9983, 3, 4, UNI_JG__SEEN } /* jg=seen */, + { 6, 185, 2433, 2, 10, UNI_GLAG } /* isglagolitic */, + { 8, 5875, 4250, 13, 16, UNI_JG__MANICHAEANSAMEKH } /* joininggroup=manichaeansamekh */, + { 9, 185, 2, 3, 1, UNI_CI } /* isci */, + { 10, 9763, 3409, 4, 17, UNI_RI } /* gcb=regionalindicator */, + { 0, 1538, 7440, 24, 10, UNI_INPC__OVERSTRUCK } /* indicpositionalcategory=overstruck */, + { 0, 1418, 7934, 24, 2, UNI_CCC__25 } /* canonicalcombiningclass=25 */, + { 0, 8642, 0, 7, 0, UNI_hyphen_values_index } /* hyphen= */, + { 1, 3448, 1, 3, 41, UNI_UCASEXT } /* inunifiedcanadianaboriginalsyllabicsextended */, + { 1, 9691, 6928, 4, 11, UNI_INMEDEFAIDRIN } /* blk=medefaidrin */, + { 10, 9691, 1632, 4, 18, UNI_GEOMETRICSHAPESEXT } /* blk=geometricshapesext */, + { 0, 1934, 0, 2, 0, UNI_CN } /* cn */, + { 0, 185, 8614, 2, 7, UNI_ELYM } /* iselymaic */, + { 2, 8782, 8845, 7, 7, UNI_TAVT } /* script=taiviet */, + { 1, 10542, 3403, 5, 5, UNI_XPOSIXSPACE } /* xperlspace */, + { 2, 3553, 1026, 18, 2, -UNI_VS } /* variationselector=no */, + { 0, 10352, 34, 3, 2, UNI_WB__EX } /* wb=ex */, + { 2, 8973, 7835, 6, 9, UNI_INOLDUYGHUR } /* block=olduyghur */, + { 3, 2242, 16, 3, 1, UNI_NB } /* innb */, + { 2, 8973, 8740, 6, 7, UNI_OLCK } /* block=olchiki */, + { 1, 8973, 8838, 6, 7, UNI_INTAITHAM } /* block=taitham */, + { 0, 5242, 0, 14, 0, UNI_HIGHSURROGATES } /* highsurrogates */, + { 0, 9691, 4170, 4, 16, UNI_LATIN1 } /* blk=latin1supplement */, + { 1, 9691, 3103, 4, 6, UNI_INCOPTIC } /* blk=coptic */, + { 0, 1506, 3868, 4, 5, UNI_INGRANTHA } /* ingrantha */, + { 1, 9147, 9454, 6, 5, -UNI__PERL_NCHAR } /* nchar=false */, + { 0, 9647, 10310, 4, 3, UNI_AGE__4 } /* age=v40 */, + { 4, 6083, 8171, 13, 2, UNI_NV__26 } /* numericvalue=26 */, + { 5, 9550, 10055, 4, 4, UNI_IDS } /* ids=true */, + { 24, 9711, 7923, 4, 2, UNI_CCC__11 } /* ccc=11 */, + { 0, 4026, 0, 16, 0, UNI_PE } /* closepunctuation */, + { 2, 1418, 1180, 24, 2, UNI_CCC__BL } /* canonicalcombiningclass=bl */, + { 2, 9727, 26, 4, 1, UNI_CWL } /* cwl=y */, + { 4, 1880, 36, 22, 1, UNI_CWU } /* changeswhenuppercased=t */, + { 0, 9476, 8500, 3, 4, UNI_UGAR } /* sc=ugar */, + { 0, 8628, 10355, 7, 3, UNI_GRBASE } /* grbase=yes */, + { 4, 10229, 4588, 3, 6, UNI_DT__MED } /* dt=medial */, + { 0, 4972, 10032, 3, 3, UNI_TFNG } /* istfng */, + { 0, 5875, 9554, 13, 5, UNI_JG__ZHAIN } /* joininggroup=zhain */, + { 0, 7460, 10304, 10, 3, UNI_IN__3_DOT_1 } /* presentin=v31 */, + { 4, 9711, 9310, 5, 4, UNI_CCC__16 } /* ccc=ccc16 */, + { 2, 9476, 8866, 3, 7, UNI_SC__TIRH } /* sc=tirhuta */, + { 1, 8705, 10355, 7, 3, UNI_NFKCQC__Y } /* nfkcqc=yes */, + { 0, 5088, 1026, 14, 2, -UNI_POSIXXDIGIT } /* asciihexdigit=no */, + { 2, 8782, 4426, 7, 6, UNI_TANG } /* script=tangut */, + { 0, 9647, 9607, 4, 4, UNI_AGE__14 } /* age=14.0 */, + { 0, 185, 8566, 3, 6, UNI_CJKEXTD } /* iscjkextd */, + { 0, 9476, 10111, 3, 4, UNI_ZANB } /* sc=zanb */, + { 3, 185, 9231, 2, 6, UNI_WCHO } /* iswancho */, + { 8, 185, 2841, 2, 4, UNI_MERO } /* ismero */, + { 0, 9691, 5029, 4, 15, UNI_VEDICEXT } /* blk=vedicextensions */, + { 1, 9691, 868, 4, 28, UNI_PHONETICEXTSUP } /* blk=phoneticextensionssupplement */, + { 0, 3193, 0, 4, 0, UNI_ETHI } /* ethi */, + { 8, 4157, 3302, 3, 17, UNI_PI } /* isinitialpunctuation */, + { 2, 9731, 10355, 4, 3, UNI_CWT } /* cwt=yes */, + { 3, 9474, 5718, 5, 14, UNI_INSC__VOWELDEPENDENT } /* insc=voweldependent */, + { 3, 10229, 8726, 3, 7, UNI_DT__NB } /* dt=nobreak */, + { 1, 9991, 0, 4, 0, UNI_SHAW } /* shaw */, + { 3, 9123, 1, 6, 1, -UNI_XPOSIXLOWER } /* lower=n */, + { 1, 9691, 8476, 4, 8, UNI_INTIFINAGH } /* blk=tifinagh */, + { 6, 7907, 26, 9, 1, UNI_XIDS } /* xidstart=y */, + { 11, 1538, 2473, 24, 4, UNI_INPC__LEFT } /* indicpositionalcategory=left */, + { 3, 1553, 7, 10, 1, UNI_SC } /* category=sc */, + { 0, 4609, 0, 15, 0, UNI_CONTROLPICTURES } /* controlpictures */, + { 0, 4885, 2435, 4, 8, UNI_INGLAGOLITIC } /* inglagolitic */, + { 0, 185, 1903, 3, 21, UNI_CJKCOMPATIDEOGRAPHSSUP } /* iscjkcompatideographssup */, + { 7, 9691, 1632, 4, 23, UNI_GEOMETRICSHAPESEXT } /* blk=geometricshapesextended */, + { 2, 3877, 9207, 17, 4, UNI_THAA } /* scriptextensions=thaa */, + { 0, 9979, 8797, 5, 6, UNI_SHAW } /* scx=shavian */, + { 48, 9461, 3382, 3, 3, UNI_SB__SE } /* sb=sep */, + { 0, 9063, 9454, 6, 5, -UNI_EPRES } /* epres=false */, + { 0, 8973, 1061, 7, 5, UNI_INCOPTIC } /* block=coptic */, + { 3, 9691, 9484, 4, 5, UNI_INLIMBU } /* blk=limbu */, + { 3, 185, 5096, 2, 5, UNI_XPOSIXDIGIT } /* isdigit */, + { 0, 185, 8719, 2, 7, UNI_NB } /* isnoblock */, + { 12, 7230, 866, 10, 2, UNI_BC__WS } /* bidiclass=ws */, + { 0, 8887, 1026, 7, 2, -UNI_XPOSIXSPACE } /* wspace=no */, + { 1, 7230, 6602, 10, 12, UNI_BC__ON } /* bidiclass=otherneutral */, + { 1, 7360, 10394, 10, 2, UNI_LB__XX } /* linebreak=xx */, + { 1, 8782, 6518, 7, 4, UNI_MEND } /* script=mend */, + { 4, 284, 0, 33, 0, UNI_MISCMATHSYMBOLSB } /* miscellaneousmathematicalsymbolsb */, + { 5, 7908, 36, 8, 1, UNI_IDS } /* idstart=t */, + { 1, 9979, 9444, 4, 5, UNI_DOGR } /* scx=dogra */, + { 9, 10226, 3, 3, 1, -UNI_DI } /* di=f */, + { 0, 10516, 469, 3, 4, UNI_P } /* ispunct */, + { 1, 9927, 10055, 4, 4, UNI_PCM } /* pcm=true */, + { 0, 9476, 9883, 3, 4, UNI_NARB } /* sc=narb */, + { 11, 8782, 1924, 7, 6, UNI_SC__ZYYY } /* script=common */, + { 2, 185, 1562, 2, 24, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* issupsymbolsandpictographs */, + { 0, 9711, 8, 4, 1, UNI_CCC__A } /* ccc=a */, + { 0, 1946, 0, 12, 0, UNI_DIACRITICALS } /* diacriticals */, + { 1, 9691, 4282, 4, 16, UNI_MISCMATHSYMBOLSA } /* blk=miscmathsymbolsa */, + { 0, 1836, 9454, 22, 5, -UNI_CWL } /* changeswhenlowercased=false */, + { 3, 8881, 5075, 3, 13, UNI_ANCIENTSYMBOLS } /* isancientsymbols */, + { 21, 10253, 7664, 3, 9, UNI_LB__B2 } /* lb=breakboth */, + { 4, 9747, 36, 4, 1, UNI_DIA } /* dia=t */, + { 0, 185, 8300, 2, 8, UNI_DUPL } /* isduployan */, + { 0, 10516, 9940, 3, 3, UNI_MIAO } /* isplrd */, + { 8, 8782, 9823, 7, 4, UNI_SC__KTHI } /* script=kthi */, + { 8, 10508, 1847, 8, 5, UNI_XPOSIXLOWER } /* isxposixlower */, + { 2, 7230, 37, 10, 2, UNI_BC__EN } /* bidiclass=en */, + { 2, 9476, 9771, 3, 4, UNI_SC__GONM } /* sc=gonm */, + { 1, 3391, 10355, 18, 3, UNI__PERL_PATWS } /* patternwhitespace=yes */, + { 0, 1418, 7619, 24, 9, UNI_CCC__AL } /* canonicalcombiningclass=aboveleft */, + { 9, 4074, 4286, 16, 10, UNI_SM } /* generalcategory=mathsymbol */, + { 14, 9691, 630, 4, 30, UNI_CJKEXTE } /* blk=cjkunifiedideographsextensione */, + { 0, 4463, 3141, 4, 11, UNI_DEVANAGARIEXT } /* indevanagariext */, + { 1, 7297, 6594, 3, 3, UNI_HUNG } /* ishung */, + { 8, 3121, 9039, 18, 6, UNI_DT__ENC } /* decompositiontype=circle */, + { 17, 5116, 0, 13, 0, UNI_CI } /* caseignorable */, + { 3, 3928, 0, 17, 0, UNI_SUTTONSIGNWRITING } /* suttonsignwriting */, + { 0, 8782, 7863, 8, 8, UNI_SAMR } /* script=samaritan */, + { 0, 9691, 4474, 4, 15, UNI_ARABICEXTA } /* blk=arabicextendeda */, + { 0, 8782, 3265, 7, 8, UNI_SC__GEOR } /* script=georgian */, + { 2, 4074, 6132, 16, 2, UNI_PF } /* generalcategory=pf */, + { 1, 185, 9771, 2, 4, UNI_GONM } /* isgonm */, + { 13, 342, 0, 2, 0, UNI_PE } /* pe */, + { 0, 9979, 9683, 4, 4, UNI_BATK } /* scx=batk */, + { 3, 9979, 8276, 4, 4, UNI_BALI } /* scx=bali */, + { 1, 1418, 9320, 25, 4, UNI_CCC__18 } /* canonicalcombiningclass=ccc18 */, + { 0, 6529, 7836, 3, 8, UNI_INOLDUYGHUR } /* inolduyghur */, + { 0, 4972, 3482, 3, 17, UNI_TAIXUANJING } /* istaixuanjingsymbols */, + { 1, 9711, 9675, 4, 3, UNI_CCC__202 } /* ccc=atb */, + { 1, 9476, 8284, 3, 8, UNI_BASS } /* sc=bassavah */, + { 26, 3724, 0, 17, 0, UNI_ETHIOPICEXTB } /* ethiopicextendedb */, + { 0, 8973, 8824, 6, 7, UNI_SUPPUAB } /* block=suppuab */, + { 1, 8973, 3068, 7, 17, UNI_HALFMARKS } /* block=combininghalfmarks */, + { 4, 4684, 866, 15, 1, UNI_EA__W } /* eastasianwidth=w */, + { 42, 7811, 0, 4, 0, UNI_ITAL } /* ital */, + { 8, 4972, 2101, 3, 14, UNI_TRANSPORTANDMAP } /* istransportandmap */, + { 0, 4744, 9165, 15, 6, UNI_IDENTIFIERTYPE__NOTXID } /* identifiertype=notxid */, + { 25, 1553, 1, 9, 1, UNI_N } /* category=n */, + { 4, 9691, 9444, 4, 5, UNI_INDOGRA } /* blk=dogra */, + { 4, 4714, 0, 15, 0, UNI_grext_values_index } /* graphemeextend= */, + { 0, 10217, 6146, 3, 12, UNI_BC__AN } /* bc=arabicnumber */, + { 0, 9476, 7420, 3, 10, UNI_XPEO } /* sc=oldpersian */, + { 4, 10402, 25, 29, 1, UNI__PERL_PROBLEMATIC_LOCALE_FOLDS } /* _perl_problematic_locale_folds */, + { 9, 8973, 9871, 6, 3, UNI_INMRO } /* block=mro */, + { 0, 10253, 6829, 3, 11, UNI_LB__IN } /* lb=inseperable */, + { 16, 185, 3265, 2, 8, UNI_GEOR } /* isgeorgian */, + { 0, 10268, 8028, 3, 4, UNI_NV__2000 } /* nv=2000 */, + { 8, 1418, 9340, 25, 4, UNI_CCC__22 } /* canonicalcombiningclass=ccc22 */, + { 6, 1553, 48, 10, 1, UNI_SM } /* category=sm */, + { 3, 8881, 9680, 3, 3, UNI_AVST } /* isavst */, + { 0, 9264, 0, 5, 0, UNI_ADLM } /* adlam */, + { 0, 9691, 7450, 4, 10, UNI_INPHOENICIAN } /* blk=phoenician */, + { 0, 1852, 26, 6, 1, UNI_CASED } /* cased=y */, + { 7, 9214, 3, 5, 1, -UNI_IDEO } /* ideo=f */, + { 10, 4074, 468, 16, 5, UNI_P } /* generalcategory=punct */, + { 1, 9711, 10392, 4, 2, UNI_CCC__9 } /* ccc=vr */, + { 1, 9747, 10055, 4, 4, UNI_DIA } /* dia=true */, + { 1, 21, 3319, 2, 18, UNI_LATINEXTADDITIONAL } /* inlatinextadditional */, + { 7, 185, 7736, 2, 9, UNI_LATINEXTD } /* islatinextd */, + { 18, 9476, 4410, 3, 6, UNI_SC__SYRC } /* sc=syriac */, + { 3, 185, 8628, 2, 6, UNI_GRBASE } /* isgrbase */, + { 2, 9207, 0, 6, 0, UNI_THAA } /* thaana */, + { 2, 8973, 1655, 6, 23, UNI_COMPATJAMO } /* block=hangulcompatibilityjamo */, + { 2, 2248, 7511, 3, 9, UNI_SMALLFORMS } /* insmallforms */, + { 1, 185, 6183, 3, 11, UNI_CHESSSYMBOLS } /* ischesssymbols */, + { 0, 3406, 9454, 3, 5, -UNI_CE } /* ce=false */, + { 0, 9647, 10067, 4, 4, UNI_AGE__12 } /* age=v120 */, + { 0, 10268, 9567, 3, 4, UNI_NV__1_SLASH_20 } /* nv=1/20 */, + { 1, 6842, 3607, 4, 15, UNI_UCAS } /* incanadiansyllabics */, + { 8, 9153, 9494, 6, 5, UNI_NFCQC__M } /* nfcqc=maybe */, + { 23, 5093, 10055, 9, 4, UNI_XPOSIXXDIGIT } /* hexdigit=true */, + { 8, 9979, 9294, 4, 5, UNI_BUHD } /* scx=buhid */, + { 0, 8973, 7790, 6, 9, UNI_INNEWTAILUE } /* block=newtailue */, + { 11, 9691, 4759, 4, 15, UNI_INIMPERIALARAMAIC } /* blk=imperialaramaic */, + { 0, 10268, 9627, 3, 4, UNI_NV__3_SLASH_64 } /* nv=3/64 */, + { 4, 1880, 10055, 22, 4, UNI_CWU } /* changeswhenuppercased=true */, + { 14, 9459, 10355, 5, 3, UNI_IDSB } /* idsb=yes */, + { 1, 8967, 26, 6, 1, UNI_BIDIM } /* bidim=y */, + { 24, 185, 1747, 2, 23, UNI_ZNAMENNYMUSIC } /* isznamennymusicalnotation */, + { 0, 3877, 2269, 17, 11, UNI_MTEI } /* scriptextensions=meeteimayek */, + { 0, 10253, 4401, 3, 9, UNI_EMOD } /* lb=emodifier */, + { 0, 1858, 10055, 22, 4, UNI_CWT } /* changeswhentitlecased=true */, + { 1, 8593, 0, 7, 0, UNI_compex_values_index } /* compex= */, + { 0, 3121, 4058, 18, 3, UNI_DT__FIN } /* decompositiontype=fin */, + { 7, 185, 6928, 2, 11, UNI_MEDF } /* ismedefaidrin */, + { 6, 7230, 32, 10, 2, UNI_BC__CS } /* bidiclass=cs */, + { 0, 1418, 9410, 25, 4, UNI_CCC__36 } /* canonicalcombiningclass=ccc36 */, + { 43, 9727, 0, 3, 0, UNI_CWL } /* cwl */, + { 3, 8782, 8614, 7, 4, UNI_ELYM } /* script=elym */, + { 4, 10217, 4520, 4, 14, UNI_BC__BN } /* bc=boundaryneutral */, + { 4, 1418, 8043, 24, 2, UNI_CCC__23 } /* canonicalcombiningclass=23 */, + { 3, 9979, 8356, 4, 4, UNI_HIRA } /* scx=hira */, + { 0, 9647, 10337, 4, 3, UNI_AGE__7 } /* age=v70 */, + { 1, 9711, 9012, 4, 3, UNI_CCC__129 } /* ccc=129 */, + { 36, 8782, 9117, 7, 4, UNI_LEPC } /* script=lepc */, + { 5, 9474, 0, 5, 0, UNI_insc_values_index } /* insc= */, + { 1, 1189, 2321, 3, 3, UNI_INTHAI } /* inthai */, + { 0, 7230, 2533, 10, 11, UNI_BC__R } /* bidiclass=righttoleft */, + { 0, 9476, 7808, 3, 9, UNI_ITAL } /* sc=olditalic */, + { 0, 3877, 3265, 17, 8, UNI_GEOR } /* scriptextensions=georgian */, + { 0, 6675, 1026, 11, 2, -UNI_IDC } /* idcontinue=no */, + { 0, 9691, 5927, 4, 13, UNI_LOWSURROGATES } /* blk=lowsurrogates */, + { 2, 2056, 10355, 22, 3, UNI__PERL_NCHAR } /* noncharactercodepoint=yes */, + { 1, 6083, 8060, 13, 8, UNI_NV__1_SLASH_3 } /* numericvalue=3.33e-01 */, + { 3, 6083, 8931, 13, 5, UNI_NV__60000 } /* numericvalue=60000 */, + { 1, 8782, 9947, 7, 4, UNI_SC__COPT } /* script=qaac */, + { 0, 8973, 8796, 6, 7, UNI_SHAW } /* block=shavian */, + { 0, 7467, 10079, 3, 4, UNI_IN__14 } /* in=v140 */, + { 9, 4074, 263, 16, 2, UNI_SM } /* generalcategory=sm */, + { 5, 3877, 9264, 17, 5, UNI_ADLM } /* scriptextensions=adlam */, + { 0, 6674, 0, 4, 0, UNI_XIDC } /* xidc */, + { 6, 8782, 8831, 7, 7, UNI_SC__TGLG } /* script=tagalog */, + { 0, 9979, 6362, 4, 5, UNI_KHMR } /* scx=khmer */, + { 2, 5550, 0, 15, 0, UNI_DT__CAN } /* nfdquickcheck=n */, + { 1, 10268, 9578, 3, 2, UNI_NV__41 } /* nv=41 */, + { 3, 9711, 9320, 5, 4, UNI_CCC__18 } /* ccc=ccc18 */, + { 4, 3121, 1254, 18, 4, UNI_DT__INIT } /* decompositiontype=init */, + { 0, 9691, 3193, 4, 8, UNI_INETHIOPIC } /* blk=ethiopic */, + { 0, 8782, 2248, 7, 21, UNI_PRTI } /* script=inscriptionalparthian */, + { 0, 10115, 0, 4, 0, UNI_QAAI } /* zinh */, + { 0, 2841, 0, 19, 0, UNI_MERO } /* meroitichieroglyphs */, + { 0, 9177, 26, 6, 1, UNI_QMARK } /* qmark=y */, + { 3, 7360, 10380, 10, 2, UNI_LB__H3 } /* linebreak=h3 */, + { 5, 8782, 4939, 7, 15, UNI_SARB } /* script=oldsoutharabian */, + { 0, 5875, 4819, 13, 15, UNI_JG__MANICHAEANSADHE } /* joininggroup=manichaeansadhe */, + { 0, 9449, 10055, 5, 4, UNI_EMOD } /* emod=true */, + { 1, 8782, 7811, 7, 4, UNI_ITAL } /* script=ital */, + { 0, 9691, 9195, 4, 6, UNI_INTANGSA } /* blk=tangsa */, + { 8, 4972, 10028, 3, 3, UNI_TAVT } /* istavt */, + { 1, 3398, 10355, 11, 3, UNI_XPOSIXSPACE } /* whitespace=yes */, + { 1, 3571, 0, 17, 0, UNI_ALCHEMICAL } /* alchemicalsymbols */, + { 0, 5875, 5966, 13, 13, UNI_JG__MANICHAEANMEM } /* joininggroup=manichaeanmem */, + { 2, 9711, 5461, 4, 2, UNI_CCC__7 } /* ccc=nk */, + { 6, 4074, 27, 16, 2, UNI_LOWERCASELETTER } /* generalcategory=ll */, + { 1, 8782, 3935, 8, 10, UNI_SGNW } /* script=signwriting */, + { 1, 10247, 7038, 3, 11, UNI_JG__ROHINGYAYEH } /* jg=rohingyayeh */, + { 1, 1553, 468, 9, 11, UNI_P } /* category=punctuation */, + { 3, 9476, 8508, 3, 8, UNI_VITH } /* sc=vithkuqi */, + { 0, 1655, 0, 23, 0, UNI_COMPATJAMO } /* hangulcompatibilityjamo */, + { 3, 4157, 6676, 3, 9, UNI_IDC } /* isidcontinue */, + { 1, 5875, 342, 13, 2, UNI_JG__PE } /* joininggroup=pe */, + { 0, 5875, 4789, 13, 15, UNI_JG__MANICHAEANALEPH } /* joininggroup=manichaeanaleph */, + { 0, 9979, 9093, 4, 6, UNI_KTHI } /* scx=kaithi */, + { 5, 3894, 10055, 17, 4, UNI_STERM } /* sentenceterminal=true */, + { 16, 8973, 1394, 6, 24, UNI_ARABICPFB } /* block=arabicpresentationformsb */, + { 0, 185, 4058, 2, 16, UNI_PF } /* isfinalpunctuation */, + { 3, 2248, 7863, 3, 8, UNI_INSAMARITAN } /* insamaritan */, + { 1, 9476, 7433, 3, 4, UNI_SC__SOGD } /* sc=sogd */, + { 3, 8782, 8811, 8, 3, UNI_SOYO } /* script=soyo */, + { 0, 9476, 8537, 3, 7, UNI_SC__BENG } /* sc=bengali */, + { 17, 2955, 0, 19, 0, UNI_SUPARROWSA } /* supplementalarrowsa */, + { 2, 8782, 9195, 7, 6, UNI_TNSA } /* script=tangsa */, + { 0, 10229, 69, 3, 3, UNI_DT__SUP } /* dt=sup */, + { 1, 10280, 10355, 3, 3, UNI_RI } /* ri=yes */, + { 0, 9691, 5862, 4, 13, UNI_IPAEXT } /* blk=ipaextensions */, + { 4, 9763, 34, 4, 6, UNI_GCB__EX } /* gcb=extend */, + { 2, 8973, 1443, 7, 23, UNI_CJKSYMBOLS } /* block=cjksymbolsandpunctuation */, + { 2, 5875, 4218, 13, 16, UNI_JG__MANICHAEANDALETH } /* joininggroup=manichaeandaleth */, + { 12, 6340, 151, 4, 33, UNI_DIACRITICALSSUP } /* incombiningdiacriticalmarkssupplement */, + { 8, 9887, 0, 4, 0, UNI_NBAT } /* nbat */, + { 12, 9743, 26, 4, 1, UNI_DEP } /* dep=y */, + { 25, 9474, 2868, 5, 10, UNI_INSC__TONELETTER } /* insc=toneletter */, + { 3, 3877, 6302, 17, 6, UNI_HEBR } /* scriptextensions=hebrew */, + { 0, 8558, 0, 7, 0, UNI_CJKEXTC } /* cjkextc */, + { 0, 10268, 8235, 3, 2, UNI_NV__28 } /* nv=28 */, + { 1, 4074, 3301, 16, 18, UNI_PI } /* generalcategory=initialpunctuation */, + { 9, 6083, 7940, 13, 8, UNI_NV__1_SLASH_80 } /* numericvalue=1.25e-02 */, + { 0, 6083, 5732, 13, 11, UNI_NV__10000000000 } /* numericvalue=10000000000 */, + { 14, 3139, 0, 4, 0, UNI_DEVA } /* deva */, + { 15, 118, 5863, 3, 5, UNI_IPAEXT } /* inipaext */, + { 5, 5662, 1195, 14, 2, UNI_LB__LF } /* sentencebreak=lf */, + { 23, 1836, 1026, 22, 2, -UNI_CWL } /* changeswhenlowercased=no */, + { 1, 9751, 0, 4, 0, UNI_DIAK } /* diak */, + { 34, 9691, 2936, 4, 9, UNI_INSUNDANESE } /* blk=sundanese */, + { 7, 185, 3445, 2, 4, UNI_RUMI } /* isrumi */, + { 0, 10516, 9932, 3, 3, UNI_PHLP } /* isphlp */, + { 5, 3877, 8691, 17, 4, UNI_MULT } /* scriptextensions=mult */, + { 2, 21, 3445, 2, 18, UNI_RUMI } /* inruminumeralsymbols */, + { 2, 6340, 44, 3, 15, UNI_CJKCOMPAT } /* incjkcompatibility */, + { 0, 8782, 1655, 7, 6, UNI_SC__HANG } /* script=hangul */, + { 0, 1274, 1026, 21, 2, -UNI_CE } /* compositionexclusion=no */, + { 26, 8973, 3193, 6, 18, UNI_ETHIOPICSUP } /* block=ethiopicsupplement */, + { 0, 9691, 3193, 4, 18, UNI_ETHIOPICSUP } /* blk=ethiopicsupplement */, + { 80, 7460, 10343, 10, 3, UNI_IN__9 } /* presentin=v90 */, + { 1, 9051, 36, 6, 1, UNI_ECOMP } /* ecomp=t */, + { 18, 6529, 7809, 3, 8, UNI_INOLDITALIC } /* inolditalic */, + { 3, 1858, 26, 22, 1, UNI_CWT } /* changeswhentitlecased=y */, + { 1, 8973, 6928, 6, 11, UNI_INMEDEFAIDRIN } /* block=medefaidrin */, + { 6, 9237, 0, 4, 0, UNI_YEZI } /* yezi */, + { 6, 9979, 7501, 5, 9, UNI_SAUR } /* scx=saurashtra */, + { 4, 6083, 10366, 13, 2, UNI_NV__46 } /* numericvalue=46 */, + { 0, 8973, 3978, 6, 8, UNI_INBOPOMOFO } /* block=bopomofo */, + { 0, 9695, 752, 4, 5, UNI_BPT__C } /* bpt=close */, + { 0, 2312, 4139, 3, 15, UNI_HIGHPUSURROGATES } /* inhighpusurrogates */, + { 0, 6937, 0, 13, 0, UNI_MISCSYMBOLS } /* inmiscsymbols */, + { 0, 185, 9767, 2, 4, UNI_GONG } /* isgong */, + { 0, 7297, 2228, 3, 3, UNI_HAN } /* ishani */, + { 1, 10247, 5953, 3, 13, UNI_JG__MALAYALAMNNNA } /* jg=malayalamnnna */, + { 1, 10511, 1847, 5, 5, UNI_POSIXLOWER } /* posixlower */, + { 1, 10516, 469, 3, 10, UNI_P } /* ispunctuation */, + { 3, 6083, 8044, 13, 8, UNI_NV__1_SLASH_32 } /* numericvalue=3.13e-02 */, + { 4, 5875, 4829, 13, 5, UNI_JG__SADHE } /* joininggroup=sadhe */, + { 0, 9474, 9225, 5, 6, UNI_INSC__VIRAMA } /* insc=virama */, + { 14, 8973, 0, 6, 43, UNI_UCASEXTA } /* block=unifiedcanadianaboriginalsyllabicsextendeda */, + { 1, 1418, 9004, 25, 4, UNI_CCC__12 } /* canonicalcombiningclass=ccc12 */, + { 2, 10352, 4912, 3, 2, UNI_WB__DQ } /* wb=dq */, + { 2, 1553, 401, 9, 6, UNI_CF } /* category=format */, + { 17, 9691, 5772, 5, 12, UNI_BLOCKELEMENTS } /* blk=blockelements */, + { 18, 10247, 6693, 3, 4, UNI_JG__NOON } /* jg=noon */, + { 8, 4157, 60, 3, 3, UNI_IDEO } /* isideo */, + { 16, 185, 1167, 2, 25, UNI_DI } /* isdefaultignorablecodepoint */, + { 1, 185, 7570, 2, 4, UNI_WARA } /* iswara */, + { 5, 1088, 3, 27, 1, -UNI_PCM } /* prependedconcatenationmark=f */, + { 2, 9476, 6302, 3, 6, UNI_HEBR } /* sc=hebrew */, + { 0, 8768, 26, 7, 1, UNI_PATSYN } /* patsyn=y */, + { 1, 5662, 1090, 15, 2, UNI_SB__SE } /* sentencebreak=sep */, + { 0, 1295, 0, 25, 0, UNI_SUPERANDSUB } /* superscriptsandsubscripts */, + { 2, 8782, 2085, 7, 4, UNI_SC__MODI } /* script=modi */, + { 7, 8782, 10019, 7, 4, UNI_TALU } /* script=talu */, + { 1, 868, 0, 28, 0, UNI_PHONETICEXTSUP } /* phoneticextensionssupplement */, + { 14, 7467, 7923, 3, 2, UNI_IN__11 } /* in=11 */, + { 10, 9474, 8268, 5, 8, UNI_INSC__AVAGRAHA } /* insc=avagraha */, + { 3, 10229, 8364, 3, 8, UNI_DT__ISO } /* dt=isolated */, + { 7, 4972, 9208, 3, 5, UNI_THAA } /* isthaana */, + { 1, 9549, 36, 5, 1, UNI_XIDS } /* xids=t */, + { 1, 9476, 9779, 3, 4, UNI_SC__GUJR } /* sc=gujr */, + { 0, 6529, 7827, 3, 8, UNI_INOLDTURKIC } /* inoldturkic */, + { 9, 8593, 9454, 7, 5, -UNI_COMPEX } /* compex=false */, + { 3, 9711, 9380, 5, 4, UNI_CCC__30 } /* ccc=ccc30 */, + { 0, 8712, 26, 7, 1, UNI_DT__NONE } /* nfkdqc=y */, + { 0, 6158, 1, 12, 1, -UNI_BIDIC } /* bidicontrol=n */, + { 4, 9647, 10298, 4, 3, UNI_AGE__2_DOT_1 } /* age=v21 */, + { 0, 9476, 8388, 3, 4, UNI_SC__JAVA } /* sc=java */, + { 2, 9691, 4426, 4, 16, UNI_TANGUTCOMPONENTS } /* blk=tangutcomponents */, + { 10, 2056, 36, 22, 1, UNI__PERL_NCHAR } /* noncharactercodepoint=t */, + { 0, 3877, 3049, 17, 4, UNI_CHER } /* scriptextensions=cher */, + { 0, 9057, 3, 6, 1, -UNI_EMOJI } /* emoji=f */, + { 0, 1538, 7115, 24, 11, UNI_INPC__TOPANDRIGHT } /* indicpositionalcategory=topandright */, + { 0, 1418, 8102, 24, 2, UNI_CCC__17 } /* canonicalcombiningclass=17 */, + { 0, 185, 251, 2, 33, UNI_MISCMATHSYMBOLSA } /* ismiscellaneousmathematicalsymbolsa */, + { 16, 10119, 0, 4, 0, UNI_ZYYY } /* zyyy */, + { 1, 8782, 9895, 7, 3, UNI_SC__NKO } /* script=nko */, + { 2, 185, 661, 3, 29, UNI_CJKEXTF } /* iscjkunifiedideographsextensionf */, + { 0, 7682, 10355, 9, 3, UNI_EXT } /* extender=yes */, + { 0, 9550, 0, 4, 0, UNI_ids_values_index } /* ids= */, + { 0, 6674, 0, 12, 0, UNI_xidc_values_index } /* xidcontinue= */, + { 0, 9979, 8300, 4, 8, UNI_DUPL } /* scx=duployan */, + { 1, 9476, 7853, 3, 4, UNI_PAUC } /* sc=pauc */, + { 8, 107, 0, 6, 0, UNI_S } /* symbol */, + { 1, 1115, 10055, 26, 4, UNI_CWKCF } /* changeswhennfkccasefolded=true */, + { 2, 5823, 10355, 13, 3, UNI_GRBASE } /* graphemebase=yes */, + { 1, 9476, 9839, 3, 4, UNI_SC__LINA } /* sc=lina */, + { 0, 7297, 8, 3, 2, UNI_HAN } /* ishan */, + { 0, 10244, 46, 3, 2, UNI_CO } /* gc=co */, + { 8, 9469, 473, 3, 2, UNI_PUA } /* inpua */, + { 4, 9469, 2473, 5, 4, UNI_INPC__LEFT } /* inpc=left */, + { 3, 9469, 910, 3, 13, UNI_PUA } /* inprivateusearea */, + { 7, 8881, 98, 3, 9, UNI_XPOSIXALPHA } /* isalphabetic */, + { 5, 185, 2879, 2, 9, UNI_MONG } /* ismongolian */, + { 2, 7467, 9583, 3, 4, UNI_IN__10 } /* in=10.0 */, + { 8, 9979, 3103, 4, 4, UNI_COPT } /* scx=copt */, + { 1, 9213, 0, 6, 0, UNI_uideo_values_index } /* uideo= */, + { 1, 9057, 36, 6, 1, UNI_EMOJI } /* emoji=t */, + { 1, 10268, 8913, 3, 6, UNI_NV__400000 } /* nv=400000 */, + { 11, 9979, 79, 4, 6, UNI_ARAB } /* scx=arabic */, + { 0, 8508, 0, 4, 0, UNI_VITH } /* vith */, + { 0, 3894, 1, 17, 1, -UNI_STERM } /* sentenceterminal=n */, + { 8, 9979, 4849, 4, 15, UNI_MERC } /* scx=meroiticcursive */, + { 0, 9711, 9335, 5, 4, UNI_CCC__21 } /* ccc=ccc21 */, + { 2, 7071, 0, 4, 0, UNI_SORA } /* sora */, + { 1, 8782, 9891, 7, 4, UNI_NEWA } /* script=newa */, + { 0, 5408, 8686, 4, 5, UNI_INMARCHEN } /* inmarchen */, + { 4, 7218, 4535, 3, 6, UNI_BRAI } /* inbraille */, + { 2, 9476, 2227, 3, 14, UNI_SC__ROHG } /* sc=hanifirohingya */, + { 0, 10508, 7908, 3, 7, UNI_XIDS } /* isxidstart */, + { 0, 8973, 9069, 6, 6, UNI_INGOTHIC } /* block=gothic */, + { 11, 21, 5746, 3, 12, UNI_AEGEANNUMBERS } /* inaegeannumbers */, + { 0, 185, 3409, 2, 17, UNI_RI } /* isregionalindicator */, + { 1, 10560, 2423, 3, 3, UNI_VITH } /* isvith */, + { 2, 9979, 8500, 4, 4, UNI_UGAR } /* scx=ugar */, + { 8, 6626, 0, 12, 0, UNI_PLAYINGCARDS } /* playingcards */, + { 0, 8782, 9951, 7, 4, UNI_SC__QAAI } /* script=qaai */, + { 3, 8973, 5862, 6, 6, UNI_IPAEXT } /* block=ipaext */, + { 2, 1990, 7799, 22, 9, UNI_INSC__NONJOINER } /* indicsyllabiccategory=nonjoiner */, + { 2, 5648, 0, 13, 0, UNI_QMARK } /* quotationmark */, + { 13, 10268, 5732, 3, 8, UNI_NV__10000000 } /* nv=10000000 */, + { 3, 6340, 8587, 3, 6, UNI_CJKEXTG } /* incjkextg */, + { 0, 9691, 8538, 5, 6, UNI_INBENGALI } /* blk=bengali */, + { 6, 9219, 10355, 6, 3, UNI_XPOSIXUPPER } /* upper=yes */, + { 5, 8973, 6614, 6, 12, UNI_PHAISTOS } /* block=phaistosdisc */, + { 1, 8973, 3792, 6, 17, UNI_INKHITANSMALLSCRIPT } /* block=khitansmallscript */, + { 0, 10553, 8804, 3, 3, UNI_SIDD } /* issidd */, + { 1, 9476, 9129, 3, 6, UNI_LYCI } /* sc=lycian */, + { 0, 9691, 7530, 4, 10, UNI_SUPARROWSB } /* blk=suparrowsb */, + { 1, 10217, 4362, 3, 16, UNI_BC__S } /* bc=segmentseparator */, + { 1, 9979, 9524, 4, 5, UNI_RUNR } /* scx=runic */, + { 12, 8973, 4330, 6, 16, UNI_MYANMAREXTB } /* block=myanmarextendedb */, + { 0, 9979, 10004, 5, 3, UNI_SOGO } /* scx=sogo */, + { 0, 6083, 5732, 13, 6, UNI_NV__100000 } /* numericvalue=100000 */, + { 7, 5088, 0, 5, 0, UNI_ASCII } /* ascii */, + { 0, 185, 5836, 2, 8, UNI_GREEKEXT } /* isgreekext */, + { 4, 10508, 10528, 8, 5, UNI_XPOSIXPRINT } /* isxposixprint */, + { 1, 5875, 5992, 13, 13, UNI_JG__MANICHAEANONE } /* joininggroup=manichaeanone */, + { 1, 1219, 0, 26, 0, UNI_KATAKANAEXT } /* katakanaphoneticextensions */, + { 1, 1836, 36, 22, 1, UNI_CWL } /* changeswhenlowercased=t */, + { 4, 5029, 0, 8, 0, UNI_VEDICEXT } /* vedicext */, + { 4, 5214, 0, 14, 0, UNI_INGREEK } /* greekandcoptic */, + { 4, 9544, 10355, 5, 3, UNI_XIDC } /* xidc=yes */, + { 0, 3877, 4924, 17, 15, UNI_NARB } /* scriptextensions=oldnortharabian */, + { 32, 8782, 8979, 7, 6, UNI_CARI } /* script=carian */, + { 17, 7790, 0, 9, 0, UNI_TALU } /* newtailue */, + { 0, 9844, 5774, 5, 10, UNI_BLOCKELEMENTS } /* inblockelements */, + { 0, 9474, 3994, 5, 16, UNI_INSC__CANTILLATIONMARK } /* insc=cantillationmark */, + { 1, 1167, 0, 26, 0, UNI_di_values_index } /* defaultignorablecodepoint= */, + { 0, 185, 7330, 2, 4, UNI_KHAR } /* iskhar */, + { 9, 447, 0, 32, 0, UNI_IDEOGRAPHICSYMBOLS } /* ideographicsymbolsandpunctuation */, + { 2, 8973, 2311, 6, 7, UNI_INSINHALA } /* block=sinhala */, + { 7, 8782, 7330, 7, 10, UNI_KHAR } /* script=kharoshthi */, + { 0, 7433, 0, 7, 0, UNI_SOGD } /* sogdian */, + { 2, 8782, 9703, 7, 4, UNI_SC__CAKM } /* script=cakm */, + { 7, 7460, 5732, 10, 2, UNI_IN__10 } /* presentin=10 */, + { 4, 3121, 2809, 18, 3, UNI_DT__NAR } /* decompositiontype=nar */, + { 0, 3877, 3792, 17, 17, UNI_KITS } /* scriptextensions=khitansmallscript */, + { 1, 9647, 10063, 4, 3, UNI_IN__1_DOT_1 } /* age=v11 */, + { 5, 9711, 7320, 4, 4, UNI_CCC__6 } /* ccc=hanr */, + { 3, 8782, 7844, 7, 9, UNI_PALM } /* script=palmyrene */, + { 1, 3673, 0, 17, 0, UNI_CYRILLICEXTB } /* cyrillicextendedb */, + { 6, 10247, 5396, 3, 14, UNI_JG__MANICHAEANAYIN } /* jg=manichaeanayin */, + { 0, 8973, 3837, 7, 3, UNI_INCHAM } /* block=cham */, + { 3, 9691, 6614, 4, 8, UNI_PHAISTOS } /* blk=phaistos */, + { 9, 9691, 2727, 4, 19, UNI_ENCLOSEDALPHANUMSUP } /* blk=enclosedalphanumsup */, + { 1, 9476, 9875, 3, 4, UNI_MTEI } /* sc=mtei */, + { 1, 10247, 9243, 3, 6, UNI_JG__YUDHHE } /* jg=yudhhe */, + { 1, 9711, 10157, 4, 3, UNI_CCC__AL } /* ccc=228 */, + { 2, 10247, 3843, 3, 17, UNI_JG__MANICHAEANHUNDRED } /* jg=manichaeanhundred */, + { 2, 3877, 7781, 17, 9, UNI_NBAT } /* scriptextensions=nabataean */, + { 1, 10247, 5940, 3, 13, UNI_JG__MALAYALAMLLLA } /* jg=malayalamllla */, + { 23, 9923, 0, 4, 0, UNI_OUGR } /* ougr */, + { 1, 185, 5836, 2, 13, UNI_GREEKEXT } /* isgreekextended */, + { 35, 9711, 8059, 4, 2, UNI_CCC__33 } /* ccc=33 */, + { 0, 10109, 1748, 3, 22, UNI_ZNAMENNYMUSIC } /* inznamennymusicalnotation */, + { 1, 8782, 8649, 7, 7, UNI_SC__KNDA } /* script=kannada */, + { 2, 185, 2374, 3, 19, UNI_PC } /* isconnectorpunctuation */, + { 0, 10268, 8171, 3, 2, UNI_NV__26 } /* nv=26 */, + { 1, 8973, 7862, 6, 9, UNI_INSAMARITAN } /* block=samaritan */, + { 8, 10244, 7005, 3, 11, UNI_SO } /* gc=othersymbol */, + { 5, 9545, 1026, 4, 2, -UNI_IDC } /* idc=no */, + { 2, 6340, 3050, 3, 17, UNI_CHEROKEESUP } /* incherokeesupplement */, + { 6, 8955, 26, 6, 1, UNI_XPOSIXALPHA } /* alpha=y */, + { 36, 6083, 8913, 13, 2, UNI_NV__40 } /* numericvalue=40 */, + { 1, 9135, 0, 4, 0, UNI_LYDI } /* lydi */, + { 1, 10268, 8196, 3, 8, UNI_NV__15_SLASH_2 } /* nv=7.50e+00 */, + { 41, 21, 1678, 2, 9, UNI_LATINEXTE } /* inlatinexte */, + { 0, 9979, 6518, 4, 12, UNI_MEND } /* scx=mendekikakui */, + { 12, 185, 184, 2, 34, UNI_MISCPICTOGRAPHS } /* ismiscellaneoussymbolsandpictographs */, + { 1, 10560, 25, 3, 1, UNI_VS } /* isvs */, + { 0, 10510, 10528, 6, 5, UNI_XPOSIXPRINT } /* xposixprint */, + { 25, 1655, 0, 6, 0, UNI_HANG } /* hangul */, + { 0, 4972, 6091, 3, 3, UNI_TALU } /* istalu */, + { 3, 4847, 6520, 4, 10, UNI_INMENDEKIKAKUI } /* inmendekikakui */, + { 2, 3877, 8621, 17, 4, UNI_GRAN } /* scriptextensions=gran */, + { 0, 8614, 0, 4, 0, UNI_ELYM } /* elym */, + { 0, 9476, 5368, 3, 4, UNI_LISU } /* sc=lisu */, + { 5, 9691, 2936, 4, 19, UNI_SUNDANESESUP } /* blk=sundanesesupplement */, + { 2, 8782, 9444, 7, 5, UNI_SC__DOGR } /* script=dogra */, + { 0, 9434, 10055, 5, 4, UNI_CWCM } /* cwcm=true */, + { 0, 9711, 9018, 4, 3, UNI_CCC__130 } /* ccc=130 */, + { 0, 9461, 340, 3, 2, UNI_SB__LO } /* sb=lo */, + { 5, 8782, 8340, 7, 8, UNI_SC__GUJR } /* script=gujarati */, + { 4, 10253, 1528, 3, 9, UNI_LB__SG } /* lb=surrogate */, + { 2, 8973, 6862, 6, 11, UNI_KATAKANAEXT } /* block=katakanaext */, + { 0, 10268, 7956, 3, 8, UNI_NV__3_SLASH_2 } /* nv=1.50e+00 */, + { 1, 7297, 1419, 3, 3, UNI_HANO } /* ishano */, + { 8, 6083, 8937, 13, 3, UNI_NV__700 } /* numericvalue=700 */, + { 0, 9691, 2613, 4, 19, UNI_ANCIENTGREEKNUMBERS } /* blk=ancientgreeknumbers */, + { 16, 3877, 7072, 18, 10, UNI_SORA } /* scriptextensions=sorasompeng */, + { 3, 21, 9183, 2, 6, UNI_INREJANG } /* inrejang */, + { 1, 10047, 0, 4, 0, UNI_TNSA } /* tnsa */, + { 0, 9979, 9739, 4, 4, UNI_CYRL } /* scx=cyrl */, + { 0, 8973, 4924, 6, 15, UNI_NARB } /* block=oldnortharabian */, + { 1, 185, 4314, 2, 7, UNI_MYMR } /* ismyanmar */, + { 2, 8348, 0, 8, 0, UNI_GURU } /* gurmukhi */, + { 0, 9711, 7990, 4, 1, UNI_CCC__8 } /* ccc=8 */, + { 1, 1418, 9300, 25, 4, UNI_CCC__14 } /* canonicalcombiningclass=ccc14 */, + { 0, 2879, 0, 12, 0, UNI_MONGOLIANSUP } /* mongoliansup */, + { 2, 10253, 7410, 3, 10, UNI_LB__NS } /* lb=nonstarter */, + { 0, 9691, 6206, 4, 12, UNI_CYRILLICEXTB } /* blk=cyrillicextb */, + { 13, 5408, 331, 4, 19, UNI_MATHOPERATORS } /* inmathematicaloperators */, + { 12, 4972, 1870, 3, 8, UNI_TITLE } /* istitlecase */, + { 10, 1553, 1588, 9, 1, UNI_Z } /* category=z */, + { 0, 4074, 1934, 16, 2, UNI_CN } /* generalcategory=cn */, + { 1, 5648, 26, 14, 1, UNI_QMARK } /* quotationmark=y */, + { 2, 8782, 0, 14, 0, UNI_SC__SHRD } /* script=sharada */, + { 2, 10268, 8172, 3, 8, UNI_NV__1_SLASH_160 } /* nv=6.25e-03 */, + { 0, 5875, 10292, 13, 3, UNI_JG__TAH } /* joininggroup=tah */, + { 0, 8973, 383, 6, 32, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* block=egyptianhieroglyphformatcontrols */, + { 0, 10352, 1219, 3, 2, UNI_WB__KA } /* wb=ka */, + { 3, 720, 0, 30, 0, UNI_CUNEIFORMNUMBERS } /* cuneiformnumbersandpunctuation */, + { 2, 6083, 8907, 13, 3, UNI_NV__300 } /* numericvalue=300 */, + { 0, 8881, 864, 4, 4, UNI_ARROWS } /* isarrows */, + { 3, 4463, 3141, 4, 8, UNI_INDEVANAGARI } /* indevanagari */, + { 16, 185, 6961, 2, 11, UNI_MYANMAREXTB } /* ismyanmarextb */, + { 0, 9979, 10095, 4, 4, UNI_XPEO } /* scx=xpeo */, + { 0, 8782, 10004, 8, 3, UNI_SOGO } /* script=sogo */, + { 2, 9171, 10355, 6, 3, UNI__PERL_PATWS } /* patws=yes */, + { 0, 8973, 5029, 6, 8, UNI_VEDICEXT } /* block=vedicext */, + { 0, 896, 0, 28, 0, UNI_SUPPUAA } /* supplementaryprivateuseareaa */, + { 2, 1418, 9016, 25, 5, UNI_CCC__130 } /* canonicalcombiningclass=ccc130 */, + { 16, 6741, 0, 11, 0, UNI_dep_values_index } /* deprecated= */, + { 1, 2453, 0, 20, 0, UNI_PHLI } /* inscriptionalpahlavi */, + { 0, 3978, 0, 16, 0, UNI_BOPOMOFOEXT } /* bopomofoextended */, + { 8, 185, 1595, 2, 14, UNI_MUSIC } /* ismusicalsymbols */, + { 0, 9087, 26, 6, 1, UNI_JOINC } /* joinc=y */, + { 3, 9476, 2353, 3, 20, UNI_HLUW } /* sc=anatolianhieroglyphs */, + { 2, 7230, 10238, 10, 3, UNI_BC__FSI } /* bidiclass=fsi */, + { 4, 149, 0, 35, 0, UNI_DIACRITICALSSUP } /* combiningdiacriticalmarkssupplement */, + { 0, 9691, 5270, 4, 6, UNI_KANGXI } /* blk=kangxi */, + { 0, 9879, 0, 4, 0, UNI_MYMR } /* mymr */, + { 0, 185, 4186, 2, 16, UNI_LINEARBIDEOGRAMS } /* islinearbideograms */, + { 1, 7460, 10075, 10, 4, UNI_IN__13 } /* presentin=v130 */, + { 1, 7391, 534, 4, 2, UNI_CANS } /* iscans */, + { 2, 8881, 15, 4, 2, UNI_ARAB } /* isarab */, + { 0, 9201, 0, 6, 0, UNI_TELU } /* telugu */, + { 0, 1189, 9535, 3, 4, UNI_INTAKRI } /* intakri */, + { 0, 8973, 3624, 8, 15, UNI_INCAUCASIANALBANIAN } /* block=caucasianalbanian */, + { 0, 185, 9484, 2, 5, UNI_LIMB } /* islimbu */, + { 48, 6614, 0, 12, 0, UNI_PHAISTOS } /* phaistosdisc */, + { 0, 185, 9504, 2, 5, UNI_NSHU } /* isnushu */, + { 0, 10217, 8, 3, 2, UNI_BC__AN } /* bc=an */, + { 5, 9476, 9915, 3, 4, UNI_SC__ORYA } /* sc=orya */, + { 0, 8973, 7510, 6, 10, UNI_SMALLFORMS } /* block=smallforms */, + { 0, 2304, 3356, 3, 17, UNI_ORNAMENTALDINGBATS } /* isornamentaldingbats */, + { 1, 9476, 8691, 3, 7, UNI_SC__MULT } /* sc=multani */, + { 14, 8881, 3964, 4, 7, UNI_ARABICSUP } /* isarabicsup */, + { 0, 3945, 10355, 17, 3, UNI_UIDEO } /* unifiedideograph=yes */, + { 1, 9979, 4426, 4, 4, UNI_TANG } /* scx=tang */, + { 6, 5592, 10355, 14, 3, UNI_PATSYN } /* patternsyntax=yes */, + { 1, 9743, 10355, 4, 3, UNI_DEP } /* dep=yes */, + { 8, 3877, 8476, 17, 8, UNI_TFNG } /* scriptextensions=tifinagh */, + { 8, 1538, 62, 3, 4, UNI_INDOGRA } /* indogra */, + { 0, 9691, 1019, 4, 5, UNI_MUSIC } /* blk=music */, + { 1, 2185, 26, 21, 1, UNI_EXTPICT } /* extendedpictographic=y */, + { 8, 8973, 9444, 6, 5, UNI_INDOGRA } /* block=dogra */, + { 0, 3877, 5940, 17, 9, UNI_MLYM } /* scriptextensions=malayalam */, + { 0, 7230, 3797, 10, 3, UNI_BC__NSM } /* bidiclass=nsm */, + { 1, 4972, 8469, 3, 7, UNI_TAGB } /* istagbanwa */, + { 2, 8973, 6752, 6, 6, UNI_DOMINO } /* block=domino */, + { 18, 3877, 7826, 17, 9, UNI_ORKH } /* scriptextensions=oldturkic */, + { 1, 8973, 7093, 6, 11, UNI_SUPERANDSUB } /* block=superandsub */, + { 3, 4157, 448, 3, 17, UNI_IDEOGRAPHICSYMBOLS } /* isideographicsymbols */, + { 0, 9979, 9201, 4, 6, UNI_TELU } /* scx=telugu */, + { 1, 9691, 6122, 4, 12, UNI_ALPHABETICPF } /* blk=alphabeticpf */, + { 19, 10268, 8228, 3, 8, UNI_NV__1_SLASH_12 } /* nv=8.33e-02 */, + { 0, 9979, 7570, 4, 10, UNI_WARA } /* scx=warangciti */, + { 1, 3877, 10047, 17, 4, UNI_TNSA } /* scriptextensions=tnsa */, + { 2, 185, 9129, 2, 4, UNI_LYCI } /* islyci */, + { 2, 8782, 1116, 7, 4, UNI_SC__HANG } /* script=hang */, + { 0, 10553, 0, 3, 0, UNI_S } /* iss */, + { 0, 7580, 139, 10, 2, UNI_WB__FO } /* wordbreak=fo */, + { 8, 5875, 5420, 13, 4, UNI_JG__BETH } /* joininggroup=beth */, + { 0, 6340, 6183, 3, 11, UNI_CHESSSYMBOLS } /* inchesssymbols */, + { 0, 9476, 9891, 3, 4, UNI_NEWA } /* sc=newa */, + { 0, 9691, 251, 4, 33, UNI_MISCMATHSYMBOLSA } /* blk=miscellaneousmathematicalsymbolsa */, + { 1, 9691, 3792, 4, 17, UNI_INKHITANSMALLSCRIPT } /* blk=khitansmallscript */, + { 1, 8782, 9519, 7, 5, UNI_OSGE } /* script=osage */, + { 0, 4972, 1870, 3, 4, UNI_TITLE } /* istitle */, + { 0, 9803, 912, 4, 1, UNI_GCB__V } /* hst=v */, + { 9, 7467, 0, 3, 0, UNI_in_values_index } /* in= */, + { 0, 8292, 0, 4, 0, UNI_BUGI } /* bugi */, + { 7, 9691, 3445, 4, 4, UNI_RUMI } /* blk=rumi */, + { 0, 3877, 1223, 17, 4, UNI_KANA } /* scriptextensions=kana */, + { 12, 8973, 9034, 7, 5, UNI_INCHAKMA } /* block=chakma */, + { 1, 2034, 0, 22, 0, UNI_MISCTECHNICAL } /* miscellaneoustechnical */, + { 6, 9476, 9667, 3, 4, UNI_ARMN } /* sc=armn */, + { 0, 9647, 8046, 4, 2, UNI_AGE__13 } /* age=13 */, + { 3, 3877, 8607, 17, 4, UNI_ELBA } /* scriptextensions=elba */, + { 16, 10268, 8943, 3, 2, UNI_NV__80 } /* nv=80 */, + { 0, 8973, 8810, 6, 7, UNI_INSOYOMBO } /* block=soyombo */, + { 5, 21, 5075, 3, 13, UNI_ANCIENTSYMBOLS } /* inancientsymbols */, + { 3, 185, 3265, 2, 11, UNI_GEORGIANSUP } /* isgeorgiansup */, + { 0, 9691, 1747, 4, 23, UNI_ZNAMENNYMUSIC } /* blk=znamennymusicalnotation */, + { 4, 8782, 9667, 7, 4, UNI_ARMN } /* script=armn */, + { 1, 6937, 4286, 6, 12, UNI_MISCMATHSYMBOLSA } /* inmiscmathsymbolsa */, + { 10, 7381, 0, 2, 0, UNI_VS } /* vs */, + { 0, 9691, 5606, 4, 14, UNI_PHONETICEXTSUP } /* blk=phoneticextsup */, + { 7, 2312, 2748, 4, 17, UNI_JAMOEXTA } /* inhanguljamoextendeda */, + { 0, 1990, 9499, 22, 5, UNI_INSC__NUKTA } /* indicsyllabiccategory=nukta */, + { 0, 6083, 9612, 13, 3, UNI_NV__5_SLASH_2 } /* numericvalue=5/2 */, + { 0, 1990, 1609, 22, 23, UNI_INSC__CONSONANTPRECEDINGREPHA } /* indicsyllabiccategory=consonantprecedingrepha */, + { 0, 9979, 9879, 4, 4, UNI_MYMR } /* scx=mymr */, + { 28, 5830, 26, 6, 1, UNI_EBASE } /* ebase=y */, + { 8, 185, 9105, 2, 6, UNI_KHOJ } /* iskhojki */, + { 0, 8973, 6961, 6, 11, UNI_MYANMAREXTB } /* block=myanmarextb */, + { 3, 8973, 896, 6, 28, UNI_SUPPUAA } /* block=supplementaryprivateuseareaa */, + { 0, 1219, 0, 8, 0, UNI_KANA } /* katakana */, + { 4, 8973, 5836, 6, 13, UNI_GREEKEXT } /* block=greekextended */, + { 1, 5875, 5396, 13, 14, UNI_JG__MANICHAEANAYIN } /* joininggroup=manichaeanayin */, + { 0, 3877, 2509, 17, 4, UNI_MONG } /* scriptextensions=mong */, + { 8, 2803, 1, 19, 1, -UNI_IDST } /* idstrinaryoperator=n */, + { 0, 6083, 8212, 13, 8, UNI_NV__4_SLASH_5 } /* numericvalue=8.00e-01 */, + { 0, 6083, 9604, 13, 3, UNI_NV__3_SLASH_2 } /* numericvalue=3/2 */, + { 18, 1274, 3, 21, 1, -UNI_CE } /* compositionexclusion=f */, + { 0, 9979, 9129, 4, 6, UNI_LYCI } /* scx=lycian */, + { 0, 9691, 8572, 4, 7, UNI_CJKEXTE } /* blk=cjkexte */, + { 0, 21, 1674, 2, 4, UNI_JAMO } /* injamo */, + { 0, 10268, 8044, 3, 8, UNI_NV__1_SLASH_32 } /* nv=3.13e-02 */, + { 3, 4894, 10355, 15, 3, UNI_NFKCQC__Y } /* nfkcquickcheck=yes */, + { 0, 9691, 8979, 4, 6, UNI_INCARIAN } /* blk=carian */, + { 0, 3157, 0, 13, 0, UNI_EMOD } /* emojimodifier */, + { 2, 8782, 8684, 7, 4, UNI_MARC } /* script=marc */, + { 0, 3319, 0, 9, 0, UNI_LATINEXTA } /* latinexta */, + { 0, 9979, 7016, 4, 11, UNI_HMNG } /* scx=pahawhhmong */, + { 2, 3978, 0, 4, 0, UNI_BOPO } /* bopo */, + { 16, 185, 6044, 2, 13, UNI_MAYANNUMERALS } /* ismayannumerals */, + { 0, 10217, 3229, 3, 18, UNI_BC__FSI } /* bc=firststrongisolate */, + { 0, 7370, 1, 10, 1, -UNI_XPOSIXLOWER } /* lowercase=n */, + { 2, 185, 1678, 2, 14, UNI_LATINEXTA } /* islatinextendeda */, + { 0, 3894, 26, 17, 1, UNI_STERM } /* sentenceterminal=y */, + { 49, 7908, 3, 8, 1, -UNI_IDS } /* idstart=f */, + { 0, 1115, 1, 26, 1, -UNI_CWKCF } /* changeswhennfkccasefolded=n */, + { 0, 10516, 0, 12, 0, UNI_POSIXBLANK } /* isposixblank */, + { 0, 3877, 4042, 17, 7, UNI_CPRT } /* scriptextensions=cypriot */, + { 2, 2248, 3464, 3, 11, UNI_SMALLKANAEXT } /* insmallkanaext */, + { 40, 185, 3050, 3, 3, UNI_CHER } /* ischer */, + { 1, 10511, 5095, 5, 6, UNI_POSIXXDIGIT } /* posixxdigit */, + { 0, 9691, 43, 4, 36, UNI_CJKCOMPATIDEOGRAPHSSUP } /* blk=cjkcompatibilityideographssupplement */, + { 8, 9691, 10039, 4, 4, UNI_INTHAI } /* blk=thai */, + { 12, 21, 7727, 2, 9, UNI_LATINEXTC } /* inlatinextc */, + { 20, 4744, 7137, 15, 11, UNI_IDENTIFIERTYPE__UNCOMMONUSE } /* identifiertype=uncommonuse */, + { 8, 1418, 0, 24, 0, UNI_ccc_values_index } /* canonicalcombiningclass= */, + { 2, 1418, 9024, 24, 3, UNI_CCC__132 } /* canonicalcombiningclass=132 */, + { 0, 9489, 1, 5, 1, -UNI_MATH } /* math=n */, + { 3, 10268, 7611, 3, 1, UNI_NV__5 } /* nv=5 */, + { 5, 9839, 0, 4, 0, UNI_LINA } /* lina */, + { 0, 4684, 1, 15, 1, UNI_EA__N } /* eastasianwidth=n */, + { 4, 1990, 2413, 22, 20, UNI_INSC__CONSONANTWITHSTACKER } /* indicsyllabiccategory=consonantwithstacker */, + { 0, 8642, 3, 7, 1, -UNI_HYPHEN } /* hyphen=f */, + { 6, 7467, 10328, 3, 3, UNI_IN__6_DOT_1 } /* in=v61 */, + { 1, 3877, 9195, 17, 6, UNI_TNSA } /* scriptextensions=tangsa */, + { 0, 8782, 9687, 7, 4, UNI_BHKS } /* script=bhks */, + { 8, 8782, 9201, 7, 6, UNI_SC__TELU } /* script=telugu */, + { 18, 9474, 9499, 5, 5, UNI_INSC__NUKTA } /* insc=nukta */, + { 0, 1418, 8907, 24, 2, UNI_CCC__30 } /* canonicalcombiningclass=30 */, + { 1, 9691, 6614, 4, 12, UNI_PHAISTOS } /* blk=phaistosdisc */, + { 0, 3122, 0, 5, 0, UNI_ECOMP } /* ecomp */, + { 0, 6937, 288, 6, 29, UNI_MISCMATHSYMBOLSB } /* inmiscellaneousmathematicalsymbolsb */, + { 0, 4074, 4999, 16, 15, UNI_TITLE } /* generalcategory=titlecaseletter */, + { 0, 9979, 9795, 4, 4, UNI_HMNG } /* scx=hmng */, + { 11, 9691, 8508, 4, 8, UNI_INVITHKUQI } /* blk=vithkuqi */, + { 1, 4714, 0, 14, 0, UNI_GREXT } /* graphemeextend */, + { 1, 9695, 0, 4, 0, UNI_bpt_values_index } /* bpt= */, + { 0, 10244, 468, 3, 11, UNI_P } /* gc=punctuation */, + { 1, 1852, 0, 6, 0, UNI_cased_values_index } /* cased= */, + { 26, 8973, 1747, 6, 23, UNI_ZNAMENNYMUSIC } /* block=znamennymusicalnotation */, + { 1, 8967, 10055, 6, 4, UNI_BIDIM } /* bidim=true */, + { 0, 9474, 5158, 5, 14, UNI_INSC__CONSONANTFINAL } /* insc=consonantfinal */, + { 3, 3877, 4504, 17, 5, UNI_BAMU } /* scriptextensions=bamum */, + { 3, 10508, 2803, 3, 3, UNI_XIDS } /* isxids */, + { 13, 7460, 10202, 10, 3, UNI_IN__6_DOT_3 } /* presentin=6.3 */, + { 0, 9159, 0, 8, 0, UNI_DT__CAN } /* nfdqc=no */, + { 0, 8973, 3265, 6, 11, UNI_GEORGIANSUP } /* block=georgiansup */, + { 0, 9683, 0, 4, 0, UNI_BATK } /* batk */, + { 2, 9214, 9454, 5, 5, -UNI_IDEO } /* ideo=false */, + { 0, 9045, 36, 6, 1, UNI_CWKCF } /* cwkcf=t */, + { 6, 7230, 8, 10, 2, UNI_BC__AN } /* bidiclass=an */, + { 1, 9269, 10055, 5, 4, UNI_POSIXXDIGIT } /* ahex=true */, + { 0, 9647, 7996, 4, 3, UNI_AGE__2 } /* age=2.0 */, + { 8, 5823, 10055, 13, 4, UNI_GRBASE } /* graphemebase=true */, + { 0, 4684, 9, 15, 2, UNI_EA__NA } /* eastasianwidth=na */, + { 0, 7160, 2, 3, 1, UNI_YI } /* isyi */, + { 2, 10280, 10055, 3, 4, UNI_RI } /* ri=true */, + { 0, 8973, 3657, 7, 16, UNI_CYRILLICEXTA } /* block=cyrillicextendeda */, + { 0, 10268, 7923, 3, 2, UNI_NV__11 } /* nv=11 */, + { 10, 185, 9435, 3, 3, UNI_CWCM } /* iscwcm */, + { 3, 9476, 5634, 3, 14, UNI_SC__PHLP } /* sc=psalterpahlavi */, + { 0, 8782, 6972, 7, 11, UNI_SC__NAND } /* script=nandinagari */, + { 1, 9979, 8838, 4, 7, UNI_LANA } /* scx=taitham */, + { 0, 10247, 7082, 3, 11, UNI_JG__STRAIGHTWAW } /* jg=straightwaw */, + { 8, 10247, 757, 3, 3, UNI_JG__DAL } /* jg=dal */, + { 2, 9979, 9667, 4, 4, UNI_ARMN } /* scx=armn */, + { 1, 5408, 6496, 4, 10, UNI_INMASARAMGONDI } /* inmasaramgondi */, + { 1, 8973, 6302, 6, 6, UNI_INHEBREW } /* block=hebrew */, + { 2, 10511, 63, 5, 5, UNI_POSIXGRAPH } /* posixgraph */, + { 8, 9979, 4534, 4, 4, UNI_BRAI } /* scx=brai */, + { 4, 2003, 4776, 11, 13, UNI_LOWERCASELETTER } /* category=lowercaseletter */, + { 2, 7230, 5578, 10, 14, UNI_BC__NSM } /* bidiclass=nonspacingmark */, + { 1, 9711, 8171, 4, 2, UNI_CCC__26 } /* ccc=26 */, + { 5, 6386, 0, 4, 0, UNI_MAHJ } /* mahj */, + { 6, 2012, 1, 22, 1, -UNI_LOE } /* logicalorderexception=n */, + { 2, 185, 2269, 2, 11, UNI_MTEI } /* ismeeteimayek */, + { 2, 2689, 0, 19, 0, UNI_COUNTINGROD } /* countingrodnumerals */, + { 19, 9514, 0, 5, 0, UNI_ORYA } /* oriya */, + { 2, 2808, 81, 4, 33, UNI_ARABICMATH } /* inarabicmathematicalalphabeticsymbols */, + { 9, 3877, 6302, 17, 4, UNI_HEBR } /* scriptextensions=hebr */, + { 3, 9691, 7270, 4, 10, UNI_CJKSTROKES } /* blk=cjkstrokes */, + { 1, 8973, 1946, 6, 22, UNI_DIACRITICALSFORSYMBOLS } /* block=diacriticalsforsymbols */, + { 5, 10253, 6278, 3, 4, UNI_LB__GL } /* lb=glue */, + { 0, 9979, 9867, 4, 4, UNI_MLYM } /* scx=mlym */, + { 0, 6083, 7956, 13, 8, UNI_NV__3_SLASH_2 } /* numericvalue=1.50e+00 */, + { 61, 3403, 3, 6, 1, -UNI_XPOSIXSPACE } /* space=f */, + { 0, 3283, 1026, 18, 2, -UNI_IDSB } /* idsbinaryoperator=no */, + { 2, 8782, 8500, 7, 8, UNI_UGAR } /* script=ugaritic */, + { 11, 9979, 9534, 4, 4, UNI_TAKR } /* scx=takr */, + { 0, 9691, 5836, 4, 8, UNI_GREEKEXT } /* blk=greekext */, + { 17, 8973, 7271, 7, 9, UNI_CJKSTROKES } /* block=cjkstrokes */, + { 0, 5875, 6410, 13, 12, UNI_JG__MALAYALAMLLA } /* joininggroup=malayalamlla */, + { 0, 8973, 1586, 6, 14, UNI_BYZANTINEMUSIC } /* block=byzantinemusic */, + { 0, 7467, 7983, 3, 1, UNI_IN__7 } /* in=7 */, + { 11, 3406, 1, 3, 1, -UNI_CE } /* ce=n */, + { 3, 1466, 0, 13, 0, UNI_M } /* combiningmark */, + { 0, 10523, 0, 5, 0, UNI_XPOSIXBLANK } /* blank */, + { 1, 9189, 9454, 6, 5, -UNI_STERM } /* sterm=false */, + { 0, 9189, 10355, 6, 3, UNI_STERM } /* sterm=yes */, + { 2, 184, 0, 20, 0, UNI_MISCSYMBOLS } /* miscellaneoussymbols */, + { 1, 9545, 10355, 4, 3, UNI_IDC } /* idc=yes */, + { 4, 6083, 8937, 13, 4, UNI_NV__7000 } /* numericvalue=7000 */, + { 0, 9979, 494, 4, 3, UNI_HAN } /* scx=han */, + { 0, 1553, 7550, 9, 10, UNI_CN } /* category=unassigned */, + { 3, 10553, 6, 3, 1, UNI_SD } /* issd */, + { 0, 10247, 5704, 3, 14, UNI_JG__HAMZAONHEHGOAL } /* jg=tehmarbutagoal */, + { 3, 7467, 10304, 3, 3, UNI_IN__3_DOT_1 } /* in=v31 */, + { 3, 10051, 0, 4, 0, UNI_TOTO } /* toto */, + { 0, 2248, 3464, 3, 17, UNI_SMALLKANAEXT } /* insmallkanaextension */, + { 3, 38, 0, 2, 0, UNI_XPOSIXDIGIT } /* nd */, + { 1, 9931, 0, 4, 0, UNI_PHLP } /* phlp */, + { 0, 9434, 36, 5, 1, UNI_CWCM } /* cwcm=t */, + { 1, 7460, 7611, 10, 1, UNI_IN__5 } /* presentin=5 */, + { 4, 10095, 0, 4, 0, UNI_XPEO } /* xpeo */, + { 1, 3877, 8684, 17, 4, UNI_MARC } /* scriptextensions=marc */, + { 1, 10268, 5732, 3, 6, UNI_NV__100000 } /* nv=100000 */, + { 13, 6242, 0, 12, 0, UNI_ETHIOPICEXTB } /* ethiopicextb */, + { 1, 2248, 4411, 3, 5, UNI_INSYRIAC } /* insyriac */, + { 3, 9779, 0, 4, 0, UNI_GUJR } /* gujr */, + { 0, 8702, 752, 4, 14, UNI_ENCLOSEDALPHANUM } /* inenclosedalphanum */, + { 5, 9691, 5836, 4, 13, UNI_GREEKEXT } /* blk=greekextended */, + { 0, 3605, 0, 17, 0, UNI_UCAS } /* canadiansyllabics */, + { 0, 9476, 8684, 3, 7, UNI_MARC } /* sc=marchen */, + { 0, 8973, 6122, 6, 12, UNI_ALPHABETICPF } /* block=alphabeticpf */, + { 0, 7460, 10328, 10, 3, UNI_IN__6_DOT_1 } /* presentin=v61 */, + { 7, 4024, 0, 18, 0, UNI_PE } /* isclosepunctuation */, + { 4, 3877, 7570, 17, 4, UNI_WARA } /* scriptextensions=wara */, + { 10, 9691, 9504, 4, 5, UNI_INNUSHU } /* blk=nushu */, + { 9, 185, 780, 2, 30, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* issymbolsandpictographsextendeda */, + { 0, 10268, 8949, 3, 2, UNI_NV__90 } /* nv=90 */, + { 19, 9476, 860, 4, 3, UNI_SC__KNDA } /* sc=knda */, + { 7, 9979, 8831, 4, 7, UNI_TGLG } /* scx=tagalog */, + { 0, 9476, 9237, 3, 4, UNI_SC__YEZI } /* sc=yezi */, + { 1, 10244, 7, 3, 1, UNI_C } /* gc=c */, + { 1, 9461, 9279, 3, 5, UNI_SB__AT } /* sb=aterm */, + { 0, 21, 8396, 2, 8, UNI_KANAEXTA } /* inkanaexta */, + { 0, 7391, 6721, 4, 9, UNI_CASEDLETTER } /* iscasedletter */, + { 2, 9979, 3049, 4, 4, UNI_CHER } /* scx=cher */, + { 1, 7853, 0, 4, 0, UNI_PAUC } /* pauc */, + { 16, 6083, 10196, 13, 3, UNI_NV__5_SLASH_8 } /* numericvalue=5/8 */, + { 4, 185, 721, 3, 29, UNI_CUNEIFORMNUMBERS } /* iscuneiformnumbersandpunctuation */, + { 4, 10268, 10214, 3, 3, UNI_NV__9_SLASH_2 } /* nv=9/2 */, + { 2, 9691, 3707, 4, 17, UNI_ETHIOPICEXTA } /* blk=ethiopicextendeda */, + { 0, 6083, 8028, 13, 3, UNI_NV__200 } /* numericvalue=200 */, + { 0, 5536, 9494, 14, 5, UNI_NFCQC__M } /* nfcquickcheck=maybe */, + { 9, 660, 0, 30, 0, UNI_CJKEXTF } /* cjkunifiedideographsextensionf */, + { 8, 48, 0, 1, 0, UNI_M } /* m */, + { 7, 5592, 36, 14, 1, UNI_PATSYN } /* patternsyntax=t */, + { 0, 185, 3139, 2, 18, UNI_DEVANAGARIEXT } /* isdevanagariextended */, + { 4, 10268, 8020, 3, 8, UNI_NV__1_SLASH_40 } /* nv=2.50e-02 */, + { 33, 1345, 0, 25, 0, UNI_SYMBOLSFORLEGACYCOMPUTING } /* symbolsforlegacycomputing */, + { 4, 9484, 0, 4, 0, UNI_LIMB } /* limb */, + { 0, 9711, 8028, 4, 3, UNI_WB__EB } /* ccc=200 */, + { 2, 4624, 0, 15, 0, UNI_CURRENCYSYMBOLS } /* currencysymbols */, + { 6, 6730, 0, 11, 0, UNI_CPMN } /* cyprominoan */, + { 0, 185, 4654, 2, 15, UNI_DIACRITICALSEXT } /* isdiacriticalsext */, + { 3, 3877, 9823, 17, 4, UNI_KTHI } /* scriptextensions=kthi */, + { 41, 8973, 2269, 6, 11, UNI_INMEETEIMAYEK } /* block=meeteimayek */, + { 2, 9979, 9183, 4, 6, UNI_RJNG } /* scx=rejang */, + { 1, 1538, 3499, 24, 18, UNI_INPC__TOPANDLEFTANDRIGHT } /* indicpositionalcategory=topandleftandright */, + { 1, 3877, 8790, 18, 6, UNI_SHRD } /* scriptextensions=sharada */, + { 1, 2803, 36, 19, 1, UNI_IDST } /* idstrinaryoperator=t */, + { 0, 10268, 8937, 3, 5, UNI_NV__70000 } /* nv=70000 */, + { 1, 9691, 9655, 4, 4, UNI_INAHOM } /* blk=ahom */, + { 0, 6083, 10178, 13, 3, UNI_NV__3_SLASH_4 } /* numericvalue=3/4 */, + { 0, 4504, 0, 5, 0, UNI_BAMU } /* bamum */, + { 0, 9827, 0, 4, 0, UNI_LANA } /* lana */, + { 11, 9647, 10316, 4, 3, UNI_AGE__5 } /* age=v50 */, + { 0, 10229, 1310, 3, 3, UNI_DT__SUB } /* dt=sub */, + { 0, 7580, 7772, 10, 6, UNI_WB__MN } /* wordbreak=midnum */, + { 0, 9476, 8292, 3, 8, UNI_SC__BUGI } /* sc=buginese */, + { 1, 8782, 7260, 7, 10, UNI_CHRS } /* script=chorasmian */, + { 2, 10232, 4527, 3, 7, UNI_EA__N } /* ea=neutral */, + { 0, 9550, 1026, 4, 2, -UNI_IDS } /* ids=no */, + { 0, 10244, 38, 3, 2, UNI_XPOSIXDIGIT } /* gc=nd */, + { 0, 9979, 8468, 4, 4, UNI_TAGB } /* scx=tagb */, + { 0, 8782, 3139, 7, 10, UNI_SC__DEVA } /* script=devanagari */, + { 0, 4972, 8860, 3, 6, UNI_TIBT } /* istibetan */, + { 4, 2936, 0, 19, 0, UNI_SUNDANESESUP } /* sundanesesupplement */, + { 0, 2553, 10056, 21, 3, UNI_TERM } /* terminalpunctuation=true */, + { 0, 185, 4202, 2, 16, UNI_LINEARBSYLLABARY } /* islinearbsyllabary */, + { 3, 9691, 1678, 4, 9, UNI_LATINEXTE } /* blk=latinexte */, + { 0, 3945, 1026, 17, 2, -UNI_UIDEO } /* unifiedideograph=no */, + { 0, 185, 1586, 2, 23, UNI_BYZANTINEMUSIC } /* isbyzantinemusicalsymbols */, + { 1, 3877, 9135, 17, 6, UNI_LYDI } /* scriptextensions=lydian */, + { 0, 185, 9867, 2, 4, UNI_MLYM } /* ismlym */, + { 6, 5830, 10355, 6, 3, UNI_EBASE } /* ebase=yes */, + { 0, 4598, 1634, 4, 21, UNI_GEOMETRICSHAPESEXT } /* ingeometricshapesextended */, + { 0, 3877, 9915, 17, 4, UNI_ORYA } /* scriptextensions=orya */, + { 1, 9476, 9895, 3, 3, UNI_SC__NKO } /* sc=nko */, + { 10, 6194, 0, 12, 0, UNI_CYRILLICEXTA } /* cyrillicexta */, + { 10, 10268, 7951, 3, 1, UNI_NV__3 } /* nv=3 */, + { 0, 9461, 126, 3, 2, UNI_LB__CR } /* sb=cr */, + { 18, 2746, 0, 19, 0, UNI_JAMOEXTA } /* hanguljamoextendeda */, + { 35, 8973, 3962, 6, 16, UNI_ARABICSUP } /* block=arabicsupplement */, + { 0, 21, 6362, 2, 12, UNI_KHMERSYMBOLS } /* inkhmersymbols */, + { 0, 4972, 1288, 4, 2, UNI_TELU } /* istelu */, + { 1, 3877, 9719, 17, 4, UNI_CPMN } /* scriptextensions=cpmn */, + { 7, 2304, 1783, 4, 2, UNI_OLCK } /* isolck */, + { 0, 7218, 1587, 3, 13, UNI_BYZANTINEMUSIC } /* inbyzantinemusic */, + { 0, 10268, 8943, 3, 3, UNI_NV__800 } /* nv=800 */, + { 0, 6340, 571, 3, 29, UNI_CJKEXTC } /* incjkunifiedideographsextensionc */, + { 8, 9476, 8803, 3, 7, UNI_SIDD } /* sc=siddham */, + { 59, 8973, 7450, 6, 10, UNI_INPHOENICIAN } /* block=phoenician */, + { 0, 3877, 8754, 17, 7, UNI_OSMA } /* scriptextensions=osmanya */, + { 2, 10283, 10355, 3, 3, UNI_SD } /* sd=yes */, + { 1, 10402, 6675, 6, 6, UNI__PERL_IDCONT } /* _perl_idcont */, + { 1, 3398, 3, 11, 1, -UNI_XPOSIXSPACE } /* whitespace=f */, + { 1, 3877, 10083, 17, 3, UNI_VAI } /* scriptextensions=vai */, + { 0, 7230, 3211, 10, 18, UNI_BC__ET } /* bidiclass=europeanterminator */, + { 1, 7218, 1587, 3, 22, UNI_BYZANTINEMUSIC } /* inbyzantinemusicalsymbols */, + { 0, 6697, 1, 11, 1, -UNI_XPOSIXALPHA } /* alphabetic=n */, + { 2, 7297, 34, 3, 2, UNI_XPOSIXXDIGIT } /* ishex */, + { 1, 10268, 9254, 3, 5, UNI_NV__1_SLASH_320 } /* nv=1/320 */, + { 0, 8973, 1678, 6, 9, UNI_LATINEXTE } /* block=latinexte */, + { 4, 9823, 0, 4, 0, UNI_KTHI } /* kthi */, + { 3, 5093, 1, 9, 1, -UNI_XPOSIXXDIGIT } /* hexdigit=n */, + { 0, 8973, 115, 7, 24, UNI_DIACRITICALS } /* block=combiningdiacriticalmarks */, + { 1, 7360, 8642, 10, 2, UNI_LB__HY } /* linebreak=hy */, + { 3, 9057, 1026, 6, 2, -UNI_EMOJI } /* emoji=no */, + { 14, 8782, 10051, 7, 4, UNI_TOTO } /* script=toto */, + { 6, 1553, 1026, 9, 2, UNI_NO } /* category=no */, + { 0, 9979, 7, 4, 18, UNI_CANS } /* scx=canadianaboriginal */, + { 0, 7580, 18, 10, 2, UNI_RI } /* wordbreak=ri */, + { 0, 21, 4186, 2, 16, UNI_LINEARBIDEOGRAMS } /* inlinearbideograms */, + { 1, 9476, 7820, 3, 4, UNI_SC__PERM } /* sc=perm */, + { 0, 1930, 0, 16, 0, UNI_INDICNUMBERFORMS } /* indicnumberforms */, + { 1, 8973, 1655, 6, 6, UNI_INHANGUL } /* block=hangul */, + { 0, 21, 3573, 4, 15, UNI_ALCHEMICAL } /* inalchemicalsymbols */, + { 9, 185, 6158, 2, 5, UNI_BIDIC } /* isbidic */, + { 3, 1088, 36, 27, 1, UNI_PCM } /* prependedconcatenationmark=t */, + { 0, 7300, 3, 10, 1, -UNI_DIA } /* diacritic=f */, + { 1, 21, 1678, 2, 14, UNI_LATINEXTA } /* inlatinextendeda */, + { 17, 5116, 26, 14, 1, UNI_CI } /* caseignorable=y */, + { 0, 10229, 10289, 3, 3, UNI_DT__SQR } /* dt=sqr */, + { 9, 10229, 2304, 3, 3, UNI_DT__ISO } /* dt=iso */, + { 2, 9979, 7790, 4, 9, UNI_TALU } /* scx=newtailue */, + { 1, 1067, 0, 2, 0, UNI_CASEDLETTER } /* lc */, + { 2, 2593, 3403, 4, 5, UNI_VERTSPACE } /* vertspace */, + { 0, 185, 10398, 2, 2, UNI_ZP } /* iszp */, + { 0, 1274, 0, 21, 0, UNI_ce_values_index } /* compositionexclusion= */, + { 0, 185, 5927, 2, 13, UNI_LOWSURROGATES } /* islowsurrogates */, + { 12, 9476, 8284, 3, 4, UNI_BASS } /* sc=bass */, + { 0, 10268, 9619, 3, 4, UNI_NV__3_SLASH_16 } /* nv=3/16 */, + { 3, 185, 2433, 2, 13, UNI_GLAGOLITICSUP } /* isglagoliticsup */, + { 0, 3481, 0, 11, 0, UNI_TAIXUANJING } /* taixuanjing */, + { 5, 3139, 0, 18, 0, UNI_DEVANAGARIEXT } /* devanagariextended */, + { 6, 2433, 0, 10, 0, UNI_GLAG } /* glagolitic */, + { 3, 8782, 2841, 7, 4, UNI_MERO } /* script=mero */, + { 22, 7230, 4521, 12, 13, UNI_BC__BN } /* bidiclass=boundaryneutral */, + { 4, 8782, 9135, 7, 6, UNI_LYDI } /* script=lydian */, + { 0, 2338, 0, 3, 0, UNI_XPOSIXXDIGIT } /* hex */, + { 0, 3175, 0, 17, 0, UNI_EPRES } /* emojipresentation */, + { 14, 2056, 3, 22, 1, -UNI__PERL_NCHAR } /* noncharactercodepoint=f */, + { 1, 10511, 1891, 5, 5, UNI_POSIXUPPER } /* posixupper */, + { 0, 4074, 1, 16, 1, UNI_N } /* generalcategory=n */, + { 6, 185, 44, 3, 15, UNI_CJKCOMPAT } /* iscjkcompatibility */, + { 0, 185, 9069, 2, 6, UNI_GOTH } /* isgothic */, + { 8, 7297, 8357, 3, 7, UNI_HIRA } /* ishiragana */, + { 64, 9691, 1655, 4, 23, UNI_COMPATJAMO } /* blk=hangulcompatibilityjamo */, + { 0, 5875, 9111, 13, 6, UNI_JG__LAMADH } /* joininggroup=lamadh */, + { 2, 5875, 9274, 13, 5, UNI_JG__ALAPH } /* joininggroup=alaph */, + { 12, 185, 9891, 2, 4, UNI_NEWA } /* isnewa */, + { 0, 8782, 9819, 7, 4, UNI_SC__KNDA } /* script=knda */, + { 2, 7360, 4898, 10, 2, UNI_LB__QU } /* linebreak=qu */, + { 0, 10253, 59, 3, 2, UNI_LB__ID } /* lb=id */, + { 3, 8782, 1678, 7, 5, UNI_SC__LATN } /* script=latin */, + { 4, 1592, 3708, 3, 15, UNI_ETHIOPICEXT } /* inethiopicextended */, + { 3, 8372, 0, 8, 0, UNI_JAMOEXTA } /* jamoexta */, + { 9, 9474, 3639, 5, 17, UNI_INSC__CONSONANTPREFIXED } /* insc=consonantprefixed */, + { 0, 1770, 1, 22, 1, UNI_BPT__N } /* bidipairedbrackettype=n */, + { 3, 9476, 3103, 3, 6, UNI_SC__COPT } /* sc=coptic */, + { 1, 5875, 9983, 13, 4, UNI_JG__SEEN } /* joininggroup=seen */, + { 13, 9219, 1, 6, 1, -UNI_XPOSIXUPPER } /* upper=n */, + { 1, 9691, 383, 4, 32, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* blk=egyptianhieroglyphformatcontrols */, + { 9, 383, 0, 32, 0, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* egyptianhieroglyphformatcontrols */, + { 0, 1990, 4879, 22, 15, UNI_INSC__MODIFYINGLETTER } /* indicsyllabiccategory=modifyingletter */, + { 4, 5875, 10220, 13, 3, UNI_JG__BEH } /* joininggroup=beh */, + { 2, 6083, 7924, 13, 8, UNI_NV__1_SLASH_9 } /* numericvalue=1.11e-01 */, + { 1, 9691, 7510, 4, 10, UNI_SMALLFORMS } /* blk=smallforms */, + { 0, 8782, 9482, 7, 4, UNI_PHLI } /* script=phli */, + { 7, 7460, 7951, 10, 1, UNI_IN__3 } /* presentin=3 */, + { 5, 7060, 1026, 11, 2, -UNI_SD } /* softdotted=no */, + { 0, 6350, 18, 12, 1, UNI_JT__R } /* joiningtype=r */, + { 0, 6083, 8913, 13, 6, UNI_NV__400000 } /* numericvalue=400000 */, + { 1, 9711, 8028, 4, 2, UNI_CCC__20 } /* ccc=20 */, + { 0, 8973, 3571, 6, 10, UNI_ALCHEMICAL } /* block=alchemical */, + { 2, 2143, 0, 14, 0, UNI_CJKRADICALSSUP } /* cjkradicalssup */, + { 0, 3121, 10289, 18, 3, UNI_DT__SQR } /* decompositiontype=sqr */, + { 0, 9476, 9129, 3, 4, UNI_LYCI } /* sc=lyci */, + { 19, 8973, 2085, 6, 15, UNI_MODIFIERLETTERS } /* block=modifierletters */, + { 11, 185, 8340, 2, 8, UNI_GUJR } /* isgujarati */, + { 0, 8973, 5270, 6, 6, UNI_KANGXI } /* block=kangxi */, + { 8, 9647, 8036, 4, 3, UNI_AGE__3_DOT_1 } /* age=3.1 */, + { 2, 10553, 10000, 3, 3, UNI_SHRD } /* isshrd */, + { 6, 1218, 0, 2, 0, UNI_SK } /* sk */, + { 2, 4074, 10390, 16, 2, UNI_CASEDLETTER } /* generalcategory=l_ */, + { 16, 10253, 534, 3, 2, UNI_LB__NS } /* lb=ns */, + { 7, 9711, 9360, 5, 4, UNI_CCC__26 } /* ccc=ccc26 */, + { 0, 2312, 1657, 4, 21, UNI_COMPATJAMO } /* inhangulcompatibilityjamo */, + { 9, 10268, 0, 3, 0, UNI_nv_values_index } /* nv= */, + { 1, 185, 1847, 2, 9, UNI_XPOSIXLOWER } /* islowercase */, + { 5, 4972, 2321, 3, 3, UNI_THAI } /* isthai */, + { 9, 8782, 6386, 7, 4, UNI_SC__MAHJ } /* script=mahj */, + { 8, 4346, 0, 16, 0, UNI_PO } /* otherpunctuation */, + { 0, 9979, 8677, 4, 7, UNI_MAND } /* scx=mandaic */, + { 7, 8628, 26, 7, 1, UNI_GRBASE } /* grbase=y */, + { 0, 5093, 10355, 9, 3, UNI_XPOSIXXDIGIT } /* hexdigit=yes */, + { 0, 3877, 9859, 17, 4, UNI_MERC } /* scriptextensions=merc */, + { 0, 10268, 7610, 3, 9, UNI_NV___MINUS_1_SLASH_2 } /* nv=-5.00e-01 */, + { 0, 8881, 81, 4, 33, UNI_ARABICMATH } /* isarabicmathematicalalphabeticsymbols */, + { 8, 9979, 7811, 4, 4, UNI_ITAL } /* scx=ital */, + { 0, 1418, 1780, 24, 2, UNI_CCC__BR } /* canonicalcombiningclass=br */, + { 18, 10352, 18, 3, 2, UNI_RI } /* wb=ri */, + { 3, 185, 5522, 2, 14, UNI_SK } /* ismodifiersymbol */, + { 0, 8782, 8292, 7, 4, UNI_SC__BUGI } /* script=bugi */, + { 1, 5606, 0, 14, 0, UNI_PHONETICEXTSUP } /* phoneticextsup */, + { 9, 1792, 0, 21, 0, UNI_CWCF } /* changeswhencasefolded */, + { 0, 5284, 0, 14, 0, UNI_LATINEXTB } /* latinextendedb */, + { 2, 5648, 10355, 14, 3, UNI_QMARK } /* quotationmark=yes */, + { 4, 9474, 1490, 5, 24, UNI_INSC__CONSONANTSUCCEEDINGREPHA } /* insc=consonantsucceedingrepha */, + { 0, 185, 6386, 2, 7, UNI_MAHJONG } /* ismahjong */, + { 5, 8663, 0, 7, 0, UNI_LINA } /* lineara */, + { 0, 9979, 9534, 4, 5, UNI_TAKR } /* scx=takri */, + { 0, 10217, 2473, 3, 20, UNI_BC__LRE } /* bc=lefttorightembedding */, + { 0, 7310, 0, 10, 0, UNI_DIAK } /* divesakuru */, + { 32, 5592, 1, 14, 1, -UNI_PATSYN } /* patternsyntax=n */, + { 0, 6083, 9639, 13, 4, UNI_NV__7_SLASH_12 } /* numericvalue=7/12 */, + { 3, 6719, 0, 11, 0, UNI_CASEDLETTER } /* casedletter */, + { 0, 7360, 74, 10, 2, UNI_EMOD } /* linebreak=em */, + { 2, 1270, 9454, 25, 5, -UNI_COMPEX } /* fullcompositionexclusion=false */, + { 0, 9464, 0, 5, 0, UNI_idst_values_index } /* idst= */, + { 20, 9476, 10027, 3, 4, UNI_TAVT } /* sc=tavt */, + { 1, 4074, 1172, 16, 2, UNI_TITLE } /* generalcategory=lt */, + { 3, 185, 9129, 2, 6, UNI_LYCI } /* islycian */, + { 3, 8782, 6593, 7, 4, UNI_HUNG } /* script=hung */, + { 4, 10268, 8919, 3, 6, UNI_NV__432000 } /* nv=432000 */, + { 2, 185, 9699, 2, 4, UNI_BUHD } /* isbuhd */, + { 1, 10223, 10055, 3, 4, UNI_CI } /* ci=true */, + { 0, 9691, 79, 4, 6, UNI_INARABIC } /* blk=arabic */, + { 1, 185, 1467, 3, 12, UNI_M } /* iscombiningmark */, + { 3, 7360, 1846, 10, 2, UNI_LB__NL } /* linebreak=nl */, + { 9, 10268, 9249, 3, 5, UNI_NV__1_SLASH_160 } /* nv=1/160 */, + { 0, 10516, 1891, 7, 5, UNI_POSIXUPPER } /* isposixupper */, + { 0, 185, 511, 3, 19, UNI_CJK } /* iscjkunifiedideographs */, + { 4, 1814, 36, 22, 1, UNI_CWCM } /* changeswhencasemapped=t */, + { 0, 9469, 2479, 5, 5, UNI_INPC__RIGHT } /* inpc=right */, + { 1, 7580, 6278, 10, 12, UNI_WB__EB } /* wordbreak=glueafterzwj */, + { 1, 8656, 0, 7, 0, UNI_KALI } /* kayahli */, + { 2, 8782, 9783, 7, 4, UNI_SC__GURU } /* script=guru */, + { 0, 9691, 2898, 4, 19, UNI_OTTOMANSIYAQNUMBERS } /* blk=ottomansiyaqnumbers */, + { 0, 9476, 8677, 3, 7, UNI_SC__MAND } /* sc=mandaic */, + { 12, 8973, 511, 7, 29, UNI_CJKEXTA } /* block=cjkunifiedideographsextensiona */, + { 1, 5875, 5, 13, 1, UNI_JG__E } /* joininggroup=e */, + { 0, 5875, 2661, 13, 9, UNI_JG__YEHBARREE } /* joininggroup=yehbarree */, + { 2, 10352, 7772, 3, 9, UNI_WB__MB } /* wb=midnumlet */, + { 0, 6083, 7923, 13, 2, UNI_NV__11 } /* numericvalue=11 */, + { 0, 10268, 8179, 3, 2, UNI_NV__36 } /* nv=36 */, + { 1, 9691, 7727, 4, 9, UNI_LATINEXTC } /* blk=latinextc */, + { 2, 21, 3792, 2, 17, UNI_INKHITANSMALLSCRIPT } /* inkhitansmallscript */, + { 0, 9691, 114, 4, 35, UNI_DIACRITICALSFORSYMBOLS } /* blk=combiningdiacriticalmarksforsymbols */, + { 4, 9476, 9799, 3, 4, UNI_HMNP } /* sc=hmnp */, + { 13, 8702, 812, 4, 27, UNI_ENCLOSEDIDEOGRAPHICSUP } /* inenclosedideographicsupplement */, + { 0, 2206, 36, 21, 1, UNI_GCB__T } /* graphemeclusterbreak=t */, + { 2, 10547, 0, 4, 0, UNI_PE } /* ispe */, + { 0, 185, 8656, 2, 7, UNI_KALI } /* iskayahli */, + { 7, 8782, 1166, 9, 2, UNI_SC__SHRD } /* script=shrd */, + { 0, 9691, 1034, 4, 11, UNI_ENCLOSEDCJK } /* blk=enclosedcjk */, + { 0, 8973, 5340, 6, 14, UNI_LATINEXTF } /* block=latinextendedf */, + { 1, 1880, 0, 21, 0, UNI_CWU } /* changeswhenuppercased */, + { 0, 1553, 7, 9, 1, UNI_C } /* category=c */, + { 2, 4714, 3, 15, 1, -UNI_GREXT } /* graphemeextend=f */, + { 5, 7844, 0, 4, 0, UNI_PALM } /* palm */, + { 4, 3877, 9284, 17, 5, UNI_BATK } /* scriptextensions=batak */, + { 0, 9545, 26, 4, 1, UNI_IDC } /* idc=y */, + { 0, 9691, 2633, 5, 5, UNI_INBRAHMI } /* blk=brahmi */, + { 20, 6340, 631, 3, 29, UNI_CJKEXTE } /* incjkunifiedideographsextensione */, + { 2, 2593, 0, 20, 1, UNI_VO__U } /* verticalorientation=u */, + { 0, 9469, 6615, 3, 7, UNI_PHAISTOS } /* inphaistos */, + { 6, 8973, 4186, 6, 16, UNI_LINEARBIDEOGRAMS } /* block=linearbideograms */, + { 11, 185, 7862, 2, 9, UNI_SAMR } /* issamaritan */, + { 4, 2746, 0, 10, 0, UNI_JAMO } /* hanguljamo */, + { 16, 6338, 26, 12, 1, UNI_JOINC } /* joincontrol=y */, + { 5, 5875, 6432, 13, 5, UNI_JG__GAMAL } /* joininggroup=gamal */, + { 0, 4972, 4259, 3, 3, UNI_TNSA } /* istnsa */, + { 1, 9213, 36, 6, 1, UNI_UIDEO } /* uideo=t */, + { 2, 8973, 2993, 6, 19, UNI_SUPARROWSC } /* block=supplementalarrowsc */, + { 1, 9691, 9295, 5, 4, UNI_INBUHID } /* blk=buhid */, + { 0, 9979, 6290, 4, 12, UNI_GONG } /* scx=gunjalagondi */, + { 2, 3894, 9454, 17, 5, -UNI_STERM } /* sentenceterminal=false */, + { 0, 9476, 10015, 3, 4, UNI_SC__TALE } /* sc=tale */, + { 1, 9691, 7211, 5, 9, UNI_ASCII } /* blk=basiclatin */, + { 0, 7460, 10337, 10, 3, UNI_IN__7 } /* presentin=v70 */, + { 0, 21, 9135, 2, 6, UNI_INLYDIAN } /* inlydian */, + { 21, 4909, 10355, 15, 3, UNI_DT__NONE } /* nfkdquickcheck=yes */, + { 9, 10268, 7611, 3, 8, UNI_NV__1_SLASH_2 } /* nv=5.00e-01 */, + { 0, 9695, 6001, 4, 4, UNI_BPT__N } /* bpt=none */, + { 6, 185, 6752, 2, 6, UNI_DOMINO } /* isdomino */, + { 2, 9476, 9444, 3, 5, UNI_SC__DOGR } /* sc=dogra */, + { 3, 21, 9117, 2, 6, UNI_INLEPCHA } /* inlepcha */, + { 8, 9979, 9105, 4, 4, UNI_KHOJ } /* scx=khoj */, + { 0, 9907, 0, 4, 0, UNI_OLCK } /* olck */, + { 0, 9691, 1061, 4, 27, UNI_OCR } /* blk=opticalcharacterrecognition */, + { 3, 185, 4849, 2, 15, UNI_MERC } /* ismeroiticcursive */, + { 0, 9476, 498, 5, 3, UNI_KHMR } /* sc=khmer */, + { 1, 185, 2690, 3, 10, UNI_COUNTINGROD } /* iscountingrod */, + { 1, 9979, 9482, 4, 4, UNI_PHLI } /* scx=phli */, + { 0, 21, 5354, 2, 14, UNI_LATINEXTG } /* inlatinextendedg */, + { 2, 9979, 2433, 4, 10, UNI_GLAG } /* scx=glagolitic */, + { 1, 9063, 1026, 6, 2, -UNI_EPRES } /* epres=no */, + { 1, 10247, 2661, 3, 3, UNI_JG__YEH } /* jg=yeh */, + { 2, 10253, 1775, 3, 2, UNI_LB__AI } /* lb=ai */, + { 0, 8782, 9081, 7, 4, UNI_HATR } /* script=hatr */, + { 6, 9979, 2879, 4, 9, UNI_MONG } /* scx=mongolian */, + { 1, 6578, 0, 12, 0, UNI_nt_values_index } /* numerictype= */, + { 0, 9691, 1946, 4, 22, UNI_DIACRITICALSFORSYMBOLS } /* blk=diacriticalsforsymbols */, + { 0, 7460, 10340, 10, 3, UNI_IN__8 } /* presentin=v80 */, + { 1, 133, 0, 2, 0, UNI_LM } /* lm */, + { 8, 5875, 6031, 13, 13, UNI_JG__MANICHAEANWAW } /* joininggroup=manichaeanwaw */, + { 21, 1990, 0, 22, 0, UNI_insc_values_index } /* indicsyllabiccategory= */, + { 1, 10244, 3382, 3, 9, UNI_Z } /* gc=separator */, + { 0, 2784, 5717, 19, 2, UNI_LB__H2 } /* hangulsyllabletype=lv */, + { 65, 9979, 7655, 4, 9, UNI_BHKS } /* scx=bhaiksuki */, + { 1, 10247, 4789, 3, 15, UNI_JG__MANICHAEANALEPH } /* jg=manichaeanaleph */, + { 13, 9691, 6626, 4, 12, UNI_PLAYINGCARDS } /* blk=playingcards */, + { 0, 9476, 9863, 3, 4, UNI_MIAO } /* sc=miao */, + { 16, 9979, 8866, 4, 4, UNI_TIRH } /* scx=tirh */, + { 3, 9123, 10055, 6, 4, UNI_XPOSIXLOWER } /* lower=true */, + { 1, 1167, 9454, 26, 5, -UNI_DI } /* defaultignorablecodepoint=false */, + { 1, 7460, 10190, 10, 3, UNI_IN__5_DOT_2 } /* presentin=5.2 */, + { 1, 3877, 9887, 17, 4, UNI_NBAT } /* scriptextensions=nbat */, + { 10, 1990, 4579, 22, 15, UNI_INSC__CONSONANTMEDIAL } /* indicsyllabiccategory=consonantmedial */, + { 10, 9979, 2085, 4, 4, UNI_MODI } /* scx=modi */, + { 0, 1418, 41, 24, 2, UNI_CCC__DA } /* canonicalcombiningclass=da */, + { 1, 187, 0, 2, 0, UNI_CE } /* ce */, + { 34, 8973, 79, 6, 35, UNI_ARABICMATH } /* block=arabicmathematicalalphabeticsymbols */, + { 1, 9935, 0, 4, 0, UNI_PHNX } /* phnx */, + { 1, 9711, 10154, 4, 3, UNI_CCC__R } /* ccc=226 */, + { 0, 9691, 2164, 4, 21, UNI_CYRILLICSUP } /* blk=cyrillicsupplementary */, + { 1, 185, 9755, 2, 4, UNI_DSRT } /* isdsrt */, + { 1, 9979, 10115, 4, 4, UNI_QAAI } /* scx=zinh */, + { 8, 6340, 2144, 3, 20, UNI_CJKRADICALSSUP } /* incjkradicalssupplement */, + { 81, 9763, 1088, 4, 7, UNI_GCB__PP } /* gcb=prepend */, + { 18, 4154, 25, 3, 1, UNI_INVS } /* invs */, + { 5, 21, 3809, 2, 17, UNI_LETTERLIKESYMBOLS } /* inletterlikesymbols */, + { 16, 9476, 6494, 3, 12, UNI_SC__GONM } /* sc=masaramgondi */, + { 0, 7360, 6096, 10, 13, UNI_LB__PR } /* linebreak=prefixnumeric */, + { 0, 5592, 9454, 14, 5, -UNI_PATSYN } /* patternsyntax=false */, + { 32, 185, 9034, 3, 5, UNI_CAKM } /* ischakma */, + { 37, 4330, 0, 16, 0, UNI_MYANMAREXTB } /* myanmarextendedb */, + { 1, 8782, 9484, 7, 4, UNI_SC__LIMB } /* script=limb */, + { 6, 9476, 9069, 3, 6, UNI_GOTH } /* sc=gothic */, + { 0, 6083, 7947, 13, 2, UNI_NV__21 } /* numericvalue=21 */, + { 3, 9979, 9679, 4, 4, UNI_AVST } /* scx=avst */, + { 12, 4074, 107, 16, 6, UNI_S } /* generalcategory=symbol */, + { 0, 3319, 0, 18, 0, UNI_LATINEXTADDITIONAL } /* latinextadditional */, + { 0, 8973, 4474, 6, 15, UNI_ARABICEXTA } /* block=arabicextendeda */, + { 2, 7467, 10190, 3, 3, UNI_IN__5_DOT_2 } /* in=5.2 */, + { 0, 10244, 75, 3, 2, UNI_ME } /* gc=me */, + { 10, 185, 2165, 3, 10, UNI_CYRILLICSUP } /* iscyrillicsup */, + { 0, 3553, 3, 18, 1, -UNI_VS } /* variationselector=f */, + { 0, 9474, 3085, 5, 18, UNI_INSC__CONSONANTSUBJOINED } /* insc=consonantsubjoined */, + { 2, 10223, 1, 3, 1, -UNI_CI } /* ci=n */, + { 9, 185, 8559, 3, 6, UNI_CJKEXTC } /* iscjkextc */, + { 4, 5797, 0, 13, 0, UNI_XPOSIXDIGIT } /* decimalnumber */, + { 17, 9979, 9835, 4, 4, UNI_LATN } /* scx=latn */, + { 4, 185, 3050, 3, 17, UNI_CHEROKEESUP } /* ischerokeesupplement */, + { 3, 9469, 869, 3, 10, UNI_PHONETICEXT } /* inphoneticext */, + { 2, 8973, 8284, 6, 8, UNI_INBASSAVAH } /* block=bassavah */, + { 1, 185, 2632, 2, 6, UNI_BRAH } /* isbrahmi */, + { 8, 185, 4534, 2, 4, UNI_BRAI } /* isbrai */, + { 32, 9469, 5607, 3, 13, UNI_PHONETICEXTSUP } /* inphoneticextsup */, + { 0, 9469, 869, 3, 27, UNI_PHONETICEXTSUP } /* inphoneticextensionssupplement */, + { 4, 3121, 46, 18, 6, UNI_DT__COM } /* decompositiontype=compat */, + { 11, 9711, 9330, 5, 4, UNI_CCC__20 } /* ccc=ccc20 */, + { 4, 10253, 203, 3, 2, UNI_LB__SA } /* lb=sa */, + { 1, 9177, 3, 6, 1, -UNI_QMARK } /* qmark=f */, + { 1, 9051, 3, 6, 1, -UNI_ECOMP } /* ecomp=f */, + { 98, 10253, 867, 3, 2, UNI_LB__SP } /* lb=sp */, + { 0, 8782, 3978, 7, 4, UNI_SC__BOPO } /* script=bopo */, + { 0, 8782, 720, 7, 9, UNI_XSUX } /* script=cuneiform */, + { 5, 6675, 10355, 11, 3, UNI_IDC } /* idcontinue=yes */, + { 0, 9461, 752, 3, 2, UNI_SB__CL } /* sb=cl */, + { 34, 185, 7510, 2, 10, UNI_SMALLFORMS } /* issmallforms */, + { 23, 8973, 2690, 7, 10, UNI_COUNTINGROD } /* block=countingrod */, + { 1, 6083, 8949, 13, 6, UNI_NV__900000 } /* numericvalue=900000 */, + { 0, 10511, 97, 5, 5, UNI_POSIXALPHA } /* posixalpha */, + { 8, 4639, 0, 15, 0, UNI_PD } /* dashpunctuation */, + { 8, 9544, 0, 5, 0, UNI_xidc_values_index } /* xidc= */, + { 8, 1538, 6734, 3, 5, UNI_DOMINO } /* indomino */, + { 1, 9476, 9509, 3, 5, UNI_OGAM } /* sc=ogham */, + { 0, 185, 6219, 3, 11, UNI_CYRILLICEXTC } /* iscyrillicextc */, + { 19, 9979, 7330, 4, 4, UNI_KHAR } /* scx=khar */, + { 0, 10247, 6446, 3, 12, UNI_JG__MALAYALAMNYA } /* jg=malayalamnya */, + { 3, 9711, 3596, 4, 9, UNI_CCC__BL } /* ccc=belowleft */, + { 0, 7160, 10104, 3, 3, UNI_YI } /* isyiii */, + { 3, 5875, 6005, 13, 13, UNI_JG__MANICHAEANTAW } /* joininggroup=manichaeantaw */, + { 8, 185, 1219, 2, 26, UNI_KATAKANAEXT } /* iskatakanaphoneticextensions */, + { 0, 9691, 896, 4, 28, UNI_SUPPUAA } /* blk=supplementaryprivateuseareaa */, + { 0, 1190, 496, 3, 2, UNI_NT__NU } /* nt=nu */, + { 3, 185, 4314, 2, 16, UNI_MYANMAREXTA } /* ismyanmarextendeda */, + { 4, 9763, 1195, 4, 2, UNI_LB__LF } /* gcb=lf */, + { 17, 10268, 9571, 3, 3, UNI_NV__1_SLASH_4 } /* nv=1/4 */, + { 2, 8740, 0, 7, 0, UNI_OLCK } /* olchiki */, + { 0, 9711, 8992, 5, 5, UNI_CCC__107 } /* ccc=ccc107 */, + { 2, 185, 2936, 2, 19, UNI_SUNDANESESUP } /* issundanesesupplement */, + { 0, 185, 2269, 2, 21, UNI_MEETEIMAYEKEXT } /* ismeeteimayekextensions */, + { 4, 9691, 1678, 4, 14, UNI_LATINEXTA } /* blk=latinextendeda */, + { 3, 3877, 5634, 17, 14, UNI_PHLP } /* scriptextensions=psalterpahlavi */, + { 1, 6950, 0, 11, 0, UNI_MYANMAREXTA } /* myanmarexta */, + { 1, 8881, 1396, 4, 22, UNI_ARABICPFB } /* isarabicpresentationformsb */, + { 19, 185, 8684, 2, 7, UNI_MARC } /* ismarchen */, + { 11, 10253, 6302, 3, 12, UNI_LB__HL } /* lb=hebrewletter */, + { 2, 9691, 9524, 4, 5, UNI_INRUNIC } /* blk=runic */, + { 0, 9691, 8348, 4, 8, UNI_INGURMUKHI } /* blk=gurmukhi */, + { 2, 10268, 8903, 3, 2, UNI_NV__60 } /* nv=60 */, + { 3, 1814, 1, 22, 1, -UNI_CWCM } /* changeswhencasemapped=n */, + { 0, 9847, 0, 3, 0, UNI_LOE } /* loe */, + { 0, 21, 3445, 2, 4, UNI_RUMI } /* inrumi */, + { 9, 6937, 207, 6, 11, UNI_MISCPICTOGRAPHS } /* inmiscpictographs */, + { 4, 9171, 10055, 6, 4, UNI__PERL_PATWS } /* patws=true */, + { 3, 7467, 10199, 3, 3, UNI_IN__6_DOT_1 } /* in=6.1 */, + { 13, 2808, 7648, 4, 7, UNI_ARABICPFB } /* inarabicpfb */, + { 24, 9691, 9201, 4, 6, UNI_INTELUGU } /* blk=telugu */, + { 0, 9979, 8845, 4, 7, UNI_TAVT } /* scx=taiviet */, + { 0, 9979, 9129, 4, 4, UNI_LYCI } /* scx=lyci */, + { 1, 185, 1443, 3, 23, UNI_CJKSYMBOLS } /* iscjksymbolsandpunctuation */, + { 0, 4442, 0, 9, 0, UNI_TANGUTSUP } /* tangutsup */, + { 0, 9691, 3707, 4, 11, UNI_ETHIOPICEXT } /* blk=ethiopicext */, + { 1, 8444, 3, 8, 1, -UNI_RADICAL } /* radical=f */, + { 8, 2593, 472, 20, 2, UNI_VO__TU } /* verticalorientation=tu */, + { 2, 8782, 6972, 7, 4, UNI_SC__NAND } /* script=nand */, + { 50, 9711, 9415, 5, 4, UNI_CCC__84 } /* ccc=ccc84 */, + { 1, 185, 3319, 2, 18, UNI_LATINEXTADDITIONAL } /* islatinextadditional */, + { 8, 8973, 10083, 6, 3, UNI_INVAI } /* block=vai */, + { 0, 185, 5029, 2, 15, UNI_VEDICEXT } /* isvedicextensions */, + { 2, 9691, 5130, 4, 14, UNI_CJKCOMPATFORMS } /* blk=cjkcompatforms */, + { 2, 6083, 8102, 13, 2, UNI_NV__17 } /* numericvalue=17 */, + { 1, 34, 0, 3, 0, UNI_EXT } /* ext */, + { 1, 8593, 3, 7, 1, -UNI_COMPEX } /* compex=f */, + { 0, 8881, 728, 4, 2, UNI_ARMN } /* isarmn */, + { 0, 10456, 10440, 14, 11, UNI__PERL_FOLDS_TO_MULTI_CHAR } /* _perl_folds_to_multi_char */, + { 17, 7230, 0, 11, 0, UNI_BC__B } /* bidiclass=b */, + { 4, 9469, 7017, 3, 10, UNI_INPAHAWHHMONG } /* inpahawhhmong */, + { 2, 9691, 329, 4, 21, UNI_MATHOPERATORS } /* blk=mathematicaloperators */, + { 0, 2312, 8357, 3, 7, UNI_INHIRAGANA } /* inhiragana */, + { 0, 9691, 862, 4, 6, UNI_ARROWS } /* blk=arrows */, + { 1, 10229, 4058, 3, 3, UNI_DT__FIN } /* dt=fin */, + { 2, 6340, 721, 3, 8, UNI_INCUNEIFORM } /* incuneiform */, + { 3, 7218, 8285, 3, 7, UNI_INBASSAVAH } /* inbassavah */, + { 1, 9474, 4458, 5, 5, UNI_INSC__VOWEL } /* insc=vowel */, + { 1, 5875, 4834, 13, 15, UNI_JG__MANICHAEANZAYIN } /* joininggroup=manichaeanzayin */, + { 0, 9691, 4314, 4, 16, UNI_MYANMAREXTA } /* blk=myanmarextendeda */, + { 1, 7552, 0, 8, 0, UNI_ASSIGNED } /* assigned */, + { 1, 8973, 7520, 6, 10, UNI_SUPARROWSA } /* block=suparrowsa */, + { 1, 1418, 7320, 24, 10, UNI_CCC__6 } /* canonicalcombiningclass=hanreading */, + { 4, 6083, 5733, 13, 1, UNI_NV__0 } /* numericvalue=0 */, + { 0, 6340, 4625, 3, 14, UNI_CURRENCYSYMBOLS } /* incurrencysymbols */, + { 0, 10247, 6470, 3, 12, UNI_JG__MALAYALAMTTA } /* jg=malayalamtta */, + { 0, 5823, 36, 13, 1, UNI_GRBASE } /* graphemebase=t */, + { 1, 9731, 3, 4, 1, -UNI_CWT } /* cwt=f */, + { 1, 10516, 0, 4, 0, UNI_PO } /* ispo */, + { 0, 9549, 26, 5, 1, UNI_XIDS } /* xids=y */, + { 0, 8973, 691, 7, 29, UNI_CJKEXTG } /* block=cjkunifiedideographsextensiong */, + { 2, 185, 7580, 2, 4, UNI_XPOSIXWORD } /* isword */, + { 0, 9213, 1, 6, 1, -UNI_UIDEO } /* uideo=n */, + { 8, 5875, 5424, 13, 14, UNI_JG__MANICHAEANFIVE } /* joininggroup=manichaeanfive */, + { 1, 3571, 0, 10, 0, UNI_ALCHEMICAL } /* alchemical */, + { 10, 8973, 1678, 6, 14, UNI_LATINEXTA } /* block=latinextendeda */, + { 1, 4624, 0, 14, 0, UNI_SC } /* currencysymbol */, + { 0, 9979, 8607, 4, 4, UNI_ELBA } /* scx=elba */, + { 0, 9979, 9444, 4, 4, UNI_DOGR } /* scx=dogr */, + { 4, 720, 0, 16, 0, UNI_CUNEIFORMNUMBERS } /* cuneiformnumbers */, + { 2, 9747, 1026, 4, 2, -UNI_DIA } /* dia=no */, + { 0, 10268, 10181, 3, 3, UNI_NV__3_SLASH_5 } /* nv=3/5 */, + { 1, 185, 9967, 2, 4, UNI_RUNR } /* isrunr */, + { 1, 8973, 7727, 6, 9, UNI_LATINEXTC } /* block=latinextc */, + { 7, 317, 0, 33, 0, UNI_SUPMATHOPERATORS } /* supplementalmathematicaloperators */, + { 0, 8782, 9859, 7, 4, UNI_MERC } /* script=merc */, + { 5, 4744, 0, 15, 0, UNI_identifiertype_values_index } /* identifiertype= */, + { 3, 9711, 9417, 4, 2, UNI_CCC__84 } /* ccc=84 */, + { 0, 8782, 1223, 7, 4, UNI_SC__KANA } /* script=kana */, + { 10, 4847, 2271, 4, 9, UNI_INMEETEIMAYEK } /* inmeeteimayek */, + { 17, 6083, 9407, 13, 2, UNI_NV__35 } /* numericvalue=35 */, + { 1, 10247, 10107, 3, 4, UNI_JG__ZAIN } /* jg=zain */, + { 48, 185, 5823, 2, 12, UNI_GRBASE } /* isgraphemebase */, + { 10, 3283, 1, 18, 1, -UNI_IDSB } /* idsbinaryoperator=n */, + { 11, 8973, 2746, 6, 19, UNI_JAMOEXTA } /* block=hanguljamoextendeda */, + { 1, 6529, 3356, 3, 17, UNI_ORNAMENTALDINGBATS } /* inornamentaldingbats */, + { 2, 8979, 0, 6, 0, UNI_CARI } /* carian */, + { 41, 6083, 8937, 13, 2, UNI_NV__70 } /* numericvalue=70 */, + { 0, 6972, 0, 4, 0, UNI_NAND } /* nand */, + { 1, 8782, 2227, 7, 14, UNI_SC__ROHG } /* script=hanifirohingya */, + { 1, 9476, 8740, 3, 7, UNI_OLCK } /* sc=olchiki */, + { 8, 3175, 26, 18, 1, UNI_EPRES } /* emojipresentation=y */, + { 2, 4474, 0, 15, 0, UNI_ARABICEXTA } /* arabicextendeda */, + { 0, 4074, 7005, 16, 11, UNI_SO } /* generalcategory=othersymbol */, + { 1, 8973, 1632, 6, 23, UNI_GEOMETRICSHAPESEXT } /* block=geometricshapesextended */, + { 0, 3877, 8607, 17, 7, UNI_ELBA } /* scriptextensions=elbasan */, + { 1, 1418, 3596, 24, 9, UNI_CCC__BL } /* canonicalcombiningclass=belowleft */, + { 4, 7360, 396, 10, 2, UNI_LB__GL } /* linebreak=gl */, + { 1, 1418, 9385, 25, 4, UNI_CCC__31 } /* canonicalcombiningclass=ccc31 */, + { 5, 6083, 8925, 13, 5, UNI_NV__50000 } /* numericvalue=50000 */, + { 0, 10352, 2468, 3, 2, UNI_LB__HL } /* wb=hl */, + { 0, 7580, 6287, 10, 3, UNI_LB__ZWJ } /* wordbreak=zwj */, + { 3, 9691, 2955, 4, 19, UNI_SUPARROWSA } /* blk=supplementalarrowsa */, + { 1, 5045, 8493, 3, 7, UNI_UCASEXTA } /* isucasexta */, + { 0, 9691, 1295, 4, 25, UNI_SUPERANDSUB } /* blk=superscriptsandsubscripts */, + { 2, 4972, 4443, 3, 15, UNI_TANGUTSUP } /* istangutsupplement */, + { 0, 46, 0, 2, 0, UNI_CO } /* co */, + { 0, 18, 0, 2, 0, UNI_RI } /* ri */, + { 0, 3877, 9835, 17, 4, UNI_LATN } /* scriptextensions=latn */, + { 13, 5662, 0, 14, 0, UNI_sb_values_index } /* sentencebreak= */, + { 26, 8973, 868, 6, 11, UNI_PHONETICEXT } /* block=phoneticext */, + { 0, 6842, 3922, 4, 4, UNI_INCARIAN } /* incarian */, + { 0, 5875, 8324, 13, 8, UNI_JG__FARSIYEH } /* joininggroup=farsiyeh */, + { 0, 7460, 10211, 10, 3, UNI_IN__9 } /* presentin=9.0 */, + { 4, 2808, 864, 4, 4, UNI_ARROWS } /* inarrows */, + { 0, 8973, 9117, 6, 6, UNI_INLEPCHA } /* block=lepcha */, + { 2, 9971, 0, 4, 0, UNI_SAMR } /* samr */, + { 0, 185, 2123, 3, 20, UNI_CJKCOMPATFORMS } /* iscjkcompatibilityforms */, + { 2, 3877, 2312, 18, 3, UNI_SINH } /* scriptextensions=sinh */, + { 1, 2248, 2079, 3, 21, UNI_MODIFIERLETTERS } /* inspacingmodifierletters */, + { 1, 6340, 3837, 3, 3, UNI_INCHAM } /* incham */, + { 2, 9711, 7995, 4, 2, UNI_CCC__12 } /* ccc=12 */, + { 0, 9461, 401, 3, 6, UNI_SB__FO } /* sb=format */, + { 0, 8881, 7648, 4, 7, UNI_ARABICPFB } /* isarabicpfb */, + { 8, 10268, 10370, 3, 2, UNI_NV__48 } /* nv=48 */, + { 2, 6083, 9367, 13, 2, UNI_NV__27 } /* numericvalue=27 */, + { 2, 8973, 0, 6, 0, UNI_blk_values_index } /* block= */, + { 12, 8973, 7709, 6, 9, UNI_INKHUDAWADI } /* block=khudawadi */, + { 0, 9691, 1946, 4, 12, UNI_DIACRITICALS } /* blk=diacriticals */, + { 7, 32, 0, 2, 0, UNI__PERL_SURROGATE } /* cs */, + { 3, 9476, 7433, 3, 7, UNI_SC__SOGD } /* sc=sogdian */, + { 0, 2206, 1934, 21, 2, UNI_GCB__CN } /* graphemeclusterbreak=cn */, + { 20, 9711, 8998, 5, 4, UNI_CCC__11 } /* ccc=ccc11 */, + { 1, 9979, 4504, 4, 5, UNI_BAMU } /* scx=bamum */, + { 3, 10223, 36, 3, 1, UNI_CI } /* ci=t */, + { 0, 8782, 9867, 7, 4, UNI_SC__MLYM } /* script=mlym */, + { 2, 7460, 10301, 10, 3, UNI_IN__3 } /* presentin=v30 */, + { 0, 2100, 0, 15, 0, UNI_TRANSPORTANDMAP } /* transportandmap */, + { 1, 9476, 9207, 3, 4, UNI_SC__THAA } /* sc=thaa */, + { 0, 185, 5592, 2, 13, UNI_PATSYN } /* ispatternsyntax */, + { 16, 3877, 9931, 17, 4, UNI_PHLP } /* scriptextensions=phlp */, + { 0, 2185, 3, 21, 1, -UNI_EXTPICT } /* extendedpictographic=f */, + { 1, 7460, 7924, 10, 3, UNI_IN__1_DOT_1 } /* presentin=1.1 */, + { 12, 185, 8573, 3, 6, UNI_CJKEXTE } /* iscjkexte */, + { 0, 9691, 6362, 4, 5, UNI_INKHMER } /* blk=khmer */, + { 5, 185, 3707, 2, 11, UNI_ETHIOPICEXT } /* isethiopicext */, + { 11, 7190, 0, 10, 0, UNI_ARABICEXTA } /* arabicexta */, + { 5, 4074, 401, 16, 6, UNI_CF } /* generalcategory=format */, + { 0, 1418, 9499, 24, 5, UNI_CCC__7 } /* canonicalcombiningclass=nukta */, + { 0, 9476, 7310, 3, 10, UNI_DIAK } /* sc=divesakuru */, + { 2, 4847, 8692, 3, 6, UNI_INMULTANI } /* inmultani */, + { 3, 1990, 1245, 22, 9, UNI_INSC__CONSONANT } /* indicsyllabiccategory=consonant */, + { 8, 1418, 8, 24, 1, UNI_CCC__A } /* canonicalcombiningclass=a */, + { 2, 9189, 1, 6, 1, -UNI_STERM } /* sterm=n */, + { 0, 9979, 9264, 4, 5, UNI_ADLM } /* scx=adlam */, + { 0, 21, 9099, 2, 6, UNI_KANBUN } /* inkanbun */, + { 6, 5093, 0, 8, 0, UNI_XPOSIXXDIGIT } /* hexdigit */, + { 2, 5830, 10055, 6, 4, UNI_EBASE } /* ebase=true */, + { 33, 9476, 0, 3, 0, UNI_sc_values_index } /* sc= */, + { 4, 7460, 10079, 10, 4, UNI_IN__14 } /* presentin=v140 */, + { 8, 3403, 10055, 6, 4, UNI_XPOSIXSPACE } /* space=true */, + { 0, 9269, 1026, 5, 2, -UNI_POSIXXDIGIT } /* ahex=no */, + { 0, 9691, 1632, 4, 15, UNI_GEOMETRICSHAPES } /* blk=geometricshapes */, + { 2, 5172, 0, 14, 0, UNI_emod_values_index } /* emojimodifier= */, + { 0, 4598, 3250, 5, 15, UNI_INPUNCTUATION } /* ingeneralpunctuation */, + { 2, 1792, 36, 22, 1, UNI_CWCF } /* changeswhencasefolded=t */, + { 1, 21, 5368, 2, 14, UNI_LISUSUP } /* inlisusupplement */, + { 9, 8973, 4202, 6, 16, UNI_LINEARBSYLLABARY } /* block=linearbsyllabary */, + { 16, 9691, 5088, 4, 5, UNI_ASCII } /* blk=ascii */, + { 3, 728, 0, 2, 0, UNI_MN } /* mn */, + { 2, 7580, 34, 10, 6, UNI_WB__EXTEND } /* wordbreak=extend */, + { 0, 8973, 2269, 6, 14, UNI_MEETEIMAYEKEXT } /* block=meeteimayekext */, + { 1, 10516, 10529, 3, 4, UNI_XPOSIXPRINT } /* isprint */, + { 1, 6083, 10184, 13, 3, UNI_NV__4_SLASH_5 } /* numericvalue=4/5 */, + { 1, 3877, 7820, 17, 4, UNI_PERM } /* scriptextensions=perm */, + { 1, 9691, 4298, 4, 16, UNI_MISCMATHSYMBOLSB } /* blk=miscmathsymbolsb */, + { 0, 8973, 1586, 6, 23, UNI_BYZANTINEMUSIC } /* block=byzantinemusicalsymbols */, + { 2, 185, 7271, 3, 9, UNI_CJKSTROKES } /* iscjkstrokes */, + { 3, 2312, 2748, 4, 8, UNI_JAMO } /* inhanguljamo */, + { 1, 10247, 6015, 3, 3, UNI_JG__TAW } /* jg=taw */, + { 3, 4410, 0, 16, 0, UNI_SYRIACSUP } /* syriacsupplement */, + { 3, 9189, 0, 6, 0, UNI_sterm_values_index } /* sterm= */, + { 0, 9691, 2689, 4, 19, UNI_COUNTINGROD } /* blk=countingrodnumerals */, + { 0, 4074, 1045, 16, 6, UNI_L } /* generalcategory=letter */, + { 0, 10516, 7349, 3, 3, UNI_PHLI } /* isphli */, + { 3, 10253, 909, 3, 2, UNI_LB__PR } /* lb=pr */, + { 4, 185, 1116, 3, 24, UNI_CWKCF } /* ischangeswhennfkccasefolded */, + { 1, 2185, 9454, 21, 5, -UNI_EXTPICT } /* extendedpictographic=false */, + { 17, 9476, 4984, 3, 5, UNI_SC__TAML } /* sc=tamil */, + { 0, 9979, 6928, 4, 11, UNI_MEDF } /* scx=medefaidrin */, + { 0, 10244, 263, 3, 2, UNI_SM } /* gc=sm */, + { 0, 2808, 29, 4, 4, UNI_INARABIC } /* inarabic */, + { 6, 9979, 2248, 4, 21, UNI_PRTI } /* scx=inscriptionalparthian */, + { 1, 6338, 3, 12, 1, -UNI_JOINC } /* joincontrol=f */, + { 0, 10268, 7988, 3, 8, UNI_NV__3_SLASH_16 } /* nv=1.88e-01 */, + { 4, 8782, 8420, 7, 8, UNI_SC__MAHJ } /* script=mahajani */, + { 2, 6697, 0, 11, 0, UNI_alpha_values_index } /* alphabetic= */, + { 2, 5088, 10055, 14, 4, UNI_POSIXXDIGIT } /* asciihexdigit=true */, + { 0, 9691, 7646, 4, 9, UNI_ARABICPFB } /* blk=arabicpfb */, + { 1, 9544, 3, 5, 1, -UNI_XIDC } /* xidc=f */, + { 0, 2553, 9454, 20, 5, -UNI_TERM } /* terminalpunctuation=false */, + { 0, 9691, 540, 4, 30, UNI_CJKEXTB } /* blk=cjkunifiedideographsextensionb */, + { 1, 5875, 5704, 13, 10, UNI_JG__TEHMARBUTA } /* joininggroup=tehmarbuta */, + { 2, 7370, 10055, 10, 4, UNI_XPOSIXLOWER } /* lowercase=true */, + { 1, 5045, 1892, 3, 4, UNI_XPOSIXUPPER } /* isupper */, + { 1, 3877, 720, 17, 9, UNI_XSUX } /* scriptextensions=cuneiform */, + { 0, 8973, 810, 6, 22, UNI_ENCLOSEDIDEOGRAPHICSUP } /* block=enclosedideographicsup */, + { 0, 5634, 0, 14, 0, UNI_PHLP } /* psalterpahlavi */, + { 3, 9979, 2227, 4, 4, UNI_HAN } /* scx=hani */, + { 8, 3049, 0, 18, 0, UNI_CHEROKEESUP } /* cherokeesupplement */, + { 0, 9711, 1180, 4, 2, UNI_CCC__BL } /* ccc=bl */, + { 1, 9464, 3, 5, 1, -UNI_IDST } /* idst=f */, + { 1, 21, 5901, 2, 13, UNI_KANAEXTB } /* inkanaextendedb */, + { 0, 9979, 9484, 4, 4, UNI_LIMB } /* scx=limb */, + { 1, 9439, 36, 5, 1, UNI_DASH } /* dash=t */, + { 0, 9476, 3193, 3, 8, UNI_ETHI } /* sc=ethiopic */, + { 0, 3877, 9771, 17, 4, UNI_GONM } /* scriptextensions=gonm */, + { 0, 8712, 0, 7, 0, UNI_nfkdqc_values_index } /* nfkdqc= */, + { 8, 8973, 8817, 6, 7, UNI_SUPPUAA } /* block=suppuaa */, + { 3, 10516, 2, 3, 1, UNI_PI } /* ispi */, + { 0, 1418, 9325, 25, 4, UNI_CCC__19 } /* canonicalcombiningclass=ccc19 */, + { 4, 7230, 6134, 10, 12, UNI_BC__AL } /* bidiclass=arabicletter */, + { 0, 7297, 1656, 3, 5, UNI_HANG } /* ishangul */, + { 8, 8973, 8492, 6, 7, UNI_UCASEXT } /* block=ucasext */, + { 0, 2292, 0, 2, 0, UNI_PD } /* pd */, + { 29, 8782, 8292, 7, 8, UNI_SC__BUGI } /* script=buginese */, + { 0, 8973, 3707, 6, 11, UNI_ETHIOPICEXT } /* block=ethiopicext */, + { 9, 6083, 8156, 13, 8, UNI_NV__5_SLASH_8 } /* numericvalue=6.25e-01 */, + { 2, 1061, 0, 27, 0, UNI_OCR } /* opticalcharacterrecognition */, + { 2, 9979, 9895, 4, 4, UNI_NKO } /* scx=nkoo */, + { 11, 7560, 1, 10, 1, -UNI_XPOSIXUPPER } /* uppercase=n */, + { 10, 6083, 7975, 13, 1, UNI_NV__6 } /* numericvalue=6 */, + { 4, 1418, 9355, 25, 4, UNI_CCC__25 } /* canonicalcombiningclass=ccc25 */, + { 2, 1553, 5578, 9, 14, UNI_MN } /* category=nonspacingmark */, + { 0, 3877, 9237, 17, 6, UNI_YEZI } /* scriptextensions=yezidi */, + { 1, 1538, 2579, 24, 14, UNI_INPC__BOTTOMANDRIGHT } /* indicpositionalcategory=bottomandright */, + { 4, 8973, 2936, 6, 19, UNI_SUNDANESESUP } /* block=sundanesesupplement */, + { 4, 9691, 1595, 4, 14, UNI_MUSIC } /* blk=musicalsymbols */, + { 2, 3877, 9081, 17, 6, UNI_HATR } /* scriptextensions=hatran */, + { 42, 9847, 10055, 4, 4, UNI_LOE } /* loe=true */, + { 0, 9691, 4202, 4, 16, UNI_LINEARBSYLLABARY } /* blk=linearbsyllabary */, + { 22, 2312, 4731, 4, 13, UNI_INHANGUL } /* inhangulsyllables */, + { 7, 9469, 469, 3, 10, UNI_INPUNCTUATION } /* inpunctuation */, + { 1, 5690, 0, 14, 0, UNI_SUPPUNCTUATION } /* suppunctuation */, + { 3, 1553, 4954, 9, 15, UNI_PS } /* category=openpunctuation */, + { 1, 1990, 3639, 22, 17, UNI_INSC__CONSONANTPREFIXED } /* indicsyllabiccategory=consonantprefixed */, + { 16, 9691, 6242, 4, 12, UNI_ETHIOPICEXTB } /* blk=ethiopicextb */, + { 0, 7580, 5948, 10, 2, UNI_WB__ML } /* wordbreak=ml */, + { 0, 2012, 26, 22, 1, UNI_LOE } /* logicalorderexception=y */, + { 16, 9691, 6494, 4, 12, UNI_INMASARAMGONDI } /* blk=masaramgondi */, + { 0, 7433, 0, 4, 0, UNI_SOGD } /* sogd */, + { 0, 7370, 9454, 10, 5, -UNI_XPOSIXLOWER } /* lowercase=false */, + { 1, 9459, 3, 5, 1, -UNI_IDSB } /* idsb=f */, + { 0, 9979, 8811, 5, 3, UNI_SOYO } /* scx=soyo */, + { 3, 9476, 2841, 3, 19, UNI_MERO } /* sc=meroitichieroglyphs */, + { 0, 21, 5927, 2, 13, UNI_LOWSURROGATES } /* inlowsurrogates */, + { 1, 1418, 8994, 24, 3, UNI_CCC__107 } /* canonicalcombiningclass=107 */, + { 20, 9647, 10071, 4, 4, UNI_AGE__12_DOT_1 } /* age=v121 */, + { 1, 9691, 2332, 4, 6, UNI_YIJING } /* blk=yijing */, + { 3, 8973, 721, 7, 8, UNI_INCUNEIFORM } /* block=cuneiform */, + { 0, 2242, 1936, 3, 10, UNI_NUMBERFORMS } /* innumberforms */, + { 0, 3877, 9703, 17, 4, UNI_CAKM } /* scriptextensions=cakm */, + { 1, 185, 1678, 2, 9, UNI_LATINEXTE } /* islatinexte */, + { 7, 10247, 4819, 3, 15, UNI_JG__MANICHAEANSADHE } /* jg=manichaeansadhe */, + { 1, 1088, 10055, 27, 4, UNI_PCM } /* prependedconcatenationmark=true */, + { 1, 5270, 0, 14, 0, UNI_KANGXI } /* kangxiradicals */, + { 0, 3283, 36, 18, 1, UNI_IDSB } /* idsbinaryoperator=t */, + { 16, 9979, 9827, 4, 4, UNI_LANA } /* scx=lana */, + { 44, 3403, 26, 6, 1, UNI_XPOSIXSPACE } /* space=y */, + { 3, 4714, 9454, 15, 5, -UNI_GREXT } /* graphemeextend=false */, + { 8, 8973, 5690, 6, 14, UNI_SUPPUNCTUATION } /* block=suppunctuation */, + { 0, 185, 8691, 2, 7, UNI_MULT } /* ismultani */, + { 2, 10217, 2822, 3, 19, UNI_BC__LRO } /* bc=lefttorightoverride */, + { 3, 8973, 150, 7, 34, UNI_DIACRITICALSSUP } /* block=combiningdiacriticalmarkssupplement */, + { 3, 6338, 0, 5, 0, UNI_JOINC } /* joinc */, + { 9, 5536, 17, 15, 1, UNI_COMPEX } /* nfcquickcheck=no */, + { 3, 4984, 0, 8, 0, UNI_TAMILSUP } /* tamilsup */, + { 0, 8973, 44, 7, 35, UNI_CJKCOMPATIDEOGRAPHSSUP } /* block=cjkcompatibilityideographssupplement */, + { 1, 8881, 1008, 3, 26, UNI_ANCIENTGREEKMUSIC } /* isancientgreekmusicalnotation */, + { 5, 1418, 8028, 24, 2, UNI_CCC__20 } /* canonicalcombiningclass=20 */, + { 1, 2185, 1026, 21, 2, -UNI_EXTPICT } /* extendedpictographic=no */, + { 1, 9763, 4401, 4, 9, UNI_WB__EB } /* gcb=emodifier */, + { 6, 9979, 8500, 4, 8, UNI_UGAR } /* scx=ugaritic */, + { 0, 1858, 10355, 22, 3, UNI_CWT } /* changeswhentitlecased=yes */, + { 0, 185, 5270, 2, 6, UNI_KANGXI } /* iskangxi */, + { 9, 8782, 9895, 7, 4, UNI_SC__NKO } /* script=nkoo */, + { 1, 1009, 0, 2, 0, UNI_CI } /* ci */, + { 0, 185, 10390, 2, 2, UNI_CASEDLETTER } /* isl_ */, + { 12, 7360, 10378, 10, 2, UNI_LB__H2 } /* linebreak=h2 */, + { 1, 8973, 2248, 6, 21, UNI_ININSCRIPTIONALPARTHIAN } /* block=inscriptionalparthian */, + { 9, 9711, 8099, 4, 2, UNI_CCC__14 } /* ccc=14 */, + { 0, 6083, 8943, 13, 6, UNI_NV__800000 } /* numericvalue=800000 */, + { 2, 9979, 4186, 4, 7, UNI_LINB } /* scx=linearb */, + { 8, 8973, 6183, 7, 11, UNI_CHESSSYMBOLS } /* block=chesssymbols */, + { 0, 10516, 7451, 3, 9, UNI_PHNX } /* isphoenician */, + { 0, 7467, 10340, 3, 3, UNI_IN__8 } /* in=v80 */, + { 0, 7360, 3409, 10, 17, UNI_RI } /* linebreak=regionalindicator */, + { 10, 9691, 1587, 5, 13, UNI_BYZANTINEMUSIC } /* blk=byzantinemusic */, + { 1, 9476, 9947, 3, 4, UNI_SC__COPT } /* sc=qaac */, + { 10, 9461, 4346, 3, 5, UNI_SB__XX } /* sb=other */, + { 2, 9979, 8684, 4, 7, UNI_MARC } /* scx=marchen */, + { 0, 10268, 10153, 3, 2, UNI_NV__42 } /* nv=42 */, + { 3, 5875, 5704, 13, 14, UNI_JG__HAMZAONHEHGOAL } /* joininggroup=tehmarbutagoal */, + { 8, 3121, 2593, 18, 4, UNI_DT__VERT } /* decompositiontype=vert */, + { 56, 780, 0, 30, 0, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* symbolsandpictographsextendeda */, + { 3, 10253, 6708, 3, 11, UNI_LB__BB } /* lb=breakbefore */, + { 5, 8973, 7281, 7, 9, UNI_COMPATJAMO } /* block=compatjamo */, + { 8, 9461, 867, 3, 2, UNI_SB__SP } /* sb=sp */, + { 1, 3877, 7835, 17, 9, UNI_OUGR } /* scriptextensions=olduyghur */, + { 6, 8881, 3572, 3, 9, UNI_ALCHEMICAL } /* isalchemical */, + { 9, 3877, 7655, 17, 9, UNI_BHKS } /* scriptextensions=bhaiksuki */, + { 1, 7560, 1026, 10, 2, -UNI_XPOSIXUPPER } /* uppercase=no */, + { 0, 6617, 210, 4, 2, UNI_TOTO } /* istoto */, + { 10, 10268, 8084, 3, 8, UNI_NV__3_SLASH_80 } /* nv=3.75e-02 */, + { 3, 185, 6057, 2, 13, UNI_MISCTECHNICAL } /* ismisctechnical */, + { 0, 9476, 9931, 3, 4, UNI_SC__PHLP } /* sc=phlp */, + { 3, 1514, 0, 24, 0, UNI_HIGHPUSURROGATES } /* highprivateusesurrogates */, + { 0, 6350, 6, 12, 1, UNI_JT__D } /* joiningtype=d */, + { 6, 8973, 3355, 6, 18, UNI_ORNAMENTALDINGBATS } /* block=ornamentaldingbats */, + { 16, 1538, 2573, 24, 12, UNI_INPC__TOPANDBOTTOM } /* indicpositionalcategory=topandbottom */, + { 0, 9691, 9081, 4, 6, UNI_INHATRAN } /* blk=hatran */, + { 0, 10247, 9274, 3, 5, UNI_JG__ALAPH } /* jg=alaph */, + { 14, 4598, 4092, 4, 14, UNI_GEORGIANEXT } /* ingeorgianextended */, + { 1, 9476, 7071, 3, 11, UNI_SORA } /* sc=sorasompeng */, + { 3, 9269, 26, 5, 1, UNI_POSIXXDIGIT } /* ahex=y */, + { 39, 8973, 4864, 6, 15, UNI_MISCPICTOGRAPHS } /* block=miscpictographs */, + { 1, 4074, 133, 16, 2, UNI_LM } /* generalcategory=lm */, + { 24, 10510, 1891, 6, 5, UNI_XPOSIXUPPER } /* xposixupper */, + { 0, 2248, 318, 3, 32, UNI_SUPMATHOPERATORS } /* insupplementalmathematicaloperators */, + { 7, 9711, 7619, 4, 9, UNI_CCC__AL } /* ccc=aboveleft */, + { 1, 8854, 2333, 3, 5, UNI_YIJING } /* inyijing */, + { 0, 1792, 1026, 22, 2, -UNI_CWCF } /* changeswhencasefolded=no */, + { 0, 7580, 1195, 10, 2, UNI_LB__LF } /* wordbreak=lf */, + { 1, 8782, 9811, 7, 4, UNI_KHMR } /* script=khmr */, + { 0, 9691, 2122, 4, 21, UNI_CJKCOMPATFORMS } /* blk=cjkcompatibilityforms */, + { 1, 6083, 9249, 13, 5, UNI_NV__1_SLASH_160 } /* numericvalue=1/160 */, + { 0, 4074, 4058, 16, 16, UNI_PF } /* generalcategory=finalpunctuation */, + { 0, 185, 1045, 2, 6, UNI_L } /* isletter */, + { 3, 3877, 9919, 17, 4, UNI_OSGE } /* scriptextensions=osge */, + { 9, 9979, 7420, 4, 10, UNI_XPEO } /* scx=oldpersian */, + { 2, 9189, 0, 7, 0, UNI_STERM } /* sterm=t */, + { 0, 8782, 2841, 7, 19, UNI_MERO } /* script=meroitichieroglyphs */, + { 1, 10271, 0, 3, 0, UNI_OCR } /* ocr */, + { 0, 9476, 9534, 3, 4, UNI_SC__TAKR } /* sc=takr */, + { 0, 10232, 1, 3, 1, UNI_EA__N } /* ea=n */, + { 0, 6340, 4616, 9, 8, UNI_CONTROLPICTURES } /* incontrolpictures */, + { 0, 8961, 0, 6, 0, UNI_bidic_values_index } /* bidic= */, + { 1, 5045, 1369, 3, 3, UNI_UGAR } /* isugar */, + { 1, 185, 9963, 2, 4, UNI_ROHG } /* isrohg */, + { 0, 10560, 3403, 6, 5, UNI_VERTSPACE } /* isvertspace */, + { 0, 8782, 7844, 7, 4, UNI_PALM } /* script=palm */, + { 0, 7360, 867, 10, 2, UNI_LB__SP } /* linebreak=sp */, + { 0, 8565, 0, 7, 0, UNI_CJKEXTD } /* cjkextd */, + { 0, 4744, 1285, 15, 9, UNI_IDENTIFIERTYPE__EXCLUSION } /* identifiertype=exclusion */, + { 32, 6314, 3, 12, 1, -UNI_IDEO } /* ideographic=f */, + { 6, 4972, 8867, 3, 6, UNI_TIRH } /* istirhuta */, + { 0, 3157, 3, 18, 1, -UNI_EBASE } /* emojimodifierbase=f */, + { 2, 8973, 9201, 6, 6, UNI_INTELUGU } /* block=telugu */, + { 6, 10268, 9013, 3, 2, UNI_NV__29 } /* nv=29 */, + { 0, 8973, 4410, 6, 6, UNI_INSYRIAC } /* block=syriac */, + { 0, 3877, 9509, 17, 5, UNI_OGAM } /* scriptextensions=ogham */, + { 8, 9799, 0, 4, 0, UNI_HMNP } /* hmnp */, + { 0, 6083, 10368, 13, 2, UNI_NV__47 } /* numericvalue=47 */, + { 0, 8782, 8677, 7, 7, UNI_SC__MAND } /* script=mandaic */, + { 3, 6675, 1, 11, 1, -UNI_IDC } /* idcontinue=n */, + { 4, 9476, 9504, 3, 5, UNI_NSHU } /* sc=nushu */, + { 34, 9270, 3, 4, 1, -UNI_XPOSIXXDIGIT } /* hex=f */, + { 4, 4714, 26, 15, 1, UNI_GREXT } /* graphemeextend=y */, + { 1, 185, 1946, 2, 22, UNI_DIACRITICALSFORSYMBOLS } /* isdiacriticalsforsymbols */, + { 0, 10244, 1218, 3, 2, UNI_SK } /* gc=sk */, + { 6, 3945, 10055, 17, 4, UNI_UIDEO } /* unifiedideograph=true */, + { 0, 7560, 10055, 10, 4, UNI_XPOSIXUPPER } /* uppercase=true */, + { 0, 9979, 9509, 4, 5, UNI_OGAM } /* scx=ogham */, + { 0, 10111, 0, 4, 0, UNI_ZANB } /* zanb */, + { 0, 9469, 6615, 3, 11, UNI_PHAISTOS } /* inphaistosdisc */, + { 0, 9691, 2689, 4, 11, UNI_COUNTINGROD } /* blk=countingrod */, + { 0, 9979, 1924, 4, 6, UNI_ZYYY } /* scx=common */, + { 0, 10346, 18, 3, 1, UNI_VO__R } /* vo=r */, + { 0, 10280, 3, 3, 1, -UNI_RI } /* ri=f */, + { 1, 1418, 9016, 25, 4, UNI_CCC__13 } /* canonicalcombiningclass=ccc13 */, + { 1, 3877, 4849, 17, 15, UNI_MERC } /* scriptextensions=meroiticcursive */, + { 3, 9077, 1, 4, 1, -UNI_EXT } /* ext=n */, + { 0, 9647, 10202, 4, 3, UNI_AGE__6_DOT_3 } /* age=6.3 */, + { 0, 7907, 36, 9, 1, UNI_XIDS } /* xidstart=t */, + { 0, 1553, 46, 9, 2, UNI_CO } /* category=co */, + { 2, 8973, 4534, 6, 7, UNI_BRAI } /* block=braille */, + { 0, 9927, 1, 4, 1, -UNI_PCM } /* pcm=n */, + { 0, 2242, 9896, 3, 2, UNI_INNKO } /* innko */, + { 0, 4074, 75, 16, 2, UNI_ME } /* generalcategory=me */, + { 0, 8973, 4138, 6, 16, UNI_HIGHPUSURROGATES } /* block=highpusurrogates */, + { 0, 7467, 7995, 3, 2, UNI_IN__12 } /* in=12 */, + { 0, 8476, 0, 8, 0, UNI_TFNG } /* tifinagh */, + { 0, 10268, 8907, 3, 5, UNI_NV__30000 } /* nv=30000 */, + { 1, 8768, 0, 6, 0, UNI_PATSYN } /* patsyn */, + { 1, 3877, 2937, 18, 8, UNI_SUND } /* scriptextensions=sundanese */, + { 0, 8973, 5940, 6, 9, UNI_INMALAYALAM } /* block=malayalam */, + { 6, 5758, 10055, 13, 4, UNI_BIDIM } /* bidimirrored=true */, + { 0, 9747, 0, 4, 0, UNI_dia_values_index } /* dia= */, + { 4, 9711, 4175, 4, 1, UNI_CCC__1 } /* ccc=1 */, + { 0, 8782, 3622, 7, 17, UNI_AGHB } /* script=caucasianalbanian */, + { 0, 9711, 8988, 4, 3, UNI_CCC__103 } /* ccc=103 */, + { 15, 9476, 9919, 3, 4, UNI_OSGE } /* sc=osge */, + { 0, 8973, 2165, 7, 7, UNI_INCYRILLIC } /* block=cyrillic */, + { 8, 4074, 6719, 16, 11, UNI_CASEDLETTER } /* generalcategory=casedletter */, + { 0, 3877, 9504, 17, 5, UNI_NSHU } /* scriptextensions=nushu */, + { 2, 9476, 9903, 3, 4, UNI_OGAM } /* sc=ogam */, + { 1, 2808, 4491, 4, 13, UNI_ARABICEXTB } /* inarabicextendedb */, + { 35, 9474, 9289, 5, 5, UNI_INSC__BINDU } /* insc=bindu */, + { 0, 9691, 3049, 4, 8, UNI_INCHEROKEE } /* blk=cherokee */, + { 0, 5116, 1, 14, 1, -UNI_CI } /* caseignorable=n */, + { 37, 5875, 5508, 13, 14, UNI_JG__MANICHAEANYODH } /* joininggroup=manichaeanyodh */, + { 0, 9691, 3319, 4, 18, UNI_LATINEXTADDITIONAL } /* blk=latinextadditional */, + { 16, 1088, 0, 26, 0, UNI_PCM } /* prependedconcatenationmark */, + { 1, 10352, 8516, 3, 7, UNI_WB__LE } /* wb=aletter */, + { 0, 3792, 0, 17, 0, UNI_KITS } /* khitansmallscript */, + { 3, 185, 3247, 2, 18, UNI_INPUNCTUATION } /* isgeneralpunctuation */, + { 0, 6314, 36, 12, 1, UNI_IDEO } /* ideographic=t */, + { 2, 3877, 6518, 17, 4, UNI_MEND } /* scriptextensions=mend */, + { 0, 185, 1275, 3, 19, UNI_CE } /* iscompositionexclusion */, + { 1, 9647, 10295, 4, 3, UNI_AGE__2 } /* age=v20 */, + { 16, 8782, 9715, 7, 4, UNI_CHRS } /* script=chrs */, + { 0, 9979, 7330, 4, 10, UNI_KHAR } /* scx=kharoshthi */, + { 8, 8881, 7192, 4, 8, UNI_ARABICEXTA } /* isarabicexta */, + { 0, 9476, 8508, 3, 4, UNI_VITH } /* sc=vith */, + { 3, 3877, 9069, 17, 4, UNI_GOTH } /* scriptextensions=goth */, + { 7, 185, 284, 2, 33, UNI_MISCMATHSYMBOLSB } /* ismiscellaneousmathematicalsymbolsb */, + { 1, 6083, 9259, 13, 5, UNI_NV__11_SLASH_12 } /* numericvalue=11/12 */, + { 16, 1792, 9454, 22, 5, -UNI_CWCF } /* changeswhencasefolded=false */, + { 0, 5408, 8680, 5, 4, UNI_INMANDAIC } /* inmandaic */, + { 2, 9691, 9871, 4, 3, UNI_INMRO } /* blk=mro */, + { 10, 185, 691, 3, 29, UNI_CJKEXTG } /* iscjkunifiedideographsextensiong */, + { 26, 1632, 0, 15, 0, UNI_GEOMETRICSHAPES } /* geometricshapes */, + { 0, 1852, 1026, 6, 2, -UNI_CASED } /* cased=no */, + { 48, 8782, 7655, 7, 9, UNI_BHKS } /* script=bhaiksuki */, + { 1, 1418, 8147, 24, 2, UNI_CCC__16 } /* canonicalcombiningclass=16 */, + { 75, 9691, 8607, 4, 7, UNI_INELBASAN } /* blk=elbasan */, + { 5, 8388, 0, 4, 0, UNI_JAVA } /* java */, + { 10, 9449, 10355, 5, 3, UNI_EMOD } /* emod=yes */, + { 3, 185, 6338, 2, 5, UNI_JOINC } /* isjoinc */, + { 3, 10217, 2513, 3, 20, UNI_BC__PDF } /* bc=popdirectionalformat */, + { 0, 9691, 1034, 4, 27, UNI_ENCLOSEDCJK } /* blk=enclosedcjklettersandmonths */, + { 1, 9550, 3, 4, 1, -UNI_IDS } /* ids=f */, + { 0, 8973, 2332, 6, 6, UNI_YIJING } /* block=yijing */, + { 60, 9474, 7470, 5, 10, UNI_INSC__PUREKILLER } /* insc=purekiller */, + { 0, 9691, 8719, 4, 7, UNI_NB } /* blk=noblock */, + { 0, 3877, 7420, 17, 10, UNI_XPEO } /* scriptextensions=oldpersian */, + { 0, 9691, 1747, 4, 13, UNI_ZNAMENNYMUSIC } /* blk=znamennymusic */, + { 1, 3945, 3, 17, 1, -UNI_UIDEO } /* unifiedideograph=f */, + { 4, 9647, 9599, 4, 4, UNI_AGE__13 } /* age=13.0 */, + { 5, 10253, 6287, 3, 2, UNI_LB__ZW } /* lb=zw */, + { 7, 185, 1586, 2, 14, UNI_BYZANTINEMUSIC } /* isbyzantinemusic */, + { 1, 10244, 10398, 3, 2, UNI_ZP } /* gc=zp */, + { 0, 10244, 1934, 3, 2, UNI_CN } /* gc=cn */, + { 12, 9711, 6554, 4, 12, UNI_CCC__0 } /* ccc=notreordered */, + { 4, 9474, 1609, 5, 23, UNI_INSC__CONSONANTPRECEDINGREPHA } /* insc=consonantprecedingrepha */, + { 0, 5862, 0, 6, 0, UNI_IPAEXT } /* ipaext */, + { 0, 9979, 8356, 4, 8, UNI_HIRA } /* scx=hiragana */, + { 1, 8782, 9919, 7, 4, UNI_OSGE } /* script=osge */, + { 1, 8973, 8789, 6, 7, UNI_SC__SHRD } /* block=sharada */, + { 8, 10268, 9259, 3, 5, UNI_NV__11_SLASH_12 } /* nv=11/12 */, + { 0, 1088, 9454, 27, 5, -UNI_PCM } /* prependedconcatenationmark=false */, + { 0, 8621, 0, 7, 0, UNI_GRAN } /* grantha */, + { 16, 10349, 10055, 3, 4, UNI_VS } /* vs=true */, + { 2, 6083, 8943, 13, 4, UNI_NV__8000 } /* numericvalue=8000 */, + { 0, 10268, 10362, 3, 2, UNI_NV__44 } /* nv=44 */, + { 10, 1852, 36, 6, 1, UNI_CASED } /* cased=t */, + { 0, 9691, 8500, 4, 8, UNI_INUGARITIC } /* blk=ugaritic */, + { 0, 9691, 4442, 4, 16, UNI_TANGUTSUP } /* blk=tangutsupplement */, + { 1, 5875, 8460, 13, 8, UNI_JG__SWASHKAF } /* joininggroup=swashkaf */, + { 18, 3877, 1538, 18, 3, UNI_SIND } /* scriptextensions=sind */, + { 2, 3877, 9871, 17, 3, UNI_MRO } /* scriptextensions=mro */, + { 0, 10352, 74, 3, 2, UNI_WB__EB } /* wb=em */, + { 0, 2269, 0, 11, 0, UNI_MTEI } /* meeteimayek */, + { 4, 9979, 7430, 4, 10, UNI_SOGO } /* scx=oldsogdian */, + { 10, 10268, 8903, 3, 4, UNI_NV__6000 } /* nv=6000 */, + { 34, 2304, 4926, 4, 13, UNI_NARB } /* isoldnortharabian */, + { 4, 7682, 0, 9, 0, UNI_ext_values_index } /* extender= */, + { 2, 6340, 3050, 3, 10, UNI_CHEROKEESUP } /* incherokeesup */, + { 0, 6340, 8580, 3, 6, UNI_CJKEXTF } /* incjkextf */, + { 0, 6083, 5732, 13, 13, UNI_NV__1000000000000 } /* numericvalue=1000000000000 */, + { 0, 9691, 7390, 4, 10, UNI_MISCARROWS } /* blk=miscarrows */, + { 8, 1592, 6231, 3, 11, UNI_ETHIOPICEXTA } /* inethiopicexta */, + { 9, 7230, 2473, 10, 11, UNI_BC__L } /* bidiclass=lefttoright */, + { 0, 1189, 9530, 3, 4, UNI_INTAILE } /* intaile */, + { 33, 185, 63, 2, 5, UNI_XPOSIXGRAPH } /* isgraph */, + { 40, 8973, 4314, 6, 16, UNI_MYANMAREXTA } /* block=myanmarextendeda */, + { 1, 8973, 9135, 6, 6, UNI_INLYDIAN } /* block=lydian */, + { 29, 10217, 2533, 3, 11, UNI_BC__R } /* bc=righttoleft */, + { 4, 9177, 36, 6, 1, UNI_QMARK } /* qmark=t */, + { 0, 8782, 1014, 7, 5, UNI_SC__GREK } /* script=greek */, + { 0, 8782, 9875, 7, 4, UNI_MTEI } /* script=mtei */, + { 8, 9711, 3039, 4, 5, UNI_CCC__A } /* ccc=above */, + { 4, 9979, 9237, 4, 6, UNI_YEZI } /* scx=yezidi */, + { 1, 3877, 9867, 17, 4, UNI_MLYM } /* scriptextensions=mlym */, + { 0, 10268, 7980, 3, 8, UNI_NV__1_SLASH_6 } /* nv=1.67e-01 */, + { 3, 3877, 4939, 17, 15, UNI_SARB } /* scriptextensions=oldsoutharabian */, + { 58, 10244, 2085, 3, 14, UNI_LM } /* gc=modifierletter */, + { 43, 5227, 0, 4, 0, UNI_CHAM } /* cham */, + { 10, 8973, 317, 6, 33, UNI_SUPMATHOPERATORS } /* block=supplementalmathematicaloperators */, + { 27, 10253, 10382, 3, 2, UNI_GCB__L } /* lb=jl */, + { 1, 10283, 0, 3, 0, UNI_sd_values_index } /* sd= */, + { 0, 10253, 6818, 3, 11, UNI_LB__IN } /* lb=inseparable */, + { 0, 4639, 0, 4, 0, UNI_DASH } /* dash */, + { 0, 5172, 3, 14, 1, -UNI_EMOD } /* emojimodifier=f */, + { 1, 8973, 1219, 6, 26, UNI_KATAKANAEXT } /* block=katakanaphoneticextensions */, + { 0, 9763, 1934, 4, 2, UNI_GCB__CN } /* gcb=cn */, + { 4, 9691, 43, 4, 3, UNI_CJK } /* blk=cjk */, + { 1, 10244, 49, 3, 1, UNI_P } /* gc=p */, + { 1, 9476, 8388, 3, 8, UNI_SC__JAVA } /* sc=javanese */, + { 30, 5875, 66, 15, 2, UNI_JG__KAPH } /* joininggroup=kaph */, + { 4, 4847, 2880, 3, 8, UNI_INMONGOLIAN } /* inmongolian */, + { 2, 3877, 7434, 18, 3, UNI_SOGD } /* scriptextensions=sogd */, + { 3, 9979, 8684, 4, 4, UNI_MARC } /* scx=marc */, + { 1, 1418, 10160, 24, 3, UNI_CCC__A } /* canonicalcombiningclass=230 */, + { 4, 8973, 952, 6, 18, UNI_INVS } /* block=variationselectors */, + { 1, 8973, 9504, 6, 5, UNI_INNUSHU } /* block=nushu */, + { 0, 8973, 4043, 7, 15, UNI_CYPRIOTSYLLABARY } /* block=cypriotsyllabary */, + { 0, 9691, 3463, 4, 12, UNI_SMALLKANAEXT } /* blk=smallkanaext */, + { 1, 8782, 9767, 7, 4, UNI_SC__GONG } /* script=gong */, + { 0, 8973, 9484, 6, 5, UNI_INLIMBU } /* block=limbu */, + { 0, 8705, 17, 8, 1, UNI_NFKCQC__N } /* nfkcqc=no */, + { 5, 3877, 8754, 17, 4, UNI_OSMA } /* scriptextensions=osma */, + { 0, 2248, 8453, 3, 7, UNI_SPECIALS } /* inspecials */, + { 34, 10229, 10091, 3, 4, UNI_EA__F } /* dt=wide */, + { 1, 8782, 10119, 7, 4, UNI_SC__ZYYY } /* script=zyyy */, + { 6, 43, 0, 36, 0, UNI_CJKCOMPATIDEOGRAPHSSUP } /* cjkcompatibilityideographssupplement */, + { 0, 10232, 67, 3, 1, UNI_EA__H } /* ea=h */, + { 0, 8782, 8348, 7, 8, UNI_SC__GURU } /* script=gurmukhi */, + { 0, 3877, 8500, 17, 8, UNI_UGAR } /* scriptextensions=ugaritic */, + { 0, 4074, 5676, 16, 14, UNI_ZS } /* generalcategory=spaceseparator */, + { 0, 3911, 0, 17, 0, UNI_SMALLFORMS } /* smallformvariants */, + { 1, 9979, 3265, 4, 8, UNI_GEOR } /* scx=georgian */, + { 0, 8782, 9899, 7, 4, UNI_NSHU } /* script=nshu */, + { 0, 2304, 9520, 3, 4, UNI_OSGE } /* isosage */, + { 1, 8782, 10031, 7, 4, UNI_TFNG } /* script=tfng */, + { 1, 6083, 9260, 13, 4, UNI_NV__1_SLASH_12 } /* numericvalue=1/12 */, + { 1, 6083, 8949, 13, 2, UNI_NV__90 } /* numericvalue=90 */, + { 18, 10268, 9367, 3, 2, UNI_NV__27 } /* nv=27 */, + { 0, 9711, 8907, 4, 2, UNI_CCC__30 } /* ccc=30 */, + { 0, 9189, 10056, 7, 3, UNI_STERM } /* sterm=true */, + { 94, 7460, 10322, 10, 3, UNI_IN__5_DOT_2 } /* presentin=v52 */, + { 1, 2509, 0, 4, 0, UNI_MONG } /* mong */, + { 1, 21, 7736, 2, 9, UNI_LATINEXTD } /* inlatinextd */, + { 0, 6083, 9578, 13, 2, UNI_NV__41 } /* numericvalue=41 */, + { 0, 9476, 9444, 3, 4, UNI_SC__DOGR } /* sc=dogr */, + { 12, 10250, 0, 4, 0, UNI_JT__L } /* jt=l */, + { 2, 9469, 6627, 3, 11, UNI_PLAYINGCARDS } /* inplayingcards */, + { 0, 2227, 0, 4, 0, UNI_HAN } /* hani */, + { 0, 10268, 10208, 3, 3, UNI_NV__7_SLASH_8 } /* nv=7/8 */, + { 0, 7230, 2533, 10, 20, UNI_BC__RLE } /* bidiclass=righttoleftembedding */, + { 1, 9707, 0, 4, 0, UNI_CANS } /* cans */, + { 1, 185, 8663, 2, 7, UNI_LINA } /* islineara */, + { 24, 1418, 9675, 24, 3, UNI_CCC__202 } /* canonicalcombiningclass=atb */, + { 4, 185, 3445, 2, 18, UNI_RUMI } /* isruminumeralsymbols */, + { 17, 8444, 36, 8, 1, UNI_RADICAL } /* radical=t */, + { 64, 10352, 0, 3, 0, UNI_wb_values_index } /* wb= */, + { 7, 9691, 6194, 4, 12, UNI_CYRILLICEXTA } /* blk=cyrillicexta */, + { 7, 10349, 10355, 3, 3, UNI_VS } /* vs=yes */, + { 1, 10244, 4286, 3, 10, UNI_SM } /* gc=mathsymbol */, + { 2, 2012, 0, 21, 0, UNI_LOE } /* logicalorderexception */, + { 3, 6741, 3, 11, 1, -UNI_DEP } /* deprecated=f */, + { 2, 8973, 3193, 6, 11, UNI_ETHIOPICSUP } /* block=ethiopicsup */, + { 0, 7230, 2290, 10, 21, UNI_BC__PDI } /* bidiclass=popdirectionalisolate */, + { 0, 6290, 0, 12, 0, UNI_GONG } /* gunjalagondi */, + { 12, 6340, 116, 4, 33, UNI_DIACRITICALSFORSYMBOLS } /* incombiningdiacriticalmarksforsymbols */, + { 1, 9647, 9, 4, 2, UNI_AGE__NA } /* age=na */, + { 9, 185, 5888, 2, 13, UNI_KANAEXTA } /* iskanaextendeda */, + { 1, 1902, 0, 19, 0, UNI_CJKCOMPATIDEOGRAPHS } /* cjkcompatideographs */, + { 0, 9711, 7983, 4, 1, UNI_CCC__7 } /* ccc=7 */, + { 0, 4074, 25, 16, 1, UNI_S } /* generalcategory=s */, + { 16, 2206, 24, 21, 1, UNI_GCB__L } /* graphemeclusterbreak=l */, + { 1, 1418, 9305, 25, 4, UNI_CCC__15 } /* canonicalcombiningclass=ccc15 */, + { 0, 1990, 3994, 22, 16, UNI_INSC__CANTILLATIONMARK } /* indicsyllabiccategory=cantillationmark */, + { 3, 1088, 26, 27, 1, UNI_PCM } /* prependedconcatenationmark=y */, + { 1, 4074, 1564, 16, 2, UNI_PS } /* generalcategory=ps */, + { 7, 9719, 0, 4, 0, UNI_CPMN } /* cpmn */, + { 1, 9476, 2227, 3, 4, UNI_SC__HAN } /* sc=hani */, + { 0, 7260, 0, 10, 0, UNI_CHRS } /* chorasmian */, + { 0, 8973, 0, 12, 0, UNI_INCARIAN } /* block=carian */, + { 1, 185, 8600, 2, 7, UNI_DSRT } /* isdeseret */, + { 5, 9270, 10055, 4, 4, UNI_XPOSIXXDIGIT } /* hex=true */, + { 8, 9177, 10055, 6, 4, UNI_QMARK } /* qmark=true */, + { 2, 9691, 810, 4, 22, UNI_ENCLOSEDIDEOGRAPHICSUP } /* blk=enclosedideographicsup */, + { 38, 10516, 2595, 3, 3, UNI_PRTI } /* isprti */, + { 0, 2248, 0, 21, 0, UNI_PRTI } /* inscriptionalparthian */, + { 1, 6340, 2165, 3, 7, UNI_INCYRILLIC } /* incyrillic */, + { 5, 4074, 9706, 16, 2, UNI_MC } /* generalcategory=mc */, + { 0, 7360, 6288, 10, 2, UNI_LB__WJ } /* linebreak=wj */, + { 0, 10268, 8164, 3, 8, UNI_NV__1_SLASH_16 } /* nv=6.25e-02 */, + { 0, 185, 9815, 2, 4, UNI_KITS } /* iskits */, + { 0, 5823, 3, 13, 1, -UNI_GRBASE } /* graphemebase=f */, + { 8, 7853, 0, 9, 0, UNI_PAUC } /* paucinhau */, + { 1, 8782, 9207, 7, 6, UNI_SC__THAA } /* script=thaana */, + { 0, 185, 6950, 2, 11, UNI_MYANMAREXTA } /* ismyanmarexta */, + { 1, 9474, 6572, 5, 6, UNI_LB__ZWJ } /* insc=joiner */, + { 1, 3403, 0, 6, 0, UNI_wspace_values_index } /* space= */, + { 4, 9434, 10355, 5, 3, UNI_CWCM } /* cwcm=yes */, + { 0, 9691, 6057, 4, 13, UNI_MISCTECHNICAL } /* blk=misctechnical */, + { 0, 9643, 0, 4, 0, UNI_ADLM } /* adlm */, + { 1, 6674, 10055, 12, 4, UNI_XIDC } /* xidcontinue=true */, + { 14, 9979, 9484, 4, 5, UNI_LIMB } /* scx=limbu */, + { 1, 7360, 7628, 10, 9, UNI_LB__AI } /* linebreak=ambiguous */, + { 0, 9476, 9775, 3, 4, UNI_SC__GREK } /* sc=grek */, + { 3, 10346, 3546, 3, 7, UNI_VO__U } /* vo=upright */, + { 0, 9711, 24, 4, 1, UNI_CCC__L } /* ccc=l */, + { 1, 9123, 10355, 6, 3, UNI_XPOSIXLOWER } /* lower=yes */, + { 0, 3877, 3265, 17, 4, UNI_GEOR } /* scriptextensions=geor */, + { 0, 6940, 0, 4, 0, UNI__PERL_SURROGATE } /* iscs */, + { 1, 2269, 0, 21, 0, UNI_MEETEIMAYEKEXT } /* meeteimayekextensions */, + { 0, 5662, 50, 14, 2, UNI_SB__AT } /* sentencebreak=at */, + { 2, 9476, 10099, 3, 4, UNI_XSUX } /* sc=xsux */, + { 1, 185, 9117, 2, 6, UNI_LEPC } /* islepcha */, + { 8, 9979, 2312, 5, 6, UNI_SINH } /* scx=sinhala */, + { 16, 9691, 5634, 4, 14, UNI_INPSALTERPAHLAVI } /* blk=psalterpahlavi */, + { 0, 10253, 185, 3, 2, UNI_LB__IS } /* lb=is */, + { 9, 1167, 0, 25, 0, UNI_DI } /* defaultignorablecodepoint */, + { 0, 6083, 9567, 13, 4, UNI_NV__1_SLASH_20 } /* numericvalue=1/20 */, + { 4, 9691, 4984, 4, 15, UNI_TAMILSUP } /* blk=tamilsupplement */, + { 0, 9474, 4579, 5, 15, UNI_INSC__CONSONANTMEDIAL } /* insc=consonantmedial */, + { 5, 185, 511, 3, 29, UNI_CJKEXTA } /* iscjkunifiedideographsextensiona */, + { 0, 10511, 3403, 5, 5, UNI_POSIXSPACE } /* posixspace */, + { 8, 3877, 7570, 17, 10, UNI_WARA } /* scriptextensions=warangciti */, + { 0, 3877, 6386, 17, 4, UNI_MAHJ } /* scriptextensions=mahj */, + { 0, 7230, 2292, 10, 3, UNI_BC__PDI } /* bidiclass=pdi */, + { 5, 5662, 401, 14, 6, UNI_SB__FO } /* sentencebreak=format */, + { 1, 10352, 5068, 3, 2, UNI_WB__SQ } /* wb=sq */, + { 1, 3553, 10055, 18, 4, UNI_VS } /* variationselector=true */, + { 7, 8782, 8468, 7, 4, UNI_SC__TAGB } /* script=tagb */, + { 9, 9979, 2841, 4, 19, UNI_MERO } /* scx=meroitichieroglyphs */, + { 64, 9647, 10205, 4, 3, UNI_AGE__7 } /* age=7.0 */, + { 0, 1880, 1, 22, 1, -UNI_CWU } /* changeswhenuppercased=n */, + { 22, 5875, 6271, 13, 7, UNI_JG__SEMKATH } /* joininggroup=semkath */, + { 0, 7467, 7924, 3, 3, UNI_IN__1_DOT_1 } /* in=1.1 */, + { 5, 9979, 10083, 4, 4, UNI_VAI } /* scx=vaii */, + { 0, 185, 3365, 2, 8, UNI_DINGBATS } /* isdingbats */, + { 0, 9711, 9016, 5, 5, UNI_CCC__130 } /* ccc=ccc130 */, + { 2, 3877, 3193, 17, 4, UNI_ETHI } /* scriptextensions=ethi */, + { 1, 10553, 7, 3, 1, UNI_SC } /* issc */, + { 12, 3877, 7811, 17, 4, UNI_ITAL } /* scriptextensions=ital */, + { 0, 3877, 3978, 17, 4, UNI_BOPO } /* scriptextensions=bopo */, + { 4, 185, 3139, 2, 13, UNI_DEVANAGARIEXT } /* isdevanagariext */, + { 6, 9979, 1655, 4, 6, UNI_HANG } /* scx=hangul */, + { 8, 10283, 10055, 3, 4, UNI_SD } /* sd=true */, + { 5, 10511, 10528, 5, 5, UNI_POSIXPRINT } /* posixprint */, + { 0, 3391, 1026, 18, 2, -UNI__PERL_PATWS } /* patternwhitespace=no */, + { 2, 185, 7071, 2, 11, UNI_SORA } /* issorasompeng */, + { 1, 8973, 2433, 6, 20, UNI_GLAGOLITICSUP } /* block=glagoliticsupplement */, + { 0, 4972, 4985, 3, 7, UNI_TAMILSUP } /* istamilsup */, + { 1, 7580, 5068, 10, 2, UNI_WB__SQ } /* wordbreak=sq */, + { 11, 9691, 8452, 4, 8, UNI_SPECIALS } /* blk=specials */, + { 8, 9979, 8979, 4, 6, UNI_CARI } /* scx=carian */, + { 4, 9691, 7790, 4, 9, UNI_INNEWTAILUE } /* blk=newtailue */, + { 0, 8782, 3792, 7, 17, UNI_KITS } /* script=khitansmallscript */, + { 0, 3877, 8508, 17, 8, UNI_VITH } /* scriptextensions=vithkuqi */, + { 0, 9691, 2841, 4, 19, UNI_MERO } /* blk=meroitichieroglyphs */, + { 0, 4378, 0, 16, 0, UNI_SUPMATHOPERATORS } /* supmathoperators */, + { 2, 6158, 0, 12, 0, UNI_bidic_values_index } /* bidicontrol= */, + { 8, 3877, 9923, 17, 4, UNI_OUGR } /* scriptextensions=ougr */, + { 1, 9171, 0, 6, 0, UNI_patws_values_index } /* patws= */, + { 1, 6529, 1062, 3, 26, UNI_OCR } /* inopticalcharacterrecognition */, + { 0, 9270, 10355, 4, 3, UNI_XPOSIXXDIGIT } /* hex=yes */, + { 8, 9711, 9420, 5, 4, UNI_CCC__91 } /* ccc=ccc91 */, + { 5, 8873, 0, 7, 0, UNI_ZZZZ } /* unknown */, + { 2, 4847, 2271, 4, 12, UNI_MEETEIMAYEKEXT } /* inmeeteimayekext */, + { 0, 2206, 407, 21, 7, UNI_GCB__CN } /* graphemeclusterbreak=control */, + { 0, 9647, 8099, 4, 2, UNI_AGE__14 } /* age=14 */, + { 0, 9711, 3031, 4, 18, UNI_CCC__216 } /* ccc=attachedaboveright */, + { 0, 8973, 8276, 6, 8, UNI_INBALINESE } /* block=balinese */, + { 1, 3877, 7808, 17, 9, UNI_ITAL } /* scriptextensions=olditalic */, + { 2, 10217, 10262, 3, 3, UNI_BC__LRO } /* bc=lro */, + { 1, 9691, 3690, 4, 17, UNI_CYRILLICEXTC } /* blk=cyrillicextendedc */, + { 3, 10518, 0, 10, 0, UNI_POSIXBLANK } /* posixblank */, + { 0, 3406, 10355, 3, 3, UNI_CE } /* ce=yes */, + { 0, 8973, 6950, 6, 11, UNI_MYANMAREXTA } /* block=myanmarexta */, + { 8, 8782, 9663, 7, 4, UNI_ARMI } /* script=armi */, + { 1, 9691, 1370, 4, 24, UNI_ARABICPFA } /* blk=arabicpresentationformsa */, + { 0, 3103, 0, 4, 0, UNI_COPT } /* copt */, + { 9, 9647, 7550, 4, 10, UNI_AGE__NA } /* age=unassigned */, + { 13, 9171, 9454, 6, 5, -UNI__PERL_PATWS } /* patws=false */, + { 17, 2185, 36, 21, 1, UNI_EXTPICT } /* extendedpictographic=t */, + { 0, 9147, 0, 7, 0, -UNI__PERL_NCHAR } /* nchar=n */, + { 0, 5045, 59, 3, 4, UNI_UIDEO } /* isuideo */, + { 33, 8768, 1, 7, 1, -UNI_PATSYN } /* patsyn=n */, + { 0, 9691, 9514, 4, 5, UNI_INORIYA } /* blk=oriya */, + { 1, 8782, 9771, 7, 4, UNI_SC__GONM } /* script=gonm */, + { 4, 1553, 1530, 11, 7, UNI__PERL_SURROGATE } /* category=surrogate */, + { 17, 9711, 10163, 4, 3, UNI_CCC__AR } /* ccc=232 */, + { 0, 9979, 10015, 4, 4, UNI_TALE } /* scx=tale */, + { 0, 9691, 8551, 4, 7, UNI_CJKEXTB } /* blk=cjkextb */, + { 0, 9711, 5849, 4, 13, UNI_CCC__IS } /* ccc=iotasubscript */, + { 2, 9075, 26, 6, 1, UNI_GREXT } /* grext=y */, + { 3, 9979, 9767, 4, 4, UNI_GONG } /* scx=gong */, + { 9, 9979, 9237, 4, 4, UNI_YEZI } /* scx=yezi */, + { 33, 9489, 10355, 5, 3, UNI_MATH } /* math=yes */, + { 0, 10247, 7880, 3, 9, UNI_JG__SYRIACWAW } /* jg=syriacwaw */, + { 0, 4744, 6741, 15, 10, UNI_DEP } /* identifiertype=deprecated */, + { 2, 3398, 9454, 11, 5, -UNI_XPOSIXSPACE } /* whitespace=false */, + { 0, 9691, 9529, 4, 5, UNI_INTAILE } /* blk=taile */, + { 1, 5172, 9454, 14, 5, -UNI_EMOD } /* emojimodifier=false */, + { 1, 6314, 1026, 12, 2, -UNI_IDEO } /* ideographic=no */, + { 10, 9213, 10055, 6, 4, UNI_UIDEO } /* uideo=true */, + { 9, 185, 5340, 2, 14, UNI_LATINEXTF } /* islatinextendedf */, + { 8, 9847, 0, 4, 0, UNI_loe_values_index } /* loe= */, + { 2, 7718, 0, 9, 0, UNI_LATINEXTB } /* latinextb */, + { 4, 9550, 36, 4, 1, UNI_IDS } /* ids=t */, + { 5, 9803, 5717, 4, 2, UNI_LB__H2 } /* hst=lv */, + { 1, 9711, 8179, 4, 2, UNI_CCC__36 } /* ccc=36 */, + { 0, 8973, 2034, 6, 22, UNI_MISCTECHNICAL } /* block=miscellaneoustechnical */, + { 3, 2304, 6432, 3, 3, UNI_OGAM } /* isogam */, + { 1, 8316, 10355, 8, 3, UNI_EXTPICT } /* extpict=yes */, + { 3, 9743, 36, 4, 1, UNI_DEP } /* dep=t */, + { 0, 10268, 9254, 3, 4, UNI_NV__1_SLASH_32 } /* nv=1/32 */, + { 3, 2332, 0, 6, 0, UNI_YIJING } /* yijing */, + { 5, 1167, 1, 26, 1, -UNI_DI } /* defaultignorablecodepoint=n */, + { 1, 10244, 4624, 3, 14, UNI_SC } /* gc=currencysymbol */, + { 1, 1858, 36, 22, 1, UNI_CWT } /* changeswhentitlecased=t */, + { 2, 5093, 9454, 9, 5, -UNI_XPOSIXXDIGIT } /* hexdigit=false */, + { 9, 6083, 8903, 13, 4, UNI_NV__6000 } /* numericvalue=6000 */, + { 0, 10268, 8028, 3, 8, UNI_NV__20000000 } /* nv=20000000 */, + { 24, 21, 7718, 2, 9, UNI_LATINEXTB } /* inlatinextb */, + { 0, 2593, 3528, 20, 7, UNI_VO__R } /* verticalorientation=rotated */, + { 1, 7360, 1528, 10, 9, UNI_LB__SG } /* linebreak=surrogate */, + { 0, 1418, 9030, 24, 3, UNI_WB__EB } /* canonicalcombiningclass=133 */, + { 25, 5088, 1, 14, 1, -UNI_POSIXXDIGIT } /* asciihexdigit=n */, + { 1, 1553, 728, 9, 2, UNI_MN } /* category=mn */, + { 0, 8973, 7071, 6, 11, UNI_INSORASOMPENG } /* block=sorasompeng */, + { 2, 9476, 7862, 3, 9, UNI_SAMR } /* sc=samaritan */, + { 0, 9691, 7853, 4, 9, UNI_INPAUCINHAU } /* blk=paucinhau */, + { 10, 10508, 5096, 8, 5, UNI_XPOSIXDIGIT } /* isxposixdigit */, + { 4, 1418, 8059, 24, 2, UNI_CCC__33 } /* canonicalcombiningclass=33 */, + { 129, 3877, 9105, 17, 4, UNI_KHOJ } /* scriptextensions=khoj */, + { 8, 6937, 255, 6, 29, UNI_MISCMATHSYMBOLSA } /* inmiscellaneousmathematicalsymbolsa */, + { 0, 9476, 18, 6, 1, UNI_KHAR } /* sc=khar */, + { 0, 9213, 26, 6, 1, UNI_UIDEO } /* uideo=y */, + { 1, 3877, 9294, 17, 5, UNI_BUHD } /* scriptextensions=buhid */, + { 93, 6338, 36, 12, 1, UNI_JOINC } /* joincontrol=t */, + { 8, 9979, 6590, 4, 12, UNI_HUNG } /* scx=oldhungarian */, + { 0, 7460, 8148, 10, 3, UNI_IN__6 } /* presentin=6.0 */, + { 19, 1553, 32, 9, 2, UNI__PERL_SURROGATE } /* category=cs */, + { 2, 6083, 10208, 13, 3, UNI_NV__7_SLASH_8 } /* numericvalue=7/8 */, + { 0, 8782, 8804, 8, 3, UNI_SIDD } /* script=sidd */, + { 0, 185, 4504, 2, 5, UNI_BAMU } /* isbamum */, + { 0, 185, 8594, 3, 5, UNI_COMPEX } /* iscompex */, + { 0, 6083, 7916, 13, 8, UNI_NV__1_SLASH_10 } /* numericvalue=1.00e-01 */, + { 0, 10217, 6602, 3, 12, UNI_BC__ON } /* bc=otherneutral */, + { 0, 2012, 10355, 22, 3, UNI_LOE } /* logicalorderexception=yes */, + { 2, 7467, 10325, 3, 3, UNI_IN__6 } /* in=v60 */, + { 4, 3049, 0, 11, 0, UNI_CHEROKEESUP } /* cherokeesup */, + { 1, 2557, 983, 5, 24, UNI_ALPHABETICPF } /* inalphabeticpresentationforms */, + { 5, 9439, 3, 5, 1, -UNI_DASH } /* dash=f */, + { 6, 9476, 7430, 3, 10, UNI_SOGO } /* sc=oldsogdian */, + { 13, 10510, 9424, 6, 5, UNI_XPOSIXCNTRL } /* xposixcntrl */, + { 0, 9647, 7983, 4, 1, UNI_AGE__7 } /* age=7 */, + { 0, 10253, 4594, 3, 15, UNI_LB__CB } /* lb=contingentbreak */, + { 0, 10396, 0, 2, 0, UNI_ZL } /* zl */, + { 0, 1990, 9225, 22, 6, UNI_INSC__VIRAMA } /* indicsyllabiccategory=virama */, + { 0, 6340, 511, 3, 19, UNI_CJK } /* incjkunifiedideographs */, + { 3, 9153, 26, 6, 1, UNI_NFCQC__Y } /* nfcqc=y */, + { 2, 118, 2250, 4, 19, UNI_ININSCRIPTIONALPARTHIAN } /* ininscriptionalparthian */, + { 0, 3877, 9879, 17, 4, UNI_MYMR } /* scriptextensions=mymr */, + { 1, 185, 6362, 2, 5, UNI_KHMR } /* iskhmer */, + { 0, 8961, 36, 6, 1, UNI_BIDIC } /* bidic=t */, + { 11, 10268, 5732, 3, 2, UNI_NV__10 } /* nv=10 */, + { 32, 9711, 9422, 4, 2, UNI_CCC__91 } /* ccc=91 */, + { 0, 9171, 0, 5, 0, UNI__PERL_PATWS } /* patws */, + { 0, 3877, 7863, 18, 8, UNI_SAMR } /* scriptextensions=samaritan */, + { 0, 1189, 2101, 3, 14, UNI_TRANSPORTANDMAP } /* intransportandmap */, + { 38, 5875, 4829, 13, 3, UNI_JG__SAD } /* joininggroup=sad */, + { 0, 7862, 0, 9, 0, UNI_SAMR } /* samaritan */, + { 0, 10553, 4411, 3, 5, UNI_SYRC } /* issyriac */, + { 25, 21, 8531, 3, 6, UNI_INAVESTAN } /* inavestan */, + { 1, 2803, 0, 3, 0, UNI_IDS } /* ids */, + { 2, 6158, 26, 12, 1, UNI_BIDIC } /* bidicontrol=y */, + { 39, 1418, 3588, 24, 17, UNI_WB__EB } /* canonicalcombiningclass=attachedbelowleft */, + { 32, 5758, 1, 13, 1, -UNI_BIDIM } /* bidimirrored=n */, + { 34, 9691, 8817, 4, 7, UNI_SUPPUAA } /* blk=suppuaa */, + { 3, 9691, 8677, 4, 7, UNI_INMANDAIC } /* blk=mandaic */, + { 0, 10553, 10004, 3, 3, UNI_SOGO } /* issogo */, + { 0, 1418, 9407, 24, 2, UNI_CCC__35 } /* canonicalcombiningclass=35 */, + { 0, 2312, 1515, 3, 23, UNI_HIGHPUSURROGATES } /* inhighprivateusesurrogates */, + { 1, 8782, 7105, 8, 10, UNI_SC__SYLO } /* script=sylotinagri */, + { 17, 10229, 3463, 3, 5, UNI_DT__SML } /* dt=small */, + { 1, 8973, 7826, 6, 9, UNI_INOLDTURKIC } /* block=oldturkic */, + { 9, 9284, 0, 5, 0, UNI_BATK } /* batak */, + { 8, 9699, 0, 4, 0, UNI_BUHD } /* buhd */, + { 26, 6083, 8084, 13, 8, UNI_NV__3_SLASH_80 } /* numericvalue=3.75e-02 */, + { 1, 2012, 0, 22, 0, UNI_loe_values_index } /* logicalorderexception= */, + { 0, 9711, 9365, 5, 4, UNI_CCC__27 } /* ccc=ccc27 */, + { 0, 2185, 10055, 21, 4, UNI_EXTPICT } /* extendedpictographic=true */, + { 1, 2206, 1195, 21, 2, UNI_LB__LF } /* graphemeclusterbreak=lf */, + { 17, 120, 9070, 3, 5, UNI_INGOTHIC } /* ingothic */, + { 4, 9439, 0, 5, 0, UNI_dash_values_index } /* dash= */, + { 0, 10217, 0, 4, 0, UNI_BC__B } /* bc=b */, + { 1, 9476, 1678, 3, 5, UNI_SC__LATN } /* sc=latin */, + { 1, 9691, 3624, 4, 4, UNI_UCAS } /* blk=ucas */, + { 10, 7467, 10211, 3, 3, UNI_IN__9 } /* in=9.0 */, + { 0, 7467, 7975, 3, 1, UNI_IN__6 } /* in=6 */, + { 1, 8979, 0, 4, 0, UNI_CARI } /* cari */, + { 0, 6674, 1, 12, 1, -UNI_XIDC } /* xidcontinue=n */, + { 0, 9190, 1, 5, 1, -UNI_TERM } /* term=n */, + { 17, 8782, 7420, 7, 10, UNI_XPEO } /* script=oldpersian */, + { 32, 7218, 8293, 3, 7, UNI_INBUGINESE } /* inbuginese */, + { 12, 8967, 3, 6, 1, -UNI_BIDIM } /* bidim=f */, + { 27, 8782, 2269, 7, 11, UNI_MTEI } /* script=meeteimayek */, + { 0, 9979, 2632, 4, 4, UNI_BRAH } /* scx=brah */, + { 0, 5662, 70, 14, 2, UNI_SB__UP } /* sentencebreak=up */, + { 5, 1553, 3373, 9, 18, UNI_ZP } /* category=paragraphseparator */, + { 0, 10247, 7177, 3, 3, UNI_JG__FEH } /* jg=feh */, + { 1, 8973, 5256, 6, 7, UNI_KANASUP } /* block=kanasup */, + { 9, 1880, 10355, 22, 3, UNI_CWU } /* changeswhenuppercased=yes */, + { 169, 7467, 10307, 3, 3, UNI_IN__3_DOT_2 } /* in=v32 */, + { 4, 9476, 9524, 3, 5, UNI_RUNR } /* sc=runic */, + { 0, 185, 10119, 2, 4, UNI_ZYYY } /* iszyyy */, + { 1, 7467, 10175, 3, 3, UNI_IN__3_DOT_2 } /* in=3.2 */, + { 9, 6302, 0, 6, 0, UNI_HEBR } /* hebrew */, + { 34, 9979, 1177, 5, 3, UNI_SORA } /* scx=sora */, + { 0, 9763, 0, 4, 0, UNI_gcb_values_index } /* gcb= */, + { 0, 8973, 3481, 6, 11, UNI_TAIXUANJING } /* block=taixuanjing */, + { 0, 7682, 3, 9, 1, -UNI_EXT } /* extender=f */, + { 1, 185, 4170, 2, 6, UNI_LATIN1 } /* islatin1 */, + { 2, 10253, 5382, 3, 14, UNI_LB__BK } /* lb=mandatorybreak */, + { 0, 8782, 5227, 7, 4, UNI_CHAM } /* script=cham */, + { 14, 1553, 4026, 9, 16, UNI_PE } /* category=closepunctuation */, + { 0, 7391, 3607, 4, 15, UNI_UCAS } /* iscanadiansyllabics */, + { 6, 2206, 6895, 21, 3, UNI_LB__H3 } /* graphemeclusterbreak=lvt */, + { 0, 24, 0, 1, 0, UNI_L } /* l */, + { 34, 9691, 2879, 4, 9, UNI_INMONGOLIAN } /* blk=mongolian */, + { 1, 10232, 866, 3, 1, UNI_EA__W } /* ea=w */, + { 0, 185, 3382, 2, 9, UNI_Z } /* isseparator */, + { 1, 118, 416, 3, 31, UNI_INIDC } /* inideographicdescriptioncharacters */, + { 21, 1592, 3708, 3, 16, UNI_ETHIOPICEXTA } /* inethiopicextendeda */, + { 0, 3877, 58, 17, 2, UNI_YI } /* scriptextensions=yi */, + { 8, 7230, 427, 10, 2, UNI_BC__ES } /* bidiclass=es */, + { 49, 5045, 1, 3, 33, UNI_UCAS } /* isunifiedcanadianaboriginalsyllabics */, + { 31, 8973, 3050, 7, 17, UNI_CHEROKEESUP } /* block=cherokeesupplement */, + { 0, 2808, 81, 4, 8, UNI_ARABICMATH } /* inarabicmath */, + { 2, 1747, 0, 23, 0, UNI_ZNAMENNYMUSIC } /* znamennymusicalnotation */, + { 0, 3193, 0, 8, 0, UNI_ETHI } /* ethiopic */, + { 5, 3877, 8508, 17, 4, UNI_VITH } /* scriptextensions=vith */, + { 1, 6083, 8903, 13, 2, UNI_NV__60 } /* numericvalue=60 */, + { 1, 9476, 8300, 3, 8, UNI_SC__DUPL } /* sc=duployan */, + { 24, 9691, 5745, 4, 13, UNI_AEGEANNUMBERS } /* blk=aegeannumbers */, + { 14, 6083, 8901, 13, 6, UNI_NV__216000 } /* numericvalue=216000 */, + { 0, 21, 8404, 2, 8, UNI_KANAEXTB } /* inkanaextb */, + { 8, 7297, 9792, 3, 3, UNI_HLUW } /* ishluw */, + { 5, 3877, 10027, 17, 4, UNI_TAVT } /* scriptextensions=tavt */, + { 0, 7360, 6807, 10, 11, UNI_LB__EX } /* linebreak=exclamation */, + { 0, 8782, 8799, 10, 4, UNI_SHAW } /* script=shavian */, + { 4, 690, 0, 30, 0, UNI_CJKEXTG } /* cjkunifiedideographsextensiong */, + { 0, 10566, 8875, 4, 5, UNI_ZZZZ } /* isunknown */, + { 2, 9691, 7808, 4, 9, UNI_INOLDITALIC } /* blk=olditalic */, + { 0, 3103, 0, 6, 0, UNI_COPT } /* coptic */, + { 0, 10352, 6254, 3, 12, UNI_WB__EX } /* wb=extendnumlet */, + { 9, 7460, 10205, 10, 3, UNI_IN__7 } /* presentin=7.0 */, + { 1, 2808, 3964, 4, 7, UNI_ARABICSUP } /* inarabicsup */, + { 0, 9979, 9771, 4, 4, UNI_GONM } /* scx=gonm */, + { 0, 10217, 3427, 3, 18, UNI_BC__RLI } /* bc=righttoleftisolate */, + { 0, 9476, 2879, 3, 9, UNI_SC__MONG } /* sc=mongolian */, + { 0, 1418, 10142, 24, 3, UNI_CCC__202 } /* canonicalcombiningclass=202 */, + { 28, 5875, 6686, 13, 11, UNI_JG__AFRICANNOON } /* joininggroup=africannoon */, + { 14, 5875, 7490, 13, 10, UNI_JG__REVERSEDPE } /* joininggroup=reversedpe */, + { 0, 10247, 4122, 3, 16, UNI_JG__HANIFIROHINGYAPA } /* jg=hanifirohingyapa */, + { 0, 1553, 468, 9, 5, UNI_P } /* category=punct */, + { 0, 21, 7709, 2, 9, UNI_INKHUDAWADI } /* inkhudawadi */, + { 22, 6083, 10181, 13, 3, UNI_NV__3_SLASH_5 } /* numericvalue=3/5 */, + { 0, 8973, 8831, 6, 7, UNI_INTAGALOG } /* block=tagalog */, + { 0, 1167, 10355, 26, 3, UNI_DI } /* defaultignorablecodepoint=yes */, + { 0, 185, 3139, 2, 10, UNI_DEVA } /* isdevanagari */, + { 25, 8782, 9183, 7, 6, UNI_RJNG } /* script=rejang */, + { 0, 7360, 496, 10, 2, UNI_LB__NU } /* linebreak=nu */, + { 15, 3406, 10055, 3, 4, UNI_CE } /* ce=true */, + { 0, 10283, 36, 3, 1, UNI_SD } /* sd=t */, + { 0, 7360, 9764, 10, 2, UNI_LB__CB } /* linebreak=cb */, + { 4, 8782, 2353, 7, 20, UNI_HLUW } /* script=anatolianhieroglyphs */, + { 68, 10516, 5095, 7, 6, UNI_POSIXXDIGIT } /* isposixxdigit */, + { 0, 9979, 8614, 4, 7, UNI_ELYM } /* scx=elymaic */, + { 1, 10352, 6287, 3, 3, UNI_LB__ZWJ } /* wb=zwj */, + { 1, 8782, 6290, 7, 12, UNI_SC__GONG } /* script=gunjalagondi */, + { 1, 10253, 6326, 3, 12, UNI_LB__IS } /* lb=infixnumeric */, + { 1, 7736, 0, 9, 0, UNI_LATINEXTD } /* latinextd */, + { 0, 9691, 4924, 4, 15, UNI_NARB } /* blk=oldnortharabian */, + { 21, 2593, 3535, 20, 18, UNI_VO__TU } /* verticalorientation=transformedupright */, + { 32, 4972, 9535, 3, 3, UNI_TAKR } /* istakr */, + { 1, 8705, 0, 7, 0, UNI_nfkcqc_values_index } /* nfkcqc= */, + { 8, 3877, 9815, 17, 4, UNI_KITS } /* scriptextensions=kits */, + { 0, 9691, 4186, 4, 16, UNI_LINEARBIDEOGRAMS } /* blk=linearbideograms */, + { 1, 185, 8420, 2, 8, UNI_MAHJ } /* ismahajani */, + { 49, 8782, 9237, 7, 4, UNI_SC__YEZI } /* script=yezi */, + { 48, 1847, 0, 9, 0, UNI_XPOSIXLOWER } /* lowercase */, + { 0, 10232, 10091, 3, 4, UNI_EA__W } /* ea=wide */, + { 2, 3877, 9839, 17, 4, UNI_LINA } /* scriptextensions=lina */, + { 0, 10553, 1538, 3, 3, UNI_SIND } /* issind */, + { 9, 9476, 4924, 3, 15, UNI_NARB } /* sc=oldnortharabian */, + { 0, 9979, 4939, 4, 15, UNI_SARB } /* scx=oldsoutharabian */, + { 47, 10247, 5452, 3, 14, UNI_JG__MANICHAEANKAPH } /* jg=manichaeankaph */, + { 0, 10229, 6530, 3, 8, UNI_DT__NONCANON } /* dt=noncanon */, + { 2, 10247, 7180, 3, 10, UNI_JG__AFRICANQAF } /* jg=africanqaf */, + { 6, 10268, 5733, 3, 1, UNI_NV__0 } /* nv=0 */, + { 10, 5662, 34, 14, 6, UNI_SB__EX } /* sentencebreak=extend */, + { 0, 10253, 3409, 3, 17, UNI_RI } /* lb=regionalindicator */, + { 0, 2765, 0, 19, 0, UNI_JAMOEXTB } /* hanguljamoextendedb */, + { 17, 7540, 0, 10, 0, UNI_SUPARROWSC } /* suparrowsc */, + { 0, 10268, 8949, 3, 5, UNI_NV__90000 } /* nv=90000 */, + { 16, 5875, 7177, 13, 2, UNI_JG__FE } /* joininggroup=fe */, + { 0, 9549, 1026, 5, 2, -UNI_XIDS } /* xids=no */, + { 1, 4170, 0, 9, 0, UNI_LATIN1 } /* latin1sup */, + { 0, 9476, 8979, 3, 4, UNI_CARI } /* sc=cari */, + { 0, 5676, 0, 14, 0, UNI_ZS } /* spaceseparator */, + { 9, 1836, 10055, 22, 4, UNI_CWL } /* changeswhenlowercased=true */, + { 0, 8705, 26, 7, 1, UNI_NFKCQC__Y } /* nfkcqc=y */, + { 1, 6340, 541, 3, 29, UNI_CJKEXTB } /* incjkunifiedideographsextensionb */, + { 1, 9979, 7434, 5, 6, UNI_SOGD } /* scx=sogdian */, + { 2, 6338, 10055, 12, 4, UNI_JOINC } /* joincontrol=true */, + { 0, 1115, 10355, 26, 3, UNI_CWKCF } /* changeswhennfkccasefolded=yes */, + { 1, 9647, 10319, 4, 3, UNI_AGE__5_DOT_1 } /* age=v51 */, + { 0, 8973, 7745, 6, 9, UNI_LATINEXTF } /* block=latinextf */, + { 5, 9476, 5059, 3, 15, UNI_ZANB } /* sc=zanabazarsquare */, + { 13, 6340, 721, 3, 15, UNI_CUNEIFORMNUMBERS } /* incuneiformnumbers */, + { 0, 6083, 9616, 13, 3, UNI_NV__7_SLASH_2 } /* numericvalue=7/2 */, + { 6, 4972, 9203, 4, 4, UNI_TELU } /* istelugu */, + { 8, 9691, 3049, 4, 18, UNI_CHEROKEESUP } /* blk=cherokeesupplement */, + { 0, 9711, 8761, 4, 7, UNI_CCC__1 } /* ccc=overlay */, + { 2, 8973, 9099, 6, 6, UNI_KANBUN } /* block=kanbun */, + { 3, 3934, 0, 11, 0, UNI_SGNW } /* signwriting */, + { 2, 3193, 0, 11, 0, UNI_ETHIOPICSUP } /* ethiopicsup */, + { 1, 9979, 9815, 4, 4, UNI_KITS } /* scx=kits */, + { 0, 9979, 9931, 4, 4, UNI_PHLP } /* scx=phlp */, + { 9, 1553, 1846, 9, 2, UNI_NL } /* category=nl */, + { 1, 10510, 3403, 6, 5, UNI_XPOSIXSPACE } /* xposixspace */, + { 0, 1814, 1026, 22, 2, -UNI_CWCM } /* changeswhencasemapped=no */, + { 0, 4864, 0, 15, 0, UNI_MISCPICTOGRAPHS } /* miscpictographs */, + { 6, 4157, 416, 3, 31, UNI_INIDC } /* isideographicdescriptioncharacters */, + { 18, 9461, 113, 3, 2, UNI_SB__SC } /* sb=sc */, + { 2, 4972, 10036, 3, 3, UNI_TGLG } /* istglg */, + { 2, 9691, 8388, 4, 8, UNI_INJAVANESE } /* blk=javanese */, + { 0, 9763, 4346, 4, 5, UNI_GCB__XX } /* gcb=other */, + { 2, 185, 9851, 2, 4, UNI_MEDF } /* ismedf */, + { 1, 9691, 720, 4, 9, UNI_INCUNEIFORM } /* blk=cuneiform */, + { 2, 7160, 2333, 3, 5, UNI_YIJING } /* isyijing */, + { 1, 10516, 132, 3, 3, UNI_PALM } /* ispalm */, + { 0, 8782, 8838, 7, 7, UNI_LANA } /* script=taitham */, + { 0, 8973, 6044, 6, 13, UNI_MAYANNUMERALS } /* block=mayannumerals */, + { 9, 3175, 3, 18, 1, -UNI_EPRES } /* emojipresentation=f */, + { 0, 9691, 8845, 4, 7, UNI_INTAIVIET } /* blk=taiviet */, + { 1, 9123, 1026, 6, 2, -UNI_XPOSIXLOWER } /* lower=no */, + { 0, 6674, 36, 12, 1, UNI_XIDC } /* xidcontinue=t */, + { 0, 7360, 6287, 10, 3, UNI_LB__ZWJ } /* linebreak=zwj */, + { 0, 10508, 9424, 8, 5, UNI_XPOSIXCNTRL } /* isxposixcntrl */, + { 2, 9476, 8500, 3, 8, UNI_UGAR } /* sc=ugaritic */, + { 2, 2784, 6895, 19, 11, UNI_LB__H3 } /* hangulsyllabletype=lvtsyllable */, + { 0, 9476, 4426, 3, 6, UNI_TANG } /* sc=tangut */, + { 1, 185, 9895, 2, 4, UNI_NKO } /* isnkoo */, + { 10, 8866, 0, 4, 0, UNI_TIRH } /* tirh */, + { 0, 9444, 0, 5, 0, UNI_DOGR } /* dogra */, + { 1, 8782, 7434, 8, 3, UNI_SC__SOGD } /* script=sogd */, + { 2, 8973, 3775, 6, 17, UNI_INDICSIYAQNUMBERS } /* block=indicsiyaqnumbers */, + { 0, 9647, 9583, 4, 4, UNI_AGE__10 } /* age=10.0 */, + { 8, 8782, 7835, 7, 9, UNI_SC__OUGR } /* script=olduyghur */, + { 0, 8973, 4410, 6, 16, UNI_SYRIACSUP } /* block=syriacsupplement */, + { 1, 7360, 4026, 10, 16, UNI_LB__CL } /* linebreak=closepunctuation */, + { 96, 3877, 9947, 17, 4, UNI_COPT } /* scriptextensions=qaac */, + { 2, 10247, 4834, 3, 15, UNI_JG__MANICHAEANZAYIN } /* jg=manichaeanzayin */, + { 0, 5875, 7082, 13, 11, UNI_JG__STRAIGHTWAW } /* joininggroup=straightwaw */, + { 4, 10244, 3373, 3, 18, UNI_ZP } /* gc=paragraphseparator */, + { 11, 5536, 48, 14, 1, UNI_NFCQC__M } /* nfcquickcheck=m */, + { 64, 6083, 9254, 13, 4, UNI_NV__1_SLASH_32 } /* numericvalue=1/32 */, + { 2, 9691, 4410, 4, 16, UNI_SYRIACSUP } /* blk=syriacsupplement */, + { 3, 10553, 7018, 3, 3, UNI_SHAW } /* isshaw */, + { 0, 185, 5797, 2, 13, UNI_XPOSIXDIGIT } /* isdecimalnumber */, + { 0, 9469, 7845, 3, 8, UNI_PALM } /* inpalmyrene */, + { 10, 8628, 9454, 7, 5, -UNI_GRBASE } /* grbase=false */, + { 1, 9461, 8747, 3, 7, UNI_SB__LE } /* sb=oletter */, + { 0, 9691, 1320, 4, 25, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* blk=symbolsandpictographsexta */, + { 0, 3391, 9454, 18, 5, -UNI__PERL_PATWS } /* patternwhitespace=false */, + { 1, 185, 4504, 2, 8, UNI_BAMUMSUP } /* isbamumsup */, + { 0, 9979, 9899, 4, 4, UNI_NSHU } /* scx=nshu */, + { 1, 7907, 10055, 9, 4, UNI_XIDS } /* xidstart=true */, + { 4, 8973, 2078, 6, 22, UNI_MODIFIERLETTERS } /* block=spacingmodifierletters */, + { 0, 10553, 4190, 3, 3, UNI_SARB } /* issarb */, + { 19, 2784, 6650, 19, 12, UNI_GCB__T } /* hangulsyllabletype=trailingjamo */, + { 1, 8973, 1007, 6, 17, UNI_ANCIENTGREEKMUSIC } /* block=ancientgreekmusic */, + { 4, 10247, 3860, 3, 17, UNI_JG__MANICHAEANTHAMEDH } /* jg=manichaeanthamedh */, + { 0, 185, 9135, 2, 6, UNI_LYDI } /* islydian */, + { 0, 185, 7781, 2, 9, UNI_NBAT } /* isnabataean */, + { 0, 5256, 0, 14, 0, UNI_KANASUP } /* kanasupplement */, + { 0, 9711, 8043, 4, 2, UNI_CCC__23 } /* ccc=23 */, + { 0, 4154, 6110, 3, 12, UNI_VERTICALFORMS } /* inverticalforms */, + { 0, 6614, 0, 8, 0, UNI_PHAISTOS } /* phaistos */, + { 2, 5298, 0, 14, 0, UNI_LATINEXTC } /* latinextendedc */, + { 0, 9691, 4535, 5, 14, UNI_BRAI } /* blk=braillepatterns */, + { 2, 6529, 4940, 3, 14, UNI_SARB } /* inoldsoutharabian */, + { 6, 8973, 6972, 6, 11, UNI_INNANDINAGARI } /* block=nandinagari */, + { 0, 9763, 5669, 4, 2, UNI_WB__EB } /* gcb=eb */, + { 64, 9549, 1, 5, 1, -UNI_XIDS } /* xids=n */, + { 0, 10253, 84, 3, 2, UNI_LB__CM } /* lb=cm */, + { 27, 185, 810, 2, 22, UNI_ENCLOSEDIDEOGRAPHICSUP } /* isenclosedideographicsup */, + { 0, 8973, 4170, 6, 9, UNI_LATIN1 } /* block=latin1sup */, + { 0, 9895, 0, 3, 0, UNI_NKO } /* nko */, + { 0, 10244, 0, 3, 0, UNI_gc_values_index } /* gc= */, + { 1, 3877, 8537, 17, 4, UNI_BENG } /* scriptextensions=beng */, + { 7, 6340, 2165, 3, 20, UNI_CYRILLICSUP } /* incyrillicsupplementary */, + { 2, 7391, 2, 5, 1, UNI_CARI } /* iscari */, + { 0, 4654, 0, 15, 0, UNI_DIACRITICALSEXT } /* diacriticalsext */, + { 0, 7297, 5275, 3, 3, UNI_HIRA } /* ishira */, + { 29, 8973, 8545, 7, 6, UNI_CJKEXTA } /* block=cjkexta */, + { 33, 10553, 17, 3, 1, UNI_SO } /* isso */, + { 2, 3121, 6530, 18, 12, UNI_DT__NONCANON } /* decompositiontype=noncanonical */, + { 3, 5875, 5466, 13, 14, UNI_JG__MANICHAEANQOPH } /* joininggroup=manichaeanqoph */, + { 0, 1553, 2292, 9, 2, UNI_PD } /* category=pd */, + { 0, 9075, 10355, 6, 3, UNI_GREXT } /* grext=yes */, + { 0, 5270, 0, 6, 0, UNI_KANGXI } /* kangxi */, + { 1, 9214, 1026, 5, 2, -UNI_IDEO } /* ideo=no */, + { 0, 185, 2269, 2, 14, UNI_MEETEIMAYEKEXT } /* ismeeteimayekext */, + { 0, 3409, 10355, 18, 3, UNI_RI } /* regionalindicator=yes */, + { 4, 9691, 3571, 4, 10, UNI_ALCHEMICAL } /* blk=alchemical */, + { 3, 5550, 26, 14, 1, UNI_NFDQC__Y } /* nfdquickcheck=y */, + { 5, 4074, 2373, 16, 20, UNI_PC } /* generalcategory=connectorpunctuation */, + { 7, 8782, 9699, 7, 4, UNI_SC__BUHD } /* script=buhd */, + { 0, 9476, 9895, 3, 4, UNI_SC__NKO } /* sc=nkoo */, + { 1, 10083, 0, 4, 0, UNI_VAI } /* vaii */, + { 43, 8973, 8803, 6, 7, UNI_INSIDDHAM } /* block=siddham */, + { 2, 10247, 6432, 3, 5, UNI_JG__GAMAL } /* jg=gamal */, + { 1, 185, 8276, 2, 4, UNI_BALI } /* isbali */, + { 10, 3877, 8804, 18, 6, UNI_SIDD } /* scriptextensions=siddham */, + { 0, 9691, 1902, 4, 19, UNI_CJKCOMPATIDEOGRAPHS } /* blk=cjkcompatideographs */, + { 23, 185, 8670, 2, 7, UNI_MAKA } /* ismakasar */, + { 2, 9691, 4729, 4, 15, UNI_INHANGUL } /* blk=hangulsyllables */, + { 0, 1891, 0, 9, 0, UNI_XPOSIXUPPER } /* uppercase */, + { 0, 5830, 3, 6, 1, -UNI_EBASE } /* ebase=f */, + { 2, 185, 8348, 2, 8, UNI_GURU } /* isgurmukhi */, + { 6, 9476, 1537, 3, 4, UNI_SC__SIND } /* sc=sind */, + { 0, 4186, 0, 7, 0, UNI_LINB } /* linearb */, + { 1, 6083, 7996, 13, 8, UNI_NV__1_SLASH_5 } /* numericvalue=2.00e-01 */, + { 0, 10510, 1847, 6, 5, UNI_XPOSIXLOWER } /* xposixlower */, + { 0, 2784, 6873, 19, 11, UNI_GCB__L } /* hangulsyllabletype=leadingjamo */, + { 0, 7682, 1026, 9, 2, -UNI_EXT } /* extender=no */, + { 7, 9979, 7709, 4, 9, UNI_SIND } /* scx=khudawadi */, + { 0, 8973, 4298, 6, 16, UNI_MISCMATHSYMBOLSB } /* block=miscmathsymbolsb */, + { 1, 1442, 0, 10, 0, UNI_CJKSYMBOLS } /* cjksymbols */, + { 19, 4074, 1288, 16, 2, UNI_UPPERCASELETTER } /* generalcategory=lu */, + { 11, 6083, 5732, 13, 8, UNI_NV__10000000 } /* numericvalue=10000000 */, + { 8, 9691, 149, 4, 35, UNI_DIACRITICALSSUP } /* blk=combiningdiacriticalmarkssupplement */, + { 0, 1418, 18, 24, 1, UNI_CCC__R } /* canonicalcombiningclass=r */, + { 1, 7360, 534, 10, 2, UNI_LB__NS } /* linebreak=ns */, + { 4, 6578, 5096, 12, 5, UNI_NT__DI } /* numerictype=digit */, + { 7, 8831, 0, 7, 0, UNI_TGLG } /* tagalog */, + { 0, 10547, 7580, 6, 4, UNI_POSIXWORD } /* isperlword */, + { 1, 9979, 1219, 4, 8, UNI_KANA } /* scx=katakana */, + { 3, 5802, 0, 5, 0, UNI_XPOSIXALNUM } /* alnum */, + { 13, 2003, 1046, 10, 5, UNI_L } /* category=letter */, + { 2, 8973, 4534, 6, 15, UNI_BRAI } /* block=braillepatterns */, + { 4, 9691, 0, 4, 43, UNI_UCASEXTA } /* blk=unifiedcanadianaboriginalsyllabicsextendeda */, + { 0, 185, 1674, 2, 4, UNI_JAMO } /* isjamo */, + { 0, 7467, 10343, 3, 3, UNI_IN__9 } /* in=v90 */, + { 41, 8973, 4939, 6, 15, UNI_SARB } /* block=oldsoutharabian */, + { 3, 3877, 8859, 17, 7, UNI_TIBT } /* scriptextensions=tibetan */, + { 22, 10268, 9387, 3, 2, UNI_NV__31 } /* nv=31 */, + { 4, 6338, 0, 12, 0, UNI_joinc_values_index } /* joincontrol= */, + { 0, 6083, 5732, 13, 2, UNI_NV__10 } /* numericvalue=10 */, + { 0, 185, 924, 2, 28, UNI_SUPPUAB } /* issupplementaryprivateuseareab */, + { 0, 185, 4381, 2, 13, UNI_MATHOPERATORS } /* ismathoperators */, + { 69, 8973, 5354, 6, 14, UNI_LATINEXTG } /* block=latinextendedg */, + { 0, 10253, 8642, 3, 2, UNI_LB__HY } /* lb=hy */, + { 8, 9476, 9195, 3, 6, UNI_TNSA } /* sc=tangsa */, + { 0, 8881, 4476, 4, 13, UNI_ARABICEXTA } /* isarabicextendeda */, + { 12, 10244, 2373, 3, 20, UNI_PC } /* gc=connectorpunctuation */, + { 79, 8276, 0, 4, 0, UNI_BALI } /* bali */, + { 0, 8973, 8476, 6, 8, UNI_INTIFINAGH } /* block=tifinagh */, + { 12, 10247, 9659, 3, 4, UNI_JG__ALEF } /* jg=alef */, + { 1, 8887, 26, 7, 1, UNI_XPOSIXSPACE } /* wspace=y */, + { 0, 5550, 10355, 14, 3, UNI_NFDQC__Y } /* nfdquickcheck=yes */, + { 4, 10516, 6, 3, 1, UNI_PD } /* ispd */, + { 5, 2593, 18, 20, 1, UNI_VO__R } /* verticalorientation=r */, + { 1, 5045, 1, 3, 42, UNI_UCASEXTA } /* isunifiedcanadianaboriginalsyllabicsextendeda */, + { 3, 2248, 2975, 3, 18, UNI_SUPARROWSB } /* insupplementalarrowsb */, + { 3, 9691, 4090, 4, 11, UNI_GEORGIANEXT } /* blk=georgianext */, + { 1, 10253, 4026, 3, 16, UNI_LB__CL } /* lb=closepunctuation */, + { 41, 5875, 6917, 13, 11, UNI_JG__MALAYALAMRA } /* joininggroup=malayalamra */, + { 30, 8782, 8614, 7, 7, UNI_ELYM } /* script=elymaic */, + { 1, 185, 4170, 2, 16, UNI_LATIN1 } /* islatin1supplement */, + { 27, 10247, 5466, 3, 14, UNI_JG__MANICHAEANQOPH } /* jg=manichaeanqoph */, + { 1, 4298, 0, 16, 0, UNI_MISCMATHSYMBOLSB } /* miscmathsymbolsb */, + { 0, 10268, 8931, 3, 6, UNI_NV__600000 } /* nv=600000 */, + { 11, 8973, 780, 6, 30, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* block=symbolsandpictographsextendeda */, + { 18, 10247, 4244, 3, 3, UNI_JG__LAM } /* jg=lam */, + { 10, 9269, 0, 5, 0, UNI_ahex_values_index } /* ahex= */, + { 0, 3409, 3, 18, 1, -UNI_RI } /* regionalindicator=f */, + { 16, 9474, 8484, 5, 8, UNI_INSC__TONEMARK } /* insc=tonemark */, + { 0, 9476, 8635, 3, 7, UNI_SC__HANO } /* sc=hanunoo */, + { 16, 85, 0, 4, 0, UNI_MATH } /* math */, + { 1, 8973, 2974, 6, 19, UNI_SUPARROWSB } /* block=supplementalarrowsb */, + { 7, 6340, 601, 3, 29, UNI_CJKEXTD } /* incjkunifiedideographsextensiond */, + { 0, 1858, 9454, 22, 5, -UNI_CWT } /* changeswhentitlecased=false */, + { 131, 185, 8887, 2, 6, UNI_XPOSIXSPACE } /* iswspace */, + { 0, 6340, 1443, 3, 9, UNI_CJKSYMBOLS } /* incjksymbols */, + { 0, 1990, 8268, 22, 8, UNI_INSC__AVAGRAHA } /* indicsyllabiccategory=avagraha */, + { 0, 8444, 10355, 8, 3, UNI_RADICAL } /* radical=yes */, + { 0, 8973, 721, 7, 29, UNI_CUNEIFORMNUMBERS } /* block=cuneiformnumbersandpunctuation */, + { 0, 8973, 7104, 6, 11, UNI_INSYLOTINAGRI } /* block=sylotinagri */, + { 2, 7580, 1219, 10, 8, UNI_WB__KA } /* wordbreak=katakana */, + { 36, 185, 1946, 2, 12, UNI_DIACRITICALS } /* isdiacriticals */, + { 0, 3877, 3139, 17, 4, UNI_DEVA } /* scriptextensions=deva */, + { 0, 21, 3573, 4, 8, UNI_ALCHEMICAL } /* inalchemical */, + { 0, 185, 5690, 2, 14, UNI_SUPPUNCTUATION } /* issuppunctuation */, + { 37, 9214, 36, 5, 1, UNI_IDEO } /* ideo=t */, + { 0, 185, 6109, 2, 13, UNI_VERTICALFORMS } /* isverticalforms */, + { 0, 4684, 4527, 15, 7, UNI_EA__N } /* eastasianwidth=neutral */, + { 0, 4157, 326, 3, 3, UNI_ITAL } /* isital */, + { 1, 10226, 9454, 3, 5, -UNI_DI } /* di=false */, + { 1, 9153, 48, 6, 1, UNI_NFCQC__M } /* nfcqc=m */, + { 1, 5093, 1026, 9, 2, -UNI_XPOSIXXDIGIT } /* hexdigit=no */, + { 6, 8854, 2333, 3, 20, UNI_YIJING } /* inyijinghexagramsymbols */, + { 96, 2248, 7434, 3, 6, UNI_INSOGDIAN } /* insogdian */, + { 4, 9045, 26, 6, 1, UNI_CWKCF } /* cwkcf=y */, + { 1, 21, 5340, 2, 14, UNI_LATINEXTF } /* inlatinextendedf */, + { 0, 7218, 7656, 3, 8, UNI_INBHAIKSUKI } /* inbhaiksuki */, + { 2, 10244, 32, 3, 2, UNI__PERL_SURROGATE } /* gc=cs */, + { 42, 27, 0, 2, 0, UNI_LOWERCASELETTER } /* ll */, + { 4, 9474, 4394, 5, 16, UNI_INSC__SYLLABLEMODIFIER } /* insc=syllablemodifier */, + { 29, 10109, 1748, 3, 12, UNI_ZNAMENNYMUSIC } /* inznamennymusic */, + { 0, 9081, 0, 4, 0, UNI_HATR } /* hatr */, + { 2, 9476, 10103, 3, 4, UNI_SC__YI } /* sc=yiii */, + { 8, 3894, 1026, 17, 2, -UNI_STERM } /* sentenceterminal=no */, + { 4, 7460, 8092, 10, 3, UNI_IN__4 } /* presentin=4.0 */, + { 0, 8782, 3103, 7, 4, UNI_SC__COPT } /* script=copt */, + { 0, 10226, 0, 3, 0, UNI_di_values_index } /* di= */, + { 5, 8881, 9652, 3, 3, UNI_AGHB } /* isaghb */, + { 0, 9434, 1026, 5, 2, -UNI_CWCM } /* cwcm=no */, + { 33, 185, 9430, 3, 3, UNI_CWCF } /* iscwcf */, + { 18, 8973, 9183, 6, 6, UNI_INREJANG } /* block=rejang */, + { 33, 9476, 10023, 3, 4, UNI_SC__TAML } /* sc=taml */, + { 2, 8973, 5368, 6, 4, UNI_INLISU } /* block=lisu */, + { 0, 7390, 0, 10, 0, UNI_MISCARROWS } /* miscarrows */, + { 42, 2146, 0, 7, 0, UNI_RADICAL } /* radical */, + { 1, 9190, 9454, 5, 5, -UNI_TERM } /* term=false */, + { 51, 185, 6207, 3, 11, UNI_CYRILLICEXTB } /* iscyrillicextb */, + { 0, 7391, 12, 5, 3, UNI_CARI } /* iscarian */, + { 0, 7580, 1219, 10, 2, UNI_WB__KA } /* wordbreak=ka */, + { 1, 9048, 0, 2, 0, UNI_CF } /* cf */, + { 73, 1418, 1779, 24, 2, UNI_CCC__DB } /* canonicalcombiningclass=db */, + { 0, 1538, 1948, 4, 10, UNI_DIACRITICALS } /* indiacriticals */, + { 4, 8973, 3445, 6, 4, UNI_RUMI } /* block=rumi */, + { 0, 10217, 866, 3, 2, UNI_BC__WS } /* bc=ws */, + { 1, 9691, 952, 4, 18, UNI_INVS } /* blk=variationselectors */, + { 1, 9979, 7844, 4, 4, UNI_PALM } /* scx=palm */, + { 0, 5758, 1026, 13, 2, -UNI_BIDIM } /* bidimirrored=no */, + { 2, 9087, 1, 6, 1, -UNI_JOINC } /* joinc=n */, + { 1, 185, 6386, 2, 4, UNI_MAHJ } /* ismahj */, + { 1, 4314, 0, 16, 0, UNI_MYANMAREXTA } /* myanmarextendeda */, + { 7, 8973, 541, 7, 29, UNI_CJKEXTB } /* block=cjkunifiedideographsextensionb */, + { 1, 10280, 36, 3, 1, UNI_RI } /* ri=t */, + { 1, 118, 6, 3, 2, UNI_INIDC } /* inidc */, + { 0, 9979, 7501, 5, 3, UNI_SAUR } /* scx=saur */, + { 0, 185, 3463, 2, 18, UNI_SMALLKANAEXT } /* issmallkanaextension */, + { 0, 10516, 7580, 7, 4, UNI_POSIXWORD } /* isposixword */, + { 3, 9803, 24, 4, 1, UNI_GCB__L } /* hst=l */, + { 0, 6755, 2900, 4, 17, UNI_OTTOMANSIYAQNUMBERS } /* inottomansiyaqnumbers */, + { 16, 21, 5368, 2, 4, UNI_INLISU } /* inlisu */, + { 1, 8782, 9534, 7, 4, UNI_SC__TAKR } /* script=takr */, + { 1, 9476, 7811, 3, 4, UNI_ITAL } /* sc=ital */, + { 3, 9153, 0, 6, 0, UNI_nfcqc_values_index } /* nfcqc= */, + { 0, 6083, 8244, 13, 8, UNI_NV__7_SLASH_8 } /* numericvalue=8.75e-01 */, + { 7, 185, 9135, 2, 4, UNI_LYDI } /* islydi */, + { 0, 9075, 0, 6, 0, UNI_grext_values_index } /* grext= */, + { 3, 8973, 4489, 6, 15, UNI_ARABICEXTB } /* block=arabicextendedb */, + { 0, 185, 4504, 2, 4, UNI_BAMU } /* isbamu */, + { 8, 9979, 4504, 4, 4, UNI_BAMU } /* scx=bamu */, + { 2, 10247, 5992, 3, 13, UNI_JG__MANICHAEANONE } /* jg=manichaeanone */, + { 0, 9647, 10301, 4, 3, UNI_AGE__3 } /* age=v30 */, + { 0, 9691, 3962, 4, 9, UNI_ARABICSUP } /* blk=arabicsup */, + { 8, 1836, 10355, 22, 3, UNI_CWL } /* changeswhenlowercased=yes */, + { 5, 8973, 6219, 7, 11, UNI_CYRILLICEXTC } /* block=cyrillicextc */, + { 0, 8973, 2123, 7, 20, UNI_CJKCOMPATFORMS } /* block=cjkcompatibilityforms */, + { 0, 8973, 5029, 6, 15, UNI_VEDICEXT } /* block=vedicextensions */, + { 4, 9476, 7781, 3, 9, UNI_NBAT } /* sc=nabataean */, + { 20, 9979, 8790, 5, 6, UNI_SHRD } /* scx=sharada */, + { 1, 9679, 0, 4, 0, UNI_AVST } /* avst */, + { 0, 3877, 8873, 17, 7, UNI_ZZZZ } /* scriptextensions=unknown */, + { 0, 9691, 2501, 4, 3, UNI_PUA } /* blk=pua */, + { 20, 9775, 0, 4, 0, UNI_GREK } /* grek */, + { 30, 9459, 1026, 5, 2, -UNI_IDSB } /* idsb=no */, + { 0, 8973, 1007, 6, 27, UNI_ANCIENTGREEKMUSIC } /* block=ancientgreekmusicalnotation */, + { 12, 10508, 7580, 8, 4, UNI_XPOSIXWORD } /* isxposixword */, + { 2, 7060, 36, 11, 1, UNI_SD } /* softdotted=t */, + { 111, 8973, 5927, 6, 13, UNI_LOWSURROGATES } /* block=lowsurrogates */, + { 0, 8973, 2433, 6, 13, UNI_GLAGOLITICSUP } /* block=glagoliticsup */, + { 4, 3877, 9033, 17, 6, UNI_CAKM } /* scriptextensions=chakma */, + { 1, 10268, 8913, 3, 3, UNI_NV__400 } /* nv=400 */, + { 2, 4074, 5096, 16, 5, UNI_XPOSIXDIGIT } /* generalcategory=digit */, + { 1, 9979, 3935, 5, 10, UNI_SGNW } /* scx=signwriting */, + { 3, 9476, 3978, 3, 4, UNI_SC__BOPO } /* sc=bopo */, + { 0, 8537, 0, 7, 0, UNI_BENG } /* bengali */, + { 4, 4699, 26, 15, 1, UNI_ECOMP } /* emojicomponent=y */, + { 0, 7467, 10059, 3, 4, UNI_IN__10 } /* in=v100 */, + { 26, 9476, 9207, 3, 6, UNI_SC__THAA } /* sc=thaana */, + { 19, 3877, 8866, 17, 4, UNI_TIRH } /* scriptextensions=tirh */, + { 1, 185, 9284, 2, 5, UNI_BATK } /* isbatak */, + { 2, 2304, 4941, 4, 13, UNI_SARB } /* isoldsoutharabian */, + { 1, 4598, 1634, 4, 16, UNI_GEOMETRICSHAPESEXT } /* ingeometricshapesext */, + { 1, 8973, 5836, 6, 8, UNI_GREEKEXT } /* block=greekext */, + { 47, 185, 1724, 2, 23, UNI_SUPPUNCTUATION } /* issupplementalpunctuation */, + { 3, 185, 10123, 2, 4, UNI_ZZZZ } /* iszzzz */, + { 3, 4699, 10055, 15, 4, UNI_ECOMP } /* emojicomponent=true */, + { 10, 3877, 7016, 17, 11, UNI_HMNG } /* scriptextensions=pahawhhmong */, + { 2, 4074, 5014, 16, 15, UNI_UPPERCASELETTER } /* generalcategory=uppercaseletter */, + { 3, 4314, 0, 7, 0, UNI_MYMR } /* myanmar */, + { 1, 3877, 8621, 17, 7, UNI_GRAN } /* scriptextensions=grantha */, + { 0, 10268, 10127, 3, 3, UNI_NV__1_SLASH_5 } /* nv=1/5 */, + { 0, 8973, 7240, 6, 10, UNI_BOXDRAWING } /* block=boxdrawing */, + { 20, 10283, 1026, 3, 2, -UNI_SD } /* sd=no */, + { 2, 9691, 5284, 4, 14, UNI_LATINEXTB } /* blk=latinextendedb */, + { 0, 9691, 5862, 4, 6, UNI_IPAEXT } /* blk=ipaext */, + { 0, 6083, 8949, 13, 5, UNI_NV__90000 } /* numericvalue=90000 */, + { 0, 10226, 1, 3, 1, -UNI_DI } /* di=n */, + { 21, 5836, 0, 8, 0, UNI_GREEKEXT } /* greekext */, + { 0, 9476, 9999, 3, 4, UNI_SC__SHRD } /* sc=shrd */, + { 32, 2012, 1026, 22, 2, -UNI_LOE } /* logicalorderexception=no */, + { 2, 1442, 0, 24, 0, UNI_CJKSYMBOLS } /* cjksymbolsandpunctuation */, + { 1, 9691, 9099, 4, 6, UNI_KANBUN } /* blk=kanbun */, + { 0, 9763, 10394, 4, 2, UNI_GCB__XX } /* gcb=xx */, + { 0, 10560, 10084, 3, 3, UNI_VAI } /* isvaii */, + { 17, 1553, 729, 9, 6, UNI_N } /* category=number */, + { 8, 8973, 44, 7, 15, UNI_CJKCOMPAT } /* block=cjkcompatibility */, + { 2, 21, 5368, 2, 7, UNI_LISUSUP } /* inlisusup */, + { 1, 9763, 6279, 5, 11, UNI_WB__EB } /* gcb=glueafterzwj */, + { 1, 185, 3691, 3, 16, UNI_CYRILLICEXTC } /* iscyrillicextendedc */, + { 2, 9771, 0, 4, 0, UNI_GONM } /* gonm */, + { 1, 7467, 8148, 3, 3, UNI_IN__6 } /* in=6.0 */, + { 0, 8782, 9284, 7, 5, UNI_BATK } /* script=batak */, + { 11, 8782, 8388, 7, 8, UNI_SC__JAVA } /* script=javanese */, + { 0, 10268, 8925, 3, 4, UNI_NV__5000 } /* nv=5000 */, + { 0, 1418, 10392, 24, 2, UNI_CCC__9 } /* canonicalcombiningclass=vr */, + { 78, 2553, 0, 4, 0, UNI_TERM } /* term */, + { 24, 9763, 6287, 4, 3, UNI_LB__ZWJ } /* gcb=zwj */, + { 0, 9476, 7844, 3, 4, UNI_PALM } /* sc=palm */, + { 24, 4074, 4346, 16, 16, UNI_PO } /* generalcategory=otherpunctuation */, + { 99, 8782, 9863, 7, 4, UNI_MIAO } /* script=miao */, + { 0, 3877, 10008, 18, 3, UNI_SYRC } /* scriptextensions=syrc */, + { 1, 6083, 8147, 13, 2, UNI_NV__16 } /* numericvalue=16 */, + { 2, 9171, 1, 6, 1, -UNI__PERL_PATWS } /* patws=n */, + { 8, 9691, 8789, 4, 7, UNI_SC__SHRD } /* blk=sharada */, + { 1, 7580, 7763, 10, 9, UNI_WB__ML } /* wordbreak=midletter */, + { 22, 5536, 0, 14, 0, UNI_nfcqc_values_index } /* nfcquickcheck= */, + { 10, 8973, 8621, 6, 7, UNI_INGRANTHA } /* block=grantha */, + { 0, 10247, 6482, 3, 12, UNI_JG__MANICHAEANPE } /* jg=manichaeanpe */, + { 1, 3877, 8500, 17, 4, UNI_UGAR } /* scriptextensions=ugar */, + { 3, 10253, 10250, 3, 2, UNI_GCB__T } /* lb=jt */, + { 1, 3877, 1655, 17, 6, UNI_HANG } /* scriptextensions=hangul */, + { 0, 10217, 2533, 3, 20, UNI_BC__RLE } /* bc=righttoleftembedding */, + { 65, 8955, 1, 6, 1, -UNI_XPOSIXALPHA } /* alpha=n */, + { 4, 1418, 9422, 24, 2, UNI_CCC__91 } /* canonicalcombiningclass=91 */, + { 4, 2304, 4347, 3, 4, UNI_C } /* isother */, + { 0, 8973, 8508, 6, 8, UNI_INVITHKUQI } /* block=vithkuqi */, + { 1, 8782, 3978, 7, 8, UNI_SC__BOPO } /* script=bopomofo */, + { 0, 6340, 44, 3, 2, UNI_CJK } /* incjk */, + { 0, 3283, 0, 17, 0, UNI_IDSB } /* idsbinaryoperator */, + { 0, 2003, 6375, 10, 11, UNI_NL } /* category=letternumber */, + { 41, 10250, 36, 3, 1, UNI_JT__T } /* jt=t */, + { 3, 2304, 8755, 3, 6, UNI_OSMA } /* isosmanya */, + { 42, 8881, 98, 3, 4, UNI_XPOSIXALPHA } /* isalpha */, + { 2, 8782, 6518, 7, 12, UNI_MEND } /* script=mendekikakui */, + { 6, 8642, 26, 7, 1, UNI_HYPHEN } /* hyphen=y */, + { 4, 4972, 4985, 3, 4, UNI_TAML } /* istamil */, + { 0, 9979, 8873, 4, 7, UNI_ZZZZ } /* scx=unknown */, + { 0, 10516, 84, 3, 2, UNI_PCM } /* ispcm */, + { 40, 2808, 8262, 4, 6, UNI_INARMENIAN } /* inarmenian */, + { 0, 9691, 7570, 4, 10, UNI_INWARANGCITI } /* blk=warangciti */, + { 3, 7370, 10355, 10, 3, UNI_XPOSIXLOWER } /* lowercase=yes */, + { 69, 6741, 10055, 11, 4, UNI_DEP } /* deprecated=true */, + { 25, 7297, 4730, 3, 14, UNI_INHANGUL } /* ishangulsyllables */, + { 4, 185, 4401, 2, 4, UNI_EMOD } /* isemod */, + { 1, 2433, 0, 20, 0, UNI_GLAGOLITICSUP } /* glagoliticsupplement */, + { 1, 1418, 8027, 24, 3, UNI_CCC__B } /* canonicalcombiningclass=220 */, + { 0, 9975, 0, 4, 0, UNI_SARB } /* sarb */, + { 0, 7360, 2468, 10, 2, UNI_LB__HL } /* linebreak=hl */, + { 1, 9214, 1, 5, 1, -UNI_IDEO } /* ideo=n */, + { 2, 9691, 3049, 4, 11, UNI_CHEROKEESUP } /* blk=cherokeesup */, + { 2, 10516, 97, 7, 5, UNI_POSIXALPHA } /* isposixalpha */, + { 1, 8973, 184, 6, 20, UNI_MISCSYMBOLS } /* block=miscellaneoussymbols */, + { 0, 3877, 1678, 17, 5, UNI_LATN } /* scriptextensions=latin */, + { 11, 185, 2085, 2, 4, UNI_MODI } /* ismodi */, + { 0, 10003, 0, 4, 0, UNI_SOGO } /* sogo */, + { 4, 3406, 36, 3, 1, UNI_CE } /* ce=t */, + { 2, 10560, 68, 3, 4, UNI_VSSUP } /* isvssup */, + { 0, 3877, 1629, 17, 4, UNI_PHAG } /* scriptextensions=phag */, + { 0, 3121, 4588, 18, 6, UNI_DT__MED } /* decompositiontype=medial */, + { 0, 9691, 6044, 4, 13, UNI_MAYANNUMERALS } /* blk=mayannumerals */, + { 2, 8973, 3050, 7, 10, UNI_CHEROKEESUP } /* block=cherokeesup */, + { 1, 9979, 7105, 5, 3, UNI_SYLO } /* scx=sylo */, + { 2, 6083, 9402, 13, 2, UNI_NV__34 } /* numericvalue=34 */, + { 33, 4489, 0, 15, 0, UNI_ARABICEXTB } /* arabicextendedb */, + { 19, 6083, 8943, 13, 2, UNI_NV__80 } /* numericvalue=80 */, + { 8, 3877, 9651, 17, 4, UNI_AGHB } /* scriptextensions=aghb */, + { 8, 9476, 6972, 3, 11, UNI_SC__NAND } /* sc=nandinagari */, + { 1, 4074, 5578, 16, 14, UNI_MN } /* generalcategory=nonspacingmark */, + { 2, 9476, 9879, 3, 4, UNI_SC__MYMR } /* sc=mymr */, + { 0, 9711, 2473, 4, 4, UNI_CCC__L } /* ccc=left */, + { 0, 9476, 9816, 4, 3, UNI_KITS } /* sc=kits */, + { 3, 8973, 3247, 6, 18, UNI_INPUNCTUATION } /* block=generalpunctuation */, + { 0, 1418, 9675, 24, 4, UNI_WB__EB } /* canonicalcombiningclass=atbl */, + { 0, 8782, 8276, 7, 8, UNI_BALI } /* script=balinese */, + { 4, 10217, 6134, 3, 12, UNI_BC__AL } /* bc=arabicletter */, + { 0, 9449, 0, 5, 0, UNI_emod_values_index } /* emod= */, + { 29, 10283, 9454, 3, 5, -UNI_SD } /* sd=false */, + { 8, 6741, 0, 10, 0, UNI_DEP } /* deprecated */, + { 1, 7297, 8643, 3, 5, UNI_HYPHEN } /* ishyphen */, + { 0, 9476, 8810, 3, 4, UNI_SOYO } /* sc=soyo */, + { 0, 9691, 3481, 4, 18, UNI_TAIXUANJING } /* blk=taixuanjingsymbols */, + { 16, 10253, 5620, 3, 14, UNI_LB__PO } /* lb=postfixnumeric */, + { 6, 4074, 5522, 16, 14, UNI_SK } /* generalcategory=modifiersymbol */, + { 0, 10244, 728, 3, 2, UNI_MN } /* gc=mn */, + { 19, 6083, 8919, 13, 6, UNI_NV__432000 } /* numericvalue=432000 */, + { 0, 6158, 10355, 12, 3, UNI_BIDIC } /* bidicontrol=yes */, + { 11, 5536, 26, 14, 1, UNI_NFCQC__Y } /* nfcquickcheck=y */, + { 8, 9691, 79, 4, 10, UNI_ARABICMATH } /* blk=arabicmath */, + { 0, 1418, 5733, 24, 1, UNI_CCC__0 } /* canonicalcombiningclass=0 */, + { 1, 75, 0, 2, 0, UNI_ME } /* me */, + { 38, 6083, 7983, 13, 1, UNI_NV__7 } /* numericvalue=7 */, + { 3, 2056, 9454, 22, 5, -UNI__PERL_NCHAR } /* noncharactercodepoint=false */, + { 1, 9691, 43, 4, 9, UNI_CJKCOMPAT } /* blk=cjkcompat */, + { 6, 10229, 6001, 3, 4, UNI_DT__NONE } /* dt=none */, + { 1, 7, 0, 18, 0, UNI_CANS } /* canadianaboriginal */, + { 2, 9647, 10079, 4, 4, UNI_AGE__14 } /* age=v140 */, + { 130, 3877, 4314, 17, 7, UNI_MYMR } /* scriptextensions=myanmar */, + { 3, 10244, 1026, 3, 2, UNI_NO } /* gc=no */, + { 1, 185, 8404, 2, 8, UNI_KANAEXTB } /* iskanaextb */, + { 0, 185, 1846, 2, 2, UNI_NL } /* isnl */, + { 17, 8782, 7790, 7, 9, UNI_TALU } /* script=newtailue */, + { 54, 9711, 8046, 4, 2, UNI_CCC__13 } /* ccc=13 */, + { 6, 5875, 6455, 13, 3, UNI_JG__NYA } /* joininggroup=nya */, + { 0, 10268, 10372, 3, 2, UNI_NV__49 } /* nv=49 */, + { 8, 2304, 7828, 4, 7, UNI_ORKH } /* isoldturkic */, + { 5, 9434, 9454, 5, 5, -UNI_CWCM } /* cwcm=false */, + { 0, 9177, 1026, 6, 2, -UNI_QMARK } /* qmark=no */, + { 4, 8881, 7639, 4, 7, UNI_ARABICPFA } /* isarabicpfa */, + { 24, 4939, 0, 15, 0, UNI_SARB } /* oldsoutharabian */, + { 1, 9711, 8986, 5, 4, UNI_CCC__10 } /* ccc=ccc10 */, + { 9, 3049, 0, 8, 0, UNI_CHER } /* cherokee */, + { 0, 9476, 9237, 3, 6, UNI_SC__YEZI } /* sc=yezidi */, + { 24, 7230, 10259, 10, 3, UNI_BC__LRI } /* bidiclass=lri */, + { 6, 185, 2165, 3, 17, UNI_CYRILLICSUP } /* iscyrillicsupplement */, + { 0, 9449, 1, 5, 1, -UNI_EMOD } /* emod=n */, + { 1, 185, 4699, 2, 14, UNI_ECOMP } /* isemojicomponent */, + { 12, 9105, 0, 6, 0, UNI_KHOJ } /* khojki */, + { 0, 6314, 0, 12, 0, UNI_ideo_values_index } /* ideographic= */, + { 11, 8782, 8300, 7, 8, UNI_SC__DUPL } /* script=duployan */, + { 9, 5662, 34, 14, 2, UNI_SB__EX } /* sentencebreak=ex */, + { 6, 6083, 8091, 13, 2, UNI_NV__24 } /* numericvalue=24 */, + { 0, 5662, 6677, 15, 8, UNI_SB__SC } /* sentencebreak=scontinue */, + { 0, 185, 9847, 2, 3, UNI_LOE } /* isloe */, + { 2, 7467, 10063, 3, 4, UNI_IN__11 } /* in=v110 */, + { 3, 185, 8580, 3, 6, UNI_CJKEXTF } /* iscjkextf */, + { 0, 10247, 7177, 3, 2, UNI_JG__FE } /* jg=fe */, + { 0, 9147, 26, 6, 1, UNI__PERL_NCHAR } /* nchar=y */, + { 3, 9691, 1514, 4, 24, UNI_HIGHPUSURROGATES } /* blk=highprivateusesurrogates */, + { 0, 3463, 0, 12, 0, UNI_SMALLKANAEXT } /* smallkanaext */, + { 0, 9476, 8831, 3, 7, UNI_SC__TGLG } /* sc=tagalog */, + { 19, 9783, 0, 4, 0, UNI_GURU } /* guru */, + { 0, 2803, 10355, 19, 3, UNI_IDST } /* idstrinaryoperator=yes */, + { 1, 9476, 7260, 3, 10, UNI_CHRS } /* sc=chorasmian */, + { 6, 3877, 8663, 17, 7, UNI_LINA } /* scriptextensions=lineara */, + { 0, 7230, 2917, 10, 19, UNI_BC__RLO } /* bidiclass=righttoleftoverride */, + { 0, 185, 4864, 2, 15, UNI_MISCPICTOGRAPHS } /* ismiscpictographs */, + { 0, 9979, 2937, 5, 3, UNI_SUND } /* scx=sund */, + { 34, 8881, 1753, 3, 2, UNI_ANY } /* isany */, + { 0, 1586, 0, 14, 0, UNI_BYZANTINEMUSIC } /* byzantinemusic */, + { 7, 7360, 1775, 10, 2, UNI_LB__AI } /* linebreak=ai */, + { 1, 118, 1932, 4, 14, UNI_INDICNUMBERFORMS } /* inindicnumberforms */, + { 1, 9647, 10063, 4, 4, UNI_AGE__11 } /* age=v110 */, + { 0, 9476, 8866, 3, 4, UNI_SC__TIRH } /* sc=tirh */, + { 0, 2164, 0, 21, 0, UNI_CYRILLICSUP } /* cyrillicsupplementary */, + { 0, 9045, 10355, 6, 3, UNI_CWKCF } /* cwkcf=yes */, + { 4, 9147, 10055, 6, 4, UNI__PERL_NCHAR } /* nchar=true */, + { 47, 8782, 2708, 7, 19, UNI_EGYP } /* script=egyptianhieroglyphs */, + { 0, 9691, 7016, 4, 11, UNI_INPAHAWHHMONG } /* blk=pahawhhmong */, + { 58, 1869, 0, 9, 0, UNI_TITLE } /* titlecase */, + { 0, 7230, 2513, 10, 20, UNI_BC__PDF } /* bidiclass=popdirectionalformat */, + { 7, 1588, 0, 1, 0, UNI_Z } /* z */, + { 3, 9711, 7220, 4, 10, UNI_CCC__BR } /* ccc=belowright */, + { 6, 10268, 8188, 3, 8, UNI_NV__2_SLASH_3 } /* nv=6.67e-01 */, + { 0, 10007, 0, 4, 0, UNI_SYRC } /* syrc */, + { 8, 9469, 7854, 3, 8, UNI_INPAUCINHAU } /* inpaucinhau */, + { 1, 5875, 5494, 13, 14, UNI_JG__MANICHAEANTETH } /* joininggroup=manichaeanteth */, + { 14, 3877, 9129, 17, 6, UNI_LYCI } /* scriptextensions=lycian */, + { 8, 9979, 8670, 4, 4, UNI_MAKA } /* scx=maka */, + { 0, 9045, 0, 6, 0, UNI_cwkcf_values_index } /* cwkcf= */, + { 1, 9691, 5368, 4, 14, UNI_LISUSUP } /* blk=lisusupplement */, + { 33, 3877, 8740, 17, 7, UNI_OLCK } /* scriptextensions=olchiki */, + { 9, 1592, 384, 3, 31, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* inegyptianhieroglyphformatcontrols */, + { 168, 9691, 8285, 5, 7, UNI_INBASSAVAH } /* blk=bassavah */, + { 8, 9691, 5312, 4, 14, UNI_LATINEXTD } /* blk=latinextendedd */, + { 51, 8782, 9815, 7, 4, UNI_KITS } /* script=kits */, + { 29, 9439, 9454, 5, 5, -UNI_DASH } /* dash=false */, + { 0, 9763, 263, 4, 2, UNI_GCB__SM } /* gcb=sm */, + { 0, 9691, 5256, 4, 14, UNI_KANASUP } /* blk=kanasupplement */, + { 33, 6083, 8925, 13, 6, UNI_NV__500000 } /* numericvalue=500000 */, + { 0, 7908, 9454, 8, 5, -UNI_IDS } /* idstart=false */, + { 2, 9691, 3193, 4, 11, UNI_ETHIOPICSUP } /* blk=ethiopicsup */, + { 5, 6937, 2038, 6, 18, UNI_MISCTECHNICAL } /* inmiscellaneoustechnical */, + { 0, 1990, 4394, 22, 16, UNI_INSC__SYLLABLEMODIFIER } /* indicsyllabiccategory=syllablemodifier */, + { 0, 6340, 3069, 4, 16, UNI_HALFMARKS } /* incombininghalfmarks */, + { 13, 1034, 0, 11, 0, UNI_ENCLOSEDCJK } /* enclosedcjk */, + { 0, 10388, 0, 2, 0, UNI_CASEDLETTER } /* l& */, + { 1, 10268, 9623, 3, 4, UNI_NV__3_SLASH_20 } /* nv=3/20 */, + { 16, 9691, 570, 4, 30, UNI_CJKEXTC } /* blk=cjkunifiedideographsextensionc */, + { 71, 9476, 8348, 3, 8, UNI_SC__GURU } /* sc=gurmukhi */, + { 0, 9476, 8670, 3, 4, UNI_MAKA } /* sc=maka */, + { 0, 9545, 1, 4, 1, -UNI_IDC } /* idc=n */, + { 22, 8444, 26, 8, 1, UNI_RADICAL } /* radical=y */, + { 1, 7005, 0, 11, 0, UNI_SO } /* othersymbol */, + { 96, 5875, 6041, 13, 3, UNI_JG__WAW } /* joininggroup=waw */, + { 120, 9476, 2509, 3, 4, UNI_SC__MONG } /* sc=mong */, + { 35, 10229, 8332, 3, 8, UNI_DT__FRA } /* dt=fraction */, + { 64, 9476, 3049, 3, 8, UNI_CHER } /* sc=cherokee */, + { 4, 6697, 36, 11, 1, UNI_XPOSIXALPHA } /* alphabetic=t */, + { 5, 185, 11, 2, 3, UNI_DIA } /* isdia */, + { 0, 9979, 3049, 4, 8, UNI_CHER } /* scx=cherokee */, + { 3, 9691, 7656, 5, 8, UNI_INBHAIKSUKI } /* blk=bhaiksuki */, + { 10, 1115, 26, 26, 1, UNI_CWKCF } /* changeswhennfkccasefolded=y */, + { 0, 7370, 26, 10, 1, UNI_XPOSIXLOWER } /* lowercase=y */, + { 2, 2248, 7531, 3, 9, UNI_SUPARROWSB } /* insuparrowsb */, + { 0, 2003, 0, 10, 0, UNI_L } /* category=l */, + { 18, 3877, 8670, 17, 7, UNI_MAKA } /* scriptextensions=makasar */, + { 2, 5662, 1847, 14, 5, UNI_SB__LO } /* sentencebreak=lower */, + { 1, 185, 9099, 2, 6, UNI_KANBUN } /* iskanbun */, + { 0, 8782, 6302, 7, 4, UNI_HEBR } /* script=hebr */, + { 0, 9057, 1, 6, 1, -UNI_EMOJI } /* emoji=n */, + { 0, 1088, 1, 27, 1, -UNI_PCM } /* prependedconcatenationmark=n */, + { 0, 7560, 9454, 10, 5, -UNI_XPOSIXUPPER } /* uppercase=false */, + { 0, 185, 8284, 2, 4, UNI_BASS } /* isbass */, + { 8, 1880, 9454, 22, 5, -UNI_CWU } /* changeswhenuppercased=false */, + { 16, 9476, 7853, 3, 9, UNI_PAUC } /* sc=paucinhau */, + { 24, 1189, 9202, 3, 5, UNI_INTELUGU } /* intelugu */, + { 19, 2248, 7094, 3, 10, UNI_SUPERANDSUB } /* insuperandsub */, + { 6, 185, 3265, 2, 18, UNI_GEORGIANSUP } /* isgeorgiansupplement */, + { 0, 4106, 0, 16, 0, UNI_HALFANDFULLFORMS } /* halfandfullforms */, + { 1, 3877, 10015, 17, 4, UNI_TALE } /* scriptextensions=tale */, + { 5, 9476, 4504, 3, 5, UNI_BAMU } /* sc=bamum */, + { 0, 4847, 4331, 3, 15, UNI_MYANMAREXTB } /* inmyanmarextendedb */, + { 0, 9979, 9959, 4, 4, UNI_RJNG } /* scx=rjng */, + { 0, 1553, 17, 10, 1, UNI_SO } /* category=so */, + { 2, 8973, 3445, 6, 18, UNI_RUMI } /* block=ruminumeralsymbols */, + { 4, 4074, 728, 16, 2, UNI_MN } /* generalcategory=mn */, + { 2, 1418, 9350, 25, 4, UNI_CCC__24 } /* canonicalcombiningclass=ccc24 */, + { 3, 10346, 3528, 3, 7, UNI_VO__R } /* vo=rotated */, + { 2, 3877, 9093, 17, 6, UNI_KTHI } /* scriptextensions=kaithi */, + { 0, 4157, 2249, 3, 20, UNI_PRTI } /* isinscriptionalparthian */, + { 7, 7580, 126, 10, 2, UNI_LB__CR } /* wordbreak=cr */, + { 0, 10352, 1195, 3, 2, UNI_LB__LF } /* wb=lf */, + { 0, 185, 1067, 2, 2, UNI_CASEDLETTER } /* islc */, + { 0, 10217, 427, 3, 2, UNI_BC__ES } /* bc=es */, + { 0, 185, 9895, 2, 3, UNI_NKO } /* isnko */, + { 1, 5875, 2247, 13, 3, UNI_JG__AIN } /* joininggroup=ain */, + { 9, 9691, 4654, 4, 15, UNI_DIACRITICALSEXT } /* blk=diacriticalsext */, + { 6, 9979, 4426, 4, 6, UNI_TANG } /* scx=tangut */, + { 2, 9691, 6230, 4, 12, UNI_ETHIOPICEXTA } /* blk=ethiopicexta */, + { 1, 6752, 0, 11, 0, UNI_DOMINO } /* dominotiles */, + { 39, 185, 6338, 2, 11, UNI_JOINC } /* isjoincontrol */, + { 0, 3409, 0, 18, 0, UNI_ri_values_index } /* regionalindicator= */, + { 9, 5662, 10394, 14, 2, UNI_SB__XX } /* sentencebreak=xx */, + { 2, 4744, 1167, 15, 16, UNI_IDENTIFIERTYPE__DEFAULTIGNORABLE } /* identifiertype=defaultignorable */, + { 0, 4847, 2086, 3, 3, UNI_INMODI } /* inmodi */, + { 1, 9474, 4969, 5, 15, UNI_INSC__REGISTERSHIFTER } /* insc=registershifter */, + { 0, 10508, 5096, 3, 5, UNI_XPOSIXXDIGIT } /* isxdigit */, + { 0, 1418, 9225, 24, 6, UNI_CCC__9 } /* canonicalcombiningclass=virama */, + { 0, 2304, 126, 3, 2, UNI_OCR } /* isocr */, + { 9, 9476, 9081, 3, 6, UNI_HATR } /* sc=hatran */, + { 2, 185, 7745, 2, 9, UNI_LATINEXTF } /* islatinextf */, + { 0, 9190, 26, 5, 1, UNI_TERM } /* term=y */, + { 10, 8712, 10355, 7, 3, UNI_DT__NONE } /* nfkdqc=yes */, + { 1, 9476, 720, 3, 9, UNI_XSUX } /* sc=cuneiform */, + { 1, 8782, 9655, 7, 4, UNI_AHOM } /* script=ahom */, + { 0, 6083, 7972, 13, 8, UNI_NV__1_SLASH_64 } /* numericvalue=1.56e-02 */, + { 34, 185, 4170, 2, 9, UNI_LATIN1 } /* islatin1sup */, + { 6, 9213, 1026, 6, 2, -UNI_UIDEO } /* uideo=no */, + { 2, 3175, 36, 18, 1, UNI_EPRES } /* emojipresentation=t */, + { 2, 9711, 9671, 4, 4, UNI_CCC__216 } /* ccc=atar */, + { 25, 7700, 6304, 4, 4, UNI_INHEBREW } /* inhebrew */, + { 4, 3157, 0, 18, 0, UNI_ebase_values_index } /* emojimodifierbase= */, + { 16, 9449, 1026, 5, 2, -UNI_EMOD } /* emod=no */, + { 0, 1418, 9400, 25, 4, UNI_CCC__34 } /* canonicalcombiningclass=ccc34 */, + { 3, 43, 0, 3, 0, UNI_CJK } /* cjk */, + { 3, 6362, 0, 12, 0, UNI_KHMERSYMBOLS } /* khmersymbols */, + { 3, 8881, 2354, 3, 19, UNI_HLUW } /* isanatolianhieroglyphs */, + { 0, 3877, 9081, 17, 4, UNI_HATR } /* scriptextensions=hatr */, + { 1, 407, 0, 7, 0, UNI_XPOSIXCNTRL } /* control */, + { 0, 21, 1219, 2, 26, UNI_KATAKANAEXT } /* inkatakanaphoneticextensions */, + { 1, 1418, 7947, 24, 2, UNI_CCC__21 } /* canonicalcombiningclass=21 */, + { 8, 7467, 10337, 3, 3, UNI_IN__7 } /* in=v70 */, + { 16, 10268, 9611, 3, 4, UNI_NV__15_SLASH_2 } /* nv=15/2 */, + { 0, 1088, 0, 27, 0, UNI_pcm_values_index } /* prependedconcatenationmark= */, + { 1, 8782, 8537, 7, 4, UNI_SC__BENG } /* script=beng */, + { 0, 3877, 9679, 17, 4, UNI_AVST } /* scriptextensions=avst */, + { 0, 4074, 32, 16, 2, UNI__PERL_SURROGATE } /* generalcategory=cs */, + { 0, 9219, 10055, 6, 4, UNI_XPOSIXUPPER } /* upper=true */, + { 0, 21, 5256, 2, 7, UNI_KANASUP } /* inkanasup */, + { 0, 5875, 3843, 13, 17, UNI_JG__MANICHAEANHUNDRED } /* joininggroup=manichaeanhundred */, + { 1, 9476, 1220, 4, 7, UNI_SC__KANA } /* sc=katakana */, + { 4, 10535, 3403, 5, 5, UNI_XPOSIXBLANK } /* horizspace */, + { 0, 6083, 8931, 13, 6, UNI_NV__600000 } /* numericvalue=600000 */, + { 1, 185, 2034, 2, 22, UNI_MISCTECHNICAL } /* ismiscellaneoustechnical */, + { 2, 1553, 4346, 9, 5, UNI_C } /* category=other */, + { 2, 8782, 7016, 7, 11, UNI_HMNG } /* script=pahawhhmong */, + { 8, 4074, 1060, 16, 2, UNI_SO } /* generalcategory=so */, + { 69, 2248, 1296, 3, 24, UNI_SUPERANDSUB } /* insuperscriptsandsubscripts */, + { 1, 8973, 7655, 6, 9, UNI_INBHAIKSUKI } /* block=bhaiksuki */, + { 0, 9691, 9069, 4, 6, UNI_INGOTHIC } /* blk=gothic */, + { 0, 9711, 9307, 4, 2, UNI_CCC__15 } /* ccc=15 */, + { 33, 3391, 36, 18, 1, UNI__PERL_PATWS } /* patternwhitespace=t */, + { 0, 9219, 26, 6, 1, UNI_XPOSIXUPPER } /* upper=y */, + { 0, 1190, 5797, 3, 7, UNI_XPOSIXDIGIT } /* nt=decimal */, + { 6, 3877, 9135, 17, 4, UNI_LYDI } /* scriptextensions=lydi */, + { 9, 8782, 7310, 7, 10, UNI_DIAK } /* script=divesakuru */, + { 0, 3877, 7501, 18, 9, UNI_SAUR } /* scriptextensions=saurashtra */, + { 1, 8782, 7709, 7, 9, UNI_SC__SIND } /* script=khudawadi */, + { 6, 185, 6862, 2, 11, UNI_KATAKANAEXT } /* iskatakanaext */, + { 0, 10268, 7950, 3, 2, UNI_NV__43 } /* nv=43 */, + { 0, 6674, 10355, 12, 3, UNI_XIDC } /* xidcontinue=yes */, + { 81, 185, 3707, 2, 17, UNI_ETHIOPICEXTA } /* isethiopicextendeda */, + { 27, 2164, 0, 8, 0, UNI_CYRL } /* cyrillic */, + { 2, 185, 3175, 2, 17, UNI_EPRES } /* isemojipresentation */, + { 3, 7230, 10262, 10, 3, UNI_BC__LRO } /* bidiclass=lro */, + { 0, 3624, 0, 4, 0, UNI_UCAS } /* ucas */, + { 0, 9979, 9231, 4, 6, UNI_WCHO } /* scx=wancho */, + { 18, 3877, 2248, 17, 21, UNI_PRTI } /* scriptextensions=inscriptionalparthian */, + { 0, 9476, 7570, 3, 4, UNI_WARA } /* sc=wara */, + { 0, 9735, 1, 4, 1, -UNI_CWU } /* cwu=n */, + { 2, 4847, 0, 17, 0, UNI_INMEROITICCURSIVE } /* inmeroiticcursive */, + { 29, 4598, 3267, 4, 16, UNI_GEORGIANSUP } /* ingeorgiansupplement */, + { 64, 8973, 3978, 6, 16, UNI_BOPOMOFOEXT } /* block=bopomofoextended */, + { 0, 5875, 9995, 13, 4, UNI_JG__SHIN } /* joininggroup=shin */, + { 0, 10247, 5504, 3, 4, UNI_JG__TETH } /* jg=teth */, + { 10, 1088, 1026, 27, 2, -UNI_PCM } /* prependedconcatenationmark=no */, + { 1, 8782, 10095, 7, 4, UNI_XPEO } /* script=xpeo */, + { 1, 9691, 2860, 4, 19, UNI_MODIFIERTONELETTERS } /* blk=modifiertoneletters */, + { 0, 3157, 1026, 18, 2, -UNI_EBASE } /* emojimodifierbase=no */, + { 3, 7230, 5186, 10, 14, UNI_BC__EN } /* bidiclass=europeannumber */, + { 3, 9476, 8621, 3, 4, UNI_SC__GRAN } /* sc=gran */, + { 0, 7580, 73, 10, 2, UNI_WB__LE } /* wordbreak=le */, + { 0, 4157, 3284, 3, 3, UNI_IDSB } /* isidsb */, + { 7, 185, 8372, 2, 8, UNI_JAMOEXTA } /* isjamoexta */, + { 0, 10346, 3517, 3, 18, UNI_VO__TR } /* vo=transformedrotated */, + { 17, 10229, 10286, 3, 3, UNI_DT__SML } /* dt=sml */, + { 2, 3707, 0, 11, 0, UNI_ETHIOPICEXT } /* ethiopicext */, + { 6, 9051, 0, 6, 0, UNI_ecomp_values_index } /* ecomp= */, + { 2, 9691, 3103, 4, 18, UNI_COPTICEPACTNUMBERS } /* blk=copticepactnumbers */, + { 1, 3121, 1254, 18, 7, UNI_DT__INIT } /* decompositiontype=initial */, + { 0, 10560, 5031, 4, 6, UNI_VEDICEXT } /* isvedicext */, + { 32, 2993, 0, 19, 0, UNI_SUPARROWSC } /* supplementalarrowsc */, + { 26, 9979, 7570, 4, 4, UNI_WARA } /* scx=wara */, + { 0, 3877, 6362, 17, 5, UNI_KHMR } /* scriptextensions=khmer */, + { 4, 720, 0, 9, 0, UNI_XSUX } /* cuneiform */, + { 1, 3121, 2304, 18, 3, UNI_DT__ISO } /* decompositiontype=iso */, + { 0, 2803, 0, 18, 0, UNI_IDST } /* idstrinaryoperator */, + { 0, 185, 3373, 2, 18, UNI_ZP } /* isparagraphseparator */, + { 0, 185, 839, 2, 29, UNI_MISCARROWS } /* ismiscellaneoussymbolsandarrows */, + { 29, 8973, 4170, 6, 16, UNI_LATIN1 } /* block=latin1supplement */, + { 21, 185, 7093, 2, 11, UNI_SUPERANDSUB } /* issuperandsub */, + { 1, 9711, 9225, 4, 6, UNI_CCC__9 } /* ccc=virama */, + { 3, 8782, 8388, 7, 4, UNI_SC__JAVA } /* script=java */, + { 0, 8572, 0, 7, 0, UNI_CJKEXTE } /* cjkexte */, + { 0, 9476, 3265, 3, 4, UNI_SC__GEOR } /* sc=geor */, + { 5, 3877, 7501, 18, 3, UNI_SAUR } /* scriptextensions=saur */, + { 19, 8782, 9907, 7, 4, UNI_OLCK } /* script=olck */, + { 10, 7370, 1026, 10, 2, -UNI_XPOSIXLOWER } /* lowercase=no */, + { 8, 9979, 9851, 4, 4, UNI_MEDF } /* scx=medf */, + { 0, 1506, 5217, 5, 11, UNI_INGREEK } /* ingreekandcoptic */, + { 0, 4984, 0, 15, 0, UNI_TAMILSUP } /* tamilsupplement */, + { 1, 10268, 8937, 3, 6, UNI_NV__700000 } /* nv=700000 */, + { 30, 185, 3809, 2, 17, UNI_LETTERLIKESYMBOLS } /* isletterlikesymbols */, + { 1, 2206, 5669, 21, 2, UNI_WB__EB } /* graphemeclusterbreak=eb */, + { 0, 9691, 8380, 4, 8, UNI_JAMOEXTB } /* blk=jamoextb */, + { 0, 8973, 3193, 6, 8, UNI_INETHIOPIC } /* block=ethiopic */, + { 0, 3877, 9831, 17, 3, UNI_LAO } /* scriptextensions=lao */, + { 0, 185, 1925, 3, 5, UNI_ZYYY } /* iscommon */, + { 50, 7908, 0, 7, 0, UNI_IDS } /* idstart */, + { 1, 3121, 3463, 18, 5, UNI_DT__SML } /* decompositiontype=small */, + { 1, 7230, 3337, 10, 18, UNI_BC__LRI } /* bidiclass=lefttorightisolate */, + { 0, 2248, 7105, 3, 10, UNI_INSYLOTINAGRI } /* insylotinagri */, + { 0, 185, 9843, 2, 4, UNI_LINB } /* islinb */, + { 0, 1274, 36, 21, 1, UNI_CE } /* compositionexclusion=t */, + { 0, 4847, 1596, 3, 13, UNI_MUSIC } /* inmusicalsymbols */, + { 5, 9791, 0, 4, 0, UNI_HLUW } /* hluw */, + { 0, 10253, 34, 3, 2, UNI_LB__EX } /* lb=ex */, + { 1, 9647, 8156, 4, 3, UNI_AGE__6_DOT_2 } /* age=6.2 */, + { 27, 6083, 8907, 13, 5, UNI_NV__30000 } /* numericvalue=30000 */, + { 2, 9691, 1678, 4, 23, UNI_LATINEXTADDITIONAL } /* blk=latinextendedadditional */, + { 1, 6083, 10214, 13, 3, UNI_NV__9_SLASH_2 } /* numericvalue=9/2 */, + { 0, 1553, 1934, 9, 2, UNI_CN } /* category=cn */, + { 0, 8973, 5131, 7, 13, UNI_CJKCOMPATFORMS } /* block=cjkcompatforms */, + { 2, 3877, 7310, 17, 10, UNI_DIAK } /* scriptextensions=divesakuru */, + { 16, 9979, 9791, 4, 4, UNI_HLUW } /* scx=hluw */, + { 6, 3877, 9237, 17, 4, UNI_YEZI } /* scriptextensions=yezi */, + { 2, 6083, 9571, 13, 4, UNI_NV__1_SLASH_40 } /* numericvalue=1/40 */, + { 16, 9979, 5634, 4, 14, UNI_PHLP } /* scx=psalterpahlavi */, + { 0, 9476, 2632, 3, 6, UNI_BRAH } /* sc=brahmi */, + { 105, 6083, 8949, 13, 3, UNI_NV__900 } /* numericvalue=900 */, + { 22, 185, 1088, 2, 26, UNI_PCM } /* isprependedconcatenationmark */, + { 0, 7160, 5275, 3, 9, UNI_YIRADICALS } /* isyiradicals */, + { 1, 9476, 8873, 3, 7, UNI_ZZZZ } /* sc=unknown */, + { 1, 10244, 1466, 3, 13, UNI_M } /* gc=combiningmark */, + { 0, 4865, 728, 4, 2, UNI_CPMN } /* iscpmn */, + { 87, 9691, 7420, 4, 10, UNI_INOLDPERSIAN } /* blk=oldpersian */, + { 1, 9711, 5733, 4, 1, UNI_CCC__0 } /* ccc=0 */, + { 0, 9743, 1026, 4, 2, -UNI_DEP } /* dep=no */, + { 8, 4074, 1588, 16, 1, UNI_Z } /* generalcategory=z */, + { 0, 3121, 8726, 18, 7, UNI_DT__NB } /* decompositiontype=nobreak */, + { 3, 8973, 9519, 6, 5, UNI_INOSAGE } /* block=osage */, + { 1, 8973, 6057, 6, 13, UNI_MISCTECHNICAL } /* block=misctechnical */, + { 1, 8316, 1, 8, 1, -UNI_EXTPICT } /* extpict=n */, + { 4, 10035, 0, 4, 0, UNI_TGLG } /* tglg */, + { 0, 2808, 4476, 4, 13, UNI_ARABICEXTA } /* inarabicextendeda */, + { 1, 7467, 8119, 3, 1, UNI_IN__9 } /* in=9 */, + { 0, 185, 8649, 2, 7, UNI_KNDA } /* iskannada */, + { 4, 3409, 36, 18, 1, UNI_RI } /* regionalindicator=t */, + { 4, 7467, 8046, 3, 2, UNI_IN__13 } /* in=13 */, + { 8, 1007, 0, 27, 0, UNI_ANCIENTGREEKMUSIC } /* ancientgreekmusicalnotation */, + { 2, 9476, 9679, 3, 4, UNI_AVST } /* sc=avst */, + { 4, 185, 10396, 2, 2, UNI_ZL } /* iszl */, + { 0, 5875, 7880, 13, 9, UNI_JG__SYRIACWAW } /* joininggroup=syriacwaw */, + { 34, 8973, 2165, 7, 20, UNI_CYRILLICSUP } /* block=cyrillicsupplementary */, + { 15, 9911, 0, 4, 0, UNI_ORKH } /* orkh */, + { 1, 9549, 9454, 5, 5, -UNI_XIDS } /* xids=false */, + { 2, 8967, 9454, 6, 5, -UNI_BIDIM } /* bidim=false */, + { 5, 8973, 8388, 6, 8, UNI_INJAVANESE } /* block=javanese */, + { 0, 9476, 10051, 3, 4, UNI_TOTO } /* sc=toto */, + { 16, 185, 9183, 2, 6, UNI_RJNG } /* isrejang */, + { 0, 9484, 0, 5, 0, UNI_LIMB } /* limbu */, + { 2, 9979, 10047, 4, 4, UNI_TNSA } /* scx=tnsa */, + { 0, 9711, 9410, 5, 4, UNI_CCC__36 } /* ccc=ccc36 */, + { 0, 9691, 8838, 4, 7, UNI_INTAITHAM } /* blk=taitham */, + { 1, 8782, 9755, 7, 4, UNI_DSRT } /* script=dsrt */, + { 48, 5408, 0, 12, 0, UNI_INMANICHAEAN } /* inmanichaean */, + { 7, 8768, 1026, 7, 2, -UNI_PATSYN } /* patsyn=no */, + { 0, 8782, 9939, 7, 4, UNI_MIAO } /* script=plrd */, + { 0, 3877, 8635, 17, 7, UNI_HANO } /* scriptextensions=hanunoo */, + { 0, 185, 9075, 2, 5, UNI_GREXT } /* isgrext */, + { 1, 4972, 2556, 5, 16, UNI_TERM } /* isterminalpunctuation */, + { 2, 9424, 0, 5, 0, UNI_XPOSIXCNTRL } /* cntrl */, + { 34, 10268, 5732, 3, 11, UNI_NV__10000000000 } /* nv=10000000000 */, + { 2, 3553, 36, 18, 1, UNI_VS } /* variationselector=t */, + { 0, 9691, 7835, 4, 9, UNI_INOLDUYGHUR } /* blk=olduyghur */, + { 0, 1418, 9307, 24, 2, UNI_CCC__15 } /* canonicalcombiningclass=15 */, + { 21, 8782, 8754, 7, 7, UNI_OSMA } /* script=osmanya */, + { 14, 3283, 26, 18, 1, UNI_IDSB } /* idsbinaryoperator=y */, + { 4, 9763, 5581, 4, 11, UNI_GCB__SM } /* gcb=spacingmark */, + { 0, 8782, 2453, 7, 20, UNI_PHLI } /* script=inscriptionalpahlavi */, + { 0, 1538, 9, 24, 2, UNI_INPC__NA } /* indicpositionalcategory=na */, + { 0, 3553, 1, 18, 1, -UNI_VS } /* variationselector=n */, + { 39, 9476, 8276, 3, 8, UNI_BALI } /* sc=balinese */, + { 8, 185, 1678, 2, 23, UNI_LATINEXTADDITIONAL } /* islatinextendedadditional */, + { 20, 8782, 7700, 7, 9, UNI_SC__QAAI } /* script=inherited */, + { 132, 3403, 36, 6, 1, UNI_XPOSIXSPACE } /* space=t */, + { 2, 2003, 5915, 10, 12, UNI_ZL } /* category=lineseparator */, + { 137, 9691, 9534, 4, 5, UNI_INTAKRI } /* blk=takri */, + { 0, 185, 8607, 2, 7, UNI_ELBA } /* iselbasan */, + { 0, 185, 6626, 2, 12, UNI_PLAYINGCARDS } /* isplayingcards */, + { 0, 2003, 36, 10, 1, UNI_TITLE } /* category=lt */, + { 0, 9691, 3622, 4, 17, UNI_INCAUCASIANALBANIAN } /* blk=caucasianalbanian */, + { 1, 10253, 9764, 3, 2, UNI_LB__CB } /* lb=cb */, + { 0, 8782, 2632, 7, 4, UNI_BRAH } /* script=brah */, + { 0, 185, 6494, 2, 12, UNI_GONM } /* ismasaramgondi */, + { 0, 3398, 0, 11, 0, UNI_wspace_values_index } /* whitespace= */, + { 0, 7218, 4505, 3, 7, UNI_BAMUMSUP } /* inbamumsup */, + { 9, 185, 4090, 2, 16, UNI_GEORGIANEXT } /* isgeorgianextended */, + { 0, 10268, 8212, 3, 8, UNI_NV__4_SLASH_5 } /* nv=8.00e-01 */, + { 0, 1724, 0, 23, 0, UNI_SUPPUNCTUATION } /* supplementalpunctuation */, + { 1, 9979, 8600, 4, 7, UNI_DSRT } /* scx=deseret */, + { 3, 10244, 6994, 3, 11, UNI_NO } /* gc=othernumber */, + { 1, 9476, 9971, 3, 4, UNI_SAMR } /* sc=samr */, + { 0, 5875, 6018, 13, 13, UNI_JG__MANICHAEANTEN } /* joininggroup=manichaeanten */, + { 0, 8866, 0, 7, 0, UNI_TIRH } /* tirhuta */, + { 4, 9461, 1847, 3, 5, UNI_SB__LO } /* sb=lower */, + { 0, 10352, 5669, 3, 2, UNI_WB__EB } /* wb=eb */, + { 88, 1592, 6243, 3, 11, UNI_ETHIOPICEXTB } /* inethiopicextb */, + { 2, 8782, 9787, 7, 4, UNI_SC__HANO } /* script=hano */, + { 1, 7682, 10055, 9, 4, UNI_EXT } /* extender=true */, + { 112, 8973, 3607, 8, 15, UNI_UCAS } /* block=canadiansyllabics */, + { 1, 21, 9265, 3, 4, UNI_INADLAM } /* inadlam */, + { 2, 8973, 79, 6, 6, UNI_INARABIC } /* block=arabic */, + { 0, 4074, 6983, 16, 11, UNI_LO } /* generalcategory=otherletter */, + { 0, 9979, 9887, 4, 4, UNI_NBAT } /* scx=nbat */, + { 77, 185, 1061, 3, 5, UNI_COPT } /* iscoptic */, + { 1, 2304, 7837, 4, 7, UNI_OUGR } /* isolduyghur */, + { 20, 8782, 9931, 7, 4, UNI_SC__PHLP } /* script=phlp */, + { 1, 9476, 9201, 3, 6, UNI_SC__TELU } /* sc=telugu */, + { 0, 8973, 1724, 6, 23, UNI_SUPPUNCTUATION } /* block=supplementalpunctuation */, + { 0, 10268, 10364, 3, 2, UNI_NV__45 } /* nv=45 */, + { 2, 6340, 8573, 3, 6, UNI_CJKEXTE } /* incjkexte */, + { 1, 6083, 8124, 13, 8, UNI_NV__1_SLASH_20 } /* numericvalue=5.00e-02 */, + { 0, 8782, 4504, 7, 5, UNI_BAMU } /* script=bamum */, + { 1, 2311, 0, 4, 0, UNI_SINH } /* sinh */, + { 0, 10247, 342, 3, 2, UNI_JG__PE } /* jg=pe */, + { 20, 8782, 9484, 7, 5, UNI_SC__LIMB } /* script=limbu */, + { 1, 185, 2584, 2, 4, UNI_MAND } /* ismand */, + { 33, 1418, 2479, 24, 5, UNI_CCC__R } /* canonicalcombiningclass=right */, + { 9, 8782, 2312, 8, 3, UNI_SC__SINH } /* script=sinh */, + { 1, 9947, 0, 4, 0, UNI_COPT } /* qaac */, + { 0, 9979, 4042, 4, 7, UNI_CPRT } /* scx=cypriot */, + { 0, 750, 0, 21, 0, UNI_ENCLOSEDALPHANUM } /* enclosedalphanumerics */, + { 0, 9691, 4426, 4, 6, UNI_INTANGUT } /* blk=tangut */, + { 1, 8775, 0, 7, 0, UNI_PHAG } /* phagspa */, + { 0, 2206, 5581, 21, 11, UNI_GCB__SM } /* graphemeclusterbreak=spacingmark */, + { 98, 3877, 9117, 17, 6, UNI_LEPC } /* scriptextensions=lepcha */, + { 3, 6083, 9575, 13, 3, UNI_NV__1_SLASH_6 } /* numericvalue=1/6 */, + { 0, 8973, 6230, 6, 12, UNI_ETHIOPICEXTA } /* block=ethiopicexta */, + { 1, 4074, 9424, 16, 5, UNI_XPOSIXCNTRL } /* generalcategory=cntrl */, + { 2, 10250, 6840, 3, 11, UNI_JT__C } /* jt=joincausing */, + { 7, 9469, 2579, 5, 6, UNI_INPC__BOTTOM } /* inpc=bottom */, + { 0, 4426, 0, 4, 0, UNI_TANG } /* tang */, + { 0, 9739, 0, 4, 0, UNI_CYRL } /* cyrl */, + { 0, 6340, 1903, 3, 21, UNI_CJKCOMPATIDEOGRAPHSSUP } /* incjkcompatideographssup */, + { 13, 8782, 4186, 7, 7, UNI_SC__LINB } /* script=linearb */, + { 51, 9269, 36, 5, 1, UNI_POSIXXDIGIT } /* ahex=t */, + { 8, 10223, 26, 3, 1, UNI_CI } /* ci=y */, + { 23, 7230, 3229, 10, 18, UNI_BC__FSI } /* bidiclass=firststrongisolate */, + { 4, 9213, 10355, 6, 3, UNI_UIDEO } /* uideo=yes */, + { 4, 5888, 0, 13, 0, UNI_KANAEXTA } /* kanaextendeda */, + { 1, 1418, 185, 24, 2, UNI_CCC__IS } /* canonicalcombiningclass=is */, + { 131, 1418, 10166, 24, 3, UNI_CCC__DB } /* canonicalcombiningclass=233 */, + { 0, 9691, 9033, 4, 6, UNI_INCHAKMA } /* blk=chakma */, + { 0, 9691, 468, 4, 11, UNI_INPUNCTUATION } /* blk=punctuation */, + { 0, 7580, 1846, 10, 2, UNI_WB__NL } /* wordbreak=nl */, + { 0, 3775, 0, 17, 0, UNI_INDICSIYAQNUMBERS } /* indicsiyaqnumbers */, + { 7, 9189, 26, 6, 1, UNI_STERM } /* sterm=y */, + { 0, 10253, 1846, 3, 2, UNI_LB__NL } /* lb=nl */, + { 5, 9979, 5940, 4, 9, UNI_MLYM } /* scx=malayalam */, + { 2, 9087, 10055, 6, 4, UNI_JOINC } /* joinc=true */, + { 0, 7071, 0, 11, 0, UNI_SORA } /* sorasompeng */, + { 3, 9927, 0, 4, 0, UNI_pcm_values_index } /* pcm= */, + { 17, 8973, 9891, 6, 4, UNI_INNEWA } /* block=newa */, + { 1, 9979, 6593, 4, 4, UNI_HUNG } /* scx=hung */, + { 2, 8973, 8380, 6, 8, UNI_JAMOEXTB } /* block=jamoextb */, + { 32, 8961, 10055, 6, 4, UNI_BIDIC } /* bidic=true */, + { 4, 5662, 139, 14, 2, UNI_SB__FO } /* sentencebreak=fo */, + { 1, 3877, 2841, 17, 19, UNI_MERO } /* scriptextensions=meroitichieroglyphs */, + { 1, 10553, 7434, 3, 6, UNI_SOGD } /* issogdian */, + { 10, 9711, 9387, 4, 2, UNI_CCC__31 } /* ccc=31 */, + { 10, 3877, 9819, 17, 4, UNI_KNDA } /* scriptextensions=knda */, + { 49, 7460, 10319, 10, 3, UNI_IN__5_DOT_1 } /* presentin=v51 */, + { 1, 7370, 3, 10, 1, -UNI_XPOSIXLOWER } /* lowercase=f */, + { 1, 10268, 8091, 3, 2, UNI_NV__24 } /* nv=24 */, + { 1, 3877, 9827, 17, 4, UNI_LANA } /* scriptextensions=lana */, + { 1, 2727, 0, 19, 0, UNI_ENCLOSEDALPHANUMSUP } /* enclosedalphanumsup */, + { 1, 6083, 10153, 13, 2, UNI_NV__42 } /* numericvalue=42 */, + { 6, 2304, 2899, 3, 18, UNI_OTTOMANSIYAQNUMBERS } /* isottomansiyaqnumbers */, + { 0, 7060, 3, 11, 1, -UNI_SD } /* softdotted=f */, + { 33, 10247, 2661, 3, 9, UNI_JG__YEHBARREE } /* jg=yehbarree */, + { 4, 5875, 4266, 13, 16, UNI_JG__MANICHAEANTWENTY } /* joininggroup=manichaeantwenty */, + { 0, 7104, 0, 4, 0, UNI_SYLO } /* sylo */, + { 0, 8702, 1036, 4, 25, UNI_ENCLOSEDCJK } /* inenclosedcjklettersandmonths */, + { 0, 185, 1034, 2, 27, UNI_ENCLOSEDCJK } /* isenclosedcjklettersandmonths */, + { 1, 6158, 9454, 12, 5, -UNI_BIDIC } /* bidicontrol=false */, + { 0, 2553, 1026, 20, 2, -UNI_TERM } /* terminalpunctuation=no */, + { 1, 1418, 1220, 24, 3, UNI_CCC__214 } /* canonicalcombiningclass=ata */, + { 0, 5408, 8422, 4, 6, UNI_INMAHAJANI } /* inmahajani */, + { 0, 2085, 0, 14, 0, UNI_LM } /* modifierletter */, + { 1, 9476, 8657, 4, 6, UNI_SC__KALI } /* sc=kayahli */, + { 2, 3877, 2453, 17, 20, UNI_PHLI } /* scriptextensions=inscriptionalpahlavi */, + { 70, 10253, 5669, 3, 2, UNI_EBASE } /* lb=eb */, + { 2, 9979, 9207, 4, 6, UNI_THAA } /* scx=thaana */, + { 74, 9476, 2841, 3, 4, UNI_MERO } /* sc=mero */, + { 1, 3398, 36, 11, 1, UNI_XPOSIXSPACE } /* whitespace=t */, + { 8, 9691, 1220, 5, 4, UNI_INBATAK } /* blk=batak */, + { 0, 9207, 0, 4, 0, UNI_THAA } /* thaa */, + { 0, 3877, 6290, 17, 12, UNI_GONG } /* scriptextensions=gunjalagondi */, + { 0, 4684, 7628, 15, 9, UNI_EA__A } /* eastasianwidth=ambiguous */, + { 0, 185, 4186, 2, 7, UNI_LINB } /* islinearb */, + { 1, 10247, 5228, 3, 14, UNI_JG__HAMZAONHEHGOAL } /* jg=hamzaonhehgoal */, + { 0, 9835, 0, 4, 0, UNI_LATN } /* latn */, + { 2, 4909, 1026, 15, 2, UNI_NFKDQC__N } /* nfkdquickcheck=no */, + { 4, 8782, 8873, 7, 7, UNI_ZZZZ } /* script=unknown */, + { 0, 8973, 8677, 6, 7, UNI_INMANDAIC } /* block=mandaic */, + { 0, 7300, 36, 10, 1, UNI_DIA } /* diacritic=t */, + { 1, 185, 2078, 2, 22, UNI_MODIFIERLETTERS } /* isspacingmodifierletters */, + { 9, 9711, 3588, 4, 17, UNI_WB__EB } /* ccc=attachedbelowleft */, + { 1, 1595, 0, 14, 0, UNI_MUSIC } /* musicalsymbols */, + { 3, 1418, 9310, 25, 4, UNI_CCC__16 } /* canonicalcombiningclass=ccc16 */, + { 17, 10217, 24, 3, 1, UNI_BC__L } /* bc=l */, + { 0, 7467, 10322, 3, 3, UNI_IN__5_DOT_2 } /* in=v52 */, + { 132, 8642, 0, 6, 0, UNI_HYPHEN } /* hyphen */, + { 137, 185, 5758, 2, 5, UNI_BIDIM } /* isbidim */, + { 4, 9711, 7975, 4, 1, UNI_CCC__6 } /* ccc=6 */, + { 0, 185, 9811, 2, 4, UNI_KHMR } /* iskhmr */, + { 2, 4699, 1026, 15, 2, -UNI_ECOMP } /* emojicomponent=no */, + { 200, 4074, 49, 16, 1, UNI_P } /* generalcategory=p */, + { 0, 6697, 10355, 11, 3, UNI_XPOSIXALPHA } /* alphabetic=yes */, + { 0, 3877, 2632, 17, 4, UNI_BRAH } /* scriptextensions=brah */, + { 6, 8782, 10115, 7, 4, UNI_SC__QAAI } /* script=zinh */, + { 1, 6529, 6591, 3, 11, UNI_INOLDHUNGARIAN } /* inoldhungarian */, + { 0, 9189, 1026, 6, 2, -UNI_STERM } /* sterm=no */, + { 0, 3877, 9907, 17, 4, UNI_OLCK } /* scriptextensions=olck */, + { 50, 10253, 8642, 3, 6, UNI_LB__HY } /* lb=hyphen */, + { 107, 7580, 2468, 10, 2, UNI_LB__HL } /* wordbreak=hl */, + { 1, 6340, 8559, 3, 6, UNI_CJKEXTC } /* incjkextc */, + { 0, 10516, 25, 3, 1, UNI_PS } /* isps */, + { 2, 8973, 9081, 6, 6, UNI_INHATRAN } /* block=hatran */, + { 0, 9474, 2670, 5, 19, UNI_INSC__CONSONANTHEADLETTER } /* insc=consonantheadletter */, + { 26, 3877, 9687, 17, 4, UNI_BHKS } /* scriptextensions=bhks */, + { 0, 1990, 8880, 22, 7, UNI_INSC__VISARGA } /* indicsyllabiccategory=visarga */, + { 32, 7580, 8308, 10, 8, UNI_WB__EB } /* wordbreak=ebasegaz */, + { 0, 6083, 8028, 13, 4, UNI_NV__2000 } /* numericvalue=2000 */, + { 8, 185, 7240, 2, 10, UNI_BOXDRAWING } /* isboxdrawing */, + { 15, 8973, 1935, 6, 11, UNI_NUMBERFORMS } /* block=numberforms */, + { 0, 9979, 7105, 5, 10, UNI_SYLO } /* scx=sylotinagri */, + { 5, 5581, 0, 11, 0, UNI_MC } /* spacingmark */, + { 1, 2248, 5691, 3, 13, UNI_SUPPUNCTUATION } /* insuppunctuation */, + { 0, 4074, 6374, 16, 12, UNI_NL } /* generalcategory=letternumber */, + { 67, 9545, 0, 4, 0, UNI_idc_values_index } /* idc= */, + { 1, 3121, 750, 18, 3, UNI_DT__ENC } /* decompositiontype=enc */, + { 0, 185, 541, 3, 29, UNI_CJKEXTB } /* iscjkunifiedideographsextensionb */, + { 1, 2012, 3, 22, 1, -UNI_LOE } /* logicalorderexception=f */, + { 0, 10268, 8100, 3, 8, UNI_NV__5_SLASH_12 } /* nv=4.17e-01 */, + { 2, 7360, 7664, 10, 9, UNI_LB__B2 } /* linebreak=breakboth */, + { 24, 10268, 7996, 3, 8, UNI_NV__1_SLASH_5 } /* nv=2.00e-01 */, + { 1, 3406, 3, 3, 1, -UNI_CE } /* ce=f */, + { 11, 10268, 9639, 3, 4, UNI_NV__7_SLASH_12 } /* nv=7/12 */, + { 1, 9469, 910, 3, 9, UNI_PUA } /* inprivateuse */, + { 177, 1418, 8046, 24, 2, UNI_CCC__13 } /* canonicalcombiningclass=13 */, + { 0, 3877, 2493, 17, 20, UNI_HMNP } /* scriptextensions=nyiakengpuachuehmong */, + { 36, 9476, 8663, 3, 7, UNI_SC__LINA } /* sc=lineara */, + { 0, 6158, 0, 5, 0, UNI_BIDIC } /* bidic */, + { 0, 9979, 9514, 4, 5, UNI_ORYA } /* scx=oriya */, + { 1, 9214, 0, 5, 0, UNI_ideo_values_index } /* ideo= */, + { 3, 5875, 6266, 13, 12, UNI_JG__FINALSEMKATH } /* joininggroup=finalsemkath */, + { 7, 185, 7790, 2, 9, UNI_TALU } /* isnewtailue */, + { 32, 79, 0, 4, 0, UNI_ARAB } /* arab */, + { 0, 3403, 1, 6, 1, -UNI_XPOSIXSPACE } /* space=n */, + { 10, 3877, 79, 17, 4, UNI_ARAB } /* scriptextensions=arab */, + { 2, 7060, 0, 11, 0, UNI_sd_values_index } /* softdotted= */, + { 169, 1747, 0, 13, 0, UNI_ZNAMENNYMUSIC } /* znamennymusic */, + { 3, 7360, 10384, 10, 2, UNI_GCB__V } /* linebreak=jv */, + { 3, 6083, 8148, 13, 8, UNI_NV__3_SLASH_5 } /* numericvalue=6.00e-01 */, + { 3, 7709, 0, 9, 0, UNI_SIND } /* khudawadi */, + { 0, 4074, 113, 16, 2, UNI_SC } /* generalcategory=sc */, + { 1, 10268, 8132, 3, 8, UNI_NV__11_SLASH_2 } /* nv=5.50e+00 */, + { 0, 10346, 3535, 3, 18, UNI_VO__TU } /* vo=transformedupright */, + { 5, 10268, 10193, 3, 3, UNI_NV__5_SLASH_6 } /* nv=5/6 */, + { 14, 9153, 10355, 6, 3, UNI_NFCQC__Y } /* nfcqc=yes */, + { 4, 5875, 5564, 13, 14, UNI_JG__NOJOININGGROUP } /* joininggroup=nojoininggroup */, + { 0, 10268, 5732, 3, 3, UNI_NV__100 } /* nv=100 */, + { 16, 9476, 3622, 3, 17, UNI_AGHB } /* sc=caucasianalbanian */, + { 0, 9691, 8300, 4, 8, UNI_INDUPLOYAN } /* blk=duployan */, + { 32, 9476, 9911, 3, 4, UNI_ORKH } /* sc=orkh */, + { 3, 3076, 0, 9, 0, UNI_HALFMARKS } /* halfmarks */, + { 1, 9476, 10087, 3, 4, UNI_WCHO } /* sc=wcho */, + { 88, 6083, 8028, 13, 6, UNI_NV__200000 } /* numericvalue=200000 */, + { 66, 8782, 5059, 7, 15, UNI_ZANB } /* script=zanabazarsquare */, + { 0, 9461, 752, 3, 5, UNI_SB__CL } /* sb=close */, + { 6, 8973, 4504, 6, 5, UNI_INBAMUM } /* block=bamum */, + { 2, 9747, 1, 4, 1, -UNI_DIA } /* dia=n */, + { 42, 4684, 0, 15, 0, UNI_ea_values_index } /* eastasianwidth= */, + { 52, 185, 6242, 2, 12, UNI_ETHIOPICEXTB } /* isethiopicextb */, + { 1, 7460, 7996, 10, 3, UNI_IN__2 } /* presentin=2.0 */, + { 33, 10229, 46, 3, 3, UNI_DT__COM } /* dt=com */, + { 58, 3406, 0, 3, 0, UNI_ce_values_index } /* ce= */, + { 42, 8292, 0, 8, 0, UNI_BUGI } /* buginese */, + { 1, 9545, 10055, 4, 4, UNI_IDC } /* idc=true */, + { 35, 9979, 9903, 4, 4, UNI_OGAM } /* scx=ogam */, + { 0, 8782, 2227, 7, 4, UNI_SC__HAN } /* script=hani */, + { 0, 185, 48, 2, 1, UNI_M } /* ism */, + { 6, 7580, 6302, 10, 12, UNI_LB__HL } /* wordbreak=hebrewletter */, + { 0, 2312, 4109, 5, 13, UNI_HALFANDFULLFORMS } /* inhalfandfullforms */, + { 6, 8782, 8600, 7, 7, UNI_DSRT } /* script=deseret */, + { 0, 8973, 909, 6, 10, UNI_PUA } /* block=privateuse */, + { 0, 5758, 0, 13, 0, UNI_bidim_values_index } /* bidimirrored= */, + { 0, 10268, 9615, 3, 4, UNI_NV__17_SLASH_2 } /* nv=17/2 */, + { 5, 9711, 3031, 4, 13, UNI_CCC__214 } /* ccc=attachedabove */, + { 0, 3877, 7, 17, 18, UNI_CANS } /* scriptextensions=canadianaboriginal */, + { 0, 185, 7390, 2, 10, UNI_MISCARROWS } /* ismiscarrows */, + { 0, 9711, 10166, 4, 3, UNI_CCC__DB } /* ccc=233 */, + { 26, 10268, 9571, 3, 4, UNI_NV__1_SLASH_40 } /* nv=1/40 */, + { 1, 9691, 3673, 4, 17, UNI_CYRILLICEXTB } /* blk=cyrillicextendedb */, + { 3, 10253, 9920, 3, 2, UNI_LB__SG } /* lb=sg */, + { 7, 7300, 9454, 10, 5, -UNI_DIA } /* diacritic=false */, + { 64, 10268, 8925, 3, 3, UNI_NV__500 } /* nv=500 */, + { 2, 9979, 9871, 4, 4, UNI_MRO } /* scx=mroo */, + { 8, 8973, 5256, 6, 14, UNI_KANASUP } /* block=kanasupplement */, + { 4, 4972, 8469, 3, 3, UNI_TAGB } /* istagb */, + { 0, 9476, 7844, 3, 9, UNI_PALM } /* sc=palmyrene */, + { 4, 9691, 3911, 4, 17, UNI_SMALLFORMS } /* blk=smallformvariants */, + { 0, 8973, 8396, 6, 8, UNI_KANAEXTA } /* block=kanaexta */, + { 0, 6083, 7988, 13, 8, UNI_NV__3_SLASH_16 } /* numericvalue=1.88e-01 */, + { 1, 9691, 1394, 4, 24, UNI_ARABICPFB } /* blk=arabicpresentationformsb */, + { 20, 9927, 10355, 4, 3, UNI_PCM } /* pcm=yes */, + { 1, 9723, 0, 4, 0, UNI_CPRT } /* cprt */, + { 4, 8782, 10123, 7, 4, UNI_ZZZZ } /* script=zzzz */, + { 0, 9979, 1223, 4, 4, UNI_KANA } /* scx=kana */, + { 1, 10247, 6018, 3, 13, UNI_JG__MANICHAEANTEN } /* jg=manichaeanten */, + { 17, 8973, 6362, 6, 5, UNI_INKHMER } /* block=khmer */, + { 2, 9695, 1, 4, 1, UNI_BPT__N } /* bpt=n */, + { 0, 7467, 7995, 3, 4, UNI_IN__12 } /* in=12.0 */, + { 2, 1924, 0, 6, 0, UNI_ZYYY } /* common */, + { 0, 9691, 8558, 4, 7, UNI_CJKEXTC } /* blk=cjkextc */, + { 2, 8782, 8284, 7, 8, UNI_BASS } /* script=bassavah */, + { 3, 4074, 4774, 16, 15, UNI_LOWERCASELETTER } /* generalcategory=lowercaseletter */, + { 2, 8782, 3049, 7, 4, UNI_CHER } /* script=cher */, + { 0, 21, 8656, 2, 7, UNI_KALI } /* inkayahli */, + { 5, 10268, 8148, 3, 8, UNI_NV__3_SLASH_5 } /* nv=6.00e-01 */, + { 0, 7727, 0, 9, 0, UNI_LATINEXTC } /* latinextc */, + { 0, 8887, 9454, 7, 5, -UNI_XPOSIXSPACE } /* wspace=false */, + { 0, 10547, 48, 5, 1, UNI_PERM } /* isperm */, + { 2, 4744, 8436, 15, 8, UNI_IDENTIFIERTYPE__OBSOLETE } /* identifiertype=obsolete */, + { 0, 10247, 8460, 3, 8, UNI_JG__SWASHKAF } /* jg=swashkaf */, + { 1, 8973, 2144, 7, 20, UNI_CJKRADICALSSUP } /* block=cjkradicalssupplement */, + { 8, 185, 4043, 3, 6, UNI_CPRT } /* iscypriot */, + { 88, 4954, 0, 15, 0, UNI_PS } /* openpunctuation */, + { 0, 8973, 2227, 6, 14, UNI_INHANIFIROHINGYA } /* block=hanifirohingya */, + { 106, 7360, 10374, 10, 2, UNI_LB__B2 } /* linebreak=b2 */, + { 1, 9476, 8356, 3, 8, UNI_SC__HIRA } /* sc=hiragana */, + { 0, 1990, 4564, 22, 15, UNI_INSC__CONSONANTKILLER } /* indicsyllabiccategory=consonantkiller */, + { 206, 3877, 8260, 17, 8, UNI_ARMN } /* scriptextensions=armenian */, + { 0, 3877, 9899, 17, 4, UNI_NSHU } /* scriptextensions=nshu */, + { 0, 9159, 0, 6, 0, UNI_nfdqc_values_index } /* nfdqc= */, + { 0, 1418, 8920, 24, 2, UNI_CCC__32 } /* canonicalcombiningclass=32 */, + { 1, 6340, 2144, 3, 13, UNI_CJKRADICALSSUP } /* incjkradicalssup */, + { 0, 4714, 36, 15, 1, UNI_GREXT } /* graphemeextend=t */, + { 0, 185, 5354, 2, 14, UNI_LATINEXTG } /* islatinextendedg */, + { 0, 7460, 9607, 10, 4, UNI_IN__14 } /* presentin=14.0 */, + { 0, 3398, 1, 11, 1, -UNI_XPOSIXSPACE } /* whitespace=n */, + { 0, 3877, 8276, 17, 8, UNI_BALI } /* scriptextensions=balinese */, + { 0, 9476, 2708, 3, 19, UNI_EGYP } /* sc=egyptianhieroglyphs */, + { 32, 3945, 9454, 17, 5, -UNI_UIDEO } /* unifiedideograph=false */, + { 3, 1418, 9018, 24, 3, UNI_CCC__130 } /* canonicalcombiningclass=130 */, + { 4, 9476, 10047, 3, 4, UNI_TNSA } /* sc=tnsa */, + { 1, 21, 3319, 2, 9, UNI_LATINEXTA } /* inlatinexta */, + { 7, 10280, 1026, 3, 2, -UNI_RI } /* ri=no */, + { 0, 8973, 10011, 6, 4, UNI_TAGS } /* block=tags */, + { 0, 4684, 67, 15, 1, UNI_EA__H } /* eastasianwidth=h */, + { 0, 9063, 3, 6, 1, -UNI_EPRES } /* epres=f */, + { 16, 9117, 0, 6, 0, UNI_LEPC } /* lepcha */, + { 64, 9087, 1026, 6, 2, -UNI_JOINC } /* joinc=no */, + { 4, 2784, 7889, 19, 9, UNI_GCB__V } /* hangulsyllabletype=voweljamo */, + { 0, 8782, 9093, 7, 6, UNI_SC__KTHI } /* script=kaithi */, + { 11, 8782, 10083, 7, 4, UNI_VAI } /* script=vaii */, + { 2, 9979, 720, 4, 9, UNI_XSUX } /* scx=cuneiform */, + { 3, 2078, 0, 22, 0, UNI_MODIFIERLETTERS } /* spacingmodifierletters */, + { 0, 9476, 10119, 3, 4, UNI_SC__ZYYY } /* sc=zyyy */, + { 2, 9807, 0, 4, 0, UNI_KALI } /* kali */, + { 8, 9691, 6362, 4, 12, UNI_KHMERSYMBOLS } /* blk=khmersymbols */, + { 24, 185, 5581, 2, 11, UNI_MC } /* isspacingmark */, + { 1, 8649, 0, 7, 0, UNI_KNDA } /* kannada */, + { 4, 185, 4282, 2, 16, UNI_MISCMATHSYMBOLSA } /* ismiscmathsymbolsa */, + { 0, 10400, 0, 2, 0, UNI_ZS } /* zs */, + { 2, 9979, 9895, 4, 3, UNI_NKO } /* scx=nko */, + { 0, 7580, 6785, 10, 11, UNI_WB__DQ } /* wordbreak=doublequote */, + { 3, 8782, 58, 7, 2, UNI_SC__YI } /* script=yi */, + { 2, 6697, 3, 11, 1, -UNI_XPOSIXALPHA } /* alphabetic=f */, + { 0, 8881, 5746, 3, 12, UNI_AEGEANNUMBERS } /* isaegeannumbers */, + { 8, 8300, 0, 4, 0, UNI_DUPL } /* dupl */, + { 0, 4154, 68, 3, 4, UNI_VSSUP } /* invssup */, + { 9, 7460, 10199, 10, 3, UNI_IN__6_DOT_1 } /* presentin=6.1 */, + { 0, 8404, 0, 8, 0, UNI_KANAEXTB } /* kanaextb */, + { 0, 5093, 3, 9, 1, -UNI_XPOSIXXDIGIT } /* hexdigit=f */, + { 0, 9979, 9504, 4, 5, UNI_NSHU } /* scx=nushu */, + { 0, 9476, 10083, 3, 3, UNI_VAI } /* sc=vai */, + { 1, 4426, 0, 6, 0, UNI_TANG } /* tangut */, + { 0, 6340, 6731, 3, 10, UNI_INCYPROMINOAN } /* incyprominoan */, + { 4, 1852, 9454, 6, 5, -UNI_CASED } /* cased=false */, + { 1, 6340, 1443, 3, 23, UNI_CJKSYMBOLS } /* incjksymbolsandpunctuation */, + { 0, 185, 3122, 2, 5, UNI_ECOMP } /* isecomp */, + { 2, 9647, 7975, 4, 1, UNI_AGE__6 } /* age=6 */, + { 8, 9815, 0, 4, 0, UNI_KITS } /* kits */, + { 1, 9979, 8621, 4, 7, UNI_GRAN } /* scx=grantha */, + { 24, 3877, 2227, 17, 4, UNI_HAN } /* scriptextensions=hani */, + { 17, 10268, 8102, 3, 2, UNI_NV__17 } /* nv=17 */, + { 3, 8782, 10043, 7, 4, UNI_TIBT } /* script=tibt */, + { 12, 9691, 2034, 4, 22, UNI_MISCTECHNICAL } /* blk=miscellaneoustechnical */, + { 0, 21, 5270, 2, 6, UNI_KANGXI } /* inkangxi */, + { 0, 8973, 3691, 7, 16, UNI_CYRILLICEXTC } /* block=cyrillicextendedc */, + { 0, 185, 9177, 2, 5, UNI_QMARK } /* isqmark */, + { 0, 8881, 8262, 4, 6, UNI_ARMN } /* isarmenian */, + { 0, 10244, 6374, 3, 12, UNI_NL } /* gc=letternumber */, + { 2, 5550, 0, 14, 0, UNI_nfdqc_values_index } /* nfdquickcheck= */, + { 4, 10510, 7580, 6, 4, UNI_XPOSIXWORD } /* xposixword */, + { 0, 7580, 74, 10, 2, UNI_WB__EB } /* wordbreak=em */, + { 1, 185, 9751, 2, 4, UNI_DIAK } /* isdiak */, + { 179, 6083, 8180, 13, 8, UNI_NV__13_SLASH_2 } /* numericvalue=6.50e+00 */, + { 1, 185, 4774, 2, 15, UNI_LOWERCASELETTER } /* islowercaseletter */, + { 4, 9459, 26, 5, 1, UNI_IDSB } /* idsb=y */, + { 3, 6928, 0, 11, 0, UNI_MEDF } /* medefaidrin */, + { 7, 10268, 8027, 3, 2, UNI_NV__22 } /* nv=22 */, + { 0, 9803, 6873, 4, 11, UNI_GCB__L } /* hst=leadingjamo */, + { 0, 6340, 3674, 3, 16, UNI_CYRILLICEXTB } /* incyrillicextendedb */, + { 1, 2936, 0, 9, 0, UNI_SUND } /* sundanese */, + { 33, 4157, 5863, 3, 5, UNI_IPAEXT } /* isipaext */, + { 0, 7297, 8636, 3, 6, UNI_HANO } /* ishanunoo */, + { 18, 3409, 0, 17, 0, UNI_RI } /* regionalindicator */, + { 82, 7297, 5094, 3, 7, UNI_XPOSIXXDIGIT } /* ishexdigit */, + { 8, 3877, 2937, 18, 3, UNI_SUND } /* scriptextensions=sund */, + { 117, 8881, 3572, 3, 16, UNI_ALCHEMICAL } /* isalchemicalsymbols */, + { 240, 185, 383, 2, 32, UNI_EGYPTIANHIEROGLYPHFORMATCONTROLS } /* isegyptianhieroglyphformatcontrols */, + { 25, 9803, 36, 4, 1, UNI_GCB__T } /* hst=t */, + { 0, 7460, 8100, 10, 3, UNI_IN__4_DOT_1 } /* presentin=4.1 */, + { 68, 7430, 0, 10, 0, UNI_SOGO } /* oldsogdian */, + { 1, 8782, 9779, 7, 4, UNI_SC__GUJR } /* script=gujr */, + { 58, 8628, 0, 6, 0, UNI_GRBASE } /* grbase */, + { 1, 1418, 8251, 24, 2, UNI_CCC__19 } /* canonicalcombiningclass=19 */, + { 0, 21, 1008, 3, 16, UNI_ANCIENTGREEKMUSIC } /* inancientgreekmusic */, + { 104, 9691, 7500, 4, 10, UNI_INSAURASHTRA } /* blk=saurashtra */, + { 4, 6972, 0, 11, 0, UNI_NAND } /* nandinagari */, + { 1, 9847, 1, 4, 1, -UNI_LOE } /* loe=n */, + { 1, 1946, 0, 22, 0, UNI_DIACRITICALSFORSYMBOLS } /* diacriticalsforsymbols */, + { 0, 10247, 2247, 3, 3, UNI_JG__AIN } /* jg=ain */, + { 0, 2613, 0, 19, 0, UNI_ANCIENTGREEKNUMBERS } /* ancientgreeknumbers */, + { 2, 7467, 7611, 3, 1, UNI_IN__5 } /* in=5 */, + { 0, 9129, 0, 6, 0, UNI_LYCI } /* lycian */, + { 4, 3877, 4426, 17, 6, UNI_TANG } /* scriptextensions=tangut */, + { 16, 2206, 126, 21, 2, UNI_LB__CR } /* graphemeclusterbreak=cr */, + { 1, 8973, 8300, 6, 8, UNI_INDUPLOYAN } /* block=duployan */, + { 1, 5875, 757, 13, 3, UNI_JG__DAL } /* joininggroup=dal */, + { 2, 952, 0, 18, 0, UNI_INVS } /* variationselectors */, + { 0, 185, 3911, 2, 17, UNI_SMALLFORMS } /* issmallformvariants */, + { 0, 21, 6362, 2, 5, UNI_INKHMER } /* inkhmer */, + { 7, 8973, 2898, 6, 19, UNI_OTTOMANSIYAQNUMBERS } /* block=ottomansiyaqnumbers */, + { 0, 5875, 7148, 13, 11, UNI_JG__YEHWITHTAIL } /* joininggroup=yehwithtail */, + { 36, 1190, 5096, 3, 5, UNI_NT__DI } /* nt=digit */, + { 12, 185, 115, 3, 24, UNI_DIACRITICALS } /* iscombiningdiacriticalmarks */, + { 0, 2304, 9920, 3, 3, UNI_OSGE } /* isosge */, + { 0, 8973, 219, 7, 32, UNI_DIACRITICALSEXT } /* block=combiningdiacriticalmarksextended */, + { 1, 9691, 114, 4, 25, UNI_DIACRITICALS } /* blk=combiningdiacriticalmarks */, + { 0, 8881, 5089, 3, 4, UNI_ASCII } /* isascii */, + { 1, 1270, 26, 25, 1, UNI_COMPEX } /* fullcompositionexclusion=y */, + { 1, 513, 0, 16, 0, UNI_UIDEO } /* unifiedideograph */, + { 0, 9476, 9703, 3, 4, UNI_SC__CAKM } /* sc=cakm */, + { 1, 10510, 10523, 6, 5, UNI_XPOSIXBLANK } /* xposixblank */, + { 4, 8782, 9514, 7, 5, UNI_SC__ORYA } /* script=oriya */, + { 3, 9691, 10051, 4, 4, UNI_INTOTO } /* blk=toto */, + { 0, 9429, 1026, 5, 2, -UNI_CWCF } /* cwcf=no */, + { 1, 568, 0, 2, 0, UNI_NB } /* nb */, + { 2, 9979, 10039, 4, 4, UNI_THAI } /* scx=thai */, + { 0, 4157, 6, 3, 2, UNI_IDC } /* isidc */, + { 0, 9979, 8300, 4, 4, UNI_DUPL } /* scx=dupl */, + { 0, 9691, 2143, 4, 21, UNI_CJKRADICALSSUP } /* blk=cjkradicalssupplement */, + { 5, 10229, 3525, 3, 3, UNI_DT__MED } /* dt=med */, + { 0, 7060, 26, 11, 1, UNI_SD } /* softdotted=y */, + { 4, 9691, 4984, 4, 8, UNI_TAMILSUP } /* blk=tamilsup */, + { 0, 7907, 0, 4, 0, UNI_XIDS } /* xids */, + { 1, 1553, 1923, 9, 2, UNI_PC } /* category=pc */, + { 7, 1418, 9000, 24, 3, UNI_CCC__118 } /* canonicalcombiningclass=118 */, + { 0, 3877, 9655, 17, 4, UNI_AHOM } /* scriptextensions=ahom */, + { 1, 9859, 0, 4, 0, UNI_MERC } /* merc */, + { 0, 7370, 0, 10, 0, UNI_lower_values_index } /* lowercase= */, + { 0, 10229, 1295, 3, 5, UNI_DT__SUP } /* dt=super */, + { 1, 3391, 3, 18, 1, -UNI__PERL_PATWS } /* patternwhitespace=f */, + { 0, 8973, 4426, 6, 6, UNI_INTANGUT } /* block=tangut */, + { 65, 9057, 0, 6, 0, UNI_emoji_values_index } /* emoji= */, + { 0, 113, 0, 2, 0, UNI_SC } /* sc */, + { 16, 5875, 6422, 13, 12, UNI_JG__MALAYALAMNGA } /* joininggroup=malayalamnga */, + { 0, 8955, 10055, 6, 4, UNI_XPOSIXALPHA } /* alpha=true */, + { 0, 9534, 0, 4, 0, UNI_TAKR } /* takr */, + { 1, 185, 6362, 2, 12, UNI_KHMERSYMBOLS } /* iskhmersymbols */, + { 1, 2304, 9916, 3, 3, UNI_ORYA } /* isorya */, + { 9, 10253, 7590, 3, 10, UNI_LB__WJ } /* lb=wordjoiner */, + { 0, 8973, 7190, 6, 10, UNI_ARABICEXTA } /* block=arabicexta */, + { 11, 9711, 10142, 4, 3, UNI_CCC__202 } /* ccc=202 */, + { 8, 810, 0, 29, 0, UNI_ENCLOSEDIDEOGRAPHICSUP } /* enclosedideographicsupplement */, + { 0, 7580, 4346, 10, 5, UNI_WB__XX } /* wordbreak=other */, + { 4, 185, 7655, 2, 9, UNI_BHKS } /* isbhaiksuki */, + { 8, 9691, 10011, 4, 4, UNI_TAGS } /* blk=tags */, + { 1, 185, 2879, 2, 12, UNI_MONGOLIANSUP } /* ismongoliansup */, + { 2, 9461, 496, 3, 7, UNI_SB__NU } /* sb=numeric */, + { 131, 9691, 0, 4, 42, UNI_UCASEXT } /* blk=unifiedcanadianaboriginalsyllabicsextended */, + { 3, 6083, 10193, 13, 3, UNI_NV__5_SLASH_6 } /* numericvalue=5/6 */, + { 8, 8973, 3265, 6, 8, UNI_INGEORGIAN } /* block=georgian */, + { 0, 8600, 0, 7, 0, UNI_DSRT } /* deseret */, + { 50, 8973, 2746, 6, 10, UNI_JAMO } /* block=hanguljamo */, + { 0, 185, 1632, 2, 18, UNI_GEOMETRICSHAPESEXT } /* isgeometricshapesext */, + { 0, 6675, 36, 11, 1, UNI_IDC } /* idcontinue=t */, + { 3, 8782, 1538, 8, 3, UNI_SC__SIND } /* script=sind */, + { 91, 9927, 26, 4, 1, UNI_PCM } /* pcm=y */, + { 0, 9691, 2078, 4, 22, UNI_MODIFIERLETTERS } /* blk=spacingmodifierletters */, + { 0, 8782, 8866, 7, 7, UNI_SC__TIRH } /* script=tirhuta */, + { 4, 4187, 1971, 5, 19, UNI_EARLYDYNASTICCUNEIFORM } /* inearlydynasticcuneiform */, + { 1, 185, 10523, 2, 5, UNI_XPOSIXBLANK } /* isblank */, + { 0, 7360, 5144, 10, 14, UNI_LB__SA } /* linebreak=complexcontext */, + { 7, 3877, 4411, 18, 5, UNI_SYRC } /* scriptextensions=syriac */, + { 16, 1538, 1948, 4, 20, UNI_DIACRITICALSFORSYMBOLS } /* indiacriticalsforsymbols */, + { 0, 8973, 1968, 6, 22, UNI_EARLYDYNASTICCUNEIFORM } /* block=earlydynasticcuneiform */, + { 1, 8356, 0, 4, 0, UNI_HIRA } /* hira */, + { 26, 9691, 3979, 5, 10, UNI_BOPOMOFOEXT } /* blk=bopomofoext */, + { 15, 5045, 1130, 3, 3, UNI_UCAS } /* isucas */, + { 1, 9077, 36, 4, 1, UNI_EXT } /* ext=t */, + { 0, 1190, 0, 3, 0, UNI_nt_values_index } /* nt= */, + { 0, 1678, 0, 9, 0, UNI_LATINEXTE } /* latinexte */, + { 2, 1189, 4985, 3, 14, UNI_TAMILSUP } /* intamilsupplement */, + { 126, 8691, 0, 4, 0, UNI_MULT } /* mult */, + { 0, 9691, 415, 4, 32, UNI_INIDC } /* blk=ideographicdescriptioncharacters */, + { 16, 114, 0, 35, 0, UNI_DIACRITICALSFORSYMBOLS } /* combiningdiacriticalmarksforsymbols */, + { 4, 9171, 26, 6, 1, UNI__PERL_PATWS } /* patws=y */, + { 0, 8973, 6590, 6, 12, UNI_INOLDHUNGARIAN } /* block=oldhungarian */, + { 0, 8782, 494, 7, 3, UNI_SC__HAN } /* script=han */, + { 0, 3121, 6530, 18, 8, UNI_DT__NONCANON } /* decompositiontype=noncanon */, + { 1, 8782, 4984, 7, 5, UNI_SC__TAML } /* script=tamil */, + { 3, 185, 2433, 2, 20, UNI_GLAGOLITICSUP } /* isglagoliticsupplement */, + { 0, 10352, 6302, 3, 12, UNI_LB__HL } /* wb=hebrewletter */, + { 2, 6218, 0, 12, 0, UNI_CYRILLICEXTC } /* cyrillicextc */, + { 0, 9519, 0, 5, 0, UNI_OSGE } /* osage */, + { 0, 6083, 8251, 13, 2, UNI_NV__19 } /* numericvalue=19 */, + { 0, 8782, 8468, 7, 8, UNI_SC__TAGB } /* script=tagbanwa */, + { 1, 10268, 4175, 3, 1, UNI_NV__1 } /* nv=1 */, + { 0, 9979, 8476, 4, 8, UNI_TFNG } /* scx=tifinagh */, + { 0, 10247, 5, 3, 1, UNI_JG__E } /* jg=e */, + { 32, 4186, 0, 16, 0, UNI_LINEARBIDEOGRAMS } /* linearbideograms */, + { 4, 5045, 514, 3, 15, UNI_UIDEO } /* isunifiedideograph */, + { 96, 4714, 1, 15, 1, -UNI_GREXT } /* graphemeextend=n */, + { 2, 9735, 10055, 4, 4, UNI_CWU } /* cwu=true */, + { 0, 9476, 8789, 3, 7, UNI_SC__SHRD } /* sc=sharada */, + { 1, 3175, 10355, 18, 3, UNI_EPRES } /* emojipresentation=yes */, + { 3, 3877, 8979, 17, 4, UNI_CARI } /* scriptextensions=cari */, + { 0, 9476, 9651, 3, 4, UNI_AGHB } /* sc=aghb */, + { 15, 7530, 0, 10, 0, UNI_SUPARROWSB } /* suparrowsb */, + { 4, 9731, 36, 4, 1, UNI_CWT } /* cwt=t */, + { 0, 185, 1747, 2, 13, UNI_ZNAMENNYMUSIC } /* isznamennymusic */, + { 0, 9476, 9859, 3, 4, UNI_MERC } /* sc=merc */, + { 0, 1418, 9402, 24, 2, UNI_CCC__34 } /* canonicalcombiningclass=34 */, + { 0, 9461, 73, 3, 2, UNI_SB__LE } /* sb=le */, + { 33, 3978, 0, 11, 0, UNI_BOPOMOFOEXT } /* bopomofoext */, + { 100, 2206, 8308, 21, 8, UNI_WB__EB } /* graphemeclusterbreak=ebasegaz */, + { 2, 5662, 7, 15, 1, UNI_SB__SC } /* sentencebreak=sc */, + { 0, 8973, 7754, 6, 9, UNI_LATINEXTG } /* block=latinextg */, + { 0, 8973, 3481, 6, 18, UNI_TAIXUANJING } /* block=taixuanjingsymbols */, + { 272, 9711, 10172, 4, 3, UNI_CCC__IS } /* ccc=240 */, + { 2, 1189, 8832, 3, 6, UNI_INTAGALOG } /* intagalog */, + { 1, 4847, 4315, 3, 6, UNI_INMYANMAR } /* inmyanmar */, + { 0, 9219, 1026, 6, 2, -UNI_XPOSIXUPPER } /* upper=no */, + { 1, 8593, 36, 7, 1, UNI_COMPEX } /* compex=t */, + { 0, 9979, 9863, 4, 4, UNI_MIAO } /* scx=miao */, + { 57, 4074, 24, 16, 1, UNI_L } /* generalcategory=l */, + { 0, 8973, 7210, 6, 10, UNI_ASCII } /* block=basiclatin */, + { 34, 9691, 8803, 4, 7, UNI_INSIDDHAM } /* blk=siddham */, + { 5, 6741, 1026, 11, 2, -UNI_DEP } /* deprecated=no */, + { 1, 3049, 0, 4, 0, UNI_CHER } /* cher */, + { 0, 9647, 10334, 4, 3, UNI_AGE__6_DOT_3 } /* age=v63 */, + { 1, 8973, 1678, 6, 23, UNI_LATINEXTADDITIONAL } /* block=latinextendedadditional */, + { 9, 8782, 3193, 7, 8, UNI_ETHI } /* script=ethiopic */, + { 0, 1592, 3194, 3, 10, UNI_ETHIOPICSUP } /* inethiopicsup */, + { 0, 10268, 8913, 3, 5, UNI_NV__40000 } /* nv=40000 */, + { 32, 1553, 7005, 9, 11, UNI_SO } /* category=othersymbol */, + { 0, 9979, 4411, 5, 5, UNI_SYRC } /* scx=syriac */, + { 3, 1562, 0, 24, 0, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* supsymbolsandpictographs */, + { 12, 9429, 10055, 5, 4, UNI_CWCF } /* cwcf=true */, + { 28, 8635, 0, 7, 0, UNI_HANO } /* hanunoo */, + { 5, 3877, 9787, 17, 4, UNI_HANO } /* scriptextensions=hano */, + { 0, 8782, 10015, 7, 4, UNI_SC__TALE } /* script=tale */, + { 0, 10530, 8861, 4, 5, UNI_INTIBETAN } /* intibetan */, + { 5, 9461, 139, 3, 2, UNI_SB__FO } /* sb=fo */, + { 0, 10268, 8252, 3, 8, UNI_NV__11_SLASH_12 } /* nv=9.17e-01 */, + { 0, 185, 6506, 2, 12, UNI_MATHALPHANUM } /* ismathalphanum */, + { 1, 8973, 9237, 6, 6, UNI_INYEZIDI } /* block=yezidi */, + { 1, 9476, 8796, 3, 7, UNI_SHAW } /* sc=shavian */, + { 0, 8881, 7553, 3, 7, UNI_ASSIGNED } /* isassigned */, + { 1, 5875, 3, 15, 1, UNI_JG__KAF } /* joininggroup=kaf */, + { 22, 3877, 7105, 18, 3, UNI_SYLO } /* scriptextensions=sylo */, + { 0, 3877, 8804, 18, 3, UNI_SIDD } /* scriptextensions=sidd */, + { 6, 7391, 1018, 4, 2, UNI_CAKM } /* iscakm */, + { 1, 10510, 97, 6, 5, UNI_XPOSIXALPHA } /* xposixalpha */, + { 141, 3877, 9105, 17, 6, UNI_KHOJ } /* scriptextensions=khojki */, + { 0, 6083, 8220, 13, 8, UNI_NV__5_SLASH_6 } /* numericvalue=8.33e-01 */, + { 1, 6083, 1250, 13, 3, UNI_NV__NAN } /* numericvalue=nan */, + { 1, 1418, 4968, 24, 2, UNI_CCC__0 } /* canonicalcombiningclass=nr */, + { 4, 8973, 7430, 6, 10, UNI_INOLDSOGDIAN } /* block=oldsogdian */, + { 3, 7240, 0, 10, 0, UNI_BOXDRAWING } /* boxdrawing */, + { 0, 5875, 6458, 13, 12, UNI_JG__MALAYALAMSSA } /* joininggroup=malayalamssa */, + { 1, 8973, 4090, 6, 16, UNI_GEORGIANEXT } /* block=georgianextended */, + { 7, 10540, 17, 5, 1, UNI_XPEO } /* isxpeo */, + { 170, 185, 11, 2, 2, UNI_DI } /* isdi */, + { 4, 10247, 6662, 3, 12, UNI_JG__VERTICALTAIL } /* jg=verticaltail */, + { 4, 3877, 9755, 17, 4, UNI_DSRT } /* scriptextensions=dsrt */, + { 1, 185, 4534, 2, 15, UNI_BRAI } /* isbraillepatterns */, + { 5, 9159, 10355, 6, 3, UNI_NFDQC__Y } /* nfdqc=yes */, + { 1, 9476, 3159, 5, 2, UNI_SC__KHOJ } /* sc=khoj */, + { 128, 10268, 8028, 3, 3, UNI_NV__200 } /* nv=200 */, + { 45, 6340, 2165, 3, 17, UNI_CYRILLICSUP } /* incyrillicsupplement */, + { 64, 9474, 4564, 5, 15, UNI_INSC__CONSONANTKILLER } /* insc=consonantkiller */, + { 0, 8881, 29, 4, 4, UNI_ARAB } /* isarabic */, + { 74, 9691, 3707, 4, 16, UNI_ETHIOPICEXT } /* blk=ethiopicextended */, + { 1, 1370, 0, 24, 0, UNI_ARABICPFA } /* arabicpresentationformsa */, + { 0, 9691, 3319, 4, 9, UNI_LATINEXTA } /* blk=latinexta */, + { 7, 9474, 5784, 5, 13, UNI_INSC__CONSONANTDEAD } /* insc=consonantdead */, + { 0, 2242, 9505, 3, 4, UNI_INNUSHU } /* innushu */, + { 27, 3463, 0, 18, 0, UNI_SMALLKANAEXT } /* smallkanaextension */, + { 2, 7230, 10274, 10, 3, UNI_BC__PDF } /* bidiclass=pdf */, + { 0, 7467, 7951, 3, 1, UNI_IN__3 } /* in=3 */, + { 2, 3877, 9775, 17, 4, UNI_GREK } /* scriptextensions=grek */, + { 0, 8782, 9879, 7, 4, UNI_SC__MYMR } /* script=mymr */, + { 0, 10244, 340, 3, 2, UNI_LO } /* gc=lo */, + { 0, 9691, 839, 4, 29, UNI_MISCARROWS } /* blk=miscellaneoussymbolsandarrows */, + { 9, 9469, 2573, 5, 20, UNI_INPC__TOPANDBOTTOMANDRIGHT } /* inpc=topandbottomandright */, + { 1, 6529, 7421, 3, 9, UNI_INOLDPERSIAN } /* inoldpersian */, + { 1, 9476, 9991, 3, 4, UNI_SHAW } /* sc=shaw */, + { 2, 9476, 3978, 3, 8, UNI_SC__BOPO } /* sc=bopomofo */, + { 0, 10223, 3, 3, 1, -UNI_CI } /* ci=f */, + { 132, 9177, 1, 6, 1, -UNI_QMARK } /* qmark=n */, + { 0, 9711, 8027, 4, 2, UNI_CCC__22 } /* ccc=22 */, + { 0, 4999, 0, 15, 0, UNI_TITLE } /* titlecaseletter */, + { 1, 8967, 1026, 6, 2, -UNI_BIDIM } /* bidim=no */, + { 34, 10516, 8776, 3, 6, UNI_PHAG } /* isphagspa */, + { 0, 1553, 342, 9, 2, UNI_PE } /* category=pe */, + { 0, 1880, 0, 22, 0, UNI_cwu_values_index } /* changeswhenuppercased= */, + { 1, 10253, 752, 3, 2, UNI_LB__CL } /* lb=cl */, + { 0, 10511, 7580, 5, 4, UNI_POSIXWORD } /* posixword */, + { 0, 9691, 750, 4, 16, UNI_ENCLOSEDALPHANUM } /* blk=enclosedalphanum */, + { 106, 5408, 5942, 4, 7, UNI_INMALAYALAM } /* inmalayalam */, + { 0, 9711, 9370, 5, 4, UNI_CCC__28 } /* ccc=ccc28 */, + { 19, 3877, 7260, 17, 10, UNI_CHRS } /* scriptextensions=chorasmian */, + { 24, 185, 10388, 2, 2, UNI_CASEDLETTER } /* isl& */, + { 1, 7460, 10295, 10, 3, UNI_IN__2 } /* presentin=v20 */, + { 17, 3877, 7709, 17, 9, UNI_SIND } /* scriptextensions=khudawadi */, + { 0, 263, 0, 2, 0, UNI_SM } /* sm */, + { 33, 9550, 10355, 4, 3, UNI_IDS } /* ids=yes */, + { 0, 3121, 10091, 18, 4, UNI_EA__F } /* decompositiontype=wide */, + { 27, 4972, 8846, 3, 6, UNI_TAVT } /* istaiviet */, + { 0, 10253, 496, 3, 2, UNI_LB__NU } /* lb=nu */, + { 7, 4984, 0, 5, 0, UNI_TAML } /* tamil */, + { 0, 8973, 8552, 7, 6, UNI_CJKEXTB } /* block=cjkextb */, + { 0, 4074, 5581, 16, 11, UNI_MC } /* generalcategory=spacingmark */, + { 2, 10015, 0, 4, 0, UNI_TALE } /* tale */, + { 0, 4598, 3267, 4, 6, UNI_INGEORGIAN } /* ingeorgian */, + { 1, 9691, 7844, 4, 9, UNI_PALM } /* blk=palmyrene */, + { 3, 4699, 0, 14, 0, UNI_ECOMP } /* emojicomponent */, + { 4, 7391, 5118, 4, 11, UNI_CI } /* iscaseignorable */, + { 5, 9269, 3, 5, 1, -UNI_POSIXXDIGIT } /* ahex=f */, + { 56, 8881, 9265, 3, 4, UNI_ADLM } /* isadlam */, + { 1, 1847, 0, 5, 0, UNI_XPOSIXLOWER } /* lower */, + { 106, 3157, 10355, 18, 3, UNI_EBASE } /* emojimodifierbase=yes */, + { 1, 1418, 6851, 24, 11, UNI_CCC__8 } /* canonicalcombiningclass=kanavoicing */, + { 0, 8887, 10055, 7, 4, UNI_XPOSIXSPACE } /* wspace=true */, + { 42, 10530, 8478, 4, 6, UNI_INTIFINAGH } /* intifinagh */, + { 0, 185, 9827, 2, 4, UNI_LANA } /* islana */, + { 1, 8782, 8656, 7, 7, UNI_SC__KALI } /* script=kayahli */, + { 12, 3877, 4534, 17, 7, UNI_BRAI } /* scriptextensions=braille */, + { 20, 185, 1019, 2, 5, UNI_MUSIC } /* ismusic */, + { 2, 9803, 7380, 4, 10, UNI_LB__H2 } /* hst=lvsyllable */, + { 0, 10268, 8949, 3, 4, UNI_NV__9000 } /* nv=9000 */, + { 0, 8782, 6362, 7, 5, UNI_KHMR } /* script=khmer */, + { 1, 8973, 952, 6, 28, UNI_VSSUP } /* block=variationselectorssupplement */, + { 2, 185, 3978, 2, 4, UNI_BOPO } /* isbopo */, + { 2, 1466, 0, 24, 0, UNI_DIACRITICALSFORSYMBOLS } /* combiningmarksforsymbols */, + { 1, 10508, 5802, 8, 5, UNI_XPOSIXALNUM } /* isxposixalnum */, + { 1, 6083, 10136, 13, 3, UNI_NV__2_SLASH_3 } /* numericvalue=2/3 */, + { 0, 7230, 1354, 10, 3, UNI_BC__RLE } /* bidiclass=rle */, + { 1, 185, 9819, 2, 4, UNI_KNDA } /* isknda */, + { 0, 3301, 0, 18, 0, UNI_PI } /* initialpunctuation */, + { 0, 185, 9069, 2, 4, UNI_GOTH } /* isgoth */, + { 12, 9979, 2937, 5, 8, UNI_SUND } /* scx=sundanese */, + { 243, 5875, 9243, 13, 6, UNI_JG__YUDHHE } /* joininggroup=yudhhe */, + { 16, 6340, 3105, 4, 16, UNI_COPTICEPACTNUMBERS } /* incopticepactnumbers */, + { 2, 8782, 8621, 7, 7, UNI_SC__GRAN } /* script=grantha */, + { 4, 185, 868, 2, 11, UNI_PHONETICEXT } /* isphoneticext */, + { 84, 4074, 468, 16, 11, UNI_P } /* generalcategory=punctuation */, + { 3, 1418, 6554, 24, 12, UNI_CCC__0 } /* canonicalcombiningclass=notreordered */, + { 9, 6083, 9631, 13, 3, UNI_NV__3_SLASH_8 } /* numericvalue=3/8 */, + { 26, 9691, 9093, 4, 6, UNI_INKAITHI } /* blk=kaithi */, + { 0, 5927, 0, 13, 0, UNI_LOWSURROGATES } /* lowsurrogates */, + { 5, 9544, 36, 5, 1, UNI_XIDC } /* xidc=t */, + { 1, 185, 4625, 3, 14, UNI_CURRENCYSYMBOLS } /* iscurrencysymbols */, + { 7, 8973, 8670, 6, 7, UNI_INMAKASAR } /* block=makasar */, + { 0, 9476, 7700, 3, 9, UNI_SC__QAAI } /* sc=inherited */, + { 0, 8973, 3707, 6, 17, UNI_ETHIOPICEXTA } /* block=ethiopicextendeda */, + { 1, 2248, 2994, 3, 18, UNI_SUPARROWSC } /* insupplementalarrowsc */, + { 3, 9979, 7826, 4, 9, UNI_ORKH } /* scx=oldturkic */, + { 20, 8973, 571, 7, 29, UNI_CJKEXTC } /* block=cjkunifiedideographsextensionc */, + { 0, 8782, 7450, 7, 10, UNI_PHNX } /* script=phoenician */, + { 2, 7300, 0, 10, 0, UNI_dia_values_index } /* diacritic= */, + { 347, 10268, 8907, 3, 2, UNI_NV__30 } /* nv=30 */, + { 0, 9476, 7333, 6, 7, UNI_KHAR } /* sc=kharoshthi */, + { 0, 8973, 5888, 6, 13, UNI_KANAEXTA } /* block=kanaextendeda */, + { 2, 9691, 9831, 4, 3, UNI_INLAO } /* blk=lao */, + { 56, 7370, 36, 10, 1, UNI_XPOSIXLOWER } /* lowercase=t */, + { 0, 8782, 9923, 7, 4, UNI_SC__OUGR } /* script=ougr */, + { 21, 9195, 0, 6, 0, UNI_TNSA } /* tangsa */, + { 101, 8973, 2353, 6, 20, UNI_INANATOLIANHIEROGLYPHS } /* block=anatolianhieroglyphs */, + { 22, 9691, 2164, 4, 18, UNI_CYRILLICSUP } /* blk=cyrillicsupplement */, + { 45, 9691, 1007, 4, 27, UNI_ANCIENTGREEKMUSIC } /* blk=ancientgreekmusicalnotation */, + { 21, 3175, 9454, 18, 5, -UNI_EPRES } /* emojipresentation=false */, + { 0, 3193, 0, 18, 0, UNI_ETHIOPICSUP } /* ethiopicsupplement */, + { 2, 8973, 5312, 6, 14, UNI_LATINEXTD } /* block=latinextendedd */, + { 82, 10253, 2664, 3, 2, UNI_LB__BA } /* lb=ba */, + { 0, 3877, 9524, 17, 5, UNI_RUNR } /* scriptextensions=runic */, + { 0, 8973, 10051, 6, 4, UNI_INTOTO } /* block=toto */, + { 129, 3157, 36, 18, 1, UNI_EBASE } /* emojimodifierbase=t */, + { 1, 10229, 4058, 3, 5, UNI_DT__FIN } /* dt=final */, + { 33, 8719, 0, 7, 0, UNI_NB } /* noblock */, + { 2, 1418, 10172, 24, 3, UNI_CCC__IS } /* canonicalcombiningclass=240 */, + { 1, 9464, 36, 5, 1, UNI_IDST } /* idst=t */, + { 14, 10268, 8028, 3, 5, UNI_NV__20000 } /* nv=20000 */, + { 43, 8300, 0, 8, 0, UNI_DUPL } /* duployan */, + { 4, 9461, 7871, 3, 9, UNI_SB__SC } /* sb=scontinue */, + { 0, 8973, 7808, 6, 9, UNI_INOLDITALIC } /* block=olditalic */, + { 0, 2056, 0, 21, 0, UNI__PERL_NCHAR } /* noncharactercodepoint */, + { 3, 8973, 2936, 6, 9, UNI_INSUNDANESE } /* block=sundanese */, + { 0, 9691, 7781, 4, 9, UNI_INNABATAEAN } /* blk=nabataean */, + { 1, 6340, 691, 3, 29, UNI_CJKEXTG } /* incjkunifiedideographsextensiong */, + { 65, 185, 750, 2, 16, UNI_ENCLOSEDALPHANUM } /* isenclosedalphanum */, + { 0, 7908, 0, 8, 0, UNI_ids_values_index } /* idstart= */, + { 14, 6340, 1062, 4, 4, UNI_INCOPTIC } /* incoptic */, + { 4, 5940, 0, 9, 0, UNI_MLYM } /* malayalam */, + { 10, 1968, 0, 22, 0, UNI_EARLYDYNASTICCUNEIFORM } /* earlydynasticcuneiform */, + { 138, 8973, 3319, 6, 9, UNI_LATINEXTA } /* block=latinexta */, + { 0, 2056, 0, 22, 0, UNI_nchar_values_index } /* noncharactercodepoint= */, + { 0, 7297, 9082, 3, 5, UNI_HATR } /* ishatran */, + { 0, 2593, 3546, 20, 7, UNI_VO__U } /* verticalorientation=upright */, + { 1, 5648, 1, 14, 1, -UNI_QMARK } /* quotationmark=n */, + { 1, 10268, 9575, 3, 4, UNI_NV__1_SLASH_64 } /* nv=1/64 */, + { 1, 6083, 8020, 13, 8, UNI_NV__1_SLASH_40 } /* numericvalue=2.50e-02 */, + { 0, 9691, 0, 4, 34, UNI_UCAS } /* blk=unifiedcanadianaboriginalsyllabics */, + { 1, 10516, 9424, 7, 5, UNI_POSIXCNTRL } /* isposixcntrl */, + { 0, 8973, 9284, 6, 5, UNI_INBATAK } /* block=batak */, + { 0, 9476, 8684, 3, 4, UNI_MARC } /* sc=marc */, + { 0, 10349, 0, 3, 0, UNI_vs_values_index } /* vs= */, + { 22, 3139, 0, 10, 0, UNI_DEVA } /* devanagari */, + { 36, 3283, 3, 18, 1, -UNI_IDSB } /* idsbinaryoperator=f */, + { 0, 185, 7016, 2, 11, UNI_HMNG } /* ispahawhhmong */, + { 6, 8973, 1295, 6, 25, UNI_SUPERANDSUB } /* block=superscriptsandsubscripts */, + { 5, 8973, 6207, 7, 11, UNI_CYRILLICEXTB } /* block=cyrillicextb */, + { 133, 7360, 4010, 10, 16, UNI_LB__CP } /* linebreak=closeparenthesis */, + { 4, 9063, 0, 5, 0, UNI_EPRES } /* epres */, + { 9, 7297, 6303, 3, 5, UNI_HEBR } /* ishebrew */, + { 76, 21, 5326, 2, 14, UNI_LATINEXTE } /* inlatinextendede */, + { 2, 7300, 1026, 10, 2, -UNI_DIA } /* diacritic=no */, + { 0, 7580, 5830, 10, 5, UNI_WB__EB } /* wordbreak=ebase */, + { 4, 8973, 3265, 6, 18, UNI_GEORGIANSUP } /* block=georgiansupplement */, + { 3, 9691, 3809, 4, 17, UNI_LETTERLIKESYMBOLS } /* blk=letterlikesymbols */, + { 0, 9476, 8468, 3, 4, UNI_SC__TAGB } /* sc=tagb */, + { 0, 2553, 10355, 20, 3, UNI_TERM } /* terminalpunctuation=yes */, + { 4, 7218, 3979, 3, 10, UNI_BOPOMOFOEXT } /* inbopomofoext */, + { 168, 10508, 10100, 3, 3, UNI_XSUX } /* isxsux */, + { 2, 7230, 4549, 10, 15, UNI_BC__CS } /* bidiclass=commonseparator */, + { 1, 9476, 8859, 3, 7, UNI_TIBT } /* sc=tibetan */, + { 3, 1418, 8901, 24, 3, UNI_CCC__216 } /* canonicalcombiningclass=216 */, + { 0, 9711, 18, 4, 1, UNI_CCC__R } /* ccc=r */, + { 0, 10244, 5581, 3, 11, UNI_MC } /* gc=spacingmark */, + { 1, 9087, 10355, 6, 3, UNI_JOINC } /* joinc=yes */, + { 0, 2248, 4411, 3, 15, UNI_SYRIACSUP } /* insyriacsupplement */, + { 0, 8420, 0, 8, 0, UNI_MAHJ } /* mahajani */, + { 0, 8973, 4410, 6, 9, UNI_SYRIACSUP } /* block=syriacsup */, + { 1, 340, 0, 2, 0, UNI_LO } /* lo */, + { 13, 184, 0, 34, 0, UNI_MISCPICTOGRAPHS } /* miscellaneoussymbolsandpictographs */, + { 0, 9469, 0, 5, 0, UNI_inpc_values_index } /* inpc= */, + { 0, 6158, 36, 12, 1, UNI_BIDIC } /* bidicontrol=t */, + { 1, 1418, 6774, 24, 11, UNI_CCC__DB } /* canonicalcombiningclass=doublebelow */, + { 0, 9691, 2269, 4, 21, UNI_MEETEIMAYEKEXT } /* blk=meeteimayekextensions */, + { 0, 3067, 0, 18, 0, UNI_HALFMARKS } /* combininghalfmarks */, + { 2, 10553, 2937, 3, 3, UNI_SUND } /* issund */, + { 264, 3877, 10099, 17, 4, UNI_XSUX } /* scriptextensions=xsux */, + { 7, 4074, 10388, 16, 2, UNI_CASEDLETTER } /* generalcategory=l& */, + { 18, 9979, 7853, 4, 9, UNI_PAUC } /* scx=paucinhau */, + { 0, 8887, 10355, 7, 3, UNI_XPOSIXSPACE } /* wspace=yes */, + { 4, 4744, 7692, 16, 8, UNI_IDENTIFIERTYPE__INCLUSION } /* identifiertype=inclusion */, + { 256, 9711, 10151, 4, 3, UNI_CCC__L } /* ccc=224 */, + { 0, 8260, 0, 8, 0, UNI_ARMN } /* armenian */, + { 0, 8973, 8614, 6, 7, UNI_INELYMAIC } /* block=elymaic */, + { 3, 8782, 8866, 7, 4, UNI_SC__TIRH } /* script=tirh */, + { 6, 8782, 9534, 7, 5, UNI_SC__TAKR } /* script=takri */, + { 256, 185, 750, 2, 30, UNI_ENCLOSEDALPHANUMSUP } /* isenclosedalphanumericsupplement */, + { 7, 8782, 3139, 7, 4, UNI_SC__DEVA } /* script=deva */, + { 0, 7467, 10313, 3, 3, UNI_IN__4_DOT_1 } /* in=v41 */, + { 0, 8973, 1946, 6, 12, UNI_DIACRITICALS } /* block=diacriticals */, + { 1, 10244, 6132, 3, 2, UNI_PF } /* gc=pf */, + { 1, 4074, 1026, 16, 2, UNI_NO } /* generalcategory=no */, + { 8, 2557, 6125, 5, 9, UNI_ALPHABETICPF } /* inalphabeticpf */, + { 1, 3877, 7018, 18, 3, UNI_SHAW } /* scriptextensions=shaw */, + { 0, 10253, 126, 3, 2, UNI_LB__CR } /* lb=cr */, + { 0, 2003, 24, 10, 1, UNI_LOWERCASELETTER } /* category=ll */, + { 8, 9731, 0, 4, 0, UNI_cwt_values_index } /* cwt= */, + { 0, 9691, 2746, 4, 10, UNI_JAMO } /* blk=hanguljamo */, + { 92, 2206, 8313, 21, 3, UNI_WB__EB } /* graphemeclusterbreak=gaz */, + { 5, 9476, 9923, 3, 4, UNI_SC__OUGR } /* sc=ougr */, + { 67, 10099, 0, 4, 0, UNI_XSUX } /* xsux */, + { 8, 9177, 9454, 6, 5, -UNI_QMARK } /* qmark=false */, + { 0, 9979, 8804, 5, 3, UNI_SIDD } /* scx=sidd */, + { 8, 10247, 5966, 3, 13, UNI_JG__MANICHAEANMEM } /* jg=manichaeanmem */, + { 0, 9691, 9539, 4, 5, UNI_VSSUP } /* blk=vssup */, + { 0, 8973, 4729, 6, 15, UNI_INHANGUL } /* block=hangulsyllables */, + { 1, 185, 150, 3, 34, UNI_DIACRITICALSSUP } /* iscombiningdiacriticalmarkssupplement */, + { 28, 9647, 10304, 4, 3, UNI_AGE__3_DOT_1 } /* age=v31 */, + { 1, 2185, 1, 21, 1, -UNI_EXTPICT } /* extendedpictographic=n */, + { 1, 10268, 9631, 3, 4, UNI_NV__3_SLASH_80 } /* nv=3/80 */, + { 0, 21, 1219, 2, 8, UNI_INKATAKANA } /* inkatakana */, + { 0, 8973, 4984, 6, 5, UNI_INTAMIL } /* block=tamil */, + { 0, 8782, 8476, 7, 8, UNI_TFNG } /* script=tifinagh */, + { 32, 9711, 9340, 5, 4, UNI_CCC__22 } /* ccc=ccc22 */, + { 4, 5340, 0, 14, 0, UNI_LATINEXTF } /* latinextendedf */, + { 5, 1990, 4458, 22, 16, UNI_INSC__VOWELINDEPENDENT } /* indicsyllabiccategory=vowelindependent */, + { 0, 7391, 9, 4, 16, UNI_CANS } /* iscanadianaboriginal */, + { 3, 8782, 7570, 7, 10, UNI_WARA } /* script=warangciti */, + { 0, 5875, 9855, 13, 4, UNI_JG__MEEM } /* joininggroup=meem */, + { 2, 8973, 8566, 7, 6, UNI_CJKEXTD } /* block=cjkextd */, + { 5, 7360, 496, 10, 7, UNI_LB__NU } /* linebreak=numeric */, + { 2, 10229, 436, 4, 2, UNI_DT__ENC } /* dt=enc */, + { 99, 9189, 3, 6, 1, -UNI_STERM } /* sterm=f */, + { 87, 10244, 5914, 3, 13, UNI_ZL } /* gc=lineseparator */, + { 0, 2185, 0, 20, 0, UNI_EXTPICT } /* extendedpictographic */, + { 6, 8973, 7016, 6, 11, UNI_INPAHAWHHMONG } /* block=pahawhhmong */, + { 2, 8782, 9683, 7, 4, UNI_BATK } /* script=batk */, + { 256, 5836, 0, 13, 0, UNI_GREEKEXT } /* greekextended */, + { 0, 3877, 2841, 17, 4, UNI_MERO } /* scriptextensions=mero */, + { 0, 8973, 9539, 6, 5, UNI_VSSUP } /* block=vssup */, + { 22, 8973, 9863, 6, 4, UNI_INMIAO } /* block=miao */, + { 0, 3877, 10000, 18, 3, UNI_SHRD } /* scriptextensions=shrd */, + { 25, 1538, 2479, 24, 5, UNI_INPC__RIGHT } /* indicpositionalcategory=right */, + { 1, 9691, 2493, 4, 20, UNI_INNYIAKENGPUACHUEHMONG } /* blk=nyiakengpuachuehmong */, + { 1, 3877, 8292, 17, 8, UNI_BUGI } /* scriptextensions=buginese */, + { 11, 1553, 1187, 9, 2, UNI_PO } /* category=po */, + { 2, 3877, 9707, 17, 4, UNI_CANS } /* scriptextensions=cans */, + { 0, 8782, 8276, 7, 4, UNI_BALI } /* script=bali */, + { 0, 8782, 2312, 8, 6, UNI_SC__SINH } /* script=sinhala */, + { 0, 6083, 10139, 13, 3, UNI_NV__2_SLASH_5 } /* numericvalue=2/5 */, + { 1, 9691, 2248, 4, 21, UNI_ININSCRIPTIONALPARTHIAN } /* blk=inscriptionalparthian */, + { 0, 8973, 9514, 6, 5, UNI_INORIYA } /* block=oriya */, + { 1, 7, 0, 1, 0, UNI_C } /* c */, + { 306, 10253, 4954, 3, 15, UNI_LB__OP } /* lb=openpunctuation */, + { 0, 10268, 9560, 3, 3, UNI_NV__1_SLASH_2 } /* nv=1/2 */, + { 20, 2248, 1563, 3, 23, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* insupsymbolsandpictographs */, + { 15, 1836, 0, 21, 0, UNI_CWL } /* changeswhenlowercased */, + { 7, 9691, 5298, 4, 14, UNI_LATINEXTC } /* blk=latinextendedc */, + { 0, 1836, 1, 22, 1, -UNI_CWL } /* changeswhenlowercased=n */, + { 0, 2841, 0, 4, 0, UNI_MERO } /* mero */, + { 6, 3877, 9667, 17, 4, UNI_ARMN } /* scriptextensions=armn */, + { 0, 9711, 10148, 4, 3, UNI_CCC__BR } /* ccc=222 */, + { 73, 10268, 10196, 3, 3, UNI_NV__5_SLASH_8 } /* nv=5/8 */, + { 0, 9711, 0, 4, 0, UNI_ccc_values_index } /* ccc= */, + { 0, 9270, 36, 4, 1, UNI_XPOSIXXDIGIT } /* hex=t */, + { 0, 5059, 0, 15, 0, UNI_ZANB } /* zanabazarsquare */, + { 1, 6350, 0, 12, 0, UNI_jt_values_index } /* joiningtype= */, + { 33, 4669, 0, 15, 0, UNI_DIACRITICALSSUP } /* diacriticalssup */, + { 2, 185, 2955, 2, 19, UNI_SUPARROWSA } /* issupplementalarrowsa */, + { 1, 1418, 6763, 24, 11, UNI_CCC__DA } /* canonicalcombiningclass=doubleabove */, + { 462, 9544, 1, 5, 1, -UNI_XIDC } /* xidc=n */, + { 65, 185, 5131, 3, 13, UNI_CJKCOMPATFORMS } /* iscjkcompatforms */, + { 1, 9063, 26, 6, 1, UNI_EPRES } /* epres=y */, + { 0, 185, 34, 2, 3, UNI_EXT } /* isext */, + { 130, 2312, 2229, 4, 12, UNI_INHANIFIROHINGYA } /* inhanifirohingya */, + { 1, 7580, 6254, 10, 12, UNI_WB__EX } /* wordbreak=extendnumlet */, + { 1, 185, 9835, 2, 4, UNI_LATN } /* islatn */, + { 0, 10253, 10394, 3, 2, UNI_LB__XX } /* lb=xx */, + { 6, 97, 0, 10, 0, UNI_XPOSIXALPHA } /* alphabetic */, + { 3, 185, 3674, 3, 16, UNI_CYRILLICEXTB } /* iscyrillicextendedb */, + { 0, 9476, 3934, 3, 11, UNI_SGNW } /* sc=signwriting */, + { 16, 5875, 7177, 13, 3, UNI_JG__FEH } /* joininggroup=feh */, + { 71, 4074, 1187, 16, 2, UNI_PO } /* generalcategory=po */, + { 2, 9469, 8776, 3, 6, UNI_INPHAGSPA } /* inphagspa */, + { 27, 8468, 0, 4, 0, UNI_TAGB } /* tagb */, + { 3, 6083, 9307, 13, 2, UNI_NV__15 } /* numericvalue=15 */, + { 9, 5875, 6906, 13, 11, UNI_JG__MALAYALAMJA } /* joininggroup=malayalamja */, + { 0, 6083, 8925, 13, 4, UNI_NV__5000 } /* numericvalue=5000 */, + { 37, 10516, 5096, 7, 5, UNI_POSIXDIGIT } /* isposixdigit */, + { 1, 9691, 8859, 4, 7, UNI_INTIBETAN } /* blk=tibetan */, + { 1, 1553, 3383, 10, 8, UNI_Z } /* category=separator */, + { 30, 9979, 10103, 4, 4, UNI_YI } /* scx=yiii */, + { 0, 10229, 1418, 3, 9, UNI_DT__CAN } /* dt=canonical */, + { 0, 8973, 8468, 6, 8, UNI_INTAGBANWA } /* block=tagbanwa */, + { 48, 9997, 8791, 4, 5, UNI_SC__SHRD } /* insharada */, + { 0, 185, 5368, 2, 7, UNI_LISUSUP } /* islisusup */, + { 100, 8955, 1026, 6, 2, -UNI_XPOSIXALPHA } /* alpha=no */, + { 39, 8782, 9911, 7, 4, UNI_ORKH } /* script=orkh */, + { 4, 1418, 9417, 24, 2, UNI_CCC__84 } /* canonicalcombiningclass=84 */, + { 33, 7297, 4107, 3, 15, UNI_HALFANDFULLFORMS } /* ishalfandfullforms */, + { 0, 9803, 6895, 4, 11, UNI_LB__H3 } /* hst=lvtsyllable */, + { 0, 10250, 0, 3, 1, UNI_JT__U } /* jt=u */, + { 0, 8782, 6494, 7, 12, UNI_SC__GONM } /* script=masaramgondi */, + { 33, 10516, 910, 3, 9, UNI_CO } /* isprivateuse */, + { 0, 8973, 5284, 6, 14, UNI_LATINEXTB } /* block=latinextendedb */, + { 16, 8782, 10099, 7, 4, UNI_XSUX } /* script=xsux */, + { 1, 10253, 10376, 3, 2, UNI_LB__BK } /* lb=bk */, + { 98, 10268, 8204, 3, 8, UNI_NV__3_SLASH_4 } /* nv=7.50e-01 */, + { 0, 9691, 2746, 4, 19, UNI_JAMOEXTA } /* blk=hanguljamoextendeda */, + { 1, 2206, 263, 21, 2, UNI_GCB__SM } /* graphemeclusterbreak=sm */, + { 0, 7460, 8212, 10, 3, UNI_IN__8 } /* presentin=8.0 */, + { 13, 3409, 26, 18, 1, UNI_RI } /* regionalindicator=y */, + { 10, 10268, 7964, 3, 8, UNI_NV__3_SLASH_20 } /* nv=1.50e-01 */, + { 4, 9763, 5064, 5, 2, UNI_WB__EB } /* gcb=gaz */, + { 1, 1592, 3194, 3, 17, UNI_ETHIOPICSUP } /* inethiopicsupplement */, + { 1, 3877, 8614, 17, 4, UNI_ELYM } /* scriptextensions=elym */, + { 0, 1852, 10055, 6, 4, UNI_CASED } /* cased=true */, + { 0, 10043, 0, 4, 0, UNI_TIBT } /* tibt */, + { 1, 9476, 9081, 3, 4, UNI_HATR } /* sc=hatr */, + { 0, 2206, 74, 21, 2, UNI_WB__EB } /* graphemeclusterbreak=em */, + { 99, 10508, 6675, 3, 3, UNI_XIDC } /* isxidc */, + { 0, 3877, 10083, 17, 4, UNI_VAI } /* scriptextensions=vaii */, + { 0, 43, 0, 26, 0, UNI_CJKCOMPATIDEOGRAPHS } /* cjkcompatibilityideographs */, + { 2, 8782, 9935, 7, 4, UNI_PHNX } /* script=phnx */, + { 4, 8973, 8719, 6, 7, UNI_NB } /* block=noblock */, + { 0, 5045, 5015, 3, 14, UNI_UPPERCASELETTER } /* isuppercaseletter */, + { 34, 8782, 9827, 7, 4, UNI_LANA } /* script=lana */, + { 3, 5088, 10355, 14, 3, UNI_POSIXXDIGIT } /* asciihexdigit=yes */, + { 0, 8973, 3139, 6, 10, UNI_INDEVANAGARI } /* block=devanagari */, + { 0, 8782, 5368, 7, 4, UNI_LISU } /* script=lisu */, + { 12, 185, 9783, 2, 4, UNI_GURU } /* isguru */, + { 8, 9647, 7611, 4, 3, UNI_AGE__5 } /* age=5.0 */, + { 0, 9979, 9915, 4, 4, UNI_ORYA } /* scx=orya */, + { 3, 10244, 4774, 3, 15, UNI_LOWERCASELETTER } /* gc=lowercaseletter */, + { 3, 9476, 1924, 3, 6, UNI_SC__ZYYY } /* sc=common */, + { 0, 6083, 10204, 13, 2, UNI_NV__37 } /* numericvalue=37 */, + { 0, 3553, 26, 18, 1, UNI_VS } /* variationselector=y */, + { 0, 3978, 0, 8, 0, UNI_BOPO } /* bopomofo */, + { 0, 10244, 7550, 3, 10, UNI_CN } /* gc=unassigned */, + { 432, 9867, 0, 4, 0, UNI_MLYM } /* mlym */, + { 32, 8973, 329, 6, 21, UNI_MATHOPERATORS } /* block=mathematicaloperators */, + { 20, 2269, 0, 14, 0, UNI_MEETEIMAYEKEXT } /* meeteimayekext */, + { 32, 97, 0, 5, 0, UNI_XPOSIXALPHA } /* alpha */, + { 32, 9979, 9843, 4, 4, UNI_LINB } /* scx=linb */, + { 5, 3945, 36, 17, 1, UNI_UIDEO } /* unifiedideograph=t */, + { 4, 9747, 26, 4, 1, UNI_DIA } /* dia=y */, + { 0, 8782, 8775, 7, 7, UNI_SC__PHAG } /* script=phagspa */, + { 2, 10352, 401, 3, 6, UNI_WB__FO } /* wb=format */, + { 0, 185, 1678, 2, 5, UNI_LATN } /* islatin */, + { 0, 9711, 9006, 4, 3, UNI_CCC__122 } /* ccc=122 */, + { 118, 8388, 0, 8, 0, UNI_JAVA } /* javanese */, + { 3, 9691, 447, 4, 18, UNI_IDEOGRAPHICSYMBOLS } /* blk=ideographicsymbols */, + { 1, 9651, 0, 4, 0, UNI_AGHB } /* aghb */, + { 1, 1418, 8235, 24, 2, UNI_CCC__28 } /* canonicalcombiningclass=28 */, + { 0, 8973, 447, 6, 18, UNI_IDEOGRAPHICSYMBOLS } /* block=ideographicsymbols */, + { 9, 185, 3837, 3, 3, UNI_CHAM } /* ischam */, + { 9, 7646, 0, 9, 0, UNI_ARABICPFB } /* arabicpfb */, + { 1, 8973, 4381, 6, 13, UNI_MATHOPERATORS } /* block=mathoperators */, + { 35, 1553, 134, 9, 4, UNI_M } /* category=mark */, + { 0, 10253, 8894, 3, 7, UNI_LB__ZW } /* lb=zwspace */, + { 11, 5758, 26, 13, 1, UNI_BIDIM } /* bidimirrored=y */, + { 41, 10516, 3403, 7, 5, UNI_POSIXSPACE } /* isposixspace */, + { 9, 9539, 0, 5, 0, UNI_VSSUP } /* vssup */, + { 128, 1418, 4175, 24, 1, UNI_CCC__1 } /* canonicalcombiningclass=1 */, + { 1, 9979, 3139, 4, 10, UNI_DEVA } /* scx=devanagari */, + { 0, 9476, 79, 3, 6, UNI_SC__ARAB } /* sc=arabic */, + { 1, 9474, 1245, 5, 25, UNI_INSC__CONSONANTINITIALPOSTFIXED } /* insc=consonantinitialpostfixed */, + { 0, 1990, 9289, 22, 5, UNI_INSC__BINDU } /* indicsyllabiccategory=bindu */, + { 1, 10253, 5648, 3, 9, UNI_LB__QU } /* lb=quotation */, + { 4, 3877, 6972, 17, 11, UNI_NAND } /* scriptextensions=nandinagari */, + { 24, 7580, 10394, 10, 2, UNI_WB__XX } /* wordbreak=xx */, + { 0, 2248, 3912, 3, 16, UNI_SMALLFORMS } /* insmallformvariants */, + { 0, 8782, 5940, 7, 9, UNI_SC__MLYM } /* script=malayalam */, + { 4, 10244, 134, 3, 4, UNI_M } /* gc=mark */, + { 2, 3877, 10111, 17, 4, UNI_ZANB } /* scriptextensions=zanb */, + { 1, 5810, 0, 13, 0, UNI_ME } /* enclosingmark */, + { 0, 6842, 3625, 5, 14, UNI_INCAUCASIANALBANIAN } /* incaucasianalbanian */, + { 0, 1852, 10355, 6, 3, UNI_CASED } /* cased=yes */, + { 0, 8782, 4504, 7, 4, UNI_BAMU } /* script=bamu */, + { 0, 7360, 5830, 10, 5, UNI_EBASE } /* linebreak=ebase */, + { 0, 9476, 7, 3, 18, UNI_CANS } /* sc=canadianaboriginal */, + { 3, 2122, 0, 21, 0, UNI_CJKCOMPATFORMS } /* cjkcompatibilityforms */, + { 2, 4972, 4427, 3, 5, UNI_TANG } /* istangut */, + { 0, 1538, 2579, 24, 6, UNI_INPC__BOTTOM } /* indicpositionalcategory=bottom */, + { 32, 6083, 7934, 13, 2, UNI_NV__25 } /* numericvalue=25 */, + { 0, 9691, 4381, 4, 13, UNI_MATHOPERATORS } /* blk=mathoperators */, + { 0, 8316, 0, 8, 0, UNI_extpict_values_index } /* extpict= */, + { 1, 9691, 1442, 4, 24, UNI_CJKSYMBOLS } /* blk=cjksymbolsandpunctuation */, + { 0, 9711, 9016, 5, 4, UNI_CCC__13 } /* ccc=ccc13 */, + { 193, 10232, 1193, 3, 9, UNI_EA__H } /* ea=halfwidth */, + { 364, 5875, 6693, 13, 4, UNI_JG__NOON } /* joininggroup=noon */, + { 170, 9550, 26, 4, 1, UNI_IDS } /* ids=y */, + { 0, 1418, 9004, 25, 5, UNI_CCC__122 } /* canonicalcombiningclass=ccc122 */, + { 3, 9711, 4968, 4, 2, UNI_CCC__0 } /* ccc=nr */, + { 0, 8973, 6109, 6, 13, UNI_VERTICALFORMS } /* block=verticalforms */, + { 3, 9691, 8340, 4, 8, UNI_INGUJARATI } /* blk=gujarati */, + { 0, 10232, 7628, 3, 9, UNI_EA__A } /* ea=ambiguous */, + { 0, 8887, 0, 6, 0, UNI_XPOSIXSPACE } /* wspace */, + { 2, 7907, 3, 9, 1, -UNI_XIDS } /* xidstart=f */, + { 0, 9476, 9739, 3, 4, UNI_SC__CYRL } /* sc=cyrl */, + { 0, 10352, 4346, 3, 5, UNI_WB__XX } /* wb=other */, + { 18, 3877, 9534, 17, 5, UNI_TAKR } /* scriptextensions=takri */, + { 2, 118, 5863, 3, 12, UNI_IPAEXT } /* inipaextensions */, + { 0, 4972, 5947, 3, 3, UNI_TAML } /* istaml */, + { 0, 2860, 0, 19, 0, UNI_MODIFIERTONELETTERS } /* modifiertoneletters */, + { 9, 1274, 10355, 21, 3, UNI_CE } /* compositionexclusion=yes */, + { 258, 6340, 44, 3, 35, UNI_CJKCOMPATIDEOGRAPHSSUP } /* incjkcompatibilityideographssupplement */, + { 256, 3877, 4186, 17, 7, UNI_LINB } /* scriptextensions=linearb */, + { 0, 9691, 3247, 4, 18, UNI_INPUNCTUATION } /* blk=generalpunctuation */, + { 42, 9045, 0, 5, 0, UNI_CWKCF } /* cwkcf */, + { 257, 1701, 0, 23, 0, UNI_SHORTHANDFORMATCONTROLS } /* shorthandformatcontrols */, + { 0, 9691, 7093, 4, 11, UNI_SUPERANDSUB } /* blk=superandsub */, + { 147, 9691, 3826, 4, 10, UNI_INMANICHAEAN } /* blk=manichaean */, + { 7, 9489, 0, 5, 0, UNI_math_values_index } /* math= */, + { 0, 8782, 8607, 7, 7, UNI_ELBA } /* script=elbasan */, + { 3, 1924, 0, 22, 0, UNI_INDICNUMBERFORMS } /* commonindicnumberforms */, + { 0, 9979, 10035, 4, 4, UNI_TGLG } /* scx=tglg */, + { 168, 9691, 10083, 4, 3, UNI_INVAI } /* blk=vai */, + { 2, 2185, 0, 21, 0, UNI_extpict_values_index } /* extendedpictographic= */, + { 67, 7360, 6326, 10, 12, UNI_LB__IS } /* linebreak=infixnumeric */, + { 0, 8782, 7853, 7, 9, UNI_PAUC } /* script=paucinhau */, + { 0, 10232, 3, 3, 1, UNI_EA__F } /* ea=f */, + { 33, 9691, 8866, 4, 7, UNI_INTIRHUTA } /* blk=tirhuta */, + { 0, 9476, 10003, 3, 4, UNI_SOGO } /* sc=sogo */, + { 0, 4714, 10355, 15, 3, UNI_GREXT } /* graphemeextend=yes */, + { 136, 185, 8587, 3, 6, UNI_CJKEXTG } /* iscjkextg */, + { 0, 10229, 9039, 3, 6, UNI_DT__ENC } /* dt=circle */, + { 17, 9691, 5214, 4, 14, UNI_INGREEK } /* blk=greekandcoptic */, + { 0, 3877, 8284, 17, 8, UNI_BASS } /* scriptextensions=bassavah */, + { 20, 185, 1219, 2, 8, UNI_KANA } /* iskatakana */, + { 0, 7460, 10307, 10, 3, UNI_IN__3_DOT_2 } /* presentin=v32 */, + { 13, 9691, 3481, 4, 11, UNI_TAIXUANJING } /* blk=taixuanjing */, + { 1, 8782, 10083, 7, 3, UNI_VAI } /* script=vai */, + { 0, 6675, 3, 11, 1, -UNI_IDC } /* idcontinue=f */, + { 2, 5522, 0, 14, 0, UNI_SK } /* modifiersymbol */, + { 0, 7360, 8642, 10, 6, UNI_LB__HY } /* linebreak=hyphen */, + { 0, 9711, 8986, 5, 5, UNI_CCC__103 } /* ccc=ccc103 */, + { 0, 5662, 340, 14, 2, UNI_SB__LO } /* sentencebreak=lo */, + { 79, 9915, 0, 4, 0, UNI_ORYA } /* orya */, + { 0, 3877, 9723, 17, 4, UNI_CPRT } /* scriptextensions=cprt */, + { 0, 3877, 9939, 17, 4, UNI_MIAO } /* scriptextensions=plrd */, + { 57, 9129, 0, 4, 0, UNI_LYCI } /* lyci */, + { 31, 2248, 7541, 3, 9, UNI_SUPARROWSC } /* insuparrowsc */, + { 0, 9979, 9951, 4, 4, UNI_QAAI } /* scx=qaai */, + { 7, 9270, 1, 4, 1, -UNI_XPOSIXXDIGIT } /* hex=n */, + { 1, 9075, 1, 6, 1, -UNI_GREXT } /* grext=n */, + { 0, 10247, 4234, 3, 16, UNI_JG__MANICHAEANLAMEDH } /* jg=manichaeanlamedh */, + { 2, 4410, 0, 9, 0, UNI_SYRIACSUP } /* syriacsup */, + { 11, 9691, 1655, 4, 6, UNI_INHANGUL } /* blk=hangul */, + { 0, 7907, 0, 8, 0, UNI_XIDS } /* xidstart */, + { 2, 4074, 5914, 16, 13, UNI_ZL } /* generalcategory=lineseparator */, + { 0, 1553, 5522, 9, 14, UNI_SK } /* category=modifiersymbol */, + { 0, 185, 721, 3, 15, UNI_CUNEIFORMNUMBERS } /* iscuneiformnumbers */, + { 0, 9979, 8754, 4, 7, UNI_OSMA } /* scx=osmanya */, + { 536, 9691, 6950, 4, 11, UNI_MYANMAREXTA } /* blk=myanmarexta */, + { 4, 4463, 3141, 4, 16, UNI_DEVANAGARIEXT } /* indevanagariextended */, + { 0, 7580, 34, 10, 2, UNI_WB__EX } /* wordbreak=ex */, + { 1, 9077, 3, 4, 1, -UNI_EXT } /* ext=f */, + { 2, 1792, 10355, 22, 3, UNI_CWCF } /* changeswhencasefolded=yes */, + { 14, 9979, 8388, 4, 4, UNI_JAVA } /* scx=java */, + { 4, 9979, 9655, 4, 4, UNI_AHOM } /* scx=ahom */, + { 8, 10244, 113, 3, 2, UNI_SC } /* gc=sc */, + { 0, 6340, 1926, 4, 20, UNI_INDICNUMBERFORMS } /* incommonindicnumberforms */, + { 0, 9464, 1026, 5, 2, -UNI_IDST } /* idst=no */, + { 1, 3877, 9811, 17, 4, UNI_KHMR } /* scriptextensions=khmr */, + { 1, 6350, 6638, 12, 12, UNI_JT__R } /* joiningtype=rightjoining */, + { 148, 9691, 8810, 4, 7, UNI_INSOYOMBO } /* blk=soyombo */, + { 2, 9051, 10055, 6, 4, UNI_ECOMP } /* ecomp=true */, + { 1, 9979, 9755, 4, 4, UNI_DSRT } /* scx=dsrt */, + { 9, 8492, 0, 8, 0, UNI_UCASEXTA } /* ucasexta */, + { 0, 10244, 9424, 3, 5, UNI_XPOSIXCNTRL } /* gc=cntrl */, + { 7, 9476, 8276, 3, 4, UNI_BALI } /* sc=bali */, + { 4, 185, 9740, 3, 3, UNI_CYRL } /* iscyrl */, + { 21, 9871, 0, 4, 0, UNI_MRO } /* mroo */, + { 0, 9476, 9107, 5, 4, UNI_SC__KHOJ } /* sc=khojki */, + { 0, 6132, 0, 2, 0, UNI_PF } /* pf */, + { 132, 6741, 36, 11, 1, UNI_DEP } /* deprecated=t */, + { 10, 1553, 48, 9, 1, UNI_M } /* category=m */, + { 0, 5088, 26, 14, 1, UNI_POSIXXDIGIT } /* asciihexdigit=y */, + { 1, 8782, 8635, 7, 7, UNI_SC__HANO } /* script=hanunoo */, + { 0, 6083, 8172, 13, 8, UNI_NV__1_SLASH_160 } /* numericvalue=6.25e-03 */, + { 0, 185, 123, 2, 9, UNI_DIA } /* isdiacritic */, + { 86, 9476, 2248, 3, 21, UNI_PRTI } /* sc=inscriptionalparthian */, + { 5, 6083, 7950, 13, 1, UNI_NV__4 } /* numericvalue=4 */, + { 48, 3894, 0, 17, 0, UNI_sterm_values_index } /* sentenceterminal= */, + { 0, 9691, 7104, 4, 11, UNI_INSYLOTINAGRI } /* blk=sylotinagri */, + { 0, 1418, 9365, 25, 4, UNI_CCC__27 } /* canonicalcombiningclass=ccc27 */, + { 153, 10268, 9579, 3, 3, UNI_NV__1_SLASH_8 } /* nv=1/8 */, + { 0, 9476, 9755, 3, 4, UNI_DSRT } /* sc=dsrt */, + { 12, 5130, 0, 14, 0, UNI_CJKCOMPATFORMS } /* cjkcompatforms */, + { 65, 7160, 9238, 3, 3, UNI_YEZI } /* isyezi */, + { 0, 2553, 0, 20, 0, UNI_term_values_index } /* terminalpunctuation= */, + { 0, 2003, 10389, 10, 1, UNI_CASEDLETTER } /* category=l& */, + { 2, 6083, 8100, 13, 8, UNI_NV__5_SLASH_12 } /* numericvalue=4.17e-01 */, + { 1, 9691, 5368, 4, 4, UNI_INLISU } /* blk=lisu */, + { 35, 185, 2433, 2, 4, UNI_GLAG } /* isglag */, + { 0, 4744, 7027, 15, 11, UNI_IDENTIFIERTYPE__RECOMMENDED } /* identifiertype=recommended */, + { 257, 5875, 5979, 13, 13, UNI_JG__MANICHAEANNUN } /* joininggroup=manichaeannun */, + { 0, 8973, 9093, 6, 6, UNI_INKAITHI } /* block=kaithi */, + { 1, 3809, 0, 17, 0, UNI_LETTERLIKESYMBOLS } /* letterlikesymbols */, + { 0, 1418, 5461, 24, 2, UNI_CCC__7 } /* canonicalcombiningclass=nk */, + { 1, 3877, 9514, 17, 5, UNI_ORYA } /* scriptextensions=oriya */, + { 65, 9183, 0, 6, 0, UNI_RJNG } /* rejang */, + { 12, 7580, 728, 10, 2, UNI_WB__MN } /* wordbreak=mn */, + { 0, 9763, 10235, 4, 3, UNI_WB__EB } /* gcb=ebg */, + { 0, 8973, 4504, 6, 15, UNI_BAMUMSUP } /* block=bamumsupplement */, + { 129, 7467, 7550, 3, 10, UNI_AGE__NA } /* in=unassigned */, + { 0, 8973, 1034, 6, 27, UNI_ENCLOSEDCJK } /* block=enclosedcjklettersandmonths */, + { 0, 9045, 1, 6, 1, -UNI_CWKCF } /* cwkcf=n */, + { 1, 9476, 9534, 3, 5, UNI_SC__TAKR } /* sc=takri */, + { 0, 9691, 6506, 4, 12, UNI_MATHALPHANUM } /* blk=mathalphanum */, + { 0, 7297, 2747, 3, 9, UNI_JAMO } /* ishanguljamo */, + { 3, 6494, 0, 12, 0, UNI_GONM } /* masaramgondi */, + { 66, 185, 7754, 2, 9, UNI_LATINEXTG } /* islatinextg */, + { 0, 8702, 2729, 4, 17, UNI_ENCLOSEDALPHANUMSUP } /* inenclosedalphanumsup */, + { 1, 6083, 9387, 13, 2, UNI_NV__31 } /* numericvalue=31 */, + { 1, 9476, 2264, 4, 3, UNI_SC__KTHI } /* sc=kthi */, + { 3, 5875, 5228, 13, 14, UNI_JG__HAMZAONHEHGOAL } /* joininggroup=hamzaonhehgoal */, + { 1, 9711, 1220, 4, 3, UNI_CCC__214 } /* ccc=ata */, + { 0, 3877, 383, 17, 4, UNI_EGYP } /* scriptextensions=egyp */, + { 0, 4504, 0, 8, 0, UNI_BAMUMSUP } /* bamumsup */, + { 2, 2248, 1321, 3, 24, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* insymbolsandpictographsexta */, + { 1, 1270, 1, 25, 1, -UNI_COMPEX } /* fullcompositionexclusion=n */, + { 35, 1189, 4985, 3, 4, UNI_INTAMIL } /* intamil */, + { 32, 10244, 9048, 3, 2, UNI_CF } /* gc=cf */, + { 1, 185, 8292, 2, 4, UNI_BUGI } /* isbugi */, + { 0, 9476, 2936, 3, 4, UNI_SUND } /* sc=sund */, + { 0, 3398, 1026, 11, 2, -UNI_XPOSIXSPACE } /* whitespace=no */, + { 0, 185, 6972, 2, 4, UNI_NAND } /* isnand */, + { 1, 1418, 9405, 25, 4, UNI_CCC__35 } /* canonicalcombiningclass=ccc35 */, + { 144, 1418, 8171, 24, 2, UNI_CCC__26 } /* canonicalcombiningclass=26 */, + { 4, 7360, 5382, 10, 14, UNI_LB__BK } /* linebreak=mandatorybreak */, + { 0, 8642, 1026, 7, 2, -UNI_HYPHEN } /* hyphen=no */, + { 3, 5875, 8852, 13, 7, UNI_JG__THINYEH } /* joininggroup=thinyeh */, + { 1, 185, 1, 3, 1, UNI_CN } /* iscn */, + { 8, 9045, 10055, 6, 4, UNI_CWKCF } /* cwkcf=true */, + { 0, 9691, 3365, 4, 8, UNI_DINGBATS } /* blk=dingbats */, + { 1, 185, 184, 2, 20, UNI_MISCSYMBOLS } /* ismiscellaneoussymbols */, + { 19, 6083, 8937, 13, 5, UNI_NV__70000 } /* numericvalue=70000 */, + { 2, 1019, 0, 5, 0, UNI_MUSIC } /* music */, + { 294, 9691, 4090, 4, 16, UNI_GEORGIANEXT } /* blk=georgianextended */, + { 423, 3877, 2227, 17, 14, UNI_ROHG } /* scriptextensions=hanifirohingya */, + { 132, 8973, 3809, 6, 17, UNI_LETTERLIKESYMBOLS } /* block=letterlikesymbols */, + { 49, 10268, 9635, 3, 4, UNI_NV__5_SLASH_12 } /* nv=5/12 */, + { 1, 7360, 185, 10, 2, UNI_LB__IS } /* linebreak=is */, + { 1, 10268, 9260, 3, 4, UNI_NV__1_SLASH_12 } /* nv=1/12 */, + { 16, 9711, 8147, 4, 2, UNI_CCC__16 } /* ccc=16 */, + { 3, 185, 9775, 2, 4, UNI_GREK } /* isgrek */, + { 1, 9691, 3928, 4, 17, UNI_SUTTONSIGNWRITING } /* blk=suttonsignwriting */, + { 2, 9549, 10055, 5, 4, UNI_XIDS } /* xids=true */, + { 0, 8973, 9655, 6, 4, UNI_INAHOM } /* block=ahom */, + { 0, 185, 868, 2, 18, UNI_PHONETICEXT } /* isphoneticextensions */, + { 0, 185, 3193, 2, 11, UNI_ETHIOPICSUP } /* isethiopicsup */, + { 0, 9434, 1, 5, 1, -UNI_CWCM } /* cwcm=n */, + { 0, 185, 5256, 2, 14, UNI_KANASUP } /* iskanasupplement */, + { 262, 7218, 4505, 3, 14, UNI_BAMUMSUP } /* inbamumsupplement */, + { 2, 1990, 8484, 22, 8, UNI_INSC__TONEMARK } /* indicsyllabiccategory=tonemark */, + { 3, 9691, 8635, 4, 7, UNI_INHANUNOO } /* blk=hanunoo */, + { 313, 1770, 4954, 22, 4, UNI_BPT__O } /* bidipairedbrackettype=open */, + { 0, 9743, 9454, 4, 5, -UNI_DEP } /* dep=false */, + { 3, 3121, 6001, 18, 4, UNI_DT__NONE } /* decompositiontype=none */, + { 0, 9711, 9305, 5, 4, UNI_CCC__15 } /* ccc=ccc15 */, + { 1, 9691, 7600, 4, 10, UNI_YIRADICALS } /* blk=yiradicals */, + { 0, 9979, 10051, 4, 4, UNI_TOTO } /* scx=toto */, + { 9, 8642, 9454, 7, 5, -UNI_HYPHEN } /* hyphen=false */, + { 0, 3877, 10115, 17, 4, UNI_QAAI } /* scriptextensions=zinh */, + { 0, 7360, 8413, 11, 7, UNI_LB__LF } /* linebreak=linefeed */, + { 0, 7570, 0, 4, 0, UNI_WARA } /* wara */, + { 58, 185, 7210, 2, 10, UNI_ASCII } /* isbasiclatin */, + { 2, 9476, 3826, 3, 10, UNI_SC__MANI } /* sc=manichaean */, + { 3, 8973, 1370, 6, 24, UNI_ARABICPFA } /* block=arabicpresentationformsa */, + { 0, 9927, 1026, 4, 2, -UNI_PCM } /* pcm=no */, + { 9, 3877, 7330, 17, 10, UNI_KHAR } /* scriptextensions=kharoshthi */, + { 0, 6083, 9631, 13, 4, UNI_NV__3_SLASH_80 } /* numericvalue=3/80 */, + { 0, 9727, 10355, 4, 3, UNI_CWL } /* cwl=yes */, + { 0, 8973, 3571, 6, 17, UNI_ALCHEMICAL } /* block=alchemicalsymbols */, + { 1, 9476, 9719, 3, 4, UNI_SC__CPMN } /* sc=cpmn */, + { 812, 9429, 0, 5, 0, UNI_cwcf_values_index } /* cwcf= */, + { 8, 1553, 10396, 9, 2, UNI_ZL } /* category=zl */, + { 4, 9755, 0, 4, 0, UNI_DSRT } /* dsrt */, + { 1, 7580, 496, 10, 2, UNI_WB__NU } /* wordbreak=nu */, + { 48, 21, 9524, 2, 5, UNI_INRUNIC } /* inrunic */, + { 0, 9476, 9687, 3, 4, UNI_BHKS } /* sc=bhks */, + { 0, 7360, 3, 11, 1, UNI_LB__LF } /* linebreak=lf */, + { 747, 9663, 0, 4, 0, UNI_ARMI } /* armi */, + { 101, 7297, 2228, 3, 13, UNI_ROHG } /* ishanifirohingya */, + { 38, 4074, 340, 16, 2, UNI_LO } /* generalcategory=lo */, + { 43, 185, 868, 2, 28, UNI_PHONETICEXTSUP } /* isphoneticextensionssupplement */, + { 129, 9469, 5044, 5, 15, UNI_LOE } /* inpc=visualorderleft */, + { 3, 10217, 0, 3, 0, UNI_bc_values_index } /* bc= */, + { 1, 8973, 8356, 6, 8, UNI_INHIRAGANA } /* block=hiragana */, + { 33, 6083, 8188, 13, 8, UNI_NV__2_SLASH_3 } /* numericvalue=6.67e-01 */, + { 24, 8810, 0, 4, 0, UNI_SOYO } /* soyo */, + { 68, 185, 44, 3, 2, UNI_CJK } /* iscjk */, + { 12, 118, 448, 3, 31, UNI_IDEOGRAPHICSYMBOLS } /* inideographicsymbolsandpunctuation */, + { 64, 8973, 3139, 6, 18, UNI_DEVANAGARIEXT } /* block=devanagariextended */, + { 13, 2304, 7432, 4, 8, UNI_SOGO } /* isoldsogdian */, + { 68, 8973, 3911, 6, 17, UNI_SMALLFORMS } /* block=smallformvariants */, + { 1, 10268, 8004, 3, 8, UNI_NV__5_SLASH_2 } /* nv=2.50e+00 */, + { 2, 1320, 0, 25, 0, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* symbolsandpictographsexta */, + { 2, 9979, 4759, 4, 15, UNI_ARMI } /* scx=imperialaramaic */, + { 0, 4865, 1163, 4, 2, UNI_CPRT } /* iscprt */, + { 1, 10352, 8313, 3, 3, UNI_WB__EB } /* wb=gaz */, + { 204, 2974, 0, 19, 0, UNI_SUPARROWSB } /* supplementalarrowsb */, + { 24, 2085, 0, 4, 0, UNI_MODI } /* modi */, + { 0, 3894, 3, 17, 1, -UNI_STERM } /* sentenceterminal=f */, + { 18, 9979, 4924, 4, 15, UNI_NARB } /* scx=oldnortharabian */, + { 0, 8579, 0, 7, 0, UNI_CJKEXTF } /* cjkextf */, + { 0, 2373, 0, 20, 0, UNI_PC } /* connectorpunctuation */, + { 4, 1858, 3, 22, 1, -UNI_CWT } /* changeswhentitlecased=f */, + { 2, 185, 2165, 3, 20, UNI_CYRILLICSUP } /* iscyrillicsupplementary */, + { 366, 9429, 1, 5, 1, -UNI_CWCF } /* cwcf=n */, + { 3, 8782, 9707, 7, 4, UNI_CANS } /* script=cans */, + { 392, 6386, 0, 7, 0, UNI_MAHJONG } /* mahjong */, + { 2, 868, 0, 11, 0, UNI_PHONETICEXT } /* phoneticext */, + { 0, 10280, 1, 3, 1, -UNI_RI } /* ri=n */, + { 0, 9476, 7570, 3, 10, UNI_WARA } /* sc=warangciti */, + { 27, 4202, 0, 16, 0, UNI_LINEARBSYLLABARY } /* linearbsyllabary */, + { 0, 8782, 9117, 7, 6, UNI_LEPC } /* script=lepcha */, + { 0, 10247, 5480, 3, 14, UNI_JG__MANICHAEANRESH } /* jg=manichaeanresh */, + { 0, 10508, 468, 8, 5, UNI_XPOSIXPUNCT } /* isxposixpunct */, + { 0, 2056, 1, 22, 1, -UNI__PERL_NCHAR } /* noncharactercodepoint=n */, + { 6, 9979, 2353, 4, 20, UNI_HLUW } /* scx=anatolianhieroglyphs */, + { 0, 1852, 3, 6, 1, -UNI_CASED } /* cased=f */, + { 2, 1553, 3301, 9, 18, UNI_PI } /* category=initialpunctuation */, + { 1, 9979, 5227, 4, 4, UNI_CHAM } /* scx=cham */, + { 0, 8782, 2879, 7, 9, UNI_SC__MONG } /* script=mongolian */, + { 8, 8973, 909, 6, 14, UNI_PUA } /* block=privateusearea */, + { 3, 3121, 1295, 18, 5, UNI_DT__SUP } /* decompositiontype=super */, + { 4, 7580, 5669, 10, 2, UNI_WB__EB } /* wordbreak=eb */, + { 36, 9711, 9499, 4, 5, UNI_CCC__7 } /* ccc=nukta */, + { 11, 2936, 0, 4, 0, UNI_SUND } /* sund */, + { 4, 9691, 660, 4, 30, UNI_CJKEXTF } /* blk=cjkunifiedideographsextensionf */, + { 0, 3877, 9967, 17, 4, UNI_RUNR } /* scriptextensions=runr */, + { 0, 5662, 36, 15, 1, UNI_SB__ST } /* sentencebreak=st */, + { 98, 8973, 1345, 6, 25, UNI_SYMBOLSFORLEGACYCOMPUTING } /* block=symbolsforlegacycomputing */, + { 0, 9476, 8979, 3, 6, UNI_CARI } /* sc=carian */, + { 706, 4157, 1931, 3, 15, UNI_INDICNUMBERFORMS } /* isindicnumberforms */, + { 0, 9691, 2085, 4, 4, UNI_INMODI } /* blk=modi */, + { 96, 6697, 26, 11, 1, UNI_XPOSIXALPHA } /* alphabetic=y */, + { 0, 9691, 4489, 4, 15, UNI_ARABICEXTB } /* blk=arabicextendedb */, + { 1, 9647, 10199, 4, 3, UNI_AGE__6_DOT_1 } /* age=6.1 */, + { 0, 3707, 0, 17, 0, UNI_ETHIOPICEXTA } /* ethiopicextendeda */, + { 0, 8782, 9739, 7, 4, UNI_SC__CYRL } /* script=cyrl */, + { 52, 6340, 2691, 4, 17, UNI_COUNTINGROD } /* incountingrodnumerals */, + { 2, 9871, 0, 3, 0, UNI_MRO } /* mro */, + { 2, 8887, 3, 7, 1, -UNI_XPOSIXSPACE } /* wspace=f */, + { 384, 9979, 6302, 4, 6, UNI_HEBR } /* scx=hebrew */, + { 18, 8973, 750, 6, 16, UNI_ENCLOSEDALPHANUM } /* block=enclosedalphanum */, + { 0, 9743, 0, 4, 0, UNI_dep_values_index } /* dep= */, + { 2, 185, 5771, 2, 13, UNI_BLOCKELEMENTS } /* isblockelements */, + { 3, 9449, 0, 10, 0, -UNI_EMOD } /* emod=false */, + { 5, 9979, 6386, 4, 4, UNI_MAHJ } /* scx=mahj */, + { 3, 7230, 3741, 10, 17, UNI_BC__ES } /* bidiclass=europeanseparator */, + { 9, 4074, 729, 16, 6, UNI_N } /* generalcategory=number */, + { 0, 9711, 8901, 4, 3, UNI_CCC__216 } /* ccc=216 */, + { 1, 10229, 2593, 3, 4, UNI_DT__VERT } /* dt=vert */, + { 65, 7467, 8099, 3, 2, UNI_IN__14 } /* in=14 */, + { 0, 6697, 9454, 11, 5, -UNI_XPOSIXALPHA } /* alphabetic=false */, + { 2, 2304, 4347, 3, 15, UNI_PO } /* isotherpunctuation */, + { 261, 8973, 4314, 6, 7, UNI_INMYANMAR } /* block=myanmar */, + { 2, 8973, 4442, 6, 16, UNI_TANGUTSUP } /* block=tangutsupplement */, + { 0, 8961, 3, 6, 1, -UNI_BIDIC } /* bidic=f */, + { 0, 10223, 10355, 3, 3, UNI_CI } /* ci=yes */, + { 1, 8973, 8340, 6, 8, UNI_INGUJARATI } /* block=gujarati */, + { 0, 185, 8537, 2, 7, UNI_BENG } /* isbengali */, + { 1, 1418, 9335, 25, 4, UNI_CCC__21 } /* canonicalcombiningclass=ccc21 */, + { 24, 10247, 5704, 3, 10, UNI_JG__TEHMARBUTA } /* jg=tehmarbuta */, + { 28, 6083, 5732, 13, 9, UNI_NV__100000000 } /* numericvalue=100000000 */, + { 1, 2248, 2312, 3, 6, UNI_INSINHALA } /* insinhala */, + { 4, 185, 7330, 2, 10, UNI_KHAR } /* iskharoshthi */, + { 0, 8973, 5242, 6, 14, UNI_HIGHSURROGATES } /* block=highsurrogates */, + { 0, 10247, 9995, 3, 4, UNI_JG__SHIN } /* jg=shin */, + { 0, 185, 1014, 2, 5, UNI_GREK } /* isgreek */, + { 2, 7218, 7211, 3, 9, UNI_ASCII } /* inbasiclatin */, + { 1, 21, 9656, 3, 3, UNI_INAHOM } /* inahom */, + { 7, 3877, 9791, 17, 4, UNI_HLUW } /* scriptextensions=hluw */, + { 0, 9711, 9405, 5, 4, UNI_CCC__35 } /* ccc=ccc35 */, + { 9, 2332, 0, 21, 0, UNI_YIJING } /* yijinghexagramsymbols */, + { 3, 185, 3104, 3, 17, UNI_COPTICEPACTNUMBERS } /* iscopticepactnumbers */, + { 3, 9691, 8796, 4, 7, UNI_SHAW } /* blk=shavian */, + { 733, 10253, 341, 3, 2, UNI_LB__OP } /* lb=op */, + { 2, 2304, 7810, 4, 7, UNI_ITAL } /* isolditalic */, + { 0, 185, 3050, 3, 7, UNI_CHER } /* ischerokee */, + { 0, 6741, 1, 11, 1, -UNI_DEP } /* deprecated=n */, + { 0, 1418, 8988, 24, 3, UNI_CCC__103 } /* canonicalcombiningclass=103 */, + { 22, 185, 8691, 2, 4, UNI_MULT } /* ismult */, + { 0, 1553, 0, 10, 0, UNI_S } /* category=s */, + { 32, 9691, 7241, 5, 9, UNI_BOXDRAWING } /* blk=boxdrawing */, + { 57, 185, 3319, 2, 9, UNI_LATINEXTA } /* islatinexta */, + { 0, 9464, 10355, 5, 3, UNI_IDST } /* idst=yes */, + { 0, 1418, 8099, 24, 2, UNI_CCC__14 } /* canonicalcombiningclass=14 */, + { 0, 10553, 2937, 3, 8, UNI_SUND } /* issundanese */, + { 6, 9290, 8302, 4, 6, UNI_INDUPLOYAN } /* induployan */, + { 3, 6529, 4925, 3, 14, UNI_NARB } /* inoldnortharabian */, + { 0, 9461, 496, 3, 2, UNI_SB__NU } /* sb=nu */, + { 7, 8782, 8607, 7, 4, UNI_ELBA } /* script=elba */, + { 9, 1270, 36, 25, 1, UNI_COMPEX } /* fullcompositionexclusion=t */, + { 0, 9476, 10083, 3, 4, UNI_VAI } /* sc=vaii */, + { 0, 10229, 0, 3, 0, UNI_dt_values_index } /* dt= */, + { 1, 8967, 36, 6, 1, UNI_BIDIM } /* bidim=t */, + { 2, 3877, 9963, 17, 4, UNI_ROHG } /* scriptextensions=rohg */, + { 128, 5875, 2651, 13, 19, UNI_JG__BURUSHASKIYEHBARREE } /* joininggroup=burushaskiyehbarree */, + { 11, 2003, 0, 10, 1, UNI_UPPERCASELETTER } /* category=lu */, + { 1, 9695, 4954, 4, 4, UNI_BPT__O } /* bpt=open */, + { 0, 9863, 0, 4, 0, UNI_MIAO } /* miao */, + { 7, 9927, 9454, 4, 5, -UNI_PCM } /* pcm=false */, + { 32, 9691, 1466, 4, 24, UNI_DIACRITICALSFORSYMBOLS } /* blk=combiningmarksforsymbols */, + { 1, 8782, 10103, 7, 4, UNI_SC__YI } /* script=yiii */, + { 0, 9979, 9081, 4, 6, UNI_HATR } /* scx=hatran */, + { 4, 1990, 1490, 22, 24, UNI_INSC__CONSONANTSUCCEEDINGREPHA } /* indicsyllabiccategory=consonantsucceedingrepha */, + { 0, 185, 1968, 2, 22, UNI_EARLYDYNASTICCUNEIFORM } /* isearlydynasticcuneiform */, + { 1, 5592, 1026, 14, 2, -UNI_PATSYN } /* patternsyntax=no */, + { 1, 185, 9524, 2, 5, UNI_RUNR } /* isrunic */, + { 0, 8782, 4534, 7, 4, UNI_BRAI } /* script=brai */, + { 0, 4972, 8839, 3, 6, UNI_LANA } /* istaitham */, + { 0, 9476, 9294, 3, 5, UNI_SC__BUHD } /* sc=buhid */, + { 11, 8782, 7781, 7, 9, UNI_NBAT } /* script=nabataean */, + { 10, 2304, 8742, 4, 5, UNI_OLCK } /* isolchiki */, + { 0, 1418, 10145, 24, 3, UNI_CCC__BL } /* canonicalcombiningclass=218 */, + { 2, 8782, 1219, 7, 8, UNI_SC__KANA } /* script=katakana */, + { 4, 2304, 263, 3, 3, UNI_OSMA } /* isosma */, + { 0, 9063, 10355, 6, 3, UNI_EPRES } /* epres=yes */, + { 263, 8961, 10355, 6, 3, UNI_BIDIC } /* bidic=yes */, + { 4, 6340, 8566, 3, 6, UNI_CJKEXTD } /* incjkextd */, + { 6, 9979, 9783, 4, 4, UNI_GURU } /* scx=guru */, + { 513, 21, 4170, 2, 9, UNI_LATIN1 } /* inlatin1sup */, + { 21, 5875, 7038, 13, 11, UNI_JG__ROHINGYAYEH } /* joininggroup=rohingyayeh */, + { 1, 5758, 0, 12, 0, UNI_BIDIM } /* bidimirrored */, + { 7, 10553, 4411, 3, 8, UNI_SYRIACSUP } /* issyriacsup */, + { 5, 10268, 8943, 3, 4, UNI_NV__8000 } /* nv=8000 */, + { 0, 9219, 36, 6, 1, UNI_XPOSIXUPPER } /* upper=t */, + { 72, 10268, 10366, 3, 2, UNI_NV__46 } /* nv=46 */, + { 1, 5408, 4383, 4, 11, UNI_MATHOPERATORS } /* inmathoperators */, + { 18, 9979, 7820, 4, 4, UNI_PERM } /* scx=perm */, + { 3, 9711, 8211, 4, 2, UNI_CCC__18 } /* ccc=18 */, + { 38, 7580, 4912, 10, 2, UNI_WB__DQ } /* wordbreak=dq */, + { 268, 6083, 7611, 13, 8, UNI_NV__1_SLASH_2 } /* numericvalue=5.00e-01 */, + { 88, 1792, 3, 22, 1, -UNI_CWCF } /* changeswhencasefolded=f */, + { 0, 6044, 0, 13, 0, UNI_MAYANNUMERALS } /* mayannumerals */, + { 41, 9979, 9831, 4, 4, UNI_LAO } /* scx=laoo */, + { 0, 4090, 0, 11, 0, UNI_GEORGIANEXT } /* georgianext */, + { 916, 5592, 0, 13, 0, UNI_PATSYN } /* patternsyntax */, + { 1, 3877, 9739, 17, 4, UNI_CYRL } /* scriptextensions=cyrl */, + { 25, 185, 7709, 2, 9, UNI_SIND } /* iskhudawadi */, + { 5, 9476, 9975, 3, 4, UNI_SARB } /* sc=sarb */, + { 0, 5875, 4244, 13, 3, UNI_JG__LAM } /* joininggroup=lam */, + { 2, 1418, 9671, 24, 4, UNI_CCC__216 } /* canonicalcombiningclass=atar */, + { 1, 8881, 4491, 4, 13, UNI_ARABICEXTB } /* isarabicextendedb */, + { 0, 9691, 317, 4, 33, UNI_SUPMATHOPERATORS } /* blk=supplementalmathematicaloperators */, + { 13, 8973, 6626, 6, 12, UNI_PLAYINGCARDS } /* block=playingcards */, + { 0, 1858, 0, 21, 0, UNI_CWT } /* changeswhentitlecased */, + { 0, 9469, 7115, 5, 11, UNI_INPC__TOPANDRIGHT } /* inpc=topandright */, + { 56, 118, 2455, 4, 18, UNI_ININSCRIPTIONALPAHLAVI } /* ininscriptionalpahlavi */, + { 0, 9979, 7844, 4, 9, UNI_PALM } /* scx=palmyrene */, + { 0, 9476, 8340, 3, 8, UNI_SC__GUJR } /* sc=gujarati */, + { 514, 8973, 721, 7, 15, UNI_CUNEIFORMNUMBERS } /* block=cuneiformnumbers */, + { 0, 185, 8316, 2, 7, UNI_EXTPICT } /* isextpict */, + { 4, 9147, 3, 6, 1, -UNI__PERL_NCHAR } /* nchar=f */, + { 65, 4074, 5797, 16, 13, UNI_XPOSIXDIGIT } /* generalcategory=decimalnumber */, + { 1, 6083, 10130, 13, 3, UNI_NV__1_SLASH_7 } /* numericvalue=1/7 */, + { 132, 2304, 1062, 3, 26, UNI_OCR } /* isopticalcharacterrecognition */, + { 0, 2553, 0, 19, 0, UNI_TERM } /* terminalpunctuation */, + { 1, 8973, 2311, 6, 21, UNI_SINHALAARCHAICNUMBERS } /* block=sinhalaarchaicnumbers */, + { 0, 8782, 8621, 7, 4, UNI_SC__GRAN } /* script=gran */, + { 0, 5592, 0, 14, 0, UNI_patsyn_values_index } /* patternsyntax= */, + { 18, 10283, 3, 3, 1, -UNI_SD } /* sd=f */, + { 1, 1418, 10163, 24, 3, UNI_CCC__AR } /* canonicalcombiningclass=232 */, + { 18, 10268, 8943, 3, 6, UNI_NV__800000 } /* nv=800000 */, + { 0, 9691, 1930, 4, 16, UNI_INDICNUMBERFORMS } /* blk=indicnumberforms */, + { 0, 3409, 10055, 18, 4, UNI_RI } /* regionalindicator=true */, + { 11, 7360, 989, 10, 2, UNI_LB__CP } /* linebreak=cp */, + { 0, 9979, 8775, 4, 7, UNI_PHAG } /* scx=phagspa */, + { 1, 9883, 0, 4, 0, UNI_NARB } /* narb */, + { 32, 8702, 752, 4, 28, UNI_ENCLOSEDALPHANUMSUP } /* inenclosedalphanumericsupplement */, + { 74, 7297, 2747, 3, 18, UNI_JAMOEXTA } /* ishanguljamoextendeda */, + { 0, 9979, 8670, 4, 7, UNI_MAKA } /* scx=makasar */, + { 11, 8973, 350, 6, 33, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* block=supplementalsymbolsandpictographs */, + { 177, 9979, 1678, 4, 5, UNI_LATN } /* scx=latin */, + { 0, 185, 9716, 3, 3, UNI_CHRS } /* ischrs */, + { 67, 6083, 9563, 13, 4, UNI_NV__1_SLASH_10 } /* numericvalue=1/10 */, + { 0, 9439, 10055, 5, 4, UNI_DASH } /* dash=true */, + { 10, 1935, 0, 11, 0, UNI_NUMBERFORMS } /* numberforms */, + { 1, 9476, 9529, 3, 5, UNI_SC__TALE } /* sc=taile */, + { 0, 9171, 36, 6, 1, UNI__PERL_PATWS } /* patws=t */, + { 1, 8973, 4106, 6, 16, UNI_HALFANDFULLFORMS } /* block=halfandfullforms */, + { 341, 1189, 2101, 3, 21, UNI_TRANSPORTANDMAP } /* intransportandmapsymbols */, + { 264, 9763, 912, 4, 1, UNI_GCB__V } /* gcb=v */, + { 0, 10268, 7934, 3, 2, UNI_NV__25 } /* nv=25 */, + { 0, 9476, 9795, 3, 4, UNI_HMNG } /* sc=hmng */, + { 0, 9051, 10355, 6, 3, UNI_ECOMP } /* ecomp=yes */, + { 7, 3283, 9454, 18, 5, -UNI_IDSB } /* idsbinaryoperator=false */, + { 0, 6083, 8913, 13, 4, UNI_NV__4000 } /* numericvalue=4000 */, + { 0, 7682, 0, 8, 0, UNI_EXT } /* extender */, + { 1, 5875, 1512, 13, 3, UNI_JG__HAH } /* joininggroup=hah */, + { 48, 8955, 36, 6, 1, UNI_XPOSIXALPHA } /* alpha=t */, + { 0, 8973, 1632, 6, 18, UNI_GEOMETRICSHAPESEXT } /* block=geometricshapesext */, + { 21, 9476, 9831, 3, 3, UNI_LAO } /* sc=lao */, + { 7, 9691, 9135, 4, 6, UNI_INLYDIAN } /* blk=lydian */, + { 0, 6340, 116, 4, 23, UNI_DIACRITICALS } /* incombiningdiacriticalmarks */, + { 56, 9787, 0, 4, 0, UNI_HANO } /* hano */, + { 0, 9469, 7451, 3, 9, UNI_INPHOENICIAN } /* inphoenician */, + { 3, 9544, 9454, 5, 5, -UNI_XIDC } /* xidc=false */, + { 256, 9476, 9963, 3, 4, UNI_SC__ROHG } /* sc=rohg */, + { 2, 6083, 7950, 13, 2, UNI_NV__43 } /* numericvalue=43 */, + { 0, 5662, 126, 14, 2, UNI_LB__CR } /* sentencebreak=cr */, + { 21, 5088, 3, 14, 1, -UNI_POSIXXDIGIT } /* asciihexdigit=f */, + { 0, 10244, 5014, 3, 15, UNI_UPPERCASELETTER } /* gc=uppercaseletter */, + { 0, 9691, 868, 4, 11, UNI_PHONETICEXT } /* blk=phoneticext */, + { 1, 7460, 10316, 10, 3, UNI_IN__5 } /* presentin=v50 */, + { 640, 839, 0, 29, 0, UNI_MISCARROWS } /* miscellaneoussymbolsandarrows */, + { 0, 7460, 9587, 10, 4, UNI_IN__11 } /* presentin=11.0 */, + { 0, 9045, 9454, 6, 5, -UNI_CWKCF } /* cwkcf=false */, + { 2, 10553, 8825, 3, 6, UNI_SUPPUAB } /* issuppuab */, + { 113, 4972, 3482, 3, 10, UNI_TAIXUANJING } /* istaixuanjing */, + { 0, 9051, 26, 6, 1, UNI_ECOMP } /* ecomp=y */, + { 0, 8782, 0, 7, 0, UNI_sc_values_index } /* script= */, + { 3, 7467, 9596, 3, 3, UNI_IN__2_DOT_1 } /* in=2.1 */, + { 1, 10247, 10265, 3, 3, UNI_JG__MIM } /* jg=mim */, + { 0, 9979, 9519, 4, 5, UNI_OSGE } /* scx=osage */, + { 3, 9979, 1116, 4, 4, UNI_HANG } /* scx=hang */, + { 36, 1418, 9315, 25, 4, UNI_CCC__17 } /* canonicalcombiningclass=ccc17 */, + { 12, 8452, 0, 8, 0, UNI_SPECIALS } /* specials */, + { 1090, 9691, 3139, 4, 13, UNI_DEVANAGARIEXT } /* blk=devanagariext */, + { 1, 3121, 69, 18, 3, UNI_DT__SUP } /* decompositiontype=sup */, + { 0, 8973, 1562, 6, 24, UNI_SUPSYMBOLSANDPICTOGRAPHS } /* block=supsymbolsandpictographs */, + { 0, 9033, 0, 6, 0, UNI_CAKM } /* chakma */, + { 5, 10268, 8036, 3, 8, UNI_NV__1_SLASH_32 } /* nv=3.12e-02 */, + { 5, 9489, 9454, 5, 5, -UNI_MATH } /* math=false */, + { 2, 9711, 8994, 4, 3, UNI_CCC__107 } /* ccc=107 */, + { 522, 10547, 3403, 6, 5, UNI_POSIXSPACE } /* isperlspace */, + { 14, 4426, 0, 16, 0, UNI_TANGUTCOMPONENTS } /* tangutcomponents */, + { 2, 9691, 479, 4, 31, UNI_MATHALPHANUM } /* blk=mathematicalalphanumericsymbols */, + { 7, 3877, 8292, 17, 4, UNI_BUGI } /* scriptextensions=bugi */, + { 3, 9655, 0, 4, 0, UNI_AHOM } /* ahom */, + { 1034, 3877, 4534, 17, 4, UNI_BRAI } /* scriptextensions=brai */, + { 2, 185, 571, 3, 29, UNI_CJKEXTC } /* iscjkunifiedideographsextensionc */, + { 0, 10247, 7170, 3, 10, UNI_JG__AFRICANFEH } /* jg=africanfeh */, + { 11, 10402, 1528, 6, 9, UNI__PERL_SURROGATE } /* _perl_surrogate */, + { 0, 8677, 0, 7, 0, UNI_MAND } /* mandaic */, + { 0, 2803, 9454, 19, 5, -UNI_IDST } /* idstrinaryoperator=false */, + { 0, 9476, 8300, 3, 4, UNI_SC__DUPL } /* sc=dupl */, + { 0, 8782, 4759, 7, 15, UNI_ARMI } /* script=imperialaramaic */, + { 8, 8973, 8859, 6, 7, UNI_INTIBETAN } /* block=tibetan */, + { 4, 6674, 3, 12, 1, -UNI_XIDC } /* xidcontinue=f */, + { 7, 21, 5089, 3, 4, UNI_ASCII } /* inascii */, + { 0, 1852, 0, 5, 0, UNI_CASED } /* cased */, + { 0, 9731, 9454, 4, 5, -UNI_CWT } /* cwt=false */, + { 2, 1418, 5849, 24, 13, UNI_CCC__IS } /* canonicalcombiningclass=iotasubscript */, + { 0, 8782, 1177, 8, 3, UNI_SORA } /* script=sora */, + { 1, 8444, 1026, 8, 2, -UNI_RADICAL } /* radical=no */, + { 258, 924, 0, 28, 0, UNI_SUPPUAB } /* supplementaryprivateuseareab */, + { 528, 10511, 468, 5, 5, UNI_POSIXPUNCT } /* posixpunct */, + { 0, 8782, 10047, 7, 4, UNI_TNSA } /* script=tnsa */, + { 0, 9711, 9395, 5, 4, UNI_CCC__33 } /* ccc=ccc33 */, + { 0, 9476, 7500, 3, 10, UNI_SAUR } /* sc=saurashtra */, + { 17, 8973, 5634, 6, 14, UNI_INPSALTERPAHLAVI } /* block=psalterpahlavi */, + { 0, 10247, 7187, 3, 3, UNI_JG__QAF } /* jg=qaf */, + { 0, 1418, 7995, 24, 2, UNI_CCC__12 } /* canonicalcombiningclass=12 */, + { 0, 9691, 9231, 4, 6, UNI_INWANCHO } /* blk=wancho */, + { 3, 10352, 10394, 3, 2, UNI_WB__XX } /* wb=xx */, + { 1, 9691, 9129, 4, 6, UNI_INLYCIAN } /* blk=lycian */, + { 0, 6675, 9454, 11, 5, -UNI_IDC } /* idcontinue=false */, + { 0, 2501, 0, 3, 0, UNI_PUA } /* pua */, + { 512, 9476, 9843, 3, 4, UNI_SC__LINB } /* sc=linb */, + { 1, 7360, 5102, 10, 14, UNI_LB__CR } /* linebreak=carriagereturn */, + { 13, 9691, 3656, 4, 17, UNI_CYRILLICEXTA } /* blk=cyrillicextendeda */, + { 0, 1538, 3012, 24, 19, UNI_INPC__TOPANDBOTTOMANDLEFT } /* indicpositionalcategory=topandbottomandleft */, + { 180, 10349, 1026, 3, 2, -UNI_VS } /* vs=no */, + { 0, 9711, 9022, 5, 5, UNI_CCC__132 } /* ccc=ccc132 */, + { 0, 185, 4378, 2, 16, UNI_SUPMATHOPERATORS } /* issupmathoperators */, + { 3, 9190, 3, 5, 1, -UNI_TERM } /* term=f */, + { 35, 8684, 0, 4, 0, UNI_MARC } /* marc */, + { 1, 10352, 496, 3, 2, UNI_WB__NU } /* wb=nu */, + { 1, 185, 721, 3, 8, UNI_XSUX } /* iscuneiform */, + { 16, 9476, 9482, 3, 4, UNI_PHLI } /* sc=phli */, + { 4, 10253, 3, 4, 1, UNI_LB__LF } /* lb=lf */, + { 8, 8768, 10355, 7, 3, UNI_PATSYN } /* patsyn=yes */, + { 148, 6083, 8092, 13, 8, UNI_NV__2_SLASH_5 } /* numericvalue=4.00e-01 */, + { 1, 8702, 752, 4, 19, UNI_ENCLOSEDALPHANUM } /* inenclosedalphanumerics */, + { 0, 6083, 8252, 13, 8, UNI_NV__11_SLASH_12 } /* numericvalue=9.17e-01 */, + { 1, 9691, 2433, 4, 20, UNI_GLAGOLITICSUP } /* blk=glagoliticsupplement */, + { 17, 9735, 0, 3, 0, UNI_CWU } /* cwu */, + { 48, 8967, 1, 6, 1, -UNI_BIDIM } /* bidim=n */, + { 228, 10244, 10396, 3, 2, UNI_ZL } /* gc=zl */, + { 3, 10244, 407, 3, 7, UNI_XPOSIXCNTRL } /* gc=control */, + { 1, 10516, 473, 3, 2, UNI_PUA } /* ispua */, + { 5, 8782, 2937, 8, 3, UNI_SUND } /* script=sund */, + { 0, 7467, 10205, 3, 3, UNI_IN__7 } /* in=7.0 */, + { 2, 2206, 6278, 21, 12, UNI_WB__EB } /* graphemeclusterbreak=glueafterzwj */, + { 3, 2206, 1088, 21, 7, UNI_GCB__PP } /* graphemeclusterbreak=prepend */, + { 19, 1189, 4427, 3, 5, UNI_INTANGUT } /* intangut */, + { 0, 9476, 4504, 3, 4, UNI_BAMU } /* sc=bamu */, + { 0, 8782, 4426, 7, 4, UNI_TANG } /* script=tang */, + { 36, 10268, 8220, 3, 8, UNI_NV__5_SLASH_6 } /* nv=8.33e-01 */, + { 53, 7682, 1, 9, 1, -UNI_EXT } /* extender=n */, + { 0, 1553, 1466, 9, 13, UNI_M } /* category=combiningmark */, + { 0, 3877, 9863, 17, 4, UNI_MIAO } /* scriptextensions=miao */, + { 0, 7460, 9596, 10, 3, UNI_IN__2_DOT_1 } /* presentin=2.1 */, + { 13, 185, 2144, 3, 20, UNI_CJKRADICALSSUP } /* iscjkradicalssupplement */, + { 1, 5875, 6482, 13, 12, UNI_JG__MANICHAEANPE } /* joininggroup=manichaeanpe */, + { 802, 185, 24, 2, 1, UNI_L } /* isl */, + { 0, 10223, 0, 3, 0, UNI_ci_values_index } /* ci= */, + { 1, 8973, 7570, 6, 10, UNI_INWARANGCITI } /* block=warangciti */, + { 6, 8973, 3978, 6, 11, UNI_BOPOMOFOEXT } /* block=bopomofoext */, + { 8, 7360, 6818, 10, 11, UNI_LB__IN } /* linebreak=inseparable */, + { 18, 7580, 0, 4, 0, UNI_XPOSIXWORD } /* word */, + { 137, 9524, 0, 5, 0, UNI_RUNR } /* runic */, + { 24, 1553, 5582, 10, 10, UNI_MC } /* category=spacingmark */, + { 145, 8782, 9851, 7, 4, UNI_MEDF } /* script=medf */, + { 1, 185, 3707, 2, 16, UNI_ETHIOPICEXT } /* isethiopicextended */, + { 0, 6340, 8552, 3, 6, UNI_CJKEXTB } /* incjkextb */, + { 0, 3121, 9759, 18, 4, UNI_DT__FONT } /* decompositiontype=font */, + { 0, 9476, 2164, 3, 8, UNI_SC__CYRL } /* sc=cyrillic */, + { 2, 5648, 10055, 14, 4, UNI_QMARK } /* quotationmark=true */, + { 0, 9691, 7520, 4, 10, UNI_SUPARROWSA } /* blk=suparrowsa */, + { 1, 5592, 10055, 14, 4, UNI_PATSYN } /* patternsyntax=true */, + { 0, 6302, 0, 4, 0, UNI_HEBR } /* hebr */, + { 0, 6340, 1903, 3, 18, UNI_CJKCOMPATIDEOGRAPHS } /* incjkcompatideographs */, + { 297, 10244, 24, 3, 1, UNI_L } /* gc=l */, + { 3, 9703, 0, 4, 0, UNI_CAKM } /* cakm */, + { 2, 10217, 10259, 3, 3, UNI_BC__LRI } /* bc=lri */, + { 1, 9476, 9663, 3, 4, UNI_ARMI } /* sc=armi */, + { 803, 9979, 9911, 4, 4, UNI_ORKH } /* scx=orkh */, + { 398, 8537, 0, 4, 0, UNI_BENG } /* beng */, + { 1, 10217, 3373, 3, 18, UNI_BC__B } /* bc=paragraphseparator */, + { 16, 3894, 10355, 17, 3, UNI_STERM } /* sentenceterminal=yes */, + { 0, 1836, 26, 22, 1, UNI_CWL } /* changeswhenlowercased=y */, + { 0, 8782, 8670, 7, 7, UNI_MAKA } /* script=makasar */, + { 1, 7907, 1026, 9, 2, -UNI_XIDS } /* xidstart=no */, + { 0, 7467, 9595, 3, 4, UNI_IN__12_DOT_1 } /* in=12.1 */, + { 0, 4074, 5810, 16, 13, UNI_ME } /* generalcategory=enclosingmark */, + { 1, 5662, 8747, 14, 7, UNI_SB__LE } /* sentencebreak=oletter */, + { 0, 4074, 1067, 16, 2, UNI_CASEDLETTER } /* generalcategory=lc */, + { 2, 8973, 924, 6, 28, UNI_SUPPUAB } /* block=supplementaryprivateuseareab */, + { 1, 9979, 8740, 4, 7, UNI_OLCK } /* scx=olchiki */, + { 3, 9711, 10169, 4, 3, UNI_CCC__DA } /* ccc=234 */, + { 0, 6340, 4043, 3, 15, UNI_CYPRIOTSYLLABARY } /* incypriotsyllabary */, + { 143, 9803, 9, 4, 2, UNI_HST__NA } /* hst=na */, + { 1, 1418, 10169, 24, 3, UNI_CCC__DA } /* canonicalcombiningclass=234 */, + { 0, 10352, 8308, 3, 8, UNI_WB__EB } /* wb=ebasegaz */, + { 33, 9544, 26, 5, 1, UNI_XIDC } /* xidc=y */, + { 0, 10352, 7772, 3, 6, UNI_WB__MN } /* wb=midnum */, + { 0, 7460, 8046, 10, 2, UNI_IN__13 } /* presentin=13 */, + { 0, 185, 6972, 2, 11, UNI_NAND } /* isnandinagari */, + { 0, 9979, 9195, 4, 6, UNI_TNSA } /* scx=tangsa */, + { 178, 8973, 4442, 6, 9, UNI_TANGUTSUP } /* block=tangutsup */, + { 18, 9695, 17, 4, 1, UNI_BPT__O } /* bpt=o */, + { 2, 3656, 0, 17, 0, UNI_CYRILLICEXTA } /* cyrillicextendeda */, + { 3, 9474, 2393, 5, 20, UNI_INSC__CONSONANTPLACEHOLDER } /* insc=consonantplaceholder */, + { 262, 9979, 6972, 4, 4, UNI_NAND } /* scx=nand */, + { 0, 10247, 9855, 3, 4, UNI_JG__MEEM } /* jg=meem */, + { 5, 7360, 43, 10, 2, UNI_LB__CJ } /* linebreak=cj */, + { 0, 9439, 1026, 5, 2, -UNI_DASH } /* dash=no */, + { 0, 185, 5312, 2, 14, UNI_LATINEXTD } /* islatinextendedd */, + { 10, 8973, 7817, 6, 9, UNI_INOLDPERMIC } /* block=oldpermic */, + { 7, 8973, 0, 6, 42, UNI_UCASEXT } /* block=unifiedcanadianaboriginalsyllabicsextended */, + { 0, 9189, 0, 5, 0, UNI_STERM } /* sterm */, + { 4, 6083, 8949, 13, 4, UNI_NV__9000 } /* numericvalue=9000 */, + { 0, 1167, 3, 26, 1, -UNI_DI } /* defaultignorablecodepoint=f */, + { 170, 7460, 9599, 10, 4, UNI_IN__13 } /* presentin=13.0 */, + { 0, 9979, 9105, 4, 6, UNI_KHOJ } /* scx=khojki */, + { 118, 9711, 9402, 4, 2, UNI_CCC__34 } /* ccc=34 */, + { 4, 9979, 9117, 4, 4, UNI_LEPC } /* scx=lepc */, + { 2, 10244, 10388, 3, 2, UNI_CASEDLETTER } /* gc=l& */, + { 0, 1418, 8998, 25, 5, UNI_CCC__118 } /* canonicalcombiningclass=ccc118 */, + { 7, 10268, 8043, 3, 2, UNI_NV__23 } /* nv=23 */, + { 0, 9691, 3139, 4, 10, UNI_INDEVANAGARI } /* blk=devanagari */, + { 1, 8973, 8492, 6, 8, UNI_UCASEXTA } /* block=ucasexta */, + { 2, 8782, 10023, 7, 4, UNI_SC__TAML } /* script=taml */, + { 0, 3877, 2879, 17, 9, UNI_MONG } /* scriptextensions=mongolian */, + { 0, 10268, 7990, 3, 1, UNI_NV__8 } /* nv=8 */, + { 1, 3877, 9529, 17, 5, UNI_TALE } /* scriptextensions=taile */, + { 0, 8973, 3319, 6, 18, UNI_LATINEXTADDITIONAL } /* block=latinextadditional */, + { 0, 7391, 755, 4, 3, UNI_CASED } /* iscased */, + { 1042, 185, 9046, 3, 4, UNI_CWKCF } /* iscwkcf */, + { 129, 185, 6374, 2, 12, UNI_NL } /* isletternumber */, + { 24, 9979, 8691, 4, 4, UNI_MULT } /* scx=mult */, + { 1481, 3121, 8332, 18, 8, UNI_DT__FRA } /* decompositiontype=fraction */, + { 70, 8973, 1467, 7, 23, UNI_DIACRITICALSFORSYMBOLS } /* block=combiningmarksforsymbols */, + { 3, 1270, 10055, 25, 4, UNI_COMPEX } /* fullcompositionexclusion=true */, + { 0, 8973, 5088, 6, 5, UNI_ASCII } /* block=ascii */, + { 169, 2242, 6974, 4, 9, UNI_INNANDINAGARI } /* innandinagari */, + { 1, 1678, 0, 14, 0, UNI_LATINEXTA } /* latinextendeda */, + { 650, 5648, 36, 14, 1, UNI_QMARK } /* quotationmark=t */, + { 3, 8782, 9831, 7, 4, UNI_LAO } /* script=laoo */, + { 6, 185, 408, 3, 6, UNI_XPOSIXCNTRL } /* iscontrol */, + { 0, 9057, 10055, 6, 4, UNI_EMOJI } /* emoji=true */, + { 66, 3121, 9141, 18, 6, UNI_DT__NAR } /* decompositiontype=narrow */, + { 3, 7218, 4535, 3, 14, UNI_BRAI } /* inbraillepatterns */, + { 6, 9711, 9030, 4, 3, UNI_WB__EB } /* ccc=133 */, + { 0, 5172, 10055, 14, 4, UNI_EMOD } /* emojimodifier=true */, + { 4, 8973, 750, 6, 21, UNI_ENCLOSEDALPHANUM } /* block=enclosedalphanumerics */, + { 1, 8782, 79, 7, 6, UNI_SC__ARAB } /* script=arabic */, + { 89, 3945, 0, 17, 0, UNI_uideo_values_index } /* unifiedideograph= */, + { 520, 10510, 5095, 6, 6, UNI_XPOSIXXDIGIT } /* xposixxdigit */, + { 0, 3175, 1, 18, 1, -UNI_EPRES } /* emojipresentation=n */, + { 66, 185, 134, 2, 4, UNI_M } /* ismark */, + { 0, 5875, 2227, 13, 21, UNI_JG__HANIFIROHINGYAKINNAYA } /* joininggroup=hanifirohingyakinnaya */, + { 0, 2012, 10055, 22, 4, UNI_LOE } /* logicalorderexception=true */, + { 8, 9691, 9519, 4, 5, UNI_INOSAGE } /* blk=osage */, + { 292, 10280, 9454, 3, 5, -UNI_RI } /* ri=false */, + { 0, 9811, 0, 4, 0, UNI_KHMR } /* khmr */, + { 6, 4463, 8602, 4, 5, UNI_DSRT } /* indeseret */, + { 0, 3877, 7853, 17, 4, UNI_PAUC } /* scriptextensions=pauc */, + { 71, 6983, 0, 11, 0, UNI_LO } /* otherletter */, + { 136, 9979, 8979, 4, 4, UNI_CARI } /* scx=cari */, + { 1, 6340, 5131, 3, 13, UNI_CJKCOMPATFORMS } /* incjkcompatforms */, + { 1, 10247, 6005, 3, 13, UNI_JG__MANICHAEANTAW } /* jg=manichaeantaw */, + { 1, 10268, 8147, 3, 2, UNI_NV__16 } /* nv=16 */, + { 7, 7230, 0, 10, 0, UNI_bc_values_index } /* bidiclass= */, + { 692, 185, 5940, 2, 9, UNI_MLYM } /* ismalayalam */, + { 2, 6340, 44, 3, 8, UNI_CJKCOMPAT } /* incjkcompat */, + { 201, 8768, 3, 7, 1, -UNI_PATSYN } /* patsyn=f */, + { 144, 8973, 3674, 7, 16, UNI_CYRILLICEXTB } /* block=cyrillicextendedb */, + { 1, 8782, 9751, 7, 4, UNI_DIAK } /* script=diak */, + { 0, 185, 5648, 2, 13, UNI_QMARK } /* isquotationmark */, + { 0, 5088, 9454, 14, 5, -UNI_POSIXXDIGIT } /* asciihexdigit=false */, + { 26, 7210, 0, 10, 0, UNI_ASCII } /* basiclatin */, + { 128, 8973, 4669, 6, 15, UNI_DIACRITICALSSUP } /* block=diacriticalssup */, + { 9, 9476, 4849, 3, 15, UNI_MERC } /* sc=meroiticcursive */, + { 152, 9979, 8292, 4, 8, UNI_BUGI } /* scx=buginese */, + { 1, 4847, 1020, 3, 4, UNI_MUSIC } /* inmusic */, + { 19, 9691, 2164, 4, 11, UNI_CYRILLICSUP } /* blk=cyrillicsup */, + { 273, 447, 0, 18, 0, UNI_IDEOGRAPHICSYMBOLS } /* ideographicsymbols */, + { 0, 10232, 0, 3, 0, UNI_ea_values_index } /* ea= */, + { 26, 4157, 5863, 3, 12, UNI_IPAEXT } /* isipaextensions */, + { 2, 3877, 9807, 17, 4, UNI_KALI } /* scriptextensions=kali */, + { 0, 6340, 6195, 3, 11, UNI_CYRILLICEXTA } /* incyrillicexta */, + { 1, 9959, 0, 4, 0, UNI_RJNG } /* rjng */, + { 515, 5875, 9243, 13, 4, UNI_JG__YUDH } /* joininggroup=yudh */, + { 0, 1418, 9028, 25, 5, UNI_WB__EB } /* canonicalcombiningclass=ccc133 */, + { 2, 9691, 980, 4, 27, UNI_ALPHABETICPF } /* blk=alphabeticpresentationforms */, + { 96, 7460, 10175, 10, 3, UNI_IN__3_DOT_2 } /* presentin=3.2 */, + { 0, 9691, 9863, 4, 4, UNI_INMIAO } /* blk=miao */, + { 13, 8356, 0, 8, 0, UNI_HIRA } /* hiragana */, + { 2, 8468, 0, 8, 0, UNI_TAGB } /* tagbanwa */, + { 0, 7360, 5620, 10, 14, UNI_LB__PO } /* linebreak=postfixnumeric */, + { 0, 8973, 568, 6, 2, UNI_NB } /* block=nb */, + { 4, 9647, 7611, 4, 1, UNI_AGE__5 } /* age=5 */, + { 16, 5875, 7180, 13, 10, UNI_JG__AFRICANQAF } /* joininggroup=africanqaf */, + { 0, 9979, 2493, 4, 20, UNI_HMNP } /* scx=nyiakengpuachuehmong */, + { 260, 1274, 26, 21, 1, UNI_CE } /* compositionexclusion=y */, + { 0, 8782, 10039, 7, 4, UNI_THAI } /* script=thai */, + { 0, 8973, 8452, 6, 8, UNI_SPECIALS } /* block=specials */, + { 0, 10244, 1564, 3, 2, UNI_PS } /* gc=ps */, + { 2, 1418, 8211, 24, 2, UNI_CCC__18 } /* canonicalcombiningclass=18 */, + { 0, 10516, 6615, 3, 7, UNI_PHAISTOS } /* isphaistos */, + { 46, 3877, 9895, 17, 3, UNI_NKO } /* scriptextensions=nko */, + { 8, 7467, 7950, 3, 1, UNI_IN__4 } /* in=4 */, + { 0, 9979, 2509, 4, 4, UNI_MONG } /* scx=mong */, + { 11, 9147, 17, 7, 1, -UNI__PERL_NCHAR } /* nchar=no */, + { 0, 8628, 0, 7, 0, UNI_grbase_values_index } /* grbase= */, + { 2, 8782, 9069, 7, 4, UNI_GOTH } /* script=goth */, + { 0, 10268, 5732, 3, 9, UNI_NV__100000000 } /* nv=100000000 */, + { 15, 8973, 7159, 6, 11, UNI_YISYLLABLES } /* block=yisyllables */, + { 0, 9979, 9663, 4, 4, UNI_ARMI } /* scx=armi */, + { 0, 8782, 9719, 7, 4, UNI_SC__CPMN } /* script=cpmn */, + { 0, 9474, 4879, 5, 15, UNI_INSC__MODIFYINGLETTER } /* insc=modifyingletter */, + { 1, 3877, 1014, 17, 5, UNI_GREK } /* scriptextensions=greek */, + { 5, 10403, 7580, 4, 4, UNI_POSIXWORD } /* perlword */, + { 0, 185, 6614, 2, 12, UNI_PHAISTOS } /* isphaistosdisc */, + { 9, 4744, 6542, 15, 12, UNI_IDENTIFIERTYPE__NOTCHARACTER } /* identifiertype=notcharacter */, + { 1027, 8628, 1, 7, 1, -UNI_GRBASE } /* grbase=n */, + { 3, 7467, 9600, 3, 3, UNI_IN__3 } /* in=3.0 */, + { 121, 9691, 1968, 4, 22, UNI_EARLYDYNASTICCUNEIFORM } /* blk=earlydynasticcuneiform */, + { 2, 5875, 5504, 13, 4, UNI_JG__TETH } /* joininggroup=teth */, + { 1, 8782, 1629, 7, 4, UNI_SC__PHAG } /* script=phag */, + { 1, 9449, 26, 5, 1, UNI_EMOD } /* emod=y */, + { 1029, 9691, 780, 4, 30, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* blk=symbolsandpictographsextendeda */, + { 0, 7460, 7990, 10, 1, UNI_IN__8 } /* presentin=8 */, + { 65, 185, 6741, 2, 10, UNI_DEP } /* isdeprecated */, + { 0, 8973, 447, 6, 32, UNI_IDEOGRAPHICSYMBOLS } /* block=ideographicsymbolsandpunctuation */, + { 2, 10247, 6434, 3, 12, UNI_JG__MALAYALAMNNA } /* jg=malayalamnna */, + { 5, 5045, 8501, 3, 7, UNI_UGAR } /* isugaritic */, + { 0, 9763, 8308, 4, 8, UNI_WB__EB } /* gcb=ebasegaz */, + { 365, 9190, 0, 5, 0, UNI_term_values_index } /* term= */, + { 0, 1814, 10355, 22, 3, UNI_CWCM } /* changeswhencasemapped=yes */, + { 2, 8955, 9454, 6, 5, -UNI_XPOSIXALPHA } /* alpha=false */, + { 6, 1945, 0, 2, 0, UNI_SD } /* sd */, + { 1, 9190, 10056, 6, 3, UNI_TERM } /* term=true */, + { 265, 1418, 2833, 24, 2, UNI_CCC__1 } /* canonicalcombiningclass=ov */, + { 0, 9691, 720, 4, 16, UNI_CUNEIFORMNUMBERS } /* blk=cuneiformnumbers */, + { 1, 185, 7104, 2, 11, UNI_SYLO } /* issylotinagri */, + { 2, 185, 4625, 3, 13, UNI_SC } /* iscurrencysymbol */, + { 0, 2304, 7006, 3, 10, UNI_SO } /* isothersymbol */, + { 0, 9476, 9707, 3, 4, UNI_CANS } /* sc=cans */, + { 0, 9979, 9871, 4, 3, UNI_MRO } /* scx=mro */, + { 0, 8973, 7600, 6, 10, UNI_YIRADICALS } /* block=yiradicals */, + { 720, 4058, 0, 16, 0, UNI_PF } /* finalpunctuation */, + { 0, 9647, 5732, 4, 2, UNI_AGE__10 } /* age=10 */, + { 1, 185, 8607, 2, 4, UNI_ELBA } /* iselba */, + { 352, 10247, 7148, 3, 11, UNI_JG__YEHWITHTAIL } /* jg=yehwithtail */, + { 1, 9979, 7434, 5, 3, UNI_SOGD } /* scx=sogd */, + { 1, 3373, 0, 18, 0, UNI_ZP } /* paragraphseparator */, + { 0, 510, 0, 30, 0, UNI_CJKEXTA } /* cjkunifiedideographsextensiona */, + { 1, 10511, 5802, 5, 5, UNI_POSIXALNUM } /* posixalnum */, + { 62, 10268, 8913, 3, 4, UNI_NV__4000 } /* nv=4000 */, + { 320, 9476, 2311, 3, 7, UNI_SC__SINH } /* sc=sinhala */, + { 0, 10510, 5096, 6, 5, UNI_XPOSIXDIGIT } /* xposixdigit */, + { 2, 7360, 415, 10, 11, UNI_LB__ID } /* linebreak=ideographic */, + { 340, 185, 9871, 2, 3, UNI_MRO } /* ismro */, + { 0, 118, 4760, 3, 14, UNI_INIMPERIALARAMAIC } /* inimperialaramaic */, + { 0, 8642, 10055, 7, 4, UNI_HYPHEN } /* hyphen=true */, + { 24, 9691, 7862, 4, 9, UNI_INSAMARITAN } /* blk=samaritan */, + { 0, 6937, 188, 6, 30, UNI_MISCPICTOGRAPHS } /* inmiscellaneoussymbolsandpictographs */, + { 1, 1553, 4058, 9, 16, UNI_PF } /* category=finalpunctuation */, + { 0, 3157, 10055, 18, 4, UNI_EBASE } /* emojimodifierbase=true */, + { 0, 3877, 3826, 17, 4, UNI_MANI } /* scriptextensions=mani */, + { 4, 5592, 26, 14, 1, UNI_PATSYN } /* patternsyntax=y */, + { 0, 4847, 6951, 3, 10, UNI_MYANMAREXTA } /* inmyanmarexta */, + { 6, 8593, 1026, 7, 2, -UNI_COMPEX } /* compex=no */, + { 1, 2898, 0, 19, 0, UNI_OTTOMANSIYAQNUMBERS } /* ottomansiyaqnumbers */, + { 0, 21, 9129, 2, 6, UNI_INLYCIAN } /* inlycian */, + { 4, 8782, 8740, 7, 7, UNI_OLCK } /* script=olchiki */, + { 3, 9979, 9907, 4, 4, UNI_OLCK } /* scx=olck */, + { 9, 1418, 8986, 25, 5, UNI_CCC__103 } /* canonicalcombiningclass=ccc103 */, + { 0, 9979, 3978, 4, 4, UNI_BOPO } /* scx=bopo */, + { 2, 8973, 6386, 6, 7, UNI_MAHJONG } /* block=mahjong */, + { 0, 9469, 2573, 5, 3, UNI_INPC__TOP } /* inpc=top */, + { 0, 2206, 71, 21, 2, UNI_GCB__PP } /* graphemeclusterbreak=pp */, + { 4, 185, 2936, 2, 12, UNI_SUNDANESESUP } /* issundanesesup */, + { 0, 9476, 9827, 3, 4, UNI_LANA } /* sc=lana */, + { 2, 10516, 1630, 3, 3, UNI_PHAG } /* isphag */, + { 8, 9691, 4984, 4, 5, UNI_INTAMIL } /* blk=tamil */, + { 3, 9476, 9907, 3, 4, UNI_OLCK } /* sc=olck */, + { 10, 9979, 2269, 4, 11, UNI_MTEI } /* scx=meeteimayek */, + { 1, 8881, 981, 3, 26, UNI_ALPHABETICPF } /* isalphabeticpresentationforms */, + { 74, 8284, 0, 8, 0, UNI_BASS } /* bassavah */, + { 0, 185, 5284, 2, 14, UNI_LATINEXTB } /* islatinextendedb */, + { 0, 1553, 9424, 9, 5, UNI_XPOSIXCNTRL } /* category=cntrl */, + { 30, 7360, 752, 10, 2, UNI_LB__CL } /* linebreak=cl */, + { 0, 8973, 1930, 6, 16, UNI_INDICNUMBERFORMS } /* block=indicnumberforms */, + { 2, 10268, 10360, 3, 2, UNI_NV__39 } /* nv=39 */, + { 32, 10253, 1187, 3, 2, UNI_LB__PO } /* lb=po */, + { 29, 9461, 9189, 3, 5, UNI_SB__ST } /* sb=sterm */, + { 67, 5914, 0, 13, 0, UNI_ZL } /* lineseparator */, + { 212, 6083, 8211, 13, 2, UNI_NV__18 } /* numericvalue=18 */, + { 608, 1814, 0, 22, 0, UNI_cwcm_values_index } /* changeswhencasemapped= */, + { 0, 7360, 5648, 10, 9, UNI_LB__QU } /* linebreak=quotation */, + { 0, 3894, 36, 17, 1, UNI_STERM } /* sentenceterminal=t */, + { 0, 5875, 10265, 13, 3, UNI_JG__MIM } /* joininggroup=mim */, + { 3, 1632, 0, 18, 0, UNI_GEOMETRICSHAPESEXT } /* geometricshapesext */, + { 0, 10244, 4954, 3, 15, UNI_PS } /* gc=openpunctuation */, + { 0, 7360, 4954, 10, 15, UNI_LB__OP } /* linebreak=openpunctuation */, + { 0, 5662, 752, 14, 5, UNI_SB__CL } /* sentencebreak=close */, + { 0, 8973, 4625, 7, 14, UNI_CURRENCYSYMBOLS } /* block=currencysymbols */, + { 1, 8973, 8656, 6, 7, UNI_KALI } /* block=kayahli */, + { 34, 9711, 2833, 4, 2, UNI_CCC__1 } /* ccc=ov */, + { 12, 10268, 7975, 3, 1, UNI_NV__6 } /* nv=6 */, + { 0, 4972, 1117, 3, 3, UNI_TANG } /* istang */, + { 108, 7745, 0, 9, 0, UNI_LATINEXTF } /* latinextf */, + { 2, 6206, 0, 12, 0, UNI_CYRILLICEXTB } /* cyrillicextb */, + { 0, 1564, 0, 2, 0, UNI_PS } /* ps */, + { 136, 9476, 9514, 3, 5, UNI_SC__ORYA } /* sc=oriya */, + { 72, 3409, 1, 18, 1, -UNI_RI } /* regionalindicator=n */, + { 488, 9691, 568, 4, 2, UNI_NB } /* blk=nb */, + { 9, 9691, 810, 4, 29, UNI_ENCLOSEDIDEOGRAPHICSUP } /* blk=enclosedideographicsupplement */, + { 2, 9691, 7817, 4, 9, UNI_INOLDPERMIC } /* blk=oldpermic */, + { 3, 8973, 2879, 6, 12, UNI_MONGOLIANSUP } /* block=mongoliansup */, + { 144, 7520, 0, 10, 0, UNI_SUPARROWSA } /* suparrowsa */, + { 320, 10352, 10235, 3, 3, UNI_WB__EB } /* wb=ebg */, + { 1, 3877, 3193, 17, 8, UNI_ETHI } /* scriptextensions=ethiopic */, + { 0, 3942, 8350, 4, 6, UNI_INGURMUKHI } /* ingurmukhi */, + { 527, 4074, 48, 16, 1, UNI_M } /* generalcategory=m */, + { 122, 6083, 9603, 13, 4, UNI_NV__13_SLASH_2 } /* numericvalue=13/2 */, + { 1, 1553, 6983, 9, 11, UNI_LO } /* category=otherletter */, + { 22, 9647, 10331, 4, 3, UNI_AGE__6_DOT_2 } /* age=v62 */, + { 75, 9691, 2332, 4, 21, UNI_YIJING } /* blk=yijinghexagramsymbols */, + { 2, 9711, 6851, 4, 11, UNI_CCC__8 } /* ccc=kanavoicing */, + { 0, 9691, 4535, 5, 6, UNI_BRAI } /* blk=braille */, + { 0, 9461, 0, 3, 0, UNI_sb_values_index } /* sb= */, + { 94, 8782, 9444, 7, 4, UNI_SC__DOGR } /* script=dogr */, + { 0, 383, 0, 4, 0, UNI_EGYP } /* egyp */, + { 0, 6083, 8913, 13, 5, UNI_NV__40000 } /* numericvalue=40000 */, + { 0, 5823, 1026, 13, 2, -UNI_GRBASE } /* graphemebase=no */, + { 2, 9979, 9699, 4, 4, UNI_BUHD } /* scx=buhd */, + { 0, 8973, 9264, 6, 5, UNI_INADLAM } /* block=adlam */, + { 22, 7300, 26, 10, 1, UNI_DIA } /* diacritic=y */, + { 1, 9691, 8579, 4, 7, UNI_CJKEXTF } /* blk=cjkextf */, + { 0, 2206, 34, 21, 2, UNI_GCB__EX } /* graphemeclusterbreak=ex */, + { 1, 9087, 3, 6, 1, -UNI_JOINC } /* joinc=f */, + { 0, 10352, 496, 3, 7, UNI_WB__NU } /* wb=numeric */, + { 66, 3877, 3622, 17, 17, UNI_AGHB } /* scriptextensions=caucasianalbanian */, + { 10, 8782, 7330, 7, 4, UNI_KHAR } /* script=khar */, + { 1, 10352, 139, 3, 2, UNI_WB__FO } /* wb=fo */, + { 7, 9476, 1116, 3, 4, UNI_SC__HANG } /* sc=hang */, + { 24, 9647, 7951, 4, 1, UNI_AGE__3 } /* age=3 */, + { 7, 1538, 2573, 24, 3, UNI_INPC__TOP } /* indicpositionalcategory=top */, + { 0, 185, 1903, 3, 18, UNI_CJKCOMPATIDEOGRAPHS } /* iscjkcompatideographs */, + { 5, 7230, 3398, 10, 10, UNI_BC__WS } /* bidiclass=whitespace */, + { 0, 7093, 0, 11, 0, UNI_SUPERANDSUB } /* superandsub */, + { 1, 2248, 8818, 3, 6, UNI_SUPPUAA } /* insuppuaa */, + { 11, 909, 0, 10, 0, UNI_CO } /* privateuse */, + { 61, 8782, 9807, 7, 4, UNI_SC__KALI } /* script=kali */, + { 263, 9476, 10007, 3, 4, UNI_SC__SYRC } /* sc=syrc */, + { 15, 7560, 36, 10, 1, UNI_XPOSIXUPPER } /* uppercase=t */, + { 1, 9691, 5368, 4, 7, UNI_LISUSUP } /* blk=lisusup */, + { 2, 810, 0, 22, 0, UNI_ENCLOSEDIDEOGRAPHICSUP } /* enclosedideographicsup */, + { 1, 7360, 8428, 10, 8, UNI_LB__NL } /* linebreak=nextline */, + { 0, 8973, 5214, 6, 14, UNI_INGREEK } /* block=greekandcoptic */, + { 0, 185, 8670, 2, 4, UNI_MAKA } /* ismaka */, + { 32, 59, 0, 4, 0, UNI_IDEO } /* ideo */, + { 137, 185, 729, 2, 6, UNI_N } /* isnumber */, + { 48, 7230, 3373, 10, 18, UNI_BC__B } /* bidiclass=paragraphseparator */, + { 0, 9294, 0, 5, 0, UNI_BUHD } /* buhid */, + { 10, 1592, 2709, 3, 18, UNI_INEGYPTIANHIEROGLYPHS } /* inegyptianhieroglyphs */, + { 272, 10244, 207, 3, 2, UNI_PI } /* gc=pi */, + { 0, 9461, 33, 3, 2, UNI_SB__SE } /* sb=se */, + { 126, 9847, 9454, 4, 5, -UNI_LOE } /* loe=false */, + { 24, 4074, 3373, 16, 18, UNI_ZP } /* generalcategory=paragraphseparator */, + { 6, 8316, 1026, 8, 2, -UNI_EXTPICT } /* extpict=no */, + { 0, 9691, 6972, 4, 11, UNI_INNANDINAGARI } /* blk=nandinagari */, + { 26, 9476, 4759, 3, 15, UNI_ARMI } /* sc=imperialaramaic */, + { 6, 2803, 10055, 19, 4, UNI_IDST } /* idstrinaryoperator=true */, + { 16, 10352, 728, 3, 2, UNI_WB__MN } /* wb=mn */, + { 3, 9647, 8212, 4, 3, UNI_AGE__8 } /* age=8.0 */, + { 0, 9691, 284, 4, 33, UNI_MISCMATHSYMBOLSB } /* blk=miscellaneousmathematicalsymbolsb */, + { 160, 185, 8388, 2, 4, UNI_JAVA } /* isjava */, + { 3, 7360, 21, 10, 2, UNI_LB__IN } /* linebreak=in */, + { 91, 10268, 8949, 3, 6, UNI_NV__900000 } /* nv=900000 */, + { 1, 2248, 3929, 3, 16, UNI_SUTTONSIGNWRITING } /* insuttonsignwriting */, + { 0, 8961, 9454, 6, 5, -UNI_BIDIC } /* bidic=false */, + { 0, 9476, 9284, 3, 5, UNI_BATK } /* sc=batak */, + { 0, 3877, 2632, 17, 6, UNI_BRAH } /* scriptextensions=brahmi */, + { 0, 9979, 9135, 4, 6, UNI_LYDI } /* scx=lydian */, + { 0, 8380, 0, 8, 0, UNI_JAMOEXTB } /* jamoextb */, + { 0, 8973, 6506, 6, 12, UNI_MATHALPHANUM } /* block=mathalphanum */, + { 0, 10247, 2651, 3, 19, UNI_JG__BURUSHASKIYEHBARREE } /* jg=burushaskiyehbarree */, + { 12, 9077, 0, 4, 0, UNI_ext_values_index } /* ext= */, + { 25, 8973, 3076, 6, 9, UNI_HALFMARKS } /* block=halfmarks */, + { 1, 2242, 7783, 4, 7, UNI_INNABATAEAN } /* innabataean */, + { 0, 10553, 10008, 3, 3, UNI_SYRC } /* issyrc */, + { 288, 9177, 10355, 6, 3, UNI_QMARK } /* qmark=yes */, + { 0, 9476, 10123, 3, 4, UNI_ZZZZ } /* sc=zzzz */, + { 7, 7467, 7934, 3, 1, UNI_IN__2 } /* in=2 */, + { 0, 4157, 7909, 3, 6, UNI_IDS } /* isidstart */, + { 0, 8973, 5745, 6, 13, UNI_AEGEANNUMBERS } /* block=aegeannumbers */, + { 16, 185, 9444, 2, 4, UNI_DOGR } /* isdogr */, + { 0, 7467, 9587, 3, 4, UNI_IN__11 } /* in=11.0 */, + { 0, 9711, 7934, 4, 2, UNI_CCC__25 } /* ccc=25 */, + { 0, 9691, 4669, 4, 15, UNI_DIACRITICALSSUP } /* blk=diacriticalssup */, + { 26, 10346, 472, 3, 2, UNI_VO__TU } /* vo=tu */, + { 2, 5368, 0, 7, 0, UNI_LISUSUP } /* lisusup */, + { 1, 10244, 27, 3, 2, UNI_LOWERCASELETTER } /* gc=ll */, + { 9, 3877, 7853, 17, 9, UNI_PAUC } /* scriptextensions=paucinhau */, + { 2, 9476, 2433, 3, 10, UNI_SC__GLAG } /* sc=glagolitic */, + { 6, 9434, 26, 5, 1, UNI_CWCM } /* cwcm=y */, + { 1192, 7460, 7975, 10, 1, UNI_IN__6 } /* presentin=6 */, + { 11, 6230, 0, 12, 0, UNI_ETHIOPICEXTA } /* ethiopicexta */, + { 0, 185, 5830, 2, 5, UNI_EBASE } /* isebase */, + { 292, 8810, 0, 7, 0, UNI_SOYO } /* soyombo */, + { 1, 7460, 10298, 10, 3, UNI_IN__2_DOT_1 } /* presentin=v21 */, + { 0, 9979, 8284, 4, 4, UNI_BASS } /* scx=bass */, + { 68, 9711, 9375, 5, 4, UNI_CCC__29 } /* ccc=ccc29 */, + { 0, 9979, 9939, 4, 4, UNI_MIAO } /* scx=plrd */, + { 0, 7460, 10331, 10, 3, UNI_IN__6_DOT_2 } /* presentin=v62 */, + { 26, 8782, 4190, 8, 3, UNI_SARB } /* script=sarb */, + { 0, 3877, 9935, 17, 4, UNI_PHNX } /* scriptextensions=phnx */, + { 1, 10553, 8811, 3, 6, UNI_SOYO } /* issoyombo */, + { 0, 1990, 5200, 22, 14, UNI_INSC__GEMINATIONMARK } /* indicsyllabiccategory=geminationmark */, + { 9, 1553, 6132, 9, 2, UNI_PF } /* category=pf */, + { 0, 3962, 0, 16, 0, UNI_ARABICSUP } /* arabicsupplement */, + { 39, 9979, 5368, 4, 4, UNI_LISU } /* scx=lisu */, + { 44, 185, 7540, 2, 10, UNI_SUPARROWSC } /* issuparrowsc */, + { 0, 8973, 8559, 7, 6, UNI_CJKEXTC } /* block=cjkextc */, + { 86, 4074, 6994, 16, 11, UNI_NO } /* generalcategory=othernumber */, + { 1, 6675, 0, 10, 0, UNI_IDC } /* idcontinue */, + { 424, 5875, 88, 13, 2, UNI_JG__HE } /* joininggroup=he */, + { 1280, 8702, 1036, 4, 9, UNI_ENCLOSEDCJK } /* inenclosedcjk */, + { 176, 0, 0, 42, 0, UNI_UCASEXT } /* unifiedcanadianaboriginalsyllabicsextended */, + { 1, 185, 3050, 3, 10, UNI_CHEROKEESUP } /* ischerokeesup */, + { 10, 2003, 7, 10, 1, UNI_CASEDLETTER } /* category=lc */, + { 30, 8782, 8284, 7, 4, UNI_BASS } /* script=bass */, + { 4, 185, 810, 2, 29, UNI_ENCLOSEDIDEOGRAPHICSUP } /* isenclosedideographicsupplement */, + { 0, 9979, 0, 4, 0, UNI_scx_values_index } /* scx= */, + { 0, 9843, 0, 4, 0, UNI_LINB } /* linb */, + { 0, 4504, 0, 4, 0, UNI_BAMU } /* bamu */, + { 72, 185, 6386, 2, 12, UNI_MAHJONG } /* ismahjongtiles */, + { 26, 8973, 6731, 7, 10, UNI_INCYPROMINOAN } /* block=cyprominoan */, + { 1, 10217, 10256, 3, 3, UNI_BC__LRE } /* bc=lre */, + { 1313, 9429, 9454, 5, 5, -UNI_CWCF } /* cwcf=false */, + { 5, 3877, 2312, 18, 6, UNI_SINH } /* scriptextensions=sinhala */, + { 97, 10268, 7932, 3, 8, UNI_NV__1_SLASH_8 } /* nv=1.25e-01 */, + { 28, 1553, 6719, 9, 11, UNI_CASEDLETTER } /* category=casedletter */, + { 256, 6590, 0, 12, 0, UNI_HUNG } /* oldhungarian */, + { 1, 10268, 8012, 3, 8, UNI_NV__1_SLASH_4 } /* nv=2.50e-01 */, + { 0, 6083, 5732, 13, 4, UNI_NV__1000 } /* numericvalue=1000 */, + { 11, 9476, 6590, 3, 12, UNI_HUNG } /* sc=oldhungarian */, + { 0, 1189, 8469, 3, 7, UNI_INTAGBANWA } /* intagbanwa */, + { 36, 9695, 7, 4, 1, UNI_BPT__C } /* bpt=c */, + { 79, 8973, 8292, 6, 8, UNI_INBUGINESE } /* block=buginese */, + { 1, 4170, 0, 6, 0, UNI_LATIN1 } /* latin1 */, + { 0, 4972, 9535, 3, 4, UNI_TAKR } /* istakri */, + { 2, 185, 9883, 2, 4, UNI_NARB } /* isnarb */, + { 0, 9691, 6675, 4, 3, UNI_INIDC } /* blk=idc */, + { 192, 7467, 8092, 3, 3, UNI_IN__4 } /* in=4.0 */, + { 6, 8628, 36, 7, 1, UNI_GRBASE } /* grbase=t */, + { 0, 9544, 10055, 5, 4, UNI_XIDC } /* xidc=true */, + { 1, 1553, 4639, 9, 15, UNI_PD } /* category=dashpunctuation */, + { 8, 9727, 3, 4, 1, -UNI_CWL } /* cwl=f */, + { 5, 8973, 8684, 6, 7, UNI_INMARCHEN } /* block=marchen */, + { 0, 1418, 3031, 24, 18, UNI_CCC__216 } /* canonicalcombiningclass=attachedaboveright */, + { 0, 5830, 9454, 6, 5, -UNI_EBASE } /* ebase=false */, + { 36, 185, 3193, 2, 18, UNI_ETHIOPICSUP } /* isethiopicsupplement */, + { 9, 8961, 1026, 6, 2, -UNI_BIDIC } /* bidic=no */, + { 0, 10516, 63, 7, 5, UNI_POSIXGRAPH } /* isposixgraph */, + { 512, 8973, 601, 7, 29, UNI_CJKEXTD } /* block=cjkunifiedideographsextensiond */, + { 357, 4154, 1775, 3, 2, UNI_INVAI } /* invai */, + { 4, 9077, 26, 4, 1, UNI_EXT } /* ext=y */, + { 0, 6340, 2123, 3, 20, UNI_CJKCOMPATFORMS } /* incjkcompatibilityforms */, + { 1, 3121, 568, 18, 2, UNI_DT__NB } /* decompositiontype=nb */, + { 0, 7467, 10075, 3, 4, UNI_IN__13 } /* in=v130 */, + { 290, 6083, 4175, 13, 1, UNI_NV__1 } /* numericvalue=1 */, + { 0, 8782, 9264, 7, 5, UNI_SC__ADLM } /* script=adlam */, + { 0, 401, 0, 6, 0, UNI_CF } /* format */, + { 2, 9171, 3, 6, 1, -UNI__PERL_PATWS } /* patws=f */, + { 64, 4714, 1026, 15, 2, -UNI_GREXT } /* graphemeextend=no */, + { 0, 1538, 5044, 24, 15, UNI_LOE } /* indicpositionalcategory=visualorderleft */, + { 0, 9691, 7745, 4, 9, UNI_LATINEXTF } /* blk=latinextf */, + { 0, 10268, 8059, 3, 2, UNI_NV__33 } /* nv=33 */, + { 0, 3877, 7430, 17, 10, UNI_SOGO } /* scriptextensions=oldsogdian */, + { 300, 9476, 8607, 3, 4, UNI_ELBA } /* sc=elba */, + { 2, 10247, 5410, 3, 14, UNI_JG__MANICHAEANBETH } /* jg=manichaeanbeth */, + { 0, 8881, 27, 3, 2, UNI_ALL } /* isall */, + { 13, 10553, 2312, 3, 3, UNI_SINH } /* issinh */, + { 0, 10253, 4503, 3, 2, UNI_LB__BB } /* lb=bb */, + { 0, 9731, 1026, 4, 2, -UNI_CWT } /* cwt=no */, + { 0, 8614, 0, 7, 0, UNI_ELYM } /* elymaic */, + { 1, 5088, 36, 14, 1, UNI_POSIXXDIGIT } /* asciihexdigit=t */, + { 117, 10253, 97, 3, 10, UNI_LB__AL } /* lb=alphabetic */, + { 11, 10268, 8092, 3, 8, UNI_NV__2_SLASH_5 } /* nv=4.00e-01 */, + { 29, 10516, 3, 3, 1, UNI_PF } /* ispf */, + { 0, 8955, 3, 6, 1, -UNI_XPOSIXALPHA } /* alpha=f */, + { 4, 8782, 9651, 7, 4, UNI_AGHB } /* script=aghb */, + { 0, 9979, 4314, 4, 7, UNI_MYMR } /* scx=myanmar */, + { 0, 8824, 0, 7, 0, UNI_SUPPUAB } /* suppuab */, + { 12, 1418, 10157, 24, 3, UNI_CCC__AL } /* canonicalcombiningclass=228 */, + { 1, 6340, 661, 3, 29, UNI_CJKEXTF } /* incjkunifiedideographsextensionf */, + { 3, 10268, 10136, 3, 3, UNI_NV__2_SLASH_3 } /* nv=2/3 */, + { 9, 5662, 1891, 14, 5, UNI_SB__UP } /* sentencebreak=upper */, + { 0, 21, 1678, 2, 23, UNI_LATINEXTADDITIONAL } /* inlatinextendedadditional */, + { 2, 6697, 1026, 11, 2, -UNI_XPOSIXALPHA } /* alphabetic=no */, + { 0, 0, 0, 43, 0, UNI_UCASEXTA } /* unifiedcanadianaboriginalsyllabicsextendeda */, + { 1, 10247, 6906, 3, 11, UNI_JG__MALAYALAMJA } /* jg=malayalamja */, + { 56, 8973, 7718, 6, 9, UNI_LATINEXTB } /* block=latinextb */, + { 7, 9691, 8656, 4, 7, UNI_KALI } /* blk=kayahli */, + { 0, 8712, 0, 8, 0, UNI_NFKDQC__N } /* nfkdqc=n */, + { 11, 9476, 9715, 3, 4, UNI_CHRS } /* sc=chrs */, + { 0, 6340, 220, 4, 31, UNI_DIACRITICALSEXT } /* incombiningdiacriticalmarksextended */, + { 2, 9831, 0, 3, 0, UNI_LAO } /* lao */, + { 1, 1629, 0, 4, 0, UNI_PHAG } /* phag */, + { 9, 8973, 7390, 6, 10, UNI_MISCARROWS } /* block=miscarrows */, + { 281, 4847, 2086, 3, 14, UNI_MODIFIERLETTERS } /* inmodifierletters */, + { 2, 8973, 415, 6, 32, UNI_INIDC } /* block=ideographicdescriptioncharacters */, + { 4, 9691, 909, 4, 10, UNI_PUA } /* blk=privateuse */, + { 0, 10247, 6422, 3, 12, UNI_JG__MALAYALAMNGA } /* jg=malayalamnga */, + { 16, 6083, 7610, 13, 9, UNI_NV___MINUS_1_SLASH_2 } /* numericvalue=-5.00e-01 */, + { 0, 3877, 8356, 17, 8, UNI_HIRA } /* scriptextensions=hiragana */, + { 2, 9927, 36, 4, 1, UNI_PCM } /* pcm=t */, + { 1, 8973, 5326, 6, 14, UNI_LATINEXTE } /* block=latinextendede */, + { 1, 4442, 0, 16, 0, UNI_TANGUTSUP } /* tangutsupplement */, + { 0, 21, 5312, 2, 14, UNI_LATINEXTD } /* inlatinextendedd */, + { 384, 4074, 7, 16, 1, UNI_C } /* generalcategory=c */, + { 0, 4346, 0, 5, 0, UNI_C } /* other */, + { 0, 3877, 8656, 17, 7, UNI_KALI } /* scriptextensions=kayahli */, + { 4, 2304, 9515, 3, 4, UNI_ORYA } /* isoriya */, + { 0, 1418, 3588, 24, 13, UNI_CCC__202 } /* canonicalcombiningclass=attachedbelow */, + { 0, 9093, 0, 6, 0, UNI_KTHI } /* kaithi */, + { 1, 5875, 2661, 13, 3, UNI_JG__YEH } /* joininggroup=yeh */, + { 0, 5116, 36, 14, 1, UNI_CI } /* caseignorable=t */, + { 0, 10229, 1254, 3, 4, UNI_DT__INIT } /* dt=init */, + { 0, 185, 317, 2, 33, UNI_SUPMATHOPERATORS } /* issupplementalmathematicaloperators */, + { 0, 6083, 8116, 13, 8, UNI_NV__3_SLASH_64 } /* numericvalue=4.69e-02 */, + { 0, 3403, 9454, 6, 5, -UNI_XPOSIXSPACE } /* space=false */, + { 1, 1189, 4443, 3, 8, UNI_TANGUTSUP } /* intangutsup */, + { 2, 185, 4714, 2, 14, UNI_GREXT } /* isgraphemeextend */, + { 3, 4074, 1846, 16, 2, UNI_NL } /* generalcategory=nl */, + { 336, 185, 38, 2, 2, UNI_XPOSIXDIGIT } /* isnd */, + { 23, 1990, 1245, 22, 25, UNI_INSC__CONSONANTINITIALPOSTFIXED } /* indicsyllabiccategory=consonantinitialpostfixed */, + { 6, 9476, 8754, 3, 4, UNI_OSMA } /* sc=osma */, + { 345, 9691, 2353, 4, 20, UNI_INANATOLIANHIEROGLYPHS } /* blk=anatolianhieroglyphs */, + { 4, 185, 7, 3, 1, UNI_XPOSIXCNTRL } /* iscc */, + { 3, 7820, 0, 4, 0, UNI_PERM } /* perm */, + { 4, 185, 10400, 2, 2, UNI_ZS } /* iszs */, + { 0, 8973, 1747, 6, 13, UNI_ZNAMENNYMUSIC } /* block=znamennymusic */, + { 800, 5662, 2553, 15, 4, UNI_SB__ST } /* sentencebreak=sterm */, + { 7, 8782, 9504, 7, 5, UNI_NSHU } /* script=nushu */, + { 1, 9691, 7433, 4, 7, UNI_INSOGDIAN } /* blk=sogdian */, + { 35, 1418, 7990, 24, 1, UNI_CCC__8 } /* canonicalcombiningclass=8 */, + { 68, 9476, 9643, 3, 4, UNI_SC__ADLM } /* sc=adlm */, + { 3, 9476, 7450, 3, 10, UNI_PHNX } /* sc=phoenician */, + { 32, 10247, 9111, 3, 6, UNI_JG__LAMADH } /* jg=lamadh */, + { 18, 7360, 59, 10, 2, UNI_LB__ID } /* linebreak=id */, + { 6, 9979, 8388, 4, 8, UNI_JAVA } /* scx=javanese */, + { 0, 8973, 3707, 6, 16, UNI_ETHIOPICEXT } /* block=ethiopicextended */, + { 0, 3877, 8691, 17, 7, UNI_MULT } /* scriptextensions=multani */, + { 0, 3877, 9484, 17, 4, UNI_LIMB } /* scriptextensions=limb */, + { 5, 7467, 10310, 3, 3, UNI_IN__4 } /* in=v40 */, + { 0, 2248, 1725, 3, 22, UNI_SUPPUNCTUATION } /* insupplementalpunctuation */, + { 50, 9476, 8614, 3, 7, UNI_ELYM } /* sc=elymaic */, + { 0, 1990, 5158, 22, 14, UNI_INSC__CONSONANTFINAL } /* indicsyllabiccategory=consonantfinal */, + { 291, 4074, 3382, 16, 9, UNI_Z } /* generalcategory=separator */, + { 6, 9691, 1674, 4, 4, UNI_JAMO } /* blk=jamo */, + { 0, 185, 3978, 2, 8, UNI_BOPO } /* isbopomofo */, + { 0, 9476, 1655, 3, 6, UNI_SC__HANG } /* sc=hangul */, + { 0, 10247, 10277, 3, 3, UNI_JG__REH } /* jg=reh */, + { 130, 9803, 6895, 4, 3, UNI_LB__H3 } /* hst=lvt */, + { 0, 7467, 7990, 3, 1, UNI_IN__8 } /* in=8 */, + { 0, 8973, 1903, 7, 18, UNI_CJKCOMPATIDEOGRAPHS } /* block=cjkcompatideographs */, + { 50, 9135, 0, 6, 0, UNI_LYDI } /* lydian */, + { 0, 7360, 18, 10, 2, UNI_RI } /* linebreak=ri */, + { 33, 8316, 36, 8, 1, UNI_EXTPICT } /* extpict=t */, + { 1, 7835, 0, 9, 0, UNI_OUGR } /* olduyghur */, + { 20, 1418, 9006, 24, 3, UNI_CCC__122 } /* canonicalcombiningclass=122 */, + { 0, 9979, 10083, 4, 3, UNI_VAI } /* scx=vai */, + { 1, 2003, 48, 10, 1, UNI_LM } /* category=lm */, + { 0, 9647, 10307, 4, 3, UNI_AGE__3_DOT_2 } /* age=v32 */, + { 0, 9943, 0, 4, 0, UNI_PRTI } /* prti */, + { 1, 10349, 1, 3, 1, -UNI_VS } /* vs=n */, + { 0, 9270, 9454, 4, 5, -UNI_XPOSIXXDIGIT } /* hex=false */, + { 0, 21, 1008, 3, 26, UNI_ANCIENTGREEKMUSIC } /* inancientgreekmusicalnotation */, + { 18, 4042, 0, 7, 0, UNI_CPRT } /* cypriot */, + { 0, 6529, 126, 3, 2, UNI_OCR } /* inocr */, + { 0, 9711, 9345, 5, 4, UNI_CCC__23 } /* ccc=ccc23 */, + { 0, 9979, 2433, 4, 4, UNI_GLAG } /* scx=glag */, + { 0, 9711, 3596, 4, 5, UNI_CCC__B } /* ccc=below */, + { 619, 9270, 0, 4, 0, UNI_hex_values_index } /* hex= */, + { 0, 10217, 3398, 3, 10, UNI_BC__WS } /* bc=whitespace */, + { 0, 8782, 9033, 7, 6, UNI_SC__CAKM } /* script=chakma */, + { 0, 9979, 9919, 4, 4, UNI_OSGE } /* scx=osge */, + { 417, 9476, 9867, 3, 4, UNI_SC__MLYM } /* sc=mlym */, + { 17, 9647, 10175, 4, 3, UNI_AGE__3_DOT_2 } /* age=3.2 */, + { 0, 9075, 0, 5, 0, UNI_GREXT } /* grext */, + { 1, 7230, 2822, 10, 19, UNI_BC__LRO } /* bidiclass=lefttorightoverride */, + { 0, 1189, 8777, 3, 3, UNI_TAGS } /* intags */, + { 0, 9476, 7826, 3, 9, UNI_ORKH } /* sc=oldturkic */, + { 12, 5875, 6470, 13, 12, UNI_JG__MALAYALAMTTA } /* joininggroup=malayalamtta */, + { 0, 1189, 3482, 3, 10, UNI_TAIXUANJING } /* intaixuanjing */, + { 10, 9967, 0, 4, 0, UNI_RUNR } /* runr */, + { 67, 9476, 9069, 3, 4, UNI_GOTH } /* sc=goth */, + { 2, 7360, 909, 10, 2, UNI_LB__PR } /* linebreak=pr */, + { 12, 3121, 1310, 18, 3, UNI_DT__SUB } /* decompositiontype=sub */, + { 1, 10268, 9591, 3, 4, UNI_NV__11_SLASH_2 } /* nv=11/2 */, + { 2, 7360, 97, 10, 10, UNI_LB__AL } /* linebreak=alphabetic */, + { 0, 9963, 0, 4, 0, UNI_ROHG } /* rohg */, + { 555, 8973, 251, 6, 33, UNI_MISCMATHSYMBOLSA } /* block=miscellaneousmathematicalsymbolsa */, + { 2, 6675, 26, 11, 1, UNI_IDC } /* idcontinue=y */, + { 4, 9691, 6290, 4, 12, UNI_INGUNJALAGONDI } /* blk=gunjalagondi */, + { 0, 10508, 5095, 8, 6, UNI_XPOSIXXDIGIT } /* isxposixxdigit */, + { 1103, 10268, 9254, 3, 3, UNI_NV__1_SLASH_3 } /* nv=1/3 */, + { 72, 3877, 8340, 17, 8, UNI_GUJR } /* scriptextensions=gujarati */, + { 0, 10247, 10220, 3, 3, UNI_JG__BEH } /* jg=beh */, + { 842, 10244, 4346, 3, 5, UNI_C } /* gc=other */, + { 90, 8973, 8573, 7, 6, UNI_CJKEXTE } /* block=cjkexte */, + { 1164, 10247, 9955, 3, 4, UNI_JG__QAPH } /* jg=qaph */, + { 1, 7360, 9920, 10, 2, UNI_LB__SG } /* linebreak=sg */, + { 0, 1506, 5839, 5, 10, UNI_GREEKEXT } /* ingreekextended */, + { 0, 10247, 10292, 3, 3, UNI_JG__TAH } /* jg=tah */, + { 138, 7297, 9800, 3, 3, UNI_HMNP } /* ishmnp */, + { 2, 2879, 0, 9, 0, UNI_MONG } /* mongolian */, + { 1, 9476, 8845, 3, 7, UNI_TAVT } /* sc=taiviet */, + { 0, 123, 0, 9, 0, UNI_DIA } /* diacritic */, + { 0, 9691, 6302, 4, 6, UNI_INHEBREW } /* blk=hebrew */, + { 0, 9691, 3139, 4, 18, UNI_DEVANAGARIEXT } /* blk=devanagariextended */, + { 3, 8881, 1372, 4, 22, UNI_ARABICPFA } /* isarabicpresentationformsa */, + { 1281, 8782, 7501, 8, 9, UNI_SAUR } /* script=saurashtra */, + { 2, 9476, 9484, 3, 4, UNI_SC__LIMB } /* sc=limb */, + { 2, 8973, 839, 6, 29, UNI_MISCARROWS } /* block=miscellaneoussymbolsandarrows */, + { 1, 10268, 8180, 3, 8, UNI_NV__13_SLASH_2 } /* nv=6.50e+00 */, + { 15, 9081, 0, 6, 0, UNI_HATR } /* hatran */, + { 1, 3448, 8493, 3, 7, UNI_UCASEXTA } /* inucasexta */, + { 0, 10244, 10390, 3, 2, UNI_CASEDLETTER } /* gc=l_ */, + { 0, 8782, 9959, 7, 4, UNI_RJNG } /* script=rjng */, + { 2, 10553, 2312, 3, 6, UNI_SINH } /* issinhala */, + { 0, 5408, 6046, 4, 11, UNI_MAYANNUMERALS } /* inmayannumerals */, + { 2, 4909, 1, 15, 1, UNI_NFKDQC__N } /* nfkdquickcheck=n */, + { 1, 2312, 1196, 5, 23, UNI_HALFANDFULLFORMS } /* inhalfwidthandfullwidthforms */, + { 0, 3877, 9444, 17, 4, UNI_DOGR } /* scriptextensions=dogr */, + { 5, 6083, 8068, 13, 8, UNI_NV__7_SLASH_2 } /* numericvalue=3.50e+00 */, + { 0, 9979, 10019, 4, 4, UNI_TALU } /* scx=talu */, + { 0, 8782, 9943, 7, 4, UNI_PRTI } /* script=prti */, + { 0, 9691, 7190, 4, 10, UNI_ARABICEXTA } /* blk=arabicexta */, + { 1, 9269, 0, 4, 0, UNI_POSIXXDIGIT } /* ahex */, + { 5, 1553, 4624, 9, 14, UNI_SC } /* category=currencysymbol */, + { 39, 9691, 8831, 4, 7, UNI_INTAGALOG } /* blk=tagalog */, + { 10, 118, 3777, 4, 15, UNI_INDICSIYAQNUMBERS } /* inindicsiyaqnumbers */, + { 21, 2206, 10235, 21, 3, UNI_WB__EB } /* graphemeclusterbreak=ebg */, + { 3, 3942, 8342, 4, 6, UNI_INGUJARATI } /* ingujarati */, + { 0, 6083, 8099, 13, 2, UNI_NV__14 } /* numericvalue=14 */, + { 3, 1167, 36, 26, 1, UNI_DI } /* defaultignorablecodepoint=t */, + { 2, 10268, 9407, 3, 2, UNI_NV__35 } /* nv=35 */, + { 257, 7908, 10355, 8, 3, UNI_IDS } /* idstart=yes */, + { 0, 185, 7570, 2, 10, UNI_WARA } /* iswarangciti */, + { 26, 10229, 9759, 3, 4, UNI_DT__FONT } /* dt=font */, + { 3, 185, 329, 2, 21, UNI_MATHOPERATORS } /* ismathematicaloperators */, + { 32, 9979, 9703, 4, 4, UNI_CAKM } /* scx=cakm */, + { 0, 4972, 9530, 3, 4, UNI_TALE } /* istaile */, + { 0, 8593, 26, 7, 1, UNI_COMPEX } /* compex=y */, + { 0, 1034, 0, 27, 0, UNI_ENCLOSEDCJK } /* enclosedcjklettersandmonths */, + { 42, 9545, 3, 4, 1, -UNI_IDC } /* idc=f */, + { 0, 8782, 8530, 7, 7, UNI_AVST } /* script=avestan */, + { 16, 10253, 10384, 3, 2, UNI_GCB__V } /* lb=jv */, + { 0, 8973, 5298, 6, 14, UNI_LATINEXTC } /* block=latinextendedc */, + { 49, 436, 0, 5, 0, UNI__PERL_NCHAR } /* nchar */, + { 1025, 10253, 1141, 3, 26, UNI_LB__CJ } /* lb=conditionaljapanesestarter */, + { 2, 9439, 10355, 5, 3, UNI_DASH } /* dash=yes */, + { 1033, 1632, 0, 23, 0, UNI_GEOMETRICSHAPESEXT } /* geometricshapesextended */, + { 1328, 185, 909, 2, 14, UNI_PUA } /* isprivateusearea */, + { 257, 10247, 9479, 3, 5, UNI_JG__KHAPH } /* jg=khaph */, + { 1070, 1187, 0, 2, 0, UNI_PO } /* po */, + { 64, 7297, 5243, 3, 13, UNI_HIGHSURROGATES } /* ishighsurrogates */, + { 0, 8973, 4984, 6, 8, UNI_TAMILSUP } /* block=tamilsup */, + { 41, 10268, 9631, 3, 3, UNI_NV__3_SLASH_8 } /* nv=3/8 */, + { 3, 9979, 8754, 4, 4, UNI_OSMA } /* scx=osma */, + { 0, 2784, 36, 19, 1, UNI_GCB__T } /* hangulsyllabletype=t */, + { 4, 10268, 8060, 3, 8, UNI_NV__1_SLASH_3 } /* nv=3.33e-01 */, + { 0, 8782, 8684, 7, 7, UNI_MARC } /* script=marchen */, + { 0, 10247, 7254, 3, 3, UNI_JG__KAF } /* jg=kaf */, + { 0, 9691, 4330, 4, 16, UNI_MYANMAREXTB } /* blk=myanmarextendedb */, + { 0, 1418, 10154, 24, 3, UNI_CCC__R } /* canonicalcombiningclass=226 */, + { 7, 4972, 4985, 3, 14, UNI_TAMILSUP } /* istamilsupplement */, + { 0, 3877, 9851, 17, 4, UNI_MEDF } /* scriptextensions=medf */, + { 1, 9735, 9454, 4, 5, -UNI_CWU } /* cwu=false */, + { 16, 9691, 1587, 5, 22, UNI_BYZANTINEMUSIC } /* blk=byzantinemusicalsymbols */, + { 260, 9219, 0, 6, 0, UNI_upper_values_index } /* upper= */, + { 40, 9063, 0, 6, 0, UNI_epres_values_index } /* epres= */, + { 0, 9069, 0, 4, 0, UNI_GOTH } /* goth */, + { 0, 8782, 3826, 7, 4, UNI_SC__MANI } /* script=mani */, + { 1, 9691, 3265, 4, 11, UNI_GEORGIANSUP } /* blk=georgiansup */, + { 1, 9647, 10187, 4, 3, UNI_AGE__5_DOT_1 } /* age=5.1 */, + { 0, 8973, 7500, 6, 10, UNI_INSAURASHTRA } /* block=saurashtra */, + { 1, 9691, 5074, 4, 14, UNI_ANCIENTSYMBOLS } /* blk=ancientsymbols */, + { 38, 21, 9105, 2, 6, UNI_INKHOJKI } /* inkhojki */, + { 27, 6083, 8179, 13, 2, UNI_NV__36 } /* numericvalue=36 */, + { 0, 10217, 25, 3, 1, UNI_BC__S } /* bc=s */, + { 1, 10232, 9141, 3, 6, UNI_EA__NA } /* ea=narrow */, + { 1, 8782, 9509, 7, 5, UNI_OGAM } /* script=ogham */, + { 643, 10516, 1847, 7, 5, UNI_POSIXLOWER } /* isposixlower */, + { 0, 7230, 3427, 10, 18, UNI_BC__RLI } /* bidiclass=righttoleftisolate */, + { 17, 185, 9687, 2, 4, UNI_BHKS } /* isbhks */, + { 13, 8973, 3104, 7, 17, UNI_COPTICEPACTNUMBERS } /* block=copticepactnumbers */, + { 0, 5745, 0, 13, 0, UNI_AEGEANNUMBERS } /* aegeannumbers */, + { 1, 3877, 9207, 17, 6, UNI_THAA } /* scriptextensions=thaana */, + { 2053, 21, 4170, 2, 6, UNI_LATIN1 } /* inlatin1 */, + { 0, 7460, 10310, 10, 3, UNI_IN__4 } /* presentin=v40 */, + { 37, 8782, 2433, 7, 4, UNI_SC__GLAG } /* script=glag */, + { 0, 10268, 7948, 3, 8, UNI_NV__1_SLASH_7 } /* nv=1.43e-01 */, + { 5, 6350, 6840, 12, 11, UNI_JT__C } /* joiningtype=joincausing */, + { 674, 9691, 9237, 4, 6, UNI_INYEZIDI } /* blk=yezidi */, + { 1232, 7467, 8100, 3, 3, UNI_IN__4_DOT_1 } /* in=4.1 */, + { 14, 6340, 3691, 3, 16, UNI_CYRILLICEXTC } /* incyrillicextendedc */, + { 1357, 9847, 36, 4, 1, UNI_LOE } /* loe=t */, + { 48, 9691, 8404, 4, 8, UNI_KANAEXTB } /* blk=kanaextb */, + { 51, 2248, 7501, 3, 9, UNI_INSAURASHTRA } /* insaurashtra */, + { 1, 7460, 10187, 10, 3, UNI_IN__5_DOT_1 } /* presentin=5.1 */, + { 2, 9474, 4154, 5, 16, UNI_INSC__INVISIBLESTACKER } /* insc=invisiblestacker */, + { 340, 10244, 909, 3, 10, UNI_CO } /* gc=privateuse */, + { 15, 4972, 48, 5, 1, UNI_TERM } /* isterm */, + { 0, 5088, 0, 13, 0, UNI_POSIXXDIGIT } /* asciihexdigit */, + { 278, 3758, 8523, 17, 7, UNI_IDENTIFIERSTATUS__ALLOWED } /* identifierstatus=allowed */, + { 18, 8782, 8260, 7, 8, UNI_ARMN } /* script=armenian */, + { 0, 7637, 0, 9, 0, UNI_ARABICPFA } /* arabicpfa */, + { 0, 1418, 9013, 24, 2, UNI_CCC__29 } /* canonicalcombiningclass=29 */, + { 784, 4972, 5000, 3, 14, UNI_TITLE } /* istitlecaseletter */, + { 69, 1418, 7975, 24, 1, UNI_CCC__6 } /* canonicalcombiningclass=6 */, + { 269, 185, 0, 4, 0, UNI_CE } /* isce */, + { 2, 10229, 6530, 3, 12, UNI_DT__NONCANON } /* dt=noncanonical */, + { 0, 8973, 8691, 6, 7, UNI_INMULTANI } /* block=multani */, + { 0, 10352, 109, 3, 2, UNI_WB__MB } /* wb=mb */, + { 517, 9476, 8537, 3, 4, UNI_SC__BENG } /* sc=beng */, + { 0, 2206, 5717, 21, 2, UNI_LB__H2 } /* graphemeclusterbreak=lv */, + { 1, 9691, 6939, 4, 11, UNI_MISCSYMBOLS } /* blk=miscsymbols */, + { 2, 8508, 0, 8, 0, UNI_VITH } /* vithkuqi */, + { 3, 9469, 3505, 5, 12, UNI_INPC__LEFTANDRIGHT } /* inpc=leftandright */, + { 1, 7580, 8313, 10, 3, UNI_WB__EB } /* wordbreak=gaz */, + { 4, 9691, 2085, 4, 15, UNI_MODIFIERLETTERS } /* blk=modifierletters */, + { 0, 1814, 0, 21, 0, UNI_CWCM } /* changeswhencasemapped */, + { 0, 185, 2056, 2, 21, UNI__PERL_NCHAR } /* isnoncharactercodepoint */, + { 0, 3877, 9951, 17, 4, UNI_QAAI } /* scriptextensions=qaai */, + { 0, 1538, 0, 24, 0, UNI_inpc_values_index } /* indicpositionalcategory= */, + { 1280, 9979, 8292, 4, 4, UNI_BUGI } /* scx=bugi */, + { 1078, 6083, 8027, 13, 2, UNI_NV__22 } /* numericvalue=22 */, + { 8, 9691, 8614, 4, 7, UNI_INELYMAIC } /* blk=elymaic */, + { 0, 2206, 18, 21, 2, UNI_RI } /* graphemeclusterbreak=ri */, + { 0, 1990, 6572, 22, 6, UNI_LB__ZWJ } /* indicsyllabiccategory=joiner */, + { 108, 8782, 9105, 7, 6, UNI_SC__KHOJ } /* script=khojki */, + { 6, 4090, 0, 16, 0, UNI_GEORGIANEXT } /* georgianextended */, + { 642, 10390, 0, 2, 0, UNI_CASEDLETTER } /* l_ */, + { 0, 8607, 0, 4, 0, UNI_ELBA } /* elba */, + { 27, 9997, 8798, 4, 5, UNI_SHAW } /* inshavian */, + { 0, 185, 568, 2, 2, UNI_NB } /* isnb */, + { 3, 9711, 9004, 5, 4, UNI_CCC__12 } /* ccc=ccc12 */, + { 3, 7907, 9454, 9, 5, -UNI_XIDS } /* xidstart=false */, + { 0, 2248, 781, 3, 29, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* insymbolsandpictographsextendeda */, + { 0, 9711, 9013, 4, 2, UNI_CCC__29 } /* ccc=29 */, + { 1, 9711, 79, 4, 2, UNI_CCC__AR } /* ccc=ar */, + { 6, 8782, 9791, 7, 4, UNI_HLUW } /* script=hluw */, + { 0, 7907, 0, 9, 0, UNI_xids_values_index } /* xidstart= */, + { 1, 9979, 8260, 4, 8, UNI_ARMN } /* scx=armenian */, + { 1, 9476, 10095, 3, 4, UNI_XPEO } /* sc=xpeo */, + { 1803, 9951, 0, 4, 0, UNI_QAAI } /* qaai */, + { 584, 8782, 8508, 7, 4, UNI_VITH } /* script=vith */, + { 0, 9691, 5270, 4, 14, UNI_KANGXI } /* blk=kangxiradicals */, + { 0, 7360, 23, 10, 2, UNI_LB__AL } /* linebreak=al */, + { 0, 9691, 10271, 4, 3, UNI_OCR } /* blk=ocr */, + { 2, 4074, 1528, 16, 9, UNI__PERL_SURROGATE } /* generalcategory=surrogate */, + { 2051, 9691, 5029, 4, 8, UNI_VEDICEXT } /* blk=vedicext */, + { 532, 185, 2708, 2, 19, UNI_EGYP } /* isegyptianhieroglyphs */, + { 1536, 9691, 8740, 4, 7, UNI_OLCK } /* blk=olchiki */, + { 0, 185, 8537, 2, 4, UNI_BENG } /* isbeng */, + { 0, 9735, 3, 4, 1, -UNI_CWU } /* cwu=f */, + { 1, 185, 4504, 2, 15, UNI_BAMUMSUP } /* isbamumsupplement */, + { 1, 6083, 5732, 13, 7, UNI_NV__1000000 } /* numericvalue=1000000 */, + { 0, 4074, 0, 16, 0, UNI_gc_values_index } /* generalcategory= */, + { 1024, 3877, 3935, 18, 10, UNI_SGNW } /* scriptextensions=signwriting */, + { 0, 185, 6752, 2, 11, UNI_DOMINO } /* isdominotiles */, + { 0, 10253, 8413, 4, 7, UNI_LB__LF } /* lb=linefeed */, + { 1, 8782, 4849, 7, 15, UNI_MERC } /* script=meroiticcursive */, + { 0, 5875, 3826, 13, 17, UNI_JG__MANICHAEANDHAMEDH } /* joininggroup=manichaeandhamedh */, + { 0, 9979, 8859, 4, 7, UNI_TIBT } /* scx=tibetan */, + { 1154, 9979, 2312, 5, 3, UNI_SINH } /* scx=sinh */, + { 4, 4729, 0, 15, 0, UNI_INHANGUL } /* hangulsyllables */, + { 258, 3877, 8979, 17, 6, UNI_CARI } /* scriptextensions=carian */, + { 0, 10226, 1026, 3, 2, -UNI_DI } /* di=no */, + { 0, 9979, 10031, 4, 4, UNI_TFNG } /* scx=tfng */, + { 148, 3877, 7450, 17, 10, UNI_PHNX } /* scriptextensions=phoenician */, + { 14, 3877, 1177, 18, 3, UNI_SORA } /* scriptextensions=sora */, + { 1873, 6083, 8913, 13, 3, UNI_NV__400 } /* numericvalue=400 */, + { 9, 7360, 25, 10, 2, UNI_LB__SY } /* linebreak=sy */, + { 10, 10516, 3623, 3, 3, UNI_PAUC } /* ispauc */, + { 67, 10268, 10133, 3, 3, UNI_NV__1_SLASH_9 } /* nv=1/9 */, + { 0, 8973, 1632, 6, 15, UNI_GEOMETRICSHAPES } /* block=geometricshapes */, + { 160, 10253, 415, 3, 11, UNI_LB__ID } /* lb=ideographic */, + { 4, 10253, 1466, 3, 13, UNI_LB__CM } /* lb=combiningmark */, + { 2685, 8973, 3365, 6, 8, UNI_DINGBATS } /* block=dingbats */, + { 257, 9476, 9094, 4, 5, UNI_SC__KTHI } /* sc=kaithi */, + { 0, 10352, 7049, 3, 11, UNI_WB__SQ } /* wb=singlequote */, + { 0, 1167, 10055, 26, 4, UNI_DI } /* defaultignorablecodepoint=true */, + { 0, 9691, 8372, 4, 8, UNI_JAMOEXTA } /* blk=jamoexta */, + { 6, 185, 1270, 2, 24, UNI_COMPEX } /* isfullcompositionexclusion */, + { 16, 9691, 5340, 4, 14, UNI_LATINEXTF } /* blk=latinextendedf */, + { 268, 5823, 0, 13, 0, UNI_grbase_values_index } /* graphemebase= */, + { 10, 3877, 2164, 17, 8, UNI_CYRL } /* scriptextensions=cyrillic */, + { 0, 4972, 10044, 3, 3, UNI_TIBT } /* istibt */, + { 0, 6578, 11, 12, 2, UNI_NT__DI } /* numerictype=di */, + { 3, 185, 8388, 2, 8, UNI_JAVA } /* isjavanese */, + { 12, 4744, 8733, 15, 7, UNI_IDENTIFIERTYPE__NOTNFKC } /* identifiertype=notnfkc */, + { 2, 4972, 4229, 3, 3, UNI_TALE } /* istale */, + { 2, 5662, 9279, 14, 5, UNI_SB__AT } /* sentencebreak=aterm */, + { 0, 8782, 10111, 7, 4, UNI_ZANB } /* script=zanb */, + { 0, 8973, 750, 6, 30, UNI_ENCLOSEDALPHANUMSUP } /* block=enclosedalphanumericsupplement */, + { 0, 4972, 8867, 3, 3, UNI_TIRH } /* istirh */, + { 91, 6314, 9454, 12, 5, -UNI_IDEO } /* ideographic=false */, + { 0, 185, 9879, 2, 4, UNI_MYMR } /* ismymr */, + { 68, 185, 3826, 2, 10, UNI_MANI } /* ismanichaean */, + { 0, 7580, 0, 10, 0, UNI_wb_values_index } /* wordbreak= */, + { 4, 3157, 0, 17, 0, UNI_EBASE } /* emojimodifierbase */, + { 2, 21, 5888, 2, 13, UNI_KANAEXTA } /* inkanaextendeda */, + { 0, 9691, 510, 4, 30, UNI_CJKEXTA } /* blk=cjkunifiedideographsextensiona */, + { 0, 10247, 6031, 3, 13, UNI_JG__MANICHAEANWAW } /* jg=manichaeanwaw */, + { 128, 3877, 6928, 17, 11, UNI_MEDF } /* scriptextensions=medefaidrin */, + { 0, 10244, 107, 3, 6, UNI_S } /* gc=symbol */, + { 2, 8973, 1514, 6, 24, UNI_HIGHPUSURROGATES } /* block=highprivateusesurrogates */, + { 673, 8973, 8866, 6, 7, UNI_INTIRHUTA } /* block=tirhuta */, + { 0, 5536, 10355, 14, 3, UNI_NFCQC__Y } /* nfcquickcheck=yes */, + { 0, 3247, 0, 18, 0, UNI_INPUNCTUATION } /* generalpunctuation */, + { 531, 8881, 5803, 3, 4, UNI_XPOSIXALNUM } /* isalnum */, + { 0, 1553, 9048, 9, 2, UNI_CF } /* category=cf */, + { 0, 9476, 6730, 3, 11, UNI_SC__CPMN } /* sc=cyprominoan */, + { 0, 1274, 9454, 21, 5, -UNI_CE } /* compositionexclusion=false */, + { 0, 9449, 0, 6, 0, -UNI_EMOD } /* emod=f */, + { 8, 9476, 4534, 3, 4, UNI_BRAI } /* sc=brai */, + { 0, 9476, 58, 3, 2, UNI_SC__YI } /* sc=yi */, + { 0, 9979, 3139, 4, 4, UNI_DEVA } /* scx=deva */, + { 6, 8973, 1061, 6, 27, UNI_OCR } /* block=opticalcharacterrecognition */, + { 0, 3877, 8797, 18, 6, UNI_SHAW } /* scriptextensions=shavian */, + { 0, 5116, 9454, 14, 5, -UNI_CI } /* caseignorable=false */, + { 1, 1270, 0, 24, 0, UNI_COMPEX } /* fullcompositionexclusion */, + { 36, 8973, 9207, 6, 6, UNI_INTHAANA } /* block=thaana */, + { 0, 21, 8388, 2, 8, UNI_INJAVANESE } /* injavanese */, + { 3, 6083, 8164, 13, 8, UNI_NV__1_SLASH_16 } /* numericvalue=6.25e-02 */, + { 513, 9691, 218, 4, 33, UNI_DIACRITICALSEXT } /* blk=combiningdiacriticalmarksextended */, + { 67, 9979, 9069, 4, 4, UNI_GOTH } /* scx=goth */, + { 1, 1167, 26, 26, 1, UNI_DI } /* defaultignorablecodepoint=y */, + { 276, 9743, 3, 4, 1, -UNI_DEP } /* dep=f */, + { 273, 9476, 8810, 3, 7, UNI_SOYO } /* sc=soyombo */, + { 87, 9691, 4170, 4, 6, UNI_LATIN1 } /* blk=latin1 */, + { 0, 5875, 9480, 14, 4, UNI_JG__KHAPH } /* joininggroup=khaph */, + { 1233, 8973, 7261, 7, 9, UNI_INCHORASMIAN } /* block=chorasmian */, + { 77, 185, 5634, 2, 14, UNI_PHLP } /* ispsalterpahlavi */, + { 363, 6083, 7611, 13, 1, UNI_NV__5 } /* numericvalue=5 */, + { 0, 10268, 9604, 3, 3, UNI_NV__3_SLASH_2 } /* nv=3/2 */, + { 19, 7467, 10298, 3, 3, UNI_IN__2_DOT_1 } /* in=v21 */, + { 0, 8973, 6752, 6, 11, UNI_DOMINO } /* block=dominotiles */, + { 0, 1418, 9360, 25, 4, UNI_CCC__26 } /* canonicalcombiningclass=ccc26 */, + { 257, 5823, 26, 13, 1, UNI_GRBASE } /* graphemebase=y */, + { 264, 3283, 10355, 18, 3, UNI_IDSB } /* idsbinaryoperator=yes */, + { 292, 9711, 9010, 5, 5, UNI_CCC__129 } /* ccc=ccc129 */, + { 0, 3707, 0, 16, 0, UNI_ETHIOPICEXT } /* ethiopicextended */, + { 422, 4924, 0, 15, 0, UNI_NARB } /* oldnortharabian */, + { 657, 9691, 3775, 4, 17, UNI_INDICSIYAQNUMBERS } /* blk=indicsiyaqnumbers */, + { 0, 4684, 10091, 15, 4, UNI_EA__W } /* eastasianwidth=wide */, + { 148, 5758, 9454, 13, 5, -UNI_BIDIM } /* bidimirrored=false */, + { 1, 185, 44, 3, 25, UNI_CJKCOMPATIDEOGRAPHS } /* iscjkcompatibilityideographs */, + { 0, 2012, 36, 22, 1, UNI_LOE } /* logicalorderexception=t */, + { 3, 7360, 8894, 10, 7, UNI_LB__ZW } /* linebreak=zwspace */, + { 0, 185, 133, 2, 2, UNI_LM } /* islm */, + { 3, 6529, 9520, 3, 4, UNI_INOSAGE } /* inosage */, + { 2, 3877, 8300, 17, 4, UNI_DUPL } /* scriptextensions=dupl */, + { 0, 9903, 0, 4, 0, UNI_OGAM } /* ogam */, + { 2, 3175, 10055, 18, 4, UNI_EPRES } /* emojipresentation=true */, + { 0, 8973, 9231, 6, 6, UNI_INWANCHO } /* block=wancho */, + { 0, 185, 9823, 2, 4, UNI_KTHI } /* iskthi */, + { 105, 9691, 6109, 4, 13, UNI_VERTICALFORMS } /* blk=verticalforms */, + { 2400, 9469, 3018, 5, 13, UNI_INPC__BOTTOMANDLEFT } /* inpc=bottomandleft */, + { 560, 9691, 43, 4, 26, UNI_CJKCOMPATIDEOGRAPHS } /* blk=cjkcompatibilityideographs */, + { 704, 6083, 8907, 13, 2, UNI_NV__30 } /* numericvalue=30 */, + { 0, 8973, 1019, 6, 5, UNI_MUSIC } /* block=music */, + { 0, 8973, 4610, 7, 14, UNI_CONTROLPICTURES } /* block=controlpictures */, + { 1288, 8782, 9839, 7, 4, UNI_SC__LINA } /* script=lina */, + { 0, 9476, 3139, 3, 4, UNI_SC__DEVA } /* sc=deva */, + { 1040, 8796, 0, 7, 0, UNI_SHAW } /* shavian */, + { 0, 9711, 7320, 4, 10, UNI_CCC__6 } /* ccc=hanreading */, + { 565, 5045, 1, 3, 41, UNI_UCASEXT } /* isunifiedcanadianaboriginalsyllabicsextended */, + { 1056, 9979, 9963, 4, 4, UNI_ROHG } /* scx=rohg */, + { 122, 2553, 1, 20, 1, -UNI_TERM } /* terminalpunctuation=n */, + { 1, 6083, 9591, 13, 4, UNI_NV__11_SLASH_2 } /* numericvalue=11/2 */, + { 583, 3945, 26, 17, 1, UNI_UIDEO } /* unifiedideograph=y */, + { 4, 1193, 0, 26, 0, UNI_HALFANDFULLFORMS } /* halfwidthandfullwidthforms */, + { 2196, 9549, 0, 5, 0, UNI_xids_values_index } /* xids= */, + { 21, 5875, 5448, 13, 4, UNI_JG__HETH } /* joininggroup=heth */, + { 1, 185, 5914, 2, 13, UNI_ZL } /* islineseparator */, + { 5, 9979, 10099, 4, 4, UNI_XSUX } /* scx=xsux */, + { 0, 8973, 8420, 6, 8, UNI_INMAHAJANI } /* block=mahajani */, + { 2, 185, 17, 3, 1, UNI_CO } /* isco */, + { 4, 10268, 8943, 3, 5, UNI_NV__80000 } /* nv=80000 */, + { 1, 9434, 0, 4, 0, UNI_CWCM } /* cwcm */, + { 3, 1045, 0, 6, 0, UNI_L } /* letter */, + { 137, 10247, 4829, 3, 5, UNI_JG__SADHE } /* jg=sadhe */, + { 412, 9979, 2227, 4, 14, UNI_ROHG } /* scx=hanifirohingya */, + { 10, 1418, 9367, 24, 2, UNI_CCC__27 } /* canonicalcombiningclass=27 */, + { 516, 10229, 8332, 3, 3, UNI_DT__FRA } /* dt=fra */, + { 1, 1814, 10055, 22, 4, UNI_CWCM } /* changeswhencasemapped=true */, + { 3, 1418, 9390, 25, 4, UNI_CCC__32 } /* canonicalcombiningclass=ccc32 */, + { 0, 9691, 2100, 4, 22, UNI_TRANSPORTANDMAP } /* blk=transportandmapsymbols */, + { 0, 3877, 9903, 17, 4, UNI_OGAM } /* scriptextensions=ogam */, + { 1073, 2304, 9510, 3, 4, UNI_OGAM } /* isogham */, + { 0, 9979, 3826, 4, 4, UNI_MANI } /* scx=mani */, + { 1041, 8782, 8691, 7, 4, UNI_SC__MULT } /* script=mult */, + { 1966, 5096, 0, 5, 0, UNI_XPOSIXDIGIT } /* digit */, + { 1, 10402, 10490, 6, 9, UNI__PERL_ANY_FOLDS } /* _perl_any_folds */, + { 7, 9237, 0, 6, 0, UNI_YEZI } /* yezidi */, + { 1, 185, 0, 3, 0, UNI_C } /* isc */, + { 9, 1553, 407, 9, 7, UNI_XPOSIXCNTRL } /* category=control */, + { 0, 10023, 0, 4, 0, UNI_TAML } /* taml */, + { 0, 5758, 36, 13, 1, UNI_BIDIM } /* bidimirrored=t */, + { 6, 9123, 0, 6, 0, UNI_lower_values_index } /* lower= */, + { 0, 8782, 9775, 7, 4, UNI_SC__GREK } /* script=grek */, + { 5, 4699, 3, 15, 1, -UNI_ECOMP } /* emojicomponent=f */, + { 0, 1190, 39, 3, 2, UNI_XPOSIXDIGIT } /* nt=de */, + { 0, 6083, 8235, 13, 2, UNI_NV__28 } /* numericvalue=28 */, + { 1553, 9711, 8102, 4, 2, UNI_CCC__17 } /* ccc=17 */, + { 0, 6386, 0, 12, 0, UNI_MAHJONG } /* mahjongtiles */, + { 1, 3121, 46, 18, 3, UNI_DT__COM } /* decompositiontype=com */, + { 2, 7460, 8036, 10, 3, UNI_IN__3_DOT_1 } /* presentin=3.1 */, + { 1, 10229, 1254, 3, 7, UNI_DT__INIT } /* dt=initial */, + { 0, 185, 383, 2, 4, UNI_EGYP } /* isegyp */, + { 1, 9476, 6972, 3, 4, UNI_SC__NAND } /* sc=nand */, + { 155, 8881, 2614, 3, 18, UNI_ANCIENTGREEKNUMBERS } /* isancientgreeknumbers */, + { 0, 8782, 9129, 7, 6, UNI_LYCI } /* script=lycian */, + { 1025, 9711, 9300, 5, 4, UNI_CCC__14 } /* ccc=ccc14 */, + { 1839, 8782, 9967, 7, 4, UNI_RUNR } /* script=runr */, + { 0, 7460, 9583, 10, 4, UNI_IN__10 } /* presentin=10.0 */, + { 0, 8973, 1014, 6, 5, UNI_INGREEK } /* block=greek */, + { 0, 6350, 7, 12, 1, UNI_JT__C } /* joiningtype=c */, + { 130, 10253, 25, 3, 2, UNI_LB__SY } /* lb=sy */, + { 0, 8782, 7853, 7, 4, UNI_PAUC } /* script=pauc */, + { 0, 10229, 2809, 3, 3, UNI_DT__NAR } /* dt=nar */, + { 0, 10247, 7290, 3, 10, UNI_JG__DALATHRISH } /* jg=dalathrish */, + { 1, 494, 0, 3, 0, UNI_HAN } /* han */, + { 0, 2803, 3, 19, 1, -UNI_IDST } /* idstrinaryoperator=f */, + { 0, 9727, 1026, 4, 2, -UNI_CWL } /* cwl=no */, + { 2822, 3877, 8811, 18, 3, UNI_SOYO } /* scriptextensions=soyo */, + { 0, 7297, 3077, 3, 8, UNI_HALFMARKS } /* ishalfmarks */, + { 2, 8316, 1966, 10, 3, -UNI_EXTPICT } /* extpict=false */, + { 4, 7200, 0, 10, 0, UNI_ARABICEXTB } /* arabicextb */, + { 0, 6675, 0, 3, 0, UNI_IDC } /* idc */, + { 269, 10352, 6278, 3, 12, UNI_WB__EB } /* wb=glueafterzwj */, + { 32, 7060, 1, 11, 1, -UNI_SD } /* softdotted=n */, + { 0, 9691, 79, 4, 35, UNI_ARABICMATH } /* blk=arabicmathematicalalphabeticsymbols */, + { 64, 1026, 0, 2, 0, UNI_NO } /* no */, + { 0, 185, 8300, 2, 4, UNI_DUPL } /* isdupl */, + { 3, 329, 0, 21, 0, UNI_MATHOPERATORS } /* mathematicaloperators */, + { 0, 9177, 0, 6, 0, UNI_qmark_values_index } /* qmark= */, + { 4, 9647, 10059, 4, 4, UNI_AGE__10 } /* age=v100 */, + { 1, 6518, 0, 12, 0, UNI_MEND } /* mendekikakui */, + { 1238, 1814, 9454, 22, 5, -UNI_CWCM } /* changeswhencasemapped=false */, + { 29, 9429, 10355, 5, 3, UNI_CWCF } /* cwcf=yes */, + { 0, 1553, 2085, 9, 14, UNI_LM } /* category=modifierletter */, + { 284, 8967, 0, 6, 0, UNI_bidim_values_index } /* bidim= */, + { 16, 1592, 3708, 3, 10, UNI_ETHIOPICEXT } /* inethiopicext */, + { 1, 4894, 0, 15, 0, UNI_nfkcqc_values_index } /* nfkcquickcheck= */, + { 5, 9706, 0, 2, 0, UNI_MC } /* mc */, + { 0, 8782, 4534, 7, 7, UNI_BRAI } /* script=braille */, + { 0, 10232, 8, 3, 1, UNI_EA__A } /* ea=a */, + { 0, 4074, 2085, 16, 14, UNI_LM } /* generalcategory=modifierletter */, + { 1248, 8973, 2493, 6, 20, UNI_INNYIAKENGPUACHUEHMONG } /* block=nyiakengpuachuehmong */, + { 2354, 9691, 1924, 4, 22, UNI_INDICNUMBERFORMS } /* blk=commonindicnumberforms */, + { 1554, 1902, 0, 22, 0, UNI_CJKCOMPATIDEOGRAPHSSUP } /* cjkcompatideographssup */, + { 1127, 6937, 843, 6, 25, UNI_MISCARROWS } /* inmiscellaneoussymbolsandarrows */, + { 2, 9979, 3193, 4, 4, UNI_ETHI } /* scx=ethi */, + { 649, 8586, 0, 7, 0, UNI_CJKEXTG } /* cjkextg */, + { 336, 10247, 5462, 3, 4, UNI_JG__KAPH } /* jg=kaph */, + { 0, 9979, 3792, 4, 17, UNI_KITS } /* scx=khitansmallscript */, + { 135, 1418, 3031, 24, 13, UNI_CCC__214 } /* canonicalcombiningclass=attachedabove */, + { 8, 9691, 7430, 4, 10, UNI_INOLDSOGDIAN } /* blk=oldsogdian */, + { 1122, 185, 6158, 2, 11, UNI_BIDIC } /* isbidicontrol */, + { 0, 4894, 26, 15, 1, UNI_NFKCQC__Y } /* nfkcquickcheck=y */, + { 1, 9979, 10008, 5, 3, UNI_SYRC } /* scx=syrc */, + { 0, 9979, 10087, 4, 4, UNI_WCHO } /* scx=wcho */, + { 2, 7360, 6708, 10, 11, UNI_LB__BB } /* linebreak=breakbefore */, + { 19, 185, 9899, 2, 4, UNI_NSHU } /* isnshu */, + { 0, 3877, 6593, 17, 4, UNI_HUNG } /* scriptextensions=hung */, + { 1027, 8973, 4504, 6, 8, UNI_BAMUMSUP } /* block=bamumsup */, + { 2, 8973, 9524, 6, 5, UNI_INRUNIC } /* block=runic */, + { 0, 185, 952, 2, 17, UNI_VS } /* isvariationselector */, + { 0, 10226, 10055, 3, 4, UNI_DI } /* di=true */, + { 0, 185, 2185, 2, 20, UNI_EXTPICT } /* isextendedpictographic */, + { 0, 21, 5256, 2, 14, UNI_KANASUP } /* inkanasupplement */, + { 28, 10247, 3826, 3, 17, UNI_JG__MANICHAEANDHAMEDH } /* jg=manichaeandhamedh */, + { 682, 9105, 0, 4, 0, UNI_KHOJ } /* khoj */, + { 0, 1418, 16, 24, 1, UNI_CCC__B } /* canonicalcombiningclass=b */, + { 25, 8973, 10039, 6, 4, UNI_INTHAI } /* block=thai */, + { 80, 9063, 36, 6, 1, UNI_EPRES } /* epres=t */, + { 0, 10508, 10523, 8, 5, UNI_XPOSIXBLANK } /* isxposixblank */, + { 0, 9691, 690, 4, 30, UNI_CJKEXTG } /* blk=cjkunifiedideographsextensiong */, + { 733, 4381, 0, 13, 0, UNI_MATHOPERATORS } /* mathoperators */, + { 6, 9691, 7637, 4, 9, UNI_ARABICPFA } /* blk=arabicpfa */, + { 1155, 9476, 9264, 3, 5, UNI_SC__ADLM } /* sc=adlam */, + { 6, 6350, 7126, 12, 11, UNI_JT__T } /* joiningtype=transparent */, + { 1321, 7500, 0, 4, 0, UNI_SAUR } /* saur */, + { 806, 9647, 8148, 4, 3, UNI_AGE__6 } /* age=6.0 */, + { 0, 8782, 79, 7, 4, UNI_SC__ARAB } /* script=arab */, + { 0, 5875, 5940, 13, 13, UNI_JG__MALAYALAMLLLA } /* joininggroup=malayalamllla */, + { 129, 8973, 8663, 6, 7, UNI_INLINEARA } /* block=lineara */, + { 1, 8973, 2708, 6, 19, UNI_INEGYPTIANHIEROGLYPHS } /* block=egyptianhieroglyphs */, + { 1, 3877, 8530, 17, 7, UNI_AVST } /* scriptextensions=avestan */, + { 0, 5823, 9454, 13, 5, -UNI_GRBASE } /* graphemebase=false */, + { 1, 9439, 26, 5, 1, UNI_DASH } /* dash=y */, + { 2345, 4157, 3284, 3, 16, UNI_IDSB } /* isidsbinaryoperator */, + { 2858, 7908, 10055, 8, 4, UNI_IDS } /* idstart=true */, + { 2564, 2248, 2937, 3, 18, UNI_SUNDANESESUP } /* insundanesesupplement */, + { 0, 4074, 2292, 16, 2, UNI_PD } /* generalcategory=pd */, + { 6, 9691, 868, 4, 18, UNI_PHONETICEXT } /* blk=phoneticextensions */, + { 80, 10217, 2292, 3, 3, UNI_BC__PDI } /* bc=pdi */, + { 0, 9075, 10055, 6, 4, UNI_GREXT } /* grext=true */, + { 0, 1538, 3505, 24, 12, UNI_INPC__LEFTANDRIGHT } /* indicpositionalcategory=leftandright */, + { 0, 10268, 5732, 3, 5, UNI_NV__10000 } /* nv=10000 */, + { 662, 10553, 2553, 3, 4, UNI_STERM } /* issterm */, + { 0, 9544, 1026, 5, 2, -UNI_XIDC } /* xidc=no */, + { 0, 1553, 49, 9, 1, UNI_P } /* category=p */, + { 0, 3877, 10103, 17, 4, UNI_YI } /* scriptextensions=yiii */, + { 0, 10247, 5438, 3, 14, UNI_JG__MANICHAEANHETH } /* jg=manichaeanheth */, + { 2492, 5648, 1026, 14, 2, -UNI_QMARK } /* quotationmark=no */, + { 0, 10553, 8811, 3, 3, UNI_SOYO } /* issoyo */, + { 3616, 185, 9859, 2, 4, UNI_MERC } /* ismerc */, + { 2304, 5093, 36, 9, 1, UNI_XPOSIXXDIGIT } /* hexdigit=t */, + { 17, 9979, 2841, 4, 4, UNI_MERO } /* scx=mero */, + { 10, 8782, 2632, 7, 6, UNI_BRAH } /* script=brahmi */, + { 0, 3877, 8684, 17, 7, UNI_MARC } /* scriptextensions=marchen */, + { 2, 1418, 9330, 25, 4, UNI_CCC__20 } /* canonicalcombiningclass=ccc20 */, + { 0, 2936, 0, 12, 0, UNI_SUNDANESESUP } /* sundanesesup */, + { 0, 1553, 45, 10, 1, UNI_SK } /* category=sk */, + { 2145, 3265, 0, 8, 0, UNI_GEOR } /* georgian */, + { 0, 10217, 10274, 3, 3, UNI_BC__PDF } /* bc=pdf */, + { 69, 8973, 8600, 6, 7, UNI_DSRT } /* block=deseret */, + { 128, 5095, 0, 6, 0, UNI_XPOSIXXDIGIT } /* xdigit */, + { 277, 2206, 4346, 21, 5, UNI_GCB__XX } /* graphemeclusterbreak=other */, + { 84, 10247, 5235, 3, 7, UNI_JG__HEHGOAL } /* jg=hehgoal */, + { 2, 10268, 1250, 3, 3, UNI_NV__NAN } /* nv=nan */, + { 1081, 9711, 9400, 5, 4, UNI_CCC__34 } /* ccc=ccc34 */, + { 0, 9476, 9787, 3, 4, UNI_SC__HANO } /* sc=hano */, + { 9, 9077, 10055, 4, 4, UNI_EXT } /* ext=true */, + { 528, 3409, 9454, 18, 5, -UNI_RI } /* regionalindicator=false */, + { 0, 5875, 9659, 13, 4, UNI_JG__ALEF } /* joininggroup=alef */, + { 0, 8973, 1320, 6, 25, UNI_SYMBOLSANDPICTOGRAPHSEXTA } /* block=symbolsandpictographsexta */, + { 0, 9691, 2879, 4, 12, UNI_MONGOLIANSUP } /* blk=mongoliansup */, + { 0, 9476, 3049, 3, 4, UNI_CHER } /* sc=cher */, + { 17, 3877, 9891, 17, 4, UNI_NEWA } /* scriptextensions=newa */, + { 2697, 2553, 0, 21, 0, UNI_TERM } /* terminalpunctuation=t */, + { 0, 4714, 10055, 15, 4, UNI_GREXT } /* graphemeextend=true */, + { 0, 8881, 5089, 3, 12, UNI_POSIXXDIGIT } /* isasciihexdigit */, + { 1, 185, 1467, 3, 23, UNI_DIACRITICALSFORSYMBOLS } /* iscombiningmarksforsymbols */, + { 6, 10268, 8903, 3, 3, UNI_NV__600 } /* nv=600 */, + { 0, 185, 8396, 2, 8, UNI_KANAEXTA } /* iskanaexta */, + { 9, 8973, 8348, 6, 8, UNI_INGURMUKHI } /* block=gurmukhi */, + { 4, 185, 7718, 2, 9, UNI_LATINEXTB } /* islatinextb */, + { 0, 9691, 3463, 4, 18, UNI_SMALLKANAEXT } /* blk=smallkanaextension */, + { 2258, 2784, 24, 19, 1, UNI_GCB__L } /* hangulsyllabletype=l */, + { 0, 9469, 7440, 5, 10, UNI_INPC__OVERSTRUCK } /* inpc=overstruck */, + { 0, 3877, 3978, 17, 8, UNI_BOPO } /* scriptextensions=bopomofo */, + { 0, 6083, 9611, 13, 4, UNI_NV__15_SLASH_2 } /* numericvalue=15/2 */, + { 137, 7550, 0, 10, 0, UNI_CN } /* unassigned */, + { 6, 185, 3157, 2, 13, UNI_EMOD } /* isemojimodifier */, + { 2, 10268, 8949, 3, 3, UNI_NV__900 } /* nv=900 */, + { 51, 10244, 599, 3, 2, UNI_XPOSIXCNTRL } /* gc=cc */, + { 10, 1852, 1, 6, 1, -UNI_CASED } /* cased=n */, + { 8, 9747, 3, 4, 1, -UNI_DIA } /* dia=f */, + { 5, 6374, 0, 12, 0, UNI_NL } /* letternumber */, + { 0, 1418, 3039, 24, 5, UNI_CCC__A } /* canonicalcombiningclass=above */, + { 47, 9476, 9871, 3, 3, UNI_MRO } /* sc=mro */, + { 1144, 10244, 10400, 3, 2, UNI_ZS } /* gc=zs */, + { 2217, 1418, 8986, 25, 4, UNI_CCC__10 } /* canonicalcombiningclass=ccc10 */, + { 0, 9979, 9719, 4, 4, UNI_CPMN } /* scx=cpmn */, + { 0, 185, 2311, 2, 21, UNI_SINHALAARCHAICNUMBERS } /* issinhalaarchaicnumbers */, + { 229, 7360, 5669, 10, 2, UNI_EBASE } /* linebreak=eb */, + { 0, 8621, 0, 4, 0, UNI_GRAN } /* gran */, + { 0, 9474, 2413, 5, 20, UNI_INSC__CONSONANTWITHSTACKER } /* insc=consonantwithstacker */, + { 2609, 8973, 862, 6, 6, UNI_ARROWS } /* block=arrows */, + { 0, 5354, 0, 14, 0, UNI_LATINEXTG } /* latinextendedg */, + { 233, 6083, 10362, 13, 2, UNI_NV__44 } /* numericvalue=44 */, + { 12, 6994, 0, 11, 0, UNI_NO } /* othernumber */, + { 22, 8881, 184, 4, 2, UNI_ARMI } /* isarmi */, + { 0, 9711, 8251, 4, 2, UNI_CCC__19 } /* ccc=19 */, + { 0, 9939, 0, 4, 0, UNI_MIAO } /* plrd */, + { 0, 3877, 9069, 17, 6, UNI_GOTH } /* scriptextensions=gothic */, + { 0, 9691, 6862, 4, 11, UNI_KATAKANAEXT } /* blk=katakanaext */, + { 556, 3877, 9519, 17, 5, UNI_OSGE } /* scriptextensions=osage */, + { 1311, 9979, 8663, 4, 7, UNI_LINA } /* scx=lineara */, + { 1, 9711, 6774, 4, 11, UNI_CCC__DB } /* ccc=doublebelow */, + { 0, 4598, 1634, 4, 13, UNI_GEOMETRICSHAPES } /* ingeometricshapes */, + { 11, 3877, 2584, 17, 4, UNI_MAND } /* scriptextensions=mand */, + { 1427, 8782, 7, 7, 18, UNI_CANS } /* script=canadianaboriginal */, + { 0, 4074, 1218, 16, 2, UNI_SK } /* generalcategory=sk */, + { 5, 8782, 866, 10, 1, UNI_SHAW } /* script=shaw */, + { 462, 9269, 9454, 5, 5, -UNI_POSIXXDIGIT } /* ahex=false */, + { 585, 10244, 25, 3, 1, UNI_S } /* gc=s */, + { 0, 7218, 8277, 3, 7, UNI_INBALINESE } /* inbalinese */, + { 8, 10268, 10368, 3, 2, UNI_NV__47 } /* nv=47 */, + { 0, 8316, 0, 9, 0, -UNI_EXTPICT } /* extpict=f */, + { 0, 3398, 0, 10, 0, UNI_XPOSIXSPACE } /* whitespace */, + { 2870, 2242, 9892, 3, 3, UNI_INNEWA } /* innewa */, + { 0, 9691, 4378, 4, 16, UNI_SUPMATHOPERATORS } /* blk=supmathoperators */, + { 1, 9123, 9454, 6, 5, -UNI_XPOSIXLOWER } /* lower=false */, + { 1128, 3121, 4058, 18, 5, UNI_DT__FIN } /* decompositiontype=final */, + { 0, 9449, 36, 5, 1, UNI_EMOD } /* emod=t */, + { 3091, 9476, 8260, 3, 8, UNI_ARMN } /* sc=armenian */, + { 0, 185, 728, 2, 2, UNI_MN } /* ismn */, + { 1800, 1167, 1026, 26, 2, -UNI_DI } /* defaultignorablecodepoint=no */, + { 1, 9979, 7450, 4, 10, UNI_PHNX } /* scx=phoenician */, + { 47, 7467, 9607, 3, 4, UNI_IN__14 } /* in=14.0 */, + { 0, 10268, 8076, 3, 8, UNI_NV__3_SLASH_8 } /* nv=3.75e-01 */, + { 83, 8782, 9081, 7, 6, UNI_HATR } /* script=hatran */, + { 5, 9735, 10355, 4, 3, UNI_CWU } /* cwu=yes */, + { 0, 1869, 0, 5, 0, UNI_TITLE } /* title */, + { 2, 9063, 10055, 6, 4, UNI_EPRES } /* epres=true */, + { 138, 10244, 1172, 3, 2, UNI_TITLE } /* gc=lt */, + { 1089, 9763, 34, 4, 2, UNI_GCB__EX } /* gcb=ex */, + { 8, 3942, 6293, 5, 9, UNI_INGUNJALAGONDI } /* ingunjalagondi */, + { 2, 3877, 9482, 17, 4, UNI_PHLI } /* scriptextensions=phli */, + { 0, 9979, 8420, 4, 8, UNI_MAHJ } /* scx=mahajani */, + { 0, 9979, 6730, 4, 11, UNI_CPMN } /* scx=cyprominoan */, + { 0, 9123, 3, 6, 1, -UNI_XPOSIXLOWER } /* lower=f */, + { 2374, 8782, 3936, 8, 3, UNI_SGNW } /* script=sgnw */, + { 0, 9476, 7500, 3, 4, UNI_SAUR } /* sc=saur */, + { 0, 185, 9294, 2, 5, UNI_BUHD } /* isbuhid */, + { 0, 7460, 8099, 10, 2, UNI_IN__14 } /* presentin=14 */, + { 0, 185, 1935, 2, 11, UNI_NUMBERFORMS } /* isnumberforms */, + { 0, 1553, 10400, 9, 2, UNI_ZS } /* category=zs */, + { 50, 9691, 3076, 4, 9, UNI_HALFMARKS } /* blk=halfmarks */, + { 0, 2143, 0, 21, 0, UNI_CJKRADICALSSUP } /* cjkradicalssupplement */, + { 4, 185, 2879, 2, 19, UNI_MONGOLIANSUP } /* ismongoliansupplement */, + { 0, 9647, 7995, 4, 4, UNI_AGE__12 } /* age=12.0 */, + { 526, 9691, 2269, 4, 11, UNI_INMEETEIMAYEK } /* blk=meeteimayek */, + { 23, 9979, 10000, 5, 3, UNI_SHRD } /* scx=shrd */, + { 1149, 185, 9736, 3, 2, UNI_CWU } /* iscwu */, + { 0, 10268, 8907, 3, 3, UNI_NV__300 } /* nv=300 */, + { 0, 21, 8649, 2, 7, UNI_INKANNADA } /* inkannada */, + { 1163, 185, 1881, 3, 20, UNI_CWU } /* ischangeswhenuppercased */, + { 1, 6083, 9571, 13, 3, UNI_NV__1_SLASH_4 } /* numericvalue=1/4 */, + { 6, 4074, 10400, 16, 2, UNI_ZS } /* generalcategory=zs */, + { 1, 3877, 10039, 17, 4, UNI_THAI } /* scriptextensions=thai */, + { 0, 3877, 5368, 17, 4, UNI_LISU } /* scriptextensions=lisu */, + { 3901, 9549, 10355, 5, 3, UNI_XIDS } /* xids=yes */, + { 135, 2632, 0, 4, 0, UNI_BRAH } /* brah */, + { 0, 3877, 5059, 17, 15, UNI_ZANB } /* scriptextensions=zanabazarsquare */, + { 2625, 3877, 0, 17, 0, UNI_scx_values_index } /* scriptextensions= */, + { 9, 7297, 2766, 3, 18, UNI_JAMOEXTB } /* ishanguljamoextendedb */, + { 2309, 10217, 5186, 3, 14, UNI_BC__EN } /* bc=europeannumber */, + { 0, 510, 0, 20, 0, UNI_CJK } /* cjkunifiedideographs */, + { 2, 8544, 0, 7, 0, UNI_CJKEXTA } /* cjkexta */, + { 1541, 49, 0, 1, 0, UNI_P } /* p */, + { 3, 9711, 1779, 4, 2, UNI_CCC__DB } /* ccc=db */, + { 2, 5830, 36, 6, 1, UNI_EBASE } /* ebase=t */, + { 4, 185, 3398, 2, 10, UNI_XPOSIXSPACE } /* iswhitespace */, + { 0, 3877, 3049, 17, 8, UNI_CHER } /* scriptextensions=cherokee */, + { 0, 9691, 750, 4, 30, UNI_ENCLOSEDALPHANUMSUP } /* blk=enclosedalphanumericsupplement */, + { 5, 185, 3928, 2, 17, UNI_SUTTONSIGNWRITING } /* issuttonsignwriting */, + { 3, 9667, 0, 4, 0, UNI_ARMN } /* armn */, + { 7, 10253, 8873, 3, 7, UNI_LB__XX } /* lb=unknown */, + { 577, 8973, 2613, 6, 19, UNI_ANCIENTGREEKNUMBERS } /* block=ancientgreeknumbers */, + { 14, 6578, 39, 12, 2, UNI_XPOSIXDIGIT } /* numerictype=de */, + { 0, 1418, 3596, 24, 5, UNI_CCC__B } /* canonicalcombiningclass=below */, + { 1, 10516, 10528, 7, 5, UNI_POSIXPRINT } /* isposixprint */, + { 0, 9711, 3039, 4, 10, UNI_CCC__AR } /* ccc=aboveright */, + { 1, 5758, 10355, 13, 3, UNI_BIDIM } /* bidimirrored=yes */, + { 3622, 185, 4286, 2, 10, UNI_SM } /* ismathsymbol */, + { 3358, 10346, 0, 3, 1, UNI_VO__U } /* vo=u */, + { 2, 10553, 6924, 3, 3, UNI_SAMR } /* issamr */, + { 24, 9691, 720, 4, 30, UNI_CUNEIFORMNUMBERS } /* blk=cuneiformnumbersandpunctuation */, + { 0, 1553, 75, 9, 2, UNI_ME } /* category=me */, + { 1113, 9063, 1, 6, 1, -UNI_EPRES } /* epres=n */, + { 3, 9979, 8537, 4, 7, UNI_BENG } /* scx=bengali */, + { 832, 10268, 8937, 3, 3, UNI_NV__700 } /* nv=700 */, + { 0, 3877, 8600, 17, 7, UNI_DSRT } /* scriptextensions=deseret */, + { 1, 9979, 9883, 4, 4, UNI_NARB } /* scx=narb */, + { 394, 10253, 7250, 3, 10, UNI_LB__BA } /* lb=breakafter */, + { 3717, 3877, 9959, 17, 4, UNI_RJNG } /* scriptextensions=rjng */, + { 2923, 10553, 8818, 3, 6, UNI_SUPPUAA } /* issuppuaa */, + { 1, 8973, 9105, 6, 6, UNI_INKHOJKI } /* block=khojki */, + { 3824, 8881, 8531, 3, 6, UNI_AVST } /* isavestan */, + { 452, 5578, 0, 14, 0, UNI_MN } /* nonspacingmark */, + { 0, 8782, 9871, 7, 3, UNI_MRO } /* script=mro */, + { 0, 4684, 1193, 15, 9, UNI_EA__H } /* eastasianwidth=halfwidth */, + { 11, 10247, 5494, 3, 14, UNI_JG__MANICHAEANTETH } /* jg=manichaeanteth */, + { 4085, 21, 4202, 2, 16, UNI_LINEARBSYLLABARY } /* inlinearbsyllabary */, + { 4, 2784, 9, 19, 2, UNI_HST__NA } /* hangulsyllabletype=na */, + { 1074, 9691, 600, 4, 30, UNI_CJKEXTD } /* blk=cjkunifiedideographsextensiond */, + { 1235, 1, 0, 1, 0, UNI_N } /* n */, + { 0, 3382, 0, 9, 0, UNI_Z } /* separator */, + { 2100, 7467, 7996, 3, 3, UNI_IN__2 } /* in=2.0 */, + { 21, 5172, 10355, 14, 3, UNI_EMOD } /* emojimodifier=yes */, + { 1, 7360, 34, 10, 2, UNI_LB__EX } /* linebreak=ex */, + { 15, 1189, 9208, 3, 5, UNI_INTHAANA } /* inthaana */, + { 3104, 9691, 7159, 4, 11, UNI_YISYLLABLES } /* blk=yisyllables */, + { 20, 9087, 0, 6, 0, UNI_joinc_values_index } /* joinc= */, + { 2945, 5045, 8493, 3, 6, UNI_UCASEXT } /* isucasext */, + { 3, 2248, 2312, 3, 20, UNI_SINHALAARCHAICNUMBERS } /* insinhalaarchaicnumbers */, + { 4, 8973, 980, 6, 27, UNI_ALPHABETICPF } /* block=alphabeticpresentationforms */, + { 3984, 185, 5214, 2, 14, UNI_INGREEK } /* isgreekandcoptic */, + { 2688, 5875, 7187, 13, 3, UNI_JG__QAF } /* joininggroup=qaf */, + { 0, 6083, 8036, 13, 8, UNI_NV__1_SLASH_32 } /* numericvalue=3.12e-02 */, + { 9, 79, 0, 6, 0, UNI_ARAB } /* arabic */, + { 0, 9476, 7016, 3, 11, UNI_HMNG } /* sc=pahawhhmong */, + { 473, 8444, 0, 8, 0, UNI_radical_values_index } /* radical= */, + { 48, 9979, 8635, 4, 7, UNI_HANO } /* scx=hanunoo */, + { 10, 8768, 36, 7, 1, UNI_PATSYN } /* patsyn=t */, + { 304, 7560, 26, 10, 1, UNI_XPOSIXUPPER } /* uppercase=y */, + { 9, 10244, 1045, 3, 6, UNI_L } /* gc=letter */, + { 1732, 185, 1847, 2, 5, UNI_XPOSIXLOWER } /* islower */, + { 2625, 9763, 18, 4, 2, UNI_RI } /* gcb=ri */, + { 0, 10268, 9603, 3, 4, UNI_NV__13_SLASH_2 } /* nv=13/2 */, + { 1861, 9711, 9350, 5, 4, UNI_CCC__24 } /* ccc=ccc24 */, + { 3456, 185, 1859, 3, 20, UNI_CWT } /* ischangeswhentitlecased */, + { 4, 58, 0, 2, 0, UNI_YI } /* yi */, + { 8, 6529, 8755, 3, 6, UNI_INOSMANYA } /* inosmanya */, + { 0, 9469, 869, 3, 17, UNI_PHONETICEXT } /* inphoneticextensions */, + { 576, 9429, 36, 5, 1, UNI_CWCF } /* cwcf=t */, + { 0, 8881, 7202, 4, 8, UNI_ARABICEXTB } /* isarabicextb */, + { 4240, 118, 448, 3, 17, UNI_IDEOGRAPHICSYMBOLS } /* inideographicsymbols */, + { 13, 9711, 9390, 5, 4, UNI_CCC__32 } /* ccc=ccc32 */, + { 1836, 7467, 10067, 3, 4, UNI_IN__12 } /* in=v120 */, + { 0, 2206, 6287, 21, 3, UNI_LB__ZWJ } /* graphemeclusterbreak=zwj */, + { 3, 185, 9807, 2, 4, UNI_KALI } /* iskali */, + { 0, 8973, 7310, 6, 10, UNI_INDIVESAKURU } /* block=divesakuru */, + { 10, 185, 2509, 2, 4, UNI_MONG } /* ismong */, + { 6266, 7297, 2531, 3, 3, UNI_HATR } /* ishatr */, + { 0, 8782, 7501, 8, 3, UNI_SAUR } /* script=saur */, + { 3, 2312, 2100, 4, 4, UNI_INHATRAN } /* inhatran */, + { 0, 9711, 3588, 4, 13, UNI_CCC__202 } /* ccc=attachedbelow */, + { 1631, 10247, 6271, 3, 7, UNI_JG__SEMKATH } /* jg=semkath */, + { 2402, 185, 3157, 2, 17, UNI_EBASE } /* isemojimodifierbase */, + { 264, 4847, 2271, 4, 19, UNI_MEETEIMAYEKEXT } /* inmeeteimayekextensions */, + { 684, 1418, 7923, 24, 2, UNI_CCC__11 } /* canonicalcombiningclass=11 */, + { 0, 3877, 9895, 17, 4, UNI_NKO } /* scriptextensions=nkoo */, + { 0, 7360, 4503, 10, 2, UNI_LB__BB } /* linebreak=bb */, + { 4670, 185, 601, 3, 29, UNI_CJKEXTD } /* iscjkunifiedideographsextensiond */, + { 0, 8628, 1026, 7, 2, -UNI_GRBASE } /* grbase=no */, + { 0, 9691, 5256, 4, 7, UNI_KANASUP } /* blk=kanasup */, + { 19, 9691, 6518, 4, 12, UNI_INMENDEKIKAKUI } /* blk=mendekikakui */, + { 0, 9469, 3012, 5, 19, UNI_INPC__TOPANDBOTTOMANDLEFT } /* inpc=topandbottomandleft */, + { 0, 1990, 4346, 22, 5, UNI_INSC__OTHER } /* indicsyllabiccategory=other */, + { 4, 9847, 3, 4, 1, -UNI_LOE } /* loe=f */, + { 1890, 9691, 7280, 4, 10, UNI_COMPATJAMO } /* blk=compatjamo */, + { 0, 7360, 10250, 10, 2, UNI_GCB__T } /* linebreak=jt */, + { 0, 10253, 7628, 3, 9, UNI_LB__AI } /* lb=ambiguous */, + { 4669, 5074, 0, 14, 0, UNI_ANCIENTSYMBOLS } /* ancientsymbols */, + { 0, 9476, 8607, 3, 7, UNI_ELBA } /* sc=elbasan */ }; MPH_VALt match_uniprop( const unsigned char * const key, const U16 key_len ) { @@ -7495,57 +7650,57 @@ MPH_VALt match_uniprop( const unsigned char * const key, const U16 key_len ) { /* Generated from: * 688d673ec947f7ccf898b4eae9848139d4d33676b688dee54f449f8bf9d3bbd2 lib/Unicode/UCD.pm - * ce96627d4fc91b4fd886c409caeb9b76cf7bd345e12f05c6701add7f233f6437 lib/unicore/ArabicShaping.txt - * 0e69eef3da722cc104522d8372e86d5b86bb7afcc761b0c991e39e832294946d lib/unicore/BidiBrackets.txt - * a00d9d21585106a52113fb7b1d3d0373a5835be72e76862fb559ebddd474d70e lib/unicore/BidiMirroring.txt - * 81a82b6a9fcf1a9c12f588d7a1decd73a9afdc4cac95b0eb7e576e7942d6c19f lib/unicore/Blocks.txt - * 99d231d7c91688bbe8ca8ccebcc2f46b5b222f844babe4827295bae11e2abe5f lib/unicore/CaseFolding.txt - * 38badafd818d8405324fe298c0676be0c95186368c84b5368375fd871a645144 lib/unicore/CompositionExclusions.txt - * e779a443d3aa2a3166a15becaa2b737c922480e32c0453d5956093633555078f lib/unicore/DAge.txt - * a5d45f59b39deaab3c72ce8c1a2e212a5e086dff11b1f9d5bb0e352642e82248 lib/unicore/DCoreProperties.txt - * 3ac44e11c84bdaf6b207d2c2c20eed857ae17052393fc7f71b0fe951186ba906 lib/unicore/DNormalizationProps.txt - * 4f822ec7a9ebbb3138ad29bade8b9688d25b39c7a3c0b7431f01e7229e4fcb6e lib/unicore/EastAsianWidth.txt - * fc535aa1047a70105ab9a22c2b4c3f363a2ff02fe48ebbc5eeb9873b2752ff0b lib/unicore/EquivalentUnifiedIdeograph.txt - * b9c5158ce944d2fec57e0e4ecb716bdabfc3bdde73525f1772fe03f61a30d473 lib/unicore/HangulSyllableType.txt - * 36c1b2a626ff1fb23b8b21e6ea8712698f8ce668dded1cb48b8ddf6a6a1b04e9 lib/unicore/IdStatus.txt - * 4857c4ffa3898e6128b2d46b0a02e499a663fb91464a69ef3611096f01293acc lib/unicore/IdType.txt - * 69197b019fa5f2fb0d8c6ed1ed8acb9f2e8b5b8f45a947953ffa652f3bf54983 lib/unicore/IndicPositionalCategory.txt - * 6604e2f0fde7428675364aa0006bc686b79488dcc60ae8cb29800af2be3352e8 lib/unicore/IndicSyllabicCategory.txt - * 84ead63924aaa74b988b2eaf254a8733276ed108633ce2ef77a9ee1de7818162 lib/unicore/Jamo.txt - * d5abcd8f54c8a2aa912924c485ccf7f968ad98feaa303d8e9a29ad89172f1faf lib/unicore/LineBreak.txt - * 985128e8c8b2540233331d9b27d897d2c23bd5bcf1d05da960befce6efc59542 lib/unicore/NameAliases.txt - * 27282b8aa01d4d0c44aef436cb74195ae8639ffa187aeee4e6247af76febea76 lib/unicore/NamedSequences.txt - * 485b5a3ed25dbf1f94dfa5a9b69d8b4550ffd0c33045ccc55ccfd7c80b2a40cf lib/unicore/PropList.txt - * 6b3902e9268cd843fe65cbdea992108c9528343ec0679f800b96f356bb553e5a lib/unicore/PropValueAliases.txt - * 2bd5777847e3d6add3c7e5c0d1393ddcab89e5a0ac3ff498cb0c53041f0b86e4 lib/unicore/PropertyAliases.txt - * 03a61dc89422e44cc2b73e8e893321007880ab69e2a4d281c0f1bc29c602b9d0 lib/unicore/ScriptExtensions.txt - * 9a5ed1ec9b5f0d7147e9371ad792ab39203611af7637cff2aa4a5c663b172cde lib/unicore/Scripts.txt - * 6424312f1dc39b22e0ff9c0ffb13dfad424d9b03e6a6dc6bca941f6bf5ef1ffd lib/unicore/SpecialCasing.txt - * bdbffbbfc8ad4d3a6d01b5891510458f3d36f7170422af4ea2bed3211a73e8bb lib/unicore/UnicodeData.txt - * 160f41816234addb511901d5f21febd69574578dd93de6ef8153e35693325575 lib/unicore/VerticalOrientation.txt - * 32dfb37d21db530529a6ec3dc13d96f21f8e7c7faf7ff3db8a9760cd76cec81d lib/unicore/auxiliary/GCBTest.txt - * 2bd3c5e2d62701ff81fb3ec318e179a4618cabb1493b1e0dd2b4e7e56c5437c4 lib/unicore/auxiliary/GraphemeBreakProperty.txt - * c51fbebfa82a0f36473b44bfd71d5ef6cb6a1f81fb313375dc9a1910d79bb2b6 lib/unicore/auxiliary/LBTest.txt - * 80b0107750818d8f370bd120b6fe56b6855b60581f72affe8b60409a469b4b65 lib/unicore/auxiliary/SBTest.txt - * 09e3166ebab166ac630a227f77f4e794ebd433271abd5588f5a67e7f199c71ee lib/unicore/auxiliary/SentenceBreakProperty.txt - * bf5373ce28a5df06796c93dc159dd15a997bb2950c92704b40ae8190cfc3716d lib/unicore/auxiliary/WBTest.txt - * a2b7373cf2fe3fa3b26dbb53405ca849985f771ff47f1c61743978003ff80499 lib/unicore/auxiliary/WordBreakProperty.txt - * d2686f400a638c80775d7c662556fb8fa8dd3bbe4aa548d9d31624264c6e1bb1 lib/unicore/emoji/emoji.txt - * b827ae5da8c2b08947cc9a120a7b7fd2f1676fb160b508df78075381635b127c lib/unicore/extracted/DBidiClass.txt - * 6fdc5b5ef40444a8f0c772e6b67c00498d4216fe0c0fdf76744ce338f2ad3810 lib/unicore/extracted/DBinaryProperties.txt - * e14928a5bf6ad5958a80332bd42e96e14420080a95c660e5da29384e496755d0 lib/unicore/extracted/DCombiningClass.txt - * 579a03281fbe87b78d5d9a8523de4d255edd7e4ca6eab0e4c7729de97e9b89b1 lib/unicore/extracted/DDecompositionType.txt - * ad83c59b257e9d480ffd3001d4ac240c5fed7cb1919453e1c4e8877035256bcd lib/unicore/extracted/DEastAsianWidth.txt - * 4502f0969e4e6558c4b4c6ca4c23dad70b863d61dd3d5eed1a62a6c3c99fd570 lib/unicore/extracted/DGeneralCategory.txt - * 00bb88b89e2adb646f3177f9444e2d3192386b81a5de9556104b338274b253e1 lib/unicore/extracted/DJoinGroup.txt - * ac835b6e11a60c9820d3cf2d1cb0558dd68efb8f53f404a51632e4726690a6d7 lib/unicore/extracted/DJoinType.txt - * baba9dfc133e3cb770a89aaf0973b1341fa61c2da6c176baf6428898b3b568d8 lib/unicore/extracted/DLineBreak.txt - * 6d4a8c945dd7db83ed617cbb7d937de7f4ecf016ff22970d846e996a7c9a2a5d lib/unicore/extracted/DNumType.txt - * 5b7c14380d5cceeaffcfbc18db1ed936391d2af2d51f5a41f1a17b692c77e59b lib/unicore/extracted/DNumValues.txt - * 4e169849b96b76987a8fc443ef421b44d2dcebbd981bb457f6a13e8af77cdbe2 lib/unicore/mktables - * 50b85a67451145545a65cea370dab8d3444fbfe07e9c34cef560c5b7da9d3eef lib/unicore/version + * c7698811e9adb6cc98fb996a7de4be2b6532f2ac67e76055cc8afdbf6ee18af3 lib/unicore/ArabicShaping.txt + * 24a74555f918bbe99f5b3f1b83cf36fc0e205bb8a600a6a3aa539c710a3dcf27 lib/unicore/BidiBrackets.txt + * 7a5c74cedc1616a9af0a9d22e108ae592d86fe93649c144ae6ba49f193a44122 lib/unicore/BidiMirroring.txt + * 598870dddef7b34b5a972916528c456aff2765b79cd4f9647fb58ceb767e7f17 lib/unicore/Blocks.txt + * a566cd48687b2cd897e02501118b2413c14ae86d318f9abbbba97feb84189f0f lib/unicore/CaseFolding.txt + * 3360762fc3295cea54ab251c31df621d05ba4b94d46c60eaac29aa16d70ad1e0 lib/unicore/CompositionExclusions.txt + * 7e058dec02147098bc9c28d86209f0f251bba0538f3b5a705ad02ea3bb709fe0 lib/unicore/DAge.txt + * e3eddd7d469cd1b0feed7528defad1a1cc7c6a9ceb0ae4446a6d10921ed2e7bc lib/unicore/DCoreProperties.txt + * b2c444c20730b097787fdf50bd7d6dd3fc5256ab8084f5b35b11c8776eca674c lib/unicore/DNormalizationProps.txt + * f901ac011aa32a09224d6555da71e2532c59c1d3381322829de0e3b880507250 lib/unicore/EastAsianWidth.txt + * 5995522f01633073911dad1edb74d13aa832f42862c0392a79627b85d52f2391 lib/unicore/EquivalentUnifiedIdeograph.txt + * cd1c9367cba438afa965fcb5edc6ed3ec6e685fd5dd21c0cc20c026f04beb0e5 lib/unicore/HangulSyllableType.txt + * 3f3f368fccdb37f350ecedc20b37fa71ab31c04e847884c77780d34283539f73 lib/unicore/IdStatus.txt + * 45a150c23961b58d7784704af6c4daccd6517d97b6489e53d13bbdbf9e4f065f lib/unicore/IdType.txt + * d8704c8725568813a947ff2ef38bcf1f05e2a6fbea6876ba384890f187a8bf61 lib/unicore/IndicPositionalCategory.txt + * c7b969b653dc278fb66ab4136223d320e30ad19367eb791ae60dcc6d92071b16 lib/unicore/IndicSyllabicCategory.txt + * 39ff89e0a329e1ccce6d54fad8cf82e90926901928c0ca9b9a2ad5681f330dd9 lib/unicore/Jamo.txt + * 9e06e9f35c6959fb91dcc7993f90d58523c3079bc62c6b25f828b4cdebc5d70c lib/unicore/LineBreak.txt + * 14b3b677d33f95c51423dce6eef4a6a28b4b160451ecedee4b91edb6745cf4a3 lib/unicore/NameAliases.txt + * db5745688affcdc0c3927a1ee0667018a96a7b24513f866d5235e98fef6c2436 lib/unicore/NamedSequences.txt + * 6bddfdb850417a5bee6deff19290fd1b138589909afb50f5a049f343bf2c6722 lib/unicore/PropList.txt + * eb755757e20b72b330b2948df3cf2ff7adb0e31bb060140dc09dafb132ace2cd lib/unicore/PropValueAliases.txt + * 859d7225f2d2a460b3ccb1d61a7945f8cc219acdf5aa53b66b7a1e4bf6ebfc87 lib/unicore/PropertyAliases.txt + * d37eedf63ff9c48bac863d5f76862373d6cf5269fd21253d499e2430d638c01d lib/unicore/ScriptExtensions.txt + * 52db475c4ec445e73b0b16915448c357614946ad7062843c563e00d7535c6510 lib/unicore/Scripts.txt + * c667b45908fd269af25fd55d2fc5bbc157fb1b77675936e25c513ce32e080334 lib/unicore/SpecialCasing.txt + * 36018e68657fdcb3485f636630ffe8c8532e01c977703d2803f5b89d6c5feafb lib/unicore/UnicodeData.txt + * 869ff43dd012f924d03c89fc268c88f0e7eea72f0228b91ca30455afdb84f8fd lib/unicore/VerticalOrientation.txt + * ddc7d4d1f3838573b94fc5d83ff7217e63c47b22ae1cd40c5fe1a54efc15589b lib/unicore/auxiliary/GCBTest.txt + * 97e79f1f8d9cd76d120f2420381a01abc00a7c78a2aa583fa3f9627264a99742 lib/unicore/auxiliary/GraphemeBreakProperty.txt + * 488dbb6a7e1d0070d4aa7c175352c818ff6425172850d1b40c6177726658cb05 lib/unicore/auxiliary/LBTest.txt + * 7e42dd749dbb94aa44b13faf9df6319d9a16ce2ea09a3a094fcfbb5962168040 lib/unicore/auxiliary/SBTest.txt + * 7092ca4117cec891c25c7724132efc519e1dece01ae9fd6068035a9db04d526e lib/unicore/auxiliary/SentenceBreakProperty.txt + * 8094b544ec1580c7e41ac0187805cc1aeb330a90301ec7505563e1a59318284e lib/unicore/auxiliary/WBTest.txt + * 7716752aad296d4ab23ff4ed0a2746fc5328750ff84e9e7d6f3828ee9eaef742 lib/unicore/auxiliary/WordBreakProperty.txt + * b597836124298b8f7fa076273802840cfc3271a25f5c397a082e120954b82c3c lib/unicore/emoji/emoji.txt + * e5fe51acc74e3e83b4fb4c7b25f3c34491d6eb8095c9955d0712dafbca7b3c2b lib/unicore/extracted/DBidiClass.txt + * cd0a14176d93bf440b77a582a0d678190fc0688b15442d4cfb250bf2e27956af lib/unicore/extracted/DBinaryProperties.txt + * 12b0c3af9b600b49488d66545a3e7844ea980809627201bf9afeebe1c9f16f4e lib/unicore/extracted/DCombiningClass.txt + * f76064b298cfbd715ba542e7894f7a507d32da2f011070d1d01df95cad9817d6 lib/unicore/extracted/DDecompositionType.txt + * f9bef074cc916db57fece99d54a4505f8e7c7b17481619e3f0005211f7717d4b lib/unicore/extracted/DEastAsianWidth.txt + * cde679c8461976ed40d7edf61ae98cbb947540831f06f5bc7da7decbf91a1420 lib/unicore/extracted/DGeneralCategory.txt + * 9bb891831328713603a486a4a03df7f7987c3e1e8144a6d1ac71fd061ef3f732 lib/unicore/extracted/DJoinGroup.txt + * e97c65bbea0a69d2fae6ec4182b09e519e13232e20bd804b3004edc0f36bb0d4 lib/unicore/extracted/DJoinType.txt + * 43f6df50e4878f501b417e366b0ee097ae5ccb2d4ce942026bed3d62d78e7887 lib/unicore/extracted/DLineBreak.txt + * a04502ebb36a45d83cbe48a7d8132ea8143edb7b3d34d0aa6afe4a9685049741 lib/unicore/extracted/DNumType.txt + * 11075771b112e8e7ccf6ffa637c4c91eadc3ef3db0517b24e605df8fd3624239 lib/unicore/extracted/DNumValues.txt + * 24b7b7bda1a2ab4684ba53355d82ad227c1624b337b37c3b96f2e4b902eea1f2 lib/unicore/mktables + * c72bbdeda99714db1c8024d3311da4aef3c0db3b9b9f11455a7cfe10d5e9aba3 lib/unicore/version * 0a6b5ab33bb1026531f816efe81aea1a8ffcd34a27cbea37dd6a70a63d73c844 regen/charset_translations.pl * 5f8520d3a17ade6317fc0c423f5091470924b1ef425bca0c41ce8e4a9f8460fe regen/mk_PL_charclass.pl - * 04a5294218c412e5ee2e0d9f8d22af1d95bbfd2cafae3935cbb6b5871e9f9704 regen/mk_invlists.pl + * 6defb8383a69034f8279fea4ff66e09bf58049c4cbecf2331b9b245c45d4f2d5 regen/mk_invlists.pl * cf1d68efb7d919d302c4005641eae8d36da6d7850816ad374b0c00b45e609f43 regen/mph.pl * ex: set ro: */ diff --git a/unicode_constants.h b/unicode_constants.h index eea66f6ba4..56933b8f11 100644 --- a/unicode_constants.h +++ b/unicode_constants.h @@ -45,7 +45,7 @@ bytes. =cut */ -#define UNICODE_MAJOR_VERSION 13 +#define UNICODE_MAJOR_VERSION 14 #define UNICODE_DOT_VERSION 0 #define UNICODE_DOT_DOT_VERSION 0 @@ -190,7 +190,7 @@ bytes. /* The number of code points not matching \pC */ #ifdef PERL_IN_REGCOMP_C -# define NON_OTHER_COUNT 143698 +# define NON_OTHER_COUNT 144534 #endif /* The highest code point that has any type of case change */ -- cgit v1.2.1