diff options
author | Karl Williamson <khw@cpan.org> | 2020-02-03 16:20:03 -0700 |
---|---|---|
committer | Karl Williamson <khw@cpan.org> | 2020-02-03 16:34:56 -0700 |
commit | f9c633636bbfa6e7a869340ac7e4ed3244172e5d (patch) | |
tree | bc682921241bd19e35abc65afb655b8b1825a170 /lib | |
parent | ac92cca2aeae8ca2e2b1306a5a9547c186077cfd (diff) | |
download | perl-f9c633636bbfa6e7a869340ac7e4ed3244172e5d.tar.gz |
Support Unicode properties Identifier_(Status|Type)
These non-UCD properties are now being asked to be supported by the
Unicode regular expression specification, UTS #18
These have a slightly different header syntax for giving the version
than UCD files. In this commit, I modify these to fit, but will
probably have to generalize at some point the parsing of versions in
mktables.
Diffstat (limited to 'lib')
-rw-r--r-- | lib/unicore/IdStatus.txt | 2 | ||||
-rw-r--r-- | lib/unicore/IdType.txt | 2 | ||||
-rw-r--r-- | lib/unicore/mktables | 40 | ||||
-rw-r--r-- | lib/unicore/uni_keywords.pl | 1857 |
4 files changed, 978 insertions, 923 deletions
diff --git a/lib/unicore/IdStatus.txt b/lib/unicore/IdStatus.txt index 6fa8e0d4a0..4837df0a28 100644 --- a/lib/unicore/IdStatus.txt +++ b/lib/unicore/IdStatus.txt @@ -1,4 +1,4 @@ -# IdentifierStatus.txt +# IdentifierStatus-13.0.0.txt # Date: 2019-10-22, 13:05:26 GMT # © 2019 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. diff --git a/lib/unicore/IdType.txt b/lib/unicore/IdType.txt index 74893b67ce..df79a86421 100644 --- a/lib/unicore/IdType.txt +++ b/lib/unicore/IdType.txt @@ -1,4 +1,4 @@ -# IdentifierType.txt +# IdentifierType-13.0.0.txt # Date: 2019-11-05, 08:05:20 GMT # © 2019 Unicode®, Inc. # Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries. diff --git a/lib/unicore/mktables b/lib/unicore/mktables index f11e466823..40ac545bc7 100644 --- a/lib/unicore/mktables +++ b/lib/unicore/mktables @@ -1468,6 +1468,7 @@ my $DI; # Default_Ignorable_Code_Point property my $NChar; # Noncharacter_Code_Point property my $script; my $scx; # Script_Extensions property +my $idt; # Identifier_Type property # Are there conflicting names because of beginning with 'In_', or 'Is_' my $has_In_conflicts = 0; @@ -13546,6 +13547,36 @@ sub filter_emojidata_line { return; } +sub setup_IdStatus { + my $ids = Property->new('Identifier_Status', + Match_SubDir => 'IdStatus', + Default_Map => 'Restricted', + ); + $ids->add_match_table('Allowed'); +} + +sub setup_IdType { + $idt = Property->new('Identifier_Type', + Match_SubDir => 'IdType', + Default_Map => 'Not_Character', + Format => $STRING_WHITE_SPACE_LIST, + ); +} + +sub filter_IdType_line { + + # Some code points have more than one type, separated by spaces on the + # input. For now, we just add everything as a property value. Later when + # we look for properties with format $STRING_WHITE_SPACE_LIST, we resolve + # things + + my @fields = split /\s*;\s*/; + my $types = $fields[1]; + $idt->add_match_table($types) unless defined $idt->table($types); + + return; +} + sub generate_hst { # Populates the Hangul Syllable Type property from first principles @@ -20133,6 +20164,15 @@ my @input_file_objects = ( Input_file->new("$EMOJI/emoji.txt", v13.0.0, Has_Missings_Defaults => $NOT_IGNORED, ), + Input_file->new('IdStatus.txt', v13.0.0, + Pre_Handler => \&setup_IdStatus, + Property => 'Identifier_Status', + ), + Input_file->new('IdType.txt', v13.0.0, + Pre_Handler => \&setup_IdType, + Each_Line_Handler => \&filter_IdType_line, + Property => 'Identifier_Type', + ), ); # End of all the preliminaries. diff --git a/lib/unicore/uni_keywords.pl b/lib/unicore/uni_keywords.pl index 894ede5df4..649cc07fac 100644 --- a/lib/unicore/uni_keywords.pl +++ b/lib/unicore/uni_keywords.pl @@ -4,19 +4,19 @@ # Any changes made here will be lost! %Unicode::UCD::uni_prop_ptrs_indices = ( - '_perl_any_folds' => 1174, - '_perl_charname_begin' => 1175, - '_perl_charname_continue' => 1176, - '_perl_folds_to_multi_char' => 1177, - '_perl_idcont' => 1178, - '_perl_idstart' => 1179, - '_perl_is_in_multi_char_fold' => 1180, - '_perl_nchar' => 1181, - '_perl_patws' => 1182, - '_perl_problematic_locale_foldeds_start' => 1183, - '_perl_problematic_locale_folds' => 1184, - '_perl_quotemeta' => 1185, - '_perl_surrogate' => 1186, + '_perl_any_folds' => 1187, + '_perl_charname_begin' => 1188, + '_perl_charname_continue' => 1189, + '_perl_folds_to_multi_char' => 1190, + '_perl_idcont' => 1191, + '_perl_idstart' => 1192, + '_perl_is_in_multi_char_fold' => 1193, + '_perl_nchar' => 1194, + '_perl_patws' => 1195, + '_perl_problematic_locale_foldeds_start' => 1196, + '_perl_problematic_locale_folds' => 1197, + '_perl_quotemeta' => 1198, + '_perl_surrogate' => 1199, 'adlm' => 1, 'aegeannumbers' => 2, 'age=10' => 3, @@ -43,13 +43,13 @@ 'age=9' => 24, 'age=na' => 25, 'aghb' => 26, - 'ahex' => 957, + 'ahex' => 970, 'ahom' => 27, 'alchemical' => 28, 'all' => 29, - 'alnum' => 1148, - 'alpha' => 1149, - 'alphabetic' => 1149, + 'alnum' => 1161, + 'alpha' => 1162, + 'alphabetic' => 1162, 'alphabeticpf' => 30, 'ancientgreekmusic' => 31, 'ancientgreeknumbers' => 32, @@ -65,7 +65,7 @@ 'armn' => 42, 'arrows' => 43, 'ascii' => 44, - 'asciihexdigit' => 957, + 'asciihexdigit' => 970, 'assigned' => 45, 'avst' => 46, 'bali' => 47, @@ -101,7 +101,7 @@ 'bhks' => 76, 'bidic' => 77, 'bidim' => 78, - 'blank' => 1150, + 'blank' => 1163, 'blockelements' => 79, 'bopo' => 80, 'bopomofoext' => 81, @@ -120,7 +120,7 @@ 'cari' => 94, 'cased' => 95, 'casedletter' => 96, - 'cc' => 1151, + 'cc' => 1164, 'ccc=0' => 97, 'ccc=1' => 98, 'ccc=10' => 99, @@ -201,11 +201,11 @@ 'cjkstrokes' => 174, 'cjksymbols' => 175, 'cn' => 176, - 'cntrl' => 1151, + 'cntrl' => 1164, 'co' => 177, 'compatjamo' => 178, 'compex' => 179, - 'control' => 1151, + 'control' => 1164, 'controlpictures' => 180, 'copt' => 181, 'copticepactnumbers' => 182, @@ -226,7 +226,7 @@ 'cyrillicsup' => 197, 'cyrl' => 198, 'dash' => 199, - 'decimalnumber' => 1152, + 'decimalnumber' => 1165, 'dep' => 200, 'deva' => 201, 'devanagariext' => 202, @@ -237,7 +237,7 @@ 'diacriticalsforsymbols' => 207, 'diacriticalssup' => 208, 'diak' => 209, - 'digit' => 1152, + 'digit' => 1165, 'dingbats' => 210, 'dogr' => 211, 'domino' => 212, @@ -307,7 +307,7 @@ 'gonm' => 276, 'goth' => 277, 'gran' => 278, - 'graph' => 1153, + 'graph' => 1166, 'grbase' => 279, 'greekext' => 280, 'grek' => 281, @@ -321,914 +321,927 @@ 'hano' => 289, 'hatr' => 290, 'hebr' => 291, - 'hex' => 1160, - 'hexdigit' => 1160, + 'hex' => 1173, + 'hexdigit' => 1173, 'highpusurrogates' => 292, 'highsurrogates' => 293, 'hira' => 294, 'hluw' => 295, 'hmng' => 296, 'hmnp' => 297, - 'horizspace' => 1150, + 'horizspace' => 1163, 'hst=na' => 298, 'hung' => 299, 'hyphen_perl_aux' => 300, 'idc' => 301, - 'ideo' => 302, - 'ideographicsymbols' => 303, - 'ids' => 304, - 'idsb' => 305, - 'idst' => 306, - 'in=1.1' => 504, - 'in=10' => 499, - 'in=11' => 500, - 'in=12' => 501, - 'in=12.1' => 502, - 'in=13' => 503, - 'in=2' => 505, - 'in=2.1' => 506, - 'in=3' => 507, - 'in=3.1' => 508, - 'in=3.2' => 509, - 'in=4' => 510, - 'in=4.1' => 511, - 'in=5' => 512, - 'in=5.1' => 513, - 'in=5.2' => 514, - 'in=6' => 515, - 'in=6.1' => 516, - 'in=6.2' => 517, - 'in=6.3' => 518, - 'in=7' => 519, - 'in=8' => 520, - 'in=9' => 521, - 'inadlam' => 307, - 'inahom' => 308, - 'inanatolianhieroglyphs' => 309, - 'inarabic' => 310, - 'inarmenian' => 311, - 'inavestan' => 312, - 'inbalinese' => 313, - 'inbamum' => 314, - 'inbassavah' => 315, - 'inbatak' => 316, - 'inbengali' => 317, - 'inbhaiksuki' => 318, - 'inbopomofo' => 319, - 'inbrahmi' => 320, - 'inbuginese' => 321, - 'inbuhid' => 322, - 'incarian' => 323, - 'incaucasianalbanian' => 324, - 'inchakma' => 325, - 'incham' => 326, - 'incherokee' => 327, - 'inchorasmian' => 328, - 'incoptic' => 329, - 'incuneiform' => 330, - 'incyrillic' => 331, - 'indevanagari' => 332, - 'indicnumberforms' => 333, - 'indicsiyaqnumbers' => 334, - 'indivesakuru' => 335, - 'indogra' => 336, - 'induployan' => 337, - 'inegyptianhieroglyphs' => 338, - 'inelbasan' => 339, - 'inelymaic' => 340, - 'inethiopic' => 341, - 'ingeorgian' => 342, - 'inglagolitic' => 343, - 'ingothic' => 344, - 'ingrantha' => 345, - 'ingreek' => 346, - 'ingujarati' => 347, - 'ingunjalagondi' => 348, - 'ingurmukhi' => 349, - 'inhangul' => 350, - 'inhanifirohingya' => 351, - 'inhanunoo' => 352, - 'inhatran' => 353, - 'inhebrew' => 354, - 'inhiragana' => 355, - 'inidc' => 356, - 'inimperialaramaic' => 357, - 'ininscriptionalpahlavi' => 358, - 'ininscriptionalparthian' => 359, - 'injavanese' => 360, - 'inkaithi' => 361, - 'inkannada' => 362, - 'inkatakana' => 363, - 'inkharoshthi' => 364, - 'inkhitansmallscript' => 365, - 'inkhmer' => 366, - 'inkhojki' => 367, - 'inkhudawadi' => 368, - 'inlao' => 369, - 'inlepcha' => 370, - 'inlimbu' => 371, - 'inlineara' => 372, - 'inlisu' => 373, - 'inlycian' => 374, - 'inlydian' => 375, - 'inmahajani' => 376, - 'inmakasar' => 377, - 'inmalayalam' => 378, - 'inmandaic' => 379, - 'inmanichaean' => 380, - 'inmarchen' => 381, - 'inmasaramgondi' => 382, - 'inmedefaidrin' => 383, - 'inmeeteimayek' => 384, - 'inmendekikakui' => 385, - 'inmeroiticcursive' => 386, - 'inmiao' => 387, - 'inmodi' => 388, - 'inmongolian' => 389, - 'inmro' => 390, - 'inmultani' => 391, - 'inmyanmar' => 392, - 'innabataean' => 393, - 'innandinagari' => 394, - 'innewa' => 395, - 'innewtailue' => 396, - 'innko' => 397, - 'innushu' => 398, - 'innyiakengpuachuehmong' => 399, - 'inogham' => 400, - 'inoldhungarian' => 401, - 'inolditalic' => 402, - 'inoldpermic' => 403, - 'inoldpersian' => 404, - 'inoldsogdian' => 405, - 'inoldturkic' => 406, - 'inoriya' => 407, - 'inosage' => 408, - 'inosmanya' => 409, - 'inpahawhhmong' => 410, - 'inpaucinhau' => 411, - 'inpc=bottom' => 412, - 'inpc=bottomandleft' => 413, - 'inpc=bottomandright' => 414, - 'inpc=left' => 415, - 'inpc=leftandright' => 416, - 'inpc=na' => 417, - 'inpc=overstruck' => 418, - 'inpc=right' => 419, - 'inpc=top' => 420, - 'inpc=topandbottom' => 421, - 'inpc=topandbottomandleft' => 422, - 'inpc=topandbottomandright' => 423, - 'inpc=topandleft' => 424, - 'inpc=topandleftandright' => 425, - 'inpc=topandright' => 426, - 'inphagspa' => 427, - 'inphoenician' => 428, - 'inpsalterpahlavi' => 429, - 'inpunctuation' => 430, - 'inrejang' => 431, - 'inrunic' => 432, - 'insamaritan' => 433, - 'insaurashtra' => 434, - 'insc=avagraha' => 435, - 'insc=bindu' => 436, - 'insc=brahmijoiningnumber' => 437, - 'insc=cantillationmark' => 438, - 'insc=consonant' => 439, - 'insc=consonantdead' => 440, - 'insc=consonantfinal' => 441, - 'insc=consonantheadletter' => 442, - 'insc=consonantinitialpostfixed' => 443, - 'insc=consonantkiller' => 444, - 'insc=consonantmedial' => 445, - 'insc=consonantplaceholder' => 446, - 'insc=consonantprecedingrepha' => 447, - 'insc=consonantprefixed' => 448, - 'insc=consonantsubjoined' => 449, - 'insc=consonantsucceedingrepha' => 450, - 'insc=consonantwithstacker' => 451, - 'insc=geminationmark' => 452, - 'insc=invisiblestacker' => 453, - 'insc=modifyingletter' => 454, - 'insc=nonjoiner' => 455, - 'insc=nukta' => 456, - 'insc=number' => 457, - 'insc=numberjoiner' => 458, - 'insc=other' => 459, - 'insc=purekiller' => 460, - 'insc=registershifter' => 461, - 'insc=syllablemodifier' => 462, - 'insc=toneletter' => 463, - 'insc=tonemark' => 464, - 'insc=virama' => 465, - 'insc=visarga' => 466, - 'insc=vowel' => 467, - 'insc=voweldependent' => 468, - 'insc=vowelindependent' => 469, - 'insiddham' => 470, - 'insinhala' => 471, - 'insogdian' => 472, - 'insorasompeng' => 473, - 'insoyombo' => 474, - 'insundanese' => 475, - 'insylotinagri' => 476, - 'insyriac' => 477, - 'intagalog' => 478, - 'intagbanwa' => 479, - 'intaile' => 480, - 'intaitham' => 481, - 'intaiviet' => 482, - 'intakri' => 483, - 'intamil' => 484, - 'intangut' => 485, - 'intelugu' => 486, - 'inthaana' => 487, - 'inthai' => 488, - 'intibetan' => 489, - 'intifinagh' => 490, - 'intirhuta' => 491, - 'inugaritic' => 492, - 'invai' => 493, - 'invs' => 494, - 'inwancho' => 495, - 'inwarangciti' => 496, - 'inyezidi' => 497, - 'inzanabazarsquare' => 498, - 'ipaext' => 522, - 'ital' => 523, - 'jamo' => 524, - 'jamoexta' => 525, - 'jamoextb' => 526, - 'java' => 527, - 'jg=africanfeh' => 528, - 'jg=africannoon' => 529, - 'jg=africanqaf' => 530, - 'jg=ain' => 531, - 'jg=alaph' => 532, - 'jg=alef' => 533, - 'jg=beh' => 534, - 'jg=beth' => 535, - 'jg=burushaskiyehbarree' => 536, - 'jg=dal' => 537, - 'jg=dalathrish' => 538, - 'jg=e' => 539, - 'jg=farsiyeh' => 540, - 'jg=fe' => 541, - 'jg=feh' => 542, - 'jg=finalsemkath' => 543, - 'jg=gaf' => 544, - 'jg=gamal' => 545, - 'jg=hah' => 546, - 'jg=hamzaonhehgoal' => 547, - 'jg=hanifirohingyakinnaya' => 548, - 'jg=hanifirohingyapa' => 549, - 'jg=he' => 550, - 'jg=heh' => 551, - 'jg=hehgoal' => 552, - 'jg=heth' => 553, - 'jg=kaf' => 554, - 'jg=kaph' => 555, - 'jg=khaph' => 556, - 'jg=knottedheh' => 557, - 'jg=lam' => 558, - 'jg=lamadh' => 559, - 'jg=malayalambha' => 560, - 'jg=malayalamja' => 561, - 'jg=malayalamlla' => 562, - 'jg=malayalamllla' => 563, - 'jg=malayalamnga' => 564, - 'jg=malayalamnna' => 565, - 'jg=malayalamnnna' => 566, - 'jg=malayalamnya' => 567, - 'jg=malayalamra' => 568, - 'jg=malayalamssa' => 569, - 'jg=malayalamtta' => 570, - 'jg=manichaeanaleph' => 571, - 'jg=manichaeanayin' => 572, - 'jg=manichaeanbeth' => 573, - 'jg=manichaeandaleth' => 574, - 'jg=manichaeandhamedh' => 575, - 'jg=manichaeanfive' => 576, - 'jg=manichaeangimel' => 577, - 'jg=manichaeanheth' => 578, - 'jg=manichaeanhundred' => 579, - 'jg=manichaeankaph' => 580, - 'jg=manichaeanlamedh' => 581, - 'jg=manichaeanmem' => 582, - 'jg=manichaeannun' => 583, - 'jg=manichaeanone' => 584, - 'jg=manichaeanpe' => 585, - 'jg=manichaeanqoph' => 586, - 'jg=manichaeanresh' => 587, - 'jg=manichaeansadhe' => 588, - 'jg=manichaeansamekh' => 589, - 'jg=manichaeantaw' => 590, - 'jg=manichaeanten' => 591, - 'jg=manichaeanteth' => 592, - 'jg=manichaeanthamedh' => 593, - 'jg=manichaeantwenty' => 594, - 'jg=manichaeanwaw' => 595, - 'jg=manichaeanyodh' => 596, - 'jg=manichaeanzayin' => 597, - 'jg=meem' => 598, - 'jg=mim' => 599, - 'jg=nojoininggroup' => 600, - 'jg=noon' => 601, - 'jg=nun' => 602, - 'jg=nya' => 603, - 'jg=pe' => 604, - 'jg=qaf' => 605, - 'jg=qaph' => 606, - 'jg=reh' => 607, - 'jg=reversedpe' => 608, - 'jg=rohingyayeh' => 609, - 'jg=sad' => 610, - 'jg=sadhe' => 611, - 'jg=seen' => 612, - 'jg=semkath' => 613, - 'jg=shin' => 614, - 'jg=straightwaw' => 615, - 'jg=swashkaf' => 616, - 'jg=syriacwaw' => 617, - 'jg=tah' => 618, - 'jg=taw' => 619, - 'jg=tehmarbuta' => 620, - 'jg=teth' => 621, - 'jg=waw' => 622, - 'jg=yeh' => 623, - 'jg=yehbarree' => 624, - 'jg=yehwithtail' => 625, - 'jg=yudh' => 626, - 'jg=yudhhe' => 627, - 'jg=zain' => 628, - 'jg=zhain' => 629, - 'joinc' => 630, - 'jt=c' => 631, - 'jt=d' => 632, - 'jt=l' => 633, - 'jt=r' => 634, - 'jt=t' => 635, - 'jt=u' => 636, - 'kali' => 637, - 'kana' => 638, - 'kanaexta' => 639, - 'kanasup' => 640, - 'kanbun' => 641, - 'kangxi' => 642, - 'katakanaext' => 643, - 'khar' => 644, - 'khmersymbols' => 645, - 'khmr' => 646, - 'khoj' => 647, - 'kits' => 648, - 'knda' => 649, - 'kthi' => 650, - 'l' => 651, + 'identifierstatus=allowed' => 302, + 'identifierstatus=restricted' => 303, + 'identifiertype=defaultignorable' => 304, + 'identifiertype=exclusion' => 305, + 'identifiertype=inclusion' => 306, + 'identifiertype=limiteduse' => 307, + 'identifiertype=notcharacter' => 308, + 'identifiertype=notnfkc' => 309, + 'identifiertype=notxid' => 310, + 'identifiertype=obsolete' => 311, + 'identifiertype=recommended' => 312, + 'identifiertype=technical' => 313, + 'identifiertype=uncommonuse' => 314, + 'ideo' => 315, + 'ideographicsymbols' => 316, + 'ids' => 317, + 'idsb' => 318, + 'idst' => 319, + 'in=1.1' => 517, + 'in=10' => 512, + 'in=11' => 513, + 'in=12' => 514, + 'in=12.1' => 515, + 'in=13' => 516, + 'in=2' => 518, + 'in=2.1' => 519, + 'in=3' => 520, + 'in=3.1' => 521, + 'in=3.2' => 522, + 'in=4' => 523, + 'in=4.1' => 524, + 'in=5' => 525, + 'in=5.1' => 526, + 'in=5.2' => 527, + 'in=6' => 528, + 'in=6.1' => 529, + 'in=6.2' => 530, + 'in=6.3' => 531, + 'in=7' => 532, + 'in=8' => 533, + 'in=9' => 534, + 'inadlam' => 320, + 'inahom' => 321, + 'inanatolianhieroglyphs' => 322, + 'inarabic' => 323, + 'inarmenian' => 324, + 'inavestan' => 325, + 'inbalinese' => 326, + 'inbamum' => 327, + 'inbassavah' => 328, + 'inbatak' => 329, + 'inbengali' => 330, + 'inbhaiksuki' => 331, + 'inbopomofo' => 332, + 'inbrahmi' => 333, + 'inbuginese' => 334, + 'inbuhid' => 335, + 'incarian' => 336, + 'incaucasianalbanian' => 337, + 'inchakma' => 338, + 'incham' => 339, + 'incherokee' => 340, + 'inchorasmian' => 341, + 'incoptic' => 342, + 'incuneiform' => 343, + 'incyrillic' => 344, + 'indevanagari' => 345, + 'indicnumberforms' => 346, + 'indicsiyaqnumbers' => 347, + 'indivesakuru' => 348, + 'indogra' => 349, + 'induployan' => 350, + 'inegyptianhieroglyphs' => 351, + 'inelbasan' => 352, + 'inelymaic' => 353, + 'inethiopic' => 354, + 'ingeorgian' => 355, + 'inglagolitic' => 356, + 'ingothic' => 357, + 'ingrantha' => 358, + 'ingreek' => 359, + 'ingujarati' => 360, + 'ingunjalagondi' => 361, + 'ingurmukhi' => 362, + 'inhangul' => 363, + 'inhanifirohingya' => 364, + 'inhanunoo' => 365, + 'inhatran' => 366, + 'inhebrew' => 367, + 'inhiragana' => 368, + 'inidc' => 369, + 'inimperialaramaic' => 370, + 'ininscriptionalpahlavi' => 371, + 'ininscriptionalparthian' => 372, + 'injavanese' => 373, + 'inkaithi' => 374, + 'inkannada' => 375, + 'inkatakana' => 376, + 'inkharoshthi' => 377, + 'inkhitansmallscript' => 378, + 'inkhmer' => 379, + 'inkhojki' => 380, + 'inkhudawadi' => 381, + 'inlao' => 382, + 'inlepcha' => 383, + 'inlimbu' => 384, + 'inlineara' => 385, + 'inlisu' => 386, + 'inlycian' => 387, + 'inlydian' => 388, + 'inmahajani' => 389, + 'inmakasar' => 390, + 'inmalayalam' => 391, + 'inmandaic' => 392, + 'inmanichaean' => 393, + 'inmarchen' => 394, + 'inmasaramgondi' => 395, + 'inmedefaidrin' => 396, + 'inmeeteimayek' => 397, + 'inmendekikakui' => 398, + 'inmeroiticcursive' => 399, + 'inmiao' => 400, + 'inmodi' => 401, + 'inmongolian' => 402, + 'inmro' => 403, + 'inmultani' => 404, + 'inmyanmar' => 405, + 'innabataean' => 406, + 'innandinagari' => 407, + 'innewa' => 408, + 'innewtailue' => 409, + 'innko' => 410, + 'innushu' => 411, + 'innyiakengpuachuehmong' => 412, + 'inogham' => 413, + 'inoldhungarian' => 414, + 'inolditalic' => 415, + 'inoldpermic' => 416, + 'inoldpersian' => 417, + 'inoldsogdian' => 418, + 'inoldturkic' => 419, + 'inoriya' => 420, + 'inosage' => 421, + 'inosmanya' => 422, + 'inpahawhhmong' => 423, + 'inpaucinhau' => 424, + 'inpc=bottom' => 425, + 'inpc=bottomandleft' => 426, + 'inpc=bottomandright' => 427, + 'inpc=left' => 428, + 'inpc=leftandright' => 429, + 'inpc=na' => 430, + 'inpc=overstruck' => 431, + 'inpc=right' => 432, + 'inpc=top' => 433, + 'inpc=topandbottom' => 434, + 'inpc=topandbottomandleft' => 435, + 'inpc=topandbottomandright' => 436, + 'inpc=topandleft' => 437, + 'inpc=topandleftandright' => 438, + 'inpc=topandright' => 439, + 'inphagspa' => 440, + 'inphoenician' => 441, + 'inpsalterpahlavi' => 442, + 'inpunctuation' => 443, + 'inrejang' => 444, + 'inrunic' => 445, + 'insamaritan' => 446, + 'insaurashtra' => 447, + 'insc=avagraha' => 448, + 'insc=bindu' => 449, + 'insc=brahmijoiningnumber' => 450, + 'insc=cantillationmark' => 451, + 'insc=consonant' => 452, + 'insc=consonantdead' => 453, + 'insc=consonantfinal' => 454, + 'insc=consonantheadletter' => 455, + 'insc=consonantinitialpostfixed' => 456, + 'insc=consonantkiller' => 457, + 'insc=consonantmedial' => 458, + 'insc=consonantplaceholder' => 459, + 'insc=consonantprecedingrepha' => 460, + 'insc=consonantprefixed' => 461, + 'insc=consonantsubjoined' => 462, + 'insc=consonantsucceedingrepha' => 463, + 'insc=consonantwithstacker' => 464, + 'insc=geminationmark' => 465, + 'insc=invisiblestacker' => 466, + 'insc=modifyingletter' => 467, + 'insc=nonjoiner' => 468, + 'insc=nukta' => 469, + 'insc=number' => 470, + 'insc=numberjoiner' => 471, + 'insc=other' => 472, + 'insc=purekiller' => 473, + 'insc=registershifter' => 474, + 'insc=syllablemodifier' => 475, + 'insc=toneletter' => 476, + 'insc=tonemark' => 477, + 'insc=virama' => 478, + 'insc=visarga' => 479, + 'insc=vowel' => 480, + 'insc=voweldependent' => 481, + 'insc=vowelindependent' => 482, + 'insiddham' => 483, + 'insinhala' => 484, + 'insogdian' => 485, + 'insorasompeng' => 486, + 'insoyombo' => 487, + 'insundanese' => 488, + 'insylotinagri' => 489, + 'insyriac' => 490, + 'intagalog' => 491, + 'intagbanwa' => 492, + 'intaile' => 493, + 'intaitham' => 494, + 'intaiviet' => 495, + 'intakri' => 496, + 'intamil' => 497, + 'intangut' => 498, + 'intelugu' => 499, + 'inthaana' => 500, + 'inthai' => 501, + 'intibetan' => 502, + 'intifinagh' => 503, + 'intirhuta' => 504, + 'inugaritic' => 505, + 'invai' => 506, + 'invs' => 507, + 'inwancho' => 508, + 'inwarangciti' => 509, + 'inyezidi' => 510, + 'inzanabazarsquare' => 511, + 'ipaext' => 535, + 'ital' => 536, + 'jamo' => 537, + 'jamoexta' => 538, + 'jamoextb' => 539, + 'java' => 540, + 'jg=africanfeh' => 541, + 'jg=africannoon' => 542, + 'jg=africanqaf' => 543, + 'jg=ain' => 544, + 'jg=alaph' => 545, + 'jg=alef' => 546, + 'jg=beh' => 547, + 'jg=beth' => 548, + 'jg=burushaskiyehbarree' => 549, + 'jg=dal' => 550, + 'jg=dalathrish' => 551, + 'jg=e' => 552, + 'jg=farsiyeh' => 553, + 'jg=fe' => 554, + 'jg=feh' => 555, + 'jg=finalsemkath' => 556, + 'jg=gaf' => 557, + 'jg=gamal' => 558, + 'jg=hah' => 559, + 'jg=hamzaonhehgoal' => 560, + 'jg=hanifirohingyakinnaya' => 561, + 'jg=hanifirohingyapa' => 562, + 'jg=he' => 563, + 'jg=heh' => 564, + 'jg=hehgoal' => 565, + 'jg=heth' => 566, + 'jg=kaf' => 567, + 'jg=kaph' => 568, + 'jg=khaph' => 569, + 'jg=knottedheh' => 570, + 'jg=lam' => 571, + 'jg=lamadh' => 572, + 'jg=malayalambha' => 573, + 'jg=malayalamja' => 574, + 'jg=malayalamlla' => 575, + 'jg=malayalamllla' => 576, + 'jg=malayalamnga' => 577, + 'jg=malayalamnna' => 578, + 'jg=malayalamnnna' => 579, + 'jg=malayalamnya' => 580, + 'jg=malayalamra' => 581, + 'jg=malayalamssa' => 582, + 'jg=malayalamtta' => 583, + 'jg=manichaeanaleph' => 584, + 'jg=manichaeanayin' => 585, + 'jg=manichaeanbeth' => 586, + 'jg=manichaeandaleth' => 587, + 'jg=manichaeandhamedh' => 588, + 'jg=manichaeanfive' => 589, + 'jg=manichaeangimel' => 590, + 'jg=manichaeanheth' => 591, + 'jg=manichaeanhundred' => 592, + 'jg=manichaeankaph' => 593, + 'jg=manichaeanlamedh' => 594, + 'jg=manichaeanmem' => 595, + 'jg=manichaeannun' => 596, + 'jg=manichaeanone' => 597, + 'jg=manichaeanpe' => 598, + 'jg=manichaeanqoph' => 599, + 'jg=manichaeanresh' => 600, + 'jg=manichaeansadhe' => 601, + 'jg=manichaeansamekh' => 602, + 'jg=manichaeantaw' => 603, + 'jg=manichaeanten' => 604, + 'jg=manichaeanteth' => 605, + 'jg=manichaeanthamedh' => 606, + 'jg=manichaeantwenty' => 607, + 'jg=manichaeanwaw' => 608, + 'jg=manichaeanyodh' => 609, + 'jg=manichaeanzayin' => 610, + 'jg=meem' => 611, + 'jg=mim' => 612, + 'jg=nojoininggroup' => 613, + 'jg=noon' => 614, + 'jg=nun' => 615, + 'jg=nya' => 616, + 'jg=pe' => 617, + 'jg=qaf' => 618, + 'jg=qaph' => 619, + 'jg=reh' => 620, + 'jg=reversedpe' => 621, + 'jg=rohingyayeh' => 622, + 'jg=sad' => 623, + 'jg=sadhe' => 624, + 'jg=seen' => 625, + 'jg=semkath' => 626, + 'jg=shin' => 627, + 'jg=straightwaw' => 628, + 'jg=swashkaf' => 629, + 'jg=syriacwaw' => 630, + 'jg=tah' => 631, + 'jg=taw' => 632, + 'jg=tehmarbuta' => 633, + 'jg=teth' => 634, + 'jg=waw' => 635, + 'jg=yeh' => 636, + 'jg=yehbarree' => 637, + 'jg=yehwithtail' => 638, + 'jg=yudh' => 639, + 'jg=yudhhe' => 640, + 'jg=zain' => 641, + 'jg=zhain' => 642, + 'joinc' => 643, + 'jt=c' => 644, + 'jt=d' => 645, + 'jt=l' => 646, + 'jt=r' => 647, + 'jt=t' => 648, + 'jt=u' => 649, + 'kali' => 650, + 'kana' => 651, + 'kanaexta' => 652, + 'kanasup' => 653, + 'kanbun' => 654, + 'kangxi' => 655, + 'katakanaext' => 656, + 'khar' => 657, + 'khmersymbols' => 658, + 'khmr' => 659, + 'khoj' => 660, + 'kits' => 661, + 'knda' => 662, + 'kthi' => 663, + 'l' => 664, 'l_' => 96, 'l_amp_' => 96, - 'lana' => 652, - 'lao' => 653, - 'latin1' => 654, - 'latinexta' => 655, - 'latinextadditional' => 656, - 'latinextb' => 657, - 'latinextc' => 658, - 'latinextd' => 659, - 'latinexte' => 660, - 'latn' => 661, - 'lb=ai' => 662, - 'lb=al' => 663, - 'lb=b2' => 664, - 'lb=ba' => 665, - 'lb=bb' => 666, - 'lb=bk' => 667, - 'lb=cb' => 668, - 'lb=cj' => 669, - 'lb=cl' => 670, - 'lb=cm' => 671, - 'lb=cp' => 672, - 'lb=cr' => 673, - 'lb=ex' => 674, - 'lb=gl' => 675, - 'lb=h2' => 676, - 'lb=h3' => 677, - 'lb=hl' => 678, - 'lb=hy' => 679, - 'lb=id' => 680, - 'lb=in' => 681, - 'lb=is' => 682, - 'lb=lf' => 683, - 'lb=nl' => 684, - 'lb=ns' => 685, - 'lb=nu' => 686, - 'lb=op' => 687, - 'lb=po' => 688, - 'lb=pr' => 689, - 'lb=qu' => 690, - 'lb=sa' => 691, - 'lb=sg_perl_aux' => 692, - 'lb=sp' => 693, - 'lb=sy' => 694, - 'lb=wj' => 695, - 'lb=xx' => 696, - 'lb=zw' => 697, - 'lb=zwj' => 698, + 'lana' => 665, + 'lao' => 666, + 'latin1' => 667, + 'latinexta' => 668, + 'latinextadditional' => 669, + 'latinextb' => 670, + 'latinextc' => 671, + 'latinextd' => 672, + 'latinexte' => 673, + 'latn' => 674, + 'lb=ai' => 675, + 'lb=al' => 676, + 'lb=b2' => 677, + 'lb=ba' => 678, + 'lb=bb' => 679, + 'lb=bk' => 680, + 'lb=cb' => 681, + 'lb=cj' => 682, + 'lb=cl' => 683, + 'lb=cm' => 684, + 'lb=cp' => 685, + 'lb=cr' => 686, + 'lb=ex' => 687, + 'lb=gl' => 688, + 'lb=h2' => 689, + 'lb=h3' => 690, + 'lb=hl' => 691, + 'lb=hy' => 692, + 'lb=id' => 693, + 'lb=in' => 694, + 'lb=is' => 695, + 'lb=lf' => 696, + 'lb=nl' => 697, + 'lb=ns' => 698, + 'lb=nu' => 699, + 'lb=op' => 700, + 'lb=po' => 701, + 'lb=pr' => 702, + 'lb=qu' => 703, + 'lb=sa' => 704, + 'lb=sg_perl_aux' => 705, + 'lb=sp' => 706, + 'lb=sy' => 707, + 'lb=wj' => 708, + 'lb=xx' => 709, + 'lb=zw' => 710, + 'lb=zwj' => 711, 'lc' => 96, - 'lepc' => 699, - 'letterlikesymbols' => 700, - 'limb' => 701, - 'lina' => 702, - 'linb' => 703, - 'linearbideograms' => 704, - 'linearbsyllabary' => 705, - 'lisu' => 706, - 'lisusup' => 707, - 'll' => 711, - 'lm' => 708, - 'lo' => 709, - 'loe' => 710, - 'lower' => 1154, - 'lowercase' => 1154, - 'lowercaseletter' => 711, - 'lowsurrogates' => 712, - 'lt' => 1111, - 'lu' => 1117, - 'lyci' => 713, - 'lydi' => 714, - 'm' => 715, - 'mahj' => 716, - 'mahjong' => 717, - 'maka' => 718, - 'mand' => 719, - 'mani' => 720, - 'marc' => 721, - 'math' => 722, - 'mathalphanum' => 723, - 'mathoperators' => 724, - 'mayannumerals' => 725, - 'mc' => 726, - 'me' => 727, - 'medf' => 728, - 'meeteimayekext' => 729, - 'mend' => 730, - 'merc' => 731, - 'mero' => 732, - 'miao' => 733, - 'miscarrows' => 734, - 'miscmathsymbolsa' => 735, - 'miscmathsymbolsb' => 736, - 'miscpictographs' => 737, - 'miscsymbols' => 738, - 'misctechnical' => 739, - 'mlym' => 740, - 'mn' => 741, - 'modi' => 742, - 'modifierletters' => 743, - 'modifiertoneletters' => 744, - 'mong' => 745, - 'mongoliansup' => 746, - 'mro' => 747, - 'mtei' => 748, - 'mult' => 749, - 'music' => 750, - 'myanmarexta' => 751, - 'myanmarextb' => 752, - 'mymr' => 753, - 'n' => 754, - 'nand' => 755, - 'narb' => 756, - 'nb' => 757, - 'nbat' => 758, - 'nd' => 1152, - 'newa' => 759, - 'nfcqc=m' => 760, - 'nfcqc=y' => 761, - 'nfdqc=y' => 762, - 'nfkcqc=n' => 763, - 'nfkcqc=y' => 764, - 'nfkdqc=n' => 765, - 'nko' => 766, - 'nl' => 767, - 'no' => 768, - 'nshu' => 769, - 'nt=di' => 770, - 'nt=nu' => 771, - 'numberforms' => 772, - 'nv=0' => 773, - 'nv=1' => 774, - 'nv=1/10' => 799, - 'nv=1/12' => 800, - 'nv=1/16' => 801, - 'nv=1/160' => 802, - 'nv=1/2' => 803, - 'nv=1/20' => 804, - 'nv=1/3' => 805, - 'nv=1/32' => 806, - 'nv=1/320' => 807, - 'nv=1/4' => 808, - 'nv=1/40' => 809, - 'nv=1/5' => 810, - 'nv=1/6' => 811, - 'nv=1/64' => 812, - 'nv=1/7' => 813, - 'nv=1/8' => 814, - 'nv=1/80' => 815, - 'nv=1/9' => 816, - 'nv=10' => 775, - 'nv=100' => 776, - 'nv=1000' => 777, - 'nv=10000' => 778, - 'nv=100000' => 779, - 'nv=1000000' => 780, - 'nv=10000000' => 781, - 'nv=100000000' => 782, - 'nv=10000000000' => 783, - 'nv=1000000000000' => 784, - 'nv=11' => 785, - 'nv=11/12' => 786, - 'nv=11/2' => 787, - 'nv=12' => 788, - 'nv=13' => 789, - 'nv=13/2' => 790, - 'nv=14' => 791, - 'nv=15' => 792, - 'nv=15/2' => 793, - 'nv=16' => 794, - 'nv=17' => 795, - 'nv=17/2' => 796, - 'nv=18' => 797, - 'nv=19' => 798, - 'nv=2' => 817, - 'nv=2/3' => 834, - 'nv=2/5' => 835, - 'nv=20' => 818, - 'nv=200' => 819, - 'nv=2000' => 820, - 'nv=20000' => 821, - 'nv=200000' => 822, - 'nv=20000000' => 823, - 'nv=21' => 824, - 'nv=216000' => 825, - 'nv=22' => 826, - 'nv=23' => 827, - 'nv=24' => 828, - 'nv=25' => 829, - 'nv=26' => 830, - 'nv=27' => 831, - 'nv=28' => 832, - 'nv=29' => 833, - 'nv=3' => 836, - 'nv=3/16' => 851, - 'nv=3/2' => 852, - 'nv=3/20' => 853, - 'nv=3/4' => 854, - 'nv=3/5' => 855, - 'nv=3/64' => 856, - 'nv=3/8' => 857, - 'nv=3/80' => 858, - 'nv=30' => 837, - 'nv=300' => 838, - 'nv=3000' => 839, - 'nv=30000' => 840, - 'nv=300000' => 841, - 'nv=31' => 842, - 'nv=32' => 843, - 'nv=33' => 844, - 'nv=34' => 845, - 'nv=35' => 846, - 'nv=36' => 847, - 'nv=37' => 848, - 'nv=38' => 849, - 'nv=39' => 850, - 'nv=4' => 859, - 'nv=4/5' => 875, - 'nv=40' => 860, - 'nv=400' => 861, - 'nv=4000' => 862, - 'nv=40000' => 863, - 'nv=400000' => 864, - 'nv=41' => 865, - 'nv=42' => 866, - 'nv=43' => 867, - 'nv=432000' => 868, - 'nv=44' => 869, - 'nv=45' => 870, - 'nv=46' => 871, - 'nv=47' => 872, - 'nv=48' => 873, - 'nv=49' => 874, - 'nv=5' => 876, - 'nv=5/12' => 882, - 'nv=5/2' => 883, - 'nv=5/6' => 884, - 'nv=5/8' => 885, - 'nv=50' => 877, - 'nv=500' => 878, - 'nv=5000' => 879, - 'nv=50000' => 880, - 'nv=500000' => 881, - 'nv=6' => 886, - 'nv=60' => 887, - 'nv=600' => 888, - 'nv=6000' => 889, - 'nv=60000' => 890, - 'nv=600000' => 891, - 'nv=7' => 892, - 'nv=7/12' => 898, - 'nv=7/2' => 899, - 'nv=7/8' => 900, - 'nv=70' => 893, - 'nv=700' => 894, - 'nv=7000' => 895, - 'nv=70000' => 896, - 'nv=700000' => 897, - 'nv=8' => 901, - 'nv=80' => 902, - 'nv=800' => 903, - 'nv=8000' => 904, - 'nv=80000' => 905, - 'nv=800000' => 906, - 'nv=9' => 907, - 'nv=9/2' => 913, - 'nv=90' => 908, - 'nv=900' => 909, - 'nv=9000' => 910, - 'nv=90000' => 911, - 'nv=900000' => 912, - 'nv=_minus_1/2' => 915, - 'nv=nan' => 914, - 'ocr' => 916, - 'ogam' => 917, - 'olck' => 918, - 'orkh' => 919, - 'ornamentaldingbats' => 920, - 'orya' => 921, - 'osge' => 922, - 'osma' => 923, - 'ottomansiyaqnumbers' => 924, - 'p' => 925, - 'palm' => 926, - 'patsyn' => 927, - 'pauc' => 928, - 'pc' => 929, - 'pcm' => 930, - 'pd' => 931, - 'pe' => 932, - 'perlspace' => 954, - 'perlword' => 956, - 'perm' => 933, - 'pf' => 934, - 'phag' => 935, - 'phaistos' => 936, - 'phli' => 937, - 'phlp' => 938, - 'phnx' => 939, - 'phoneticext' => 940, - 'phoneticextsup' => 941, - 'pi' => 942, - 'playingcards' => 943, - 'po' => 944, - 'posixalnum' => 945, - 'posixalpha' => 946, - 'posixblank' => 947, - 'posixcntrl' => 948, - 'posixdigit' => 949, - 'posixgraph' => 950, - 'posixlower' => 951, - 'posixprint' => 952, - 'posixpunct' => 953, - 'posixspace' => 954, - 'posixupper' => 955, - 'posixword' => 956, - 'posixxdigit' => 957, - 'print' => 1155, - 'prti' => 958, - 'ps' => 959, - 'pua' => 960, - 'qaai' => 961, - 'qmark' => 962, - 'radical' => 963, - 'ri' => 964, - 'rjng' => 965, - 'rohg' => 966, - 'rumi' => 967, - 'runr' => 968, - 's' => 969, - 'samr' => 970, - 'sarb' => 971, - 'saur' => 972, - 'sb=at' => 973, - 'sb=cl' => 974, - 'sb=ex' => 975, - 'sb=fo' => 976, - 'sb=le' => 977, - 'sb=lo' => 978, - 'sb=nu' => 979, - 'sb=sc' => 980, - 'sb=se' => 981, - 'sb=sp' => 982, - 'sb=st' => 983, - 'sb=up' => 984, - 'sb=xx' => 985, - 'sc' => 986, - 'sc=adlm' => 987, - 'sc=arab' => 988, - 'sc=beng' => 989, - 'sc=bopo' => 990, - 'sc=bugi' => 991, - 'sc=buhd' => 992, - 'sc=cakm' => 993, - 'sc=copt' => 994, - 'sc=cprt' => 995, - 'sc=cyrl' => 996, - 'sc=deva' => 997, - 'sc=dogr' => 998, - 'sc=dupl' => 999, - 'sc=geor' => 1000, - 'sc=glag' => 1001, - 'sc=gong' => 1002, - 'sc=gonm' => 1003, - 'sc=gran' => 1004, - 'sc=grek' => 1005, - 'sc=gujr' => 1006, - 'sc=guru' => 1007, - 'sc=han' => 1008, - 'sc=hang' => 1009, - 'sc=hano' => 1010, - 'sc=hira' => 1011, - 'sc=java' => 1012, - 'sc=kali' => 1013, - 'sc=kana' => 1014, - 'sc=khoj' => 1015, - 'sc=knda' => 1016, - 'sc=kthi' => 1017, - 'sc=latn' => 1018, - 'sc=limb' => 1019, - 'sc=lina' => 1020, - 'sc=linb' => 1021, - 'sc=mahj' => 1022, - 'sc=mand' => 1023, - 'sc=mani' => 1024, - 'sc=mlym' => 1025, - 'sc=modi' => 1026, - 'sc=mong' => 1027, - 'sc=mult' => 1028, - 'sc=mymr' => 1029, - 'sc=nand' => 1030, - 'sc=orya' => 1031, - 'sc=perm' => 1032, - 'sc=phag' => 1033, - 'sc=phlp' => 1034, - 'sc=qaai' => 1035, - 'sc=rohg' => 1036, - 'sc=shrd' => 1037, - 'sc=sind' => 1038, - 'sc=sinh' => 1039, - 'sc=sogd' => 1040, - 'sc=sylo' => 1041, - 'sc=syrc' => 1042, - 'sc=tagb' => 1043, - 'sc=takr' => 1044, - 'sc=tale' => 1045, - 'sc=taml' => 1046, - 'sc=telu' => 1047, - 'sc=tglg' => 1048, - 'sc=thaa' => 1049, - 'sc=tirh' => 1050, - 'sc=yezi' => 1051, - 'sc=yi' => 1052, - 'sc=zyyy' => 1053, - 'sd' => 1054, - 'sgnw' => 1055, - 'shaw' => 1056, - 'shorthandformatcontrols' => 1057, - 'shrd' => 1058, - 'sidd' => 1059, - 'sind' => 1060, - 'sinh' => 1061, - 'sinhalaarchaicnumbers' => 1062, - 'sk' => 1063, - 'sm' => 1064, - 'smallforms' => 1065, - 'smallkanaext' => 1066, - 'so' => 1067, - 'sogd' => 1068, - 'sogo' => 1069, - 'sora' => 1070, - 'soyo' => 1071, - 'space' => 1157, - 'spaceperl' => 1157, - 'specials' => 1072, - 'sterm' => 1073, - 'sund' => 1074, - 'sundanesesup' => 1075, - 'suparrowsa' => 1076, - 'suparrowsb' => 1077, - 'suparrowsc' => 1078, - 'superandsub' => 1079, - 'supmathoperators' => 1080, - 'suppuaa' => 1081, - 'suppuab' => 1082, - 'suppunctuation' => 1083, - 'supsymbolsandpictographs' => 1084, - 'suttonsignwriting' => 1085, - 'sylo' => 1086, - 'symbolsandpictographsexta' => 1087, - 'symbolsforlegacycomputing' => 1088, - 'syrc' => 1089, - 'syriacsup' => 1090, - 'tagb' => 1091, - 'tags' => 1092, - 'taixuanjing' => 1093, - 'takr' => 1094, - 'tale' => 1095, - 'talu' => 1096, - 'tamilsup' => 1097, - 'taml' => 1098, - 'tang' => 1099, - 'tangutcomponents' => 1100, - 'tangutsup' => 1101, - 'tavt' => 1102, - 'telu' => 1103, - 'term' => 1104, - 'tfng' => 1105, - 'tglg' => 1106, - 'thaa' => 1107, - 'thai' => 1108, - 'tibt' => 1109, - 'tirh' => 1110, - 'title' => 1111, - 'titlecase' => 1111, - 'titlecaseletter' => 1111, - 'transportandmap' => 1112, - 'ucas' => 1113, - 'ucasext' => 1114, - 'ugar' => 1115, - 'uideo' => 1116, - 'upper' => 1158, - 'uppercase' => 1158, - 'uppercaseletter' => 1117, - 'vai' => 1118, - 'vedicext' => 1119, - 'verticalforms' => 1120, - 'vertspace' => 1121, - 'vo=r' => 1122, - 'vo=tr' => 1123, - 'vo=tu' => 1124, - 'vo=u' => 1125, - 'vs' => 1126, - 'vssup' => 1127, - 'wara' => 1128, - 'wb=dq' => 1129, - 'wb=eb' => 1130, - 'wb=ex' => 1131, - 'wb=extend' => 1132, - 'wb=fo' => 1133, - 'wb=ka' => 1134, - 'wb=le' => 1135, - 'wb=mb' => 1136, - 'wb=ml' => 1137, - 'wb=mn' => 1138, - 'wb=nl' => 1139, - 'wb=nu' => 1140, - 'wb=sq' => 1141, - 'wb=wsegspace' => 1142, - 'wb=xx' => 1143, - 'wcho' => 1144, - 'whitespace' => 1157, - 'word' => 1159, - 'wspace' => 1157, - 'xdigit' => 1160, - 'xidc' => 1145, - 'xids' => 1146, - 'xpeo' => 1147, - 'xperlspace' => 1157, - 'xposixalnum' => 1148, - 'xposixalpha' => 1149, - 'xposixblank' => 1150, - 'xposixcntrl' => 1151, - 'xposixdigit' => 1152, - 'xposixgraph' => 1153, - 'xposixlower' => 1154, - 'xposixprint' => 1155, - 'xposixpunct' => 1156, - 'xposixspace' => 1157, - 'xposixupper' => 1158, - 'xposixword' => 1159, - 'xposixxdigit' => 1160, - 'xsux' => 1161, - 'yezi' => 1162, - 'yi' => 1163, - 'yijing' => 1164, - 'yiradicals' => 1165, - 'yisyllables' => 1166, - 'z' => 1167, - 'zanb' => 1168, - 'zl' => 1169, - 'zp' => 1170, - 'zs' => 1171, - 'zyyy' => 1172, - 'zzzz' => 1173, + 'lepc' => 712, + 'letterlikesymbols' => 713, + 'limb' => 714, + 'lina' => 715, + 'linb' => 716, + 'linearbideograms' => 717, + 'linearbsyllabary' => 718, + 'lisu' => 719, + 'lisusup' => 720, + 'll' => 724, + 'lm' => 721, + 'lo' => 722, + 'loe' => 723, + 'lower' => 1167, + 'lowercase' => 1167, + 'lowercaseletter' => 724, + 'lowsurrogates' => 725, + 'lt' => 1124, + 'lu' => 1130, + 'lyci' => 726, + 'lydi' => 727, + 'm' => 728, + 'mahj' => 729, + 'mahjong' => 730, + 'maka' => 731, + 'mand' => 732, + 'mani' => 733, + 'marc' => 734, + 'math' => 735, + 'mathalphanum' => 736, + 'mathoperators' => 737, + 'mayannumerals' => 738, + 'mc' => 739, + 'me' => 740, + 'medf' => 741, + 'meeteimayekext' => 742, + 'mend' => 743, + 'merc' => 744, + 'mero' => 745, + 'miao' => 746, + 'miscarrows' => 747, + 'miscmathsymbolsa' => 748, + 'miscmathsymbolsb' => 749, + 'miscpictographs' => 750, + 'miscsymbols' => 751, + 'misctechnical' => 752, + 'mlym' => 753, + 'mn' => 754, + 'modi' => 755, + 'modifierletters' => 756, + 'modifiertoneletters' => 757, + 'mong' => 758, + 'mongoliansup' => 759, + 'mro' => 760, + 'mtei' => 761, + 'mult' => 762, + 'music' => 763, + 'myanmarexta' => 764, + 'myanmarextb' => 765, + 'mymr' => 766, + 'n' => 767, + 'nand' => 768, + 'narb' => 769, + 'nb' => 770, + 'nbat' => 771, + 'nd' => 1165, + 'newa' => 772, + 'nfcqc=m' => 773, + 'nfcqc=y' => 774, + 'nfdqc=y' => 775, + 'nfkcqc=n' => 776, + 'nfkcqc=y' => 777, + 'nfkdqc=n' => 778, + 'nko' => 779, + 'nl' => 780, + 'no' => 781, + 'nshu' => 782, + 'nt=di' => 783, + 'nt=nu' => 784, + 'numberforms' => 785, + 'nv=0' => 786, + 'nv=1' => 787, + 'nv=1/10' => 812, + 'nv=1/12' => 813, + 'nv=1/16' => 814, + 'nv=1/160' => 815, + 'nv=1/2' => 816, + 'nv=1/20' => 817, + 'nv=1/3' => 818, + 'nv=1/32' => 819, + 'nv=1/320' => 820, + 'nv=1/4' => 821, + 'nv=1/40' => 822, + 'nv=1/5' => 823, + 'nv=1/6' => 824, + 'nv=1/64' => 825, + 'nv=1/7' => 826, + 'nv=1/8' => 827, + 'nv=1/80' => 828, + 'nv=1/9' => 829, + 'nv=10' => 788, + 'nv=100' => 789, + 'nv=1000' => 790, + 'nv=10000' => 791, + 'nv=100000' => 792, + 'nv=1000000' => 793, + 'nv=10000000' => 794, + 'nv=100000000' => 795, + 'nv=10000000000' => 796, + 'nv=1000000000000' => 797, + 'nv=11' => 798, + 'nv=11/12' => 799, + 'nv=11/2' => 800, + 'nv=12' => 801, + 'nv=13' => 802, + 'nv=13/2' => 803, + 'nv=14' => 804, + 'nv=15' => 805, + 'nv=15/2' => 806, + 'nv=16' => 807, + 'nv=17' => 808, + 'nv=17/2' => 809, + 'nv=18' => 810, + 'nv=19' => 811, + 'nv=2' => 830, + 'nv=2/3' => 847, + 'nv=2/5' => 848, + 'nv=20' => 831, + 'nv=200' => 832, + 'nv=2000' => 833, + 'nv=20000' => 834, + 'nv=200000' => 835, + 'nv=20000000' => 836, + 'nv=21' => 837, + 'nv=216000' => 838, + 'nv=22' => 839, + 'nv=23' => 840, + 'nv=24' => 841, + 'nv=25' => 842, + 'nv=26' => 843, + 'nv=27' => 844, + 'nv=28' => 845, + 'nv=29' => 846, + 'nv=3' => 849, + 'nv=3/16' => 864, + 'nv=3/2' => 865, + 'nv=3/20' => 866, + 'nv=3/4' => 867, + 'nv=3/5' => 868, + 'nv=3/64' => 869, + 'nv=3/8' => 870, + 'nv=3/80' => 871, + 'nv=30' => 850, + 'nv=300' => 851, + 'nv=3000' => 852, + 'nv=30000' => 853, + 'nv=300000' => 854, + 'nv=31' => 855, + 'nv=32' => 856, + 'nv=33' => 857, + 'nv=34' => 858, + 'nv=35' => 859, + 'nv=36' => 860, + 'nv=37' => 861, + 'nv=38' => 862, + 'nv=39' => 863, + 'nv=4' => 872, + 'nv=4/5' => 888, + 'nv=40' => 873, + 'nv=400' => 874, + 'nv=4000' => 875, + 'nv=40000' => 876, + 'nv=400000' => 877, + 'nv=41' => 878, + 'nv=42' => 879, + 'nv=43' => 880, + 'nv=432000' => 881, + 'nv=44' => 882, + 'nv=45' => 883, + 'nv=46' => 884, + 'nv=47' => 885, + 'nv=48' => 886, + 'nv=49' => 887, + 'nv=5' => 889, + 'nv=5/12' => 895, + 'nv=5/2' => 896, + 'nv=5/6' => 897, + 'nv=5/8' => 898, + 'nv=50' => 890, + 'nv=500' => 891, + 'nv=5000' => 892, + 'nv=50000' => 893, + 'nv=500000' => 894, + 'nv=6' => 899, + 'nv=60' => 900, + 'nv=600' => 901, + 'nv=6000' => 902, + 'nv=60000' => 903, + 'nv=600000' => 904, + 'nv=7' => 905, + 'nv=7/12' => 911, + 'nv=7/2' => 912, + 'nv=7/8' => 913, + 'nv=70' => 906, + 'nv=700' => 907, + 'nv=7000' => 908, + 'nv=70000' => 909, + 'nv=700000' => 910, + 'nv=8' => 914, + 'nv=80' => 915, + 'nv=800' => 916, + 'nv=8000' => 917, + 'nv=80000' => 918, + 'nv=800000' => 919, + 'nv=9' => 920, + 'nv=9/2' => 926, + 'nv=90' => 921, + 'nv=900' => 922, + 'nv=9000' => 923, + 'nv=90000' => 924, + 'nv=900000' => 925, + 'nv=_minus_1/2' => 928, + 'nv=nan' => 927, + 'ocr' => 929, + 'ogam' => 930, + 'olck' => 931, + 'orkh' => 932, + 'ornamentaldingbats' => 933, + 'orya' => 934, + 'osge' => 935, + 'osma' => 936, + 'ottomansiyaqnumbers' => 937, + 'p' => 938, + 'palm' => 939, + 'patsyn' => 940, + 'pauc' => 941, + 'pc' => 942, + 'pcm' => 943, + 'pd' => 944, + 'pe' => 945, + 'perlspace' => 967, + 'perlword' => 969, + 'perm' => 946, + 'pf' => 947, + 'phag' => 948, + 'phaistos' => 949, + 'phli' => 950, + 'phlp' => 951, + 'phnx' => 952, + 'phoneticext' => 953, + 'phoneticextsup' => 954, + 'pi' => 955, + 'playingcards' => 956, + 'po' => 957, + 'posixalnum' => 958, + 'posixalpha' => 959, + 'posixblank' => 960, + 'posixcntrl' => 961, + 'posixdigit' => 962, + 'posixgraph' => 963, + 'posixlower' => 964, + 'posixprint' => 965, + 'posixpunct' => 966, + 'posixspace' => 967, + 'posixupper' => 968, + 'posixword' => 969, + 'posixxdigit' => 970, + 'print' => 1168, + 'prti' => 971, + 'ps' => 972, + 'pua' => 973, + 'qaai' => 974, + 'qmark' => 975, + 'radical' => 976, + 'ri' => 977, + 'rjng' => 978, + 'rohg' => 979, + 'rumi' => 980, + 'runr' => 981, + 's' => 982, + 'samr' => 983, + 'sarb' => 984, + 'saur' => 985, + 'sb=at' => 986, + 'sb=cl' => 987, + 'sb=ex' => 988, + 'sb=fo' => 989, + 'sb=le' => 990, + 'sb=lo' => 991, + 'sb=nu' => 992, + 'sb=sc' => 993, + 'sb=se' => 994, + 'sb=sp' => 995, + 'sb=st' => 996, + 'sb=up' => 997, + 'sb=xx' => 998, + 'sc' => 999, + 'sc=adlm' => 1000, + 'sc=arab' => 1001, + 'sc=beng' => 1002, + 'sc=bopo' => 1003, + 'sc=bugi' => 1004, + 'sc=buhd' => 1005, + 'sc=cakm' => 1006, + 'sc=copt' => 1007, + 'sc=cprt' => 1008, + 'sc=cyrl' => 1009, + 'sc=deva' => 1010, + 'sc=dogr' => 1011, + 'sc=dupl' => 1012, + 'sc=geor' => 1013, + 'sc=glag' => 1014, + 'sc=gong' => 1015, + 'sc=gonm' => 1016, + 'sc=gran' => 1017, + 'sc=grek' => 1018, + 'sc=gujr' => 1019, + 'sc=guru' => 1020, + 'sc=han' => 1021, + 'sc=hang' => 1022, + 'sc=hano' => 1023, + 'sc=hira' => 1024, + 'sc=java' => 1025, + 'sc=kali' => 1026, + 'sc=kana' => 1027, + 'sc=khoj' => 1028, + 'sc=knda' => 1029, + 'sc=kthi' => 1030, + 'sc=latn' => 1031, + 'sc=limb' => 1032, + 'sc=lina' => 1033, + 'sc=linb' => 1034, + 'sc=mahj' => 1035, + 'sc=mand' => 1036, + 'sc=mani' => 1037, + 'sc=mlym' => 1038, + 'sc=modi' => 1039, + 'sc=mong' => 1040, + 'sc=mult' => 1041, + 'sc=mymr' => 1042, + 'sc=nand' => 1043, + 'sc=orya' => 1044, + 'sc=perm' => 1045, + 'sc=phag' => 1046, + 'sc=phlp' => 1047, + 'sc=qaai' => 1048, + 'sc=rohg' => 1049, + 'sc=shrd' => 1050, + 'sc=sind' => 1051, + 'sc=sinh' => 1052, + 'sc=sogd' => 1053, + 'sc=sylo' => 1054, + 'sc=syrc' => 1055, + 'sc=tagb' => 1056, + 'sc=takr' => 1057, + 'sc=tale' => 1058, + 'sc=taml' => 1059, + 'sc=telu' => 1060, + 'sc=tglg' => 1061, + 'sc=thaa' => 1062, + 'sc=tirh' => 1063, + 'sc=yezi' => 1064, + 'sc=yi' => 1065, + 'sc=zyyy' => 1066, + 'sd' => 1067, + 'sgnw' => 1068, + 'shaw' => 1069, + 'shorthandformatcontrols' => 1070, + 'shrd' => 1071, + 'sidd' => 1072, + 'sind' => 1073, + 'sinh' => 1074, + 'sinhalaarchaicnumbers' => 1075, + 'sk' => 1076, + 'sm' => 1077, + 'smallforms' => 1078, + 'smallkanaext' => 1079, + 'so' => 1080, + 'sogd' => 1081, + 'sogo' => 1082, + 'sora' => 1083, + 'soyo' => 1084, + 'space' => 1170, + 'spaceperl' => 1170, + 'specials' => 1085, + 'sterm' => 1086, + 'sund' => 1087, + 'sundanesesup' => 1088, + 'suparrowsa' => 1089, + 'suparrowsb' => 1090, + 'suparrowsc' => 1091, + 'superandsub' => 1092, + 'supmathoperators' => 1093, + 'suppuaa' => 1094, + 'suppuab' => 1095, + 'suppunctuation' => 1096, + 'supsymbolsandpictographs' => 1097, + 'suttonsignwriting' => 1098, + 'sylo' => 1099, + 'symbolsandpictographsexta' => 1100, + 'symbolsforlegacycomputing' => 1101, + 'syrc' => 1102, + 'syriacsup' => 1103, + 'tagb' => 1104, + 'tags' => 1105, + 'taixuanjing' => 1106, + 'takr' => 1107, + 'tale' => 1108, + 'talu' => 1109, + 'tamilsup' => 1110, + 'taml' => 1111, + 'tang' => 1112, + 'tangutcomponents' => 1113, + 'tangutsup' => 1114, + 'tavt' => 1115, + 'telu' => 1116, + 'term' => 1117, + 'tfng' => 1118, + 'tglg' => 1119, + 'thaa' => 1120, + 'thai' => 1121, + 'tibt' => 1122, + 'tirh' => 1123, + 'title' => 1124, + 'titlecase' => 1124, + 'titlecaseletter' => 1124, + 'transportandmap' => 1125, + 'ucas' => 1126, + 'ucasext' => 1127, + 'ugar' => 1128, + 'uideo' => 1129, + 'upper' => 1171, + 'uppercase' => 1171, + 'uppercaseletter' => 1130, + 'vai' => 1131, + 'vedicext' => 1132, + 'verticalforms' => 1133, + 'vertspace' => 1134, + 'vo=r' => 1135, + 'vo=tr' => 1136, + 'vo=tu' => 1137, + 'vo=u' => 1138, + 'vs' => 1139, + 'vssup' => 1140, + 'wara' => 1141, + 'wb=dq' => 1142, + 'wb=eb' => 1143, + 'wb=ex' => 1144, + 'wb=extend' => 1145, + 'wb=fo' => 1146, + 'wb=ka' => 1147, + 'wb=le' => 1148, + 'wb=mb' => 1149, + 'wb=ml' => 1150, + 'wb=mn' => 1151, + 'wb=nl' => 1152, + 'wb=nu' => 1153, + 'wb=sq' => 1154, + 'wb=wsegspace' => 1155, + 'wb=xx' => 1156, + 'wcho' => 1157, + 'whitespace' => 1170, + 'word' => 1172, + 'wspace' => 1170, + 'xdigit' => 1173, + 'xidc' => 1158, + 'xids' => 1159, + 'xpeo' => 1160, + 'xperlspace' => 1170, + 'xposixalnum' => 1161, + 'xposixalpha' => 1162, + 'xposixblank' => 1163, + 'xposixcntrl' => 1164, + 'xposixdigit' => 1165, + 'xposixgraph' => 1166, + 'xposixlower' => 1167, + 'xposixprint' => 1168, + 'xposixpunct' => 1169, + 'xposixspace' => 1170, + 'xposixupper' => 1171, + 'xposixword' => 1172, + 'xposixxdigit' => 1173, + 'xsux' => 1174, + 'yezi' => 1175, + 'yi' => 1176, + 'yijing' => 1177, + 'yiradicals' => 1178, + 'yisyllables' => 1179, + 'z' => 1180, + 'zanb' => 1181, + 'zl' => 1182, + 'zp' => 1183, + 'zs' => 1184, + 'zyyy' => 1185, + 'zzzz' => 1186, ); 1; @@ -1247,6 +1260,8 @@ # 4f822ec7a9ebbb3138ad29bade8b9688d25b39c7a3c0b7431f01e7229e4fcb6e lib/unicore/EastAsianWidth.txt # fc535aa1047a70105ab9a22c2b4c3f363a2ff02fe48ebbc5eeb9873b2752ff0b lib/unicore/EquivalentUnifiedIdeograph.txt # b9c5158ce944d2fec57e0e4ecb716bdabfc3bdde73525f1772fe03f61a30d473 lib/unicore/HangulSyllableType.txt +# a8a51d020f05b3fdb5e05413acbf106bef49de2d5715f9725f9350d52373c544 lib/unicore/IdStatus.txt +# 48f6f91216cc9f9d5c3cd2b55d768b48dd6696400e1f4290eccd1ec81f5958da lib/unicore/IdType.txt # 69197b019fa5f2fb0d8c6ed1ed8acb9f2e8b5b8f45a947953ffa652f3bf54983 lib/unicore/IndicPositionalCategory.txt # 6604e2f0fde7428675364aa0006bc686b79488dcc60ae8cb29800af2be3352e8 lib/unicore/IndicSyllabicCategory.txt # 84ead63924aaa74b988b2eaf254a8733276ed108633ce2ef77a9ee1de7818162 lib/unicore/Jamo.txt @@ -1280,7 +1295,7 @@ # 0fea35394151afefbb4121b6380db1b480be6f9bafb4eba3382dc292dcf68526 lib/unicore/extracted/DLineBreak.txt # 6d4a8c945dd7db83ed617cbb7d937de7f4ecf016ff22970d846e996a7c9a2a5d lib/unicore/extracted/DNumType.txt # 5b7c14380d5cceeaffcfbc18db1ed936391d2af2d51f5a41f1a17b692c77e59b lib/unicore/extracted/DNumValues.txt -# eefd34f5f03191cb297d62f66273ca68efc972703f5323543427a9b285f28657 lib/unicore/mktables +# b546595bd9f4946e2997179652ff9a0d3ceef7833fbcc37524c1abf74363e73d lib/unicore/mktables # 50b85a67451145545a65cea370dab8d3444fbfe07e9c34cef560c5b7da9d3eef lib/unicore/version # 2680b9254eb236c5c090f11b149605043e8c8433661b96efc4a42fb4709342a5 regen/charset_translations.pl # 6bbad21de0848e0236b02f34f5fa0edd3cdae9ba8173cc9469a5513936b9e728 regen/mk_PL_charclass.pl |