diff options
author | Karl Williamson <khw@cpan.org> | 2017-11-18 09:35:25 -0700 |
---|---|---|
committer | Karl Williamson <khw@cpan.org> | 2017-11-18 09:47:16 -0700 |
commit | 9b79e9e3431d11e79a4f85268f70130b7b4369f6 (patch) | |
tree | a3f683a13b8f98680f9e5be0903b622e05ba3c16 | |
parent | 04f89ea7f30fbde4ccaefee940117aa6a27d5fd0 (diff) | |
download | perl-9b79e9e3431d11e79a4f85268f70130b7b4369f6.tar.gz |
PATCH: [perl #132463] perluniprops for \p{Word}
perluniprops was not updated to reflect the changes made to what
\p{Word} contains as of 5.18. What was added was the code points that
have the Join_Control property, which, so far, only contain U+200C and
U+200D. This commit uses Join Control instead of the hard-coded code
point numbers, so that when Unicode changes it, it automatically will
still be valid.
Thanks for spotting this.
-rw-r--r-- | charclass_invlists.h | 2 | ||||
-rw-r--r-- | lib/unicore/mktables | 3 | ||||
-rw-r--r-- | regcharclass.h | 2 |
3 files changed, 4 insertions, 3 deletions
diff --git a/charclass_invlists.h b/charclass_invlists.h index 1ae981214c..4eb26efa91 100644 --- a/charclass_invlists.h +++ b/charclass_invlists.h @@ -97454,7 +97454,7 @@ static const U8 WB_table[24][24] = { * be0f129691d479aa38646e4ca0ec1ee576ae7f75b0300a5624a7fa862fa8abba lib/unicore/extracted/DLineBreak.txt * 92449d354d9f6b6f2f97a292ebb59f6344ffdeb83d120d7d23e569c43ba67cd5 lib/unicore/extracted/DNumType.txt * e3a319527153b0c6c0c549b40fc6f3a01a7a0dcd6620784391db25901df3b154 lib/unicore/extracted/DNumValues.txt - * 409910af8e9ad2cba213c70f936a6c716494029a8346e8b55dd44275cc51d35d lib/unicore/mktables + * d905c655c0cc448f19894613ce87026dea667bb66c65937667424fc0afdc90c4 lib/unicore/mktables * 21653d2744fdd071f9ef138c805393901bb9547cf3e777ebf50215a191f986ea lib/unicore/version * 913d2f93f3cb6cdf1664db888bf840bc4eb074eef824e082fceda24a9445e60c regen/charset_translations.pl * 48418cbf454eb9ef35c73468ed5ef72ad8603490eabe74181ce4fae42ec72579 regen/mk_invlists.pl diff --git a/lib/unicore/mktables b/lib/unicore/mktables index 1386735e2f..200ae46d30 100644 --- a/lib/unicore/mktables +++ b/lib/unicore/mktables @@ -14499,7 +14499,8 @@ sub compile_perl() { my $Word = $perl->add_match_table('Word', Full_Name => 'XPosixWord', Description => '\w, including beyond ASCII;' - . ' = \p{Alnum} + \pM + \p{Pc}', + . ' = \p{Alnum} + \pM + \p{Pc}' + . ' + \p{Join_Control}', Initialize => $Alnum + $gc->table('Mark'), ); my $Pc = $gc->table('Connector_Punctuation'); # 'Pc' Not in release 1 diff --git a/regcharclass.h b/regcharclass.h index 6b3e846aaa..38ddd84c55 100644 --- a/regcharclass.h +++ b/regcharclass.h @@ -1898,7 +1898,7 @@ * be0f129691d479aa38646e4ca0ec1ee576ae7f75b0300a5624a7fa862fa8abba lib/unicore/extracted/DLineBreak.txt * 92449d354d9f6b6f2f97a292ebb59f6344ffdeb83d120d7d23e569c43ba67cd5 lib/unicore/extracted/DNumType.txt * e3a319527153b0c6c0c549b40fc6f3a01a7a0dcd6620784391db25901df3b154 lib/unicore/extracted/DNumValues.txt - * 409910af8e9ad2cba213c70f936a6c716494029a8346e8b55dd44275cc51d35d lib/unicore/mktables + * d905c655c0cc448f19894613ce87026dea667bb66c65937667424fc0afdc90c4 lib/unicore/mktables * 21653d2744fdd071f9ef138c805393901bb9547cf3e777ebf50215a191f986ea lib/unicore/version * 913d2f93f3cb6cdf1664db888bf840bc4eb074eef824e082fceda24a9445e60c regen/charset_translations.pl * 9ea6338945a7d70e5ea4b31ac7856c0b521df96be002e94b4b3b7d31debbf3ab regen/regcharclass.pl |