diff options
author | Karl Williamson <khw@cpan.org> | 2015-05-15 14:23:12 -0600 |
---|---|---|
committer | Karl Williamson <khw@cpan.org> | 2015-09-04 10:21:17 -0600 |
commit | 073c22b3d2738ecdd785352b16b62ca94ab7074c (patch) | |
tree | 0c802b7f46a2505fd37ea1ef1993e0d09e622c97 /handy.h | |
parent | c93ea49efa21178588f8f466fb74da0fb52cdc41 (diff) | |
download | perl-073c22b3d2738ecdd785352b16b62ca94ab7074c.tar.gz |
l1_char_class_tab.h: Add bits for UTF-EBCDIC
This is for the next commit.
Diffstat (limited to 'handy.h')
-rw-r--r-- | handy.h | 12 |
1 files changed, 10 insertions, 2 deletions
@@ -962,14 +962,22 @@ patched there. The file as of this writing is cpan/Devel-PPPort/parts/inc/misc # define _CC_NON_FINAL_FOLD 21 # define _CC_IS_IN_SOME_FOLD 22 # define _CC_MNEMONIC_CNTRL 23 -/* Unused: 24-31 + +/* This next group is only used on EBCDIC platforms, so theoretically could be + * shared with something entirely different that's only on ASCII platforms */ +# define _CC_UTF8_IS_START 29 +# define _CC_UTF8_IS_DOWNGRADEABLE_START 30 +# define _CC_UTF8_IS_CONTINUATION 31 +/* Unused: 24-28 * If more bits are needed, one could add a second word for non-64bit * QUAD_IS_INT systems, using some #ifdefs to distinguish between having a 2nd * word or not. The IS_IN_SOME_FOLD bit is the most easily expendable, as it * is used only for optimization (as of this writing), and differs in the * Latin1 range from the ALPHA bit only in two relatively unimportant * characters: the masculine and feminine ordinal indicators, so removing it - * would just cause /i regexes which match them to run less efficiently */ + * would just cause /i regexes which match them to run less efficiently. + * Similarly the EBCDIC-only bits are used just for speed, and could be + * replaced by other means */ #if defined(PERL_CORE) || defined(PERL_EXT) /* An enum version of the character class numbers, to help compilers |