summaryrefslogtreecommitdiff
path: root/handy.h
diff options
context:
space:
mode:
authorKarl Williamson <khw@cpan.org>2015-05-15 14:23:12 -0600
committerKarl Williamson <khw@cpan.org>2015-09-04 10:21:17 -0600
commit073c22b3d2738ecdd785352b16b62ca94ab7074c (patch)
tree0c802b7f46a2505fd37ea1ef1993e0d09e622c97 /handy.h
parentc93ea49efa21178588f8f466fb74da0fb52cdc41 (diff)
downloadperl-073c22b3d2738ecdd785352b16b62ca94ab7074c.tar.gz
l1_char_class_tab.h: Add bits for UTF-EBCDIC
This is for the next commit.
Diffstat (limited to 'handy.h')
-rw-r--r--handy.h12
1 files changed, 10 insertions, 2 deletions
diff --git a/handy.h b/handy.h
index c3fd77d456..6691e3ff76 100644
--- a/handy.h
+++ b/handy.h
@@ -962,14 +962,22 @@ patched there. The file as of this writing is cpan/Devel-PPPort/parts/inc/misc
# define _CC_NON_FINAL_FOLD 21
# define _CC_IS_IN_SOME_FOLD 22
# define _CC_MNEMONIC_CNTRL 23
-/* Unused: 24-31
+
+/* This next group is only used on EBCDIC platforms, so theoretically could be
+ * shared with something entirely different that's only on ASCII platforms */
+# define _CC_UTF8_IS_START 29
+# define _CC_UTF8_IS_DOWNGRADEABLE_START 30
+# define _CC_UTF8_IS_CONTINUATION 31
+/* Unused: 24-28
* If more bits are needed, one could add a second word for non-64bit
* QUAD_IS_INT systems, using some #ifdefs to distinguish between having a 2nd
* word or not. The IS_IN_SOME_FOLD bit is the most easily expendable, as it
* is used only for optimization (as of this writing), and differs in the
* Latin1 range from the ALPHA bit only in two relatively unimportant
* characters: the masculine and feminine ordinal indicators, so removing it
- * would just cause /i regexes which match them to run less efficiently */
+ * would just cause /i regexes which match them to run less efficiently.
+ * Similarly the EBCDIC-only bits are used just for speed, and could be
+ * replaced by other means */
#if defined(PERL_CORE) || defined(PERL_EXT)
/* An enum version of the character class numbers, to help compilers