summaryrefslogtreecommitdiff
path: root/utfebcdic.h
diff options
context:
space:
mode:
authorKarl Williamson <khw@cpan.org>2019-10-02 20:37:17 -0600
committerKarl Williamson <khw@cpan.org>2019-10-06 11:07:09 -0600
commitab2e28c2f2b8f2edf930448a1c0182a8bd4f469f (patch)
tree16c1c3220b88f335af9a3d93b43815dcfe1c43ac /utfebcdic.h
parent2dc97505e86018c7ceba8c96fd84f477c8dd45d3 (diff)
downloadperl-ab2e28c2f2b8f2edf930448a1c0182a8bd4f469f.tar.gz
Make defn of UVCHR_IS_INVARIANT common
This can be derived from other values, removing an EBCDIC dependency
Diffstat (limited to 'utfebcdic.h')
-rw-r--r--utfebcdic.h12
1 files changed, 1 insertions, 11 deletions
diff --git a/utfebcdic.h b/utfebcdic.h
index 99a5bad5c3..d52d54a43f 100644
--- a/utfebcdic.h
+++ b/utfebcdic.h
@@ -202,17 +202,7 @@ possible to UTF-8-encode a single code point in different ways, but that is
explicitly forbidden, and the shortest possible encoding should always be used
(and that is what Perl does). */
-/* It turns out that on EBCDIC platforms, the invariants are the characters
- * that have ASCII equivalents, plus the C1 controls. Since the C0 controls
- * and DELETE are ASCII, this is the same as: (isASCII(uv) || isCNTRL_L1(uv))
- * */
-#define UVCHR_IS_INVARIANT(uv) cBOOL(FITS_IN_8_BITS(uv) \
- && (PL_charclass[(U8) (uv)] & (_CC_mask(_CC_ASCII) | _CC_mask(_CC_CNTRL))))
-
-/* UTF-EBCDIC semantic macros - We used to transform back into I8 and then
- * compare, but now only have to do a single lookup by using a bit in
- * l1_char_class_tab.h.
- * Comments as to the meaning of each are given at their corresponding utf8.h
+/* Comments as to the meaning of each are given at their corresponding utf8.h
* definitions. */
/* Equivalent to ! UVCHR_IS_INVARIANT(c) */
#define UTF8_IS_CONTINUED(c) cBOOL(FITS_IN_8_BITS(c) \