summaryrefslogtreecommitdiff
path: root/utfebcdic.h
diff options
context:
space:
mode:
authorKarl Williamson <khw@cpan.org>2021-06-14 12:32:41 -0600
committerKarl Williamson <khw@cpan.org>2021-08-07 05:14:43 -0600
commitfcd03d925b4b3a67a6162b516b3ea4194e92bc92 (patch)
treec3fceba9a87467207809454f8bb38f6cb8455855 /utfebcdic.h
parent36da1e17a35eb23f0d666ee29dbff5c7823cad4c (diff)
downloadperl-fcd03d925b4b3a67a6162b516b3ea4194e92bc92.tar.gz
utf8.h: Make a bit of EBCDIC known to ASCII
This info is needed in one other place; doing it here means only specifying it once.
Diffstat (limited to 'utfebcdic.h')
-rw-r--r--utfebcdic.h6
1 files changed, 1 insertions, 5 deletions
diff --git a/utfebcdic.h b/utfebcdic.h
index 56e268f302..1b9b35acf1 100644
--- a/utfebcdic.h
+++ b/utfebcdic.h
@@ -202,12 +202,8 @@ possible to UTF-8-encode a single code point in different ways, but that is
explicitly forbidden, and the shortest possible encoding should always be used
(and that is what Perl does). */
-/* It turns out that just this one number is sufficient to derive all the basic
- * macros for UTF-8 and UTF-EBCDIC. Everything follows from the fact that
- * there are 6 bits of real information in a UTF-8 continuation byte vs. 5 bits
- * in a UTF-EBCDIC one. */
+#define UTF_CONTINUATION_BYTE_INFO_BITS UTF_EBCDIC_CONTINUATION_BYTE_INFO_BITS
-#define UTF_CONTINUATION_BYTE_INFO_BITS 5
/* Also needed is how perl handles a start byte of 8 one bits. The decision
* was made to just append the minimal number of bytes after that so that code
* points up to 64 bits wide could be represented. In UTF-8, that was an extra