summaryrefslogtreecommitdiff
path: root/utf8.h
diff options
context:
space:
mode:
authorJarkko Hietaniemi <jhi@iki.fi>2000-10-25 18:52:30 +0000
committerJarkko Hietaniemi <jhi@iki.fi>2000-10-25 18:52:30 +0000
commitfcc8fcf67e5ea5f08178c9ac86509bc972ef38ff (patch)
treec1e1979344ade58a2413d5700ea4ecba54b6afbe /utf8.h
parent5bbb0b5ac8fdf0a5cc17b4f7b9199f9e3d7db4b6 (diff)
downloadperl-fcc8fcf67e5ea5f08178c9ac86509bc972ef38ff.tar.gz
Allow poking holes at the UTF-8 decoding strictness.
p4raw-id: //depot/perl@7438
Diffstat (limited to 'utf8.h')
-rw-r--r--utf8.h13
1 files changed, 12 insertions, 1 deletions
diff --git a/utf8.h b/utf8.h
index 548d8212f5..dc93e95aa9 100644
--- a/utf8.h
+++ b/utf8.h
@@ -29,10 +29,21 @@ END_EXTERN_C
#define UTF8_MAXLEN 13 /* how wide can a single UTF8 encoded character become */
-#define IN_UTF8 (PL_curcop->op_private & HINT_UTF8)
+/* #define IN_UTF8 (PL_curcop->op_private & HINT_UTF8) */
#define IN_BYTE (PL_curcop->op_private & HINT_BYTE)
#define DO_UTF8(sv) (SvUTF8(sv) && !IN_BYTE)
+#define UTF8_ALLOW_CONTINUATION 0x0001
+#define UTF8_ALLOW_NON_CONTINUATION 0x0002
+#define UTF8_ALLOW_FE_FF 0x0004
+#define UTF8_ALLOW_SHORT 0x0008
+#define UTF8_ALLOW_SURROGATE 0x0010
+#define UTF8_ALLOW_BOM 0x0020
+#define UTF8_ALLOW_FFFF 0x0040
+#define UTF8_ALLOW_LONG 0x0080
+#define UTF8_ALLOW_ANY 0x00ff
+#define UTF8_CHECK_ONLY 0x0100
+
#define UTF8SKIP(s) PL_utf8skip[*(U8*)s]
#ifdef HAS_QUAD