summaryrefslogtreecommitdiff
path: root/utf8.h
diff options
context:
space:
mode:
authorKarl Williamson <khw@cpan.org>2014-06-28 21:43:02 -0600
committerKarl Williamson <khw@cpan.org>2014-07-09 08:04:52 -0600
commita17767184dd91d4cb8e0f020584a315c581d7b7a (patch)
tree12dbcf18fc35dd70760a43346e22c4c1d47ea9e5 /utf8.h
parentcdf175f7f80eedf9ecae198d41dded383592465d (diff)
downloadperl-a17767184dd91d4cb8e0f020584a315c581d7b7a.tar.gz
utf8.h: Add comment
Diffstat (limited to 'utf8.h')
-rw-r--r--utf8.h4
1 files changed, 3 insertions, 1 deletions
diff --git a/utf8.h b/utf8.h
index 2357fb009c..613389cc49 100644
--- a/utf8.h
+++ b/utf8.h
@@ -485,7 +485,9 @@ Perl's extended UTF-8 means we can have start bytes up to FF.
* U+10FFFF: \xF4\x8F\xBF\xBF \xF9\xA1\xBF\xBF\xBF max legal Unicode
* U+110000: \xF4\x90\x80\x80 \xF9\xA2\xA0\xA0\xA0
* U+110001: \xF4\x90\x80\x81 \xF9\xA2\xA0\xA0\xA1
- */
+ *
+ * BE AWARE that this test doesn't rule out malformed code points, in
+ * particular overlongs */
#ifdef EBCDIC /* Both versions assume well-formed UTF8 */
# define UTF8_IS_SUPER(s) (NATIVE_UTF8_TO_I8(* (U8*) (s)) >= 0xF9 \
&& (NATIVE_UTF8_TO_I8(* (U8*) (s)) > 0xF9 \