summaryrefslogtreecommitdiff
path: root/utf8.c
diff options
context:
space:
mode:
authorKarl Williamson <public@khwilliamson.com>2013-04-30 09:13:35 -0600
committerKarl Williamson <public@khwilliamson.com>2013-08-29 09:56:08 -0600
commitbcb1a2d416c144271685cdf48af52ebbc3f267f8 (patch)
treea00af5ea832eda3750b8cf4773a9a0ac5a02e44e /utf8.c
parent2ae25f5c60ad0e9dc97213915f719f4f1b9053f1 (diff)
downloadperl-bcb1a2d416c144271685cdf48af52ebbc3f267f8.tar.gz
perlapi vis utf8.c: Nits
Diffstat (limited to 'utf8.c')
-rw-r--r--utf8.c9
1 files changed, 4 insertions, 5 deletions
diff --git a/utf8.c b/utf8.c
index e738801e13..3c9fc61c1c 100644
--- a/utf8.c
+++ b/utf8.c
@@ -125,7 +125,7 @@ UNICODE_WARN_SUPER and UNICODE_DISALLOW_SUPER flags, affect the handling of
code points that are
above the Unicode maximum of 0x10FFFF. Code points above 0x7FFF_FFFF (which are
even less portable) can be warned and/or disallowed even if other above-Unicode
-code points are accepted by the UNICODE_WARN_FE_FF and UNICODE_DISALLOW_FE_FF
+code points are accepted, by the UNICODE_WARN_FE_FF and UNICODE_DISALLOW_FE_FF
flags.
And finally, the flag UNICODE_WARN_ILLEGAL_INTERCHANGE selects all four of the
@@ -262,11 +262,10 @@ Perl_uvoffuni_to_utf8_flags(pTHX_ U8 *d, UV uv, UV flags)
#endif
#endif /* Non loop style */
}
-
/*
=for apidoc uvchr_to_utf8
-Adds the UTF-8 representation of the Native code point C<uv> to the end
+Adds the UTF-8 representation of the native code point C<uv> to the end
of the string C<d>; C<d> should have at least C<UTF8_MAXBYTES+1> free
bytes available. The return value is the pointer to the byte after the
end of the new character. In other words,
@@ -302,8 +301,8 @@ Perl_uvchr_to_utf8_flags(pTHX_ U8 *d, UV uv, UV flags)
/*
Tests if the first C<len> bytes of string C<s> form a valid UTF-8
-character. Note that an INVARIANT (i.e. ASCII) character is a valid
-UTF-8 character. The number of bytes in the UTF-8 character
+character. Note that an INVARIANT (i.e. ASCII on non-EBCDIC) character is a
+valid UTF-8 character. The number of bytes in the UTF-8 character
will be returned if it is valid, otherwise 0.
This is the "slow" version as opposed to the "fast" version which is