handy.h: Add bounds checking to case change arrays

This makes sure that the index into the arrays used to change between lower and upper case will fit into their bounds; returning an error character if not. The check is likely to be optimized out if the index is stored in 8 bits.
author: Karl Williamson <public@khwilliamson.com> 2010-08-31 20:20:01 -0600
committer: Rafael Garcia-Suarez <rgs@consttype.org> 2010-09-13 13:56:03 +0200
commit: 4125141464884619e852c7b0986a51eba8fe1636 (patch)
tree: d4393940bde6463ba49617a14b9900ac0e1a0998 /handy.h
parent: cf301eb7d17e4d58d25337e997b1c7b0133e3c91 (diff)
download: perl-4125141464884619e852c7b0986a51eba8fe1636.tar.gz
1 files changed, 13 insertions, 7 deletions
diff --git a/handy.h b/handy.h
index b46b844dba..a1d753dea8 100644
--- a/handy.h
+++ b/handy.h
@@ -528,9 +528,7 @@ patched there.  The file as of this writing is cpan/Devel-PPPort/parts/inc/misc
 #   define isPUNCT(c)	ispunct(c)
 #   define isXDIGIT(c)	isxdigit(c)
 #   define toUPPER(c)	toupper(c)
-#   define toUPPER_LATIN1_MOD(c)    UNI_TO_NATIVE(PL_mod_latin1_uc[(U8) NATIVE_TO_UNI(c)])
 #   define toLOWER(c)	tolower(c)
-#   define toLOWER_LATIN1(c)	UNI_TO_NATIVE(PL_latin1_lc[(U8) NATIVE_TO_UNI(c)])
 #else
 #   define isUPPER(c)	((c) >= 'A' && (c) <= 'Z')
 #   define isLOWER(c)	((c) >= 'a' && (c) <= 'z')
@@ -542,12 +540,20 @@ patched there.  The file as of this writing is cpan/Devel-PPPort/parts/inc/misc
 #   define isPUNCT(c)	(((c) >= 33 && (c) <= 47) || ((c) >= 58 && (c) <= 64)  || ((c) >= 91 && (c) <= 96) || ((c) >= 123 && (c) <= 126))
 #   define isXDIGIT(c)  (isDIGIT(c) || ((c) >= 'a' && (c) <= 'f') || ((c) >= 'A' && (c) <= 'F'))
 
-/* Use table lookup for speed */
-#   define toLOWER_LATIN1(c)	(PL_latin1_lc[(U8) c])
 
-/* Modified uc.  Is correct uc except for three non-ascii chars which are
- * all mapped to one of them, and these need special handling */
-#   define toUPPER_LATIN1_MOD(c)    (PL_mod_latin1_uc[(U8) c])
+    /* Use table lookup for speed; return error character for input
+     * out-of-range */
+#   define toLOWER_LATIN1(c)    (FITS_IN_8_BITS(c)                            \
+                                ? UNI_TO_NATIVE(PL_latin1_lc[                 \
+                                                  NATIVE_TO_UNI( (U8) (c)) ]) \
+                                : UNICODE_REPLACEMENT)
+    /* Modified uc.  Is correct uc except for three non-ascii chars which are
+     * all mapped to one of them, and these need special handling; error
+     * character for input out-of-range */
+#   define toUPPER_LATIN1_MOD(c) (FITS_IN_8_BITS(c)                           \
+                                 ? UNI_TO_NATIVE(PL_mod_latin1_uc[            \
+                                                  NATIVE_TO_UNI( (U8) (c)) ]) \
+                                 : UNICODE_REPLACEMENT)
 
 /* ASCII casing. */
 #   define toUPPER(c)	(isLOWER(c) ? (c) - ('a' - 'A') : (c))
author	Karl Williamson <public@khwilliamson.com>	2010-08-31 20:20:01 -0600
committer	Rafael Garcia-Suarez <rgs@consttype.org>	2010-09-13 13:56:03 +0200
commit	4125141464884619e852c7b0986a51eba8fe1636 (patch)
tree	d4393940bde6463ba49617a14b9900ac0e1a0998 /handy.h
parent	cf301eb7d17e4d58d25337e997b1c7b0133e3c91 (diff)
download	perl-4125141464884619e852c7b0986a51eba8fe1636.tar.gz