summaryrefslogtreecommitdiff
path: root/unicode_constants.h
diff options
context:
space:
mode:
authorKarl Williamson <public@khwilliamson.com>2012-10-03 16:35:00 -0600
committerKarl Williamson <public@khwilliamson.com>2012-10-09 11:16:05 -0600
commit0a982f06581f440016dd643d5e2c5585b9320c43 (patch)
treefb6550bd9cdd6b15ed9d124cad13bf16683607c2 /unicode_constants.h
parent8769f413b9f20a6cc3b610fc5fa588e3593b5295 (diff)
downloadperl-0a982f06581f440016dd643d5e2c5585b9320c43.tar.gz
regcomp.c: Refactor join_exact() to handle all multi-char folds
join_exact() prior to this commit returned a delta for 3 problematic sequences showing that the minimum length they match is less than their nominal length. It turns out that this is needed for all multi-character fold sequences; our test suite just did not have the tests in it to show that. Tests that do show this will be added in a future commit, but code elsewhere must be fixed before they pass. regcomp.c
Diffstat (limited to 'unicode_constants.h')
-rw-r--r--unicode_constants.h6
1 files changed, 2 insertions, 4 deletions
diff --git a/unicode_constants.h b/unicode_constants.h
index f28a7b727c..f4d3172b53 100644
--- a/unicode_constants.h
+++ b/unicode_constants.h
@@ -24,11 +24,9 @@
#define COMBINING_ACUTE_ACCENT_UTF8 "\xCC\x81" /* U+0301 */
#define COMBINING_DIAERESIS_UTF8 "\xCC\x88" /* U+0308 */
-#define GREEK_SMALL_LETTER_IOTA_UTF8_FIRST_BYTE 0xCE /* U+03B9 */
-#define GREEK_SMALL_LETTER_IOTA_UTF8_TAIL "\xB9" /* U+03B9 */
+#define GREEK_SMALL_LETTER_IOTA_UTF8 "\xCE\xB9" /* U+03B9 */
-#define GREEK_SMALL_LETTER_UPSILON_UTF8_FIRST_BYTE 0xCF /* U+03C5 */
-#define GREEK_SMALL_LETTER_UPSILON_UTF8_TAIL "\x85" /* U+03C5 */
+#define GREEK_SMALL_LETTER_UPSILON_UTF8 "\xCF\x85" /* U+03C5 */
#define HYPHEN_UTF8 "\xE2\x80\x90" /* U+2010 */
#define FIRST_SURROGATE_UTF8_FIRST_BYTE 0xED /* U+D800 */