diff options
Diffstat (limited to 'testdata/testinput14')
-rw-r--r-- | testdata/testinput14 | 50 |
1 files changed, 47 insertions, 3 deletions
diff --git a/testdata/testinput14 b/testdata/testinput14 index f97f3ec..8a17ae7 100644 --- a/testdata/testinput14 +++ b/testdata/testinput14 @@ -1,9 +1,12 @@ -# These test special (mostly error) UTF features of DFA matching. They are a -# selection of the more comprehensive tests that are run for non-DFA matching. -# The output is different for the different widths. +# These test special UTF and UCP features of DFA matching. The output is +# different for the different widths. #subject dfa +# ---------------------------------------------------- +# These are a selection of the more comprehensive tests that are run for +# non-DFA matching. + /X/utf XX\x{d800} XX\x{d800}\=offset=3 @@ -33,5 +36,46 @@ XX\xef\x80\=ph \xf7\=ph \xf7\x80\=ph + +# ---------------------------------------------------- +# UCP and casing tests - except for the first two, these will all fail in 8-bit +# mode because they are testing UCP without UTF and use characters > 255. + +/\x{c1}/i,no_start_optimize +\= Expect no match + \x{e1} + +/\x{c1}+\x{e1}/iB,ucp + \x{c1}\x{c1}\x{c1} + \x{e1}\x{e1}\x{e1} + +/\x{120}\x{c1}/i,ucp,no_start_optimize + \x{121}\x{e1} + +/\x{120}\x{c1}/i,ucp + \x{121}\x{e1} + +/[^\x{120}]/i,no_start_optimize + \x{121} + +/[^\x{120}]/i,ucp,no_start_optimize +\= Expect no match + \x{121} + +/[^\x{120}]/i + \x{121} + +/[^\x{120}]/i,ucp +\= Expect no match + \x{121} + +/\x{120}{2}/i,ucp + \x{121}\x{121} + +/[^\x{120}]{2}/i,ucp +\= Expect no match + \x{121}\x{121} + +# ---------------------------------------------------- # End of testinput14 |