summaryrefslogtreecommitdiff
path: root/testdata/testinput14
blob: 8a17ae733e01fc457732f88b799e6d0ca67a46fc (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
# These test special UTF and UCP features of DFA matching. The output is
# different for the different widths.

#subject dfa

# ---------------------------------------------------- 
# These are a selection of the more comprehensive tests that are run for
# non-DFA matching.

/X/utf
    XX\x{d800}
    XX\x{d800}\=offset=3
    XX\x{d800}\=no_utf_check
    XX\x{da00}
    XX\x{da00}\=no_utf_check
    XX\x{dc00}
    XX\x{dc00}\=no_utf_check
    XX\x{de00}
    XX\x{de00}\=no_utf_check
    XX\x{dfff}
    XX\x{dfff}\=no_utf_check
    XX\x{110000}
    XX\x{d800}\x{1234}
          
/badutf/utf
    X\xdf
    XX\xef
    XXX\xef\x80
    X\xf7
    XX\xf7\x80
    XXX\xf7\x80\x80

/shortutf/utf
    XX\xdf\=ph
    XX\xef\=ph
    XX\xef\x80\=ph
    \xf7\=ph
    \xf7\x80\=ph
    
# ---------------------------------------------------- 
# UCP and casing tests - except for the first two, these will all fail in 8-bit
# mode because they are testing UCP without UTF and use characters > 255.

/\x{c1}/i,no_start_optimize
\= Expect no match
    \x{e1}

/\x{c1}+\x{e1}/iB,ucp
    \x{c1}\x{c1}\x{c1}
    \x{e1}\x{e1}\x{e1} 

/\x{120}\x{c1}/i,ucp,no_start_optimize
    \x{121}\x{e1}

/\x{120}\x{c1}/i,ucp
    \x{121}\x{e1}

/[^\x{120}]/i,no_start_optimize
    \x{121}

/[^\x{120}]/i,ucp,no_start_optimize
\= Expect no match
    \x{121}

/[^\x{120}]/i
    \x{121}

/[^\x{120}]/i,ucp
\= Expect no match
    \x{121}
    
/\x{120}{2}/i,ucp
    \x{121}\x{121}

/[^\x{120}]{2}/i,ucp
\= Expect no match
    \x{121}\x{121}

# ---------------------------------------------------- 

# End of testinput14