diff options
author | Larry Wall <larry@wall.org> | 1998-07-24 05:44:33 +0000 |
---|---|---|
committer | Larry Wall <larry@wall.org> | 1998-07-24 05:44:33 +0000 |
commit | a0ed51b321531af4b47cce24205ab9656f043f0f (patch) | |
tree | 610356407b37a4041ea8bcaf44571579b2da5613 /regcomp.h | |
parent | 9332a1c1d80ded85a2b1f32b1c8968a35e3b0fbb (diff) | |
download | perl-a0ed51b321531af4b47cce24205ab9656f043f0f.tar.gz |
Here are the long-expected Unicode/UTF-8 modifications.
p4raw-id: //depot/utfperl@1651
Diffstat (limited to 'regcomp.h')
-rw-r--r-- | regcomp.h | 13 |
1 files changed, 8 insertions, 5 deletions
@@ -204,19 +204,22 @@ EXTCONST char varies[]; #else EXTCONST char varies[] = { BRANCH, BACK, STAR, PLUS, CURLY, CURLYX, REF, REFF, REFFL, - WHILEM, CURLYM, CURLYN, BRANCHJ, IFTHEN, SUSPEND, 0 + WHILEM, CURLYM, CURLYN, BRANCHJ, IFTHEN, SUSPEND, CLUMP, 0 }; #endif /* The following always have a length of 1. char* since we do strchr on it. */ +/* (Note that lenght 1 means "one character" under UTF8, not "one octet".) */ #ifndef DOINIT EXTCONST char simple[]; #else EXTCONST char simple[] = { - ANY, SANY, ANYOF, - ALNUM, ALNUML, NALNUM, NALNUML, - SPACE, SPACEL, NSPACE, NSPACEL, - DIGIT, NDIGIT, 0 + ANY, ANYUTF8, SANY, SANYUTF8, ANYOF, ANYOFUTF8, + ALNUM, ALNUMUTF8, ALNUML, ALNUMLUTF8, + NALNUM, NALNUMUTF8, NALNUML, NALNUMLUTF8, + SPACE, SPACEUTF8, SPACEL, SPACELUTF8, + NSPACE, NSPACEUTF8, NSPACEL, NSPACELUTF8, + DIGIT, DIGITUTF8, NDIGIT, NDIGITUTF8, 0 }; #endif |