diff options
author | Nick Ing-Simmons <nik@tiuk.ti.com> | 2001-03-28 14:38:24 +0000 |
---|---|---|
committer | Nick Ing-Simmons <nik@tiuk.ti.com> | 2001-03-28 14:38:24 +0000 |
commit | daf0f78e031c718c75590ef9ef573756f805776e (patch) | |
tree | ef46cd2cf7cc422e43d555f69d103115c21cfce8 /t/op/utf8decode.t | |
parent | 30ff31546a6570f575cb35e80f834c872c5abdb1 (diff) | |
download | perl-daf0f78e031c718c75590ef9ef573756f805776e.tar.gz |
More EBCDIC tweaks:
- one more swash issue &~(0xA0-1) did not do the right thing,
for UTF-EBCDIC where &~(0x80-1) does for UTF-8.
- add "use re 'asciirange'" to make [!-~] etc. work
use it in MIME::QuotedPrint and t/op/regexp.t and t/op/pat.t
- Choose a key for t/op/each.t test which gets encoded.
- Skip utf8decode if this is UTF-EBCDIC.
p4raw-id: //depot/perlio@9400
Diffstat (limited to 't/op/utf8decode.t')
-rw-r--r-- | t/op/utf8decode.t | 20 |
1 files changed, 17 insertions, 3 deletions
diff --git a/t/op/utf8decode.t b/t/op/utf8decode.t index 4d05a6b8d3..824805d5df 100644 --- a/t/op/utf8decode.t +++ b/t/op/utf8decode.t @@ -3,6 +3,20 @@ BEGIN { chdir 't' if -d 't'; @INC = '../lib'; + +} + +{ + my $wide = v256; + use bytes; + print STDERR ord($wide),"\n"; + if (ord($wide) == 140) { + print "1..0 # Skip: UTF-EBCDIC (not UTF-8) used here\n"; + exit 0; + } + elsif (ord($wide) != 196) { + warn sprintf("v256 starts with %02X\n",ord($wide)); + } } no utf8; @@ -13,7 +27,7 @@ my $test = 1; # This table is based on Markus Kuhn's UTF-8 Decode Stress Tester, # http://www.cl.cam.ac.uk/~mgk25/ucs/examples/UTF-8-test.txt, -# version dated 2000-09-02. +# version dated 2000-09-02. # We use the \x notation instead of raw binary bytes for \x00-\x1f\x7f-\xff # because e.g. many patch programs have issues with binary data. @@ -21,7 +35,7 @@ my $test = 1; my @MK = split(/\n/, <<__EOMK__); 1 Correct UTF-8 1.1.1 y "\xce\xba\xe1\xbd\xb9\xcf\x83\xce\xbc\xce\xb5" - 11 ce:ba:e1:bd:b9:cf:83:ce:bc:ce:b5 5 -2 Boundary conditions +2 Boundary conditions 2.1 First possible sequence of certain length 2.1.1 y "\x00" 0 1 00 1 2.1.2 y "\xc2\x80" 80 2 c2:80 1 @@ -135,7 +149,7 @@ __EOMK__ sub moan { print "$id: @_"; } - + sub test_unpack_U { $WARNCNT = 0; $WARNMSG = ""; |