diff options
author | Lorry Tar Creator <lorry-tar-importer@lorry> | 2016-04-22 04:38:07 +0000 |
---|---|---|
committer | Lorry Tar Creator <lorry-tar-importer@lorry> | 2016-04-22 04:38:07 +0000 |
commit | 28ef1abc10cfbc2c3d2747c008eb2300858d0426 (patch) | |
tree | 41208fb8f393e6cb6cc8f939623ad47a0db17876 /tests/pcre-utf8 | |
download | grep-tarball-master.tar.gz |
Diffstat (limited to 'tests/pcre-utf8')
-rwxr-xr-x | tests/pcre-utf8 | 40 |
1 files changed, 40 insertions, 0 deletions
diff --git a/tests/pcre-utf8 b/tests/pcre-utf8 new file mode 100755 index 0000000..a29b412 --- /dev/null +++ b/tests/pcre-utf8 @@ -0,0 +1,40 @@ +#! /bin/sh +# Ensure that, with -P, Unicode \p{} symbols are correctly matched. +# +# Copyright (C) 2012-2016 Free Software Foundation, Inc. +# +# Copying and distribution of this file, with or without modification, +# are permitted in any medium without royalty provided the copyright +# notice and this notice are preserved. + +. "${srcdir=.}/init.sh"; path_prepend_ ../src +require_en_utf8_locale_ +LC_ALL=en_US.UTF-8 require_pcre_ + +fail=0 + +echo '$' | LC_ALL=en_US.UTF-8 grep -qP '\p{S}' \ + || skip_ 'PCRE support is compiled out, or it does not support properties' + +euro='\342\202\254 euro' +printf "$euro\\n" > in || framework_failure_ + +# The euro sign has the unicode "Symbol" property, so this must match: +LC_ALL=en_US.UTF-8 grep -P '^\p{S}' in > out || fail=1 +compare in out || fail=1 + +# This RE must *not* match in the C locale, because the first +# byte is not a "Symbol". +LC_ALL=C grep -P '^\p{S}' in > out && fail=1 +compare /dev/null out || fail=1 + +LC_ALL=en_US.UTF-8 grep -P '^. euro$' in > out2 || fail=1 +compare in out2 || fail=1 + +LC_ALL=en_US.UTF-8 grep -oP '. euro' in > out3 || fail=1 +compare in out3 || fail=1 + +LC_ALL=en_US.UTF-8 grep -P '^\P{S}' in > out4 +compare /dev/null out4 || fail=1 + +Exit $fail |