From 8ebfab32803787379c8201fb9f650fcb35e33ecc Mon Sep 17 00:00:00 2001 From: Bruno Haible Date: Thu, 4 May 2023 23:27:16 +0200 Subject: c32swidth: Add tests. * tests/test-c32swidth.c: New file, based on tests/test-c32width.c. * modules/c32swidth-tests: New file. --- ChangeLog | 4 ++ modules/c32swidth-tests | 15 ++++++ tests/test-c32swidth.c | 128 ++++++++++++++++++++++++++++++++++++++++++++++++ 3 files changed, 147 insertions(+) create mode 100644 modules/c32swidth-tests create mode 100644 tests/test-c32swidth.c diff --git a/ChangeLog b/ChangeLog index d55b5e5120..aaffe12fc1 100644 --- a/ChangeLog +++ b/ChangeLog @@ -1,5 +1,9 @@ 2023-05-04 Bruno Haible + c32swidth: Add tests. + * tests/test-c32swidth.c: New file, based on tests/test-c32width.c. + * modules/c32swidth-tests: New file. + c32swidth: New module. * lib/uchar.in.h (c32swidth): New declaration. * lib/wcswidth-impl.h: Use macros FUNC, UNIT, CHARACTER_WIDTH. diff --git a/modules/c32swidth-tests b/modules/c32swidth-tests new file mode 100644 index 0000000000..e591b9109f --- /dev/null +++ b/modules/c32swidth-tests @@ -0,0 +1,15 @@ +Files: +tests/test-c32swidth.c +tests/signature.h +tests/macros.h + +Depends-on: +localcharset +setlocale + +configure.ac: + +Makefile.am: +TESTS += test-c32swidth +check_PROGRAMS += test-c32swidth +test_c32swidth_LDADD = $(LDADD) $(SETLOCALE_LIB) $(LIBUNISTRING) diff --git a/tests/test-c32swidth.c b/tests/test-c32swidth.c new file mode 100644 index 0000000000..8bf19afec9 --- /dev/null +++ b/tests/test-c32swidth.c @@ -0,0 +1,128 @@ +/* Test of c32swidth() function. + Copyright (C) 2023 Free Software Foundation, Inc. + + This program is free software: you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation, either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program. If not, see . */ + +/* Written by Bruno Haible , 2023. */ + +#include + +#include + +#include "signature.h" +SIGNATURE_CHECK (c32swidth, int, (const char32_t *, size_t)); + +#include +#include + +#include "localcharset.h" +#include "macros.h" + +int +main () +{ + int w; + + /* Switch to an UTF-8 locale. */ + if (!((setlocale (LC_ALL, "fr_FR.UTF-8") != NULL + || setlocale (LC_ALL, "de_DE.UTF-8") != NULL + || setlocale (LC_ALL, "es_ES.UTF-8") != NULL + || setlocale (LC_ALL, "en_US.UTF-8") != NULL) + /* Check whether it's really an UTF-8 locale. + On native Windows, these setlocale calls succeed but the encoding + of this locale is CP1252, not UTF-8. */ + && strcmp (locale_charset (), "UTF-8") == 0)) + { + fprintf (stderr, "Skipping test: No common Unicode locale is installed\n"); + return 77; + } + + { + char32_t s[] = { 'f', 'p', 0, 'x' }; + w = c32swidth (s, 0); + ASSERT (w == 0); + w = c32swidth (s, 1); + ASSERT (w == 1); + w = c32swidth (s, 2); + ASSERT (w == 2); + w = c32swidth (s, 3); + ASSERT (w == 2); + w = c32swidth (s, 4); + ASSERT (w == 2); + w = c32swidth (s, (size_t)(-1)); + ASSERT (w == 2); + } + + { + char32_t s[] = { 'f', 'p', '\n', 'x' }; + w = c32swidth (s, 0); + ASSERT (w == 0); + w = c32swidth (s, 1); + ASSERT (w == 1); + w = c32swidth (s, 2); + ASSERT (w == 2); + w = c32swidth (s, 3); + ASSERT (w == -1); + w = c32swidth (s, 4); + ASSERT (w == -1); + } + + /* Test width of some non-spacing characters. */ + { + char32_t s[] = { 'a', 0x0301 }; + w = c32swidth (s, 2); + ASSERT (w == 1); + } + + /* Test width of some zero width characters. */ + { + char32_t s[] = { 'i', 0x200B, 'j' }; + w = c32swidth (s, 3); + ASSERT (w == 2); + } + + /* Test width of some math symbols. + U+2202 is marked as having ambiguous width (A) in EastAsianWidth.txt + (see ). + The Unicode Standard Annex 11 + + says + "Ambiguous characters behave like wide or narrow characters + depending on the context (language tag, script identification, + associated font, source of data, or explicit markup; all can + provide the context). If the context cannot be established + reliably, they should be treated as narrow characters by default." + For c32width(), the only available context information is the locale. + The chosen locale above is a Western locale, not an East Asian locale, + therefore U+2202 should be treated like a narrow character. */ + { + char32_t s[] = { 0x2202 }; + w = c32swidth (s, 1); + ASSERT (w == 1); + } + + /* Test width of some CJK characters. */ + { + char32_t s[] = { 0x4E2D, 0x6587 }; + w = c32swidth (s, 2); + ASSERT (w == 4); + } + { + char32_t s[] = { 0x20369, 0x2F876 }; + w = c32swidth (s, 2); + ASSERT (w == 4); + } + + return 0; +} -- cgit v1.2.1