summaryrefslogtreecommitdiff
path: root/tests/unictype/test-categ_Lo.c
diff options
context:
space:
mode:
authorBruno Haible <bruno@clisp.org>2021-12-31 12:20:27 +0100
committerBruno Haible <bruno@clisp.org>2021-12-31 12:20:27 +0100
commitf2e9cd38b97c58bcd66b804e08186503e00a3e8e (patch)
tree712f545d28aab410fe12b9ac93efca3bc682d8de /tests/unictype/test-categ_Lo.c
parent09cf5f3ac960dc7f413186bbda1c8aa2d43944df (diff)
downloadgnulib-f2e9cd38b97c58bcd66b804e08186503e00a3e8e.tar.gz
Update to Unicode 13.0.0.
* lib/gen-uni-tables.c (is_WBP_MIDLETTER): Add character 0x055F. (get_wbp): Assign value WBP_ALETTER to the characters 0x02E5..0x02EB, 0x055A, 0x058A, 0xA708..0xA716. * lib/gen-uni-tables.c (LBP_CP1, LBP_CP2, LBP_OP1, LBP_OP2): New enum values. (LBP_OP, LBP_CP): Assign artificial values. (get_lbp): Use the unicode_width[] table to assign LBP_CP1, LBP_CP2 instead of LBP_CP, and LBP_OP1, LBP_OP2 instead of LBP_OP. Update such that unilbrk/lbrkprop.txt comes out as expected. (debug_output_lbp): Print either LBP_CP1 or LBP_CP2 as LBP_CP. Print either LBP_OP1 or LBP_OP2 as LBP_OP. (lbp_value_to_string): Handle LBP_CP1, LBP_CP2, LBP_OP1, LBP_OP2 instead of LBP_CP, LBP_OP. (output_lbrk_rules_as_tables): Treat LBP_CP and LBP_OP as macros that map to two table rows/columns. In rule LB30, use only LBP_OP1 instead of LBP_OP, and only LBP_CP1 instead of LBP_CP. Simplify rule LB22. * lib/unilbrk/lbrktables.h (LBP_CP1, LBP_CP2, LBP_OP1, LBP_OP2): New enum values. (LBP_OP, LBP_CP): Remove enum values. (unilbrk_table): Update declaration. * lib/unilbrk/u8-possible-linebreaks.c (u8_possible_linebreaks_loop): Add a test for East Asian opening parenthesis. * lib/unilbrk/u16-possible-linebreaks.c (u16_possible_linebreaks_loop): Likewise. * lib/unilbrk/u32-possible-linebreaks.c (u32_possible_linebreaks_loop): Likewise. * lib/uniwidth/width.c (nonspacing_table_data, nonspacing_table_ind): Update. (uc_width): Assign width 2 to the characters 0x16FF0..0x16FF1, 0x18AF3..0x18CD5, 0x18D00..0x18D08, 0x1F6D6..0x1F6D7, 0x1F6FB..0x1F6FC, 0x1F90C, 0x1FA74, 0x1FA83..0x1FA86, 0x1FA96..0x1FAA8, 0x1FAB0..0x1FAB6, 0x1FAC0..0x1FAC2, 0x1FAD0..0x1FAD6. Assign width 1 to the characters 0x1F93B, 0x1F946. * tests/uniwidth/test-uc_width2.sh: Expect width 0 for the characters 0x0B55, 0x0D81, 0x1ABF..0x1AC0, 0xA82C, 0x10EAB..0x10EAC, 0x111CF, 0x1193B..0x1193C, 0x1193E, 0x11943, 0x16FE4. Expect width 2 for the characters 0x16FF0..0x16FF1, 0x18AF3..0x18CD5, 0x18D00..0x18D08, 0x1F6D6..0x1F6D7, 0x1F6FB..0x1F6FC, 0x1F90C, 0x1FA74, 0x1FA83..0x1FA86, 0x1FA96..0x1FAA8, 0x1FAB0..0x1FAB6, 0x1FAC0..0x1FAC2, 0x1FAD0..0x1FAD6. Expect width 1 for the characters 0x1F93B, 0x1F946. * All generated files under lib/uni* and tests/uni*: Regenerate. * tests/uniname/NameAliases.txt: Update. * tests/uniname/UnicodeData.txt: Update. * tests/uninorm/NormalizationTest.txt: Update. * tests/unigbrk/GraphemeBreakTest.txt: Update. * tests/uniwbrk/WordBreakTest.txt: Update. * All the affected modules: Bump required libunistring version.
Diffstat (limited to 'tests/unictype/test-categ_Lo.c')
-rw-r--r--tests/unictype/test-categ_Lo.c33
1 files changed, 23 insertions, 10 deletions
diff --git a/tests/unictype/test-categ_Lo.c b/tests/unictype/test-categ_Lo.c
index d0553234aa..38a059c461 100644
--- a/tests/unictype/test-categ_Lo.c
+++ b/tests/unictype/test-categ_Lo.c
@@ -41,7 +41,7 @@
{ 0x0840, 0x0858 },
{ 0x0860, 0x086A },
{ 0x08A0, 0x08B4 },
- { 0x08B6, 0x08BD },
+ { 0x08B6, 0x08C7 },
{ 0x0904, 0x0939 },
{ 0x093D, 0x093D },
{ 0x0950, 0x0950 },
@@ -117,7 +117,7 @@
{ 0x0CDE, 0x0CDE },
{ 0x0CE0, 0x0CE1 },
{ 0x0CF1, 0x0CF2 },
- { 0x0D05, 0x0D0C },
+ { 0x0D04, 0x0D0C },
{ 0x0D0E, 0x0D10 },
{ 0x0D12, 0x0D3A },
{ 0x0D3D, 0x0D3D },
@@ -230,10 +230,10 @@
{ 0x30FF, 0x30FF },
{ 0x3105, 0x312F },
{ 0x3131, 0x318E },
- { 0x31A0, 0x31BA },
+ { 0x31A0, 0x31BF },
{ 0x31F0, 0x31FF },
- { 0x3400, 0x4DB5 },
- { 0x4E00, 0x9FEF },
+ { 0x3400, 0x4DBF },
+ { 0x4E00, 0x9FFC },
{ 0xA000, 0xA014 },
{ 0xA016, 0xA48C },
{ 0xA4D0, 0xA4F7 },
@@ -357,15 +357,19 @@
{ 0x10B80, 0x10B91 },
{ 0x10C00, 0x10C48 },
{ 0x10D00, 0x10D23 },
+ { 0x10E80, 0x10EA9 },
+ { 0x10EB0, 0x10EB1 },
{ 0x10F00, 0x10F1C },
{ 0x10F27, 0x10F27 },
{ 0x10F30, 0x10F45 },
+ { 0x10FB0, 0x10FC4 },
{ 0x10FE0, 0x10FF6 },
{ 0x11003, 0x11037 },
{ 0x11083, 0x110AF },
{ 0x110D0, 0x110E8 },
{ 0x11103, 0x11126 },
{ 0x11144, 0x11144 },
+ { 0x11147, 0x11147 },
{ 0x11150, 0x11172 },
{ 0x11176, 0x11176 },
{ 0x11183, 0x111B2 },
@@ -391,7 +395,7 @@
{ 0x1135D, 0x11361 },
{ 0x11400, 0x11434 },
{ 0x11447, 0x1144A },
- { 0x1145F, 0x1145F },
+ { 0x1145F, 0x11461 },
{ 0x11480, 0x114AF },
{ 0x114C4, 0x114C5 },
{ 0x114C7, 0x114C7 },
@@ -403,7 +407,13 @@
{ 0x116B8, 0x116B8 },
{ 0x11700, 0x1171A },
{ 0x11800, 0x1182B },
- { 0x118FF, 0x118FF },
+ { 0x118FF, 0x11906 },
+ { 0x11909, 0x11909 },
+ { 0x1190C, 0x11913 },
+ { 0x11915, 0x11916 },
+ { 0x11918, 0x1192F },
+ { 0x1193F, 0x1193F },
+ { 0x11941, 0x11941 },
{ 0x119A0, 0x119A7 },
{ 0x119AA, 0x119D0 },
{ 0x119E1, 0x119E1 },
@@ -428,6 +438,7 @@
{ 0x11D6A, 0x11D89 },
{ 0x11D98, 0x11D98 },
{ 0x11EE0, 0x11EF2 },
+ { 0x11FB0, 0x11FB0 },
{ 0x12000, 0x12399 },
{ 0x12480, 0x12543 },
{ 0x13000, 0x1342E },
@@ -441,7 +452,8 @@
{ 0x16F00, 0x16F4A },
{ 0x16F50, 0x16F50 },
{ 0x17000, 0x187F7 },
- { 0x18800, 0x18AF2 },
+ { 0x18800, 0x18CD5 },
+ { 0x18D00, 0x18D08 },
{ 0x1B000, 0x1B11E },
{ 0x1B150, 0x1B152 },
{ 0x1B164, 0x1B167 },
@@ -487,12 +499,13 @@
{ 0x1EEA1, 0x1EEA3 },
{ 0x1EEA5, 0x1EEA9 },
{ 0x1EEAB, 0x1EEBB },
- { 0x20000, 0x2A6D6 },
+ { 0x20000, 0x2A6DD },
{ 0x2A700, 0x2B734 },
{ 0x2B740, 0x2B81D },
{ 0x2B820, 0x2CEA1 },
{ 0x2CEB0, 0x2EBE0 },
- { 0x2F800, 0x2FA1D }
+ { 0x2F800, 0x2FA1D },
+ { 0x30000, 0x3134A }
#define PREDICATE(c) uc_is_general_category (c, UC_CATEGORY_Lo)
#include "test-predicate-part2.h"