From de524f25f5a90dad63fa962cb8585acd86c62a88 Mon Sep 17 00:00:00 2001 From: Karl Williamson Date: Wed, 15 Sep 2021 07:36:41 -0600 Subject: mktables: Split a Line Break equivalence class This is used for the \b{lb}, and the rule is changing in Unicode 14.0 --- regen/mk_invlists.pl | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) (limited to 'regen') diff --git a/regen/mk_invlists.pl b/regen/mk_invlists.pl index d58e63cba9..cdddbc5e08 100644 --- a/regen/mk_invlists.pl +++ b/regen/mk_invlists.pl @@ -1783,6 +1783,9 @@ sub output_LB_table() { # PR × (ID | EB | EM) $lb_table[$lb_enums{'Prefix_Numeric'}][$lb_enums{'Ideographic'}] = $lb_actions{'LB_NOBREAK'}; + $lb_table[$lb_enums{'Prefix_Numeric'}] + [$lb_enums{'Unassigned_Extended_Pictographic_Ideographic'}] + = $lb_actions{'LB_NOBREAK'}; $lb_table[$lb_enums{'Prefix_Numeric'}][$lb_enums{'E_Base'}] = $lb_actions{'LB_NOBREAK'}; $lb_table[$lb_enums{'Prefix_Numeric'}][$lb_enums{'E_Modifier'}] @@ -1791,6 +1794,8 @@ sub output_LB_table() { # (ID | EB | EM) × PO $lb_table[$lb_enums{'Ideographic'}][$lb_enums{'Postfix_Numeric'}] = $lb_actions{'LB_NOBREAK'}; + $lb_table[$lb_enums{'Unassigned_Extended_Pictographic_Ideographic'}] + [$lb_enums{'Postfix_Numeric'}] = $lb_actions{'LB_NOBREAK'}; $lb_table[$lb_enums{'E_Base'}][$lb_enums{'Postfix_Numeric'}] = $lb_actions{'LB_NOBREAK'}; $lb_table[$lb_enums{'E_Modifier'}][$lb_enums{'Postfix_Numeric'}] @@ -2462,7 +2467,7 @@ my @props; push @props, sort { prop_name_for_cmp($a) cmp prop_name_for_cmp($b) } qw( &UpperLatin1 _Perl_GCB,EDGE,E_Base,E_Base_GAZ,E_Modifier,Glue_After_Zwj,LV,Prepend,Regional_Indicator,SpacingMark,ZWJ,ExtPict_XX - _Perl_LB,EDGE,Close_Parenthesis,Hebrew_Letter,Next_Line,Regional_Indicator,ZWJ,Contingent_Break,E_Base,E_Modifier,H2,H3,JL,JT,JV,Word_Joiner,East_Asian_CP,East_Asian_OP + _Perl_LB,EDGE,Close_Parenthesis,Hebrew_Letter,Next_Line,Regional_Indicator,ZWJ,Contingent_Break,E_Base,E_Modifier,H2,H3,JL,JT,JV,Word_Joiner,East_Asian_CP,East_Asian_OP,Unassigned_Extended_Pictographic_Ideographic _Perl_SB,EDGE,SContinue,CR,Extend,LF _Perl_WB,Perl_Tailored_HSpace,EDGE,UNKNOWN,CR,Double_Quote,E_Base,E_Base_GAZ,E_Modifier,Extend,Glue_After_Zwj,Hebrew_Letter,LF,MidNumLet,Newline,Regional_Indicator,Single_Quote,ZWJ,ExtPict_XX,ExtPict_LE _Perl_SCX,Latin,Inherited,Unknown,Kore,Jpan,Hanb,INVALID -- cgit v1.2.1