diff options
-rw-r--r-- | lib/unicore/mktables | 6 | ||||
-rw-r--r-- | pod/perldelta.pod | 5 | ||||
-rw-r--r-- | t/uni/class.t | 14 |
3 files changed, 16 insertions, 9 deletions
diff --git a/lib/unicore/mktables b/lib/unicore/mktables index a8209cf748..042fb94834 100644 --- a/lib/unicore/mktables +++ b/lib/unicore/mktables @@ -10153,12 +10153,16 @@ END # allow the BELL name for U+1F514, so that the old usage can be # deprecated for one cycle. - return if $_ !~ /^(?:0007|1F514);/; + return if $_ !~ /^(?:0007|1F514|070F);/; my ($code_point, @fields) = split /\s*;\s*/, $_, -1; if ($code_point eq '0007') { $fields[$CHARNAME] = "ALERT"; } + elsif ($code_point eq '070F') { # Unicode Corrigendum #8; see + # http://www.unicode.org/versions/corrigendum8.html + $fields[$BIDI] = "AL"; + } elsif ($^V lt v5.15.0) { # For 5.16 will convert to use Unicode's name $fields[$CHARNAME] = ""; } diff --git a/pod/perldelta.pod b/pod/perldelta.pod index 9b1b6f4f0a..f3f5dbfe9b 100644 --- a/pod/perldelta.pod +++ b/pod/perldelta.pod @@ -139,8 +139,9 @@ L<perlmod/"BEGIN, UNITCHECK, CHECK, INIT and END">. =head2 Unicode Version 6.0 is now supported (mostly) -Perl comes with the Unicode 6.0 data base, with one exception noted -below. +Perl comes with the Unicode 6.0 data base updated with +L<Corrigendum #8|http://www.unicode.org/versions/corrigendum8.html>, +with one exception noted below. See L<http://unicode.org/versions/Unicode6.0.0> for details on the new release. Perl does not support any Unicode provisional properties, including the new ones for this release, but their database files are diff --git a/t/uni/class.t b/t/uni/class.t index 107a20274d..fedec4cdfe 100644 --- a/t/uni/class.t +++ b/t/uni/class.t @@ -65,12 +65,14 @@ is(($str =~ /(\p{Other::Class}+)/)[0], '@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]^_'); # make sure it finds class in other OTHER package is(($str =~ /(\p{A::B::Intersection}+)/)[0], '@ABCDEFGHIJKLMNO'); -# lib/unicore/Bc/AL.pl -$str = "\x{070D}\x{070E}\x{070F}\x{0710}\x{0711}"; -is(($str =~ /(\P{BidiClass: ArabicLetter}+)/)[0], "\x{070F}"); -is(($str =~ /(\P{BidiClass: AL}+)/)[0], "\x{070F}"); -is(($str =~ /(\P{BC :ArabicLetter}+)/)[0], "\x{070F}"); -is(($str =~ /(\P{bc=AL}+)/)[0], "\x{070F}"); +# lib/unicore/lib/Bc/AL.pl. U+070E is unassigned, currently, but still has +# bidi class AL. The first one in the sequence that doesn't is 0711, which is +# BC=NSM. +$str = "\x{070D}\x{070E}\x{070F}\x{0710}\x{0711}\x{0712}"; +is(($str =~ /(\P{BidiClass: ArabicLetter}+)/)[0], "\x{0711}"); +is(($str =~ /(\P{BidiClass: AL}+)/)[0], "\x{0711}"); +is(($str =~ /(\P{BC :ArabicLetter}+)/)[0], "\x{0711}"); +is(($str =~ /(\P{bc=AL}+)/)[0], "\x{0711}"); # make sure InGreek works $str = "[\x{038B}\x{038C}\x{038D}]"; |