summaryrefslogtreecommitdiff
path: root/lib/unicore
diff options
context:
space:
mode:
authorHugo van der Sanden <hv@crypt.org>2002-12-11 09:59:31 +0000
committerhv <hv@crypt.org>2002-12-11 09:59:31 +0000
commit9c3dc5877366a4b76c59e7e1b537358b0b2bc2f8 (patch)
tree1c355bde2e89cc80c6e45dbf250069fe28912dfc /lib/unicore
parent3a2263fe90d1c0e6c8f9368f10e6672379a975a2 (diff)
downloadperl-9c3dc5877366a4b76c59e7e1b537358b0b2bc2f8.tar.gz
Integrate from maint-5.8 #18156, #18218.
p4raw-id: //depot/perl@18281 p4raw-integrated: from //depot/maint-5.8/perl@18280 'copy in' lib/unicore/Category.pl lib/unicore/SpecialCasing.txt lib/unicore/UnicodeData.txt lib/unicore/lib/C.pl lib/unicore/lib/Cf.pl lib/unicore/lib/Cntrl.pl lib/unicore/lib/Graph.pl lib/unicore/lib/P.pl lib/unicore/lib/Pd.pl lib/unicore/lib/Print.pl lib/unicore/lib/Punct.pl (@17645..) t/op/pack.t (@18080..) p4raw-integrated: from //depot/maint-5.8/perl@18156 'merge in' lib/Unicode/UCD.t (@17645..)
Diffstat (limited to 'lib/unicore')
-rw-r--r--lib/unicore/Category.pl2
-rw-r--r--lib/unicore/SpecialCasing.txt12
-rw-r--r--lib/unicore/UnicodeData.txt2
-rw-r--r--lib/unicore/lib/C.pl1
-rw-r--r--lib/unicore/lib/Cf.pl1
-rw-r--r--lib/unicore/lib/Cntrl.pl1
-rw-r--r--lib/unicore/lib/Graph.pl3
-rw-r--r--lib/unicore/lib/P.pl1
-rw-r--r--lib/unicore/lib/Pd.pl1
-rw-r--r--lib/unicore/lib/Print.pl3
-rw-r--r--lib/unicore/lib/Punct.pl1
11 files changed, 17 insertions, 11 deletions
diff --git a/lib/unicore/Category.pl b/lib/unicore/Category.pl
index dba6ad9afc..e374f06df1 100644
--- a/lib/unicore/Category.pl
+++ b/lib/unicore/Category.pl
@@ -41,7 +41,7 @@ return <<'END';
00AA Ll
00AB Pi
00AC Sm
-00AD Pd
+00AD Cf
00AE So
00AF Sk
00B0 So
diff --git a/lib/unicore/SpecialCasing.txt b/lib/unicore/SpecialCasing.txt
index f25ac9b1b8..87740c7cd0 100644
--- a/lib/unicore/SpecialCasing.txt
+++ b/lib/unicore/SpecialCasing.txt
@@ -231,14 +231,18 @@ FB17; FB17; 0544 056D; 0544 053D; # ARMENIAN SMALL LIGATURE MEN XEH
# I and i-dotless; I-dot and i are case pairs in Turkish and Azeri
# The following rules handle those cases.
-0130; 0069; 0130; 0130; tr # LATIN CAPITAL LETTER I WITH DOT ABOVE
-0130; 0069; 0130; 0130; az # LATIN CAPITAL LETTER I WITH DOT ABOVE
+0130; 0069; 0130; 0130; tr; # LATIN CAPITAL LETTER I WITH DOT ABOVE
+0130; 0069; 0130; 0130; az; # LATIN CAPITAL LETTER I WITH DOT ABOVE
# When lowercasing, remove dot_above in the sequence I + dot_above, which will turn into i.
# This matches the behavior of the canonically equivalent I-dot_above
-0307; ; 0307; 0307; tr After_Soft_Dotted; # COMBINING DOT ABOVE
-0307; ; 0307; 0307; az After_Soft_Dotted; # COMBINING DOT ABOVE
+0307; ; 0307; 0307; tr After_I; # COMBINING DOT ABOVE
+0307; ; 0307; 0307; az After_I; # COMBINING DOT ABOVE
+
+# After_I: The last preceding base character was an uppercase I, and
+# there is no intervening combining character class 230 (ABOVE).
+# (from Unicode 3.2 Errata 2002 October 31)
# When lowercasing, unless an I is before a dot_above, it turns into a dotless i.
diff --git a/lib/unicore/UnicodeData.txt b/lib/unicore/UnicodeData.txt
index 125a6920dc..088fdb4fb6 100644
--- a/lib/unicore/UnicodeData.txt
+++ b/lib/unicore/UnicodeData.txt
@@ -171,7 +171,7 @@
00AA;FEMININE ORDINAL INDICATOR;Ll;0;L;<super> 0061;;;;N;;;;;
00AB;LEFT-POINTING DOUBLE ANGLE QUOTATION MARK;Pi;0;ON;;;;;Y;LEFT POINTING GUILLEMET;*;;;
00AC;NOT SIGN;Sm;0;ON;;;;;N;;;;;
-00AD;SOFT HYPHEN;Pd;0;ON;;;;;N;;;;;
+00AD;SOFT HYPHEN;Cf;0;ON;;;;;N;;;;;
00AE;REGISTERED SIGN;So;0;ON;;;;;N;REGISTERED TRADE MARK SIGN;;;;
00AF;MACRON;Sk;0;ON;<compat> 0020 0304;;;;N;SPACING MACRON;;;;
00B0;DEGREE SIGN;So;0;ET;;;;;N;;;;;
diff --git a/lib/unicore/lib/C.pl b/lib/unicore/lib/C.pl
index bbe5b39e48..b098c869f6 100644
--- a/lib/unicore/lib/C.pl
+++ b/lib/unicore/lib/C.pl
@@ -12,6 +12,7 @@
return <<'END';
0000 001F
007F 009F
+00AD
0221
0234 024F
02AE 02AF
diff --git a/lib/unicore/lib/Cf.pl b/lib/unicore/lib/Cf.pl
index 9012824ee4..1179ccbe88 100644
--- a/lib/unicore/lib/Cf.pl
+++ b/lib/unicore/lib/Cf.pl
@@ -10,6 +10,7 @@
# Meaning: General Category 'Cf'
#
return <<'END';
+00AD
06DD
070F
180E
diff --git a/lib/unicore/lib/Cntrl.pl b/lib/unicore/lib/Cntrl.pl
index b794776699..13327fd3a1 100644
--- a/lib/unicore/lib/Cntrl.pl
+++ b/lib/unicore/lib/Cntrl.pl
@@ -11,6 +11,7 @@
return <<'END';
0000 001F
007F 009F
+00AD
06DD
070F
180E
diff --git a/lib/unicore/lib/Graph.pl b/lib/unicore/lib/Graph.pl
index e3e98b518d..212c4c637f 100644
--- a/lib/unicore/lib/Graph.pl
+++ b/lib/unicore/lib/Graph.pl
@@ -10,7 +10,8 @@
#
return <<'END';
0021 007E
-00A1 0220
+00A1 00AC
+00AE 0220
0222 0233
0250 02AD
02B0 02EE
diff --git a/lib/unicore/lib/P.pl b/lib/unicore/lib/P.pl
index 1302e8d8f9..6ad7119ee0 100644
--- a/lib/unicore/lib/P.pl
+++ b/lib/unicore/lib/P.pl
@@ -21,7 +21,6 @@ return <<'END';
007D
00A1
00AB
-00AD
00B7
00BB
00BF
diff --git a/lib/unicore/lib/Pd.pl b/lib/unicore/lib/Pd.pl
index e32f88fe50..545e454b51 100644
--- a/lib/unicore/lib/Pd.pl
+++ b/lib/unicore/lib/Pd.pl
@@ -11,7 +11,6 @@
#
return <<'END';
002D
-00AD
058A
1806
2010 2015
diff --git a/lib/unicore/lib/Print.pl b/lib/unicore/lib/Print.pl
index 01ac6f10d4..d1eb1e23c2 100644
--- a/lib/unicore/lib/Print.pl
+++ b/lib/unicore/lib/Print.pl
@@ -10,7 +10,8 @@
#
return <<'END';
0020 007E
-00A0 0220
+00A0 00AC
+00AE 0220
0222 0233
0250 02AD
02B0 02EE
diff --git a/lib/unicore/lib/Punct.pl b/lib/unicore/lib/Punct.pl
index ca68b6ab49..70b8a2929c 100644
--- a/lib/unicore/lib/Punct.pl
+++ b/lib/unicore/lib/Punct.pl
@@ -20,7 +20,6 @@ return <<'END';
007D
00A1
00AB
-00AD
00B7
00BB
00BF