diff options
Diffstat (limited to 'cpan/Unicode-Collate/Collate')
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale.pm | 24 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/az.pl | 50 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/da.pl | 12 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/et.pl | 12 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/fi.pl | 12 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/fil.pl | 11 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/fo.pl | 12 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/ha.pl | 13 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/is.pl | 4 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/kl.pl | 12 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/lt.pl | 22 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/mt.pl | 29 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/nn.pl | 12 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/sk.pl | 2 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/sv.pl | 12 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/tr.pl | 45 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/wo.pl | 25 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/yo.pl | 19 |
18 files changed, 324 insertions, 4 deletions
diff --git a/cpan/Unicode-Collate/Collate/Locale.pm b/cpan/Unicode-Collate/Collate/Locale.pm index 4aeef1f582..4803df98c7 100644 --- a/cpan/Unicode-Collate/Collate/Locale.pm +++ b/cpan/Unicode-Collate/Collate/Locale.pm @@ -4,7 +4,7 @@ use strict; use Carp; use base qw(Unicode::Collate); -our $VERSION = '0.58'; +our $VERSION = '0.59'; use File::Spec; @@ -13,7 +13,8 @@ my $KeyPath = File::Spec->catfile('allkeys.txt'); my $PL_EXT = '.pl'; my %LocaleFile = map { ($_, $_) } qw( - af ca cs cy da eo es et fi fo fr haw is kl lv nn pl ro sk sl sv sw + af az ca cs cy da eo es et fi fil fo fr ha haw + is kl lt lv mt nn pl ro sk sl sv sw tr wo yo ); $LocaleFile{'default'} = ''; $LocaleFile{'es__traditional'} = 'es_trad'; @@ -39,7 +40,7 @@ sub getlocale { return shift->{accepted_locale}; } -sub _fetch_locale { +sub _fetchpl { my $accepted = shift; my $f = $LocaleFile{$accepted}; return if !$f; @@ -60,7 +61,7 @@ sub new { } $hash{table} = $KeyPath; - my $href = _fetch_locale($hash{accepted_locale}); + my $href = _fetchpl($hash{accepted_locale}); while (my($k,$v) = each %$href) { if (exists $hash{$k}) { croak "$k is reserved by $hash{locale}, can't be overwritten"; @@ -153,6 +154,7 @@ this method returns a string C<'default'> meaning no special tailoring. locale name description ---------------------------------------------------------- af Afrikaans + az Azerbaijani (Azeri) ca Catalan cs Czech cy Welsh @@ -162,12 +164,16 @@ this method returns a string C<'default'> meaning no special tailoring. es__traditional Spanish ('ch' and 'll' as a grapheme) et Estonian fi Finnish + fil Filipino fo Faroese fr French + ha Hausa haw Hawaiian is Icelandic kl Kalaallisut + lt Lithuanian lv Latvian + mt Maltese nb Norwegian Bokmal nn Norwegian Nynorsk pl Polish @@ -176,6 +182,16 @@ this method returns a string C<'default'> meaning no special tailoring. sl Slovenian sv Swedish sw Swahili + tr Turkish + wo Wolof + yo Yoruba + +=head1 INSTALL + +Installation of Unicode::Collate::Locale requires F<Collate/Locale.pm>, +F<Collate/Locale/*.pm> and F<Collate/allkeys.txt>. On building, +Unicode::Collate::Locale doesn't require F<data/*.txt> and F<mklocale>. +Tests for Unicode::Collate::Locale are named F<t/loc_*.t>. =head1 AUTHOR diff --git a/cpan/Unicode-Collate/Collate/Locale/az.pl b/cpan/Unicode-Collate/Collate/Locale/az.pl new file mode 100644 index 0000000000..b9ed54b644 --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/az.pl @@ -0,0 +1,50 @@ ++{ +# schwa doesn't require tailoring + entry => <<'ENTRY', # for DUCET v5.2.0 +00E7 ; [.123E.0020.0002.00E7] # LATIN SMALL LETTER C WITH CEDILLA +0063 0327 ; [.123E.0020.0002.00E7] # LATIN SMALL LETTER C WITH CEDILLA +00C7 ; [.123E.0020.0008.00C7] # LATIN CAPITAL LETTER C WITH CEDILLA +0043 0327 ; [.123E.0020.0008.00C7] # LATIN CAPITAL LETTER C WITH CEDILLA +011F ; [.12B1.0020.0002.011F] # LATIN SMALL LETTER G WITH BREVE +0067 0306 ; [.12B1.0020.0002.011F] # LATIN SMALL LETTER G WITH BREVE +011E ; [.12B1.0020.0008.011E] # LATIN CAPITAL LETTER G WITH BREVE +0047 0306 ; [.12B1.0020.0008.011E] # LATIN CAPITAL LETTER G WITH BREVE +0131 ; [.12EB.0020.0002.0131] # LATIN SMALL LETTER DOTLESS I +0049 ; [.12EB.0020.0008.0049] # LATIN CAPITAL LETTER I +00CC ; [.12EB.0020.0008.0049][.0000.0035.0002.0300] # LATIN CAPITAL LETTER I WITH GRAVE +00CD ; [.12EB.0020.0008.0049][.0000.0032.0002.0301] # LATIN CAPITAL LETTER I WITH ACUTE +00CE ; [.12EB.0020.0008.0049][.0000.003C.0002.0302] # LATIN CAPITAL LETTER I WITH CIRCUMFLEX +00CF ; [.12EB.0020.0008.0049][.0000.0047.0002.0308] # LATIN CAPITAL LETTER I WITH DIAERESIS +012A ; [.12EB.0020.0008.0049][.0000.005B.0002.0304] # LATIN CAPITAL LETTER I WITH MACRON +012C ; [.12EB.0020.0008.0049][.0000.0037.0002.0306] # LATIN CAPITAL LETTER I WITH BREVE +012E ; [.12EB.0020.0008.0049][.0000.0059.0002.0328] # LATIN CAPITAL LETTER I WITH OGONEK +0130 ; [.12EC.0020.0008.0130] # LATIN CAPITAL LETTER I WITH DOT ABOVE +0049 0307 ; [.12EC.0020.0008.0130] # LATIN CAPITAL LETTER I WITH DOT ABOVE +00F6 ; [.138F.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS +006F 0308 ; [.138F.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS +00D6 ; [.138F.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +004F 0308 ; [.138F.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.138F.0020.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.138F.0020.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON +015F ; [.1411.0020.0002.015F] # LATIN SMALL LETTER S WITH CEDILLA +0073 0327 ; [.1411.0020.0002.015F] # LATIN SMALL LETTER S WITH CEDILLA +015E ; [.1411.0020.0008.015E] # LATIN CAPITAL LETTER S WITH CEDILLA +0053 0327 ; [.1411.0020.0008.015E] # LATIN CAPITAL LETTER S WITH CEDILLA +00FC ; [.1454.0020.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS +0075 0308 ; [.1454.0020.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS +00DC ; [.1454.0020.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +0055 0308 ; [.1454.0020.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.1454.0020.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.1454.0020.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.1454.0020.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.1454.0020.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.1454.0020.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.1454.0020.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.1454.0020.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.1454.0020.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON +0071 ; [.131F.0020.0002.0071] # LATIN SMALL LETTER Q +0051 ; [.131F.0020.0008.0051] # LATIN CAPITAL LETTER Q +0078 ; [.12D4.0020.0002.0078] # LATIN SMALL LETTER X +0058 ; [.12D4.0020.0008.0058] # LATIN CAPITAL LETTER X +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/da.pl b/cpan/Unicode-Collate/Collate/Locale/da.pl index e680df11b9..6b707f17d6 100644 --- a/cpan/Unicode-Collate/Collate/Locale/da.pl +++ b/cpan/Unicode-Collate/Collate/Locale/da.pl @@ -13,6 +13,14 @@ 0075 0308 ; [.149C.0021.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS 00DC ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS 0055 0308 ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.149C.0021.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.149C.0021.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.149C.0021.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.149C.0021.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.149C.0021.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.149C.0021.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.149C.0021.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.149C.0021.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON 0171 ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0075 030B ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0170 ; [.149C.0022.0008.0170] # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE @@ -28,6 +36,8 @@ 0061 0308 ; [.14AE.0021.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.14AE.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.14AE.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.14AE.0021.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.14AE.0021.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 0119 ; [.14AE.0022.0002.0119] # LATIN SMALL LETTER E WITH OGONEK 0065 0328 ; [.14AE.0022.0002.0119] # LATIN SMALL LETTER E WITH OGONEK 0118 ; [.14AE.0022.0008.0118] # LATIN CAPITAL LETTER E WITH OGONEK @@ -42,6 +52,8 @@ 006F 0308 ; [.14AF.0021.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 00D6 ; [.14AF.0021.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS 004F 0308 ; [.14AF.0021.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.14AF.0021.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.14AF.0021.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON 0151 ; [.14AF.0022.0002.0151] # LATIN SMALL LETTER O WITH DOUBLE ACUTE 006F 030B ; [.14AF.0022.0002.0151] # LATIN SMALL LETTER O WITH DOUBLE ACUTE 0150 ; [.14AF.0022.0008.0150] # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE diff --git a/cpan/Unicode-Collate/Collate/Locale/et.pl b/cpan/Unicode-Collate/Collate/Locale/et.pl index 15a24198d0..0ee593f8da 100644 --- a/cpan/Unicode-Collate/Collate/Locale/et.pl +++ b/cpan/Unicode-Collate/Collate/Locale/et.pl @@ -20,13 +20,25 @@ 0061 0308 ; [.1494.0020.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.1494.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.1494.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.1494.0020.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.1494.0020.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 00F6 ; [.1495.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 006F 0308 ; [.1495.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 00D6 ; [.1495.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS 004F 0308 ; [.1495.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.1495.0020.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.1495.0020.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON 00FC ; [.1496.0020.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS 0075 0308 ; [.1496.0020.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS 00DC ; [.1496.0020.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS 0055 0308 ; [.1496.0020.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.1496.0020.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.1496.0020.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.1496.0020.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.1496.0020.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.1496.0020.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.1496.0020.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.1496.0020.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.1496.0020.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON ENTRY }; diff --git a/cpan/Unicode-Collate/Collate/Locale/fi.pl b/cpan/Unicode-Collate/Collate/Locale/fi.pl index 96e3491db1..7d0faf63b3 100644 --- a/cpan/Unicode-Collate/Collate/Locale/fi.pl +++ b/cpan/Unicode-Collate/Collate/Locale/fi.pl @@ -15,6 +15,14 @@ 0075 0308 ; [.149C.0021.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS 00DC ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS 0055 0308 ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.149C.0021.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.149C.0021.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.149C.0021.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.149C.0021.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.149C.0021.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.149C.0021.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.149C.0021.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.149C.0021.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON 0292 ; [.14AD.0021.0002.0292][.0000.007D.0002.0335] # LATIN SMALL LETTER EZH 01B7 ; [.14AD.0021.0008.01B7][.0000.007D.0002.0335] # LATIN CAPITAL LETTER EZH 01EF ; [.14AD.0021.0002.0292][.0000.007D.0002.0335][.0000.0041.0002.030C] # LATIN SMALL LETTER EZH WITH CARON @@ -30,6 +38,8 @@ 0061 0308 ; [.14AF.0020.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.14AF.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.14AF.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.14AF.0020.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.14AF.0020.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 00E6 ; [.14AF.0021.0002.00E6] # LATIN SMALL LETTER AE 00C6 ; [.14AF.0021.0008.00C6] # LATIN CAPITAL LETTER AE 1D2D ; [.14AF.0021.0014.1D2D] # MODIFIER LETTER CAPITAL AE @@ -41,6 +51,8 @@ 006F 0308 ; [.14B0.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 00D6 ; [.14B0.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS 004F 0308 ; [.14B0.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.14B0.0020.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.14B0.0020.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON 00F8 ; [.14B0.0021.0002.00F8] # LATIN SMALL LETTER O WITH STROKE 006F 0338 ; [.14B0.0021.0002.00F8] # LATIN SMALL LETTER O WITH STROKE 00D8 ; [.14B0.0021.0008.00D8] # LATIN CAPITAL LETTER O WITH STROKE diff --git a/cpan/Unicode-Collate/Collate/Locale/fil.pl b/cpan/Unicode-Collate/Collate/Locale/fil.pl new file mode 100644 index 0000000000..bb6f7a34ca --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/fil.pl @@ -0,0 +1,11 @@ ++{ + entry => <<'ENTRY', # for DUCET v5.2.0 +00F1 ; [.136E.0020.0002.00F1] # LATIN SMALL LETTER N WITH TILDE +006E 0303 ; [.136E.0020.0002.00F1] # LATIN SMALL LETTER N WITH TILDE +00D1 ; [.136E.0020.0008.00D1] # LATIN CAPITAL LETTER N WITH TILDE +004E 0303 ; [.136E.0020.0008.00D1] # LATIN CAPITAL LETTER N WITH TILDE +006E 0067 ; [.136F.0020.0002.006E] # <LATIN SMALL LETTER N, LATIN SMALL LETTER G> +004E 0067 ; [.136F.0020.0007.004E] # <LATIN CAPITAL LETTER N, LATIN SMALL LETTER G> +004E 0047 ; [.136F.0020.0008.004E] # <LATIN CAPITAL LETTER N, LATIN CAPITAL LETTER G> +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/fo.pl b/cpan/Unicode-Collate/Collate/Locale/fo.pl index 48066f2b8c..b759203614 100644 --- a/cpan/Unicode-Collate/Collate/Locale/fo.pl +++ b/cpan/Unicode-Collate/Collate/Locale/fo.pl @@ -12,6 +12,14 @@ 0075 0308 ; [.149C.0021.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS 00DC ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS 0055 0308 ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.149C.0021.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.149C.0021.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.149C.0021.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.149C.0021.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.149C.0021.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.149C.0021.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.149C.0021.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.149C.0021.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON 0171 ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0075 030B ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0170 ; [.149C.0022.0008.0170] # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE @@ -27,6 +35,8 @@ 0061 0308 ; [.14AE.0021.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.14AE.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.14AE.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.14AE.0021.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.14AE.0021.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 0119 ; [.14AE.0022.0002.0119] # LATIN SMALL LETTER E WITH OGONEK 0065 0328 ; [.14AE.0022.0002.0119] # LATIN SMALL LETTER E WITH OGONEK 0118 ; [.14AE.0022.0008.0118] # LATIN CAPITAL LETTER E WITH OGONEK @@ -41,6 +51,8 @@ 006F 0308 ; [.14AF.0021.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 00D6 ; [.14AF.0021.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS 004F 0308 ; [.14AF.0021.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.14AF.0021.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.14AF.0021.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON 0151 ; [.14AF.0022.0002.0151] # LATIN SMALL LETTER O WITH DOUBLE ACUTE 006F 030B ; [.14AF.0022.0002.0151] # LATIN SMALL LETTER O WITH DOUBLE ACUTE 0150 ; [.14AF.0022.0008.0150] # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE diff --git a/cpan/Unicode-Collate/Collate/Locale/ha.pl b/cpan/Unicode-Collate/Collate/Locale/ha.pl new file mode 100644 index 0000000000..d531c1118b --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/ha.pl @@ -0,0 +1,13 @@ ++{ +# b-hook, d-hook, k-hook, y-hook don't require tailoring + entry => <<'ENTRY', # for DUCET v5.2.0 +0073 0068 ; [.1411.0020.0002.0073] # <LATIN SMALL LETTER S, LATIN SMALL LETTER H> +0053 0068 ; [.1411.0020.0007.0053] # <LATIN CAPITAL LETTER S, LATIN SMALL LETTER H> +0053 0048 ; [.1411.0020.0008.0053] # <LATIN CAPITAL LETTER S, LATIN CAPITAL LETTER H> +0074 0073 ; [.1434.0020.0002.0074] # <LATIN SMALL LETTER T, LATIN SMALL LETTER S> +0054 0073 ; [.1434.0020.0007.0054] # <LATIN CAPITAL LETTER T, LATIN SMALL LETTER S> +0054 0053 ; [.1434.0020.0008.0054] # <LATIN CAPITAL LETTER T, LATIN CAPITAL LETTER S> +0027 0079 ; [.14A8.0020.0002.01B4] # <APOSTROPHE, LATIN SMALL LETTER Y> +0027 0059 ; [.14A8.0020.0008.01B3] # <APOSTROPHE, LATIN CAPITAL LETTER Y> +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/is.pl b/cpan/Unicode-Collate/Collate/Locale/is.pl index ec48689df5..b6c93a9c01 100644 --- a/cpan/Unicode-Collate/Collate/Locale/is.pl +++ b/cpan/Unicode-Collate/Collate/Locale/is.pl @@ -41,10 +41,14 @@ 0061 0308 ; [.1522.0021.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.1522.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.1522.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.1522.0021.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.1522.0021.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 00F6 ; [.1523.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 006F 0308 ; [.1523.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 00D6 ; [.1523.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS 004F 0308 ; [.1523.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.1523.0020.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.1523.0020.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON 00F8 ; [.1523.0021.0002.00F8] # LATIN SMALL LETTER O WITH STROKE 006F 0338 ; [.1523.0021.0002.00F8] # LATIN SMALL LETTER O WITH STROKE 00D8 ; [.1523.0021.0008.00D8] # LATIN CAPITAL LETTER O WITH STROKE diff --git a/cpan/Unicode-Collate/Collate/Locale/kl.pl b/cpan/Unicode-Collate/Collate/Locale/kl.pl index 5c525b8536..a69c1016ec 100644 --- a/cpan/Unicode-Collate/Collate/Locale/kl.pl +++ b/cpan/Unicode-Collate/Collate/Locale/kl.pl @@ -14,6 +14,14 @@ 0075 0308 ; [.149C.0021.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS 00DC ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS 0055 0308 ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.149C.0021.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.149C.0021.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.149C.0021.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.149C.0021.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.149C.0021.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.149C.0021.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.149C.0021.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.149C.0021.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON 0171 ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0075 030B ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0170 ; [.149C.0022.0008.0170] # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE @@ -29,6 +37,8 @@ 0061 0308 ; [.14AE.0021.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.14AE.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.14AE.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.14AE.0021.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.14AE.0021.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 0119 ; [.14AE.0022.0002.0119] # LATIN SMALL LETTER E WITH OGONEK 0065 0328 ; [.14AE.0022.0002.0119] # LATIN SMALL LETTER E WITH OGONEK 0118 ; [.14AE.0022.0008.0118] # LATIN CAPITAL LETTER E WITH OGONEK @@ -43,6 +53,8 @@ 006F 0308 ; [.14AF.0021.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 00D6 ; [.14AF.0021.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS 004F 0308 ; [.14AF.0021.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.14AF.0021.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.14AF.0021.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON 0151 ; [.14AF.0022.0002.0151] # LATIN SMALL LETTER O WITH DOUBLE ACUTE 006F 030B ; [.14AF.0022.0002.0151] # LATIN SMALL LETTER O WITH DOUBLE ACUTE 0150 ; [.14AF.0022.0008.0150] # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE diff --git a/cpan/Unicode-Collate/Collate/Locale/lt.pl b/cpan/Unicode-Collate/Collate/Locale/lt.pl new file mode 100644 index 0000000000..b1dbc082fb --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/lt.pl @@ -0,0 +1,22 @@ ++{ + entry => <<'ENTRY', # for DUCET v5.2.0 +0307 ; [.0000.005A.0002.0307] # COMBINING DOT ABOVE +010D ; [.124F.0020.0002.010D] # LATIN SMALL LETTER C WITH CARON +0063 030C ; [.124F.0020.0002.010D] # LATIN SMALL LETTER C WITH CARON +010C ; [.124F.0020.0008.010C] # LATIN CAPITAL LETTER C WITH CARON +0043 030C ; [.124F.0020.0008.010C] # LATIN CAPITAL LETTER C WITH CARON +0079 ; [.12EC.0021.0002.0079] # LATIN SMALL LETTER Y +0059 ; [.12EC.0021.0008.0059] # LATIN CAPITAL LETTER Y +0161 ; [.1432.0020.0002.0161] # LATIN SMALL LETTER S WITH CARON +0073 030C ; [.1432.0020.0002.0161] # LATIN SMALL LETTER S WITH CARON +0160 ; [.1432.0020.0008.0160] # LATIN CAPITAL LETTER S WITH CARON +0053 030C ; [.1432.0020.0008.0160] # LATIN CAPITAL LETTER S WITH CARON +017E ; [.14C9.0020.0002.017E] # LATIN SMALL LETTER Z WITH CARON +007A 030C ; [.14C9.0020.0002.017E] # LATIN SMALL LETTER Z WITH CARON +017D ; [.14C9.0020.0008.017D] # LATIN CAPITAL LETTER Z WITH CARON +005A 030C ; [.14C9.0020.0008.017D] # LATIN CAPITAL LETTER Z WITH CARON +0117 ; [.126B.0020.0002.0065][.0000.005A.0002.0307] # LATIN SMALL LETTER E WITH DOT ABOVE +0116 ; [.126B.0020.0008.0045][.0000.005A.0002.0307] # LATIN CAPITAL LETTER E WITH DOT ABOVE +0130 ; [.12EC.0020.0008.0049][.0000.005A.0002.0307] # LATIN CAPITAL LETTER I WITH DOT ABOVE +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/mt.pl b/cpan/Unicode-Collate/Collate/Locale/mt.pl new file mode 100644 index 0000000000..08aa5aebf4 --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/mt.pl @@ -0,0 +1,29 @@ ++{ + upper_before_lower => 1, + entry => <<'ENTRY', # for DUCET v5.2.0 +010B ; [.124F.0020.0002.010B] # LATIN SMALL LETTER C WITH DOT ABOVE +0063 0307 ; [.124F.0020.0002.010B] # LATIN SMALL LETTER C WITH DOT ABOVE +010A ; [.124F.0020.0008.010A] # LATIN CAPITAL LETTER C WITH DOT ABOVE +0043 0307 ; [.124F.0020.0008.010A] # LATIN CAPITAL LETTER C WITH DOT ABOVE +0121 ; [.12AF.0020.0002.0121] # LATIN SMALL LETTER G WITH DOT ABOVE +0067 0307 ; [.12AF.0020.0002.0121] # LATIN SMALL LETTER G WITH DOT ABOVE +0120 ; [.12AF.0020.0008.0120] # LATIN CAPITAL LETTER G WITH DOT ABOVE +0047 0307 ; [.12AF.0020.0008.0120] # LATIN CAPITAL LETTER G WITH DOT ABOVE +0067 0127 ; [.12D2.0020.0002.0067] # <LATIN SMALL LETTER G, LATIN SMALL LETTER H WITH STROKE> +0067 0126 ; [.12D2.0020.0007.0067][0.0.2.0] # <LATIN SMALL LETTER G, LATIN CAPITAL LETTER H WITH STROKE> +0047 0127 ; [.12D2.0020.0007.0047][0.0.8.0] # <LATIN CAPITAL LETTER G, LATIN SMALL LETTER H WITH STROKE> +0047 0126 ; [.12D2.0020.0008.0047] # <LATIN CAPITAL LETTER G, LATIN CAPITAL LETTER H WITH STROKE> +0067 0068 0335 ; [.12D2.0020.0002.0067] # <LATIN SMALL LETTER G, LATIN SMALL LETTER H, COMBINING SHORT STROKE OVERLAY> +0067 0048 0335 ; [.12D2.0020.0007.0067][0.0.2.0] # <LATIN SMALL LETTER G, LATIN CAPITAL LETTER H, COMBINING SHORT STROKE OVERLAY> +0047 0068 0335 ; [.12D2.0020.0007.0047][0.0.8.0] # <LATIN CAPITAL LETTER G, LATIN SMALL LETTER H, COMBINING SHORT STROKE OVERLAY> +0047 0048 0335 ; [.12D2.0020.0008.0047] # <LATIN CAPITAL LETTER G, LATIN CAPITAL LETTER H, COMBINING SHORT STROKE OVERLAY> +0127 ; [.12EB.0020.0002.0127] # LATIN SMALL LETTER H WITH STROKE +0068 0335 ; [.12EB.0020.0002.0127] # LATIN SMALL LETTER H WITH STROKE +0126 ; [.12EB.0020.0008.0126] # LATIN CAPITAL LETTER H WITH STROKE +0048 0335 ; [.12EB.0020.0008.0126] # LATIN CAPITAL LETTER H WITH STROKE +017C ; [.14AC.0020.0002.017C] # LATIN SMALL LETTER Z WITH DOT ABOVE +007A 0307 ; [.14AC.0020.0002.017C] # LATIN SMALL LETTER Z WITH DOT ABOVE +017B ; [.14AC.0020.0008.017B] # LATIN CAPITAL LETTER Z WITH DOT ABOVE +005A 0307 ; [.14AC.0020.0008.017B] # LATIN CAPITAL LETTER Z WITH DOT ABOVE +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/nn.pl b/cpan/Unicode-Collate/Collate/Locale/nn.pl index 1c836f1711..6f6a286b08 100644 --- a/cpan/Unicode-Collate/Collate/Locale/nn.pl +++ b/cpan/Unicode-Collate/Collate/Locale/nn.pl @@ -12,6 +12,14 @@ 0075 0308 ; [.149C.0021.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS 00DC ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS 0055 0308 ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.149C.0021.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.149C.0021.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.149C.0021.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.149C.0021.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.149C.0021.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.149C.0021.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.149C.0021.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.149C.0021.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON 0171 ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0075 030B ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0170 ; [.149C.0022.0008.0170] # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE @@ -27,6 +35,8 @@ 0061 0308 ; [.14AE.0021.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.14AE.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.14AE.0021.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.14AE.0021.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.14AE.0021.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 0119 ; [.14AE.0022.0002.0119] # LATIN SMALL LETTER E WITH OGONEK 0065 0328 ; [.14AE.0022.0002.0119] # LATIN SMALL LETTER E WITH OGONEK 0118 ; [.14AE.0022.0008.0118] # LATIN CAPITAL LETTER E WITH OGONEK @@ -41,6 +51,8 @@ 006F 0308 ; [.14AF.0021.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 00D6 ; [.14AF.0021.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS 004F 0308 ; [.14AF.0021.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.14AF.0021.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.14AF.0021.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON 0151 ; [.14AF.0022.0002.0151] # LATIN SMALL LETTER O WITH DOUBLE ACUTE 006F 030B ; [.14AF.0022.0002.0151] # LATIN SMALL LETTER O WITH DOUBLE ACUTE 0150 ; [.14AF.0022.0008.0150] # LATIN CAPITAL LETTER O WITH DOUBLE ACUTE diff --git a/cpan/Unicode-Collate/Collate/Locale/sk.pl b/cpan/Unicode-Collate/Collate/Locale/sk.pl index f248d1b20c..dc42f44acd 100644 --- a/cpan/Unicode-Collate/Collate/Locale/sk.pl +++ b/cpan/Unicode-Collate/Collate/Locale/sk.pl @@ -4,6 +4,8 @@ 0061 0308 ; [.1210.0020.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.1210.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.1210.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.1210.0020.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.1210.0020.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 010D ; [.123E.0020.0002.010D] # LATIN SMALL LETTER C WITH CARON 0063 030C ; [.123E.0020.0002.010D] # LATIN SMALL LETTER C WITH CARON 010C ; [.123E.0020.0008.010C] # LATIN CAPITAL LETTER C WITH CARON diff --git a/cpan/Unicode-Collate/Collate/Locale/sv.pl b/cpan/Unicode-Collate/Collate/Locale/sv.pl index e8324d1a13..a039152cde 100644 --- a/cpan/Unicode-Collate/Collate/Locale/sv.pl +++ b/cpan/Unicode-Collate/Collate/Locale/sv.pl @@ -14,6 +14,14 @@ 0075 0308 ; [.149C.0021.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS 00DC ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS 0055 0308 ; [.149C.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.149C.0021.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.149C.0021.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.149C.0021.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.149C.0021.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.149C.0021.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.149C.0021.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.149C.0021.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.149C.0021.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON 0171 ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0075 030B ; [.149C.0022.0002.0171] # LATIN SMALL LETTER U WITH DOUBLE ACUTE 0170 ; [.149C.0022.0008.0170] # LATIN CAPITAL LETTER U WITH DOUBLE ACUTE @@ -29,6 +37,8 @@ 0061 0308 ; [.14AF.0020.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS 00C4 ; [.14AF.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS 0041 0308 ; [.14AF.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.14AF.0020.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.14AF.0020.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON 00E6 ; [.14AF.0021.0002.00E6] # LATIN SMALL LETTER AE 00C6 ; [.14AF.0021.0008.00C6] # LATIN CAPITAL LETTER AE 1D2D ; [.14AF.0021.0014.1D2D] # MODIFIER LETTER CAPITAL AE @@ -44,6 +54,8 @@ 006F 0308 ; [.14B0.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS 00D6 ; [.14B0.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS 004F 0308 ; [.14B0.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.14B0.0020.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.14B0.0020.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON 00F8 ; [.14B0.0021.0002.00F8] # LATIN SMALL LETTER O WITH STROKE 006F 0338 ; [.14B0.0021.0002.00F8] # LATIN SMALL LETTER O WITH STROKE 00D8 ; [.14B0.0021.0008.00D8] # LATIN CAPITAL LETTER O WITH STROKE diff --git a/cpan/Unicode-Collate/Collate/Locale/tr.pl b/cpan/Unicode-Collate/Collate/Locale/tr.pl new file mode 100644 index 0000000000..250a0efcb5 --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/tr.pl @@ -0,0 +1,45 @@ ++{ + entry => <<'ENTRY', # for DUCET v5.2.0 +00E7 ; [.123E.0020.0002.00E7] # LATIN SMALL LETTER C WITH CEDILLA +0063 0327 ; [.123E.0020.0002.00E7] # LATIN SMALL LETTER C WITH CEDILLA +00C7 ; [.123E.0020.0008.00C7] # LATIN CAPITAL LETTER C WITH CEDILLA +0043 0327 ; [.123E.0020.0008.00C7] # LATIN CAPITAL LETTER C WITH CEDILLA +011F ; [.12B1.0020.0002.011F] # LATIN SMALL LETTER G WITH BREVE +0067 0306 ; [.12B1.0020.0002.011F] # LATIN SMALL LETTER G WITH BREVE +011E ; [.12B1.0020.0008.011E] # LATIN CAPITAL LETTER G WITH BREVE +0047 0306 ; [.12B1.0020.0008.011E] # LATIN CAPITAL LETTER G WITH BREVE +0131 ; [.12EB.0020.0002.0131] # LATIN SMALL LETTER DOTLESS I +0049 ; [.12EB.0020.0008.0049] # LATIN CAPITAL LETTER I +00CC ; [.12EB.0020.0008.0049][.0000.0035.0002.0300] # LATIN CAPITAL LETTER I WITH GRAVE +00CD ; [.12EB.0020.0008.0049][.0000.0032.0002.0301] # LATIN CAPITAL LETTER I WITH ACUTE +00CE ; [.12EB.0020.0008.0049][.0000.003C.0002.0302] # LATIN CAPITAL LETTER I WITH CIRCUMFLEX +00CF ; [.12EB.0020.0008.0049][.0000.0047.0002.0308] # LATIN CAPITAL LETTER I WITH DIAERESIS +012A ; [.12EB.0020.0008.0049][.0000.005B.0002.0304] # LATIN CAPITAL LETTER I WITH MACRON +012C ; [.12EB.0020.0008.0049][.0000.0037.0002.0306] # LATIN CAPITAL LETTER I WITH BREVE +012E ; [.12EB.0020.0008.0049][.0000.0059.0002.0328] # LATIN CAPITAL LETTER I WITH OGONEK +0130 ; [.12EC.0020.0008.0130] # LATIN CAPITAL LETTER I WITH DOT ABOVE +0049 0307 ; [.12EC.0020.0008.0130] # LATIN CAPITAL LETTER I WITH DOT ABOVE +00F6 ; [.138F.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS +006F 0308 ; [.138F.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS +00D6 ; [.138F.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +004F 0308 ; [.138F.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.138F.0020.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.138F.0020.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON +015F ; [.1411.0020.0002.015F] # LATIN SMALL LETTER S WITH CEDILLA +0073 0327 ; [.1411.0020.0002.015F] # LATIN SMALL LETTER S WITH CEDILLA +015E ; [.1411.0020.0008.015E] # LATIN CAPITAL LETTER S WITH CEDILLA +0053 0327 ; [.1411.0020.0008.015E] # LATIN CAPITAL LETTER S WITH CEDILLA +00FC ; [.1454.0020.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS +0075 0308 ; [.1454.0020.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS +00DC ; [.1454.0020.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +0055 0308 ; [.1454.0020.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.1454.0020.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.1454.0020.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.1454.0020.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.1454.0020.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.1454.0020.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.1454.0020.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.1454.0020.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.1454.0020.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/wo.pl b/cpan/Unicode-Collate/Collate/Locale/wo.pl new file mode 100644 index 0000000000..941260cf7f --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/wo.pl @@ -0,0 +1,25 @@ ++{ +# eng doesn't require tailoring + entry => <<'ENTRY', # for DUCET v5.2.0 +00E0 ; [.1210.0020.0002.00E0] # LATIN SMALL LETTER A WITH GRAVE +0061 0300 ; [.1210.0020.0002.00E0] # LATIN SMALL LETTER A WITH GRAVE +00C0 ; [.1210.0020.0008.00C0] # LATIN CAPITAL LETTER A WITH GRAVE +0041 0300 ; [.1210.0020.0008.00C0] # LATIN CAPITAL LETTER A WITH GRAVE +00E9 ; [.126C.0020.0002.00E9] # LATIN SMALL LETTER E WITH ACUTE +0065 0301 ; [.126C.0020.0002.00E9] # LATIN SMALL LETTER E WITH ACUTE +00C9 ; [.126C.0020.0008.00C9] # LATIN CAPITAL LETTER E WITH ACUTE +0045 0301 ; [.126C.0020.0008.00C9] # LATIN CAPITAL LETTER E WITH ACUTE +00EB ; [.126D.0020.0002.00EB] # LATIN SMALL LETTER E WITH DIAERESIS +0065 0308 ; [.126D.0020.0002.00EB] # LATIN SMALL LETTER E WITH DIAERESIS +00CB ; [.126D.0020.0008.00CB] # LATIN CAPITAL LETTER E WITH DIAERESIS +0045 0308 ; [.126D.0020.0008.00CB] # LATIN CAPITAL LETTER E WITH DIAERESIS +00F1 ; [.136E.0020.0002.00F1] # LATIN SMALL LETTER N WITH TILDE +006E 0303 ; [.136E.0020.0002.00F1] # LATIN SMALL LETTER N WITH TILDE +00D1 ; [.136E.0020.0008.00D1] # LATIN CAPITAL LETTER N WITH TILDE +004E 0303 ; [.136E.0020.0008.00D1] # LATIN CAPITAL LETTER N WITH TILDE +00F3 ; [.138F.0020.0002.00F3] # LATIN SMALL LETTER O WITH ACUTE +006F 0301 ; [.138F.0020.0002.00F3] # LATIN SMALL LETTER O WITH ACUTE +00D3 ; [.138F.0020.0008.00D3] # LATIN CAPITAL LETTER O WITH ACUTE +004F 0301 ; [.138F.0020.0008.00D3] # LATIN CAPITAL LETTER O WITH ACUTE +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/yo.pl b/cpan/Unicode-Collate/Collate/Locale/yo.pl new file mode 100644 index 0000000000..884d83fb7c --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/yo.pl @@ -0,0 +1,19 @@ ++{ + entry => <<'ENTRY', # for DUCET v5.2.0 +1EB9 ; [.126C.0020.0002.1EB9] # LATIN SMALL LETTER E WITH DOT BELOW +0065 0323 ; [.126C.0020.0002.1EB9] # LATIN SMALL LETTER E WITH DOT BELOW +1EB8 ; [.126C.0020.0008.1EB8] # LATIN CAPITAL LETTER E WITH DOT BELOW +0045 0323 ; [.126C.0020.0008.1EB8] # LATIN CAPITAL LETTER E WITH DOT BELOW +0067 0062 ; [.12B1.0020.0002.0067] # <LATIN SMALL LETTER G, LATIN SMALL LETTER B> +0047 0062 ; [.12B1.0020.0007.0047] # <LATIN CAPITAL LETTER G, LATIN SMALL LETTER B> +0047 0042 ; [.12B1.0020.0008.0047] # <LATIN CAPITAL LETTER G, LATIN CAPITAL LETTER B> +1ECD ; [.138F.0020.0002.1ECD] # LATIN SMALL LETTER O WITH DOT BELOW +006F 0323 ; [.138F.0020.0002.1ECD] # LATIN SMALL LETTER O WITH DOT BELOW +1ECC ; [.138F.0020.0008.1ECC] # LATIN CAPITAL LETTER O WITH DOT BELOW +004F 0323 ; [.138F.0020.0008.1ECC] # LATIN CAPITAL LETTER O WITH DOT BELOW +1E63 ; [.1411.0020.0002.1E63] # LATIN SMALL LETTER S WITH DOT BELOW +0073 0323 ; [.1411.0020.0002.1E63] # LATIN SMALL LETTER S WITH DOT BELOW +1E62 ; [.1411.0020.0008.1E62] # LATIN CAPITAL LETTER S WITH DOT BELOW +0053 0323 ; [.1411.0020.0008.1E62] # LATIN CAPITAL LETTER S WITH DOT BELOW +ENTRY +}; |