diff options
author | Chris 'BinGOs' Williams <chris@bingosnet.co.uk> | 2011-10-02 19:36:35 +0100 |
---|---|---|
committer | Chris 'BinGOs' Williams <chris@bingosnet.co.uk> | 2011-10-02 19:36:35 +0100 |
commit | bd65daabad8a8b02a5d670456ceb2ca31f9d26cd (patch) | |
tree | 6d30b6e06e393e3fd587c55c259aea45a77cf631 /cpan/Unicode-Collate/Collate | |
parent | a2fa999d41c94d622051667d897fedca90be1828 (diff) | |
download | perl-bd65daabad8a8b02a5d670456ceb2ca31f9d26cd.tar.gz |
Update Unicode-Collate to CPAN version 0.79
[DELTA]
0.79 Sun Oct 2 20:31:01 2011
- pod: [rt.cpan.org #70241] Fix minor grammar error in manpage
by Harlan Lieberman-Berg.
- 'suppress' no longer affects contractions via 'entry'.
- U::C::Locale newly supports locales: as, fi__phonebook, gu.
- added loc_as.t, loc_fiph.t, loc_gu in t.
- updated some locales to CLDR 2.0 : ar, be, bg.
Diffstat (limited to 'cpan/Unicode-Collate/Collate')
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale.pm | 83 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/ar.pl | 13 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/as.pl | 9 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/be.pl | 42 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/bg.pl | 44 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/fi_phone.pl | 61 | ||||
-rw-r--r-- | cpan/Unicode-Collate/Collate/Locale/gu.pl | 7 |
7 files changed, 249 insertions, 10 deletions
diff --git a/cpan/Unicode-Collate/Collate/Locale.pm b/cpan/Unicode-Collate/Collate/Locale.pm index 749c64c23b..92bdf249cb 100644 --- a/cpan/Unicode-Collate/Collate/Locale.pm +++ b/cpan/Unicode-Collate/Collate/Locale.pm @@ -4,7 +4,7 @@ use strict; use Carp; use base qw(Unicode::Collate); -our $VERSION = '0.76'; +our $VERSION = '0.79'; use File::Spec; @@ -12,15 +12,14 @@ use File::Spec; my $PL_EXT = '.pl'; my %LocaleFile = map { ($_, $_) } qw( - af ar az ca cs cy da eo es et fi fil fo fr ha haw - hr hu hy ig is ja kk kl ko lt lv mt nb nn nso om pl ro ru - se sk sl sq sv tn to tr uk vi wo yo zh + af ar as az be bg ca cs cy da eo es et fi fil fo fr gu + ha haw hr hu hy ig is ja kk kl ko lt lv mt nb nn nso om + pl ro ru se sk sl sq sv tn to tr uk vi wo yo zh ); $LocaleFile{'default'} = ''; $LocaleFile{'de__phonebook'} = 'de_phone'; $LocaleFile{'es__traditional'} = 'es_trad'; - $LocaleFile{'be'} = 'ru'; - $LocaleFile{'bg'} = 'ru'; + $LocaleFile{'fi__phonebook'} = 'fi_phone'; $LocaleFile{'mk'} = 'ru'; $LocaleFile{'sr'} = 'ru'; $LocaleFile{'zh__big5han'} = 'zh_big5'; @@ -84,6 +83,73 @@ sub new { 1; __END__ +MEMORANDA for developing + +locale based CLDR +---------------------------------------------------------------------------- +af 2.0 = 1.8.1 +ar 2.0 +as 2.0 = 1.8.1 +az 2.0 = 1.8.1 +be 2.0 +bg 2.0 +ca 2.0 = 1.8.1 (alt="proposed" type="standard") +cs 2.0 = 1.8.1 (type="standard") +cy 2.0 = 1.8.1 +da 2.0 = 1.8.1 (type="standard") [AA's to pass CLDR tests] +de__phonebook 2.0 (type="phonebook") +eo 2.0 = 1.8.1 +es 2.0 (type="standard") +es__traditional 2.0 = 1.8.1 (type="traditional") +et 2.0 = 1.8.1 +fi 2.0 = 1.8.1 (type="standard" alt="proposed") +fi__phonebook 2.0 = 1.8.1 (type="phonebook") +fil 2.0 (type="standard") = 1.8.1 +fo 2.0 = 1.8.1 (alt="proposed" type="standard") +fr 2.0 (fr_CA, backwards="on") +gu 2.0 (type="standard") +ha +haw +hr +hu +hy +ig +is +ja +kk +kl +ko +lt +lv +mk +mt +nb +nn +nso +om +pl +ro +ru +se +sk +sl +sq +sr +sv +tn +to +tr +uk +vi +wo +yo +zh +zh__big5han +zh__gb2312han +zh__pinyin +zh__stroke +---------------------------------------------------------------------------- + =head1 NAME Unicode::Collate::Locale - Linguistic tailoring for DUCET via Unicode::Collate @@ -190,6 +256,7 @@ this method returns a string C<'default'> meaning no special tailoring. ---------------------------------------------------------- af Afrikaans ar Arabic + as Assamese az Azerbaijani (Azeri) be Belarusian bg Bulgarian @@ -202,10 +269,12 @@ this method returns a string C<'default'> meaning no special tailoring. es Spanish es__traditional Spanish ('ch' and 'll' as a grapheme) et Estonian - fi Finnish + fi Finnish (v and w are primary equal) + fi__phonebook Finnish (v and w as separate characters) fil Filipino fo Faroese fr French + gu Gujarati ha Hausa haw Hawaiian hr Croatian diff --git a/cpan/Unicode-Collate/Collate/Locale/ar.pl b/cpan/Unicode-Collate/Collate/Locale/ar.pl index 516e02dfd2..bd71ba234c 100644 --- a/cpan/Unicode-Collate/Collate/Locale/ar.pl +++ b/cpan/Unicode-Collate/Collate/Locale/ar.pl @@ -1,7 +1,14 @@ +{ entry => <<'ENTRY', # for DUCET v6.0.0 -0629 ; [.1C54.0020.0002.062A] # ARABIC LETTER TEH MARBUTA -FE93 ; [.1C54.0020.0002.062A] # ARABIC LETTER TEH MARBUTA ISOLATED FORM -FE94 ; [.1C54.0020.0002.062A] # ARABIC LETTER TEH MARBUTA FINAL FORM +0629 ; [.1C54.0021.0002.0629] # ARABIC LETTER TEH MARBUTA +FE94 ; [.1C54.0021.0019.FE94] # ARABIC LETTER TEH MARBUTA FINAL FORM +FE93 ; [.1C54.0021.001A.FE93] # ARABIC LETTER TEH MARBUTA ISOLATED FORM +0649 ; [.1CE9.0021.0002.0649] # ARABIC LETTER ALEF MAKSURA +FBE8 ; [.1CE9.0021.0017.FBE8] # ARABIC LETTER UIGHUR KAZAKH KIRGHIZ ALEF MAKSURA INITIAL FORM +FBE9 ; [.1CE9.0021.0018.FBE9] # ARABIC LETTER UIGHUR KAZAKH KIRGHIZ ALEF MAKSURA MEDIAL FORM +FEF0 ; [.1CE9.0021.0019.FEF0] # ARABIC LETTER ALEF MAKSURA FINAL FORM +FEEF ; [.1CE9.0021.001A.FEEF] # ARABIC LETTER ALEF MAKSURA ISOLATED FORM +FC90 ; [.1CE9.0021.001B.FC90] # ARABIC LIGATURE ALEF MAKSURA WITH SUPERSCRIPT ALEF FINAL FORM +FC5D ; [.1CE9.0021.001C.FC5D] # ARABIC LIGATURE ALEF MAKSURA WITH SUPERSCRIPT ALEF ISOLATED FORM ENTRY }; diff --git a/cpan/Unicode-Collate/Collate/Locale/as.pl b/cpan/Unicode-Collate/Collate/Locale/as.pl new file mode 100644 index 0000000000..b9a51de160 --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/as.pl @@ -0,0 +1,9 @@ ++{ + entry => <<'ENTRY', # for DUCET v6.0.0 +0982 ; [.1FE8.0020.0002.0982][.FFF1.0000.0000.0000] # BENGALI SIGN ANUSVARA +0981 ; [.1FE8.0020.0002.0981][.FFF2.0000.0000.0000] # BENGALI SIGN CANDRABINDU +0983 ; [.1FE8.0020.0002.0983][.FFF3.0000.0000.0000] # BENGALI SIGN VISARGA +09A4 09CD 200D ; [.1FF7.0020.0002.09A4][.FFF1.0000.0000.0000] # <BENGALI LETTER TA, BENGALI SIGN VIRAMA, ZERO WIDTH JOINER> +0995 09CD 09B7 ; [.200A.0020.0002.0995][.FFF1.0000.0000.0000] # <BENGALI LETTER KA, BENGALI SIGN VIRAMA, BENGALI LETTER SSA> +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/be.pl b/cpan/Unicode-Collate/Collate/Locale/be.pl new file mode 100644 index 0000000000..3e7684f900 --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/be.pl @@ -0,0 +1,42 @@ ++{ + suppress => [0x0410, 0x0430, 0x04D8, 0x04D9, 0x0413, 0x0433, 0x0415, 0x0435, + 0x0416, 0x0436, 0x0417, 0x0437, 0x0406, 0x0456, 0x041E, 0x043E, + 0x04E8, 0x04E9, 0x041A, 0x043A, 0x0427, 0x0447, 0x042B, 0x044B, + 0x042D, 0x044D, 0x0474, 0x0475], + entry => <<'ENTRY', # for DUCET v6.0.0 +0451 ; [.198C.0020.0002.0451] # CYRILLIC SMALL LETTER IO +0435 0308 ; [.198C.0020.0002.0451] # CYRILLIC SMALL LETTER IO +0401 ; [.198C.0020.0008.0401] # CYRILLIC CAPITAL LETTER IO +0415 0308 ; [.198C.0020.0008.0401] # CYRILLIC CAPITAL LETTER IO +04D1 ; [.1943.0020.0002.0430][.0000.0037.0002.0306] # CYRILLIC SMALL LETTER A WITH BREVE +04D0 ; [.1943.0020.0008.0410][.0000.0037.0002.0306] # CYRILLIC CAPITAL LETTER A WITH BREVE +04D3 ; [.1943.0020.0002.0430][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER A WITH DIAERESIS +04D2 ; [.1943.0020.0008.0410][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER A WITH DIAERESIS +04DB ; [.194F.0020.0002.04D9][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER SCHWA WITH DIAERESIS +04DA ; [.194F.0020.0008.04D8][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER SCHWA WITH DIAERESIS +0453 ; [.1963.0020.0002.0433][.0000.0032.0002.0301] # CYRILLIC SMALL LETTER GJE +0403 ; [.1963.0020.0008.0413][.0000.0032.0002.0301] # CYRILLIC CAPITAL LETTER GJE +04D7 ; [.198B.0020.0002.0435][.0000.0037.0002.0306] # CYRILLIC SMALL LETTER IE WITH BREVE +04D6 ; [.198B.0020.0008.0415][.0000.0037.0002.0306] # CYRILLIC CAPITAL LETTER IE WITH BREVE +04DD ; [.1997.0020.0002.0436][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER ZHE WITH DIAERESIS +04DC ; [.1997.0020.0008.0416][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER ZHE WITH DIAERESIS +04DF ; [.19A4.0020.0002.0437][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER ZE WITH DIAERESIS +04DE ; [.19A4.0020.0008.0417][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER ZE WITH DIAERESIS +0457 ; [.19C8.0020.0002.0456][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER YI +0407 ; [.19C8.0020.0008.0406][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER YI +04E7 ; [.1A29.0020.0002.043E][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER O WITH DIAERESIS +04E6 ; [.1A29.0020.0008.041E][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER O WITH DIAERESIS +04EB ; [.1A31.0020.0002.04E9][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER BARRED O WITH DIAERESIS +04EA ; [.1A31.0020.0008.04E8][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER BARRED O WITH DIAERESIS +045C ; [.19DA.0020.0002.043A][.0000.0032.0002.0301] # CYRILLIC SMALL LETTER KJE +040C ; [.19DA.0020.0008.041A][.0000.0032.0002.0301] # CYRILLIC CAPITAL LETTER KJE +04F5 ; [.1ABE.0020.0002.0447][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER CHE WITH DIAERESIS +04F4 ; [.1ABE.0020.0008.0427][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER CHE WITH DIAERESIS +04F9 ; [.1AF1.0020.0002.044B][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER YERU WITH DIAERESIS +04F8 ; [.1AF1.0020.0008.042B][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER YERU WITH DIAERESIS +04ED ; [.1B06.0020.0002.044D][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER E WITH DIAERESIS +04EC ; [.1B06.0020.0008.042D][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER E WITH DIAERESIS +0477 ; [.1B3C.0020.0002.0475][.0000.0065.0002.030F] # CYRILLIC SMALL LETTER IZHITSA WITH DOUBLE GRAVE ACCENT +0476 ; [.1B3C.0020.0008.0474][.0000.0065.0002.030F] # CYRILLIC CAPITAL LETTER IZHITSA WITH DOUBLE GRAVE ACCENT +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/bg.pl b/cpan/Unicode-Collate/Collate/Locale/bg.pl new file mode 100644 index 0000000000..8b4c808371 --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/bg.pl @@ -0,0 +1,44 @@ ++{ + suppress => [0x0410, 0x0430, 0x04D8, 0x04D9, 0x0413, 0x0433, 0x0415, 0x0435, + 0x0416, 0x0436, 0x0417, 0x0437, 0x0406, 0x0456, 0x041E, 0x043E, + 0x04E8, 0x04E9, 0x041A, 0x043A, 0x0423, 0x0443, 0x0427, 0x0447, + 0x042B, 0x044B, 0x042D, 0x044D, 0x0474, 0x0475], + entry => <<'ENTRY', # for DUCET v6.0.0 +04D1 ; [.1943.0020.0002.0430][.0000.0037.0002.0306] # CYRILLIC SMALL LETTER A WITH BREVE +04D0 ; [.1943.0020.0008.0410][.0000.0037.0002.0306] # CYRILLIC CAPITAL LETTER A WITH BREVE +04D3 ; [.1943.0020.0002.0430][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER A WITH DIAERESIS +04D2 ; [.1943.0020.0008.0410][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER A WITH DIAERESIS +04DB ; [.194F.0020.0002.04D9][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER SCHWA WITH DIAERESIS +04DA ; [.194F.0020.0008.04D8][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER SCHWA WITH DIAERESIS +0453 ; [.1963.0020.0002.0433][.0000.0032.0002.0301] # CYRILLIC SMALL LETTER GJE +0403 ; [.1963.0020.0008.0413][.0000.0032.0002.0301] # CYRILLIC CAPITAL LETTER GJE +04D7 ; [.198B.0020.0002.0435][.0000.0037.0002.0306] # CYRILLIC SMALL LETTER IE WITH BREVE +04D6 ; [.198B.0020.0008.0415][.0000.0037.0002.0306] # CYRILLIC CAPITAL LETTER IE WITH BREVE +04DD ; [.1997.0020.0002.0436][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER ZHE WITH DIAERESIS +04DC ; [.1997.0020.0008.0416][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER ZHE WITH DIAERESIS +04DF ; [.19A4.0020.0002.0437][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER ZE WITH DIAERESIS +04DE ; [.19A4.0020.0008.0417][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER ZE WITH DIAERESIS +0457 ; [.19C8.0020.0002.0456][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER YI +0407 ; [.19C8.0020.0008.0406][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER YI +04E7 ; [.1A29.0020.0002.043E][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER O WITH DIAERESIS +04E6 ; [.1A29.0020.0008.041E][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER O WITH DIAERESIS +04EB ; [.1A31.0020.0002.04E9][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER BARRED O WITH DIAERESIS +04EA ; [.1A31.0020.0008.04E8][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER BARRED O WITH DIAERESIS +045C ; [.19DA.0020.0002.043A][.0000.0032.0002.0301] # CYRILLIC SMALL LETTER KJE +040C ; [.19DA.0020.0008.041A][.0000.0032.0002.0301] # CYRILLIC CAPITAL LETTER KJE +045E ; [.1A6B.0020.0002.0443][.0000.0037.0002.0306] # CYRILLIC SMALL LETTER SHORT U +040E ; [.1A6B.0020.0008.0423][.0000.0037.0002.0306] # CYRILLIC CAPITAL LETTER SHORT U +04F1 ; [.1A6B.0020.0002.0443][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER U WITH DIAERESIS +04F0 ; [.1A6B.0020.0008.0423][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER U WITH DIAERESIS +04F3 ; [.1A6B.0020.0002.0443][.0000.004D.0002.030B] # CYRILLIC SMALL LETTER U WITH DOUBLE ACUTE +04F2 ; [.1A6B.0020.0008.0423][.0000.004D.0002.030B] # CYRILLIC CAPITAL LETTER U WITH DOUBLE ACUTE +04F5 ; [.1ABE.0020.0002.0447][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER CHE WITH DIAERESIS +04F4 ; [.1ABE.0020.0008.0427][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER CHE WITH DIAERESIS +04F9 ; [.1AF1.0020.0002.044B][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER YERU WITH DIAERESIS +04F8 ; [.1AF1.0020.0008.042B][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER YERU WITH DIAERESIS +04ED ; [.1B06.0020.0002.044D][.0000.0047.0002.0308] # CYRILLIC SMALL LETTER E WITH DIAERESIS +04EC ; [.1B06.0020.0008.042D][.0000.0047.0002.0308] # CYRILLIC CAPITAL LETTER E WITH DIAERESIS +0477 ; [.1B3C.0020.0002.0475][.0000.0065.0002.030F] # CYRILLIC SMALL LETTER IZHITSA WITH DOUBLE GRAVE ACCENT +0476 ; [.1B3C.0020.0008.0474][.0000.0065.0002.030F] # CYRILLIC CAPITAL LETTER IZHITSA WITH DOUBLE GRAVE ACCENT +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/fi_phone.pl b/cpan/Unicode-Collate/Collate/Locale/fi_phone.pl new file mode 100644 index 0000000000..850ddd7f48 --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/fi_phone.pl @@ -0,0 +1,61 @@ ++{ +# in cldr test/fi.xml why x{110}x < xdx though xd < x{110} ? + entry => <<'ENTRY', # for DUCET v6.0.0 +0111 ; [.15E4.0021.0002.0111][.0000.007D.0002.0335] # LATIN SMALL LETTER D WITH STROKE +0110 ; [.15E4.0021.0008.0110][.0000.007D.0002.0335] # LATIN CAPITAL LETTER D WITH STROKE +01E5 ; [.1644.0021.0002.01E5][.0000.007D.0002.0335] # LATIN SMALL LETTER G WITH STROKE +01E4 ; [.1644.0021.0008.01E4][.0000.007D.0002.0335] # LATIN CAPITAL LETTER G WITH STROKE +014B ; [.1702.0021.0002.014B][.0000.007D.0002.0335] # LATIN SMALL LETTER ENG +014A ; [.1702.0021.0008.014A][.0000.007D.0002.0335] # LATIN CAPITAL LETTER ENG +0167 ; [.17C9.0021.0002.0167][.0000.007D.0002.0335] # LATIN SMALL LETTER T WITH STROKE +0166 ; [.17C9.0021.0008.0166][.0000.007D.0002.0335] # LATIN CAPITAL LETTER T WITH STROKE +00FC ; [.1833.0021.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS +0075 0308 ; [.1833.0021.0002.00FC] # LATIN SMALL LETTER U WITH DIAERESIS +00DC ; [.1833.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +0055 0308 ; [.1833.0021.0008.00DC] # LATIN CAPITAL LETTER U WITH DIAERESIS +01DC ; [.1833.0021.0002.00FC][.0000.0035.0002.0300] # LATIN SMALL LETTER U WITH DIAERESIS AND GRAVE +01DB ; [.1833.0021.0008.00DC][.0000.0035.0002.0300] # LATIN CAPITAL LETTER U WITH DIAERESIS AND GRAVE +01D8 ; [.1833.0021.0002.00FC][.0000.0032.0002.0301] # LATIN SMALL LETTER U WITH DIAERESIS AND ACUTE +01D7 ; [.1833.0021.0008.00DC][.0000.0032.0002.0301] # LATIN CAPITAL LETTER U WITH DIAERESIS AND ACUTE +01D6 ; [.1833.0021.0002.00FC][.0000.005B.0002.0304] # LATIN SMALL LETTER U WITH DIAERESIS AND MACRON +01D5 ; [.1833.0021.0008.00DC][.0000.005B.0002.0304] # LATIN CAPITAL LETTER U WITH DIAERESIS AND MACRON +01DA ; [.1833.0021.0002.00FC][.0000.0041.0002.030C] # LATIN SMALL LETTER U WITH DIAERESIS AND CARON +01D9 ; [.1833.0021.0008.00DC][.0000.0041.0002.030C] # LATIN CAPITAL LETTER U WITH DIAERESIS AND CARON +0292 ; [.1844.0021.0002.0292][.0000.007D.0002.0335] # LATIN SMALL LETTER EZH +01B7 ; [.1844.0021.0008.01B7][.0000.007D.0002.0335] # LATIN CAPITAL LETTER EZH +01EF ; [.1844.0021.0002.0292][.0000.007D.0002.0335][.0000.0041.0002.030C] # LATIN SMALL LETTER EZH WITH CARON +01EE ; [.1844.0021.0008.01B7][.0000.007D.0002.0335][.0000.0041.0002.030C] # LATIN CAPITAL LETTER EZH WITH CARON +00E5 ; [.18B9.0020.0002.00E5] # LATIN SMALL LETTER A WITH RING ABOVE +0061 030A ; [.18B9.0020.0002.00E5] # LATIN SMALL LETTER A WITH RING ABOVE +00C5 ; [.18B9.0020.0008.00C5] # LATIN CAPITAL LETTER A WITH RING ABOVE +0041 030A ; [.18B9.0020.0008.00C5] # LATIN CAPITAL LETTER A WITH RING ABOVE +212B ; [.18B9.0020.0008.00C5] # ANGSTROM SIGN +01FB ; [.18B9.0020.0002.00E5][.0000.0032.0002.0301] # LATIN SMALL LETTER A WITH RING ABOVE AND ACUTE +01FA ; [.18B9.0020.0008.00C5][.0000.0032.0002.0301] # LATIN CAPITAL LETTER A WITH RING ABOVE AND ACUTE +00E4 ; [.18BA.0020.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS +0061 0308 ; [.18BA.0020.0002.00E4] # LATIN SMALL LETTER A WITH DIAERESIS +00C4 ; [.18BA.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +0041 0308 ; [.18BA.0020.0008.00C4] # LATIN CAPITAL LETTER A WITH DIAERESIS +01DF ; [.18BA.0020.0002.00E4][.0000.005B.0002.0304] # LATIN SMALL LETTER A WITH DIAERESIS AND MACRON +01DE ; [.18BA.0020.0008.00C4][.0000.005B.0002.0304] # LATIN CAPITAL LETTER A WITH DIAERESIS AND MACRON +00E6 ; [.18BA.0021.0002.00E6] # LATIN SMALL LETTER AE +00C6 ; [.18BA.0021.0008.00C6] # LATIN CAPITAL LETTER AE +1D2D ; [.18BA.0021.0014.1D2D] # MODIFIER LETTER CAPITAL AE +01FD ; [.18BA.0021.0002.00E6][.0000.0032.0002.0301] # LATIN SMALL LETTER AE WITH ACUTE +01FC ; [.18BA.0021.0008.00C6][.0000.0032.0002.0301] # LATIN CAPITAL LETTER AE WITH ACUTE +01E3 ; [.18BA.0021.0002.00E6][.0000.005B.0002.0304] # LATIN SMALL LETTER AE WITH MACRON +01E2 ; [.18BA.0021.0008.00C6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER AE WITH MACRON +00F6 ; [.18BB.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS +006F 0308 ; [.18BB.0020.0002.00F6] # LATIN SMALL LETTER O WITH DIAERESIS +00D6 ; [.18BB.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +004F 0308 ; [.18BB.0020.0008.00D6] # LATIN CAPITAL LETTER O WITH DIAERESIS +022B ; [.18BB.0020.0002.00F6][.0000.005B.0002.0304] # LATIN SMALL LETTER O WITH DIAERESIS AND MACRON +022A ; [.18BB.0020.0008.00D6][.0000.005B.0002.0304] # LATIN CAPITAL LETTER O WITH DIAERESIS AND MACRON +00F8 ; [.18BB.0021.0002.00F8] # LATIN SMALL LETTER O WITH STROKE +006F 0338 ; [.18BB.0021.0002.00F8] # LATIN SMALL LETTER O WITH STROKE +00D8 ; [.18BB.0021.0008.00D8] # LATIN CAPITAL LETTER O WITH STROKE +004F 0338 ; [.18BB.0021.0008.00D8] # LATIN CAPITAL LETTER O WITH STROKE +01FF ; [.18BB.0021.0002.00F8][.0000.0032.0002.0301] # LATIN SMALL LETTER O WITH STROKE AND ACUTE +01FE ; [.18BB.0021.0008.00D8][.0000.0032.0002.0301] # LATIN CAPITAL LETTER O WITH STROKE AND ACUTE +ENTRY +}; diff --git a/cpan/Unicode-Collate/Collate/Locale/gu.pl b/cpan/Unicode-Collate/Collate/Locale/gu.pl new file mode 100644 index 0000000000..0f630c8336 --- /dev/null +++ b/cpan/Unicode-Collate/Collate/Locale/gu.pl @@ -0,0 +1,7 @@ ++{ + entry => <<'ENTRY', # for DUCET v6.0.0 +0A82 ; [.2054.0020.0002.0A82][.FFF1.0000.0000.0000] # GUJARATI SIGN ANUSVARA +0A81 ; [.2054.0021.0002.0A81][.FFF1.0000.0000.0A81] # GUJARATI SIGN CANDRABINDU +0A83 ; [.2054.0020.0002.0A83][.FFF2.0000.0000.0000] # GUJARATI SIGN VISARGA +ENTRY +}; |