UCD.pm: Don't use NamedSequences.txt, saves disk

This changes UCD to not use this file. Instead it takes advantage of the recent addition of named sequences being accessible through the \N{} construct. In one case where it returns a hash of all the named sequences, it uses the same .pl file that \N{} does. My guess is that this routine's usefulness is now past, as named sequences are now incorporated into the core.
author: Karl Williamson <public@khwilliamson.com> 2010-11-19 11:59:05 -0700
committer: Father Chrysostomos <sprout@cpan.org> 2010-11-20 18:15:14 -0800
commit: 98ef7649bc2d994db925c45a7d2fdce7dff098b3 (patch)
tree: 3a64d9622b37c8a89ce0c0b41586e109bede8565 /lib/Unicode
parent: afdbe55d0c4f11409419f813c4360c8ab300a779 (diff)
download: perl-98ef7649bc2d994db925c45a7d2fdce7dff098b3.tar.gz
1 files changed, 22 insertions, 8 deletions
diff --git a/lib/Unicode/UCD.pm b/lib/Unicode/UCD.pm
index 2c1f0e55c1..eb4de2882d 100644
--- a/lib/Unicode/UCD.pm
+++ b/lib/Unicode/UCD.pm
@@ -2,6 +2,7 @@ package Unicode::UCD;
 
 use strict;
 use warnings;
+use charnames ();
 
 our $VERSION = '0.29';
 
@@ -1129,13 +1130,14 @@ my %NAMEDSEQ;
 
 sub _namedseq {
     unless (%NAMEDSEQ) {
-	if (openunicode(\$NAMEDSEQFH, "NamedSequences.txt")) {
+	if (openunicode(\$NAMEDSEQFH, "Name.pl")) {
 	    local $_;
 	    while (<$NAMEDSEQFH>) {
-		if (/^(.+)\s*;\s*([0-9A-F]+(?: [0-9A-F]+)*)$/) {
-		    my ($n, $s) = ($1, $2);
-		    my @s = map { chr(hex($_)) } split(' ', $s);
-		    $NAMEDSEQ{$n} = join("", @s);
+		if (/^ [0-9A-F]+ \  /x) {
+                    chomp;
+                    my ($sequence, $name) = split /\t/;
+		    my @s = map { chr(hex($_)) } split(' ', $sequence);
+		    $NAMEDSEQ{$name} = join("", @s);
 		}
 	    }
 	    close($NAMEDSEQFH);
@@ -1144,18 +1146,30 @@ sub _namedseq {
 }
 
 sub namedseq {
-    _namedseq() unless %NAMEDSEQ;
+
+    # Use charnames::string_vianame() which now returns this information,
+    # unless the caller wants the hash returned, in which case we read it in,
+    # and thereafter use it instead of calling charnames, as it is faster.
+
     my $wantarray = wantarray();
     if (defined $wantarray) {
 	if ($wantarray) {
 	    if (@_ == 0) {
+                _namedseq() unless %NAMEDSEQ;
 		return %NAMEDSEQ;
 	    } elsif (@_ == 1) {
-		my $s = $NAMEDSEQ{ $_[0] };
+		my $s;
+                if (%NAMEDSEQ) {
+                    $s = $NAMEDSEQ{ $_[0] };
+                }
+                else {
+                    $s = charnames::string_vianame($_[0]);
+                }
 		return defined $s ? map { ord($_) } split('', $s) : ();
 	    }
 	} elsif (@_ == 1) {
-	    return $NAMEDSEQ{ $_[0] };
+            return $NAMEDSEQ{ $_[0] } if %NAMEDSEQ;
+            return charnames::string_vianame($_[0]);
 	}
     }
     return;
author	Karl Williamson <public@khwilliamson.com>	2010-11-19 11:59:05 -0700
committer	Father Chrysostomos <sprout@cpan.org>	2010-11-20 18:15:14 -0800
commit	98ef7649bc2d994db925c45a7d2fdce7dff098b3 (patch)
tree	3a64d9622b37c8a89ce0c0b41586e109bede8565 /lib/Unicode
parent	afdbe55d0c4f11409419f813c4360c8ab300a779 (diff)
download	perl-98ef7649bc2d994db925c45a7d2fdce7dff098b3.tar.gz