summaryrefslogtreecommitdiff
path: root/lib/Search/Dict.pm
diff options
context:
space:
mode:
Diffstat (limited to 'lib/Search/Dict.pm')
-rw-r--r--lib/Search/Dict.pm52
1 files changed, 52 insertions, 0 deletions
diff --git a/lib/Search/Dict.pm b/lib/Search/Dict.pm
new file mode 100644
index 0000000000..10aa4ff583
--- /dev/null
+++ b/lib/Search/Dict.pm
@@ -0,0 +1,52 @@
+package Search::Dict;
+require 5.000;
+require Exporter;
+
+@ISA = qw(Exporter);
+@EXPORT = qw(look);
+
+# Usage: look(*FILEHANDLE,$key,$dict,$fold)
+
+# Sets file position in FILEHANDLE to be first line greater than or equal
+# (stringwise) to $key. Pass flags for dictionary order and case folding.
+
+sub look {
+ local(*FH,$key,$dict,$fold) = @_;
+ local($max,$min,$mid,$_);
+ local($dev,$ino,$mode,$nlink,$uid,$gid,$rdev,$size,$atime,$mtime,$ctime,
+ $blksize,$blocks) = stat(FH);
+ $blksize = 8192 unless $blksize;
+ $key =~ s/[^\w\s]//g if $dict;
+ $key =~ tr/A-Z/a-z/ if $fold;
+ $max = int($size / $blksize);
+ while ($max - $min > 1) {
+ $mid = int(($max + $min) / 2);
+ seek(FH,$mid * $blksize,0);
+ $_ = <FH> if $mid; # probably a partial line
+ $_ = <FH>;
+ chop;
+ s/[^\w\s]//g if $dict;
+ tr/A-Z/a-z/ if $fold;
+ if ($_ lt $key) {
+ $min = $mid;
+ }
+ else {
+ $max = $mid;
+ }
+ }
+ $min *= $blksize;
+ seek(FH,$min,0);
+ <FH> if $min;
+ while (<FH>) {
+ chop;
+ s/[^\w\s]//g if $dict;
+ y/A-Z/a-z/ if $fold;
+ last if $_ ge $key;
+ $min = tell(FH);
+ }
+ seek(FH,$min,0);
+ $min;
+}
+
+1;
+