X-Git-Url: http://www.dxcluster.org/gitweb/gitweb.cgi?a=blobdiff_plain;f=perl%2FBadWords.pm;h=e7d1169e3a390abd5845f5922bb299eaa79cefdc;hb=17f0b57add792391822d38116e89b33c1df4e2dd;hp=2336bb0468e22b1b95e3b517f5750c6397dd9fc2;hpb=428e91daacae4fddcabc7e6279c1fbd40edbbe91;p=spider.git diff --git a/perl/BadWords.pm b/perl/BadWords.pm index 2336bb04..e7d1169e 100644 --- a/perl/BadWords.pm +++ b/perl/BadWords.pm @@ -12,12 +12,13 @@ use strict; use DXUtil; use DXVars; +use DXHash; use IO::File; -use vars qw(%badwords $fn); +use vars qw($badword); -$fn = "$main::data/badwords"; -%badwords = (); +my $oldfn = "$main::data/badwords"; +$badword = new DXHash "badword"; use vars qw($VERSION $BRANCH); $VERSION = sprintf( "%d.%03d", q$Revision$ =~ /(\d+)\.(\d+)/ ); @@ -29,23 +30,24 @@ $main::branch += $BRANCH; sub load { my @out; - return unless -e $fn; - my $fh = new IO::File $fn; + return unless -e $oldfn; + my $fh = new IO::File $oldfn; if ($fh) { - %badwords = (); while (<$fh>) { chomp; next if /^\s*\#/; my @list = split " "; for (@list) { - $badwords{lc $_}++; + $badword->add($_); } } $fh->close; + $badword->put; + unlink $oldfn; } else { - my $l = "can't open $fn $!"; - dbg('err', $l); + my $l = "can't open $oldfn $!"; + dbg($l); push @out, $l; } return @out; @@ -54,7 +56,7 @@ sub load # check the text against the badwords list sub check { - return grep { $badwords{$_} } split(/\b/, lc shift); + return grep { $badword->in($_) } split(/\b/, lc shift); } 1;