projects
/
spider.git
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
and also in sh/db0sdx.pl
[spider.git]
/
perl
/
DXDupe.pm
diff --git
a/perl/DXDupe.pm
b/perl/DXDupe.pm
index cd4272c787530d24473dc821fcd7b724596762c9..5b288d1f87b1b3f1d04f8f99caf8c485d3d0127f 100644
(file)
--- a/
perl/DXDupe.pm
+++ b/
perl/DXDupe.pm
@@
-21,24
+21,39
@@
$fn = "$main::data/dupefile";
sub init
{
sub init
{
- $dbm = tie (%d, 'DB_File', $fn) or confess "can't open dupe file: $fn ($!)";
+ unlink $fn;
+ $dbm = tie (%d, 'DB_File', $fn);
+ confess "cannot open $fn $!" unless $dbm;
}
sub finish
{
undef $dbm;
untie %d;
}
sub finish
{
undef $dbm;
untie %d;
+ undef %d;
+ unlink $fn;
}
sub check
{
}
sub check
{
- my ($s, $t) = @_;
- return 1 if exists $d{$s};
- $t = $main::systime + $default unless $t;
- $d{$s} = $t;
+ my $s = shift;
+ return 1 if find($s);
+ add($s, shift);
return 0;
}
return 0;
}
+sub find
+{
+ return $d{$_[0]};
+}
+
+sub add
+{
+ my $s = shift;
+ my $t = shift || $main::systime + $default;
+ $d{$s} = $t;
+}
+
sub del
{
my $s = shift;
sub del
{
my $s = shift;
@@
-49,9
+64,11
@@
sub process
{
# once an hour
if ($main::systime - $lasttime >= 3600) {
{
# once an hour
if ($main::systime - $lasttime >= 3600) {
+ my @del;
while (($k, $v) = each %d) {
while (($k, $v) = each %d) {
-
delete $d{$k}
if $main::systime >= $v;
+
push @del, $k
if $main::systime >= $v;
}
}
+ delete $d{$_} for @del;
$lasttime = $main::systime;
}
}
$lasttime = $main::systime;
}
}
@@
-78,7
+95,7
@@
sub listdups
my @out;
for (sort { $d{$a} <=> $d{$b} } grep { m{$regex}i } keys %d) {
my ($dum, $key) = unpack "a1a*", $_;
my @out;
for (sort { $d{$a} <=> $d{$b} } grep { m{$regex}i } keys %d) {
my ($dum, $key) = unpack "a1a*", $_;
- push @out, "$key = " . cldatetime($d{$_} - $dupage);
+ push @out, "$key = " . cldatetime($d{$_} - $dupage)
. " expires " . cldatetime($d{$_})
;
}
return @out;
}
}
return @out;
}