--- trunk/scripts/est-spider 2006/08/25 11:59:04 179 +++ trunk/scripts/est-spider 2006/08/26 22:33:34 181 @@ -61,7 +61,7 @@ my $filter; foreach my $f (qw/pdftotext pstotext/) { my $w = which($f); - if ($f) { + if ($w) { $filter->{$f} = $w; print STDERR "using $f filter at $w\n" if ($verbose); } @@ -237,6 +237,7 @@ if ($contents) { # html2text + $contents =~ s###gis; $contents =~ s#<[^>]+/*>##gs; $contents =~ s#\s\s+# #gs;