--- bin/reindex.pl 2007/04/29 11:37:28 129 +++ bin/reindex.pl 2007/05/08 14:11:38 144 @@ -11,8 +11,13 @@ use Data::Dump qw/dump/; use Text::DeDuper; use Encode; +use Getopt::Long; -my $remove_duplicates = 1; +my $keep_duplicates = 0; + +GetOptions( + 'duplicates!' => $keep_duplicates, +); $|=1; @@ -22,9 +27,9 @@ my $coll = Grep::Model::ItemCollection->new( results_are_readable => 1, current_user => $system_user ); $coll->unlimit; -print "indexing ", $coll->count, " items "; +print "indexing ", $coll->count, " items ", $keep_duplicates ? "" : "removing duplicates "; -my $search = Grep::Search->new(); +my $search = Grep::Search->new({ create => 1 }); my $deduper = Text::DeDuper->new(); my ( $total, $duplicates ) = ( 0, 0 ); @@ -33,7 +38,7 @@ print $i->id; - if ( $remove_duplicates ) { + if ( ! $keep_duplicates ) { my $c = encode('utf-8', $i->content); @@ -59,6 +64,6 @@ $total++; } -print "$total records indexed", $remove_duplicates ? " ($duplicates duplicates)" : "", "\n"; +print "$total records indexed", $duplicates ? "($duplicates duplicates)" : "", "\n"; $search->finish;