/[Search-Estraier]/trunk/scripts/estcp.pl
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Diff of /trunk/scripts/estcp.pl

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 80 by dpavlin, Mon Jan 16 23:08:07 2006 UTC revision 141 by dpavlin, Wed May 10 14:52:28 2006 UTC
# Line 1  Line 1 
1  #!/usr/bin/perl -w  #!/usr/bin/perl -w
2    
3  use strict;  use strict;
4  use Search::Estraier;  use Search::Estraier 0.06;
5  use URI::Escape qw/uri_escape/;  use URI::Escape qw/uri_escape/;
6    use Time::HiRes;
7    use POSIX qw/strftime/;
8    
9  =head1 NAME  =head1 NAME
10    
# Line 15  my ($from,$to) = @ARGV; Line 17  my ($from,$to) = @ARGV;
17  die "usage: $0 http://localhost:1978/node/from http://remote.example.com:1978/node/to\n" unless ($from && $to);  die "usage: $0 http://localhost:1978/node/from http://remote.example.com:1978/node/to\n" unless ($from && $to);
18    
19  my $debug = 0;  my $debug = 0;
20    my $max = 256;
21    
22  # create and configure node  # create and configure node
23  my $from_n = new Search::Estraier::Node(  my $from_n = new Search::Estraier::Node(
24          url => $from,          url => $from,
25          croak_on_error => 1,          croak_on_error => 1,
26          debug => $debug,          debug => $debug,
27            user => 'admin',
28            passwd => 'admin',
29  );  );
30  my $to_n = new Search::Estraier::Node(  my $to_n = new Search::Estraier::Node(
31          url => $to,          url => $to,
32          croak_on_error => 1,          croak_on_error => 1,
33          debug => $debug,          debug => $debug,
34            user => 'admin',
35            passwd => 'admin',
36            create => 1,
37            label => $from_n->label,
38  );  );
39    
40  print "Copy from ",$from_n->name," (",$from_n->label,") to ",$to_n->name," (",$to_n->label,") - ",$from_n->doc_num," documents (",$from_n->word_num," words, ",$from_n->size," bytes)\n";  print "Copy from ",$from_n->name," (",$from_n->label,") to ",$to_n->name," (",$to_n->label,") - ",$from_n->doc_num," documents (",$from_n->word_num," words, ",$from_n->size," bytes)\n";
41    
42  my $tick = int($from_n->doc_num / 78);  my $doc_num = $from_n->doc_num || 1;
43    
 print "[";  
 my $res;  
44  my $prev;  my $prev;
45  my $i = 0;  my $i = 0;
46    my $more = 1;
47    
48  do {  my $t = time();
49    
50    while($more) {
51            my $res;
52          $from_n->shuttle_url( $from_n->{url} . '/list',          $from_n->shuttle_url( $from_n->{url} . '/list',
53                  'application/x-www-form-urlencoded',                  'application/x-www-form-urlencoded',
54                  'max=256' . ( $prev ? '&prev=' . uri_escape( $prev ) : '' ),                  'max=' . $max . ( $prev ? '&prev=' . uri_escape( $prev ) : '' ),
55                  \$res,                  \$res,
56          );          );
57          last unless ($res);          if (! $res || $res eq '') {
58                    $more = 0;
59                    last;
60            }
61          foreach my $l (split(/\n/,$res)) {          foreach my $l (split(/\n/,$res)) {
62                  (my $id, $prev) = split(/\t/,$l, 2);                  (my $id, $prev) = split(/\t/,$l, 2);
63                  $to_n->put_doc( $from_n->get_doc( $id ));  
64                    #$to_n->put_doc( $from_n->get_doc( $id ));
65    
66                    my $doc_draft = $from_n->_fetch_doc( id => $id, chomp_resbody => 1 );
67                    $to_n->shuttle_url( $to_n->{url} . '/put_doc', 'text/x-estraier-draft', $doc_draft, undef) == 200 or die "can't insert $doc_draft\n";
68    
69                    $i++;
70          }          }
71          print "$prev\n";          warn "$prev\n" if ($debug);
72          print "." if ($i++ % $tick == 0);  
73  } while ($res);          my $rate = ( $i / (time() - $t) );
74            printf("%d records, %1.2f%% [%1.2f rec/s] estimated finish: %s\n",
75                    $i,
76                    ($i * 100 / $doc_num),
77                    $rate,
78                    strftime("%Y-%m-%d %H:%M:%S", localtime( time() + int(($doc_num-$i) / $rate))),
79            );
80    
81    }
82    
83    print "Copy completed.\n";
84    
 print "]\n";  

Legend:
Removed from v.80  
changed lines
  Added in v.141

  ViewVC Help
Powered by ViewVC 1.1.26