/[couchdb]/scripts/reblog2couchdb.pl
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Annotation of /scripts/reblog2couchdb.pl

Parent Directory Parent Directory | Revision Log Revision Log


Revision 6 - (hide annotations)
Tue Aug 5 16:22:43 2008 UTC (15 years, 10 months ago) by dpavlin
File MIME type: text/plain
File size: 2335 byte(s)
keep last synced row within couchdb for easy stop/resume of
import
1 dpavlin 2 #!/usr/bin/perl -w
2    
3     use strict;
4     use DBI;
5     use CouchDB::Client;
6     use Data::Dump qw/dump/;
7    
8     $|++;
9    
10     my $database = 'reblog';
11    
12 dpavlin 6 my $dbi = "DBI:mysql:database=$database";
13     $dbi .= ";host=127.0.0.1;port=13306"; # XXX over ssh
14 dpavlin 2
15     my $sql = qq{
16     select
17 dpavlin 4 items.id as _id,
18     items.*,
19     feeds.url as feed_url,
20     feeds.title as feed_title,
21     feeds.link as feed_link,
22     feeds.description as feed_description
23 dpavlin 2 from items
24 dpavlin 4 join items_userdata on items.id = item_id
25     join feeds on items.feed_id = feeds.id
26 dpavlin 6 where items.id > ?
27 dpavlin 4 order by items.id asc
28 dpavlin 6 limit 1000
29 dpavlin 2 };
30    
31    
32     my $c = CouchDB::Client->new(uri => 'http://localhost:5984/');
33    
34     $c->testConnection or die "The server cannot be reached";
35 dpavlin 6 print "CouchDB version " . $c->serverInfo->{version} . "\n";
36 dpavlin 2 my $db = $c->newDB( $database );
37     $db->create unless $c->dbExists( $database );
38    
39 dpavlin 6 my $status = $db->newDoc( '_sync' );
40     eval { $status->retrieve };
41     $status->create if $@;
42 dpavlin 2
43 dpavlin 6 print "status ",dump( $status->{data} ), "\n";
44    
45     my $last_row = $status->{data}->{last_row_id} || 0;
46    
47     my $dbh = DBI->connect($dbi,"","") || die $DBI::errstr;
48    
49     print "Fetching items from $dbi id > $last_row\n";
50    
51     my $sth = $dbh->prepare($sql) || die $dbh->errstr();
52     $sth->execute( $last_row ) || die $sth->errstr();
53    
54     warn dump( $sth->{NAME} );
55    
56     print "found ",$sth->rows," items to process...";
57    
58 dpavlin 2 my $pk = 'id';
59    
60 dpavlin 6 my $count = 0;
61    
62 dpavlin 2 while (my $row = $sth->fetchrow_hashref() ) {
63 dpavlin 4 my $_id = $row->{_id} || die "row needs _id";
64 dpavlin 2 my $doc = $db->newDoc( $_id );
65 dpavlin 4
66     sub row2doc {
67     my ( $row, $doc ) = @_;
68     my $a = delete( $row->{xml} );
69     $doc->addAttachment( 'item.xml', 'application/xhtml+xml', $a ) if $a;
70     my $a = delete( $row->{content} );
71     $doc->addAttachment( 'content.html', 'text/html', $a ) if $a;
72     $doc->{data} = $row;
73     return $doc;
74     }
75    
76     row2doc( $row, $doc );
77    
78 dpavlin 2 eval { $doc->create };
79     if ( $@ ) {
80 dpavlin 4 $doc->retrieve;
81     row2doc( $row, $doc )->update;
82     # eval { $doc->update };
83     warn ( $@ ? "ERROR $_id $@" : "updated $_id" ), $/;
84 dpavlin 2 } else {
85 dpavlin 4 warn "created ",dump( $row ),$/;
86 dpavlin 2 }
87 dpavlin 6
88     $count++;
89     if ( $count++ % 100 == 0 ) { # checkpoint every 100 records
90     $status->{data}->{last_row_id} = $row->{id};
91     $status->update;
92     }
93 dpavlin 2 }
94    
95 dpavlin 6 # end checkpoint
96     $status->{data}->{last_row_id} = $last_row;
97     $status->update;
98    
99 dpavlin 2 __END__
100    
101     $sql = qq{
102     update items_userdata
103     set value_numeric = 1
104     where label = 'read' and item_id in ($ids)
105     };
106    
107     $dbh->do( $sql );
108    

Properties

Name Value
svn:executable *

  ViewVC Help
Powered by ViewVC 1.1.26