/[socialtext-import]/tamtam/tamtam2socialtext.pl
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Annotation of /tamtam/tamtam2socialtext.pl

Parent Directory Parent Directory | Revision Log Revision Log


Revision 13 - (hide annotations)
Wed Dec 12 17:14:58 2007 UTC (16 years, 2 months ago) by dpavlin
File MIME type: text/plain
File size: 2902 byte(s)
added original link at end of page
1 dpavlin 5 #!/usr/bin/perl
2    
3     use warnings;
4     use strict;
5    
6     use XML::Simple;
7     use File::Find;
8     use Regexp::Common qw/balanced/;
9     use Socialtext::Resting;
10     use Encode;
11 dpavlin 6 use HTTP::Date;
12 dpavlin 5 use Data::Dump qw/dump/;
13    
14 dpavlin 11 my $max = 999;
15 dpavlin 6
16 dpavlin 5 my $page;
17 dpavlin 6 my $page_date;
18 dpavlin 5
19 dpavlin 9 my @page_names;
20    
21 dpavlin 5 find({
22     wanted => sub {
23     my $path = $File::Find::name;
24     return unless -f $path;
25 dpavlin 6
26 dpavlin 5 warn "# $path\n";
27     my $ref = XMLin( $path ) || die "can't open $path: $!";
28 dpavlin 6
29     my $name = $ref->{name} || die "no name in $path";
30 dpavlin 8
31     return if $name =~ m/^TamSystem/;
32    
33 dpavlin 6 my $date = $ref->{meta}->{LastModified};
34     if ( ! $date ) {
35     warn "SKIP: no LastModified in $path $name";
36     return;
37     }
38     my $data =
39     $ref->{widgets}->{widget}->{data} ||
40     $ref->{widgets}->{widget}->{Body}->{data} ||
41     die "no data in $path ",dump( $ref );
42    
43 dpavlin 13 $data .= qq{
44     ----
45    
46     Original: http://www.razmjenavjestina.org/$path
47     };
48    
49 dpavlin 6 $page->{ $name } = [ $data, $date ];
50    
51 dpavlin 11 # strip path from page name
52     $name =~ s,^.+/([^/]+)$,$1,;
53     push @page_names, $name;
54    
55 dpavlin 13 # warn dump( $ref );
56 dpavlin 5 },
57     }, shift @ARGV || '.');
58    
59 dpavlin 6 my @pages = ( keys %$page );
60 dpavlin 5
61 dpavlin 11 warn "found following pages: ", join(", ", @page_names),"\n";
62 dpavlin 5
63 dpavlin 11 my $page_link_re = '\b(' . join('|', @page_names) . ')\b';
64    
65 dpavlin 5 my $Rester = Socialtext::Resting->new(
66     username => 'tamtam',
67     password => 'import',
68     server => 'http://saturn.ffzg.hr/',
69     );
70     $Rester->workspace('razmjenavjestina');
71     $Rester->put_workspacetag('TamTam');
72    
73     sub header {
74     my $h = shift;
75     if ( $h =~ m/^(=+)\s+(.+?)\s+\1$/ ) {
76     my $level = length($1);
77     return "\n" . ( '^' x $level ) . " $2\n";
78     } else {
79 dpavlin 11 return $h;
80 dpavlin 5 }
81     }
82    
83     sub surround {
84     my ( $with, $what ) = @_;
85     return $with . $what . $with;
86     }
87    
88 dpavlin 12 sub pre {
89     my $text = shift;
90     $text =~ s/^{{{//;
91     $text =~ s/}}}$//;
92     return '.pre' . $text . '.pre';
93     }
94    
95 dpavlin 6 my $count = 0;
96    
97 dpavlin 5 foreach my $name ( keys %$page ) {
98 dpavlin 6 last if $count++ == $max;
99 dpavlin 5
100 dpavlin 6 my ( $body, $date ) = @{ $page->{$name} };
101     $date = time2str( $date );
102    
103 dpavlin 5 $body =~ s/\Q[[TableOfContents]]\E/{toc}/gs;
104     $body =~ s/\Q[[BR]]\E/\n/gs;
105     $body =~ s/$RE{balanced}{-begin => "= |== |=== |==== |===== |===== "}{-end => " =| ==| ===| ====| ====="}{-keep}/header($1)/gse;
106     $body =~ s/''''(.+?)''''/surround('`',$1)/gse;
107     $body =~ s/'''(.+?)'''/surround('*',$1)/gse;
108     $body =~ s/''(.+?)''/surround('_',$1)/gse;
109 dpavlin 12 $body =~ s/$RE{balanced}{-begin => "{{{"}{-end => "}}}"}{-keep}/pre($1)/gse;
110 dpavlin 5
111 dpavlin 9 # fix bullets
112 dpavlin 7 $body =~ s/^\s+([\*])/$1/gm;
113    
114 dpavlin 9 # fix links
115     $body =~ s/\["([^"]+)"\]/[$1]/gs;
116 dpavlin 10 $body =~ s,\[(http://\S+)\s+([^\]]+)\],"$2"<$1>,gs;
117     $body =~ s,\[(http://[^\]]+)\],$1,gs;
118 dpavlin 11 $body =~ s,$page_link_re,[$1],gs;
119 dpavlin 9
120 dpavlin 5 Encode::_utf8_off( $body );
121    
122 dpavlin 6 my @tags = ( 'TamTam' );
123 dpavlin 5
124 dpavlin 6 if ( $name =~ m!/! ) {
125     my @page_tags = split(m!/!, $name);
126 dpavlin 8 $name = pop @page_tags; # remove page name
127 dpavlin 6 push @tags, @page_tags;
128     }
129    
130     $Rester->put_page( $name, {
131     content => $body,
132     date => $date,
133     });
134 dpavlin 5 print "+ $name\n";
135 dpavlin 6 foreach ( @tags ) {
136     $Rester->put_pagetag( $name, $_ );
137     print "+ $name [$_]\n";
138     }
139    
140 dpavlin 5 }
141    

Properties

Name Value
svn:executable *

  ViewVC Help
Powered by ViewVC 1.1.26