/[socialtext-import]/tamtam/tamtam2socialtext.pl
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Annotation of /tamtam/tamtam2socialtext.pl

Parent Directory Parent Directory | Revision Log Revision Log


Revision 11 - (hide annotations)
Wed Dec 12 14:04:11 2007 UTC (16 years, 3 months ago) by dpavlin
File MIME type: text/plain
File size: 2646 byte(s)
- don't die on invalid header, leave it as-is
- make links from names of pages
1 dpavlin 5 #!/usr/bin/perl
2    
3     use warnings;
4     use strict;
5    
6     use XML::Simple;
7     use File::Find;
8     use Regexp::Common qw/balanced/;
9     use Socialtext::Resting;
10     use Encode;
11 dpavlin 6 use HTTP::Date;
12 dpavlin 5 use Data::Dump qw/dump/;
13    
14 dpavlin 11 my $max = 999;
15 dpavlin 6
16 dpavlin 5 my $page;
17 dpavlin 6 my $page_date;
18 dpavlin 5
19 dpavlin 9 my @page_names;
20    
21 dpavlin 5 find({
22     wanted => sub {
23     my $path = $File::Find::name;
24     return unless -f $path;
25 dpavlin 6
26 dpavlin 5 warn "# $path\n";
27     my $ref = XMLin( $path ) || die "can't open $path: $!";
28 dpavlin 6
29     my $name = $ref->{name} || die "no name in $path";
30 dpavlin 8
31     return if $name =~ m/^TamSystem/;
32    
33 dpavlin 6 my $date = $ref->{meta}->{LastModified};
34     if ( ! $date ) {
35     warn "SKIP: no LastModified in $path $name";
36     return;
37     }
38     my $data =
39     $ref->{widgets}->{widget}->{data} ||
40     $ref->{widgets}->{widget}->{Body}->{data} ||
41     die "no data in $path ",dump( $ref );
42    
43     $page->{ $name } = [ $data, $date ];
44    
45 dpavlin 11 # strip path from page name
46     $name =~ s,^.+/([^/]+)$,$1,;
47     push @page_names, $name;
48    
49 dpavlin 6 #warn dump( $ref );
50 dpavlin 5 },
51     }, shift @ARGV || '.');
52    
53 dpavlin 6 my @pages = ( keys %$page );
54 dpavlin 5
55 dpavlin 11 warn "found following pages: ", join(", ", @page_names),"\n";
56 dpavlin 5
57 dpavlin 11 my $page_link_re = '\b(' . join('|', @page_names) . ')\b';
58    
59 dpavlin 5 my $Rester = Socialtext::Resting->new(
60     username => 'tamtam',
61     password => 'import',
62     server => 'http://saturn.ffzg.hr/',
63     );
64     $Rester->workspace('razmjenavjestina');
65     $Rester->put_workspacetag('TamTam');
66    
67     sub header {
68     my $h = shift;
69     if ( $h =~ m/^(=+)\s+(.+?)\s+\1$/ ) {
70     my $level = length($1);
71     return "\n" . ( '^' x $level ) . " $2\n";
72     } else {
73 dpavlin 11 return $h;
74 dpavlin 5 }
75     }
76    
77     sub surround {
78     my ( $with, $what ) = @_;
79     return $with . $what . $with;
80     }
81    
82 dpavlin 6 my $count = 0;
83    
84 dpavlin 5 foreach my $name ( keys %$page ) {
85 dpavlin 6 last if $count++ == $max;
86 dpavlin 5
87 dpavlin 6 my ( $body, $date ) = @{ $page->{$name} };
88     $date = time2str( $date );
89    
90 dpavlin 5 $body =~ s/\Q[[TableOfContents]]\E/{toc}/gs;
91     $body =~ s/\Q[[BR]]\E/\n/gs;
92     $body =~ s/$RE{balanced}{-begin => "= |== |=== |==== |===== |===== "}{-end => " =| ==| ===| ====| ====="}{-keep}/header($1)/gse;
93     $body =~ s/''''(.+?)''''/surround('`',$1)/gse;
94     $body =~ s/'''(.+?)'''/surround('*',$1)/gse;
95     $body =~ s/''(.+?)''/surround('_',$1)/gse;
96    
97 dpavlin 9 # fix bullets
98 dpavlin 7 $body =~ s/^\s+([\*])/$1/gm;
99    
100 dpavlin 9 # fix links
101     $body =~ s/\["([^"]+)"\]/[$1]/gs;
102 dpavlin 10 $body =~ s,\[(http://\S+)\s+([^\]]+)\],"$2"<$1>,gs;
103     $body =~ s,\[(http://[^\]]+)\],$1,gs;
104 dpavlin 11 $body =~ s,$page_link_re,[$1],gs;
105 dpavlin 9
106 dpavlin 5 Encode::_utf8_off( $body );
107    
108 dpavlin 6 my @tags = ( 'TamTam' );
109 dpavlin 5
110 dpavlin 6 if ( $name =~ m!/! ) {
111     my @page_tags = split(m!/!, $name);
112 dpavlin 8 $name = pop @page_tags; # remove page name
113 dpavlin 6 push @tags, @page_tags;
114     }
115    
116     $Rester->put_page( $name, {
117     content => $body,
118     date => $date,
119     });
120 dpavlin 5 print "+ $name\n";
121 dpavlin 6 foreach ( @tags ) {
122     $Rester->put_pagetag( $name, $_ );
123     print "+ $name [$_]\n";
124     }
125    
126 dpavlin 5 }
127    

Properties

Name Value
svn:executable *

  ViewVC Help
Powered by ViewVC 1.1.26