/[Search-Estraier]/trunk/lib/Search/Estraier.pm
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Diff of /trunk/lib/Search/Estraier.pm

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 47 by dpavlin, Fri Jan 6 01:51:28 2006 UTC revision 49 by dpavlin, Fri Jan 6 12:40:23 2006 UTC
# Line 692  use Carp qw/carp croak confess/; Line 692  use Carp qw/carp croak confess/;
692  use URI;  use URI;
693  use MIME::Base64;  use MIME::Base64;
694  use IO::Socket::INET;  use IO::Socket::INET;
695    use URI::Escape qw/uri_escape/;
696    
697  =head1 Search::Estraier::Node  =head1 Search::Estraier::Node
698    
# Line 928  sub get_doc_by_uri { Line 929  sub get_doc_by_uri {
929  }  }
930    
931    
932    =head2 get_doc_attr
933    
934    Retrieve the value of an atribute from object
935    
936      my $val = $node->get_doc_attr( document_id, 'attribute_name' ) or
937            die "can't get document attribute";
938    
939    =cut
940    
941    sub get_doc_attr {
942            my $self = shift;
943            my ($id,$name) = @_;
944            return unless ($id && $name);
945            return $self->_fetch_doc( id => $id, attr => $name );
946    }
947    
948    
949    =head2 get_doc_attr_by_uri
950    
951    Retrieve the value of an atribute from object
952    
953      my $val = $node->get_doc_attr_by_uri( document_id, 'attribute_name' ) or
954            die "can't get document attribute";
955    
956    =cut
957    
958    sub get_doc_attr_by_uri {
959            my $self = shift;
960            my ($uri,$name) = @_;
961            return unless ($uri && $name);
962            return $self->_fetch_doc( uri => $uri, attr => $name );
963    }
964    
965    
966  =head2 etch_doc  =head2 etch_doc
967    
968  Exctract document keywords  Exctract document keywords
# Line 936  Exctract document keywords Line 971  Exctract document keywords
971    
972  =cut  =cut
973    
974  sub erch_doc {  sub etch_doc {
975          my $self = shift;          my $self = shift;
976          my $id = shift || return;          my $id = shift || return;
977          return $self->_fetch_doc( id => $id, etch => 1 );          return $self->_fetch_doc( id => $id, etch => 1 );
# Line 987  C<etch_doc>, C<etch_doc_by_uri>. Line 1022  C<etch_doc>, C<etch_doc_by_uri>.
1022   my $doc = $node->_fetch_doc( id => 42, etch => 1 );   my $doc = $node->_fetch_doc( id => 42, etch => 1 );
1023   my $doc = $node->_fetch_doc( uri => 'file:///document/uri/42', etch => 1 );   my $doc = $node->_fetch_doc( uri => 'file:///document/uri/42', etch => 1 );
1024    
1025     # to get document attrubute add attr
1026     my $doc = $node->_fetch_doc( id => 42, attr => '@mdate' );
1027     my $doc = $node->_fetch_doc( uri => 'file:///document/uri/42', attr => '@mdate' );
1028    
1029   # more general form which allows implementation of   # more general form which allows implementation of
1030   # uri_to_id   # uri_to_id
1031   my $id = $node->_fetch_doc(   my $id = $node->_fetch_doc(
# Line 1016  sub _fetch_doc { Line 1055  sub _fetch_doc {
1055                  confess "unhandled argument. Need id or uri.";                  confess "unhandled argument. Need id or uri.";
1056          }          }
1057    
1058            if ($a->{attr}) {
1059                    $path = '/get_doc_attr';
1060                    $arg .= '&attr=' . uri_escape($a->{attr});
1061                    $a->{chomp_resbody} = 1;
1062            }
1063    
1064          my $rv = $self->shuttle_url( $self->{url} . $path,          my $rv = $self->shuttle_url( $self->{url} . $path,
1065                  'application/x-www-form-urlencoded',                  'application/x-www-form-urlencoded',
1066                  $arg,                  $arg,
# Line 1042  sub _fetch_doc { Line 1087  sub _fetch_doc {
1087  }  }
1088    
1089    
1090    =head2 name
1091    
1092      my $node_name = $node->name;
1093    
1094    =cut
1095    
1096    sub name {
1097            my $self = shift;
1098            $self->set_info unless ($self->{name});
1099            return $self->{name};
1100    }
1101    
1102    
1103    =head2 label
1104    
1105      my $node_label = $node->label;
1106    
1107    =cut
1108    
1109    sub label {
1110            my $self = shift;
1111            $self->set_info unless ($self->{label});
1112            return $self->{label};
1113    }
1114    
1115    
1116    =head2 doc_num
1117    
1118      my $documents_in_node = $node->doc_num;
1119    
1120    =cut
1121    
1122    sub doc_num {
1123            my $self = shift;
1124            $self->set_info if ($self->{dnum} < 0);
1125            return $self->{dnum};
1126    }
1127    
1128    
1129    =head2 word_num
1130    
1131      my $words_in_node = $node->word_num;
1132    
1133    =cut
1134    
1135    sub word_num {
1136            my $self = shift;
1137            $self->set_info if ($self->{wnum} < 0);
1138            return $self->{wnum};
1139    }
1140    
1141    
1142    =head2 size
1143    
1144      my $node_size = $node->size;
1145    
1146    =cut
1147    
1148    sub size {
1149            my $self = shift;
1150            $self->set_info if ($self->{size} < 0);
1151            return $self->{size};
1152    }
1153    
1154    
1155    
1156  =head2 shuttle_url  =head2 shuttle_url
# Line 1155  sub shuttle_url { Line 1264  sub shuttle_url {
1264          return $self->{status};          return $self->{status};
1265  }  }
1266    
1267    
1268    =head2 set_info
1269    
1270    Set information for node
1271    
1272      $node->set_info;
1273    
1274    =cut
1275    
1276    sub set_info {
1277            my $self = shift;
1278    
1279            $self->{status} = -1;
1280            return unless ($self->{url});
1281    
1282            my $resbody;
1283            my $rv = $self->shuttle_url( $self->{url} . '/inform',
1284                    'text/plain',
1285                    undef,
1286                    \$resbody,
1287            );
1288    
1289            return if ($rv != 200 || !$resbody);
1290    
1291            chomp($resbody);
1292    
1293            ( $self->{name}, $self->{label}, $self->{dnum}, $self->{wnum}, $self->{size} ) =
1294                    split(/\t/, $resbody, 5);
1295    
1296    }
1297    
1298  ###  ###
1299    
1300  =head1 EXPORT  =head1 EXPORT

Legend:
Removed from v.47  
changed lines
  Added in v.49

  ViewVC Help
Powered by ViewVC 1.1.26