/[webpac2]/trunk/lib/WebPAC/Parser.pm

This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!

Diff of /trunk/lib/WebPAC/Parser.pm

Parent Directory | Revision Log | View Patch Patch

-revision 712 by dpavlin,
Tue Sep 26 10:23:04 2006 UTC
+revision 800 by dpavlin,
Sun Feb  4 23:10:18 2007 UTC
 Line 13 
 use base qw/WebPAC::Common/;
  =head1 NAME
- WebPAC::Parser - parse perl normalization configuration files and mungle it
+ WebPAC::Parser - parse perl normalization configuration files (rules) and mungle it
  =head1 VERSION
- Version 0.05
+ Version 0.08
  =cut
- our $VERSION = '0.05';
+ our $VERSION = '0.08';
  =head1 SYNOPSIS
  This module will parse L<WebPAC::Normalize/lookup> directives and generate source
- to produce lookups and normalization.
+ to produce lookups and normalization. It will also parse other parts of
+ source to produce some of DWIM (I<Do What I Mean>) magic
+ (like producing MARC oputput using L<WebPAC::Output::MARC> if there are C<marc_*>
+ rules in normalisation).
  It's written using L<PPI>, pure-perl parser for perl and heavily influenced by
  reading about LISP. It might be a bit over-the board, but at least it removed
-Line 148 
 sub lookup_create_rules {
+Line 151 
 sub lookup_create_rules {
          return $self->{_lookup_create}->{ _q($database) }->{ _q($input) };
  }
+ =head2 normalize_rules
+   my $source = $parser->normalize_rules($database, $input);
+ =cut
+ sub normalize_rules {
+         my $self = shift;
+         my ($database,$input) = @_;
+         $input = _input_name($input);
+         return unless (
+                 defined( $self->{_normalize_source}->{ _q($database) } ) &&
+                 defined( $self->{_normalize_source}->{ _q($database) }->{ _q($input) } )
+         );
+         return $self->{_normalize_source}->{ _q($database) }->{ _q($input) };
+ }
+ =head2 have_rules
+   my $do_marc = $parser->have_rules('marc', $database, $input);
+   my $do_index = $parser->have_rules('search', $database);
+ This function will return hash containing count of all found C<marc_*> or
+ C<search> directives. Input name is optional.
+ =cut
+ sub have_rules {
+         my $self = shift;
+         my $log = $self->_get_logger();
+         my $type = shift @_ || $log->logconfess("need at least type");
+         my $database = shift @_ || $log->logconfess("database is required");
+         my $input = shift @_;
+         $input = _input_name($input);
+         return unless defined( $self->{_have_rules}->{ _q($database) } );
+         my $database_rules = $self->{_have_rules}->{ _q($database ) };
+         if (defined($input)) {
+                 return unless (
+                         defined( $database_rules->{ _q($input) } ) &&
+                         defined( $database_rules->{ _q($input) }->{ $type } )
+                 );
+                 return $database_rules->{ _q($input) }->{ $type };
+         }
+         my $usage;
+         foreach my $i (keys %{ $database_rules }) {
+                 next unless defined( $database_rules->{$i}->{$type} );
+                 foreach my $t (keys %{ $database_rules->{ $i }->{$type} }) {
+                         $usage->{ $t } += $database_rules->{ $i }->{ $t };
+                 }
+         }
+         return $usage;
+ }
  =head1 PRIVATE
  =head2 _read_sources
-Line 165 
 sub _read_sources {
+Line 236 
 sub _read_sources {
          my $nr = 0;
-         my @lookups;
+         my @sources;
+         my $lookup_src_cache;
          $self->{config}->iterate_inputs( sub {
                  my ($input, $database) = @_;
-Line 188 
 sub _read_sources {
+Line 261 
 sub _read_sources {
                          $self->{valid_inputs}->{$database}->{$input_name}++;
-                         push @lookups, sub {
+                         push @sources, sub {
-                                 $self->_parse_lookups( $database, $input_name, $full, $s );
+                                 warn "### $database $input_name, $full ###\n";
+                                 $self->_parse_source( $database, $input_name, $full, $s );
                          };
                          $nr++;
-Line 198 
 sub _read_sources {
+Line 272 
 sub _read_sources {
          $log->debug("found $nr source files");
-         # parse all lookups
+         # parse all sources
-         $_->() foreach (@lookups);
+         $_->() foreach (@sources);
          return $nr;
  }
- =head2 _parse_lookups
+ =head2 _parse_source
-   $parser->_parse_lookups($database,$input,$path,$source);
+   $parser->_parse_source($database,$input,$path,$source);
  Called for each normalize source (rules) in each input by L</_read_sources>
-Line 214 
 It will report invalid databases and inp
+Line 288 
 It will report invalid databases and inp
  =cut
- sub _parse_lookups {
+ sub _parse_source {
          my $self = shift;
          my ($database, $input, $path, $source) = @_;
-Line 232 
 sub _parse_lookups {
+Line 306 
 sub _parse_lookups {
          my $Document = PPI::Document->new( \$source ) || $log->logdie("can't parse source:\n", $self->{source});
          $Document->prune('PPI::Token::Whitespace');
+         $Document->prune('PPI::Token::Comment');
          #$Document->prune('PPI::Token::Operator');
          # Find all the named subroutines
-Line 335 
 sub _parse_lookups {
+Line 410 
 sub _parse_lookups {
          $log->debug("create: ", dump($self->{_lookup_create}) );
          $log->debug("normalize: $normalize_source");
-         $self->{_normalize_source}->{$database}->{$input} = $normalize_source;
+         $self->{_normalize_source}->{$database}->{$input} .= $normalize_source;
          if ($self->{debug}) {
                  my $Dumper = PPI::Dumper->new( $Document );
-Line 344 
 sub _parse_lookups {
+Line 419 
 sub _parse_lookups {
          $log->error("Parser errors:\n", join("\n",@{ $self->{_lookup_errors} }) ) if ($self->{_lookup_errors});
+         $Document->find( sub {
+                         my ($Document,$Element) = @_;
+                         $Element->isa('PPI::Token::Word') or return '';
+                         if ($Element->content =~ m/^(marc|search)/) {
+                                 my $what = $1;
+                                 $log->debug("found $what rules in $database/$input");
+                                 $self->{_have_rules}->{ $database }->{ $input }->{ $what }->{ $Element->content }++;
+                         } else {
+                                 return '';
+                         }
+         });
          return 1;
  }

 Legend:



Removed from v.712
 


changed lines


 
Added in v.800
 Legend:



Removed from v.712
 


changed lines


 
Added in v.800
-Removed from v.712
+Added in v.800

	ViewVC Help
Powered by ViewVC 1.1.26