/[Biblio-Isis]/trunk/lib/Biblio/Isis.pm

This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!

Diff of /trunk/lib/Biblio/Isis.pm

Parent Directory | Revision Log | View Patch Patch

-revision 62 by dpavlin,
Mon Jul 10 12:01:04 2006 UTC
+revision 70 by dpavlin,
Fri May 18 20:26:01 2007 UTC
 Line 7 
 use File::Glob qw(:globally :nocase);
  BEGIN {
          use Exporter ();
          use vars qw ($VERSION @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS);
-         $VERSION     = 0.22_2;
+         $VERSION     = 0.24_1;
          @ISA         = qw (Exporter);
          #Give a hoot don't pollute, do not export more than needed by default
          @EXPORT      = qw ();
 Line 84 
 Open ISIS database
          read_fdt => 1,
          include_deleted => 1,
          hash_filter => sub {
-                 my $v = shift;
+                 my ($v,$field_number) = @_;
                  $v =~ s#foo#bar#g;
          },
          debug => 1,
          join_subfields_with => ' ; ',
-         regexps => [
-                 's/something/else/g',
-         ],
   );
  Options are described below:
-Line 117 
 Don't skip logically deleted records in
+Line 114 
 Don't skip logically deleted records in
  =item hash_filter
- Filter code ref which will be used before data is converted to hash.
+ Filter code ref which will be used before data is converted to hash. It will
+ receive two arguments, whole line from current field (in C<< $_[0] >>) and
+ field number (in C<< $_[1] >>).
  =item debug
-Line 129 
 Define delimiter which will be used to j
+Line 128 
 Define delimiter which will be used to j
  option is included to support lagacy application written against version
  older than 0.21 of this module. By default, it disabled. See L</to_hash>.
- =item regexpes
+ =item ignore_empty_subfields
- Define (any number) of regexpes to apply at field values before they are
+ Remove all empty subfields while reading from ISIS file.
- splitted into subfield. This is great place to split subfields in input to
- mulitple subfields if needed or rename subfields.
  =back
-Line 146 
 sub new {
+Line 143 
 sub new {
          croak "new needs database name (isisdb) as argument!" unless ({@_}->{isisdb});
-         foreach my $v (qw{isisdb debug include_deleted hash_filter}) {
+         foreach my $v (qw{isisdb debug include_deleted hash_filter join_subfields_with ignore_empty_subfields}) {
-                 $self->{$v} = {@_}->{$v};
+                 $self->{$v} = {@_}->{$v} if defined({@_}->{$v});
          }
          my @isis_files = grep(/\.(FDT|MST|XRF|CNT)$/i,glob($self->{isisdb}."*"));
-Line 391 
 sub fetch {
+Line 388 
 sub fetch {
                  # skip zero-sized fields
                  next if ($FieldLEN[$i] == 0);
-                 push @{$self->{record}->{$FieldTAG[$i]}}, substr($buff,$FieldPOS[$i],$FieldLEN[$i]);
+                 my $v = substr($buff,$FieldPOS[$i],$FieldLEN[$i]);
+                 if ( $self->{ignore_empty_subfields} ) {
+                         $v =~ s/(\^\w)+(\^\w)/$2/g;
+                         $v =~ s/\^\w$//;                        # last on line?
+                         next if ($v eq '');
+                 }
+                 push @{$self->{record}->{$FieldTAG[$i]}}, $v;
          }
          $self->{'current_mfn'} = $mfn;
-Line 528 
 There is also more elaborative way to ca
+Line 533 
 There is also more elaborative way to ca
    my $hash = $isis->to_hash({
          mfn => 42,
          include_subfields => 1,
-         regexps => [
-                 's/something/else/g',
-         ],
    });
  Each option controll creation of hash:
-Line 558 
 have original record subfield order and
+Line 560 
 have original record subfield order and
  Define delimiter which will be used to join repeatable subfields. You can
  specify option here instead in L</new> if you want to have per-record control.
- =item regexpes
+ =item hash_filter
- Override C<regexpes> specified in L</new>.
+ You can override C<hash_filter> defined in L</new> using this option.
  =back
-Line 573 
 sub to_hash {
+Line 575 
 sub to_hash {
          my $mfn = shift || confess "need mfn!";
          my $arg;
+         my $hash_filter = $self->{hash_filter};
          if (ref($mfn) eq 'HASH') {
                  $arg = $mfn;
                  $mfn = $arg->{mfn} || confess "need mfn in arguments";
+                 $hash_filter = $arg->{hash_filter} if ($arg->{hash_filter});
          }
-         $arg->{regexpes} ||= $self->{regexpes};
-         confess "regexps must be HASH" if ($arg->{regexps} && ref($arg->{regexps}) ne 'HASH');
          # init record to include MFN as field 000
          my $rec = { '000' => [ $mfn ] };
          my $row = $self->fetch($mfn) || return;
-         my $j_rs = $arg->{join_subfields_with};
+         my $j_rs = $arg->{join_subfields_with} || $self->{join_subfields_with};
          $j_rs = $self->{join_subfields_with} unless(defined($j_rs));
          my $i_sf = $arg->{include_subfields};
-Line 595 
 sub to_hash {
+Line 596 
 sub to_hash {
                  foreach my $l (@{$row->{$f_nr}}) {
                          # filter output
-                         if ($self->{'hash_filter'}) {
+                         $l = $hash_filter->($l, $f_nr) if ($hash_filter);
-                                 $l = $self->{'hash_filter'}->($l);
+                         next unless defined($l);
-                                 next unless defined($l);
-                         }
-                         # apply regexps
-                         if ($arg->{regexps} && defined($arg->{regexps}->{$f_nr})) {
-                                 confess "regexps->{$f_nr} must be ARRAY" if (ref($arg->{regexps}->{$f_nr}) ne 'ARRAY');
-                                 my $c = 0;
-                                 foreach my $r (@{ $arg->{regexps}->{$f_nr} }) {
-                                         while ( eval '$l =~ ' . $r ) { $c++ };
-                                 }
-                                 warn "## field $f_nr triggered $c regexpes\n" if ($c && $self->{debug});
-                         }
                          my $val;
                          my $r_sf;       # repeatable subfields in this record
-Line 622 
 sub to_hash {
+Line 611 
 sub to_hash {
                                          next if (! $t);
                                          my ($sf,$v) = (substr($t,0,1), substr($t,1));
                                          # XXX this might be option, but why?
-                                         next unless ($v);
+                                         next unless (defined($v) && $v ne '');
  #                                       warn "### $f_nr^$sf:$v",$/ if ($self->{debug} > 1);
                                          if (ref( $val->{$sf} ) eq 'ARRAY') {
-Line 774 
 know any details about it's version.
+Line 763 
 know any details about it's version.
  As this is young module, new features are added in subsequent version. It's
  a good idea to specify version when using this module like this:
-   use Biblio::Isis 0.21
+   use Biblio::Isis 0.23
  Below is list of changes in specific version of module (so you can target
  older versions if you really have to):
  =over 8
+ =item 0.24
+ Added C<ignore_empty_subfields>
+ =item 0.23
+ Added C<hash_filter> to L</to_hash>
+ Fixed bug with documented C<join_subfields_with> in L</new> which wasn't
+ implemented
+ =item 0.22
+ Added field number when calling C<hash_filter>
  =item 0.21
  Added C<join_subfields_with> to L</new> and L</to_hash>.

 Legend:



Removed from v.62
 


changed lines


 
Added in v.70
 Legend:



Removed from v.62
 


changed lines


 
Added in v.70
-Removed from v.62
+Added in v.70

	ViewVC Help
Powered by ViewVC 1.1.26