/[wait]/trunk/lib/WAIT/Table.pm

This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!

Diff of /trunk/lib/WAIT/Table.pm

Parent Directory | Revision Log | View Patch Patch

-cvs-head/lib/WAIT/Table.pm
revision 20 by cvs2svn,
Tue May  9 11:29:45 2000 UTC
+trunk/lib/WAIT/Table.pm
revision 108 by dpavlin,
Tue Jul 13 17:41:12 2004 UTC
 Line 4
  # Author          : Ulrich Pfeifer
  # Created On      : Thu Aug  8 13:05:10 1996
  # Last Modified By: Ulrich Pfeifer
- # Last Modified On: Mon May  8 20:20:58 2000
+ # Last Modified On: Wed Jan 23 14:15:15 2002
  # Language        : CPerl
- # Update Count    : 131
+ # Update Count    : 152
  # Status          : Unknown, Use with caution!
  #
  # Copyright (c) 1996-1997, Ulrich Pfeifer
 Line 25 
 WAIT::Table -- Module for maintaining Ta
  =cut
  package WAIT::Table;
+ our $VERSION = "2.000";
  use WAIT::Table::Handle ();
  require WAIT::Parse::Base;
-Line 32 
 require WAIT::Parse::Base;
+Line 33 
 require WAIT::Parse::Base;
  use strict;
  use Carp;
  # use autouse Carp => qw( croak($) );
- use DB_File;
+ use BerkeleyDB;
  use Fcntl;
- use LockFile::Simple ();
- my $USE_RECNO = 0;
  =head2 Creating a Table.
-Line 133 
 sub new {
+Line 131 
 sub new {
    my $self = {};
    # Check for mandatory attrs early
-   $self->{name}     = $parm{name}     or croak "No name specified";
+   for my $x (qw(name attr env maindbfile tablename)) {
-   $self->{attr}     = $parm{attr}     or croak "No attributes specified";
+     $self->{$x}     = $parm{$x}     or croak "No $x specified";
+   }
    # Do that before we eventually add '_weight' to attributes.
    $self->{keyset}   = $parm{keyset}   || [[@{$parm{attr}}]];
-Line 158 
 sub new {
+Line 157 
 sub new {
      unshift @{$parm{attr}}, '_weight' unless $attr{'_weight'};
    }
-   $self->{file}     = $parm{file}     or croak "No file specified";
+   $self->{path}     = $parm{path}     or croak "No path specified";
-   if (-d  $self->{file}){
+   bless $self, $type;
-     warn "Warning: Directory '$self->{file}' already exists\n";
-   } elsif (!mkdir($self->{file}, 0775)) {
-     croak "Could not 'mkdir $self->{file}': $!\n";
-   }
-   my $lockmgr = LockFile::Simple->make(-autoclean => 1);
-   # aquire a write lock
-   $self->{write_lock} = $lockmgr->lock($self->{file} . '/write')
-     or die "Can't lock '$self->{file}/write'";
    $self->{djk}      = $parm{djk}      if defined $parm{djk};
    $self->{layout}   = $parm{layout} || new WAIT::Parse::Base;
-Line 177 
 sub new {
+Line 167 
 sub new {
    $self->{deleted}  = {};       # no deleted records yet
    $self->{indexes}  = {};
-   bless $self, $type;
+   # Checking for readers is not necessary, but let's go with the
+   # generic method.
    # Call create_index() and create_index() for compatibility
    for (@{$self->{keyset}||[]}) {
      #carp "Specification of indexes at table create time is deprecated";
-Line 187 
 sub new {
+Line 179 
 sub new {
      # carp "Specification of inverted indexes at table create time is deprecated";
      my $att  = shift @{$parm{invindex}};
      my @spec = @{shift @{$parm{invindex}}};
-     my @opt;
+     my @opt  = ();
      if (ref($spec[0])) {
-       carp "Secondary pipelines are deprecated\n";
+       warn "Secondary pipelines are deprecated";
        @opt = %{shift @spec};
      }
-     $self->create_inverted_index(attribute => $att, pipeline  => \@spec, @opt);
+     $self->create_inverted_index(attribute => $att,
+                                  pipeline  => \@spec,
+                                  @opt);
    }
    $self;
    # end of backwarn compatibility stuff
  }
+ for my $accessor (qw(maindbfile tablename)) {
+   no strict 'refs';
+   *{$accessor} = sub {
+     my($self) = @_;
+     return $self->{$accessor} if $self->{$accessor};
+     require Carp;
+     Carp::confess("accessor $accessor not there");
+   }
+ }
  =head2 Creating an index
    $tb->create_index('docid');
-Line 222 
 sub create_index {
+Line 226 
 sub create_index {
    require WAIT::Index;
    my $name = join '-', @_;
+   #### warn "WARNING: Suspect use of \$_ in method create_index. name[$name]_[$_]";
    $self->{indexes}->{$name} =
-     new WAIT::Index file => $self->{file}.'/'.$name, attr => $_;
+     WAIT::Index->new(
+                      file => $self->file.'/'.$name,
+                      subname => $name,
+                      env  => $self->{env},
+                      maindbfile => $self->maindbfile,
+                      tablename => $self->tablename,
+                      attr => $_,
+                     );
  }
  =head2 Creating an inverted index
-Line 284 
 sub create_inverted_index {
+Line 296 
 sub create_inverted_index {
    }
    my $name = join '_', ($parm{attribute}, @{$parm{pipeline}});
-   my $idx = new WAIT::InvertedIndex(file   => $self->{file}.'/'.$name,
+   my $idx = WAIT::InvertedIndex->new(file   => $self->file.'/'.$name,
-                                     filter => [@{$parm{pipeline}}], # clone
+                                      subname=> $name,
-                                     name   => $name,
+                                      env    => $self->{env},
-                                     attr   => $parm{attribute},
+                                      maindbfile => $self->maindbfile,
-                                     %opt, # backward compatibility stuff
+                                      tablename => $self->tablename,
-                                    );
+                                      filter => [@{$parm{pipeline}}], # clone
+                                      name   => $name,
+                                      attr   => $parm{attribute},
+                                      %opt, # backward compatibility stuff
+                                     );
    # We will have to use $parm{predicate} here
    push @{$self->{inverted}->{$parm{attribute}}}, $idx;
  }
  sub dir {
-   $_[0]->{file};
+   $_[0]->file;
  }
  =head2 C<$tb-E<gt>layout>
-Line 323 
 Must be called via C<WAIT::Database::dro
+Line 339 
 Must be called via C<WAIT::Database::dro
  sub drop {
    my $self = shift;
    if ((caller)[0] eq 'WAIT::Database') { # database knows about this
      $self->close;               # just make sure
-     my $file = $self->{file};
+     my $file = $self->file;
      for (values %{$self->{indexes}}) {
        $_->drop;
      }
      unlink "$file/records";
-     # $self->unlock;
+     rmdir "$file/read" or warn "Could not rmdir '$file/read'";
-     ! (!-e $file or rmdir $file);
    } else {
      croak ref($self)."::drop called directly";
    }
-Line 346 
 sub mrequire ($) {
+Line 364 
 sub mrequire ($) {
    require $module;
  }
+ sub path {
+   my($self) = @_;
+   return $self->{path} if $self->{path};
+   require Data::Dumper; print STDERR "Line " . __LINE__ . ", File: " . __FILE__ . "\n" . Data::Dumper->new([$self],[qw(self)])->Indent(1)->Useqq(1)->Dump; # XXX
+   require Carp;
+   Carp::confess("NO file attr");
+ }
  sub open {
    my $self = shift;
-   my $file = $self->{file} . '/records';
+   my $file = $self->file . '/records';
    mrequire ref($self);           # that's tricky eh?
    if (defined $self->{'layout'}) {
-Line 359 
 sub open {
+Line 385 
 sub open {
    }
    if (exists $self->{indexes}) {
      require WAIT::Index;
-     for (values %{$self->{indexes}}) {
+     for my $Ind (values %{$self->{indexes}}) {
-       $_->{mode} = $self->{mode};
+       for my $x (qw(mode env maindbfile)) {
+         $Ind->{$x} = $self->{$x};
+       }
      }
    }
    if (exists $self->{inverted}) {
      my ($att, $idx);
      for $att (keys %{$self->{inverted}}) {
        for $idx (@{$self->{inverted}->{$att}}) {
-         $idx->{mode} = $self->{mode};
+         for my $x (qw(mode env maindbfile)) {
+           $idx->{$x} = $self->{$x};
+         }
        }
      }
      require WAIT::InvertedIndex;
    }
-   unless (defined $self->{dbh}) {
-     if ($USE_RECNO) {
-       $self->{dbh} = tie(@{$self->{db}}, 'DB_File', $file,
-                          $self->{mode}, 0664, $DB_RECNO);
-     } else {
-       $self->{dbh} =
-         tie(%{$self->{db}}, 'DB_File', $file,
-                          $self->{mode}, 0664, $DB_BTREE);
-     }
-   }
-   # Locking
-   #
-   # We allow multiple readers to coexists.  But write access excludes
-   # all read access vice versa.  In practice read access on tables
-   # open for writing will mostly work ;-)
-   my $lockmgr = LockFile::Simple->make(-autoclean => 1);
+   # CONFUSION: WAIT knows two *modes*: read-only or read-write.
+   # BerkeleyDB means file permissions when talking about Mode.
-   # aquire a write lock. We might hold one acquired in create() already
+   # BerkeleyDB has the "Flags" attribute to specify
-   $self->{write_lock} ||= $lockmgr->lock($self->{file} . '/write')
+   # read/write/lock/etc subsystems.
-     or die "Can't lock '$self->{file}/write'";
-   my $lockdir = $self->{file} . '/read';
-   unless (-d $lockdir) {
-     mkdir $lockdir, 0755 or die "Could not mkdir $lockdir: $!";
-   }
+   my $flags;
    if ($self->{mode} & O_RDWR) {
-     # this is a hack.  We do not check for reopening ...
+     $flags = DB_CREATE; # | DB_INIT_MPOOL | DB_PRIVATE | DB_INIT_CDB;
-     return $self if $self->{write_lock};
+     warn "Flags on table $file set to 'writing'";
-     # If we actually want to write we must check if there are any readers
-     opendir DIR, $lockdir or
-       die "Could not opendir '$lockdir': $!";
-     for my $lockfile (grep { -f "$lockdir/$_" } readdir DIR) {
-       # check if the locks are still valid.
-       # Since we are protected by a write lock, we could use a pline file.
-       # But we want to use the stale testing from LockFile::Simple.
-       if (my $lck = $lockmgr->trylock("$lockdir/$lockfile")) {
-         warn "Removing stale lockfile '$lockdir/$lockfile'";
-         $lck->release;
-       } else {
-         $self->{write_lock}->release;
-         die "Cannot write table '$file' while it's in use";
-       }
-     }
    } else {
-     # this is a hack.  We do not check for reopening ...
+     $flags = DB_RDONLY;
-     return $self if $self->{read_lock};
+     # warn "Flags on table $file set to 'readonly'";
+   }
-     # We are a reader. So we release the write lock
+   unless (defined $self->{dbh}) {
-     my $id = time;
+     my $subname = $self->tablename . "/records";
-     while (-f "$lockdir/$id.lock") { # here assume ".lock" format!
+     $self->{dbh} =
-       $id++;
+         tie(%{$self->{db}}, 'BerkeleyDB::Btree',
-     }
+             $self->{env} ? (Env => $self->{env}) : (),
-     $self->{read_lock} = $lockmgr->lock("$lockdir/$id");
+             # Filename => $file,
-     $self->{write_lock}->release;
+             Filename => $self->maindbfile,
-     delete $self->{write_lock};
+             Subname => $subname,
+             Mode => 0664,
+             Flags => $flags,
+             $WAIT::Database::Cachesize?(Cachesize => $WAIT::Database::Cachesize):(),
+             $WAIT::Database::Pagesize?(Pagesize => $WAIT::Database::Pagesize):(),
+            )
+             or die "Cannot tie: $BerkeleyDB::Error;
+  DEBUG: Filename[$self->{maindbfile}]subname[$subname]Mode[0664]Flags[$flags]";
    }
    $self;
  }
-Line 510 
 sub insert {
+Line 509 
 sub insert {
    unless ($gotkey) {
      $key = $self->{nextk}++;
    }
-   if ($USE_RECNO) {
+   $self->{db}->{$key} = $tuple;
-     $self->{db}->[$key] = $tuple;
-   } else {
-     $self->{db}->{$key} = $tuple;
-   }
    for (values %{$self->{indexes}}) {
      unless ($_->insert($key, %parm)) {
        # duplicate key, undo changes
-Line 565 
 sub fetch {
+Line 560 
 sub fetch {
    return () if exists $self->{deleted}->{$key};
    defined $self->{db} or $self->open;
-   if ($USE_RECNO) {
+   $self->unpack($self->{db}->{$key});
-     $self->unpack($self->{db}->[$key]);
-   } else {
-     $self->unpack($self->{db}->{$key});
-   }
  }
  sub delete_by_key {
-Line 609 
 sub delete {
+Line 600 
 sub delete {
  }
  sub unpack {
-   my $self = shift;
+   my($self, $tuple) = @_;
-   my $tuple = shift;
-   return unless defined $tuple;
+   unless (defined $tuple){
+     # require Carp; # unfortunately gives us "bizarre copy...." :-(((((
+     warn("Debug: somebody called unpack without argument tuple!");
+     return;
+   }
    my $att;
    my @result;
-Line 625 
 sub unpack {
+Line 620 
 sub unpack {
  sub set {
    my ($self, $iattr, $value) = @_;
+   # in the rare case that they haven't written a single record yet, we
-   return unless $self->{write_lock};
+   # make sure, the inverted inherits our $self->{mode}:
+   defined $self->{db} or $self->open;
    for my $att (keys %{$self->{inverted}}) {
      if ($] > 5.003) {         # avoid bug in perl up to 5.003_05
        my $idx;
-Line 644 
 sub set {
+Line 641 
 sub set {
  sub close {
    my $self = shift;
+   require Carp; Carp::cluck("------->Closing A Table<-------");
    if (exists $self->{'access'}) {
      eval {$self->{'access'}->close}; # dont bother if not opened
    }
-   for (values %{$self->{indexes}}) {
+   if ($WAIT::Index::VERSION) {
-     require WAIT::Index;
+     for (values %{$self->{indexes}}) {
-     $_->close();
+       $_->close();
+     }
    }
-   if (defined $self->{inverted}) {
+   if (defined $self->{inverted} && $WAIT::InvertedIndex::VERSION) {
+     # require WAIT::InvertedIndex; Uli: we can avoid closing indexes:
+     # if WAIT::InvertedIndex has not been loaded, they cannot have
+     # been altered so far
      my $att;
      for $att (keys %{$self->{inverted}}) {
        if ($] > 5.003) {         # avoid bug in perl up to 5.003_05
-Line 666 
 sub close {
+Line 669 
 sub close {
    }
    if ($self->{dbh}) {
      delete $self->{dbh};
+   }
-     if ($USE_RECNO) {
+   untie %{$self->{db}};
-       untie @{$self->{db}};
+   for my $att (qw(env db file maindbfile)) {
-     } else {
+     delete $self->{$att};
-       untie %{$self->{db}};
+     warn "----->Deleted att $att<-----";
-     }
-     delete $self->{db};
    }
-   $self->unlock;
 ;
  }
- sub unlock {
+ sub DESTROY {
    my $self = shift;
-   # Either we have a read or a write lock (or we close the table already)
+   delete $self->{env};
-   # unless ($self->{read_lock} || $self->{write_lock}) {
-   #   warn "WAIT::Table::unlock: Table aparently hold's no lock"
-   # }
-   if ($self->{write_lock}) {
-     $self->{write_lock}->release();
-     delete $self->{write_lock};
-   }
-   if ($self->{read_lock}) {
-     $self->{read_lock}->release();
-     delete $self->{read_lock};
-   }
- }
- sub DESTROY {
+   # require Data::Dumper; print STDERR "Line " . __LINE__ . ", File: " . __FILE__ . "\n" . Data::Dumper->new([$self],[qw(self)])->Indent(1)->Useqq(1)->Dump; # XXX
-   my $self = shift;
-   warn "Table handle destroyed without closing it first"
-     if $self->{write_lock} || $self->{read_lock};
  }
  sub open_scan {
-Line 759 
 sub intervall {
+Line 742 
 sub intervall {
    bless \%result, 'WAIT::Query::Raw';
  }
- sub search {
+ sub search_ref {
    my $self  = shift;
    my ($query, $attr, $cont, $raw);
    if (ref $_[0]) {
      $query = shift;
+     # require Data::Dumper; print STDERR "Line " . __LINE__ . ", File: " . __FILE__ . "\n" . Data::Dumper->new([$query],[qw()])->Indent(1)->Useqq(1)->Dump; # XXX
      $attr = $query->{attr};
      $cont = $query->{cont};
      $raw  = $query->{raw};
-Line 804 
 sub search {
+Line 788 
 sub search {
    }
    if (defined $cont and $cont ne '') {
      for (@{$self->{inverted}->{$attr}}) {
-       my %r = $_->search($query, $cont);
+       my $r = $_->search_ref($query, $cont);
        my ($key, $val);
-       while (($key, $val) = each %r) {
+       while (($key, $val) = each %$r) {
          if (exists $result{$key}) {
            $result{$key} += $val;
          } else {
-Line 820 
 sub search {
+Line 804 
 sub search {
    for (keys %result) {
      delete $result{$_} if $self->{deleted}->{$_}
    }
-   %result;
+   \%result;
+ }
+ sub parse_query {
+   my($self, $attr, $query) = @_;
+   return unless defined $query && length $query;
+   my %qt;
+   for (@{$self->{inverted}->{$attr}}) {
+     grep $qt{$_}++, $_->parse($query);
+   }
+   [keys %qt];
  }
  sub hilight_positions {

 Legend:



Removed from v.20
 


changed lines


 
Added in v.108
 Legend:



Removed from v.20
 


changed lines


 
Added in v.108
-Removed from v.20
+Added in v.108

	ViewVC Help
Powered by ViewVC 1.1.26