/[Biblio-Isis]/trunk/t/2_isis.t
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Annotation of /trunk/t/2_isis.t

Parent Directory Parent Directory | Revision Log Revision Log


Revision 61 - (hide annotations)
Sun Jul 9 21:36:33 2006 UTC (17 years, 8 months ago) by dpavlin
File MIME type: application/x-troff
File size: 8238 byte(s)
initial implementation of split_on_delimiters functionality needed for
Webpac. It adds just regexpes hash to to_hash, but I'm still not quite
satisfied with it.
1 dpavlin 19 #!/usr/bin/perl -w
2    
3     use strict;
4     use blib;
5    
6 dpavlin 61 use Test::More tests => 136;
7 dpavlin 38 use File::Spec;
8 dpavlin 19
9 dpavlin 45 BEGIN {
10     use_ok( 'Biblio::Isis' );
11     eval "use Data::Dump";
12    
13     if (! $@) {
14     *Dumper = *Data::Dump::dump;
15     } else {
16     use Data::Dumper;
17     }
18     }
19    
20    
21 dpavlin 58 my $debug = length( shift(@ARGV) || '' );
22 dpavlin 19 my $isis;
23    
24 dpavlin 38 my $path_winisis = File::Spec->catfile('data', 'winisis', 'BIBL');
25     my $path_isismarc = File::Spec->catfile('data', 'isismarc', 'BIBL');
26    
27 dpavlin 19 sub test_data {
28    
29 dpavlin 21 my $args = {@_};
30    
31 dpavlin 36 isa_ok ($isis, 'Biblio::Isis');
32 dpavlin 19
33 dpavlin 32 cmp_ok($isis->count, '==', 5, "count is 5");
34 dpavlin 19
35     # test .CNT data
36    
37     SKIP: {
38     skip "no CNT file for this database", 5 unless $isis->{cnt_file};
39    
40 dpavlin 28 ok(my $isis_cnt = $isis->read_cnt, "read_cnt");
41 dpavlin 19
42 dpavlin 28 cmp_ok(scalar keys %{$isis_cnt}, '==', 2, "returns 2 elements");
43    
44 dpavlin 19 my $cnt = {
45     '1' => {
46     'N' => 15,
47     'K' => 5,
48     'FMAXPOS' => 8,
49     'POSRX' => 1,
50     'ABNORMAL' => 1,
51     'ORDN' => 5,
52     'LIV' => 0,
53     'ORDF' => 5,
54     'NMAXPOS' => 1
55     },
56     '2' => {
57     'N' => 15,
58     'K' => 5,
59     'FMAXPOS' => 4,
60     'POSRX' => 1,
61     'ABNORMAL' => 0,
62     'ORDN' => 5,
63     'LIV' => 0,
64     'ORDF' => 5,
65     'NMAXPOS' => 1
66     }
67     };
68    
69     foreach my $c (keys %{$cnt}) {
70     foreach my $kn (keys %{$cnt->{$c}}) {
71 dpavlin 28 cmp_ok($isis_cnt->{$c}->{$kn}, '==', $cnt->{$c}->{$kn}, "cnt $c $kn same");
72 dpavlin 19 }
73     }
74     }
75    
76 dpavlin 21 # test fetch
77    
78     my $data = [ {
79     '801' => [ '^aFFZG' ],
80     '702' => [ '^aHolder^bElizabeth' ],
81     '990' => [ '2140', '88', 'HAY' ],
82     '675' => [ '^a159.9' ],
83     '210' => [ '^aNew York^cNew York University press^dcop. 1988' ],
84     }, {
85     '210' => [ '^aNew York^cUniversity press^d1989' ],
86     '700' => [ '^aFrosh^bStephen' ],
87     '990' => [ '2140', '89', 'FRO' ],
88     '200' => [ '^aPsychoanalysis and psychology^eminding the gap^fStephen Frosh' ],
89     '215' => [ '^aIX, 275 str.^d23 cm' ],
90     }, {
91     '210' => [ '^aLondon^cFree Associoation Books^d1992' ],
92     '700' => [ '^aTurkle^bShirlie' ],
93     '990' => [ '2140', '92', 'LAC' ],
94     '200' => [ '^aPsychoanalitic politics^eJacques Lacan and Freud\'s French Revolution^fSherry Turkle' ],
95     '686' => [ '^a2140', '^a2140' ],
96    
97     }, {
98     '700' => [ '^aGross^bRichard' ],
99     '200' => [ '^aKey studies in psychology^fRichard D. Gross' ],
100     '210' => [ '^aLondon^cHodder & Stoughton^d1994' ],
101     '10' => [ '^a0-340-59691-0' ],
102     }, {
103     # identifier test
104     '200' => [ '1#^aPsychology^fCamille B. Wortman, Elizabeth F. Loftus, Mary E. Marshal' ],
105 dpavlin 49 225 => ["1#^aMcGraw-Hill series in Psychology"],
106     205 => ["^a4th ed"],
107 dpavlin 21 } ];
108    
109 dpavlin 32 foreach my $mfn (1 .. $isis->count) {
110 dpavlin 45
111 dpavlin 21 my $rec;
112     ok($rec = $isis->fetch($mfn), "fetch $mfn");
113    
114 dpavlin 54 diag "<<<<< rec = ",Dumper( $rec ), "\n>>>>> data = ", Dumper( $data->[$mfn-1] ) if ($debug);
115 dpavlin 46
116 dpavlin 21 foreach my $f (keys %{$data->[$mfn-1]}) {
117     my $i = 0;
118     foreach my $v (@{$data->[$mfn-1]->{$f}}) {
119     $v =~ s/^[01# ][01# ]// if ($args->{no_ident});
120 dpavlin 49 diag "compare '", $rec->{$f}->[$i], "' eq '$v'" if ($debug);
121     cmp_ok($rec->{$f}->[$i], 'eq', $v, "MFN $mfn field: $f offset: $i");
122 dpavlin 21 $i++;
123     }
124     }
125 dpavlin 54
126     cmp_ok($isis->mfn, '==', $mfn, 'mfn');
127    
128 dpavlin 21 }
129    
130 dpavlin 22 # test to_ascii
131    
132     SKIP: {
133     eval "use Digest::MD5 qw(md5_hex)";
134    
135     skip "no Digest::MD5 module", 5 if ($@);
136    
137 dpavlin 32 foreach my $mfn (1 .. $isis->count) {
138 dpavlin 22 my $md5 = md5_hex($isis->to_ascii($mfn));
139 dpavlin 25 cmp_ok($md5, 'eq', $args->{md5_ascii}[$mfn - 1], "md5 $mfn");
140 dpavlin 22 }
141     }
142    
143 dpavlin 19 }
144    
145 dpavlin 36 $isis = Biblio::Isis->new (
146 dpavlin 38 isisdb => $path_winisis,
147 dpavlin 25 include_deleted => 1,
148 dpavlin 54 debug => $debug > 1 ? ($debug - 1) : 0,
149 dpavlin 19 );
150    
151 dpavlin 51 diag "new Biblio::Isis = ", Dumper($isis) if ($debug);
152 dpavlin 19
153 dpavlin 22 test_data(
154     no_ident => 1,
155     md5_ascii => [ qw(
156     a369eff702307ba12eb81656ee0587fe
157     4fb38537a94f3f5954e40d9536b942b0
158 dpavlin 25 579a7c6901c654bdeac10547a98e5b71
159 dpavlin 22 7d2adf1675c83283aa9b82bf343e3d85
160 dpavlin 49 4cc1f798bbcf36862f7aa78c3410801a
161 dpavlin 22 ) ],
162     );
163 dpavlin 19
164 dpavlin 36 $isis = Biblio::Isis->new (
165 dpavlin 38 isisdb => $path_isismarc,
166 dpavlin 25 include_deleted => 1,
167 dpavlin 19 );
168    
169 dpavlin 22 test_data(
170     md5_ascii => [ qw(
171     f5587d9bcaa54257a98fe27d3c17a0b6
172     3be9a049f686f2a36af93a856dcae0f2
173     3961be5e3ba8fb274c89c08d18df4bcc
174     5f73ec00d08af044a2c4105f7d889e24
175     843b9ebccf16a498fba623c78f21b6c0
176     ) ],
177     );
178 dpavlin 25
179     # check logically deleted
180    
181 dpavlin 36 $isis = Biblio::Isis->new (
182 dpavlin 38 isisdb => $path_winisis,
183 dpavlin 25 include_deleted => 1,
184     );
185    
186     ok($isis->fetch(3), "deleted found");
187     cmp_ok($isis->{deleted}, '==', 3, "MFN 3 is deleted");
188 dpavlin 54 ok($isis->{record}, "record exists");
189 dpavlin 25
190 dpavlin 55 diag "record = ",Dumper($isis->{record}) if ($debug);
191 dpavlin 54
192 dpavlin 36 $isis = Biblio::Isis->new (
193 dpavlin 38 isisdb => $path_winisis,
194 dpavlin 33 debug => $debug,
195 dpavlin 25 );
196    
197     ok(! $isis->fetch(3), "deleted not found");
198     cmp_ok($isis->{deleted}, '==', 3, "MFN 3 is deleted");
199 dpavlin 54 ok(! $isis->{record}, 'no record');
200 dpavlin 25
201 dpavlin 54 $isis->{record} = {
202     900 => [ '^a900a^b900b^c900c' ],
203     901 => [
204     '^a901a-1^b901b-1^c901c-1',
205     '^a901a-2^b901b-2',
206     '^a901a-3',
207     ],
208     902 => [
209     '^aa1^aa2^aa3^bb1^aa4^bb2^cc1^aa5',
210     ],
211     };
212     $isis->{current_mfn} = 42;
213    
214 dpavlin 55 ok(my $hash = $isis->to_hash( $isis->mfn ), 'to_hash');
215     diag "to_hash = ",Dumper( $hash ) if ($debug);
216     is_deeply( $hash, {
217     "000" => [42],
218     900 => [{ a => "900a", b => "900b", c => "900c" }],
219     901 => [
220     { a => "901a-1", b => "901b-1", c => "901c-1" },
221     { a => "901a-2", b => "901b-2" },
222     { a => "901a-3" },
223     ],
224     902 => [
225     { a => ["a1", "a2", "a3", "a4", "a5"], b => ["b1", "b2"], c => "c1" },
226     ],
227     }, 'hash is_deeply');
228    
229     ok(my $ascii = $isis->to_ascii( $isis->mfn ), 'to_ascii');
230     diag "to_ascii = \n", $ascii if ($debug);
231     cmp_ok($ascii, 'eq', <<'__END_OF_ASCII__', 'to_ascii output');
232     0 42
233     900 ^a900a^b900b^c900c
234     901 ^a901a-1^b901b-1^c901c-1
235     901 ^a901a-2^b901b-2
236     901 ^a901a-3
237     902 ^aa1^aa2^aa3^bb1^aa4^bb2^cc1^aa5
238     __END_OF_ASCII__
239    
240 dpavlin 56 ok(my $hash2 = $isis->to_hash({ mfn => $isis->mfn }), 'to_hash(mfn)');
241     is_deeply( $hash2, $hash, 'same hash' );
242 dpavlin 57
243     ok($hash = $isis->to_hash({ mfn => $isis->mfn, include_subfields => 1 }), 'to_hash(mfn,include_subfields)');
244     diag "to_hash = ",Dumper( $hash ) if ($debug);
245     is_deeply( $hash, {
246     "000" => [42],
247     900 => [
248     { a => "900a", b => "900b", c => "900c", subfields => ["a", 0, "b", 0, "c", 0] },
249     ],
250     901 => [
251     { a => "901a-1", b => "901b-1", c => "901c-1", subfields => ["a", 0, "b", 0, "c", 0] },
252     { a => "901a-2", b => "901b-2", subfields => ["a", 0, "b", 0] },
253     { a => "901a-3", subfields => ["a", 0] },
254     ],
255     902 => [
256     { a => ["a1", "a2", "a3", "a4", "a5"], b => ["b1", "b2"], c => "c1",
257     subfields => ["a", 0, "a", 1, "a", 2, "b", 0, "a", 3, "b", 1, "c", 0, "a", 4],
258     },
259     ],
260     }, 'hash is_deeply');
261    
262 dpavlin 58 ok($hash = $isis->to_hash({ mfn => $isis->mfn, join_subfields_with => ' ; ' }), 'to_hash(mfn,join_subfields_with)');
263     diag "to_hash = ",Dumper( $hash ) if ($debug);
264     is_deeply( $hash, {
265     "000" => [42],
266     900 => [{ a => "900a", b => "900b", c => "900c" }],
267     901 => [
268     { a => "901a-1", b => "901b-1", c => "901c-1" },
269     { a => "901a-2", b => "901b-2" },
270     { a => "901a-3" },
271     ],
272     902 => [{ a => "a1 ; a2 ; a3 ; a4 ; a5", b => "b1 ; b2", c => "c1" }],
273     }, 'hash is_deeply');
274 dpavlin 61
275     # split_on_delimiters
276    
277     $isis->{record} = {
278     900 => [ '^a900a : 900b ; 900c' ],
279     901 => [
280     '^a901a-1 x 901b-1 y 901c-1',
281     '^b901b-2 x 901b-2',
282     '^c901c-3 y 901c-3',
283     ],
284     };
285    
286     my $split_on_delimiters = {
287     900 => { a => { ' : ' => 'b', ' ; ' => 'c' } },
288     901 => {
289     a => { ' x ' => 'b', ' y ' => 'c' },
290     b => { ' x ' => 'b' },
291     c => { ' y ' => 'c' }
292     },
293     };
294    
295     diag "split_on_delimiters = ", Dumper($split_on_delimiters);
296    
297     my $regexpes;
298    
299     foreach my $f (keys %$split_on_delimiters) {
300     warn "--- f: $f\n";
301     foreach my $sf (keys %{ $split_on_delimiters->{$f} }) {
302     warn "---- sf: $sf\n";
303     foreach my $patt (keys %{ $split_on_delimiters->{$f}->{$sf} }) {
304     my $new_sf = $split_on_delimiters->{$f}->{$sf}->{$patt} || die "no field?";
305     warn "----- patt: $patt -> $new_sf\n";
306    
307     # fool-proof spaces in pattern
308     $patt =~ s/\s+/\\s\+/g;
309    
310     push @{ $regexpes->{$f} },
311     's/\^' . $sf . '([^\^]+)' . $patt . '([^\^]+)/^' . $sf . '$1^' . $new_sf . '$2/g';
312     }
313     }
314     }
315    
316     diag "generated regexpes = ", Dumper( $regexpes );
317    
318    
319     ok($hash = $isis->to_hash({ mfn => $isis->mfn, regexps => $regexpes, }), 'to_hash(mfn,regexpes)');
320     diag "to_hash = ",Dumper( $hash ) if ($debug);
321     is_deeply( $hash, {
322     "000" => [42],
323     900 => [{ a => "900a", b => "900b", c => "900c" }],
324     901 => [
325     { a => "901a-1", b => "901b-1", c => "901c-1" },
326     { b => ["901b-2", "901b-2"] },
327     { c => ["901c-3", "901c-3"] },
328     ],
329     }, 'hash is_deeply');

Properties

Name Value
svn:executable *

  ViewVC Help
Powered by ViewVC 1.1.26