23 |
F 686 10 CC |
F 686 10 CC |
24 |
F 990 11 Signatura |
F 990 11 Signatura |
25 |
F 991 12 Inventarni broj |
F 991 12 Inventarni broj |
26 |
F 10 13 ISBN |
F ISN 13 ISBN, ISSN |
27 |
F MFN 14 MFN |
F MFN 14 MFN |
28 |
F 215+ 15 Materijalni opis |
F 215+ 15 Materijalni opis |
29 |
|
F 101 16 Jezik |
30 |
|
F tip 17 Tip graπe |
31 |
"; |
"; |
32 |
|
|
33 |
|
$common::database_cf="/local/search/databases.cf"; |
34 |
|
|
35 |
#-------------------------------------------------------------------- |
#-------------------------------------------------------------------- |
36 |
# |
# |
37 |
# mps_expand(nr,"space separated string"); |
# mps_expand(nr,"space separated string"); |
42 |
my $out = ""; |
my $out = ""; |
43 |
while (my $fld = shift @_) { |
while (my $fld = shift @_) { |
44 |
if ($fld =~ s/\s*[,;\.!?'"<>\[\]]*\s+/ /g) { |
if ($fld =~ s/\s*[,;\.!?'"<>\[\]]*\s+/ /g) { |
45 |
|
$fld =~ s/></ /g; |
46 |
foreach my $w (split(/\s+/,$fld)) { |
foreach my $w (split(/\s+/,$fld)) { |
47 |
# FIX: this should be replaced by stemmer! |
# FIX: this should be replaced by stemmer! |
48 |
$out .= "W $w $nr\n"; |
# remove chars from beginning of word |
49 |
|
$w =~ s/^['"<(\[]//g; |
50 |
|
# remove chars from end of word |
51 |
|
$w =~ s/[,;\.!?'">)\]]$//g; |
52 |
|
# preglasi φΦδΔόά -> |
53 |
|
if ($w =~ m/[]/) { |
54 |
|
$out .= "W $w $nr\n"; |
55 |
|
$w =~ s/[]/oe/g; |
56 |
|
$w =~ s/[]/ae/g; |
57 |
|
$w =~ s/[]/ue/g; |
58 |
|
$out .= "W $w $nr\n"; |
59 |
|
# Irish Last names |
60 |
|
} elsif (($nr == 1 || $nr == 2 || $nr == 3 || $nr == 6 || $nr == 7 || $nr == 8) && $w =~ m/^Ma?c([A-Z].+)/) { |
61 |
|
$out .= "W Mc$1 $nr\n"; |
62 |
|
$out .= "W Mac$1 $nr\n"; |
63 |
|
} else { |
64 |
|
$out .= "W $w $nr\n"; |
65 |
|
} |
66 |
} |
} |
67 |
} else { |
} else { |
68 |
$out .= "W $fld $nr\n"; |
$out .= "W $fld $nr\n"; |