--- trunk/conf/mjesec.yml 2006/09/06 19:25:22 636 +++ trunk/conf/mjesec.yml 2006/11/03 20:41:12 773 @@ -226,9 +226,7 @@ credit: 10000 - to: ffsk credit: 10000 - - to: ffsfb - credit: 10000 - - to: ffsfm + - to: ffsf credit: 10000 - to: ffso credit: 10000 @@ -308,34 +306,42 @@ type: isis path: '/backup/isis_backup/A105-1/ISIS/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis.pm' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffar: name: 'Arheologija, Filozofski fakultet u Zagrebu' input: - name: libri - type: isis - path: '/backup/isis_backup/A018-2/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' + - name: libri + type: isis + path: '/backup/isis_backup/A018-2/isisdata/latest/LIBRI/LIBRI' + encoding: 'cp852' + #limit: 10 + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/minimal.pl' + - name: peri + type: isis + path: '/backup/isis_backup/A018-2/isisdata/latest/PERI/PERI' + encoding: 'cp852' + #limit: 10 + #modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/minimal.pl' ffet: name: 'Etnologija, Filozofski fakultet u Zagrebu' input: name: libri type: isis - path: '/backup/isis_backup/A203-2/ISISDATA/latest/LIBRI/LIBRI' + path: '/backup/isis_backup/A203-3/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' fffi: name: 'Filozofija, Filozofski fakultet u Zagrebu' @@ -344,10 +350,10 @@ type: isis path: '/backup/isis_backup/A102-1B/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' fffo: name: 'Fonetika, Filozofski fakultet u Zagrebu' @@ -356,18 +362,18 @@ type: isis path: '/backup/isis_backup/novi-40162/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' - name: arti type: isis path: '/backup/isis_backup/novi-40162/ISISDATA/latest/ARTI/ARTI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/ff-arti.pl' ffge: @@ -377,10 +383,10 @@ type: isis path: '/backup/isis_backup/A106-1/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffhu: name: 'Hungarologija, Filozofski fakultet u Zagrebu' @@ -389,10 +395,10 @@ type: isis path: '/backup/isis_backup/B001-2/winisis/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/ff-libri.pl' ffiz: name: 'Informacijske znanosti, Filozofski fakultet u Zagrebu' @@ -401,10 +407,10 @@ type: isis path: '/backup/isis_backup/A129-2/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffkf: name: 'Klasièna filologija, Filozofski fakultet u Zagrebu' @@ -413,34 +419,40 @@ type: isis path: '/backup/isis_backup/A209-2/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffkk: name: 'Komparativna knji¾evnost, Filozofski fakultet u Zagrebu' input: - name: libri type: isis +# path: '/home/mglavica/mnt/LIBRI/LIBRI' path: '/backup/isis_backup/A207-3/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/minimal.pl' + - name: peri + type: isis + path: '/backup/isis_backup/A207-3/isisdata/latest/PERI/PERI' + encoding: 'cp852' + #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/ff-libri.pl' - name: arti type: isis +# path: '/home/mglavica/mnt/ARTI/ARTI' path: '/backup/isis_backup/A207-3/isisdata/latest/ARTI/ARTI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 - modify_records: - 200: - '^f': - '; ': '^x' + modify_file: 'conf/modify/ffkk-arti.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/ff-arti.pl' fflo: name: 'Lingvistika, Filozofski fakultet u Zagrebu' @@ -449,42 +461,10 @@ type: isis path: '/backup/isis_backup/A108-1/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 modify_file: 'conf/modify/common.pl' - modify_records: - 200: - '^k': - '^e': ' : ' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '^k': ' ; ' - '*': - '^g': ' ; ' - '^a': - ' : ': '^e' - ' = ': '^d' - ' ; ': '^k' - 210: - '^a': - '^c': '^b' - '^b': - ' ; ': '^a' - ' : ': '^b' - '^d': '^c' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' fftu: name: 'Turkologija, Filozofski fakultet u Zagrebu' @@ -493,10 +473,10 @@ type: isis path: '/backup/isis_backup/B025-2/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffpe: name: 'Pedagogija, Filozofski fakultet u Zagrebu' @@ -505,10 +485,10 @@ type: isis path: '/backup/isis_backup/A226-1/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffpo: name: 'Povijest, Filozofski fakultet u Zagrebu' @@ -517,10 +497,9 @@ type: isis path: '/backup/isis_backup/A-201-1/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffpu: name: 'Povijest umjetnosti, Filozofski fakultet u Zagrebu' @@ -529,10 +508,10 @@ type: isis path: '/backup/isis_backup/C124-3/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffps: # all variables here will be available as config variables in template @@ -555,45 +534,19 @@ encoding: 'cp852' # lookup - lookup: 'conf/lookup/isis_ffzg.yml' + # lookup: 'conf/lookup/isis_ffzg.yml' # limit number of records to read from database #limit: 10 - modify_records: - 200: - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - '^c': '. ' - 210: - '^a': - '^c': '^b' - '^b': - ' : ': '^b' - '^d': '^c' - '*': - '. (': '. (^e' - '^e': - ' : ': ' ^f' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' + modify_file: 'conf/modify/common.pl' + # define normalisation for that source normalize: # which tag to use in normalize xml for data? # tag: 'isis' # path to normalization xml - path: 'conf/normalize/common.pl' + path: 'conf/normalize/ff-libri.pl' #path: 'conf/normalize/isis_ffzg.yml' # another input database @@ -601,10 +554,10 @@ type: isis path: '/backup/isis_backup/sunce2/isisdata/latest/PERI/PERI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + # modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/ff-peri.pl' ffro: name: 'Romanistika, Filozofski fakultet u Zagrebu' @@ -613,10 +566,10 @@ type: isis path: '/backup/isis_backup/A224-6/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffsk: name: 'Skandinavistika, Filozofski fakultet u Zagrebu' @@ -625,90 +578,40 @@ type: isis path: '/backup/isis_backup/B009-2/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' - ffsfb: - name: 'Slavenska filologija (B), Filozofski fakulteti u Zagrebu' + ffsf: + name: 'Slavenska filologija, Filozofski fakulteti u Zagrebu' input: - name: libri - type: isis - path: '/data/isis_data/sfb/LIBRI/LIBRI' -# path: '/backup/isis_backup/A125-3/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^a': - ' : ': '^e' - ' = ': '^d' - '^k': - '^e': ' : ' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '^k': ' ; ' - '*': - '^g': ' ; ' - 210: - '^a': - '^c': '^b' - '^b': - ' ; ': '^a' - ' : ': '^b' - '^d': '^c' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' - normalize: - path: 'conf/normalize/common.pl' - - ffsfm: - name: 'Slavenska filologija (M), Filozofski fakulteti u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A121-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^a': - ' ; ': '^k' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - 210: - '*': - '^c': '^b' - '^d': '^c' - '. (': '. (^e' - ' : ': ' :^f' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' - normalize: - path: 'conf/normalize/common.pl' + - name: blibri + type: isis +# path: '/data/isis_data/sfb/LIBRI/LIBRI' + path: '/backup/isis_backup/A125-3/ISISDATA/latest/LIBRI/LIBRI' + encoding: 'cp852' + #limit: 10 + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/ff-libri.pl' + - name: mlibri + type: isis + path: '/data/isis_data/sfm/LIBRI/LIBRI' +# path: '/backup/isis_backup/A121-2/ISISDATA/latest/LIBRI/LIBRI' + encoding: 'cp852' + #limit: 10 + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/minimal.pl' + - name: peri + type: isis + path: '/backup/isis_backup/A125-2/ISISDATA/latest/PERI/PERI' + encoding: 'cp852' + #limit: 10 + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/minimal.pl' ffso: name: 'Sociologija, Filozofski fakultet u Zagrebu' @@ -717,37 +620,22 @@ type: isis path: '/backup/isis_backup/A002-3/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 - modify_records: - 200: - '^a': - ' : ': '^e' - ' = ': '^d' - ' ; ': '^k' - '^k': - '^e': ' : ' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '^k': ' ; ' - '*': - '^g': ' ; ' + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffta: name: 'Talijanistika, Filozofski fakultet u Zagrebu' input: name: libri type: isis - path: '/backup/isis_backup/A224-1/isisdata/latest/LIBRI/LIBRI' + path: '/backup/isis_backup/A225-2/isisdata/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffsr: name: 'Sredi¹nja èitaonica, Filozofski fakultet u Zagrebu' @@ -756,10 +644,10 @@ type: isis path: '/backup/isis_backup/A112-1/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' ffmic: name: 'Meðunarodni istra¾ivaèki centar za kasnu antiku i srednji vijek' @@ -768,116 +656,108 @@ type: isis path: '/backup/isis_backup/C107-9/ISISDATA/latest/LIBRI/LIBRI' encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - efzg: - name: 'Ekonomski fakutet u Zagrebu' - input: - name: knjige - type: marc - path: '/data/drustvene/efzg/unimarc.iso' - encoding: 'cp852' - # CroList recoding pairs to fix encoding problems - recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' - #limit: 1000 - normalize: - path: 'conf/normalize/common.pl' - - eizg: - name: 'Ekonomski institut u Zagrebu' - input: - name: bib - type: isis - path: '/data/drustvene/eizg/BIB' - encoding: 'cp852' - lookup: 'conf/lookup/eizg.yml' - #limit: 100 - normalize: - path: 'conf/normalize/common.pl' - - efos: - name: 'Ekonomski fakutet u Osijeku' - input: - name: knjige - type: marc - path: '/data/drustvene/efos/EFOSBAZA.ISO' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - #recode: '^ È ~ è ] Æ } æ | ð \[ © { ¹ @ ® ` ¾' - lookup: 'conf/lookup/efos.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - irmo: - name: 'Institut za meðunarodne odnose u Zagrebu' - input: - name: knjige - type: isis - path: '/data/drustvene/irmo/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/eizg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - hika: - name: 'Fakultet za turistièki i hotelski menad¾ment u Opatiji' - input: - name: knjige - type: marc - path: '/data/drustvene/hika/szi.iso' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - iztzg: - name: 'Institut za turizam u Zagrebu' - input: - name: knjige - type: isis - path: '/data/drustvene/iztzg/BIB' - encoding: 'cp852' - lookup: 'conf/lookup/eizg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - jzav: - name: 'Jadranski zavod' - input: - name: bib - type: isis - path: '/data/drustvene/jzav/BIB' - encoding: 'cp852' - lookup: 'conf/lookup/jzav.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ijf: - name: 'Institut za javne financije' - input: - name: knjige - type: marc - path: '/data/drustvene/ijf/szi.iso' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/ff-libri.pl' +# +# efzg: +# name: 'Ekonomski fakutet u Zagrebu' +# input: +# name: knjige +# type: marc +# path: '/data/drustvene/efzg/unimarc.iso' +# encoding: 'cp852' +# # CroList recoding pairs to fix encoding problems +# recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' +# #limit: 1000 +# normalize: +# path: 'conf/normalize/minimal.pl' +# +# eizg: +# name: 'Ekonomski institut u Zagrebu' +# input: +# name: bib +# type: isis +# path: '/data/drustvene/eizg/BIB' +# encoding: 'cp852' +# #limit: 100 +# normalize: +# path: 'conf/normalize/ff-libri.pl' +# +# efos: +# name: 'Ekonomski fakutet u Osijeku' +# input: +# name: knjige +# type: marc +# path: '/data/drustvene/efos/EFOSBAZA.ISO' +# encoding: 'ISO-8859-2' +# # CroList recoding pairs to fix encoding problems +# #recode: '^ È ~ è ] Æ } æ | ð \[ © { ¹ @ ® ` ¾' +# #limit: 10 +# normalize: +# path: 'conf/normalize/ff-libri.pl' +# +# irmo: +# name: 'Institut za meðunarodne odnose u Zagrebu' +# input: +# name: knjige +# type: isis +# path: '/data/drustvene/irmo/LIBRI' +# encoding: 'cp852' +# #limit: 10 +# normalize: +# path: 'conf/normalize/ff-libri.pl' +# +# hika: +# name: 'Fakultet za turistièki i hotelski menad¾ment u Opatiji' +# input: +# name: knjige +# type: marc +# path: '/data/drustvene/hika/szi.iso' +# encoding: 'ISO-8859-2' +# # CroList recoding pairs to fix encoding problems +# recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' +# #limit: 10 +# normalize: +# path: 'conf/normalize/ff-libri.pl' +# +# iztzg: +# name: 'Institut za turizam u Zagrebu' +# input: +# name: knjige +# type: isis +# path: '/data/drustvene/iztzg/BIB' +# encoding: 'cp852' +# #limit: 10 +# normalize: +# path: 'conf/normalize/ff-libri.pl' +# +# jzav: +# name: 'Jadranski zavod' +# input: +# name: bib +# type: isis +# path: '/data/drustvene/jzav/BIB' +# encoding: 'cp852' +# #limit: 10 +# normalize: +# path: 'conf/normalize/ff-libri.pl' +# +# ijf: +# name: 'Institut za javne financije' +# input: +# name: knjige +# type: marc +# path: '/data/drustvene/ijf/szi.iso' +# encoding: 'ISO-8859-2' +# # CroList recoding pairs to fix encoding problems +# recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' +# #limit: 10 +# normalize: +# path: 'conf/normalize/ff-libri.pl' -# Elektronièki èasopisi +## Elektronièki èasopisi emerald: name: 'EmeraldFulltext' input: @@ -892,3 +772,44 @@ path: 'conf/normalize/excel_emerald.pl' +## Wiley zbirka + wiley: + name: 'Wiley Intescience Full' + input: + - name: full + type: marc + path: '/data/FF/wiley/wiley2.mrc' + encoding: 'UTF-8' + normalize: + path: 'conf/normalize/marc-cufts.pl' + - name: licenced + type: excel + path: '/data/FF/wiley/wiley_casopisi2006.xls' + worksheet: 'licenced' + from: 1 + encoding: 'windows-1250' + normalize: + path: 'conf/normalize/excel-wiley.pl' + - name: nourl + type: marc + path: '/data/webpac2/out/marc/wiley-licenced.marc' + encoding: 'UTF-8' + normalize: + path: 'conf/normalize/marc-wiley-nourl.pl' +# - name: licenced +# type: marc +# path: '/data/FF/wiley/wiley-licenced.marc' +# encoding: 'UTF-8' +# normalize: +# path: 'conf/normalize/common.pl' + + nsk: + name: 'Nacionalna i sveucilisna knjiznica' + input: + name: baza + type: marc + path: '/backup/data/NSK/BBaza.ISO' + encoding: 'ISO-8859-2' + normalize: + path: 'conf/normalize/marc-nsk.pl' +