--- trunk/conf/mjesec.yml 2006/08/23 10:08:17 612 +++ trunk/conf/mjesec.yml 2008/02/12 18:32:13 1090 @@ -9,7 +9,8 @@ sites_root: 'sites' # which indexing engine to use? (hyperestraier is default) -use_indexer: 'hyperestraier' +#use_indexer: 'hyperestraier' +use_indexer: 'hyperestraier-native' #use_indexer: 'kinosearch' # configuration for Hyper Estraier full text search engine @@ -24,6 +25,8 @@ # don't turn this on! it will spit huge amounts of output #debug: 1 # + # + path: 'casket/' # number of results on each page hits_on_page: 10 # number of results to fetch for suggestion (it will fold multiple sameones) @@ -43,107 +46,6 @@ # configuration for KinoSearch search engine library kinosearch: index_path: './kinosearch/' - fields: - - 'uri' - - 'AccompanyingMaterial' - - 'APA' - - 'CallNo' - - 'ContentsNote' - - 'CorporateName' - - 'CorporateName2' - - 'DatePublication' - - 'EditionNote' - - 'EditionStatement' - - 'ExpandedTitle' - - 'fond' - - 'Form' - - 'Frequency' - - 'GeneralNote' - - 'ID' - - 'IdentificationNumbers' - - 'IntellectResponsNote' - - 'InternalBibliographies' - - 'InvNo' - - 'ISBN' - - 'ISSN' - - 'ISN' - - 'IssuedWith' - - 'Language' - - 'level' - - 'MaterialDesignation' - - 'MFN' - - 'NamePublisher' - - 'Names' - - 'OriginatingSource' - - 'ParallelTitle' - - 'Parts' - - 'PartsEF' - - 'PartsID' - - 'PersonalName' - - 'PersonalName2' - - 'PersonalNameOther' - - 'PhysicalDescription' - - 'PhysicalDescriptionNote' - - 'PhysicalDetails' - - 'Piece' - - 'PieceAnalitic' - - 'PieceNum' - - 'PieceSubtitle' - - 'PlacePublication' - - 'Responsibility' - - 'ResponsibilityFirst' - - 'ResponsibilitySecond' - - 'SerialNo' - - 'Series' - - 'SeriesTitle' - - 'Set' - - 'Set2' - - 'Subtitle' - - 'Summary' - - 'SystemRequirements' - - 'titleNo' - - 'TitleProper' - - 'TitleProper2' - - 'UDC' - - 'UDC_All' - - 'UDCb' - - 'UncontrolledTerms' - - 'UniformHeading' - - 'URL' - - 'VolumeDesignation' - - 'AllThes' - - 'BroaderTerm' - - 'ClassCode' - - 'DescriptorEN' - - 'DescriptorFR' - - 'DescriptorGE' - - 'DescriptorHR' - - 'filename' - - 'format' - - 'headline' - - 'IDths' - - 'line' - - 'line2' - - 'line3' - - 'line4' - - 'MicrothesaurusEN' - - 'MicrothesaurusFR' - - 'MicrothesaurusGE' - - 'MicrothesaurusHR' - - 'NarrowerTerm' - - 'NonDescriptorEN' - - 'NonDescriptorFR' - - 'NonDescriptorGE' - - 'NonDescriptorHR' - - 'RelatedTerm' - - 'ScopeNoteEN' - - 'ScopeNoteHR' - - 'SeeBefore' - - 'SeeNext' - - 'Source' - - 'SubjectAreaHR' - - 'SubjectIndex' - - 'URL' database: 'unconfigured database name' label: 'unconfigured database label' encoding: 'iso-8859-2' @@ -173,7 +75,12 @@ isis: 'WebPAC::Input::ISIS' marc: 'WebPAC::Input::MARC' excel: 'WebPAC::Input::Excel' - + # define delimiters for validation + delimiters: + - ' ; ' + - ' : ' + - ' / ' + - ' = ' editor: # open this record when opening editor # (it will also be used to deduce default database and input) @@ -223,9 +130,7 @@ credit: 10000 - to: ffsk credit: 10000 - - to: ffsfb - credit: 10000 - - to: ffsfm + - to: ffsf credit: 10000 - to: ffso credit: 10000 @@ -235,35 +140,23 @@ credit: 10000 - to: ffmic credit: 10000 - - to: efzg - credit: 10000 - - to: eizg - credit: 10000 - - to: efos - credit: 10000 - - to: irmo + - to: vusp credit: 10000 - - to: hika + - to: kem credit: 10000 - - to: iztzg - credit: 10000 - - to: jzav - credit: 10000 - - to: ijf - credit: 10000 - - to: emerald + - to: efzg credit: 10000 - # site with alternative databases - 'hr': - name: 'Primjer za hrvatsko sučelje' - links: - - to: ffps - credit: 10000 - - to: ffkk - credit: 5000 - - to: emerald - credit: 5000 +# # site with alternative databases +# 'hr': +# name: 'Primjer za hrvatsko sučelje' +# links: +# - to: ffps +# credit: 10000 +# - to: ffkk +# credit: 5000 +# - to: emerald +# credit: 5000 # 'ffps': @@ -272,549 +165,114 @@ # - to: ffps # credit: 10000 - 'drustvene': - name: 'Katalog knjižnica društvenih znanosti' - links: - - to: efzg - credit: 10000 - - to: eizg - credit: 10000 - - to: efos - credit: 10000 - - to: irmo - credit: 10000 - - to: hika - credit: 10000 - - to: iztzg - credit: 10000 - - to: jzav - credit: 10000 - - to: ijf - credit: 10000 +# 'drustvene': +# name: 'Katalog knjižnica društvenih znanosti' +# links: +# - to: efzg +# credit: 10000 +# - to: eizg +# credit: 10000 +# - to: efos +# credit: 10000 +# - to: irmo +# credit: 10000 +# - to: hika +# credit: 10000 +# - to: iztzg +# credit: 10000 +# - to: jzav +# credit: 10000 +# - to: ijf +# credit: 10000 - 'ecasopisi': - name: 'Katalog elektroničkih časopisa' - links: - - to: emerald - credit: 10000 - - ffan: - name: 'Anglistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A105-1/ISIS/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis.pm' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffar: - name: 'Arheologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A018-2/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffet: - name: 'Etnologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A203-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - fffi: - name: 'Filozofija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A102-1B/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' +# 'ecasopisi': +# name: 'Katalog elektroničkih časopisa' +# links: +# - to: emerald +# credit: 10000 - fffo: - name: 'Fonetika, Filozofski fakultet u Zagrebu' + hazu: + name: 'HAZU' input: - - name: libri - type: isis - path: '/backup/isis_backup/novi-40162/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - name: arti + - name: bib type: isis - path: '/backup/isis_backup/novi-40162/ISISDATA/latest/ARTI/ARTI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 + path: '/data/unizg/hazu/BIB' + encoding: 'cp852' + modify_file: 'conf/modify/common.pl' normalize: - path: 'conf/normalize/common.pl' - - - ffge: - name: 'Germanistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A106-1/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' - ffhu: - name: 'Hungarologija, Filozofski fakultet u Zagrebu' + sand: + name: 'SAND' input: - name: libri - type: isis - path: '/backup/isis_backup/B001-2/winisis/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 + name: casopisi + type: dbf + path: '/data/unizg/casopisi/sys/cas2000.dbf' normalize: path: 'conf/normalize/common.pl' - - ffiz: - name: 'Informacijske znanosti, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A129-2/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffkf: - name: 'Klasična filologija, Filozofski fakultet u Zagrebu' +# mapping_path: 'conf/input/dbf/cas2000.yml' + + hidra: + name: 'HIDRA' input: - name: libri - type: isis - path: '/backup/isis_backup/A209-2/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffkk: - name: 'Komparativna književnost, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A207-3/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - fflo: - name: 'Lingvistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A108-1/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - '^c': '. ' - 210: - '*': - '^c': '^b' - '^d': '^c' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' - normalize: - path: 'conf/normalize/common.pl' - - fftu: - name: 'Turkologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/B025-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffpe: - name: 'Pedagogija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A226-1/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' + - name: bib + type: isis + path: '/data/hidra/test/BIB' + encoding: 'cp852' + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/minimal.pl' - ffpo: - name: 'Povijest, Filozofski fakultet u Zagrebu' + efzg: + name: 'EFZG' input: - name: libri - type: isis - path: '/backup/isis_backup/A201-1/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffpu: - name: 'Povijest umjetnosti, Filozofski fakultet u Zagrebu' + - name: crolist + type: marc + path: '/data/unizg/drustvene/efzg/unimarc.iso' + encoding: 'ISO-8859-2' + normalize: + path: 'conf/normalize/minimal.pl' + + ipu: + name: 'Institut za povijest umjetnosti' input: - name: libri - type: isis - path: '/backup/isis_backup/C124-3/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffps: - # all variables here will be available as config variables in template - name: 'Psihologija, Filozofski fakultet u Zagrebu' - code: 'ps' - url: 'http://www.knjiznice.ffzg.hr/psihologija' + - name: bibl + type: isis + path: '/data/unizg/humanistika/ipu/20071115/bibl/BIBL' + encoding: 'cp852' + # modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/minimal.pl' - # define input source + zvonar: + name: 'HAZU Odsjek za povijesne znanosti' input: - # this will create unique name with name of database and mfn - name: libri - # isis type: isis - - # full path to database - path: '/backup/isis_backup/sunce2/isisdata/latest/LIBRI/' - # path: '/data/isis_data/PS/LIBRI/' - - # encoding of character set in isis data - encoding: '852' - - # lookup - lookup: 'conf/lookup/isis_ffzg.yml' - - # limit number of records to read from database - #limit: 10 - - # define normalisation for that source + path: '/data/unizg/humanistika/hazu-p/LIBRI' normalize: - # which tag to use in normalize xml for data? - # tag: 'isis' - # path to normalization xml - path: 'conf/normalize/common.pl' - #path: 'conf/normalize/isis_ffzg.yml' - - # another input database + path: 'conf/normalize/minimal.pl' - name: peri type: isis - path: '/backup/isis_backup/sunce2/isisdata/latest/PERI/PERI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 + path: '/data/unizg/humanistika/hazu-p/PERI' normalize: - path: 'conf/normalize/common.pl' - - ffro: - name: 'Romanistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A224-2/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffsk: - name: 'Skandinavistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/B009-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffsfb: - name: 'Slavenska filologija (B), Filozofski fakulteti u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A125-3/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^a': - ' ; ': '^k' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - 210: - '*': - '^c': '^b' - '^d': '^c' - '. (': '. (^e' - ' : ': ' :^f' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' - normalize: - path: 'conf/normalize/common.pl' - - ffsfm: - name: 'Slavenska filologija (M), Filozofski fakulteti u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A121-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^a': - ' ; ': '^k' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - 210: - '*': - '^c': '^b' - '^d': '^c' - '. (': '. (^e' - ' : ': ' :^f' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' - normalize: - path: 'conf/normalize/common.pl' - - ffso: - name: 'Sociologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A002-3/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffta: - name: 'Talijanistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A224-1/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffsr: - name: 'Središnja čitaonica, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A112-1/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' + path: 'conf/normalize/minimal.pl' - ffmic: - name: 'Međunarodni istraživački centar za kasnu antiku i srednji vijek' + stross: + name: 'Strossmayerova galerija' input: - name: libri - type: isis - path: '/backup/isis_backup/C107-9/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - efzg: - name: 'Ekonomski fakutet u Zagrebu' - input: - name: knjige - type: marc - path: '/data/drustvene/efzg/unimarc.iso' - encoding: '852' - # CroList recoding pairs to fix encoding problems - recode: 'ĎC Č Ďc č ÂC Ć Âc ć ň đ ĎS Š Ďs š ĎZ Ž Ďz ž' - lookup: 'conf/lookup/efzg.yml' - #limit: 1000 - normalize: - path: 'conf/normalize/common.pl' - - eizg: - name: 'Ekonomski institut u Zagrebu' - input: - name: bib - type: isis - path: '/data/drustvene/eizg/BIB' - encoding: '852' - lookup: 'conf/lookup/eizg.yml' - #limit: 100 - normalize: - path: 'conf/normalize/common.pl' - - efos: - name: 'Ekonomski fakutet u Osijeku' - input: - name: knjige - type: marc - path: '/data/drustvene/efos/EFOSBAZA.ISO' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - #recode: '^ Č ~ č ] Ć } ć | đ \[ Š { š @ Ž ` ž' - lookup: 'conf/lookup/efos.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - irmo: - name: 'Institut za međunarodne odnose u Zagrebu' - input: - name: knjige - type: isis - path: '/data/drustvene/irmo/LIBRI' - encoding: '852' - lookup: 'conf/lookup/eizg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - hika: - name: 'Fakultet za turistički i hotelski menadžment u Opatiji' - input: - name: knjige - type: marc - path: '/data/drustvene/hika/szi.iso' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - recode: 'ĎC Č Ďc č ÂC Ć Âc ć ň đ ĎS Š Ďs š ĎZ Ž Ďz ž' - lookup: 'conf/lookup/efzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - iztzg: - name: 'Institut za turizam u Zagrebu' - input: - name: knjige - type: isis - path: '/data/drustvene/iztzg/BIB' - encoding: '852' - lookup: 'conf/lookup/eizg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - jzav: - name: 'Jadranski zavod' - input: - name: bib - type: isis - path: '/data/drustvene/jzav/BIB' - encoding: '852' - lookup: 'conf/lookup/jzav.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ijf: - name: 'Institut za javne financije' - input: - name: knjige - type: marc - path: '/data/drustvene/ijf/szi.iso' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - recode: 'ĎC Č Ďc č ÂC Ć Âc ć ň đ ĎS Š Ďs š ĎZ Ž Ďz ž' - lookup: 'conf/lookup/efzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - -# Elektronički časopisi - emerald: - name: 'EmeraldFulltext' + - name: bib + type: isis + path: '/data/unizg/stross/BIB' + normalize: + path: 'conf/normalize/minimal.pl' + + koncar: + name: 'Končar' input: - name: ecas - type: excel - path: '/data/FF/emerald/persistenturls.xls' - worksheet: 'All Titles' - from: 20 - encoding: 'windows-1250' - #limit: 10 - normalize: - path: 'conf/normalize/excel_emerald.pl' - - + - name: unimar + type: isis + path: '/data/tehnika/koncar/UNIMAR' + normalize: + path: 'conf/normalize/minimal.pl' +