--- trunk/conf/mjesec.yml 2006/08/23 10:08:17 612 +++ trunk/conf/mjesec.yml 2006/10/08 18:44:42 754 @@ -9,7 +9,8 @@ sites_root: 'sites' # which indexing engine to use? (hyperestraier is default) -use_indexer: 'hyperestraier' +#use_indexer: 'hyperestraier' +use_indexer: 'hyperestraier-native' #use_indexer: 'kinosearch' # configuration for Hyper Estraier full text search engine @@ -24,6 +25,8 @@ # don't turn this on! it will spit huge amounts of output #debug: 1 # + # + path: 'casket/' # number of results on each page hits_on_page: 10 # number of results to fetch for suggestion (it will fold multiple sameones) @@ -304,9 +307,9 @@ name: libri type: isis path: '/backup/isis_backup/A105-1/ISIS/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis.pm' + encoding: 'cp852' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: path: 'conf/normalize/common.pl' @@ -316,8 +319,7 @@ name: libri type: isis path: '/backup/isis_backup/A018-2/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -328,8 +330,7 @@ name: libri type: isis path: '/backup/isis_backup/A203-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -340,8 +341,7 @@ name: libri type: isis path: '/backup/isis_backup/A102-1B/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -352,16 +352,14 @@ - name: libri type: isis path: '/backup/isis_backup/novi-40162/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' - name: arti type: isis path: '/backup/isis_backup/novi-40162/ISISDATA/latest/ARTI/ARTI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -373,8 +371,7 @@ name: libri type: isis path: '/backup/isis_backup/A106-1/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -385,8 +382,7 @@ name: libri type: isis path: '/backup/isis_backup/B001-2/winisis/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -397,9 +393,9 @@ name: libri type: isis path: '/backup/isis_backup/A129-2/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: path: 'conf/normalize/common.pl' @@ -409,8 +405,7 @@ name: libri type: isis path: '/backup/isis_backup/A209-2/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -418,14 +413,32 @@ ffkk: name: 'Komparativna knji¾evnost, Filozofski fakultet u Zagrebu' input: - name: libri - type: isis - path: '/backup/isis_backup/A207-3/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' + - name: libri + type: isis +# path: '/home/mglavica/mnt/LIBRI/LIBRI' + path: '/backup/isis_backup/A207-3/isisdata/latest/LIBRI/LIBRI' + encoding: 'cp852' + #limit: 10 + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/ff-libri.pl' + - name: peri + type: isis + path: '/backup/isis_backup/A207-3/isisdata/latest/PERI/PERI' + encoding: 'cp852' + #limit: 10 + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/ff-libri.pl' + - name: arti + type: isis +# path: '/home/mglavica/mnt/ARTI/ARTI' + path: '/backup/isis_backup/A207-3/isisdata/latest/ARTI/ARTI' + encoding: 'cp852' + #limit: 10 + modify_file: 'conf/modify/common.pl' + normalize: + path: 'conf/normalize/ff-arti.pl' fflo: name: 'Lingvistika, Filozofski fakultet u Zagrebu' @@ -433,31 +446,9 @@ name: libri type: isis path: '/backup/isis_backup/A108-1/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 - modify_records: - 200: - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - '^c': '. ' - 210: - '*': - '^c': '^b' - '^d': '^c' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' + modify_file: 'conf/modify/common.pl' normalize: path: 'conf/normalize/common.pl' @@ -467,8 +458,7 @@ name: libri type: isis path: '/backup/isis_backup/B025-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -479,8 +469,7 @@ name: libri type: isis path: '/backup/isis_backup/A226-1/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -490,10 +479,9 @@ input: name: libri type: isis - path: '/backup/isis_backup/A201-1/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 + path: '/backup/isis_backup/A-201-1/isisdata/latest/LIBRI/LIBRI' + encoding: 'cp852' + modify_file: 'conf/modify/common.pl' normalize: path: 'conf/normalize/common.pl' @@ -503,8 +491,7 @@ name: libri type: isis path: '/backup/isis_backup/C124-3/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -527,14 +514,16 @@ # path: '/data/isis_data/PS/LIBRI/' # encoding of character set in isis data - encoding: '852' + encoding: 'cp852' # lookup - lookup: 'conf/lookup/isis_ffzg.yml' + # lookup: 'conf/lookup/isis_ffzg.yml' # limit number of records to read from database #limit: 10 + modify_file: 'conf/modify/common.pl' + # define normalisation for that source normalize: # which tag to use in normalize xml for data? @@ -547,8 +536,7 @@ - name: peri type: isis path: '/backup/isis_backup/sunce2/isisdata/latest/PERI/PERI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -558,9 +546,8 @@ input: name: libri type: isis - path: '/backup/isis_backup/A224-2/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + path: '/backup/isis_backup/A224-6/isisdata/latest/LIBRI/LIBRI' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -571,8 +558,7 @@ name: libri type: isis path: '/backup/isis_backup/B009-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -582,35 +568,11 @@ input: name: libri type: isis - path: '/backup/isis_backup/A125-3/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + path: '/data/isis_data/sfb/LIBRI/LIBRI' +# path: '/backup/isis_backup/A125-3/ISISDATA/latest/LIBRI/LIBRI' + encoding: 'cp852' #limit: 10 - modify_records: - 200: - '^a': - ' ; ': '^k' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - 210: - '*': - '^c': '^b' - '^d': '^c' - '. (': '. (^e' - ' : ': ' :^f' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' + modify_file: 'conf/modify/common.pl' normalize: path: 'conf/normalize/common.pl' @@ -619,35 +581,11 @@ input: name: libri type: isis - path: '/backup/isis_backup/A121-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + path: '/data/isis_data/sfm/LIBRI/LIBRI' +# path: '/backup/isis_backup/A121-2/ISISDATA/latest/LIBRI/LIBRI' + encoding: 'cp852' #limit: 10 - modify_records: - 200: - '^a': - ' ; ': '^k' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - 210: - '*': - '^c': '^b' - '^d': '^c' - '. (': '. (^e' - ' : ': ' :^f' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' + modify_file: 'conf/modify/common.pl' normalize: path: 'conf/normalize/common.pl' @@ -657,9 +595,23 @@ name: libri type: isis path: '/backup/isis_backup/A002-3/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 + modify_records: + 200: + '^a': + ' : ': '^e' + ' = ': '^d' + ' ; ': '^k' + '^k': + '^e': ' : ' + '^d': + '^e': ' : ' + '^e': + '^d': ' = ' + '^k': ' ; ' + '*': + '^g': ' ; ' normalize: path: 'conf/normalize/common.pl' @@ -668,10 +620,10 @@ input: name: libri type: isis - path: '/backup/isis_backup/A224-1/isisdata/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + path: '/backup/isis_backup/A225-2/isisdata/latest/LIBRI/LIBRI' + encoding: 'cp852' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: path: 'conf/normalize/common.pl' @@ -681,9 +633,9 @@ name: libri type: isis path: '/backup/isis_backup/A112-1/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 + modify_file: 'conf/modify/common.pl' normalize: path: 'conf/normalize/common.pl' @@ -693,8 +645,7 @@ name: libri type: isis path: '/backup/isis_backup/C107-9/ISISDATA/latest/LIBRI/LIBRI' - encoding: '852' - lookup: 'conf/lookup/isis_ffzg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -705,10 +656,9 @@ name: knjige type: marc path: '/data/drustvene/efzg/unimarc.iso' - encoding: '852' + encoding: 'cp852' # CroList recoding pairs to fix encoding problems recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' #limit: 1000 normalize: path: 'conf/normalize/common.pl' @@ -719,8 +669,7 @@ name: bib type: isis path: '/data/drustvene/eizg/BIB' - encoding: '852' - lookup: 'conf/lookup/eizg.yml' + encoding: 'cp852' #limit: 100 normalize: path: 'conf/normalize/common.pl' @@ -734,7 +683,6 @@ encoding: 'ISO-8859-2' # CroList recoding pairs to fix encoding problems #recode: '^ È ~ è ] Æ } æ | ð \[ © { ¹ @ ® ` ¾' - lookup: 'conf/lookup/efos.yml' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -745,8 +693,7 @@ name: knjige type: isis path: '/data/drustvene/irmo/LIBRI' - encoding: '852' - lookup: 'conf/lookup/eizg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -760,7 +707,6 @@ encoding: 'ISO-8859-2' # CroList recoding pairs to fix encoding problems recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -771,8 +717,7 @@ name: knjige type: isis path: '/data/drustvene/iztzg/BIB' - encoding: '852' - lookup: 'conf/lookup/eizg.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -783,8 +728,7 @@ name: bib type: isis path: '/data/drustvene/jzav/BIB' - encoding: '852' - lookup: 'conf/lookup/jzav.yml' + encoding: 'cp852' #limit: 10 normalize: path: 'conf/normalize/common.pl' @@ -798,7 +742,6 @@ encoding: 'ISO-8859-2' # CroList recoding pairs to fix encoding problems recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' #limit: 10 normalize: path: 'conf/normalize/common.pl'