/[webpac2]/Webpacus/config.yml
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Diff of /Webpacus/config.yml

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 142 by dpavlin, Fri Nov 25 00:23:33 2005 UTC revision 435 by dpavlin, Mon Apr 17 20:23:12 2006 UTC
# Line 1  Line 1 
1  --- #YAML:1.0  --- #YAML:1.0
2  # DO NOT USE TABS FOR INDENTATION OR label/value SEPARATION!!!  # DO NOT USE TABS FOR INDENTATION OR label/value SEPARATION!!!
3    
4  # configuration for hyper estraier full text search engine  # encoding of this configuration file
5    config_encoding: 'ISO-8859-2'
6    # encoding in Catalyst.
7    catalyst_encoding: 'UTF-8'
8    # relative path to sites templates under Catalyst root
9    sites_root: 'sites'
10    
11    # which indexing engine to use? (hyperestraier is default)
12    #use_indexer: 'hyperestraier'
13    use_indexer: 'kinosearch'
14    
15    # configuration for Hyper Estraier full text search engine
16  hyperestraier:  hyperestraier:
17    url: 'http://localhost:1978/node/webpac2'    #url: 'http://localhost:1978/node/webpac2'
18      masterurl: 'http://localhost:1978'
19      defaultnode: 'webpac2'
20    #  defaultnode: 'ps'
21      defaultdepth: 1
22    user: 'admin'    user: 'admin'
23    passwd: 'admin'    passwd: 'admin'
24      # don't turn this on! it will spit huge amounts of output
25      #debug: 1
26      #
27      # number of results on each page
28      hits_on_page: 30
29      # number of results to fetch for suggestion (it will fold multiple sameones)
30      hits_for_suggest: 20
31    #    #
32    # options used while indexing    # options used while indexing
33    #    #
   # name of database (not used yet, but required)  
   database: 'test'  
34    # which tag type to use for search engine (used while indexing)    # which tag type to use for search engine (used while indexing)
35    type: 'search'    type: 'search'
36    #    #
37    # options used for Catalyst only  
38    #  # configuration for KinoSearch search engine library
39    # FIXME encoding comming from Catalyst.  kinosearch:
40    catalyst_encoding: 'UTF-8'    index_path: './kinosearch/'
41      fields:
42        - 'uri'
43        - 'AccompanyingMaterial'
44        - 'APA'
45        - 'CallNo'
46        - 'ContentsNote'
47        - 'CorporateName'
48        - 'CorporateName2'
49        - 'DatePublication'
50        - 'EditionNote'
51        - 'EditionStatement'
52        - 'ExpandedTitle'
53        - 'fond'
54        - 'Form'
55        - 'Frequency'
56        - 'GeneralNote'
57        - 'ID'
58        - 'IdentificationNumbers'
59        - 'IntellectResponsNote'
60        - 'InternalBibliographies'
61        - 'InvNo'
62        - 'ISBN'
63        - 'ISSN'
64        - 'ISN'
65        - 'IssuedWith'
66        - 'Language'
67        - 'level'
68        - 'MaterialDesignation'
69        - 'MFN'
70        - 'NamePublisher'
71        - 'Names'
72        - 'OriginatingSource'
73        - 'ParallelTitle'
74        - 'Parts'
75        - 'PartsEF'
76        - 'PartsID'
77        - 'PersonalName'
78        - 'PersonalName2'
79        - 'PersonalNameOther'
80        - 'PhysicalDescription'
81        - 'PhysicalDescriptionNote'
82        - 'PhysicalDetails'
83        - 'Piece'
84        - 'PieceAnalitic'
85        - 'PieceNum'
86        - 'PieceSubtitle'
87        - 'PlacePublication'
88        - 'Responsibility'
89        - 'ResponsibilityFirst'
90        - 'ResponsibilitySecond'
91        - 'SerialNo'
92        - 'Series'
93        - 'SeriesTitle'
94        - 'Set'
95        - 'Set2'
96        - 'Subtitle'
97        - 'Summary'
98        - 'SystemRequirements'
99        - 'titleNo'
100        - 'TitleProper'
101        - 'TitleProper2'
102        - 'UDC'
103        - 'UDC_All'
104        - 'UDCb'
105        - 'UncontrolledTerms'
106        - 'UniformHeading'
107        - 'URL'
108        - 'VolumeDesignation'
109        - 'AllThes'
110        - 'BroaderTerm'
111        - 'ClassCode'
112        - 'DescriptorEN'
113        - 'DescriptorFR'
114        - 'DescriptorGE'
115        - 'DescriptorHR'
116        - 'filename'
117        - 'format'
118        - 'headline'
119        - 'IDths'
120        - 'line'
121        - 'line2'
122        - 'line3'
123        - 'line4'
124        - 'MicrothesaurusEN'
125        - 'MicrothesaurusFR'
126        - 'MicrothesaurusGE'
127        - 'MicrothesaurusHR'
128        - 'NarrowerTerm'
129        - 'NonDescriptorEN'
130        - 'NonDescriptorFR'
131        - 'NonDescriptorGE'
132        - 'NonDescriptorHR'
133        - 'RelatedTerm'
134        - 'ScopeNoteEN'
135        - 'ScopeNoteHR'
136        - 'SeeBefore'
137        - 'SeeNext'
138        - 'Source'
139        - 'SubjectAreaHR'
140        - 'SubjectIndex'
141        - 'URL'
142      database: 'unconfigured database name'
143      label: 'unconfigured database label'
144      encoding: 'iso-8859-2'
145      # clean database before opening? (WARNING: this erases existing database)
146      clean: 1
147      # which field type to index?
148      type: 'search'
149    
150  webpac:  webpac:
151    # default template to use    # default template to use
# Line 35  webpac: Line 163  webpac:
163    webpac_encoding: 'iso-8859-2'    webpac_encoding: 'iso-8859-2'
164    # encoding expected by Catalyst    # encoding expected by Catalyst
165    out_encoding: 'utf-8'    out_encoding: 'utf-8'
166      # define different input formats (types) and perl modules to handle them
167      inputs:
168        isis: 'WebPAC::Input::ISIS'
169        marc: 'WebPAC::Input::MARC'
170    
171    editor:
172      # open this record when opening editor
173      # (it will also be used to deduce default database and input)
174      default_record_uri: 'ps/libri/1'
175    
176  # directives after this are used when indexing using core WebPAC modules  # directives after this are used when indexing using core WebPAC modules
177    
178  input:  databases:
179    # isis    # This is empty database created only in Hyper Estraier to merge
180    type: isis    # all three databases
181    # full path to database    'webpac2':
182    path: '/data/isis_data/ps/LIBRI/LIBRI'      name: 'Search all'
183    # encoding of character set in isis data      links:
184    encoding: '852'        - to: ps
185    # lookup          credit: 10000
186    lookup: 'conf/lookup/isis.pm'        - to: kk
187    # limit number of records to read from database          credit: 10000
188  #  limit: 100        - to: jzav
189            credit: 10000
190  normalize:  
191    # which tag to use in normalize xml for data?    # site with alternative databases
192    tag: 'isis'    'hr':
193    # path to normalization xml      name: 'Primjer za hrvatsko suèelje'
194    path: 'conf/normalize/isis_ffzg.xml'      links:
195          - to: ps
196            credit: 10000
197          - to: kk
198            credit: 5000
199    
200      # Psihologija
201      'ps':
202        # all variables here will be available as config variables in template
203        name: 'Knji¾nica psihologije'
204        code: 'ps'
205      
206        # define input source
207        input:
208          # this will create unique name with name of database and mfn
209          - name: libri
210            # isis
211            type: isis
212        
213            # full path to database
214            path: '/data/isis_data/ffps-libri/LIBRI'
215        
216            # encoding of character set in isis data
217            encoding: '852'
218        
219            # lookup
220            lookup: 'conf/lookup/isis.pm'
221        
222            # limit number of records to read from database
223            #limit: 100
224        
225            # define normalisation for that source
226            normalize:
227              # which tag to use in normalize xml for data?
228              tag: 'isis'
229              # path to normalization xml
230              path: 'conf/normalize/isis_ffzg.xml'
231              #path: 'conf/normalize/isis_ffzg.yml'
232      
233          # another input database
234          - name: peri
235            type: isis
236            path: '/data/isis_data/ffps-peri/PERI'
237            encoding: '852'
238            lookup: 'conf/lookup/isis.pm'
239            #limit: 100
240            normalize:
241              tag: 'isis'
242              path: 'conf/normalize/isis_ffzg.xml'
243    
244      # Komparativna
245      kk:
246        name: 'Komparativna'
247      
248        input:
249          name: libri
250          type: isis
251          path: '/data/isis_data/ffkk/LIBRI'
252          encoding: '852'
253          lookup: 'conf/lookup/isis.pm'
254          #limit: 100
255          normalize:
256            tag: 'isis'
257            path: 'conf/normalize/isis_ffzg.xml'
258      
259      jzav:
260        name: 'Jadranski zavod'
261        input:
262          name: knjige
263          type: isis
264          path: '/data/isis_data/jzav/BIB'
265          encoding: '852'
266          lookup: 'conf/lookup/jzav.yml'
267          #limit: 100
268          normalize:
269            tag: 'isis'
270            path: 'conf/normalize/isis_ffzg.xml'
271      
272      efzg:
273        name: 'Ekonomski fakutet u Zagrebu'
274        input:
275          name: knjige
276          type: marc
277          path: '/data/isis_data/efzg/unimarc.iso'
278          encoding: '852'
279          # CroList recoding pairs to fix encoding problems
280          recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾'
281          lookup: 'conf/lookup/isis.pm'
282          #limit: 100
283          normalize:
284            tag: 'isis'
285            path: 'conf/normalize/isis_ffzg.xml'
286      

Legend:
Removed from v.142  
changed lines
  Added in v.435

  ViewVC Help
Powered by ViewVC 1.1.26