ecas configuration changes
[webpac2] / vhost / ecas / config.yml
index b245451..da56e32 100644 (file)
@@ -15,153 +15,185 @@ vhost:
 #    - STREQ: 'Cijeli naslov'
 #
 
-use_indexer: 'hyperestraier'
-
-hyperestraier:
-  masterurl: 'http://localhost:1978'
-  user: 'admin'
-  passwd: 'admin'
-  
-  # number of results on each page
-  hits_on_page: 10
-  # number of results to fetch for suggestion (it will fold multiple sameones)
-  hits_for_suggest: 20
-  # which tag type to use for search engine (used while indexing)
-  type: 'search'
-  #
-
-kinosearch:
-  index_path: 'var/kinosearch/ecas'
-  # clean database before opening? (WARNING: this erases existing database)
-  clean: 1
-  # which field type to index?
-  type: 'search'
-
 databases:
   ecas:
     name: 'Katalog elektroničkih časopisa'
-    description: 'dostupnih u zbirkama nabavljenim za potrebe visokoškolskih i znanstvenih ustanova Republike Hrvatske'
+#    description: 'dostupnih u zbirkama nabavljenim za potrebe visokoškolskih i znanstvenih ustanova Republike Hrvatske'
     input:
       - name: 'cairn'
-        description: 'Carin'
-        module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/cairn/Revues_Cairn090420.xls'
-        encoding: 'utf-8'
-        normalize:
-          path: 'vhost/ecas/cairn.pl'
+        description: 'Cairn'
+        module: 'WebPAC::Input::CSV'
+        path: 'vhost/ecas/data/cairn/latest/cairn.csv'
+        from: 1
+        to: 1000
+        normalize:
+          - path: 'vhost/ecas/cairn.pl'
+      - name: 'cambridge'
+        description: 'Cambridge Journals, HSS Collection'
+        module: 'WebPAC::Input::TSV'
+        path: 'vhost/ecas/data/cambridge/latest/cambridge-hss.txt'
+        normalize:
+          - path: 'vhost/ecas/kbar.pl'
+        skip: 0
       - name: 'doaj'
-        description: 'DOAJ'
-        module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/doaj/doaj-20090416.xls'
-        encoding: 'utf-8'
+        description: 'DOAJ - Directory of Open Access Journals'
+        module: 'WebPAC::Input::CSV'
+        path: 'vhost/ecas/data/doaj/latest/doaj.csv'
         normalize:
-          path: 'vhost/ecas/doaj.pl'
-      - name: 'ebsco-asc'
+          path: 'vhost/ecas/doaj.pl'
+      - name: 'ebsco-a9h'
         description: 'EBSCO Academic Search Complete'
         module: 'WebPAC::Input::MARC'
-        path: '/data/FF/ecasopisi/ebsco/a9h-ft.marc'
+        path: 'vhost/ecas/data/ebsco/latest/a9h-ft.marc'
         normalize:
-          path: 'vhost/ecas/marc.pl'
-      - name: 'ebsco-bsc'
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-bth'
         description: 'EBSCO Business Source Complete'
         module: 'WebPAC::Input::MARC'
-        path: '/data/FF/ecasopisi/ebsco/bth-ft.marc'
+        path: 'vhost/ecas/data/ebsco/latest/bth-ft.marc'
         normalize:
-          path: 'vhost/ecas/marc.pl'
-      - name: 'ebsco-mfp'
-        description: 'EBSCO MasterFILE Premier'
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-c8h'
+        description: 'EBSCO CINAHL with Full Text'
         module: 'WebPAC::Input::MARC'
-        path: '/data/FF/ecasopisi/ebsco/f5h-ft.marc'
+        path: 'vhost/ecas/data/ebsco/latest/c8h-ft.marc'
         normalize:
-          path: 'vhost/ecas/marc.pl'
-      - name: 'ebsco-gf'
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-f3h'
+        description: 'EBSCO Film & Television Literature Index with Full Text'
+        module: 'WebPAC::Input::MARC'
+        path: 'vhost/ecas/data/ebsco/latest/f3h-ft.marc'
+        normalize:
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-8gh'
         description: 'EBSCO GreenFILE'
         module: 'WebPAC::Input::MARC'
-        path: '/data/FF/ecasopisi/ebsco/8gh-ft.marc'
+        path: 'vhost/ecas/data/ebsco/latest/8gh-ft.marc'
         normalize:
-          path: 'vhost/ecas/marc.pl'
-      - name: 'ebsco-si'
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-hxh'
+        description: 'EBSCO Health Source - Consumer Edition'
+        module: 'WebPAC::Input::MARC'
+        path: 'vhost/ecas/data/ebsco/latest/hxh-ft.marc'
+        normalize:
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-hch'
+        description: 'EBSCO Health Source: Nursing/Academic Edition'
+        module: 'WebPAC::Input::MARC'
+        path: 'vhost/ecas/data/ebsco/latest/hch-ft.marc'
+        normalize:
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-f5h'
+        description: 'EBSCO MasterFILE Premier'
+        module: 'WebPAC::Input::MARC'
+        path: 'vhost/ecas/data/ebsco/latest/f5h-ft.marc'
+        normalize:
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-sih'
         description: 'EBSCO SocINDEX with Full Text'
         module: 'WebPAC::Input::MARC'
-        path: '/data/FF/ecasopisi/ebsco/sih-ft.marc'
+        path: 'vhost/ecas/data/ebsco/latest/sih-ft.marc'
         normalize:
-          path: 'vhost/ecas/marc.pl'
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'ebsco-pbh'
+        description: 'EBSCO Psycyology and Behavioral Sciences Collection'
+        module: 'WebPAC::Input::MARC'
+        path: 'vhost/ecas/data/ebsco/latest/pbh-ft.marc'
+        normalize:
+          - path: 'vhost/ecas/marc-ebsco.pl'
+      - name: 'psycarticles'
+        description: 'PsycARTICLES'
+        module: 'WebPAC::Input::TSV'
+        path: 'vhost/ecas/data/psycarticles/latest/psycarticles.txt'
+        normalize:
+          path: 'vhost/ecas/kbart-psycarticles-ebsco.pl'
+        from: 1
+        to: 250
+        skip: 0
       - name: 'emerald'
-        description: 'Emerald EMX95'
-        module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/emerald/emx95.xls'
-        encoding: 'utf-8'
+        description: 'Emerald Journals'
+        module: 'WebPAC::Input::TSV'
+        path: 'vhost/ecas/data/emerald/latest/emerald.txt'
         normalize:
-          path: 'vhost/ecas/emerald.pl'
+          path: 'vhost/ecas/kbar.pl'
+        skip: 0
       - name: 'hrcak'
-        description: 'Hrcak'
+        description: 'Hrčak'
         module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/hrcak/hrcak-naslovi.xls'
-        encoding: 'windows-1250'
+        from: 1
+        to: 360
+        workshhet: 'Sheet1'
+        path: 'vhost/ecas/data/hrcak/latest/hrcak.xls'
         normalize:
           path: 'vhost/ecas/hrcak.pl'
+        skip: 0
       - name: 'jstor'
         description: 'JSTOR'
-        module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/jstor/as.titleList.xls'
-        encoding: 'windows-1250'
-        normalize:
-          path: 'vhost/ecas/jstor.pl'
-      - name: 'jstor'
-        description: 'JSTOR'
-        module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/jstor/asii.titleList.xls'
-        encoding: 'windows-1250'
-        normalize:
-          path: 'vhost/ecas/jstor.pl'
-      - name: 'jstor'
-        description: 'JSTOR'
-        module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/jstor/asiii.titleList.xls'
-        encoding: 'windows-1250'
+        module: 'WebPAC::Input::TSV'
+        path: 'vhost/ecas/data/jstor/latest/jstor.txt'
         normalize:
-          path: 'vhost/ecas/jstor.pl'
-      - name: 'jstor'
-        description: 'JSTOR'
-        module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/jstor/asiv.titleList.xls'
-        encoding: 'windows-1250'
-        normalize:
-          path: 'vhost/ecas/jstor.pl'
-      - name: 'jstor'
-        description: 'JSTOR'
-        module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/jstor/asv.titleList.xls'
-        encoding: 'windows-1250'
-        normalize:
-          path: 'vhost/ecas/jstor.pl'
+          - path: 'vhost/ecas/kbar.pl'
       - name: 'ovid'
-        description: 'Ovid Full Text Journals, PsycARTICLES'
-        module: 'WebPAC::Input::Ovid'
-        path: '/data/FF/ecasopisi/ovid/cites-all.txt'
-        encoding: 'iso-8859-1'
+        description: 'Ovid Full Text'
+        module: 'WebPAC::Input::OvidOld'
+        path: 'vhost/ecas/data/ovid/latest/ovid-citation-all.txt'
         normalize:
-          path: 'vhost/ecas/ovid.pl'
+          - path: 'vhost/ecas/ovid.pl'
+        skip: 0
       - name: 'oxford'
         description: 'Oxford Journals'
         module: 'WebPAC::Input::MARC'
-        path: '/data/FF/ecasopisi/oxford/sites.dtl'
+        path: 'vhost/ecas/data/oxford/sites.dtl'
         normalize:
           path: 'vhost/ecas/marc.pl'
+        skip: 1
       - name: 'muse'
         description: 'Project MUSE'
         module: 'WebPAC::Input::MARC'
-        path: '/data/FF/ecasopisi/muse/premium.mrc'
+        path: 'vhost/ecas/data/muse/latest/premium.mrc'
         normalize:
-          path: 'vhost/ecas/marc.pl'
+          - path: 'vhost/ecas/marc-muse.pl'
       - name: 'pubmed'
         description: 'PubMed Central' 
+        module: 'WebPAC::Input::CSV'
+        path: 'vhost/ecas/data/pubmed/latest/pubmed.csv'
+        from: 1
+        to: 2000
+        normalize:
+          - path: 'vhost/ecas/pubmed.pl'
+      - name: 'sd'
+        description: 'ScienceDirect' 
+        module: 'WebPAC::Input::TSV'
+        path: 'vhost/ecas/data/sd/latest/sd.txt'
+        from: 1
+        to: 1550
+        normalize:
+          - path: 'vhost/ecas/kbart.pl'
+      - name: 'springeravailable'
+        description: 'SpringerLink - Humanities, Social Sciences and Law' 
         module: 'WebPAC::Input::Excel'
-        path: '/data/FF/ecasopisi/pubmed/jlist.xls'
-        encoding: 'windows-1250'
+        path: 'vhost/ecas/data/springer/Hum-SocSci-Low.xls'
+        from: 1
+        to: 199
         normalize:
-          path: 'vhost/ecas/pubmed.pl'
+          - path: 'vhost/ecas/springer.pl'
+      - name: 'springerall'
+        description: 'SpringerLink - Humanities, Social Sciences and Law' 
+        module: 'WebPAC::Input::Excel'
+        path: 'vhost/ecas/data/springer/Hum-SocSci-Low.xls'
+        from: 1
+        to: 200
+        skip: 1
+        normalize:
+          - path: 'vhost/ecas/springer.pl'
+      - name: 'titles'
+        description: 'Pojedinačni naslovi' 
+        module: 'WebPAC::Input::TSV'
+        path: 'vhost/ecas/data/pojedinacni/pojedinacni.tsv'
+        skip: 0
+        normalize:
+          - path: 'vhost/ecas/pojedinacni.pl'
     output:
-      module: 'WebPAC::Output::SWISH'
-      database: 'ecas'
+      module: 'WebPAC::Output::SWISH'
+        database: 'ecas'