X-Git-Url: http://git.rot13.org/?a=blobdiff_plain;f=conf%2Fmjesec.yml;h=703f455e398d9e11ea700ebb248de67a0d26dea0;hb=05866fca50ed45db47a4552769f1a6e080b91397;hp=f2999d4659744a5961ea02234287a72134e5bcb2;hpb=b51c76b845c6360166dca64584b11e5b765482e8;p=webpac2 diff --git a/conf/mjesec.yml b/conf/mjesec.yml index f2999d4..703f455 100644 --- a/conf/mjesec.yml +++ b/conf/mjesec.yml @@ -9,7 +9,8 @@ catalyst_encoding: 'UTF-8' sites_root: 'sites' # which indexing engine to use? (hyperestraier is default) -use_indexer: 'hyperestraier' +#use_indexer: 'hyperestraier' +use_indexer: 'hyperestraier-native' #use_indexer: 'kinosearch' # configuration for Hyper Estraier full text search engine @@ -24,6 +25,8 @@ hyperestraier: # don't turn this on! it will spit huge amounts of output #debug: 1 # + # + path: 'casket/' # number of results on each page hits_on_page: 10 # number of results to fetch for suggestion (it will fold multiple sameones) @@ -43,107 +46,6 @@ pager: # configuration for KinoSearch search engine library kinosearch: index_path: './kinosearch/' - fields: - - 'uri' - - 'AccompanyingMaterial' - - 'APA' - - 'CallNo' - - 'ContentsNote' - - 'CorporateName' - - 'CorporateName2' - - 'DatePublication' - - 'EditionNote' - - 'EditionStatement' - - 'ExpandedTitle' - - 'fond' - - 'Form' - - 'Frequency' - - 'GeneralNote' - - 'ID' - - 'IdentificationNumbers' - - 'IntellectResponsNote' - - 'InternalBibliographies' - - 'InvNo' - - 'ISBN' - - 'ISSN' - - 'ISN' - - 'IssuedWith' - - 'Language' - - 'level' - - 'MaterialDesignation' - - 'MFN' - - 'NamePublisher' - - 'Names' - - 'OriginatingSource' - - 'ParallelTitle' - - 'Parts' - - 'PartsEF' - - 'PartsID' - - 'PersonalName' - - 'PersonalName2' - - 'PersonalNameOther' - - 'PhysicalDescription' - - 'PhysicalDescriptionNote' - - 'PhysicalDetails' - - 'Piece' - - 'PieceAnalitic' - - 'PieceNum' - - 'PieceSubtitle' - - 'PlacePublication' - - 'Responsibility' - - 'ResponsibilityFirst' - - 'ResponsibilitySecond' - - 'SerialNo' - - 'Series' - - 'SeriesTitle' - - 'Set' - - 'Set2' - - 'Subtitle' - - 'Summary' - - 'SystemRequirements' - - 'titleNo' - - 'TitleProper' - - 'TitleProper2' - - 'UDC' - - 'UDC_All' - - 'UDCb' - - 'UncontrolledTerms' - - 'UniformHeading' - - 'URL' - - 'VolumeDesignation' - - 'AllThes' - - 'BroaderTerm' - - 'ClassCode' - - 'DescriptorEN' - - 'DescriptorFR' - - 'DescriptorGE' - - 'DescriptorHR' - - 'filename' - - 'format' - - 'headline' - - 'IDths' - - 'line' - - 'line2' - - 'line3' - - 'line4' - - 'MicrothesaurusEN' - - 'MicrothesaurusFR' - - 'MicrothesaurusGE' - - 'MicrothesaurusHR' - - 'NarrowerTerm' - - 'NonDescriptorEN' - - 'NonDescriptorFR' - - 'NonDescriptorGE' - - 'NonDescriptorHR' - - 'RelatedTerm' - - 'ScopeNoteEN' - - 'ScopeNoteHR' - - 'SeeBefore' - - 'SeeNext' - - 'Source' - - 'SubjectAreaHR' - - 'SubjectIndex' - - 'URL' database: 'unconfigured database name' label: 'unconfigured database label' encoding: 'iso-8859-2' @@ -173,7 +75,12 @@ webpac: isis: 'WebPAC::Input::ISIS' marc: 'WebPAC::Input::MARC' excel: 'WebPAC::Input::Excel' - + # define delimiters for validation + delimiters: + - ' ; ' + - ' : ' + - ' / ' + - ' = ' editor: # open this record when opening editor # (it will also be used to deduce default database and input) @@ -223,9 +130,7 @@ databases: credit: 10000 - to: ffsk credit: 10000 - - to: ffsfb - credit: 10000 - - to: ffsfm + - to: ffsf credit: 10000 - to: ffso credit: 10000 @@ -235,627 +140,171 @@ databases: credit: 10000 - to: ffmic credit: 10000 - - to: efzg - credit: 10000 - - to: eizg - credit: 10000 - - to: efos - credit: 10000 - - to: irmo - credit: 10000 - - to: hika - credit: 10000 - - to: iztzg - credit: 10000 - - to: jzav - credit: 10000 - - to: ijf - credit: 10000 - - to: emerald - credit: 10000 - - # site with alternative databases - 'hr': - name: 'Primjer za hrvatsko suèelje' - links: - - to: ffps - credit: 10000 - - to: ffkk - credit: 5000 - - to: emerald - credit: 5000 - - -# 'ffps': -# name: 'Knji¾nica Odsjeka za psihologiju' -# links: -# - to: ffps -# credit: 10000 - - 'drustvene': - name: 'Katalog knji¾nica dru¹tvenih znanosti' - links: - - to: efzg - credit: 10000 - - to: eizg - credit: 10000 - - to: efos - credit: 10000 - - to: irmo - credit: 10000 - - to: hika - credit: 10000 - - to: iztzg - credit: 10000 - - to: jzav - credit: 10000 - - to: ijf - credit: 10000 - - 'ecasopisi': - name: 'Katalog elektronièkih èasopisa' - links: - - to: emerald - credit: 10000 - - ffan: - name: 'Anglistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A105-1/ISIS/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis.pm' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffar: - name: 'Arheologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A018-2/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffet: - name: 'Etnologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A203-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - fffi: - name: 'Filozofija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A102-1B/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - fffo: - name: 'Fonetika, Filozofski fakultet u Zagrebu' - input: - - name: libri - type: isis - path: '/backup/isis_backup/novi-40162/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 + - to: vusp + credit: 10000 + - to: kem + credit: 10000 + - to: efzg + credit: 10000 + + +# hazu: +# name: 'HAZU' +# input: +# - name: bib +# type: isis +# path: '/data/unizg/hazu/BIB' +# encoding: 'cp852' +# modify_file: 'conf/modify/common.pl' +# normalize: +# path: 'conf/normalize/minimal.pl' +# +# sand: +# name: 'SAND' +# input: +# name: casopisi +# type: dbf +# path: '/data/unizg/casopisi/sys/cas2000.dbf' +# normalize: +# path: 'conf/normalize/common.pl' +## mapping_path: 'conf/input/dbf/cas2000.yml' +# +# hidra: +# name: 'HIDRA' +# input: +# - name: bib +# type: isis +# path: '/data/hidra/test/BIB' +# encoding: 'cp852' +# modify_file: 'conf/modify/common.pl' +# normalize: +# path: 'conf/normalize/minimal.pl' +# +# efzg: +# name: 'EFZG' +# input: +# - name: crolist +# type: marc +# path: '/data/unizg/drustvene/efzg/unimarc.iso' +# encoding: 'ISO-8859-2' +# normalize: +# path: 'conf/normalize/minimal.pl' +# +# ipu: +# name: 'Institut za povijest umjetnosti' +# input: +# - name: bibl +# type: isis +# path: '/data/unizg/humanistika/ipu/20071115/bibl/BIBL' +# encoding: 'cp852' +# # modify_file: 'conf/modify/common.pl' +# normalize: +# path: 'conf/normalize/minimal.pl' +# +# zvonar: +# name: 'HAZU Odsjek za povijesne znanosti' +# input: +# - name: libri +# type: isis +# path: '/data/unizg/humanistika/hazu-p/LIBRI' +# normalize: +# path: 'conf/normalize/minimal.pl' +# - name: peri +# type: isis +# path: '/data/unizg/humanistika/hazu-p/PERI' +# normalize: +# path: 'conf/normalize/minimal.pl' +# +# stross: +# name: 'Strossmayerova galerija' +# input: +# - name: bib +# type: isis +# path: '/data/unizg/stross/BIB' +# normalize: +# path: 'conf/normalize/minimal.pl' +# +# koncar: +# name: 'Konèar' +# input: +# - name: unimar +# type: isis +# path: '/data/tehnika/koncar/UNIMAR' +# normalize: +# path: 'conf/normalize/minimal.pl' +# + datumi: + name: 'Nevaljali datumi' + input: + - name: tablica + type: excel + path: '/data/isis_data/greske/datum_unosa.xls' + encoding: 'windows-1250' normalize: - path: 'conf/normalize/common.pl' - - name: arti + - path: 'conf/normalize/common.pl' + +# ffps: +# name: 'Psihologija, Filozofski fakultet u Zagrebu' +# code: 'ps' +# url: 'http://www.knjiznice.ffzg.hr/psihologija' +# input: +# - name: libri +# type: isis +# path: '/backup/isis_backup/sunce2/isisdata/latest/LIBRI/' +# encoding: 'cp852' +# modify_file: 'conf/modify/common.pl' +# normalize: +# - path: 'conf/normalize/report-sorted-txt.pl' +# output: +## - module: 'Excel' +## path: '/data/isis_data/ps/reports/libri-nema-jezik.xls' +# - module: 'Sorted' +# path: 'out/report/mfn/ps/' +## - module: 'Excel' +## path: '/data/isis_data/ps/reports/autori-udk.xls' + + + stross: + name: 'Strossmayerova galerija' + input: + - name: bib type: isis - path: '/backup/isis_backup/novi-40162/ISISDATA/latest/ARTI/ARTI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 + path: '/data/unizg/stross/BIB' normalize: - path: 'conf/normalize/common.pl' - - - ffge: - name: 'Germanistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A106-1/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffhu: - name: 'Hungarologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/B001-2/winisis/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffiz: - name: 'Informacijske znanosti, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A129-2/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffkf: - name: 'Klasièna filologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A209-2/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffkk: - name: 'Komparativna knji¾evnost, Filozofski fakultet u Zagrebu' - input: - - name: libri - type: isis - path: '/data/isis_data/kk/LIBRI/LIBRI' -# path: '/backup/isis_backup/A207-3/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 + - path: 'conf/normalize/report-sorted-txt.pl' + output: +# - module: 'Excel' +# path: '/data/isis_data/iz/reports/libri-nema-jezik.xls' + - module: 'Sorted' + path: 'out/report/mfn/iz/' +# - module: 'Excel' +# path: '/data/isis_data/iz/reports/autori-udk.xls' + + + casopisi: + name: 'Èasopisi u Knji¾nicama FF-a' + input: + - name: ff + type: excel + path: '/data/isis_data/CASOPISI/svi-casopisi-FF.xls' + ncoding: 'utf-8' normalize: - path: 'conf/normalize/common.pl' - - name: arti - type: isis - path: '/data/isis_data/kk/ARTI/ARTI' -# path: '/backup/isis_backup/A207-3/isisdata/latest/ARTI/ARTI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^f': - '; ': '^x' + - path: 'conf/normalize/ff-casopisi-xls.pl' +# - path: 'conf/normalize/ff-casopisi-marc.pl' + output: + - module: 'Excel' + path: 'out/excel/casopisi-FF-dupli-knjiznice.xls' + + fflibri: + name: 'Filozofski fakultet u Zagrebu' + input: + - name: marc + type: marc + path: 'out/marc/fflibri.marc' + encoding: 'ISO-8859-2' normalize: - path: 'conf/normalize/common.pl' - - fflo: - name: 'Lingvistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A108-1/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - fftu: - name: 'Turkologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/B025-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffpe: - name: 'Pedagogija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A226-1/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffpo: - name: 'Povijest, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A201-1/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffpu: - name: 'Povijest umjetnosti, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/C124-3/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffps: - # all variables here will be available as config variables in template - name: 'Psihologija, Filozofski fakultet u Zagrebu' - code: 'ps' - url: 'http://www.knjiznice.ffzg.hr/psihologija' - - # define input source - input: - # this will create unique name with name of database and mfn - - name: libri - # isis - type: isis - - # full path to database - path: '/backup/isis_backup/sunce2/isisdata/latest/LIBRI/' - # path: '/data/isis_data/PS/LIBRI/' - - # encoding of character set in isis data - encoding: 'cp852' - - # lookup - lookup: 'conf/lookup/isis_ffzg.yml' - - # limit number of records to read from database - #limit: 10 - - modify_records: - 200: - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - '^c': '. ' - 210: - '^a': - '^c': '^b' - '^b': - ' : ': '^b' - '^d': '^c' - '*': - '. (': '. (^e' - '^e': - ' : ': ' ^f' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' - # define normalisation for that source - normalize: - # which tag to use in normalize xml for data? - # tag: 'isis' - # path to normalization xml - path: 'conf/normalize/common.pl' - #path: 'conf/normalize/isis_ffzg.yml' - - # another input database - - name: peri - type: isis - path: '/backup/isis_backup/sunce2/isisdata/latest/PERI/PERI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffro: - name: 'Romanistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A224-2/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffsk: - name: 'Skandinavistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/B009-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffsfb: - name: 'Slavenska filologija (B), Filozofski fakulteti u Zagrebu' - input: - name: libri - type: isis - path: '/data/isis_data/sfb/LIBRI/LIBRI' -# path: '/backup/isis_backup/A125-3/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^a': - ' : ': '^e' - ' = ': '^d' - '^k': - '^e': ' : ' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '^k': ' ; ' - '*': - '^g': ' ; ' - 210: - '^a': - '^c': '^b' - '^b': - ' ; ': '^a' - ' : ': '^b' - '^d': '^c' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' - normalize: - path: 'conf/normalize/common.pl' - - ffsfm: - name: 'Slavenska filologija (M), Filozofski fakulteti u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A121-2/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^a': - ' ; ': '^k' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '*': - '^g': ' ; ' - 210: - '*': - '^c': '^b' - '^d': '^c' - '. (': '. (^e' - ' : ': ' :^f' - 700: - '^a': - '^b': ', ' - 701: - '^a': - '^b': ', ' - 702: - '^a': - '^b': ', ' - normalize: - path: 'conf/normalize/common.pl' - - ffso: - name: 'Sociologija, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A002-3/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - modify_records: - 200: - '^a': - ' : ': '^e' - ' = ': '^d' - ' ; ': '^k' - '^k': - '^e': ' : ' - '^d': - '^e': ' : ' - '^e': - '^d': ' = ' - '^k': ' ; ' - '*': - '^g': ' ; ' - normalize: - path: 'conf/normalize/common.pl' - - ffta: - name: 'Talijanistika, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A224-1/isisdata/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffsr: - name: 'Sredi¹nja èitaonica, Filozofski fakultet u Zagrebu' - input: - name: libri - type: isis - path: '/backup/isis_backup/A112-1/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ffmic: - name: 'Meðunarodni istra¾ivaèki centar za kasnu antiku i srednji vijek' - input: - name: libri - type: isis - path: '/backup/isis_backup/C107-9/ISISDATA/latest/LIBRI/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/isis_ffzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - efzg: - name: 'Ekonomski fakutet u Zagrebu' - input: - name: knjige - type: marc - path: '/data/drustvene/efzg/unimarc.iso' - encoding: 'cp852' - # CroList recoding pairs to fix encoding problems - recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' - #limit: 1000 - normalize: - path: 'conf/normalize/common.pl' - - eizg: - name: 'Ekonomski institut u Zagrebu' - input: - name: bib - type: isis - path: '/data/drustvene/eizg/BIB' - encoding: 'cp852' - lookup: 'conf/lookup/eizg.yml' - #limit: 100 - normalize: - path: 'conf/normalize/common.pl' - - efos: - name: 'Ekonomski fakutet u Osijeku' - input: - name: knjige - type: marc - path: '/data/drustvene/efos/EFOSBAZA.ISO' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - #recode: '^ È ~ è ] Æ } æ | ð \[ © { ¹ @ ® ` ¾' - lookup: 'conf/lookup/efos.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - irmo: - name: 'Institut za meðunarodne odnose u Zagrebu' - input: - name: knjige - type: isis - path: '/data/drustvene/irmo/LIBRI' - encoding: 'cp852' - lookup: 'conf/lookup/eizg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - hika: - name: 'Fakultet za turistièki i hotelski menad¾ment u Opatiji' - input: - name: knjige - type: marc - path: '/data/drustvene/hika/szi.iso' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - iztzg: - name: 'Institut za turizam u Zagrebu' - input: - name: knjige - type: isis - path: '/data/drustvene/iztzg/BIB' - encoding: 'cp852' - lookup: 'conf/lookup/eizg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - jzav: - name: 'Jadranski zavod' - input: - name: bib - type: isis - path: '/data/drustvene/jzav/BIB' - encoding: 'cp852' - lookup: 'conf/lookup/jzav.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - - ijf: - name: 'Institut za javne financije' - input: - name: knjige - type: marc - path: '/data/drustvene/ijf/szi.iso' - encoding: 'ISO-8859-2' - # CroList recoding pairs to fix encoding problems - recode: 'ÏC È Ïc è ÂC Æ Âc æ ò ð ÏS © Ïs ¹ ÏZ ® Ïz ¾' - lookup: 'conf/lookup/efzg.yml' - #limit: 10 - normalize: - path: 'conf/normalize/common.pl' - -# Elektronièki èasopisi - emerald: - name: 'EmeraldFulltext' - input: - name: ecas - type: excel - path: '/data/FF/emerald/persistenturls.xls' - worksheet: 'All Titles' - from: 20 - encoding: 'windows-1250' - #limit: 10 - normalize: - path: 'conf/normalize/excel_emerald.pl' - + - path: 'conf/normalize/ff-libri-dupli.pl' + output: + - module: 'Excel' + path: 'out/excel/knjige-duplo.xls'