# - path: 'conf/normalize/isi/isi2xls.pl'
# - path: 'conf/isi/isi2sorted.pl'
- path: 'conf/isi/tables.pl'
-# - name: buskov
-# type: isi
-# path: '/data/FF/citati/citing/buskov.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
-# - name: butkovica.txt
-# type: isi
-# path: '/data/FF/citati/citing/butkovica.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
-# - name: corkalobiruskid.txt
-# type: isi
-# path: '/data/FF/citati/citing/corkalobiruskid.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
+ - name: buskov
+ type: isi
+ path: '/data/FF/citati/citing/buskov.txt'
+ encoding: 'ISO-8859-1'
+ normalize:
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
+ skip: 1
+ - name: butkovica.txt
+ type: isi
+ path: '/data/FF/citati/citing/butkovica.txt'
+ encoding: 'ISO-8859-1'
+ normalize:
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
+ skip: 1
+ - name: corkalobiruskid.txt
+ type: isi
+ path: '/data/FF/citati/citing/corkalobiruskid.txt'
+ encoding: 'ISO-8859-1'
+ normalize:
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
+ skip: 1
- name: hrend
type: isi
path: '/data/FF/citati/citing/hrend.txt'
# - path: 'conf/normalize/isi/isi2xls.pl'
# - path: 'conf/isi/isi2sorted.pl'
- path: 'conf/isi/tables.pl'
-# - name: hromatkoi
-# type: isi
-# path: '/data/FF/citati/citing/hromatkoi.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
+ - name: hromatkoi
+ type: isi
+ path: '/data/FF/citati/citing/hromatkoi.txt'
+ encoding: 'ISO-8859-1'
+ normalize:
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
+ skip: 1
- name: hudekknezevicj
type: isi
path: '/data/FF/citati/citing/hudekknezevicj.txt'
# - path: 'conf/normalize/isi/isi2xls.pl'
# - path: 'conf/isi/isi2sorted.pl'
- path: 'conf/isi/tables.pl'
-# - name: kerestesg
-# type: isi
-# path: '/data/FF/citati/citing/kerestesg.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
-# - name: knezovicz
-# type: isi
-# path: '/data/FF/citati/citing/knezovicz.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
-# - name: kolesaricv
-# type: isi
-# path: '/data/FF/citati/citing/kolesaricv.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
+ - name: kerestesg
+ type: isi
+ path: '/data/FF/citati/citing/kerestesg.txt'
+ encoding: 'ISO-8859-1'
+ normalize:
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
+ skip: 1
+ - name: knezovicz
+ type: isi
+ path: '/data/FF/citati/citing/knezovicz.txt'
+ encoding: 'ISO-8859-1'
+ normalize:
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
+ skip: 1
+ - name: kolesaricv
+ type: isi
+ path: '/data/FF/citati/citing/kolesaricv.txt'
+ encoding: 'ISO-8859-1'
+ normalize:
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
+ skip: 1
- name: kuterovacjagodicg
type: isi
path: '/data/FF/citati/citing/kuterovacjagodicg.txt'
# - path: 'conf/normalize/isi/isi2xls.pl'
# - path: 'conf/isi/isi2sorted.pl'
- path: 'conf/isi/tables.pl'
-# - name: maslicsersicd
-# type: isi
-# path: '/data/FF/citati/citing/maslicsersicd.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
+ - name: maslicsersicd
+ type: isi
+ path: '/data/FF/citati/citing/maslicsersicd.txt'
+ encoding: 'ISO-8859-1'
+ normalize:
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
+ skip: 1
- name: radosevicvidacekb
type: isi
path: '/data/FF/citati/citing/radosevicvidacekb.txt'
# - path: 'conf/normalize/isi/isi2xls.pl'
# - path: 'conf/isi/isi2sorted.pl'
- path: 'conf/isi/tables.pl'
-# - name: galicz
-# type: isi
-# path: '/data/FF/citati/citing/galicz.txt'
-# encoding: 'ISO-8859-1'
-# normalize:
-# # - path: 'conf/normalize/isi/isi2xls.pl'
-# # - path: 'conf/isi/isi2sorted.pl'
-# - path: 'conf/isi/tables.pl'
- - name: tadinacm
+ - name: galicz
type: isi
- path: '/data/FF/citati/citing/tadinacm.txt'
+ path: '/data/FF/citati/citing/galicz.txt'
encoding: 'ISO-8859-1'
normalize:
# - path: 'conf/normalize/isi/isi2xls.pl'
# - path: 'conf/isi/isi2sorted.pl'
- path: 'conf/isi/tables.pl'
- - name: cropsy
+ skip: 1
+ - name: tadinacm
type: isi
- path: '/data/FF/citati/croatia-psychol.txt'
- # encoding: 'ISO-8859-1'
+ path: '/data/FF/citati/citing/tadinacm.txt'
+ encoding: 'ISO-8859-1'
normalize:
- - path: 'conf/isi/croatia-psychol.pl'
+ # - path: 'conf/normalize/isi/isi2xls.pl'
+ # - path: 'conf/isi/isi2sorted.pl'
+ - path: 'conf/isi/tables.pl'
- name: radovi
type: excel
path: '/data/FF/citati/citirani_radovi.xls'
normalize:
# - path: 'conf/normalize/isi/isi2xls.pl'
# - path: 'conf/isi/isi2sorted.pl'
- - path: 'conf/isi/citirani_radovi.pl'
+ - path: 'conf/isi/citirani-radovi.pl'
+ - name: cropsy
+ type: isi
+ path: '/data/FF/citati/croatia-psychol.txt'
+ normalize:
+ - path: 'conf/isi/tables-cropsy.pl'
+ skip: 0
output:
# - module: 'Excel'
# path: '/data/FF/citati/data.xls'
dsn: 'dbi:Pg:dbname=dipl'
schema: 'conf/isi/schema.sql'
# table: 'citirani'
-
--- /dev/null
+drop view if exists parovi;
+drop view if exists rpcou;
+drop view if exists citingu;
+drop view if exists citiraniu;
+
+drop table if exists utca;
+create table utca (
+ id serial,
+ ut text,
+ ca text
+);
+
+drop table if exists cited;
+create table cited (
+ id serial,
+ ca text,
+ cr_auth text,
+ au text,
+ ut text,
+ cr_full text,
+ cr_year text,
+ cr_ref text,
+ cr_doi text
+);
+
+drop table if exists authors;
+create table authors (
+ id serial,
+ ut text,
+ au text,
+ af text,
+ ca text
+);
+
+
+drop table if exists citing;
+create table citing (
+ id serial,
+ ut text,
+ pt text,
+ au text,
+ af text,
+ ti text,
+ so text,
+ la text,
+ dt text,
+ c1 text,
+ rp text,
+ nr integer,
+ tc integer,
+ pi text,
+ py integer,
+ di text,
+ sc text
+);
+
+drop table if exists rpco;
+create table rpco (
+ ut text,
+ rp text,
+ rpco text
+);
+
+
+drop table if exists citirani;
+create table citirani (
+ id serial,
+ ca text,
+ cr_auth text,
+ cr_ref text,
+ cr_year text,
+ cr_vol text,
+ cr_page text,
+ ttc integer,
+ cr text,
+ can text
+);
+
+create view citingu as select distinct ut,pt,au,so,la,dt,nr,tc,pi,py,di,sc,rp from citing ;
+
+create view rpcou as select distinct * from rpco ;
+
+create view parovi as select distinct citirani.ca,
+ citirani.cr,
+ cited.cr_full,
+ cited.ut,
+ citingu.pt,
+ citingu.au,
+ citingu.so,
+ citingu.la,
+ citingu.dt,
+ citingu.nr,
+ citingu.tc,
+ citingu.pi,
+ citingu.py,
+ citingu.sc,
+ citingu.rp
+from citirani
+left join cited on citirani.cr = cited.cr_full
+left join citingu on cited.ut = citingu.ut
+left join rpcou on cited.ut = rpcou.ut
+;
+
+create view citiraniu as select distinct cr_auth,cr_ref,cr_year,cr_vol,cr_page,ttc,cr from citirani ;
+
+
+drop table if exists cropsy;
+create table cropsy (
+ id serial,
+ ut text,
+ au text,
+ c1 text,
+ rp text,
+ tc integer,
+ py integer
+);
+
+
+-- CREATE AGGREGATE array_accum (anyelement)
+-- (
+-- sfunc = array_append,
+-- stype = anyarray,
+-- initcond = '{}'
+-- );
+
+-- select d, count(*),
+-- array_to_string(array_accum('+'::text),'') as graph
+-- from hits group by 1 order by 1 asc;
+
+
+-- create index cited_au on cited(au);
+-- create index cited_cited on cited(cited);
+