X-Git-Url: http://git.rot13.org/?a=blobdiff_plain;f=html.pl;h=3d9cfce0e96fcec5c2542e6ee1011e4f403af5c6;hb=626163e24773f07bb9131a80a3a111f052b64f24;hp=1d5ef4cb0328c7880a87a4cb92abe439a7b76089;hpb=e56b98419add535e5ec976ad0c7b82fe3743e4ba;p=koha-bibliografija diff --git a/html.pl b/html.pl index 1d5ef4c..3d9cfce 100755 --- a/html.pl +++ b/html.pl @@ -12,12 +12,29 @@ use locale; use Text::Unaccent; use Carp qw(confess); use utf8; +use JSON; +use POSIX qw(strftime); +use Storable; use lib '/srv/koha_ffzg'; use C4::Context; use XML::LibXML; use XML::LibXSLT; +my $pid_file = '/dev/shm/bibliografija.pid'; +{ + if ( -e $pid_file ) { + open(my $fh, '<', $pid_file); + my $pid = <$fh>; + no autodie; # it will die on kill + kill 0, $pid || die "$0 allready running as pid $pid"; + } + open(my $fh, '>', $pid_file); + print $fh $$; + close($fh); +} + + my $dbh = C4::Context->dbh; sub debug { @@ -97,10 +114,11 @@ while( my $row = $sth_auth->fetchrow_hashref ) { debug 'department_in_group' => $department_in_group; foreach my $department ( keys %$department_in_sum ) { - $department_in_sum->{$department} = 0 unless $department =~ m/(centar|croaticum|katedra|odsjek)/i; +# $department_in_sum->{$department} = 0 unless $department =~ m/(centar|croaticum|katedra|odsjek)/i; } debug 'auth_department' => $auth_department; +store $auth_department, '/dev/shm/auth_department.storable'; debug 'auth_group' => $auth_group; debug 'department_in_sum' => $department_in_sum; @@ -128,6 +146,7 @@ where =cut my $biblio_year; +my $biblio_full_name; my $type_stats; my $parser = XML::LibXML->new(); @@ -198,6 +217,7 @@ while( my $row = $sth_select_authors->fetchrow_hashref ) { my $extract = { '008' => undef, '100' => '(9|a)', + '245' => 'a', '680' => 'i', '700' => '(9|4|a)', '942' => '(t|r|v)' @@ -239,12 +259,14 @@ while( my $row = $sth_select_authors->fetchrow_hashref ) { if ( ! defined $data->{year} ) { warn "MISSING year in ", $row->{biblionumber}; +=for remove-year-limit } elsif ( $data->{year} < 2008 ) { push @{ $skip->{year_lt_2008} }, $row->{biblionumber}; next; } elsif ( $data->{year} > 2013 ) { push @{ $skip->{year_gt_2013} }, $row->{biblionumber}; next; +=cut } # warn "# ", $row->{biblionumber}, " data ",dump($data); @@ -275,10 +297,13 @@ while( my $row = $sth_select_authors->fetchrow_hashref ) { foreach my $authid ( @first_author ) { push @{ $authors->{$authid}->{aut}->{ $category } }, $row->{biblionumber}; } + $biblio_full_name->{ $row->{biblionumber} } = $data->{100}->[0]->{a}; } else { $have_100 = 0; } + $biblio_full_name->{ $row->{biblionumber} } ||= $data->{245}->[0]->{a}; + my $have_edt; if ( exists $data->{700} ) { @@ -300,23 +325,33 @@ while( my $row = $sth_select_authors->fetchrow_hashref ) { $type_stats->{$type}++; - if ( $type =~ m/(edt|trl|com|ctb)/ ) { - push @{ $authors->{$authid}->{sec}->{ $category } }, $row->{biblionumber}; - push @{ $authors->{$authid}->{$1}->{ $category } }, $row->{biblionumber}; - } elsif ( $type =~ m/aut/ ) { - if ( ! $have_100 ) { - $have_edt = grep { exists $_->{4} && $_->{4} =~ m/edt/ } @{ $data->{700} } if ! defined $have_edt; - if ( $have_edt ) { - $skip->{ have_700_edt }->{ $row->{biblionumber} }++; + my @types = split(/[\s\/]+/, $type); + + foreach my $type ( @types ) { + my $type = substr($type,0,3); + $type_stats->{_count_each_type}->{$type}++; + + if ( $type =~ m/(edt|trl|com|ctb)/ ) { + push @{ $authors->{$authid}->{__sec}->{ $category } }, $row->{biblionumber}; + push @{ $authors->{$authid}->{$type}->{ $category } }, $row->{biblionumber}; + $type =~ s/(com|ctb)/_ostalo/; + push @{ $authors->{$authid}->{$type}->{ $category } }, $row->{biblionumber}; + + } elsif ( $type =~ m/aut/ ) { + if ( ! $have_100 ) { + $have_edt = grep { exists $_->{4} && $_->{4} =~ m/edt/ } @{ $data->{700} } if ! defined $have_edt; + if ( $have_edt ) { + $skip->{ have_700_edt }->{ $row->{biblionumber} }++; + } else { + push @{ $authors->{$authid}->{aut}->{ $category } }, $row->{biblionumber}; + } } else { push @{ $authors->{$authid}->{aut}->{ $category } }, $row->{biblionumber}; } } else { - push @{ $authors->{$authid}->{aut}->{ $category } }, $row->{biblionumber}; +# warn "# SKIP ", $row->{biblionumber}, ' no 700$4 in ', dump($data); + $skip->{ 'no_700$4' }->{ $row->{biblionumber} }++; } - } else { -# warn "# SKIP ", $row->{biblionumber}, ' no 700$4 in ', dump($data); - $skip->{ 'no_700$4' }->{ $row->{biblionumber} }++; } } delete $data->{700}; @@ -327,9 +362,11 @@ while( my $row = $sth_select_authors->fetchrow_hashref ) { } debug 'authors' => $authors; +store $authors, '/dev/shm/authors.storable'; debug 'type_stats' => $type_stats; debug 'skip' => $skip; debug 'biblio_year' => $biblio_year; +debug 'biblio_full_name' => $biblio_full_name; debug 'biblio_data' => $biblio_data; debug 'biblio_author_external' => $biblio_author_external; @@ -350,13 +387,18 @@ sub html_title { |, join(" ", @_), qq| + + |; } sub html_end { - return qq|\n\n|; + return + qq|Zadnji puta osvježeno: |, + strftime("%Y-%m-%d %H:%M:%S\n", localtime()), + qq|\n\n|; } mkdir 'html' unless -d 'html'; @@ -370,30 +412,137 @@ debug 'authors' => \@authors; sub li_biblio { my ($biblionumber) = @_; - return qq|
  • |, + return qq|
  • |, qq|$biblionumber|, biblioitem_html($biblionumber), qq|edit|, qq|
  • \n|; } +sub unique { + my $unique; + $unique->{$_}++ foreach @_; + return keys %$unique; +} + +sub unique_biblionumber { + my @v = unique @_; + return sort { + $biblio_year->{$b} <=> $biblio_year->{$a} || + $biblio_full_name->{$a} cmp $biblio_full_name->{$b} || + $a <=> $b + } @v; +} + sub author_html { my ( $fh, $authid, $type, $label ) = @_; return unless exists $authors->{$authid}->{$type}; - print $fh qq|

    $label

    \n|; + print $fh qq|

    $label

    \n|; foreach my $category ( sort keys %{ $authors->{$authid}->{$type} } ) { my $label = $category_label->{$category} || 'Bez kategorije'; - print $fh qq|

    $label

    \n\n|; + print $fh qq|\n|; + } +} + +my @toc_type_label = ( +'aut' => 'Primarno autorstvo', +'edt' => 'UredniÅ¡tva', +'trl' => 'Prijevodi', +'_ostalo' => 'Ostalo', +); + + +sub count_author_years { + my $years = shift; + my ($authid) = @_; + foreach my $type ( keys %{ $authors->{$authid} } ) { +# next if $type =~ m/^_/; # FIXME + foreach my $category ( keys %{ $authors->{$authid}->{$type} } ) { + foreach my $biblionumber ( unique_biblionumber @{ $authors->{$authid}->{$type}->{$category} } ) { + $years->{ $biblio_year->{ $biblionumber } }->{ $type . '-' . $category }->{ $biblionumber }++; + } + } + } + return $years; +} + +sub html_year_selection { + my $fh = shift; + my @authids = unique @_; + + debug 'html_year_selection authids=', [ @authids ]; + + print $fh qq|Godine:\n|; + my $type_cat_count = {}; + my $years; + + foreach my $authid ( @authids ) { + $years = count_author_years( $years, $authid ); + } + + debug 'years' => $years; + + foreach my $year ( sort { $b <=> $a } keys %$years ) { + print $fh qq| \n|; + foreach my $type_cat ( keys %{ $years->{$year} } ) { + my $count = scalar keys %{ $years->{$year}->{$type_cat} }; + $years->{$year}->{$type_cat} = $count; # remove biblionumbers and use count + $type_cat_count->{ $type_cat } += $count; + my ($type,$cat) = split(/-/, $type_cat); + $type_cat_count->{_toc}->{$type}->{$cat}++; + $type_cat_count->{_toc_count}->{$type} += $count; + } } + + print $fh qq| + + + |; + + print $fh qq||; + + print $fh q| + + + |; + + debug 'type_cat_count' => $type_cat_count; + + # TOC + print $fh qq|\n|; + } + foreach my $row ( sort { $a->{full_name} cmp $b->{full_name} } @authors ) { my $first = substr( $row->{full_name}, 0, 1 ); @@ -407,10 +556,16 @@ foreach my $row ( sort { $a->{full_name} cmp $b->{full_name} } @authors ) { my $path = "html/$row->{authid}"; open(my $fh, '>:encoding(utf-8)', "$path.new"); print $fh html_title($row->{full_name}, "bibliografija"); - print $fh qq|

    $row->{full_name} - bibliografija za razdoblje 2008-2013

    |; + print $fh qq|

    $row->{full_name} - bibliografija

    \n|; + + html_year_selection $fh => $row->{authid}; - author_html( $fh, $row->{authid}, 'aut' => 'Primarno autorstvo' ); - author_html( $fh, $row->{authid}, 'sec' => 'Uredništva, prijevodi, krička izdanja' ); + my $i = 0; + while ( $i < $#toc_type_label ) { + my $type = $toc_type_label[$i++] || die "type"; + my $label = $toc_type_label[$i++] || die "label"; + author_html( $fh, $row->{authid}, $type => $label ); + } print $fh html_end; close($fh); @@ -429,7 +584,7 @@ my $department_category_author; foreach my $department ( sort keys %$auth_department ) { foreach my $authid ( sort @{ $auth_department->{$department} } ) { my @categories = keys %{ $authors->{$authid}->{aut} }; - push @categories, keys %{ $authors->{$authid}->{sec} }; + push @categories, keys %{ $authors->{$authid}->{__sec} }; foreach my $category ( sort @categories ) { push @{ $department_category_author->{$department}->{$category} }, $authid; push @{ $department_category_author->{'AAA_ukupno'}->{$category} }, $authid if $department_in_sum->{$department}; @@ -444,71 +599,92 @@ foreach my $department ( sort keys %$auth_department ) { debug 'department_category_author' => $department_category_author; -mkdir 'html/departments' unless -d 'html/departments'; -sub unique_biblionumber { - my @v = @_; - my $u; - $u->{$_}++ foreach @v; - return sort { $biblio_year->{$b} <=> $biblio_year->{$a} || $a <=> $b } keys %$u; -} +sub department_html { + my ( $fh, $department, $type, $label, $csv_fh ) = @_; -open(my $dep_fh, '>:encoding(utf-8)', 'html/departments/index.new'); -print $dep_fh html_title('Odsijeci Filozofskog fakulteta u Zagrebu'), qq|