X-Git-Url: http://git.rot13.org/?a=blobdiff_plain;f=vhost%2Fwebpac2.cgi;h=fd76b657b4f95a9c989e24be91b19ed7cc75a209;hb=270b0142ec5a98e84ecb5beaf1a020130ab9e013;hp=c8e6d3e009c0cfc624156b63a4a2cb4e07047ab8;hpb=c0a634d5a1e0be3570ace125195cbfc350cf0c5b;p=webpac2 diff --git a/vhost/webpac2.cgi b/vhost/webpac2.cgi index c8e6d3e..fd76b65 100755 --- a/vhost/webpac2.cgi +++ b/vhost/webpac2.cgi @@ -7,19 +7,85 @@ use CGI qw/:standard/; use CGI::Carp qw/fatalsToBrowser/; use File::Slurp; use YAML; -use Search::Estraier; +use Data::Page; +use Data::Dump qw/dump/; +use SWISH::API; +use JSON; +use Text::Unaccent::PurePerl qw/unac_string/; +use HTML::FillInForm::Lite; +use Encode; -print header; +my $range_around = 5; +my @entries_per_page = ( 30, 50, 100, 500 ); +my $debug = param('debug'); + +print header( + -charset => 'utf-8', +); sub dump_yaml { my $name = shift; - print qq|
# $name\n|, YAML::Dump( @_ ), qq|
|; + print qq|
$name
|, YAML::Dump( @_ ), qq|
| if $debug; +} + +sub show_pager { + my ($pager) = @_; + + my @show_pages; + my $after_current = 0; + + if ( $pager->current_page <= $range_around + 2 ) { + @show_pages = ( $pager->first_page .. $pager->current_page ); + $after_current = $range_around - $pager->current_page; + } else { + @show_pages = ( $pager->first_page, '', $pager->current_page - $range_around .. $pager->current_page ); + } + + if ( $pager->current_page + $after_current + $range_around + 1 >= $pager->last_page ) { + push @show_pages, ( $pager->current_page + 1 .. $pager->last_page ); + } else { + push @show_pages, ( $pager->current_page + 1 .. $pager->current_page + $after_current + $range_around, '', $pager->last_page ); + } + +# dump_yaml( 'show_pages', \@show_pages ); + + return '' unless $#show_pages; + + my ( $prev, $next ) = ( '<<', '>>' ); + + sub li_a_href { + my ( $page, $label, $attr ) = @_; + param( 'current_page', $page ); + my $url = self_url( -query => 1 ); + $attr ||= ''; + $label ||= $page; + qq|$label|; + } + + return + $pager->previous_page ? li_a_href( $pager->previous_page, $prev ) : qq|| + , ( map { + if ( $_ eq $pager->current_page ) { + qq|
  • $_
  • |; + } elsif ( $_ eq '' ) { + qq||; + } else { + li_a_href( $_ ); + } + } @show_pages ) + , $pager->next_page ? li_a_href( $pager->next_page, $next ) : qq|| + ; + } my $path = $ENV{PATH_INFO} || 'ecas'; +$path =~ s{^/+}{}; +$path =~ s{/+$}{}; my $dir = $0; $dir =~ s{/[^/]+.cgi}{}; +dump_yaml( 'dir', $dir ); + my $config = YAML::LoadFile( "$dir/$path/config.yml" ); my $database = (keys %{ $config->{databases} })[0]; @@ -34,77 +100,253 @@ if ( -e $html_markup ) { undef $html_markup; } -my $estraier = YAML::LoadFile( "$dir/../var/estraier/$database.yaml" ); +my $stats; +{ + my $path = "$dir/../var/swish/$database.yaml"; + $stats = YAML::LoadFile( $path ); + dump_yaml( "stats $path", $stats ); +} my $db = $config->{databases}->{$database}; -my @attr = keys %{ $estraier->{attr} }; # FIXME replace with real gnerated lookup +sub read_config_txt { + my ( $file ) = @_; + my $input; + my $path ="$dir/$path/$path-$file.txt"; + if ( ! -e $path ) { + warn "missing $path"; + return; + } + foreach ( split(/[\n\r]+/, read_file( $path ) ) ) { + my ( $val,$label ) = split(/\s*\t\s*/,$_,2); + push @{ $input->{ '-values' } }, $val; + $input->{ '-labels' }->{$val} = $label; + } + return $input; +} + +my $attr_labels = read_config_txt 'labels'; +my $attr_operators = read_config_txt 'operators'; + +my @attr = @{ $attr_labels->{'-values'} } if $attr_labels; +@attr = keys %{ $stats->{attr} } unless @attr; + + +warn dump( $attr_labels, $attr_operators ); + +my $only_input; +my $inputs_available = 0; + +foreach ( @{ $db->{input} } ) { + my $input = $_->{name} || die "no name in ",dump( $_ ); + next unless defined $stats->{input}->{$input}; # skip inputs without data + if ( ! $only_input->{'-labels'}->{$input} ) { + push @{ $only_input->{'-values'} }, $input; + $only_input->{'-labels'}->{$input} = $_->{description} || $input; + $inputs_available++; + } +} + +warn "## only_input = ", dump( $only_input ); + +my @style = ( '../../style.css' ); +push @style, "../../$path/$path.css" if -e "$dir/$path/$path.css"; +dump_yaml( 'style', \@style ); + +sub search_form { + + my $form_html = "$dir/$path/$path-search.html"; + if ( -e $form_html ) { + my $html = read_file( $form_html ); + my $q = CGI->new(); + my $h = HTML::FillInForm::Lite->new(); + return $h->fill(\$html, $q); + } + + qq||, + start_form( -action => self_url( query => 0 ) ), + checkbox_group( + -name => 'attr', + %$attr_labels, +# -linebreak => 0, + ), + textfield( -name => 'search' ), + $attr_operators ? popup_menu( -name => 'attr_operator', %$attr_operators ) : '', + submit( -value => 'Search' ), +# hidden( -name => 'entries_per_page', -default => $entries_per_page ), + popup_menu( -name => 'entries_per_page', -values => [ @entries_per_page ], -title => 'entries per page' ), + # we need current_page fixed at 1 so that every submit through form will reset it + qq||, + checkbox( -name => 'debug', -default => 0 ), # FIXME hidden? + qq|
    |, + $inputs_available > 1 ? + h2( 'Select input' ) . + checkbox_group( + -name => 'only_input', + %$only_input, + -linebreak=> 'true', + ) : '', + qq|
    |, + end_form, + ; +} + print start_html( -title => $db->{name}, - -style => '../../style.css', + -style => [ @style ], ), h1( $db->{name} ), qq|
    |, $db->{description}, qq|
    |, - start_form, - radio_group( - -name => 'attr', - -values => [ @attr ], -# -linebreak => 0, - ), - textfield( -name => 'search' ), - submit ; -print end_form; - if ( my $search = param('search') ) { - print qq|
    |; + $search = unac_string( Encode::decode('utf-8',$search) ); + + print qq| + +
    + |; + + my $swish = SWISH::API->new( "$dir/../var/swish/$database" ); + $swish->abort_last_error if $swish->Error; + + my @search = (); + my @attrs = param('attr'); + my $op = param('attr_operator'); - my $node = Search::Estraier::Node->new( - url => $config->{hyperestraier}->{masterurl} . '/node/' . $database, - croak_on_error => 1, - ); + if ( $search =~ m{(=|"|\bAND\b|\bOR\b)} ) { + push @search, $search; + } elsif ( @attrs ) { - my $cond = Search::Estraier::Condition->new; - $cond->set_phrase( $search ); - my $nres = $node->search( $cond, 0 ); + $op ||= 'Q*'; + my @or; + foreach my $attr ( @attrs ) { + my $v = $search; + $v =~ s/^\s+//; + warn "-- v: $v\n"; + sub rewrite { + my ( $attr, $whitespace, $v ) = @_; + warn "## filter $op $whitespace $v\n"; + my $template = $op; + $template =~ s{Q}{$v}; + $whitespace = " AND " if $whitespace; + + # don't return -* &* and other non-word characters + return '' if $template =~ m/^\W\*$/ || $template =~ m/\band\b/i; + + return + $whitespace . + $attr . '="' . $template . '"'; + ; + }; + if ( $op =~ m{\s} ) { + my $template = $op; + $template =~ s{Q}{$v}; + $v = $attr . '="' . $template . '"'; + } else { + $v =~ s{(\s*)(\S+)}{rewrite($attr,$1,$2)}ge; + } + + push @or, $v; + + } + push @search, '(' . join(') OR (', @or) . ')'; - if ( ! $nres ) { - my $no_results = "No results for search '%s'"; - printf qq|
    $no_results
    |, $search; } else { - my $results = "Got %d results for search '%s'"; - printf qq|
    $results
    |, $nres->hits, $search; + push @search, "all=\"$search\""; + } + + my $q = '(' . join(') AND (', @search) . ')'; + + my @only_input = param('only_input'); + $q .= ' AND ((' . join(') OR (', map { "input=\"$_\"" } @only_input) . '))' if @only_input; + + warn "# query: $q\n"; + my $search_obj = $swish->new_search_object; + if ( my $sort = param('sort') ) { + $search_obj->set_sort( $sort ); + } + my $swish_results = $search_obj->execute( $q ); - print qq|
      |; + dump_yaml( 'swish_results', $swish_results ); - foreach my $i ( 1 .. $nres->doc_num ) { - my $rdoc = $nres->get_doc( $i - 1 ); - print qq|
    1. |; + my $pager = Data::Page->new; + $pager->$_( param($_) ) foreach ( qw/entries_per_page current_page/ ); + $pager->total_entries( $swish_results->hits ); + + dump_yaml( 'pager', $pager ); + + $swish_results->seek_result( $pager->first - 1 ); + + if ( ! $pager->total_entries ) { + my $no_results = 'No results for search %s'; + $no_results = $swish->error_string . '
      %s' if $swish->error; + printf qq|
      $no_results
      \n\n|, $q; + } else { + + my $results = "%d results for search %s showing results %d - %d"; + printf qq|
      $results
      \n\n|, $pager->total_entries, $q, $pager->first, $pager->last; + + my $pager_html = join("\n", show_pager( $pager )); + + print qq|
        $pager_html
      \n\n| if $pager_html; + + my $nr = $pager->first; + print qq|
        \n|; + + my $limit = $pager->entries_on_this_page; + + my $nr = 1; + + while ( my $result = $swish_results->next_result ) { + + my $data = $result->property('data'); + dump_yaml( 'data', $data ); + # FIXME if we produce valid json we shouldn't need eval here! + eval { $data = from_json( $data, {utf8 => 1} ); }; + if ( $@ ) { + warn "ERROR: $@ from ",dump( $data ); + next; + } + + my $li_class = ''; + $li_class = qq| class="z"| if $nr % 2 == 0; + print qq||; foreach my $attr ( @attr ) { - my $v = $rdoc->attr( $attr ); - if ( defined $v && $html_markup && ! $html_markup_skip->{$attr} ) { - eval "\$v = $html_markup->$attr( \$v );"; + next unless defined $data->{$attr}; + my $v = $data->{$attr}; + if ( $html_markup && ! $html_markup_skip->{$attr} ) { + eval "\$v = $html_markup->$attr( \$v, \$data );"; if ( $@ ) { warn "disable html markup for $attr: $@"; $html_markup_skip->{$attr} = $@; } + } else { + $v =~ s{(http://\S+)}{$1}; } - next unless defined $v; - print qq|
        $v
        \n|; + my $label = $attr_labels->{'-labels'}->{$attr} || $attr; + print qq|
        $v
        \n|; } print qq|\n|; + + last if $nr++ == $pager->last; } - print qq|
      |; + print qq|
    \n\n|; + + print qq|
      $pager_html
    \n\n| if $pager_html; } print qq|
    |; + + dump_yaml( 'pager', $pager ); + } -dump_yaml( 'estraier', $estraier ); -dump_yaml( 'db', $db ); +print search_form; + +dump_yaml( "config databases $database", $db ); dump_yaml( 'html_markup_skip', $html_markup_skip ); print end_html;