4e1a8a66ab28d12a9f6e891ce20bf901c2087727
[webpac] / WebPac.pm
1 package WebPac;
2
3 use base 'CGI::Application';
4 use strict;
5
6 use HTML::Pager;
7 use HTML::FillInForm;
8 use SWISH;
9 use Text::Iconv;
10 use DBI;
11 use Config::IniFiles;
12 use Text::Unaccent;
13
14 use lib '..';
15 use index_DBI;
16 use back2html;
17
18 # configuration options
19 # FIXME they really should go in configuration file!
20 my $TEMPLATE_PATH = '/data/webpac/template_html';
21 my $CHARSET = 'ISO-8859-2';
22 my $SWISH = '/usr/bin/swish-e';
23 my $INDEX = '/data/webpac/index/isis.index';
24 my $MAX_HITS = 0;
25 my $ON_PAGE = 10;
26
27 Text::Iconv->raise_error(0);     # Conversion errors raise exceptions
28
29 my $from_utf8 = Text::Iconv->new('UTF8', $CHARSET);
30
31 # read global.conf configuration
32 my $cfg_global = new Config::IniFiles( -file => '../global.conf' ) || die "can't open 'global.conf'";
33
34
35 sub setup {
36         my $self = shift;
37         $self->tmpl_path($TEMPLATE_PATH);
38         $self->run_modes(
39                 'search' => 'show_search_form',
40                 'results' => 'show_results_list',
41 #               'user' => 'show_user_detail',
42                 'index' => 'show_index',
43         );
44         $self->start_mode('search');
45         $self->mode_param('rm');
46
47         $self->header_props(-charset=>$CHARSET);
48 }
49
50 sub show_search_form {
51         my $self = shift;
52
53         # Get the CGI.pm query object
54         my $q = $self->query();
55
56         my $tmpl = $self->load_tmpl('search.html');
57         my $html = $tmpl->output;
58
59         my $fif = new HTML::FillInForm;
60
61         return $fif->fill(scalarref => \$html, fobject => $q,
62                 target => 'search');
63 }
64  
65 sub show_results_list {
66         my $self = shift;
67
68         my $q = $self->query();
69
70         my @swish_results;      # results from swish
71
72         # load template for this page
73
74         my @s_arr;      # all queries are located here
75
76         my @path_arr = $q->param('path');
77         my $full = $q->param('full');
78
79         for(my $i = 1; $i <=30; $i++) {
80
81                 return show_index($self, $i) if ($q->param("f".$i."_index"));
82                 next if (! $q->param("v$i"));
83                 next if (! $q->param("f$i"));
84
85                 # re-write query from +/- to and/and not
86                 my @param_vals = $q->param("v$i");
87                 my @swish_q;
88                 while (my $search = shift @param_vals) {
89                         my $s;
90                         # remove accents
91                         $search = unac_string($CHARSET,$search);
92                         while ($search =~ s/\s*("[^"]+")\s*/ /) {
93                                 $s .= "$1 ";
94                         }
95                         $search =~ s/^\s+//;
96                         $search =~ s/\s+$//;
97
98                         foreach (split(/\s+/,$search)) {
99                                 if (m/^([+-])(\S+)/) {
100                                         $s.= ($s) ? "and " : "";
101                                         $s.="not " if ($1 eq "-");
102                                         $s.="$2* ";
103                                 } elsif (m/(and|or|not)/i) {
104                                         $s.="$_ ";
105                                 } else {
106                                         $s.="$_* ";
107                                 }
108                         }
109                         $s =~ s/\*+/*/g;
110                         push @swish_q,$s;
111                 }
112                 # FIXME default operator for multi-value fields is or. There is
113                 # no way to change it, except here for now. Is there need?
114                 push @s_arr, $q->param("f$i")."_swish=(".join(" or ",@swish_q).")";
115         }
116
117         my $tmpl = $self->load_tmpl('results.html');
118
119         # call swish
120         my $sh = SWISH->connect('Fork',
121                 prog     => $SWISH,
122                 indexes  => $INDEX,
123                 properties  => [qw/swishdocpath swishrank swishtitle headline html/],
124                 results  => sub {
125                         my ($sh,$hit) = @_;
126
127                         push @swish_results, {
128                                 nr => ($#swish_results + 2),
129                                 path => $hit->swishdocpath,
130                                 headline => $from_utf8->convert($hit->headline),
131                                 html => back2html($from_utf8->convert($hit->html)),
132                                 rank => $hit->swishrank };
133
134                 },
135                 #startnum => 0,
136                 maxhits => $MAX_HITS
137         );
138
139         die $SWISH::errstr unless $sh;
140         # construct swish query
141         my $sw_q = join(" and ",@s_arr);
142         if (@path_arr) {
143                 $sw_q .= "and (swishdocpath=\"";
144                 $sw_q .= join("\" or swishdocpath=\"",@path_arr);
145                 $sw_q .= "\")";
146                 $tmpl->param('full',1); # show full records
147         }
148
149         my $hits = $sh->query($sw_q);
150
151         $tmpl->param('hits',$hits);
152         $tmpl->param('search',$sw_q);
153
154         $tmpl->param('PAGER_offset',$q->param("PAGER_offset") || 1);
155         $tmpl->param('last_PAGER_offset',$q->param("last_PAGER_offset") || 1);
156
157         # create a Pager object
158         my $pager = HTML::Pager->new(
159                 # required parameters
160                 query => $q,
161                 get_data_callback => sub {
162                         my ($offset, $rows) = @_;
163
164                         my @result;
165                         for (my $i=0; $i<$rows; $i++) {
166                                 push @result, $swish_results[$offset+$i] if $swish_results[$offset+$i];
167                         }
168                         return \@result;
169                 },
170                 rows => $hits,
171                 page_size => $ON_PAGE,
172                 # some optional parameters
173                 persist_vars => [
174                         'rm',
175                         'f1', 'v1',
176                         'f2', 'v2',
177                         'f3', 'v3',
178                         'f4', 'v4',
179                         'f5', 'v5',
180                         'f6', 'v6',
181                         'f7', 'v7',
182                         'f8', 'v8',
183                         'f9', 'v9',
184                         ],
185                 #cell_space_color => '#000000',
186                 #cell_background_color => '#ffffff',
187                 #nav_background_color => '#dddddd',
188                 #javascript_presubmit => 'last_minute_javascript()',
189                 debug => 1,
190                 template => $tmpl,
191         );
192
193         my $html = $pager->output;
194
195         return $html;
196 }
197  
198 sub show_index {
199         my $self = shift;
200         my $i = shift;          # field number
201
202         my $q = $self->query();
203
204         my $field = $q->param("f$i");
205         my $limit = $q->param("v$i");
206
207         my $html;
208
209         my $index = new index_DBI(
210                 $cfg_global->val('global', 'dbi_dbd'),
211                 $cfg_global->val('global', 'dbi_dsn'),
212                 $cfg_global->val('global', 'dbi_user'),
213                 $cfg_global->val('global', 'dbi_passwd') || ''
214         );
215
216         my $total = $index->check($field);
217         if (! $total) {
218                 my $tmpl = $self->load_tmpl('no_index.html');
219                 $tmpl->param('field',$field);
220                 $html = $tmpl->output;
221                 return $html;
222         }
223
224         my $tmpl = $self->load_tmpl('index_res.html');
225         $tmpl->param('field',$field);
226         $tmpl->param('limit',$limit);
227         $tmpl->param('total',$total);
228
229 # FIXME I should set offset and leave out limit from fetch!!
230 #       if (! $q->param("PAGER_offset") {
231 #               $q->param("Pager_offet)
232 #       }
233
234         my $pager = HTML::Pager->new(
235                 query => $q,
236                 get_data_callback => sub {
237                         my ($offset, $rows) = @_;
238
239                         my @result = $index->fetch($field,'item',$limit, $offset, $rows);
240                         return \@result;
241                 },
242                 rows => $total,
243                 page_size => $ON_PAGE,
244                 persist_vars => [
245                         'rm', 
246                         "f$i", "v$i", "f".$i."_index", 
247                         'offset',
248                         ],
249                 debug => 1,
250                 template => $tmpl,
251         );
252
253         return $pager->output;
254 }
255
256 1;