2 # this file implements index functions using DBI
3 # and huge amounts of memory for cache speedup
5 # this version doesn't support ident (which sould be location in
6 # library). But, that functionality is not used anyway...
18 my %Table; # index tables which where visited in this run
19 my %sth_cache; # cache prepared statements
26 my $bench_time = time();
32 print STDERR "last operation took ",time()-$bench_time," seconds...\n";
34 print STDERR "$msg\n";
42 my $dbd = shift || die "need dbi_dbd= in [global] section of configuration file";
43 my $dsn = shift || die "need dbi_dsn= in [global] section of configuration file";
44 my $user = shift || die "need dbi_user= in [global] section of configuration file";
45 my $passwd = shift || die "need dbi_passwd= in [global] section of configuration file";
49 $self->{dbh} = DBI->connect("DBI:$dbd:$dsn",$user,$passwd) || die $DBI::errstr;
52 $self->bench("connected to $dbd as $user");
54 # force SQLite to support binary 0 in data (which shouldn't
55 # happend, but it did to me)
58 $self->{dbh}->{sqlite_handle_binary_nulls} = 1;
64 sub delete_and_create {
69 #print "#### delete_and_create($field)\n";
71 my $sql = "select count(*) from $field";
72 my $sth = $self->{dbh}->prepare($sql);
73 # FIX: this is not a good way to check if table exists!
74 if ($sth && $sth->execute() && $sth->fetchrow_hashref) {
75 my $sql = "drop table $field";
76 my $sth = $self->{dbh}->do($sql) || warn "SQL: $sql - ".$sth->errstr();
78 $sql = "create table $field (
86 $sth = $self->{dbh}->do($sql) || warn "SQL: $sql ".$self->{dbh}->errstr();
93 my $index_data = shift || print STDERR "\$index->insert($field,NULL,...)";
94 my $display = shift || $index_data;
97 print STDERR "\$index->insert() -- no value to insert\n";
103 #$sth_cache{$field."select"}->execute($index_data) || die "cache: $field select; ".$self->{dbh}->errstr();
105 $index_data =~ s#&(\w)(acute|cedil|circ|grave|ring|slash|tilde|uml);#$1#gi;
107 my $uc = uc($index_data);
108 if (! $c_table->{$field}->{$uc}) {
109 #print stderr "in index: $index_data\n";
110 $c_table->{$field}->{$uc} = $index_data;
111 $c_table->{$field}->{$uc}->{display} = $display;
112 $c_count->{$field}->{$uc} = 1;
114 $c_count->{$field}->{$uc}++;
124 my $sql = "select count(*) from $field where upper(item) like upper(?)||'%'";
126 my $sth = $self->{dbh}->prepare($sql) || die $self->{dbh}->errstr();
127 $sth->execute($where) || die "sql: $sql; ".$self->{dbh}->errstr();
129 my ($total) = $sth->fetchrow_array();
131 # no results, count all
133 my $sql = "select count(*) from $field";
135 my $sth = $self->{dbh}->prepare($sql) || die $self->{dbh}->errstr();
136 $sth->execute() || die "sql: $sql; ".$self->{dbh}->errstr();
137 $total = $sth->fetchrow_array();
151 my $from_ord = shift || 0;
152 my $rows = shift || 10;
156 my $sql = "select item,display,ord from $field";
159 my $sql2 = "select ord from $field where upper(item) like upper(?)||'%'";
160 my $sth = $self->{dbh}->prepare($sql2) || die "sql2: $sql2; ".$self->{dbh}->errstr();
162 $sth->execute($where) || die "sql2: $sql2; ".$self->{dbh}->errstr();
163 if (my $row = $sth->fetchrow_hashref) {
164 $from_ord += $row->{ord} - 1;
166 # if no match is found when searching from beginning
167 # of word in index, try substring match anywhere
168 $sql2 = "select ord from $field where upper(item) like '% '||upper(?)||'%'";
169 $sth = $self->{dbh}->prepare($sql2) || die "sql2: $sql2; ".$self->{dbh}->errstr();
170 $sth->execute($where) || die "sql2: $sql2; ".$self->{dbh}->errstr();
171 if (my $row = $sth->fetchrow_hashref) {
172 $from_ord += $row->{ord} - 1;
176 $sql .= " order by ord limit $rows offset $from_ord";
178 my $sth = $self->{dbh}->prepare($sql) || die "prepare: $sql; ".$self->{dbh}->errstr();
179 $sth->execute() || die "execute: $sql; ".$self->{dbh}->errstr();
181 while (my $row = $sth->fetchrow_hashref) {
182 $row->{item} = HTML::Entities::encode($row->{item},' <>&"');
183 $row->{display} = HTML::Entities::encode($row->{display},'<>&"');
184 $row->{item} =~ s#&(\w)(acute|cedil|circ|grave|ring|slash|tilde|uml);#$1#gi;
185 $row->{display} =~ s#&(\w)(acute|cedil|circ|grave|ring|slash|tilde|uml);#&$1$2;#gi;
194 return if (! $self->{dbh});
196 foreach my $table (keys %Table) {
197 $self->bench("Crating table $table");
198 $self->delete_and_create($table);
200 $self->{dbh}->begin_work || die $self->{dbh}->errstr();
202 $self->bench("Sorting ".$Table{$table}." (with duplicates) items in $table");
203 my @keys = sort keys %{$c_table->{$table}};
205 $self->bench("Dumping ".($#keys+1)." items into $table");
206 my $sql = "insert into $table (ord,item,display,count) values (?,?,?,?)";
207 my $sth = $self->{dbh}->prepare($sql) || die "sql: $sql; ".$self->{dbh}->errstr();
210 foreach my $key (@keys) {
211 $sth->execute(++$ord,
212 $c_table->{$table}->{$key},
213 $c_table->{$table}->{$key}->{display},
214 $c_count->{$table}->{$key}
218 $self->{dbh}->commit || die $self->{dbh}->errstr();
221 if ($self->{dbd} =~ m/(Pg|SQLite)/) {
222 $self->{dbh}->do(qq{vacuum}) || warn "vacumming failed. It shouldn't if you are using PostgreSQL or SQLite: ".$self->{dbh}->errstr();
225 $self->bench("disconnecting from database");
227 $self->{dbh}->disconnect;
233 print STDERR "index_DBI fatal error: \$index->close() not called... $Count references left!\n" if ($Count > 0);
235 # print STDERR "usage\ttable\n";
236 # foreach (keys %Table) {
237 # print STDERR $Table{$_},"\t$_\n";