--- trunk/index_DBI_cache.pm 2003/07/13 21:54:22 95 +++ trunk2/lib/WebPac/Index.pm 2004/06/13 20:20:29 348 @@ -6,10 +6,13 @@ # library). But, that functionality is not used anyway... # -package index_DBI; +package WebPac::Index; use strict qw(vars); use vars qw($Count); use HTML::Entities; +use URI::Escape; +use locale; +use Carp; use DBI; @@ -34,18 +37,25 @@ sub new { my $class = shift; - my $self = {}; + my $self = {@_}; bless($self, $class); - my $dbd = shift || die "need dbi_dbd= in [global] section of configuration file"; - my $dsn = shift || die "need dbi_dsn= in [global] section of configuration file"; - my $user = shift || die "need dbi_user= in [global] section of configuration file"; - my $passwd = shift || die "need dbi_passwd= in [global] section of configuration file"; + croak "need dbd" if (! $self->{dbd}); + croak "need dsn" if (! $self->{dsn}); + croak "need user" if (! $self->{user}); + croak "need passwd" if (! $self->{passwd}); - $self->{dbh} = DBI->connect("DBI:$dbd:$dsn",$user,$passwd) || die $DBI::errstr; + $self->{dbh} = DBI->connect("DBI:$self->{dbd}:$self->{dsn}",$self->{user},$self->{passwd}) || die $DBI::errstr; $Count++; - $self->bench("connected to $dbd as $user"); + $self->bench("connected to $self->{dbd} as $self->{user}"); + + # force SQLite to support binary 0 in data (which shouldn't + # happend, but it did to me) + eval { + no warnings 'all'; + $self->{dbh}->{sqlite_handle_binary_nulls} = 1; + }; return $self; } @@ -62,10 +72,11 @@ # FIX: this is not a good way to check if table exists! if ($sth->execute() && $sth->fetchrow_hashref) { my $sql = "drop table $field"; - my $sth = $self->{dbh}->do($sql) || die "SQL: $sql ".$self->{dbh}->errstr(); + my $sth = $self->{dbh}->do($sql) || warn "SQL: $sql - ".$sth->errstr(); } $sql = "create table $field ( item varchar(255), + display text, count int, ord int, primary key (item) @@ -79,7 +90,7 @@ my $field = shift; my $index_data = shift || print STDERR "\$index->insert($field,NULL,...)"; - my $ident = shift || ''; # e.g. library id + my $display = shift || $index_data; if (! $index_data) { print STDERR "\$index->insert() -- no value to insert\n"; @@ -101,25 +112,37 @@ if (! $c_table->{$field}->{$uc}) { #print stderr "in index: $index_data\n"; $c_table->{$field}->{$uc} = $index_data; + $c_table->{$field}->{$uc}->{display} = $display; $c_count->{$field}->{$uc} = 1; } else { $c_count->{$field}->{$uc}++; } } -sub check { +sub count { my $self = shift; my $field = shift; + my $where = shift; - my $sql = "select count(*) from $field"; + my $sql = "select count(*) from $field where upper(item) like upper(?)||'%'"; my $sth = $self->{dbh}->prepare($sql) || die $self->{dbh}->errstr(); - $sth->execute() || die "sql: $sql; ".$self->{dbh}->errstr(); + $sth->execute($where) || die "sql: $sql; ".$self->{dbh}->errstr(); my ($total) = $sth->fetchrow_array(); - return $total; + # no results, count all + if (! $total) { + my $sql = "select count(*) from $field"; + + my $sth = $self->{dbh}->prepare($sql) || die $self->{dbh}->errstr(); + $sth->execute() || die "sql: $sql; ".$self->{dbh}->errstr(); + $total = $sth->fetchrow_array(); + + } + + return $total || 1; } @@ -127,7 +150,6 @@ my $self = shift; my $field = shift; - my $what = shift || 'item'; # 'item,ident' my $where = shift; my $from_ord = shift || 0; @@ -135,15 +157,24 @@ my @sql_args; - my $sql = "select $what,ord from $field"; + my $sql = "select item,display,ord from $field"; if ($where) { - my $sql2 = " select ord from $field where upper($what) like upper(?)||'%'"; + my $sql2 = "select ord from $field where upper(item) like upper(?)||'%'"; my $sth = $self->{dbh}->prepare($sql2) || die "sql2: $sql2; ".$self->{dbh}->errstr(); $sth->execute($where) || die "sql2: $sql2; ".$self->{dbh}->errstr(); if (my $row = $sth->fetchrow_hashref) { $from_ord += $row->{ord} - 1; + } else { + # if no match is found when searching from beginning + # of word in index, try substring match anywhere + $sql2 = "select ord from $field where upper(item) like '% '||upper(?)||'%'"; + $sth = $self->{dbh}->prepare($sql2) || die "sql2: $sql2; ".$self->{dbh}->errstr(); + $sth->execute($where) || die "sql2: $sql2; ".$self->{dbh}->errstr(); + if (my $row = $sth->fetchrow_hashref) { + $from_ord += $row->{ord} - 1; + } } } $sql .= " order by ord limit $rows offset $from_ord"; @@ -152,7 +183,8 @@ $sth->execute() || die "execute: $sql; ".$self->{dbh}->errstr(); my @arr; while (my $row = $sth->fetchrow_hashref) { - $row->{item} = HTML::Entities::encode($row->{item},'<>&"'); + $row->{item} = HTML::Entities::encode($row->{item},' <>&"'); + $row->{display} = HTML::Entities::encode($row->{display},'<>&"'); push @arr,$row; } return @arr; @@ -169,23 +201,29 @@ $self->{dbh}->begin_work || die $self->{dbh}->errstr(); - $self->bench("Sorting ".$Table{$table}." items in $table"); + $self->bench("Sorting ".$Table{$table}." (with duplicates) items in $table"); my @keys = sort keys %{$c_table->{$table}}; - $self->bench("Dumping data into $table"); - my $sql = "insert into $table (ord,item,count) values (?,?,?)"; + $self->bench("Dumping ".($#keys+1)." items into $table"); + my $sql = "insert into $table (ord,item,display,count) values (?,?,?,?)"; my $sth = $self->{dbh}->prepare($sql) || die "sql: $sql; ".$self->{dbh}->errstr(); my $ord = 0; foreach my $key (@keys) { $sth->execute(++$ord, $c_table->{$table}->{$key}, + $c_table->{$table}->{$key}->{display}, $c_count->{$table}->{$key} ); } $self->{dbh}->commit || die $self->{dbh}->errstr(); } + + if ($self->{dbd} =~ m/(Pg|SQLite)/) { + $self->{dbh}->do(qq{vacuum}) || warn "vacumming failed. It shouldn't if you are using PostgreSQL or SQLite: ".$self->{dbh}->errstr(); + } + $self->bench("disconnecting from database"); $self->{dbh}->disconnect;