# my $tokenizer = KinoSearch::Analysis::Tokenizer->new( pattern => '\\w' );
+# numeric_padding values are used in range search, and muse be sortable
+
sub new {
my $class = shift @_;
my %Conf = @_;
my $self = bless {
index => $index_path,
first_time_indexing => ! -d $index_path,
+ numeric_padding => [ qw(
+ backup_date
+ date
+ ) ],
+
}, $class;
- warn "# ",dump($self);
+ #warn "# ",dump($self);
return $self;
}
# numeric
$schema->spec_field( name => $_, type => $string_type ) foreach ( qw/
- backup_date
fid
shareid
type
# sortable numeric
$schema->spec_field( name => $_, type => $sort_type ) foreach (qw/
backupnum
+ backup_date
date
size
/);
create => 1,
);
- warn "# created indexer";
+ #warn "# created indexer";
return $self->{_indexer} = $indexer;
return $hits->total_hits;
}
+sub _numeric_padding { sprintf "%010d", $_[0] } # pad up to 32bit number (timestamp)
+
sub add_doc {
my ($self,$row) = @_;
$path =~ s/(.)/$1 /g; # XXX our tokenize
$row->{_file_path_split} = $path;
- warn "XXX ",dump($row) if $ENV{DEBUG};
-
$self->{stats}->{add_doc}++;
+ foreach my $col ( @{ $self->{numeric_padding} } ) {
+ $row->{$col} = _numeric_padding $row->{$col};
+ }
+
+ warn "XXX ",dump($row) if $ENV{DEBUG};
+
$self->indexer->add_doc( $row );
}
sub commit {
my $self = shift;
$self->indexer->commit;
- warn "# commit index ", dump($self->{stats});
+ print STDERR "[commit]";
+}
+
+sub _field_lower_upper_term {
+ my ( $self, $field, $l, $u ) = @_;
+ my $numeric_padding = grep { /^$field$/ } @{ $self->{numeric_padding} };
+ my $range;
+ if ( $l ) {
+ $range->{lower_term} = $numeric_padding ? _numeric_padding $l : $l;
+ $range->{include_lower} = 1;
+ }
+ if ( $u ) {
+ $range->{upper_term} = $numeric_padding ? _numeric_padding $u : $u;
+ $range->{include_upper} = 1;
+ }
+ if ( $range ) {
+ $range->{field} = $field;
+
+ #warn "# $field $l - $u numeric_padding:$numeric_padding ",dump($range);
+ }
+ return $range;
}
sub search {
my $split = $q;
$split =~ s/(.)/$1 /g; # _file_path_split
- $split = qq{"$split"}; # exact ordering
+ my $split_query = KinoSearch::Search::TermQuery->new( field => '_file_path_split', term => $split );
+#warn "XXX ",dump($split_query);
+
+
+ my $query_parser = KinoSearch::Search::QueryParser->new(
+ schema => $self->searcher->get_schema,
+ fields => ['_file_path_split'],
+ );
+ my $query = $query_parser->parse( '"' . $split . '"' );
+
+ my @and_query;
+
+ if ( $shareid ) {
+ push @and_query, KinoSearch::Search::TermQuery->new( field => 'shareid', term => $shareid );
+ }
+
+ if ( my $range = $self->_field_lower_upper_term( 'backup_date', $backup_from, $backup_to ) ) {
+ push @and_query, KinoSearch::Search::RangeQuery->new( %$range );
+ }
+ if ( my $range = $self->_field_lower_upper_term( 'date', $files_from, $files_to ) ) {
+ push @and_query, KinoSearch::Search::RangeQuery->new( %$range );
+ }
+
+ if ( @and_query ) {
+ push @and_query, $query;
+ $query = KinoSearch::Search::ANDQuery->new( children => [ @and_query ] );
+ }
+
my $hits = $self->searcher->hits(
- query => $split,
+ query => m/:/ ? $q : $query,
offset => $offset,
num_wanted => $on_page,
sort_spec => $sort_spec,
my $results;
while ( my $hit = $hits->next ) {
-warn "XXX ",dump($hit);
+ warn "## hit = ",dump($hit) if $ENV{DEBUG};
push @$results, $hit;
}