blob: e59de867394958eb767cb4ffdb64f0d99331a6b3 [file] [log] [blame]
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
use strict;
use warnings;
use lib 'buildlib';
use Lucy::Test;
package ControlSchema;
use base qw( Lucy::Plan::Schema );
sub new {
my $self = shift->SUPER::new(@_);
my $type = Lucy::Plan::FullTextType->new(
analyzer => Lucy::Analysis::RegexTokenizer->new );
$self->spec_field( name => 'content', type => $type );
$self->spec_field( name => 'category', type => $type );
return $self;
}
package BoostedFieldSchema;
use base qw( Lucy::Plan::Schema );
sub new {
my $self = shift->SUPER::new(@_);
my $tokenizer = Lucy::Analysis::RegexTokenizer->new;
my $plain_type = Lucy::Plan::FullTextType->new( analyzer => $tokenizer );
my $boosted_type = Lucy::Plan::FullTextType->new(
analyzer => $tokenizer,
boost => 100,
);
$self->spec_field( name => 'content', type => $plain_type );
$self->spec_field( name => 'category', type => $boosted_type );
return $self;
}
package main;
use Test::More tests => 3;
my $control_folder = Lucy::Store::RAMFolder->new;
my $boosted_doc_folder = Lucy::Store::RAMFolder->new;
my $boosted_field_folder = Lucy::Store::RAMFolder->new;
my $control_indexer = Lucy::Index::Indexer->new(
schema => ControlSchema->new,
index => $control_folder,
);
my $boosted_field_indexer = Lucy::Index::Indexer->new(
schema => BoostedFieldSchema->new,
index => $boosted_field_folder,
);
my $boosted_doc_indexer = Lucy::Index::Indexer->new(
schema => ControlSchema->new,
index => $boosted_doc_folder,
);
my %source_docs = (
'x' => '',
'x a a a a' => 'x a',
'a b' => 'x a a',
);
while ( my ( $content, $cat ) = each %source_docs ) {
my %fields = (
content => $content,
category => $cat,
);
$control_indexer->add_doc( \%fields );
$boosted_field_indexer->add_doc( \%fields );
my $boost = $content =~ /b/ ? 2 : 1;
$boosted_doc_indexer->add_doc( doc => \%fields, boost => $boost );
}
$control_indexer->commit;
$boosted_field_indexer->commit;
$boosted_doc_indexer->commit;
my $searcher = Lucy::Search::IndexSearcher->new( index => $control_folder, );
my $hits = $searcher->hits( query => 'a' );
my $hit = $hits->next;
is( $hit->{content}, "x a a a a", "best doc ranks highest with no boosting" );
$searcher
= Lucy::Search::IndexSearcher->new( index => $boosted_field_folder, );
$hits = $searcher->hits( query => 'a' );
$hit = $hits->next;
is( $hit->{content}, 'a b', "boost in FieldType works" );
$searcher = Lucy::Search::IndexSearcher->new( index => $boosted_doc_folder, );
$hits = $searcher->hits( query => 'a' );
$hit = $hits->next;
is( $hit->{content}, 'a b', "boost from \$doc->set_boost works" );