blob: 09631f8040392d975faa8e1276ada3bce07433d5 [file] [log] [blame]
using Lucene.Net.Analysis;
using Lucene.Net.Documents;
using Lucene.Net.Index;
using Lucene.Net.Search;
using Lucene.Net.Util;
using NUnit.Framework;
using System;
using System.IO;
using Assert = Lucene.Net.TestFramework.Assert;
using Console = Lucene.Net.Util.SystemConsole;
namespace Lucene.Net
{
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
public class TestSearchForDuplicates : LuceneTestCase
{
internal const string PRIORITY_FIELD = "priority";
internal const string ID_FIELD = "id";
internal const string HIGH_PRIORITY = "high";
internal const string MED_PRIORITY = "medium";
internal const string LOW_PRIORITY = "low";
/// <summary>
/// this test compares search results when using and not using compound
/// files.
///
/// TODO: There is rudimentary search result validation as well, but it is
/// simply based on asserting the output observed in the old test case,
/// without really knowing if the output is correct. Someone needs to
/// validate this output and make any changes to the checkHits method.
/// </summary>
[Test]
public void TestRun()
{
StringWriter sw;
string multiFileOutput;
string singleFileOutput;
int MAX_DOCS = AtLeast(225);
using (sw = new StringWriter())
{
DoTest(Random, sw, false, MAX_DOCS);
multiFileOutput = sw.ToString();
}
//System.out.println(multiFileOutput);
using (sw = new StringWriter())
{
DoTest(Random, sw, true, MAX_DOCS);
singleFileOutput = sw.ToString();
}
Assert.AreEqual(multiFileOutput, singleFileOutput);
}
private void DoTest(Random random, TextWriter @out, bool useCompoundFiles, int MAX_DOCS)
{
Store.Directory directory = NewDirectory();
Analyzer analyzer = new MockAnalyzer(random);
IndexWriterConfig conf = NewIndexWriterConfig(TEST_VERSION_CURRENT, analyzer);
MergePolicy mp = conf.MergePolicy;
mp.NoCFSRatio = useCompoundFiles ? 1.0 : 0.0;
IndexWriter writer = new IndexWriter(directory, conf);
if (Verbose)
{
Console.WriteLine("TEST: now build index MAX_DOCS=" + MAX_DOCS);
}
for (int j = 0; j < MAX_DOCS; j++)
{
Documents.Document d = new Documents.Document();
d.Add(NewTextField(PRIORITY_FIELD, HIGH_PRIORITY, Field.Store.YES));
d.Add(NewTextField(ID_FIELD, Convert.ToString(j), Field.Store.YES));
writer.AddDocument(d);
}
writer.Dispose();
// try a search without OR
IndexReader reader = DirectoryReader.Open(directory);
IndexSearcher searcher = NewSearcher(reader);
Query query = new TermQuery(new Term(PRIORITY_FIELD, HIGH_PRIORITY));
@out.WriteLine("Query: " + query.ToString(PRIORITY_FIELD));
if (Verbose)
{
Console.WriteLine("TEST: search query=" + query);
}
Sort sort = new Sort(SortField.FIELD_SCORE, new SortField(ID_FIELD, SortFieldType.INT32));
ScoreDoc[] hits = searcher.Search(query, null, MAX_DOCS, sort).ScoreDocs;
PrintHits(@out, hits, searcher);
CheckHits(hits, MAX_DOCS, searcher);
// try a new search with OR
searcher = NewSearcher(reader);
hits = null;
BooleanQuery booleanQuery = new BooleanQuery();
booleanQuery.Add(new TermQuery(new Term(PRIORITY_FIELD, HIGH_PRIORITY)), Occur.SHOULD);
booleanQuery.Add(new TermQuery(new Term(PRIORITY_FIELD, MED_PRIORITY)), Occur.SHOULD);
@out.WriteLine("Query: " + booleanQuery.ToString(PRIORITY_FIELD));
hits = searcher.Search(booleanQuery, null, MAX_DOCS, sort).ScoreDocs;
PrintHits(@out, hits, searcher);
CheckHits(hits, MAX_DOCS, searcher);
reader.Dispose();
directory.Dispose();
}
private void PrintHits(TextWriter @out, ScoreDoc[] hits, IndexSearcher searcher)
{
@out.WriteLine(hits.Length + " total results\n");
for (int i = 0; i < hits.Length; i++)
{
if (i < 10 || (i > 94 && i < 105))
{
Documents.Document d = searcher.Doc(hits[i].Doc);
@out.WriteLine(i + " " + d.Get(ID_FIELD));
}
}
}
private void CheckHits(ScoreDoc[] hits, int expectedCount, IndexSearcher searcher)
{
Assert.AreEqual(expectedCount, hits.Length, "total results");
for (int i = 0; i < hits.Length; i++)
{
if (i < 10 || (i > 94 && i < 105))
{
Documents.Document d = searcher.Doc(hits[i].Doc);
Assert.AreEqual(Convert.ToString(i), d.Get(ID_FIELD), "check " + i);
}
}
}
}
}