blob: c4a34f955c1a9bffff63553228522d4d25819977 [file] [log] [blame]
using Lucene.Net.Documents;
using Lucene.Net.Index.Extensions;
using NUnit.Framework;
using System;
using Assert = Lucene.Net.TestFramework.Assert;
namespace Lucene.Net.Index
{
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
using BytesRef = Lucene.Net.Util.BytesRef;
using Directory = Lucene.Net.Store.Directory;
using Document = Documents.Document;
using Field = Field;
using Lucene41PostingsFormat = Lucene.Net.Codecs.Lucene41.Lucene41PostingsFormat;
using LuceneTestCase = Lucene.Net.Util.LuceneTestCase;
using MockAnalyzer = Lucene.Net.Analysis.MockAnalyzer;
using TestUtil = Lucene.Net.Util.TestUtil;
[TestFixture]
public class TestSegmentTermEnum : LuceneTestCase
{
internal Directory dir;
[SetUp]
public override void SetUp()
{
base.SetUp();
dir = NewDirectory();
}
[TearDown]
public override void TearDown()
{
dir.Dispose();
base.TearDown();
}
[Test]
public virtual void TestTermEnum()
{
IndexWriter writer = null;
writer = new IndexWriter(dir, NewIndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(Random)));
// ADD 100 documents with term : aaa
// add 100 documents with terms: aaa bbb
// Therefore, term 'aaa' has document frequency of 200 and term 'bbb' 100
for (int i = 0; i < 100; i++)
{
AddDoc(writer, "aaa");
AddDoc(writer, "aaa bbb");
}
writer.Dispose();
// verify document frequency of terms in an multi segment index
VerifyDocFreq();
// merge segments
writer = new IndexWriter(dir, NewIndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(Random)).SetOpenMode(OpenMode.APPEND));
writer.ForceMerge(1);
writer.Dispose();
// verify document frequency of terms in a single segment index
VerifyDocFreq();
}
[Test]
public virtual void TestPrevTermAtEnd()
{
IndexWriter writer = new IndexWriter(dir, NewIndexWriterConfig(TEST_VERSION_CURRENT, new MockAnalyzer(Random)).SetCodec(TestUtil.AlwaysPostingsFormat(new Lucene41PostingsFormat())));
AddDoc(writer, "aaa bbb");
writer.Dispose();
SegmentReader reader = GetOnlySegmentReader(DirectoryReader.Open(dir));
TermsEnum terms = reader.Fields.GetTerms("content").GetEnumerator();
Assert.IsTrue(terms.MoveNext());
Assert.AreEqual("aaa", terms.Term.Utf8ToString());
Assert.IsTrue(terms.MoveNext());
long ordB;
try
{
ordB = terms.Ord;
}
#pragma warning disable 168
catch (NotSupportedException uoe)
#pragma warning restore 168
{
// ok -- codec is not required to support ord
reader.Dispose();
return;
}
Assert.AreEqual("bbb", terms.Term.Utf8ToString());
Assert.IsFalse(terms.MoveNext());
terms.SeekExact(ordB);
Assert.AreEqual("bbb", terms.Term.Utf8ToString());
reader.Dispose();
}
private void VerifyDocFreq()
{
IndexReader reader = DirectoryReader.Open(dir);
TermsEnum termEnum = MultiFields.GetTerms(reader, "content").GetEnumerator();
// create enumeration of all terms
// go to the first term (aaa)
termEnum.MoveNext();
// assert that term is 'aaa'
Assert.AreEqual("aaa", termEnum.Term.Utf8ToString());
Assert.AreEqual(200, termEnum.DocFreq);
// go to the second term (bbb)
termEnum.MoveNext();
// assert that term is 'bbb'
Assert.AreEqual("bbb", termEnum.Term.Utf8ToString());
Assert.AreEqual(100, termEnum.DocFreq);
// create enumeration of terms after term 'aaa',
// including 'aaa'
termEnum.SeekCeil(new BytesRef("aaa"));
// assert that term is 'aaa'
Assert.AreEqual("aaa", termEnum.Term.Utf8ToString());
Assert.AreEqual(200, termEnum.DocFreq);
// go to term 'bbb'
termEnum.MoveNext();
// assert that term is 'bbb'
Assert.AreEqual("bbb", termEnum.Term.Utf8ToString());
Assert.AreEqual(100, termEnum.DocFreq);
reader.Dispose();
}
private void AddDoc(IndexWriter writer, string value)
{
Document doc = new Document();
doc.Add(NewTextField("content", value, Field.Store.NO));
writer.AddDocument(doc);
}
}
}