blob: 32884fe263d7cd956332ebf9ce9174007d730615 [file] [log] [blame]
using Lucene.Net.Diagnostics;
using System;
using System.Diagnostics;
using System.Runtime.CompilerServices;
using FieldInfos = Lucene.Net.Index.FieldInfos;
using IndexFormatTooNewException = Lucene.Net.Index.IndexFormatTooNewException;
using IndexFormatTooOldException = Lucene.Net.Index.IndexFormatTooOldException;
namespace Lucene.Net.Codecs.Lucene3x
{
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
using IndexInput = Lucene.Net.Store.IndexInput;
using Term = Lucene.Net.Index.Term;
/// <summary>
/// @lucene.experimental
/// </summary>
[Obsolete("(4.0) No longer used with flex indexing, except for reading old segments")]
internal sealed class SegmentTermEnum : IDisposable
#if FEATURE_CLONEABLE
, System.ICloneable
#endif
{
private IndexInput input;
internal FieldInfos fieldInfos;
internal long size;
internal long position = -1;
// Changed strings to true utf8 with length-in-bytes not
// length-in-chars
public const int FORMAT_VERSION_UTF8_LENGTH_IN_BYTES = -4;
// NOTE: always change this if you switch to a new format!
// whenever you add a new format, make it 1 smaller (negative version logic)!
public const int FORMAT_CURRENT = FORMAT_VERSION_UTF8_LENGTH_IN_BYTES;
// when removing support for old versions, leave the last supported version here
public const int FORMAT_MINIMUM = FORMAT_VERSION_UTF8_LENGTH_IN_BYTES;
private TermBuffer termBuffer = new TermBuffer();
private TermBuffer prevBuffer = new TermBuffer();
private TermBuffer scanBuffer = new TermBuffer(); // used for scanning
internal TermInfo termInfo = new TermInfo();
private readonly int format; // LUCENENET: marked readonly
private readonly bool isIndex = false; // LUCENENET: marked readonly
internal long indexPointer = 0;
internal int indexInterval; // LUCENENET NOTE: Changed from public field to internal (class is internal anyway)
internal int skipInterval;
internal int newSuffixStart;
internal int maxSkipLevels;
private bool first = true;
public SegmentTermEnum(IndexInput i, FieldInfos fis, bool isi)
{
input = i;
fieldInfos = fis;
isIndex = isi;
maxSkipLevels = 1; // use single-level skip lists for formats > -3
int firstInt = input.ReadInt32();
if (firstInt >= 0)
{
// original-format file, without explicit format version number
format = 0;
size = firstInt;
// back-compatible settings
indexInterval = 128;
skipInterval = int.MaxValue; // switch off skipTo optimization
}
else
{
// we have a format version number
format = firstInt;
// check that it is a format we can understand
if (format > FORMAT_MINIMUM)
{
throw new IndexFormatTooOldException(input, format, FORMAT_MINIMUM, FORMAT_CURRENT);
}
if (format < FORMAT_CURRENT)
{
throw new IndexFormatTooNewException(input, format, FORMAT_MINIMUM, FORMAT_CURRENT);
}
size = input.ReadInt64(); // read the size
indexInterval = input.ReadInt32();
skipInterval = input.ReadInt32();
maxSkipLevels = input.ReadInt32();
if (Debugging.AssertsEnabled)
{
Debugging.Assert(indexInterval > 0, "indexInterval={0} is negative; must be > 0", indexInterval);
Debugging.Assert(skipInterval > 0, "skipInterval={0} is negative; must be > 0", skipInterval);
}
}
}
public object Clone()
{
// LUCENENET: MemberwiseClone() doesn't throw in .NET
SegmentTermEnum clone = (SegmentTermEnum)base.MemberwiseClone();
clone.input = (IndexInput)input.Clone();
clone.termInfo = new TermInfo(termInfo);
clone.termBuffer = (TermBuffer)termBuffer.Clone();
clone.prevBuffer = (TermBuffer)prevBuffer.Clone();
clone.scanBuffer = new TermBuffer();
return clone;
}
internal void Seek(long pointer, long p, Term t, TermInfo ti)
{
input.Seek(pointer);
position = p;
termBuffer.Set(t);
prevBuffer.Reset();
//System.out.println(" ste doSeek prev=" + prevBuffer.toTerm() + " this=" + this);
termInfo.Set(ti);
first = p == -1;
}
/// <summary>
/// Increments the enumeration to the next element. True if one exists. </summary>
public bool Next()
{
prevBuffer.Set(termBuffer);
//System.out.println(" ste setPrev=" + prev() + " this=" + this);
if (position++ >= size - 1)
{
termBuffer.Reset();
//System.out.println(" EOF");
return false;
}
termBuffer.Read(input, fieldInfos);
newSuffixStart = termBuffer.newSuffixStart;
termInfo.DocFreq = input.ReadVInt32(); // read doc freq
termInfo.FreqPointer += input.ReadVInt64(); // read freq pointer
termInfo.ProxPointer += input.ReadVInt64(); // read prox pointer
if (termInfo.DocFreq >= skipInterval)
{
termInfo.SkipOffset = input.ReadVInt32();
}
if (isIndex)
{
indexPointer += input.ReadVInt64(); // read index pointer
}
//System.out.println(" ste ret term=" + term());
return true;
}
/* Optimized scan, without allocating new terms.
* Return number of invocations to next().
*
* NOTE: LUCENE-3183: if you pass Term("", "") here then this
* will incorrectly return before positioning the enum,
* and position will be -1; caller must detect this. */
internal int ScanTo(Term term)
{
scanBuffer.Set(term);
int count = 0;
if (first)
{
// Always force initial next() in case term is
// Term("", "")
Next();
first = false;
count++;
}
while (scanBuffer.CompareTo(termBuffer) > 0 && Next())
{
count++;
}
return count;
}
/// <summary>
/// Returns the current Term in the enumeration.
/// Initially invalid, valid after <see cref="Next()"/> called for the first time.
/// </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
public Term Term()
{
return termBuffer.ToTerm();
}
/// <summary>
/// Returns the previous Term enumerated. Initially <c>null</c>. </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
internal Term Prev()
{
return prevBuffer.ToTerm();
}
/// <summary>
/// Returns the current <see cref="Lucene3x.TermInfo"/> in the enumeration.
/// Initially invalid, valid after <see cref="Next()"/> called for the first time.
/// </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
internal TermInfo TermInfo()
{
return new TermInfo(termInfo);
}
/// <summary>
/// Sets the argument to the current <see cref="Lucene3x.TermInfo"/> in the enumeration.
/// Initially invalid, valid after <see cref="Next()"/> called for the first time.
/// </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
internal void TermInfo(TermInfo ti)
{
ti.Set(termInfo);
}
/// <summary>
/// Returns the docFreq from the current <see cref="Lucene3x.TermInfo"/> in the enumeration.
/// Initially invalid, valid after <see cref="Next()"/> called for the first time.
/// </summary>
public int DocFreq => termInfo.DocFreq;
/// <summary>
/// Returns the freqPointer from the current <see cref="Lucene3x.TermInfo"/> in the enumeration.
/// Initially invalid, valid after<see cref="Next()"/> called for the first time.
/// </summary>
internal long FreqPointer => termInfo.FreqPointer;
/// <summary>
/// Returns the proxPointer from the current <see cref="Lucene3x.TermInfo"/> in the enumeration.
/// Initially invalid, valid after<see cref="Next()"/> called for the first time.
/// </summary>
internal long ProxPointer => termInfo.ProxPointer;
/// <summary>
/// Closes the enumeration to further activity, freeing resources. </summary>
[MethodImpl(MethodImplOptions.AggressiveInlining)]
public void Dispose()
{
input.Dispose();
}
}
}