blob: e16e53a79ce342f37f68e8168da6f645d56f1dfe [file] [log] [blame]
using System.Collections.Generic;
namespace Lucene.Net.Facet.Taxonomy
{
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
using MatchingDocs = FacetsCollector.MatchingDocs;
using BinaryDocValues = Lucene.Net.Index.BinaryDocValues;
using BytesRef = Lucene.Net.Util.BytesRef;
using DocIdSetIterator = Lucene.Net.Search.DocIdSetIterator;
/// <summary>
/// Computes facets counts, assuming the default encoding
/// into DocValues was used.
///
/// @lucene.experimental
/// </summary>
public class FastTaxonomyFacetCounts : Int32TaxonomyFacets
{
/// <summary>
/// Create <see cref="FastTaxonomyFacetCounts"/>, which also
/// counts all facet labels.
/// </summary>
public FastTaxonomyFacetCounts(TaxonomyReader taxoReader, FacetsConfig config, FacetsCollector fc)
: this(FacetsConfig.DEFAULT_INDEX_FIELD_NAME, taxoReader, config, fc)
{
}
/// <summary>
/// Create <see cref="FastTaxonomyFacetCounts"/>, using the
/// specified <paramref name="indexFieldName"/> for ordinals. Use
/// this if you had set <see cref="FacetsConfig.SetIndexFieldName"/>
/// to change the index
/// field name for certain dimensions.
/// </summary>
public FastTaxonomyFacetCounts(string indexFieldName, TaxonomyReader taxoReader, FacetsConfig config, FacetsCollector fc)
: base(indexFieldName, taxoReader, config)
{
Count(fc.GetMatchingDocs());
}
private void Count(IList<FacetsCollector.MatchingDocs> matchingDocs)
{
// LUCENENET specific - performance is significantly better if we instantiate
// this outside of the outer loop.
BytesRef bytesRef = new BytesRef();
foreach (FacetsCollector.MatchingDocs hits in matchingDocs)
{
BinaryDocValues dv = hits.Context.AtomicReader.GetBinaryDocValues(m_indexFieldName);
if (dv == null) // this reader does not have DocValues for the requested category list
{
continue;
}
DocIdSetIterator docs = hits.Bits.GetIterator();
int doc;
while ((doc = docs.NextDoc()) != DocIdSetIterator.NO_MORE_DOCS)
{
dv.Get(doc, bytesRef);
var bytes = bytesRef.Bytes;
int end = bytesRef.Offset + bytesRef.Length;
int ord = 0;
int offset = bytesRef.Offset;
int prev = 0;
while (offset < end)
{
byte b = bytes[offset++];
if ((sbyte)b >= 0)
{
prev = ord = ((ord << 7) | b) + prev;
++m_values[ord];
ord = 0;
}
else
{
ord = (ord << 7) | (b & 0x7F);
}
}
}
}
Rollup();
}
}
}