| package org.apache.lucene.facet.taxonomy; |
| |
| /* |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| import java.io.IOException; |
| import java.util.List; |
| |
| import org.apache.lucene.facet.FacetsCollector; |
| import org.apache.lucene.facet.FacetsConfig; |
| import org.apache.lucene.facet.FacetsCollector.MatchingDocs; |
| import org.apache.lucene.index.BinaryDocValues; |
| import org.apache.lucene.util.BytesRef; |
| import org.apache.lucene.util.FixedBitSet; |
| |
| /** Computes facets counts, assuming the default encoding |
| * into DocValues was used. |
| * |
| * @lucene.experimental */ |
| public class FastTaxonomyFacetCounts extends IntTaxonomyFacets { |
| |
| /** Create {@code FastTaxonomyFacetCounts}, which also |
| * counts all facet labels. */ |
| public FastTaxonomyFacetCounts(TaxonomyReader taxoReader, FacetsConfig config, FacetsCollector fc) throws IOException { |
| this(FacetsConfig.DEFAULT_INDEX_FIELD_NAME, taxoReader, config, fc); |
| } |
| |
| /** Create {@code FastTaxonomyFacetCounts}, using the |
| * specified {@code indexFieldName} for ordinals. Use |
| * this if you had set {@link |
| * FacetsConfig#setIndexFieldName} to change the index |
| * field name for certain dimensions. */ |
| public FastTaxonomyFacetCounts(String indexFieldName, TaxonomyReader taxoReader, FacetsConfig config, FacetsCollector fc) throws IOException { |
| super(indexFieldName, taxoReader, config); |
| count(fc.getMatchingDocs()); |
| } |
| |
| private final void count(List<MatchingDocs> matchingDocs) throws IOException { |
| for(MatchingDocs hits : matchingDocs) { |
| BinaryDocValues dv = hits.context.reader().getBinaryDocValues(indexFieldName); |
| if (dv == null) { // this reader does not have DocValues for the requested category list |
| continue; |
| } |
| FixedBitSet bits = hits.bits; |
| |
| final int length = hits.bits.length(); |
| int doc = 0; |
| BytesRef scratch = new BytesRef(); |
| while (doc < length && (doc = bits.nextSetBit(doc)) != -1) { |
| dv.get(doc, scratch); |
| byte[] bytes = scratch.bytes; |
| int end = scratch.offset + scratch.length; |
| int ord = 0; |
| int offset = scratch.offset; |
| int prev = 0; |
| while (offset < end) { |
| byte b = bytes[offset++]; |
| if (b >= 0) { |
| prev = ord = ((ord << 7) | b) + prev; |
| ++values[ord]; |
| ord = 0; |
| } else { |
| ord = (ord << 7) | (b & 0x7F); |
| } |
| } |
| ++doc; |
| } |
| } |
| |
| rollup(); |
| } |
| } |