blob: 0ea365fc04833fd913a40c1afedff2e82e67e78e [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.lucene.index;
import org.apache.lucene.analysis.MockAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.SortedDocValuesField;
import org.apache.lucene.document.SortedSetDocValuesField;
import org.apache.lucene.store.Directory;
import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.LongValues;
import org.apache.lucene.util.LuceneTestCase;
import org.apache.lucene.util.RamUsageTester;
import org.apache.lucene.util.TestUtil;
import java.io.IOException;
import java.lang.reflect.Field;
import java.util.HashMap;
public class TestOrdinalMap extends LuceneTestCase {
private static final Field ORDINAL_MAP_OWNER_FIELD;
static {
try {
ORDINAL_MAP_OWNER_FIELD = OrdinalMap.class.getDeclaredField("owner");
} catch (Exception e) {
throw new Error();
}
}
private static final RamUsageTester.Accumulator ORDINAL_MAP_ACCUMULATOR = new RamUsageTester.Accumulator() {
public long accumulateObject(Object o, long shallowSize, java.util.Map<Field,Object> fieldValues, java.util.Collection<Object> queue) {
if (o == LongValues.ZEROES || o == LongValues.IDENTITY) {
return 0L;
}
if (o instanceof OrdinalMap) {
fieldValues = new HashMap<>(fieldValues);
fieldValues.remove(ORDINAL_MAP_OWNER_FIELD);
}
return super.accumulateObject(o, shallowSize, fieldValues, queue);
}
};
public void testRamBytesUsed() throws IOException {
Directory dir = newDirectory();
IndexWriterConfig cfg = new IndexWriterConfig(new MockAnalyzer(random())).setCodec(TestUtil.alwaysDocValuesFormat(TestUtil.getDefaultDocValuesFormat()));
RandomIndexWriter iw = new RandomIndexWriter(random(), dir, cfg);
final int maxDoc = TestUtil.nextInt(random(), 10, 1000);
final int maxTermLength = TestUtil.nextInt(random(), 1, 4);
for (int i = 0; i < maxDoc; ++i) {
Document d = new Document();
if (random().nextBoolean()) {
d.add(new SortedDocValuesField("sdv", new BytesRef(TestUtil.randomSimpleString(random(), maxTermLength))));
}
final int numSortedSet = random().nextInt(3);
for (int j = 0; j < numSortedSet; ++j) {
d.add(new SortedSetDocValuesField("ssdv", new BytesRef(TestUtil.randomSimpleString(random(), maxTermLength))));
}
iw.addDocument(d);
if (rarely()) {
iw.getReader().close();
}
}
iw.commit();
DirectoryReader r = iw.getReader();
SortedDocValues sdv = MultiDocValues.getSortedValues(r, "sdv");
if (sdv instanceof MultiDocValues.MultiSortedDocValues) {
OrdinalMap map = ((MultiDocValues.MultiSortedDocValues) sdv).mapping;
assertEquals(RamUsageTester.sizeOf(map, ORDINAL_MAP_ACCUMULATOR), map.ramBytesUsed());
}
SortedSetDocValues ssdv = MultiDocValues.getSortedSetValues(r, "ssdv");
if (ssdv instanceof MultiDocValues.MultiSortedSetDocValues) {
OrdinalMap map = ((MultiDocValues.MultiSortedSetDocValues) ssdv).mapping;
assertEquals(RamUsageTester.sizeOf(map, ORDINAL_MAP_ACCUMULATOR), map.ramBytesUsed());
}
iw.close();
r.close();
dir.close();
}
/**
* Tests the case where one segment contains all of the global ords. In this case, we apply a
* small optimization and hardcode the first segment indices and global ord deltas as all zeroes.
*/
public void testOneSegmentWithAllValues() throws IOException {
Directory dir = newDirectory();
IndexWriterConfig cfg = new IndexWriterConfig(new MockAnalyzer(random()))
.setCodec(TestUtil.alwaysDocValuesFormat(TestUtil.getDefaultDocValuesFormat()))
.setMergePolicy(NoMergePolicy.INSTANCE);
IndexWriter iw = new IndexWriter(dir, cfg);
int numTerms = 1000;
for (int i = 0; i < numTerms; ++i) {
Document d = new Document();
String term = String.valueOf(i);
d.add(new SortedDocValuesField("sdv", new BytesRef(term)));
iw.addDocument(d);
}
iw.forceMerge(1);
for (int i = 0; i < 10; ++i) {
Document d = new Document();
String term = String.valueOf(random().nextInt(numTerms));
d.add(new SortedDocValuesField("sdv", new BytesRef(term)));
iw.addDocument(d);
}
iw.commit();
DirectoryReader r = iw.getReader();
SortedDocValues sdv = MultiDocValues.getSortedValues(r, "sdv");
assertNotNull(sdv);
assertTrue(sdv instanceof MultiDocValues.MultiSortedDocValues);
// Check that the optimization kicks in.
OrdinalMap map = ((MultiDocValues.MultiSortedDocValues) sdv).mapping;
assertEquals(LongValues.ZEROES, map.firstSegments);
assertEquals(LongValues.ZEROES, map.globalOrdDeltas);
// Check the map's basic behavior.
assertEquals(numTerms, (int) map.getValueCount());
for (int i = 0; i < numTerms; i++) {
assertEquals(0, map.getFirstSegmentNumber(i));
assertEquals(i, map.getFirstSegmentOrd(i));
}
iw.close();
r.close();
dir.close();
}
}