| /* |
| * Copyright 2009-2013 by The Regents of the University of California |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * you may obtain a copy of the License from |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package edu.uci.ics.hyracks.storage.am.lsm.invertedindex.common; |
| |
| import java.io.IOException; |
| import java.util.ArrayList; |
| import java.util.List; |
| import java.util.logging.Level; |
| import java.util.logging.Logger; |
| |
| import org.junit.Test; |
| |
| import edu.uci.ics.hyracks.storage.am.common.api.IIndex; |
| import edu.uci.ics.hyracks.storage.am.common.api.IndexException; |
| import edu.uci.ics.hyracks.storage.am.common.datagen.TupleGenerator; |
| import edu.uci.ics.hyracks.storage.am.config.AccessMethodTestsConfig; |
| import edu.uci.ics.hyracks.storage.am.lsm.invertedindex.api.IInvertedIndexSearchModifier; |
| import edu.uci.ics.hyracks.storage.am.lsm.invertedindex.search.ConjunctiveSearchModifier; |
| import edu.uci.ics.hyracks.storage.am.lsm.invertedindex.search.EditDistanceSearchModifier; |
| import edu.uci.ics.hyracks.storage.am.lsm.invertedindex.search.JaccardSearchModifier; |
| import edu.uci.ics.hyracks.storage.am.lsm.invertedindex.util.LSMInvertedIndexTestContext; |
| import edu.uci.ics.hyracks.storage.am.lsm.invertedindex.util.LSMInvertedIndexTestContext.InvertedIndexType; |
| import edu.uci.ics.hyracks.storage.am.lsm.invertedindex.util.LSMInvertedIndexTestUtils; |
| |
| public abstract class AbstractInvertedIndexSearchTest extends AbstractInvertedIndexTest { |
| |
| protected final Logger LOGGER = Logger.getLogger(AbstractInvertedIndexSearchTest.class.getName()); |
| |
| protected int NUM_DOC_QUERIES = AccessMethodTestsConfig.LSM_INVINDEX_NUM_DOC_QUERIES; |
| protected int NUM_RANDOM_QUERIES = AccessMethodTestsConfig.LSM_INVINDEX_NUM_RANDOM_QUERIES; |
| protected final boolean bulkLoad; |
| |
| public AbstractInvertedIndexSearchTest(InvertedIndexType invIndexType, boolean bulkLoad) { |
| super(invIndexType); |
| this.bulkLoad = bulkLoad; |
| } |
| |
| protected void runTest(LSMInvertedIndexTestContext testCtx, TupleGenerator tupleGen, |
| List<IInvertedIndexSearchModifier> searchModifiers) throws IOException, IndexException { |
| IIndex invIndex = testCtx.getIndex(); |
| invIndex.create(); |
| invIndex.activate(); |
| |
| if (bulkLoad) { |
| LSMInvertedIndexTestUtils.bulkLoadInvIndex(testCtx, tupleGen, NUM_DOCS_TO_INSERT); |
| } else { |
| LSMInvertedIndexTestUtils.insertIntoInvIndex(testCtx, tupleGen, NUM_DOCS_TO_INSERT); |
| } |
| invIndex.validate(); |
| |
| for (IInvertedIndexSearchModifier searchModifier : searchModifiers) { |
| if (LOGGER.isLoggable(Level.INFO)) { |
| LOGGER.info("Running searches with: " + searchModifier.toString()); |
| } |
| LSMInvertedIndexTestUtils.testIndexSearch(testCtx, tupleGen, harness.getRandom(), NUM_DOC_QUERIES, |
| NUM_RANDOM_QUERIES, searchModifier, SCAN_COUNT_ARRAY); |
| } |
| |
| invIndex.deactivate(); |
| invIndex.destroy(); |
| } |
| |
| private void testWordInvIndexIndex(LSMInvertedIndexTestContext testCtx) throws IOException, IndexException { |
| TupleGenerator tupleGen = LSMInvertedIndexTestUtils.createStringDocumentTupleGen(harness.getRandom()); |
| List<IInvertedIndexSearchModifier> searchModifiers = new ArrayList<IInvertedIndexSearchModifier>(); |
| searchModifiers.add(new ConjunctiveSearchModifier()); |
| searchModifiers.add(new JaccardSearchModifier(1.0f)); |
| searchModifiers.add(new JaccardSearchModifier(0.9f)); |
| searchModifiers.add(new JaccardSearchModifier(0.7f)); |
| searchModifiers.add(new JaccardSearchModifier(0.5f)); |
| runTest(testCtx, tupleGen, searchModifiers); |
| } |
| |
| private void testNGramInvIndexIndex(LSMInvertedIndexTestContext testCtx) throws IOException, IndexException { |
| TupleGenerator tupleGen = LSMInvertedIndexTestUtils.createPersonNamesTupleGen(harness.getRandom()); |
| List<IInvertedIndexSearchModifier> searchModifiers = new ArrayList<IInvertedIndexSearchModifier>(); |
| searchModifiers.add(new ConjunctiveSearchModifier()); |
| searchModifiers.add(new JaccardSearchModifier(1.0f)); |
| searchModifiers.add(new JaccardSearchModifier(0.9f)); |
| searchModifiers.add(new JaccardSearchModifier(0.7f)); |
| searchModifiers.add(new JaccardSearchModifier(0.5f)); |
| searchModifiers.add(new EditDistanceSearchModifier(LSMInvertedIndexTestUtils.TEST_GRAM_LENGTH, 0)); |
| searchModifiers.add(new EditDistanceSearchModifier(LSMInvertedIndexTestUtils.TEST_GRAM_LENGTH, 1)); |
| searchModifiers.add(new EditDistanceSearchModifier(LSMInvertedIndexTestUtils.TEST_GRAM_LENGTH, 2)); |
| searchModifiers.add(new EditDistanceSearchModifier(LSMInvertedIndexTestUtils.TEST_GRAM_LENGTH, 3)); |
| runTest(testCtx, tupleGen, searchModifiers); |
| } |
| |
| @Test |
| public void wordTokensInvIndexTest() throws IOException, IndexException { |
| LSMInvertedIndexTestContext testCtx = LSMInvertedIndexTestUtils.createWordInvIndexTestContext(harness, invIndexType); |
| testWordInvIndexIndex(testCtx); |
| } |
| |
| @Test |
| public void hashedWordTokensInvIndexTest() throws IOException, IndexException { |
| LSMInvertedIndexTestContext testCtx = LSMInvertedIndexTestUtils.createHashedWordInvIndexTestContext(harness, |
| invIndexType); |
| testWordInvIndexIndex(testCtx); |
| } |
| |
| @Test |
| public void ngramTokensInvIndexTest() throws IOException, IndexException { |
| LSMInvertedIndexTestContext testCtx = LSMInvertedIndexTestUtils.createNGramInvIndexTestContext(harness, invIndexType); |
| testNGramInvIndexIndex(testCtx); |
| } |
| |
| @Test |
| public void hashedNGramTokensInvIndexTest() throws IOException, IndexException { |
| LSMInvertedIndexTestContext testCtx = LSMInvertedIndexTestUtils.createHashedNGramInvIndexTestContext(harness, |
| invIndexType); |
| testNGramInvIndexIndex(testCtx); |
| } |
| |
| } |