| package org.apache.lucene; |
| |
| /** |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| import java.io.IOException; |
| import java.io.PrintWriter; |
| import java.io.StringWriter; |
| |
| import org.apache.lucene.store.*; |
| import org.apache.lucene.document.*; |
| import org.apache.lucene.analysis.*; |
| import org.apache.lucene.index.*; |
| import org.apache.lucene.search.*; |
| import org.apache.lucene.queryParser.*; |
| import org.apache.lucene.util.LuceneTestCase; |
| import junit.framework.TestSuite; |
| import junit.textui.TestRunner; |
| |
| public class TestSearchForDuplicates extends LuceneTestCase { |
| |
| /** Main for running test case by itself. */ |
| public static void main(String args[]) { |
| TestRunner.run (new TestSuite(TestSearchForDuplicates.class)); |
| } |
| |
| |
| |
| static final String PRIORITY_FIELD ="priority"; |
| static final String ID_FIELD ="id"; |
| static final String HIGH_PRIORITY ="high"; |
| static final String MED_PRIORITY ="medium"; |
| static final String LOW_PRIORITY ="low"; |
| |
| |
| /** This test compares search results when using and not using compound |
| * files. |
| * |
| * TODO: There is rudimentary search result validation as well, but it is |
| * simply based on asserting the output observed in the old test case, |
| * without really knowing if the output is correct. Someone needs to |
| * validate this output and make any changes to the checkHits method. |
| */ |
| public void testRun() throws Exception { |
| StringWriter sw = new StringWriter(); |
| PrintWriter pw = new PrintWriter(sw, true); |
| doTest(pw, false); |
| pw.close(); |
| sw.close(); |
| String multiFileOutput = sw.getBuffer().toString(); |
| //System.out.println(multiFileOutput); |
| |
| sw = new StringWriter(); |
| pw = new PrintWriter(sw, true); |
| doTest(pw, true); |
| pw.close(); |
| sw.close(); |
| String singleFileOutput = sw.getBuffer().toString(); |
| |
| assertEquals(multiFileOutput, singleFileOutput); |
| } |
| |
| |
| private void doTest(PrintWriter out, boolean useCompoundFiles) throws Exception { |
| Directory directory = new RAMDirectory(); |
| Analyzer analyzer = new SimpleAnalyzer(TEST_VERSION_CURRENT); |
| IndexWriterConfig conf = new IndexWriterConfig(TEST_VERSION_CURRENT, analyzer); |
| LogMergePolicy lmp = (LogMergePolicy) conf.getMergePolicy(); |
| lmp.setUseCompoundFile(useCompoundFiles); |
| lmp.setUseCompoundDocStore(useCompoundFiles); |
| IndexWriter writer = new IndexWriter(directory, conf); |
| |
| final int MAX_DOCS = 225; |
| |
| for (int j = 0; j < MAX_DOCS; j++) { |
| Document d = new Document(); |
| d.add(new Field(PRIORITY_FIELD, HIGH_PRIORITY, Field.Store.YES, Field.Index.ANALYZED)); |
| d.add(new Field(ID_FIELD, Integer.toString(j), Field.Store.YES, Field.Index.ANALYZED)); |
| writer.addDocument(d); |
| } |
| writer.close(); |
| |
| // try a search without OR |
| Searcher searcher = new IndexSearcher(directory, true); |
| |
| QueryParser parser = new QueryParser(TEST_VERSION_CURRENT, PRIORITY_FIELD, analyzer); |
| |
| Query query = parser.parse(HIGH_PRIORITY); |
| out.println("Query: " + query.toString(PRIORITY_FIELD)); |
| |
| ScoreDoc[] hits = searcher.search(query, null, MAX_DOCS).scoreDocs; |
| printHits(out, hits, searcher); |
| checkHits(hits, MAX_DOCS, searcher); |
| |
| searcher.close(); |
| |
| // try a new search with OR |
| searcher = new IndexSearcher(directory, true); |
| hits = null; |
| |
| parser = new QueryParser(TEST_VERSION_CURRENT, PRIORITY_FIELD, analyzer); |
| |
| query = parser.parse(HIGH_PRIORITY + " OR " + MED_PRIORITY); |
| out.println("Query: " + query.toString(PRIORITY_FIELD)); |
| |
| hits = searcher.search(query, null, MAX_DOCS).scoreDocs; |
| printHits(out, hits, searcher); |
| checkHits(hits, MAX_DOCS, searcher); |
| |
| searcher.close(); |
| } |
| |
| |
| private void printHits(PrintWriter out, ScoreDoc[] hits, Searcher searcher ) throws IOException { |
| out.println(hits.length + " total results\n"); |
| for (int i = 0 ; i < hits.length; i++) { |
| if ( i < 10 || (i > 94 && i < 105) ) { |
| Document d = searcher.doc(hits[i].doc); |
| out.println(i + " " + d.get(ID_FIELD)); |
| } |
| } |
| } |
| |
| private void checkHits(ScoreDoc[] hits, int expectedCount, Searcher searcher) throws IOException { |
| assertEquals("total results", expectedCount, hits.length); |
| for (int i = 0 ; i < hits.length; i++) { |
| if ( i < 10 || (i > 94 && i < 105) ) { |
| Document d = searcher.doc(hits[i].doc); |
| assertEquals("check " + i, String.valueOf(i), d.get(ID_FIELD)); |
| } |
| } |
| } |
| |
| } |