solr/core/src/test/org/apache/solr/analysis/CommonGramsFilterFactoryTest.java - manifoldcf-integration-solr-3.x - Git at Google

 package org.apache.solr.analysis;

 /**
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 import org.apache.lucene.analysis.MockTokenizer;
 import org.apache.lucene.analysis.TokenStream;
 import org.apache.lucene.analysis.Tokenizer;
 import org.apache.solr.common.ResourceLoader;
 import org.apache.solr.core.SolrResourceLoader;

 import java.io.StringReader;
 import java.util.Set;
 import java.util.Map;
 import java.util.HashMap;

 /**
  * Tests pretty much copied from StopFilterFactoryTest We use the test files
  * used by the StopFilterFactoryTest TODO: consider creating separate test files
  * so this won't break if stop filter test files change
  **/
 public class CommonGramsFilterFactoryTest extends BaseTokenTestCase {

   public void testInform() throws Exception {
     ResourceLoader loader = new SolrResourceLoader(null, null);
     assertTrue("loader is null and it shouldn't be", loader != null);
     CommonGramsFilterFactory factory = new CommonGramsFilterFactory();
     Map<String, String> args = new HashMap<String, String>(DEFAULT_VERSION_PARAM);
     args.put("words", "stop-1.txt");
     args.put("ignoreCase", "true");
     factory.init(args);
     factory.inform(loader);
     Set<?> words = factory.getCommonWords();
     assertTrue("words is null and it shouldn't be", words != null);
     assertTrue("words Size: " + words.size() + " is not: " + 2,
         words.size() == 2);
     assertTrue(factory.isIgnoreCase() + " does not equal: " + true, factory
         .isIgnoreCase() == true);

     factory = new CommonGramsFilterFactory();
     args.put("words", "stop-1.txt, stop-2.txt");
     factory.init(args);
     factory.inform(loader);
     words = factory.getCommonWords();
     assertTrue("words is null and it shouldn't be", words != null);
     assertTrue("words Size: " + words.size() + " is not: " + 4,
         words.size() == 4);
     assertTrue(factory.isIgnoreCase() + " does not equal: " + true, factory
         .isIgnoreCase() == true);

   }

   /**
    * If no words are provided, then a set of english default stopwords is used.
    */
   public void testDefaults() throws Exception {
     ResourceLoader loader = new SolrResourceLoader(null, null);
     assertTrue("loader is null and it shouldn't be", loader != null);
     CommonGramsFilterFactory factory = new CommonGramsFilterFactory();
     Map<String, String> args = new HashMap<String, String>(DEFAULT_VERSION_PARAM);
     factory.init(args);
     factory.inform(loader);
     Set<?> words = factory.getCommonWords();
     assertTrue("words is null and it shouldn't be", words != null);
     assertTrue(words.contains("the"));
     Tokenizer tokenizer = new MockTokenizer(new StringReader("testing the factory"), MockTokenizer.WHITESPACE, false);
     TokenStream stream = factory.create(tokenizer);
     assertTokenStreamContents(stream,
         new String[] { "testing", "testing_the", "the", "the_factory", "factory" });
   }
 }
	package org.apache.solr.analysis;

	/**
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	import org.apache.lucene.analysis.MockTokenizer;
	import org.apache.lucene.analysis.TokenStream;
	import org.apache.lucene.analysis.Tokenizer;
	import org.apache.solr.common.ResourceLoader;
	import org.apache.solr.core.SolrResourceLoader;

	import java.io.StringReader;
	import java.util.Set;
	import java.util.Map;
	import java.util.HashMap;

	/**
	* Tests pretty much copied from StopFilterFactoryTest We use the test files
	* used by the StopFilterFactoryTest TODO: consider creating separate test files
	* so this won't break if stop filter test files change
	**/
	public class CommonGramsFilterFactoryTest extends BaseTokenTestCase {

	public void testInform() throws Exception {
	ResourceLoader loader = new SolrResourceLoader(null, null);
	assertTrue("loader is null and it shouldn't be", loader != null);
	CommonGramsFilterFactory factory = new CommonGramsFilterFactory();
	Map<String, String> args = new HashMap<String, String>(DEFAULT_VERSION_PARAM);
	args.put("words", "stop-1.txt");
	args.put("ignoreCase", "true");
	factory.init(args);
	factory.inform(loader);
	Set<?> words = factory.getCommonWords();
	assertTrue("words is null and it shouldn't be", words != null);
	assertTrue("words Size: " + words.size() + " is not: " + 2,
	words.size() == 2);
	assertTrue(factory.isIgnoreCase() + " does not equal: " + true, factory
	.isIgnoreCase() == true);

	factory = new CommonGramsFilterFactory();
	args.put("words", "stop-1.txt, stop-2.txt");
	factory.init(args);
	factory.inform(loader);
	words = factory.getCommonWords();
	assertTrue("words is null and it shouldn't be", words != null);
	assertTrue("words Size: " + words.size() + " is not: " + 4,
	words.size() == 4);
	assertTrue(factory.isIgnoreCase() + " does not equal: " + true, factory
	.isIgnoreCase() == true);

	}

	/**
	* If no words are provided, then a set of english default stopwords is used.
	*/
	public void testDefaults() throws Exception {
	ResourceLoader loader = new SolrResourceLoader(null, null);
	assertTrue("loader is null and it shouldn't be", loader != null);
	CommonGramsFilterFactory factory = new CommonGramsFilterFactory();
	Map<String, String> args = new HashMap<String, String>(DEFAULT_VERSION_PARAM);
	factory.init(args);
	factory.inform(loader);
	Set<?> words = factory.getCommonWords();
	assertTrue("words is null and it shouldn't be", words != null);
	assertTrue(words.contains("the"));
	Tokenizer tokenizer = new MockTokenizer(new StringReader("testing the factory"), MockTokenizer.WHITESPACE, false);
	TokenStream stream = factory.create(tokenizer);
	assertTokenStreamContents(stream,
	new String[] { "testing", "testing_the", "the", "the_factory", "factory" });
	}
	}