| /* |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package org.apache.lucene.benchmark.byTask.tasks; |
| |
| import java.io.IOException; |
| import java.io.StreamTokenizer; |
| import java.io.StringReader; |
| import java.lang.reflect.Constructor; |
| import java.util.*; |
| import org.apache.lucene.analysis.Analyzer; |
| import org.apache.lucene.benchmark.byTask.PerfRunData; |
| import org.apache.lucene.benchmark.byTask.utils.AnalyzerFactory; |
| import org.apache.lucene.util.Version; |
| |
| /** |
| * Create a new {@link org.apache.lucene.analysis.Analyzer} and set it in the getRunData() for use |
| * by all future tasks. |
| */ |
| public class NewAnalyzerTask extends PerfTask { |
| private List<String> analyzerNames; |
| private int current; |
| |
| public NewAnalyzerTask(PerfRunData runData) { |
| super(runData); |
| analyzerNames = new ArrayList<>(); |
| } |
| |
| public static final Analyzer createAnalyzer(String className) throws Exception { |
| final Class<? extends Analyzer> clazz = Class.forName(className).asSubclass(Analyzer.class); |
| try { |
| // first try to use a ctor with version parameter (needed for many new Analyzers that have no |
| // default one anymore |
| Constructor<? extends Analyzer> cnstr = clazz.getConstructor(Version.class); |
| return cnstr.newInstance(Version.LATEST); |
| } catch (NoSuchMethodException nsme) { |
| // otherwise use default ctor |
| return clazz.getConstructor().newInstance(); |
| } |
| } |
| |
| @Override |
| public int doLogic() throws IOException { |
| String analyzerName = null; |
| try { |
| if (current >= analyzerNames.size()) { |
| current = 0; |
| } |
| analyzerName = analyzerNames.get(current++); |
| Analyzer analyzer = null; |
| if (null == analyzerName || 0 == analyzerName.length()) { |
| analyzerName = "org.apache.lucene.analysis.standard.StandardAnalyzer"; |
| } |
| // First, lookup analyzerName as a named analyzer factory |
| AnalyzerFactory factory = getRunData().getAnalyzerFactories().get(analyzerName); |
| if (null != factory) { |
| analyzer = factory.create(); |
| } else { |
| if (analyzerName.contains(".")) { |
| if (analyzerName.startsWith("standard.")) { |
| analyzerName = "org.apache.lucene.analysis." + analyzerName; |
| } |
| analyzer = createAnalyzer(analyzerName); |
| } else { // No package |
| try { |
| // Attempt to instantiate a core analyzer |
| String coreClassName = "org.apache.lucene.analysis.core." + analyzerName; |
| analyzer = createAnalyzer(coreClassName); |
| analyzerName = coreClassName; |
| } catch (ClassNotFoundException e) { |
| // If not a core analyzer, try the base analysis package |
| analyzerName = "org.apache.lucene.analysis." + analyzerName; |
| analyzer = createAnalyzer(analyzerName); |
| } |
| } |
| } |
| getRunData().setAnalyzer(analyzer); |
| } catch (Exception e) { |
| throw new RuntimeException("Error creating Analyzer: " + analyzerName, e); |
| } |
| return 1; |
| } |
| |
| /** |
| * Set the params (analyzerName only), Comma-separate list of Analyzer class names. If the |
| * Analyzer lives in org.apache.lucene.analysis, the name can be shortened by dropping the o.a.l.a |
| * part of the Fully Qualified Class Name. |
| * |
| * <p>Analyzer names may also refer to previously defined AnalyzerFactory's. |
| * |
| * <p>Example Declaration: {"NewAnalyzer" NewAnalyzer(WhitespaceAnalyzer, SimpleAnalyzer, |
| * StopAnalyzer, standard.StandardAnalyzer) > |
| * |
| * <p>Example AnalyzerFactory usage: |
| * |
| * <pre> |
| * -AnalyzerFactory(name:'whitespace tokenized',WhitespaceTokenizer) |
| * -NewAnalyzer('whitespace tokenized') |
| * </pre> |
| * |
| * @param params analyzerClassName, or empty for the StandardAnalyzer |
| */ |
| @Override |
| public void setParams(String params) { |
| super.setParams(params); |
| final StreamTokenizer stok = new StreamTokenizer(new StringReader(params)); |
| stok.quoteChar('"'); |
| stok.quoteChar('\''); |
| stok.eolIsSignificant(false); |
| stok.ordinaryChar(','); |
| try { |
| while (stok.nextToken() != StreamTokenizer.TT_EOF) { |
| switch (stok.ttype) { |
| case ',': |
| { |
| // Do nothing |
| break; |
| } |
| case '\'': |
| case '\"': |
| case StreamTokenizer.TT_WORD: |
| { |
| analyzerNames.add(stok.sval); |
| break; |
| } |
| default: |
| { |
| throw new RuntimeException("Unexpected token: " + stok.toString()); |
| } |
| } |
| } |
| } catch (RuntimeException e) { |
| if (e.getMessage().startsWith("Line #")) { |
| throw e; |
| } else { |
| throw new RuntimeException("Line #" + (stok.lineno() + getAlgLineNum()) + ": ", e); |
| } |
| } catch (Throwable t) { |
| throw new RuntimeException("Line #" + (stok.lineno() + getAlgLineNum()) + ": ", t); |
| } |
| } |
| |
| /* (non-Javadoc) |
| * @see org.apache.lucene.benchmark.byTask.tasks.PerfTask#supportsParams() |
| */ |
| @Override |
| public boolean supportsParams() { |
| return true; |
| } |
| } |