blob: 4f692ae68f652fb30dd5669f7b962b7c57aa92d2 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.lucene.search.spans;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import java.util.Objects;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermStates;
import org.apache.lucene.search.BooleanClause.Occur;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.MultiTermQuery;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.QueryVisitor;
import org.apache.lucene.search.ScoreMode;
import org.apache.lucene.search.ScoringRewrite;
import org.apache.lucene.search.TopTermsRewrite;
/**
* Wraps any {@link MultiTermQuery} as a {@link SpanQuery},
* so it can be nested within other SpanQuery classes.
* <p>
* The query is rewritten by default to a {@link SpanOrQuery} containing
* the expanded terms, but this can be customized.
* <p>
* Example:
* <blockquote><pre class="prettyprint">
* {@code
* WildcardQuery wildcard = new WildcardQuery(new Term("field", "bro?n"));
* SpanQuery spanWildcard = new SpanMultiTermQueryWrapper<WildcardQuery>(wildcard);
* // do something with spanWildcard, such as use it in a SpanFirstQuery
* }
* </pre></blockquote>
*/
public class SpanMultiTermQueryWrapper<Q extends MultiTermQuery> extends SpanQuery {
protected final Q query;
private SpanRewriteMethod rewriteMethod;
/**
* Create a new SpanMultiTermQueryWrapper.
*
* @param query Query to wrap.
*/
@SuppressWarnings({"rawtypes","unchecked"})
public SpanMultiTermQueryWrapper(Q query) {
this.query = Objects.requireNonNull(query);
this.rewriteMethod = selectRewriteMethod(query);
}
private static SpanRewriteMethod selectRewriteMethod(MultiTermQuery query) {
MultiTermQuery.RewriteMethod method = query.getRewriteMethod();
if (method instanceof TopTermsRewrite) {
final int pqsize = ((TopTermsRewrite) method).getSize();
return new TopTermsSpanBooleanQueryRewrite(pqsize);
} else {
return SCORING_SPAN_QUERY_REWRITE;
}
}
/**
* Expert: returns the rewriteMethod
*/
public final SpanRewriteMethod getRewriteMethod() {
return rewriteMethod;
}
/**
* Expert: sets the rewrite method. This only makes sense
* to be a span rewrite method.
*/
public final void setRewriteMethod(SpanRewriteMethod rewriteMethod) {
this.rewriteMethod = rewriteMethod;
}
@Override
public String getField() {
return query.getField();
}
@Override
public SpanWeight createWeight(IndexSearcher searcher, ScoreMode scoreMode, float boost) throws IOException {
throw new IllegalArgumentException("Rewrite first!");
}
/** Returns the wrapped query */
public Query getWrappedQuery() {
return query;
}
@Override
public String toString(String field) {
StringBuilder builder = new StringBuilder();
builder.append("SpanMultiTermQueryWrapper(");
// NOTE: query.toString must be placed in a temp local to avoid compile errors on Java 8u20
// see https://bugs.openjdk.java.net/browse/JDK-8056984?page=com.atlassian.streams.streams-jira-plugin:activity-stream-issue-tab
String queryStr = query.toString(field);
builder.append(queryStr);
builder.append(")");
return builder.toString();
}
@Override
public Query rewrite(IndexReader reader) throws IOException {
return rewriteMethod.rewrite(reader, query);
}
@Override
public void visit(QueryVisitor visitor) {
if (visitor.acceptField(query.getField())) {
query.visit(visitor.getSubVisitor(Occur.MUST, this));
}
}
@Override
public int hashCode() {
return classHash() * 31 + query.hashCode();
}
@Override
public boolean equals(Object other) {
return sameClassAs(other) &&
query.equals(((SpanMultiTermQueryWrapper<?>) other).query);
}
/** Abstract class that defines how the query is rewritten. */
public static abstract class SpanRewriteMethod extends MultiTermQuery.RewriteMethod {
@Override
public abstract SpanQuery rewrite(IndexReader reader, MultiTermQuery query) throws IOException;
}
/**
* A rewrite method that first translates each term into a SpanTermQuery in a
* {@link Occur#SHOULD} clause in a BooleanQuery, and keeps the
* scores as computed by the query.
*
* @see #setRewriteMethod
*/
public final static SpanRewriteMethod SCORING_SPAN_QUERY_REWRITE = new SpanRewriteMethod() {
private final ScoringRewrite<List<SpanQuery>> delegate = new ScoringRewrite<List<SpanQuery>>() {
@Override
protected List<SpanQuery> getTopLevelBuilder() {
return new ArrayList<SpanQuery>();
}
protected Query build(List<SpanQuery> builder) {
return new SpanOrQuery(builder.toArray(new SpanQuery[builder.size()]));
}
@Override
protected void checkMaxClauseCount(int count) {
// we accept all terms as SpanOrQuery has no limits
}
@Override
protected void addClause(List<SpanQuery> topLevel, Term term, int docCount, float boost, TermStates states) {
final SpanTermQuery q = new SpanTermQuery(term, states);
topLevel.add(q);
}
};
@Override
public SpanQuery rewrite(IndexReader reader, MultiTermQuery query) throws IOException {
return (SpanQuery) delegate.rewrite(reader, query);
}
};
/**
* A rewrite method that first translates each term into a SpanTermQuery in a
* {@link Occur#SHOULD} clause in a BooleanQuery, and keeps the
* scores as computed by the query.
*
* <p>
* This rewrite method only uses the top scoring terms so it will not overflow
* the boolean max clause count.
*
* @see #setRewriteMethod
*/
public static final class TopTermsSpanBooleanQueryRewrite extends SpanRewriteMethod {
private final TopTermsRewrite<List<SpanQuery>> delegate;
/**
* Create a TopTermsSpanBooleanQueryRewrite for
* at most <code>size</code> terms.
*/
public TopTermsSpanBooleanQueryRewrite(int size) {
delegate = new TopTermsRewrite<List<SpanQuery>>(size) {
@Override
protected int getMaxSize() {
return Integer.MAX_VALUE;
}
@Override
protected List<SpanQuery> getTopLevelBuilder() {
return new ArrayList<SpanQuery>();
}
@Override
protected Query build(List<SpanQuery> builder) {
return new SpanOrQuery(builder.toArray(new SpanQuery[builder.size()]));
}
@Override
protected void addClause(List<SpanQuery> topLevel, Term term, int docFreq, float boost, TermStates states) {
final SpanTermQuery q = new SpanTermQuery(term, states);
topLevel.add(q);
}
};
}
/** return the maximum priority queue size */
public int getSize() {
return delegate.getSize();
}
@Override
public SpanQuery rewrite(IndexReader reader, MultiTermQuery query) throws IOException {
return (SpanQuery) delegate.rewrite(reader, query);
}
@Override
public int hashCode() {
return 31 * delegate.hashCode();
}
@Override
public boolean equals(Object obj) {
if (this == obj) return true;
if (obj == null) return false;
if (getClass() != obj.getClass()) return false;
final TopTermsSpanBooleanQueryRewrite other = (TopTermsSpanBooleanQueryRewrite) obj;
return delegate.equals(other.delegate);
}
}
}