org.apache.lucene.queries.spans.SpanMultiTermQueryWrapper Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.lucene.queries.spans;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import java.util.Objects;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermStates;
import org.apache.lucene.search.BooleanClause.Occur;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.MultiTermQuery;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.QueryVisitor;
import org.apache.lucene.search.ScoreMode;
import org.apache.lucene.search.ScoringRewrite;
import org.apache.lucene.search.TopTermsRewrite;
/**
* Wraps any {@link MultiTermQuery} as a {@link SpanQuery}, so it can be nested within other
* SpanQuery classes.
*
* The query is rewritten by default to a {@link SpanOrQuery} containing the expanded terms, but
* this can be customized.
*
*
Example:
*
*
*
* {@code
* WildcardQuery wildcard = new WildcardQuery(new Term("field", "bro?n"));
* SpanQuery spanWildcard = new SpanMultiTermQueryWrapper(wildcard);
* // do something with spanWildcard, such as use it in a SpanFirstQuery
* }
*
*
*/
public class SpanMultiTermQueryWrapper extends SpanQuery {
protected final Q query;
private SpanRewriteMethod rewriteMethod;
/**
* Create a new SpanMultiTermQueryWrapper.
*
* @param query Query to wrap.
*/
@SuppressWarnings({"rawtypes", "unchecked"})
public SpanMultiTermQueryWrapper(Q query) {
this.query = Objects.requireNonNull(query);
this.rewriteMethod = selectRewriteMethod(query);
}
private static SpanRewriteMethod selectRewriteMethod(MultiTermQuery query) {
MultiTermQuery.RewriteMethod method = query.getRewriteMethod();
if (method instanceof TopTermsRewrite) {
final int pqsize = ((TopTermsRewrite>) method).getSize();
return new TopTermsSpanBooleanQueryRewrite(pqsize);
} else {
return SCORING_SPAN_QUERY_REWRITE;
}
}
/** Expert: returns the rewriteMethod */
public final SpanRewriteMethod getRewriteMethod() {
return rewriteMethod;
}
/** Expert: sets the rewrite method. This only makes sense to be a span rewrite method. */
public final void setRewriteMethod(SpanRewriteMethod rewriteMethod) {
this.rewriteMethod = rewriteMethod;
}
@Override
public String getField() {
return query.getField();
}
@Override
public SpanWeight createWeight(IndexSearcher searcher, ScoreMode scoreMode, float boost)
throws IOException {
throw new IllegalArgumentException("Rewrite first!");
}
/** Returns the wrapped query */
public Query getWrappedQuery() {
return query;
}
@Override
public String toString(String field) {
StringBuilder builder = new StringBuilder();
builder.append("SpanMultiTermQueryWrapper(");
// NOTE: query.toString must be placed in a temp local to avoid compile errors on Java 8u20
// see
// https://bugs.openjdk.java.net/browse/JDK-8056984?page=com.atlassian.streams.streams-jira-plugin:activity-stream-issue-tab
String queryStr = query.toString(field);
builder.append(queryStr);
builder.append(")");
return builder.toString();
}
@Override
public Query rewrite(IndexSearcher indexSearcher) throws IOException {
return rewriteMethod.rewrite(indexSearcher.getIndexReader(), query);
}
@Override
public void visit(QueryVisitor visitor) {
if (visitor.acceptField(query.getField())) {
query.visit(visitor.getSubVisitor(Occur.MUST, this));
}
}
@Override
public int hashCode() {
return classHash() * 31 + query.hashCode();
}
@Override
public boolean equals(Object other) {
return sameClassAs(other) && query.equals(((SpanMultiTermQueryWrapper>) other).query);
}
/** Abstract class that defines how the query is rewritten. */
public abstract static class SpanRewriteMethod extends MultiTermQuery.RewriteMethod {
@Override
public abstract SpanQuery rewrite(IndexReader reader, MultiTermQuery query) throws IOException;
}
/**
* A rewrite method that first translates each term into a SpanTermQuery in a {@link Occur#SHOULD}
* clause in a BooleanQuery, and keeps the scores as computed by the query.
*
* @see #setRewriteMethod
*/
public static final SpanRewriteMethod SCORING_SPAN_QUERY_REWRITE =
new SpanRewriteMethod() {
private final ScoringRewrite> delegate =
new ScoringRewrite>() {
@Override
protected List getTopLevelBuilder() {
return new ArrayList();
}
@Override
protected Query build(List builder) {
return new SpanOrQuery(builder.toArray(new SpanQuery[builder.size()]));
}
@Override
protected void checkMaxClauseCount(int count) {
// we accept all terms as SpanOrQuery has no limits
}
@Override
protected void addClause(
List topLevel,
Term term,
int docCount,
float boost,
TermStates states) {
final SpanTermQuery q = new SpanTermQuery(term, states);
topLevel.add(q);
}
};
@Override
public SpanQuery rewrite(IndexReader reader, MultiTermQuery query) throws IOException {
return (SpanQuery) delegate.rewrite(reader, query);
}
};
/**
* A rewrite method that first translates each term into a SpanTermQuery in a {@link Occur#SHOULD}
* clause in a BooleanQuery, and keeps the scores as computed by the query.
*
* This rewrite method only uses the top scoring terms so it will not overflow the boolean max
* clause count.
*
* @see #setRewriteMethod
*/
public static final class TopTermsSpanBooleanQueryRewrite extends SpanRewriteMethod {
private final TopTermsRewrite> delegate;
/** Create a TopTermsSpanBooleanQueryRewrite for at most size
terms. */
public TopTermsSpanBooleanQueryRewrite(int size) {
delegate =
new TopTermsRewrite>(size) {
@Override
protected int getMaxSize() {
return Integer.MAX_VALUE;
}
@Override
protected List getTopLevelBuilder() {
return new ArrayList();
}
@Override
protected Query build(List builder) {
return new SpanOrQuery(builder.toArray(new SpanQuery[builder.size()]));
}
@Override
protected void addClause(
List topLevel, Term term, int docFreq, float boost, TermStates states) {
final SpanTermQuery q = new SpanTermQuery(term, states);
topLevel.add(q);
}
};
}
/** return the maximum priority queue size */
public int getSize() {
return delegate.getSize();
}
@Override
public SpanQuery rewrite(IndexReader reader, MultiTermQuery query) throws IOException {
return (SpanQuery) delegate.rewrite(reader, query);
}
@Override
public int hashCode() {
return 31 * delegate.hashCode();
}
@Override
public boolean equals(Object obj) {
if (this == obj) return true;
if (obj == null) return false;
if (getClass() != obj.getClass()) return false;
final TopTermsSpanBooleanQueryRewrite other = (TopTermsSpanBooleanQueryRewrite) obj;
return delegate.equals(other.delegate);
}
}
}