All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.lucene.search.MultiCollector Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.lucene.search;


import java.io.IOException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;

import org.apache.lucene.index.LeafReaderContext;

/**
 * A {@link Collector} which allows running a search with several {@link Collector}s. It offers a
 * static {@link #wrap} method which accepts a list of collectors and wraps them with {@link
 * MultiCollector}, while filtering out the null null ones.
 *
 * 

NOTE:When mixing collectors that want to skip low-scoring hits ({@link * ScoreMode#TOP_SCORES}) with ones that require to see all hits, such as mixing {@link * TopScoreDocCollector} and {@link TotalHitCountCollector}, it should be faster to run the query * twice, once for each collector, rather than using this wrapper on a single search. */ public class MultiCollector implements Collector { /** See {@link #wrap(Iterable)}. */ public static Collector wrap(Collector... collectors) { return wrap(Arrays.asList(collectors)); } /** * Wraps a list of {@link Collector}s with a {@link MultiCollector}. This * method works as follows: *

    *
  • Filters out the null collectors, so they are not used * during search time. *
  • If the input contains 1 real collector (i.e. non-null ), * it is returned. *
  • Otherwise the method returns a {@link MultiCollector} which wraps the * non-null ones. *
* * @throws IllegalArgumentException * if either 0 collectors were input, or all collectors are * null. */ public static Collector wrap(Iterable collectors) { // For the user's convenience, we allow null collectors to be passed. // However, to improve performance, these null collectors are found // and dropped from the array we save for actual collection time. int n = 0; for (Collector c : collectors) { if (c != null) { n++; } } if (n == 0) { throw new IllegalArgumentException("At least 1 collector must not be null"); } else if (n == 1) { // only 1 Collector - return it. Collector col = null; for (Collector c : collectors) { if (c != null) { col = c; break; } } return col; } else { Collector[] colls = new Collector[n]; n = 0; for (Collector c : collectors) { if (c != null) { colls[n++] = c; } } return new MultiCollector(colls); } } private final boolean cacheScores; private final Collector[] collectors; private MultiCollector(Collector... collectors) { this.collectors = collectors; int numNeedsScores = 0; for (Collector collector : collectors) { if (collector.scoreMode().needsScores()) { numNeedsScores += 1; } } this.cacheScores = numNeedsScores >= 2; } @Override public ScoreMode scoreMode() { ScoreMode scoreMode = null; for (Collector collector : collectors) { if (scoreMode == null) { scoreMode = collector.scoreMode(); } else if (scoreMode != collector.scoreMode()) { return ScoreMode.COMPLETE; } } return scoreMode; } @Override public LeafCollector getLeafCollector(LeafReaderContext context) throws IOException { final List leafCollectors = new ArrayList<>(collectors.length); ScoreMode leafScoreMode = null; for (Collector collector : collectors) { final LeafCollector leafCollector; try { leafCollector = collector.getLeafCollector(context); } catch (CollectionTerminatedException e) { // this leaf collector does not need this segment continue; } if (leafScoreMode == null) { leafScoreMode = collector.scoreMode(); } else if (leafScoreMode != collector.scoreMode()) { leafScoreMode = ScoreMode.COMPLETE; } leafCollectors.add(leafCollector); } if (leafCollectors.isEmpty()) { throw new CollectionTerminatedException(); } else { // Wraps single leaf collector that wants to skip low-scoring hits (ScoreMode.TOP_SCORES) // but the global score mode doesn't allow it. if (leafCollectors.size() == 1 && (scoreMode() == ScoreMode.TOP_SCORES || leafScoreMode != ScoreMode.TOP_SCORES)) { return leafCollectors.get(0); } return new MultiLeafCollector( leafCollectors, cacheScores, scoreMode() == ScoreMode.TOP_SCORES); } } private static class MultiLeafCollector implements LeafCollector { private final boolean cacheScores; private final LeafCollector[] collectors; private final float[] minScores; private final boolean skipNonCompetitiveScores; private MultiLeafCollector(List collectors, boolean cacheScores, boolean skipNonCompetitive) { this.collectors = collectors.toArray(new LeafCollector[collectors.size()]); this.cacheScores = cacheScores; this.skipNonCompetitiveScores = skipNonCompetitive; this.minScores = this.skipNonCompetitiveScores ? new float[this.collectors.length] : null; } @Override public void setScorer(Scorable scorer) throws IOException { if (cacheScores) { scorer = ScoreCachingWrappingScorer.wrap(scorer); } if (skipNonCompetitiveScores) { for (int i = 0; i < collectors.length; ++i) { final LeafCollector c = collectors[i]; if (c != null) { c.setScorer(new MinCompetitiveScoreAwareScorable(scorer, i, minScores)); } } } else { scorer = new FilterScorable(scorer) { @Override public void setMinCompetitiveScore(float minScore) throws IOException { // Ignore calls to setMinCompetitiveScore so that if we wrap two // collectors and one of them wants to skip low-scoring hits, then // the other collector still sees all hits. } }; for (int i = 0; i < collectors.length; ++i) { final LeafCollector c = collectors[i]; if (c != null) { c.setScorer(scorer); } } } } @Override public void collect(int doc) throws IOException { for (int i = 0; i < collectors.length; i++) { final LeafCollector collector = collectors[i]; if (collector != null) { try { collector.collect(doc); } catch (CollectionTerminatedException e) { collectors[i] = null; if (allCollectorsTerminated()) { throw new CollectionTerminatedException(); } } } } } private boolean allCollectorsTerminated() { for (int i = 0; i < collectors.length; i++) { if (collectors[i] != null) { return false; } } return true; } } final static class MinCompetitiveScoreAwareScorable extends FilterScorable { private final int idx; private final float[] minScores; MinCompetitiveScoreAwareScorable(Scorable in, int idx, float[] minScores) { super(in); this.idx = idx; this.minScores = minScores; } @Override public void setMinCompetitiveScore(float minScore) throws IOException { if (minScore > minScores[idx]) { minScores[idx] = minScore; in.setMinCompetitiveScore(minScore()); } } private float minScore() { float min = Float.MAX_VALUE; for (int i = 0; i < minScores.length; i++) { if (minScores[i] < min) { min = minScores[i]; } } return min; } } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy