
org.apache.lucene.search.TopDocs Maven / Gradle / Ivy
/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.lucene.search; import org.apache.lucene.util.PriorityQueue; /** Represents hits returned by {@link * IndexSearcher#search(Query,int)}. */ public class TopDocs { /** The total number of hits for the query. */ public TotalHits totalHits; /** The top hits for the query. */ public ScoreDoc[] scoreDocs; /** Constructs a TopDocs. */ public TopDocs(TotalHits totalHits, ScoreDoc[] scoreDocs) { this.totalHits = totalHits; this.scoreDocs = scoreDocs; } // Refers to one hit: private final static class ShardRef { // Which shard (index into shardHits[]): final int shardIndex; // True if we should use the incoming ScoreDoc.shardIndex for sort order final boolean useScoreDocIndex; // Which hit within the shard: int hitIndex; ShardRef(int shardIndex, boolean useScoreDocIndex) { this.shardIndex = shardIndex; this.useScoreDocIndex = useScoreDocIndex; } @Override public String toString() { return "ShardRef(shardIndex=" + shardIndex + " hitIndex=" + hitIndex + ")"; } int getShardIndex(ScoreDoc scoreDoc) { if (useScoreDocIndex) { if (scoreDoc.shardIndex == -1) { throw new IllegalArgumentException("setShardIndex is false but TopDocs[" + shardIndex + "].scoreDocs[" + hitIndex + "] is not set"); } return scoreDoc.shardIndex; } else { // NOTE: we don't assert that shardIndex is -1 here, because caller could in fact have set it but asked us to ignore it now return shardIndex; } } } /** * if we need to tie-break since score / sort value are the same we first compare shard index (lower shard wins) * and then iff shard index is the same we use the hit index. */ static boolean tieBreakLessThan(ShardRef first, ScoreDoc firstDoc, ShardRef second, ScoreDoc secondDoc) { final int firstShardIndex = first.getShardIndex(firstDoc); final int secondShardIndex = second.getShardIndex(secondDoc); // Tie break: earlier shard wins if (firstShardIndex< secondShardIndex) { return true; } else if (firstShardIndex > secondShardIndex) { return false; } else { // Tie break in same shard: resolve however the // shard had resolved it: assert first.hitIndex != second.hitIndex; return first.hitIndex < second.hitIndex; } } // Specialized MergeSortQueue that just merges by // relevance score, descending: private static class ScoreMergeSortQueue extends PriorityQueue
must be * passed to {@link TopFieldCollector#create}). * @see #merge(Sort, int, int, TopFieldDocs[], boolean) * @lucene.experimental */ public static TopFieldDocs merge(Sort sort, int topN, TopFieldDocs[] shardHits) { return merge(sort, 0, topN, shardHits, true); } /** * Same as {@link #merge(Sort, int, TopFieldDocs[])} but also ignores the top * {@code start} top docs. This is typically useful for pagination. * * Note: If {@code setShardIndex} is true, this method will assume the incoming order of {@code shardHits} reflects * each shard's index and will fill the {@link ScoreDoc#shardIndex}, otherwise * it must already be set for all incoming {@code ScoreDoc}s, which can be useful when doing multiple reductions * (merges) of TopDocs. * * @lucene.experimental */ public static TopFieldDocs merge(Sort sort, int start, int topN, TopFieldDocs[] shardHits, boolean setShardIndex) { if (sort == null) { throw new IllegalArgumentException("sort must be non-null when merging field-docs"); } return (TopFieldDocs) mergeAux(sort, start, topN, shardHits, setShardIndex); } /** Auxiliary method used by the {@link #merge} impls. A sort value of null * is used to indicate that docs should be sorted by score. */ private static TopDocs mergeAux(Sort sort, int start, int size, TopDocs[] shardHits, boolean setShardIndex) { final PriorityQueue{ final ScoreDoc[][] shardHits; public ScoreMergeSortQueue(TopDocs[] shardHits) { super(shardHits.length); this.shardHits = new ScoreDoc[shardHits.length][]; for(int shardIDX=0;shardIDX secondScoreDoc.score) { return true; } else { return tieBreakLessThan(first, firstScoreDoc, second, secondScoreDoc); } } } @SuppressWarnings({"rawtypes","unchecked"}) private static class MergeSortQueue extends PriorityQueue { // These are really FieldDoc instances: final ScoreDoc[][] shardHits; final FieldComparator>[] comparators; final int[] reverseMul; public MergeSortQueue(Sort sort, TopDocs[] shardHits) { super(shardHits.length); this.shardHits = new ScoreDoc[shardHits.length][]; for(int shardIDX=0;shardIDX fillFields=true queue; if (sort == null) { queue = new ScoreMergeSortQueue(shardHits); } else { queue = new MergeSortQueue(sort, shardHits); } long totalHitCount = 0; TotalHits.Relation totalHitsRelation = TotalHits.Relation.EQUAL_TO; int availHitCount = 0; for(int shardIDX=0;shardIDX 0) { availHitCount += shard.scoreDocs.length; queue.add(new ShardRef(shardIDX, setShardIndex == false)); } } final ScoreDoc[] hits; if (availHitCount <= start) { hits = new ScoreDoc[0]; } else { hits = new ScoreDoc[Math.min(size, availHitCount - start)]; int requestedResultWindow = start + size; int numIterOnHits = Math.min(availHitCount, requestedResultWindow); int hitUpto = 0; while (hitUpto < numIterOnHits) { assert queue.size() > 0; ShardRef ref = queue.top(); final ScoreDoc hit = shardHits[ref.shardIndex].scoreDocs[ref.hitIndex++]; if (setShardIndex) { // caller asked us to record shardIndex (index of the TopDocs array) this hit is coming from: hit.shardIndex = ref.shardIndex; } else if (hit.shardIndex == -1) { throw new IllegalArgumentException("setShardIndex is false but TopDocs[" + ref.shardIndex + "].scoreDocs[" + (ref.hitIndex-1) + "] is not set"); } if (hitUpto >= start) { hits[hitUpto - start] = hit; } hitUpto++; if (ref.hitIndex < shardHits[ref.shardIndex].scoreDocs.length) { // Not done with this these TopDocs yet: queue.updateTop(); } else { queue.pop(); } } } TotalHits totalHits = new TotalHits(totalHitCount, totalHitsRelation); if (sort == null) { return new TopDocs(totalHits, hits); } else { return new TopFieldDocs(totalHits, hits, sort.getSort()); } } }
© 2015 - 2025 Weber Informatics LLC | Privacy Policy