All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.lucene.util.MergedIterator Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.lucene.util;


import java.util.Iterator;
import java.util.NoSuchElementException;

import org.apache.lucene.util.PriorityQueue;

/**
 * Provides a merged sorted view from several sorted iterators.
 * 

* If built with removeDuplicates set to true and an element * appears in multiple iterators then it is deduplicated, that is this iterator * returns the sorted union of elements. *

* If built with removeDuplicates set to false then all elements * in all iterators are returned. *

* Caveats: *

    *
  • The behavior is undefined if the iterators are not actually sorted. *
  • Null elements are unsupported. *
  • If removeDuplicates is set to true and if a single iterator contains * duplicates then they will not be deduplicated. *
  • When elements are deduplicated it is not defined which one is returned. *
  • If removeDuplicates is set to false then the order in which duplicates * are returned isn't defined. *
* @lucene.internal */ public final class MergedIterator> implements Iterator { private T current; private final TermMergeQueue queue; private final SubIterator[] top; private final boolean removeDuplicates; private int numTop; @SuppressWarnings({"unchecked","rawtypes"}) public MergedIterator(Iterator... iterators) { this(true, iterators); } @SuppressWarnings({"unchecked","rawtypes"}) public MergedIterator(boolean removeDuplicates, Iterator... iterators) { this.removeDuplicates = removeDuplicates; queue = new TermMergeQueue<>(iterators.length); top = new SubIterator[iterators.length]; int index = 0; for (Iterator iterator : iterators) { if (iterator.hasNext()) { SubIterator sub = new SubIterator<>(); sub.current = iterator.next(); sub.iterator = iterator; sub.index = index++; queue.add(sub); } } } @Override public boolean hasNext() { if (queue.size() > 0) { return true; } for (int i = 0; i < numTop; i++) { if (top[i].iterator.hasNext()) { return true; } } return false; } @Override public T next() { // restore queue pushTop(); // gather equal top elements if (queue.size() > 0) { pullTop(); } else { current = null; } if (current == null) { throw new NoSuchElementException(); } return current; } @Override public void remove() { throw new UnsupportedOperationException(); } private void pullTop() { assert numTop == 0; top[numTop++] = queue.pop(); if (removeDuplicates) { // extract all subs from the queue that have the same top element while (queue.size() != 0 && queue.top().current.equals(top[0].current)) { top[numTop++] = queue.pop(); } } current = top[0].current; } private void pushTop() { // call next() on each top, and put back into queue for (int i = 0; i < numTop; i++) { if (top[i].iterator.hasNext()) { top[i].current = top[i].iterator.next(); queue.add(top[i]); } else { // no more elements top[i].current = null; } } numTop = 0; } private static class SubIterator> { Iterator iterator; I current; int index; } private static class TermMergeQueue> extends PriorityQueue> { TermMergeQueue(int size) { super(size); } @Override protected boolean lessThan(SubIterator a, SubIterator b) { final int cmp = a.current.compareTo(b.current); if (cmp != 0) { return cmp < 0; } else { return a.index < b.index; } } } }