org.apache.lucene.util.MergedIterator Maven / Gradle / Ivy
The newest version!
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.lucene.util;
import java.util.Iterator;
import java.util.NoSuchElementException;
import org.apache.lucene.util.PriorityQueue;
/**
* Provides a merged sorted view from several sorted iterators.
*
* If built with removeDuplicates
set to true and an element
* appears in multiple iterators then it is deduplicated, that is this iterator
* returns the sorted union of elements.
*
* If built with removeDuplicates
set to false then all elements
* in all iterators are returned.
*
* Caveats:
*
* - The behavior is undefined if the iterators are not actually sorted.
*
- Null elements are unsupported.
*
- If removeDuplicates is set to true and if a single iterator contains
* duplicates then they will not be deduplicated.
*
- When elements are deduplicated it is not defined which one is returned.
*
- If removeDuplicates is set to false then the order in which duplicates
* are returned isn't defined.
*
* @lucene.internal
*/
public final class MergedIterator> implements Iterator {
private T current;
private final TermMergeQueue queue;
private final SubIterator[] top;
private final boolean removeDuplicates;
private int numTop;
@SuppressWarnings({"unchecked","rawtypes"})
public MergedIterator(Iterator... iterators) {
this(true, iterators);
}
@SuppressWarnings({"unchecked","rawtypes"})
public MergedIterator(boolean removeDuplicates, Iterator... iterators) {
this.removeDuplicates = removeDuplicates;
queue = new TermMergeQueue<>(iterators.length);
top = new SubIterator[iterators.length];
int index = 0;
for (Iterator iterator : iterators) {
if (iterator.hasNext()) {
SubIterator sub = new SubIterator<>();
sub.current = iterator.next();
sub.iterator = iterator;
sub.index = index++;
queue.add(sub);
}
}
}
@Override
public boolean hasNext() {
if (queue.size() > 0) {
return true;
}
for (int i = 0; i < numTop; i++) {
if (top[i].iterator.hasNext()) {
return true;
}
}
return false;
}
@Override
public T next() {
// restore queue
pushTop();
// gather equal top elements
if (queue.size() > 0) {
pullTop();
} else {
current = null;
}
if (current == null) {
throw new NoSuchElementException();
}
return current;
}
@Override
public void remove() {
throw new UnsupportedOperationException();
}
private void pullTop() {
assert numTop == 0;
top[numTop++] = queue.pop();
if (removeDuplicates) {
// extract all subs from the queue that have the same top element
while (queue.size() != 0
&& queue.top().current.equals(top[0].current)) {
top[numTop++] = queue.pop();
}
}
current = top[0].current;
}
private void pushTop() {
// call next() on each top, and put back into queue
for (int i = 0; i < numTop; i++) {
if (top[i].iterator.hasNext()) {
top[i].current = top[i].iterator.next();
queue.add(top[i]);
} else {
// no more elements
top[i].current = null;
}
}
numTop = 0;
}
private static class SubIterator> {
Iterator iterator;
I current;
int index;
}
private static class TermMergeQueue> extends PriorityQueue> {
TermMergeQueue(int size) {
super(size);
}
@Override
protected boolean lessThan(SubIterator a, SubIterator b) {
final int cmp = a.current.compareTo(b.current);
if (cmp != 0) {
return cmp < 0;
} else {
return a.index < b.index;
}
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy