![JAR search and dependency download from the Maven repository](/logo.png)
com.pivovarit.collectors.ParallelStreamCollector Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of parallel-collectors Show documentation
Show all versions of parallel-collectors Show documentation
Parallel collection processing with customizable thread pools
package com.pivovarit.collectors;
import java.util.ArrayList;
import java.util.Collection;
import java.util.EnumSet;
import java.util.List;
import java.util.Set;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.Executor;
import java.util.function.BiConsumer;
import java.util.function.BinaryOperator;
import java.util.function.Function;
import java.util.function.Supplier;
import java.util.stream.Collector;
import java.util.stream.Stream;
import java.util.stream.StreamSupport;
import static com.pivovarit.collectors.AsyncParallelCollector.batch;
import static com.pivovarit.collectors.AsyncParallelCollector.requireValidParallelism;
import static com.pivovarit.collectors.BatchingStream.defaultBatchAmount;
import static com.pivovarit.collectors.BatchingStream.partitioned;
import static com.pivovarit.collectors.Dispatcher.limiting;
import static com.pivovarit.collectors.Dispatcher.unbounded;
import static java.util.Collections.emptySet;
import static java.util.Objects.requireNonNull;
import static java.util.stream.Collectors.collectingAndThen;
import static java.util.stream.Collectors.toList;
/**
* @author Grzegorz Piwowarek
*/
class ParallelStreamCollector implements Collector>, Stream> {
private static final EnumSet UNORDERED = EnumSet.of(Characteristics.UNORDERED);
private final Dispatcher dispatcher;
private final Function function;
private final Function>, Stream> processor;
private final Set characteristics;
private ParallelStreamCollector(
Function function,
Function>, Stream> processor,
Set characteristics,
Dispatcher dispatcher) {
this.processor = processor;
this.characteristics = characteristics;
this.dispatcher = dispatcher;
this.function = function;
}
private void startConsuming() {
if (!dispatcher.isRunning()) {
dispatcher.start();
}
}
@Override
public Supplier>> supplier() {
return ArrayList::new;
}
@Override
public BiConsumer>, T> accumulator() {
return (acc, e) -> {
startConsuming();
acc.add(dispatcher.enqueue(() -> function.apply(e)));
};
}
@Override
public BinaryOperator>> combiner() {
return (left, right) -> {
throw new UnsupportedOperationException();
};
}
@Override
public Function>, Stream> finisher() {
return acc -> {
dispatcher.stop();
return processor.apply(acc);
};
}
@Override
public Set characteristics() {
return characteristics;
}
static Collector> streaming(Function mapper, Executor executor) {
requireNonNull(executor, "executor can't be null");
requireNonNull(mapper, "mapper can't be null");
return new ParallelStreamCollector<>(mapper, streamInCompletionOrderStrategy(), UNORDERED, limiting(executor));
}
static Collector> streaming(Function mapper, Executor executor, int parallelism) {
requireNonNull(executor, "executor can't be null");
requireNonNull(mapper, "mapper can't be null");
requireValidParallelism(parallelism);
return new ParallelStreamCollector<>(mapper, streamInCompletionOrderStrategy(), UNORDERED, limiting(executor, parallelism));
}
static Collector> streamingInBatches(Function mapper, Executor executor) {
requireNonNull(executor, "executor can't be null");
requireNonNull(mapper, "mapper can't be null");
return collectingAndThen(collectingAndThen(toList(), list -> partitioned(list, defaultBatchAmount())
.collect(new ParallelStreamCollector<>(batch(mapper), streamInCompletionOrderStrategy(), UNORDERED, unbounded(executor)))), s -> s
.flatMap(Collection::stream));
}
static Collector> streamingInBatches(Function mapper, Executor executor, int parallelism) {
requireNonNull(executor, "executor can't be null");
requireNonNull(mapper, "mapper can't be null");
requireValidParallelism(parallelism);
return batched(new ParallelStreamCollector<>(batch(mapper), streamInCompletionOrderStrategy(), UNORDERED, unbounded(executor)), parallelism);
}
static Collector> streamingOrdered(Function mapper, Executor executor) {
requireNonNull(executor, "executor can't be null");
requireNonNull(mapper, "mapper can't be null");
return new ParallelStreamCollector<>(mapper, streamOrderedStrategy(), emptySet(), limiting(executor));
}
static Collector> streamingOrdered(Function mapper, Executor executor, int parallelism) {
requireNonNull(executor, "executor can't be null");
requireNonNull(mapper, "mapper can't be null");
requireValidParallelism(parallelism);
return new ParallelStreamCollector<>(mapper, streamOrderedStrategy(), emptySet(), limiting(executor, parallelism));
}
static Collector> streamingOrderedInBatches(Function mapper, Executor executor) {
requireNonNull(executor, "executor can't be null");
requireNonNull(mapper, "mapper can't be null");
return batched(new ParallelStreamCollector<>(batch(mapper), streamOrderedStrategy(), emptySet(), unbounded(executor)), defaultBatchAmount());
}
static Collector> streamingOrderedInBatches(Function mapper, Executor executor, int parallelism) {
requireNonNull(executor, "executor can't be null");
requireNonNull(mapper, "mapper can't be null");
requireValidParallelism(parallelism);
return batched(new ParallelStreamCollector<>(batch(mapper), streamOrderedStrategy(), emptySet(), unbounded(executor)), parallelism);
}
private static Function>, Stream> streamInCompletionOrderStrategy() {
return futures -> StreamSupport.stream(new CompletionOrderSpliterator<>(futures), false);
}
private static Function>, Stream> streamOrderedStrategy() {
return futures -> futures.stream().map(CompletableFuture::join);
}
private static Collector> batched(ParallelStreamCollector, List> collector, int parallelism) {
return collectingAndThen(collectingAndThen(toList(), list -> partitioned(list, parallelism)
.collect(collector)), s -> s.flatMap(Collection::stream));
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy