All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.datakernel.aggregation.AggregationGroupReducer Maven / Gradle / Ivy

/*
 * Copyright (C) 2015-2018 SoftIndex LLC.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package io.datakernel.aggregation;

import io.datakernel.aggregation.ot.AggregationStructure;
import io.datakernel.aggregation.util.PartitionPredicate;
import io.datakernel.async.AsyncCollector;
import io.datakernel.async.Promise;
import io.datakernel.codegen.DefiningClassLoader;
import io.datakernel.stream.AbstractStreamConsumer;
import io.datakernel.stream.StreamDataAcceptor;
import io.datakernel.stream.StreamSupplier;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.function.Function;

import static io.datakernel.util.Preconditions.checkNotNull;

public final class AggregationGroupReducer extends AbstractStreamConsumer implements StreamDataAcceptor {
	private static final Logger logger = LoggerFactory.getLogger(AggregationGroupReducer.class);

	private final AggregationChunkStorage storage;
	private final AggregationStructure aggregation;
	private final List measures;
	private final PartitionPredicate partitionPredicate;
	private final Class recordClass;
	private final Function keyFunction;
	private final Aggregate aggregate;
	private final AsyncCollector> chunksCollector;
	private final DefiningClassLoader classLoader;
	private final int chunkSize;

	private final HashMap map = new HashMap<>();

	public AggregationGroupReducer(AggregationChunkStorage storage,
			AggregationStructure aggregation, List measures,
			Class recordClass, PartitionPredicate partitionPredicate,
			Function keyFunction, Aggregate aggregate,
			int chunkSize, DefiningClassLoader classLoader) {
		this.storage = checkNotNull(storage, "Cannot create AggregationGroupReducer with AggregationChunkStorage that is null");
		this.measures = checkNotNull(measures, "Cannot create AggregationGroupReducer with measures that is null");
		this.partitionPredicate = checkNotNull(partitionPredicate, "Cannot create AggregationGroupReducer with PartitionPredicate that is null");
		this.recordClass = checkNotNull(recordClass, "Cannot create AggregationGroupReducer with recordClass that is null");
		this.keyFunction = checkNotNull(keyFunction, "Cannot create AggregationGroupReducer with keyFunction that is null");
		this.aggregate = checkNotNull(aggregate, "Cannot create AggregationGroupReducer with Aggregate that is null");
		this.chunkSize = chunkSize;
		this.aggregation = checkNotNull(aggregation, "Cannot create AggregationGroupReducer with AggregationStructure that is null");
		this.chunksCollector = AsyncCollector.create(new ArrayList<>());
		this.classLoader = checkNotNull(classLoader, "Cannot create AggregationGroupReducer with ClassLoader that is null");
	}

	public Promise> getResult() {
		return chunksCollector.get();
	}

	@Override
	public void accept(T item) {
		K key = keyFunction.apply(item);
		Object accumulator = map.get(key);
		if (accumulator != null) {
			aggregate.accumulate(accumulator, item);
		} else {
			accumulator = aggregate.createAccumulator(item);
			map.put(key, accumulator);

			if (map.size() == chunkSize) {
				doFlush();
			}
		}
	}

	@Override
	protected void onStarted() {
		getSupplier().resume(this);
	}

	@SuppressWarnings("unchecked")
	private void doFlush() {
		if (map.isEmpty())
			return;

		suspendOrResume();

		List> entryList = new ArrayList<>(map.entrySet());
		map.clear();

		entryList.sort((o1, o2) -> {
			K key1 = o1.getKey();
			K key2 = o2.getKey();
			return key1.compareTo(key2);
		});

		List list = new ArrayList<>(entryList.size());
		for (Map.Entry entry : entryList) {
			list.add((T) entry.getValue());
		}

		StreamSupplier supplier = StreamSupplier.ofIterable(list);
		AggregationChunker chunker = AggregationChunker.create(aggregation, measures, recordClass,
				partitionPredicate, storage, classLoader, chunkSize);

		chunksCollector.addPromise(
				supplier.streamTo(chunker)
						.then($ -> chunker.getResult()),
				List::addAll)
				.whenResult($ -> suspendOrResume());
	}

	private void suspendOrResume() {
		if (chunksCollector.getActivePromises() > 2) {
			logger.trace("Suspend group reduce: {}", this);
			getSupplier().suspend();
		} else {
			logger.trace("Resume group reduce: {}", this);
			getSupplier().resume(this);
		}
	}

	@Override
	protected Promise onEndOfStream() {
		doFlush();
		return chunksCollector.run().get().toVoid();
	}

	@Override
	protected void onError(Throwable e) {
		chunksCollector.close(e);
	}

	// jmx
	public void flush() {
		doFlush();
	}

	public int getBufferSize() {
		return map.size();
	}

	@Override
	public String toString() {
		return "AggregationGroupReducer{" +
				"keys=" + aggregation.getKeys() +
				"measures=" + measures +
				", chunkSize=" + chunkSize +
				", map.size=" + map.size() +
				'}';
	}
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy