org.elasticsearch.compute.aggregation.blockhash.TimeSeriesBlockHash Maven / Gradle / Ivy
/*
* Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
* or more contributor license agreements. Licensed under the Elastic License
* 2.0; you may not use this file except in compliance with the Elastic License
* 2.0.
*/
package org.elasticsearch.compute.aggregation.blockhash;
import org.apache.lucene.util.BytesRef;
import org.elasticsearch.common.unit.ByteSizeValue;
import org.elasticsearch.common.util.BigArrays;
import org.elasticsearch.common.util.BitArray;
import org.elasticsearch.common.util.BytesRefHash;
import org.elasticsearch.common.util.LongLongHash;
import org.elasticsearch.compute.aggregation.GroupingAggregatorFunction;
import org.elasticsearch.compute.aggregation.SeenGroupIds;
import org.elasticsearch.compute.data.Block;
import org.elasticsearch.compute.data.BytesRefBlock;
import org.elasticsearch.compute.data.BytesRefVector;
import org.elasticsearch.compute.data.IntBlock;
import org.elasticsearch.compute.data.IntVector;
import org.elasticsearch.compute.data.LongBlock;
import org.elasticsearch.compute.data.LongVector;
import org.elasticsearch.compute.data.Page;
import org.elasticsearch.compute.operator.DriverContext;
import org.elasticsearch.core.ReleasableIterator;
import org.elasticsearch.core.Releasables;
import java.util.Objects;
public final class TimeSeriesBlockHash extends BlockHash {
private final int tsHashChannel;
private final int timestampIntervalChannel;
private final BytesRefHash tsidHashes;
private final LongLongHash intervalHash;
long groupOrdinal = -1;
BytesRef previousTsidHash;
long previousTimestampInterval;
public TimeSeriesBlockHash(int tsHashChannel, int timestampIntervalChannel, DriverContext driverContext) {
super(driverContext.blockFactory());
this.tsHashChannel = tsHashChannel;
this.timestampIntervalChannel = timestampIntervalChannel;
this.tsidHashes = new BytesRefHash(1, blockFactory.bigArrays());
this.intervalHash = new LongLongHash(1, blockFactory.bigArrays());
}
@Override
public void close() {
Releasables.close(tsidHashes, intervalHash);
}
@Override
public void add(Page page, GroupingAggregatorFunction.AddInput addInput) {
BytesRefBlock tsHashBlock = page.getBlock(tsHashChannel);
BytesRefVector tsHashVector = Objects.requireNonNull(tsHashBlock.asVector());
try (var ordsBuilder = blockFactory.newIntVectorBuilder(tsHashVector.getPositionCount())) {
LongBlock timestampIntervalBlock = page.getBlock(timestampIntervalChannel);
BytesRef spare = new BytesRef();
for (int i = 0; i < tsHashVector.getPositionCount(); i++) {
BytesRef tsHash = tsHashVector.getBytesRef(i, spare);
long timestampInterval = timestampIntervalBlock.getLong(i);
// Optimization that relies on the fact that blocks are sorted by tsid hash and timestamp
if (tsHash.equals(previousTsidHash) == false || timestampInterval != previousTimestampInterval) {
long tsidOrdinal = tsidHashes.add(tsHash);
if (tsidOrdinal < 0) {
tsidOrdinal = -1 - tsidOrdinal;
}
groupOrdinal = intervalHash.add(tsidOrdinal, timestampInterval);
if (groupOrdinal < 0) {
groupOrdinal = -1 - groupOrdinal;
}
previousTsidHash = BytesRef.deepCopyOf(tsHash);
previousTimestampInterval = timestampInterval;
}
ordsBuilder.appendInt(Math.toIntExact(groupOrdinal));
}
try (var ords = ordsBuilder.build()) {
addInput.add(0, ords);
}
}
}
@Override
public ReleasableIterator lookup(Page page, ByteSizeValue targetBlockSize) {
throw new UnsupportedOperationException("TODO");
}
@Override
public Block[] getKeys() {
int positions = (int) intervalHash.size();
BytesRefVector tsidHashes = null;
LongVector timestampIntervals = null;
try (
BytesRefVector.Builder tsidHashesBuilder = blockFactory.newBytesRefVectorBuilder(positions);
LongVector.FixedBuilder timestampIntervalsBuilder = blockFactory.newLongVectorFixedBuilder(positions)
) {
BytesRef scratch = new BytesRef();
for (long i = 0; i < positions; i++) {
BytesRef key1 = this.tsidHashes.get(intervalHash.getKey1(i), scratch);
tsidHashesBuilder.appendBytesRef(key1);
timestampIntervalsBuilder.appendLong((int) i, intervalHash.getKey2(i));
}
tsidHashes = tsidHashesBuilder.build();
timestampIntervals = timestampIntervalsBuilder.build();
} finally {
if (timestampIntervals == null) {
Releasables.closeExpectNoException(tsidHashes);
}
}
return new Block[] { tsidHashes.asBlock(), timestampIntervals.asBlock() };
}
@Override
public IntVector nonEmpty() {
long endExclusive = intervalHash.size();
return IntVector.range(0, Math.toIntExact(endExclusive), blockFactory);
}
@Override
public BitArray seenGroupIds(BigArrays bigArrays) {
long size = intervalHash.size();
return new SeenGroupIds.Range(0, Math.toIntExact(size)).seenGroupIds(bigArrays);
}
public String toString() {
return "TimeSeriesBlockHash{keys=[BytesRefKey[channel="
+ tsHashChannel
+ "], LongKey[channel="
+ timestampIntervalChannel
+ "]], entries="
+ groupOrdinal
+ "b}";
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy