io.trino.plugin.deltalake.DeltaLakeSplit Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of trino-delta-lake Show documentation
Show all versions of trino-delta-lake Show documentation
Trino - Delta Lake connector
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.trino.plugin.deltalake;
import com.fasterxml.jackson.annotation.JsonCreator;
import com.fasterxml.jackson.annotation.JsonIgnore;
import com.fasterxml.jackson.annotation.JsonProperty;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import io.airlift.slice.SizeOf;
import io.trino.plugin.deltalake.transactionlog.DeletionVectorEntry;
import io.trino.spi.HostAddress;
import io.trino.spi.SplitWeight;
import io.trino.spi.connector.ConnectorSplit;
import io.trino.spi.predicate.TupleDomain;
import java.util.List;
import java.util.Map;
import java.util.Objects;
import java.util.Optional;
import static com.google.common.base.MoreObjects.toStringHelper;
import static io.airlift.slice.SizeOf.LONG_INSTANCE_SIZE;
import static io.airlift.slice.SizeOf.estimatedSizeOf;
import static io.airlift.slice.SizeOf.instanceSize;
import static io.airlift.slice.SizeOf.sizeOf;
import static java.util.Objects.requireNonNull;
public class DeltaLakeSplit
implements ConnectorSplit
{
private static final int INSTANCE_SIZE = instanceSize(DeltaLakeSplit.class);
private final String path;
private final long start;
private final long length;
private final long fileSize;
private final Optional fileRowCount;
private final long fileModifiedTime;
private final Optional deletionVector;
private final SplitWeight splitWeight;
private final TupleDomain statisticsPredicate;
private final Map> partitionKeys;
@JsonCreator
public DeltaLakeSplit(
@JsonProperty("path") String path,
@JsonProperty("start") long start,
@JsonProperty("length") long length,
@JsonProperty("fileSize") long fileSize,
@JsonProperty("rowCount") Optional fileRowCount,
@JsonProperty("fileModifiedTime") long fileModifiedTime,
@JsonProperty("deletionVector") Optional deletionVector,
@JsonProperty("splitWeight") SplitWeight splitWeight,
@JsonProperty("statisticsPredicate") TupleDomain statisticsPredicate,
@JsonProperty("partitionKeys") Map> partitionKeys)
{
this.path = requireNonNull(path, "path is null");
this.start = start;
this.length = length;
this.fileSize = fileSize;
this.fileRowCount = requireNonNull(fileRowCount, "rowCount is null");
this.fileModifiedTime = fileModifiedTime;
this.deletionVector = requireNonNull(deletionVector, "deletionVector is null");
this.splitWeight = requireNonNull(splitWeight, "splitWeight is null");
this.statisticsPredicate = requireNonNull(statisticsPredicate, "statisticsPredicate is null");
this.partitionKeys = requireNonNull(partitionKeys, "partitionKeys is null");
}
@Override
public boolean isRemotelyAccessible()
{
return true;
}
@JsonIgnore
@Override
public List getAddresses()
{
return ImmutableList.of();
}
@JsonProperty
@Override
public SplitWeight getSplitWeight()
{
return splitWeight;
}
@JsonProperty
public String getPath()
{
return path;
}
@JsonProperty
public long getStart()
{
return start;
}
@JsonProperty
public long getLength()
{
return length;
}
@JsonProperty
public long getFileSize()
{
return fileSize;
}
@JsonProperty
public Optional getFileRowCount()
{
return fileRowCount;
}
@JsonProperty
public long getFileModifiedTime()
{
return fileModifiedTime;
}
@JsonProperty
public Optional getDeletionVector()
{
return deletionVector;
}
/**
* A TupleDomain representing the min/max statistics from the file this split was generated from. This does not contain any partitioning information.
*/
@JsonProperty
public TupleDomain getStatisticsPredicate()
{
return statisticsPredicate;
}
@JsonProperty
public Map> getPartitionKeys()
{
return partitionKeys;
}
@Override
public long getRetainedSizeInBytes()
{
return INSTANCE_SIZE
+ estimatedSizeOf(path)
+ sizeOf(fileRowCount, value -> LONG_INSTANCE_SIZE)
+ sizeOf(deletionVector, DeletionVectorEntry::sizeInBytes)
+ splitWeight.getRetainedSizeInBytes()
+ statisticsPredicate.getRetainedSizeInBytes(DeltaLakeColumnHandle::getRetainedSizeInBytes)
+ estimatedSizeOf(partitionKeys, SizeOf::estimatedSizeOf, value -> sizeOf(value, SizeOf::estimatedSizeOf));
}
@Override
public Object getInfo()
{
return ImmutableMap.builder()
.put("path", path)
.put("start", start)
.put("length", length)
.buildOrThrow();
}
@Override
public String toString()
{
return toStringHelper(this)
.add("path", path)
.add("start", start)
.add("length", length)
.add("fileSize", fileSize)
.add("rowCount", fileRowCount)
.add("deletionVector", deletionVector)
.add("statisticsPredicate", statisticsPredicate)
.add("partitionKeys", partitionKeys)
.toString();
}
@Override
public boolean equals(Object o)
{
if (this == o) {
return true;
}
if (o == null || getClass() != o.getClass()) {
return false;
}
DeltaLakeSplit that = (DeltaLakeSplit) o;
return start == that.start &&
length == that.length &&
fileSize == that.fileSize &&
path.equals(that.path) &&
fileRowCount.equals(that.fileRowCount) &&
deletionVector.equals(that.deletionVector) &&
Objects.equals(statisticsPredicate, that.statisticsPredicate) &&
Objects.equals(partitionKeys, that.partitionKeys);
}
@Override
public int hashCode()
{
return Objects.hash(path, start, length, fileSize, fileRowCount, deletionVector, statisticsPredicate, partitionKeys);
}
}