io.trino.plugin.hive.AcidInfo Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of trino-hive Show documentation
Show all versions of trino-hive Show documentation
This is a Databricks build of Trino's Hive plugin which includes support for HTTP based transport
for it's Hive metastore thrift interface.
The newest version!
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.trino.plugin.hive;
import com.fasterxml.jackson.annotation.JsonCreator;
import com.fasterxml.jackson.annotation.JsonProperty;
import com.google.common.collect.ArrayListMultimap;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ListMultimap;
import io.airlift.slice.SizeOf;
import org.apache.hadoop.fs.Path;
import java.util.ArrayList;
import java.util.List;
import java.util.Objects;
import java.util.Optional;
import static com.google.common.base.MoreObjects.toStringHelper;
import static com.google.common.base.Preconditions.checkArgument;
import static com.google.common.base.Preconditions.checkState;
import static io.airlift.slice.SizeOf.estimatedSizeOf;
import static io.airlift.slice.SizeOf.instanceSize;
import static java.util.Objects.requireNonNull;
/**
* Stores information about Acid properties of a partition.
*/
public class AcidInfo
{
private static final int INSTANCE_SIZE = instanceSize(AcidInfo.class);
private final String partitionLocation;
private final List deleteDeltas;
private final List originalFiles;
private final int bucketId;
private final boolean orcAcidVersionValidated;
@JsonCreator
public AcidInfo(
@JsonProperty("partitionLocation") String partitionLocation,
@JsonProperty("deleteDeltaDirectories") List deleteDeltaDirectories,
@JsonProperty("originalFiles") List originalFiles,
@JsonProperty("bucketId") int bucketId,
@JsonProperty("orcAcidVersionValidated") boolean orcAcidVersionValidated)
{
this.partitionLocation = requireNonNull(partitionLocation, "partitionLocation is null");
this.deleteDeltas = ImmutableList.copyOf(requireNonNull(deleteDeltaDirectories, "deleteDeltaDirectories is null"));
this.originalFiles = ImmutableList.copyOf(requireNonNull(originalFiles, "originalFiles is null"));
this.bucketId = bucketId;
this.orcAcidVersionValidated = orcAcidVersionValidated;
}
@JsonProperty
public List getOriginalFiles()
{
return originalFiles;
}
@JsonProperty
public int getBucketId()
{
return bucketId;
}
@JsonProperty
public String getPartitionLocation()
{
return partitionLocation;
}
@JsonProperty
public List getDeleteDeltaDirectories()
{
return deleteDeltas;
}
@JsonProperty
public boolean isOrcAcidVersionValidated()
{
return orcAcidVersionValidated;
}
@Override
public boolean equals(Object o)
{
if (this == o) {
return true;
}
if (o == null || getClass() != o.getClass()) {
return false;
}
AcidInfo that = (AcidInfo) o;
return bucketId == that.bucketId &&
orcAcidVersionValidated == that.orcAcidVersionValidated &&
Objects.equals(partitionLocation, that.partitionLocation) &&
Objects.equals(deleteDeltas, that.deleteDeltas) &&
Objects.equals(originalFiles, that.originalFiles);
}
@Override
public int hashCode()
{
return Objects.hash(partitionLocation, deleteDeltas, originalFiles, bucketId, orcAcidVersionValidated);
}
@Override
public String toString()
{
return toStringHelper(this)
.add("partitionLocation", partitionLocation)
.add("deleteDeltas", deleteDeltas)
.add("originalFiles", originalFiles)
.add("bucketId", bucketId)
.add("orcAcidVersionValidated", orcAcidVersionValidated)
.toString();
}
public long getRetainedSizeInBytes()
{
return INSTANCE_SIZE
+ estimatedSizeOf(partitionLocation)
+ estimatedSizeOf(deleteDeltas, SizeOf::estimatedSizeOf)
+ estimatedSizeOf(originalFiles, OriginalFileInfo::getRetainedSizeInBytes);
}
public static class OriginalFileInfo
{
private static final int INSTANCE_SIZE = instanceSize(OriginalFileInfo.class);
private final String name;
private final long fileSize;
@JsonCreator
public OriginalFileInfo(
@JsonProperty("name") String name,
@JsonProperty("fileSize") long fileSize)
{
this.name = requireNonNull(name, "name is null");
this.fileSize = fileSize;
}
@JsonProperty
public String getName()
{
return name;
}
@JsonProperty
public long getFileSize()
{
return fileSize;
}
@Override
public boolean equals(Object o)
{
if (this == o) {
return true;
}
if (o == null || getClass() != o.getClass()) {
return false;
}
OriginalFileInfo that = (OriginalFileInfo) o;
return fileSize == that.fileSize &&
name.equals(that.name);
}
@Override
public int hashCode()
{
return Objects.hash(name, fileSize);
}
@Override
public String toString()
{
return toStringHelper(this)
.add("name", name)
.add("fileSize", fileSize)
.toString();
}
public long getRetainedSizeInBytes()
{
return INSTANCE_SIZE + estimatedSizeOf(name);
}
}
public static Builder builder(Path partitionPath)
{
return new Builder(partitionPath);
}
public static class Builder
{
private final Path partitionLocation;
private final List deleteDeltaDirectories = new ArrayList<>();
private final ListMultimap bucketIdToOriginalFileInfoMap = ArrayListMultimap.create();
private boolean orcAcidVersionValidated;
private Builder(Path partitionPath)
{
partitionLocation = requireNonNull(partitionPath, "partitionPath is null");
}
public Builder addDeleteDelta(Path deleteDeltaPath)
{
requireNonNull(deleteDeltaPath, "deleteDeltaPath is null");
Path partitionPathFromDeleteDelta = deleteDeltaPath.getParent();
checkArgument(
partitionLocation.equals(partitionPathFromDeleteDelta),
"Partition location in DeleteDelta '%s' does not match stored location '%s'",
deleteDeltaPath.getParent().toString(),
partitionLocation);
deleteDeltaDirectories.add(deleteDeltaPath.getName());
return this;
}
public Builder addOriginalFile(Path originalFilePath, long originalFileLength, int bucketId)
{
requireNonNull(originalFilePath, "originalFilePath is null");
Path partitionPathFromOriginalPath = originalFilePath.getParent();
// originalFilePath has scheme in the prefix (i.e. scheme://), extract path from uri and compare.
checkArgument(
partitionLocation.toUri().getPath().equals(partitionPathFromOriginalPath.toUri().getPath()),
"Partition location in OriginalFile '%s' does not match stored location '%s'",
originalFilePath.getParent().toString(),
partitionLocation);
bucketIdToOriginalFileInfoMap.put(bucketId, new OriginalFileInfo(originalFilePath.getName(), originalFileLength));
return this;
}
public Builder setOrcAcidVersionValidated(boolean orcAcidVersionValidated)
{
this.orcAcidVersionValidated = orcAcidVersionValidated;
return this;
}
public AcidInfo buildWithRequiredOriginalFiles(int bucketId)
{
checkState(
bucketId > -1 && bucketIdToOriginalFileInfoMap.containsKey(bucketId),
"Bucket Id to OriginalFileInfo map should have entry for requested bucket id: %s",
bucketId);
return new AcidInfo(partitionLocation.toString(), deleteDeltaDirectories, bucketIdToOriginalFileInfoMap.get(bucketId), bucketId, orcAcidVersionValidated);
}
public Optional build()
{
if (deleteDeltaDirectories.isEmpty() && orcAcidVersionValidated) {
// We do not want to bail out with `Optional.empty()` if ORC ACID version was not validated based on _orc_acid_version file.
// If we did so extra validation in OrcPageSourceFactory (based on file metadata) would not be performed.
return Optional.empty();
}
return Optional.of(new AcidInfo(partitionLocation.toString(), deleteDeltaDirectories, ImmutableList.of(), -1, orcAcidVersionValidated));
}
}
}