Please wait. This can take some minutes ...
Many resources are needed to download a project. Please understand that we have to compensate our server costs. Thank you in advance.
Project price only 1 $
You can buy this project and download/modify it how often you want.
io.trino.plugin.hive.HiveTableHandle Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.trino.plugin.hive;
import com.fasterxml.jackson.annotation.JsonCreator;
import com.fasterxml.jackson.annotation.JsonIgnore;
import com.fasterxml.jackson.annotation.JsonProperty;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import io.trino.plugin.hive.acid.AcidTransaction;
import io.trino.plugin.hive.util.HiveBucketing.HiveBucketFilter;
import io.trino.plugin.hive.util.HiveUtil;
import io.trino.spi.connector.ColumnHandle;
import io.trino.spi.connector.ConnectorTableHandle;
import io.trino.spi.connector.SchemaTableName;
import io.trino.spi.predicate.TupleDomain;
import java.util.List;
import java.util.Map;
import java.util.Objects;
import java.util.Optional;
import java.util.Set;
import static com.google.common.base.Preconditions.checkState;
import static io.trino.plugin.hive.acid.AcidTransaction.NO_ACID_TRANSACTION;
import static java.util.Objects.requireNonNull;
import static java.util.stream.Collectors.joining;
public class HiveTableHandle
implements ConnectorTableHandle
{
private final String schemaName;
private final String tableName;
private final Optional> tableParameters;
private final List partitionColumns;
private final List dataColumns;
private final Optional> partitions;
private final TupleDomain compactEffectivePredicate;
private final TupleDomain enforcedConstraint;
private final Optional bucketHandle;
private final Optional bucketFilter;
private final Optional>> analyzePartitionValues;
private final Optional> analyzeColumnNames;
private final Set constraintColumns;
private final Set projectedColumns;
private final AcidTransaction transaction;
private final boolean recordScannedFiles;
private final Optional maxScannedFileSize;
@JsonCreator
public HiveTableHandle(
@JsonProperty("schemaName") String schemaName,
@JsonProperty("tableName") String tableName,
@JsonProperty("partitionColumns") List partitionColumns,
@JsonProperty("dataColumns") List dataColumns,
@JsonProperty("compactEffectivePredicate") TupleDomain compactEffectivePredicate,
@JsonProperty("enforcedConstraint") TupleDomain enforcedConstraint,
@JsonProperty("bucketHandle") Optional bucketHandle,
@JsonProperty("bucketFilter") Optional bucketFilter,
@JsonProperty("analyzePartitionValues") Optional>> analyzePartitionValues,
@JsonProperty("analyzeColumnNames") Optional> analyzeColumnNames,
@JsonProperty("transaction") AcidTransaction transaction)
{
this(
schemaName,
tableName,
Optional.empty(),
partitionColumns,
dataColumns,
Optional.empty(),
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
analyzePartitionValues,
analyzeColumnNames,
ImmutableSet.of(),
ImmutableSet.of(),
transaction,
false,
Optional.empty());
}
public HiveTableHandle(
String schemaName,
String tableName,
Map tableParameters,
List partitionColumns,
List dataColumns,
Optional bucketHandle)
{
this(
schemaName,
tableName,
Optional.of(tableParameters),
partitionColumns,
dataColumns,
Optional.empty(),
TupleDomain.all(),
TupleDomain.all(),
bucketHandle,
Optional.empty(),
Optional.empty(),
Optional.empty(),
ImmutableSet.of(),
ImmutableSet.of(),
NO_ACID_TRANSACTION,
false,
Optional.empty());
}
public HiveTableHandle(
String schemaName,
String tableName,
Optional> tableParameters,
List partitionColumns,
List dataColumns,
Optional> partitions,
TupleDomain compactEffectivePredicate,
TupleDomain enforcedConstraint,
Optional bucketHandle,
Optional bucketFilter,
Optional>> analyzePartitionValues,
Optional> analyzeColumnNames,
Set constraintColumns,
Set projectedColumns,
AcidTransaction transaction,
boolean recordScannedFiles,
Optional maxSplitFileSize)
{
this.schemaName = requireNonNull(schemaName, "schemaName is null");
this.tableName = requireNonNull(tableName, "tableName is null");
this.tableParameters = requireNonNull(tableParameters, "tableParameters is null").map(ImmutableMap::copyOf);
this.partitionColumns = ImmutableList.copyOf(requireNonNull(partitionColumns, "partitionColumns is null"));
this.dataColumns = ImmutableList.copyOf(requireNonNull(dataColumns, "dataColumns is null"));
this.partitions = requireNonNull(partitions, "partitions is null").map(ImmutableList::copyOf);
this.compactEffectivePredicate = requireNonNull(compactEffectivePredicate, "compactEffectivePredicate is null");
this.enforcedConstraint = requireNonNull(enforcedConstraint, "enforcedConstraint is null");
this.bucketHandle = requireNonNull(bucketHandle, "bucketHandle is null");
this.bucketFilter = requireNonNull(bucketFilter, "bucketFilter is null");
this.analyzePartitionValues = requireNonNull(analyzePartitionValues, "analyzePartitionValues is null").map(ImmutableList::copyOf);
this.analyzeColumnNames = requireNonNull(analyzeColumnNames, "analyzeColumnNames is null").map(ImmutableSet::copyOf);
this.constraintColumns = ImmutableSet.copyOf(requireNonNull(constraintColumns, "constraintColumns is null"));
this.projectedColumns = ImmutableSet.copyOf(requireNonNull(projectedColumns, "projectedColumns is null"));
this.transaction = requireNonNull(transaction, "transaction is null");
this.recordScannedFiles = recordScannedFiles;
this.maxScannedFileSize = requireNonNull(maxSplitFileSize, "maxSplitFileSize is null");
}
public HiveTableHandle withAnalyzePartitionValues(List> analyzePartitionValues)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitions,
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
Optional.of(analyzePartitionValues),
analyzeColumnNames,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withAnalyzeColumnNames(Set analyzeColumnNames)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitions,
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
analyzePartitionValues,
Optional.of(analyzeColumnNames),
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withTransaction(AcidTransaction transaction)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitions,
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
analyzePartitionValues,
analyzeColumnNames,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withUpdateProcessor(AcidTransaction transaction, HiveUpdateProcessor updateProcessor)
{
requireNonNull(updateProcessor, "updateProcessor is null");
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitions,
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
analyzePartitionValues,
analyzeColumnNames,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withProjectedColumns(Set projectedColumns)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitions,
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
analyzePartitionValues,
analyzeColumnNames,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withRecordScannedFiles(boolean recordScannedFiles)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitions,
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
analyzePartitionValues,
analyzeColumnNames,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withMaxScannedFileSize(Optional maxScannedFileSize)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitions,
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
analyzePartitionValues,
analyzeColumnNames,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
@JsonProperty
public String getSchemaName()
{
return schemaName;
}
@JsonProperty
public String getTableName()
{
return tableName;
}
// do not serialize tableParameters as they are not needed on workers
@JsonIgnore
public Optional> getTableParameters()
{
return tableParameters;
}
@JsonProperty
public List getPartitionColumns()
{
return partitionColumns;
}
@JsonProperty
public List getDataColumns()
{
return dataColumns;
}
// do not serialize partitions as they are not needed on workers
@JsonIgnore
public Optional> getPartitions()
{
return partitions;
}
@JsonProperty
public TupleDomain getCompactEffectivePredicate()
{
return compactEffectivePredicate;
}
@JsonProperty
public TupleDomain getEnforcedConstraint()
{
return enforcedConstraint;
}
@JsonProperty
public Optional getBucketHandle()
{
return bucketHandle;
}
@JsonProperty
public Optional getBucketFilter()
{
return bucketFilter;
}
@JsonProperty
public Optional>> getAnalyzePartitionValues()
{
return analyzePartitionValues;
}
@JsonProperty
public Optional> getAnalyzeColumnNames()
{
return analyzeColumnNames;
}
@JsonProperty
public AcidTransaction getTransaction()
{
return transaction;
}
// do not serialize constraint columns as they are not needed on workers
@JsonIgnore
public Set getConstraintColumns()
{
return constraintColumns;
}
// do not serialize projected columns as they are not needed on workers
@JsonIgnore
public Set getProjectedColumns()
{
return projectedColumns;
}
public SchemaTableName getSchemaTableName()
{
return new SchemaTableName(schemaName, tableName);
}
@JsonIgnore
public boolean isAcidDelete()
{
return transaction.isDelete();
}
@JsonIgnore
public boolean isAcidUpdate()
{
return transaction.isUpdate();
}
@JsonIgnore
public Optional getUpdateProcessor()
{
return transaction.getUpdateProcessor();
}
@JsonIgnore
public boolean isInAcidTransaction()
{
return transaction.isAcidTransactionRunning();
}
@JsonIgnore
public long getAcidTransactionId()
{
checkState(transaction.isAcidTransactionRunning(), "The AcidTransaction is not running");
return transaction.getAcidTransactionId();
}
@JsonIgnore
public long getWriteId()
{
checkState(transaction.isAcidTransactionRunning(), "The AcidTransaction is not running");
return transaction.getWriteId();
}
@JsonIgnore
public boolean isRecordScannedFiles()
{
return recordScannedFiles;
}
@JsonIgnore
public Optional getMaxScannedFileSize()
{
return maxScannedFileSize;
}
@Override
public boolean equals(Object o)
{
if (this == o) {
return true;
}
if (o == null || getClass() != o.getClass()) {
return false;
}
HiveTableHandle that = (HiveTableHandle) o;
return Objects.equals(schemaName, that.schemaName) &&
Objects.equals(tableName, that.tableName) &&
Objects.equals(tableParameters, that.tableParameters) &&
Objects.equals(partitionColumns, that.partitionColumns) &&
Objects.equals(partitions, that.partitions) &&
Objects.equals(compactEffectivePredicate, that.compactEffectivePredicate) &&
Objects.equals(enforcedConstraint, that.enforcedConstraint) &&
Objects.equals(bucketHandle, that.bucketHandle) &&
Objects.equals(bucketFilter, that.bucketFilter) &&
Objects.equals(analyzePartitionValues, that.analyzePartitionValues) &&
Objects.equals(transaction, that.transaction) &&
Objects.equals(projectedColumns, that.projectedColumns);
}
@Override
public int hashCode()
{
return Objects.hash(
schemaName,
tableName,
tableParameters,
partitionColumns,
partitions,
compactEffectivePredicate,
enforcedConstraint,
bucketHandle,
bucketFilter,
analyzePartitionValues,
transaction,
projectedColumns);
}
@Override
public String toString()
{
StringBuilder builder = new StringBuilder();
builder.append(schemaName).append(":").append(tableName);
bucketHandle.ifPresent(bucket -> {
builder.append(" buckets=").append(bucket.getReadBucketCount());
if (!bucket.getSortedBy().isEmpty()) {
builder.append(" sorted_by=")
.append(bucket.getSortedBy().stream()
.map(HiveUtil::sortingColumnToString)
.collect(joining(", ", "[", "]")));
}
});
return builder.toString();
}
}