Please wait. This can take some minutes ...
Many resources are needed to download a project. Please understand that we have to compensate our server costs. Thank you in advance.
Project price only 1 $
You can buy this project and download/modify it how often you want.
io.trino.plugin.hive.HiveTableHandle Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.trino.plugin.hive;
import com.fasterxml.jackson.annotation.JsonCreator;
import com.fasterxml.jackson.annotation.JsonIgnore;
import com.fasterxml.jackson.annotation.JsonProperty;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import io.trino.metastore.HivePartition;
import io.trino.plugin.hive.acid.AcidTransaction;
import io.trino.plugin.hive.util.HiveBucketing.HiveBucketFilter;
import io.trino.plugin.hive.util.HiveUtil;
import io.trino.spi.connector.ColumnHandle;
import io.trino.spi.connector.ConnectorTableHandle;
import io.trino.spi.connector.SchemaTableName;
import io.trino.spi.predicate.TupleDomain;
import java.util.List;
import java.util.Map;
import java.util.Objects;
import java.util.Optional;
import java.util.Set;
import static com.google.common.base.Preconditions.checkState;
import static io.trino.plugin.hive.acid.AcidTransaction.NO_ACID_TRANSACTION;
import static java.util.Objects.requireNonNull;
import static java.util.stream.Collectors.joining;
public class HiveTableHandle
implements ConnectorTableHandle
{
private final String schemaName;
private final String tableName;
private final Optional> tableParameters;
private final List partitionColumns;
private final List dataColumns;
private final Optional> partitionNames;
private final Optional> partitions;
private final TupleDomain compactEffectivePredicate;
private final TupleDomain enforcedConstraint;
private final Optional tablePartitioning;
private final Optional bucketFilter;
private final Optional>> analyzePartitionValues;
private final Set constraintColumns;
private final Set projectedColumns;
private final AcidTransaction transaction;
private final boolean recordScannedFiles;
private final Optional maxScannedFileSize;
@JsonCreator
public HiveTableHandle(
@JsonProperty("schemaName") String schemaName,
@JsonProperty("tableName") String tableName,
@JsonProperty("partitionColumns") List partitionColumns,
@JsonProperty("dataColumns") List dataColumns,
@JsonProperty("compactEffectivePredicate") TupleDomain compactEffectivePredicate,
@JsonProperty("enforcedConstraint") TupleDomain enforcedConstraint,
@JsonProperty("tablePartitioning") Optional tablePartitioning,
@JsonProperty("bucketFilter") Optional bucketFilter,
@JsonProperty("analyzePartitionValues") Optional>> analyzePartitionValues,
@JsonProperty("transaction") AcidTransaction transaction)
{
this(
schemaName,
tableName,
Optional.empty(),
partitionColumns,
dataColumns,
Optional.empty(),
Optional.empty(),
compactEffectivePredicate,
enforcedConstraint,
tablePartitioning,
bucketFilter,
analyzePartitionValues,
ImmutableSet.of(),
transaction,
false,
Optional.empty());
}
public HiveTableHandle(
String schemaName,
String tableName,
Map tableParameters,
List partitionColumns,
List dataColumns,
Optional tablePartitioning)
{
this(
schemaName,
tableName,
Optional.of(tableParameters),
partitionColumns,
dataColumns,
Optional.empty(),
Optional.empty(),
TupleDomain.all(),
TupleDomain.all(),
tablePartitioning,
Optional.empty(),
Optional.empty(),
ImmutableSet.of(),
NO_ACID_TRANSACTION,
false,
Optional.empty());
}
private HiveTableHandle(
String schemaName,
String tableName,
Optional> tableParameters,
List partitionColumns,
List dataColumns,
Optional> partitionNames,
Optional> partitions,
TupleDomain compactEffectivePredicate,
TupleDomain enforcedConstraint,
Optional tablePartitioning,
Optional bucketFilter,
Optional>> analyzePartitionValues,
Set constraintColumns,
AcidTransaction transaction,
boolean recordScannedFiles,
Optional maxSplitFileSize)
{
this(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitionNames,
partitions,
compactEffectivePredicate,
enforcedConstraint,
tablePartitioning,
bucketFilter,
analyzePartitionValues,
constraintColumns,
ImmutableSet.builder().addAll(partitionColumns).addAll(dataColumns).build(),
transaction,
recordScannedFiles,
maxSplitFileSize);
}
public HiveTableHandle(
String schemaName,
String tableName,
Optional> tableParameters,
List partitionColumns,
List dataColumns,
Optional> partitionNames,
Optional> partitions,
TupleDomain compactEffectivePredicate,
TupleDomain enforcedConstraint,
Optional tablePartitioning,
Optional bucketFilter,
Optional>> analyzePartitionValues,
Set constraintColumns,
Set projectedColumns,
AcidTransaction transaction,
boolean recordScannedFiles,
Optional maxSplitFileSize)
{
checkState(partitionNames.isEmpty() || partitions.isEmpty(), "partition names and partitions list cannot be present at same time");
this.schemaName = requireNonNull(schemaName, "schemaName is null");
this.tableName = requireNonNull(tableName, "tableName is null");
this.tableParameters = tableParameters.map(ImmutableMap::copyOf);
this.partitionColumns = ImmutableList.copyOf(requireNonNull(partitionColumns, "partitionColumns is null"));
this.dataColumns = ImmutableList.copyOf(requireNonNull(dataColumns, "dataColumns is null"));
this.partitionNames = partitionNames.map(ImmutableList::copyOf);
this.partitions = partitions.map(ImmutableList::copyOf);
this.compactEffectivePredicate = requireNonNull(compactEffectivePredicate, "compactEffectivePredicate is null");
this.enforcedConstraint = requireNonNull(enforcedConstraint, "enforcedConstraint is null");
this.tablePartitioning = requireNonNull(tablePartitioning, "tablePartitioning is null");
this.bucketFilter = requireNonNull(bucketFilter, "bucketFilter is null");
this.analyzePartitionValues = analyzePartitionValues.map(ImmutableList::copyOf);
this.constraintColumns = ImmutableSet.copyOf(requireNonNull(constraintColumns, "constraintColumns is null"));
this.projectedColumns = ImmutableSet.copyOf(requireNonNull(projectedColumns, "projectedColumns is null"));
this.transaction = requireNonNull(transaction, "transaction is null");
this.recordScannedFiles = recordScannedFiles;
this.maxScannedFileSize = requireNonNull(maxSplitFileSize, "maxSplitFileSize is null");
}
public HiveTableHandle withAnalyzePartitionValues(List> analyzePartitionValues)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitionNames,
partitions,
compactEffectivePredicate,
enforcedConstraint,
tablePartitioning,
bucketFilter,
Optional.of(analyzePartitionValues),
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withTransaction(AcidTransaction transaction)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitionNames,
partitions,
compactEffectivePredicate,
enforcedConstraint,
tablePartitioning,
bucketFilter,
analyzePartitionValues,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withProjectedColumns(Set projectedColumns)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitionNames,
partitions,
compactEffectivePredicate,
enforcedConstraint,
tablePartitioning,
bucketFilter,
analyzePartitionValues,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withRecordScannedFiles(boolean recordScannedFiles)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitionNames,
partitions,
compactEffectivePredicate,
enforcedConstraint,
tablePartitioning,
bucketFilter,
analyzePartitionValues,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withMaxScannedFileSize(Optional maxScannedFileSize)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitionNames,
partitions,
compactEffectivePredicate,
enforcedConstraint,
tablePartitioning,
bucketFilter,
analyzePartitionValues,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
public HiveTableHandle withTablePartitioning(Optional hiveTablePartitioning)
{
return new HiveTableHandle(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitionNames,
partitions,
compactEffectivePredicate,
enforcedConstraint,
hiveTablePartitioning,
bucketFilter,
analyzePartitionValues,
constraintColumns,
projectedColumns,
transaction,
recordScannedFiles,
maxScannedFileSize);
}
@JsonProperty
public String getSchemaName()
{
return schemaName;
}
@JsonProperty
public String getTableName()
{
return tableName;
}
// do not serialize tableParameters as they are not needed on workers
@JsonIgnore
public Optional> getTableParameters()
{
return tableParameters;
}
@JsonProperty
public List getPartitionColumns()
{
return partitionColumns;
}
@JsonProperty
public List getDataColumns()
{
return dataColumns;
}
/**
* Represents raw partition information as String.
* These are partially satisfied by the table filter criteria.
* This will be set to `Optional#empty` if parsed partition information are loaded.
* Skip serialization as they are not needed on workers
*/
@JsonIgnore
public Optional> getPartitionNames()
{
return partitionNames;
}
/**
* Represents parsed partition information (which is derived from raw partition string).
* These are fully satisfied by the table filter criteria.
* Skip serialization as they are not needed on workers
*/
@JsonIgnore
public Optional> getPartitions()
{
return partitions;
}
@JsonProperty
public TupleDomain getCompactEffectivePredicate()
{
return compactEffectivePredicate;
}
@JsonProperty
public TupleDomain getEnforcedConstraint()
{
return enforcedConstraint;
}
@JsonProperty
public Optional getTablePartitioning()
{
return tablePartitioning;
}
@JsonProperty
public Optional getBucketFilter()
{
return bucketFilter;
}
@JsonProperty
public Optional>> getAnalyzePartitionValues()
{
return analyzePartitionValues;
}
@JsonProperty
public AcidTransaction getTransaction()
{
return transaction;
}
// do not serialize constraint columns as they are not needed on workers
@JsonIgnore
public Set getConstraintColumns()
{
return constraintColumns;
}
// do not serialize projected columns as they are not needed on workers
@JsonIgnore
public Set getProjectedColumns()
{
return projectedColumns;
}
public SchemaTableName getSchemaTableName()
{
return new SchemaTableName(schemaName, tableName);
}
@JsonIgnore
public boolean isAcidMerge()
{
return transaction.isMerge();
}
@JsonIgnore
public boolean isRecordScannedFiles()
{
return recordScannedFiles;
}
@JsonIgnore
public Optional getMaxScannedFileSize()
{
return maxScannedFileSize;
}
@Override
public boolean equals(Object o)
{
if (this == o) {
return true;
}
if (o == null || getClass() != o.getClass()) {
return false;
}
HiveTableHandle that = (HiveTableHandle) o;
return Objects.equals(schemaName, that.schemaName) &&
Objects.equals(tableName, that.tableName) &&
Objects.equals(tableParameters, that.tableParameters) &&
Objects.equals(partitionColumns, that.partitionColumns) &&
Objects.equals(dataColumns, that.dataColumns) &&
Objects.equals(partitionNames, that.partitionNames) &&
Objects.equals(partitions, that.partitions) &&
Objects.equals(compactEffectivePredicate, that.compactEffectivePredicate) &&
Objects.equals(enforcedConstraint, that.enforcedConstraint) &&
Objects.equals(tablePartitioning, that.tablePartitioning) &&
Objects.equals(bucketFilter, that.bucketFilter) &&
Objects.equals(analyzePartitionValues, that.analyzePartitionValues) &&
Objects.equals(constraintColumns, that.constraintColumns) &&
Objects.equals(transaction, that.transaction) &&
Objects.equals(projectedColumns, that.projectedColumns) &&
recordScannedFiles == that.recordScannedFiles &&
Objects.equals(maxScannedFileSize, that.maxScannedFileSize);
}
@Override
public int hashCode()
{
return Objects.hash(
schemaName,
tableName,
tableParameters,
partitionColumns,
dataColumns,
partitionNames,
partitions,
compactEffectivePredicate,
enforcedConstraint,
tablePartitioning,
bucketFilter,
analyzePartitionValues,
constraintColumns,
transaction,
projectedColumns,
recordScannedFiles,
maxScannedFileSize);
}
@Override
public String toString()
{
StringBuilder builder = new StringBuilder();
builder.append(schemaName).append(":").append(tableName);
if (!constraintColumns.isEmpty()) {
builder.append(" constraint on ");
builder.append(constraintColumns.stream()
.map(HiveColumnHandle::getName)
.collect(joining(", ", "[", "]")));
}
tablePartitioning.ifPresent(bucket -> {
if (bucket.active()) {
builder.append(" buckets=").append(bucket.partitioningHandle().getBucketCount());
if (!bucket.sortedBy().isEmpty()) {
builder.append(" sorted_by=")
.append(bucket.sortedBy().stream()
.map(HiveUtil::sortingColumnToString)
.collect(joining(", ", "[", "]")));
}
}
});
return builder.toString();
}
}