io.prestosql.plugin.hive.HiveConfig Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.prestosql.plugin.hive;
import com.google.common.base.Splitter;
import com.google.common.collect.ImmutableList;
import io.airlift.configuration.Config;
import io.airlift.configuration.ConfigDescription;
import io.airlift.configuration.DefunctConfig;
import io.airlift.configuration.LegacyConfig;
import io.airlift.units.DataSize;
import io.airlift.units.Duration;
import io.airlift.units.MaxDataSize;
import io.airlift.units.MinDataSize;
import io.prestosql.plugin.hive.HiveSessionProperties.InsertExistingPartitionsBehavior;
import org.joda.time.DateTimeZone;
import javax.annotation.Nullable;
import javax.validation.constraints.AssertTrue;
import javax.validation.constraints.Max;
import javax.validation.constraints.Min;
import javax.validation.constraints.NotNull;
import java.util.List;
import java.util.Optional;
import java.util.TimeZone;
import static io.airlift.units.DataSize.Unit.MEGABYTE;
import static io.prestosql.plugin.hive.HiveSessionProperties.InsertExistingPartitionsBehavior.APPEND;
import static io.prestosql.plugin.hive.HiveSessionProperties.InsertExistingPartitionsBehavior.ERROR;
import static java.util.concurrent.TimeUnit.MINUTES;
@DefunctConfig({
"dfs.domain-socket-path",
"hive.file-system-cache-ttl",
"hive.max-global-split-iterator-threads",
"hive.max-sort-files-per-bucket",
"hive.bucket-writing",
"hive.optimized-reader.enabled",
"hive.rcfile-optimized-writer.enabled",
"hive.time-zone",
"hive.assume-canonical-partition-keys",
})
public class HiveConfig
{
private static final Splitter SPLITTER = Splitter.on(',').trimResults().omitEmptyStrings();
private DataSize maxSplitSize = DataSize.of(64, MEGABYTE);
private int maxPartitionsPerScan = 100_000;
private int maxOutstandingSplits = 1_000;
private DataSize maxOutstandingSplitsSize = DataSize.of(256, MEGABYTE);
private int maxSplitIteratorThreads = 1_000;
private int minPartitionBatchSize = 10;
private int maxPartitionBatchSize = 100;
private int maxInitialSplits = 200;
private int splitLoaderConcurrency = 4;
private Integer maxSplitsPerSecond;
private DataSize maxInitialSplitSize;
private int domainCompactionThreshold = 100;
private DataSize writerSortBufferSize = DataSize.of(64, MEGABYTE);
private boolean forceLocalScheduling;
private boolean recursiveDirWalkerEnabled;
private boolean ignoreAbsentPartitions;
private int maxConcurrentFileRenames = 20;
private int maxConcurrentMetastoreDrops = 20;
private boolean allowCorruptWritesForTesting;
private long perTransactionMetastoreCacheMaximumSize = 1000;
private HiveStorageFormat hiveStorageFormat = HiveStorageFormat.ORC;
private HiveCompressionCodec hiveCompressionCodec = HiveCompressionCodec.GZIP;
private boolean respectTableFormat = true;
private boolean immutablePartitions;
private Optional insertExistingPartitionsBehavior = Optional.empty();
private boolean createEmptyBucketFiles;
private int maxPartitionsPerWriter = 100;
private int maxOpenSortFiles = 50;
private int writeValidationThreads = 16;
private DataSize textMaxLineLength = DataSize.of(100, MEGABYTE);
private String orcLegacyTimeZone = TimeZone.getDefault().getID();
private String parquetTimeZone = TimeZone.getDefault().getID();
private boolean useParquetColumnNames;
private String rcfileTimeZone = TimeZone.getDefault().getID();
private boolean rcfileWriterValidate;
private boolean skipDeletionForAlter;
private boolean skipTargetCleanupOnRollback;
private boolean bucketExecutionEnabled = true;
private boolean sortedWritingEnabled = true;
private boolean optimizeMismatchedBucketCount;
private boolean writesToNonManagedTablesEnabled;
private boolean createsOfNonManagedTablesEnabled = true;
private boolean tableStatisticsEnabled = true;
private int partitionStatisticsSampleSize = 100;
private boolean ignoreCorruptedStatistics;
private boolean collectColumnStatisticsOnWrite = true;
private String recordingPath;
private boolean replay;
private Duration recordingDuration = new Duration(10, MINUTES);
private boolean s3SelectPushdownEnabled;
private int s3SelectPushdownMaxConnections = 500;
private boolean isTemporaryStagingDirectoryEnabled = true;
private String temporaryStagingDirectoryPath = "/tmp/presto-${USER}";
private Duration fileStatusCacheExpireAfterWrite = new Duration(1, MINUTES);
private long fileStatusCacheMaxSize = 1000 * 1000;
private List fileStatusCacheTables = ImmutableList.of();
private boolean translateHiveViews;
private Optional hiveTransactionHeartbeatInterval = Optional.empty();
private int hiveTransactionHeartbeatThreads = 5;
private boolean allowRegisterPartition;
private boolean queryPartitionFilterRequired;
private boolean partitionUseColumnNames;
private boolean projectionPushdownEnabled = true;
private Duration dynamicFilteringProbeBlockingTimeout = new Duration(0, MINUTES);
private HiveTimestampPrecision timestampPrecision = HiveTimestampPrecision.MILLISECONDS;
public int getMaxInitialSplits()
{
return maxInitialSplits;
}
@Config("hive.max-initial-splits")
public HiveConfig setMaxInitialSplits(int maxInitialSplits)
{
this.maxInitialSplits = maxInitialSplits;
return this;
}
public DataSize getMaxInitialSplitSize()
{
if (maxInitialSplitSize == null) {
return DataSize.ofBytes(maxSplitSize.toBytes() / 2).to(maxSplitSize.getUnit());
}
return maxInitialSplitSize;
}
@Config("hive.max-initial-split-size")
public HiveConfig setMaxInitialSplitSize(DataSize maxInitialSplitSize)
{
this.maxInitialSplitSize = maxInitialSplitSize;
return this;
}
@Min(1)
public int getSplitLoaderConcurrency()
{
return splitLoaderConcurrency;
}
@Config("hive.split-loader-concurrency")
public HiveConfig setSplitLoaderConcurrency(int splitLoaderConcurrency)
{
this.splitLoaderConcurrency = splitLoaderConcurrency;
return this;
}
@Min(1)
@Nullable
public Integer getMaxSplitsPerSecond()
{
return maxSplitsPerSecond;
}
@Config("hive.max-splits-per-second")
@ConfigDescription("Throttles the maximum number of splits that can be assigned to tasks per second")
public HiveConfig setMaxSplitsPerSecond(Integer maxSplitsPerSecond)
{
this.maxSplitsPerSecond = maxSplitsPerSecond;
return this;
}
@Min(1)
public int getDomainCompactionThreshold()
{
return domainCompactionThreshold;
}
@Config("hive.domain-compaction-threshold")
@ConfigDescription("Maximum ranges to allow in a tuple domain without compacting it")
public HiveConfig setDomainCompactionThreshold(int domainCompactionThreshold)
{
this.domainCompactionThreshold = domainCompactionThreshold;
return this;
}
@MinDataSize("1MB")
@MaxDataSize("1GB")
public DataSize getWriterSortBufferSize()
{
return writerSortBufferSize;
}
@Config("hive.writer-sort-buffer-size")
public HiveConfig setWriterSortBufferSize(DataSize writerSortBufferSize)
{
this.writerSortBufferSize = writerSortBufferSize;
return this;
}
public boolean isForceLocalScheduling()
{
return forceLocalScheduling;
}
@Config("hive.force-local-scheduling")
public HiveConfig setForceLocalScheduling(boolean forceLocalScheduling)
{
this.forceLocalScheduling = forceLocalScheduling;
return this;
}
@Min(1)
public int getMaxConcurrentFileRenames()
{
return maxConcurrentFileRenames;
}
@Config("hive.max-concurrent-file-renames")
public HiveConfig setMaxConcurrentFileRenames(int maxConcurrentFileRenames)
{
this.maxConcurrentFileRenames = maxConcurrentFileRenames;
return this;
}
@Min(1)
public int getMaxConcurrentMetastoreDrops()
{
return maxConcurrentMetastoreDrops;
}
@Config("hive.max-concurrent-metastore-drops")
public HiveConfig setMaxConcurrentMetastoreDrops(int maxConcurrentMetastoreDeletes)
{
this.maxConcurrentMetastoreDrops = maxConcurrentMetastoreDeletes;
return this;
}
@Config("hive.recursive-directories")
public HiveConfig setRecursiveDirWalkerEnabled(boolean recursiveDirWalkerEnabled)
{
this.recursiveDirWalkerEnabled = recursiveDirWalkerEnabled;
return this;
}
public boolean getRecursiveDirWalkerEnabled()
{
return recursiveDirWalkerEnabled;
}
public boolean isIgnoreAbsentPartitions()
{
return ignoreAbsentPartitions;
}
@Config("hive.ignore-absent-partitions")
public HiveConfig setIgnoreAbsentPartitions(boolean ignoreAbsentPartitions)
{
this.ignoreAbsentPartitions = ignoreAbsentPartitions;
return this;
}
@NotNull
public DataSize getMaxSplitSize()
{
return maxSplitSize;
}
@Config("hive.max-split-size")
public HiveConfig setMaxSplitSize(DataSize maxSplitSize)
{
this.maxSplitSize = maxSplitSize;
return this;
}
@Min(1)
public int getMaxPartitionsPerScan()
{
return maxPartitionsPerScan;
}
@Config("hive.max-partitions-per-scan")
@ConfigDescription("Maximum allowed partitions for a single table scan")
public HiveConfig setMaxPartitionsPerScan(int maxPartitionsPerScan)
{
this.maxPartitionsPerScan = maxPartitionsPerScan;
return this;
}
@Min(1)
public int getMaxOutstandingSplits()
{
return maxOutstandingSplits;
}
@Config("hive.max-outstanding-splits")
@ConfigDescription("Target number of buffered splits for each table scan in a query, before the scheduler tries to pause itself")
public HiveConfig setMaxOutstandingSplits(int maxOutstandingSplits)
{
this.maxOutstandingSplits = maxOutstandingSplits;
return this;
}
@MinDataSize("1MB")
public DataSize getMaxOutstandingSplitsSize()
{
return maxOutstandingSplitsSize;
}
@Config("hive.max-outstanding-splits-size")
@ConfigDescription("Maximum amount of memory allowed for split buffering for each table scan in a query, before the query is failed")
public HiveConfig setMaxOutstandingSplitsSize(DataSize maxOutstandingSplits)
{
this.maxOutstandingSplitsSize = maxOutstandingSplits;
return this;
}
@Min(1)
public int getMaxSplitIteratorThreads()
{
return maxSplitIteratorThreads;
}
@Config("hive.max-split-iterator-threads")
public HiveConfig setMaxSplitIteratorThreads(int maxSplitIteratorThreads)
{
this.maxSplitIteratorThreads = maxSplitIteratorThreads;
return this;
}
@Deprecated
public boolean getAllowCorruptWritesForTesting()
{
return allowCorruptWritesForTesting;
}
@Deprecated
@Config("hive.allow-corrupt-writes-for-testing")
@ConfigDescription("Allow Hive connector to write data even when data will likely be corrupt")
public HiveConfig setAllowCorruptWritesForTesting(boolean allowCorruptWritesForTesting)
{
this.allowCorruptWritesForTesting = allowCorruptWritesForTesting;
return this;
}
@Min(1)
public long getPerTransactionMetastoreCacheMaximumSize()
{
return perTransactionMetastoreCacheMaximumSize;
}
@Config("hive.per-transaction-metastore-cache-maximum-size")
public HiveConfig setPerTransactionMetastoreCacheMaximumSize(long perTransactionMetastoreCacheMaximumSize)
{
this.perTransactionMetastoreCacheMaximumSize = perTransactionMetastoreCacheMaximumSize;
return this;
}
@Min(1)
public int getMinPartitionBatchSize()
{
return minPartitionBatchSize;
}
@Config("hive.metastore.partition-batch-size.min")
public HiveConfig setMinPartitionBatchSize(int minPartitionBatchSize)
{
this.minPartitionBatchSize = minPartitionBatchSize;
return this;
}
@Min(1)
public int getMaxPartitionBatchSize()
{
return maxPartitionBatchSize;
}
@Config("hive.metastore.partition-batch-size.max")
public HiveConfig setMaxPartitionBatchSize(int maxPartitionBatchSize)
{
this.maxPartitionBatchSize = maxPartitionBatchSize;
return this;
}
public HiveStorageFormat getHiveStorageFormat()
{
return hiveStorageFormat;
}
@Config("hive.storage-format")
public HiveConfig setHiveStorageFormat(HiveStorageFormat hiveStorageFormat)
{
this.hiveStorageFormat = hiveStorageFormat;
return this;
}
public HiveCompressionCodec getHiveCompressionCodec()
{
return hiveCompressionCodec;
}
@Config("hive.compression-codec")
public HiveConfig setHiveCompressionCodec(HiveCompressionCodec hiveCompressionCodec)
{
this.hiveCompressionCodec = hiveCompressionCodec;
return this;
}
public boolean isRespectTableFormat()
{
return respectTableFormat;
}
@Config("hive.respect-table-format")
@ConfigDescription("Should new partitions be written using the existing table format or the default Presto format")
public HiveConfig setRespectTableFormat(boolean respectTableFormat)
{
this.respectTableFormat = respectTableFormat;
return this;
}
public boolean isImmutablePartitions()
{
return immutablePartitions;
}
@Config("hive.immutable-partitions")
@ConfigDescription("Can new data be inserted into existing partitions or existing unpartitioned tables")
public HiveConfig setImmutablePartitions(boolean immutablePartitions)
{
this.immutablePartitions = immutablePartitions;
return this;
}
public InsertExistingPartitionsBehavior getInsertExistingPartitionsBehavior()
{
return insertExistingPartitionsBehavior.orElse(immutablePartitions ? ERROR : APPEND);
}
@Config("hive.insert-existing-partitions-behavior")
@ConfigDescription("Default value for insert existing partitions behavior")
public HiveConfig setInsertExistingPartitionsBehavior(InsertExistingPartitionsBehavior insertExistingPartitionsBehavior)
{
this.insertExistingPartitionsBehavior = Optional.ofNullable(insertExistingPartitionsBehavior);
return this;
}
@AssertTrue(message = "insert-existing-partitions-behavior cannot be APPEND when immutable-partitions is true")
public boolean isInsertExistingPartitionsBehaviorValid()
{
return insertExistingPartitionsBehavior
.map(v -> InsertExistingPartitionsBehavior.isValid(v, immutablePartitions))
.orElse(true);
}
public boolean isCreateEmptyBucketFiles()
{
return createEmptyBucketFiles;
}
@Config("hive.create-empty-bucket-files")
@ConfigDescription("Create empty files for buckets that have no data")
public HiveConfig setCreateEmptyBucketFiles(boolean createEmptyBucketFiles)
{
this.createEmptyBucketFiles = createEmptyBucketFiles;
return this;
}
@Min(1)
public int getMaxPartitionsPerWriter()
{
return maxPartitionsPerWriter;
}
@Config("hive.max-partitions-per-writers")
@ConfigDescription("Maximum number of partitions per writer")
public HiveConfig setMaxPartitionsPerWriter(int maxPartitionsPerWriter)
{
this.maxPartitionsPerWriter = maxPartitionsPerWriter;
return this;
}
@Min(2)
@Max(1000)
public int getMaxOpenSortFiles()
{
return maxOpenSortFiles;
}
@Config("hive.max-open-sort-files")
@ConfigDescription("Maximum number of writer temporary files to read in one pass")
public HiveConfig setMaxOpenSortFiles(int maxOpenSortFiles)
{
this.maxOpenSortFiles = maxOpenSortFiles;
return this;
}
public int getWriteValidationThreads()
{
return writeValidationThreads;
}
@Config("hive.write-validation-threads")
@ConfigDescription("Number of threads used for verifying data after a write")
public HiveConfig setWriteValidationThreads(int writeValidationThreads)
{
this.writeValidationThreads = writeValidationThreads;
return this;
}
public DateTimeZone getRcfileDateTimeZone()
{
return DateTimeZone.forTimeZone(TimeZone.getTimeZone(rcfileTimeZone));
}
@NotNull
public String getRcfileTimeZone()
{
return rcfileTimeZone;
}
@Config("hive.rcfile.time-zone")
@ConfigDescription("Time zone for RCFile binary read and write")
public HiveConfig setRcfileTimeZone(String rcfileTimeZone)
{
this.rcfileTimeZone = rcfileTimeZone;
return this;
}
public boolean isRcfileWriterValidate()
{
return rcfileWriterValidate;
}
@Config("hive.rcfile.writer.validate")
@ConfigDescription("Validate RCFile after write by re-reading the whole file")
public HiveConfig setRcfileWriterValidate(boolean rcfileWriterValidate)
{
this.rcfileWriterValidate = rcfileWriterValidate;
return this;
}
@MinDataSize("1B")
@MaxDataSize("1GB")
@NotNull
public DataSize getTextMaxLineLength()
{
return textMaxLineLength;
}
@Config("hive.text.max-line-length")
@ConfigDescription("Maximum line length for text files")
public HiveConfig setTextMaxLineLength(DataSize textMaxLineLength)
{
this.textMaxLineLength = textMaxLineLength;
return this;
}
public DateTimeZone getOrcLegacyDateTimeZone()
{
return DateTimeZone.forTimeZone(TimeZone.getTimeZone(orcLegacyTimeZone));
}
@NotNull
public String getOrcLegacyTimeZone()
{
return orcLegacyTimeZone;
}
@Config("hive.orc.time-zone")
@ConfigDescription("Time zone for legacy ORC files that do not contain a time zone")
public HiveConfig setOrcLegacyTimeZone(String orcLegacyTimeZone)
{
this.orcLegacyTimeZone = orcLegacyTimeZone;
return this;
}
public DateTimeZone getParquetDateTimeZone()
{
return DateTimeZone.forTimeZone(TimeZone.getTimeZone(parquetTimeZone));
}
@NotNull
public String getParquetTimeZone()
{
return parquetTimeZone;
}
@Config("hive.parquet.time-zone")
@ConfigDescription("Time zone for Parquet read and write")
public HiveConfig setParquetTimeZone(String parquetTimeZone)
{
this.parquetTimeZone = parquetTimeZone;
return this;
}
public boolean isUseParquetColumnNames()
{
return useParquetColumnNames;
}
@Config("hive.parquet.use-column-names")
@ConfigDescription("Access Parquet columns using names from the file")
public HiveConfig setUseParquetColumnNames(boolean useParquetColumnNames)
{
this.useParquetColumnNames = useParquetColumnNames;
return this;
}
public boolean isOptimizeMismatchedBucketCount()
{
return optimizeMismatchedBucketCount;
}
@Config("hive.optimize-mismatched-bucket-count")
public HiveConfig setOptimizeMismatchedBucketCount(boolean optimizeMismatchedBucketCount)
{
this.optimizeMismatchedBucketCount = optimizeMismatchedBucketCount;
return this;
}
public List getFileStatusCacheTables()
{
return fileStatusCacheTables;
}
@Config("hive.file-status-cache-tables")
public HiveConfig setFileStatusCacheTables(String fileStatusCacheTables)
{
this.fileStatusCacheTables = SPLITTER.splitToList(fileStatusCacheTables);
return this;
}
public boolean isTranslateHiveViews()
{
return translateHiveViews;
}
@LegacyConfig("hive.views-execution.enabled")
@Config("hive.translate-hive-views")
@ConfigDescription("Experimental: Allow translation of Hive views into Presto views")
public HiveConfig setTranslateHiveViews(boolean translateHiveViews)
{
this.translateHiveViews = translateHiveViews;
return this;
}
public long getFileStatusCacheMaxSize()
{
return fileStatusCacheMaxSize;
}
@Config("hive.file-status-cache-size")
public HiveConfig setFileStatusCacheMaxSize(long fileStatusCacheMaxSize)
{
this.fileStatusCacheMaxSize = fileStatusCacheMaxSize;
return this;
}
public Duration getFileStatusCacheExpireAfterWrite()
{
return fileStatusCacheExpireAfterWrite;
}
@Config("hive.file-status-cache-expire-time")
public HiveConfig setFileStatusCacheExpireAfterWrite(Duration fileStatusCacheExpireAfterWrite)
{
this.fileStatusCacheExpireAfterWrite = fileStatusCacheExpireAfterWrite;
return this;
}
public boolean isSkipDeletionForAlter()
{
return skipDeletionForAlter;
}
@Config("hive.skip-deletion-for-alter")
@ConfigDescription("Skip deletion of old partition data when a partition is deleted and then inserted in the same transaction")
public HiveConfig setSkipDeletionForAlter(boolean skipDeletionForAlter)
{
this.skipDeletionForAlter = skipDeletionForAlter;
return this;
}
public boolean isSkipTargetCleanupOnRollback()
{
return skipTargetCleanupOnRollback;
}
@Config("hive.skip-target-cleanup-on-rollback")
@ConfigDescription("Skip deletion of target directories when a metastore operation fails")
public HiveConfig setSkipTargetCleanupOnRollback(boolean skipTargetCleanupOnRollback)
{
this.skipTargetCleanupOnRollback = skipTargetCleanupOnRollback;
return this;
}
public boolean isBucketExecutionEnabled()
{
return bucketExecutionEnabled;
}
@Config("hive.bucket-execution")
@ConfigDescription("Enable bucket-aware execution: only use a single worker per bucket")
public HiveConfig setBucketExecutionEnabled(boolean bucketExecutionEnabled)
{
this.bucketExecutionEnabled = bucketExecutionEnabled;
return this;
}
public boolean isSortedWritingEnabled()
{
return sortedWritingEnabled;
}
@Config("hive.sorted-writing")
@ConfigDescription("Enable writing to bucketed sorted tables")
public HiveConfig setSortedWritingEnabled(boolean sortedWritingEnabled)
{
this.sortedWritingEnabled = sortedWritingEnabled;
return this;
}
@Config("hive.non-managed-table-writes-enabled")
@ConfigDescription("Enable writes to non-managed (external) tables")
public HiveConfig setWritesToNonManagedTablesEnabled(boolean writesToNonManagedTablesEnabled)
{
this.writesToNonManagedTablesEnabled = writesToNonManagedTablesEnabled;
return this;
}
public boolean getWritesToNonManagedTablesEnabled()
{
return writesToNonManagedTablesEnabled;
}
@Config("hive.non-managed-table-creates-enabled")
@ConfigDescription("Enable non-managed (external) table creates")
public HiveConfig setCreatesOfNonManagedTablesEnabled(boolean createsOfNonManagedTablesEnabled)
{
this.createsOfNonManagedTablesEnabled = createsOfNonManagedTablesEnabled;
return this;
}
public boolean getCreatesOfNonManagedTablesEnabled()
{
return createsOfNonManagedTablesEnabled;
}
@Config("hive.table-statistics-enabled")
@ConfigDescription("Enable use of table statistics")
public HiveConfig setTableStatisticsEnabled(boolean tableStatisticsEnabled)
{
this.tableStatisticsEnabled = tableStatisticsEnabled;
return this;
}
public boolean isTableStatisticsEnabled()
{
return tableStatisticsEnabled;
}
@Min(1)
public int getPartitionStatisticsSampleSize()
{
return partitionStatisticsSampleSize;
}
@Config("hive.partition-statistics-sample-size")
@ConfigDescription("Maximum sample size of the partitions column statistics")
public HiveConfig setPartitionStatisticsSampleSize(int partitionStatisticsSampleSize)
{
this.partitionStatisticsSampleSize = partitionStatisticsSampleSize;
return this;
}
public boolean isIgnoreCorruptedStatistics()
{
return ignoreCorruptedStatistics;
}
@Config("hive.ignore-corrupted-statistics")
@ConfigDescription("Ignore corrupted statistics rather than failing")
public HiveConfig setIgnoreCorruptedStatistics(boolean ignoreCorruptedStatistics)
{
this.ignoreCorruptedStatistics = ignoreCorruptedStatistics;
return this;
}
public boolean isCollectColumnStatisticsOnWrite()
{
return collectColumnStatisticsOnWrite;
}
@Config("hive.collect-column-statistics-on-write")
@ConfigDescription("Enables automatic column level statistics collection on write")
public HiveConfig setCollectColumnStatisticsOnWrite(boolean collectColumnStatisticsOnWrite)
{
this.collectColumnStatisticsOnWrite = collectColumnStatisticsOnWrite;
return this;
}
@Config("hive.metastore-recording-path")
public HiveConfig setRecordingPath(String recordingPath)
{
this.recordingPath = recordingPath;
return this;
}
public String getRecordingPath()
{
return recordingPath;
}
@Config("hive.replay-metastore-recording")
public HiveConfig setReplay(boolean replay)
{
this.replay = replay;
return this;
}
public boolean isReplay()
{
return replay;
}
@Config("hive.metastore-recording-duration")
public HiveConfig setRecordingDuration(Duration recordingDuration)
{
this.recordingDuration = recordingDuration;
return this;
}
@NotNull
public Duration getRecordingDuration()
{
return recordingDuration;
}
public boolean isS3SelectPushdownEnabled()
{
return s3SelectPushdownEnabled;
}
@Config("hive.s3select-pushdown.enabled")
@ConfigDescription("Enable query pushdown to AWS S3 Select service")
public HiveConfig setS3SelectPushdownEnabled(boolean s3SelectPushdownEnabled)
{
this.s3SelectPushdownEnabled = s3SelectPushdownEnabled;
return this;
}
@Min(1)
public int getS3SelectPushdownMaxConnections()
{
return s3SelectPushdownMaxConnections;
}
@Config("hive.s3select-pushdown.max-connections")
public HiveConfig setS3SelectPushdownMaxConnections(int s3SelectPushdownMaxConnections)
{
this.s3SelectPushdownMaxConnections = s3SelectPushdownMaxConnections;
return this;
}
@Config("hive.temporary-staging-directory-enabled")
@ConfigDescription("Should use (if possible) temporary staging directory for write operations")
public HiveConfig setTemporaryStagingDirectoryEnabled(boolean temporaryStagingDirectoryEnabled)
{
this.isTemporaryStagingDirectoryEnabled = temporaryStagingDirectoryEnabled;
return this;
}
public boolean isTemporaryStagingDirectoryEnabled()
{
return isTemporaryStagingDirectoryEnabled;
}
@Config("hive.temporary-staging-directory-path")
@ConfigDescription("Location of temporary staging directory for write operations. Use ${USER} placeholder to use different location for each user.")
public HiveConfig setTemporaryStagingDirectoryPath(String temporaryStagingDirectoryPath)
{
this.temporaryStagingDirectoryPath = temporaryStagingDirectoryPath;
return this;
}
@NotNull
public String getTemporaryStagingDirectoryPath()
{
return temporaryStagingDirectoryPath;
}
@Config("hive.transaction-heartbeat-interval")
@ConfigDescription("Interval after which heartbeat is sent for open Hive transaction")
public HiveConfig setHiveTransactionHeartbeatInterval(Duration interval)
{
this.hiveTransactionHeartbeatInterval = Optional.ofNullable(interval);
return this;
}
@NotNull
public Optional getHiveTransactionHeartbeatInterval()
{
return hiveTransactionHeartbeatInterval;
}
public int getHiveTransactionHeartbeatThreads()
{
return hiveTransactionHeartbeatThreads;
}
@Config("hive.transaction-heartbeat-threads")
@ConfigDescription("Number of threads to run in the Hive transaction heartbeat service")
public HiveConfig setHiveTransactionHeartbeatThreads(int hiveTransactionHeartbeatThreads)
{
this.hiveTransactionHeartbeatThreads = hiveTransactionHeartbeatThreads;
return this;
}
public boolean isAllowRegisterPartition()
{
return allowRegisterPartition;
}
@Config("hive.allow-register-partition-procedure")
public HiveConfig setAllowRegisterPartition(boolean allowRegisterPartition)
{
this.allowRegisterPartition = allowRegisterPartition;
return this;
}
public boolean isQueryPartitionFilterRequired()
{
return queryPartitionFilterRequired;
}
@Config("hive.query-partition-filter-required")
@ConfigDescription("Require filter on at least one partition column")
public HiveConfig setQueryPartitionFilterRequired(boolean queryPartitionFilterRequired)
{
this.queryPartitionFilterRequired = queryPartitionFilterRequired;
return this;
}
public boolean getPartitionUseColumnNames()
{
return partitionUseColumnNames;
}
@Config("hive.partition-use-column-names")
@ConfigDescription("Access partition columns by names")
public HiveConfig setPartitionUseColumnNames(boolean partitionUseColumnNames)
{
this.partitionUseColumnNames = partitionUseColumnNames;
return this;
}
public boolean isProjectionPushdownEnabled()
{
return projectionPushdownEnabled;
}
@Config("hive.projection-pushdown-enabled")
@ConfigDescription("Projection pushdown into hive is enabled through applyProjection")
public HiveConfig setProjectionPushdownEnabled(boolean projectionPushdownEnabled)
{
this.projectionPushdownEnabled = projectionPushdownEnabled;
return this;
}
@NotNull
public Duration getDynamicFilteringProbeBlockingTimeout()
{
return dynamicFilteringProbeBlockingTimeout;
}
@Config("hive.dynamic-filtering-probe-blocking-timeout")
@ConfigDescription("Duration to wait for completion of dynamic filters during split generation for probe side table")
public HiveConfig setDynamicFilteringProbeBlockingTimeout(Duration dynamicFilteringProbeBlockingTimeout)
{
this.dynamicFilteringProbeBlockingTimeout = dynamicFilteringProbeBlockingTimeout;
return this;
}
public HiveTimestampPrecision getTimestampPrecision()
{
return timestampPrecision;
}
@Config("hive.timestamp-precision")
@ConfigDescription("Precision used to represent timestamps")
public HiveConfig setTimestampPrecision(HiveTimestampPrecision timestampPrecision)
{
this.timestampPrecision = timestampPrecision;
return this;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy