Please wait. This can take some minutes ...
Many resources are needed to download a project. Please understand that we have to compensate our server costs. Thank you in advance.
Project price only 1 $
You can buy this project and download/modify it how often you want.
io.prestosql.plugin.hive.metastore.thrift.ThriftHiveMetastore Maven / Gradle / Ivy
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.prestosql.plugin.hive.metastore.thrift;
import com.google.common.cache.CacheBuilder;
import com.google.common.cache.CacheLoader;
import com.google.common.cache.LoadingCache;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import com.google.common.collect.Iterables;
import com.google.common.util.concurrent.UncheckedExecutionException;
import io.airlift.log.Logger;
import io.airlift.units.Duration;
import io.prestosql.plugin.hive.HdfsEnvironment;
import io.prestosql.plugin.hive.HdfsEnvironment.HdfsContext;
import io.prestosql.plugin.hive.HiveBasicStatistics;
import io.prestosql.plugin.hive.HiveConfig;
import io.prestosql.plugin.hive.HivePartition;
import io.prestosql.plugin.hive.HiveType;
import io.prestosql.plugin.hive.HiveViewNotSupportedException;
import io.prestosql.plugin.hive.PartitionNotFoundException;
import io.prestosql.plugin.hive.PartitionStatistics;
import io.prestosql.plugin.hive.SchemaAlreadyExistsException;
import io.prestosql.plugin.hive.TableAlreadyExistsException;
import io.prestosql.plugin.hive.authentication.HiveIdentity;
import io.prestosql.plugin.hive.metastore.Column;
import io.prestosql.plugin.hive.metastore.HiveColumnStatistics;
import io.prestosql.plugin.hive.metastore.HivePrincipal;
import io.prestosql.plugin.hive.metastore.HivePrivilegeInfo;
import io.prestosql.plugin.hive.metastore.PartitionWithStatistics;
import io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreAuthenticationConfig.ThriftMetastoreAuthenticationType;
import io.prestosql.plugin.hive.util.RetryDriver;
import io.prestosql.spi.PrestoException;
import io.prestosql.spi.connector.SchemaNotFoundException;
import io.prestosql.spi.connector.SchemaTableName;
import io.prestosql.spi.connector.TableNotFoundException;
import io.prestosql.spi.predicate.TupleDomain;
import io.prestosql.spi.security.ConnectorIdentity;
import io.prestosql.spi.security.RoleGrant;
import io.prestosql.spi.statistics.ColumnStatisticType;
import io.prestosql.spi.type.Type;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.hive.metastore.LockComponentBuilder;
import org.apache.hadoop.hive.metastore.LockRequestBuilder;
import org.apache.hadoop.hive.metastore.TableType;
import org.apache.hadoop.hive.metastore.api.AlreadyExistsException;
import org.apache.hadoop.hive.metastore.api.ColumnStatisticsObj;
import org.apache.hadoop.hive.metastore.api.ConfigValSecurityException;
import org.apache.hadoop.hive.metastore.api.DataOperationType;
import org.apache.hadoop.hive.metastore.api.Database;
import org.apache.hadoop.hive.metastore.api.EnvironmentContext;
import org.apache.hadoop.hive.metastore.api.FieldSchema;
import org.apache.hadoop.hive.metastore.api.HiveObjectPrivilege;
import org.apache.hadoop.hive.metastore.api.HiveObjectRef;
import org.apache.hadoop.hive.metastore.api.InvalidInputException;
import org.apache.hadoop.hive.metastore.api.InvalidObjectException;
import org.apache.hadoop.hive.metastore.api.InvalidOperationException;
import org.apache.hadoop.hive.metastore.api.LockComponent;
import org.apache.hadoop.hive.metastore.api.LockRequest;
import org.apache.hadoop.hive.metastore.api.LockResponse;
import org.apache.hadoop.hive.metastore.api.LockState;
import org.apache.hadoop.hive.metastore.api.MetaException;
import org.apache.hadoop.hive.metastore.api.NoSuchLockException;
import org.apache.hadoop.hive.metastore.api.NoSuchObjectException;
import org.apache.hadoop.hive.metastore.api.NoSuchTxnException;
import org.apache.hadoop.hive.metastore.api.Partition;
import org.apache.hadoop.hive.metastore.api.PrincipalType;
import org.apache.hadoop.hive.metastore.api.PrivilegeBag;
import org.apache.hadoop.hive.metastore.api.PrivilegeGrantInfo;
import org.apache.hadoop.hive.metastore.api.Table;
import org.apache.hadoop.hive.metastore.api.TxnAbortedException;
import org.apache.hadoop.hive.metastore.api.UnknownDBException;
import org.apache.hadoop.hive.metastore.api.UnknownTableException;
import org.apache.thrift.TApplicationException;
import org.apache.thrift.TException;
import org.weakref.jmx.Flatten;
import org.weakref.jmx.Managed;
import javax.annotation.concurrent.ThreadSafe;
import javax.inject.Inject;
import java.io.Closeable;
import java.io.IOException;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.OptionalLong;
import java.util.Set;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.atomic.AtomicReference;
import java.util.function.Function;
import java.util.function.Predicate;
import java.util.regex.Pattern;
import java.util.stream.Stream;
import static com.google.common.base.Preconditions.checkArgument;
import static com.google.common.base.Strings.isNullOrEmpty;
import static com.google.common.base.Throwables.propagateIfPossible;
import static com.google.common.base.Throwables.throwIfInstanceOf;
import static com.google.common.base.Throwables.throwIfUnchecked;
import static com.google.common.base.Verify.verify;
import static com.google.common.base.Verify.verifyNotNull;
import static com.google.common.collect.ImmutableList.toImmutableList;
import static com.google.common.collect.ImmutableMap.toImmutableMap;
import static com.google.common.collect.ImmutableSet.toImmutableSet;
import static com.google.common.collect.Iterables.getOnlyElement;
import static com.google.common.collect.Sets.difference;
import static io.prestosql.plugin.hive.HiveErrorCode.HIVE_METASTORE_ERROR;
import static io.prestosql.plugin.hive.HiveErrorCode.HIVE_TABLE_LOCK_NOT_ACQUIRED;
import static io.prestosql.plugin.hive.metastore.HivePrivilegeInfo.HivePrivilege;
import static io.prestosql.plugin.hive.metastore.HivePrivilegeInfo.HivePrivilege.OWNERSHIP;
import static io.prestosql.plugin.hive.metastore.MetastoreUtil.partitionKeyFilterToStringList;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.createMetastoreColumnStatistics;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.fromMetastoreApiPrincipalType;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.fromMetastoreApiTable;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.fromPrestoPrincipalType;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.fromRolePrincipalGrants;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.getHiveBasicStatistics;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.isAvroTableWithSchemaSet;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.parsePrivilege;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.toMetastoreApiPartition;
import static io.prestosql.plugin.hive.metastore.thrift.ThriftMetastoreUtil.updateStatisticsParameters;
import static io.prestosql.plugin.hive.util.HiveUtil.PRESTO_VIEW_FLAG;
import static io.prestosql.spi.StandardErrorCode.ALREADY_EXISTS;
import static io.prestosql.spi.StandardErrorCode.NOT_SUPPORTED;
import static io.prestosql.spi.security.PrincipalType.USER;
import static java.lang.Boolean.FALSE;
import static java.lang.Boolean.TRUE;
import static java.lang.String.format;
import static java.lang.System.nanoTime;
import static java.util.Objects.requireNonNull;
import static java.util.concurrent.TimeUnit.MILLISECONDS;
import static java.util.concurrent.TimeUnit.SECONDS;
import static org.apache.hadoop.hive.common.FileUtils.makePartName;
import static org.apache.hadoop.hive.metastore.TableType.MANAGED_TABLE;
import static org.apache.hadoop.hive.metastore.api.HiveObjectType.TABLE;
import static org.apache.hadoop.hive.metastore.api.hive_metastoreConstants.HIVE_FILTER_FIELD_PARAMS;
import static org.apache.thrift.TApplicationException.UNKNOWN_METHOD;
@ThreadSafe
public class ThriftHiveMetastore
implements ThriftMetastore
{
private static final Logger log = Logger.get(ThriftHiveMetastore.class);
private static final int MAX_SET_DATE_STATISTICS_ATTEMPTS = 100;
private static final String DEFAULT_METASTORE_USER = "presto";
private final ThriftMetastoreStats stats = new ThriftMetastoreStats();
private final HdfsEnvironment hdfsEnvironment;
private final HdfsContext hdfsContext;
private final MetastoreLocator clientProvider;
private final double backoffScaleFactor;
private final Duration minBackoffDelay;
private final Duration maxBackoffDelay;
private final Duration maxRetryTime;
private final Duration maxWaitForLock;
private final int maxRetries;
private final boolean impersonationEnabled;
private final boolean authenticationEnabled;
private final LoadingCache delegationTokenCache;
private final boolean deleteFilesOnDrop;
private final boolean translateHiveViews;
private final AtomicInteger chosenGetTableAlternative = new AtomicInteger(Integer.MAX_VALUE);
private final AtomicInteger chosenTableParamAlternative = new AtomicInteger(Integer.MAX_VALUE);
private final AtomicInteger chosesGetAllViewsAlternative = new AtomicInteger(Integer.MAX_VALUE);
private final AtomicReference> metastoreSupportsDateStatistics = new AtomicReference<>(Optional.empty());
private final CoalescingCounter metastoreSetDateStatisticsFailures = new CoalescingCounter(new Duration(1, SECONDS));
private static final Pattern TABLE_PARAMETER_SAFE_KEY_PATTERN = Pattern.compile("^[a-zA-Z_]+$");
private static final Pattern TABLE_PARAMETER_SAFE_VALUE_PATTERN = Pattern.compile("^[a-zA-Z0-9]*$");
private final boolean assumeCanonicalPartitionKeys;
@Inject
public ThriftHiveMetastore(MetastoreLocator metastoreLocator, HiveConfig hiveConfig, ThriftMetastoreConfig thriftConfig, ThriftMetastoreAuthenticationConfig authenticationConfig, HdfsEnvironment hdfsEnvironment)
{
this(
metastoreLocator,
hiveConfig,
thriftConfig,
hdfsEnvironment,
authenticationConfig.getAuthenticationType() != ThriftMetastoreAuthenticationType.NONE);
}
public ThriftHiveMetastore(MetastoreLocator metastoreLocator, HiveConfig hiveConfig, ThriftMetastoreConfig thriftConfig, HdfsEnvironment hdfsEnvironment, boolean authenticationEnabled)
{
this.hdfsContext = new HdfsContext(ConnectorIdentity.ofUser(DEFAULT_METASTORE_USER));
this.clientProvider = requireNonNull(metastoreLocator, "metastoreLocator is null");
this.hdfsEnvironment = requireNonNull(hdfsEnvironment, "hdfsEnvironment is null");
this.backoffScaleFactor = thriftConfig.getBackoffScaleFactor();
this.minBackoffDelay = thriftConfig.getMinBackoffDelay();
this.maxBackoffDelay = thriftConfig.getMaxBackoffDelay();
this.maxRetryTime = thriftConfig.getMaxRetryTime();
this.maxRetries = thriftConfig.getMaxRetries();
this.impersonationEnabled = thriftConfig.isImpersonationEnabled();
this.deleteFilesOnDrop = thriftConfig.isDeleteFilesOnDrop();
this.translateHiveViews = hiveConfig.isTranslateHiveViews();
this.maxWaitForLock = thriftConfig.getMaxWaitForTransactionLock();
this.authenticationEnabled = authenticationEnabled;
this.delegationTokenCache = CacheBuilder.newBuilder()
.expireAfterWrite(thriftConfig.getDelegationTokenCacheTtl().toMillis(), MILLISECONDS)
.maximumSize(thriftConfig.getDelegationTokenCacheMaximumSize())
.build(CacheLoader.from(this::loadDelegationToken));
this.assumeCanonicalPartitionKeys = thriftConfig.isAssumeCanonicalPartitionKeys();
}
@Managed
@Flatten
public ThriftMetastoreStats getStats()
{
return stats;
}
@Override
public List getAllDatabases()
{
try {
return retry()
.stopOnIllegalExceptions()
.run("getAllDatabases", stats.getGetAllDatabases().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
return client.getAllDatabases();
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Optional getDatabase(String databaseName)
{
try {
return retry()
.stopOn(NoSuchObjectException.class)
.stopOnIllegalExceptions()
.run("getDatabase", stats.getGetDatabase().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
return Optional.of(client.getDatabase(databaseName));
}
}));
}
catch (NoSuchObjectException e) {
return Optional.empty();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public List getAllTables(String databaseName)
{
try {
return retry()
.stopOn(NoSuchObjectException.class)
.stopOnIllegalExceptions()
.run("getAllTables", () -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
return client.getAllTables(databaseName);
}
});
}
catch (NoSuchObjectException e) {
return ImmutableList.of();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public List getTablesWithParameter(String databaseName, String parameterKey, String parameterValue)
{
try {
return retry()
.stopOn(UnknownDBException.class)
.stopOnIllegalExceptions()
.run("getTablesWithParameter", stats.getGetTablesWithParameter().wrap(
() -> doGetTablesWithParameter(databaseName, parameterKey, parameterValue)));
}
catch (UnknownDBException e) {
return ImmutableList.of();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Optional getTable(HiveIdentity identity, String databaseName, String tableName)
{
try {
return retry()
.stopOn(NoSuchObjectException.class, HiveViewNotSupportedException.class)
.stopOnIllegalExceptions()
.run("getTable", stats.getGetTable().wrap(() -> {
Table table = getTableFromMetastore(identity, databaseName, tableName);
if (!translateHiveViews && table.getTableType().equals(TableType.VIRTUAL_VIEW.name()) && !isPrestoView(table)) {
throw new HiveViewNotSupportedException(new SchemaTableName(databaseName, tableName));
}
return Optional.of(table);
}));
}
catch (NoSuchObjectException e) {
return Optional.empty();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private Table getTableFromMetastore(HiveIdentity identity, String databaseName, String tableName)
throws TException
{
return alternativeCall(
() -> createMetastoreClient(identity),
ThriftHiveMetastore::defaultIsValidExceptionalResponse,
chosenGetTableAlternative,
client -> client.getTableWithCapabilities(databaseName, tableName),
client -> client.getTable(databaseName, tableName));
}
@Override
public Set getSupportedColumnStatistics(Type type)
{
return ThriftMetastoreUtil.getSupportedColumnStatistics(type);
}
private static boolean isPrestoView(Table table)
{
return "true".equals(table.getParameters().get(PRESTO_VIEW_FLAG));
}
@Override
public PartitionStatistics getTableStatistics(HiveIdentity identity, Table table)
{
List dataColumns = table.getSd().getCols().stream()
.map(FieldSchema::getName)
.collect(toImmutableList());
HiveBasicStatistics basicStatistics = getHiveBasicStatistics(table.getParameters());
Map columnStatistics = getTableColumnStatistics(identity, table.getDbName(), table.getTableName(), dataColumns, basicStatistics.getRowCount());
return new PartitionStatistics(basicStatistics, columnStatistics);
}
private Map getTableColumnStatistics(HiveIdentity identity, String databaseName, String tableName, List columns, OptionalLong rowCount)
{
try {
return retry()
.stopOn(NoSuchObjectException.class, HiveViewNotSupportedException.class)
.stopOnIllegalExceptions()
.run("getTableColumnStatistics", stats.getGetTableColumnStatistics().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
return groupStatisticsByColumn(client.getTableColumnStatistics(databaseName, tableName, columns), rowCount);
}
}));
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Map getPartitionStatistics(HiveIdentity identity, Table table, List partitions)
{
List dataColumns = table.getSd().getCols().stream()
.map(FieldSchema::getName)
.collect(toImmutableList());
List partitionColumns = table.getPartitionKeys().stream()
.map(FieldSchema::getName)
.collect(toImmutableList());
Map partitionBasicStatistics = partitions.stream()
.collect(toImmutableMap(
partition -> makePartName(partitionColumns, partition.getValues()),
partition -> getHiveBasicStatistics(partition.getParameters())));
Map partitionRowCounts = partitionBasicStatistics.entrySet().stream()
.collect(toImmutableMap(Map.Entry::getKey, entry -> entry.getValue().getRowCount()));
Map> partitionColumnStatistics = getPartitionColumnStatistics(
identity,
table.getDbName(),
table.getTableName(),
partitionBasicStatistics.keySet(),
dataColumns,
partitionRowCounts);
ImmutableMap.Builder result = ImmutableMap.builder();
for (String partitionName : partitionBasicStatistics.keySet()) {
HiveBasicStatistics basicStatistics = partitionBasicStatistics.get(partitionName);
Map columnStatistics = partitionColumnStatistics.getOrDefault(partitionName, ImmutableMap.of());
result.put(partitionName, new PartitionStatistics(basicStatistics, columnStatistics));
}
return result.build();
}
@Override
public Optional> getFields(HiveIdentity identity, String databaseName, String tableName)
{
try {
return retry()
.stopOn(MetaException.class, UnknownTableException.class, UnknownDBException.class)
.stopOnIllegalExceptions()
.run("getFields", stats.getGetFields().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
return Optional.of(ImmutableList.copyOf(client.getFields(databaseName, tableName)));
}
}));
}
catch (NoSuchObjectException e) {
return Optional.empty();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private Map> getPartitionColumnStatistics(
HiveIdentity identity,
String databaseName,
String tableName,
Set partitionNames,
List columnNames,
Map partitionRowCounts)
{
return getMetastorePartitionColumnStatistics(identity, databaseName, tableName, partitionNames, columnNames).entrySet().stream()
.filter(entry -> !entry.getValue().isEmpty())
.collect(toImmutableMap(
Map.Entry::getKey,
entry -> groupStatisticsByColumn(entry.getValue(), partitionRowCounts.getOrDefault(entry.getKey(), OptionalLong.empty()))));
}
private Map> getMetastorePartitionColumnStatistics(HiveIdentity identity, String databaseName, String tableName, Set partitionNames, List columnNames)
{
try {
return retry()
.stopOn(NoSuchObjectException.class, HiveViewNotSupportedException.class)
.stopOnIllegalExceptions()
.run("getPartitionColumnStatistics", stats.getGetPartitionColumnStatistics().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
return client.getPartitionColumnStatistics(databaseName, tableName, ImmutableList.copyOf(partitionNames), columnNames);
}
}));
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private Map groupStatisticsByColumn(List statistics, OptionalLong rowCount)
{
return statistics.stream()
.collect(toImmutableMap(ColumnStatisticsObj::getColName, statisticsObj -> ThriftMetastoreUtil.fromMetastoreApiColumnStatistics(statisticsObj, rowCount)));
}
@Override
public void updateTableStatistics(HiveIdentity identity, String databaseName, String tableName, Function update)
{
Table originalTable = getTable(identity, databaseName, tableName)
.orElseThrow(() -> new TableNotFoundException(new SchemaTableName(databaseName, tableName)));
PartitionStatistics currentStatistics = getTableStatistics(identity, originalTable);
PartitionStatistics updatedStatistics = update.apply(currentStatistics);
Table modifiedTable = originalTable.deepCopy();
HiveBasicStatistics basicStatistics = updatedStatistics.getBasicStatistics();
modifiedTable.setParameters(updateStatisticsParameters(modifiedTable.getParameters(), basicStatistics));
alterTable(identity, databaseName, tableName, modifiedTable);
io.prestosql.plugin.hive.metastore.Table table = fromMetastoreApiTable(modifiedTable);
OptionalLong rowCount = basicStatistics.getRowCount();
List metastoreColumnStatistics = updatedStatistics.getColumnStatistics().entrySet().stream()
.flatMap(entry -> {
Optional column = table.getColumn(entry.getKey());
if (column.isEmpty() && isAvroTableWithSchemaSet(modifiedTable)) {
// Avro table can have different effective schema than declared in metastore. Still, metastore does not allow
// to store statistics for a column it does not know about.
return Stream.of();
}
HiveType type = column.orElseThrow(() -> new IllegalStateException("Column not found: " + entry.getKey())).getType();
return Stream.of(createMetastoreColumnStatistics(entry.getKey(), type, entry.getValue(), rowCount));
})
.collect(toImmutableList());
if (!metastoreColumnStatistics.isEmpty()) {
setTableColumnStatistics(identity, databaseName, tableName, metastoreColumnStatistics);
}
Set removedColumnStatistics = difference(currentStatistics.getColumnStatistics().keySet(), updatedStatistics.getColumnStatistics().keySet());
removedColumnStatistics.forEach(column -> deleteTableColumnStatistics(identity, databaseName, tableName, column));
}
private void setTableColumnStatistics(HiveIdentity identity, String databaseName, String tableName, List statistics)
{
try {
retry()
.stopOn(NoSuchObjectException.class, InvalidObjectException.class, MetaException.class, InvalidInputException.class)
.stopOnIllegalExceptions()
.run("setTableColumnStatistics", stats.getSetTableColumnStatistics().wrap(() -> {
setColumnStatistics(
identity,
format("table %s.%s", databaseName, tableName),
statistics,
(client, stats) -> client.setTableColumnStatistics(databaseName, tableName, stats));
return null;
}));
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private void deleteTableColumnStatistics(HiveIdentity identity, String databaseName, String tableName, String columnName)
{
try {
retry()
.stopOn(NoSuchObjectException.class, InvalidObjectException.class, MetaException.class, InvalidInputException.class)
.stopOnIllegalExceptions()
.run("deleteTableColumnStatistics", stats.getDeleteTableColumnStatistics().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
client.deleteTableColumnStatistics(databaseName, tableName, columnName);
}
return null;
}));
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void updatePartitionStatistics(HiveIdentity identity, Table table, String partitionName, Function update)
{
List partitions = getPartitionsByNames(identity, table.getDbName(), table.getTableName(), ImmutableList.of(partitionName));
if (partitions.size() != 1) {
throw new PrestoException(HIVE_METASTORE_ERROR, "Metastore returned multiple partitions for name: " + partitionName);
}
Partition originalPartition = getOnlyElement(partitions);
PartitionStatistics currentStatistics = requireNonNull(
getPartitionStatistics(identity, table, partitions).get(partitionName), "getPartitionStatistics() did not return statistics for partition");
PartitionStatistics updatedStatistics = update.apply(currentStatistics);
Partition modifiedPartition = originalPartition.deepCopy();
HiveBasicStatistics basicStatistics = updatedStatistics.getBasicStatistics();
modifiedPartition.setParameters(updateStatisticsParameters(modifiedPartition.getParameters(), basicStatistics));
alterPartitionWithoutStatistics(identity, table.getDbName(), table.getTableName(), modifiedPartition);
Map columns = modifiedPartition.getSd().getCols().stream()
.collect(toImmutableMap(FieldSchema::getName, schema -> HiveType.valueOf(schema.getType())));
setPartitionColumnStatistics(identity, table.getDbName(), table.getTableName(), partitionName, columns, updatedStatistics.getColumnStatistics(), basicStatistics.getRowCount());
Set removedStatistics = difference(currentStatistics.getColumnStatistics().keySet(), updatedStatistics.getColumnStatistics().keySet());
removedStatistics.forEach(column -> deletePartitionColumnStatistics(identity, table.getDbName(), table.getTableName(), partitionName, column));
}
private void setPartitionColumnStatistics(
HiveIdentity identity,
String databaseName,
String tableName,
String partitionName,
Map columns,
Map columnStatistics,
OptionalLong rowCount)
{
List metastoreColumnStatistics = columnStatistics.entrySet().stream()
.filter(entry -> columns.containsKey(entry.getKey()))
.map(entry -> createMetastoreColumnStatistics(entry.getKey(), columns.get(entry.getKey()), entry.getValue(), rowCount))
.collect(toImmutableList());
if (!metastoreColumnStatistics.isEmpty()) {
setPartitionColumnStatistics(identity, databaseName, tableName, partitionName, metastoreColumnStatistics);
}
}
private void setPartitionColumnStatistics(HiveIdentity identity, String databaseName, String tableName, String partitionName, List statistics)
{
try {
retry()
.stopOn(NoSuchObjectException.class, InvalidObjectException.class, MetaException.class, InvalidInputException.class)
.stopOnIllegalExceptions()
.run("setPartitionColumnStatistics", stats.getSetPartitionColumnStatistics().wrap(() -> {
setColumnStatistics(
identity,
format("partition of table %s.%s", databaseName, tableName),
statistics,
(client, stats) -> client.setPartitionColumnStatistics(databaseName, tableName, partitionName, stats));
return null;
}));
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private void deletePartitionColumnStatistics(HiveIdentity identity, String databaseName, String tableName, String partitionName, String columnName)
{
try {
retry()
.stopOn(NoSuchObjectException.class, InvalidObjectException.class, MetaException.class, InvalidInputException.class)
.stopOnIllegalExceptions()
.run("deletePartitionColumnStatistics", stats.getDeletePartitionColumnStatistics().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
client.deletePartitionColumnStatistics(databaseName, tableName, partitionName, columnName);
}
return null;
}));
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private void setColumnStatistics(HiveIdentity identity, String objectName, List statistics, Call1> saveColumnStatistics)
throws TException
{
boolean containsDateStatistics = statistics.stream().anyMatch(stats -> stats.getStatsData().isSetDateStats());
Optional metastoreSupportsDateStatistics = this.metastoreSupportsDateStatistics.get();
if (containsDateStatistics && metastoreSupportsDateStatistics.equals(Optional.of(FALSE))) {
log.debug("Skipping date statistics for %s because metastore does not support them", objectName);
statistics = statistics.stream()
.filter(stats -> !stats.getStatsData().isSetDateStats())
.collect(toImmutableList());
containsDateStatistics = false;
}
if (!containsDateStatistics || metastoreSupportsDateStatistics.equals(Optional.of(TRUE))) {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
saveColumnStatistics.call(client, statistics);
}
return;
}
List statisticsExceptDate = statistics.stream()
.filter(stats -> !stats.getStatsData().isSetDateStats())
.collect(toImmutableList());
List dateStatistics = statistics.stream()
.filter(stats -> stats.getStatsData().isSetDateStats())
.collect(toImmutableList());
verify(!dateStatistics.isEmpty() && metastoreSupportsDateStatistics.equals(Optional.empty()));
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
saveColumnStatistics.call(client, statisticsExceptDate);
try {
saveColumnStatistics.call(client, dateStatistics);
}
catch (TException e) {
// When `dateStatistics.size() > 1` we expect something like "TApplicationException: Required field 'colName' is unset! Struct:ColumnStatisticsObj(colName:null, colType:null, statsData:null)"
// When `dateStatistics.size() == 1` we expect something like "TTransportException: java.net.SocketTimeoutException: Read timed out"
log.warn(e, "Failed to save date statistics for %s. Metastore might not support date statistics", objectName);
if (!statisticsExceptDate.isEmpty() && metastoreSetDateStatisticsFailures.incrementAndGet() >= MAX_SET_DATE_STATISTICS_ATTEMPTS) {
this.metastoreSupportsDateStatistics.set(Optional.of(FALSE));
}
return;
}
}
this.metastoreSupportsDateStatistics.set(Optional.of(TRUE));
}
@Override
public void createRole(String role, String grantor)
{
try {
retry()
.stopOn(MetaException.class)
.stopOnIllegalExceptions()
.run("createRole", stats.getCreateRole().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
client.createRole(role, grantor);
return null;
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void dropRole(String role)
{
try {
retry()
.stopOn(MetaException.class)
.stopOnIllegalExceptions()
.run("dropRole", stats.getDropRole().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
client.dropRole(role);
return null;
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Set listRoles()
{
try {
return retry()
.stopOn(MetaException.class)
.stopOnIllegalExceptions()
.run("listRoles", stats.getListRoles().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
return ImmutableSet.copyOf(client.getRoleNames());
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void grantRoles(Set roles, Set grantees, boolean adminOption, HivePrincipal grantor)
{
for (HivePrincipal grantee : grantees) {
for (String role : roles) {
grantRole(
role,
grantee.getName(), fromPrestoPrincipalType(grantee.getType()),
grantor.getName(), fromPrestoPrincipalType(grantor.getType()),
adminOption);
}
}
}
private void grantRole(String role, String granteeName, PrincipalType granteeType, String grantorName, PrincipalType grantorType, boolean grantOption)
{
try {
retry()
.stopOn(MetaException.class)
.stopOnIllegalExceptions()
.run("grantRole", stats.getGrantRole().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
client.grantRole(role, granteeName, granteeType, grantorName, grantorType, grantOption);
return null;
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void revokeRoles(Set roles, Set grantees, boolean adminOption, HivePrincipal grantor)
{
for (HivePrincipal grantee : grantees) {
for (String role : roles) {
revokeRole(
role,
grantee.getName(), fromPrestoPrincipalType(grantee.getType()),
adminOption);
}
}
}
private void revokeRole(String role, String granteeName, PrincipalType granteeType, boolean grantOption)
{
try {
retry()
.stopOn(MetaException.class)
.stopOnIllegalExceptions()
.run("revokeRole", stats.getRevokeRole().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
client.revokeRole(role, granteeName, granteeType, grantOption);
return null;
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Set listGrantedPrincipals(String role)
{
try {
return retry()
.stopOn(MetaException.class)
.stopOnIllegalExceptions()
.run("listPrincipals", stats.getListGrantedPrincipals().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
return fromRolePrincipalGrants(client.listGrantedPrincipals(role));
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Set listRoleGrants(HivePrincipal principal)
{
try {
return retry()
.stopOn(MetaException.class)
.stopOnIllegalExceptions()
.run("listRoleGrants", stats.getListRoleGrants().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
return fromRolePrincipalGrants(client.listRoleGrants(principal.getName(), fromPrestoPrincipalType(principal.getType())));
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public List getAllViews(String databaseName)
{
try {
return retry()
.stopOn(UnknownDBException.class)
.stopOnIllegalExceptions()
.run("getAllViews", stats.getGetAllViews().wrap(() -> {
if (translateHiveViews) {
return alternativeCall(
this::createMetastoreClient,
exception -> !isUnknownMethodExceptionalResponse(exception),
chosesGetAllViewsAlternative,
client -> client.getTableNamesByType(databaseName, TableType.VIRTUAL_VIEW.name()),
// fallback to enumerating Presto views only (Hive views will still be executed, but will be listed as tables)
client -> doGetTablesWithParameter(databaseName, PRESTO_VIEW_FLAG, "true"));
}
return doGetTablesWithParameter(databaseName, PRESTO_VIEW_FLAG, "true");
}));
}
catch (UnknownDBException e) {
return ImmutableList.of();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private List doGetTablesWithParameter(String databaseName, String parameterKey, String parameterValue)
throws TException
{
checkArgument(TABLE_PARAMETER_SAFE_KEY_PATTERN.matcher(parameterKey).matches(), "Parameter key contains invalid characters: '%s'", parameterKey);
/*
* The parameter value is restricted to have only alphanumeric characters so that it's safe
* to be used against HMS. When using with a LIKE operator, the HMS may want the parameter
* value to follow a Java regex pattern or a SQL pattern. And it's hard to predict the
* HMS's behavior from outside. Also, by restricting parameter values, we avoid the problem
* of how to quote them when passing within the filter string.
*/
checkArgument(TABLE_PARAMETER_SAFE_VALUE_PATTERN.matcher(parameterValue).matches(), "Parameter value contains invalid characters: '%s'", parameterValue);
/*
* Thrift call `get_table_names_by_filter` may be translated by Metastore to a SQL query against Metastore database.
* Hive 2.3 on some databases uses CLOB for table parameter value column and some databases disallow `=` predicate over
* CLOB values. At the same time, they allow `LIKE` predicates over them.
*/
String filterWithEquals = HIVE_FILTER_FIELD_PARAMS + parameterKey + " = \"" + parameterValue + "\"";
String filterWithLike = HIVE_FILTER_FIELD_PARAMS + parameterKey + " LIKE \"" + parameterValue + "\"";
return alternativeCall(
this::createMetastoreClient,
ThriftHiveMetastore::defaultIsValidExceptionalResponse,
chosenTableParamAlternative,
client -> client.getTableNamesByFilter(databaseName, filterWithEquals),
client -> client.getTableNamesByFilter(databaseName, filterWithLike));
}
@Override
public void createDatabase(HiveIdentity identity, Database database)
{
try {
retry()
.stopOn(AlreadyExistsException.class, InvalidObjectException.class, MetaException.class)
.stopOnIllegalExceptions()
.run("createDatabase", stats.getCreateDatabase().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
client.createDatabase(database);
}
return null;
}));
}
catch (AlreadyExistsException e) {
throw new SchemaAlreadyExistsException(database.getName());
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void dropDatabase(HiveIdentity identity, String databaseName)
{
try {
retry()
.stopOn(NoSuchObjectException.class, InvalidOperationException.class)
.stopOnIllegalExceptions()
.run("dropDatabase", stats.getDropDatabase().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
client.dropDatabase(databaseName, true, false);
}
return null;
}));
}
catch (NoSuchObjectException e) {
throw new SchemaNotFoundException(databaseName);
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void alterDatabase(HiveIdentity identity, String databaseName, Database database)
{
try {
retry()
.stopOn(NoSuchObjectException.class, MetaException.class)
.stopOnIllegalExceptions()
.run("alterDatabase", stats.getAlterDatabase().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
client.alterDatabase(databaseName, database);
}
return null;
}));
}
catch (NoSuchObjectException e) {
throw new SchemaNotFoundException(databaseName);
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void createTable(HiveIdentity identity, Table table)
{
try {
retry()
.stopOn(AlreadyExistsException.class, InvalidObjectException.class, MetaException.class, NoSuchObjectException.class)
.stopOnIllegalExceptions()
.run("createTable", stats.getCreateTable().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
client.createTable(table);
}
return null;
}));
}
catch (AlreadyExistsException e) {
throw new TableAlreadyExistsException(new SchemaTableName(table.getDbName(), table.getTableName()));
}
catch (NoSuchObjectException e) {
throw new SchemaNotFoundException(table.getDbName());
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void dropTable(HiveIdentity identity, String databaseName, String tableName, boolean deleteData)
{
try {
retry()
.stopOn(NoSuchObjectException.class)
.stopOnIllegalExceptions()
.run("dropTable", stats.getDropTable().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
Table table = client.getTable(databaseName, tableName);
client.dropTable(databaseName, tableName, deleteData);
String tableLocation = table.getSd().getLocation();
if (deleteFilesOnDrop && deleteData && isManagedTable(table) && !isNullOrEmpty(tableLocation)) {
deleteDirRecursive(hdfsContext, hdfsEnvironment, new Path(tableLocation));
}
}
return null;
}));
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private static void deleteDirRecursive(HdfsContext context, HdfsEnvironment hdfsEnvironment, Path path)
{
try {
hdfsEnvironment.getFileSystem(context, path).delete(path, true);
}
catch (IOException | RuntimeException e) {
// don't fail if unable to delete path
log.warn(e, "Failed to delete path: " + path.toString());
}
}
private static boolean isManagedTable(Table table)
{
return table.getTableType().equals(MANAGED_TABLE.name());
}
@Override
public void alterTable(HiveIdentity identity, String databaseName, String tableName, Table table)
{
try {
retry()
.stopOn(InvalidOperationException.class, MetaException.class)
.stopOnIllegalExceptions()
.run("alterTable", stats.getAlterTable().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
EnvironmentContext context = new EnvironmentContext();
// This prevents Hive 3.x from collecting basic table stats at table creation time.
// These stats are not useful by themselves and can take very long time to collect when creating an
// external table over large data set.
context.setProperties(ImmutableMap.of("DO_NOT_UPDATE_STATS", "true"));
client.alterTableWithEnvironmentContext(databaseName, tableName, table, context);
}
return null;
}));
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Optional> getPartitionNamesByFilter(HiveIdentity identity, String databaseName, String tableName, List columnNames, TupleDomain partitionKeysFilter)
{
Optional> parts = partitionKeyFilterToStringList(columnNames, partitionKeysFilter, assumeCanonicalPartitionKeys);
checkArgument(!columnNames.isEmpty() || partitionKeysFilter.isAll(), "must pass in all columnNames or the filter must be all");
if (parts.isEmpty()) {
return Optional.of(ImmutableList.of());
}
try {
if (partitionKeysFilter.isAll()) {
return retry()
.stopOn(NoSuchObjectException.class)
.stopOnIllegalExceptions()
.run("getPartitionNames", stats.getGetPartitionNames().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
return Optional.of(client.getPartitionNames(databaseName, tableName));
}
}));
}
return retry()
.stopOn(NoSuchObjectException.class)
.stopOnIllegalExceptions()
.run("getPartitionNamesByParts", stats.getGetPartitionNamesByParts().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
return Optional.of(client.getPartitionNamesFiltered(databaseName, tableName, parts.get()));
}
}));
}
catch (NoSuchObjectException e) {
return Optional.empty();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void addPartitions(HiveIdentity identity, String databaseName, String tableName, List partitionsWithStatistics)
{
List partitions = partitionsWithStatistics.stream()
.map(ThriftMetastoreUtil::toMetastoreApiPartition)
.collect(toImmutableList());
addPartitionsWithoutStatistics(identity, databaseName, tableName, partitions);
for (PartitionWithStatistics partitionWithStatistics : partitionsWithStatistics) {
storePartitionColumnStatistics(identity, databaseName, tableName, partitionWithStatistics.getPartitionName(), partitionWithStatistics);
}
}
private void addPartitionsWithoutStatistics(HiveIdentity identity, String databaseName, String tableName, List partitions)
{
if (partitions.isEmpty()) {
return;
}
try {
retry()
.stopOn(AlreadyExistsException.class, InvalidObjectException.class, MetaException.class, NoSuchObjectException.class, PrestoException.class)
.stopOnIllegalExceptions()
.run("addPartitions", stats.getAddPartitions().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
int partitionsAdded = client.addPartitions(partitions);
if (partitionsAdded != partitions.size()) {
throw new PrestoException(HIVE_METASTORE_ERROR,
format("Hive metastore only added %s of %s partitions", partitionsAdded, partitions.size()));
}
return null;
}
}));
}
catch (AlreadyExistsException e) {
throw new PrestoException(ALREADY_EXISTS, format("One or more partitions already exist for table '%s.%s'", databaseName, tableName), e);
}
catch (NoSuchObjectException e) {
throw new TableNotFoundException(new SchemaTableName(databaseName, tableName));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void dropPartition(HiveIdentity identity, String databaseName, String tableName, List parts, boolean deleteData)
{
try {
retry()
.stopOn(NoSuchObjectException.class, MetaException.class)
.stopOnIllegalExceptions()
.run("dropPartition", stats.getDropPartition().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
client.dropPartition(databaseName, tableName, parts, deleteData);
}
return null;
}));
}
catch (NoSuchObjectException e) {
throw new PartitionNotFoundException(new SchemaTableName(databaseName, tableName), parts);
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void alterPartition(HiveIdentity identity, String databaseName, String tableName, PartitionWithStatistics partitionWithStatistics)
{
alterPartitionWithoutStatistics(identity, databaseName, tableName, toMetastoreApiPartition(partitionWithStatistics));
storePartitionColumnStatistics(identity, databaseName, tableName, partitionWithStatistics.getPartitionName(), partitionWithStatistics);
dropExtraColumnStatisticsAfterAlterPartition(identity, databaseName, tableName, partitionWithStatistics);
}
private void alterPartitionWithoutStatistics(HiveIdentity identity, String databaseName, String tableName, Partition partition)
{
try {
retry()
.stopOn(NoSuchObjectException.class, MetaException.class)
.stopOnIllegalExceptions()
.run("alterPartition", stats.getAlterPartition().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
client.alterPartition(databaseName, tableName, partition);
}
return null;
}));
}
catch (NoSuchObjectException e) {
throw new PartitionNotFoundException(new SchemaTableName(databaseName, tableName), partition.getValues());
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private void storePartitionColumnStatistics(HiveIdentity identity, String databaseName, String tableName, String partitionName, PartitionWithStatistics partitionWithStatistics)
{
PartitionStatistics statistics = partitionWithStatistics.getStatistics();
Map columnStatistics = statistics.getColumnStatistics();
if (columnStatistics.isEmpty()) {
return;
}
Map columnTypes = partitionWithStatistics.getPartition().getColumns().stream()
.collect(toImmutableMap(Column::getName, Column::getType));
setPartitionColumnStatistics(identity, databaseName, tableName, partitionName, columnTypes, columnStatistics, statistics.getBasicStatistics().getRowCount());
}
/*
* After altering a partition metastore preserves all column statistics for that partition.
*
* The old statistics are supposed to be replaced by storing the new partition statistics.
*
* In case when the new statistics are not present for some columns, or if the table schema has changed
* if is needed to explicitly remove the statistics from the metastore for that columns.
*/
private void dropExtraColumnStatisticsAfterAlterPartition(
HiveIdentity identity,
String databaseName,
String tableName,
PartitionWithStatistics partitionWithStatistics)
{
List dataColumns = partitionWithStatistics.getPartition().getColumns().stream()
.map(Column::getName)
.collect(toImmutableList());
Set columnsWithMissingStatistics = new HashSet<>(dataColumns);
columnsWithMissingStatistics.removeAll(partitionWithStatistics.getStatistics().getColumnStatistics().keySet());
// In case new partition had the statistics computed for all the columns, the storePartitionColumnStatistics
// call in the alterPartition will just overwrite the old statistics. There is no need to explicitly remove anything.
if (columnsWithMissingStatistics.isEmpty()) {
return;
}
// check if statistics for the columnsWithMissingStatistics are actually stored in the metastore
// when trying to remove any missing statistics the metastore throws NoSuchObjectException
String partitionName = partitionWithStatistics.getPartitionName();
List statisticsToBeRemoved = getMetastorePartitionColumnStatistics(
identity,
databaseName,
tableName,
ImmutableSet.of(partitionName),
ImmutableList.copyOf(columnsWithMissingStatistics))
.getOrDefault(partitionName, ImmutableList.of());
for (ColumnStatisticsObj statistics : statisticsToBeRemoved) {
deletePartitionColumnStatistics(identity, databaseName, tableName, partitionName, statistics.getColName());
}
}
@Override
public Optional getPartition(HiveIdentity identity, String databaseName, String tableName, List partitionValues)
{
requireNonNull(partitionValues, "partitionValues is null");
try {
return retry()
.stopOn(NoSuchObjectException.class)
.stopOnIllegalExceptions()
.run("getPartition", stats.getGetPartition().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
return Optional.of(client.getPartition(databaseName, tableName, partitionValues));
}
}));
}
catch (NoSuchObjectException e) {
return Optional.empty();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public List getPartitionsByNames(HiveIdentity identity, String databaseName, String tableName, List partitionNames)
{
requireNonNull(partitionNames, "partitionNames is null");
checkArgument(!Iterables.isEmpty(partitionNames), "partitionNames is empty");
try {
return retry()
.stopOn(NoSuchObjectException.class)
.stopOnIllegalExceptions()
.run("getPartitionsByNames", stats.getGetPartitionsByNames().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient(identity)) {
return client.getPartitionsByNames(databaseName, tableName, partitionNames);
}
}));
}
catch (NoSuchObjectException e) {
// assume none of the partitions in the batch are available
return ImmutableList.of();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void grantTablePrivileges(String databaseName, String tableName, String tableOwner, HivePrincipal grantee, Set privileges)
{
Set requestedPrivileges = privileges.stream()
.map(ThriftMetastoreUtil::toMetastoreApiPrivilegeGrantInfo)
.collect(toImmutableSet());
checkArgument(!containsAllPrivilege(requestedPrivileges), "\"ALL\" not supported in PrivilegeGrantInfo.privilege");
try {
retry()
.stopOnIllegalExceptions()
.run("grantTablePrivileges", stats.getGrantTablePrivileges().wrap(() -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient()) {
Set existingPrivileges = listTablePrivileges(databaseName, tableName, tableOwner, Optional.of(grantee));
Set privilegesToGrant = new HashSet<>(requestedPrivileges);
Iterator iterator = privilegesToGrant.iterator();
while (iterator.hasNext()) {
HivePrivilegeInfo requestedPrivilege = getOnlyElement(parsePrivilege(iterator.next(), Optional.empty()));
for (HivePrivilegeInfo existingPrivilege : existingPrivileges) {
if ((requestedPrivilege.isContainedIn(existingPrivilege))) {
iterator.remove();
}
else if (existingPrivilege.isContainedIn(requestedPrivilege)) {
throw new PrestoException(NOT_SUPPORTED, format(
"Granting %s WITH GRANT OPTION is not supported while %s possesses %s",
requestedPrivilege.getHivePrivilege().name(),
grantee,
requestedPrivilege.getHivePrivilege().name()));
}
}
}
if (privilegesToGrant.isEmpty()) {
return null;
}
metastoreClient.grantPrivileges(buildPrivilegeBag(databaseName, tableName, grantee, privilegesToGrant));
}
return null;
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void revokeTablePrivileges(String databaseName, String tableName, String tableOwner, HivePrincipal grantee, Set privileges)
{
Set requestedPrivileges = privileges.stream()
.map(ThriftMetastoreUtil::toMetastoreApiPrivilegeGrantInfo)
.collect(toImmutableSet());
checkArgument(!containsAllPrivilege(requestedPrivileges), "\"ALL\" not supported in PrivilegeGrantInfo.privilege");
try {
retry()
.stopOnIllegalExceptions()
.run("revokeTablePrivileges", stats.getRevokeTablePrivileges().wrap(() -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient()) {
Set existingHivePrivileges = listTablePrivileges(databaseName, tableName, tableOwner, Optional.of(grantee)).stream()
.map(HivePrivilegeInfo::getHivePrivilege)
.collect(toImmutableSet());
Set privilegesToRevoke = requestedPrivileges.stream()
.filter(privilegeGrantInfo -> existingHivePrivileges.contains(getOnlyElement(parsePrivilege(privilegeGrantInfo, Optional.empty())).getHivePrivilege()))
.collect(toImmutableSet());
if (privilegesToRevoke.isEmpty()) {
return null;
}
metastoreClient.revokePrivileges(buildPrivilegeBag(databaseName, tableName, grantee, privilegesToRevoke));
}
return null;
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Set listTablePrivileges(String databaseName, String tableName, String tableOwner, Optional principal)
{
try {
return retry()
.stopOnIllegalExceptions()
.run("listTablePrivileges", stats.getListTablePrivileges().wrap(() -> {
try (ThriftMetastoreClient client = createMetastoreClient()) {
ImmutableSet.Builder privileges = ImmutableSet.builder();
List hiveObjectPrivilegeList;
if (principal.isEmpty()) {
HivePrincipal ownerPrincipal = new HivePrincipal(USER, tableOwner);
privileges.add(new HivePrivilegeInfo(OWNERSHIP, true, ownerPrincipal, ownerPrincipal));
hiveObjectPrivilegeList = client.listPrivileges(
null,
null,
new HiveObjectRef(TABLE, databaseName, tableName, null, null));
}
else {
if (principal.get().getType() == USER && tableOwner.equals(principal.get().getName())) {
privileges.add(new HivePrivilegeInfo(OWNERSHIP, true, principal.get(), principal.get()));
}
hiveObjectPrivilegeList = client.listPrivileges(
principal.get().getName(),
fromPrestoPrincipalType(principal.get().getType()),
new HiveObjectRef(TABLE, databaseName, tableName, null, null));
}
for (HiveObjectPrivilege hiveObjectPrivilege : hiveObjectPrivilegeList) {
HivePrincipal grantee = new HivePrincipal(fromMetastoreApiPrincipalType(hiveObjectPrivilege.getPrincipalType()), hiveObjectPrivilege.getPrincipalName());
privileges.addAll(parsePrivilege(hiveObjectPrivilege.getGrantInfo(), Optional.of(grantee)));
}
return privileges.build();
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public long openTransaction(HiveIdentity identity)
{
checkArgument(!identity.getUsername().map(String::isEmpty).orElse(true), "User should be provided to open transaction");
try {
return retry()
.stopOnIllegalExceptions()
.run("openTransaction", stats.getOpenTransaction().wrap(() -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient(identity)) {
return metastoreClient.openTransaction(identity.getUsername().get());
}
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void commitTransaction(HiveIdentity identity, long transactionId)
{
try {
retry()
.stopOnIllegalExceptions()
.run("commitTransaction", stats.getCommitTransaction().wrap(() -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient(identity)) {
metastoreClient.commitTransaction(transactionId);
}
return null;
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void sendTransactionHeartbeat(HiveIdentity identity, long transactionId)
{
try {
retry()
.stopOnIllegalExceptions()
.run("sendTransactionHeartbeat", (() -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient(identity)) {
metastoreClient.sendTransactionHeartbeat(transactionId);
}
return null;
}));
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public void acquireSharedReadLock(HiveIdentity identity, String queryId, long transactionId, List fullTables, List partitions)
{
checkArgument(!identity.getUsername().map(String::isEmpty).orElse(true), "User should be provided to acquire locks");
requireNonNull(queryId, "queryId is null");
if (fullTables.isEmpty() && partitions.isEmpty()) {
return;
}
LockRequestBuilder request = new LockRequestBuilder(queryId)
.setTransactionId(transactionId)
.setUser(identity.getUsername().get());
for (SchemaTableName table : fullTables) {
request.addLockComponent(createLockComponentForRead(table, Optional.empty()));
}
for (HivePartition partition : partitions) {
request.addLockComponent(createLockComponentForRead(partition.getTableName(), Optional.of(partition.getPartitionId())));
}
LockRequest lockRequest = request.build();
try {
LockResponse response = retry()
.stopOn(NoSuchTxnException.class, TxnAbortedException.class, MetaException.class)
.run("acquireLock", stats.getAcquireLock().wrap(() -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient(identity)) {
return metastoreClient.acquireLock(lockRequest);
}
}));
long waitStart = nanoTime();
while (response.getState() == LockState.WAITING) {
long lockId = response.getLockid();
if (Duration.nanosSince(waitStart).compareTo(maxWaitForLock) > 0) {
// timed out
throw new PrestoException(HIVE_TABLE_LOCK_NOT_ACQUIRED, format("Timed out waiting for lock %d in hive transaction %s for query %s", lockId, transactionId, queryId));
}
log.debug("Waiting for lock %d in hive transaction %s for query %s", lockId, transactionId, queryId);
response = retry()
.stopOn(NoSuchTxnException.class, NoSuchLockException.class, TxnAbortedException.class, MetaException.class)
.run("checkLock", stats.getCheckLock().wrap(() -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient(identity)) {
return metastoreClient.checkLock(lockId);
}
}));
}
if (response.getState() != LockState.ACQUIRED) {
throw new PrestoException(HIVE_TABLE_LOCK_NOT_ACQUIRED, "Could not acquire lock. Lock in state " + response.getState());
}
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
private static LockComponent createLockComponentForRead(SchemaTableName table, Optional partitionName)
{
requireNonNull(table, "table is null");
requireNonNull(partitionName, "partitionName is null");
LockComponentBuilder builder = new LockComponentBuilder();
builder.setShared();
builder.setOperationType(DataOperationType.SELECT);
builder.setDbName(table.getSchemaName());
builder.setTableName(table.getTableName());
requireNonNull(partitionName, "partitionName is null").ifPresent(builder::setPartitionName);
// acquire locks is called only for TransactionalTable
builder.setIsTransactional(true);
return builder.build();
}
@Override
public String getValidWriteIds(HiveIdentity identity, List tables, long currentTransactionId)
{
try {
return retry()
.stopOnIllegalExceptions()
.run("getValidWriteIds", stats.getValidWriteIds().wrap(() -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient(identity)) {
return metastoreClient.getValidWriteIds(
tables.stream()
.map(table -> format("%s.%s", table.getSchemaName(), table.getTableName()))
.collect(toImmutableList()),
currentTransactionId);
}
}));
}
catch (TException e) {
// When calling Hive metastore < 3, the call fails with
// Required field 'open_txns' is unset! Struct:GetOpenTxnsResponse(txn_high_water_mark:4, open_txns:null, min_open_txn:4, abortedBits:null)
throw new PrestoException(HIVE_METASTORE_ERROR, "Failed to open transaction. Transactional tables support requires Hive metastore version at least 3.0", e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public Optional getConfigValue(String name)
{
try {
return retry()
.stopOnIllegalExceptions()
.run("getConfigValueFromServer", () -> {
try (ThriftMetastoreClient metastoreClient = createMetastoreClient()) {
return Optional.ofNullable(metastoreClient.get_config_value(name, null));
}
});
}
catch (ConfigValSecurityException e) {
log.debug(e, "Could not fetch value for config '%s' from Hive", name);
return Optional.empty();
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
catch (Exception e) {
throw propagate(e);
}
}
@Override
public boolean isImpersonationEnabled()
{
return impersonationEnabled;
}
private PrivilegeBag buildPrivilegeBag(
String databaseName,
String tableName,
HivePrincipal grantee,
Set privilegeGrantInfos)
{
ImmutableList.Builder privilegeBagBuilder = ImmutableList.builder();
for (PrivilegeGrantInfo privilegeGrantInfo : privilegeGrantInfos) {
privilegeBagBuilder.add(
new HiveObjectPrivilege(
new HiveObjectRef(TABLE, databaseName, tableName, null, null),
grantee.getName(),
fromPrestoPrincipalType(grantee.getType()),
privilegeGrantInfo,
"SQL"));
}
return new PrivilegeBag(privilegeBagBuilder.build());
}
private boolean containsAllPrivilege(Set requestedPrivileges)
{
return requestedPrivileges.stream()
.anyMatch(privilege -> privilege.getPrivilege().equalsIgnoreCase("all"));
}
@SafeVarargs
private final T alternativeCall(
ClientSupplier clientSupplier,
Predicate isValidExceptionalResponse,
AtomicInteger chosenAlternative,
Call... alternatives)
throws TException
{
checkArgument(alternatives.length > 0, "No alternatives");
int chosen = chosenAlternative.get();
checkArgument(chosen == Integer.MAX_VALUE || (0 <= chosen && chosen < alternatives.length), "Bad chosen alternative value: %s", chosen);
if (chosen != Integer.MAX_VALUE) {
try (ThriftMetastoreClient client = clientSupplier.createMetastoreClient()) {
return alternatives[chosen].callOn(client);
}
}
Exception firstException = null;
for (int i = 0; i < alternatives.length; i++) {
int position = i;
try (ThriftMetastoreClient client = clientSupplier.createMetastoreClient()) {
T result = alternatives[i].callOn(client);
chosenAlternative.updateAndGet(currentChosen -> Math.min(currentChosen, position));
return result;
}
catch (TException | RuntimeException exception) {
if (isValidExceptionalResponse.test(exception)) {
// This is likely a valid response. We are not settling on an alternative yet.
// We will do it later when we get a more obviously valid response.
throw exception;
}
if (firstException == null) {
firstException = exception;
}
else if (firstException != exception) {
firstException.addSuppressed(exception);
}
}
}
verifyNotNull(firstException);
propagateIfPossible(firstException, TException.class);
throw propagate(firstException);
}
// TODO we should recognize exceptions which we suppress and try different alternative call
// this requires product tests with HDP 3
private static boolean defaultIsValidExceptionalResponse(Exception exception)
{
if (exception instanceof NoSuchObjectException) {
return true;
}
if (exception.toString().contains("AccessControlException")) {
// e.g. org.apache.hadoop.hive.metastore.api.MetaException: org.apache.hadoop.security.AccessControlException: Permission denied: ...
return true;
}
return false;
}
private static boolean isUnknownMethodExceptionalResponse(Exception exception)
{
if (!(exception instanceof TApplicationException)) {
return false;
}
TApplicationException applicationException = (TApplicationException) exception;
return applicationException.getType() == UNKNOWN_METHOD;
}
private ThriftMetastoreClient createMetastoreClient()
throws TException
{
return clientProvider.createMetastoreClient(Optional.empty());
}
private ThriftMetastoreClient createMetastoreClient(HiveIdentity identity)
throws TException
{
if (!impersonationEnabled) {
return createMetastoreClient();
}
String username = identity.getUsername().orElseThrow(() -> new IllegalStateException("End-user name should exist when metastore impersonation is enabled"));
if (authenticationEnabled) {
String delegationToken;
try {
delegationToken = delegationTokenCache.getUnchecked(username);
}
catch (UncheckedExecutionException e) {
throwIfInstanceOf(e.getCause(), PrestoException.class);
throw e;
}
return clientProvider.createMetastoreClient(Optional.of(delegationToken));
}
ThriftMetastoreClient client = createMetastoreClient();
setMetastoreUserOrClose(client, username);
return client;
}
private String loadDelegationToken(String username)
{
try (ThriftMetastoreClient client = createMetastoreClient()) {
return client.getDelegationToken(username);
}
catch (TException e) {
throw new PrestoException(HIVE_METASTORE_ERROR, e);
}
}
private static void setMetastoreUserOrClose(ThriftMetastoreClient client, String username)
throws TException
{
try {
client.setUGI(username);
}
catch (Throwable t) {
// close client and suppress any error from close
try (Closeable ignored = client) {
throw t;
}
catch (IOException e) {
// impossible; will be suppressed
}
}
}
private RetryDriver retry()
{
return RetryDriver.retry()
.exponentialBackoff(minBackoffDelay, maxBackoffDelay, maxRetryTime, backoffScaleFactor)
.maxAttempts(maxRetries + 1)
.stopOn(PrestoException.class);
}
private static RuntimeException propagate(Throwable throwable)
{
if (throwable instanceof InterruptedException) {
Thread.currentThread().interrupt();
}
throwIfUnchecked(throwable);
throw new RuntimeException(throwable);
}
@FunctionalInterface
private interface ClientSupplier
{
ThriftMetastoreClient createMetastoreClient()
throws TException;
}
@FunctionalInterface
private interface Call
{
T callOn(ThriftMetastoreClient client)
throws TException;
}
@FunctionalInterface
private interface Call1
{
void call(ThriftMetastoreClient client, A arg)
throws TException;
}
}