All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.trino.plugin.hive.metastore.glue.GlueHiveMetastore Maven / Gradle / Ivy

/*
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package io.trino.plugin.hive.metastore.glue;

import com.google.common.base.Strings;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import com.google.common.collect.Lists;
import com.google.inject.Inject;
import io.airlift.log.Logger;
import io.trino.filesystem.Location;
import io.trino.filesystem.TrinoFileSystem;
import io.trino.filesystem.TrinoFileSystemFactory;
import io.trino.metastore.Column;
import io.trino.metastore.Database;
import io.trino.metastore.HiveBasicStatistics;
import io.trino.metastore.HiveColumnStatistics;
import io.trino.metastore.HiveMetastore;
import io.trino.metastore.HivePrincipal;
import io.trino.metastore.HivePrivilegeInfo;
import io.trino.metastore.HiveType;
import io.trino.metastore.Partition;
import io.trino.metastore.PartitionStatistics;
import io.trino.metastore.PartitionWithStatistics;
import io.trino.metastore.PrincipalPrivileges;
import io.trino.metastore.StatisticsUpdateMode;
import io.trino.metastore.Table;
import io.trino.metastore.TableInfo;
import io.trino.plugin.hive.HivePartitionManager;
import io.trino.plugin.hive.PartitionNotFoundException;
import io.trino.plugin.hive.SchemaAlreadyExistsException;
import io.trino.plugin.hive.TableAlreadyExistsException;
import io.trino.spi.ErrorCode;
import io.trino.spi.TrinoException;
import io.trino.spi.connector.SchemaNotFoundException;
import io.trino.spi.connector.SchemaTableName;
import io.trino.spi.connector.TableNotFoundException;
import io.trino.spi.function.LanguageFunction;
import io.trino.spi.predicate.TupleDomain;
import io.trino.spi.security.ConnectorIdentity;
import io.trino.spi.security.RoleGrant;
import jakarta.annotation.Nullable;
import jakarta.annotation.PreDestroy;
import org.weakref.jmx.Flatten;
import org.weakref.jmx.Managed;
import software.amazon.awssdk.core.exception.SdkException;
import software.amazon.awssdk.services.glue.GlueClient;
import software.amazon.awssdk.services.glue.model.AccessDeniedException;
import software.amazon.awssdk.services.glue.model.AlreadyExistsException;
import software.amazon.awssdk.services.glue.model.BatchGetPartitionResponse;
import software.amazon.awssdk.services.glue.model.BatchUpdatePartitionRequestEntry;
import software.amazon.awssdk.services.glue.model.ColumnStatistics;
import software.amazon.awssdk.services.glue.model.CreateTableRequest;
import software.amazon.awssdk.services.glue.model.DatabaseInput;
import software.amazon.awssdk.services.glue.model.DeleteTableRequest;
import software.amazon.awssdk.services.glue.model.EntityNotFoundException;
import software.amazon.awssdk.services.glue.model.GetDatabaseResponse;
import software.amazon.awssdk.services.glue.model.GetDatabasesResponse;
import software.amazon.awssdk.services.glue.model.GetPartitionResponse;
import software.amazon.awssdk.services.glue.model.GetPartitionsResponse;
import software.amazon.awssdk.services.glue.model.GetTableResponse;
import software.amazon.awssdk.services.glue.model.GetTablesResponse;
import software.amazon.awssdk.services.glue.model.GetUserDefinedFunctionsResponse;
import software.amazon.awssdk.services.glue.model.PartitionInput;
import software.amazon.awssdk.services.glue.model.PartitionValueList;
import software.amazon.awssdk.services.glue.model.Segment;
import software.amazon.awssdk.services.glue.model.TableInput;
import software.amazon.awssdk.services.glue.model.UserDefinedFunctionInput;

import java.io.IOException;
import java.util.ArrayList;
import java.util.Collection;
import java.util.EnumSet;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.Objects;
import java.util.Optional;
import java.util.OptionalLong;
import java.util.Set;
import java.util.concurrent.Callable;
import java.util.concurrent.ExecutionException;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.function.Consumer;
import java.util.function.Predicate;
import java.util.function.UnaryOperator;
import java.util.regex.Pattern;
import java.util.stream.Collectors;
import java.util.stream.IntStream;
import java.util.stream.Stream;

import static com.google.common.base.Preconditions.checkArgument;
import static com.google.common.base.Throwables.throwIfUnchecked;
import static com.google.common.base.Verify.verify;
import static com.google.common.collect.ImmutableList.toImmutableList;
import static com.google.common.collect.ImmutableMap.toImmutableMap;
import static com.google.common.collect.ImmutableSet.toImmutableSet;
import static io.airlift.concurrent.Threads.daemonThreadsNamed;
import static io.opentelemetry.context.Context.taskWrapping;
import static io.trino.metastore.Table.TABLE_COMMENT;
import static io.trino.plugin.base.util.ExecutorUtil.processWithAdditionalThreads;
import static io.trino.plugin.hive.HiveErrorCode.HIVE_FILESYSTEM_ERROR;
import static io.trino.plugin.hive.HiveErrorCode.HIVE_METASTORE_ERROR;
import static io.trino.plugin.hive.HiveMetadata.TRINO_QUERY_ID_NAME;
import static io.trino.plugin.hive.TableType.MANAGED_TABLE;
import static io.trino.plugin.hive.metastore.MetastoreUtil.getHiveBasicStatistics;
import static io.trino.plugin.hive.metastore.MetastoreUtil.makePartitionName;
import static io.trino.plugin.hive.metastore.MetastoreUtil.metastoreFunctionName;
import static io.trino.plugin.hive.metastore.MetastoreUtil.toPartitionName;
import static io.trino.plugin.hive.metastore.MetastoreUtil.updateStatisticsParameters;
import static io.trino.plugin.hive.metastore.glue.GlueConverter.fromGlueStatistics;
import static io.trino.plugin.hive.metastore.glue.GlueConverter.toGlueColumnStatistics;
import static io.trino.plugin.hive.metastore.glue.GlueConverter.toGlueDatabaseInput;
import static io.trino.plugin.hive.metastore.glue.GlueConverter.toGlueFunctionInput;
import static io.trino.plugin.hive.metastore.glue.GlueConverter.toGluePartitionInput;
import static io.trino.plugin.hive.metastore.glue.GlueConverter.toGlueTableInput;
import static io.trino.plugin.hive.util.HiveUtil.escapeSchemaName;
import static io.trino.plugin.hive.util.HiveUtil.isDeltaLakeTable;
import static io.trino.plugin.hive.util.HiveUtil.isHudiTable;
import static io.trino.plugin.hive.util.HiveUtil.isIcebergTable;
import static io.trino.spi.ErrorType.EXTERNAL;
import static io.trino.spi.StandardErrorCode.ALREADY_EXISTS;
import static io.trino.spi.StandardErrorCode.FUNCTION_NOT_FOUND;
import static io.trino.spi.StandardErrorCode.NOT_FOUND;
import static io.trino.spi.StandardErrorCode.NOT_SUPPORTED;
import static io.trino.spi.StandardErrorCode.TABLE_NOT_FOUND;
import static io.trino.spi.StandardErrorCode.UNSUPPORTED_TABLE_TYPE;
import static io.trino.spi.connector.SchemaTableName.schemaTableName;
import static io.trino.spi.security.PrincipalType.USER;
import static java.util.Map.entry;
import static java.util.Objects.requireNonNull;
import static java.util.concurrent.Executors.newFixedThreadPool;
import static java.util.function.Predicate.not;
import static java.util.function.UnaryOperator.identity;
import static java.util.stream.Collectors.toCollection;
import static java.util.stream.Collectors.toMap;

public class GlueHiveMetastore
        implements HiveMetastore
{
    private static final Logger log = Logger.get(GlueHiveMetastore.class);

    private static final String PUBLIC_ROLE_NAME = "public";
    private static final String DEFAULT_METASTORE_USER = "trino";

    // Read limit for AWS Glue API GetColumnStatisticsForPartition
    // https://docs.aws.amazon.com/glue/latest/dg/aws-glue-api-catalog-partitions.html#aws-glue-api-catalog-partitions-GetColumnStatisticsForPartition
    private static final int GLUE_COLUMN_READ_STAT_PAGE_SIZE = 100;

    // Write limit for AWS Glue API UpdateColumnStatisticsForPartition
    // https://docs.aws.amazon.com/glue/latest/dg/aws-glue-api-catalog-partitions.html#aws-glue-api-catalog-partitions-UpdateColumnStatisticsForPartition
    private static final int GLUE_COLUMN_WRITE_STAT_PAGE_SIZE = 25;

    private static final int BATCH_GET_PARTITION_MAX_PAGE_SIZE = 1000;
    private static final int AWS_GLUE_GET_PARTITIONS_MAX_RESULTS = 1000;
    private static final int BATCH_UPDATE_PARTITION_MAX_PAGE_SIZE = 100;
    private static final int AWS_GLUE_GET_FUNCTIONS_MAX_RESULTS = 100;

    private static final AtomicInteger poolCounter = new AtomicInteger();

    private final GlueClient glueClient;
    private final GlueContext glueContext;
    private final GlueCache glueCache;
    private final TrinoFileSystem fileSystem;
    private final Optional defaultDir;
    private final int partitionSegments;
    private final boolean assumeCanonicalPartitionKeys;
    private final GlueMetastoreStats stats = new GlueMetastoreStats();
    private final Predicate tableVisibilityFilter;
    private final ExecutorService executor;

    @Inject
    public GlueHiveMetastore(
            GlueClient glueClient,
            GlueContext glueContext,
            GlueCache glueCache,
            TrinoFileSystemFactory fileSystemFactory,
            GlueHiveMetastoreConfig config,
            Set visibleTableKinds)
    {
        this(
                glueClient,
                glueContext,
                glueCache,
                fileSystemFactory.create(ConnectorIdentity.ofUser(DEFAULT_METASTORE_USER)),
                config.getDefaultWarehouseDir(),
                config.getPartitionSegments(),
                config.isAssumeCanonicalPartitionKeys(),
                visibleTableKinds,
                newFixedThreadPool(config.getThreads(), daemonThreadsNamed("glue-%s-%%s".formatted(poolCounter.getAndIncrement()))));
    }

    private GlueHiveMetastore(
            GlueClient glueClient,
            GlueContext glueContext,
            GlueCache glueCache, TrinoFileSystem fileSystem,
            Optional defaultDir,
            int partitionSegments,
            boolean assumeCanonicalPartitionKeys,
            Set visibleTableKinds,
            ExecutorService executor)
    {
        this.glueClient = requireNonNull(glueClient, "glueClient is null");
        this.glueContext = requireNonNull(glueContext, "glueContext is null");
        this.glueCache = glueCache;
        this.fileSystem = requireNonNull(fileSystem, "fileSystem is null");
        this.defaultDir = requireNonNull(defaultDir, "defaultDir is null");
        this.partitionSegments = partitionSegments;
        this.assumeCanonicalPartitionKeys = assumeCanonicalPartitionKeys;
        this.tableVisibilityFilter = createTablePredicate(visibleTableKinds);
        this.executor = taskWrapping(requireNonNull(executor, "executor is null"));
    }

    @PreDestroy
    public void shutdown()
    {
        executor.shutdownNow();
    }

    @Managed
    @Flatten
    public GlueMetastoreStats getStats()
    {
        return stats;
    }

    @Managed
    @Flatten
    public GlueCache getGlueCache()
    {
        return glueCache;
    }

    @Override
    public List getAllDatabases()
    {
        return glueCache.getDatabaseNames(this::getDatabasesInternal);
    }

    private List getDatabasesInternal(Consumer cacheDatabase)
    {
        try {
            return stats.getGetDatabases().call(() -> glueClient.getDatabasesPaginator(glueContext::configureClient).stream()
                    .map(GetDatabasesResponse::databaseList)
                    .flatMap(List::stream)
                    .map(GlueConverter::fromGlueDatabase)
                    .peek(cacheDatabase)
                    .map(Database::getDatabaseName)
                    .toList());
        }
        catch (SdkException e) {
            throw new TrinoException(HIVE_METASTORE_ERROR, e);
        }
    }

    @Override
    public Optional getDatabase(String databaseName)
    {
        return glueCache.getDatabase(databaseName, () -> getDatabaseInternal(databaseName));
    }

    private Optional getDatabaseInternal(String databaseName)
    {
        try {
            GetDatabaseResponse response = stats.getGetDatabase().call(() -> glueClient.getDatabase(builder -> builder
                    .applyMutation(glueContext::configureClient)
                    .name(databaseName)));
            return Optional.of(GlueConverter.fromGlueDatabase(response.database()));
        }
        catch (EntityNotFoundException e) {
            return Optional.empty();
        }
        catch (SdkException e) {
            throw new TrinoException(HIVE_METASTORE_ERROR, e);
        }
    }

    @Override
    public void createDatabase(Database database)
    {
        if (database.getLocation().isEmpty() && defaultDir.isPresent()) {
            Location location = Location.of(defaultDir.get())
                    .appendPath(escapeSchemaName(database.getDatabaseName()));
            database = Database.builder(database)
                    .setLocation(Optional.of(location.toString()))
                    .build();
        }

        try {
            DatabaseInput databaseInput = toGlueDatabaseInput(database);
            stats.getCreateDatabase().call(() -> glueClient.createDatabase(builder -> builder
                    .applyMutation(glueContext::configureClient)
                    .databaseInput(databaseInput)));
        }
        catch (AlreadyExistsException e) {
            // Do not throw SchemaAlreadyExistsException if this query has already created the database.
            // This may happen when an actually successful metastore create call is retried
            // because of a timeout on our side.
            String expectedQueryId = database.getParameters().get(TRINO_QUERY_ID_NAME);
            if (expectedQueryId != null) {
                String existingQueryId = getDatabase(database.getDatabaseName())
                        .map(Database::getParameters)
                        .map(parameters -> parameters.get(TRINO_QUERY_ID_NAME))
                        .orElse(null);
                if (expectedQueryId.equals(existingQueryId)) {
                    return;
                }
            }
            throw new SchemaAlreadyExistsException(database.getDatabaseName(), e);
        }
        catch (SdkException e) {
            throw new TrinoException(HIVE_METASTORE_ERROR, e);
        }
        finally {
            glueCache.invalidateDatabase(database.getDatabaseName());
            glueCache.invalidateDatabaseNames();
        }

        if (database.getLocation().isPresent()) {
            Location location = Location.of(database.getLocation().get());
            try {
                fileSystem.createDirectory(location);
            }
            catch (IOException e) {
                throw new TrinoException(HIVE_FILESYSTEM_ERROR, "Failed to create directory: " + location, e);
            }
        }
    }

    @Override
    public void dropDatabase(String databaseName, boolean deleteData)
    {
        Optional location = Optional.empty();
        if (deleteData) {
            location = getDatabase(databaseName)
                    .orElseThrow(() -> new SchemaNotFoundException(databaseName))
                    .getLocation()
                    .map(Location::of);
        }

        try {
            stats.getDeleteDatabase().call(() -> glueClient.deleteDatabase(builder -> builder
                    .applyMutation(glueContext::configureClient)
                    .name(databaseName)));
        }
        catch (EntityNotFoundException e) {
            throw new SchemaNotFoundException(databaseName, e);
        }
        catch (SdkException e) {
            throw new TrinoException(HIVE_METASTORE_ERROR, e);
        }
        finally {
            glueCache.invalidateDatabase(databaseName);
            glueCache.invalidateDatabaseNames();
        }

        location.ifPresent(this::deleteDir);
    }

    @Override
    public void renameDatabase(String databaseName, String newDatabaseName)
    {
        try {
            var database = stats.getGetDatabase().call(() -> glueClient.getDatabase(builder -> builder
                    .applyMutation(glueContext::configureClient)
                    .name(databaseName)).database());
            DatabaseInput renamedDatabase = DatabaseInput.builder()
                    .name(newDatabaseName)
                    .parameters(database.parameters())
                    .description(database.description())
                    .locationUri(database.locationUri())
                    .build();
            stats.getUpdateDatabase().call(() -> glueClient.updateDatabase(builder -> builder
                    .applyMutation(glueContext::configureClient)
                    .name(databaseName).databaseInput(renamedDatabase)));
        }
        catch (EntityNotFoundException e) {
            throw new SchemaNotFoundException(databaseName, e);
        }
        catch (AlreadyExistsException e) {
            throw new SchemaAlreadyExistsException(newDatabaseName, e);
        }
        catch (SdkException e) {
            throw new TrinoException(HIVE_METASTORE_ERROR, e);
        }
        finally {
            glueCache.invalidateDatabase(databaseName);
            glueCache.invalidateDatabase(newDatabaseName);
            glueCache.invalidateDatabaseNames();
        }
    }

    @Override
    public void setDatabaseOwner(String databaseName, HivePrincipal principal)
    {
        throw new TrinoException(NOT_SUPPORTED, "setting the database owner is not supported by Glue");
    }

    @Override
    public List getTables(String databaseName)
    {
        return glueCache.getTables(databaseName, cacheTable -> getTablesInternal(cacheTable, databaseName));
    }

    private List getTablesInternal(Consumer cacheTable, String databaseName)
    {
        try {
            ImmutableList glueTables = stats.getGetTables()
                    .call(() -> glueClient.getTablesPaginator(builder -> builder
                                    .applyMutation(glueContext::configureClient)
                                    .databaseName(databaseName)).stream()
                            .map(GetTablesResponse::tableList)
                            .flatMap(List::stream))
                    .filter(tableVisibilityFilter)
                    .collect(toImmutableList());

            // Store only valid tables in cache
            for (software.amazon.awssdk.services.glue.model.Table table : glueTables) {
                convertFromGlueIgnoringErrors(table, databaseName)
                        .ifPresent(cacheTable);
            }

            return glueTables.stream()
                    .map(table -> new TableInfo(
                            new SchemaTableName(databaseName, table.name()),
                            TableInfo.ExtendedRelationType.fromTableTypeAndComment(table.tableType(), table.parameters().get(TABLE_COMMENT))))
                    .toList();
        }
        catch (EntityNotFoundException _) {
            // Database might have been deleted concurrently.
            return ImmutableList.of();
        }
        catch (SdkException e) {
            throw new TrinoException(HIVE_METASTORE_ERROR, e);
        }
    }

    private static Optional
convertFromGlueIgnoringErrors(software.amazon.awssdk.services.glue.model.Table glueTable, String databaseName) { try { return Optional.of(GlueConverter.fromGlueTable(glueTable, databaseName)); } catch (RuntimeException e) { handleListingError(e, schemaTableName(glueTable.databaseName(), glueTable.name())); return Optional.empty(); } } private static void handleListingError(RuntimeException e, SchemaTableName tableName) { boolean silent = false; if (e instanceof TrinoException trinoException) { ErrorCode errorCode = trinoException.getErrorCode(); silent = errorCode.equals(UNSUPPORTED_TABLE_TYPE.toErrorCode()) || // e.g. table deleted concurrently errorCode.equals(TABLE_NOT_FOUND.toErrorCode()) || errorCode.equals(NOT_FOUND.toErrorCode()) || // e.g. Iceberg/Delta table being deleted concurrently resulting in failure to load metadata from filesystem errorCode.getType() == EXTERNAL; } if (silent) { log.debug(e, "Failed to get metadata for table: %s", tableName); } else { log.warn(e, "Failed to get metadata for table: %s", tableName); } } @Override public Optional
getTable(String databaseName, String tableName) { return glueCache.getTable(databaseName, tableName, () -> getTableInternal(databaseName, tableName)); } private Optional
getTableInternal(String databaseName, String tableName) { try { GetTableResponse result = stats.getGetTable().call(() -> glueClient.getTable(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .name(tableName))); return Optional.of(GlueConverter.fromGlueTable(result.table(), databaseName)); } catch (EntityNotFoundException e) { return Optional.empty(); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } } @Override public void createTable(Table table, PrincipalPrivileges principalPrivileges) { try { TableInput input = toGlueTableInput(table); stats.getCreateTable().call(() -> glueClient.createTable(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(table.getDatabaseName()) .tableInput(input))); } catch (AlreadyExistsException e) { // Do not throw TableAlreadyExistsException if this query has already created the table. // This may happen when an actually successful metastore create call is retried // because of a timeout on our side. String expectedQueryId = table.getParameters().get(TRINO_QUERY_ID_NAME); if (expectedQueryId != null) { String existingQueryId = getTable(table.getDatabaseName(), table.getTableName()) .map(Table::getParameters) .map(parameters -> parameters.get(TRINO_QUERY_ID_NAME)) .orElse(null); if (expectedQueryId.equals(existingQueryId)) { return; } } throw new TableAlreadyExistsException(new SchemaTableName(table.getDatabaseName(), table.getTableName()), e); } catch (EntityNotFoundException e) { throw new SchemaNotFoundException(table.getDatabaseName(), e); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidateTable(table.getDatabaseName(), table.getTableName(), true); glueCache.invalidateTables(table.getDatabaseName()); } } @Override public void dropTable(String databaseName, String tableName, boolean deleteData) { Optional deleteLocation = Optional.empty(); if (deleteData) { Table table = getTable(databaseName, tableName) .orElseThrow(() -> new TableNotFoundException(new SchemaTableName(databaseName, tableName))); if (table.getTableType().equals(MANAGED_TABLE.name())) { deleteLocation = table.getStorage() .getOptionalLocation() .filter(not(String::isEmpty)) .map(Location::of); } } DeleteTableRequest deleteTableRequest = DeleteTableRequest.builder() .applyMutation(glueContext::configureClient) .databaseName(databaseName) .name(tableName) .build(); try { stats.getDeleteTable().call(() -> glueClient.deleteTable(deleteTableRequest)); } catch (EntityNotFoundException e) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidateTable(databaseName, tableName, true); glueCache.invalidateTables(databaseName); } deleteLocation.ifPresent(this::deleteDir); } private void deleteDir(Location path) { try { fileSystem.deleteDirectory(path); } catch (Exception e) { // don't fail if unable to delete path log.warn(e, "Failed to delete path: %s", path); } } @Override public void replaceTable(String databaseName, String tableName, Table newTable, PrincipalPrivileges principalPrivileges) { if (!tableName.equals(newTable.getTableName()) || !databaseName.equals(newTable.getDatabaseName())) { throw new TrinoException(NOT_SUPPORTED, "Table rename is not yet supported by Glue service"); } updateTable(databaseName, tableName, _ -> newTable); } private void updateTable(String databaseName, String tableName, UnaryOperator
modifier) { Table existingTable = getTable(databaseName, tableName) .orElseThrow(() -> new TableNotFoundException(new SchemaTableName(databaseName, tableName))); Table newTable = modifier.apply(existingTable); if (!existingTable.getDatabaseName().equals(newTable.getDatabaseName()) || !existingTable.getTableName().equals(newTable.getTableName())) { throw new TrinoException(NOT_SUPPORTED, "Update cannot be used to change rename a table"); } if (existingTable.getParameters().getOrDefault("table_type", "").equalsIgnoreCase("iceberg") && !Objects.equals( existingTable.getParameters().get("metadata_location"), newTable.getParameters().get("previous_metadata_location"))) { throw new TrinoException(NOT_SUPPORTED, "Cannot update Iceberg table: supplied previous location does not match current location"); } try { stats.getUpdateTable().call(() -> glueClient.updateTable(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableInput(toGlueTableInput(newTable)))); } catch (EntityNotFoundException e) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidateTable(databaseName, tableName, false); } } @Override public void renameTable(String databaseName, String tableName, String newDatabaseName, String newTableName) { // read the existing table software.amazon.awssdk.services.glue.model.Table table; try { table = stats.getGetTable().call(() -> glueClient.getTable(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .name(tableName)) .table()); } catch (EntityNotFoundException e) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } // create a new table with the same data as the old table try { CreateTableRequest createTableRequest = CreateTableRequest.builder() .applyMutation(glueContext::configureClient) .databaseName(newDatabaseName) .tableInput(asTableInputBuilder(table) .name(newTableName) .build()) .build(); stats.getCreateTable().call(() -> glueClient.createTable(createTableRequest)); } catch (AlreadyExistsException e) { throw new TableAlreadyExistsException(new SchemaTableName(databaseName, tableName)); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } // drop the old table try { dropTable(databaseName, tableName, false); } catch (RuntimeException e) { // if the drop failed, try to clean up the new table try { dropTable(databaseName, tableName, false); } catch (RuntimeException cleanupException) { if (!cleanupException.equals(e)) { e.addSuppressed(cleanupException); } } throw e; } finally { glueCache.invalidateTable(databaseName, tableName, true); glueCache.invalidateTable(newDatabaseName, newTableName, true); glueCache.invalidateTables(databaseName); if (!databaseName.equals(newDatabaseName)) { glueCache.invalidateTables(newDatabaseName); } } } public static TableInput.Builder asTableInputBuilder(software.amazon.awssdk.services.glue.model.Table table) { return TableInput.builder() .name(table.name()) .description(table.description()) .owner(table.owner()) .lastAccessTime(table.lastAccessTime()) .lastAnalyzedTime(table.lastAnalyzedTime()) .retention(table.retention()) .storageDescriptor(table.storageDescriptor()) .partitionKeys(table.partitionKeys()) .viewOriginalText(table.viewOriginalText()) .viewExpandedText(table.viewExpandedText()) .tableType(table.tableType()) .targetTable(table.targetTable()) .parameters(table.parameters()); } @Override public void commentTable(String databaseName, String tableName, Optional comment) { updateTable(databaseName, tableName, table -> table.withComment(comment)); } @Override public void setTableOwner(String databaseName, String tableName, HivePrincipal principal) { updateTable(databaseName, tableName, table -> table.withOwner(principal)); } @Override public Map getTableColumnStatistics(String databaseName, String tableName, Set columnNames) { return glueCache.getTableColumnStatistics( databaseName, tableName, columnNames, missingColumnNames -> getTableColumnStatisticsInternal(databaseName, tableName, missingColumnNames)); } private Map getTableColumnStatisticsInternal(String databaseName, String tableName, Set columnNames) { var columnStatsTasks = Lists.partition(ImmutableList.copyOf(columnNames), GLUE_COLUMN_READ_STAT_PAGE_SIZE).stream() .map(partialColumns -> (Callable>) () -> stats.getGetColumnStatisticsForTable().call(() -> glueClient.getColumnStatisticsForTable(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .columnNames(partialColumns)) .columnStatisticsList())) .collect(toImmutableList()); try { return fromGlueStatistics(runParallel(columnStatsTasks)); } catch (ExecutionException e) { if (e.getCause() instanceof EntityNotFoundException) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } throw new TrinoException(HIVE_METASTORE_ERROR, "Failed fetching column statistics for %s.%s".formatted(databaseName, tableName), e.getCause()); } } @Override public void updateTableStatistics(String databaseName, String tableName, OptionalLong acidWriteId, StatisticsUpdateMode mode, PartitionStatistics statisticsUpdate) { verify(acidWriteId.isEmpty(), "Glue metastore does not support Hive Acid tables"); // adding zero rows does not change stats if (mode == StatisticsUpdateMode.MERGE_INCREMENTAL && statisticsUpdate.basicStatistics().getRowCount().equals(OptionalLong.of(0))) { return; } // existing column statistics are required, for the columns being updated when in merge incremental mode // this is fetched before the basic statistics are updated, to avoid reloading in the case of retries updating basic statistics Map existingColumnStatistics; if (mode == StatisticsUpdateMode.MERGE_INCREMENTAL) { existingColumnStatistics = getTableColumnStatistics(databaseName, tableName, statisticsUpdate.columnStatistics().keySet()); } else { existingColumnStatistics = ImmutableMap.of(); } // first update the basic statistics on the table, which requires a read-modify-write cycle BasicTableStatisticsResult result; try { result = updateBasicTableStatistics(databaseName, tableName, mode, statisticsUpdate, existingColumnStatistics); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidateTable(databaseName, tableName, true); } List> tasks = new ArrayList<>(); Lists.partition(toGlueColumnStatistics(result.updateColumnStatistics()), GLUE_COLUMN_WRITE_STAT_PAGE_SIZE).stream() .map(chunk -> (Callable) () -> { stats.getUpdateColumnStatisticsForTable().call(() -> glueClient.updateColumnStatisticsForTable(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .columnStatisticsList(chunk))); return null; }) .forEach(tasks::add); result.removeColumnStatistics().stream() .map(columnName -> (Callable) () -> { stats.getDeleteColumnStatisticsForTable().call(() -> glueClient.deleteColumnStatisticsForTable(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .columnName(columnName))); return null; }) .forEach(tasks::add); try { runParallel(tasks); } catch (ExecutionException e) { if (e.getCause() instanceof EntityNotFoundException) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } throw new TrinoException(HIVE_METASTORE_ERROR, "Failed updating column statistics for %s.%s".formatted(databaseName, tableName), e.getCause()); } finally { glueCache.invalidateTableColumnStatistics(databaseName, tableName); } } private BasicTableStatisticsResult updateBasicTableStatistics( String databaseName, String tableName, StatisticsUpdateMode mode, PartitionStatistics statisticsUpdate, Map existingColumnStatistics) { Table table = getTable(databaseName, tableName) .orElseThrow(() -> new TableNotFoundException(new SchemaTableName(databaseName, tableName))); PartitionStatistics existingTableStats = new PartitionStatistics(getHiveBasicStatistics(table.getParameters()), existingColumnStatistics); PartitionStatistics updatedStatistics = mode.updatePartitionStatistics(existingTableStats, statisticsUpdate); stats.getUpdateTable().call(() -> glueClient.updateTable(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableInput(toGlueTableInput(table.withParameters(updateStatisticsParameters(table.getParameters(), updatedStatistics.basicStatistics())))))); Map columns = Stream.concat(table.getDataColumns().stream(), table.getPartitionColumns().stream()) .collect(toImmutableMap(Column::getName, identity())); Map updateColumnStatistics = columns.values().stream() .filter(column -> updatedStatistics.columnStatistics().containsKey(column.getName())) .collect(toImmutableMap(identity(), column -> updatedStatistics.columnStatistics().get(column.getName()))); Set removeColumnStatistics = switch (mode) { case OVERWRITE_SOME_COLUMNS -> ImmutableSet.of(); case OVERWRITE_ALL, MERGE_INCREMENTAL -> columns.entrySet().stream() // all columns not being updated are removed .filter(entry -> !updateColumnStatistics.containsKey(entry.getValue())) .map(Entry::getKey) .collect(Collectors.toSet()); case UNDO_MERGE_INCREMENTAL, CLEAR_ALL -> columns.keySet(); }; return new BasicTableStatisticsResult(updateColumnStatistics, removeColumnStatistics); } private record BasicTableStatisticsResult(Map updateColumnStatistics, Set removeColumnStatistics) {} @Override public void addColumn(String databaseName, String tableName, String columnName, HiveType columnType, String columnComment) { Column newColumn = new Column(columnName, columnType, Optional.ofNullable(columnComment), ImmutableMap.of()); updateTable(databaseName, tableName, table -> table.withAddColumn(newColumn)); } @Override public void renameColumn(String databaseName, String tableName, String oldColumnName, String newColumnName) { updateTable(databaseName, tableName, table -> table.withRenameColumn(oldColumnName, newColumnName)); } @Override public void dropColumn(String databaseName, String tableName, String columnName) throws EntityNotFoundException { updateTable(databaseName, tableName, table -> table.withDropColumn(columnName)); } @Override public void commentColumn(String databaseName, String tableName, String columnName, Optional comment) throws EntityNotFoundException { updateTable(databaseName, tableName, table -> table.withColumnComment(columnName, comment)); } @Override public Optional> getPartitionNamesByFilter(String databaseName, String tableName, List columnNames, TupleDomain partitionKeysFilter) { if (partitionKeysFilter.isNone()) { return Optional.of(ImmutableList.of()); } String glueFilterExpression = GlueExpressionUtil.buildGlueExpression(columnNames, partitionKeysFilter, assumeCanonicalPartitionKeys); Set partitionNames = glueCache.getPartitionNames( databaseName, tableName, glueFilterExpression, cachePartition -> getPartitionNames(cachePartition, databaseName, tableName, glueFilterExpression)); return Optional.of(partitionNames.stream() .map(PartitionName::partitionValues) .map(partitionValues -> toPartitionName(columnNames, partitionValues)) .collect(toImmutableList())); } private Set getPartitionNames(Consumer cachePartition, String databaseName, String tableName, String glueExpression) throws EntityNotFoundException { if (partitionSegments == 1) { return getPartitionNames(cachePartition, databaseName, tableName, glueExpression, null); } try { return runParallel(IntStream.range(0, partitionSegments) .mapToObj(segmentNumber -> (Callable>) () -> getPartitionNames( cachePartition, databaseName, tableName, glueExpression, Segment.builder() .segmentNumber(segmentNumber) .totalSegments(partitionSegments) .build())) .toList()) .stream() .flatMap(Collection::stream) .collect(toImmutableSet()); } catch (ExecutionException e) { if (e.getCause() instanceof EntityNotFoundException) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } throw new TrinoException(HIVE_METASTORE_ERROR, e.getCause()); } } private Set getPartitionNames(Consumer cachePartition, String databaseName, String tableName, String expression, @Nullable Segment segment) throws EntityNotFoundException { try { return stats.getGetPartitionNames().call(() -> glueClient.getPartitionsPaginator(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .expression(expression) .segment(segment) .maxResults(AWS_GLUE_GET_PARTITIONS_MAX_RESULTS)).stream() .map(GetPartitionsResponse::partitions) .flatMap(List::stream) .map(partition -> GlueConverter.fromGluePartition(databaseName, tableName, partition)) .peek(cachePartition) .map(Partition::getValues) .map(PartitionName::new) .collect(toImmutableSet())); } catch (EntityNotFoundException e) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } } @Override public Optional getPartition(Table table, List partitionValues) { String databaseName = table.getDatabaseName(); String tableName = table.getTableName(); PartitionName partitionName = new PartitionName(partitionValues); return glueCache.getPartition(databaseName, tableName, partitionName, () -> getPartition(databaseName, tableName, partitionName)); } private Optional getPartition(String databaseName, String tableName, PartitionName partitionName) { try { GetPartitionResponse result = stats.getGetPartition().call(() -> glueClient.getPartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .partitionValues(partitionName.partitionValues()))); return Optional.of(GlueConverter.fromGluePartition(databaseName, tableName, result.partition())); } catch (EntityNotFoundException e) { return Optional.empty(); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } } @Override public Map> getPartitionsByNames(Table table, List partitionNames) { List names = partitionNames.stream() .map(HivePartitionManager::extractPartitionValues) .map(PartitionName::new) .collect(toImmutableList()); return getPartitionsByNames(table.getDatabaseName(), table.getTableName(), names).entrySet().stream() .collect(toImmutableMap(entry -> makePartitionName(table.getPartitionColumns(), entry.getKey().partitionValues()), Entry::getValue)); } private Map> getPartitionsByNames(String databaseName, String tableName, Collection partitionNames) { Collection partitions = glueCache.batchGetPartitions( databaseName, tableName, partitionNames, (cachePartition, missingPartitions) -> batchGetPartition(databaseName, tableName, missingPartitions, cachePartition)); Map partitionValuesToPartitionMap = partitions.stream() .collect(toMap(partition -> new PartitionName(partition.getValues()), identity())); ImmutableMap.Builder> resultBuilder = ImmutableMap.builder(); for (PartitionName partitionName : partitionNames) { Partition partition = partitionValuesToPartitionMap.get(partitionName); resultBuilder.put(partitionName, Optional.ofNullable(partition)); } return resultBuilder.buildOrThrow(); } private Collection batchGetPartition(String databaseName, String tableName, Collection partitionNames, Consumer cachePartition) throws EntityNotFoundException { try { List pendingPartitions = partitionNames.stream() .map(partitionName -> PartitionValueList.builder().values(partitionName.partitionValues()).build()) .collect(toCollection(ArrayList::new)); ImmutableList.Builder resultsBuilder = ImmutableList.builderWithExpectedSize(partitionNames.size()); while (!pendingPartitions.isEmpty()) { List responses = runParallel(Lists.partition(pendingPartitions, BATCH_GET_PARTITION_MAX_PAGE_SIZE).stream() .map(partitions -> (Callable) () -> stats.getGetPartitions().call(() -> glueClient.batchGetPartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .partitionsToGet(partitions)))) .toList()); pendingPartitions.clear(); for (var response : responses) { // In the unlikely scenario where batchGetPartition call cannot make progress on retrieving partitions, avoid infinite loop. // We fail only in case there are still unprocessedKeys. Case with empty partitions and empty unprocessedKeys is correct in case partitions from request are not found. if (response.partitions().isEmpty() && !response.unprocessedKeys().isEmpty()) { throw new TrinoException(HIVE_METASTORE_ERROR, "Cannot make progress retrieving partitions. Unable to retrieve partitions: " + response.unprocessedKeys()); } response.partitions().stream() .map(partition -> GlueConverter.fromGluePartition(databaseName, tableName, partition)) .peek(cachePartition) .forEach(resultsBuilder::add); pendingPartitions.addAll(response.unprocessedKeys()); } } return resultsBuilder.build(); } catch (ExecutionException e) { if (e.getCause() instanceof EntityNotFoundException) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } throw new TrinoException(HIVE_METASTORE_ERROR, "Failed fetching partitions for %s.%s".formatted(databaseName, tableName), e.getCause()); } } @Override public void addPartitions(String databaseName, String tableName, List partitionsWithStatistics) { if (partitionsWithStatistics.isEmpty()) { return; } partitionsWithStatistics.stream() .map(PartitionWithStatistics::getPartition) .collect(toImmutableList()) .forEach(partition -> { if (!partition.getDatabaseName().equals(databaseName) || !partition.getTableName().equals(tableName)) { throw new TrinoException(NOT_SUPPORTED, "All partitions must belong to the same table"); } }); List updatedPartitions = partitionsWithStatistics.stream() .map(partitionWithStatistics -> { Partition partition = partitionWithStatistics.getPartition(); HiveBasicStatistics basicStatistics = partitionWithStatistics.getStatistics().basicStatistics(); return partition.withParameters(updateStatisticsParameters(partition.getParameters(), basicStatistics)); }) .toList(); var createPartitionTasks = Lists.partition(updatedPartitions, BATCH_UPDATE_PARTITION_MAX_PAGE_SIZE).stream() .map(partitionBatch -> (Callable) () -> { stats.getCreatePartitions().call(() -> glueClient.batchCreatePartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .partitionInputList(partitionBatch.stream() .map(GlueConverter::toGluePartitionInput) .collect(toImmutableList())))); return null; }) .toList(); try { runParallel(createPartitionTasks); } catch (ExecutionException e) { if (e.getCause() instanceof AlreadyExistsException) { throw new TrinoException(ALREADY_EXISTS, "Partition already exists in table %s.%s: %s".formatted(databaseName, tableName, e.getCause().getMessage())); } if (e.getCause() instanceof EntityNotFoundException) { throw new TableNotFoundException(new SchemaTableName(databaseName, tableName)); } throw new TrinoException(HIVE_METASTORE_ERROR, "Failed creating partitions for %s.%s: %s".formatted(databaseName, tableName, e.getCause().getMessage())); } // statistics are created after partitions because it is not clear if ordering matters in Glue var createStatisticsTasks = partitionsWithStatistics.stream() .map(partitionWithStatistics -> createUpdatePartitionStatisticsTasks( StatisticsUpdateMode.OVERWRITE_ALL, partitionWithStatistics.getPartition(), partitionWithStatistics.getStatistics().columnStatistics())) .flatMap(Collection::stream) .collect(toImmutableList()); try { runParallel(createStatisticsTasks); } catch (ExecutionException e) { throw new TrinoException(HIVE_METASTORE_ERROR, "Failed creating partition column statistics for %s.%s".formatted(databaseName, tableName), e.getCause()); } } @Override public void dropPartition(String databaseName, String tableName, List partitionValues, boolean deleteData) { PartitionName partitionName = new PartitionName(partitionValues); Optional location = Optional.empty(); if (deleteData) { Partition partition = getPartition(databaseName, tableName, partitionName) .orElseThrow(() -> new PartitionNotFoundException(new SchemaTableName(databaseName, tableName), partitionValues)); location = Optional.of(Strings.nullToEmpty(partition.getStorage().getLocation())) .map(Location::of); } try { stats.getDeletePartition().call(() -> glueClient.deletePartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .partitionValues(partitionValues))); } catch (EntityNotFoundException e) { throw new PartitionNotFoundException(new SchemaTableName(databaseName, tableName), partitionValues); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidatePartition(databaseName, tableName, partitionName); } location.ifPresent(this::deleteDir); } @Override public void alterPartition(String databaseName, String tableName, PartitionWithStatistics partitionWithStatistics) { if (!partitionWithStatistics.getPartition().getDatabaseName().equals(databaseName) || !partitionWithStatistics.getPartition().getTableName().equals(tableName)) { throw new TrinoException(HIVE_METASTORE_ERROR, "Partition names must match table name"); } alterPartition(partitionWithStatistics); } private void alterPartition(PartitionWithStatistics partitionWithStatistics) { Partition partition = partitionWithStatistics.getPartition(); try { HiveBasicStatistics basicStatistics = partitionWithStatistics.getStatistics().basicStatistics(); PartitionInput newPartition = toGluePartitionInput(partition.withParameters(updateStatisticsParameters(partition.getParameters(), basicStatistics))); stats.getUpdatePartition().call(() -> glueClient.updatePartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(partition.getDatabaseName()) .tableName(partition.getTableName()) .partitionInput(newPartition) .partitionValueList(partition.getValues()))); } catch (EntityNotFoundException e) { throw new PartitionNotFoundException(partition.getSchemaTableName(), partition.getValues()); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidatePartition(partition.getDatabaseName(), partition.getTableName(), new PartitionName(partition.getValues())); } try { runParallel(createUpdatePartitionStatisticsTasks(StatisticsUpdateMode.OVERWRITE_ALL, partition, partitionWithStatistics.getStatistics().columnStatistics())); } catch (ExecutionException e) { if (e.getCause() instanceof EntityNotFoundException) { throw new PartitionNotFoundException(new SchemaTableName(partition.getDatabaseName(), partition.getTableName()), partition.getValues()); } throw new TrinoException(HIVE_METASTORE_ERROR, "Failed updating partition column statistics for %s %s".formatted(partition.getSchemaTableName(), partition.getValues()), e.getCause()); } finally { // this redundant, but be safe in case stats were cached before the update glueCache.invalidatePartition(partition.getDatabaseName(), partition.getTableName(), new PartitionName(partition.getValues())); } } @Override public Map> getPartitionColumnStatistics( String databaseName, String tableName, Set partitionNames, Set columnNames) { checkArgument(!columnNames.isEmpty(), "columnNames is empty"); Map partitionsNameMap = partitionNames.stream() .collect(toImmutableMap(partitionName -> new PartitionName(HivePartitionManager.extractPartitionValues(partitionName)), identity())); return getPartitionColumnStatistics(databaseName, tableName, partitionsNameMap.keySet(), columnNames).entrySet().stream() .collect(toImmutableMap(entry -> partitionsNameMap.get(entry.getKey()), Entry::getValue)); } private Map> getPartitionColumnStatistics(String databaseName, String tableName, Collection partitionNames, Set columnNames) throws EntityNotFoundException { Map> columnStats; try { columnStats = runParallel(partitionNames.stream() .map(partitionName -> (Callable>>) () -> entry( partitionName, glueCache.getPartitionColumnStatistics( databaseName, tableName, partitionName, columnNames, missingColumnNames -> getPartitionColumnStatisticsInternal(databaseName, tableName, partitionName, missingColumnNames)))) .collect(toImmutableList())) .stream() .collect(toImmutableMap(Entry::getKey, Entry::getValue)); } catch (ExecutionException e) { throwIfUnchecked(e.getCause()); throw new TrinoException(HIVE_METASTORE_ERROR, "Failed fetching partition statistics for %s.%s".formatted(databaseName, tableName), e.getCause()); } // use empty statistics for missing partitions return partitionNames.stream() .collect(toImmutableMap(identity(), name -> columnStats.getOrDefault(name, ImmutableMap.of()))); } private Map getPartitionColumnStatisticsInternal(String databaseName, String tableName, PartitionName partitionName, Set columnNames) throws EntityNotFoundException { var columnStatsTasks = Lists.partition(ImmutableList.copyOf(columnNames), GLUE_COLUMN_READ_STAT_PAGE_SIZE).stream() .map(partialColumns -> (Callable>) () -> stats.getGetColumnStatisticsForPartition().call(() -> glueClient.getColumnStatisticsForPartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .partitionValues(partitionName.partitionValues()) .columnNames(partialColumns)) .columnStatisticsList())) .collect(toImmutableList()); try { var glueColumnStatistics = runParallel(columnStatsTasks); return fromGlueStatistics(glueColumnStatistics); } catch (ExecutionException e) { if (e.getCause() instanceof EntityNotFoundException) { return ImmutableMap.of(); } throw new TrinoException(HIVE_METASTORE_ERROR, "Failed fetching column statistics for %s.%s %s".formatted(databaseName, tableName, partitionName), e.getCause()); } } @Override public void updatePartitionStatistics(Table table, StatisticsUpdateMode mode, Map partitionUpdates) { batchUpdatePartitionStatistics(table.getDatabaseName(), table.getTableName(), mode, partitionUpdates.entrySet().stream() // filter out empty statistics for merge incremental mode .filter(entry -> mode != StatisticsUpdateMode.MERGE_INCREMENTAL || !entry.getValue().basicStatistics().getRowCount().equals(OptionalLong.of(0))) .collect(toImmutableMap(entry -> new PartitionName(HivePartitionManager.extractPartitionValues(entry.getKey())), Entry::getValue))); } private void batchUpdatePartitionStatistics(String databaseName, String tableName, StatisticsUpdateMode mode, Map newStatistics) throws EntityNotFoundException { // partitions are required for update // the glue cache is not used here because we need up-to-date partitions for the read-update-write operation // loaded partitions are not cached here since the partition values are invalidated after the update Collection partitions = batchGetPartition(databaseName, tableName, ImmutableList.copyOf(newStatistics.keySet()), _ -> {}); // existing column statistics are required for the columns being updated when in merge incremental mode // this is fetched before the basic statistics are updated, to avoid reloading in the case of retries updating basic statistics Map> existingColumnStatistics; if (mode == StatisticsUpdateMode.MERGE_INCREMENTAL) { try { existingColumnStatistics = runParallel(newStatistics.entrySet().stream() .map(entry -> (Callable>>) () -> { PartitionName partitionName = entry.getKey(); Map columnStatistics = getPartitionColumnStatisticsInternal(databaseName, tableName, partitionName, entry.getValue().columnStatistics().keySet()); return entry(partitionName, columnStatistics); }) .collect(toImmutableList())) .stream() .collect(toImmutableMap(Entry::getKey, Entry::getValue)); } catch (ExecutionException e) { throwIfUnchecked(e.getCause()); throw new TrinoException(HIVE_METASTORE_ERROR, "Failed fetching current partition statistics for %s.%s".formatted(databaseName, tableName), e.getCause()); } } else { existingColumnStatistics = ImmutableMap.of(); } List partitionStatisticsUpdates = new ArrayList<>(); for (Partition partition : partitions) { PartitionName partitionName = new PartitionName(partition.getValues()); PartitionStatistics existingStats = new PartitionStatistics( getHiveBasicStatistics(partition.getParameters()), existingColumnStatistics.getOrDefault(partitionName, ImmutableMap.of())); PartitionStatistics newStats = newStatistics.get(partitionName); PartitionStatistics updatedStatistics = mode.updatePartitionStatistics(existingStats, newStats); Partition updatedPartition = partition.withParameters(updateStatisticsParameters(partition.getParameters(), updatedStatistics.basicStatistics())); boolean basicStatsUpdated = !updatedStatistics.basicStatistics().equals(existingStats.basicStatistics()); partitionStatisticsUpdates.add(new PartitionStatisticsUpdate(updatedPartition, basicStatsUpdated, updatedStatistics.columnStatistics())); } // partitions and statistics are updated in concurrently List> tasks = new ArrayList<>(); partitionStatisticsUpdates.stream() .map(update -> createUpdatePartitionStatisticsTasks(mode, update.updatedPartition(), update.updatedStatistics())) .flatMap(Collection::stream) .forEach(tasks::add); List updatedPartitions = partitionStatisticsUpdates.stream() .filter(PartitionStatisticsUpdate::basicStatsUpdated) .map(PartitionStatisticsUpdate::updatedPartition) .collect(toImmutableList()); Lists.partition(updatedPartitions, BATCH_UPDATE_PARTITION_MAX_PAGE_SIZE).stream() .map(partitionBatch -> (Callable) () -> { stats.getBatchUpdatePartition().call(() -> glueClient.batchUpdatePartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .tableName(tableName) .entries(partitionBatch.stream() .map(partition -> BatchUpdatePartitionRequestEntry.builder() .partitionValueList(partition.getValues()) .partitionInput(toGluePartitionInput(partition)) .build()) .collect(toImmutableList())))); return null; }) .forEach(tasks::add); try { runParallel(tasks); } catch (ExecutionException e) { throw new TrinoException(HIVE_METASTORE_ERROR, "Failed updating partition column statistics for %s.%s".formatted(databaseName, tableName), e.getCause()); } } private List> createUpdatePartitionStatisticsTasks(StatisticsUpdateMode mode, Partition partition, Map updatedStatistics) { Map columns = partition.getColumns().stream() .collect(toImmutableMap(Column::getName, identity())); Map statisticsByColumn = columns.values().stream() .filter(column -> updatedStatistics.containsKey(column.getName())) .collect(toImmutableMap(identity(), column -> updatedStatistics.get(column.getName()))); Set removeColumnStatistics = switch (mode) { case OVERWRITE_SOME_COLUMNS -> ImmutableSet.of(); case OVERWRITE_ALL, MERGE_INCREMENTAL -> columns.entrySet().stream() // all columns not being updated are removed .filter(entry -> !statisticsByColumn.containsKey(entry.getValue())) .map(Entry::getKey) .collect(Collectors.toSet()); case UNDO_MERGE_INCREMENTAL, CLEAR_ALL -> columns.keySet(); }; ImmutableList.Builder> tasks = ImmutableList.builder(); Lists.partition(toGlueColumnStatistics(statisticsByColumn), GLUE_COLUMN_WRITE_STAT_PAGE_SIZE).stream() .map(chunk -> (Callable) () -> { stats.getUpdateColumnStatisticsForPartition().call(() -> glueClient.updateColumnStatisticsForPartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(partition.getDatabaseName()) .tableName(partition.getTableName()) .partitionValues(partition.getValues()) .columnStatisticsList(chunk))); return null; }) .forEach(tasks::add); removeColumnStatistics.stream() .map(columnName -> (Callable) () -> { stats.getDeleteColumnStatisticsForPartition().call(() -> glueClient.deleteColumnStatisticsForPartition(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(partition.getDatabaseName()) .tableName(partition.getTableName()) .partitionValues(partition.getValues()) .columnName(columnName))); return null; }) .forEach(tasks::add); return tasks.build(); } private record PartitionStatisticsUpdate(Partition updatedPartition, boolean basicStatsUpdated, Map updatedStatistics) {} // // Function management // @Override public boolean functionExists(String databaseName, String functionName, String signatureToken) { try { // this call is only used for create/drop function so is not worth caching stats.getUpdateUserDefinedFunction().call(() -> glueClient.getUserDefinedFunction(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .functionName(metastoreFunctionName(functionName, signatureToken)))); return true; } catch (software.amazon.awssdk.services.glue.model.EntityNotFoundException e) { return false; } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } } @Override public Collection getAllFunctions(String databaseName) { return glueCache.getAllFunctions(databaseName, () -> getFunctionsByPatternInternal(databaseName, "trino__.*")); } @Override public Collection getFunctions(String databaseName, String functionName) { return glueCache.getFunction(databaseName, functionName, () -> getFunctionsByPatternInternal(databaseName, "trino__" + Pattern.quote(functionName) + "__.*")); } private Collection getFunctionsByPatternInternal(String databaseName, String functionNamePattern) { try { return stats.getGetUserDefinedFunctions().call(() -> glueClient.getUserDefinedFunctionsPaginator(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .pattern(functionNamePattern) .maxResults(AWS_GLUE_GET_FUNCTIONS_MAX_RESULTS)).stream() .map(GetUserDefinedFunctionsResponse::userDefinedFunctions) .flatMap(List::stream) .map(GlueConverter::fromGlueFunction) .collect(toImmutableList())); } catch (software.amazon.awssdk.services.glue.model.EntityNotFoundException | AccessDeniedException e) { log.warn(e, "Failed to get SQL routines for pattern: %s in schema: %s", functionNamePattern, databaseName); return ImmutableList.of(); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } } @Override public void createFunction(String databaseName, String functionName, LanguageFunction function) { if (functionName.contains("__")) { throw new TrinoException(NOT_SUPPORTED, "Function names with double underscore are not supported"); } try { software.amazon.awssdk.services.glue.model.UserDefinedFunctionInput functionInput = toGlueFunctionInput(functionName, function); stats.getCreateUserDefinedFunction().call(() -> glueClient.createUserDefinedFunction(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .functionInput(functionInput))); } catch (software.amazon.awssdk.services.glue.model.AlreadyExistsException e) { throw new TrinoException(ALREADY_EXISTS, "Function already exists: %s.%s".formatted(databaseName, functionName), e); } catch (software.amazon.awssdk.services.glue.model.EntityNotFoundException e) { throw new SchemaNotFoundException(databaseName, e); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidateFunction(databaseName, functionName); } } @Override public void replaceFunction(String databaseName, String functionName, LanguageFunction function) { try { UserDefinedFunctionInput functionInput = toGlueFunctionInput(functionName, function); stats.getUpdateUserDefinedFunction().call(() -> glueClient.updateUserDefinedFunction(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .functionName(metastoreFunctionName(functionName, function.signatureToken())) .functionInput(functionInput))); } catch (software.amazon.awssdk.services.glue.model.EntityNotFoundException e) { throw new TrinoException(FUNCTION_NOT_FOUND, "Function not found: %s.%s".formatted(databaseName, functionName), e); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidateFunction(databaseName, functionName); } } @Override public void dropFunction(String databaseName, String functionName, String signatureToken) { try { stats.getDeleteUserDefinedFunction().call(() -> glueClient.deleteUserDefinedFunction(builder -> builder .applyMutation(glueContext::configureClient) .databaseName(databaseName) .functionName(metastoreFunctionName(functionName, signatureToken)))); } catch (software.amazon.awssdk.services.glue.model.EntityNotFoundException e) { throw new TrinoException(FUNCTION_NOT_FOUND, "Function not found: %s.%s".formatted(databaseName, functionName), e); } catch (SdkException e) { throw new TrinoException(HIVE_METASTORE_ERROR, e); } finally { glueCache.invalidateFunction(databaseName, functionName); } } // // Glue does not support permissions management or ACID transactions // @Override public void createRole(String role, String grantor) { throw new TrinoException(NOT_SUPPORTED, "createRole is not supported by Glue"); } @Override public void dropRole(String role) { throw new TrinoException(NOT_SUPPORTED, "dropRole is not supported by Glue"); } @Override public Set listRoles() { return ImmutableSet.of(PUBLIC_ROLE_NAME); } @Override public void grantRoles(Set roles, Set grantees, boolean adminOption, HivePrincipal grantor) { throw new TrinoException(NOT_SUPPORTED, "grantRoles is not supported by Glue"); } @Override public void revokeRoles(Set roles, Set grantees, boolean adminOption, HivePrincipal grantor) { throw new TrinoException(NOT_SUPPORTED, "revokeRoles is not supported by Glue"); } @Override public Set listRoleGrants(HivePrincipal principal) { if (principal.getType() == USER) { return ImmutableSet.of(new RoleGrant(principal.toTrinoPrincipal(), PUBLIC_ROLE_NAME, false)); } return ImmutableSet.of(); } @Override public void grantTablePrivileges(String databaseName, String tableName, String tableOwner, HivePrincipal grantee, HivePrincipal grantor, Set privileges, boolean grantOption) { throw new TrinoException(NOT_SUPPORTED, "grantTablePrivileges is not supported by Glue"); } @Override public void revokeTablePrivileges(String databaseName, String tableName, String tableOwner, HivePrincipal grantee, HivePrincipal grantor, Set privileges, boolean grantOption) { throw new TrinoException(NOT_SUPPORTED, "revokeTablePrivileges is not supported by Glue"); } @Override public Set listTablePrivileges(String databaseName, String tableName, Optional tableOwner, Optional principal) { return ImmutableSet.of(); } @Override public void checkSupportsTransactions() { throw new TrinoException(NOT_SUPPORTED, "Glue does not support ACID tables"); } /** * Run all tasks on executor returning as soon as all complete or any task fails. * Upon task execution failure, other tasks are canceled and interrupted, but not waited * for. * * @return results of all tasks in any order * @throws ExecutionException if any task fails; exception cause is the first task failure */ private List runParallel(Collection> tasks) throws ExecutionException { return processWithAdditionalThreads(tasks, executor); } public enum TableKind { OTHER, DELTA, ICEBERG, HUDI } private static Predicate createTablePredicate(Set visibleTableKinds) { // nothing is visible if (visibleTableKinds.isEmpty()) { return _ -> false; } // everything is visible if (visibleTableKinds.equals(ImmutableSet.copyOf(TableKind.values()))) { return _ -> true; } // exclusion if (visibleTableKinds.contains(TableKind.OTHER)) { EnumSet deniedKinds = EnumSet.complementOf(EnumSet.copyOf(visibleTableKinds)); Predicate tableVisibilityFilter = _ -> true; for (TableKind value : deniedKinds) { tableVisibilityFilter = tableVisibilityFilter.and(not(tableKindPredicate(value))); } return tableVisibilityFilter; } // inclusion Predicate tableVisibilityFilter = _ -> false; for (TableKind tableKind : visibleTableKinds) { tableVisibilityFilter = tableVisibilityFilter.or(tableKindPredicate(tableKind)); } return tableVisibilityFilter; } private static Predicate tableKindPredicate(TableKind tableKind) { return switch (tableKind) { case DELTA -> table -> isDeltaLakeTable(table.parameters()); case ICEBERG -> table -> isIcebergTable(table.parameters()); case HUDI -> table -> table.storageDescriptor() != null && isHudiTable(table.storageDescriptor().inputFormat()); case OTHER -> throw new IllegalArgumentException("Predicate can not be created for OTHER"); }; } }