All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.paimon.spark.procedure.MigrateTableProcedure Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.paimon.spark.procedure;

import org.apache.paimon.catalog.Catalog;
import org.apache.paimon.catalog.Identifier;
import org.apache.paimon.migrate.Migrator;
import org.apache.paimon.spark.catalog.WithPaimonCatalog;
import org.apache.paimon.spark.utils.TableMigrationUtils;
import org.apache.paimon.utils.ParameterUtils;
import org.apache.paimon.utils.StringUtils;

import org.apache.spark.sql.catalyst.InternalRow;
import org.apache.spark.sql.catalyst.util.MapData;
import org.apache.spark.sql.connector.catalog.TableCatalog;
import org.apache.spark.sql.types.DataTypes;
import org.apache.spark.sql.types.Metadata;
import org.apache.spark.sql.types.StructField;
import org.apache.spark.sql.types.StructType;

import java.util.HashMap;
import java.util.Map;

import static org.apache.spark.sql.types.DataTypes.BooleanType;
import static org.apache.spark.sql.types.DataTypes.IntegerType;
import static org.apache.spark.sql.types.DataTypes.StringType;

/**
 * Migrate table procedure. Usage:
 *
 * 

 *  CALL sys.migrate_table(source_type => 'hive', table => 'db.tbl', options => 'x1=y1,x2=y2')
 * 
*/ public class MigrateTableProcedure extends BaseProcedure { private static final String TMP_TBL_SUFFIX = "_paimon_"; private static final ProcedureParameter[] PARAMETERS = new ProcedureParameter[] { ProcedureParameter.required("source_type", StringType), ProcedureParameter.required("table", StringType), ProcedureParameter.optional("options", StringType), ProcedureParameter.optional("delete_origin", BooleanType), ProcedureParameter.optional("target_table", StringType), ProcedureParameter.optional( "options_map", DataTypes.createMapType(StringType, StringType)), ProcedureParameter.optional("parallelism", IntegerType), }; private static final StructType OUTPUT_TYPE = new StructType( new StructField[] { new StructField("result", DataTypes.BooleanType, true, Metadata.empty()) }); protected MigrateTableProcedure(TableCatalog tableCatalog) { super(tableCatalog); } @Override public ProcedureParameter[] parameters() { return PARAMETERS; } @Override public StructType outputType() { return OUTPUT_TYPE; } @Override public InternalRow[] call(InternalRow args) { String format = args.getString(0); String sourceTable = args.getString(1); String properties = args.isNullAt(2) ? null : args.getString(2); boolean deleteNeed = args.isNullAt(3) || args.getBoolean(3); String targetTable = args.isNullAt(4) ? null : args.getString(4); MapData mapData = args.isNullAt(5) ? null : args.getMap(5); Map optionMap = mapDataToHashMap(mapData); int parallelism = args.isNullAt(6) ? Runtime.getRuntime().availableProcessors() : args.getInt(6); Identifier sourceTableId = Identifier.fromString(sourceTable); Identifier tmpTableId = StringUtils.isEmpty(targetTable) ? Identifier.fromString(sourceTable + TMP_TBL_SUFFIX) : Identifier.fromString(targetTable); Catalog paimonCatalog = ((WithPaimonCatalog) tableCatalog()).paimonCatalog(); Map options = ParameterUtils.parseCommaSeparatedKeyValues(properties); options.putAll(optionMap); try { Migrator migrator = TableMigrationUtils.getImporter( format, paimonCatalog, sourceTableId.getDatabaseName(), sourceTableId.getObjectName(), tmpTableId.getDatabaseName(), tmpTableId.getObjectName(), parallelism, options); migrator.deleteOriginTable(deleteNeed); migrator.executeMigrate(); if (StringUtils.isEmpty(targetTable)) { paimonCatalog.renameTable(tmpTableId, sourceTableId, false); } } catch (Exception e) { throw new RuntimeException("Call migrate_table error: " + e.getMessage(), e); } return new InternalRow[] {newInternalRow(true)}; } public static Map mapDataToHashMap(MapData mapData) { HashMap map = new HashMap<>(); if (mapData != null) { for (int index = 0; index < mapData.numElements(); index++) { map.put( mapData.keyArray().getUTF8String(index).toString(), mapData.valueArray().getUTF8String(index).toString()); } } return map; } public static ProcedureBuilder builder() { return new BaseProcedure.Builder() { @Override public MigrateTableProcedure doBuild() { return new MigrateTableProcedure(tableCatalog()); } }; } @Override public String description() { return "MigrateTableProcedure"; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy