org.apache.paimon.spark.procedure.MigrateTableProcedure Maven / Gradle / Ivy
The newest version!
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.paimon.spark.procedure;
import org.apache.paimon.catalog.Catalog;
import org.apache.paimon.catalog.Identifier;
import org.apache.paimon.migrate.Migrator;
import org.apache.paimon.spark.catalog.WithPaimonCatalog;
import org.apache.paimon.spark.utils.TableMigrationUtils;
import org.apache.paimon.utils.ParameterUtils;
import org.apache.paimon.utils.StringUtils;
import org.apache.spark.sql.catalyst.InternalRow;
import org.apache.spark.sql.catalyst.util.MapData;
import org.apache.spark.sql.connector.catalog.TableCatalog;
import org.apache.spark.sql.types.DataTypes;
import org.apache.spark.sql.types.Metadata;
import org.apache.spark.sql.types.StructField;
import org.apache.spark.sql.types.StructType;
import java.util.HashMap;
import java.util.Map;
import static org.apache.spark.sql.types.DataTypes.BooleanType;
import static org.apache.spark.sql.types.DataTypes.IntegerType;
import static org.apache.spark.sql.types.DataTypes.StringType;
/**
* Migrate table procedure. Usage:
*
*
* CALL sys.migrate_table(source_type => 'hive', table => 'db.tbl', options => 'x1=y1,x2=y2')
*
*/
public class MigrateTableProcedure extends BaseProcedure {
private static final String TMP_TBL_SUFFIX = "_paimon_";
private static final ProcedureParameter[] PARAMETERS =
new ProcedureParameter[] {
ProcedureParameter.required("source_type", StringType),
ProcedureParameter.required("table", StringType),
ProcedureParameter.optional("options", StringType),
ProcedureParameter.optional("delete_origin", BooleanType),
ProcedureParameter.optional("target_table", StringType),
ProcedureParameter.optional(
"options_map", DataTypes.createMapType(StringType, StringType)),
ProcedureParameter.optional("parallelism", IntegerType),
};
private static final StructType OUTPUT_TYPE =
new StructType(
new StructField[] {
new StructField("result", DataTypes.BooleanType, true, Metadata.empty())
});
protected MigrateTableProcedure(TableCatalog tableCatalog) {
super(tableCatalog);
}
@Override
public ProcedureParameter[] parameters() {
return PARAMETERS;
}
@Override
public StructType outputType() {
return OUTPUT_TYPE;
}
@Override
public InternalRow[] call(InternalRow args) {
String format = args.getString(0);
String sourceTable = args.getString(1);
String properties = args.isNullAt(2) ? null : args.getString(2);
boolean deleteNeed = args.isNullAt(3) || args.getBoolean(3);
String targetTable = args.isNullAt(4) ? null : args.getString(4);
MapData mapData = args.isNullAt(5) ? null : args.getMap(5);
Map optionMap = mapDataToHashMap(mapData);
int parallelism =
args.isNullAt(6) ? Runtime.getRuntime().availableProcessors() : args.getInt(6);
Identifier sourceTableId = Identifier.fromString(sourceTable);
Identifier tmpTableId =
StringUtils.isEmpty(targetTable)
? Identifier.fromString(sourceTable + TMP_TBL_SUFFIX)
: Identifier.fromString(targetTable);
Catalog paimonCatalog = ((WithPaimonCatalog) tableCatalog()).paimonCatalog();
Map options = ParameterUtils.parseCommaSeparatedKeyValues(properties);
options.putAll(optionMap);
try {
Migrator migrator =
TableMigrationUtils.getImporter(
format,
paimonCatalog,
sourceTableId.getDatabaseName(),
sourceTableId.getObjectName(),
tmpTableId.getDatabaseName(),
tmpTableId.getObjectName(),
parallelism,
options);
migrator.deleteOriginTable(deleteNeed);
migrator.executeMigrate();
if (StringUtils.isEmpty(targetTable)) {
paimonCatalog.renameTable(tmpTableId, sourceTableId, false);
}
} catch (Exception e) {
throw new RuntimeException("Call migrate_table error: " + e.getMessage(), e);
}
return new InternalRow[] {newInternalRow(true)};
}
public static Map mapDataToHashMap(MapData mapData) {
HashMap map = new HashMap<>();
if (mapData != null) {
for (int index = 0; index < mapData.numElements(); index++) {
map.put(
mapData.keyArray().getUTF8String(index).toString(),
mapData.valueArray().getUTF8String(index).toString());
}
}
return map;
}
public static ProcedureBuilder builder() {
return new BaseProcedure.Builder() {
@Override
public MigrateTableProcedure doBuild() {
return new MigrateTableProcedure(tableCatalog());
}
};
}
@Override
public String description() {
return "MigrateTableProcedure";
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy