All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.paimon.flink.procedure.RemoveOrphanFilesProcedure Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.paimon.flink.procedure;

import org.apache.paimon.catalog.Identifier;
import org.apache.paimon.flink.orphan.FlinkOrphanFilesClean;
import org.apache.paimon.operation.CleanOrphanFilesResult;
import org.apache.paimon.operation.LocalOrphanFilesClean;

import org.apache.flink.table.procedure.ProcedureContext;

import java.util.Locale;

import static org.apache.paimon.operation.OrphanFilesClean.createFileCleaner;
import static org.apache.paimon.operation.OrphanFilesClean.olderThanMillis;

/**
 * Remove orphan files procedure. Usage:
 *
 * 

 *  -- use the default file delete interval
 *  CALL sys.remove_orphan_files('tableId')
 *
 *  -- use custom file delete interval
 *  CALL sys.remove_orphan_files('tableId', '2023-12-31 23:59:59')
 *
 *  -- remove all tables' orphan files in db
 *  CALL sys.remove_orphan_files('databaseName.*', '2023-12-31 23:59:59')
 * 
*/ public class RemoveOrphanFilesProcedure extends ProcedureBase { public static final String IDENTIFIER = "remove_orphan_files"; public String[] call(ProcedureContext procedureContext, String tableId) throws Exception { return call(procedureContext, tableId, ""); } public String[] call(ProcedureContext procedureContext, String tableId, String olderThan) throws Exception { return call(procedureContext, tableId, olderThan, false); } public String[] call( ProcedureContext procedureContext, String tableId, String olderThan, boolean dryRun) throws Exception { return call(procedureContext, tableId, olderThan, dryRun, null); } public String[] call( ProcedureContext procedureContext, String tableId, String olderThan, boolean dryRun, Integer parallelism) throws Exception { return call(procedureContext, tableId, olderThan, dryRun, parallelism, null); } public String[] call( ProcedureContext procedureContext, String tableId, String olderThan, boolean dryRun, Integer parallelism, String mode) throws Exception { Identifier identifier = Identifier.fromString(tableId); String databaseName = identifier.getDatabaseName(); String tableName = identifier.getObjectName(); if (mode == null) { mode = "DISTRIBUTED"; } CleanOrphanFilesResult cleanOrphanFilesResult; try { switch (mode.toUpperCase(Locale.ROOT)) { case "DISTRIBUTED": cleanOrphanFilesResult = FlinkOrphanFilesClean.executeDatabaseOrphanFiles( procedureContext.getExecutionEnvironment(), catalog, olderThanMillis(olderThan), createFileCleaner(catalog, dryRun), parallelism, databaseName, tableName); break; case "LOCAL": cleanOrphanFilesResult = LocalOrphanFilesClean.executeDatabaseOrphanFiles( catalog, databaseName, tableName, olderThanMillis(olderThan), createFileCleaner(catalog, dryRun), parallelism); break; default: throw new IllegalArgumentException( "Unknown mode: " + mode + ". Only 'DISTRIBUTED' and 'LOCAL' are supported."); } return new String[] { String.valueOf(cleanOrphanFilesResult.getDeletedFileCount()), String.valueOf(cleanOrphanFilesResult.getDeletedFileTotalLenInBytes()) }; } catch (Exception e) { throw new RuntimeException(e); } } @Override public String identifier() { return IDENTIFIER; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy