All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.kylin.tool.garbage.DataflowCleanerCLI Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.kylin.tool.garbage;

import java.util.List;
import java.util.stream.Collectors;

import org.apache.kylin.common.KylinConfig;
import org.apache.kylin.common.util.Unsafe;
import org.apache.kylin.guava30.shaded.common.collect.Lists;
import org.apache.kylin.guava30.shaded.common.collect.Sets;
import org.apache.kylin.metadata.cube.model.LayoutEntity;
import org.apache.kylin.metadata.cube.model.NDataLayout;
import org.apache.kylin.metadata.cube.model.NDataSegment;
import org.apache.kylin.metadata.cube.model.NDataflow;
import org.apache.kylin.metadata.cube.model.NDataflowManager;
import org.apache.kylin.metadata.model.NDataModel;
import org.apache.kylin.metadata.project.EnhancedUnitOfWork;
import org.apache.kylin.metadata.project.NProjectManager;
import org.apache.kylin.metadata.project.ProjectInstance;

import lombok.val;
import lombok.extern.slf4j.Slf4j;

@Slf4j
public class DataflowCleanerCLI {

    public static void main(String[] args) {
        execute();
        System.out.println("Cleanup dataflow finished.");
        Unsafe.systemExit(0);
    }

    public static void execute() {
        KylinConfig config = KylinConfig.getInstanceFromEnv();
        val projectManager = NProjectManager.getInstance(config);
        for (ProjectInstance project : projectManager.listAllProjects()) {
            log.info("Start dataflow cleanup for project<{}>", project.getName());
            try {
                cleanupRedundantIndex(project);
            } catch (Exception e) {
                log.warn("Clean dataflow for project<{}> failed", project.getName(), e);
            }
            log.info("Dataflow cleanup for project<{}> finished", project.getName());
        }
    }

    private static void cleanupRedundantIndex(ProjectInstance project) {
        EnhancedUnitOfWork.doInTransactionWithCheckAndRetry(() -> {
            val models = NDataflowManager.getInstance(KylinConfig.getInstanceFromEnv(), project.getName())
                    .listUnderliningDataModels();
            for (NDataModel model : models) {
                removeLayouts(model);
            }
            return 0;
        }, project.getName());
    }

    private static void removeLayouts(NDataModel model) {
        val dataflowManager = NDataflowManager.getInstance(KylinConfig.getInstanceFromEnv(), model.getProject());
        val dataflow = dataflowManager.getDataflow(model.getUuid());
        val layoutIds = getLayouts(dataflow);
        val toBeRemoved = Sets. newHashSet();
        for (NDataSegment segment : dataflow.getSegments()) {
            toBeRemoved.addAll(segment.getSegDetails().getAllLayouts().stream().map(NDataLayout::getLayoutId)
                    .filter(id -> !layoutIds.contains(id)).collect(Collectors.toSet()));
        }
        dataflowManager.removeLayouts(dataflow, Lists.newArrayList(toBeRemoved));
    }

    private static List getLayouts(NDataflow dataflow) {
        val cube = dataflow.getIndexPlan();
        val layouts = cube.getAllLayouts();
        return layouts.stream().map(LayoutEntity::getId).collect(Collectors.toList());
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy