All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.dinky.shaded.paimon.crosspartition.ExistingProcessor Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.dinky.shaded.paimon.crosspartition;

import org.dinky.shaded.paimon.CoreOptions.MergeEngine;
import org.dinky.shaded.paimon.data.BinaryRow;
import org.dinky.shaded.paimon.data.InternalRow;
import org.dinky.shaded.paimon.utils.ProjectToRowFunction;
import org.dinky.shaded.paimon.utils.RowIterator;

import java.util.function.BiConsumer;
import java.util.function.Function;

/** Processor to process existing key. */
public interface ExistingProcessor {

    /** @return should process new record. */
    boolean processExists(InternalRow newRow, BinaryRow previousPart, int previousBucket);

    void bulkLoadNewRecords(
            Function iteratorFunction,
            Function extractPrimary,
            Function extractPartition,
            Function assignBucket);

    static void bulkLoadCollectFirst(
            BiConsumer collector,
            RowIterator iterator,
            Function extractPrimary,
            Function extractPartition,
            Function assignBucket) {
        InternalRow row;
        BinaryRow currentKey = null;
        while ((row = iterator.next()) != null) {
            BinaryRow primaryKey = extractPrimary.apply(row);
            if (currentKey == null || !currentKey.equals(primaryKey)) {
                collector.accept(row, assignBucket.apply(extractPartition.apply(row)));
                currentKey = primaryKey.copy();
            }
        }
    }

    static ExistingProcessor create(
            MergeEngine mergeEngine,
            ProjectToRowFunction setPartition,
            BucketAssigner bucketAssigner,
            BiConsumer collector) {
        switch (mergeEngine) {
            case DEDUPLICATE:
                return new DeleteExistingProcessor(setPartition, bucketAssigner, collector);
            case PARTIAL_UPDATE:
            case AGGREGATE:
                return new UseOldExistingProcessor(setPartition, collector);
            case FIRST_ROW:
                return new SkipNewExistingProcessor(collector);
            default:
                throw new UnsupportedOperationException("Unsupported engine: " + mergeEngine);
        }
    }

    /** Input Order for sorting. */
    enum SortOrder {
        ASCENDING,
        DESCENDING,
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy