All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.paimon.spark.SparkReaderFactory Maven / Gradle / Ivy

There is a newer version: 0.9.0
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.paimon.spark;

import org.apache.paimon.data.InternalRow;
import org.apache.paimon.disk.IOManager;
import org.apache.paimon.reader.RecordReader;
import org.apache.paimon.reader.RecordReaderIterator;
import org.apache.paimon.table.source.ReadBuilder;

import org.apache.spark.sql.connector.read.InputPartition;
import org.apache.spark.sql.connector.read.PartitionReader;
import org.apache.spark.sql.connector.read.PartitionReaderFactory;

import java.io.IOException;
import java.io.UncheckedIOException;

import static org.apache.paimon.spark.SparkUtils.createIOManager;

/** A Spark {@link PartitionReaderFactory} for paimon. */
public class SparkReaderFactory implements PartitionReaderFactory {

    private static final long serialVersionUID = 1L;

    private final ReadBuilder readBuilder;

    public SparkReaderFactory(ReadBuilder readBuilder) {
        this.readBuilder = readBuilder;
    }

    @Override
    public PartitionReader createReader(
            InputPartition partition) {
        RecordReader reader;
        IOManager ioManager = createIOManager();
        try {
            reader =
                    readBuilder
                            .newRead()
                            .withIOManager(ioManager)
                            .createReader(((SparkInputPartition) partition).split());
        } catch (IOException e) {
            throw new UncheckedIOException(e);
        }
        RecordReaderIterator iterator = new RecordReaderIterator<>(reader);
        SparkInternalRow row = new SparkInternalRow(readBuilder.readType());
        return new SparkInputPartitionReader(ioManager, iterator, row);
    }

    @Override
    public boolean equals(Object o) {
        if (this == o) {
            return true;
        }

        if (o == null || getClass() != o.getClass()) {
            return false;
        }

        SparkReaderFactory that = (SparkReaderFactory) o;
        return this.readBuilder.equals(that.readBuilder);
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy