All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.flink.streaming.connectors.pulsar.table.DynamicPulsarDeserializationSchema Maven / Gradle / Ivy

There is a newer version: 1.12.0
Show newest version
/*
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.flink.streaming.connectors.pulsar.table;

import org.apache.flink.api.common.serialization.DeserializationSchema;
import org.apache.flink.api.common.typeinfo.TypeInformation;
import org.apache.flink.streaming.util.serialization.FlinkSchema;
import org.apache.flink.streaming.util.serialization.PulsarDeserializationSchema;
import org.apache.flink.streaming.util.serialization.ThreadSafeDeserializationSchema;
import org.apache.flink.table.data.GenericRowData;
import org.apache.flink.table.data.RowData;
import org.apache.flink.types.DeserializationException;
import org.apache.flink.types.RowKind;
import org.apache.flink.util.Collector;
import org.apache.flink.util.Preconditions;

import org.apache.pulsar.client.api.Message;
import org.apache.pulsar.client.api.Schema;

import javax.annotation.Nullable;

import java.io.IOException;
import java.io.Serializable;
import java.util.ArrayList;
import java.util.List;

/**
 * A specific {@link PulsarDeserializationSchema} for {@link PulsarDynamicTableSource}.
 */
class DynamicPulsarDeserializationSchema implements PulsarDeserializationSchema {

    private static final long serialVersionUID = 1L;

    @Nullable
    private final DeserializationSchema keyDeserialization;

    private final DeserializationSchema valueDeserialization;

    private final boolean hasMetadata;

    private final OutputProjectionCollector outputCollector;

    private final TypeInformation producedTypeInfo;

    private final boolean upsertMode;

    private static final ThreadLocal> tlsCollector =
            new ThreadLocal>() {
                @Override
                public SimpleCollector initialValue() {
                    return new SimpleCollector();
                }
            };

    DynamicPulsarDeserializationSchema(
            int physicalArity,
            @Nullable DeserializationSchema keyDeserialization,
            int[] keyProjection,
            DeserializationSchema valueDeserialization,
            int[] valueProjection,
            boolean hasMetadata,
            MetadataConverter[] metadataConverters,
            TypeInformation producedTypeInfo,
            boolean upsertMode) {
        if (upsertMode) {
            Preconditions.checkArgument(
                    keyDeserialization != null && keyProjection.length > 0,
                    "Key must be set in upsert mode for deserialization schema.");
        }
        this.keyDeserialization = ThreadSafeDeserializationSchema.of(keyDeserialization);
        this.valueDeserialization = ThreadSafeDeserializationSchema.of(valueDeserialization);
        this.hasMetadata = hasMetadata;
        this.outputCollector = new OutputProjectionCollector(
                physicalArity,
                keyProjection,
                valueProjection,
                metadataConverters,
                upsertMode);
        this.producedTypeInfo = producedTypeInfo;
        this.upsertMode = upsertMode;
    }

    @Override
    public void open(DeserializationSchema.InitializationContext context) throws Exception {
        if (keyDeserialization != null) {
            keyDeserialization.open(context);
        }
        valueDeserialization.open(context);
    }

    @Override
    public boolean isEndOfStream(RowData nextElement) {
        return false;
    }

    @Override
    public RowData deserialize(Message message) throws IOException {
        final SimpleCollector collector = tlsCollector.get();
        deserialize(message, collector);
        return collector.takeRecord();
    }

    @Override
    public void deserialize(Message message, Collector collector) throws IOException {
        // shortcut in case no output projection is required,
        // also not for a cartesian product with the keys
        if (keyDeserialization == null && !hasMetadata) {
            valueDeserialization.deserialize(message.getData(), collector);
            return;
        }
        BufferingCollector keyCollector = new BufferingCollector();

        // buffer key(s)
        if (keyDeserialization != null) {
            keyDeserialization.deserialize(message.getKeyBytes(), keyCollector);
        }

        // project output while emitting values
        outputCollector.inputMessage = message;
        outputCollector.physicalKeyRows = keyCollector.buffer;
        outputCollector.outputCollector = collector;
        if ((message.getData() == null || message.getData().length == 0) && upsertMode) {
            // collect tombstone messages in upsert mode by hand
            outputCollector.collect(null);
        } else {
            valueDeserialization.deserialize(message.getData(), outputCollector);
        }
        keyCollector.buffer.clear();
    }

    @Override
    public TypeInformation getProducedType() {
        return producedTypeInfo;
    }

    @Override
    public Schema getSchema() {
        return new FlinkSchema<>(Schema.BYTES.getSchemaInfo(), null, valueDeserialization);
    }

    // --------------------------------------------------------------------------------------------

    interface MetadataConverter extends Serializable {
        Object read(Message message);
    }

    // --------------------------------------------------------------------------------------------

    private static final class BufferingCollector implements Collector, Serializable {

        private static final long serialVersionUID = 1L;

        private final List buffer = new ArrayList<>();

        @Override
        public void collect(RowData record) {
            buffer.add(record);
        }

        @Override
        public void close() {
            // nothing to do
        }
    }

    private static class SimpleCollector implements Collector {
        private T record;

        @Override
        public void collect(T record) {
            this.record = record;
        }

        @Override
        public void close() {

        }

        private T getRecord() {
            return record;
        }

        private T takeRecord() {
            T result = record;
            reset();
            return result;
        }

        private void reset() {
            record = null;
        }
    }

    // --------------------------------------------------------------------------------------------

    /**
     * Emits a row with key, value, and metadata fields.
     *
     * 

The collector is able to handle the following kinds of keys: *

    *
  • No key is used. *
  • A key is used. *
  • The deserialization schema emits multiple keys. *
  • Keys and values have overlapping fields. *
  • Keys are used and value is null. *
*/ private static final class OutputProjectionCollector implements Collector, Serializable { private static final long serialVersionUID = 1L; private final int physicalArity; private final int[] keyProjection; private final int[] valueProjection; private final MetadataConverter[] metadataConverters; private final boolean upsertMode; private transient Message inputMessage; private transient List physicalKeyRows; private transient Collector outputCollector; OutputProjectionCollector( int physicalArity, int[] keyProjection, int[] valueProjection, MetadataConverter[] metadataConverters, boolean upsertMode) { this.physicalArity = physicalArity; this.keyProjection = keyProjection; this.valueProjection = valueProjection; this.metadataConverters = metadataConverters; this.upsertMode = upsertMode; } @Override public void collect(RowData physicalValueRow) { // no key defined if (keyProjection.length == 0) { emitRow(null, (GenericRowData) physicalValueRow); return; } // otherwise emit a value for each key for (RowData physicalKeyRow : physicalKeyRows) { emitRow((GenericRowData) physicalKeyRow, (GenericRowData) physicalValueRow); } } @Override public void close() { // nothing to do } private void emitRow(@Nullable GenericRowData physicalKeyRow, @Nullable GenericRowData physicalValueRow) { final RowKind rowKind; if (physicalValueRow == null) { if (upsertMode) { rowKind = RowKind.DELETE; } else { throw new DeserializationException( "Invalid null value received in non-upsert mode. Could not to set row kind for output record."); } } else { rowKind = physicalValueRow.getRowKind(); } final int metadataArity = metadataConverters.length; final GenericRowData producedRow = new GenericRowData( rowKind, physicalArity + metadataArity); if (physicalValueRow != null) { for (int valuePos = 0; valuePos < valueProjection.length; valuePos++) { producedRow.setField(valueProjection[valuePos], physicalValueRow.getField(valuePos)); } } for (int keyPos = 0; keyPos < keyProjection.length; keyPos++) { assert physicalKeyRow != null; producedRow.setField(keyProjection[keyPos], physicalKeyRow.getField(keyPos)); } for (int metadataPos = 0; metadataPos < metadataArity; metadataPos++) { producedRow.setField(physicalArity + metadataPos, metadataConverters[metadataPos].read(inputMessage)); } outputCollector.collect(producedRow); } } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy