All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.finos.tracdap.common.data.pipeline.GrpcUploadSource Maven / Gradle / Ivy

Go to download

TRAC D.A.P. data library, interfaces and core functionality for working with primary data

The newest version!
/*
 * Licensed to the Fintech Open Source Foundation (FINOS) under one or
 * more contributor license agreements. See the NOTICE file distributed
 * with this work for additional information regarding copyright ownership.
 * FINOS licenses this file to you under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with the
 * License. You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.finos.tracdap.common.data.pipeline;

import org.finos.tracdap.common.data.util.Bytes;
import org.finos.tracdap.common.exception.ETracInternal;
import org.finos.tracdap.common.exception.EUnexpected;

import com.google.protobuf.ByteString;
import io.grpc.stub.ServerCallStreamObserver;
import io.grpc.stub.StreamObserver;
import org.apache.arrow.memory.ArrowBuf;
import org.apache.arrow.memory.BufferAllocator;

import java.util.concurrent.CompletableFuture;
import java.util.concurrent.CompletionStage;
import java.util.concurrent.Flow;
import java.util.concurrent.atomic.AtomicBoolean;
import java.util.function.Function;


public class GrpcUploadSource {

    // Source stream class for handling file / data uploads
    // The pattern is one message with metadata followed by a stream of content
    // The first message may also contain content

    // This class is intended as a very simple pass-through,
    // from a gRPC event stream to the data pipeline event stream

    private final ServerCallStreamObserver response;
    private final StreamObserver request;
    private final CompletableFuture firstMessage;
    private Flow.Subscriber subscriber;
    private Flow.Subscription subscription;
    private Runnable cleanup;

    private boolean requestedFirst;
    private boolean sentFirst;
    private boolean grpcComplete;

    @SuppressWarnings("unused") // Request class is needed to infer types for the upload source
    public GrpcUploadSource(Class requestClass, StreamObserver response) {

        if (!(response instanceof ServerCallStreamObserver))
            throw new EUnexpected();

        this.response = (ServerCallStreamObserver) response;
        this.response.disableAutoInboundFlowControl();
        this.response.setOnCancelHandler(this::apiOnCancel);

        this.request = new UploadRequestObserver();
        this.firstMessage = new CompletableFuture<>();
    }


    // Setup

    public void whenComplete(Runnable cleanup) {
        this.cleanup = cleanup;
    }

    public StreamObserver start() {
        response.request(1);
        return request;
    }

    public void succeeded(TResponse result) {

        try {
            response.onNext(result);
            response.onCompleted();
        }
        finally {
            if (cleanup != null)
                cleanup.run();
        }
    }

    public Void failed(Throwable error) {

        try {
            response.onError(error);
            return null;
        }
        finally {
            if (cleanup != null)
                cleanup.run();
        }
    }

    public CompletionStage firstMessage() {
        return firstMessage;
    }

    public Flow.Publisher dataStream(Function accessor, BufferAllocator allocator) {
        return new UploadPublisher(accessor, allocator);
    }


    // Stream event handlers

    private void apiOnNext(TRequest value) {

        if (!firstMessage.isDone()) {

            firstMessage.complete(value);

            if (requestedFirst) {

                sentFirst = true;
                subscriber.onNext(value);

                if (grpcComplete)
                    subscriber.onComplete();
            }
        }
        else {

            subscriber.onNext(value);
        }
    }

    private void apiOnComplete() {

        if (!firstMessage.isDone()) {

            // Should never happen, gRPC will always send onNext before onComplete
            firstMessage.completeExceptionally(new EUnexpected());
        }
        else {

            // Sometimes the incoming stream has just one message
            // Then onComplete might fire before the data stream is set up
            // If this happens, record the complete signal to send with the first message

            if (subscriber != null)
                subscriber.onComplete();
            else
                grpcComplete = true;
        }
    }

    private void apiOnError(Throwable error) {

        if (!firstMessage.isDone()) {

            firstMessage.completeExceptionally(error);

            if (requestedFirst) {
                sentFirst = true;
                subscriber.onError(error);
            }
        }
        else {

            subscriber.onError(error);
        }
    }

    private void apiOnCancel() {
        // TODO: Cancel not implemented yet
    }

    private void pipelineSubscribe(Flow.Subscriber subscriber) {

        if (subscription != null)
            throw new ETracInternal("Upload source is already subscribed");

        this.subscription = new UploadSubscription();
        this.subscriber = subscriber;
        this.subscriber.onSubscribe(subscription);
    }

    private void pipelineRequest(long n) {

        // The first message has already been received when the pipe starts and may contain data content
        // It is also possible the stream completed already (if there was just a single message),
        // or that an error occurred before the first message was received

        if (!sentFirst && firstMessage.isDone()) {

            sentFirst = true;

            try {

                subscriber.onNext(firstMessage.getNow(null));

                if (grpcComplete)
                    subscriber.onComplete();
            }
            catch (Throwable e) {

                subscriber.onError(e);
            }
        }

        // One message was already requested by start(), don't pump more messages than requested

        if (!requestedFirst) {
            requestedFirst = true;
            if (n > 1)
                response.request((int) n - 1);
        }
        else
            response.request((int) n);
    }

    private void pipelineCancel() {
        // TODO: Cancel not implemented yet
    }


    // Wrapper classes for the gRPC and data pipeline interfaces

    private class UploadRequestObserver implements StreamObserver {

        @Override
        public void onNext(TRequest value) {
            apiOnNext(value);
        }

        @Override
        public void onError(Throwable t) {
            apiOnError(t);
        }

        @Override
        public void onCompleted() {
            apiOnComplete();
        }
    }

    private class UploadPublisher implements Flow.Processor {

        private static final int DEFAULT_CHUNK_SIZE = 2 * 1024 * 1024;

        private final Function accessor;
        private final BufferAllocator allocator;

        private Flow.Subscriber subscriber;
        private ArrowBuf buffer;

        public UploadPublisher(Function accessor, BufferAllocator allocator) {
            this.accessor = accessor;
            this.allocator = allocator;
        }

        @Override
        public void subscribe(Flow.Subscriber subscriber) {
            this.subscriber = subscriber;
            pipelineSubscribe(this);
        }

        @Override
        public void onSubscribe(Flow.Subscription subscription) {
            subscriber.onSubscribe(subscription);
        }

        @Override
        public void onNext(TRequest item) {

            try {
                var bytes = accessor.apply(item).asReadOnlyByteBuffer();

                // TODO: Simplify this

                var sent = new AtomicBoolean(false);

                buffer = Bytes.writeToStream(
                        bytes, buffer, allocator,
                        DEFAULT_CHUNK_SIZE,
                        x -> { sent.set(true); subscriber.onNext(x); });

                if (! sent.get())
                    subscription.request(1);
            }
            catch (Exception e) {
                buffer = Bytes.closeStream(buffer);
                throw e;
            }
        }

        @Override
        public void onError(Throwable throwable) {

            try {
                subscriber.onError(throwable);
            }
            finally {
                buffer = Bytes.closeStream(buffer);
            }
        }

        @Override
        public void onComplete() {

            try {
                buffer = Bytes.flushStream(buffer, subscriber::onNext);
                subscriber.onComplete();
            }
            finally {
                buffer = Bytes.closeStream(buffer);
            }
        }
    }

    private class UploadSubscription implements Flow.Subscription {

        @Override
        public void request(long n) {
            pipelineRequest(n);
        }

        @Override
        public void cancel() {
            pipelineCancel();
        }
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy