All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.reacted.drivers.channels.grpc.GrpcDriver Maven / Gradle / Ivy

/*
 * Copyright (c) 2020 ,  [ [email protected] ]
 * All rights reserved.
 *
 * This source code is licensed under the BSD-style license found in the
 * LICENSE file in the root directory of this source tree.
 */

package io.reacted.drivers.channels.grpc;

import com.google.common.util.concurrent.ThreadFactoryBuilder;
import com.google.protobuf.ByteString;
import com.google.protobuf.Empty;
import io.grpc.CallOptions;
import io.grpc.Channel;
import io.grpc.ClientCall;
import io.grpc.ClientInterceptor;
import io.grpc.ForwardingClientCall;
import io.grpc.ForwardingClientCallListener;
import io.grpc.ManagedChannel;
import io.grpc.ManagedChannelBuilder;
import io.grpc.Metadata;
import io.grpc.MethodDescriptor;
import io.grpc.Server;
import io.grpc.Status;
import io.grpc.netty.NettyServerBuilder;
import io.grpc.services.HealthStatusManager;
import io.grpc.stub.StreamObserver;
import io.netty.channel.EventLoopGroup;
import io.netty.channel.nio.NioEventLoopGroup;
import io.netty.channel.socket.nio.NioServerSocketChannel;
import io.reacted.core.config.ChannelId;
import io.reacted.core.config.drivers.ChannelDriverConfig;
import io.reacted.core.drivers.DriverCtx;
import io.reacted.core.drivers.system.RemotingDriver;
import io.reacted.core.messages.Message;
import io.reacted.core.messages.reactors.DeliveryStatus;
import io.reacted.core.reactorsystem.ReActorContext;
import io.reacted.core.reactorsystem.ReActorSystem;
import io.reacted.patterns.NonNullByDefault;
import io.reacted.patterns.ObjectUtils;
import io.reacted.patterns.Try;
import io.reacted.patterns.UnChecked;
import java.io.ByteArrayInputStream;
import java.io.ByteArrayOutputStream;
import java.io.ObjectInputStream;
import java.io.ObjectOutputStream;
import java.net.InetSocketAddress;
import java.util.Map;
import java.util.Objects;
import java.util.Properties;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.Executor;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.TimeUnit;
import java.util.function.Function;
import javax.annotation.Nullable;

@NonNullByDefault
public class GrpcDriver extends RemotingDriver {
    private final Map> gatesStubs;
    private final ChannelId channelId;
    @Nullable
    private Server grpcServer;
    @Nullable
    private ExecutorService grpcServerExecutor;
    @Nullable
    private ExecutorService grpcClientExecutor;
    @Nullable
    private EventLoopGroup workerEventLoopGroup;
    @Nullable
    private EventLoopGroup bossEventLoopGroup;


    public GrpcDriver(GrpcDriverConfig grpcDriverConfig) {
        super(grpcDriverConfig);
        this.gatesStubs = new ConcurrentHashMap<>(1000, 0.5f);
        this.channelId = ChannelId.ChannelType.GRPC.forChannelName(grpcDriverConfig.getChannelName());
    }

    @Override
    public void initDriverLoop(ReActorSystem localReActorSystem) {
        DriverCtx grpcDriverCtx = REACTOR_SYSTEM_CTX.get();
        this.grpcServerExecutor = Executors.newFixedThreadPool(3, new ThreadFactoryBuilder()
                .setUncaughtExceptionHandler((thread, throwable) -> localReActorSystem.logError("Uncaught exception in {}",
                                                                                                thread.getName(), throwable))
                .setNameFormat("Grpc-Server-Executor-" + grpcDriverCtx.getLocalReActorSystem().getLocalReActorSystemId()
                                                                      .getReActorSystemName() + "-%d")
                .build());
        this.grpcClientExecutor = Executors.newFixedThreadPool(1, new ThreadFactoryBuilder()
                .setUncaughtExceptionHandler((thread, throwable) -> localReActorSystem.logError("Uncaught exception in {}",
                                                                                                thread.getName(), throwable))
                .setNameFormat("Grpc-Client-Executor-" + grpcDriverCtx.getLocalReActorSystem().getLocalReActorSystemId()
                                                                      .getReActorSystemName() + "-%d")
                .build());
        this.grpcClientExecutor.submit(() -> REACTOR_SYSTEM_CTX.set(grpcDriverCtx));
        this.workerEventLoopGroup = new NioEventLoopGroup(2);
        this.bossEventLoopGroup = new NioEventLoopGroup(1);
        this.grpcServer = NettyServerBuilder.forAddress(new InetSocketAddress(getDriverConfig().getHostName(),
                                                                              getDriverConfig().getPort()))
                                            .channelType(NioServerSocketChannel.class)
                                            .executor(grpcServerExecutor)
                                            .bossEventLoopGroup(bossEventLoopGroup)
                                            .workerEventLoopGroup(workerEventLoopGroup)
                                            .permitKeepAliveWithoutCalls(true)
                                            .permitKeepAliveTime(6, TimeUnit.MINUTES)
                                            .addService(new HealthStatusManager().getHealthService())
                                            .addService(new GrpcServer(this))
                                            .build();
    }

    @Override
    public CompletableFuture> cleanDriverLoop() {
        Objects.requireNonNull(grpcServer).shutdown();
        Try.of(() -> grpcServer.awaitTermination(5, TimeUnit.SECONDS))
           .ifError(error -> Thread.currentThread().interrupt());
        gatesStubs.values()
                  .forEach(linkContainer -> Try.of(() -> linkContainer.channel.shutdown()
                                                                              .awaitTermination(5, TimeUnit.SECONDS))
                                               .ifError(error -> Thread.currentThread().interrupt()));
        if (bossEventLoopGroup != null) {
            bossEventLoopGroup.shutdownGracefully();
        }
        if (workerEventLoopGroup != null) {
            workerEventLoopGroup.shutdownGracefully();
        }
        if (grpcServerExecutor != null) {
            grpcServerExecutor.shutdown();
        }
        if (grpcClientExecutor != null) {
            grpcClientExecutor.shutdown();
        }
        gatesStubs.clear();
        return CompletableFuture.completedFuture(Try.ofSuccess(null));
    }

    @Override
    public UnChecked.CheckedRunnable getDriverLoop() {
        return () -> Objects.requireNonNull(grpcServer).start();
    }

    @Override
    public ChannelId getChannelId() { return channelId; }

    @Override
    public DeliveryStatus sendMessage(ReActorContext destination, Message message) {
        Properties dstChannelIdProperties = message.getDestination().getReActorSystemRef().getGateProperties();
        String dstChannelIdName = dstChannelIdProperties.getProperty(ChannelDriverConfig.CHANNEL_ID_PROPERTY_NAME);
        /*
            Fact 1: GRPC links are not bidirectional.
            Fact 2: Every couple Channel Type - Channel Name (Aka channel id) has a dedicated driver instance.
                    To communicate with another reacted node, you need to know the channel id and the channel properties.
                    If some nodes communicate on a channel using the same setup that can be safely stored within
                    the driver instance (i.e. think about a kafka channel:  all the nodes will use the same kafka
                    coordinates) this is not true for GRPC where every node might be on a different ip address / port
            Fact 3: Give the above 2 facts, it means that in order to send a message to a GRPC node, you not only
                    need a driver instance, but also the specific properties of the remote peer.
            Fact 4: On network failures, one route might be canceled. Canceling a route means canceling from the
                    reactor system the information about how to reach a given peer. This information include the
                    channel properties for the remote peer

            Scenario: a message that requires an ACK arrives at this GRPC driver, but a network failure triggered
            the route cancellation before we can send back the ACK.

            ACKs has to be sent using the same driver that processed the incoming message and have to be sent to the
            GENERATING reactor system from datalink layer, not from the nominal sender. If a nominal sender can be
            overridden, a generating reactor system id cannot. This means that an ACK has to be sent to the
            generating reactor system, using the same driver from where the message came from and using the channel id
            managed by the receiving driver.

            For GRPC this is not enough, because we need the properties containing the specific info of the remote
            peer. These info are not sent within the datalink message, so the peer that wants to reply to a message
            (such as sending an ACK) has to retrieve them from the reactor system.

            If a network outage triggers a route unregister, we might still have some reactor references pointing
            to the supposedly dead reactor system or some messages coming from there might still need to be ACKed.

            A route unregister deletes the info regarding how to reach a given reactor system via a specific channel.
            If the route that gets unregistered is grpc, it means that a reactor system does not hold anymore any
            information about how to reach the remote peer using grpc.

            ReActed when a reply has to be sent, sets properly the ReActorSystemRef with the gate and the channel id
            that should be used (that are the same of this driver instance because of what described above), but
            if it cannot find the properties for the remote host (because the channel went offline and got unregistered)
            it simply cannot fill them.

            That said, if an ACK has to be sent back with grpc, the details about Channel Type (the driver type) and
            the channel name are still valid, but the properties are missing. Without the properties there is not much
            that can be done except returning an error
         */
        if (dstChannelIdName == null) {
            getLocalReActorSystem().logDebug("Not sending message. Destination channel is no longer available for message {}",
                                             message.toString());
            return DeliveryStatus.NOT_SENT;
        }

        SystemLinkContainer grpcLink;
        var peerChannelKey = getChannelPeerKey(dstChannelIdProperties.getProperty(GrpcDriverConfig.GRPC_HOST),
                                               dstChannelIdProperties.getProperty(GrpcDriverConfig.GRPC_PORT));
        grpcLink = gatesStubs.computeIfAbsent(peerChannelKey,
                                              newPeerChannelKey -> SystemLinkContainer.ofChannel(getNewChannel(dstChannelIdProperties,
                                                                                                               Objects.requireNonNull(grpcClientExecutor),
                                                                                                               () -> removeStaleChannel(newPeerChannelKey)),
                                                                                                 ReActedLinkGrpc::newStub,
                                                                                                 stub -> stub.link(getEmptyMessageHandler(getLocalReActorSystem()))));

        var byteArray = new ByteArrayOutputStream();

        try(ObjectOutputStream oos = new ObjectOutputStream(byteArray)) {
            oos.writeObject(message);
            var payload = ReActedLinkProtocol.ReActedDatagram.newBuilder()
                                                             .setBinaryPayload(ByteString.copyFrom(byteArray.toByteArray()))
                                                             .build();
            //noinspection SynchronizationOnLocalVariableOrMethodParameter
            synchronized (grpcLink) {
                grpcLink.link.onNext(payload);
            }
            return DeliveryStatus.SENT;

        } catch (Exception error) {
            removeStaleChannel(peerChannelKey);
            getLocalReActorSystem().logError("Error sending message {}", message.toString(), error);
            return DeliveryStatus.NOT_SENT;
        }
    }

    @Override
    public Properties getChannelProperties() { return getDriverConfig().getChannelProperties(); }

    private void removeStaleChannel(String peerChannelKey) {
        ObjectUtils.ifNotNull(this.gatesStubs.remove(peerChannelKey),
                              linkContainer -> linkContainer.channel.shutdownNow());
    }
    private static ManagedChannel getNewChannel(Properties channelIdProperties, Executor grpcExecutor,
                                                Runnable onCloseCleanup) {
        int port = Integer.parseInt(channelIdProperties.getProperty(GrpcDriverConfig.GRPC_PORT));
        String host = channelIdProperties.getProperty(GrpcDriverConfig.GRPC_HOST);
        return ManagedChannelBuilder.forAddress(host, port)
                                    .keepAliveTime(6, TimeUnit.MINUTES)
                                    .keepAliveWithoutCalls(true)
                                    .enableRetry()
                                    .usePlaintext()
                                    .executor(grpcExecutor)
                                    .intercept(newStreamClosureDetector(onCloseCleanup))
                                    .build();
    }
    private static String getChannelPeerKey(String peerHostname, String peerPort) {
        return peerHostname + "|" + peerPort;
    }
    private static class GrpcServer extends ReActedLinkGrpc.ReActedLinkImplBase {
        private final GrpcDriver thisDriver;

        public GrpcServer(GrpcDriver thisDriver) {
            this.thisDriver = thisDriver;
        }
        @Override
        public StreamObserver link(StreamObserver responseObserver) {
            return new StreamObserver<>() {
                @Override
                public void onNext(ReActedLinkProtocol.ReActedDatagram reActedDatagram) {
                    try (ObjectInputStream msgSource = new ObjectInputStream(new ByteArrayInputStream(reActedDatagram.getBinaryPayload()
                                                                                                                     .toByteArray()))) {
                        thisDriver.offerMessage((Message)msgSource.readObject());
                    } catch (Exception deserializationError) {
                        thisDriver.getLocalReActorSystem()
                                  .logError("Error decoding message", deserializationError);
                    }
                }

                @Override
                public void onError(Throwable throwable) {
                    thisDriver.getLocalReActorSystem()
                              .logError(GrpcDriver.class.getSimpleName() + " grpc error:", throwable);
                }

                @Override
                public void onCompleted() { }
            };
        }
    }
    private static ClientInterceptor newStreamClosureDetector(Runnable onStreamClosed) {
        return new ClientInterceptor() {
            @Override
            public  ClientCall
            interceptCall(MethodDescriptor methodDescriptor, CallOptions callOptions, Channel channel) {
                return new ForwardingClientCall.SimpleForwardingClientCall<>(channel.newCall(methodDescriptor,
                                                                                             callOptions)) {
                    @Override
                    public void start(Listener responseListener, Metadata headers) {
                        delegate().start(new ForwardingClientCallListener.SimpleForwardingClientCallListener<>(responseListener) {
                            @Override
                            public void onClose(Status status, Metadata trailers) {
                                super.onClose(status, trailers);
                                onStreamClosed.run();
                            }
                        }, headers);
                    }
                };
            }
        };
    }
    private static StreamObserver getEmptyMessageHandler(ReActorSystem localReActorSystem) {
        return new StreamObserver<>() {
            @Override
            public void onNext(Empty empty) { }

            @Override
            public void onError(Throwable throwable) {
                localReActorSystem.logError("Unable to communicate with the remote host", throwable);
            }

            @Override
            public void onCompleted() { }
        };
    }

    private record SystemLinkContainer(ManagedChannel channel, StreamObserver link) {
        private static 
            SystemLinkContainer ofChannel(ManagedChannel channel, Function toStub,
                                                      Function> toLink) {
                return new SystemLinkContainer<>(channel, toLink.apply(toStub.apply(channel)));
            }
        }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy