All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.dasasian.chok.node.Node Maven / Gradle / Ivy

There is a newer version: 1.7
Show newest version
/**
 * Copyright (C) 2014 Dasasian ([email protected])
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *         http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.dasasian.chok.node;

import com.dasasian.chok.node.monitor.IMonitor;
import com.dasasian.chok.operation.node.NodeOperation;
import com.dasasian.chok.operation.node.OperationResult;
import com.dasasian.chok.operation.node.ShardRedeployOperation;
import com.dasasian.chok.protocol.ConnectedComponent;
import com.dasasian.chok.protocol.InteractionProtocol;
import com.dasasian.chok.protocol.NodeQueue;
import com.dasasian.chok.protocol.metadata.NodeMetaData;
import com.dasasian.chok.util.NodeConfiguration;
import com.dasasian.chok.util.ThrottledInputStream.ThrottleSemaphore;
import org.I0Itec.zkclient.ExceptionUtil;
import org.I0Itec.zkclient.NetworkUtil;
import org.I0Itec.zkclient.exception.ZkInterruptedException;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.ipc.RPC;
import org.apache.hadoop.ipc.RPC.Server;
import org.apache.log4j.Logger;

import java.io.File;
import java.io.IOException;
import java.net.BindException;
import java.util.Collection;

public class Node implements ConnectedComponent {

    protected final static Logger LOG = Logger.getLogger(Node.class);
    private final NodeConfiguration nodeConfiguration;
    private final IContentServer contentServer;
    protected InteractionProtocol protocol;
    protected NodeContext context;
    protected String nodeName;
    private Server rpcServer;
    private IMonitor monitor;
    private Thread nodeOperatorThread;
    private boolean stopped;

    public Node(InteractionProtocol protocol, final NodeConfiguration configuration, IContentServer contentServer) {
        this.protocol = protocol;
        this.contentServer = contentServer;
        if (contentServer == null) {
            throw new IllegalArgumentException("Null server passed to Node()");
        }
        nodeConfiguration = configuration;
    }

    /*
     * Starting the hadoop RPC server that response to query requests. We iterate
     * over a port range of node.server.port.start + 10000
     */
    private static Server startRPCServer(String hostName, final int startPort, IContentServer nodeManaged, int handlerCount) {
        int serverPort = startPort;
        int tryCount = 10000;
        Server rpcServer = null;
        while (rpcServer == null) {
            try {
                rpcServer = RPC.getServer(nodeManaged, "0.0.0.0", serverPort, handlerCount, false, new Configuration());
                LOG.info(nodeManaged.getClass().getSimpleName() + " server started on : " + hostName + ":" + serverPort);
            } catch (final BindException e) {
                if (serverPort - startPort < tryCount) {
                    serverPort++;
                    // try again
                } else {
                    throw new RuntimeException("tried " + tryCount + " ports and no one is free...");
                }
            } catch (final IOException e) {
                throw new RuntimeException("unable to create rpc server", e);
            }
        }
        rpcServer.start();
        return rpcServer;
    }

    /**
     * Boots the node
     */
    public void start() {
        if (stopped) {
            throw new IllegalStateException("Node cannot be started again after it was shutdown.");
        }
        LOG.info("starting rpc server with  server class = " + contentServer.getClass().getCanonicalName());
        String hostName = NetworkUtil.getLocalhostName();
        rpcServer = startRPCServer(hostName, nodeConfiguration.getStartPort(), contentServer, nodeConfiguration.getRpcHandlerCount());
        nodeName = hostName + ":" + rpcServer.getListenerAddress().getPort();
        contentServer.init(nodeName, nodeConfiguration);

        // we add hostName and port to the shardFolder to allow multiple nodes per
        // server with the same configuration
        File shardsFolder = new File(nodeConfiguration.getShardFolder(), nodeName.replaceAll(":", "_"));
        LOG.info("local shard folder: " + shardsFolder.getAbsolutePath());
        int throttleInKbPerSec = nodeConfiguration.getShardDeployThrottle();
        final ShardManager shardManager;
        if (throttleInKbPerSec > 0) {
            LOG.info("throttling of shard deployment to " + throttleInKbPerSec + " kilo-bytes per second");
            shardManager = new ShardManager(shardsFolder, new ThrottleSemaphore(throttleInKbPerSec * 1024));
        } else {
            shardManager = new ShardManager(shardsFolder);
        }
        context = new NodeContext(protocol, this, shardManager, contentServer);
        protocol.registerComponent(this);

        startMonitor(nodeName, nodeConfiguration);
        init();
        LOG.info("started node '" + nodeName + "'");
    }

    private void init() {
        redeployInstalledShards();
        NodeMetaData nodeMetaData = new NodeMetaData(nodeName);
        NodeQueue nodeOperationQueue = protocol.publishNode(this, nodeMetaData);
        startOperatorThread(nodeOperationQueue);
    }

    private void startOperatorThread(NodeQueue nodeOperationQueue) {
        nodeOperatorThread = new Thread(new NodeOperationProcessor(nodeOperationQueue, context));
        nodeOperatorThread.setName(NodeOperationProcessor.class.getSimpleName() + ": " + getName());
        nodeOperatorThread.setDaemon(true);
        nodeOperatorThread.start();
    }

    @Override
    public synchronized void reconnect() {
        LOG.info(nodeName + " reconnected");
        init();
    }

    @Override
    public synchronized void disconnect() {
        LOG.info(nodeName + " disconnected");
        try {
            do {
                LOG.info("trying to stop node-processor...");
                nodeOperatorThread.interrupt();
                nodeOperatorThread.join(2500);
            } while (nodeOperatorThread.isAlive());
        } catch (InterruptedException e) {
            Thread.interrupted();
        }
        // we keep serving the shards
    }

    private void redeployInstalledShards() {
        Collection installedShards = context.getShardManager().getInstalledShards();
        ShardRedeployOperation redeployOperation = new ShardRedeployOperation(installedShards);
        try {
            redeployOperation.execute(context);
        } catch (InterruptedException e) {
            ExceptionUtil.convertToRuntimeException(e);
        }
    }

    private void startMonitor(String nodeName, NodeConfiguration conf) {
        if (LOG.isTraceEnabled()) {
            LOG.trace("starting node monitor");
        }
        try {
            Class monitorClass = conf.getMonitorClass();
            monitor = monitorClass.newInstance();
            monitor.startMonitoring(nodeName, protocol);
        } catch (Exception e) {
            LOG.error("Unable to start node monitor:", e);
        }
    }

    public void shutdown() {
        if (stopped) {
            throw new IllegalStateException("already stopped");
        }
        LOG.info("shutdown " + nodeName + " ...");
        stopped = true;

        if (monitor != null) {
            monitor.stopMonitoring();
        }
        nodeOperatorThread.interrupt();
        try {
            nodeOperatorThread.join();
        } catch (InterruptedException e) {
            Thread.interrupted();// proceed
        }

        protocol.unregisterComponent(this);
        rpcServer.stop();
        try {
            context.getContentServer().shutdown();
        } catch (Throwable t) {
            LOG.error("Error shutting down server", t);
        }
        LOG.info("shutdown " + nodeName + " finished");
    }

    public String getName() {
        return nodeName;
    }

    public NodeContext getContext() {
        return context;
    }

    public int getRPCServerPort() {
        return rpcServer.getListenerAddress().getPort();
    }

    public boolean isRunning() {
        // TODO jz: improve this whole start/stop/isRunning thing
        return context != null && !stopped;
    }

    public void join() throws InterruptedException {
        rpcServer.join();
    }

    public Server getRpcServer() {
        return rpcServer;
    }

    @Override
    protected void finalize() throws Throwable {
        super.finalize();
        shutdown();
    }

    @Override
    public String toString() {
        return nodeName;
    }

    public InteractionProtocol getProtocol() {
        return protocol;
    }

    public NodeConfiguration getNodeConfiguration() {
        return nodeConfiguration;
    }

    protected static class NodeOperationProcessor implements Runnable {

        private final NodeQueue _queue;
        private final NodeContext _nodeContext;

        public NodeOperationProcessor(NodeQueue queue, NodeContext nodeContext) {
            _queue = queue;
            _nodeContext = nodeContext;
        }

        @Override
        public void run() {
            try {
                while (_nodeContext.getNode().isRunning()) {
                    try {
                        NodeOperation operation = _queue.peek();
                        OperationResult operationResult = null;
                        try {
                            LOG.info("executing " + operation);
                            operationResult = operation.execute(_nodeContext);
                        } catch (Exception e) {
                            LOG.error(_nodeContext.getNode().getName() + ": failed to execute " + operation, e);
                            operationResult = new OperationResult(_nodeContext.getNode().getName(), e);
                            ExceptionUtil.rethrowInterruptedException(e);
                        } finally {
                            _queue.complete(operationResult);// only remove after finish
                        }
                    } catch (Throwable e) {
                        ExceptionUtil.rethrowInterruptedException(e);
                        LOG.fatal(_nodeContext.getNode().getName() + ": operation failure ", e);
                    }
                }
            } catch (InterruptedException | ZkInterruptedException e) {
                Thread.interrupted();
            }
            LOG.info("node operation processor for " + _nodeContext.getNode().getName() + " stopped");
        }
    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy