All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.pinterest.doctorkafka.util.OperatorUtil Maven / Gradle / Ivy

There is a newer version: 0.3.0-rc.2
Show newest version
package com.pinterest.doctorkafka.util;


import com.google.common.net.HostAndPort;
import com.pinterest.doctorkafka.BrokerStats;

import org.apache.commons.lang3.tuple.MutablePair;

import kafka.api.FetchRequest;
import kafka.api.FetchRequestBuilder;
import kafka.api.FetchResponse;
import kafka.api.Request;
import kafka.cluster.Broker;
import kafka.common.TopicAndPartition;
import kafka.consumer.ConsumerConfig;
import kafka.consumer.SimpleConsumer;
import kafka.message.MessageSet;
import kafka.utils.ZkUtils;
import org.I0Itec.zkclient.ZkClient;
import org.I0Itec.zkclient.ZkConnection;
import org.apache.avro.Schema;
import org.apache.avro.io.BinaryDecoder;
import org.apache.avro.io.DecoderFactory;
import org.apache.avro.specific.SpecificDatumReader;
import org.apache.kafka.clients.consumer.ConsumerRecord;
import org.apache.kafka.clients.consumer.KafkaConsumer;
import org.apache.kafka.clients.producer.ProducerConfig;
import org.apache.kafka.common.network.ListenerName;
import org.apache.kafka.common.security.auth.SecurityProtocol;
import org.apache.logging.log4j.LogManager;
import org.apache.logging.log4j.Logger;
import scala.Tuple2;
import scala.collection.Seq;

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.net.InetAddress;
import java.net.InetSocketAddress;
import java.net.Socket;
import java.net.UnknownHostException;
import java.util.Arrays;
import java.util.Collections;
import java.util.HashMap;
import java.util.LinkedHashMap;
import java.util.Map;
import java.util.Properties;
import java.util.stream.Collectors;
import javax.management.MBeanServerConnection;
import javax.management.remote.JMXConnector;
import javax.management.remote.JMXConnectorFactory;
import javax.management.remote.JMXServiceURL;

public class OperatorUtil {

  private static final Logger LOG = LogManager.getLogger(OperatorUtil.class);
  public static final int WINDOW_SIZE = 6000;
  public static final String HostName = getHostname();
  private static final DecoderFactory avroDecoderFactory = DecoderFactory.get();
  private static final String FETCH_CLIENT_NAME = "DoctorKafka";
  private static final int FETCH_SOCKET_TIMEOUT = 10 * 1000;
  private static final int FETCH_BUFFER_SIZE = 4 * 1024 * 1024;
  private static final int FETCH_RETRIES = 3;
  private static final int FETCH_MAX_WAIT_MS = 1; // this is the same wait as simmpleConsumerShell
  // Reuse the reader to improve performance
  private static final SpecificDatumReader brokerStatsReader = new SpecificDatumReader<>(BrokerStats.getClassSchema());

  public static String getHostname() {
    String hostName;
    try {
      hostName = InetAddress.getLocalHost().getHostName();
      int firstDotPos = hostName.indexOf('.');
      if (firstDotPos > 0) {
        hostName = hostName.substring(0, firstDotPos);
      }
    } catch (Exception e) {
      // fall back to env var.
      hostName = System.getenv("HOSTNAME");
    }
    return hostName;
  }

  /**
   * Get an MBeanServerConnection object. Return null if there is any failure.
   */
  public static MBeanServerConnection getMBeanServerConnection(String host, String jmxPort) {
    MBeanServerConnection mbs = null;
    try {
      Map env = new HashMap<>();
      JMXServiceURL address = new JMXServiceURL(
          "service:jmx:rmi://" + host + "/jndi/rmi://" + host + ":" + jmxPort + "/jmxrmi");
      JMXConnector connector = JMXConnectorFactory.connect(address, env);
      mbs = connector.getMBeanServerConnection();
    } catch (Exception e) {
      LOG.error("Failed to connect to MBeanServer {}:{}", HostName, jmxPort, e);
    }
    return mbs;
  }


  public static boolean pingKafkaBroker(String host, int port, int timeout) {
    try (Socket socket = new Socket()) {
      socket.connect(new InetSocketAddress(host, port), timeout);
      return true;
    } catch (UnknownHostException e) {
      LOG.warn("Ping failure, host: " + host, e);
      return false;
    } catch (IOException e) {
      LOG.warn("Ping failure IO, host: " + host, e);
      return false; // Either timeout or unreachable or failed DNS lookup.
    }
  }

  public static boolean canFetchData(String host, int port, String topic, int partition) {
    LOG.info("Fetching data from host {}, topic {}, partition {}", host, topic, partition);
    SimpleConsumer consumer = new SimpleConsumer(host, port,
        FETCH_SOCKET_TIMEOUT, ConsumerConfig.SocketBufferSize(), FETCH_CLIENT_NAME);
    try {
      long earlyOffset = getOffset(consumer, topic, partition,
          kafka.api.OffsetRequest.EarliestTime());
      long latestOffset = getOffset(consumer, topic, partition,
          kafka.api.OffsetRequest.LatestTime());
      long readOffset = (earlyOffset + latestOffset) / 2;
      LOG.info("earlyOffset: " + earlyOffset + " latestOffset: " + latestOffset +
          " readOffset: " + readOffset);
      for (int i = 0; i < FETCH_RETRIES; i++) {
        FetchRequest req = new FetchRequestBuilder()
            .clientId(FETCH_CLIENT_NAME)
            .replicaId(Request.DebuggingConsumerId()) // this consumerId enable reads from follower
            .maxWait(FETCH_MAX_WAIT_MS)
            .minBytes(ConsumerConfig.MinFetchBytes())
            .addFetch(topic, partition, readOffset, FETCH_BUFFER_SIZE)
            .build();
        try {
          FetchResponse response = consumer.fetch(req);

          if (response.hasError()) {
            String errMsg = "Error fetching Data. ErrorCode: " + response.error(topic, partition);
            LOG.warn(errMsg);
          } else {
            MessageSet msgSet = response.messageSet(topic, partition);
            if (msgSet.sizeInBytes() <= 0) {
              if (earlyOffset == latestOffset) {
                LOG.warn("Passed. No data in partition.  Fetching data from host {}, topic {}, partition {}",
                    host, topic, partition);
                return true;
              } else {
                LOG.warn("host: " + host + " topic: " + topic + " par: " + partition +
                    " Not enough bytes: {}", msgSet.sizeInBytes());
              }
            } else {
              LOG.info("Passed. Fetching data from host {}, topic {}, partition {}",
                  host, topic, partition);
              return true;
            }
          }
        } catch (Exception ex) {
          LOG.warn("For host: " + host + " Unexpected exception", ex);
        }
        try {
          Thread.sleep((long) (Math.random() * 3000));
        } catch (InterruptedException ex) {
          LOG.warn("Unexpected interruption", ex);
        }
      }
    } catch (IOException e) {
      LOG.warn("For host: " + host + " Unexpected exception", e);
    } finally {
      try {
        consumer.close();
      } catch (Exception e) {
        LOG.error("Unexpected exception in closing consumer", e);
      }
    }
    LOG.warn("Failed Fetching data from host {}, topic {}, parttion {}", host, topic, partition);
    return false;
  }

  public static long getOffset(SimpleConsumer consumer, String topic, int partition,
                               long whichTime) throws IOException {
    String errMsg = null;
    Exception lastEx = null;
    for (int i = 0; i < FETCH_RETRIES; i++) {
      TopicAndPartition topicAndPartition = new TopicAndPartition(topic, partition);
      try {
        long offset = consumer.earliestOrLatestOffset(topicAndPartition, whichTime,
            Request.DebuggingConsumerId());
        return offset;
      } catch (RuntimeException e) {
        lastEx = e;
        errMsg = "Failed to getting offset for topic: " + topic + " partition: " + partition
            + " host: " + consumer.host();
        LOG.warn(errMsg, e);
        try {
          Thread.sleep((long) (Math.random() * 3000));
        } catch (InterruptedException ex) {
          LOG.warn("Unexpected interruption", ex);
        }
      }
    }
    throw new IOException(errMsg, lastEx);
  }

  private static Map kafkaConsumers = new HashMap();
  private static Map zkUtilsMap = new HashMap();

  public static ZkUtils getZkUtils(String zkUrl) {
    if (!zkUtilsMap.containsKey(zkUrl)) {
      Tuple2 zkClientAndConnection =
          ZkUtils.createZkClientAndConnection(zkUrl, 30000, 3000000);

      ZkUtils zkUtils = new ZkUtils(zkClientAndConnection._1(), zkClientAndConnection._2(), true);
      zkUtilsMap.put(zkUrl, zkUtils);
    }
    return zkUtilsMap.get(zkUrl);
  }

  public static String getBrokers(String zkUrl, SecurityProtocol securityProtocol) {
    ZkUtils zkUtils = getZkUtils(zkUrl);
    Seq brokersSeq = zkUtils.getAllBrokersInCluster();
    Broker[] brokers = new Broker[brokersSeq.size()];
    brokersSeq.copyToArray(brokers);

    String brokersStr = Arrays.stream(brokers)
        .map(b -> b.brokerEndPoint(
            ListenerName.forSecurityProtocol(securityProtocol)).connectionString())
        .reduce(null, (a, b) -> (a == null) ? b : a + "," + b);
    return brokersStr;
  }

  public static Properties createKafkaProducerProperties(String zkUrl, SecurityProtocol securityProtocol) {
    String bootstrapBrokers = OperatorUtil.getBrokers(zkUrl, securityProtocol);
    Properties props = new Properties();
    props.put(KafkaUtils.BOOTSTRAP_SERVERS, bootstrapBrokers);
    props.put(ProducerConfig.ACKS_CONFIG, "1");
    props.put(ProducerConfig.RETRIES_CONFIG, 0);
    props.put(ProducerConfig.BATCH_SIZE_CONFIG, 1638400);
    props.put(ProducerConfig.BUFFER_MEMORY_CONFIG, 3554432);
    props.put(ProducerConfig.COMPRESSION_TYPE_CONFIG, "gzip");
    props.put(ProducerConfig.KEY_SERIALIZER_CLASS_CONFIG, "org.apache.kafka.common.serialization.ByteArraySerializer");
    props.put(ProducerConfig.VALUE_SERIALIZER_CLASS_CONFIG, "org.apache.kafka.common.serialization.ByteArraySerializer");
    return props;
  }


  public static Properties createKafkaConsumerProperties(String zkUrl, String consumerGroupName,
      SecurityProtocol securityProtocol, Map consumerConfigs) {
    String bootstrapBrokers = OperatorUtil.getBrokers(zkUrl, securityProtocol);
    Properties props = new Properties();
    props.put(KafkaUtils.BOOTSTRAP_SERVERS, bootstrapBrokers);
    props.put("group.id", consumerGroupName);
    props.put("enable.auto.commit", "true");
    props.put("auto.commit.interval.ms", "1000");
    props.put("key.deserializer", "org.apache.kafka.common.serialization.ByteArrayDeserializer");
    props.put("value.deserializer", "org.apache.kafka.common.serialization.ByteArrayDeserializer");

    if (consumerConfigs != null) {
      for (Map.Entry entry : consumerConfigs.entrySet()) {
        props.put(entry.getKey(), entry.getValue());
      }
    }
    return props;
  }


  public static BrokerStats deserializeBrokerStats(ConsumerRecord record) {
    try {
      BinaryDecoder binaryDecoder = avroDecoderFactory.binaryDecoder(record.value(), null);
      BrokerStats stats = new BrokerStats();
      brokerStatsReader.read(stats, binaryDecoder);
      return stats;
    } catch (Exception e) {
      LOG.debug("Fail to decode an message", e);
      return null;
    }
  }


  public static void startOstrichService(String serviceName, String tsdbHostPort, int ostrichPort) {
    final int TSDB_METRICS_PUSH_INTERVAL_IN_MILLISECONDS = 10 * 1000;
    OstrichAdminService ostrichService = new OstrichAdminService(ostrichPort);
    ostrichService.startAdminHttpService();
    if (tsdbHostPort != null) {
      LOG.info("Starting the OpenTsdb metrics pusher");
      try {
        HostAndPort pushHostPort = HostAndPort.fromString(tsdbHostPort);
        MetricsPusher metricsPusher = new MetricsPusher(
            pushHostPort.getHost(),
            pushHostPort.getPort(),
            new OpenTsdbMetricConverter(serviceName, HostName),
            TSDB_METRICS_PUSH_INTERVAL_IN_MILLISECONDS);
        metricsPusher.start();
        LOG.info("OpenTsdb metrics pusher started!");
      } catch (Throwable t) {
        // pusher fail is OK, do
        LOG.error("Exception when starting stats pusher: ", t);
      }
    }
  }

  public static MutablePair getProcNetDevStats() throws Exception {
    ProcessBuilder ps = new ProcessBuilder("cat", "/proc/net/dev");
    Process pr = ps.start();
    pr.waitFor();

    BufferedReader in = new BufferedReader(new InputStreamReader(pr.getInputStream()));
    String line;
    int counter = 0;
    long receivedBytes = 0;
    long outBytes = 0;

    while ((line = in.readLine()) != null) {
      System.out.println(counter + ": " + line);
      if (line.contains("eth0")) {
        String[] strs = line.split(" ");
        receivedBytes = Long.parseLong(strs[3]);
        outBytes = Long.parseLong(strs[41]);
        System.out.println(" inBytes = " + receivedBytes + "  outBytes = " + outBytes);
      }
      counter++;
    }
    in.close();

    MutablePair result = new MutablePair<>(receivedBytes, outBytes);
    return result;
  }

  public static MutablePair getSysNetworkTraffic(long samplingWindowInMs)
      throws Exception {
    MutablePair startNumbers = getProcNetDevStats();
    Thread.sleep(samplingWindowInMs);
    MutablePair endNumbers = getProcNetDevStats();

    double inRate = (endNumbers.getKey() - startNumbers.getKey()) * 1000.0 / samplingWindowInMs;
    double outRate =
        (endNumbers.getValue() - startNumbers.getValue()) * 1000.0 / samplingWindowInMs;
    MutablePair result = new MutablePair<>(inRate, outRate);
    return result;
  }
  /**
   * Sort the map entries based on entry values in descending order
   */
  public static > Map sortByValue(Map map) {
    return map.entrySet()
        .stream()
        .sorted(Map.Entry.comparingByValue(Collections.reverseOrder()))
        .collect(Collectors.toMap(
            Map.Entry::getKey,
            Map.Entry::getValue,
            (e1, e2) -> e1,
            LinkedHashMap::new
        ));
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy