com.epam.eco.commons.kafka.KafkaUtils Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of commons-kafka Show documentation
A library of utilities, helpers and higher-level APIs for the Kafka client library
There is a newer version: 3.0.5
/*
 * Copyright 2020 EPAM Systems
 *
 * Licensed under the Apache License, Version 2.0 (the "License"); you may not
 * use this file except in compliance with the License.  You may obtain a copy
 * of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.  See the
 * License for the specific language governing permissions and limitations under
 * the License.
 */
package com.epam.eco.commons.kafka;

import java.io.Closeable;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.Objects;
import java.util.Set;
import java.util.TreeMap;
import java.util.function.Function;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.stream.Collectors;

import org.apache.commons.collections4.CollectionUtils;
import org.apache.commons.lang3.Validate;
import org.apache.kafka.clients.consumer.ConsumerRecord;
import org.apache.kafka.clients.consumer.ConsumerRecords;
import org.apache.kafka.clients.consumer.KafkaConsumer;
import org.apache.kafka.clients.producer.KafkaProducer;
import org.apache.kafka.common.PartitionInfo;
import org.apache.kafka.common.TopicPartition;

/**
 * @author Andrei_Tytsik
 */
public abstract class KafkaUtils {

    public static final Pattern TOPIC_PARTITION_PATTERN = Pattern.compile("^(.+)-(0|[1-9]\\d*)$");

    private KafkaUtils() {
    }

    public static TopicPartition[] getAssignmentAsArray(KafkaConsumer consumer) {
        return getAssignmentAsList(consumer).stream().
                toArray(TopicPartition[]::new);
    }

    public static List getAssignmentAsList(KafkaConsumer consumer) {
        Validate.notNull(consumer, "Consumer is null");

        return new ArrayList<>(consumer.assignment());
    }

    public static TopicPartition[] getTopicPartitionsAsArray(
            KafkaConsumer consumer,
            String ... topicNames) {
        return getTopicPartitionsAsList(consumer, Arrays.asList(topicNames)).stream().
                toArray(TopicPartition[]::new);
    }

    public static List getTopicPartitionsAsList(
            KafkaConsumer consumer,
            String ... topicNames) {
        return getTopicPartitionsAsList(consumer, Arrays.asList(topicNames));
    }

    public static TopicPartition[] getTopicPartitionsAsArray(
            KafkaConsumer consumer,
            Collection topicNames) {
        return getTopicPartitionsAsList(consumer, topicNames).stream().
                toArray(TopicPartition[]::new);
    }

    public static List getTopicPartitionsAsList(
            KafkaConsumer consumer,
            Collection topicNames) {
        Validate.notNull(consumer, "Consumer is null");
        Validate.notNull(topicNames, "Collection of topic names is null");

        if (CollectionUtils.isEmpty(topicNames)) {
            return Collections.emptyList();
        }

        List topicPartitions = new ArrayList<>();
        for (String topicName : topicNames) {
            List partitionInfos = consumer.partitionsFor(topicName);
            if (CollectionUtils.isEmpty(partitionInfos)) {
                throw new RuntimeException("Partitions metadata not found for topic " + topicName);
            }

            topicPartitions.addAll(toTopicPartitions(partitionInfos));
        }

        return topicPartitions;
    }

    public static TopicPartition[] getTopicPartitionsAsArray(
            KafkaProducer producer,
            String ... topicNames) {
        return getTopicPartitionsAsList(producer, Arrays.asList(topicNames)).stream().
                toArray(TopicPartition[]::new);
    }

    public static List getTopicPartitionsAsList(
            KafkaProducer producer,
            String ... topicNames) {
        return getTopicPartitionsAsList(producer, Arrays.asList(topicNames));
    }

    public static TopicPartition[] getTopicPartitionsAsArray(
            KafkaProducer producer,
            Collection topicNames) {
        return getTopicPartitionsAsList(producer, topicNames).stream().
                toArray(TopicPartition[]::new);
    }

    public static List getTopicPartitionsAsList(
            KafkaProducer producer,
            Collection topicNames) {
        Validate.notNull(producer, "Producer is null");
        Validate.notNull(topicNames, "Collection of topic names is null");

        if (CollectionUtils.isEmpty(topicNames)) {
            return Collections.emptyList();
        }

        List topicPartitions = new ArrayList<>();
        for (String topicName : topicNames) {
            List partitionInfos = producer.partitionsFor(topicName);
            if (CollectionUtils.isEmpty(partitionInfos)) {
                throw new RuntimeException("Partitions metadata not found for topic " + topicName);
            }

            topicPartitions.addAll(toTopicPartitions(partitionInfos));
        }

        return topicPartitions;
    }

    public static TopicPartition parseTopicPartition(String string) {
        Validate.notBlank(string, "TopicPartition string is blank");

        Matcher matcher = TOPIC_PARTITION_PATTERN.matcher(string);
        if (!matcher.find()) {
            throw new IllegalArgumentException(
                    String.format("Invalid TopicPartition string '%s'", string));
        }

        String topic = matcher.group(1);
        int partition = Integer.parseInt(matcher.group(2));
        return new TopicPartition(
                topic,
                partition);
    }

    public static void closeQuietly(Closeable closeable) {
        if (closeable == null) {
            return;
        }
        try {
            closeable.close();
        } catch (Exception ex) {
            // ignore
        }
    }

    @SuppressWarnings({ "unchecked", "rawtypes" })
    public static Map extractSmallestOffsets(ConsumerRecords records) {
        Validate.notNull(records, "ConsumerRecords object is null");

        Set partitions = records.partitions();
        Map smallestOffsets = new HashMap<>((int) (partitions.size() / 0.75));
        for (TopicPartition partition : partitions) {
            List> recordsPerPartition =
                    ((ConsumerRecords)records).records(partition);
            if (recordsPerPartition.isEmpty()) {
                continue;
            }
            ConsumerRecord firstRecordInPartition = recordsPerPartition.get(0);
            smallestOffsets.put(partition, firstRecordInPartition.offset());
        }
        return smallestOffsets;
    }

    @SuppressWarnings({ "unchecked", "rawtypes" })
    public static Map extractLargestOffsets(ConsumerRecords records) {
        Validate.notNull(records, "ConsumerRecords object is null");

        Set partitions = records.partitions();
        Map largestOffsets = new HashMap<>((int) (partitions.size() / 0.75));
        for (TopicPartition partition : partitions) {
            List> recordsPerPartition =
                    ((ConsumerRecords)records).records(partition);
            if (recordsPerPartition.isEmpty()) {
                continue;
            }
            ConsumerRecord lastRecordInPartition =
                    recordsPerPartition.get(recordsPerPartition.size() - 1);
            largestOffsets.put(partition, lastRecordInPartition.offset());
        }
        return largestOffsets;
    }

    public static Map getConsumerPositions(KafkaConsumer consumer) {
        Validate.notNull(consumer, "Consumer is null");

        Set partitions = consumer.assignment();
        if (partitions == null || partitions.isEmpty()) {
            return Collections.emptyMap();
        }

        return partitions.stream().
                collect(Collectors.toMap(
                        Function.identity(),
                        partition -> consumer.position(partition)));
    }

    public static List extractTopicNamesAsList(Collection partitions) {
        Validate.notNull(partitions, "Collection of partitions is null");

        return partitions.stream().
                filter(Objects::nonNull).
                map(TopicPartition::topic).
                distinct().
                collect(Collectors.toList());
    }

    public static List extractTopicNamesAsSortedList(Collection partitions) {
        Validate.notNull(partitions, "Collection of partitions is null");

        return partitions.stream().
                filter(Objects::nonNull).
                map(TopicPartition::topic).
                distinct().
                sorted().
                collect(Collectors.toList());
    }

    public static Set extractTopicNamesAsSet(Collection partitions) {
        Validate.notNull(partitions, "Collection of partitions is null");

        return partitions.stream().
                filter(Objects::nonNull).
                map(TopicPartition::topic).
                collect(Collectors.toSet());
    }

    public static Set extractTopicNamesAsSortedSet(Collection partitions) {
        Validate.notNull(partitions, "Collection of partitions is null");

        return partitions.stream().
                filter(Objects::nonNull).
                map(TopicPartition::topic).
                collect(Collectors.toSet());
    }

    public static  Map sortedByTopicPartitionKeyMap(Map map) {
        Validate.notNull(map, "Map is null");

        return map.entrySet().stream().
                collect(
                        Collectors.toMap(
                                Entry::getKey,
                                Entry::getValue,
                                (a, b) -> b,
                                () -> new TreeMap<>(TopicPartitionComparator.INSTANCE)));
    }

    public static long calculateConsumerLag(OffsetRange topicOffsetRange, long consumerOffset) {
        Validate.notNull(topicOffsetRange, "Offset range is null");
        Validate.isTrue(consumerOffset >= 0, "Consumer offset is invalid");

        if (consumerOffset < topicOffsetRange.getSmallest()) {
            return topicOffsetRange.getSize();
        }

        long largestConsumableOffset =
                topicOffsetRange.isLargestInclusive() ?
                topicOffsetRange.getLargest() + 1 :
                topicOffsetRange.getLargest();

        if (consumerOffset > largestConsumableOffset) {
            return -1;
        }

        return largestConsumableOffset - consumerOffset;
    }

    public static List toTopicPartitions(List partitionInfos) {
        Validate.notNull(partitionInfos, "Collection of partition infos is null");

        if (partitionInfos.isEmpty()) {
            return Collections.emptyList();
        } else if (partitionInfos.size() == 1) {
            return Collections.singletonList(toTopicPartition(partitionInfos.get(0)));
        } else {
            return partitionInfos.stream().
                    map(KafkaUtils::toTopicPartition).
                    collect(Collectors.toList());
        }
    }

    public static TopicPartition toTopicPartition(PartitionInfo partitionInfo) {
        Validate.notNull(partitionInfo, "Partition info is null");

        return new TopicPartition(partitionInfo.topic(), partitionInfo.partition());
    }

}