All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.kafka.streams.processor.internals.assignment.ClientState Maven / Gradle / Ivy

There is a newer version: 3.7.1
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements. See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.kafka.streams.processor.internals.assignment;

import org.apache.kafka.common.TopicPartition;
import org.apache.kafka.streams.processor.TaskId;
import org.apache.kafka.streams.processor.internals.Task;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.util.Collection;
import java.util.Comparator;
import java.util.HashSet;
import java.util.Map;
import java.util.Set;
import java.util.stream.Collectors;
import java.util.TreeMap;
import java.util.TreeSet;
import java.util.UUID;

import static java.util.Collections.emptyMap;
import static java.util.Collections.unmodifiableMap;
import static java.util.Collections.unmodifiableSet;
import static java.util.Comparator.comparing;
import static org.apache.kafka.common.utils.Utils.union;
import static org.apache.kafka.streams.processor.internals.assignment.SubscriptionInfo.UNKNOWN_OFFSET_SUM;

public class ClientState {
    private static final Logger LOG = LoggerFactory.getLogger(ClientState.class);
    public static final Comparator TOPIC_PARTITION_COMPARATOR = comparing(TopicPartition::topic).thenComparing(TopicPartition::partition);

    private final Set activeTasks = new TreeSet<>();
    private final Set standbyTasks = new TreeSet<>();
    private final Set prevActiveTasks;
    private final Set prevStandbyTasks;

    private final Map taskOffsetSums; // contains only stateful tasks we previously owned
    private final Map taskLagTotals;  // contains lag for all stateful tasks in the app topology
    private final Map ownedPartitions = new TreeMap<>(TOPIC_PARTITION_COMPARATOR);
    private final Map> consumerToPreviousStatefulTaskIds = new TreeMap<>();

    // the following four maps are used only for logging purposes;
    // TODO KAFKA-10283: we could consider merging them with other book-keeping maps at client-levels
    //                   so that they would not be inconsistent
    private final Map> consumerToPreviousActiveTaskIds = new TreeMap<>();
    private final Map> consumerToAssignedActiveTaskIds = new TreeMap<>();
    private final Map> consumerToAssignedStandbyTaskIds = new TreeMap<>();
    private final Map> consumerToRevokingActiveTaskIds = new TreeMap<>();

    private int capacity;

    public ClientState() {
        this(0);
    }

    ClientState(final int capacity) {
        prevActiveTasks = new TreeSet<>();
        prevStandbyTasks = new TreeSet<>();
        taskOffsetSums = new TreeMap<>();
        taskLagTotals = new TreeMap<>();
        this.capacity = capacity;
    }

    // For testing only
    public ClientState(final Set previousActiveTasks,
                       final Set previousStandbyTasks,
                       final Map taskLagTotals,
                       final int capacity) {
        prevActiveTasks = unmodifiableSet(new TreeSet<>(previousActiveTasks));
        prevStandbyTasks = unmodifiableSet(new TreeSet<>(previousStandbyTasks));
        taskOffsetSums = emptyMap();
        this.taskLagTotals = unmodifiableMap(taskLagTotals);
        this.capacity = capacity;
    }

    int capacity() {
        return capacity;
    }

    public void incrementCapacity() {
        capacity++;
    }

    boolean reachedCapacity() {
        return assignedTaskCount() >= capacity;
    }

    public Set activeTasks() {
        return unmodifiableSet(activeTasks);
    }

    public int activeTaskCount() {
        return activeTasks.size();
    }

    double activeTaskLoad() {
        return ((double) activeTaskCount()) / capacity;
    }

    public void assignActiveTasks(final Collection tasks) {
        activeTasks.addAll(tasks);
    }

    public void assignActiveToConsumer(final TaskId task, final String consumer) {
        consumerToAssignedActiveTaskIds.computeIfAbsent(consumer, k -> new HashSet<>()).add(task);
    }

    public void assignStandbyToConsumer(final TaskId task, final String consumer) {
        consumerToAssignedStandbyTaskIds.computeIfAbsent(consumer, k -> new HashSet<>()).add(task);
    }

    public void revokeActiveFromConsumer(final TaskId task, final String consumer) {
        consumerToRevokingActiveTaskIds.computeIfAbsent(consumer, k -> new HashSet<>()).add(task);
    }

    public Map> prevOwnedActiveTasksByConsumer() {
        return consumerToPreviousActiveTaskIds;
    }

    public Map> prevOwnedStandbyByConsumer() {
        // standbys are just those stateful tasks minus active tasks
        final Map> consumerToPreviousStandbyTaskIds = new TreeMap<>();

        for (final Map.Entry> entry: consumerToPreviousStatefulTaskIds.entrySet()) {
            final Set standbyTaskIds = new HashSet<>(entry.getValue());
            if (consumerToPreviousActiveTaskIds.containsKey(entry.getKey()))
                standbyTaskIds.removeAll(consumerToPreviousActiveTaskIds.get(entry.getKey()));
            consumerToPreviousStandbyTaskIds.put(entry.getKey(), standbyTaskIds);
        }

        return consumerToPreviousStandbyTaskIds;
    }

    // including both active and standby tasks
    public Set prevOwnedStatefulTasksByConsumer(final String memberId) {
        return consumerToPreviousStatefulTaskIds.get(memberId);
    }

    public Map> assignedActiveTasksByConsumer() {
        return consumerToAssignedActiveTaskIds;
    }

    public Map> revokingActiveTasksByConsumer() {
        return consumerToRevokingActiveTaskIds;
    }

    public Map> assignedStandbyTasksByConsumer() {
        return consumerToAssignedStandbyTaskIds;
    }

    public void assignActive(final TaskId task) {
        assertNotAssigned(task);
        activeTasks.add(task);
    }

    public void unassignActive(final TaskId task) {
        if (!activeTasks.contains(task)) {
            throw new IllegalArgumentException("Tried to unassign active task " + task + ", but it is not currently assigned: " + this);
        }
        activeTasks.remove(task);
    }

    public Set standbyTasks() {
        return unmodifiableSet(standbyTasks);
    }

    boolean hasStandbyTask(final TaskId taskId) {
        return standbyTasks.contains(taskId);
    }

    int standbyTaskCount() {
        return standbyTasks.size();
    }

    public void assignStandby(final TaskId task) {
        assertNotAssigned(task);
        standbyTasks.add(task);
    }

    void unassignStandby(final TaskId task) {
        if (!standbyTasks.contains(task)) {
            throw new IllegalArgumentException("Tried to unassign standby task " + task + ", but it is not currently assigned: " + this);
        }
        standbyTasks.remove(task);
    }

    Set assignedTasks() {
        // Since we're copying it, it's not strictly necessary to make it unmodifiable also.
        // I'm just trying to prevent subtle bugs if we write code that thinks it can update
        // the assignment by updating the returned set.
        return unmodifiableSet(
            union(
                () -> new HashSet<>(activeTasks.size() + standbyTasks.size()),
                activeTasks,
                standbyTasks
            )
        );
    }

    public int assignedTaskCount() {
        return activeTaskCount() + standbyTaskCount();
    }

    double assignedTaskLoad() {
        return ((double) assignedTaskCount()) / capacity;
    }

    boolean hasAssignedTask(final TaskId taskId) {
        return activeTasks.contains(taskId) || standbyTasks.contains(taskId);
    }

    Set prevActiveTasks() {
        return unmodifiableSet(prevActiveTasks);
    }

    private void addPreviousActiveTask(final TaskId task) {
        prevActiveTasks.add(task);
    }

    void addPreviousActiveTasks(final Set prevTasks) {
        prevActiveTasks.addAll(prevTasks);
    }

    Set prevStandbyTasks() {
        return unmodifiableSet(prevStandbyTasks);
    }

    private void addPreviousStandbyTask(final TaskId task) {
        prevStandbyTasks.add(task);
    }

    void addPreviousStandbyTasks(final Set standbyTasks) {
        prevStandbyTasks.addAll(standbyTasks);
    }

    Set previousAssignedTasks() {
        return union(() -> new HashSet<>(prevActiveTasks.size() + prevStandbyTasks.size()), prevActiveTasks, prevStandbyTasks);
    }

    // May return null
    public String previousOwnerForPartition(final TopicPartition partition) {
        return ownedPartitions.get(partition);
    }

    public void addOwnedPartitions(final Collection ownedPartitions, final String consumer) {
        for (final TopicPartition tp : ownedPartitions) {
            this.ownedPartitions.put(tp, consumer);
        }
    }

    public void addPreviousTasksAndOffsetSums(final String consumerId, final Map taskOffsetSums) {
        this.taskOffsetSums.putAll(taskOffsetSums);
        consumerToPreviousStatefulTaskIds.put(consumerId, taskOffsetSums.keySet());
    }

    public void initializePrevTasks(final Map taskForPartitionMap) {
        if (!prevActiveTasks.isEmpty() || !prevStandbyTasks.isEmpty()) {
            throw new IllegalStateException("Already added previous tasks to this client state.");
        }
        initializePrevActiveTasksFromOwnedPartitions(taskForPartitionMap);
        initializeRemainingPrevTasksFromTaskOffsetSums();
    }

    /**
     * Compute the lag for each stateful task, including tasks this client did not previously have.
     */
    public void computeTaskLags(final UUID uuid, final Map allTaskEndOffsetSums) {
        if (!taskLagTotals.isEmpty()) {
            throw new IllegalStateException("Already computed task lags for this client.");
        }

        for (final Map.Entry taskEntry : allTaskEndOffsetSums.entrySet()) {
            final TaskId task = taskEntry.getKey();
            final Long endOffsetSum = taskEntry.getValue();
            final Long offsetSum = taskOffsetSums.getOrDefault(task, 0L);

            if (offsetSum == Task.LATEST_OFFSET) {
                taskLagTotals.put(task, Task.LATEST_OFFSET);
            } else if (offsetSum == UNKNOWN_OFFSET_SUM) {
                taskLagTotals.put(task, UNKNOWN_OFFSET_SUM);
            } else if (endOffsetSum < offsetSum) {
                LOG.warn("Task " + task + " had endOffsetSum=" + endOffsetSum + " smaller than offsetSum=" +
                             offsetSum + " on member " + uuid + ". This probably means the task is corrupted," +
                             " which in turn indicates that it will need to restore from scratch if it gets assigned." +
                             " The assignor will de-prioritize returning this task to this member in the hopes that" +
                             " some other member may be able to re-use its state.");
                taskLagTotals.put(task, endOffsetSum);
            } else {
                taskLagTotals.put(task, endOffsetSum - offsetSum);
            }
        }
    }

    /**
     * Returns the total lag across all logged stores in the task. Equal to the end offset sum if this client
     * did not have any state for this task on disk.
     *
     * @return end offset sum - offset sum
     *          Task.LATEST_OFFSET if this was previously an active running task on this client
     */
    public long lagFor(final TaskId task) {
        final Long totalLag = taskLagTotals.get(task);
        if (totalLag == null) {
            throw new IllegalStateException("Tried to lookup lag for unknown task " + task);
        }
        return totalLag;
    }

    public Set statefulActiveTasks() {
        return activeTasks.stream().filter(this::isStateful).collect(Collectors.toSet());
    }

    public Set statelessActiveTasks() {
        return activeTasks.stream().filter(task -> !isStateful(task)).collect(Collectors.toSet());
    }

    boolean hasUnfulfilledQuota(final int tasksPerThread) {
        return activeTasks.size() < capacity * tasksPerThread;
    }

    boolean hasMoreAvailableCapacityThan(final ClientState other) {
        if (capacity <= 0) {
            throw new IllegalStateException("Capacity of this ClientState must be greater than 0.");
        }

        if (other.capacity <= 0) {
            throw new IllegalStateException("Capacity of other ClientState must be greater than 0");
        }

        final double otherLoad = (double) other.assignedTaskCount() / other.capacity;
        final double thisLoad = (double) assignedTaskCount() / capacity;

        if (thisLoad < otherLoad) {
            return true;
        } else if (thisLoad > otherLoad) {
            return false;
        } else {
            return capacity > other.capacity;
        }
    }

    public String currentAssignment() {
        return "[activeTasks: (" + activeTasks +
                ") standbyTasks: (" + standbyTasks + ")]";
    }

    @Override
    public String toString() {
        return "[activeTasks: (" + activeTasks +
            ") standbyTasks: (" + standbyTasks +
            ") prevActiveTasks: (" + prevActiveTasks +
            ") prevStandbyTasks: (" + prevStandbyTasks +
            ") changelogOffsetTotalsByTask: (" + taskOffsetSums.entrySet() +
            ") taskLagTotals: (" + taskLagTotals.entrySet() +
            ") capacity: " + capacity +
            " assigned: " + assignedTaskCount() +
            "]";
    }

    private boolean isStateful(final TaskId task) {
        return taskLagTotals.containsKey(task);
    }

    private void initializePrevActiveTasksFromOwnedPartitions(final Map taskForPartitionMap) {
        // there are three cases where we need to construct some or all of the prevTasks from the ownedPartitions:
        // 1) COOPERATIVE clients on version 2.4-2.5 do not encode active tasks at all and rely on ownedPartitions
        // 2) future client during version probing, when we can't decode the future subscription info's prev tasks
        // 3) stateless tasks are not encoded in the task lags, and must be figured out from the ownedPartitions
        for (final Map.Entry partitionEntry : ownedPartitions.entrySet()) {
            final TopicPartition tp = partitionEntry.getKey();
            final TaskId task = taskForPartitionMap.get(tp);
            if (task != null) {
                addPreviousActiveTask(task);
                consumerToPreviousActiveTaskIds.computeIfAbsent(partitionEntry.getValue(), k -> new HashSet<>()).add(task);
            } else {
                LOG.error("No task found for topic partition {}", tp);
            }
        }
    }

    private void initializeRemainingPrevTasksFromTaskOffsetSums() {
        if (prevActiveTasks.isEmpty() && !ownedPartitions.isEmpty()) {
            LOG.error("Tried to process tasks in offset sum map before processing tasks from ownedPartitions = {}", ownedPartitions);
            throw new IllegalStateException("Must initialize prevActiveTasks from ownedPartitions before initializing remaining tasks.");
        }
        for (final Map.Entry taskEntry : taskOffsetSums.entrySet()) {
            final TaskId task = taskEntry.getKey();
            if (!prevActiveTasks.contains(task)) {
                final long offsetSum = taskEntry.getValue();
                if (offsetSum == Task.LATEST_OFFSET) {
                    addPreviousActiveTask(task);
                } else {
                    addPreviousStandbyTask(task);
                }
            }
        }
    }

    private void assertNotAssigned(final TaskId task) {
        if (standbyTasks.contains(task) || activeTasks.contains(task)) {
            throw new IllegalArgumentException("Tried to assign task " + task + ", but it is already assigned: " + this);
        }
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy