apache · guozhangwang · Jun 9, 2022 · Jun 8, 2022 · Jun 8, 2022 · Jun 8, 2022
diff --git a/streams/src/main/java/org/apache/kafka/streams/processor/internals/DefaultStateUpdater.java b/streams/src/main/java/org/apache/kafka/streams/processor/internals/DefaultStateUpdater.java
@@ -23,20 +23,21 @@
 import org.apache.kafka.streams.errors.TaskCorruptedException;
 import org.apache.kafka.streams.processor.TaskId;
 import org.apache.kafka.streams.processor.internals.Task.State;
+import org.apache.kafka.streams.processor.internals.TaskAndAction.Action;
 import org.slf4j.Logger;
 
 import java.time.Duration;
 import java.util.ArrayList;
 import java.util.Collection;
 import java.util.Collections;
-import java.util.HashMap;
 import java.util.HashSet;
 import java.util.LinkedList;
 import java.util.List;
 import java.util.Map;
 import java.util.Queue;
 import java.util.Set;
 import java.util.concurrent.BlockingQueue;
+import java.util.concurrent.ConcurrentHashMap;
 import java.util.concurrent.CountDownLatch;
 import java.util.concurrent.LinkedBlockingQueue;
 import java.util.concurrent.TimeUnit;
@@ -57,7 +58,7 @@ private class StateUpdaterThread extends Thread {
         private final ChangelogReader changelogReader;
         private final AtomicBoolean isRunning = new AtomicBoolean(true);
         private final Consumer<Set<TopicPartition>> offsetResetter;
-        private final Map<TaskId, Task> updatingTasks = new HashMap<>();
+        private final Map<TaskId, Task> updatingTasks = new ConcurrentHashMap<>();
         private final Logger log;
 
         public StateUpdaterThread(final String name,
@@ -72,7 +73,7 @@ public StateUpdaterThread(final String name,
             log = logContext.logger(DefaultStateUpdater.class);
         }
 
-        public Collection<Task> getAllUpdatingTasks() {
+        public Collection<Task> getUpdatingTasks() {
             return updatingTasks.values();
         }
 
@@ -117,11 +118,13 @@ private void performActionsOnTasks() {
             tasksAndActionsLock.lock();
             try {
                 for (final TaskAndAction taskAndAction : getTasksAndActions()) {
-                    final Task task = taskAndAction.task;
-                    final Action action = taskAndAction.action;
+                    final Action action = taskAndAction.getAction();
                     switch (action) {
                         case ADD:
-                            addTask(task);
+                            addTask(taskAndAction.getTask());
+                            break;
+                        case REMOVE:
+                            removeTask(taskAndAction.getTaskId());
                             break;
                     }
                 }
@@ -149,7 +152,7 @@ private void handleRuntimeException(final RuntimeException runtimeException) {
             log.error("An unexpected error occurred within the state updater thread: " + runtimeException);
             final ExceptionAndTasks exceptionAndTasks = new ExceptionAndTasks(new HashSet<>(updatingTasks.values()), runtimeException);
             updatingTasks.clear();
-            failedTasks.add(exceptionAndTasks);
+            exceptionsAndFailedTasks.add(exceptionAndTasks);
             isRunning.set(false);
         }
 
@@ -164,7 +167,7 @@ private void handleTaskCorruptedException(final TaskCorruptedException taskCorru
                 }
                 corruptedTasks.add(corruptedTask);
             }
-            failedTasks.add(new ExceptionAndTasks(corruptedTasks, taskCorruptedException));
+            exceptionsAndFailedTasks.add(new ExceptionAndTasks(corruptedTasks, taskCorruptedException));
         }
 
         private void handleStreamsException(final StreamsException streamsException) {
@@ -175,7 +178,7 @@ private void handleStreamsException(final StreamsException streamsException) {
             } else {
                 exceptionAndTasks = handleStreamsExceptionWithoutTask(streamsException);
             }
-            failedTasks.add(exceptionAndTasks);
+            exceptionsAndFailedTasks.add(exceptionAndTasks);
         }
 
         private ExceptionAndTasks handleStreamsExceptionWithTask(final StreamsException streamsException) {
@@ -230,23 +233,35 @@ private List<TaskAndAction> getTasksAndActions() {
 
         private void addTask(final Task task) {
             if (isStateless(task)) {
-                log.debug("Stateless active task " + task.id() + " was added to the state updater");
                 addTaskToRestoredTasks((StreamTask) task);
+                log.debug("Stateless active task " + task.id() + " was added to the restored tasks of the state updater");
             } else {
+                updatingTasks.put(task.id(), task);
                 if (task.isActive()) {
-                    updatingTasks.put(task.id(), task);
-                    log.debug("Stateful active task " + task.id() + " was added to the state updater");
+                    log.debug("Stateful active task " + task.id() + " was added to the updating tasks of the state updater");
                     changelogReader.enforceRestoreActive();
                 } else {
-                    updatingTasks.put(task.id(), task);
-                    log.debug("Standby task " + task.id() + " was added to the state updater");
+                    log.debug("Standby task " + task.id() + " was added to the updating tasks of the state updater");
                     if (updatingTasks.size() == 1) {
                         changelogReader.transitToUpdateStandby();
                     }
                 }
             }
         }
 
+        private void removeTask(final TaskId taskId) {
+            final Task task = updatingTasks.remove(taskId);
+            if (task != null) {
+                final Collection<TopicPartition> changelogPartitions = task.changelogPartitions();
+                changelogReader.unregister(changelogPartitions);
+                removedTasks.add(task);
+                log.debug((task.isActive() ? "Active" : "Standby")
+                    + " task " + task.id() + " was removed from the updating tasks and added to the removed tasks.");
+            } else {
+                log.debug("Task " + taskId + " was not removed since it is not updating.");
+            }
+        }
+
         private boolean isStateless(final Task task) {
             return task.changelogPartitions().isEmpty() && task.isActive();
         }
@@ -277,20 +292,6 @@ private void addTaskToRestoredTasks(final StreamTask task) {
         }
     }
 
-    enum Action {
-        ADD
-    }
-
-    private static class TaskAndAction {
-        public final Task task;
-        public final Action action;
-
-        public TaskAndAction(final Task task, final Action action) {
-            this.task = task;
-            this.action = action;
-        }
-    }
-
     private final Time time;
     private final ChangelogReader changelogReader;
     private final Consumer<Set<TopicPartition>> offsetResetter;
@@ -300,7 +301,8 @@ public TaskAndAction(final Task task, final Action action) {
     private final Queue<StreamTask> restoredActiveTasks = new LinkedList<>();
     private final Lock restoredActiveTasksLock = new ReentrantLock();
     private final Condition restoredActiveTasksCondition = restoredActiveTasksLock.newCondition();
-    private final BlockingQueue<ExceptionAndTasks> failedTasks = new LinkedBlockingQueue<>();
+    private final BlockingQueue<ExceptionAndTasks> exceptionsAndFailedTasks = new LinkedBlockingQueue<>();
+    private final BlockingQueue<Task> removedTasks = new LinkedBlockingQueue<>();
     private CountDownLatch shutdownGate;
 
     private StateUpdaterThread stateUpdaterThread = null;
@@ -325,7 +327,7 @@ public void add(final Task task) {
 
         tasksAndActionsLock.lock();
         try {
-            tasksAndActions.add(new TaskAndAction(task, Action.ADD));
+            tasksAndActions.add(TaskAndAction.createAddTask(task));
             tasksAndActionsCondition.signalAll();
         } finally {
             tasksAndActionsLock.unlock();
@@ -342,11 +344,18 @@ private void verifyStateFor(final Task task) {
     }
 
     @Override
-    public void remove(final Task task) {
+    public void remove(final TaskId taskId) {
+        tasksAndActionsLock.lock();
+        try {
+            tasksAndActions.add(TaskAndAction.createRemoveTask(taskId));
+            tasksAndActionsCondition.signalAll();
+        } finally {
+            tasksAndActionsLock.unlock();
+        }
     }
 
     @Override
-    public Set<StreamTask> getRestoredActiveTasks(final Duration timeout) {
+    public Set<StreamTask> drainRestoredActiveTasks(final Duration timeout) {
         final long timeoutMs = timeout.toMillis();
         final long startTime = time.milliseconds();
         final long deadline = startTime + timeoutMs;
@@ -375,52 +384,42 @@ public Set<StreamTask> getRestoredActiveTasks(final Duration timeout) {
     }
 
     @Override
-    public List<ExceptionAndTasks> getFailedTasksAndExceptions() {
+    public Set<Task> drainRemovedTasks() {
+        final List<Task> result = new ArrayList<>();
+        removedTasks.drainTo(result);
+        return new HashSet<>(result);
+    }
+
+    @Override
+    public List<ExceptionAndTasks> drainExceptionsAndFailedTasks() {
         final List<ExceptionAndTasks> result = new ArrayList<>();
-        failedTasks.drainTo(result);
+        exceptionsAndFailedTasks.drainTo(result);
         return result;
     }
 
-    @Override
-    public Set<Task> getAllTasks() {
-        tasksAndActionsLock.lock();
+    public Set<StandbyTask> getUpdatingStandbyTasks() {
+        return Collections.unmodifiableSet(new HashSet<>(stateUpdaterThread.getUpdatingStandbyTasks()));
+    }
+
+    public Set<Task> getUpdatingTasks() {
+        return Collections.unmodifiableSet(new HashSet<>(stateUpdaterThread.getUpdatingTasks()));
+    }
+
+    public Set<StreamTask> getRestoredActiveTasks() {
         restoredActiveTasksLock.lock();
         try {
-            final Set<Task> allTasks = new HashSet<>();
-            allTasks.addAll(tasksAndActions.stream()
-                .filter(t -> t.action == Action.ADD)
-                .map(t -> t.task)
-                .collect(Collectors.toList())
-            );
-            allTasks.addAll(stateUpdaterThread.getAllUpdatingTasks());
-            allTasks.addAll(restoredActiveTasks);
-            return Collections.unmodifiableSet(allTasks);
+            return Collections.unmodifiableSet(new HashSet<>(restoredActiveTasks));
         } finally {
             restoredActiveTasksLock.unlock();
-            tasksAndActionsLock.unlock();
         }
     }
 
-    @Override
-    public Set<StandbyTask> getStandbyTasks() {
-        tasksAndActionsLock.lock();
-        try {
-            final Set<StandbyTask> standbyTasks = new HashSet<>();
-            standbyTasks.addAll(tasksAndActions.stream()
-                .filter(t -> t.action == Action.ADD)
-                .filter(t -> !t.task.isActive())
-                .map(t -> (StandbyTask) t.task)
-                .collect(Collectors.toList())
-            );
-            standbyTasks.addAll(getUpdatingStandbyTasks());
-            return Collections.unmodifiableSet(standbyTasks);
-        } finally {
-            tasksAndActionsLock.unlock();
-        }
+    public List<ExceptionAndTasks> getExceptionsAndFailedTasks() {
+        return Collections.unmodifiableList(new ArrayList<>(exceptionsAndFailedTasks));
     }
 
-    public Set<StandbyTask> getUpdatingStandbyTasks() {
-        return Collections.unmodifiableSet(new HashSet<>(stateUpdaterThread.getUpdatingStandbyTasks()));
+    public Set<Task> getRemovedTasks() {
+        return Collections.unmodifiableSet(new HashSet<>(removedTasks));
     }
 
     @Override

diff --git a/streams/src/main/java/org/apache/kafka/streams/processor/internals/StateUpdater.java b/streams/src/main/java/org/apache/kafka/streams/processor/internals/StateUpdater.java
@@ -16,65 +16,101 @@
  */
 package org.apache.kafka.streams.processor.internals;
 
+import org.apache.kafka.streams.processor.TaskId;
+
 import java.time.Duration;
+import java.util.Collections;
 import java.util.List;
+import java.util.Objects;
 import java.util.Set;
 
 public interface StateUpdater {
 
     class ExceptionAndTasks {
-        public final Set<Task> tasks;
-        public final RuntimeException exception;
+        private final Set<Task> tasks;
+        private final RuntimeException exception;
 
         public ExceptionAndTasks(final Set<Task> tasks, final RuntimeException exception) {
-            this.tasks = tasks;
-            this.exception = exception;
+            this.tasks = Objects.requireNonNull(tasks);
+            this.exception = Objects.requireNonNull(exception);
+        }
+
+        public Set<Task> tasks() {
+            return Collections.unmodifiableSet(tasks);
+        }
+
+        public RuntimeException exception() {
+            return exception;
+        }
+
+        @Override
+        public boolean equals(final Object o) {
+            if (this == o) return true;
+            if (!(o instanceof ExceptionAndTasks)) return false;
+            final ExceptionAndTasks that = (ExceptionAndTasks) o;
+            return tasks.equals(that.tasks) && exception.equals(that.exception);
+        }
+
+        @Override
+        public int hashCode() {
+            return Objects.hash(tasks, exception);
         }
     }
 
     /**
      * Adds a task (active or standby) to the state updater.
      *
+     * This method does not block until the task is added to the state updater.
+     *
      * @param task task to add
      */
     void add(final Task task);
 
     /**
-     * Removes a task (active or standby) from the state updater.
+     * Removes a task (active or standby) from the state updater and adds the removed task to the removed tasks.
+     *
+     * This method does not block until the removed task is removed from the state updater.
      *
-     * @param task task ro remove
+     * The task to be removed is not removed from the restored active tasks and the failed tasks.
+     * Stateless tasks will never be added to the removed tasks since they are immediately added to the
+     * restored active tasks.
+     *
+     * @param taskId ID of the task to remove
      */
-    void remove(final Task task);
+    void remove(final TaskId taskId);
 
     /**
-     * Gets restored active tasks from state restoration/update
+     * Drains the restored active tasks from the state updater.
+     *
+     * The returned active tasks are removed from the state updater.
      *
      * @param timeout duration how long the calling thread should wait for restored active tasks
      *
      * @return set of active tasks with up-to-date states
      */
-    Set<StreamTask> getRestoredActiveTasks(final Duration timeout);
+    Set<StreamTask> drainRestoredActiveTasks(final Duration timeout);
 
-    /**
-     * Gets failed tasks and the corresponding exceptions
-     *
-     * @return list of failed tasks and the corresponding exceptions
-     */
-    List<ExceptionAndTasks> getFailedTasksAndExceptions();
 
     /**
-     * Get all tasks (active and standby) that are managed by the state updater.
+     * Drains the removed tasks (active and standbys) from the state updater.
+     *
+     * Removed tasks returned by this method are tasks extraordinarily removed from the state updater. These do not
+     * include restored or failed tasks.
+     *
+     * The returned removed tasks are removed from the state updater
      *
-     * @return set of tasks managed by the state updater
+     * @return set of tasks removed from the state updater
      */
-    Set<Task> getAllTasks();
+    Set<Task> drainRemovedTasks();
 
     /**
-     * Get standby tasks that are managed by the state updater.
+     * Drains the failed tasks and the corresponding exceptions.
      *
-     * @return set of standby tasks managed by the state updater
+     * The returned failed tasks are removed from the state updater
+     *
+     * @return list of failed tasks and the corresponding exceptions
      */
-    Set<StandbyTask> getStandbyTasks();
+    List<ExceptionAndTasks> drainExceptionsAndFailedTasks();
 
     /**
      * Shuts down the state updater.