line · ocadaruma · Mar 27, 2023 · Mar 2, 2023 · Mar 6, 2023 · Mar 7, 2023
diff --git a/...essor/src/main/java/com/linecorp/decaton/processor/runtime/internal/PartitionContext.java b/...essor/src/main/java/com/linecorp/decaton/processor/runtime/internal/PartitionContext.java
@@ -56,6 +56,9 @@ public class PartitionContext implements AutoCloseable {
     @Setter
     private boolean revoking;
 
+    @Getter
+    private boolean reloading;
+
     public PartitionContext(PartitionScope scope, Processors<?> processors, int maxPendingRecords) {
         this.scope = scope;
         this.processors = processors;
@@ -157,6 +160,13 @@ public void resume() {
         metrics.partitionPausedTime.record(pausedNanos, TimeUnit.NANOSECONDS);
     }
 
+    public void reloading(boolean reloading) {
+        this.reloading = reloading;
+        if (reloading) {
+            pause();
+        }
+    }
+
     @Override
     public void close() throws Exception {
         resume();

diff --git a/...ssor/src/main/java/com/linecorp/decaton/processor/runtime/internal/PartitionContexts.java b/...ssor/src/main/java/com/linecorp/decaton/processor/runtime/internal/PartitionContexts.java
@@ -28,7 +28,10 @@
 import java.util.Map.Entry;
 import java.util.Set;
 import java.util.concurrent.atomic.AtomicBoolean;
+import java.util.concurrent.atomic.AtomicInteger;
+import java.util.concurrent.locks.ReentrantLock;
 import java.util.function.Function;
+import java.util.stream.Collectors;
 
 import org.apache.kafka.clients.consumer.OffsetAndMetadata;
 import org.apache.kafka.common.TopicPartition;
@@ -53,6 +56,7 @@ public class PartitionContexts implements OffsetsStore, AssignmentStore, Partiti
     private final Map<TopicPartition, PartitionContext> contexts;
 
     private final AtomicBoolean reloadRequested;
+    private final ReentrantLock lock;
 
     public PartitionContexts(SubscriptionScope scope, Processors<?> processors) {
         this.scope = scope;
@@ -63,6 +67,7 @@ public PartitionContexts(SubscriptionScope scope, Processors<?> processors) {
         maxPendingRecords = scope.props().get(ProcessorProperties.CONFIG_MAX_PENDING_RECORDS).value();
         contexts = new HashMap<>();
         reloadRequested = new AtomicBoolean(false);
+        lock = new ReentrantLock();
 
         scope.props().get(ProcessorProperties.CONFIG_PARTITION_CONCURRENCY).listen((oldVal, newVal) -> {
             // This listener will be called at listener registration.
@@ -71,8 +76,16 @@ public PartitionContexts(SubscriptionScope scope, Processors<?> processors) {
                 return;
             }
 
-            if (!reloadRequested.getAndSet(true)) {
-                logger.info("Requested reload partition.concurrency oldValue={}, newValue={}", oldVal, newVal);
+            lock.lock();
+            try {
+                if (!reloadRequested.getAndSet(true)) {
+                    for (PartitionContext context: contexts.values()) {
+                        context.reloading(true);
+                    }
+                    logger.info("Requested reload partition.concurrency oldValue={}, newValue={}", oldVal, newVal);
+                }
+            } finally {
+                lock.unlock();
             }
         });
     }
@@ -200,7 +213,7 @@ PartitionContext instantiateContext(TopicPartition tp) {
 
     // visible for testing
     boolean pausingAllProcessing() {
-        return processingRateProp.value() == RateLimiter.PAUSED || reloadRequested.get();
+        return processingRateProp.value() == RateLimiter.PAUSED;
     }
 
     @Override
@@ -250,23 +263,30 @@ public void partitionsResumed(List<TopicPartition> partitions) {
      */
     public void maybeHandlePropertyReload() {
         if (reloadRequested.get()) {
-            if (totalPendingTasks() > 0) {
-                logger.debug("Waiting pending tasks for property reload.");
-                return;
+            lock.lock();
+            try {
+                List<TopicPartition> reloadableTopicPartitions = contexts.entrySet()
+                        .stream()
+                        .filter(entry -> entry.getValue().reloading() && entry.getValue().pendingTasksCount() == 0)
+                        .map(entry -> entry.getKey())
+                        .collect(Collectors.toList());
+                reloadContexts(reloadableTopicPartitions);
+                long reloadingPartitions = contexts.values()
+                        .stream()
+                        .filter(PartitionContext::reloading)
+                        .count();
+                if (reloadingPartitions == 0) {
+                    reloadRequested.set(false);
+                    logger.info("Completed reloading all partition contexts");
+                }
+            } finally {
+                lock.unlock();
             }
-            // it's ok to check-and-set reloadRequested without synchronization
-            // because this field is set to false only in this method, and this method is called from only subscription thread.
-            reloadRequested.set(false);
-            logger.info("Completed waiting pending tasks. Start reloading partition contexts");
-            reloadContexts();
         }
     }
 
-    private void reloadContexts() {
-        // Save current topicPartitions into copy to update contexts map while iterating over this copy.
-        Set<TopicPartition> topicPartitions = new HashSet<>(contexts.keySet());
-
-        logger.info("Start dropping partition contexts");
+    private void reloadContexts(Collection<TopicPartition> topicPartitions) {
+        logger.info("Start dropping partition context({})", topicPartitions);
         removePartition(topicPartitions);
         logger.info("Finished dropping partition contexts. Start recreating partition contexts");
 logger.info("Completed reloading property"); 
 logger.info("Completed reloading property"); 
         Map<TopicPartition, AssignmentConfig> configs = topicPartitions.stream().collect(

diff --git a/.../src/test/java/com/linecorp/decaton/processor/runtime/internal/PartitionContextsTest.java b/.../src/test/java/com/linecorp/decaton/processor/runtime/internal/PartitionContextsTest.java
@@ -35,6 +35,7 @@
 
 import java.util.ArrayList;
 import java.util.Collection;
+import java.util.Collections;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.List;
@@ -256,38 +257,59 @@ public void testPausingAllProcessing() {
     }
 
     @Test
-    public void testPausingAllProcessingByPropertyReload() {
+    public void testShouldNotBePausingAllProcessingByPropertyReload() {
         assertFalse(contexts.pausingAllProcessing());
         partitionConcurrencyProperty.set(42);
-        assertTrue(contexts.pausingAllProcessing());
+        assertFalse(contexts.pausingAllProcessing());
     }
 
     @Test
     public void testMaybeHandlePropertyReload() {
-        putContexts(12);
-
+        int count = 12;
+        List<PartitionContext> allContexts = putContexts(count);
+        List<PartitionContext> pendingContexts = new ArrayList<>();
+        List<PartitionContext> reloadableContexts = new ArrayList<>();
+        for (int i = 0; i < count; i++) {
+            PartitionContext context = allContexts.get(i);
+            if (i % 3 == 0) {
+                doReturn(100).when(context).pendingTasksCount();
+                doReturn(true).when(context).reloading();
+                pendingContexts.add(context);
+            } else {
+                doReturn(0).when(context).pendingTasksCount();
+                doReturn(true).when(context).reloading();
+                reloadableContexts.add(context);
+            }
+        }
         clearInvocations(contexts);
 
-        PartitionContext context = mock(PartitionContext.class);
-        doReturn(context).when(contexts).instantiateContext(any());
-
-        // there are some pending tasks
-        doReturn(100).when(contexts).totalPendingTasks();
-
         contexts.maybeHandlePropertyReload();
         // property reload is not requested yet
         verify(contexts, never()).instantiateContext(any());
+        for (PartitionContext context: allContexts) {
+            verify(context, never()).reloading(true);
+        }
 
         partitionConcurrencyProperty.set(42);
         contexts.maybeHandlePropertyReload();
+
+        for (PartitionContext context: allContexts) {
+            verify(context).reloading(true);
+        }
+
         // property reload is requested, but there are pending tasks
-        verify(contexts, never()).instantiateContext(any());
+        verify(contexts, times(reloadableContexts.size())).instantiateContext(any());
+        for (PartitionContext context: reloadableContexts) {
+            doReturn(false).when(context).reloading();
+        }
 
-        // pending tasks done
-        doReturn(0).when(contexts).totalPendingTasks();
+        for (PartitionContext context: pendingContexts) {
+            doReturn(0).when(context).pendingTasksCount();
+            doReturn(true).when(context).reloading();
+        }
         contexts.maybeHandlePropertyReload();
-
-        verify(contexts, times(12)).instantiateContext(any());
+        // completed reloading request
+        verify(contexts, times(count)).instantiateContext(any());
     }
 
     @Test