apache · yazgoo · Jun 28, 2024 · Jun 28, 2024 · Jun 28, 2024 · Jul 1, 2024
diff --git a/...ain/java/org/apache/kafka/connect/runtime/distributed/IncrementalCooperativeAssignor.java b/...ain/java/org/apache/kafka/connect/runtime/distributed/IncrementalCooperativeAssignor.java
@@ -657,13 +657,15 @@ private Map<String, ConnectorsAndTasks> performLoadBalancingRevocations(
                 "connector",
                 configured.connectors().size(),
                 workers,
-                WorkerLoad::connectors
+                WorkerLoad::connectors,
+                Function.identity()
         );
         Map<String, Set<ConnectorTaskId>> taskRevocations = loadBalancingRevocations(
                 "task",
                 configured.tasks().size(),
                 workers,
-                WorkerLoad::tasks
+                WorkerLoad::tasks,
+                ConnectorTaskId::connector
         );
 
         connectorRevocations.forEach((worker, revoked) ->
@@ -680,7 +682,8 @@ private <E> Map<String, Set<E>> loadBalancingRevocations(
             String allocatedResourceName,
             int totalToAllocate,
             Collection<WorkerLoad> workers,
-            Function<WorkerLoad, Collection<E>> workerAllocation
+            Function<WorkerLoad, Collection<E>> workerAllocation,
+            Function<E, String> allocationGrouper
     ) {
         int totalWorkers = workers.size();
         // The minimum instances of this resource that should be assigned to each worker
@@ -736,7 +739,7 @@ private <E> Map<String, Set<E>> loadBalancingRevocations(
             Set<E> revokedFromWorker = new LinkedHashSet<>();
             result.put(worker.worker(), revokedFromWorker);
 
-            Iterator<E> currentWorkerAllocation = workerAllocation.apply(worker).iterator();
+            Iterator<E> currentWorkerAllocation = new BalancedIterator<E>(workerAllocation.apply(worker), allocationGrouper);
             // Revoke resources from the worker until it isn't allocated any more than it should be
             for (int numRevoked = 0; currentAllocationSizeForWorker - numRevoked > maxAllocationForWorker; numRevoked++) {
                 if (!currentWorkerAllocation.hasNext()) {
@@ -793,6 +796,43 @@ protected void assignConnectors(List<WorkerLoad> workerAssignment, Collection<St
         }
     }
 
+    static class BalancedIterator<E> implements Iterator<E> {
+
+        private final Map<String, Iterator<E>> grouped;
+        private final List<String> keys;
+
+        private int k;
+
+        public BalancedIterator(Collection<E> collection, Function<E, String> allocationGrouper) {
+            this.k = 0;
+            this.grouped = collection.stream().collect(Collectors.groupingBy(
+                    allocationGrouper,
+                    Collectors.collectingAndThen(
+                            Collectors.toList(),
+                            List::iterator
+                    )
+            ));
+            this.keys = new ArrayList<>(grouped.keySet());
+        }
+
+        @Override
+        public boolean hasNext() {
+            return grouped.values().stream().anyMatch(Iterator::hasNext);
+        }
+
+        @Override
+        public E next() {
+            while (!this.keys.isEmpty() && k < k + this.keys.size()) { 
+                Iterator<E> iterator = grouped.get(this.keys.get(k % this.keys.size()));
+                k++;
+                if (iterator.hasNext()) {
+                    return iterator.next();
+                }
+            }
+            return null;
+        }
+    }
+
     /**
      * Perform a round-robin assignment of tasks to workers with existing worker load. This
      * assignment tries to balance the load between workers, by assigning tasks to workers that
@@ -802,10 +842,9 @@ protected void assignConnectors(List<WorkerLoad> workerAssignment, Collection<St
      * @param tasks the tasks to be assigned
      */
     protected void assignTasks(List<WorkerLoad> workerAssignment, Collection<ConnectorTaskId> tasks) {
-        workerAssignment.sort(WorkerLoad.taskComparator());
         WorkerLoad first = workerAssignment.get(0);
 
-        Iterator<ConnectorTaskId> load = tasks.iterator();
+        Iterator<ConnectorTaskId> load = new BalancedIterator<>(tasks, ConnectorTaskId::connector);
         while (load.hasNext()) {
             int firstLoad = first.tasksSize();
             int upTo = IntStream.range(0, workerAssignment.size())

diff --git a/...java/org/apache/kafka/connect/runtime/distributed/IncrementalCooperativeAssignorTest.java b/...java/org/apache/kafka/connect/runtime/distributed/IncrementalCooperativeAssignorTest.java
@@ -131,6 +131,46 @@ public void testTaskAssignmentWhenWorkerJoins() {
         assertEmptyAssignment();
     }
 
+    @Test
+    public void testConnectorWellBalancedOnScaleOut() {
+        // Customize assignor for this test case
+        time = new MockTime();
+        initAssignor();
+        connectors.clear();
+
+        // Add first connector
+        addNewConnector("connector1", 12);
+        performStandardRebalance();
+        assertDelay(0);
+
+        // add second connector
+        addNewConnector("connector2", 12);
+        performStandardRebalance();
+        assertDelay(0);
+
+        // add second worker
+        addNewEmptyWorkers("worker2");
+        performStandardRebalance();
+        performStandardRebalance();
+        assertDelay(0);
+
+        // add third worker
+        addNewEmptyWorkers("worker3");
+        performStandardRebalance();
+        performStandardRebalance();
+        assertDelay(0);
+
+        // assert the connectors are well balanced
+        // over the workers
+        assertEquals(3, memberAssignments.size());
+        memberAssignments.forEach((k, v) -> {
+            Map<String, List<ConnectorTaskId>> countsByConnector = v.tasks().stream().collect(Collectors.groupingBy(ConnectorTaskId::connector));
+            assertEquals(countsByConnector.size(), 2);
+            countsByConnector.forEach((k2, v2) -> assertEquals(v2.size(), 4));
+        });
+        assertBalancedAndCompleteAllocation();
+    }
+
     @Test
     public void testAssignmentsWhenWorkersJoinAfterRevocations()  {
         // Customize assignor for this test case