This is an automated email from the ASF dual-hosted git repository.
lianetm pushed a commit to branch 4.1
in repository https://gitbox.apache.org/repos/asf/kafka.git
The following commit(s) were added to refs/heads/4.1 by this push:
new 38652f763dc KAFKA-19356: Prevent new consumer fetch assigned
partitions not in explicit subscription (#19983)
38652f763dc is described below
commit 38652f763dc29ca83756bde32b97afe111c9fef9
Author: Lianet Magrans <[email protected]>
AuthorDate: Wed Jun 18 18:31:46 2025 -0400
KAFKA-19356: Prevent new consumer fetch assigned partitions not in explicit
subscription (#19983)
Fix to ensure assigned partitions whose topics are not in the consumer
explicit subscription are considered not fetchable (so that no records
are returned on poll for them)
This scenario could happen in the new async consumer (using the Consumer
rebalance protocol) when the subscription changes, because the consumer
will keep its assignment until the coordinator sends a new one (broker
drives assignments).
This does not happen in the classic consumer because the assignment
logic lives on the client-side, so the consumer pro-actively updates
assignment as needed.
This PR validates assignment vs subscription on fetch for explicit
subscription only. Regular expressions, shared subscription remain
unchanged (regex case still under discussion, will be handled separately
if needed)
Reviewers: Andrew Schofield <[email protected]>, TengYao Chi
<[email protected]>, Kirk True <[email protected]>, Jhen-Yung Hsu
<[email protected]>
---
.../clients/consumer/internals/FetchCollector.java | 5 +-
.../consumer/internals/SubscriptionState.java | 19 ++++-
.../consumer/internals/SubscriptionStateTest.java | 80 ++++++++++++++++++++++
3 files changed, 100 insertions(+), 4 deletions(-)
diff --git
a/clients/src/main/java/org/apache/kafka/clients/consumer/internals/FetchCollector.java
b/clients/src/main/java/org/apache/kafka/clients/consumer/internals/FetchCollector.java
index 2aa8aeaaffb..bbe216c2fc8 100644
---
a/clients/src/main/java/org/apache/kafka/clients/consumer/internals/FetchCollector.java
+++
b/clients/src/main/java/org/apache/kafka/clients/consumer/internals/FetchCollector.java
@@ -155,7 +155,10 @@ public class FetchCollector<K, V> {
log.debug("Not returning fetched records for partition {} since it
is no longer assigned", tp);
} else if (!subscriptions.isFetchable(tp)) {
// this can happen when a partition is paused before fetched
records are returned to the consumer's
- // poll call or if the offset is being reset
+ // poll call or if the offset is being reset.
+ // It can also happen under the Consumer rebalance protocol, when
the consumer changes its subscription.
+ // Until the consumer receives an updated assignment from the
coordinator, it can hold assigned partitions
+ // that are not in the subscription anymore, so we make them not
fetchable.
log.debug("Not returning fetched records for assigned partition {}
since it is no longer fetchable", tp);
} else {
SubscriptionState.FetchPosition position =
subscriptions.position(tp);
diff --git
a/clients/src/main/java/org/apache/kafka/clients/consumer/internals/SubscriptionState.java
b/clients/src/main/java/org/apache/kafka/clients/consumer/internals/SubscriptionState.java
index e048ab90b1c..4659f4cf0cd 100644
---
a/clients/src/main/java/org/apache/kafka/clients/consumer/internals/SubscriptionState.java
+++
b/clients/src/main/java/org/apache/kafka/clients/consumer/internals/SubscriptionState.java
@@ -487,7 +487,7 @@ public class SubscriptionState {
List<TopicPartition> result = new ArrayList<>();
assignment.forEach((topicPartition, topicPartitionState) -> {
// Cheap check is first to avoid evaluating the predicate if
possible
- if ((subscriptionType.equals(SubscriptionType.AUTO_TOPICS_SHARE)
|| topicPartitionState.isFetchable())
+ if ((subscriptionType.equals(SubscriptionType.AUTO_TOPICS_SHARE)
|| isFetchableAndSubscribed(topicPartition, topicPartitionState))
&& isAvailable.test(topicPartition)) {
result.add(topicPartition);
}
@@ -495,6 +495,19 @@ public class SubscriptionState {
return result;
}
+ /**
+ * Check if the partition is fetchable.
+ * If the consumer has explicitly subscribed to a list of topic names,
+ * this will also check that the partition is contained in the
subscription.
+ */
+ private synchronized boolean isFetchableAndSubscribed(TopicPartition
topicPartition, TopicPartitionState topicPartitionState) {
+ if (subscriptionType.equals(SubscriptionType.AUTO_TOPICS) &&
!subscription.contains(topicPartition.topic())) {
+ log.trace("Assigned partition {} is not in the subscription {} so
will be considered not fetchable.", topicPartition, subscription);
+ return false;
+ }
+ return topicPartitionState.isFetchable();
+ }
+
public synchronized boolean hasAutoAssignedPartitions() {
return this.subscriptionType == SubscriptionType.AUTO_TOPICS ||
this.subscriptionType == SubscriptionType.AUTO_PATTERN
|| this.subscriptionType == SubscriptionType.AUTO_TOPICS_SHARE
|| this.subscriptionType == SubscriptionType.AUTO_PATTERN_RE2J;
@@ -879,8 +892,8 @@ public class SubscriptionState {
}
synchronized boolean isFetchable(TopicPartition tp) {
- TopicPartitionState assignedOrNull = assignedStateOrNull(tp);
- return assignedOrNull != null && assignedOrNull.isFetchable();
+ TopicPartitionState tps = assignedStateOrNull(tp);
+ return tps != null && isFetchableAndSubscribed(tp, tps);
}
public synchronized boolean hasValidPosition(TopicPartition tp) {
diff --git
a/clients/src/test/java/org/apache/kafka/clients/consumer/internals/SubscriptionStateTest.java
b/clients/src/test/java/org/apache/kafka/clients/consumer/internals/SubscriptionStateTest.java
index 064664d2f4d..eae791dc830 100644
---
a/clients/src/test/java/org/apache/kafka/clients/consumer/internals/SubscriptionStateTest.java
+++
b/clients/src/test/java/org/apache/kafka/clients/consumer/internals/SubscriptionStateTest.java
@@ -38,9 +38,12 @@ import java.util.Arrays;
import java.util.Collection;
import java.util.Collections;
import java.util.HashSet;
+import java.util.List;
import java.util.Optional;
import java.util.Set;
+import java.util.concurrent.atomic.AtomicBoolean;
import java.util.function.LongSupplier;
+import java.util.function.Predicate;
import java.util.regex.Pattern;
import static java.util.Collections.singleton;
@@ -115,6 +118,54 @@ public class SubscriptionStateTest {
assertEquals(0, state.numAssignedPartitions());
}
+ @Test
+ public void testIsFetchableOnManualAssignment() {
+ state.assignFromUser(Set.of(tp0, tp1));
+ assertAssignedPartitionIsFetchable();
+ }
+
+ @Test
+ public void testIsFetchableOnAutoAssignment() {
+ state.subscribe(Set.of(topic), Optional.of(rebalanceListener));
+ state.assignFromSubscribed(Set.of(tp0, tp1));
+ assertAssignedPartitionIsFetchable();
+ }
+
+ private void assertAssignedPartitionIsFetchable() {
+ assertEquals(2, state.assignedPartitions().size());
+ assertTrue(state.assignedPartitions().contains(tp0));
+ assertTrue(state.assignedPartitions().contains(tp1));
+
+ assertFalse(state.isFetchable(tp0), "Should not be fetchable without a
valid position");
+ assertFalse(state.isFetchable(tp1), "Should not be fetchable without a
valid position");
+
+ state.seek(tp0, 1);
+ state.seek(tp1, 1);
+
+ assertTrue(state.isFetchable(tp0));
+ assertTrue(state.isFetchable(tp1));
+ }
+
+ @Test
+ public void testIsFetchableConsidersExplicitTopicSubscription() {
+ state.subscribe(Set.of(topic1), Optional.of(rebalanceListener));
+ state.assignFromSubscribed(Set.of(t1p0));
+ state.seek(t1p0, 1);
+
+ assertEquals(Set.of(t1p0), state.assignedPartitions());
+ assertTrue(state.isFetchable(t1p0));
+
+ // Change subscription. Assigned partitions should remain unchanged
but not fetchable.
+ state.subscribe(Set.of(topic), Optional.of(rebalanceListener));
+ assertEquals(Set.of(t1p0), state.assignedPartitions());
+ assertFalse(state.isFetchable(t1p0), "Assigned partitions not in the
subscription should not be fetchable");
+
+ // Unsubscribe. Assigned partitions should be cleared and not
fetchable.
+ state.unsubscribe();
+ assertTrue(state.assignedPartitions().isEmpty());
+ assertFalse(state.isFetchable(t1p0));
+ }
+
@Test
public void testGroupSubscribe() {
state.subscribe(singleton(topic1), Optional.of(rebalanceListener));
@@ -1073,4 +1124,33 @@ public class SubscriptionStateTest {
assertThrows(IllegalStateException.class, () ->
state.isOffsetResetNeeded(unassignedPartition));
}
+
+ // This test ensures the "fetchablePartitions" does not run the custom
predicate if the partition is not fetchable
+ // This func is used in the hot path for fetching, to find fetchable
partitions that are not in the buffer,
+ // so it should avoid evaluating the predicate if not needed.
+ @Test
+ public void testFetchablePartitionsPerformsCheapChecksFirst() {
+ // Setup fetchable partition and pause it
+ state.assignFromUser(Set.of(tp0));
+ state.seek(tp0, 100);
+ assertTrue(state.isFetchable(tp0));
+ state.pause(tp0);
+
+ // Retrieve fetchable partitions with custom predicate.
+ AtomicBoolean predicateEvaluated = new AtomicBoolean(false);
+ Predicate<TopicPartition> isBuffered = tp -> {
+ predicateEvaluated.set(true);
+ return true;
+ };
+ List<TopicPartition> fetchablePartitions =
state.fetchablePartitions(isBuffered);
+ assertTrue(fetchablePartitions.isEmpty());
+ assertFalse(predicateEvaluated.get(), "Custom predicate should not be
evaluated when partitions are not fetchable");
+
+ // Resume partition and retrieve fetchable again
+ state.resume(tp0);
+ predicateEvaluated.set(false);
+ fetchablePartitions = state.fetchablePartitions(isBuffered);
+ assertTrue(predicateEvaluated.get());
+ assertEquals(tp0, fetchablePartitions.get(0));
+ }
}