getsentry · lynnagara · Apr 1, 2022 · Mar 30, 2022 · Mar 31, 2022 · Mar 31, 2022
@@ -143,9 +143,10 @@ class KafkaConsumer(Consumer[KafkaPayload]):
 
     def __init__(
         self,
-        configuration: Mapping[str, Any],
+        configuration: MutableMapping[str, Any],
         *,
         commit_retry_policy: Optional[RetryPolicy] = None,
+        incremental_cooperative: bool = False,
     ) -> None:
         if commit_retry_policy is None:
             commit_retry_policy = NoRetryPolicy()
@@ -182,6 +183,11 @@ def __init__(
                 "invalid value for 'enable.auto.offset.store' configuration"
             )
 
+        self.__incremental_cooperative = incremental_cooperative
+
+        if self.__incremental_cooperative is True:
+            configuration["partition.assignment.strategy"] = "cooperative-sticky"
+
         # NOTE: Offsets are explicitly managed as part of the assignment
         # callback, so preemptively resetting offsets is not enabled.
         self.__consumer = ConfluentConsumer(
@@ -246,40 +252,74 @@ def assignment_callback(
         ) -> None:
             self.__state = KafkaConsumerState.ASSIGNING
 
-            try:
-                assignment: MutableSequence[ConfluentTopicPartition] = []
-
-                for partition in self.__consumer.committed(partitions):
-                    if partition.offset >= 0:
-                        assignment.append(partition)
-                    elif partition.offset == OFFSET_INVALID:
-                        assignment.append(
-                            self.__resolve_partition_starting_offset(partition)
-                        )
-                    else:
-                        raise ValueError("received unexpected offset")
-
-                offsets: MutableMapping[Partition, int] = {
-                    Partition(Topic(i.topic), i.partition): i.offset for i in assignment
-                }
-                self.__seek(offsets)
-
-                # Ensure that all partitions are resumed on assignment to avoid
-                # carrying over state from a previous assignment.
-                self.__consumer.resume(
-                    [
-                        ConfluentTopicPartition(
-                            partition.topic.name, partition.index, offset
-                        )
-                        for partition, offset in offsets.items()
-                    ]
-                )
+            if self.__incremental_cooperative is True:
+                try:
+                    incremental_assignment: MutableSequence[
+                        ConfluentTopicPartition
+                    ] = []
+
+                    for partition in partitions:
+                        if partition.offset >= 0:
+                            incremental_assignment.append(partition)
+                        elif partition.offset == OFFSET_INVALID:
+                            incremental_assignment.append(
+                                self.__resolve_partition_starting_offset(partition)
+                            )
+                        else:
+                            raise ValueError("received unexpected offset")
+
+                    offsets = {
+                        Partition(Topic(i.topic), i.partition): i.offset
+                        for i in incremental_assignment
+                    }
+
+                    self.__incremental_assign(offsets)
+
+                    # Ensure that all partitions are resumed on assignment to avoid
+                    # carrying over state from a previous assignment.
+                    self.resume([p for p in offsets])
+
+                except Exception:
+                    self.__state = KafkaConsumerState.ERROR
+                    raise
 
-                for partition in offsets:
-                    self.__paused.discard(partition)
-            except Exception:
-                self.__state = KafkaConsumerState.ERROR
-                raise
+            else:
+                try:
+                    assignment: MutableSequence[ConfluentTopicPartition] = []
+
+                    for partition in self.__consumer.committed(partitions):
+                        if partition.offset >= 0:
+                            assignment.append(partition)
+                        elif partition.offset == OFFSET_INVALID:
+                            assignment.append(
+                                self.__resolve_partition_starting_offset(partition)
+                            )
+                        else:
+                            raise ValueError("received unexpected offset")
+
+                    offsets = {
+                        Partition(Topic(i.topic), i.partition): i.offset
+                        for i in assignment
+                    }
+
+                    self.__assign(offsets)
+
+                    # Ensure that all partitions are resumed on assignment to avoid
+                    # carrying over state from a previous assignment.
+                    self.__consumer.resume(
+                        [
+                            ConfluentTopicPartition(
+                                partition.topic.name, partition.index, offset
+                            )
+                            for partition, offset in offsets.items()
+                        ]
+                    )
+
+                    for partition in offsets:
+                        self.__paused.discard(partition)
+                except Exception:
+                    self.__state = KafkaConsumerState.ERROR
+                    raise
 
             try:
                 if on_assign is not None:
@@ -431,29 +471,33 @@ def __validate_offsets(self, offsets: Mapping[Partition, int]) -> None:
         if invalid_offsets:
             raise ConsumerError(f"invalid offsets: {invalid_offsets!r}")
 
+    def __assign(self, offsets: Mapping[Partition, int]) -> None:
+        self.__validate_offsets(offsets)
+        self.__consumer.assign(
+            [
+                ConfluentTopicPartition(partition.topic.name, partition.index, offset)
+                for partition, offset in offsets.items()
+            ]
+        )
+        self.__offsets.update(offsets)
+
+    def __incremental_assign(self, offsets: Mapping[Partition, int]) -> None:
+        self.__validate_offsets(offsets)
+        self.__consumer.incremental_assign(
+            [
+                ConfluentTopicPartition(partition.topic.name, partition.index, offset)
+                for partition, offset in offsets.items()
+            ]
+        )
+        self.__offsets.update(offsets)
+
     def __seek(self, offsets: Mapping[Partition, int]) -> None:
         self.__validate_offsets(offsets)
 
-        if self.__state is KafkaConsumerState.ASSIGNING:
-            # Calling ``seek`` on the Confluent consumer from an assignment
-            # callback will throw an "Erroneous state" error. Instead,
-            # partition offsets have to be initialized by calling ``assign``.
-            self.__consumer.assign(
-                [
-                    ConfluentTopicPartition(
-                        partition.topic.name, partition.index, offset
-                    )
-                    for partition, offset in offsets.items()
-                ]
+        for partition, offset in offsets.items():
+            self.__consumer.seek(
+                ConfluentTopicPartition(partition.topic.name, partition.index, offset)
             )
-        else:
-            for partition, offset in offsets.items():
-                self.__consumer.seek(
-                    ConfluentTopicPartition(
-                        partition.topic.name, partition.index, offset
-                    )
-                )
-
         self.__offsets.update(offsets)
 
     def seek(self, offsets: Mapping[Partition, int]) -> None:

@@ -6,7 +6,7 @@
 from contextlib import closing
 from datetime import datetime
 from pickle import PickleBuffer
-from typing import Iterator, MutableSequence, Optional
+from typing import Any, Iterator, Mapping, MutableSequence, Optional
 from unittest import TestCase
 
 import pytest
@@ -46,6 +46,25 @@ def test_payload_pickle_out_of_band() -> None:
     assert pickle.loads(data, buffers=[b.raw() for b in buffers]) == payload
 
 
+@contextlib.contextmanager
+def get_topic(
+    configuration: Mapping[str, Any], partitions_count: int
+) -> Iterator[Topic]:
+    name = f"test-{uuid.uuid1().hex}"
+    client = AdminClient(configuration)
+    [[key, future]] = client.create_topics(
+        [NewTopic(name, num_partitions=partitions_count, replication_factor=1)]
+    ).items()
+    assert key == name
+    assert future.result() is None
+    try:
+        yield Topic(name)
+    finally:
+        [[key, future]] = client.delete_topics([name]).items()
+        assert key == name
+        assert future.result() is None
+
+
 class KafkaStreamsTestCase(StreamsTestMixin[KafkaPayload], TestCase):
 
     configuration = build_kafka_configuration(
@@ -54,19 +73,11 @@ class KafkaStreamsTestCase(StreamsTestMixin[KafkaPayload], TestCase):
 
     @contextlib.contextmanager
     def get_topic(self, partitions: int = 1) -> Iterator[Topic]:
-        name = f"test-{uuid.uuid1().hex}"
-        client = AdminClient(self.configuration)
-        [[key, future]] = client.create_topics(
-            [NewTopic(name, num_partitions=partitions, replication_factor=1)]
-        ).items()
-        assert key == name
-        assert future.result() is None
-        try:
-            yield Topic(name)
-        finally:
-            [[key, future]] = client.delete_topics([name]).items()
-            assert key == name
-            assert future.result() is None
+        with get_topic(self.configuration, partitions) as topic:
+            try:
+                yield topic
+            finally:
+                pass
 
     def get_consumer(
         self,
@@ -133,6 +144,70 @@ def test_auto_offset_reset_error(self) -> None:
                     consumer.poll(10.0)  # XXX: getting the subcription is slow
 
 
+def test_cooperative_rebalancing() -> None:
+    configuration = build_kafka_configuration(
+        {"bootstrap.servers": os.environ.get("DEFAULT_BROKERS", "localhost:9092")}
+    )
+
+    partitions_count = 2
+
+    group_id = uuid.uuid1().hex
+    producer = KafkaProducer(configuration)
+
+    consumer_a = KafkaConsumer(
+        {
+            **configuration,
+            "auto.offset.reset": "earliest",
+            "enable.auto.commit": False,
+            "enable.auto.offset.store": False,
+            "group.id": group_id,
+            "session.timeout.ms": 10000,
+        },
+        incremental_cooperative=True,
+    )
+    consumer_b = KafkaConsumer(
+        {
+            **configuration,
+            "auto.offset.reset": "earliest",
+            "enable.auto.commit": False,
+            "enable.auto.offset.store": False,
+            "group.id": group_id,
+            "session.timeout.ms": 10000,
+        },
+        incremental_cooperative=True,
+    )
+
+    with get_topic(configuration, partitions_count) as topic, closing(
+        producer
+    ), closing(consumer_a), closing(consumer_b):
+        for i in range(10):
+            for j in range(partitions_count):
+                producer.produce(
+                    Partition(topic, 1),
+                    KafkaPayload(None, f"{j}-{i}".encode("utf8"), []),
+                )
+
+        consumer_a.subscribe([topic])
+
+        assert consumer_a.poll(10.0) is not None
+
+        # Consumer A has 2 partitions assigned, B has none
+        assert len(consumer_a.tell()) == 2
+        assert len(consumer_b.tell()) == 0
+
+        consumer_b.subscribe([topic])
+        consumer_a.pause([Partition(topic, 0), Partition(topic, 1)])
+
+        # At some point, 1 partition will move to consumer B
+        for i in range(10):
+            assert consumer_a.poll(0) is None  # attempt to force session timeout
+            if consumer_b.poll(1.0) is not None:
+                break
+
+        assert len(consumer_a.tell()) == 1
+        assert len(consumer_b.tell()) == 1
+
+
 def test_commit_codec() -> None:
     commit = Commit("group", Partition(Topic("topic"), 0), 0, datetime.now())
     assert commit_codec.decode(commit_codec.encode(commit)) == commit