diff --git a/docs/src/main/mdoc/consumers.md b/docs/src/main/mdoc/consumers.md index 2e04dcb9b..ff3859282 100644 --- a/docs/src/main/mdoc/consumers.md +++ b/docs/src/main/mdoc/consumers.md @@ -547,6 +547,49 @@ You may notice, that actual graceful shutdown implementation requires a decent a Also note, that even if you implement a graceful shutdown your application may fall with an error. And in this case, a graceful shutdown will not be invoked. It means that your application should be ready to an _at least once_ semantic even when a graceful shutdown is implemented. Or, if you need an _exactly once_ semantic, consider using [transactions](transactions.md). +### Graceful partition revoke + +In addition to graceful shutdown of hole consumer there is an option to configure your consumer to wait for the streams +to finish processing partition before "releasing" it. Behavior can be enabled via the following settings: +```scala mdoc:silent +object WithGracefulPartitionRevoke extends IOApp.Simple { + + val run: IO[Unit] = { + def processRecord(record: CommittableConsumerRecord[IO, String, String]): IO[Unit] = + IO(println(s"Processing record: $record")) + + def run(consumer: KafkaConsumer[IO, String, String]): IO[Unit] = { + consumer.subscribeTo("topic") >> consumer + .stream + .evalMap { msg => + processRecord(msg).as(msg.offset) + } + .through(commitBatchWithin(100, 15.seconds)) + .compile + .drain + } + + val consumerSettings = ConsumerSettings[IO, String, String] = + ConsumerSettings[IO, String, String] + .withRebalanceRevokeMode(RebalanceRevokeMode.Graceful) + .withSessionTimeout(2.seconds) + + KafkaConsumer + .resource(consumerSettings) + .use { consumer => + run(consumer) + } + } + +} +``` + +Please note that this setting does not guarantee that all the commits will be performed before partition is revoked and +that `session.timeout.ms` setting is set to lower value. Be aware that awaiting too long for partition processor +to finish will cause processing of the whole topic to be suspended. + +Awaiting for commits to complete might be implemented in the future. + [commitrecovery-default]: @API_BASE_URL@/CommitRecovery$.html#Default:fs2.kafka.CommitRecovery [committableconsumerrecord]: @API_BASE_URL@/CommittableConsumerRecord.html [committableoffset]: @API_BASE_URL@/CommittableOffset.html diff --git a/modules/core/src/main/scala/fs2/kafka/ConsumerSettings.scala b/modules/core/src/main/scala/fs2/kafka/ConsumerSettings.scala index 5d3290797..92f847d18 100644 --- a/modules/core/src/main/scala/fs2/kafka/ConsumerSettings.scala +++ b/modules/core/src/main/scala/fs2/kafka/ConsumerSettings.scala @@ -8,14 +8,14 @@ package fs2.kafka import scala.concurrent.duration.* import scala.concurrent.ExecutionContext - import cats.effect.Resource import cats.Show import fs2.kafka.security.KafkaCredentialStore - import org.apache.kafka.clients.consumer.ConsumerConfig import org.apache.kafka.common.requests.OffsetFetchResponse +import scala.util.Try + /** * [[ConsumerSettings]] contain settings necessary to create a [[KafkaConsumer]]. At the very * least, this includes key and value deserializers.

@@ -151,6 +151,18 @@ sealed abstract class ConsumerSettings[F[_], K, V] { */ def withMaxPollInterval(maxPollInterval: FiniteDuration): ConsumerSettings[F, K, V] + + /** + * Returns value for property: + * + * {{{ + * ConsumerConfig.SESSION_TIMEOUT_MS_CONFIG + * }}} + * + * Returns a value as a [[FiniteDuration]] for convenience + */ + def sessionTimeout: FiniteDuration + /** * Returns a new [[ConsumerSettings]] instance with the specified session timeout. This is * equivalent to setting the following property using the [[withProperty]] function, except you @@ -373,6 +385,17 @@ sealed abstract class ConsumerSettings[F[_], K, V] { */ def withCredentials(credentialsStore: KafkaCredentialStore): ConsumerSettings[F, K, V] + /** + * One of two possible modes of operation for [[KafkaConsumer.partitionsMapStream]]. See [[RebalanceRevokeMode]] + * for detailed explanation of differences between them. + */ + def rebalanceRevokeMode: RebalanceRevokeMode + + /** + * Creates a new [[ConsumerSettings]] with the specified [[rebalanceRevokeMode]]. + */ + def withRebalanceRevokeMode(rebalanceRevokeMode: RebalanceRevokeMode): ConsumerSettings[F, K, V] + } object ConsumerSettings { @@ -388,7 +411,8 @@ object ConsumerSettings { override val pollTimeout: FiniteDuration, override val commitRecovery: CommitRecovery, override val recordMetadata: ConsumerRecord[K, V] => String, - override val maxPrefetchBatches: Int + override val maxPrefetchBatches: Int, + override val rebalanceRevokeMode: RebalanceRevokeMode ) extends ConsumerSettings[F, K, V] { override def withCustomBlockingContext(ec: ExecutionContext): ConsumerSettings[F, K, V] = @@ -422,6 +446,13 @@ object ConsumerSettings { override def withMaxPollInterval(maxPollInterval: FiniteDuration): ConsumerSettings[F, K, V] = withProperty(ConsumerConfig.MAX_POLL_INTERVAL_MS_CONFIG, maxPollInterval.toMillis.toString) + //need to use Try, to avoid separate implementation for scala 2.12 + override def sessionTimeout: FiniteDuration = + properties.get(ConsumerConfig.SESSION_TIMEOUT_MS_CONFIG) + .flatMap(str => Try(str.toLong).toOption) + .map(_.millis) + .getOrElse(45000.millis) + override def withSessionTimeout(sessionTimeout: FiniteDuration): ConsumerSettings[F, K, V] = withProperty(ConsumerConfig.SESSION_TIMEOUT_MS_CONFIG, sessionTimeout.toMillis.toString) @@ -509,6 +540,11 @@ object ConsumerSettings { ): ConsumerSettings[F, K, V] = withProperties(credentialsStore.properties) + override def withRebalanceRevokeMode( + rebalanceRevokeMode: RebalanceRevokeMode + ): ConsumerSettings[F, K, V] = + copy(rebalanceRevokeMode = rebalanceRevokeMode) + override def toString: String = s"ConsumerSettings(closeTimeout = $closeTimeout, commitTimeout = $commitTimeout, pollInterval = $pollInterval, pollTimeout = $pollTimeout, commitRecovery = $commitRecovery)" @@ -542,7 +578,8 @@ object ConsumerSettings { pollTimeout = 50.millis, commitRecovery = CommitRecovery.Default, recordMetadata = _ => OffsetFetchResponse.NO_METADATA, - maxPrefetchBatches = 2 + maxPrefetchBatches = 2, + rebalanceRevokeMode = RebalanceRevokeMode.Eager ) def apply[F[_], K, V]( diff --git a/modules/core/src/main/scala/fs2/kafka/KafkaConsumer.scala b/modules/core/src/main/scala/fs2/kafka/KafkaConsumer.scala index 57eb13ca9..c52fe843b 100644 --- a/modules/core/src/main/scala/fs2/kafka/KafkaConsumer.scala +++ b/modules/core/src/main/scala/fs2/kafka/KafkaConsumer.scala @@ -7,13 +7,11 @@ package fs2.kafka import java.util - import scala.annotation.nowarn import scala.collection.immutable.SortedSet import scala.concurrent.duration.FiniteDuration import scala.util.matching.Regex - -import cats.{Foldable, Functor, Reducible} +import cats.{Applicative, Foldable, Functor, Reducible} import cats.data.{NonEmptySet, OptionT} import cats.effect.* import cats.effect.implicits.* @@ -28,7 +26,6 @@ import fs2.kafka.internal.converters.collection.* import fs2.kafka.internal.syntax.* import fs2.kafka.internal.KafkaConsumerActor.* import fs2.kafka.internal.LogEntry.{RevokedPreviousFetch, StoredFetch} - import org.apache.kafka.clients.consumer.{OffsetAndMetadata, OffsetAndTimestamp} import org.apache.kafka.common.{Metric, MetricName, PartitionInfo, TopicPartition} @@ -151,7 +148,8 @@ object KafkaConsumer { def partitionStream( streamId: StreamId, partition: TopicPartition, - assignmentRevoked: F[Unit] + assignmentRevoked: F[Unit], + signalCompletion: F[Unit] ): Stream[F, CommittableConsumerRecord[F, K, V]] = Stream.force { for { chunks <- chunkQueue @@ -238,7 +236,9 @@ object KafkaConsumer { .fromQueueNoneTerminated(chunks) .flatMap(Stream.chunk) .covary[F] - .onFinalize(dequeueDone.complete(()).void) + //Previously all the revoke logic was done on the polling stream, not handling stream + //with new `signalCompletion` there is possibility for more graceful consumer revoke logic + .onFinalize(dequeueDone.complete(()) *> signalCompletion) } } .flatten @@ -246,15 +246,15 @@ object KafkaConsumer { def enqueueAssignment( streamId: StreamId, - assigned: Map[TopicPartition, Deferred[F, Unit]], + assigned: Map[TopicPartition, AssignmentSignals[F]], partitionsMapQueue: PartitionsMapQueue ): F[Unit] = stopConsumingDeferred .tryGet .flatMap { case None => - val assignment: PartitionsMap = assigned.map { case (partition, finisher) => - partition -> partitionStream(streamId, partition, finisher.get) + val assignment = assigned.map { case (partition, assignmentSignals) => + partition -> partitionStream(streamId, partition, assignmentSignals.awaitStreamTerminationSignal, assignmentSignals.signalStreamFinished.void) } partitionsMapQueue.offer(Some(assignment)) case Some(()) => @@ -263,24 +263,26 @@ object KafkaConsumer { def onRebalance( streamId: StreamId, - assignmentRef: Ref[F, Map[TopicPartition, Deferred[F, Unit]]], + assignmentRef: Ref[F, Map[TopicPartition, AssignmentSignals[F]]], partitionsMapQueue: PartitionsMapQueue ): OnRebalance[F] = OnRebalance( onRevoked = revoked => { - for { + val finishSignals = for { finishers <- assignmentRef.modify(_.partition(entry => !revoked.contains(entry._1))) - _ <- finishers.toVector.traverse { case (_, finisher) => finisher.complete(()) } - } yield () + revokeFinishers <- finishers + .toVector + .traverse { + case (_, assignmentSignals) => + assignmentSignals.signalStreamToTerminate.as(assignmentSignals.awaitStreamFinishedSignal) + } + } yield revokeFinishers + + finishSignals.flatMap(revokes => revokes.sequence_) }, onAssigned = assignedPartitions => { for { - assignment <- assignedPartitions - .toVector - .traverse { partition => - Deferred[F, Unit].map(partition -> _) - } - .map(_.toMap) + assignment <- buildAssignment(assignedPartitions) _ <- assignmentRef.update(_ ++ assignment) _ <- enqueueAssignment( streamId = streamId, @@ -291,11 +293,29 @@ object KafkaConsumer { } ) + def buildAssignment( + assignedPartitions: SortedSet[TopicPartition] + ): F[Map[TopicPartition, AssignmentSignals[F]]] = { + assignedPartitions + .toVector + .traverse { partition => + settings.rebalanceRevokeMode match { + case RebalanceRevokeMode.EagerMode => + Deferred[F, Unit].map(streamFinisher => partition -> AssignmentSignals.eager(streamFinisher)) + case RebalanceRevokeMode.GracefulMode => + (Deferred[F, Unit], Deferred[F, Unit]).mapN { (streamFinisher, revokeFinisher) => + partition -> AssignmentSignals.graceful(streamFinisher, revokeFinisher) + } + } + } + .map(_.toMap) + } + def requestAssignment( streamId: StreamId, - assignmentRef: Ref[F, Map[TopicPartition, Deferred[F, Unit]]], + assignmentRef: Ref[F, Map[TopicPartition, AssignmentSignals[F]]], partitionsMapQueue: PartitionsMapQueue - ): F[Map[TopicPartition, Deferred[F, Unit]]] = { + ): F[Map[TopicPartition, AssignmentSignals[F]]] = { val assignment = this.assignment( Some( onRebalance( @@ -312,18 +332,13 @@ object KafkaConsumer { F.pure(Map.empty) case Right(assigned) => - assigned - .toVector - .traverse { partition => - Deferred[F, Unit].map(partition -> _) - } - .map(_.toMap) + buildAssignment(assigned) } } def initialEnqueue( streamId: StreamId, - assignmentRef: Ref[F, Map[TopicPartition, Deferred[F, Unit]]], + assignmentRef: Ref[F, Map[TopicPartition, AssignmentSignals[F]]], partitionsMapQueue: PartitionsMapQueue ): F[Unit] = for { @@ -343,7 +358,7 @@ object KafkaConsumer { partitionsMapQueue <- Stream.eval(Queue.unbounded[F, Option[PartitionsMap]]) streamId <- Stream.eval(streamIdRef.modify(n => (n + 1, n))) assignmentRef <- Stream - .eval(Ref[F].of(Map.empty[TopicPartition, Deferred[F, Unit]])) + .eval(Ref[F].of(Map.empty[TopicPartition, AssignmentSignals[F]])) _ <- Stream.eval( initialEnqueue( streamId, @@ -825,6 +840,40 @@ object KafkaConsumer { } + /** + * Utility class to provide clarity for internals. + * Goal is to make [[RebalanceRevokeMode]] transparent to the rest of implementation internals. + * @tparam F effect used + */ + private sealed abstract class AssignmentSignals[F[_]] { + def signalStreamToTerminate: F[Boolean] + def awaitStreamTerminationSignal: F[Unit] + def signalStreamFinished: F[Boolean] + def awaitStreamFinishedSignal: F[Unit] + } + + private object AssignmentSignals { + + def eager[F[_]: Applicative](streamFinisher: Deferred[F, Unit]): AssignmentSignals[F] = EagerSignals(streamFinisher) + def graceful[F[_]](streamFinisher: Deferred[F, Unit], revokeFinisher: Deferred[F, Unit]): AssignmentSignals[F] = + GracefulSignals[F](streamFinisher, revokeFinisher) + + final case class EagerSignals[F[_]: Applicative](streamFinisher: Deferred[F, Unit]) extends AssignmentSignals[F] { + override def signalStreamToTerminate: F[Boolean] = streamFinisher.complete(()) + override def awaitStreamTerminationSignal: F[Unit] = streamFinisher.get + override def signalStreamFinished: F[Boolean] = true.pure[F] + override def awaitStreamFinishedSignal: F[Unit] = ().pure[F] + } + + final case class GracefulSignals[F[_]](streamFinisher: Deferred[F, Unit], revokeFinisher: Deferred[F, Unit]) extends AssignmentSignals[F] { + override def signalStreamToTerminate: F[Boolean] = streamFinisher.complete(()) + override def awaitStreamTerminationSignal: F[Unit] = streamFinisher.get + override def signalStreamFinished: F[Boolean] = revokeFinisher.complete(()) + override def awaitStreamFinishedSignal: F[Unit] = revokeFinisher.get + } + + } + /* * Prevents the default `MkConsumer` instance from being implicitly available * to code defined in this object, ensuring factory methods require an instance diff --git a/modules/core/src/main/scala/fs2/kafka/RebalanceRevokeMode.scala b/modules/core/src/main/scala/fs2/kafka/RebalanceRevokeMode.scala new file mode 100644 index 000000000..e8e62a6d2 --- /dev/null +++ b/modules/core/src/main/scala/fs2/kafka/RebalanceRevokeMode.scala @@ -0,0 +1,42 @@ +package fs2.kafka + +/** + * The available options for [[ConsumerSettings#rebalanceRevokeMode]].

+ * + * Available options include:
+ * - [[RebalanceRevokeMode.Eager]] old behaviour, to release assigned partition as soon as possible,
+ * - [[RebalanceRevokeMode.Graceful]] modified behavior, waiting for configured amount of time: + * {{{org.apache.kafka.clients.consumer.ConsumerConfig.SESSION_TIMEOUT_MS_CONFIG}}} It is guaranteed by kafka protocol + * that after that timeout old consumer will be marked as dead. + * + * Default mode is [[RebalanceRevokeMode.Eager]] which is exactly the same as old behavior and can be preferred + * if rebalance need to happen as quickly as possible and having multiple consumers working on a partition for a moment + * is not a problem. + * + * On the other hand if you want stricter guarantees about processing and attempt to wait for existing streams to finish + * processing messages before releasing partition choose [[RebalanceRevokeMode.Graceful]]. + * Because stream is signalled to be shutdown in-flight commits might be lost and some messages might be processed again + * after new assignment. + * + */ +sealed abstract class RebalanceRevokeMode + +object RebalanceRevokeMode { + + private[kafka] case object EagerMode extends RebalanceRevokeMode + + private[kafka] case object GracefulMode extends RebalanceRevokeMode + + /** + * Old behavior releasing partition as soon as all streams have messages dispatched and signalled termination + */ + val Eager: RebalanceRevokeMode = EagerMode + + /** + * Waiting for configured amount of time:
+ * [[ConsumerSettings#withMaxPollInterval]] * 5 or until all the partition streams finish processing (but not waiting + * for commits to conclude for that partition) + */ + val Graceful: RebalanceRevokeMode = GracefulMode + +} diff --git a/modules/core/src/main/scala/fs2/kafka/internal/KafkaConsumerActor.scala b/modules/core/src/main/scala/fs2/kafka/internal/KafkaConsumerActor.scala index 6a1f4fe02..e2c049625 100644 --- a/modules/core/src/main/scala/fs2/kafka/internal/KafkaConsumerActor.scala +++ b/modules/core/src/main/scala/fs2/kafka/internal/KafkaConsumerActor.scala @@ -230,7 +230,7 @@ final private[kafka] class KafkaConsumerActor[F[_], K, V]( res.completeWithRecords >> res.completeWithoutRecords >> res.removeRevokedRecords >> - onRevoked + onRevoked.timeout(settings.sessionTimeout) //just to be extra-safe timeout this revoke } } @@ -630,7 +630,7 @@ private[kafka] object KafkaConsumerActor { final case class OnRebalance[F[_]]( onAssigned: SortedSet[TopicPartition] => F[Unit], - onRevoked: SortedSet[TopicPartition] => F[Unit] + onRevoked: SortedSet[TopicPartition] => F[Unit], ) { override def toString: String =