-
Notifications
You must be signed in to change notification settings - Fork 14.8k
MINOR: Initialize fetchPartitionStatus as a Map type to reduce collection conversions #20768
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from all commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -30,6 +30,7 @@ import org.apache.kafka.server.purgatory.DelayedOperation | |
| import org.apache.kafka.server.storage.log.{FetchIsolation, FetchParams, FetchPartitionData} | ||
| import org.apache.kafka.storage.internals.log.{FetchPartitionStatus, LogOffsetMetadata} | ||
|
|
||
| import java.util | ||
| import scala.collection._ | ||
| import scala.jdk.CollectionConverters._ | ||
|
|
||
|
|
@@ -39,7 +40,7 @@ import scala.jdk.CollectionConverters._ | |
| */ | ||
| class DelayedFetch( | ||
| params: FetchParams, | ||
| fetchPartitionStatus: Seq[(TopicIdPartition, FetchPartitionStatus)], | ||
| fetchPartitionStatus: util.LinkedHashMap[TopicIdPartition, FetchPartitionStatus], | ||
| replicaManager: ReplicaManager, | ||
| quota: ReplicaQuota, | ||
| responseCallback: Seq[(TopicIdPartition, FetchPartitionData)] => Unit | ||
|
|
@@ -66,79 +67,78 @@ class DelayedFetch( | |
| */ | ||
| override def tryComplete(): Boolean = { | ||
| var accumulatedSize = 0 | ||
| fetchPartitionStatus.foreach { | ||
| case (topicIdPartition, fetchStatus) => | ||
| val fetchOffset = fetchStatus.startOffsetMetadata | ||
| val fetchLeaderEpoch = fetchStatus.fetchInfo.currentLeaderEpoch | ||
| try { | ||
| if (fetchOffset != LogOffsetMetadata.UNKNOWN_OFFSET_METADATA) { | ||
| val partition = replicaManager.getPartitionOrException(topicIdPartition.topicPartition) | ||
| val offsetSnapshot = partition.fetchOffsetSnapshot(fetchLeaderEpoch, params.fetchOnlyLeader) | ||
|
|
||
| val endOffset = params.isolation match { | ||
| case FetchIsolation.LOG_END => offsetSnapshot.logEndOffset | ||
| case FetchIsolation.HIGH_WATERMARK => offsetSnapshot.highWatermark | ||
| case FetchIsolation.TXN_COMMITTED => offsetSnapshot.lastStableOffset | ||
| } | ||
| fetchPartitionStatus.forEach { (topicIdPartition, fetchStatus) => | ||
| val fetchOffset = fetchStatus.startOffsetMetadata | ||
| val fetchLeaderEpoch = fetchStatus.fetchInfo.currentLeaderEpoch | ||
| try { | ||
| if (fetchOffset != LogOffsetMetadata.UNKNOWN_OFFSET_METADATA) { | ||
| val partition = replicaManager.getPartitionOrException(topicIdPartition.topicPartition) | ||
| val offsetSnapshot = partition.fetchOffsetSnapshot(fetchLeaderEpoch, params.fetchOnlyLeader) | ||
|
|
||
| val endOffset = params.isolation match { | ||
| case FetchIsolation.LOG_END => offsetSnapshot.logEndOffset | ||
| case FetchIsolation.HIGH_WATERMARK => offsetSnapshot.highWatermark | ||
| case FetchIsolation.TXN_COMMITTED => offsetSnapshot.lastStableOffset | ||
| } | ||
|
|
||
| // Go directly to the check for Case G if the message offsets are the same. If the log segment | ||
| // has just rolled, then the high watermark offset will remain the same but be on the old segment, | ||
| // which would incorrectly be seen as an instance of Case F. | ||
| if (fetchOffset.messageOffset > endOffset.messageOffset) { | ||
| // Case F, this can happen when the new fetch operation is on a truncated leader | ||
| debug(s"Satisfying fetch $this since it is fetching later segments of partition $topicIdPartition.") | ||
| return forceComplete() | ||
| } else if (fetchOffset.messageOffset < endOffset.messageOffset) { | ||
| if (fetchOffset.onOlderSegment(endOffset)) { | ||
| // Case F, this can happen when the fetch operation is falling behind the current segment | ||
| // or the partition has just rolled a new segment | ||
| debug(s"Satisfying fetch $this immediately since it is fetching older segments.") | ||
| // We will not force complete the fetch request if a replica should be throttled. | ||
| if (!params.isFromFollower || !replicaManager.shouldLeaderThrottle(quota, partition, params.replicaId)) | ||
| return forceComplete() | ||
| } else if (fetchOffset.onSameSegment(endOffset)) { | ||
| // we take the partition fetch size as upper bound when accumulating the bytes (skip if a throttled partition) | ||
| val bytesAvailable = math.min(endOffset.positionDiff(fetchOffset), fetchStatus.fetchInfo.maxBytes) | ||
| if (!params.isFromFollower || !replicaManager.shouldLeaderThrottle(quota, partition, params.replicaId)) | ||
| accumulatedSize += bytesAvailable | ||
| } | ||
| // Go directly to the check for Case G if the message offsets are the same. If the log segment | ||
| // has just rolled, then the high watermark offset will remain the same but be on the old segment, | ||
| // which would incorrectly be seen as an instance of Case F. | ||
| if (fetchOffset.messageOffset > endOffset.messageOffset) { | ||
| // Case F, this can happen when the new fetch operation is on a truncated leader | ||
| debug(s"Satisfying fetch $this since it is fetching later segments of partition $topicIdPartition.") | ||
| return forceComplete() | ||
| } else if (fetchOffset.messageOffset < endOffset.messageOffset) { | ||
| if (fetchOffset.onOlderSegment(endOffset)) { | ||
| // Case F, this can happen when the fetch operation is falling behind the current segment | ||
| // or the partition has just rolled a new segment | ||
| debug(s"Satisfying fetch $this immediately since it is fetching older segments.") | ||
| // We will not force complete the fetch request if a replica should be throttled. | ||
| if (!params.isFromFollower || !replicaManager.shouldLeaderThrottle(quota, partition, params.replicaId)) | ||
| return forceComplete() | ||
| } else if (fetchOffset.onSameSegment(endOffset)) { | ||
| // we take the partition fetch size as upper bound when accumulating the bytes (skip if a throttled partition) | ||
| val bytesAvailable = math.min(endOffset.positionDiff(fetchOffset), fetchStatus.fetchInfo.maxBytes) | ||
| if (!params.isFromFollower || !replicaManager.shouldLeaderThrottle(quota, partition, params.replicaId)) | ||
| accumulatedSize += bytesAvailable | ||
| } | ||
| } | ||
|
|
||
| // Case H: If truncation has caused diverging epoch while this request was in purgatory, return to trigger truncation | ||
| fetchStatus.fetchInfo.lastFetchedEpoch.ifPresent { fetchEpoch => | ||
| val epochEndOffset = partition.lastOffsetForLeaderEpoch(fetchLeaderEpoch, fetchEpoch, fetchOnlyFromLeader = false) | ||
| if (epochEndOffset.errorCode != Errors.NONE.code() | ||
| || epochEndOffset.endOffset == UNDEFINED_EPOCH_OFFSET | ||
| || epochEndOffset.leaderEpoch == UNDEFINED_EPOCH) { | ||
| debug(s"Could not obtain last offset for leader epoch for partition $topicIdPartition, epochEndOffset=$epochEndOffset.") | ||
| return forceComplete() | ||
| } else if (epochEndOffset.leaderEpoch < fetchEpoch || epochEndOffset.endOffset < fetchStatus.fetchInfo.fetchOffset) { | ||
| debug(s"Satisfying fetch $this since it has diverging epoch requiring truncation for partition " + | ||
| s"$topicIdPartition epochEndOffset=$epochEndOffset fetchEpoch=$fetchEpoch fetchOffset=${fetchStatus.fetchInfo.fetchOffset}.") | ||
| return forceComplete() | ||
| } | ||
| // Case H: If truncation has caused diverging epoch while this request was in purgatory, return to trigger truncation | ||
| fetchStatus.fetchInfo.lastFetchedEpoch.ifPresent { fetchEpoch => | ||
| val epochEndOffset = partition.lastOffsetForLeaderEpoch(fetchLeaderEpoch, fetchEpoch, fetchOnlyFromLeader = false) | ||
| if (epochEndOffset.errorCode != Errors.NONE.code() | ||
| || epochEndOffset.endOffset == UNDEFINED_EPOCH_OFFSET | ||
| || epochEndOffset.leaderEpoch == UNDEFINED_EPOCH) { | ||
| debug(s"Could not obtain last offset for leader epoch for partition $topicIdPartition, epochEndOffset=$epochEndOffset.") | ||
| return forceComplete() | ||
| } else if (epochEndOffset.leaderEpoch < fetchEpoch || epochEndOffset.endOffset < fetchStatus.fetchInfo.fetchOffset) { | ||
| debug(s"Satisfying fetch $this since it has diverging epoch requiring truncation for partition " + | ||
| s"$topicIdPartition epochEndOffset=$epochEndOffset fetchEpoch=$fetchEpoch fetchOffset=${fetchStatus.fetchInfo.fetchOffset}.") | ||
| return forceComplete() | ||
| } | ||
| } | ||
| } catch { | ||
| case _: NotLeaderOrFollowerException => // Case A or Case B | ||
| debug(s"Broker is no longer the leader or follower of $topicIdPartition, satisfy $this immediately") | ||
| return forceComplete() | ||
| case _: UnknownTopicOrPartitionException => // Case C | ||
| debug(s"Broker no longer knows of partition $topicIdPartition, satisfy $this immediately") | ||
| return forceComplete() | ||
| case _: KafkaStorageException => // Case D | ||
| debug(s"Partition $topicIdPartition is in an offline log directory, satisfy $this immediately") | ||
| return forceComplete() | ||
| case _: FencedLeaderEpochException => // Case E | ||
| debug(s"Broker is the leader of partition $topicIdPartition, but the requested epoch " + | ||
| s"$fetchLeaderEpoch is fenced by the latest leader epoch, satisfy $this immediately") | ||
| return forceComplete() | ||
| } | ||
| } catch { | ||
| case _: NotLeaderOrFollowerException => // Case A or Case B | ||
| debug(s"Broker is no longer the leader or follower of $topicIdPartition, satisfy $this immediately") | ||
| return forceComplete() | ||
| case _: UnknownTopicOrPartitionException => // Case C | ||
| debug(s"Broker no longer knows of partition $topicIdPartition, satisfy $this immediately") | ||
| return forceComplete() | ||
| case _: KafkaStorageException => // Case D | ||
| debug(s"Partition $topicIdPartition is in an offline log directory, satisfy $this immediately") | ||
| return forceComplete() | ||
| case _: FencedLeaderEpochException => // Case E | ||
| debug(s"Broker is the leader of partition $topicIdPartition, but the requested epoch " + | ||
| s"$fetchLeaderEpoch is fenced by the latest leader epoch, satisfy $this immediately") | ||
| return forceComplete() | ||
| } | ||
| } | ||
|
|
||
| // Case G | ||
| if (accumulatedSize >= params.minBytes) | ||
| forceComplete() | ||
| forceComplete() | ||
| else | ||
| false | ||
| } | ||
|
|
@@ -154,9 +154,9 @@ class DelayedFetch( | |
| * Upon completion, read whatever data is available and pass to the complete callback | ||
| */ | ||
| override def onComplete(): Unit = { | ||
| val fetchInfos = fetchPartitionStatus.map { case (tp, status) => | ||
| val fetchInfos = fetchPartitionStatus.asScala.iterator.map { case (tp, status) => | ||
| tp -> status.fetchInfo | ||
| } | ||
| }.toBuffer | ||
|
|
||
| val logReadResults = replicaManager.readFromLog( | ||
|
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Perhaps There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Iterators can be exhausted and hence are a bit more brittle. I would only use them as a method parameter if there is a meaningful difference in performance. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. fair enough |
||
| params, | ||
|
|
||
Uh oh!
There was an error while loading. Please reload this page.