forked from apache/kafka
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
KAFKA-14462; [14/N] Add PartitionWriter (apache#13675)
This patch introduces the `PartitionWriter` interface in the `group-coordinator` module. The `ReplicaManager` resides in the `core` module and it is thus not accessible from the `group-coordinator` one. The `CoordinatorPartitionWriter` is basically an implementation of the interface residing in `core` which interfaces with the `ReplicaManager`. One notable difference from the usual produce path is that the `PartitionWriter` returns the offset following the written records. This is then used by the coordinator runtime to track when the request associated with the write can be completed. Reviewers: Jeff Kim <[email protected]>, Justine Olshan <[email protected]>
- Loading branch information
Showing
13 changed files
with
755 additions
and
28 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
175 changes: 175 additions & 0 deletions
175
core/src/main/scala/kafka/coordinator/group/CoordinatorPartitionWriter.scala
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,175 @@ | ||
/* | ||
* Licensed to the Apache Software Foundation (ASF) under one or more | ||
* contributor license agreements. See the NOTICE file distributed with | ||
* this work for additional information regarding copyright ownership. | ||
* The ASF licenses this file to You under the Apache License, Version 2.0 | ||
* (the "License"); you may not use this file except in compliance with | ||
* the License. You may obtain a copy of the License at | ||
* | ||
* http:https://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
package kafka.coordinator.group | ||
|
||
import kafka.cluster.PartitionListener | ||
import kafka.server.{ActionQueue, ReplicaManager} | ||
import org.apache.kafka.common.TopicPartition | ||
import org.apache.kafka.common.errors.RecordTooLargeException | ||
import org.apache.kafka.common.protocol.Errors | ||
import org.apache.kafka.common.record.{CompressionType, MemoryRecords, TimestampType} | ||
import org.apache.kafka.common.record.Record.EMPTY_HEADERS | ||
import org.apache.kafka.common.requests.ProduceResponse.PartitionResponse | ||
import org.apache.kafka.common.utils.Time | ||
import org.apache.kafka.coordinator.group.runtime.PartitionWriter | ||
import org.apache.kafka.storage.internals.log.AppendOrigin | ||
|
||
import java.nio.ByteBuffer | ||
import java.util | ||
import scala.collection.Map | ||
|
||
/** | ||
* ListenerAdapter adapts the PartitionListener interface to the | ||
* PartitionWriter.Listener interface. | ||
*/ | ||
private[group] class ListenerAdapter( | ||
val listener: PartitionWriter.Listener | ||
) extends PartitionListener { | ||
override def onHighWatermarkUpdated( | ||
tp: TopicPartition, | ||
offset: Long | ||
): Unit = { | ||
listener.onHighWatermarkUpdated(tp, offset) | ||
} | ||
|
||
override def equals(that: Any): Boolean = that match { | ||
case other: ListenerAdapter => listener.equals(other.listener) | ||
case _ => false | ||
} | ||
|
||
override def hashCode(): Int = { | ||
listener.hashCode() | ||
} | ||
|
||
override def toString: String = { | ||
s"ListenerAdapter(listener=$listener)" | ||
} | ||
} | ||
|
||
class CoordinatorPartitionWriter[T]( | ||
replicaManager: ReplicaManager, | ||
serializer: PartitionWriter.Serializer[T], | ||
compressionType: CompressionType, | ||
time: Time | ||
) extends PartitionWriter[T] { | ||
// We use an action queue which directly executes actions. This is possible | ||
// here because we don't hold any conflicting locks. | ||
private val directActionQueue = new ActionQueue { | ||
override def add(action: () => Unit): Unit = { | ||
action() | ||
} | ||
|
||
override def tryCompleteActions(): Unit = {} | ||
} | ||
|
||
/** | ||
* Register a PartitionWriter.Listener. | ||
* | ||
* @param tp The partition to register the listener to. | ||
* @param listener The listener. | ||
*/ | ||
override def registerListener( | ||
tp: TopicPartition, | ||
listener: PartitionWriter.Listener | ||
): Unit = { | ||
replicaManager.maybeAddListener(tp, new ListenerAdapter(listener)) | ||
} | ||
|
||
/** | ||
* Deregister a PartitionWriter.Listener. | ||
* | ||
* @param tp The partition to deregister the listener from. | ||
* @param listener The listener. | ||
*/ | ||
override def deregisterListener( | ||
tp: TopicPartition, | ||
listener: PartitionWriter.Listener | ||
): Unit = { | ||
replicaManager.removeListener(tp, new ListenerAdapter(listener)) | ||
} | ||
|
||
/** | ||
* Write records to the partitions. Records are written in one batch so | ||
* atomicity is guaranteed. | ||
* | ||
* @param tp The partition to write records to. | ||
* @param records The list of records. The records are written in a single batch. | ||
* @return The log end offset right after the written records. | ||
* @throws KafkaException Any KafkaException caught during the write operation. | ||
*/ | ||
override def append( | ||
tp: TopicPartition, | ||
records: util.List[T] | ||
): Long = { | ||
if (records.isEmpty) throw new IllegalStateException("records must be non-empty.") | ||
|
||
replicaManager.getLogConfig(tp) match { | ||
case Some(logConfig) => | ||
val magic = logConfig.recordVersion.value | ||
val maxBatchSize = logConfig.maxMessageSize | ||
val currentTimeMs = time.milliseconds() | ||
|
||
val recordsBuilder = MemoryRecords.builder( | ||
ByteBuffer.allocate(math.min(16384, maxBatchSize)), | ||
magic, | ||
compressionType, | ||
TimestampType.CREATE_TIME, | ||
0L, | ||
maxBatchSize | ||
) | ||
|
||
records.forEach { record => | ||
val keyBytes = serializer.serializeKey(record) | ||
val valueBytes = serializer.serializeValue(record) | ||
|
||
if (recordsBuilder.hasRoomFor(currentTimeMs, keyBytes, valueBytes, EMPTY_HEADERS)) recordsBuilder.append( | ||
currentTimeMs, | ||
keyBytes, | ||
valueBytes, | ||
EMPTY_HEADERS | ||
) else throw new RecordTooLargeException(s"Message batch size is ${recordsBuilder.estimatedSizeInBytes()} bytes " + | ||
s"in append to partition $tp which exceeds the maximum configured size of $maxBatchSize.") | ||
} | ||
|
||
var appendResults: Map[TopicPartition, PartitionResponse] = Map.empty | ||
replicaManager.appendRecords( | ||
timeout = 0L, | ||
requiredAcks = 1, | ||
internalTopicsAllowed = true, | ||
origin = AppendOrigin.COORDINATOR, | ||
entriesPerPartition = Map(tp -> recordsBuilder.build()), | ||
responseCallback = results => appendResults = results, | ||
// We can directly complete the purgatories here because we don't hold | ||
// any conflicting locks. | ||
actionQueue = directActionQueue | ||
) | ||
|
||
val partitionResult = appendResults.getOrElse(tp, | ||
throw new IllegalStateException(s"Append status $appendResults should have partition $tp.")) | ||
|
||
if (partitionResult.error != Errors.NONE) { | ||
throw partitionResult.error.exception() | ||
} | ||
|
||
// Required offset. | ||
partitionResult.lastOffset + 1 | ||
|
||
case None => | ||
throw Errors.NOT_LEADER_OR_FOLLOWER.exception() | ||
} | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.