risingwavelabs · wenym1 · Sep 13, 2023 · Aug 31, 2023 · Aug 31, 2023 · Aug 31, 2023
diff --git a/src/connector/src/sink/kafka.rs b/src/connector/src/sink/kafka.rs
@@ -327,6 +327,11 @@ enum KafkaSinkState {
     Running(u64),
 }
 
+/// The delivery buffer queue size
+/// When the `DeliveryFuture` the current `future_delivery_buffer`
+/// is buffering is greater than this size, then enforcing commit once
+const KAFKA_WRITER_MAX_QUEUE_SIZE: usize = 10;
+
 pub struct KafkaSinkWriter {
     pub config: KafkaConfig,
     pub inner: FutureProducer<PrivateLinkProducerContext>,
@@ -335,6 +340,7 @@ pub struct KafkaSinkWriter {
     schema: Schema,
     pk_indices: Vec<usize>,
     is_append_only: bool,
+    future_delivery_buffer: Vec<DeliveryFuture>,
     db_name: String,
     sink_from_name: String,
 }
@@ -382,6 +388,7 @@ impl KafkaSinkWriter {
             schema,
             pk_indices,
             is_append_only,
+            future_delivery_buffer: Vec::new(),
             db_name,
             sink_from_name,
         })
@@ -403,36 +410,49 @@ impl KafkaSinkWriter {
 
     /// The actual `send_result` function, will be called when the `KafkaSinkWriter` needs to sink
     /// messages
-    async fn send_result<'a, K, P>(&'a self, mut record: FutureRecord<'a, K, P>) -> KafkaResult<()>
+    async fn send_result<'a, K, P>(
+        &'a mut self,
+        mut record: FutureRecord<'a, K, P>,
+    ) -> KafkaResult<()>
     where
         K: ToBytes + ?Sized,
         P: ToBytes + ?Sized,
     {
         // The error to be returned
         let mut err = KafkaError::Canceled;
 
+        // First take the ownership of the exist buffer
+        let mut future_buffer = std::mem::take(&mut self.future_delivery_buffer);
+
+        // Sanity check
+        debug_assert!(
+            self.future_delivery_buffer.is_empty(),
+            "future delivery buffer must be empty"
+        );
+
+        // The flag represents whether to commit
+        // This will happen when the size of buffering futures
+        // is greater than preset limit
+        let mut commit_flag = false;
+
+        // To make borrow checker happy :)
+        let mut push_flag = false;
+
         for _ in 0..self.config.max_retry_num {
             match self.send_result_inner(record).await {
-                Ok(delivery_future) => match delivery_future.await {
-                    Ok(delivery_future_result) => match delivery_future_result {
-                        // Successfully sent the record
-                        // Will return the partition and offset of the message (i32, i64)
-                        Ok(_) => return Ok(()),
-                        // If the message failed to be delivered. (i.e., flush)
-                        // The error & the copy of the original message will be returned
-                        // i.e., (KafkaError, OwnedMessage)
-                        // We will just stop the loop, and return the error
-                        // The sink executor will back to the latest checkpoint
-                        Err((k_err, _msg)) => {
-                            err = k_err;
-                            break;
-                        }
-                    },
-                    // Nothing to do here, since the err has already been set to
-                    // KafkaError::Canceled. This represents the producer is dropped
-                    // before the delivery status is received
-                    Err(_) => break,
-                },
+                // Add the future to the buffer
+                Ok(delivery_future) => {
+                    // Push the future into the buffer
+                    future_buffer.push(delivery_future);
+                    push_flag = true;
+
+                    // First see if the size is greater than the limit
+                    if future_buffer.len() > KAFKA_WRITER_MAX_QUEUE_SIZE {
+                        commit_flag = true;
+                        break;
+                    }
+                    break;
+                }
                 // The enqueue buffer is full, `send_result` will immediately return
                 // We can retry for another round after sleeping for sometime
                 Err((e, rec)) => {
@@ -449,32 +469,104 @@ impl KafkaSinkWriter {
             }
         }
 
+        if commit_flag {
+            // Give the buffer back to the origin
+            std::mem::swap(&mut future_buffer, &mut self.future_delivery_buffer);
+
+            // Sanity check
+            debug_assert!(
+                future_buffer.is_empty(),
+                "future buffer must be empty after swapping"
+            );
+
+            match self.commit().await {
+                // FIXME: Is this error handling enough?
+                Ok(_) => return Ok(()),
+                Err(_) => return Err(err),
+            }
+        }
+
+        if push_flag {
+            // Indicates success
+            std::mem::swap(&mut future_buffer, &mut self.future_delivery_buffer);
+
+            // Sanity check
+            debug_assert!(
+                future_buffer.is_empty(),
+                "future buffer must be empty after swapping"
+            );
+
+            return Ok(());
+        }
+
         Err(err)
     }
 
     async fn write_json_objects(
-        &self,
+        &mut self,
         event_key_object: Option<Value>,
         event_object: Option<Value>,
     ) -> Result<()> {
+        let topic = self.config.common.topic.clone();
         // here we assume the key part always exists and value part is optional.
         // if value is None, we will skip the payload part.
         let key_str = event_key_object.unwrap().to_string();
-        let mut record = FutureRecord::<[u8], [u8]>::to(self.config.common.topic.as_str())
-            .key(key_str.as_bytes());
+        let mut record = FutureRecord::<[u8], [u8]>::to(topic.as_str()).key(key_str.as_bytes());
         let payload;
         if let Some(value) = event_object {
             payload = value.to_string();
             record = record.payload(payload.as_bytes());
         }
+        // Send the data but not wait it to finish sinking
+        // Will join all `DeliveryFuture` during commit
         self.send_result(record).await?;
         Ok(())
     }
 
-    async fn debezium_update(&self, chunk: StreamChunk, ts_ms: u64) -> Result<()> {
+    async fn commit(&mut self) -> Result<()> {
+        // Get the ownership first
+        // The buffer will automatically become an empty vector
+        let delivery_futures = std::mem::take(&mut self.future_delivery_buffer);
+
+        // Sanity check
+        debug_assert!(
+            self.future_delivery_buffer.is_empty(),
+            "The buffer must be empty"
+        );
+
+        // Commit all together
+        // FIXME: At present we could not retry, do we actually need to?
+        for delivery_future in delivery_futures {
+            match delivery_future.await {
+                Ok(delivery_future_result) => match delivery_future_result {
+                    // Successfully sent the record
+                    // Will return the partition and offset of the message (i32, i64)
+                    Ok(_) => continue,
+                    // If the message failed to be delivered. (i.e., flush)
+                    // The error & the copy of the original message will be returned
+                    // i.e., (KafkaError, OwnedMessage)
+                    // We will just stop the loop, and return the error
+                    // The sink executor will back to the latest checkpoint
+                    Err((k_err, _msg)) => return Err(SinkError::Kafka(k_err)),
+                },
+                // This represents the producer is dropped
+                // before the delivery status is received
+                // Return `KafkaError::Canceled`
+                Err(_) => return Err(SinkError::Kafka(KafkaError::Canceled)),
+            }
+        }
+
+        Ok(())
+    }
+
+    async fn debezium_update(&mut self, chunk: StreamChunk, ts_ms: u64) -> Result<()> {
+        let schema = self.schema.clone();
+        let pk_indices = self.pk_indices.clone();
+
+        // Initialize the dbz_stream
         let dbz_stream = gen_debezium_message_stream(
-            &self.schema,
-            &self.pk_indices,
+            &schema,
+            &pk_indices,
             chunk,
             ts_ms,
             DebeziumAdapterOpts::default(),
@@ -491,13 +583,13 @@ impl KafkaSinkWriter {
         Ok(())
     }
 
-    async fn upsert(&self, chunk: StreamChunk) -> Result<()> {
-        let upsert_stream = gen_upsert_message_stream(
-            &self.schema,
-            &self.pk_indices,
-            chunk,
-            UpsertAdapterOpts::default(),
-        );
+    async fn upsert(&mut self, chunk: StreamChunk) -> Result<()> {
+        let schema = self.schema.clone();
+        let pk_indices = self.pk_indices.clone();
+
+        // Initialize the upsert_stream
+        let upsert_stream =
+            gen_upsert_message_stream(&schema, &pk_indices, chunk, UpsertAdapterOpts::default());
 
         #[for_await]
         for msg in upsert_stream {
@@ -508,10 +600,14 @@ impl KafkaSinkWriter {
         Ok(())
     }
 
-    async fn append_only(&self, chunk: StreamChunk) -> Result<()> {
+    async fn append_only(&mut self, chunk: StreamChunk) -> Result<()> {
+        let schema = self.schema.clone();
+        let pk_indices = self.pk_indices.clone();
+
+        // Initialize the append_only_stream
         let append_only_stream = gen_append_only_message_stream(
-            &self.schema,
-            &self.pk_indices,
+            &schema,
+            &pk_indices,
             chunk,
             AppendOnlyAdapterOpts::default(),
         );
@@ -561,6 +657,8 @@ impl SinkWriterV1 for KafkaSinkWriter {
     }
 
     async fn commit(&mut self) -> Result<()> {
+        // Group delivery (await the `FutureRecord`) here
+        self.commit().await?;
         Ok(())
     }
 
@@ -701,7 +799,7 @@ mod test {
     }
 
     /// Note: Please enable the kafka by running `./risedev configure` before commenting #[ignore]
-    /// to run the test
+    /// to run the test, also remember to modify `risedev.yml`
     #[ignore]
     #[tokio::test]
     async fn test_kafka_producer() -> Result<()> {