1use std::collections::BTreeMap;
16use std::fmt::Debug;
17use std::sync::Arc;
18use std::time::Duration;
19
20use anyhow::anyhow;
21use futures::{Future, FutureExt, TryFuture};
22use rdkafka::ClientConfig;
23use rdkafka::error::KafkaError;
24use rdkafka::message::ToBytes;
25use rdkafka::producer::{DeliveryFuture, FutureProducer, FutureRecord};
26use rdkafka::types::RDKafkaErrorCode;
27use risingwave_common::array::StreamChunk;
28use risingwave_common::catalog::Schema;
29use serde::Deserialize;
30use serde_with::{DisplayFromStr, serde_as};
31use strum_macros::{Display, EnumString};
32use thiserror_ext::AsReport;
33use with_options::WithOptions;
34
35use super::catalog::{SinkFormat, SinkFormatDesc};
36use super::{Sink, SinkError, SinkParam};
37use crate::connector_common::{
38 AwsAuthProps, KafkaCommon, KafkaConnectionProps, KafkaPrivateLinkCommon,
39 RdKafkaPropertiesCommon, read_kafka_log_level,
40};
41use crate::enforce_secret::EnforceSecret;
42use crate::sink::formatter::SinkFormatterImpl;
43use crate::sink::log_store::DeliveryFutureManagerAddFuture;
44use crate::sink::writer::{
45 AsyncTruncateLogSinkerOf, AsyncTruncateSinkWriter, AsyncTruncateSinkWriterExt, FormattedSink,
46};
47use crate::sink::{Result, SinkWriterParam};
48use crate::source::kafka::{
49 KafkaContextCommon, KafkaProperties, KafkaSplitEnumerator, RwProducerContext,
50};
51use crate::source::{SourceEnumeratorContext, SplitEnumerator};
52use crate::{
53 deserialize_duration_from_string, deserialize_u32_from_string, dispatch_sink_formatter_impl,
54};
55
56pub const KAFKA_SINK: &str = "kafka";
57
58const fn _default_max_retries() -> u32 {
59 3
60}
61
62const fn _default_retry_backoff() -> Duration {
63 Duration::from_millis(100)
64}
65
66const fn _default_max_in_flight_requests_per_connection() -> usize {
67 5
68}
69
70#[derive(Debug, Clone, PartialEq, Display, Deserialize, EnumString)]
71#[strum(serialize_all = "snake_case")]
72pub enum CompressionCodec {
73 None,
74 Gzip,
75 Snappy,
76 Lz4,
77 Zstd,
78}
79
80#[serde_as]
83#[derive(Debug, Clone, Deserialize, WithOptions)]
84pub struct RdKafkaPropertiesProducer {
85 #[serde(rename = "properties.allow.auto.create.topics")]
87 #[serde_as(as = "Option<DisplayFromStr>")]
88 #[with_option(allow_alter_on_fly)]
89 pub allow_auto_create_topics: Option<bool>,
90
91 #[serde(rename = "properties.queue.buffering.max.messages")]
94 #[serde_as(as = "Option<DisplayFromStr>")]
95 #[with_option(allow_alter_on_fly)]
96 pub queue_buffering_max_messages: Option<usize>,
97
98 #[serde(rename = "properties.queue.buffering.max.kbytes")]
101 #[serde_as(as = "Option<DisplayFromStr>")]
102 #[with_option(allow_alter_on_fly)]
103 queue_buffering_max_kbytes: Option<usize>,
104
105 #[serde(rename = "properties.queue.buffering.max.ms")]
110 #[serde_as(as = "Option<DisplayFromStr>")]
111 #[with_option(allow_alter_on_fly)]
112 queue_buffering_max_ms: Option<f64>,
113
114 #[serde(rename = "properties.enable.idempotence")]
121 #[serde_as(as = "Option<DisplayFromStr>")]
122 #[with_option(allow_alter_on_fly)]
123 enable_idempotence: Option<bool>,
124
125 #[serde(rename = "properties.message.send.max.retries")]
127 #[serde_as(as = "Option<DisplayFromStr>")]
128 #[with_option(allow_alter_on_fly)]
129 message_send_max_retries: Option<usize>,
130
131 #[serde(rename = "properties.retry.backoff.ms")]
133 #[serde_as(as = "Option<DisplayFromStr>")]
134 #[with_option(allow_alter_on_fly)]
135 retry_backoff_ms: Option<usize>,
136
137 #[serde(rename = "properties.batch.num.messages")]
139 #[serde_as(as = "Option<DisplayFromStr>")]
140 #[with_option(allow_alter_on_fly)]
141 batch_num_messages: Option<usize>,
142
143 #[serde(rename = "properties.batch.size")]
148 #[serde_as(as = "Option<DisplayFromStr>")]
149 #[with_option(allow_alter_on_fly)]
150 batch_size: Option<usize>,
151
152 #[serde(rename = "properties.compression.codec")]
154 #[serde_as(as = "Option<DisplayFromStr>")]
155 compression_codec: Option<CompressionCodec>,
156
157 #[serde(rename = "properties.message.timeout.ms")]
161 #[serde_as(as = "Option<DisplayFromStr>")]
162 #[with_option(allow_alter_on_fly)]
163 message_timeout_ms: Option<usize>,
164
165 #[serde(
167 rename = "properties.max.in.flight.requests.per.connection",
168 default = "_default_max_in_flight_requests_per_connection"
169 )]
170 #[serde_as(as = "DisplayFromStr")]
171 #[with_option(allow_alter_on_fly)]
172 max_in_flight_requests_per_connection: usize,
173
174 #[serde(rename = "properties.request.required.acks")]
175 #[serde_as(as = "Option<DisplayFromStr>")]
176 #[with_option(allow_alter_on_fly)]
177 request_required_acks: Option<i32>,
178}
179
180impl RdKafkaPropertiesProducer {
181 pub(crate) fn set_client(&self, c: &mut rdkafka::ClientConfig) {
182 if let Some(v) = self.allow_auto_create_topics {
183 c.set("allow.auto.create.topics", v.to_string());
184 }
185 if let Some(v) = self.queue_buffering_max_messages {
186 c.set("queue.buffering.max.messages", v.to_string());
187 }
188 if let Some(v) = self.queue_buffering_max_kbytes {
189 c.set("queue.buffering.max.kbytes", v.to_string());
190 }
191 if let Some(v) = self.queue_buffering_max_ms {
192 c.set("queue.buffering.max.ms", v.to_string());
193 }
194 if let Some(v) = self.enable_idempotence {
195 c.set("enable.idempotence", v.to_string());
196 }
197 if let Some(v) = self.message_send_max_retries {
198 c.set("message.send.max.retries", v.to_string());
199 }
200 if let Some(v) = self.retry_backoff_ms {
201 c.set("retry.backoff.ms", v.to_string());
202 }
203 if let Some(v) = self.batch_num_messages {
204 c.set("batch.num.messages", v.to_string());
205 }
206 if let Some(v) = self.batch_size {
207 c.set("batch.size", v.to_string());
208 }
209 if let Some(v) = &self.compression_codec {
210 c.set("compression.codec", v.to_string());
211 }
212 if let Some(v) = self.request_required_acks {
213 c.set("request.required.acks", v.to_string());
214 }
215 if let Some(v) = self.message_timeout_ms {
216 c.set("message.timeout.ms", v.to_string());
217 }
218 c.set(
219 "max.in.flight.requests.per.connection",
220 self.max_in_flight_requests_per_connection.to_string(),
221 );
222 }
223}
224
225#[serde_as]
226#[derive(Debug, Clone, Deserialize, WithOptions)]
227pub struct KafkaConfig {
228 #[serde(flatten)]
229 pub common: KafkaCommon,
230
231 #[serde(flatten)]
232 pub connection: KafkaConnectionProps,
233
234 #[serde(
235 rename = "properties.retry.max",
236 default = "_default_max_retries",
237 deserialize_with = "deserialize_u32_from_string"
238 )]
239 pub max_retry_num: u32,
240
241 #[serde(
242 rename = "properties.retry.interval",
243 default = "_default_retry_backoff",
244 deserialize_with = "deserialize_duration_from_string"
245 )]
246 pub retry_interval: Duration,
247
248 pub primary_key: Option<String>,
252
253 #[serde(flatten)]
254 pub rdkafka_properties_common: RdKafkaPropertiesCommon,
255
256 #[serde(flatten)]
257 pub rdkafka_properties_producer: RdKafkaPropertiesProducer,
258
259 #[serde(flatten)]
260 pub privatelink_common: KafkaPrivateLinkCommon,
261
262 #[serde(flatten)]
263 pub aws_auth_props: AwsAuthProps,
264}
265
266impl EnforceSecret for KafkaConfig {
267 fn enforce_one(prop: &str) -> crate::error::ConnectorResult<()> {
268 KafkaConnectionProps::enforce_one(prop)?;
269 AwsAuthProps::enforce_one(prop)?;
270 Ok(())
271 }
272}
273
274impl KafkaConfig {
275 pub fn from_btreemap(values: BTreeMap<String, String>) -> Result<Self> {
276 let config = serde_json::from_value::<KafkaConfig>(serde_json::to_value(values).unwrap())
277 .map_err(|e| SinkError::Config(anyhow!(e)))?;
278
279 Ok(config)
280 }
281
282 pub(crate) fn set_client(&self, c: &mut rdkafka::ClientConfig) {
283 self.rdkafka_properties_common.set_client(c);
284 self.rdkafka_properties_producer.set_client(c);
285 }
286}
287
288impl From<KafkaConfig> for KafkaProperties {
289 fn from(val: KafkaConfig) -> Self {
290 KafkaProperties {
291 bytes_per_second: None,
292 max_num_messages: None,
293 scan_startup_mode: None,
294 time_offset: None,
295 upsert: None,
296 common: val.common,
297 connection: val.connection,
298 rdkafka_properties_common: val.rdkafka_properties_common,
299 rdkafka_properties_consumer: Default::default(),
300 privatelink_common: val.privatelink_common,
301 aws_auth_props: val.aws_auth_props,
302 group_id_prefix: None,
303 unknown_fields: Default::default(),
304 }
305 }
306}
307
308#[derive(Debug)]
309pub struct KafkaSink {
310 pub config: KafkaConfig,
311 schema: Schema,
312 pk_indices: Vec<usize>,
313 format_desc: SinkFormatDesc,
314 db_name: String,
315 sink_from_name: String,
316}
317
318impl EnforceSecret for KafkaSink {
319 fn enforce_secret<'a>(
320 prop_iter: impl Iterator<Item = &'a str>,
321 ) -> crate::error::ConnectorResult<()> {
322 for prop in prop_iter {
323 KafkaConfig::enforce_one(prop)?;
324 }
325 Ok(())
326 }
327}
328
329impl TryFrom<SinkParam> for KafkaSink {
330 type Error = SinkError;
331
332 fn try_from(param: SinkParam) -> std::result::Result<Self, Self::Error> {
333 let schema = param.schema();
334 let pk_indices = param.downstream_pk_or_empty();
335 let config = KafkaConfig::from_btreemap(param.properties)?;
336 Ok(Self {
337 config,
338 schema,
339 pk_indices,
340 format_desc: param
341 .format_desc
342 .ok_or_else(|| SinkError::Config(anyhow!("missing FORMAT ... ENCODE ...")))?,
343 db_name: param.db_name,
344 sink_from_name: param.sink_from_name,
345 })
346 }
347}
348
349impl Sink for KafkaSink {
350 type LogSinker = AsyncTruncateLogSinkerOf<KafkaSinkWriter>;
351
352 const SINK_NAME: &'static str = KAFKA_SINK;
353
354 async fn new_log_sinker(&self, _writer_param: SinkWriterParam) -> Result<Self::LogSinker> {
355 let formatter = SinkFormatterImpl::new(
356 &self.format_desc,
357 self.schema.clone(),
358 self.pk_indices.clone(),
359 self.db_name.clone(),
360 self.sink_from_name.clone(),
361 &self.config.common.topic,
362 )
363 .await?;
364 let max_delivery_buffer_size = (self
365 .config
366 .rdkafka_properties_producer
367 .queue_buffering_max_messages
368 .as_ref()
369 .cloned()
370 .unwrap_or(KAFKA_WRITER_MAX_QUEUE_SIZE) as f32
371 * KAFKA_WRITER_MAX_QUEUE_SIZE_RATIO) as usize;
372
373 Ok(KafkaSinkWriter::new(self.config.clone(), formatter)
374 .await?
375 .into_log_sinker(max_delivery_buffer_size))
376 }
377
378 async fn validate(&self) -> Result<()> {
379 if self.format_desc.format != SinkFormat::AppendOnly && self.pk_indices.is_empty() {
381 return Err(SinkError::Config(anyhow!(
382 "primary key not defined for {:?} kafka sink (please define in `primary_key` field)",
383 self.format_desc.format
384 )));
385 }
386 SinkFormatterImpl::new(
388 &self.format_desc,
389 self.schema.clone(),
390 self.pk_indices.clone(),
391 self.db_name.clone(),
392 self.sink_from_name.clone(),
393 &self.config.common.topic,
394 )
395 .await?;
396
397 let check = KafkaSplitEnumerator::new(
401 KafkaProperties::from(self.config.clone()),
402 Arc::new(SourceEnumeratorContext::dummy()),
403 )
404 .await?;
405 if let Err(e) = check.check_reachability().await {
406 return Err(SinkError::Config(
407 anyhow!(
408 "cannot connect to kafka broker ({})",
409 self.config.connection.brokers,
410 )
411 .context(e),
412 ));
413 }
414 Ok(())
415 }
416
417 fn validate_alter_config(config: &BTreeMap<String, String>) -> Result<()> {
418 KafkaConfig::from_btreemap(config.clone())?;
419 Ok(())
420 }
421}
422
423const KAFKA_WRITER_MAX_QUEUE_SIZE_RATIO: f32 = 1.2;
427const KAFKA_WRITER_MAX_QUEUE_SIZE: usize = 100000;
431
432struct KafkaPayloadWriter<'a> {
433 inner: &'a FutureProducer<RwProducerContext>,
434 add_future: DeliveryFutureManagerAddFuture<'a, KafkaSinkDeliveryFuture>,
435 config: &'a KafkaConfig,
436}
437
438mod opaque_type {
439 use super::*;
440 pub type KafkaSinkDeliveryFuture = impl TryFuture<Ok = (), Error = SinkError> + Unpin + 'static;
441
442 #[define_opaque(KafkaSinkDeliveryFuture)]
443 pub(super) fn map_delivery_future(future: DeliveryFuture) -> KafkaSinkDeliveryFuture {
444 future.map(KafkaPayloadWriter::<'static>::map_future_result)
445 }
446}
447pub use opaque_type::KafkaSinkDeliveryFuture;
448use opaque_type::map_delivery_future;
449
450pub struct KafkaSinkWriter {
451 formatter: SinkFormatterImpl,
452 inner: FutureProducer<RwProducerContext>,
453 config: KafkaConfig,
454}
455
456impl KafkaSinkWriter {
457 async fn new(config: KafkaConfig, formatter: SinkFormatterImpl) -> Result<Self> {
458 let inner: FutureProducer<RwProducerContext> = {
459 let mut c = ClientConfig::new();
460
461 config.connection.set_security_properties(&mut c);
463 config.set_client(&mut c);
464
465 c.set("bootstrap.servers", &config.connection.brokers);
467
468 let broker_rewrite_map = config.privatelink_common.broker_rewrite_map.clone();
470 let ctx_common = KafkaContextCommon::new(
471 broker_rewrite_map,
472 None,
473 None,
474 config.aws_auth_props.clone(),
475 config.connection.is_aws_msk_iam(),
476 )
477 .await?;
478 let producer_ctx = RwProducerContext::new(ctx_common);
479 if let Some(log_level) = read_kafka_log_level() {
482 c.set_log_level(log_level);
483 }
484 c.create_with_context(producer_ctx).await?
485 };
486
487 Ok(KafkaSinkWriter {
488 formatter,
489 inner,
490 config: config.clone(),
491 })
492 }
493}
494
495impl AsyncTruncateSinkWriter for KafkaSinkWriter {
496 type DeliveryFuture = KafkaSinkDeliveryFuture;
497
498 async fn write_chunk<'a>(
499 &'a mut self,
500 chunk: StreamChunk,
501 add_future: DeliveryFutureManagerAddFuture<'a, Self::DeliveryFuture>,
502 ) -> Result<()> {
503 let mut payload_writer = KafkaPayloadWriter {
504 inner: &mut self.inner,
505 add_future,
506 config: &self.config,
507 };
508 dispatch_sink_formatter_impl!(&self.formatter, formatter, {
509 payload_writer.write_chunk(chunk, formatter).await
510 })
511 }
512}
513
514impl KafkaPayloadWriter<'_> {
515 async fn send_result<'a, K, P>(&'a mut self, mut record: FutureRecord<'a, K, P>) -> Result<()>
518 where
519 K: ToBytes + ?Sized,
520 P: ToBytes + ?Sized,
521 {
522 let mut success_flag = false;
523
524 let mut ret = Ok(());
525
526 for i in 0..self.config.max_retry_num {
527 match self.inner.send_result(record) {
528 Ok(delivery_future) => {
529 if self
530 .add_future
531 .add_future_may_await(map_delivery_future(delivery_future))
532 .await?
533 {
534 tracing::warn!(
535 "Number of records being delivered ({}) >= expected kafka producer queue size ({}).
536 This indicates the default value of queue.buffering.max.messages has changed.",
537 self.add_future.future_count(),
538 self.add_future.max_future_count()
539 );
540 }
541 success_flag = true;
542 break;
543 }
544 Err((e, rec)) => {
547 tracing::warn!(
548 error = %e.as_report(),
549 "producing message (key {:?}) to topic {} failed",
550 rec.key.map(|k| k.to_bytes()),
551 rec.topic,
552 );
553 record = rec;
554 match e {
555 KafkaError::MessageProduction(RDKafkaErrorCode::QueueFull) => {
556 tracing::warn!(
557 "Producer queue full. Delivery future buffer size={}. Await and retry #{}",
558 self.add_future.future_count(),
559 i
560 );
561 self.add_future.await_one_delivery().await?;
562 continue;
563 }
564 _ => return Err(e.into()),
565 }
566 }
567 }
568 }
569
570 if !success_flag {
571 ret = Err(KafkaError::MessageProduction(RDKafkaErrorCode::QueueFull).into());
574 }
575
576 ret
577 }
578
579 async fn write_inner(
580 &mut self,
581 event_key_object: Option<Vec<u8>>,
582 event_object: Option<Vec<u8>>,
583 ) -> Result<()> {
584 let topic = self.config.common.topic.clone();
585 let mut record = FutureRecord::<[u8], [u8]>::to(topic.as_str());
586 if let Some(key_str) = &event_key_object {
587 record = record.key(key_str);
588 }
589 if let Some(payload) = &event_object {
590 record = record.payload(payload);
591 }
592 self.send_result(record).await?;
595 Ok(())
596 }
597
598 fn map_future_result(delivery_future_result: <DeliveryFuture as Future>::Output) -> Result<()> {
599 match delivery_future_result {
600 Ok(Ok(_)) => Ok(()),
604 Ok(Err((k_err, _msg))) => Err(k_err.into()),
610 Err(_) => Err(KafkaError::Canceled.into()),
614 }
615 }
616}
617
618impl FormattedSink for KafkaPayloadWriter<'_> {
619 type K = Vec<u8>;
620 type V = Vec<u8>;
621
622 async fn write_one(&mut self, k: Option<Self::K>, v: Option<Self::V>) -> Result<()> {
623 self.write_inner(k, v).await
624 }
625}
626
627#[cfg(test)]
628mod test {
629 use maplit::btreemap;
630 use risingwave_common::catalog::Field;
631 use risingwave_common::types::DataType;
632
633 use super::*;
634 use crate::sink::encoder::{
635 DateHandlingMode, JsonEncoder, JsonbHandlingMode, TimeHandlingMode, TimestampHandlingMode,
636 TimestamptzHandlingMode,
637 };
638 use crate::sink::formatter::AppendOnlyFormatter;
639
640 #[test]
641 fn parse_rdkafka_props() {
642 let props: BTreeMap<String, String> = btreemap! {
643 "properties.bootstrap.server".to_owned() => "localhost:9092".to_owned(),
646 "topic".to_owned() => "test".to_owned(),
647 "properties.message.max.bytes".to_owned() => "12345".to_owned(),
650 "properties.receive.message.max.bytes".to_owned() => "54321".to_owned(),
651 "properties.queue.buffering.max.messages".to_owned() => "114514".to_owned(),
653 "properties.queue.buffering.max.kbytes".to_owned() => "114514".to_owned(),
654 "properties.queue.buffering.max.ms".to_owned() => "114.514".to_owned(),
655 "properties.enable.idempotence".to_owned() => "false".to_owned(),
656 "properties.message.send.max.retries".to_owned() => "114514".to_owned(),
657 "properties.retry.backoff.ms".to_owned() => "114514".to_owned(),
658 "properties.batch.num.messages".to_owned() => "114514".to_owned(),
659 "properties.batch.size".to_owned() => "114514".to_owned(),
660 "properties.compression.codec".to_owned() => "zstd".to_owned(),
661 "properties.message.timeout.ms".to_owned() => "114514".to_owned(),
662 "properties.max.in.flight.requests.per.connection".to_owned() => "114514".to_owned(),
663 "properties.request.required.acks".to_owned() => "-1".to_owned(),
664 };
665 let c = KafkaConfig::from_btreemap(props).unwrap();
666 assert_eq!(
667 c.rdkafka_properties_producer.queue_buffering_max_ms,
668 Some(114.514f64)
669 );
670 assert_eq!(
671 c.rdkafka_properties_producer.compression_codec,
672 Some(CompressionCodec::Zstd)
673 );
674 assert_eq!(
675 c.rdkafka_properties_producer.message_timeout_ms,
676 Some(114514)
677 );
678 assert_eq!(
679 c.rdkafka_properties_producer
680 .max_in_flight_requests_per_connection,
681 114514
682 );
683 assert_eq!(
684 c.rdkafka_properties_producer.request_required_acks,
685 Some(-1)
686 );
687
688 let props: BTreeMap<String, String> = btreemap! {
689 "connector".to_owned() => "kafka".to_owned(),
691 "properties.bootstrap.server".to_owned() => "localhost:9092".to_owned(),
692 "topic".to_owned() => "test".to_owned(),
693 "type".to_owned() => "append-only".to_owned(),
694
695 "properties.enable.idempotence".to_owned() => "True".to_owned(), };
697 assert!(KafkaConfig::from_btreemap(props).is_err());
698
699 let props: BTreeMap<String, String> = btreemap! {
700 "connector".to_owned() => "kafka".to_owned(),
702 "properties.bootstrap.server".to_owned() => "localhost:9092".to_owned(),
703 "topic".to_owned() => "test".to_owned(),
704 "type".to_owned() => "append-only".to_owned(),
705 "properties.queue.buffering.max.kbytes".to_owned() => "-114514".to_owned(), };
707 assert!(KafkaConfig::from_btreemap(props).is_err());
708
709 let props: BTreeMap<String, String> = btreemap! {
710 "connector".to_owned() => "kafka".to_owned(),
712 "properties.bootstrap.server".to_owned() => "localhost:9092".to_owned(),
713 "topic".to_owned() => "test".to_owned(),
714 "type".to_owned() => "append-only".to_owned(),
715 "properties.compression.codec".to_owned() => "notvalid".to_owned(), };
717 assert!(KafkaConfig::from_btreemap(props).is_err());
718 }
719
720 #[test]
721 fn parse_kafka_config() {
722 let properties: BTreeMap<String, String> = btreemap! {
723 "properties.bootstrap.server".to_owned() => "localhost:9092".to_owned(),
725 "topic".to_owned() => "test".to_owned(),
726 "properties.security.protocol".to_owned() => "SASL".to_owned(),
729 "properties.sasl.mechanism".to_owned() => "SASL".to_owned(),
730 "properties.sasl.username".to_owned() => "test".to_owned(),
731 "properties.sasl.password".to_owned() => "test".to_owned(),
732 "properties.retry.max".to_owned() => "20".to_owned(),
733 "properties.retry.interval".to_owned() => "500ms".to_owned(),
734 "broker.rewrite.endpoints".to_owned() => "{\"broker1\": \"10.0.0.1:8001\"}".to_owned(),
736 };
737 let config = KafkaConfig::from_btreemap(properties).unwrap();
738 assert_eq!(config.connection.brokers, "localhost:9092");
739 assert_eq!(config.common.topic, "test");
740 assert_eq!(config.max_retry_num, 20);
741 assert_eq!(config.retry_interval, Duration::from_millis(500));
742
743 let btreemap: BTreeMap<String, String> = btreemap! {
745 "broker1".to_owned() => "10.0.0.1:8001".to_owned()
746 };
747 assert_eq!(config.privatelink_common.broker_rewrite_map, Some(btreemap));
748
749 let properties: BTreeMap<String, String> = btreemap! {
751 "properties.bootstrap.server".to_owned() => "localhost:9092".to_owned(),
753 "topic".to_owned() => "test".to_owned(),
754 };
756 let config = KafkaConfig::from_btreemap(properties).unwrap();
757 assert_eq!(config.max_retry_num, 3);
758 assert_eq!(config.retry_interval, Duration::from_millis(100));
759
760 let properties: BTreeMap<String, String> = btreemap! {
762 "connector".to_owned() => "kafka".to_owned(),
763 "properties.bootstrap.server".to_owned() => "localhost:9092".to_owned(),
764 "topic".to_owned() => "test".to_owned(),
765 "type".to_owned() => "upsert".to_owned(),
766 "properties.retry.max".to_owned() => "-20".to_owned(), };
768 assert!(KafkaConfig::from_btreemap(properties).is_err());
769
770 let properties: BTreeMap<String, String> = btreemap! {
772 "connector".to_owned() => "kafka".to_owned(),
773 "properties.bootstrap.server".to_owned() => "localhost:9092".to_owned(),
774 "topic".to_owned() => "test".to_owned(),
775 "type".to_owned() => "upsert".to_owned(),
776 "properties.retry.interval".to_owned() => "500miiinutes".to_owned(), };
778 assert!(KafkaConfig::from_btreemap(properties).is_err());
779 }
780
781 #[ignore]
784 #[tokio::test]
785 async fn test_kafka_producer() -> Result<()> {
786 let properties = btreemap! {
788 "connector".to_owned() => "kafka".to_owned(),
789 "properties.bootstrap.server".to_owned() => "localhost:29092".to_owned(),
790 "type".to_owned() => "append-only".to_owned(),
791 "topic".to_owned() => "test_topic".to_owned(),
792 "properties.compression.codec".to_owned() => "zstd".to_owned(),
793 };
794
795 let schema = Schema::new(vec![
797 Field {
798 data_type: DataType::Int32,
799 name: "id".into(),
800 },
801 Field {
802 data_type: DataType::Varchar,
803 name: "v2".into(),
804 },
805 ]);
806
807 let kafka_config = KafkaConfig::from_btreemap(properties)?;
808
809 let sink = KafkaSinkWriter::new(
811 kafka_config.clone(),
812 SinkFormatterImpl::AppendOnlyJson(AppendOnlyFormatter::new(
813 None,
815 JsonEncoder::new(
816 schema,
817 None,
818 DateHandlingMode::FromCe,
819 TimestampHandlingMode::Milli,
820 TimestamptzHandlingMode::UtcString,
821 TimeHandlingMode::Milli,
822 JsonbHandlingMode::String,
823 ),
824 )),
825 )
826 .await
827 .unwrap();
828
829 use crate::sink::log_store::DeliveryFutureManager;
830
831 let mut future_manager = DeliveryFutureManager::new(usize::MAX);
832
833 for i in 0..10 {
834 println!("epoch: {}", i);
835 for j in 0..100 {
836 let mut writer = KafkaPayloadWriter {
837 inner: &sink.inner,
838 add_future: future_manager.start_write_chunk(i, j),
839 config: &sink.config,
840 };
841 match writer
842 .send_result(
843 FutureRecord::to(kafka_config.common.topic.as_str())
844 .payload(format!("value-{}", j).as_bytes())
845 .key(format!("dummy_key_for_epoch-{}", i).as_bytes()),
846 )
847 .await
848 {
849 Ok(_) => {}
850 Err(e) => {
851 println!("{:?}", e);
852 break;
853 }
854 };
855 }
856 }
857
858 Ok(())
859 }
860}