public class DeltaStreamerKafkaSource
extends org.apache.hudi.utilities.sources.KafkaSource<org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord>>
| Constructor and Description |
|---|
DeltaStreamerKafkaSource(org.apache.hudi.common.config.TypedProperties properties,
org.apache.spark.api.java.JavaSparkContext sparkContext,
org.apache.spark.sql.SparkSession sparkSession,
org.apache.hudi.utilities.ingestion.HoodieIngestionMetrics metrics,
org.apache.hudi.utilities.streamer.StreamContext streamContext) |
DeltaStreamerKafkaSource(org.apache.hudi.common.config.TypedProperties props,
org.apache.spark.api.java.JavaSparkContext sparkContext,
org.apache.spark.sql.SparkSession sparkSession,
org.apache.hudi.utilities.schema.SchemaProvider schemaProvider,
org.apache.hudi.utilities.ingestion.HoodieIngestionMetrics metrics) |
| Modifier and Type | Method and Description |
|---|---|
protected org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
maybeAppendKafkaOffsets(org.apache.spark.api.java.JavaRDD<org.apache.kafka.clients.consumer.ConsumerRecord<Object,Object>> kafkaRDd) |
void |
onCommit(String lastCkptStr) |
protected org.apache.hudi.utilities.sources.InputBatch<org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord>> |
readFromCheckpoint(org.apache.hudi.common.util.Option<org.apache.hudi.common.table.checkpoint.Checkpoint> lastCheckpointStr,
long sourceLimit) |
protected org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
toBatch(org.apache.spark.streaming.kafka010.OffsetRange[] offsetRanges) |
fetchNewData, getOffsetRangespublic DeltaStreamerKafkaSource(org.apache.hudi.common.config.TypedProperties props,
org.apache.spark.api.java.JavaSparkContext sparkContext,
org.apache.spark.sql.SparkSession sparkSession,
org.apache.hudi.utilities.schema.SchemaProvider schemaProvider,
org.apache.hudi.utilities.ingestion.HoodieIngestionMetrics metrics)
public DeltaStreamerKafkaSource(org.apache.hudi.common.config.TypedProperties properties,
org.apache.spark.api.java.JavaSparkContext sparkContext,
org.apache.spark.sql.SparkSession sparkSession,
org.apache.hudi.utilities.ingestion.HoodieIngestionMetrics metrics,
org.apache.hudi.utilities.streamer.StreamContext streamContext)
protected org.apache.hudi.utilities.sources.InputBatch<org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord>> readFromCheckpoint(org.apache.hudi.common.util.Option<org.apache.hudi.common.table.checkpoint.Checkpoint> lastCheckpointStr,
long sourceLimit)
readFromCheckpoint in class org.apache.hudi.utilities.sources.KafkaSource<org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord>>protected org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> maybeAppendKafkaOffsets(org.apache.spark.api.java.JavaRDD<org.apache.kafka.clients.consumer.ConsumerRecord<Object,Object>> kafkaRDd)
protected org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> toBatch(org.apache.spark.streaming.kafka010.OffsetRange[] offsetRanges)
toBatch in class org.apache.hudi.utilities.sources.KafkaSource<org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord>>public void onCommit(String lastCkptStr)
onCommit in interface org.apache.hudi.utilities.callback.SourceCommitCallbackonCommit in class org.apache.hudi.utilities.sources.KafkaSource<org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord>>Copyright © 2025. All rights reserved.