public class DeltaGenerator extends Object implements Serializable
| 构造器和说明 |
|---|
DeltaGenerator(DFSDeltaConfig deltaOutputConfig,
org.apache.spark.api.java.JavaSparkContext jsc,
org.apache.spark.sql.SparkSession sparkSession,
String schemaStr,
org.apache.hudi.keygen.BuiltinKeyGenerator keyGenerator) |
| 限定符和类型 | 方法和说明 |
|---|---|
org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
adjustRDDToGenerateExactNumUpdates(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> updates,
org.apache.spark.api.java.JavaSparkContext jsc,
long totalRecordsRequired) |
org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
generateDeletes(DeltaConfig.Config config) |
org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
generateInserts(DeltaConfig.Config operation) |
org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
generateUpdates(DeltaConfig.Config config) |
Map<Integer,Long> |
getAdjustedPartitionsCount(Map<Integer,Long> partitionCountMap,
long recordsToRemove) |
Map<Integer,Long> |
getPartitionToCountMap(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> records) |
org.apache.spark.api.java.JavaRDD<DeltaWriteStats> |
writeRecords(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> records) |
public DeltaGenerator(DFSDeltaConfig deltaOutputConfig, org.apache.spark.api.java.JavaSparkContext jsc, org.apache.spark.sql.SparkSession sparkSession, String schemaStr, org.apache.hudi.keygen.BuiltinKeyGenerator keyGenerator)
public org.apache.spark.api.java.JavaRDD<DeltaWriteStats> writeRecords(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> records)
public org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> generateInserts(DeltaConfig.Config operation)
public org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> generateUpdates(DeltaConfig.Config config) throws IOException
IOExceptionpublic org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> generateDeletes(DeltaConfig.Config config) throws IOException
IOExceptionpublic Map<Integer,Long> getPartitionToCountMap(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> records)
public Map<Integer,Long> getAdjustedPartitionsCount(Map<Integer,Long> partitionCountMap, long recordsToRemove)
public org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> adjustRDDToGenerateExactNumUpdates(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> updates,
org.apache.spark.api.java.JavaSparkContext jsc,
long totalRecordsRequired)
Copyright © 2021 The Apache Software Foundation. All rights reserved.