public class DeltaGenerator extends Object implements Serializable
| Constructor and Description |
|---|
DeltaGenerator(DeltaConfig deltaOutputConfig,
org.apache.spark.api.java.JavaSparkContext jsc,
org.apache.spark.sql.SparkSession sparkSession,
String schemaStr,
BuiltinKeyGenerator keyGenerator) |
| Modifier and Type | Method and Description |
|---|---|
org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
adjustRDDToGenerateExactNumUpdates(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> updates,
org.apache.spark.api.java.JavaSparkContext jsc,
long totalRecordsRequired) |
org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
generateInserts(DeltaConfig.Config operation) |
org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> |
generateUpdates(DeltaConfig.Config config) |
Map<Integer,Long> |
getAdjustedPartitionsCount(Map<Integer,Long> partitionCountMap,
long recordsToRemove) |
Map<Integer,Long> |
getPartitionToCountMap(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> records) |
org.apache.spark.api.java.JavaRDD<DeltaWriteStats> |
writeRecords(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> records) |
public DeltaGenerator(DeltaConfig deltaOutputConfig, org.apache.spark.api.java.JavaSparkContext jsc, org.apache.spark.sql.SparkSession sparkSession, String schemaStr, BuiltinKeyGenerator keyGenerator)
public org.apache.spark.api.java.JavaRDD<DeltaWriteStats> writeRecords(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> records)
public org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> generateInserts(DeltaConfig.Config operation)
public org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> generateUpdates(DeltaConfig.Config config) throws IOException
IOExceptionpublic Map<Integer,Long> getPartitionToCountMap(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> records)
public Map<Integer,Long> getAdjustedPartitionsCount(Map<Integer,Long> partitionCountMap, long recordsToRemove)
public org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> adjustRDDToGenerateExactNumUpdates(org.apache.spark.api.java.JavaRDD<org.apache.avro.generic.GenericRecord> updates,
org.apache.spark.api.java.JavaSparkContext jsc,
long totalRecordsRequired)
Copyright © 2020 The Apache Software Foundation. All rights reserved.