public class SparkSortStrategy
extends org.apache.iceberg.actions.SortStrategy
| Modifier and Type | Field and Description |
|---|---|
static java.lang.String |
COMPRESSION_FACTOR
The number of shuffle partitions and consequently the number of output files created by the
Spark Sort is based on the size of the input data files used in this rewrite operation.
|
| Constructor and Description |
|---|
SparkSortStrategy(org.apache.iceberg.Table table,
org.apache.spark.sql.SparkSession spark) |
| Modifier and Type | Method and Description |
|---|---|
protected FileScanTaskSetManager |
manager() |
org.apache.iceberg.actions.RewriteStrategy |
options(java.util.Map<java.lang.String,java.lang.String> options) |
protected FileRewriteCoordinator |
rewriteCoordinator() |
java.util.Set<org.apache.iceberg.DataFile> |
rewriteFiles(java.util.List<org.apache.iceberg.FileScanTask> filesToRewrite) |
protected double |
sizeEstimateMultiple() |
protected org.apache.spark.sql.catalyst.plans.logical.LogicalPlan |
sortPlan(org.apache.spark.sql.connector.distributions.Distribution distribution,
org.apache.spark.sql.connector.expressions.SortOrder[] ordering,
org.apache.spark.sql.catalyst.plans.logical.LogicalPlan plan,
org.apache.spark.sql.internal.SQLConf conf) |
protected org.apache.spark.sql.SparkSession |
spark() |
org.apache.iceberg.Table |
table() |
protected SparkTableCache |
tableCache() |
java.util.Set<java.lang.String> |
validOptions() |
name, sortOrder, sortOrder, validateOptionspublic static final java.lang.String COMPRESSION_FACTOR
public SparkSortStrategy(org.apache.iceberg.Table table,
org.apache.spark.sql.SparkSession spark)
public org.apache.iceberg.Table table()
public java.util.Set<java.lang.String> validOptions()
validOptions in interface org.apache.iceberg.actions.RewriteStrategyvalidOptions in class org.apache.iceberg.actions.SortStrategypublic org.apache.iceberg.actions.RewriteStrategy options(java.util.Map<java.lang.String,java.lang.String> options)
options in interface org.apache.iceberg.actions.RewriteStrategyoptions in class org.apache.iceberg.actions.SortStrategypublic java.util.Set<org.apache.iceberg.DataFile> rewriteFiles(java.util.List<org.apache.iceberg.FileScanTask> filesToRewrite)
protected org.apache.spark.sql.SparkSession spark()
protected org.apache.spark.sql.catalyst.plans.logical.LogicalPlan sortPlan(org.apache.spark.sql.connector.distributions.Distribution distribution,
org.apache.spark.sql.connector.expressions.SortOrder[] ordering,
org.apache.spark.sql.catalyst.plans.logical.LogicalPlan plan,
org.apache.spark.sql.internal.SQLConf conf)
protected double sizeEstimateMultiple()
protected SparkTableCache tableCache()
protected FileScanTaskSetManager manager()
protected FileRewriteCoordinator rewriteCoordinator()