public class MigrateTableSparkAction
extends java.lang.Object
implements org.apache.iceberg.actions.MigrateTable
| Modifier and Type | Field and Description |
|---|---|
protected static org.apache.iceberg.relocated.com.google.common.base.Joiner |
COMMA_JOINER |
protected static org.apache.iceberg.relocated.com.google.common.base.Splitter |
COMMA_SPLITTER |
protected static java.util.List<java.lang.String> |
EXCLUDED_PROPERTIES |
protected static java.lang.String |
FILE_PATH |
protected static java.lang.String |
ICEBERG_METADATA_FOLDER |
protected static java.lang.String |
LAST_MODIFIED |
protected static java.lang.String |
LOCATION |
protected static java.lang.String |
MANIFEST |
protected static java.lang.String |
MANIFEST_LIST |
protected static java.lang.String |
OTHERS |
protected static java.lang.String |
STATISTICS_FILES |
| Modifier and Type | Method and Description |
|---|---|
protected java.util.Map<java.lang.String,java.lang.String> |
additionalProperties() |
protected org.apache.spark.sql.Dataset<FileInfo> |
allReachableOtherMetadataFileDS(org.apache.iceberg.Table table) |
MigrateTableSparkAction |
backupTableName(java.lang.String tableName) |
protected org.apache.spark.sql.connector.catalog.StagingTableCatalog |
checkDestinationCatalog(org.apache.spark.sql.connector.catalog.CatalogPlugin catalog) |
protected org.apache.spark.sql.connector.catalog.TableCatalog |
checkSourceCatalog(org.apache.spark.sql.connector.catalog.CatalogPlugin catalog) |
protected org.apache.spark.sql.Dataset<FileInfo> |
contentFileDS(org.apache.iceberg.Table table) |
protected org.apache.spark.sql.Dataset<FileInfo> |
contentFileDS(org.apache.iceberg.Table table,
java.util.Set<java.lang.Long> snapshotIds) |
protected org.apache.iceberg.spark.actions.BaseSparkAction.DeleteSummary |
deleteFiles(java.util.concurrent.ExecutorService executorService,
java.util.function.Consumer<java.lang.String> deleteFunc,
java.util.Iterator<FileInfo> files)
Deletes files and keeps track of how many files were removed for each file type.
|
protected org.apache.iceberg.spark.actions.BaseSparkAction.DeleteSummary |
deleteFiles(org.apache.iceberg.io.SupportsBulkOperations io,
java.util.Iterator<FileInfo> files) |
protected org.apache.spark.sql.connector.catalog.StagingTableCatalog |
destCatalog() |
protected org.apache.spark.sql.connector.catalog.Identifier |
destTableIdent() |
protected java.util.Map<java.lang.String,java.lang.String> |
destTableProps() |
MigrateTableSparkAction |
dropBackup() |
protected void |
ensureNameMappingPresent(org.apache.iceberg.Table table) |
org.apache.iceberg.actions.MigrateTable.Result |
execute() |
MigrateTableSparkAction |
executeWith(java.util.concurrent.ExecutorService service) |
protected java.lang.String |
getMetadataLocation(org.apache.iceberg.Table table) |
protected org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> |
loadMetadataTable(org.apache.iceberg.Table table,
org.apache.iceberg.MetadataTableType type) |
protected org.apache.spark.sql.Dataset<FileInfo> |
manifestDS(org.apache.iceberg.Table table) |
protected org.apache.spark.sql.Dataset<FileInfo> |
manifestDS(org.apache.iceberg.Table table,
java.util.Set<java.lang.Long> snapshotIds) |
protected org.apache.spark.sql.Dataset<FileInfo> |
manifestListDS(org.apache.iceberg.Table table) |
protected org.apache.spark.sql.Dataset<FileInfo> |
manifestListDS(org.apache.iceberg.Table table,
java.util.Set<java.lang.Long> snapshotIds) |
protected JobGroupInfo |
newJobGroupInfo(java.lang.String groupId,
java.lang.String desc) |
protected org.apache.iceberg.Table |
newStaticTable(org.apache.iceberg.TableMetadata metadata,
org.apache.iceberg.io.FileIO io) |
ThisT |
option(java.lang.String name,
java.lang.String value) |
protected java.util.Map<java.lang.String,java.lang.String> |
options() |
ThisT |
options(java.util.Map<java.lang.String,java.lang.String> newOptions) |
protected org.apache.spark.sql.Dataset<FileInfo> |
otherMetadataFileDS(org.apache.iceberg.Table table) |
protected MigrateTableSparkAction |
self() |
protected void |
setProperties(java.util.Map<java.lang.String,java.lang.String> properties) |
protected void |
setProperty(java.lang.String key,
java.lang.String value) |
protected org.apache.spark.sql.connector.catalog.TableCatalog |
sourceCatalog() |
protected org.apache.spark.sql.connector.catalog.Identifier |
sourceTableIdent() |
protected java.lang.String |
sourceTableLocation() |
protected org.apache.spark.sql.SparkSession |
spark() |
protected org.apache.spark.api.java.JavaSparkContext |
sparkContext() |
protected StagedSparkTable |
stageDestTable() |
protected org.apache.spark.sql.Dataset<FileInfo> |
statisticsFileDS(org.apache.iceberg.Table table,
java.util.Set<java.lang.Long> snapshotIds) |
MigrateTableSparkAction |
tableProperties(java.util.Map<java.lang.String,java.lang.String> properties) |
MigrateTableSparkAction |
tableProperty(java.lang.String property,
java.lang.String value) |
protected org.apache.spark.sql.catalyst.catalog.CatalogTable |
v1SourceTable() |
protected <T> T |
withJobGroupInfo(JobGroupInfo info,
java.util.function.Supplier<T> supplier) |
protected static final java.lang.String LOCATION
protected static final java.lang.String ICEBERG_METADATA_FOLDER
protected static final java.util.List<java.lang.String> EXCLUDED_PROPERTIES
protected static final java.lang.String MANIFEST
protected static final java.lang.String MANIFEST_LIST
protected static final java.lang.String STATISTICS_FILES
protected static final java.lang.String OTHERS
protected static final java.lang.String FILE_PATH
protected static final java.lang.String LAST_MODIFIED
protected static final org.apache.iceberg.relocated.com.google.common.base.Splitter COMMA_SPLITTER
protected static final org.apache.iceberg.relocated.com.google.common.base.Joiner COMMA_JOINER
protected MigrateTableSparkAction self()
protected org.apache.spark.sql.connector.catalog.StagingTableCatalog destCatalog()
protected org.apache.spark.sql.connector.catalog.Identifier destTableIdent()
public MigrateTableSparkAction tableProperties(java.util.Map<java.lang.String,java.lang.String> properties)
tableProperties in interface org.apache.iceberg.actions.MigrateTablepublic MigrateTableSparkAction tableProperty(java.lang.String property, java.lang.String value)
tableProperty in interface org.apache.iceberg.actions.MigrateTablepublic MigrateTableSparkAction dropBackup()
dropBackup in interface org.apache.iceberg.actions.MigrateTablepublic MigrateTableSparkAction backupTableName(java.lang.String tableName)
backupTableName in interface org.apache.iceberg.actions.MigrateTablepublic MigrateTableSparkAction executeWith(java.util.concurrent.ExecutorService service)
executeWith in interface org.apache.iceberg.actions.MigrateTablepublic org.apache.iceberg.actions.MigrateTable.Result execute()
execute in interface org.apache.iceberg.actions.Action<org.apache.iceberg.actions.MigrateTable,org.apache.iceberg.actions.MigrateTable.Result>protected java.util.Map<java.lang.String,java.lang.String> destTableProps()
protected org.apache.spark.sql.connector.catalog.TableCatalog checkSourceCatalog(org.apache.spark.sql.connector.catalog.CatalogPlugin catalog)
protected java.lang.String sourceTableLocation()
protected org.apache.spark.sql.catalyst.catalog.CatalogTable v1SourceTable()
protected org.apache.spark.sql.connector.catalog.TableCatalog sourceCatalog()
protected org.apache.spark.sql.connector.catalog.Identifier sourceTableIdent()
protected void setProperties(java.util.Map<java.lang.String,java.lang.String> properties)
protected void setProperty(java.lang.String key,
java.lang.String value)
protected java.util.Map<java.lang.String,java.lang.String> additionalProperties()
protected org.apache.spark.sql.connector.catalog.StagingTableCatalog checkDestinationCatalog(org.apache.spark.sql.connector.catalog.CatalogPlugin catalog)
protected StagedSparkTable stageDestTable()
protected void ensureNameMappingPresent(org.apache.iceberg.Table table)
protected java.lang.String getMetadataLocation(org.apache.iceberg.Table table)
protected org.apache.spark.sql.SparkSession spark()
protected org.apache.spark.api.java.JavaSparkContext sparkContext()
public ThisT option(java.lang.String name,
java.lang.String value)
public ThisT options(java.util.Map<java.lang.String,java.lang.String> newOptions)
protected java.util.Map<java.lang.String,java.lang.String> options()
protected <T> T withJobGroupInfo(JobGroupInfo info, java.util.function.Supplier<T> supplier)
protected JobGroupInfo newJobGroupInfo(java.lang.String groupId, java.lang.String desc)
protected org.apache.iceberg.Table newStaticTable(org.apache.iceberg.TableMetadata metadata,
org.apache.iceberg.io.FileIO io)
protected org.apache.spark.sql.Dataset<FileInfo> contentFileDS(org.apache.iceberg.Table table)
protected org.apache.spark.sql.Dataset<FileInfo> contentFileDS(org.apache.iceberg.Table table, java.util.Set<java.lang.Long> snapshotIds)
protected org.apache.spark.sql.Dataset<FileInfo> manifestDS(org.apache.iceberg.Table table)
protected org.apache.spark.sql.Dataset<FileInfo> manifestDS(org.apache.iceberg.Table table, java.util.Set<java.lang.Long> snapshotIds)
protected org.apache.spark.sql.Dataset<FileInfo> manifestListDS(org.apache.iceberg.Table table)
protected org.apache.spark.sql.Dataset<FileInfo> manifestListDS(org.apache.iceberg.Table table, java.util.Set<java.lang.Long> snapshotIds)
protected org.apache.spark.sql.Dataset<FileInfo> statisticsFileDS(org.apache.iceberg.Table table, java.util.Set<java.lang.Long> snapshotIds)
protected org.apache.spark.sql.Dataset<FileInfo> otherMetadataFileDS(org.apache.iceberg.Table table)
protected org.apache.spark.sql.Dataset<FileInfo> allReachableOtherMetadataFileDS(org.apache.iceberg.Table table)
protected org.apache.spark.sql.Dataset<org.apache.spark.sql.Row> loadMetadataTable(org.apache.iceberg.Table table,
org.apache.iceberg.MetadataTableType type)
protected org.apache.iceberg.spark.actions.BaseSparkAction.DeleteSummary deleteFiles(java.util.concurrent.ExecutorService executorService,
java.util.function.Consumer<java.lang.String> deleteFunc,
java.util.Iterator<FileInfo> files)
executorService - an executor service to use for parallel deletesdeleteFunc - a delete funcfiles - an iterator of Spark rows of the structure (path: String, type: String)protected org.apache.iceberg.spark.actions.BaseSparkAction.DeleteSummary deleteFiles(org.apache.iceberg.io.SupportsBulkOperations io,
java.util.Iterator<FileInfo> files)