Class TransactionLogAccess
- java.lang.Object
-
- io.trino.plugin.deltalake.transactionlog.TransactionLogAccess
-
public class TransactionLogAccess extends Object
-
-
Constructor Summary
Constructors Constructor Description TransactionLogAccess(TypeManager typeManager, CheckpointSchemaManager checkpointSchemaManager, DeltaLakeConfig deltaLakeConfig, FileFormatDataSourceStats fileFormatDataSourceStats, HdfsEnvironment hdfsEnvironment, ParquetReaderConfig parquetReaderConfig)
-
Method Summary
All Methods Static Methods Instance Methods Concrete Methods Deprecated Methods Modifier and Type Method Description static <T> StringcanonicalizeColumnName(String columnName)static List<ColumnMetadata>columnsWithStats(MetadataEntry metadataEntry, TypeManager typeManager)static com.google.common.collect.ImmutableList<ColumnMetadata>columnsWithStats(List<ColumnMetadata> schema, List<String> partitionColumns)List<AddFileEntry>getActiveFiles(TableSnapshot tableSnapshot, ConnectorSession session)Stream<CommitInfoEntry>getCommitInfoEntries(TableSnapshot tableSnapshot, ConnectorSession session)io.airlift.jmx.CacheStatsMBeangetDataFileMetadataCacheStats()protected org.apache.hadoop.fs.FileSystemgetFileSystem(org.apache.hadoop.fs.Path tableLocation, SchemaTableName table, ConnectorSession session)Stream<DeltaLakeTransactionLogEntry>getJsonEntries(org.apache.hadoop.fs.FileSystem fileSystem, org.apache.hadoop.fs.Path transactionLogDir, List<Long> forVersions)io.airlift.jmx.CacheStatsMBeangetMetadataCacheStats()Optional<MetadataEntry>getMetadataEntry(TableSnapshot tableSnapshot, ConnectorSession session)List<Long>getPastTableVersions(org.apache.hadoop.fs.FileSystem fileSystem, org.apache.hadoop.fs.Path transactionLogDir, Instant startAt, long lastVersion)Returns a stream of transaction log versions betweenstartAtpoint in time andlastVersion.Stream<ProtocolEntry>getProtocolEntries(TableSnapshot tableSnapshot, ConnectorSession session)Stream<RemoveFileEntry>getRemoveEntries(TableSnapshot tableSnapshot, ConnectorSession session)voidinvalidateCaches(String tableLocation)TableSnapshotloadSnapshot(SchemaTableName table, org.apache.hadoop.fs.Path tableLocation, ConnectorSession session)static <T> Map<CanonicalColumnName,T>toCanonicalNameKeyedMap(Map<String,T> map)static <T> Map<CanonicalColumnName,T>toCanonicalNameKeyedMap(Map<String,T> map, Map<String,CanonicalColumnName> canonicalColumnNames)static <T> Map<String,T>toOriginalNameKeyedMap(Map<CanonicalColumnName,T> map)Deprecated.
-
-
-
Constructor Detail
-
TransactionLogAccess
@Inject public TransactionLogAccess(TypeManager typeManager, CheckpointSchemaManager checkpointSchemaManager, DeltaLakeConfig deltaLakeConfig, FileFormatDataSourceStats fileFormatDataSourceStats, HdfsEnvironment hdfsEnvironment, ParquetReaderConfig parquetReaderConfig)
-
-
Method Detail
-
getDataFileMetadataCacheStats
public io.airlift.jmx.CacheStatsMBean getDataFileMetadataCacheStats()
-
getMetadataCacheStats
public io.airlift.jmx.CacheStatsMBean getMetadataCacheStats()
-
loadSnapshot
public TableSnapshot loadSnapshot(SchemaTableName table, org.apache.hadoop.fs.Path tableLocation, ConnectorSession session) throws IOException
- Throws:
IOException
-
invalidateCaches
public void invalidateCaches(String tableLocation)
-
getMetadataEntry
public Optional<MetadataEntry> getMetadataEntry(TableSnapshot tableSnapshot, ConnectorSession session)
-
getActiveFiles
public List<AddFileEntry> getActiveFiles(TableSnapshot tableSnapshot, ConnectorSession session)
-
columnsWithStats
public static List<ColumnMetadata> columnsWithStats(MetadataEntry metadataEntry, TypeManager typeManager)
-
columnsWithStats
public static com.google.common.collect.ImmutableList<ColumnMetadata> columnsWithStats(List<ColumnMetadata> schema, List<String> partitionColumns)
-
getRemoveEntries
public Stream<RemoveFileEntry> getRemoveEntries(TableSnapshot tableSnapshot, ConnectorSession session)
-
getProtocolEntries
public Stream<ProtocolEntry> getProtocolEntries(TableSnapshot tableSnapshot, ConnectorSession session)
-
getCommitInfoEntries
public Stream<CommitInfoEntry> getCommitInfoEntries(TableSnapshot tableSnapshot, ConnectorSession session)
-
getJsonEntries
public Stream<DeltaLakeTransactionLogEntry> getJsonEntries(org.apache.hadoop.fs.FileSystem fileSystem, org.apache.hadoop.fs.Path transactionLogDir, List<Long> forVersions)
-
getPastTableVersions
public List<Long> getPastTableVersions(org.apache.hadoop.fs.FileSystem fileSystem, org.apache.hadoop.fs.Path transactionLogDir, Instant startAt, long lastVersion)
Returns a stream of transaction log versions betweenstartAtpoint in time andlastVersion.
-
getFileSystem
protected org.apache.hadoop.fs.FileSystem getFileSystem(org.apache.hadoop.fs.Path tableLocation, SchemaTableName table, ConnectorSession session)
-
toCanonicalNameKeyedMap
public static <T> Map<CanonicalColumnName,T> toCanonicalNameKeyedMap(Map<String,T> map)
-
toCanonicalNameKeyedMap
public static <T> Map<CanonicalColumnName,T> toCanonicalNameKeyedMap(Map<String,T> map, Map<String,CanonicalColumnName> canonicalColumnNames)
-
toOriginalNameKeyedMap
@Deprecated public static <T> Map<String,T> toOriginalNameKeyedMap(Map<CanonicalColumnName,T> map)
Deprecated.
-
-