case class TahoeLogFileIndex(spark: SparkSession, deltaLog: DeltaLog, path: Path, snapshotAtAnalysis: SnapshotDescriptor, partitionFilters: Seq[Expression], isTimeTravelQuery: Boolean) extends TahoeFileIndex with Product with Serializable
A TahoeFileIndex that generates the list of files from DeltaLog with given partition filters.
NOTE: This is NOT a TahoeFileIndexWithSnapshotDescriptor because we only use snapshotAtAnalysis for actual data skipping if this is a time travel query.
- Alphabetic
- By Inheritance
- TahoeLogFileIndex
- Serializable
- Serializable
- Product
- Equals
- TahoeFileIndex
- SnapshotDescriptor
- SupportsRowIndexFilters
- FileIndex
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Instance Constructors
- new TahoeLogFileIndex(spark: SparkSession, deltaLog: DeltaLog, path: Path, snapshotAtAnalysis: Snapshot, partitionFilters: Seq[Expression] = Nil, isTimeTravelQuery: Boolean = false)
- new TahoeLogFileIndex(spark: SparkSession, deltaLog: DeltaLog, path: Path, snapshotAtAnalysis: SnapshotDescriptor, partitionFilters: Seq[Expression], isTimeTravelQuery: Boolean)
Value Members
-
final
def
!=(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
##(): Int
- Definition Classes
- AnyRef → Any
-
final
def
==(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
def
absolutePath(child: String): Path
- Definition Classes
- TahoeFileIndex
-
final
def
asInstanceOf[T0]: T0
- Definition Classes
- Any
-
def
clone(): AnyRef
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
-
val
deltaLog: DeltaLog
- Definition Classes
- TahoeLogFileIndex → TahoeFileIndex → SnapshotDescriptor
-
final
def
eq(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
def
equals(that: Any): Boolean
- Definition Classes
- TahoeLogFileIndex → Equals → AnyRef → Any
-
def
fileStatusWithMetadataFromAddFile(addFile: AddFile): FileStatusWithMetadata
Generates a FileStatusWithMetadata using data extracted from a given AddFile.
Generates a FileStatusWithMetadata using data extracted from a given AddFile.
- Definition Classes
- TahoeFileIndex
-
def
finalize(): Unit
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( classOf[java.lang.Throwable] )
-
def
getBasePath(filePath: Path): Option[Path]
Returns the path of the base directory of the given file path (i.e.
Returns the path of the base directory of the given file path (i.e. its parent directory with all the partition directories stripped off).
- Definition Classes
- TahoeFileIndex
-
final
def
getClass(): Class[_]
- Definition Classes
- AnyRef → Any
- Annotations
- @native()
-
def
getPartitionValuesRow(partitionValues: Map[String, String]): GenericInternalRow
- Attributes
- protected
- Definition Classes
- TahoeFileIndex
- def getSnapshot: Snapshot
-
def
getSnapshotToScan: Snapshot
- Attributes
- protected
-
def
hashCode(): Int
- Definition Classes
- TahoeLogFileIndex → AnyRef → Any
-
def
inputFiles: Array[String]
- Definition Classes
- TahoeLogFileIndex → FileIndex
-
final
def
isInstanceOf[T0]: Boolean
- Definition Classes
- Any
- val isTimeTravelQuery: Boolean
-
def
listFiles(partitionFilters: Seq[Expression], dataFilters: Seq[Expression]): Seq[PartitionDirectory]
- Definition Classes
- TahoeFileIndex → FileIndex
-
def
listPartitionsAsAddFiles(partitionFilters: Seq[Expression], dataFilters: Seq[Expression]): (Seq[(InternalRow, Seq[AddFile])], Seq[AddFile])
Returns (i) tuples of partition directories to their respective AddFile actions and (ii) a collection of matched AddFiles.
Returns (i) tuples of partition directories to their respective AddFile actions and (ii) a collection of matched AddFiles. The matched AddFiles are those that meet the criteria set by the partition and data filters. Essentially, this is a collection of all the files associated with the identified partitions.
- Definition Classes
- TahoeFileIndex
-
def
makePartitionDirectories(partitionValuesToFiles: Seq[(InternalRow, Seq[AddFile])]): Seq[PartitionDirectory]
- Definition Classes
- TahoeFileIndex
-
def
matchingFiles(partitionFilters: Seq[Expression], dataFilters: Seq[Expression]): Seq[AddFile]
Returns all matching/valid files by the given
partitionFiltersanddataFilters.Returns all matching/valid files by the given
partitionFiltersanddataFilters. Implementations may avoid evaluating data filters when doing so would be expensive, but *must* evaluate the partition filters; wrong results will be produced if AddFile entries which don't match the partition filters are returned.- Definition Classes
- TahoeLogFileIndex → TahoeFileIndex
-
def
metadata: Metadata
- Definition Classes
- TahoeLogFileIndex → SnapshotDescriptor
-
def
metadataOpsTimeNs: Option[Long]
- Definition Classes
- FileIndex
-
final
def
ne(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
final
def
notify(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native()
-
final
def
notifyAll(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native()
-
def
numOfFilesIfKnown: Option[Long]
- Attributes
- protected[delta]
- Definition Classes
- TahoeLogFileIndex → SnapshotDescriptor
- val partitionFilters: Seq[Expression]
-
def
partitionSchema: StructType
- Definition Classes
- TahoeFileIndex → FileIndex
-
val
path: Path
- Definition Classes
- TahoeLogFileIndex → TahoeFileIndex
-
def
protocol: Protocol
- Definition Classes
- TahoeLogFileIndex → SnapshotDescriptor
-
def
refresh(): Unit
- Definition Classes
- TahoeLogFileIndex → FileIndex
-
def
rootPaths: Seq[Path]
- Definition Classes
- TahoeFileIndex → FileIndex
-
def
rowIndexFilters: Option[Map[String, RowIndexFilterType]]
If we know a-priori which exact rows we want to read (e.g., from a previous scan) find the per-file filter here, which must be passed down to the appropriate reader.
If we know a-priori which exact rows we want to read (e.g., from a previous scan) find the per-file filter here, which must be passed down to the appropriate reader.
- returns
a mapping from file names to the row index filter for that file.
- Definition Classes
- SupportsRowIndexFilters
-
def
schema: StructType
- Definition Classes
- SnapshotDescriptor
-
def
sizeInBytes: Long
- Definition Classes
- TahoeLogFileIndex → FileIndex
-
def
sizeInBytesIfKnown: Option[Long]
- Attributes
- protected[delta]
- Definition Classes
- TahoeLogFileIndex → SnapshotDescriptor
- val snapshotAtAnalysis: SnapshotDescriptor
-
val
spark: SparkSession
- Definition Classes
- TahoeLogFileIndex → TahoeFileIndex
-
final
def
synchronized[T0](arg0: ⇒ T0): T0
- Definition Classes
- AnyRef
-
def
toString(): String
- Definition Classes
- TahoeFileIndex → FileIndex → AnyRef → Any
-
def
version: Long
- Definition Classes
- TahoeLogFileIndex → SnapshotDescriptor
-
def
versionToUse: Option[Long]
Provides the version that's being used as part of the scan if this is a time travel query.
-
final
def
wait(): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long, arg1: Int): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()