public class Spark24HoodieVectorizedParquetRecordReader
extends org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReader
org.apache.spark.sql.execution.datasources.parquet.SpecificParquetRecordReaderBase.NullIntIterator, org.apache.spark.sql.execution.datasources.parquet.SpecificParquetRecordReaderBase.RLEIntIterator, org.apache.spark.sql.execution.datasources.parquet.SpecificParquetRecordReaderBase.ValuesReaderIntIterator| 构造器和说明 |
|---|
Spark24HoodieVectorizedParquetRecordReader(TimeZone convertTz,
boolean useOffHeap,
int capacity,
Map<Integer,Pair<org.apache.spark.sql.types.DataType,org.apache.spark.sql.types.DataType>> typeChangeInfos) |
| 限定符和类型 | 方法和说明 |
|---|---|
void |
close() |
void |
enableReturningBatches() |
Object |
getCurrentValue() |
void |
initBatch(org.apache.spark.sql.types.StructType partitionColumns,
org.apache.spark.sql.catalyst.InternalRow partitionValues) |
void |
initialize(org.apache.hadoop.mapreduce.InputSplit inputSplit,
org.apache.hadoop.mapreduce.TaskAttemptContext taskAttemptContext) |
boolean |
nextBatch() |
boolean |
nextKeyValue() |
org.apache.spark.sql.vectorized.ColumnarBatch |
resultBatch() |
getProgress, initializepublic void initBatch(org.apache.spark.sql.types.StructType partitionColumns,
org.apache.spark.sql.catalyst.InternalRow partitionValues)
initBatch 在类中 org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReaderpublic void initialize(org.apache.hadoop.mapreduce.InputSplit inputSplit,
org.apache.hadoop.mapreduce.TaskAttemptContext taskAttemptContext)
throws IOException,
InterruptedException,
UnsupportedOperationException
initialize 在类中 org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReaderIOExceptionInterruptedExceptionUnsupportedOperationExceptionpublic void close()
throws IOException
close 在接口中 Closeableclose 在接口中 AutoCloseableclose 在类中 org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReaderIOExceptionpublic org.apache.spark.sql.vectorized.ColumnarBatch resultBatch()
resultBatch 在类中 org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReaderpublic boolean nextBatch()
throws IOException
nextBatch 在类中 org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReaderIOExceptionpublic void enableReturningBatches()
enableReturningBatches 在类中 org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReaderpublic Object getCurrentValue()
getCurrentValue 在类中 org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReaderpublic boolean nextKeyValue()
throws IOException
nextKeyValue 在类中 org.apache.spark.sql.execution.datasources.parquet.VectorizedParquetRecordReaderIOExceptionCopyright © 2023 The Apache Software Foundation. All rights reserved.