final class VectorizedRleValuesReader extends ValuesReader with VectorizedValuesReader
A values reader for Parquet's run-length encoded data. This is based off of the version in parquet-mr with these changes:
- Supports the vectorized interface.
- Works on byte arrays(byte[]) instead of making byte streams.
This encoding is used in multiple places:
- Definition/Repetition levels
- Dictionary ids.
- Boolean type values of Parquet DataPageV2
- Alphabetic
- By Inheritance
- VectorizedRleValuesReader
- VectorizedValuesReader
- ValuesReader
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Instance Constructors
Value Members
-
final
def
!=(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
##(): Int
- Definition Classes
- AnyRef → Any
-
final
def
==(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
asInstanceOf[T0]: T0
- Definition Classes
- Any
-
def
clone(): AnyRef
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native() @HotSpotIntrinsicCandidate()
-
final
def
eq(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
def
equals(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
getClass(): Class[_]
- Definition Classes
- AnyRef → Any
- Annotations
- @native() @HotSpotIntrinsicCandidate()
-
def
hashCode(): Int
- Definition Classes
- AnyRef → Any
- Annotations
- @native() @HotSpotIntrinsicCandidate()
-
def
initFromPage(valueCount: Int, in: ByteBufferInputStream): Unit
- Definition Classes
- VectorizedRleValuesReader → ValuesReader
- Annotations
- @Override()
-
final
def
isInstanceOf[T0]: Boolean
- Definition Classes
- Any
-
final
def
ne(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
final
def
notify(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native() @HotSpotIntrinsicCandidate()
-
final
def
notifyAll(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native() @HotSpotIntrinsicCandidate()
-
def
readBatch(state: ParquetReadState, values: WritableColumnVector, defLevels: WritableColumnVector, valueReader: VectorizedValuesReader, updater: ParquetVectorUpdater): Unit
Reads a batch of definition levels and values into vector 'defLevels' and 'values' respectively.
Reads a batch of definition levels and values into vector 'defLevels' and 'values' respectively. The values are read using 'valueReader'.
The related states such as row index, offset, number of values left in the batch and page, are tracked by 'state'. The type-specific 'updater' is used to update or skip values.
This reader reads the definition levels and then will read from 'valueReader' for the non-null values. If the value is null, 'values' will be populated with null value.
-
def
readBatchRepeated(state: ParquetReadState, repLevels: WritableColumnVector, defLevelsReader: VectorizedRleValuesReader, defLevels: WritableColumnVector, values: WritableColumnVector, valueReader: VectorizedValuesReader, updater: ParquetVectorUpdater): Unit
Reads a batch of repetition levels, definition levels and values into 'repLevels', 'defLevels' and 'values' respectively.
Reads a batch of repetition levels, definition levels and values into 'repLevels', 'defLevels' and 'values' respectively. The definition levels and values are read via 'defLevelsReader' and 'valueReader' respectively.
The related states such as row index, offset, number of rows left in the batch and page, are tracked by 'state'. The type-specific 'updater' is used to update or skip values.
-
def
readBatchRepeatedInternal(state: ParquetReadState, repLevels: WritableColumnVector, defLevelsReader: VectorizedRleValuesReader, defLevels: WritableColumnVector, values: WritableColumnVector, nulls: WritableColumnVector, valuesReused: Boolean, valueReader: VectorizedValuesReader, updater: ParquetVectorUpdater): Unit
Keep reading repetition level values from the page until either: 1) we've read enough top-level rows to fill the current batch, or 2) we've drained the data page completely.
Keep reading repetition level values from the page until either: 1) we've read enough top-level rows to fill the current batch, or 2) we've drained the data page completely.
- valuesReused
whether 'values' vector is reused for 'nulls'
-
def
readBinary(len: Int): Binary
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readBinary(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readBoolean(): Boolean
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader → ValuesReader
- Annotations
- @Override()
-
def
readBooleans(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readByte(): Byte
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readBytes(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readBytes(): Binary
- Definition Classes
- ValuesReader
-
def
readDouble(): Double
- Definition Classes
- ValuesReader
-
def
readDoubles(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readFloat(): Float
- Definition Classes
- ValuesReader
-
def
readFloats(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readInteger(): Int
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader → ValuesReader
- Annotations
- @Override()
-
def
readIntegers(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readIntegers(state: ParquetReadState, values: WritableColumnVector, nulls: WritableColumnVector, defLevels: WritableColumnVector, valueReader: VectorizedValuesReader): Unit
Decoding for dictionary ids.
Decoding for dictionary ids. The IDs are populated into 'values' and the nullability is populated into 'nulls'.
-
def
readIntegersRepeated(state: ParquetReadState, repLevels: WritableColumnVector, defLevelsReader: VectorizedRleValuesReader, defLevels: WritableColumnVector, values: WritableColumnVector, nulls: WritableColumnVector, valueReader: VectorizedValuesReader): Unit
Reads a batch of repetition levels, definition levels and integer values into 'repLevels', 'defLevels', 'values' and 'nulls' respectively.
Reads a batch of repetition levels, definition levels and integer values into 'repLevels', 'defLevels', 'values' and 'nulls' respectively. The definition levels and values are read via 'defLevelsReader' and 'valueReader' respectively.
The 'values' vector is used to hold non-null values, while 'nulls' vector is used to hold null values.
The related states such as row index, offset, number of rows left in the batch and page, are tracked by 'state'.
Unlike 'readBatchRepeated', this is used to decode dictionary indices in dictionary encoding.
-
def
readIntegersWithRebase(total: Int, c: WritableColumnVector, rowId: Int, failIfRebase: Boolean): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readLong(): Long
- Definition Classes
- ValuesReader
-
def
readLongs(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readLongsWithRebase(total: Int, c: WritableColumnVector, rowId: Int, failIfRebase: Boolean, timeZone: String): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readShort(): Short
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readShorts(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readUnsignedIntegers(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readUnsignedLongs(total: Int, c: WritableColumnVector, rowId: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
readValueDictionaryId(): Int
- Definition Classes
- VectorizedRleValuesReader → ValuesReader
- Annotations
- @Override()
-
def
skip(): Unit
- Definition Classes
- VectorizedRleValuesReader → ValuesReader
- Annotations
- @Override()
-
def
skip(arg0: Int): Unit
- Definition Classes
- ValuesReader
-
def
skipBinary(total: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
skipBooleans(total: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
skipBytes(total: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
skipDoubles(total: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
skipFixedLenByteArray(total: Int, len: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
skipFloats(total: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
skipIntegers(total: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
skipLongs(total: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
def
skipShorts(total: Int): Unit
- Definition Classes
- VectorizedRleValuesReader → VectorizedValuesReader
- Annotations
- @Override()
-
final
def
synchronized[T0](arg0: ⇒ T0): T0
- Definition Classes
- AnyRef
-
def
toString(): String
- Definition Classes
- AnyRef → Any
-
def
updateNextOffset(arg0: Int): Unit
- Attributes
- protected[values]
- Definition Classes
- ValuesReader
-
final
def
wait(arg0: Long, arg1: Int): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
-
final
def
wait(): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
Deprecated Value Members
-
def
finalize(): Unit
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( classOf[java.lang.Throwable] ) @Deprecated
- Deprecated
-
def
getNextOffset(): Int
- Definition Classes
- ValuesReader
- Annotations
- @Deprecated
- Deprecated
-
def
initFromPage(arg0: Int, arg1: Array[Byte], arg2: Int): Unit
- Definition Classes
- ValuesReader
- Annotations
- @throws( classOf[java.io.IOException] ) @Deprecated
- Deprecated
-
def
initFromPage(arg0: Int, arg1: ByteBuffer, arg2: Int): Unit
- Definition Classes
- ValuesReader
- Annotations
- @throws( classOf[java.io.IOException] ) @Deprecated
- Deprecated