class GpuColumnarBatchSerializer extends Serializer with Serializable
Serializer for serializing ColumnarBatchs for use during normal shuffle.
The serialization write path takes the cudf Table that is described by the ColumnarBatch
and uses cudf APIs to serialize the data into a sequence of bytes on the host. The data is
returned to the Spark shuffle code where it is compressed by the CPU and written to disk.
The serialization read path is notably different. The sequence of serialized bytes IS NOT
deserialized into a cudf Table but rather tracked in host memory by a ColumnarBatch
that contains a SerializedTableColumn. During query planning, each GPU columnar shuffle
exchange is followed by a GpuShuffleCoalesceExec that expects to receive only these
custom batches of SerializedTableColumn. GpuShuffleCoalesceExec coalesces the smaller
shuffle partitions into larger tables before placing them on the GPU for further processing.
- Note
The RAPIDS shuffle does not use this code.
- Alphabetic
- By Inheritance
- GpuColumnarBatchSerializer
- Serializable
- Serializer
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Value Members
-
final
def
!=(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
##(): Int
- Definition Classes
- AnyRef → Any
-
final
def
==(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
asInstanceOf[T0]: T0
- Definition Classes
- Any
-
def
clone(): AnyRef
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native() @HotSpotIntrinsicCandidate()
-
var
defaultClassLoader: Option[ClassLoader]
- Attributes
- protected
- Definition Classes
- Serializer
-
final
def
eq(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
def
equals(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
getClass(): Class[_]
- Definition Classes
- AnyRef → Any
- Annotations
- @native() @HotSpotIntrinsicCandidate()
-
def
hashCode(): Int
- Definition Classes
- AnyRef → Any
- Annotations
- @native() @HotSpotIntrinsicCandidate()
-
final
def
isInstanceOf[T0]: Boolean
- Definition Classes
- Any
-
final
def
ne(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
def
newInstance(): SerializerInstance
- Definition Classes
- GpuColumnarBatchSerializer → Serializer
-
final
def
notify(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native() @HotSpotIntrinsicCandidate()
-
final
def
notifyAll(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native() @HotSpotIntrinsicCandidate()
-
def
setDefaultClassLoader(classLoader: ClassLoader): Serializer
- Definition Classes
- Serializer
-
def
supportsRelocationOfSerializedObjects: Boolean
- Definition Classes
- GpuColumnarBatchSerializer → Serializer
-
final
def
synchronized[T0](arg0: ⇒ T0): T0
- Definition Classes
- AnyRef
-
def
toString(): String
- Definition Classes
- AnyRef → Any
-
final
def
wait(arg0: Long, arg1: Int): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
-
final
def
wait(): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )