Packages

c

org.apache.spark.sql.execution.python

CoGroupedArrowPythonRunner

class CoGroupedArrowPythonRunner extends BasePythonRunner[(Iterator[InternalRow], Iterator[InternalRow]), ColumnarBatch] with BasicPythonArrowOutput

Python UDF Runner for cogrouped udfs. It sends Arrow bathes from two different DataFrames, groups them in Python, and receive it back in JVM as batches of single DataFrame.

Linear Supertypes
BasicPythonArrowOutput, PythonArrowOutput[ColumnarBatch], BasePythonRunner[(Iterator[InternalRow], Iterator[InternalRow]), ColumnarBatch], Logging, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. CoGroupedArrowPythonRunner
  2. BasicPythonArrowOutput
  3. PythonArrowOutput
  4. BasePythonRunner
  5. Logging
  6. AnyRef
  7. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. Protected

Instance Constructors

  1. new CoGroupedArrowPythonRunner(funcs: Seq[(ChainedPythonFunctions, Long)], evalType: Int, argOffsets: Array[Array[Int]], leftSchema: StructType, rightSchema: StructType, timeZoneId: String, largeVarTypes: Boolean, conf: Map[String, String], pythonMetrics: Map[String, SQLMetric], jobArtifactUUID: Option[String], sessionUUID: Option[String], profiler: Option[String])

Type Members

  1. implicit class LogStringContext extends AnyRef
    Definition Classes
    Logging
  2. class MonitorThread extends Thread
    Definition Classes
    BasePythonRunner
  3. class ReaderInputStream extends InputStream
    Definition Classes
    BasePythonRunner
  4. abstract class ReaderIterator extends Iterator[OUT]
    Definition Classes
    BasePythonRunner
  5. abstract class Writer extends AnyRef
    Definition Classes
    BasePythonRunner

Value Members

  1. final def !=(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  2. final def ##: Int
    Definition Classes
    AnyRef → Any
  3. final def ==(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  4. def MDC(key: LogKey, value: Any): MDC
    Attributes
    protected
    Definition Classes
    Logging
  5. val accumulator: PythonAccumulator
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  6. val argOffsets: Array[Array[Int]]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  7. def arrowMaxBytesPerOutputBatch: Int
    Attributes
    protected
    Definition Classes
    PythonArrowOutput
  8. def arrowMaxRecordsPerOutputBatch: Int
    Attributes
    protected
    Definition Classes
    PythonArrowOutput
  9. final def asInstanceOf[T0]: T0
    Definition Classes
    Any
  10. val authSocketTimeout: Long
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  11. val batchSizeForPythonUDF: Int
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  12. val bufferSize: Int
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  13. def clone(): AnyRef
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.CloneNotSupportedException]) @IntrinsicCandidate() @native()
  14. def compute(inputIterator: Iterator[(Iterator[InternalRow], Iterator[InternalRow])], partitionIndex: Int, context: TaskContext): Iterator[ColumnarBatch]
    Definition Classes
    BasePythonRunner
  15. def deserializeColumnarBatch(batch: ColumnarBatch, schema: StructType): ColumnarBatch
    Attributes
    protected
    Definition Classes
    BasicPythonArrowOutput → PythonArrowOutput
  16. val envVars: Map[String, String]
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  17. final def eq(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  18. def equals(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef → Any
  19. val evalType: Int
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  20. val faultHandlerEnabled: Boolean
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  21. val funcs: Seq[ChainedPythonFunctions]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  22. final def getClass(): Class[_ <: AnyRef]
    Definition Classes
    AnyRef → Any
    Annotations
    @IntrinsicCandidate() @native()
  23. def handleMetadataAfterExec(stream: DataInputStream): Unit
    Attributes
    protected
    Definition Classes
    PythonArrowOutput
  24. def hashCode(): Int
    Definition Classes
    AnyRef → Any
    Annotations
    @IntrinsicCandidate() @native()
  25. val hideTraceback: Boolean
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  26. val idleTimeoutSeconds: Long
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  27. def initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  28. def initializeLogIfNecessary(isInterpreter: Boolean): Unit
    Attributes
    protected
    Definition Classes
    Logging
  29. final def isInstanceOf[T0]: Boolean
    Definition Classes
    Any
  30. def isTraceEnabled(): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  31. val jobArtifactUUID: Option[String]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  32. val killOnIdleTimeout: Boolean
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  33. def log: Logger
    Attributes
    protected
    Definition Classes
    Logging
  34. def logBasedOnLevel(level: Level)(f: => MessageWithContext): Unit
    Attributes
    protected
    Definition Classes
    Logging
  35. def logDebug(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  36. def logDebug(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  37. def logDebug(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  38. def logDebug(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  39. def logError(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  40. def logError(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  41. def logError(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  42. def logError(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  43. def logInfo(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  44. def logInfo(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  45. def logInfo(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  46. def logInfo(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  47. def logName: String
    Attributes
    protected
    Definition Classes
    Logging
  48. def logTrace(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  49. def logTrace(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  50. def logTrace(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  51. def logTrace(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  52. def logWarning(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  53. def logWarning(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  54. def logWarning(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  55. def logWarning(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  56. val metrics: Map[String, AccumulatorV2[Long, Long]]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  57. final def ne(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  58. def newReaderIterator(stream: DataInputStream, writer: Writer, startTime: Long, env: SparkEnv, worker: PythonWorker, pid: Option[Int], releasedOrClosed: AtomicBoolean, context: TaskContext): Iterator[ColumnarBatch]
    Attributes
    protected
    Definition Classes
    PythonArrowOutput
  59. def newWriter(env: SparkEnv, worker: PythonWorker, inputIterator: Iterator[(Iterator[InternalRow], Iterator[InternalRow])], partitionIndex: Int, context: TaskContext): Writer
    Attributes
    protected
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  60. final def notify(): Unit
    Definition Classes
    AnyRef
    Annotations
    @IntrinsicCandidate() @native()
  61. final def notifyAll(): Unit
    Definition Classes
    AnyRef
    Annotations
    @IntrinsicCandidate() @native()
  62. val pythonExec: String
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  63. val pythonMetrics: Map[String, SQLMetric]
    Definition Classes
    CoGroupedArrowPythonRunner → PythonArrowOutput
  64. val pythonVer: String
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  65. val simplifiedTraceback: Boolean
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  66. final def synchronized[T0](arg0: => T0): T0
    Definition Classes
    AnyRef
  67. val timelyFlushEnabled: Boolean
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  68. val timelyFlushTimeoutNanos: Long
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  69. def toString(): String
    Definition Classes
    AnyRef → Any
  70. val tracebackDumpIntervalSeconds: Long
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  71. final def wait(arg0: Long, arg1: Int): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.InterruptedException])
  72. final def wait(arg0: Long): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.InterruptedException]) @native()
  73. final def wait(): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.InterruptedException])
  74. def withLogContext(context: Map[String, String])(body: => Unit): Unit
    Attributes
    protected
    Definition Classes
    Logging

Deprecated Value Members

  1. def finalize(): Unit
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.Throwable]) @Deprecated
    Deprecated

    (Since version 9)

Inherited from BasicPythonArrowOutput

Inherited from PythonArrowOutput[ColumnarBatch]

Inherited from BasePythonRunner[(Iterator[InternalRow], Iterator[InternalRow]), ColumnarBatch]

Inherited from Logging

Inherited from AnyRef

Inherited from Any

Ungrouped