Packages

c

org.apache.spark.sql.execution.python

CoGroupedArrowPythonRunner

class CoGroupedArrowPythonRunner extends BasePythonRunner[(Iterator[InternalRow], Iterator[InternalRow]), ColumnarBatch] with BasicPythonArrowOutput

Python UDF Runner for cogrouped udfs. It sends Arrow bathes from two different DataFrames, groups them in Python, and receive it back in JVM as batches of single DataFrame.

Linear Supertypes
BasicPythonArrowOutput, PythonArrowOutput[ColumnarBatch], BasePythonRunner[(Iterator[InternalRow], Iterator[InternalRow]), ColumnarBatch], Logging, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. CoGroupedArrowPythonRunner
  2. BasicPythonArrowOutput
  3. PythonArrowOutput
  4. BasePythonRunner
  5. Logging
  6. AnyRef
  7. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. Protected

Instance Constructors

  1. new CoGroupedArrowPythonRunner(funcs: Seq[(ChainedPythonFunctions, Long)], evalType: Int, argOffsets: Array[Array[Int]], leftSchema: StructType, rightSchema: StructType, timeZoneId: String, largeVarTypes: Boolean, conf: Map[String, String], pythonMetrics: Map[String, SQLMetric], jobArtifactUUID: Option[String], profiler: Option[String])

Type Members

  1. implicit class LogStringContext extends AnyRef
    Definition Classes
    Logging
  2. class MonitorThread extends Thread
    Definition Classes
    BasePythonRunner
  3. class ReaderInputStream extends InputStream
    Definition Classes
    BasePythonRunner
  4. abstract class ReaderIterator extends Iterator[OUT]
    Definition Classes
    BasePythonRunner
  5. abstract class Writer extends AnyRef
    Definition Classes
    BasePythonRunner

Value Members

  1. final def !=(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  2. final def ##: Int
    Definition Classes
    AnyRef → Any
  3. final def ==(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  4. val accumulator: PythonAccumulator
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  5. val argOffsets: Array[Array[Int]]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  6. def arrowMaxBytesPerOutputBatch: Int
    Attributes
    protected
    Definition Classes
    PythonArrowOutput
  7. def arrowMaxRecordsPerOutputBatch: Int
    Attributes
    protected
    Definition Classes
    PythonArrowOutput
  8. final def asInstanceOf[T0]: T0
    Definition Classes
    Any
  9. val authSocketTimeout: Long
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  10. val batchSizeForPythonUDF: Int
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  11. val bufferSize: Int
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  12. def clone(): AnyRef
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.CloneNotSupportedException]) @IntrinsicCandidate() @native()
  13. def compute(inputIterator: Iterator[(Iterator[InternalRow], Iterator[InternalRow])], partitionIndex: Int, context: TaskContext): Iterator[ColumnarBatch]
    Definition Classes
    BasePythonRunner
  14. def deserializeColumnarBatch(batch: ColumnarBatch, schema: StructType): ColumnarBatch
    Attributes
    protected
    Definition Classes
    BasicPythonArrowOutput → PythonArrowOutput
  15. val envVars: Map[String, String]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  16. final def eq(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  17. def equals(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef → Any
  18. val evalType: Int
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  19. val faultHandlerEnabled: Boolean
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  20. val funcs: Seq[ChainedPythonFunctions]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  21. final def getClass(): Class[_ <: AnyRef]
    Definition Classes
    AnyRef → Any
    Annotations
    @IntrinsicCandidate() @native()
  22. def handleMetadataAfterExec(stream: DataInputStream): Unit
    Attributes
    protected
    Definition Classes
    PythonArrowOutput
  23. def hashCode(): Int
    Definition Classes
    AnyRef → Any
    Annotations
    @IntrinsicCandidate() @native()
  24. val hideTraceback: Boolean
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  25. val idleTimeoutSeconds: Long
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  26. def initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  27. def initializeLogIfNecessary(isInterpreter: Boolean): Unit
    Attributes
    protected
    Definition Classes
    Logging
  28. final def isInstanceOf[T0]: Boolean
    Definition Classes
    Any
  29. def isTraceEnabled(): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  30. val jobArtifactUUID: Option[String]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  31. val killOnIdleTimeout: Boolean
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  32. def log: Logger
    Attributes
    protected
    Definition Classes
    Logging
  33. def logBasedOnLevel(level: Level)(f: => MessageWithContext): Unit
    Attributes
    protected
    Definition Classes
    Logging
  34. def logDebug(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  35. def logDebug(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  36. def logDebug(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  37. def logDebug(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  38. def logError(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  39. def logError(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  40. def logError(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  41. def logError(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  42. def logInfo(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  43. def logInfo(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  44. def logInfo(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  45. def logInfo(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  46. def logName: String
    Attributes
    protected
    Definition Classes
    Logging
  47. def logTrace(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  48. def logTrace(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  49. def logTrace(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  50. def logTrace(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  51. def logWarning(msg: => String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  52. def logWarning(entry: LogEntry, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  53. def logWarning(entry: LogEntry): Unit
    Attributes
    protected
    Definition Classes
    Logging
  54. def logWarning(msg: => String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  55. val metrics: Map[String, AccumulatorV2[Long, Long]]
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  56. final def ne(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  57. def newReaderIterator(stream: DataInputStream, writer: Writer, startTime: Long, env: SparkEnv, worker: PythonWorker, pid: Option[Int], releasedOrClosed: AtomicBoolean, context: TaskContext): Iterator[ColumnarBatch]
    Attributes
    protected
    Definition Classes
    PythonArrowOutput
  58. def newWriter(env: SparkEnv, worker: PythonWorker, inputIterator: Iterator[(Iterator[InternalRow], Iterator[InternalRow])], partitionIndex: Int, context: TaskContext): Writer
    Attributes
    protected
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  59. final def notify(): Unit
    Definition Classes
    AnyRef
    Annotations
    @IntrinsicCandidate() @native()
  60. final def notifyAll(): Unit
    Definition Classes
    AnyRef
    Annotations
    @IntrinsicCandidate() @native()
  61. val pythonExec: String
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  62. val pythonMetrics: Map[String, SQLMetric]
    Definition Classes
    CoGroupedArrowPythonRunner → PythonArrowOutput
  63. val pythonVer: String
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  64. val simplifiedTraceback: Boolean
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  65. final def synchronized[T0](arg0: => T0): T0
    Definition Classes
    AnyRef
  66. val timelyFlushEnabled: Boolean
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  67. val timelyFlushTimeoutNanos: Long
    Attributes
    protected
    Definition Classes
    BasePythonRunner
  68. def toString(): String
    Definition Classes
    AnyRef → Any
  69. val tracebackDumpIntervalSeconds: Long
    Definition Classes
    CoGroupedArrowPythonRunner → BasePythonRunner
  70. final def wait(arg0: Long, arg1: Int): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.InterruptedException])
  71. final def wait(arg0: Long): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.InterruptedException]) @native()
  72. final def wait(): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.InterruptedException])
  73. def withLogContext(context: Map[String, String])(body: => Unit): Unit
    Attributes
    protected
    Definition Classes
    Logging

Deprecated Value Members

  1. def finalize(): Unit
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws(classOf[java.lang.Throwable]) @Deprecated
    Deprecated

    (Since version 9)

Inherited from BasicPythonArrowOutput

Inherited from PythonArrowOutput[ColumnarBatch]

Inherited from BasePythonRunner[(Iterator[InternalRow], Iterator[InternalRow]), ColumnarBatch]

Inherited from Logging

Inherited from AnyRef

Inherited from Any

Ungrouped