execution

Type Members

case class AppendColumnsExec(func: (Any) ⇒ Any, deserializer: Expression, serializer: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

Applies the given function to each input row, appending the encoded result at the end of the row.
case class AppendColumnsWithObjectExec(func: (Any) ⇒ Any, inputSerializer: Seq[NamedExpression], newColumnsSerializer: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with ObjectConsumerExec with Product with Serializable

An optimized version of AppendColumnsExec, that can be executed on deserialized object directly.
trait BaseLimitExec extends SparkPlan with UnaryExecNode with CodegenSupport

Helper trait which defines methods that are shared by both LocalLimitExec and GlobalLimitExec.
case class BatchedDataSourceScanExec(output: Seq[Attribute], rdd: RDD[InternalRow], relation: BaseRelation, outputPartitioning: Partitioning, metadata: Map[String, String], metastoreTableIdentifier: Option[TableIdentifier]) extends SparkPlan with DataSourceScanExec with CodegenSupport with Product with Serializable

Physical plan node for scanning data from a batched relation.
trait BinaryExecNode extends SparkPlan
abstract class BufferedRowIterator extends AnyRef
class CacheManager extends Logging

Provides support in a SQLContext for caching query results and automatically using these cached results when subsequent queries are executed.
case class CachedData(plan: LogicalPlan, cachedRepresentation: InMemoryRelation) extends Product with Serializable

Holds a cached logical plan and its data
case class CoGroupExec(func: (Any, Iterator[Any], Iterator[Any]) ⇒ TraversableOnce[Any], keyDeserializer: Expression, leftDeserializer: Expression, rightDeserializer: Expression, leftGroup: Seq[Attribute], rightGroup: Seq[Attribute], leftAttr: Seq[Attribute], rightAttr: Seq[Attribute], outputObjAttr: Attribute, left: SparkPlan, right: SparkPlan) extends SparkPlan with BinaryExecNode with ObjectProducerExec with Product with Serializable

Co-groups the data from left and right children, and calls the function with each group and 2 iterators containing all elements in the group from left and right side.
class CoGroupedIterator extends Iterator[(InternalRow, Iterator[InternalRow], Iterator[InternalRow])]

Iterates over GroupedIterators and returns the cogrouped data, i.
case class CoalesceExec(numPartitions: Int, child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

Physical plan for returning a new RDD that has exactly numPartitions partitions.
class CoalescedPartitioner extends Partitioner

A Partitioner that might group together one or more partitions from the parent.
trait CodegenSupport extends SparkPlan

An interface for those physical operators that support codegen.
case class CollapseCodegenStages(conf: SQLConf) extends Rule[SparkPlan] with Product with Serializable

Find the chained plans that support codegen, collapse them together as WholeStageCodegen.
case class CollectLimitExec(limit: Int, child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

Take the first limit elements and collect them to a single partition.
trait DataSourceScanExec extends SparkPlan with LeafExecNode
case class DeserializeToObjectExec(deserializer: Expression, outputObjAttr: Attribute, child: SparkPlan) extends SparkPlan with UnaryExecNode with ObjectProducerExec with CodegenSupport with Product with Serializable

Takes the input row from child and turns it into object using the given deserializer expression.
case class ExpandExec(projections: Seq[Seq[Expression]], output: Seq[Attribute], child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

Apply all of the GroupExpressions to every input row, hence we will get multiple output rows for an input row.
trait FileRelation extends AnyRef

An interface for relations that are backed by files.
case class FilterExec(condition: Expression, child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with PredicateHelper with Product with Serializable

Physical plan for Filter.
case class FlatMapGroupsInRExec(func: Array[Byte], packageNames: Array[Byte], broadcastVars: Array[Broadcast[AnyRef]], inputSchema: StructType, outputSchema: StructType, keyDeserializer: Expression, valueDeserializer: Expression, groupingAttributes: Seq[Attribute], dataAttributes: Seq[Attribute], outputObjAttr: Attribute, child: SparkPlan) extends SparkPlan with UnaryExecNode with ObjectProducerExec with Product with Serializable

Groups the input rows together and calls the R function with each group and an iterator containing all elements in the group.
case class GenerateExec(generator: Generator, join: Boolean, outer: Boolean, output: Seq[Attribute], child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

Applies a Generator to a stream of input rows, combining the output of each into a new stream of rows.
case class GlobalLimitExec(limit: Int, child: SparkPlan) extends SparkPlan with BaseLimitExec with Product with Serializable

Take the first limit elements of the child's single output partition.
class GroupedIterator extends Iterator[(InternalRow, Iterator[InternalRow])]

Iterates over a presorted set of rows, chunking it up by the grouping expression.
case class InputAdapter(child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

InputAdapter is used to hide a SparkPlan from a subtree that support codegen.
trait LeafExecNode extends SparkPlan
case class LocalLimitExec(limit: Int, child: SparkPlan) extends SparkPlan with BaseLimitExec with Product with Serializable

Take the first limit elements of each child partition, but do not collect or shuffle them.
case class LocalTableScanExec(output: Seq[Attribute], rows: Seq[InternalRow]) extends SparkPlan with LeafExecNode with Product with Serializable

Physical plan node for scanning data from a local collection.
case class LogicalRDD(output: Seq[Attribute], rdd: RDD[InternalRow])(session: SparkSession) extends LogicalPlan with MultiInstanceRelation with Product with Serializable

Logical plan node for scanning data from an RDD.
case class MapElementsExec(func: AnyRef, outputObjAttr: Attribute, child: SparkPlan) extends SparkPlan with ObjectConsumerExec with ObjectProducerExec with CodegenSupport with Product with Serializable

Applies the given function to each input object.
case class MapGroupsExec(func: (Any, Iterator[Any]) ⇒ TraversableOnce[Any], keyDeserializer: Expression, valueDeserializer: Expression, groupingAttributes: Seq[Attribute], dataAttributes: Seq[Attribute], outputObjAttr: Attribute, child: SparkPlan) extends SparkPlan with UnaryExecNode with ObjectProducerExec with Product with Serializable

Groups the input rows together and calls the function with each group and an iterator containing all elements in the group.
case class MapPartitionsExec(func: (Iterator[Any]) ⇒ Iterator[Any], outputObjAttr: Attribute, child: SparkPlan) extends SparkPlan with ObjectConsumerExec with ObjectProducerExec with Product with Serializable

Applies the given function to input object iterator.
trait ObjectConsumerExec extends SparkPlan with UnaryExecNode

Physical version of ObjectConsumer.
trait ObjectProducerExec extends SparkPlan

Physical version of ObjectProducer.
case class OutputFakerExec(output: Seq[Attribute], child: SparkPlan) extends SparkPlan with Product with Serializable

A plan node that does nothing but lie about the output of its child.
case class PlanLater(plan: LogicalPlan) extends SparkPlan with LeafExecNode with Product with Serializable
case class PlanSubqueries(sparkSession: SparkSession) extends Rule[SparkPlan] with Product with Serializable

Plans scalar subqueries from that are present in the given SparkPlan.
case class ProjectExec(projectList: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

Physical plan for Project.
class QueryExecution extends AnyRef

The primary workflow for executing relational queries using Spark.
class QueryExecutionException extends Exception
case class RDDScanExec(output: Seq[Attribute], rdd: RDD[InternalRow], nodeName: String) extends SparkPlan with LeafExecNode with Product with Serializable

Physical plan node for scanning data from an RDD.
case class RangeExec(range: Range) extends SparkPlan with LeafExecNode with CodegenSupport with Product with Serializable

Physical plan for range (generating a range of 64 bit numbers).
case class RowDataSourceScanExec(output: Seq[Attribute], rdd: RDD[InternalRow], relation: BaseRelation, outputPartitioning: Partitioning, metadata: Map[String, String], metastoreTableIdentifier: Option[TableIdentifier]) extends SparkPlan with DataSourceScanExec with CodegenSupport with Product with Serializable

Physical plan node for scanning data from a relation.
abstract class RowIterator extends AnyRef

An internal iterator interface which presents a more restrictive API than scala.collection.Iterator.
case class SampleExec(lowerBound: Double, upperBound: Double, withReplacement: Boolean, seed: Long, child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

Physical plan for sampling the dataset.
case class ScalarSubquery(executedPlan: SparkPlan, exprId: ExprId) extends SubqueryExpression with Product with Serializable

A subquery that will return only one row and one column.
case class SerializeFromObjectExec(serializer: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with ObjectConsumerExec with CodegenSupport with Product with Serializable

Takes the input object from child and turns in into unsafe row using the given serializer expression.
class ShuffledRowRDD extends RDD[InternalRow]

This is a specialized version of org.apache.spark.rdd.ShuffledRDD that is optimized for shuffling rows instead of Java key-value pairs.
case class SortExec(sortOrder: Seq[SortOrder], global: Boolean, child: SparkPlan, testSpillFrequency: Int = 0) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

Performs (external) sorting.
class SparkOptimizer extends Optimizer
abstract class SparkPlan extends QueryPlan[SparkPlan] with Logging with Serializable

The base class for physical operators.
class SparkPlanInfo extends AnyRef

:: DeveloperApi :: Stores information about a SQL SparkPlan.
class SparkPlanner extends SparkStrategies
class SparkSqlAstBuilder extends AstBuilder

Builder that converts an ANTLR ParseTree into a LogicalPlan/Expression/TableIdentifier.
class SparkSqlParser extends AbstractSqlParser

Concrete parser for Spark SQL statements.
abstract class SparkStrategies extends QueryPlanner[SparkPlan]
abstract class SparkStrategy extends GenericStrategy[SparkPlan]

Converts a logical plan into zero or more SparkPlans.
case class SubqueryExec(name: String, child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

Physical plan for a subquery.
case class TakeOrderedAndProjectExec(limit: Int, sortOrder: Seq[SortOrder], projectList: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

Take the first limit elements as defined by the sortOrder, and do projection if needed.
trait UnaryExecNode extends SparkPlan
case class UnionExec(children: Seq[SparkPlan]) extends SparkPlan with Product with Serializable

Physical plan for unioning two plans, without a distinct.
final class UnsafeFixedWidthAggregationMap extends AnyRef
final class UnsafeKVExternalSorter extends AnyRef
class UnsafeRowSerializer extends Serializer with Serializable

Serializer for serializing UnsafeRows during shuffle.
case class WholeStageCodegenExec(child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

WholeStageCodegen compile a subtree of plans that support codegen together into single Java function.
case class WindowExec(windowExpression: Seq[NamedExpression], partitionSpec: Seq[Expression], orderSpec: Seq[SortOrder], child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

This class calculates and outputs (windowed) aggregates over the rows in a single (sorted) partition.

Value Members

object DataSourceScanExec extends Serializable
object GroupedIterator
object ObjectOperator

Helper functions for physical operators that work with user defined objects.
object RDDConversions
object RowIterator
object SQLExecution
object SortPrefixUtils
object SparkPlan extends Serializable
object UnaryExecNode extends Serializable
object WholeStageCodegenExec extends Serializable
package aggregate
package columnar
package command
package datasources
package debug

Contains methods for debugging query execution.
package exchange
package joins

Physical execution operators for join operations.
package metric
package python
package r
package stat
package streaming
package ui
package vectorized

package execution

Type Members

case class AppendColumnsExec(func: (Any) ⇒ Any, deserializer: Expression, serializer: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

case class AppendColumnsWithObjectExec(func: (Any) ⇒ Any, inputSerializer: Seq[NamedExpression], newColumnsSerializer: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with ObjectConsumerExec with Product with Serializable

trait BaseLimitExec extends SparkPlan with UnaryExecNode with CodegenSupport

trait BinaryExecNode extends SparkPlan

abstract class BufferedRowIterator extends AnyRef

class CacheManager extends Logging

case class CachedData(plan: LogicalPlan, cachedRepresentation: InMemoryRelation) extends Product with Serializable

class CoGroupedIterator extends Iterator[(InternalRow, Iterator[InternalRow], Iterator[InternalRow])]

case class CoalesceExec(numPartitions: Int, child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

class CoalescedPartitioner extends Partitioner

trait CodegenSupport extends SparkPlan

case class CollapseCodegenStages(conf: SQLConf) extends Rule[SparkPlan] with Product with Serializable

case class CollectLimitExec(limit: Int, child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

trait DataSourceScanExec extends SparkPlan with LeafExecNode

case class DeserializeToObjectExec(deserializer: Expression, outputObjAttr: Attribute, child: SparkPlan) extends SparkPlan with UnaryExecNode with ObjectProducerExec with CodegenSupport with Product with Serializable

case class ExpandExec(projections: Seq[Seq[Expression]], output: Seq[Attribute], child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

trait FileRelation extends AnyRef

case class FilterExec(condition: Expression, child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with PredicateHelper with Product with Serializable

case class GenerateExec(generator: Generator, join: Boolean, outer: Boolean, output: Seq[Attribute], child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

case class GlobalLimitExec(limit: Int, child: SparkPlan) extends SparkPlan with BaseLimitExec with Product with Serializable

class GroupedIterator extends Iterator[(InternalRow, Iterator[InternalRow])]

case class InputAdapter(child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

trait LeafExecNode extends SparkPlan

case class LocalLimitExec(limit: Int, child: SparkPlan) extends SparkPlan with BaseLimitExec with Product with Serializable

case class LocalTableScanExec(output: Seq[Attribute], rows: Seq[InternalRow]) extends SparkPlan with LeafExecNode with Product with Serializable

case class LogicalRDD(output: Seq[Attribute], rdd: RDD[InternalRow])(session: SparkSession) extends LogicalPlan with MultiInstanceRelation with Product with Serializable

case class MapElementsExec(func: AnyRef, outputObjAttr: Attribute, child: SparkPlan) extends SparkPlan with ObjectConsumerExec with ObjectProducerExec with CodegenSupport with Product with Serializable

case class MapPartitionsExec(func: (Iterator[Any]) ⇒ Iterator[Any], outputObjAttr: Attribute, child: SparkPlan) extends SparkPlan with ObjectConsumerExec with ObjectProducerExec with Product with Serializable

trait ObjectConsumerExec extends SparkPlan with UnaryExecNode

trait ObjectProducerExec extends SparkPlan

case class OutputFakerExec(output: Seq[Attribute], child: SparkPlan) extends SparkPlan with Product with Serializable

case class PlanLater(plan: LogicalPlan) extends SparkPlan with LeafExecNode with Product with Serializable

case class PlanSubqueries(sparkSession: SparkSession) extends Rule[SparkPlan] with Product with Serializable

case class ProjectExec(projectList: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

class QueryExecution extends AnyRef

class QueryExecutionException extends Exception

case class RDDScanExec(output: Seq[Attribute], rdd: RDD[InternalRow], nodeName: String) extends SparkPlan with LeafExecNode with Product with Serializable

case class RangeExec(range: Range) extends SparkPlan with LeafExecNode with CodegenSupport with Product with Serializable

abstract class RowIterator extends AnyRef

case class SampleExec(lowerBound: Double, upperBound: Double, withReplacement: Boolean, seed: Long, child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

case class ScalarSubquery(executedPlan: SparkPlan, exprId: ExprId) extends SubqueryExpression with Product with Serializable

case class SerializeFromObjectExec(serializer: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with ObjectConsumerExec with CodegenSupport with Product with Serializable

class ShuffledRowRDD extends RDD[InternalRow]

case class SortExec(sortOrder: Seq[SortOrder], global: Boolean, child: SparkPlan, testSpillFrequency: Int = 0) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

class SparkOptimizer extends Optimizer

abstract class SparkPlan extends QueryPlan[SparkPlan] with Logging with Serializable

class SparkPlanInfo extends AnyRef

class SparkPlanner extends SparkStrategies

class SparkSqlAstBuilder extends AstBuilder

class SparkSqlParser extends AbstractSqlParser

abstract class SparkStrategies extends QueryPlanner[SparkPlan]

abstract class SparkStrategy extends GenericStrategy[SparkPlan]

case class SubqueryExec(name: String, child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

case class TakeOrderedAndProjectExec(limit: Int, sortOrder: Seq[SortOrder], projectList: Seq[NamedExpression], child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

trait UnaryExecNode extends SparkPlan

case class UnionExec(children: Seq[SparkPlan]) extends SparkPlan with Product with Serializable

final class UnsafeFixedWidthAggregationMap extends AnyRef

final class UnsafeKVExternalSorter extends AnyRef

class UnsafeRowSerializer extends Serializer with Serializable

case class WholeStageCodegenExec(child: SparkPlan) extends SparkPlan with UnaryExecNode with CodegenSupport with Product with Serializable

case class WindowExec(windowExpression: Seq[NamedExpression], partitionSpec: Seq[Expression], orderSpec: Seq[SortOrder], child: SparkPlan) extends SparkPlan with UnaryExecNode with Product with Serializable

Value Members

object DataSourceScanExec extends Serializable

object GroupedIterator

object ObjectOperator

object RDDConversions

object RowIterator

object SQLExecution

object SortPrefixUtils

object SparkPlan extends Serializable

object UnaryExecNode extends Serializable

object WholeStageCodegenExec extends Serializable

package aggregate

package columnar

package command

package datasources

package debug