SparkSubFeed

Instance Constructors

new SparkSubFeed(dataFrame: Option[DataFrame], dataObjectId: DataObjectId, partitionValues: Seq[PartitionValues], isDAGStart: Boolean = false, isDummy: Boolean = false, filter: Option[String] = None)

dataFrame
Spark DataFrame to be processed. DataFrame should not be saved to state (@transient).
dataObjectId
id of the DataObject this SubFeed corresponds to
partitionValues
Values of Partitions transported by this SubFeed
isDAGStart
true if this subfeed is a start node of the dag
isDummy
true if this subfeed only contains a dummy DataFrame. Dummy DataFrames can be used for validating the lineage in init phase, but not for the exec phase.
filter
a spark sql filter expression. This is used by SparkIncrementalMode.

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def asInstanceOf[T0]: T0

Definition Classes
Any
def breakLineage(implicit session: SparkSession, context: ActionPipelineContext): SparkSubFeed

Break lineage.
Break lineage. This means to discard an existing DataFrame or List of FileRefs, so that it is requested again from the DataObject. This is usable to break long DataFrame Lineages over multiple Actions and instead reread the data from an intermediate table

Definition Classes
SparkSubFeed → SubFeed
def clearDAGStart(): SparkSubFeed

Definition Classes
SparkSubFeed → SubFeed
def clearFilter(implicit session: SparkSession, context: ActionPipelineContext): SparkSubFeed
def clearPartitionValues(): SparkSubFeed

Definition Classes
SparkSubFeed → SubFeed
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
val dataFrame: Option[DataFrame]

Spark DataFrame to be processed.
Spark DataFrame to be processed. DataFrame should not be saved to state (@transient).
val dataObjectId: DataObjectId

id of the DataObject this SubFeed corresponds to
id of the DataObject this SubFeed corresponds to

Definition Classes
SparkSubFeed → SubFeed
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
val filter: Option[String]

a spark sql filter expression.
a spark sql filter expression. This is used by SparkIncrementalMode.
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def getFilterCol: Option[Column]
val isDAGStart: Boolean

true if this subfeed is a start node of the dag
true if this subfeed is a start node of the dag

Definition Classes
SparkSubFeed → SubFeed
val isDummy: Boolean

true if this subfeed only contains a dummy DataFrame.
true if this subfeed only contains a dummy DataFrame. Dummy DataFrames can be used for validating the lineage in init phase, but not for the exec phase.
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def isStreaming: Option[Boolean]
def movePartitionColumnsLast(partitions: Seq[String]): SparkSubFeed
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
val partitionValues: Seq[PartitionValues]

Values of Partitions transported by this SubFeed
Values of Partitions transported by this SubFeed

Definition Classes
SparkSubFeed → SubFeed
def persist: SparkSubFeed
def resultId: String

Definition Classes
SubFeed → DAGResult
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def updatePartitionValues(partitions: Seq[String]): SparkSubFeed

Definition Classes
SparkSubFeed → SubFeed
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

Related Docs: object SparkSubFeed | package workflow

case class SparkSubFeed(dataFrame: Option[DataFrame], dataObjectId: DataObjectId, partitionValues: Seq[PartitionValues], isDAGStart: Boolean = false, isDummy: Boolean = false, filter: Option[String] = None) extends SubFeed with Product with Serializable

Instance Constructors

new SparkSubFeed(dataFrame: Option[DataFrame], dataObjectId: DataObjectId, partitionValues: Seq[PartitionValues], isDAGStart: Boolean = false, isDummy: Boolean = false, filter: Option[String] = None)

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

final def asInstanceOf[T0]: T0

def breakLineage(implicit session: SparkSession, context: ActionPipelineContext): SparkSubFeed

def clearDAGStart(): SparkSubFeed

def clearFilter(implicit session: SparkSession, context: ActionPipelineContext): SparkSubFeed

def clearPartitionValues(): SparkSubFeed

def clone(): AnyRef

val dataFrame: Option[DataFrame]

val dataObjectId: DataObjectId

final def eq(arg0: AnyRef): Boolean

val filter: Option[String]

def finalize(): Unit

final def getClass(): Class[_]

def getFilterCol: Option[Column]

val isDAGStart: Boolean

val isDummy: Boolean

final def isInstanceOf[T0]: Boolean

def isStreaming: Option[Boolean]

def movePartitionColumnsLast(partitions: Seq[String]): SparkSubFeed

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

val partitionValues: Seq[PartitionValues]

def persist: SparkSubFeed

def resultId: String

final def synchronized[T0](arg0: ⇒ T0): T0

def updatePartitionValues(partitions: Seq[String]): SparkSubFeed

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from Serializable

Inherited from Serializable

Inherited from Product

Inherited from Equals

Inherited from SubFeed

Inherited from DAGResult

Inherited from AnyRef

Inherited from Any

Ungrouped