ScioContext

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def addArtifacts(extraLocalArtifacts: List[String]): Unit

Add artifact to stage in workers.
Add artifact to stage in workers. Artifact can be jar/text-files etc. NOTE: currently one can only add artifacts before pipeline object is created.
final def asInstanceOf[T0]: T0

Definition Classes
Any
def avroFile[T](path: String, schema: Schema = null)(implicit arg0: ClassTag[T]): SCollection[T]

Get an SCollection for an Avro file.
Get an SCollection for an Avro file.
schema
must be not null if T is of type GenericRecord.
def bigQuerySelect(sqlQuery: String, flattenResults: Boolean = false): SCollection[TableRow]

Get an SCollection for a BigQuery SELECT query.
def bigQueryTable(tableSpec: String): SCollection[TableRow]

Get an SCollection for a BigQuery table.
def bigQueryTable(table: TableReference): SCollection[TableRow]

Get an SCollection for a BigQuery table.
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
def close(): ScioResult

Close the context.
Close the context. No operation can be performed once the context is closed.
def customInput[T](name: String, transform: PTransform[PBegin, PCollection[T]])(implicit arg0: ClassTag[T]): SCollection[T]

Get an SCollection with a custom input transform.
Get an SCollection with a custom input transform. The transform should have a unique name.
def datastore(projectId: String, query: Query, namespace: String = null): SCollection[Entity]

Get an SCollection for a Datastore query.
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
def isClosed: Boolean

Whether the context is closed.
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def isTest: Boolean

Whether this is a test context.
def maxAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

Create a new Accumulator that keeps track of the maximum value.
Create a new Accumulator that keeps track of the maximum value. See SCollection.withAccumulator for examples.
def minAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

Create a new Accumulator that keeps track of the minimum value.
Create a new Accumulator that keeps track of the minimum value. See SCollection.withAccumulator for examples.
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def objectFile[T](path: String)(implicit arg0: ClassTag[T]): SCollection[T]

Get an SCollection for an object file using default serialization.
Get an SCollection for an object file using default serialization.
Serialized objects are stored in Avro files to leverage Avro's block file format. Note that serialization is not guaranteed to be compatible across Scio releases.
val options: PipelineOptions
def optionsAs[T <: PipelineOptions](implicit arg0: ClassTag[T]): T

Get PipelineOptions as a more specific sub-type.
def parallelize[K, V](elems: Map[K, V])(implicit arg0: ClassTag[K], arg1: ClassTag[V]): SCollection[(K, V)]

Distribute a local Scala Map to form an SCollection.
def parallelize[T](elems: Iterable[T])(implicit arg0: ClassTag[T]): SCollection[T]

Distribute a local Scala Iterable to form an SCollection.
def parallelizeTimestamped[T](elems: Iterable[T], timestamps: Iterable[Instant])(implicit arg0: ClassTag[T]): SCollection[T]

Distribute a local Scala Iterable with timestamps to form an SCollection.
def parallelizeTimestamped[T](elems: Iterable[(T, Instant)])(implicit arg0: ClassTag[T]): SCollection[T]

Distribute a local Scala Iterable with timestamps to form an SCollection.
def pipeline: Pipeline

Underlying pipeline.
def protobufFile[T](path: String)(implicit arg0: ClassTag[T], ev: <:<[T, Message]): SCollection[T]

Get an SCollection for a Protobuf file.
Get an SCollection for a Protobuf file.
Protobuf messages are serialized into Array[Byte] and stored in Avro files to leverage Avro's block file format.
def pubsubSubscription[T](sub: String, idLabel: String = null, timestampLabel: String = null)(implicit arg0: ClassTag[T]): SCollection[T]

Get an SCollection for a Pub/Sub subscription.
def pubsubTopic[T](topic: String, idLabel: String = null, timestampLabel: String = null)(implicit arg0: ClassTag[T]): SCollection[T]

Get an SCollection for a Pub/Sub topic.
def setAppName(name: String): Unit

Set application name for the context.
def setJobName(name: String): Unit

Set job name for the context (Dataflow only)
def sumAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

Create a new Accumulator that keeps track of the sum of values.
Create a new Accumulator that keeps track of the sum of values. See SCollection.withAccumulator for examples.
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def tableRowJsonFile(path: String): SCollection[TableRow]

Get an SCollection for a BigQuery TableRow JSON file.
def textFile(path: String, compressionType: CompressionType = gio.TextIO.CompressionType.AUTO): SCollection[String]

Get an SCollection for a text file.
def tfRecordFile(path: String, tfRecordOptions: TFRecordOptions = TFRecordOptions.readDefault): SCollection[Array[Byte]]

Get an SCollection for a TensorFlow TFRecord file.
Get an SCollection for a TensorFlow TFRecord file. Note that TFRecord files are not splittable.
def toString(): String

Definition Classes
AnyRef → Any
def typedBigQuery[T <: HasAnnotation](newSource: String = null)(implicit arg0: ClassTag[T], arg1: scala.reflect.api.JavaUniverse.TypeTag[T]): SCollection[T]

Get a typed SCollection for a BigQuery SELECT query or table.
Get a typed SCollection for a BigQuery SELECT query or table.
Note that T must be annotated with BigQueryType.fromSchema, BigQueryType.fromTable, BigQueryType.fromQuery, or BigQueryType.toTable.
By default the source (table or query) specified in the annotation will be used, but it can be overridden with the newSource parameter. For example:
```
@BigQueryType.fromTable("publicdata:samples.gsod")
class Row

// Read from [publicdata:samples.gsod] as specified in the annotation.
sc.typedBigQuery[Row]()

// Read from [myproject:samples.gsod] instead.
sc.typedBigQuery[Row]("myproject:samples.gsod")

// Read from a query instead.
sc.typedBigQuery[Row]("SELECT * FROM [publicdata:samples.gsod] LIMIT 1000")
```
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
def withName(name: String): ScioContext.this.type

Set a custom name for the next transform to be applied.
Set a custom name for the next transform to be applied.

Definition Classes
TransformNameable
def wrap[T](p: PCollection[T])(implicit arg0: ClassTag[T]): SCollection[T]

Wrap a PCollection.

Related Docs: object ScioContext | package scio

class ScioContext extends TransformNameable

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

def addArtifacts(extraLocalArtifacts: List[String]): Unit

final def asInstanceOf[T0]: T0

def avroFile[T](path: String, schema: Schema = null)(implicit arg0: ClassTag[T]): SCollection[T]

def bigQuerySelect(sqlQuery: String, flattenResults: Boolean = false): SCollection[TableRow]

def bigQueryTable(tableSpec: String): SCollection[TableRow]

def bigQueryTable(table: TableReference): SCollection[TableRow]

def clone(): AnyRef

def close(): ScioResult

def customInput[T](name: String, transform: PTransform[PBegin, PCollection[T]])(implicit arg0: ClassTag[T]): SCollection[T]

def datastore(projectId: String, query: Query, namespace: String = null): SCollection[Entity]

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

def isClosed: Boolean

final def isInstanceOf[T0]: Boolean

def isTest: Boolean

def maxAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

def minAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def objectFile[T](path: String)(implicit arg0: ClassTag[T]): SCollection[T]

val options: PipelineOptions

def optionsAs[T <: PipelineOptions](implicit arg0: ClassTag[T]): T

def parallelize[K, V](elems: Map[K, V])(implicit arg0: ClassTag[K], arg1: ClassTag[V]): SCollection[(K, V)]

def parallelize[T](elems: Iterable[T])(implicit arg0: ClassTag[T]): SCollection[T]

def parallelizeTimestamped[T](elems: Iterable[T], timestamps: Iterable[Instant])(implicit arg0: ClassTag[T]): SCollection[T]

def parallelizeTimestamped[T](elems: Iterable[(T, Instant)])(implicit arg0: ClassTag[T]): SCollection[T]

def pipeline: Pipeline

def protobufFile[T](path: String)(implicit arg0: ClassTag[T], ev: <:<[T, Message]): SCollection[T]

def pubsubSubscription[T](sub: String, idLabel: String = null, timestampLabel: String = null)(implicit arg0: ClassTag[T]): SCollection[T]

def pubsubTopic[T](topic: String, idLabel: String = null, timestampLabel: String = null)(implicit arg0: ClassTag[T]): SCollection[T]

def setAppName(name: String): Unit

def setJobName(name: String): Unit

def sumAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

final def synchronized[T0](arg0: ⇒ T0): T0

def tableRowJsonFile(path: String): SCollection[TableRow]

def textFile(path: String, compressionType: CompressionType = gio.TextIO.CompressionType.AUTO): SCollection[String]

def tfRecordFile(path: String, tfRecordOptions: TFRecordOptions = TFRecordOptions.readDefault): SCollection[Array[Byte]]

def toString(): String

def typedBigQuery[T <: HasAnnotation](newSource: String = null)(implicit arg0: ClassTag[T], arg1: scala.reflect.api.JavaUniverse.TypeTag[T]): SCollection[T]

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

def withName(name: String): ScioContext.this.type

def wrap[T](p: PCollection[T])(implicit arg0: ClassTag[T]): SCollection[T]

Inherited from TransformNameable

Inherited from AnyRef

Inherited from Any

Accumulators

In-memory Collections

Input Sources

Other Members