ScioContext

Value Members

final def !=(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def !=(arg0: Any): Boolean

Definition Classes
Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def ==(arg0: Any): Boolean

Definition Classes
Any
def addArtifacts(extraLocalArtifacts: List[String]): Unit

Add artifact to stage in Dataflow - artifact can be jar/text-files etc.
Add artifact to stage in Dataflow - artifact can be jar/text-files etc. NOTE: currently one can add artifacts only before pipeline object is created
final def asInstanceOf[T0]: T0

Definition Classes
Any
def avroFile[T](path: String, schema: Schema = null)(implicit arg0: ClassTag[T]): SCollection[T]

Get an SCollection for an Avro file.
def bigQuerySelect(sqlQuery: String): SCollection[TableRow]

Get an SCollection for a BigQuery SELECT query.
def bigQueryTable(tableSpec: String): SCollection[TableRow]

Get an SCollection for a BigQuery table.
def bigQueryTable(table: TableReference): SCollection[TableRow]

Get an SCollection for a BigQuery table.
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
def close(): ScioResult

Close the context.
Close the context. No operation can be performed once the context is closed.
def datastore(datasetId: String, query: Query): SCollection[Entity]

Get an SCollection for a Datastore query.
def distCache[F](uris: Seq[String])(initFn: (Seq[File]) ⇒ F): DistCache[F]

Create a new DistCache instance.
Create a new DistCache instance.
uris
Google Cloud Storage URIs of the files to be distributed to all workers
initFn
function to initialized the distributed files

def distCache[F](uri: String)(initFn: (File) ⇒ F): DistCache[F]

Create a new DistCache instance.

uri

Google Cloud Storage URI of the file to be distributed to all workers

initFn

function to initialized the distributed file

// Prepare distributed cache as Map[Int, String]
val dc = sc.distCache("gs://dataflow-samples/samples/misc/months.txt") { f =>
  scala.io.Source.fromFile(f).getLines().map { s =>
    val t = s.split(" ")
    (t(0).toInt, t(1))
  }.toMap
}

val p: SCollection[Int] = // ...
// Extract distributed cache inside a transform
p.map(x => dc().getOrElse(x, "unknown"))

final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
def isClosed: Boolean

Whether the context is closed.
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def maxAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

Create a new Accumulator that keeps track of the maximum value.
Create a new Accumulator that keeps track of the maximum value. See SCollection.withAccumulator for examples.
def minAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

Create a new Accumulator that keeps track of the minimum value.
Create a new Accumulator that keeps track of the minimum value. See SCollection.withAccumulator for examples.
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def objectFile[T](path: String)(implicit arg0: ClassTag[T]): SCollection[T]

Get an SCollection for an object file.
val options: DataflowPipelineOptions
def parallelize[K, V](elems: Map[K, V])(implicit arg0: ClassTag[K], arg1: ClassTag[V]): SCollection[(K, V)]

Distribute a local Scala Map to form an SCollection.
def parallelize[T](elems: Iterable[T])(implicit arg0: ClassTag[T]): SCollection[T]

Distribute a local Scala Iterable to form an SCollection.
def parallelizeTimestamped[T](elems: Iterable[T], timestamps: Iterable[Instant])(implicit arg0: ClassTag[T]): SCollection[T]

Distribute a local Scala Iterable with timestamps to form an SCollection.
def parallelizeTimestamped[T](elems: Iterable[(T, Instant)])(implicit arg0: ClassTag[T]): SCollection[T]

Distribute a local Scala Iterable with timestamps to form an SCollection.
def pipeline: Pipeline

Dataflow pipeline.
def pubsubSubscription(sub: String, idLabel: String = null, timestampLabel: String = null): SCollection[String]

Get an SCollection for a Pub/Sub subscription.
def pubsubTopic(topic: String, idLabel: String = null, timestampLabel: String = null): SCollection[String]

Get an SCollection for a Pub/Sub topic.
def setName(name: String): Unit

Set name for the context.
def sumAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

Create a new Accumulator that keeps track of the sum of values.
Create a new Accumulator that keeps track of the sum of values. See SCollection.withAccumulator for examples.
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def tableRowJsonFile(path: String): SCollection[TableRow]

Get an SCollection of TableRow for a JSON file.
def textFile(path: String): SCollection[String]

Get an SCollection for a text file.
def toString(): String

Definition Classes
AnyRef → Any
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
def wrap[T](p: PCollection[T])(implicit arg0: ClassTag[T]): SCollection[T]

Wrap a PCollection.

class ScioContext extends AnyRef

Value Members

final def !=(arg0: AnyRef): Boolean

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: AnyRef): Boolean

final def ==(arg0: Any): Boolean

def addArtifacts(extraLocalArtifacts: List[String]): Unit

final def asInstanceOf[T0]: T0

def avroFile[T](path: String, schema: Schema = null)(implicit arg0: ClassTag[T]): SCollection[T]

def bigQuerySelect(sqlQuery: String): SCollection[TableRow]

def bigQueryTable(tableSpec: String): SCollection[TableRow]

def bigQueryTable(table: TableReference): SCollection[TableRow]

def clone(): AnyRef

def close(): ScioResult

def datastore(datasetId: String, query: Query): SCollection[Entity]

def distCache[F](uris: Seq[String])(initFn: (Seq[File]) ⇒ F): DistCache[F]

def distCache[F](uri: String)(initFn: (File) ⇒ F): DistCache[F]

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

def isClosed: Boolean

final def isInstanceOf[T0]: Boolean

def maxAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

def minAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def objectFile[T](path: String)(implicit arg0: ClassTag[T]): SCollection[T]

val options: DataflowPipelineOptions

def parallelize[K, V](elems: Map[K, V])(implicit arg0: ClassTag[K], arg1: ClassTag[V]): SCollection[(K, V)]

def parallelize[T](elems: Iterable[T])(implicit arg0: ClassTag[T]): SCollection[T]

def parallelizeTimestamped[T](elems: Iterable[T], timestamps: Iterable[Instant])(implicit arg0: ClassTag[T]): SCollection[T]

def parallelizeTimestamped[T](elems: Iterable[(T, Instant)])(implicit arg0: ClassTag[T]): SCollection[T]

def pipeline: Pipeline

def pubsubSubscription(sub: String, idLabel: String = null, timestampLabel: String = null): SCollection[String]

def pubsubTopic(topic: String, idLabel: String = null, timestampLabel: String = null): SCollection[String]

def setName(name: String): Unit

def sumAccumulator[T](n: String)(implicit at: AccumulatorType[T]): Accumulator[T]

final def synchronized[T0](arg0: ⇒ T0): T0

def tableRowJsonFile(path: String): SCollection[TableRow]

def textFile(path: String): SCollection[String]

def toString(): String

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

def wrap[T](p: PCollection[T])(implicit arg0: ClassTag[T]): SCollection[T]

Inherited from AnyRef

Inherited from Any

Accumulators

Distributed Cache

In-memory Collections

Input Sources

Other Members