rdd

Type Members

class ADAMContext extends Serializable with Logging

The ADAMContext provides functions on top of a SparkContext for loading genomic data.
trait ADAMSaveAnyArgs extends SaveArgs

Argument configuration for saving any output format.
abstract class AvroGenomicRDD[T, U <: Product, V <: AvroGenomicRDD[T, U, V]] extends ADAMRDDFunctions[T] with GenomicDataset[T, U, V]

An abstract class that extends GenomicRDD and where the underlying data are Avro IndexedRecords.
abstract class AvroRecordGroupGenomicRDD[T, U <: Product, V <: AvroRecordGroupGenomicRDD[T, U, V]] extends AvroGenomicRDD[T, U, V] with GenomicRDDWithLineage[T, V]

An abstract class describing a GenomicRDD where:
case class FullOuterShuffleRegionJoin[T, U](leftRdd: RDD[(ReferenceRegion, T)], rightRdd: RDD[(ReferenceRegion, U)])(implicit evidence$11: ClassTag[T], evidence$12: ClassTag[U]) extends ShuffleRegionJoin[T, U, Option[T], Option[U]] with SortedIntervalPartitionJoinWithVictims[T, U, Option[T], Option[U]] with Product with Serializable
case class GenericGenomicRDD[T](rdd: RDD[T], sequences: SequenceDictionary, regionFn: (T) ⇒ Seq[ReferenceRegion], optPartitionMap: Option[Array[Option[(ReferenceRegion, ReferenceRegion)]]] = scala.None)(implicit tTag: ClassTag[T]) extends GenomicRDD[T, GenericGenomicRDD[T]] with Product with Serializable
case class GenomeBins(binSize: Long, seqLengths: Map[String, Long]) extends Serializable with Product

Partition a genome into a set of bins.
trait GenomicDataset[T, U <: Product, V <: GenomicDataset[T, U, V]] extends GenomicRDD[T, V]

A trait describing a GenomicRDD that also supports the Spark SQL APIs.
trait GenomicDatasetConversion[T <: Product, U <: GenomicDataset[_, T, U], X <: Product, Y <: GenomicDataset[_, X, Y]] extends Function2[U, Dataset[X], Y]
case class GenomicPositionPartitioner(numParts: Int, seqLengths: Map[String, Long]) extends Partitioner with Logging with Product with Serializable

GenomicPositionPartitioner partitions ReferencePosition objects into separate, spatially-coherent regions of the genome.
trait GenomicRDD[T, U <: GenomicRDD[T, U]] extends Logging

A trait that wraps an RDD of genomic data with helpful metadata.
trait GenomicRDDWithLineage[T, U <: GenomicRDDWithLineage[T, U]] extends GenomicRDD[T, U]
case class GenomicRegionPartitioner(partitionSize: Long, seqLengths: Map[String, Long], start: Boolean = true) extends Partitioner with Logging with Product with Serializable

A partitioner for ReferenceRegion-keyed data.
trait InFormatter[T, U <: GenomicRDD[T, U], V <: InFormatter[T, U, V]] extends Serializable

Formats data going into a pipe to an invoked process.
trait InFormatterCompanion[T, U <: GenomicRDD[T, U], V <: InFormatter[T, U, V]] extends AnyRef

A trait for singleton objects that build an InFormatter from a GenomicRDD.
case class InnerShuffleRegionJoin[T, U](leftRdd: RDD[(ReferenceRegion, T)], rightRdd: RDD[(ReferenceRegion, U)])(implicit evidence$3: ClassTag[T], evidence$4: ClassTag[U]) extends ShuffleRegionJoin[T, U, T, U] with VictimlessSortedIntervalPartitionJoin[T, U, T, U] with Product with Serializable
case class InnerShuffleRegionJoinAndGroupByLeft[T, U](leftRdd: RDD[(ReferenceRegion, T)], rightRdd: RDD[(ReferenceRegion, U)])(implicit evidence$5: ClassTag[T], evidence$6: ClassTag[U]) extends ShuffleRegionJoin[T, U, T, Iterable[U]] with VictimlessSortedIntervalPartitionJoin[T, U, T, Iterable[U]] with Product with Serializable
case class InnerTreeRegionJoin[T, U]()(implicit evidence$1: ClassTag[T], evidence$2: ClassTag[U]) extends RegionJoin[T, U, T, U] with TreeRegionJoin[T, U, T, U] with Product with Serializable

Implements an inner region join where the left side of the join is broadcast.
case class InnerTreeRegionJoinAndGroupByRight[T, U]()(implicit evidence$5: ClassTag[T], evidence$6: ClassTag[U]) extends RegionJoin[T, U, Iterable[T], U] with TreeRegionJoin[T, U, Iterable[T], U] with Product with Serializable

Performs an inner region join, followed logically by grouping by the right value.
case class LeftOuterShuffleRegionJoin[T, U](leftRdd: RDD[(ReferenceRegion, T)], rightRdd: RDD[(ReferenceRegion, U)])(implicit evidence$7: ClassTag[T], evidence$8: ClassTag[U]) extends ShuffleRegionJoin[T, U, T, Option[U]] with VictimlessSortedIntervalPartitionJoin[T, U, T, Option[U]] with Product with Serializable
case class LeftOuterShuffleRegionJoinAndGroupByLeft[T, U](leftRdd: RDD[(ReferenceRegion, T)], rightRdd: RDD[(ReferenceRegion, U)])(implicit evidence$9: ClassTag[T], evidence$10: ClassTag[U]) extends ShuffleRegionJoin[T, U, T, Iterable[U]] with VictimlessSortedIntervalPartitionJoin[T, U, T, Iterable[U]] with Product with Serializable
abstract class MultisampleAvroGenomicRDD[T, U <: Product, V <: MultisampleAvroGenomicRDD[T, U, V]] extends AvroGenomicRDD[T, U, V] with MultisampleGenomicRDD[T, V]

An abstract class that extends the MultisampleGenomicRDD trait, where the data are Avro IndexedRecords.
trait MultisampleGenomicRDD[T, U <: MultisampleGenomicRDD[T, U]] extends GenomicRDD[T, U]

A trait describing a GenomicRDD with data from multiple samples.
trait OutFormatter[T] extends Serializable

Deserializes data coming out of a pipe from an invoked process.
case class ReferencePartitioner(sd: SequenceDictionary) extends Partitioner with Product with Serializable

Repartitions objects that are keyed by a ReferencePosition or ReferenceRegion into a single partition per contig.
abstract class RegionJoin[T, U, RT, RU] extends Serializable

A trait describing a join in the genomic coordinate space between two RDDs where the values are keyed by a ReferenceRegion.
case class RightOuterShuffleRegionJoinAndGroupByLeft[T, U](leftRdd: RDD[(ReferenceRegion, T)], rightRdd: RDD[(ReferenceRegion, U)])(implicit evidence$13: ClassTag[T], evidence$14: ClassTag[U]) extends ShuffleRegionJoin[T, U, Option[T], Iterable[U]] with SortedIntervalPartitionJoinWithVictims[T, U, Option[T], Iterable[U]] with Product with Serializable
case class RightOuterTreeRegionJoin[T, U]()(implicit evidence$3: ClassTag[T], evidence$4: ClassTag[U]) extends RegionJoin[T, U, Option[T], U] with TreeRegionJoin[T, U, Option[T], U] with Product with Serializable

Implements a right outer region join where the left side of the join is broadcast.
case class RightOuterTreeRegionJoinAndGroupByRight[T, U]()(implicit evidence$7: ClassTag[T], evidence$8: ClassTag[U]) extends RegionJoin[T, U, Iterable[T], U] with TreeRegionJoin[T, U, Iterable[T], U] with Product with Serializable

Performs a right outer region join, followed logically by grouping by the right value.
sealed abstract class ShuffleRegionJoin[T, U, RT, RU] extends RegionJoin[T, U, RT, RU]

A trait describing join implementations that are based on a sort-merge join.
sealed trait SortedIntervalPartitionJoinWithVictims[T, U, RT, RU] extends ShuffleRegionJoin[T, U, RT, RU]
trait TreeRegionJoin[T, U, RT, RU] extends RegionJoin[T, U, RT, RU]

Implements a shuffle free (broadcast) region join.
sealed trait VictimlessSortedIntervalPartitionJoin[T, U, RT, RU] extends ShuffleRegionJoin[T, U, RT, RU]

Value Members

object ADAMContext extends Serializable

This singleton provides an implicit conversion from a SparkContext to the ADAMContext, as well as implicit functions for the Pipe API.
object GenomicPositionPartitioner extends Serializable

Helper for creating genomic position partitioners.
object GenomicRegionPartitioner extends Serializable

Helper object for creating GenomicRegionPartitioners.
package contig
package feature
package fragment
package read
package variant

package rdd

Type Members

class ADAMContext extends Serializable with Logging

trait ADAMSaveAnyArgs extends SaveArgs

abstract class AvroGenomicRDD[T, U <: Product, V <: AvroGenomicRDD[T, U, V]] extends ADAMRDDFunctions[T] with GenomicDataset[T, U, V]

abstract class AvroRecordGroupGenomicRDD[T, U <: Product, V <: AvroRecordGroupGenomicRDD[T, U, V]] extends AvroGenomicRDD[T, U, V] with GenomicRDDWithLineage[T, V]

case class GenomeBins(binSize: Long, seqLengths: Map[String, Long]) extends Serializable with Product

trait GenomicDataset[T, U <: Product, V <: GenomicDataset[T, U, V]] extends GenomicRDD[T, V]

trait GenomicDatasetConversion[T <: Product, U <: GenomicDataset[_, T, U], X <: Product, Y <: GenomicDataset[_, X, Y]] extends Function2[U, Dataset[X], Y]

case class GenomicPositionPartitioner(numParts: Int, seqLengths: Map[String, Long]) extends Partitioner with Logging with Product with Serializable

trait GenomicRDD[T, U <: GenomicRDD[T, U]] extends Logging

trait GenomicRDDWithLineage[T, U <: GenomicRDDWithLineage[T, U]] extends GenomicRDD[T, U]

case class GenomicRegionPartitioner(partitionSize: Long, seqLengths: Map[String, Long], start: Boolean = true) extends Partitioner with Logging with Product with Serializable

trait InFormatter[T, U <: GenomicRDD[T, U], V <: InFormatter[T, U, V]] extends Serializable

trait InFormatterCompanion[T, U <: GenomicRDD[T, U], V <: InFormatter[T, U, V]] extends AnyRef

case class InnerShuffleRegionJoin[T, U](leftRdd: RDD[(ReferenceRegion, T)], rightRdd: RDD[(ReferenceRegion, U)])(implicit evidence$3: ClassTag[T], evidence$4: ClassTag[U]) extends ShuffleRegionJoin[T, U, T, U] with VictimlessSortedIntervalPartitionJoin[T, U, T, U] with Product with Serializable

case class InnerTreeRegionJoin[T, U]()(implicit evidence$1: ClassTag[T], evidence$2: ClassTag[U]) extends RegionJoin[T, U, T, U] with TreeRegionJoin[T, U, T, U] with Product with Serializable

case class InnerTreeRegionJoinAndGroupByRight[T, U]()(implicit evidence$5: ClassTag[T], evidence$6: ClassTag[U]) extends RegionJoin[T, U, Iterable[T], U] with TreeRegionJoin[T, U, Iterable[T], U] with Product with Serializable

abstract class MultisampleAvroGenomicRDD[T, U <: Product, V <: MultisampleAvroGenomicRDD[T, U, V]] extends AvroGenomicRDD[T, U, V] with MultisampleGenomicRDD[T, V]

trait MultisampleGenomicRDD[T, U <: MultisampleGenomicRDD[T, U]] extends GenomicRDD[T, U]

trait OutFormatter[T] extends Serializable

case class ReferencePartitioner(sd: SequenceDictionary) extends Partitioner with Product with Serializable

abstract class RegionJoin[T, U, RT, RU] extends Serializable

case class RightOuterTreeRegionJoin[T, U]()(implicit evidence$3: ClassTag[T], evidence$4: ClassTag[U]) extends RegionJoin[T, U, Option[T], U] with TreeRegionJoin[T, U, Option[T], U] with Product with Serializable

case class RightOuterTreeRegionJoinAndGroupByRight[T, U]()(implicit evidence$7: ClassTag[T], evidence$8: ClassTag[U]) extends RegionJoin[T, U, Iterable[T], U] with TreeRegionJoin[T, U, Iterable[T], U] with Product with Serializable

sealed abstract class ShuffleRegionJoin[T, U, RT, RU] extends RegionJoin[T, U, RT, RU]

sealed trait SortedIntervalPartitionJoinWithVictims[T, U, RT, RU] extends ShuffleRegionJoin[T, U, RT, RU]

trait TreeRegionJoin[T, U, RT, RU] extends RegionJoin[T, U, RT, RU]

sealed trait VictimlessSortedIntervalPartitionJoin[T, U, RT, RU] extends ShuffleRegionJoin[T, U, RT, RU]

Value Members

object ADAMContext extends Serializable

object GenomicPositionPartitioner extends Serializable

object GenomicRegionPartitioner extends Serializable

package contig

package feature

package fragment

package read

package variant

Ungrouped