ReadConf

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final val DefaultFetchSize: Int(1000)
final val DefaultSplitCount: Int(10)
final val DefaultTsTimestampBinding: UseTimestamp.type
final val DefaultUseStreamingValues4FBRead: Boolean
def apply(conf: SparkConf, options: Map[String, String]): ReadConf

Creates ReadConf based on an externally provided map of properties to override those of SparkCon
Creates ReadConf based on an externally provided map of properties to override those of SparkCon
conf
SparkConf of Spark context to be taken as defaults
options
externally provided map of properties
def apply(conf: SparkConf): ReadConf

Creates ReadConf based on properties provided to Spark Conf
Creates ReadConf based on properties provided to Spark Conf
conf
SparkConf of Spark context with Riak-related properties
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final val fetchSizePropName: String("spark.riak.input.fetch-size")
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
final val smartSplitMultiplier: Int(3)

The docs recommend to have your number of partitions set to 3 or 4 times the number of CPUs in your cluster so that the work gets distributed more evenly among the CPUs.
The docs recommend to have your number of partitions set to 3 or 4 times the number of CPUs in your cluster so that the work gets distributed more evenly among the CPUs. Meaning, if you only have 1 partition per core in the cluster you will have to wait for the one longest running task to complete but if you had broken that down further the workload would be more evenly balanced with fast and slow running tasks evening out.
Since there is no enough information about available Spark resources such as real number of cores, 3x multiplier will be used.
final val splitCountPropName: String("spark.riak.input.split.count")
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
final val tsBindingsTimestamp: String("spark.riakts.bindings.timestamp")
final val tsQuantumPropName: String("spark.riak.partitioning.ts-quantum")
final val tsRangeFieldPropName: String("spark.riak.partitioning.ts-range-field-name")
final val useStreamingValuesPropName: String("spark.riak.fullbucket.use-streaming-values")
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

Related Docs: class ReadConf | package rdd

object ReadConf extends Serializable

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

final val DefaultFetchSize: Int(1000)

final val DefaultSplitCount: Int(10)

final val DefaultTsTimestampBinding: UseTimestamp.type

final val DefaultUseStreamingValues4FBRead: Boolean

def apply(conf: SparkConf, options: Map[String, String]): ReadConf

def apply(conf: SparkConf): ReadConf

final def asInstanceOf[T0]: T0

def clone(): AnyRef

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

final val fetchSizePropName: String("spark.riak.input.fetch-size")

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

final val smartSplitMultiplier: Int(3)

final val splitCountPropName: String("spark.riak.input.split.count")

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

final val tsBindingsTimestamp: String("spark.riakts.bindings.timestamp")

final val tsQuantumPropName: String("spark.riak.partitioning.ts-quantum")

final val tsRangeFieldPropName: String("spark.riak.partitioning.ts-range-field-name")

final val useStreamingValuesPropName: String("spark.riak.fullbucket.use-streaming-values")

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from Serializable

Inherited from Serializable

Inherited from AnyRef

Inherited from Any

Ungrouped