DSVRGD

Instance Constructors

new DSVRGD(uid: String)

Abstract Value Members

abstract def addGradient(weights: Matrix, features: DenseMatrix, labels: DenseMatrix, updateTerm: DenseMatrix, marginCache: DenseMatrix, lossCache: DenseVector): Unit

For single instance and weights calculates gradient and loss.
For single instance and weights calculates gradient and loss. Depending on direction adds gradient and loss to the accumulated data.
weights
Weights to evaluate gradient at
features
Featrues of instance to evaluate gradient at
labels
Labels of the instance to evaluate gradient at
updateTerm
Update term to store gradient at
lossCache
Loss vector to record resulting loss values.

Attributes
protected
abstract def extractModel(labelAttributeGroup: AttributeGroup, numLabels: Int, weights: Matrix, dataset: DataFrame): M

Given labels info and weights matrice create appropriate ML models.
Given labels info and weights matrice create appropriate ML models.

Attributes
protected
abstract def weightsDistanceForLabel(oldWeights: Matrix, newWeights: DenseMatrix, label: Int): Double

Evaluates weight distance based on old and new weights images.
Evaluates weight distance based on old and new weights images.
oldWeights
Weights from the previous epoch
newWeights
Weights from the current epoch.
label
Label to check for convergence.
returns
Distance between old and new weights.

Attributes
protected

Concrete Value Members

final def !=(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def !=(arg0: Any): Boolean

Definition Classes
Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def $[T](param: Param[T]): T

Attributes
protected
Definition Classes
Params
final def ==(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def ==(arg0: Any): Boolean

Definition Classes
Any
def addL1Reg(l1regParam: Vector, weights: DenseMatrix, updateTerm: DenseMatrix, lossCache: DenseVector, skipRegFeature: Int): DenseMatrix

Attributes
protected
def addL2Reg(l2regParam: Vector, weights: DenseMatrix, updateTerm: DenseMatrix, lossCache: DenseVector, skipRegFeature: Int): DenseMatrix

Adds L2 regularization part to the gradient and loss.
Adds L2 regularization part to the gradient and loss.

Attributes
protected
def adjust(direction: Int, learningRates: DenseMatrix, updateTerm: DenseMatrix, weights: DenseMatrix): DenseMatrix
def applyL1Shrinkage(regParam: Vector, weights: DenseMatrix, skipRegFeature: Int, notDegraded: Set[Int]): DenseMatrix

Apply L1 shrinkage to the updated weights.
Apply L1 shrinkage to the updated weights.

Attributes
protected
final def asInstanceOf[T0]: T0

Definition Classes
Any
def axpy(a: Double, x: Vector, y: Array[Double]): Unit

Definition Classes
HasNetlibBlas
def axpy(a: Double, x: Array[Double], y: Array[Double]): Unit

Definition Classes
HasNetlibBlas
def axpyCompensated(updateTerm: Array[Double], sum: Array[Double], compensator: Array[Double], y: Array[Double], t: Array[Double]): Unit
def blas: BLAS

Definition Classes
HasNetlibBlas
final val cacheTrainData: BooleanParam

Definition Classes
HasCacheTrainData
final def clear(param: Param[_]): DSVRGD.this.type

Definition Classes
Params
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
val convergenceMode: Param[String]
def copy(extra: ParamMap): DSVRGD[M]

Definition Classes
DSVRGD → SummarizableEstimator → Estimator → PipelineStage → Params
def copy(x: Array[Double], y: Array[Double]): Unit

Definition Classes
HasNetlibBlas
def copyValues[T <: Params](to: T, extra: ParamMap): T

Attributes
protected
Definition Classes
Params
final def defaultCopy[T <: Params](extra: ParamMap): T

Attributes
protected
Definition Classes
Params
def dscal(a: Double, data: Array[Double]): Unit

Definition Classes
HasNetlibBlas
final val elasticNetParam: DoubleParam

Definition Classes
HasElasticNetParam
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def evaluateL1Regularization(data: DataFrame, l1Scalar: Double, numLabels: Int): Vector

Given L1 regularization config create a vector with per-label reg param (by default - constant).
Given L1 regularization config create a vector with per-label reg param (by default - constant).

Attributes
protected
def evaluateL2Regularization(data: DataFrame, l2Scalar: Double, numLabels: Int): Vector

Given L2 regularization config create a vector with per-label reg param (by default - constant).
Given L2 regularization config create a vector with per-label reg param (by default - constant).

Attributes
protected
def explainParam(param: Param[_]): String

Definition Classes
Params
def explainParams(): String

Definition Classes
Params
def extractBlock(lossHistory: Array[CompactBuffer[Double]], dataset: DataFrame, names: Map[Int, String], sc: SparkContext): DataFrame
def extractLabelVectors(labelAttributeGroup: AttributeGroup, numLabels: Int, weights: Matrix): Map[String, Vector]

Utility used to split weights matrice into label -> vector map
Utility used to split weights matrice into label -> vector map

Attributes
protected
final def extractParamMap(): ParamMap

Definition Classes
Params
final def extractParamMap(extra: ParamMap): ParamMap

Definition Classes
Params
def extractRow(label: Int, weights: Matrix): Vector

Extracts a single row from a matrice.
Extracts a single row from a matrice.

Attributes
protected
def extractSummaryBlocks(lossHistory: Array[CompactBuffer[Double]], weightDiffHistory: Array[CompactBuffer[Double]], weightNormHistory: Array[CompactBuffer[Double]], dataset: DataFrame, labelAttributeGroup: AttributeGroup): Map[Block, DataFrame]

Extracts summary blocks from iterations loss history.
Extracts summary blocks from iterations loss history.

Attributes
protected
def f2jBLAS: BLAS

Definition Classes
HasNetlibBlas
final val featuresCol: Param[String]

Definition Classes
HasFeaturesCol
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
def fit(dataset: Dataset[_]): M

Definition Classes
DSVRGD → Estimator
def fit(dataset: Dataset[_], paramMaps: Array[ParamMap]): Seq[M]

Definition Classes
Estimator
Annotations
@Since( "2.0.0" )
def fit(dataset: Dataset[_], paramMap: ParamMap): M

Definition Classes
Estimator
Annotations
@Since( "2.0.0" )
def fit(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): M

Definition Classes
Estimator
Annotations
@Since( "2.0.0" ) @varargs()
def fullGradientAndLoss(l1regParam: Vector, l2regParam: Vector, localWeights: DenseMatrix, marginCache: DenseMatrix, lossCache: DenseVector, updateTerm: DenseMatrix, skipRegFeature: Int, features: DenseMatrix, labels: DenseMatrix): Any
final def get[T](param: Param[T]): Option[T]

Definition Classes
Params
final def getCacheTrainData: Boolean

Definition Classes
HasCacheTrainData
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
final def getDefault[T](param: Param[T]): Option[T]

Definition Classes
Params
final def getElasticNetParam: Double

Definition Classes
HasElasticNetParam
final def getFeaturesCol: String

Definition Classes
HasFeaturesCol
final def getLabelCol: String

Definition Classes
HasLabelCol
final def getMaxIter: Int

Definition Classes
HasMaxIter
def getNotConverged(activeLabels: Map[Int, Int], lossHistory: Array[CompactBuffer[Double]], weightDiffHistory: Array[CompactBuffer[Double]], weightNormHistory: Array[CompactBuffer[Double]], tolerance: Double): Array[Int]

Extracts not converged labels based on actual and previous weights and on the loss history.
Extracts not converged labels based on actual and previous weights and on the loss history.

Attributes
protected
final def getOrDefault[T](param: Param[T]): T

Definition Classes
Params
def getParam(paramName: String): Param[Any]

Definition Classes
Params
final def getPredictionCol: String

Definition Classes
HasPredictionCol
final def getRegParam: Double

Definition Classes
HasRegParam
final def getTol: Double

Definition Classes
HasTol
final def hasDefault[T](param: Param[T]): Boolean

Definition Classes
Params
def hasParam(paramName: String): Boolean

Definition Classes
Params
def hashCode(): Int

Definition Classes
AnyRef → Any
def initializeLogIfNecessary(isInterpreter: Boolean): Unit

Attributes
protected
Definition Classes
Logging
def initializeWeights(data: DataFrame, numLabels: Int, numFeatures: Int): Matrix
final def isDefined(param: Param[_]): Boolean

Definition Classes
Params
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
final def isSet(param: Param[_]): Boolean

Definition Classes
Params
def isTraceEnabled(): Boolean

Attributes
protected
Definition Classes
Logging
final val labelCol: Param[String]

Definition Classes
HasLabelCol
val lastIsIntercept: BooleanParam
val learningRate: DoubleParam
val localMinibatchSize: Param[Int]
def log: Logger

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logName: String

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def lossDifferenceForLabel(lossHistory: Array[CompactBuffer[Double]], label: Int): Double

Evaluates loss difference simply as relative change
val lossIncreaseTolerance: DoubleParam
final val maxIter: IntParam

Definition Classes
HasMaxIter
def merge(labelsMap: Map[Int, Int], weights: Matrix, newWeights: DenseMatrix): DenseMatrix

Merges weights from the new epoch with overal weights.
Merges weights from the new epoch with overal weights. Dimensions of weights matrices might be different when part of labels are already converged and do not participate in descend.

Attributes
protected
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
lazy val params: Array[Param[_]]

Definition Classes
Params
final val predictionCol: Param[String]

Definition Classes
HasPredictionCol
final val regParam: DoubleParam

Definition Classes
HasRegParam
def relabel(activeLabels: Array[Int], labels: Vector): DenseVector

Used to preserve only active (not yet converged) labels into a vector
Used to preserve only active (not yet converged) labels into a vector

Attributes
protected
def relabelMatrix(activeLabels: Array[Int], matrix: Matrix): Matrix

Used to preserve only active (not yet converged) labels into a matrix
Used to preserve only active (not yet converged) labels into a matrix

Attributes
protected
final def set(paramPair: ParamPair[_]): DSVRGD.this.type

Attributes
protected
Definition Classes
Params
final def set(param: String, value: Any): DSVRGD.this.type

Attributes
protected
Definition Classes
Params
final def set[T](param: Param[T], value: T): DSVRGD.this.type

Definition Classes
Params
def setCacheTrainData(value: Boolean): DSVRGD.this.type

Definition Classes
HasCacheTrainData
def setConvergenceMode(value: String): DSVRGD.this.type
final def setDefault(paramPairs: ParamPair[_]*): DSVRGD.this.type

Attributes
protected
Definition Classes
Params
final def setDefault[T](param: Param[T], value: T): DSVRGD.this.type

Attributes
protected
Definition Classes
Params
def setElasticNetParam(value: Double): DSVRGD.this.type
def setLastIsIntercept(value: Boolean): DSVRGD.this.type
def setLearningRate(value: Double): DSVRGD.this.type
def setLocalMinibatchSize(value: Int): DSVRGD.this.type
def setMaxIter(value: Int): DSVRGD.this.type
def setRegParam(value: Double): DSVRGD.this.type
def setSlowDownFactor(value: Double): DSVRGD.this.type
def setSpeedUpFactor(value: Double): DSVRGD.this.type
def setTol(value: Double): DSVRGD.this.type
def singleStep(data: RDD[(Vector, DenseVector)], weights: Broadcast[Matrix], avgWeights: Broadcast[Matrix], avgGradient: Broadcast[Matrix], l1regParam: Vector, l2regParam: Vector, stepNum: Int, labelLearningRates: DenseVector): DistributedSgdState

Single epoch of the descend
Single epoch of the descend
data
Data with features and labels
weights
Weghts matrix to start with.
avgWeights
Average weights among walked during previous epoch.
avgGradient
Average gradient among seen during previous epoch.
l1regParam
Vector with the strength of L1 regularization (null if disabled)
l2regParam
Vector with the strength of L2 regularization (null if disabled)
stepNum
Number of epoch
returns
State with weights, averages and loss from this epoch

Attributes
protected
val slowDownFactor: DoubleParam
val speedUpFactor: DoubleParam
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toDense(weights: Broadcast[Matrix]): DenseMatrix
def toString(): String

Definition Classes
Identifiable → AnyRef → Any
final val tol: DoubleParam

Definition Classes
HasTol
def transformSchema(schema: StructType): StructType

Definition Classes
DSVRGD → PipelineStage
Annotations
@DeveloperApi()
def transformSchema(schema: StructType, logging: Boolean): StructType

Attributes
protected
Definition Classes
PipelineStage
Annotations
@DeveloperApi()
val uid: String

Definition Classes
DSVRGD → Identifiable
def updateWeights(stepSize: Double, updateTerm: DenseMatrix, weights: DenseMatrix): Unit

Updates the weights given update term and current value.
Updates the weights given update term and current value.

Attributes
protected
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
def weightNorm(newWeights: Matrix, label: Int, skipRegFeature: Int): Double

Evaluates weight norm for a given label.
Evaluates weight norm for a given label.
newWeights
Weights matrix
label
Label to evaluate weights
returns
Weights norm.

Attributes
protected

abstract class DSVRGD[M <: ModelWithSummary[M]] extends Estimator[M] with SummarizableEstimator[M] with HasPredictionCol with HasFeaturesCol with HasLabelCol with HasRegParam with HasElasticNetParam with HasNetlibBlas with HasMaxIter with HasTol with HasCacheTrainData

Instance Constructors

new DSVRGD(uid: String)

Abstract Value Members

abstract def addGradient(weights: Matrix, features: DenseMatrix, labels: DenseMatrix, updateTerm: DenseMatrix, marginCache: DenseMatrix, lossCache: DenseVector): Unit

abstract def extractModel(labelAttributeGroup: AttributeGroup, numLabels: Int, weights: Matrix, dataset: DataFrame): M

abstract def weightsDistanceForLabel(oldWeights: Matrix, newWeights: DenseMatrix, label: Int): Double

Concrete Value Members

final def !=(arg0: AnyRef): Boolean

final def !=(arg0: Any): Boolean

final def ##(): Int

final def $[T](param: Param[T]): T

final def ==(arg0: AnyRef): Boolean

final def ==(arg0: Any): Boolean

def addL1Reg(l1regParam: Vector, weights: DenseMatrix, updateTerm: DenseMatrix, lossCache: DenseVector, skipRegFeature: Int): DenseMatrix

def addL2Reg(l2regParam: Vector, weights: DenseMatrix, updateTerm: DenseMatrix, lossCache: DenseVector, skipRegFeature: Int): DenseMatrix

def adjust(direction: Int, learningRates: DenseMatrix, updateTerm: DenseMatrix, weights: DenseMatrix): DenseMatrix

def applyL1Shrinkage(regParam: Vector, weights: DenseMatrix, skipRegFeature: Int, notDegraded: Set[Int]): DenseMatrix

final def asInstanceOf[T0]: T0

def axpy(a: Double, x: Vector, y: Array[Double]): Unit

def axpy(a: Double, x: Array[Double], y: Array[Double]): Unit

def axpyCompensated(updateTerm: Array[Double], sum: Array[Double], compensator: Array[Double], y: Array[Double], t: Array[Double]): Unit

def blas: BLAS

final val cacheTrainData: BooleanParam

final def clear(param: Param[_]): DSVRGD.this.type

def clone(): AnyRef

val convergenceMode: Param[String]

def copy(extra: ParamMap): DSVRGD[M]

def copy(x: Array[Double], y: Array[Double]): Unit

def copyValues[T <: Params](to: T, extra: ParamMap): T

final def defaultCopy[T <: Params](extra: ParamMap): T

def dscal(a: Double, data: Array[Double]): Unit

final val elasticNetParam: DoubleParam

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def evaluateL1Regularization(data: DataFrame, l1Scalar: Double, numLabels: Int): Vector

def evaluateL2Regularization(data: DataFrame, l2Scalar: Double, numLabels: Int): Vector

def explainParam(param: Param[_]): String

def explainParams(): String

def extractBlock(lossHistory: Array[CompactBuffer[Double]], dataset: DataFrame, names: Map[Int, String], sc: SparkContext): DataFrame

def extractLabelVectors(labelAttributeGroup: AttributeGroup, numLabels: Int, weights: Matrix): Map[String, Vector]

final def extractParamMap(): ParamMap

final def extractParamMap(extra: ParamMap): ParamMap

def extractRow(label: Int, weights: Matrix): Vector

def extractSummaryBlocks(lossHistory: Array[CompactBuffer[Double]], weightDiffHistory: Array[CompactBuffer[Double]], weightNormHistory: Array[CompactBuffer[Double]], dataset: DataFrame, labelAttributeGroup: AttributeGroup): Map[Block, DataFrame]

def f2jBLAS: BLAS

final val featuresCol: Param[String]

def finalize(): Unit

def fit(dataset: Dataset[_]): M

def fit(dataset: Dataset[_], paramMaps: Array[ParamMap]): Seq[M]

def fit(dataset: Dataset[_], paramMap: ParamMap): M

def fit(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): M

def fullGradientAndLoss(l1regParam: Vector, l2regParam: Vector, localWeights: DenseMatrix, marginCache: DenseMatrix, lossCache: DenseVector, updateTerm: DenseMatrix, skipRegFeature: Int, features: DenseMatrix, labels: DenseMatrix): Any

final def get[T](param: Param[T]): Option[T]

final def getCacheTrainData: Boolean

final def getClass(): Class[_]

final def getDefault[T](param: Param[T]): Option[T]

final def getElasticNetParam: Double

final def getFeaturesCol: String

final def getLabelCol: String

final def getMaxIter: Int

def getNotConverged(activeLabels: Map[Int, Int], lossHistory: Array[CompactBuffer[Double]], weightDiffHistory: Array[CompactBuffer[Double]], weightNormHistory: Array[CompactBuffer[Double]], tolerance: Double): Array[Int]

final def getOrDefault[T](param: Param[T]): T

def getParam(paramName: String): Param[Any]

final def getPredictionCol: String

final def getRegParam: Double

final def getTol: Double

final def hasDefault[T](param: Param[T]): Boolean

def hasParam(paramName: String): Boolean

def hashCode(): Int

def initializeLogIfNecessary(isInterpreter: Boolean): Unit

def initializeWeights(data: DataFrame, numLabels: Int, numFeatures: Int): Matrix

final def isDefined(param: Param[_]): Boolean

final def isInstanceOf[T0]: Boolean

final def isSet(param: Param[_]): Boolean

def isTraceEnabled(): Boolean

final val labelCol: Param[String]

val lastIsIntercept: BooleanParam

val learningRate: DoubleParam