LDA

Value Members

final def !=(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def !=(arg0: Any): Boolean

Definition Classes
Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def ==(arg0: Any): Boolean

Definition Classes
Any
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
def incrementalTrain(docs: RDD[(Long, Vector)], computedModel: LocalLDAModel, alphaAS: Double = 0.1, totalIter: Int = 150, useLightLDA: Boolean = false): DistributedLDAModel

incremental train
incremental train
docs
computedModel
alphaAS
totalIter
useLightLDA
returns
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
def train(docs: RDD[(Long, Vector)], totalIter: Int = 150, numTopics: Int = 2048, alpha: Double = 0.001, beta: Double = 0.01, alphaAS: Double = 0.1, useLightLDA: Boolean = false): DistributedLDAModel

LDA training
LDA training
docs
RDD of documents, which are term (word) count vectors paired with IDs. The term count vectors are "bags of words" with a fixed-size vocabulary (where the vocabulary size is the length of the vector). Document IDs must be unique and >= 0.
totalIter
the number of iterations
numTopics
the number of topics (5000+ for large data)
alpha
recommend to be (5.0 /numTopics)
beta
recommend to be in range 0.001 - 0.1
alphaAS
recommend to be in range 0.01 - 1.0
useLightLDA
use LightLDA sampling algorithm or not, recommend false for short text
returns
DistributedLDAModel
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

object LDA extends Serializable

Value Members

final def !=(arg0: AnyRef): Boolean

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: AnyRef): Boolean

final def ==(arg0: Any): Boolean

final def asInstanceOf[T0]: T0

def clone(): AnyRef

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

def incrementalTrain(docs: RDD[(Long, Vector)], computedModel: LocalLDAModel, alphaAS: Double = 0.1, totalIter: Int = 150, useLightLDA: Boolean = false): DistributedLDAModel

final def isInstanceOf[T0]: Boolean

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

def train(docs: RDD[(Long, Vector)], totalIter: Int = 150, numTopics: Int = 2048, alpha: Double = 0.001, beta: Double = 0.01, alphaAS: Double = 0.1, useLightLDA: Boolean = false): DistributedLDAModel

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from Serializable

Inherited from Serializable

Inherited from AnyRef

Inherited from Any

Ungrouped