Class

com.salesforce.op.stages.impl.feature

TextMapHashingVectorizerModel

Related Doc: package feature

Permalink

final class TextMapHashingVectorizerModel[T <: OPMap[String]] extends OPMapVectorizerModel[String, T] with TextTokenizerParams with HashingFun

Linear Supertypes
HashingFun, TextTokenizerParams, LanguageDetectionParams, OPMapVectorizerModel[String, T], CleanTextMapFun, CleanTextFun, SequenceModel[T, OPVector], OpTransformerN[T, OPVector], OpTransformer, OpPipelineStageN[T, OPVector], HasInN, OpPipelineStage[OPVector], OpPipelineStageBase, MLWritable, OpPipelineStageParams, InputParams, Model[SequenceModel[T, OPVector]], Transformer, PipelineStage, Logging, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. TextMapHashingVectorizerModel
  2. HashingFun
  3. TextTokenizerParams
  4. LanguageDetectionParams
  5. OPMapVectorizerModel
  6. CleanTextMapFun
  7. CleanTextFun
  8. SequenceModel
  9. OpTransformerN
  10. OpTransformer
  11. OpPipelineStageN
  12. HasInN
  13. OpPipelineStage
  14. OpPipelineStageBase
  15. MLWritable
  16. OpPipelineStageParams
  17. InputParams
  18. Model
  19. Transformer
  20. PipelineStage
  21. Logging
  22. Params
  23. Serializable
  24. Serializable
  25. Identifiable
  26. AnyRef
  27. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Type Members

  1. final type InputFeatures = Array[FeatureLike[T]]

    Permalink
    Definition Classes
    OpPipelineStageN → OpPipelineStage → InputParams
  2. type KeyValue = (String) ⇒ Any

    Permalink
    Definition Classes
    OpTransformer
  3. final type OutputFeatures = FeatureLike[OPVector]

    Permalink
    Definition Classes
    OpPipelineStage → OpPipelineStageBase

Value Members

  1. final def !=(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int

    Permalink
    Definition Classes
    AnyRef → Any
  3. final def $[T](param: Param[T]): T

    Permalink
    Attributes
    protected
    Definition Classes
    Params
  4. final def ==(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  5. val args: OPMapVectorizerModelArgs

    Permalink
    Definition Classes
    OPMapVectorizerModel
  6. final def asInstanceOf[T0]: T0

    Permalink
    Definition Classes
    Any
  7. final val autoDetectLanguage: BooleanParam

    Permalink

    Indicates whether to attempt language detection.

    Indicates whether to attempt language detection.

    Definition Classes
    LanguageDetectionParams
  8. final val autoDetectThreshold: DoubleParam

    Permalink

    Language detection threshold.

    Language detection threshold. If none of the detected languages have confidence greater than the threshold then defaultLanguage is used.

    Definition Classes
    LanguageDetectionParams
  9. final def checkInputLength(features: Array[_]): Boolean

    Permalink
    Definition Classes
    OpPipelineStageN → InputParams
  10. final def checkSerializable: Try[Unit]

    Permalink
    Definition Classes
    OpTransformerN → OpPipelineStageBase
  11. def cleanMap[V](m: Map[String, V], shouldCleanKey: Boolean, shouldCleanValue: Boolean): Map[String, V]

    Permalink
    Definition Classes
    CleanTextMapFun
  12. def cleanTextFn(s: String, shouldClean: Boolean): String

    Permalink
    Definition Classes
    CleanTextFun
  13. final def clear(param: Param[_]): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    Params
  14. def clone(): AnyRef

    Permalink
    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  15. def convertFn: (Map[String, String]) ⇒ Map[String, Double]

    Permalink
  16. final def copy(extra: ParamMap): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    OpPipelineStageBase → Params
  17. def copyValues[T <: Params](to: T, extra: ParamMap): T

    Permalink
    Attributes
    protected
    Definition Classes
    Params
  18. final def defaultCopy[T <: Params](extra: ParamMap): T

    Permalink
    Attributes
    protected
    Definition Classes
    Params
  19. final val defaultLanguage: Param[String]

    Permalink

    Default language to assume in case autoDetectLanguage is disabled or failed to make a good enough prediction.

    Default language to assume in case autoDetectLanguage is disabled or failed to make a good enough prediction.

    Definition Classes
    LanguageDetectionParams
  20. final def eq(arg0: AnyRef): Boolean

    Permalink
    Definition Classes
    AnyRef
  21. def equals(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  22. def explainParam(param: Param[_]): String

    Permalink
    Definition Classes
    Params
  23. def explainParams(): String

    Permalink
    Definition Classes
    Params
  24. final def extractParamMap(): ParamMap

    Permalink
    Definition Classes
    Params
  25. final def extractParamMap(extra: ParamMap): ParamMap

    Permalink
    Definition Classes
    Params
  26. def finalize(): Unit

    Permalink
    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  27. final def get[T](param: Param[T]): Option[T]

    Permalink
    Definition Classes
    Params
  28. def getAutoDetectLanguage: Boolean

    Permalink
    Definition Classes
    LanguageDetectionParams
  29. def getAutoDetectThreshold: Double

    Permalink
    Definition Classes
    LanguageDetectionParams
  30. final def getClass(): Class[_]

    Permalink
    Definition Classes
    AnyRef → Any
  31. final def getDefault[T](param: Param[T]): Option[T]

    Permalink
    Definition Classes
    Params
  32. def getDefaultLanguage: Language

    Permalink
    Definition Classes
    LanguageDetectionParams
  33. final def getInputFeature[T <: FeatureType](i: Int): Option[FeatureLike[T]]

    Permalink
    Definition Classes
    InputParams
  34. final def getInputFeatures(): Array[OPFeature]

    Permalink
    Definition Classes
    InputParams
  35. final def getInputSchema(): StructType

    Permalink
    Definition Classes
    OpPipelineStageParams
  36. final def getMetadata(): Metadata

    Permalink
    Definition Classes
    OpPipelineStageParams
  37. def getMinTokenLength: Int

    Permalink
    Definition Classes
    TextTokenizerParams
  38. final def getOrDefault[T](param: Param[T]): T

    Permalink
    Definition Classes
    Params
  39. def getOutput(): FeatureLike[OPVector]

    Permalink
    Definition Classes
    OpPipelineStageN → OpPipelineStageBase
  40. final def getOutputFeatureName: String

    Permalink
    Definition Classes
    OpPipelineStage
  41. def getParam(paramName: String): Param[Any]

    Permalink
    Definition Classes
    Params
  42. def getToLowercase: Boolean

    Permalink
    Definition Classes
    TextTokenizerParams
  43. final def getTransientFeature(i: Int): Option[TransientFeature]

    Permalink
    Definition Classes
    InputParams
  44. final def getTransientFeatures(): Array[TransientFeature]

    Permalink
    Definition Classes
    InputParams
  45. final def hasDefault[T](param: Param[T]): Boolean

    Permalink
    Definition Classes
    Params
  46. def hasParam(paramName: String): Boolean

    Permalink
    Definition Classes
    Params
  47. def hasParent: Boolean

    Permalink
    Definition Classes
    Model
  48. def hash[T <: OPCollection](in: Seq[T], features: Array[TransientFeature], params: HashingFunctionParams): OPVector

    Permalink

    Hashes input sequence of values into OPVector using the supplied hashing params

    Hashes input sequence of values into OPVector using the supplied hashing params

    Attributes
    protected
    Definition Classes
    HashingFun
  49. def hashCode(): Int

    Permalink
    Definition Classes
    AnyRef → Any
  50. val hashSpaceStrategy: HashSpaceStrategy

    Permalink
  51. def hashingTF(params: HashingFunctionParams): HashingTF

    Permalink

    HashingTF instance

    HashingTF instance

    Attributes
    protected
    Definition Classes
    HashingFun
  52. final def inN: Array[TransientFeature]

    Permalink
    Attributes
    protected
    Definition Classes
    HasInN
  53. def initializeLogIfNecessary(isInterpreter: Boolean): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  54. final def inputAsArray(in: InputFeatures): Array[OPFeature]

    Permalink
    Definition Classes
    OpPipelineStageN → InputParams
  55. final def isDefined(param: Param[_]): Boolean

    Permalink
    Definition Classes
    Params
  56. final def isInstanceOf[T0]: Boolean

    Permalink
    Definition Classes
    Any
  57. final def isSet(param: Param[_]): Boolean

    Permalink
    Definition Classes
    Params
  58. def isSharedHashSpace(p: HashingFunctionParams, numFeatures: Option[Int] = None): Boolean

    Permalink

    Determine if the transformer should use a shared hash space for all features or not

    Determine if the transformer should use a shared hash space for all features or not

    returns

    true if the shared hashing space to be used, false otherwise

    Attributes
    protected
    Definition Classes
    HashingFun
  59. def isTraceEnabled(): Boolean

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  60. def log: Logger

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  61. def logDebug(msg: ⇒ String, throwable: Throwable): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  62. def logDebug(msg: ⇒ String): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  63. def logError(msg: ⇒ String, throwable: Throwable): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  64. def logError(msg: ⇒ String): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  65. def logInfo(msg: ⇒ String, throwable: Throwable): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  66. def logInfo(msg: ⇒ String): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  67. def logName: String

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  68. def logTrace(msg: ⇒ String, throwable: Throwable): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  69. def logTrace(msg: ⇒ String): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  70. def logWarning(msg: ⇒ String, throwable: Throwable): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  71. def logWarning(msg: ⇒ String): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    Logging
  72. def makeVectorColumnMetadata(features: Array[TransientFeature], params: HashingFunctionParams): Array[OpVectorColumnMetadata]

    Permalink
    Attributes
    protected
    Definition Classes
    HashingFun
  73. def makeVectorMetadata(features: Array[TransientFeature], params: HashingFunctionParams, outputName: String): OpVectorMetadata

    Permalink
    Attributes
    protected
    Definition Classes
    HashingFun
  74. final val minTokenLength: IntParam

    Permalink

    Minimum token length, >= 1.

    Minimum token length, >= 1.

    Definition Classes
    TextTokenizerParams
  75. final def ne(arg0: AnyRef): Boolean

    Permalink
    Definition Classes
    AnyRef
  76. final def notify(): Unit

    Permalink
    Definition Classes
    AnyRef
  77. final def notifyAll(): Unit

    Permalink
    Definition Classes
    AnyRef
  78. val numFeatures: Int

    Permalink
  79. def onGetMetadata(): Unit

    Permalink
    Definition Classes
    TextMapHashingVectorizerModel → OpPipelineStageParams
  80. def onSetInput(): Unit

    Permalink
    Attributes
    protected
    Definition Classes
    OpPipelineStageBase
  81. val operationName: String

    Permalink
    Definition Classes
    SequenceModel → OpPipelineStageBase
  82. final def outputAsArray(out: OutputFeatures): Array[OPFeature]

    Permalink
    Definition Classes
    OpPipelineStage → OpPipelineStageBase
  83. def outputFeatureUid: String

    Permalink
    Attributes
    protected[com.salesforce.op]
    Definition Classes
    OpPipelineStageN → OpPipelineStage
  84. def outputIsResponse: Boolean

    Permalink
    Definition Classes
    OpPipelineStage
  85. lazy val params: Array[Param[_]]

    Permalink
    Definition Classes
    Params
  86. var parent: Estimator[SequenceModel[T, OPVector]]

    Permalink
    Definition Classes
    Model
  87. def prepare[T <: OPCollection](el: T, shouldHashWithIndex: Boolean, shouldPrependFeatureName: Boolean, featureNameHash: Int): Iterable[Any]

    Permalink

    Function that prepares the input columns to be hashed Note that MurMur3 hashing algorithm only defined for primitive types so need to convert tuples to strings.

    Function that prepares the input columns to be hashed Note that MurMur3 hashing algorithm only defined for primitive types so need to convert tuples to strings. MultiPickList sets are hashed as is since there is no meaningful order in the selected choices. Lists and vectors can be hashed with or without their indices, since order may be important. Maps are hashed as (key,value) strings.

    el

    element we are hashing (eg. an OPList, OPMap, etc.)

    returns

    an Iterable object corresponding to the hashed element

    Attributes
    protected
    Definition Classes
    HashingFun
  88. def save(path: String): Unit

    Permalink
    Definition Classes
    MLWritable
    Annotations
    @Since( "1.6.0" ) @throws( ... )
  89. final def set(paramPair: ParamPair[_]): TextMapHashingVectorizerModel.this.type

    Permalink
    Attributes
    protected
    Definition Classes
    Params
  90. final def set(param: String, value: Any): TextMapHashingVectorizerModel.this.type

    Permalink
    Attributes
    protected
    Definition Classes
    Params
  91. final def set[T](param: Param[T], value: T): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    Params
  92. def setAutoDetectLanguage(value: Boolean): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    LanguageDetectionParams
  93. def setAutoDetectThreshold(value: Double): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    LanguageDetectionParams
  94. final def setDefault(paramPairs: ParamPair[_]*): TextMapHashingVectorizerModel.this.type

    Permalink
    Attributes
    protected
    Definition Classes
    Params
  95. final def setDefault[T](param: Param[T], value: T): TextMapHashingVectorizerModel.this.type

    Permalink
    Attributes
    protected
    Definition Classes
    Params
  96. def setDefaultLanguage(value: Language): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    LanguageDetectionParams
  97. final def setInput(features: FeatureLike[T]*): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    OpPipelineStageN
  98. final def setInput(features: InputFeatures): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    OpPipelineStageBase
  99. final def setInputFeatures[S <: OPFeature](features: Array[S]): TextMapHashingVectorizerModel.this.type

    Permalink
    Attributes
    protected
    Definition Classes
    InputParams
  100. final def setMetadata(m: Metadata): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    OpPipelineStageParams
  101. def setMinTokenLength(value: Int): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    TextTokenizerParams
  102. def setOutputFeatureName(name: String): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    OpPipelineStage
  103. def setParent(parent: Estimator[SequenceModel[T, OPVector]]): SequenceModel[T, OPVector]

    Permalink
    Definition Classes
    Model
  104. def setToLowercase(value: Boolean): TextMapHashingVectorizerModel.this.type

    Permalink
    Definition Classes
    TextTokenizerParams
  105. val shouldPrependFeatureName: Boolean

    Permalink
  106. final def stageName: String

    Permalink
    Definition Classes
    OpPipelineStageBase
  107. final def synchronized[T0](arg0: ⇒ T0): T0

    Permalink
    Definition Classes
    AnyRef
  108. final val toLowercase: BooleanParam

    Permalink

    Indicates whether to convert all characters to lowercase before tokenizing.

    Indicates whether to convert all characters to lowercase before tokenizing.

    Definition Classes
    TextTokenizerParams
  109. def toString(): String

    Permalink
    Definition Classes
    Identifiable → AnyRef → Any
  110. def tokenize(text: Text, languageDetector: LanguageDetector = TextTokenizer.LanguageDetector, analyzer: TextAnalyzer = TextTokenizer.Analyzer): TextTokenizerResult

    Permalink
    Definition Classes
    TextTokenizerParams
  111. def transform(dataset: Dataset[_]): DataFrame

    Permalink
    Definition Classes
    OpTransformerN → Transformer
  112. def transform(dataset: Dataset[_], paramMap: ParamMap): DataFrame

    Permalink
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" )
  113. def transform(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): DataFrame

    Permalink
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" ) @varargs()
  114. def transformFn: (Seq[T]) ⇒ OPVector

    Permalink
    Definition Classes
    TextMapHashingVectorizerModelOPMapVectorizerModel → OpTransformerN
  115. lazy val transformKeyValue: (KeyValue) ⇒ Any

    Permalink
    Definition Classes
    OpTransformerN → OpTransformer
  116. def transformMap: (Map[String, Any]) ⇒ Any

    Permalink
    Definition Classes
    OpTransformer
  117. def transformRow: (Row) ⇒ Any

    Permalink
    Definition Classes
    OpTransformer
  118. final def transformSchema(schema: StructType): StructType

    Permalink
    Definition Classes
    OpPipelineStageBase
  119. def transformSchema(schema: StructType, logging: Boolean): StructType

    Permalink
    Attributes
    protected
    Definition Classes
    PipelineStage
    Annotations
    @DeveloperApi()
  120. implicit val tti: scala.reflect.api.JavaUniverse.TypeTag[T]

    Permalink
    Definition Classes
    SequenceModel → OpTransformerN
  121. implicit val tto: scala.reflect.api.JavaUniverse.TypeTag[OPVector]

    Permalink
    Definition Classes
    SequenceModel → OpPipelineStageN
  122. implicit val ttov: scala.reflect.api.JavaUniverse.TypeTag[Value]

    Permalink
    Definition Classes
    SequenceModel → OpPipelineStageN
  123. val uid: String

    Permalink
    Definition Classes
    SequenceModel → Identifiable
  124. final def wait(): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  125. final def wait(arg0: Long, arg1: Int): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  126. final def wait(arg0: Long): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  127. final def write: MLWriter

    Permalink
    Definition Classes
    OpPipelineStageBase → MLWritable

Inherited from HashingFun

Inherited from TextTokenizerParams

Inherited from LanguageDetectionParams

Inherited from OPMapVectorizerModel[String, T]

Inherited from CleanTextMapFun

Inherited from CleanTextFun

Inherited from SequenceModel[T, OPVector]

Inherited from OpTransformerN[T, OPVector]

Inherited from OpTransformer

Inherited from OpPipelineStageN[T, OPVector]

Inherited from HasInN

Inherited from OpPipelineStage[OPVector]

Inherited from OpPipelineStageBase

Inherited from MLWritable

Inherited from OpPipelineStageParams

Inherited from InputParams

Inherited from Model[SequenceModel[T, OPVector]]

Inherited from Transformer

Inherited from PipelineStage

Inherited from Logging

Inherited from Params

Inherited from Serializable

Inherited from Serializable

Inherited from Identifiable

Inherited from AnyRef

Inherited from Any

Ungrouped