Class

com.databricks.labs.automl.sanitize

PearsonFiltering

Related Doc: package sanitize

Permalink

class PearsonFiltering extends DataValidation with SanitizerDefaults

Linear Supertypes
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. PearsonFiltering
  2. SanitizerDefaults
  3. DataValidation
  4. AnyRef
  5. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new PearsonFiltering(df: DataFrame, featureColumnListing: Array[String], modelType: String)

    Permalink

    df

    : DataFrame -> Dataset with a vectorized field of features, the feature columns, and a label column.

    featureColumnListing

    : Array[String] -> List of all fields that make up the feature vector Usage: val autoFiltered = new PearsonFiltering(featurizedData, fields) .setLabelCol("label") .setFeaturesCol("features") .setFilterStatistic("pearsonStat") .setFilterDirection("greater") .setFilterMode("auto") .setAutoFilterNTile(0.5) .filterFields

Value Members

  1. final def !=(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int

    Permalink
    Definition Classes
    AnyRef → Any
  3. final def ==(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  4. def _allowableCardinalilties: List[String]

    Permalink
    Definition Classes
    DataValidation
  5. def _allowableCategoricalFilterModes: List[String]

    Permalink
    Definition Classes
    DataValidation
  6. def _allowableDateTimeConversions: List[String]

    Permalink
    Definition Classes
    DataValidation
  7. final val _allowedFilterDirections: Array[String]

    Permalink
    Definition Classes
    SanitizerDefaults
  8. final val _allowedFilterModes: Array[String]

    Permalink
    Definition Classes
    SanitizerDefaults
  9. final val _allowedStats: Array[String]

    Permalink

    Pearson Defaults

    Pearson Defaults

    Definition Classes
    SanitizerDefaults
  10. final val allowableScalers: Array[String]

    Permalink

    Scaler Defaults

    Scaler Defaults

    Definition Classes
    SanitizerDefaults
  11. final def asInstanceOf[T0]: T0

    Permalink
    Definition Classes
    Any
  12. def clone(): AnyRef

    Permalink
    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  13. def convertDateAndTime(df: DataFrame, dateFields: List[String], timeFields: List[String], mode: String): (DataFrame, List[String])

    Permalink
    Definition Classes
    DataValidation
  14. def defaultFeaturesCol: String

    Permalink
    Definition Classes
    SanitizerDefaults
  15. def defaultLabelCol: String

    Permalink

    Global Defaults

    Global Defaults

    Definition Classes
    SanitizerDefaults
  16. def defaultPNorm: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  17. def defaultPearsonAutoFilterNTile: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  18. def defaultPearsonFilterDirection: String

    Permalink
    Definition Classes
    SanitizerDefaults
  19. def defaultPearsonFilterManualValue: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  20. def defaultPearsonFilterMode: String

    Permalink
    Definition Classes
    SanitizerDefaults
  21. def defaultPearsonFilterStatistic: String

    Permalink
    Definition Classes
    SanitizerDefaults
  22. def defaultRenamedFeaturesCol: String

    Permalink
    Definition Classes
    SanitizerDefaults
  23. def defaultScalerMax: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  24. def defaultScalerMin: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  25. def defaultScalerType: String

    Permalink
    Definition Classes
    SanitizerDefaults
  26. def defaultStandardScalerMeanFlag: Boolean

    Permalink
    Definition Classes
    SanitizerDefaults
  27. def defaultStandardScalerStdDevFlag: Boolean

    Permalink
    Definition Classes
    SanitizerDefaults
  28. final def eq(arg0: AnyRef): Boolean

    Permalink
    Definition Classes
    AnyRef
  29. def equals(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  30. def filterFields(ignoreFields: Array[String] = Array.empty[String]): DataFrame

    Permalink

    Main entry point for Pearson Filtering

    Main entry point for Pearson Filtering

    ignoreFields

    Fields that will be ignored from running a Pearson filter against.

  31. def finalize(): Unit

    Permalink
    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  32. def generateAssembly(numericColumns: List[String], characterColumns: List[String], featureCol: String): (Array[StringIndexer], Array[String], VectorAssembler)

    Permalink
    Definition Classes
    DataValidation
  33. def getAutoFilterNTile: Double

    Permalink
  34. final def getClass(): Class[_]

    Permalink
    Definition Classes
    AnyRef → Any
  35. def getFeaturesCol: String

    Permalink
  36. def getFilterDirection: String

    Permalink
  37. def getFilterManualValue: Double

    Permalink
  38. def getFilterMode: String

    Permalink
  39. def getFilterStatistic: String

    Permalink
  40. def getLabelCol: String

    Permalink
  41. def getParallelism: Int

    Permalink
  42. def hashCode(): Int

    Permalink
    Definition Classes
    AnyRef → Any
  43. def indexStrings(categoricalFields: List[String]): (Array[StringIndexer], Array[String])

    Permalink
    Definition Classes
    DataValidation
  44. def invalidateSelection(value: String, allowances: Seq[String]): String

    Permalink
    Definition Classes
    DataValidation
  45. final def isInstanceOf[T0]: Boolean

    Permalink
    Definition Classes
    Any
  46. final def ne(arg0: AnyRef): Boolean

    Permalink
    Definition Classes
    AnyRef
  47. final def notify(): Unit

    Permalink
    Definition Classes
    AnyRef
  48. final def notifyAll(): Unit

    Permalink
    Definition Classes
    AnyRef
  49. def oneHotEncodeStrings(stringIndexedFields: List[String]): (OneHotEncoderEstimator, Array[String])

    Permalink
    Definition Classes
    DataValidation
  50. def setAutoFilterNTile(value: Double): PearsonFiltering.this.type

    Permalink
  51. def setFeaturesCol(value: String): PearsonFiltering.this.type

    Permalink
  52. def setFilterDirection(value: String): PearsonFiltering.this.type

    Permalink
  53. def setFilterManualValue(value: Int): PearsonFiltering.this.type

    Permalink
  54. def setFilterManualValue(value: Double): PearsonFiltering.this.type

    Permalink
  55. def setFilterMode(value: String): PearsonFiltering.this.type

    Permalink
  56. def setFilterStatistic(value: String): PearsonFiltering.this.type

    Permalink
  57. def setLabelCol(value: String): PearsonFiltering.this.type

    Permalink
  58. def setParallelism(value: Int): PearsonFiltering.this.type

    Permalink
  59. final def synchronized[T0](arg0: ⇒ T0): T0

    Permalink
    Definition Classes
    AnyRef
  60. def toString(): String

    Permalink
    Definition Classes
    AnyRef → Any
  61. def validateCardinality(df: DataFrame, stringFields: List[String], cardinalityLimit: Int = 500, parallelism: Int = 20): ValidatedCategoricalFields

    Permalink
    Definition Classes
    DataValidation
  62. def validateFieldPresence(df: DataFrame, column: String): Unit

    Permalink
    Definition Classes
    DataValidation
  63. def validateInputDataframe(df: DataFrame): Unit

    Permalink
    Definition Classes
    DataValidation
  64. def validateLabelAndFeatures(df: DataFrame, labelCol: String, featureCol: String): Unit

    Permalink
    Definition Classes
    DataValidation
  65. final def wait(): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  66. final def wait(arg0: Long, arg1: Int): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  67. final def wait(arg0: Long): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )

Inherited from SanitizerDefaults

Inherited from DataValidation

Inherited from AnyRef

Inherited from Any

Ungrouped