Class

com.databricks.labs.automl.inference

InferencePipeline

Related Doc: package inference

Permalink

class InferencePipeline extends AutomationConfig with AutomationTools with DataValidation with InferenceTools

Linear Supertypes
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. InferencePipeline
  2. InferenceTools
  3. DataValidation
  4. AutomationTools
  5. SparkSessionWrapper
  6. Serializable
  7. Serializable
  8. AutomationConfig
  9. SanitizerDefaults
  10. Defaults
  11. AnyRef
  12. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new InferencePipeline(df: DataFrame)

    Permalink

Value Members

  1. final def !=(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int

    Permalink
    Definition Classes
    AnyRef → Any
  3. final def ==(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  4. def _allowableCardinalilties: List[String]

    Permalink
    Definition Classes
    DataValidation
  5. def _allowableCategoricalFilterModes: List[String]

    Permalink
    Definition Classes
    DataValidation
  6. def _allowableDateTimeConversions: List[String]

    Permalink
    Definition Classes
    DataValidation
  7. final val _allowableEvolutionStrategies: List[String]

    Permalink
    Definition Classes
    Defaults
  8. final val _allowableInitialGenerationIndexMixingModes: List[String]

    Permalink
    Definition Classes
    Defaults
  9. final val _allowableInitialGenerationModes: List[String]

    Permalink
    Definition Classes
    Defaults
  10. final val _allowableMlFlowLoggingModes: List[String]

    Permalink
    Definition Classes
    Defaults
  11. final val _allowableNAFillModes: List[String]

    Permalink
    Definition Classes
    Defaults
  12. final val _allowedFilterDirections: Array[String]

    Permalink
    Definition Classes
    SanitizerDefaults
  13. final val _allowedFilterModes: Array[String]

    Permalink
    Definition Classes
    SanitizerDefaults
  14. final val _allowedStats: Array[String]

    Permalink

    Pearson Defaults

    Pearson Defaults

    Definition Classes
    SanitizerDefaults
  15. var _autoStoppingFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  16. var _autoStoppingScore: Double

    Permalink
    Definition Classes
    AutomationConfig
  17. var _cardinalityCheckMode: String

    Permalink
    Definition Classes
    AutomationConfig
  18. var _cardinalityLimit: Int

    Permalink
    Definition Classes
    AutomationConfig
  19. var _cardinalityPrecision: Double

    Permalink
    Definition Classes
    AutomationConfig
  20. var _cardinalitySwitchFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  21. var _cardinalityThreshold: Int

    Permalink
    Definition Classes
    AutomationConfig
  22. var _cardinalityType: String

    Permalink
    Definition Classes
    AutomationConfig
  23. var _categoricalNAFillMap: Map[String, String]

    Permalink
    Definition Classes
    AutomationConfig
  24. var _characterFillStat: String

    Permalink
    Definition Classes
    AutomationConfig
  25. var _characterNABlanketFillValue: String

    Permalink
    Definition Classes
    AutomationConfig
  26. var _continuousDataThreshold: Int

    Permalink
    Definition Classes
    AutomationConfig
  27. var _continuousEvolutionGeneticMixing: Double

    Permalink
    Definition Classes
    AutomationConfig
  28. var _continuousEvolutionImprovementThreshold: Int

    Permalink
    Definition Classes
    AutomationConfig
  29. var _continuousEvolutionMaxIterations: Int

    Permalink
    Definition Classes
    AutomationConfig
  30. var _continuousEvolutionMutationAggressiveness: Int

    Permalink
    Definition Classes
    AutomationConfig
  31. var _continuousEvolutionParallelism: Int

    Permalink
    Definition Classes
    AutomationConfig
  32. var _continuousEvolutionRollingImprovementCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  33. var _continuousEvolutionStoppingScore: Double

    Permalink
    Definition Classes
    AutomationConfig
  34. var _correlationCutoffHigh: Double

    Permalink
    Definition Classes
    AutomationConfig
  35. var _correlationCutoffLow: Double

    Permalink
    Definition Classes
    AutomationConfig
  36. var _covarianceConfig: CovarianceConfig

    Permalink
    Definition Classes
    AutomationConfig
  37. def _covarianceConfigDefaults: CovarianceConfig

    Permalink
    Definition Classes
    Defaults
  38. var _covarianceFilterFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  39. var _dataPrepCachingFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  40. def _dataPrepConfigDefaults: DataPrepConfig

    Permalink
    Definition Classes
    Defaults
  41. var _dataPrepParallelism: Int

    Permalink
    Definition Classes
    AutomationConfig
  42. var _dataReductionFactor: Double

    Permalink
    Definition Classes
    AutomationConfig
  43. var _dateTimeConversionType: String

    Permalink
    Definition Classes
    AutomationConfig
  44. def _defaultAutoStoppingFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  45. def _defaultAutoStoppingScore: Double

    Permalink
    Definition Classes
    Defaults
  46. def _defaultCovarianceFilterFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  47. def _defaultDataPrepCachingFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  48. def _defaultDataPrepParallelism: Int

    Permalink
    Definition Classes
    Defaults
  49. def _defaultDataReductionFactor: Double

    Permalink
    Definition Classes
    Defaults
  50. def _defaultDateTimeConversionType: String

    Permalink
    Definition Classes
    Defaults
  51. def _defaultFeatureImportanceCutoffType: String

    Permalink
    Definition Classes
    Defaults
  52. def _defaultFeatureImportanceCutoffValue: Double

    Permalink
    Definition Classes
    Defaults
  53. def _defaultFeatureInteractionConfig: params.FeatureInteractionConfig

    Permalink
    Definition Classes
    Defaults
  54. def _defaultFeatureInteractionFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  55. def _defaultFeaturesCol: String

    Permalink
    Definition Classes
    Defaults
  56. def _defaultFieldsToIgnoreInVector: Array[String]

    Permalink
    Definition Classes
    Defaults
  57. def _defaultFirstGenerationConfig: FirstGenerationConfig

    Permalink
    Definition Classes
    Defaults
  58. def _defaultHyperSpaceInference: Boolean

    Permalink
    Definition Classes
    Defaults
  59. def _defaultHyperSpaceInferenceCount: Int

    Permalink
    Definition Classes
    Defaults
  60. def _defaultHyperSpaceModelCount: Int

    Permalink
    Definition Classes
    Defaults
  61. def _defaultHyperSpaceModelType: String

    Permalink
    Definition Classes
    Defaults
  62. def _defaultInitialGenerationMode: String

    Permalink
    Definition Classes
    Defaults
  63. def _defaultKSampleConfig: KSampleConfig

    Permalink
    Definition Classes
    Defaults
  64. def _defaultLabelCol: String

    Permalink
    Definition Classes
    Defaults
  65. def _defaultMlFlowArtifactsFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  66. def _defaultMlFlowLoggingFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  67. def _defaultModelingFamily: String

    Permalink
    Definition Classes
    Defaults
  68. def _defaultNAFillFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  69. def _defaultOneHotEncodeFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  70. def _defaultOutlierFilterFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  71. def _defaultPearsonFilterFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  72. def _defaultPipelineDebugFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  73. def _defaultPipelineId: String

    Permalink
    Definition Classes
    Defaults
  74. def _defaultScalingFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  75. def _defaultVarianceFilterFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  76. var _deltaCacheBackingDirectory: String

    Permalink
    Definition Classes
    AutomationConfig
  77. var _deltaCacheBackingDirectoryRemovalFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  78. var _evolutionStrategy: String

    Permalink
    Definition Classes
    AutomationConfig
  79. var _featureImportanceCutoffType: String

    Permalink
    Definition Classes
    AutomationConfig
  80. var _featureImportanceCutoffValue: Double

    Permalink
    Definition Classes
    AutomationConfig
  81. var _featureImportancesConfig: MainConfig

    Permalink
    Definition Classes
    AutomationConfig
  82. def _featureImportancesDefaults: MainConfig

    Permalink
    Definition Classes
    Defaults
  83. var _featureInteractionConfig: params.FeatureInteractionConfig

    Permalink
    Definition Classes
    AutomationConfig
  84. var _featureInteractionContinuousDiscretizerBucketCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  85. var _featureInteractionFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  86. var _featureInteractionParallelism: Int

    Permalink
    Definition Classes
    AutomationConfig
  87. var _featureInteractionRetentionMode: String

    Permalink
    Definition Classes
    AutomationConfig
  88. var _featureInteractionTargetInteractionPercentage: Double

    Permalink
    Definition Classes
    AutomationConfig
  89. var _featuresCol: String

    Permalink
    Definition Classes
    AutomationConfig
  90. var _fieldsToIgnore: Array[String]

    Permalink
    Definition Classes
    AutomationConfig
  91. var _fieldsToIgnoreInVector: Array[String]

    Permalink
    Definition Classes
    AutomationConfig
  92. var _fillConfig: FillConfig

    Permalink
    Definition Classes
    AutomationConfig
  93. def _fillConfigDefaults: FillConfig

    Permalink
    Definition Classes
    Defaults
  94. var _filterBounds: String

    Permalink
    Definition Classes
    AutomationConfig
  95. var _filterPrecision: Double

    Permalink
    Definition Classes
    AutomationConfig
  96. var _firstGenerationArraySeed: Long

    Permalink
    Definition Classes
    AutomationConfig
  97. var _firstGenerationConfig: FirstGenerationConfig

    Permalink
    Definition Classes
    AutomationConfig
  98. var _firstGenerationGenePool: Int

    Permalink
    Definition Classes
    AutomationConfig
  99. var _firstGenerationIndexMixingMode: String

    Permalink
    Definition Classes
    AutomationConfig
  100. var _firstGenerationMode: String

    Permalink
    Definition Classes
    AutomationConfig
  101. var _firstGenerationPermutationCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  102. var _fixedMutationValue: Int

    Permalink
    Definition Classes
    AutomationConfig
  103. def _gbtDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  104. def _gbtDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  105. var _generationalMutationStrategy: String

    Permalink
    Definition Classes
    AutomationConfig
  106. var _geneticConfig: GeneticConfig

    Permalink
    Definition Classes
    AutomationConfig
  107. var _geneticMBOCandidateFactor: Int

    Permalink
    Definition Classes
    AutomationConfig
  108. var _geneticMBORegressorType: String

    Permalink
    Definition Classes
    AutomationConfig
  109. var _geneticMixing: Double

    Permalink
    Definition Classes
    AutomationConfig
  110. def _geneticTunerDefaults: GeneticConfig

    Permalink
    Definition Classes
    Defaults
  111. var _hyperSpaceInference: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  112. var _hyperSpaceInferenceCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  113. var _hyperSpaceModelCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  114. var _hyperSpaceModelType: String

    Permalink
    Definition Classes
    AutomationConfig
  115. var _inferenceConfigSaveLocation: String

    Permalink
    Definition Classes
    AutomationConfig
  116. def _inferenceConfigSaveLocationDefault: String

    Permalink
    Definition Classes
    Defaults
  117. var _kFold: Int

    Permalink
    Definition Classes
    AutomationConfig
  118. var _kGroups: Int

    Permalink
    Definition Classes
    AutomationConfig
  119. var _kMeansDistanceMeasurement: String

    Permalink
    Definition Classes
    AutomationConfig
  120. var _kMeansMaxIter: Int

    Permalink
    Definition Classes
    AutomationConfig
  121. var _kMeansPredictionCol: String

    Permalink
    Definition Classes
    AutomationConfig
  122. var _kMeansSeed: Long

    Permalink
    Definition Classes
    AutomationConfig
  123. var _kMeansTolerance: Double

    Permalink
    Definition Classes
    AutomationConfig
  124. var _kSampleConfig: KSampleConfig

    Permalink
    Definition Classes
    AutomationConfig
  125. var _labelBalanceMode: String

    Permalink
    Definition Classes
    AutomationConfig
  126. var _labelCol: String

    Permalink
    Definition Classes
    AutomationConfig
  127. def _lightGBMDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  128. def _lightGBMDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  129. def _linearRegressionDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  130. def _linearRegressionDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  131. def _logisticRegressionDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  132. def _logisticRegressionDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  133. var _lowerFilterNTile: Double

    Permalink
    Definition Classes
    AutomationConfig
  134. var _lshHashTables: Int

    Permalink
    Definition Classes
    AutomationConfig
  135. var _lshOutputCol: String

    Permalink
    Definition Classes
    AutomationConfig
  136. var _lshSeed: Long

    Permalink
    Definition Classes
    AutomationConfig
  137. var _mainConfig: MainConfig

    Permalink
    Definition Classes
    AutomationConfig
  138. def _mainConfigDefaults: MainConfig

    Permalink
    Definition Classes
    Defaults
  139. var _minimumVectorCountToMutate: Int

    Permalink
    Definition Classes
    AutomationConfig
  140. var _mlFlowAPIToken: String

    Permalink
    Definition Classes
    AutomationConfig
  141. var _mlFlowArtifactsFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  142. var _mlFlowBestSuffix: String

    Permalink
    Definition Classes
    AutomationConfig
  143. var _mlFlowConfig: MLFlowConfig

    Permalink
    Definition Classes
    AutomationConfig
  144. def _mlFlowConfigDefaults: MLFlowConfig

    Permalink
    Definition Classes
    Defaults
  145. var _mlFlowCustomRunTags: Map[String, String]

    Permalink
    Definition Classes
    AutomationConfig
  146. var _mlFlowExperimentName: String

    Permalink
    Definition Classes
    AutomationConfig
  147. var _mlFlowLoggingFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  148. var _mlFlowLoggingMode: String

    Permalink
    Definition Classes
    AutomationConfig
  149. var _mlFlowModelSaveDirectory: String

    Permalink
    Definition Classes
    AutomationConfig
  150. var _mlFlowTrackingURI: String

    Permalink
    Definition Classes
    AutomationConfig
  151. def _mlpcDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  152. def _mlpcDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  153. var _modelSeedMap: Map[String, Any]

    Permalink
    Definition Classes
    AutomationConfig
  154. var _modelSeedSetStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  155. var _modelSelectionDistinctThreshold: Int

    Permalink
    Definition Classes
    AutomationConfig
  156. def _modelTypeDefault: String

    Permalink
    Definition Classes
    Defaults
  157. var _modelingFamily: String

    Permalink
    Definition Classes
    AutomationConfig
  158. var _mutationMagnitudeMode: String

    Permalink
    Definition Classes
    AutomationConfig
  159. var _mutationMode: String

    Permalink
    Definition Classes
    AutomationConfig
  160. var _mutationValue: Double

    Permalink
    Definition Classes
    AutomationConfig
  161. var _naFillFilterPrecision: Double

    Permalink
    Definition Classes
    AutomationConfig
  162. var _naFillFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  163. var _naFillMode: String

    Permalink
    Definition Classes
    AutomationConfig
  164. def _naiveBayesDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  165. def _naiveBayesDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  166. var _numberOfGenerations: Int

    Permalink
    Definition Classes
    AutomationConfig
  167. var _numberOfMutationsPerGeneration: Int

    Permalink
    Definition Classes
    AutomationConfig
  168. var _numberOfParentsToRetain: Int

    Permalink
    Definition Classes
    AutomationConfig
  169. var _numericBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    AutomationConfig
  170. var _numericFillStat: String

    Permalink
    Definition Classes
    AutomationConfig
  171. var _numericNABlanketFillValue: Double

    Permalink
    Definition Classes
    AutomationConfig
  172. var _numericNAFillMap: Map[String, AnyVal]

    Permalink
    Definition Classes
    AutomationConfig
  173. var _numericRatio: Double

    Permalink
    Definition Classes
    AutomationConfig
  174. var _numericTarget: Int

    Permalink
    Definition Classes
    AutomationConfig
  175. var _oneHotEncodeFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  176. var _outlierConfig: OutlierConfig

    Permalink
    Definition Classes
    AutomationConfig
  177. def _outlierConfigDefaults: OutlierConfig

    Permalink
    Definition Classes
    Defaults
  178. var _outlierFilterFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  179. var _outputDfRepartitionScaleFactor: Int

    Permalink
    Definition Classes
    AutomationConfig
  180. var _pNorm: Double

    Permalink
    Definition Classes
    AutomationConfig
  181. var _parallelism: Int

    Permalink
    Definition Classes
    AutomationConfig
  182. var _pearsonAutoFilterNTile: Double

    Permalink
    Definition Classes
    AutomationConfig
  183. var _pearsonConfig: PearsonConfig

    Permalink
    Definition Classes
    AutomationConfig
  184. def _pearsonConfigDefaults: PearsonConfig

    Permalink
    Definition Classes
    Defaults
  185. var _pearsonFilterDirection: String

    Permalink
    Definition Classes
    AutomationConfig
  186. var _pearsonFilterFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  187. var _pearsonFilterManualValue: Double

    Permalink
    Definition Classes
    AutomationConfig
  188. var _pearsonFilterMode: String

    Permalink
    Definition Classes
    AutomationConfig
  189. var _pearsonFilterStatistic: String

    Permalink
    Definition Classes
    AutomationConfig
  190. var _pipelineDebugFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  191. var _pipelineId: String

    Permalink
    Definition Classes
    AutomationConfig
  192. var _quorumCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  193. def _rfDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  194. def _rfDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  195. var _scalerMax: Double

    Permalink
    Definition Classes
    AutomationConfig
  196. var _scalerMin: Double

    Permalink
    Definition Classes
    AutomationConfig
  197. var _scalerType: String

    Permalink
    Definition Classes
    AutomationConfig
  198. var _scalingConfig: ScalingConfig

    Permalink
    Definition Classes
    AutomationConfig
  199. def _scalingConfigDefaults: ScalingConfig

    Permalink
    Definition Classes
    Defaults
  200. var _scalingFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  201. def _scoringDefaultClassifier: String

    Permalink
    Definition Classes
    Defaults
  202. def _scoringDefaultRegressor: String

    Permalink
    Definition Classes
    Defaults
  203. var _scoringMetric: String

    Permalink
    Definition Classes
    AutomationConfig
  204. var _scoringOptimizationStrategy: String

    Permalink
    Definition Classes
    AutomationConfig
  205. def _scoringOptimizationStrategyClassifier: String

    Permalink
    Definition Classes
    Defaults
  206. def _scoringOptimizationStrategyRegressor: String

    Permalink
    Definition Classes
    Defaults
  207. var _seed: Long

    Permalink
    Definition Classes
    AutomationConfig
  208. var _splitCachingStrategy: String

    Permalink
    Definition Classes
    AutomationConfig
  209. var _standardScalerMeanFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  210. var _standardScalerStdDevFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  211. var _stringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    AutomationConfig
  212. final val _supportedFeatureImportanceCutoffTypes: List[String]

    Permalink
    Definition Classes
    Defaults
  213. final val _supportedModels: Array[String]

    Permalink
    Definition Classes
    Defaults
  214. def _svmDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  215. def _svmDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  216. var _syntheticCol: String

    Permalink
    Definition Classes
    AutomationConfig
  217. var _trainPortion: Double

    Permalink
    Definition Classes
    AutomationConfig
  218. var _trainSplitChronologicalColumn: String

    Permalink
    Definition Classes
    AutomationConfig
  219. var _trainSplitChronologicalRandomPercentage: Double

    Permalink
    Definition Classes
    AutomationConfig
  220. var _trainSplitColumnSet: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  221. var _trainSplitMethod: String

    Permalink
    Definition Classes
    AutomationConfig
  222. def _treeSplitDefaults: MainConfig

    Permalink
    Definition Classes
    Defaults
  223. var _treeSplitsConfig: MainConfig

    Permalink
    Definition Classes
    AutomationConfig
  224. def _treesDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  225. def _treesDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  226. var _upperFilterNTile: Double

    Permalink
    Definition Classes
    AutomationConfig
  227. var _varianceFilterFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  228. var _vectorMutationMethod: String

    Permalink
    Definition Classes
    AutomationConfig
  229. def _xgboostDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  230. final val allowableCardinalilties: List[String]

    Permalink
    Definition Classes
    Defaults
  231. final val allowableCategoricalFilterModes: List[String]

    Permalink
    Definition Classes
    Defaults
  232. final val allowableDateTimeConversions: List[String]

    Permalink
    Definition Classes
    Defaults
  233. final val allowableFeatureInteractionModes: List[String]

    Permalink
    Definition Classes
    Defaults
  234. final val allowableKMeansDistanceMeasurements: List[String]

    Permalink
    Definition Classes
    Defaults
  235. final val allowableLabelBalanceModes: List[String]

    Permalink
    Definition Classes
    Defaults
  236. final val allowableMBORegressorTypes: List[String]

    Permalink
    Definition Classes
    Defaults
  237. final val allowableMutationModes: List[String]

    Permalink
    Definition Classes
    Defaults
  238. final val allowableScalers: Array[String]

    Permalink

    Scaler Defaults

    Scaler Defaults

    Definition Classes
    SanitizerDefaults
  239. final val allowableVectorMutationMethods: List[String]

    Permalink
    Definition Classes
    Defaults
  240. final def asInstanceOf[T0]: T0

    Permalink
    Definition Classes
    Any
  241. def autoStoppingOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  242. def autoStoppingOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  243. def cardinalitySwitchOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  244. def cardinalitySwitchOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  245. def clone(): AnyRef

    Permalink
    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  246. def convertDateAndTime(df: DataFrame, dateFields: List[String], timeFields: List[String], mode: String): (DataFrame, List[String])

    Permalink
    Definition Classes
    DataValidation
  247. def convertInferenceConfigToDataFrame(config: InferenceMainConfig): DataFrame

    Permalink

    Seems a bit counter-intuitive to do this, but this allows for cloud-agnostic storage of the config.

    Seems a bit counter-intuitive to do this, but this allows for cloud-agnostic storage of the config. Otherwise, a configuration would need to be created to manage which cloud this is operating on and handle native SDK object writers. Instead of re-inventing the wheel here, a DataFrame can be serialized to any cloud-native storage medium with very little issue.

    config

    The inference configuration generated for a particular modeling run

    returns

    A DataFrame consisting of a single row and a single field. Cell 1:1 contains the json string.

    Definition Classes
    InferenceTools
  248. def convertInferenceConfigToJson(config: InferenceMainConfig): InferenceJsonReturn

    Permalink

    Handler method for converting the InferenceMainConfig object to a serializable Json String with correct scala-compatible data structures.

    Handler method for converting the InferenceMainConfig object to a serializable Json String with correct scala-compatible data structures.

    config

    instance of InferenceMainConfig

    returns

    [InferenceJsonReturn] consisting of compact form (for logging) and prettyprint form (human readable)

    Definition Classes
    InferenceTools
  249. def convertJsonConfigToClass(jsonConfig: String): InferenceMainConfig

    Permalink

    Handler method for converting a read-in json config String to an instance of InferenceMainConfig

    Handler method for converting a read-in json config String to an instance of InferenceMainConfig

    jsonConfig

    the config as a Json-formatted String

    returns

    config as InstanceOf[InferenceMainConfig]

    Definition Classes
    InferenceTools
  250. def convertMainConfigToJson(config: MainConfig): MainJsonReturn

    Permalink
    Definition Classes
    InferenceTools
  251. def covarianceFilterOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  252. def covarianceFilterOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  253. def createInferencePayload(dataFrame: DataFrame, modelingColumnsPayload: Array[String], allColumnsPayload: Array[String]): InferencePayload

    Permalink

    Definition Classes
    InferenceTools
  254. def dataPersist(preDF: DataFrame, postDF: DataFrame, cacheLevel: StorageLevel, blockUnpersist: Boolean): (DataFrame, String)

    Permalink
    Definition Classes
    AutomationTools
  255. def dataPrepCachingOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  256. def dataPrepCachingOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  257. def defaultFeaturesCol: String

    Permalink
    Definition Classes
    SanitizerDefaults
  258. def defaultLabelCol: String

    Permalink

    Global Defaults

    Global Defaults

    Definition Classes
    SanitizerDefaults
  259. def defaultPNorm: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  260. def defaultPearsonAutoFilterNTile: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  261. def defaultPearsonFilterDirection: String

    Permalink
    Definition Classes
    SanitizerDefaults
  262. def defaultPearsonFilterManualValue: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  263. def defaultPearsonFilterMode: String

    Permalink
    Definition Classes
    SanitizerDefaults
  264. def defaultPearsonFilterStatistic: String

    Permalink
    Definition Classes
    SanitizerDefaults
  265. def defaultRenamedFeaturesCol: String

    Permalink
    Definition Classes
    SanitizerDefaults
  266. def defaultScalerMax: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  267. def defaultScalerMin: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  268. def defaultScalerType: String

    Permalink
    Definition Classes
    SanitizerDefaults
  269. def defaultStandardScalerMeanFlag: Boolean

    Permalink
    Definition Classes
    SanitizerDefaults
  270. def defaultStandardScalerStdDevFlag: Boolean

    Permalink
    Definition Classes
    SanitizerDefaults
  271. def deltaCheckBackingDirectoryRemovalOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  272. def deltaCheckBackingDirectoryRemovalOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  273. final def eq(arg0: AnyRef): Boolean

    Permalink
    Definition Classes
    AnyRef
  274. def equals(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  275. def extractGenerationData(payload: Array[GenericModelReturn]): Map[Int, (Double, Double)]

    Permalink
    Definition Classes
    AutomationTools
  276. def extractGenerationalScores(payload: Array[GenericModelReturn], scoringOptimizationStrategy: String, modelFamily: String, modelType: String): Array[GenerationalReport]

    Permalink
    Definition Classes
    AutomationTools
  277. def extractInferenceConfigFromDataFrame(configDataFrame: DataFrame): InferenceMainConfig

    Permalink

    Extract the InferenceMainConfig from a stored DataFrame containing the string-encoded json in row 1, column 1

    Extract the InferenceMainConfig from a stored DataFrame containing the string-encoded json in row 1, column 1

    configDataFrame

    A Dataframe that contains the configuration for the Inference run.

    returns

    an instance of InferenceMainConfig

    Definition Classes
    InferenceTools
  278. def extractInferenceJsonFromDataFrame(configDataFrame: DataFrame): String

    Permalink

    From a supplied DataFrame that contains the configuration in cell 1:1, get the json string

    From a supplied DataFrame that contains the configuration in cell 1:1, get the json string

    configDataFrame

    A Dataframe that contains the configuration for the Inference run.

    returns

    The string-encoded json payload for InferenceMainConfig

    Definition Classes
    InferenceTools
  279. def extractMLPCPayload(payload: MLPCConfig): Map[String, Any]

    Permalink
    Definition Classes
    AutomationTools
  280. def extractPayload(cc: Product): Map[String, Any]

    Permalink
    Definition Classes
    AutomationTools
  281. def featureInteractionOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  282. def featureInteractionOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  283. def fieldRemovalCompare(preFilterFields: Array[String], postFilterFields: Array[String]): List[String]

    Permalink
    Definition Classes
    AutomationTools
  284. def finalize(): Unit

    Permalink
    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  285. def generateAssembly(numericColumns: List[String], characterColumns: List[String], featureCol: String): (Array[StringIndexer], Array[String], VectorAssembler)

    Permalink
    Definition Classes
    DataValidation
  286. def generationDataFrameReport(generationalData: Array[GenerationalReport], sortingStrategy: String): DataFrame

    Permalink
    Definition Classes
    AutomationTools
  287. def getAutoStoppingFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  288. def getAutoStoppingScore: Double

    Permalink
    Definition Classes
    AutomationConfig
  289. def getCardinalityCheckMode: String

    Permalink
    Definition Classes
    AutomationConfig
  290. def getCardinalityLimit: Int

    Permalink
    Definition Classes
    AutomationConfig
  291. def getCardinalityPrecision: Double

    Permalink
    Definition Classes
    AutomationConfig
  292. def getCardinalitySwitch: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  293. def getCardinalityType: String

    Permalink
    Definition Classes
    AutomationConfig
  294. def getCategoricalNAFillMap: Map[String, String]

    Permalink
    Definition Classes
    AutomationConfig
  295. def getCharacterFillStat: String

    Permalink
    Definition Classes
    AutomationConfig
  296. def getCharacterNABlanketFillValue: String

    Permalink
    Definition Classes
    AutomationConfig
  297. final def getClass(): Class[_]

    Permalink
    Definition Classes
    AnyRef → Any
  298. def getContinuousDataThreshold: Int

    Permalink
    Definition Classes
    AutomationConfig
  299. def getContinuousEvolutionGeneticMixing: Double

    Permalink
    Definition Classes
    AutomationConfig
  300. def getContinuousEvolutionMaxIterations: Int

    Permalink
    Definition Classes
    AutomationConfig
  301. def getContinuousEvolutionMutationAggressiveness: Int

    Permalink
    Definition Classes
    AutomationConfig
  302. def getContinuousEvolutionParallelism: Int

    Permalink
    Definition Classes
    AutomationConfig
  303. def getContinuousEvolutionRollingImporvementCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  304. def getContinuousEvolutionStoppingScore: Double

    Permalink
    Definition Classes
    AutomationConfig
  305. def getCorrelationCutoffHigh: Double

    Permalink
    Definition Classes
    AutomationConfig
  306. def getCorrelationCutoffLow: Double

    Permalink
    Definition Classes
    AutomationConfig
  307. def getCovarianceConfig: CovarianceConfig

    Permalink
    Definition Classes
    AutomationConfig
  308. def getCovarianceFilterStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  309. def getDataPrepCachingStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  310. def getDataPrepParallelism: Int

    Permalink
    Definition Classes
    AutomationConfig
  311. def getDataReductionFactor: Double

    Permalink
    Definition Classes
    AutomationConfig
  312. def getDateTimeConversionType: String

    Permalink
    Definition Classes
    AutomationConfig
  313. def getDeltaCacheBackingDirectory: String

    Permalink
    Definition Classes
    AutomationConfig
  314. def getDeltaCacheBackingDirectoryRemovalFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  315. def getEvolutionStrategy: String

    Permalink
    Definition Classes
    AutomationConfig
  316. def getFeatConfig: MainConfig

    Permalink
    Definition Classes
    AutomationConfig
  317. def getFeatureImportanceCutoffType: String

    Permalink
    Definition Classes
    AutomationConfig
  318. def getFeatureImportanceCutoffValue: Double

    Permalink
    Definition Classes
    AutomationConfig
  319. def getFeatureInteractionConfig: params.FeatureInteractionConfig

    Permalink
    Definition Classes
    AutomationConfig
  320. def getFeatureInteractionContinuousDiscretizerBucketCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  321. def getFeatureInteractionParallelism: Int

    Permalink
    Definition Classes
    AutomationConfig
  322. def getFeatureInteractionRetentionMode: String

    Permalink
    Definition Classes
    AutomationConfig
  323. def getFeatureInteractionStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  324. def getFeatureInteractionTargetInteractionPercentage: Double

    Permalink
    Definition Classes
    AutomationConfig
  325. def getFeaturesCol: String

    Permalink
    Definition Classes
    AutomationConfig
  326. def getFieldsToIgnore: Array[String]

    Permalink
    Definition Classes
    AutomationConfig
  327. def getFieldsToIgnoreInVector: Array[String]

    Permalink
    Definition Classes
    AutomationConfig
  328. def getFillConfig: FillConfig

    Permalink
    Definition Classes
    AutomationConfig
  329. def getFilterBounds: String

    Permalink
    Definition Classes
    AutomationConfig
  330. def getFilterPrecision: Double

    Permalink
    Definition Classes
    AutomationConfig
  331. def getFirstGenerationArraySeed: Long

    Permalink
    Definition Classes
    AutomationConfig
  332. def getFirstGenerationConfig: FirstGenerationConfig

    Permalink
    Definition Classes
    AutomationConfig
  333. def getFirstGenerationGenePool: Int

    Permalink
    Definition Classes
    AutomationConfig
  334. def getFirstGenerationIndexMixingMode: String

    Permalink
    Definition Classes
    AutomationConfig
  335. def getFirstGenerationMode: String

    Permalink
    Definition Classes
    AutomationConfig
  336. def getFirstGenerationPermutationCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  337. def getFixedMutationValue: Int

    Permalink
    Definition Classes
    AutomationConfig
  338. def getGenerationalMutationStrategy: String

    Permalink
    Definition Classes
    AutomationConfig
  339. def getGeneticConfig: GeneticConfig

    Permalink
    Definition Classes
    AutomationConfig
  340. def getGeneticMixing: Double

    Permalink
    Definition Classes
    AutomationConfig
  341. def getHyperSpaceInferenceCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  342. def getHyperSpaceInferenceStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  343. def getHyperSpaceModelCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  344. def getHyperSpaceModelType: String

    Permalink
    Definition Classes
    AutomationConfig
  345. def getInferenceConfig: InferenceMainConfig

    Permalink
  346. def getInferenceConfigSaveLocation: String

    Permalink
    Definition Classes
    AutomationConfig
  347. def getKFold: Int

    Permalink
    Definition Classes
    AutomationConfig
  348. def getKGroups: Int

    Permalink
    Definition Classes
    AutomationConfig
  349. def getKMeansDistanceMeasurement: String

    Permalink
    Definition Classes
    AutomationConfig
  350. def getKMeansMaxIter: Int

    Permalink
    Definition Classes
    AutomationConfig
  351. def getKMeansPredictionCol: String

    Permalink
    Definition Classes
    AutomationConfig
  352. def getKMeansSeed: Long

    Permalink
    Definition Classes
    AutomationConfig
  353. def getKMeansTolerance: Double

    Permalink
    Definition Classes
    AutomationConfig
  354. def getKSampleConfig: KSampleConfig

    Permalink
    Definition Classes
    AutomationConfig
  355. def getLSHHashTables: Int

    Permalink
    Definition Classes
    AutomationConfig
  356. def getLSHOutputCol: String

    Permalink
    Definition Classes
    AutomationConfig
  357. def getLabelCol: String

    Permalink
    Definition Classes
    AutomationConfig
  358. def getLowerFilterNTile: Double

    Permalink
    Definition Classes
    AutomationConfig
  359. def getMainConfig: MainConfig

    Permalink
    Definition Classes
    AutomationConfig
  360. def getMinimumVectorCountToMutate: Int

    Permalink
    Definition Classes
    AutomationConfig
  361. def getMlFlowBestSuffix: String

    Permalink
    Definition Classes
    AutomationConfig
  362. def getMlFlowConfig: MLFlowConfig

    Permalink
    Definition Classes
    AutomationConfig
  363. def getMlFlowCustomRunTags: Map[String, String]

    Permalink
    Definition Classes
    AutomationConfig
  364. def getMlFlowExperimentName: String

    Permalink
    Definition Classes
    AutomationConfig
  365. def getMlFlowLogArtifactsFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  366. def getMlFlowLoggingFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  367. def getMlFlowLoggingMode: String

    Permalink
    Definition Classes
    AutomationConfig
  368. def getMlFlowModelSaveDirectory: String

    Permalink
    Definition Classes
    AutomationConfig
  369. def getMlFlowTrackingURI: String

    Permalink
    Definition Classes
    AutomationConfig
  370. def getModelSeedMap: Map[String, Any]

    Permalink
    Definition Classes
    AutomationConfig
  371. def getModelSeedSetStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  372. def getModelSelectionDistinctThreshold: Int

    Permalink
    Definition Classes
    AutomationConfig
  373. def getModelingFamily: String

    Permalink
    Definition Classes
    AutomationConfig
  374. def getMutationMagnitudeMode: String

    Permalink
    Definition Classes
    AutomationConfig
  375. def getMutationMode: String

    Permalink
    Definition Classes
    AutomationConfig
  376. def getMutationValue: Double

    Permalink
    Definition Classes
    AutomationConfig
  377. def getNAFillFilterPrecision: Double

    Permalink
    Definition Classes
    AutomationConfig
  378. def getNAFillMode: String

    Permalink
    Definition Classes
    AutomationConfig
  379. def getNaFillStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  380. def getNumberOfGenerations: Int

    Permalink
    Definition Classes
    AutomationConfig
  381. def getNumberOfMutationsPerGeneration: Int

    Permalink
    Definition Classes
    AutomationConfig
  382. def getNumberOfParentsToRetain: Int

    Permalink
    Definition Classes
    AutomationConfig
  383. def getNumericBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    AutomationConfig
  384. def getNumericFillStat: String

    Permalink
    Definition Classes
    AutomationConfig
  385. def getNumericNABlanketFillValue: Double

    Permalink
    Definition Classes
    AutomationConfig
  386. def getNumericNAFillMap: Map[String, AnyVal]

    Permalink
    Definition Classes
    AutomationConfig
  387. def getOneHotEncodingStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  388. def getOutlierConfig: OutlierConfig

    Permalink
    Definition Classes
    AutomationConfig
  389. def getOutlierFilterStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  390. def getPNorm: Double

    Permalink
    Definition Classes
    AutomationConfig
  391. def getParallelism: Int

    Permalink
    Definition Classes
    AutomationConfig
  392. def getPearsonAutoFilterNTile: Double

    Permalink
    Definition Classes
    AutomationConfig
  393. def getPearsonConfig: PearsonConfig

    Permalink
    Definition Classes
    AutomationConfig
  394. def getPearsonFilterDirection: String

    Permalink
    Definition Classes
    AutomationConfig
  395. def getPearsonFilterManualValue: Double

    Permalink
    Definition Classes
    AutomationConfig
  396. def getPearsonFilterMode: String

    Permalink
    Definition Classes
    AutomationConfig
  397. def getPearsonFilterStatistic: String

    Permalink
    Definition Classes
    AutomationConfig
  398. def getPearsonFilterStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  399. def getPipelineId: String

    Permalink
    Definition Classes
    AutomationConfig
  400. def getQuorumCount: Int

    Permalink
    Definition Classes
    AutomationConfig
  401. def getScalerMax: Double

    Permalink
    Definition Classes
    AutomationConfig
  402. def getScalerMin: Double

    Permalink
    Definition Classes
    AutomationConfig
  403. def getScalerType: String

    Permalink
    Definition Classes
    AutomationConfig
  404. def getScalingConfig: ScalingConfig

    Permalink
    Definition Classes
    AutomationConfig
  405. def getScalingStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  406. def getScoringMetric: String

    Permalink
    Definition Classes
    AutomationConfig
  407. def getScoringOptimizationStrategy: String

    Permalink
    Definition Classes
    AutomationConfig
  408. def getSeed: Long

    Permalink
    Definition Classes
    AutomationConfig
  409. def getSplitCachingStrategy: String

    Permalink
    Definition Classes
    AutomationConfig
  410. def getStandardScalingMeanFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  411. def getStandardScalingStdDevFlag: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  412. def getStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    AutomationConfig
  413. def getSyntheticCol: String

    Permalink
    Definition Classes
    AutomationConfig
  414. def getTrainPortion: Double

    Permalink
    Definition Classes
    AutomationConfig
  415. def getTrainSplitChronologicalColumn: String

    Permalink
    Definition Classes
    AutomationConfig
  416. def getTrainSplitChronologicalRandomPercentage: Double

    Permalink
    Definition Classes
    AutomationConfig
  417. def getTrainSplitMethod: String

    Permalink
    Definition Classes
    AutomationConfig
  418. def getTreeSplitsConfig: MainConfig

    Permalink
    Definition Classes
    AutomationConfig
  419. def getUpperFilterNTile: Double

    Permalink
    Definition Classes
    AutomationConfig
  420. def getVarianceFilterStatus: Boolean

    Permalink
    Definition Classes
    AutomationConfig
  421. def getVectorMutationMethod: String

    Permalink
    Definition Classes
    AutomationConfig
  422. def hashCode(): Int

    Permalink
    Definition Classes
    AnyRef → Any
  423. def hyperSpaceInferenceOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  424. def hyperSpaceInferenceOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  425. def indexStrings(categoricalFields: List[String]): (Array[StringIndexer], Array[String])

    Permalink
    Definition Classes
    DataValidation
  426. def invalidateSelection(value: String, allowances: Seq[String]): String

    Permalink
    Definition Classes
    DataValidation
  427. final def isInstanceOf[T0]: Boolean

    Permalink
    Definition Classes
    Any
  428. def mlFlowLogArtifactsOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  429. def mlFlowLogArtifactsOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  430. def mlFlowLoggingOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  431. def mlFlowLoggingOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  432. def naFillOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  433. def naFillOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  434. final def ne(arg0: AnyRef): Boolean

    Permalink
    Definition Classes
    AnyRef
  435. final def notify(): Unit

    Permalink
    Definition Classes
    AnyRef
  436. final def notifyAll(): Unit

    Permalink
    Definition Classes
    AnyRef
  437. def oneHotEncodeStrings(stringIndexedFields: List[String]): (OneHotEncoderEstimator, Array[String])

    Permalink
    Definition Classes
    DataValidation
  438. def oneHotEncodingOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  439. def oneHotEncodingOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  440. def outlierFilterOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  441. def outlierFilterOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  442. def pearsonFilterOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  443. def pearsonFilterOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  444. def prettyPrintConfig(config: AnyRef): String

    Permalink

    Provide a human-readable report into stdout and in the logs that show the configuration for a model run with the key -> value relationship shown as json

    Provide a human-readable report into stdout and in the logs that show the configuration for a model run with the key -> value relationship shown as json

    config

    AnyRef -> a defined case class

    returns

    String in the form of pretty print syntax

    Definition Classes
    AutomationTools
  445. def printSchema(schema: Array[String], dataName: String): String

    Permalink
    Definition Classes
    AutomationTools
  446. def printSchema(df: DataFrame, dataName: String): String

    Permalink
    Definition Classes
    AutomationTools
  447. def recordInferenceDataConfig(config: MainConfig, startingFields: Array[String]): InferenceDataConfig

    Permalink

    Helper method for generating the Inference Config object for the data configuration steps needed to perform to reproduce the modeling for subsequent inference runs.

    Helper method for generating the Inference Config object for the data configuration steps needed to perform to reproduce the modeling for subsequent inference runs.

    config

    The full main Config that is utilized for the execution of the run.

    startingFields

    The fields that are are returned from type casting and validation (may contain artificial suffixes for StringIndexer (_si) and OneHotEncoder(_oh). These will be removed before recording.

    returns

    and Instance of InferenceDataConfig

    Definition Classes
    AutomationTools
    Since

    0.4.0

  448. def recordInferenceSwitchSettings(config: MainConfig): InferenceSwitchSettings

    Permalink

    Single-pass method for recording all switch settings to the InferenceConfig Object.

    Single-pass method for recording all switch settings to the InferenceConfig Object.

    config

    MainConfig used for starting the training AutoML run

    Definition Classes
    AutomationTools
  449. def removeArrayOfColumns(payload: InferencePayload, removalArray: Array[String]): InferencePayload

    Permalink

    Definition Classes
    InferenceTools
  450. def runInferenceFromJSONConfig(jsonConfig: String): DataFrame

    Permalink

    Public method for performing an inference run from a supplied inference config string.

    Public method for performing an inference run from a supplied inference config string.

    jsonConfig

    the saved inference config from a previous run as string-encoded json

    returns

    A Dataframe with prediction based on a pre-trained model.

  451. def runInferenceFromStoredDataFrame(inferenceConfigDFPath: String): DataFrame

    Permalink

    Public method for performing an inference run from a stored InferenceConfig Dataframe location.

    Public method for performing an inference run from a stored InferenceConfig Dataframe location.

    inferenceConfigDFPath

    Path on storage of where the Dataframe was written during the training run.

    returns

    A Dataframe with predictions based on a pre-trained model.

  452. lazy val sc: SparkContext

    Permalink
    Definition Classes
    SparkSessionWrapper
  453. def scalingOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  454. def scalingOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  455. def setAutoStoppingScore(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  456. def setCardinalityCheckMode(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[AssertionError] )
  457. def setCardinalityLimit(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
  458. def setCardinalityPrecision(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
  459. def setCardinalitySwitch(value: Boolean): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  460. def setCardinalityThreshold(value: Int): InferencePipeline.this.type

    Permalink

    Setter - for overriding the cardinality threshold exception threshold.

    Setter - for overriding the cardinality threshold exception threshold. [WARNING] increasing this value on a sufficiently large data set could incur, during runtime, excessive memory and cpu pressure on the cluster.

    value

    Int: the limit above which an exception will be thrown for a classification problem wherein the label distinct count is too large to successfully generate synthetic data.

    Definition Classes
    AutomationConfig
    Since

    0.5.1

    Note

    Default: 20

  461. def setCardinalityType(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[AssertionError] )
  462. def setCategoricalNAFillMap(value: Map[String, String]): InferencePipeline.this.type

    Permalink

    Setter for providing a map of [Column Name -> String Fill Value] for manual by-column overrides.

    Setter for providing a map of [Column Name -> String Fill Value] for manual by-column overrides. Any non-specified fields in this map will utilize the "auto" statistics-based fill paradigm to calculate and fill any NA values in non-numeric columns.

    value

    Map[String, String]: Column Name as String -> Fill Value as String

    Definition Classes
    AutomationConfig
    Since

    0.5.2

    Note

    If fields are specified in here that are not part of the DataFrame's schema, an exception will be thrown.

    ,

    if naFillMode is specified as using Map Fill modes, this setter or the numeric na fill map MUST be set.

  463. def setCharacterFillStat(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  464. def setCharacterNABlanketFillValue(value: String): InferencePipeline.this.type

    Permalink

    Setter for providing a 'blanket override' value (fill all found categorical columns' missing values with this specified value).

    Setter for providing a 'blanket override' value (fill all found categorical columns' missing values with this specified value).

    value

    String: A value to fill all categorical na values in the DataFrame with.

    Definition Classes
    AutomationConfig
    Since

    0.5.2

  465. def setContinuousDataThreshold(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  466. def setContinuousEvolutionGeneticMixing(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  467. def setContinuousEvolutionImprovementThreshold(value: Int): InferencePipeline.this.type

    Permalink

    Setter for defining the secondary stopping criteria for continuous training mode ( number of consistentlt not-improving runs to terminate the learning algorithm due to diminishing returns.

    Setter for defining the secondary stopping criteria for continuous training mode ( number of consistentlt not-improving runs to terminate the learning algorithm due to diminishing returns.

    value

    Negative Integer (an improvement to a priori will reset the counter and subsequent non-improvements will decrement a mutable counter. If the counter hits this limit specified in value, the continuous mode algorithm will stop).

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.0

    Exceptions thrown

    IllegalArgumentException if the value is positive.

  468. def setContinuousEvolutionMaxIterations(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  469. def setContinuousEvolutionMutationAggressiveness(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  470. def setContinuousEvolutionParallelism(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  471. def setContinuousEvolutionRollingImprovementCount(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  472. def setContinuousEvolutionStoppingScore(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  473. def setCorrelationCutoffHigh(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  474. def setCorrelationCutoffLow(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  475. def setDataPrepParallelism(value: Int): InferencePipeline.this.type

    Permalink

    Setter for defining the number of concurrent threads allocated to performing asynchronous data prep tasks within the feature engineering aspect of this application.

    Setter for defining the number of concurrent threads allocated to performing asynchronous data prep tasks within the feature engineering aspect of this application.

    value

    Int: A value that must be greater than zero.

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.0

    Exceptions thrown

    IllegalArgumentException if a value less than or equal to zero is supplied.

    Note

    This value has an upper limit, depending on driver size, that will restrict the efficacy of the asynchronous tasks within the pool. Setting this too high may cause cluster instability.

  476. def setDataReductionFactor(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  477. def setDateTimeConversionType(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  478. def setDeltaCacheBackingDirectory(value: String): InferencePipeline.this.type

    Permalink

    Setter for providing a path to write the kfold train/test splits as Delta data sets to (useful for extremely large data sets or a situation where using local disk storage might be prohibitively expensive)

    Setter for providing a path to write the kfold train/test splits as Delta data sets to (useful for extremely large data sets or a situation where using local disk storage might be prohibitively expensive)

    value

    String path to a dbfs location for creating the temporary (or persisted)

    Definition Classes
    AutomationConfig
    Since

    0.7.1

  479. def setDeltaCacheBackingDirectoryRemovalFlag(value: Boolean): InferencePipeline.this.type

    Permalink

    Setter for whether or not to delete the written train/test splits for the run in Delta.

    Setter for whether or not to delete the written train/test splits for the run in Delta. Defaulted to true which means that the job will delete the data on Object store to clean itself up after the run is completed if the splitCachingStrategy is set to 'delta'

    value

    Boolean - true => delete false => leave on Object Store

    Definition Classes
    AutomationConfig
    Since

    0.7.1

  480. def setEvolutionStrategy(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  481. def setFeatConfig(value: MainConfig): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  482. def setFeatConfig(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  483. def setFeatureImportanceCutoffType(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  484. def setFeatureImportanceCutoffValue(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  485. def setFeatureInteractionContinuousDiscretizerBucketCount(value: Int): InferencePipeline.this.type

    Permalink

    Setter for determining the behavior of continuous feature columns.

    Setter for determining the behavior of continuous feature columns. In order to calculate Entropy for a continuous variable, the distribution must be converted to nominal values for estimation of per-split information gain. This setting defines how many nominal categorical values to create out of a continuously distributed feature in order to calculate Entropy.

    value

    Int -> must be greater than 1

    Definition Classes
    AutomationConfig
    Since

    0.6.2

    Exceptions thrown

    IllegalArgumentException if the value specified is <= 1

  486. def setFeatureInteractionParallelism(value: Int): InferencePipeline.this.type

    Permalink

    Setter for configuring the concurrent count for scoring of feature interaction candidates.

    Setter for configuring the concurrent count for scoring of feature interaction candidates. Due to the nature of these operations, the configuration here may need to be set differently to that of the modeling and general feature engineering phases of the toolkit. This is highly dependent on the row count of the data set being submitted.

    value

    Int -> must be greater than 0

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.2

    Exceptions thrown

    IllegalArgumentException if the value is < 1

  487. def setFeatureInteractionRetentionMode(value: String): InferencePipeline.this.type

    Permalink

    Setter for determining the mode of operation for inclusion of interacted features.

    Setter for determining the mode of operation for inclusion of interacted features. Modes are:

    • all -> Includes all interactions between all features (after string indexing of categorical values)
    • optimistic -> If the Information Gain / Variance, as compared to at least ONE of the parents of the interaction is above the threshold set by featureInteractionTargetInteractionPercentage (e.g. if IG of left parent is 0.5 and right parent is 0.9, with threshold set at 10, if the interaction between these two parents has an IG of 0.42, it would be rejected, but if it was 0.46, it would be kept)
    • strict -> the threshold percentage must be met for BOTH parents. (in the above example, the IG for the interaction would have to be > 0.81 in order to be included in the feature vector).
    value

    String -> one of: 'all', 'optimistic', or 'strict'

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.2

    Exceptions thrown

    IllegalArgumentException if the specified value submitted is not permitted

  488. def setFeatureInteractionTargetInteractionPercentage(value: Double): InferencePipeline.this.type

    Permalink

    Setter for establishing the minimum acceptable InformationGain or Variance allowed for an interaction candidate based on comparison to the scores of its parents.

    Setter for establishing the minimum acceptable InformationGain or Variance allowed for an interaction candidate based on comparison to the scores of its parents.

    value

    Double in range of -inf -> inf

    Definition Classes
    AutomationConfig
    Since

    0.6.2

  489. def setFeaturesCol(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  490. def setFieldsToIgnore(value: Array[String]): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  491. def setFieldsToIgnoreInVector(value: Array[String]): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  492. def setFilterBounds(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  493. def setFilterPrecision(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  494. def setFirstGenerationArraySeed(value: Long): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  495. def setFirstGenerationGenePool(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  496. def setFirstGenerationIndexMixingMode(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  497. def setFirstGenerationMode(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  498. def setFirstGenerationPermutationCount(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  499. def setFixedMutationValue(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  500. def setGenerationalMutationStrategy(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  501. def setGeneticMBOCandidateFactor(value: Int): InferencePipeline.this.type

    Permalink

    Setter for defining the factor to be applied to the candidate listing of hyperparameters to generate through mutation for each generation other than the initial and post-modeling optimization phases.

    Setter for defining the factor to be applied to the candidate listing of hyperparameters to generate through mutation for each generation other than the initial and post-modeling optimization phases. The larger this value (default: 10), the more potential space can be searched. There is not a large performance hit to this, and as such, values in excess of 100 are viable.

    value

    Int - a factor to multiply the numberOfMutationsPerGeneration by to generate a count of potential candidates.

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.0

    Exceptions thrown

    IllegalArgumentException if the value is not greater than zero.

  502. def setGeneticMBORegressorType(value: String): InferencePipeline.this.type

    Permalink

    Setter for selecting the type of Regressor to use for the within-epoch generation MBO of candidates

    Setter for selecting the type of Regressor to use for the within-epoch generation MBO of candidates

    value

    String - one of "XGBoost", "LinearRegression" or "RandomForest"

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.0

    Exceptions thrown

    IllegalArgumentException if the value is not supported

  503. def setGeneticMixing(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  504. def setHyperSpaceInferenceCount(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  505. def setHyperSpaceModelCount(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  506. def setHyperSpaceModelType(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  507. def setInferenceConfigSaveLocation(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
  508. def setKFold(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  509. def setKGroups(value: Int): InferencePipeline.this.type

    Permalink

    Setter for specifying the number of K-Groups to generate in the KMeans model

    Setter for specifying the number of K-Groups to generate in the KMeans model

    value

    Int: number of k groups to generate

    returns

    this

    Definition Classes
    AutomationConfig
  510. def setKMeansDistanceMeasurement(value: String): InferencePipeline.this.type

    Permalink

    Setter for which distance measurement to use to calculate the nearness of vectors to a centroid

    Setter for which distance measurement to use to calculate the nearness of vectors to a centroid

    value

    String: Options -> "euclidean" or "cosine" Default: "euclidean"

    returns

    this

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if an invalid value is entered

  511. def setKMeansMaxIter(value: Int): InferencePipeline.this.type

    Permalink

    Setter for specifying the maximum number of iterations for the KMeans model to go through to converge

    Setter for specifying the maximum number of iterations for the KMeans model to go through to converge

    value

    Int: Maximum limit on iterations

    returns

    this

    Definition Classes
    AutomationConfig
  512. def setKMeansPredictionCol(value: String): InferencePipeline.this.type

    Permalink

    Setter for the internal KMeans column for cluster membership attribution

    Setter for the internal KMeans column for cluster membership attribution

    value

    String: column name for internal algorithm column for group membership

    returns

    this

    Definition Classes
    AutomationConfig
  513. def setKMeansSeed(value: Long): InferencePipeline.this.type

    Permalink

    Setter for a KMeans seed for the clustering algorithm

    Setter for a KMeans seed for the clustering algorithm

    value

    Long: Seed value

    returns

    this

    Definition Classes
    AutomationConfig
  514. def setKMeansTolerance(value: Double): InferencePipeline.this.type

    Permalink

    Setter for Setting the tolerance for KMeans (must be >0)

    Setter for Setting the tolerance for KMeans (must be >0)

    value

    The tolerance value setting for KMeans

    returns

    this

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if a value less than 0 is entered

    See also

    reference: http://spark.apache.org/docs/latest/api/scala/index.html#org.apache.spark.ml.clustering.KMeans for further details.

  515. def setKSampleConfig(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  516. def setLSHHashTables(value: Int): InferencePipeline.this.type

    Permalink

    Setter for Configuring the number of Hash Tables to use for MinHashLSH

    Setter for Configuring the number of Hash Tables to use for MinHashLSH

    value

    Int: Count of hash tables to use

    returns

    this

    Definition Classes
    AutomationConfig
    See also

    http://spark.apache.org/docs/latest/api/scala/index.html#org.apache.spark.ml.feature.MinHashLSH for more information

  517. def setLSHOutputCol(value: String): InferencePipeline.this.type

    Permalink

    Setter for the internal LSH output hash information column

    Setter for the internal LSH output hash information column

    value

    String: column name for the internal MinHashLSH Model transformation value

    returns

    this

    Definition Classes
    AutomationConfig
  518. def setLSHSeed(value: Long): InferencePipeline.this.type

    Permalink

    Setter for Configuring the Seed value for the LSH MinHash model

    Setter for Configuring the Seed value for the LSH MinHash model

    value

    Long: A Seed value

    Definition Classes
    AutomationConfig
    Since

    0.5.1

  519. def setLabelBalanceMode(value: String): InferencePipeline.this.type

    Permalink

    Setter - for determining the label balance approach mode.

    Setter - for determining the label balance approach mode.

    value

    String: one of: 'match', 'percentage' or 'target'

    Definition Classes
    AutomationConfig
    Annotations
    @throws( ... )
    Since

    0.5.1

    Exceptions thrown

    UnsupportedOperationException() if the provided mode is not supported.

    Note

    Default: "percentage"

    ,

    Available modes:
    'match': Will match all smaller class counts to largest class count. [WARNING] - May significantly increase memory pressure!
    'percentage' Will adjust smaller classes to a percentage value of the largest class count. 'target' Will increase smaller class counts to a fixed numeric target of rows.

  520. def setLabelCol(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  521. def setLowerFilterNTile(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  522. def setMainConfig(value: MainConfig): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  523. def setMainConfig(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  524. def setMinimumVectorCountToMutate(value: Int): InferencePipeline.this.type

    Permalink

    Setter for minimum threshold for vector indexes to mutate within the feature vector.

    Setter for minimum threshold for vector indexes to mutate within the feature vector.

    value

    The minimum (or fixed) number of indexes to mutate.

    returns

    this

    Definition Classes
    AutomationConfig
    Note

    In vectorMutationMethod "fixed" this sets the fixed count of how many vector positions to mutate. In vectorMutationMethod "random" this sets the lower threshold for 'at least this many indexes will be mutated'

  525. def setMlFlowAPIToken(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  526. def setMlFlowBestSuffix(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  527. def setMlFlowConfig(value: MLFlowConfig): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  528. def setMlFlowCustomRunTags(value: Map[String, String]): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  529. def setMlFlowExperimentName(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  530. def setMlFlowLoggingMode(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  531. def setMlFlowModelSaveDirectory(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
  532. def setMlFlowTrackingURI(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  533. def setModelSeedMap(value: Map[String, Any]): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  534. def setModelSeedString(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  535. def setModelSelectionDistinctThreshold(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  536. def setModelingFamily(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  537. def setMutationMagnitudeMode(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  538. def setMutationMode(value: String): InferencePipeline.this.type

    Permalink

    Setter for the Mutation Mode of the feature vector individual values

    Setter for the Mutation Mode of the feature vector individual values

    value

    String: the mode to use.

    returns

    this

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if the mode is not supported.

    Note

    Options: "weighted" - uses weighted averaging to scale the euclidean distance between the centroid vector and mutation candidate vectors "random" - randomly selects a position on the euclidean vector between the centroid vector and the candidate mutation vectors "ratio" - uses a ratio between the values of the centroid vector and the mutation vector *

  539. def setMutationValue(value: Double): InferencePipeline.this.type

    Permalink

    Setter for specifying the mutation magnitude for the modes 'weighted' and 'ratio' in mutationMode

    Setter for specifying the mutation magnitude for the modes 'weighted' and 'ratio' in mutationMode

    value

    Double: value between 0 and 1 for mutation magnitude adjustment.

    returns

    this

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if the value specified is outside of the range (0, 1)

    Note

    the higher this value, the closer to the centroid vector vs. the candidate mutation vector the synthetic row data will be.

  540. def setNAFillFilterPrecision(value: Double): InferencePipeline.this.type

    Permalink

    Setter for defining the precision for calculating the model type as per the label column

    Setter for defining the precision for calculating the model type as per the label column

    value

    Double: Precision accuracy for approximate distinct calculation.

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[AssertionError] )
    Since

    0.5.2

    Exceptions thrown

    java.lang.AssertionError If the value is outside of the allowable range of {0, 1}

    Note

    setting this value to zero (0) for a large regression problem will incur a long processing time and an expensive shuffle.

  541. def setNAFillMode(value: String): InferencePipeline.this.type

    Permalink

    Mode for na fill
    Available modes:
    auto : Stats-based na fill for fields.

    Mode for na fill
    Available modes:
    auto : Stats-based na fill for fields. Usage of .setNumericFillStat and .setCharacterFillStat will inform the type of statistics that will be used to fill.
    mapFill : Custom by-column overrides to 'blanket fill' na values on a per-column basis. The categorical (string) fields are set via .setCategoricalNAFillMap while the numeric fields are set via .setNumericNAFillMap.
    blanketFillAll : Fills all fields based on the values specified by .setCharacterNABlanketFillValue and .setNumericNABlanketFillValue. All NA's for the appropriate types will be filled in accordingly throughout all columns.
    blanketFillCharOnly Will use statistics to fill in numeric fields, but will replace all categorical character fields na values with a blanket fill value.
    blanketFillNumOnly Will use statistics to fill in character fields, but will replace all numeric fields na values with a blanket value.

    value

    String: Mode for NA Fill

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.5.2

    Exceptions thrown

    IllegalArgumentException if the mods specified is not supported.

  542. def setNumberOfGenerations(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  543. def setNumberOfMutationsPerGeneration(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  544. def setNumberOfParentsToRetain(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  545. def setNumericBoundaries(value: Map[String, (Double, Double)]): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  546. def setNumericFillStat(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  547. def setNumericNABlanketFillValue(value: Double): InferencePipeline.this.type

    Permalink

    Setter for providing a 'blanket override' value (fill all found numeric columns' missing values with this specified value)

    Setter for providing a 'blanket override' value (fill all found numeric columns' missing values with this specified value)

    value

    Double: A value to fill all numeric na value in the DataFrame with.

    Definition Classes
    AutomationConfig
    Since

    0.5.2

  548. def setNumericNAFillMap(value: Map[String, AnyVal]): InferencePipeline.this.type

    Permalink

    Setter for providing a map of [Column Name -> AnyVal Fill Value] (must be numeric).

    Setter for providing a map of [Column Name -> AnyVal Fill Value] (must be numeric). Any non-specified fields in this map will utilize the "auto" statistics-based fill paradigm to calculate and fill any NA values in numeric columns.

    value

    Map[String, AnyVal]: Column Name as String -> Fill Numeric Type Value

    Definition Classes
    AutomationConfig
    Since

    0.5.2

    Note

    If fields are specified in here that are not part of the DataFrame's schema, an exception will be thrown.

    ,

    if naFillMode is specified as using Map Fill modes, this setter or the categorical na fill map MUST be set.

  549. def setNumericRatio(value: Double): InferencePipeline.this.type

    Permalink

    Setter - for specifying the percentage ratio for the mode 'percentage' in setLabelBalanceMode()

    Setter - for specifying the percentage ratio for the mode 'percentage' in setLabelBalanceMode()

    value

    Double: A fractional double in the range of 0.0 to 1.0.

    Definition Classes
    AutomationConfig
    Annotations
    @throws( ... )
    Since

    0.5.1

    Exceptions thrown

    UnsupportedOperationException() if the provided value is outside of the range of 0.0 -> 1.0

    Note

    Default: 0.2

    ,

    Setting this value to 1.0 is equivalent to setting the label balance mode to 'match'

  550. def setNumericTarget(value: Int): InferencePipeline.this.type

    Permalink

    Setter - for specifying the target row count to generate for 'target' mode in setLabelBalanceMode()

    Setter - for specifying the target row count to generate for 'target' mode in setLabelBalanceMode()

    value

    Int: The desired final number of rows per minority class label

    Definition Classes
    AutomationConfig
    Since

    0.5.1

    Note

    [WARNING] Setting this value to too high of a number will greatly increase runtime and memory pressure.

  551. def setPNorm(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  552. def setParallelism(value: Int): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  553. def setPearsonAutoFilterNTile(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  554. def setPearsonFilterDirection(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  555. def setPearsonFilterManualValue(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  556. def setPearsonFilterMode(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  557. def setPearsonFilterStatistic(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  558. def setPipelineId(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  559. def setQuorumCount(value: Int): InferencePipeline.this.type

    Permalink

    Setter for how many vectors to find in adjacency to the centroid for generation of synthetic data

    Setter for how many vectors to find in adjacency to the centroid for generation of synthetic data

    value

    Int: Number of vectors to find nearest each centroid within the class

    returns

    this

    Definition Classes
    AutomationConfig
    Note

    the higher the value set here, the higher the variance in synthetic data generation

  560. def setScalerMax(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  561. def setScalerMin(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  562. def setScalerType(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  563. def setScoringMetric(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  564. def setScoringOptimizationStrategy(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  565. def setSeed(value: Long): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  566. def setSplitCachingStrategy(value: String): InferencePipeline.this.type

    Permalink

    Setter for determining the split caching strategy (either persist to disk for each kfold split or backing to Delta)

    Setter for determining the split caching strategy (either persist to disk for each kfold split or backing to Delta)

    value

    Configuration string either 'persist' or 'delta'

    Definition Classes
    AutomationConfig
    Since

    0.7.1

  567. def setStandardScalerMeanFlagOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  568. def setStandardScalerMeanFlagOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  569. def setStandardScalerStdDevFlagOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  570. def setStandardScalerStdDevFlagOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  571. def setStringBoundaries(value: Map[String, List[String]]): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  572. def setSyntheticCol(value: String): InferencePipeline.this.type

    Permalink

    Setter - for setting the name of the Synthetic column name

    Setter - for setting the name of the Synthetic column name

    value

    String: A column name that is uniquely not part of the main DataFrame

    Definition Classes
    AutomationConfig
    Since

    0.5.1

  573. def setTrainPortion(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  574. def setTrainSplitChronologicalColumn(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  575. def setTrainSplitChronologicalRandomPercentage(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  576. def setTrainSplitMethod(value: String): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  577. def setTreeSplitsConfig(value: MainConfig): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  578. def setTreeSplitsConfig(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  579. def setUpperFilterNTile(value: Double): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  580. def setVectorMutationMethod(value: String): InferencePipeline.this.type

    Permalink

    Setter for the Vector Mutation Method

    Setter for the Vector Mutation Method

    value

    String - the mode to use.

    returns

    this

    Definition Classes
    AutomationConfig
    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if the mode is not supported.

    Note

    Options: "fixed" - will use the value of minimumVectorCountToMutate to select random indexes of this number of indexes. "random" - will use this number as a lower bound on a random selection of indexes between this and the vector length. "all" - will mutate all of the vectors.

  581. lazy val spark: SparkSession

    Permalink
    Definition Classes
    SparkSessionWrapper
  582. final def synchronized[T0](arg0: ⇒ T0): T0

    Permalink
    Definition Classes
    AnyRef
  583. def toString(): String

    Permalink
    Definition Classes
    AnyRef → Any
  584. final val trainSplitMethods: List[String]

    Permalink
    Definition Classes
    Defaults
  585. def trainSplitValidation(trainSplitMethod: String, modelSelection: String): String

    Permalink
    Definition Classes
    AutomationTools
  586. def validateCardinality(df: DataFrame, stringFields: List[String], cardinalityLimit: Int = 500, parallelism: Int = 20): ValidatedCategoricalFields

    Permalink
    Definition Classes
    DataValidation
  587. def validateFieldPresence(df: DataFrame, column: String): Unit

    Permalink
    Definition Classes
    DataValidation
  588. def validateInputDataframe(df: DataFrame): Unit

    Permalink
    Definition Classes
    DataValidation
  589. def validateLabelAndFeatures(df: DataFrame, labelCol: String, featureCol: String): Unit

    Permalink
    Definition Classes
    DataValidation
  590. def varianceFilterOff(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  591. def varianceFilterOn(): InferencePipeline.this.type

    Permalink
    Definition Classes
    AutomationConfig
  592. final def wait(): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  593. final def wait(arg0: Long, arg1: Int): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  594. final def wait(arg0: Long): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )

Inherited from InferenceTools

Inherited from DataValidation

Inherited from AutomationTools

Inherited from SparkSessionWrapper

Inherited from Serializable

Inherited from Serializable

Inherited from AutomationConfig

Inherited from SanitizerDefaults

Inherited from Defaults

Inherited from AnyRef

Inherited from Any

Ungrouped