Trait

com.databricks.labs.automl.executor

AutomationConfig

Related Doc: package executor

Permalink

trait AutomationConfig extends Defaults with SanitizerDefaults

Linear Supertypes
Known Subclasses
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. AutomationConfig
  2. SanitizerDefaults
  3. Defaults
  4. AnyRef
  5. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Value Members

  1. final def !=(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int

    Permalink
    Definition Classes
    AnyRef → Any
  3. final def ==(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  4. final val _allowableEvolutionStrategies: List[String]

    Permalink
    Definition Classes
    Defaults
  5. final val _allowableInitialGenerationIndexMixingModes: List[String]

    Permalink
    Definition Classes
    Defaults
  6. final val _allowableInitialGenerationModes: List[String]

    Permalink
    Definition Classes
    Defaults
  7. final val _allowableMlFlowLoggingModes: List[String]

    Permalink
    Definition Classes
    Defaults
  8. final val _allowableNAFillModes: List[String]

    Permalink
    Definition Classes
    Defaults
  9. final val _allowedFilterDirections: Array[String]

    Permalink
    Definition Classes
    SanitizerDefaults
  10. final val _allowedFilterModes: Array[String]

    Permalink
    Definition Classes
    SanitizerDefaults
  11. final val _allowedStats: Array[String]

    Permalink

    Pearson Defaults

    Pearson Defaults

    Definition Classes
    SanitizerDefaults
  12. var _autoStoppingFlag: Boolean

    Permalink
  13. var _autoStoppingScore: Double

    Permalink
  14. var _cardinalityCheckMode: String

    Permalink
  15. var _cardinalityLimit: Int

    Permalink
  16. var _cardinalityPrecision: Double

    Permalink
  17. var _cardinalitySwitchFlag: Boolean

    Permalink
  18. var _cardinalityThreshold: Int

    Permalink
  19. var _cardinalityType: String

    Permalink
  20. var _categoricalNAFillMap: Map[String, String]

    Permalink
  21. var _characterFillStat: String

    Permalink
  22. var _characterNABlanketFillValue: String

    Permalink
  23. var _continuousDataThreshold: Int

    Permalink
  24. var _continuousEvolutionGeneticMixing: Double

    Permalink
  25. var _continuousEvolutionImprovementThreshold: Int

    Permalink
  26. var _continuousEvolutionMaxIterations: Int

    Permalink
  27. var _continuousEvolutionMutationAggressiveness: Int

    Permalink
  28. var _continuousEvolutionParallelism: Int

    Permalink
  29. var _continuousEvolutionRollingImprovementCount: Int

    Permalink
  30. var _continuousEvolutionStoppingScore: Double

    Permalink
  31. var _correlationCutoffHigh: Double

    Permalink
  32. var _correlationCutoffLow: Double

    Permalink
  33. var _covarianceConfig: CovarianceConfig

    Permalink
  34. def _covarianceConfigDefaults: CovarianceConfig

    Permalink
    Definition Classes
    Defaults
  35. var _covarianceFilterFlag: Boolean

    Permalink
  36. var _dataPrepCachingFlag: Boolean

    Permalink
  37. def _dataPrepConfigDefaults: DataPrepConfig

    Permalink
    Definition Classes
    Defaults
  38. var _dataPrepParallelism: Int

    Permalink
  39. var _dataReductionFactor: Double

    Permalink
  40. var _dateTimeConversionType: String

    Permalink
  41. def _defaultAutoStoppingFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  42. def _defaultAutoStoppingScore: Double

    Permalink
    Definition Classes
    Defaults
  43. def _defaultCovarianceFilterFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  44. def _defaultDataPrepCachingFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  45. def _defaultDataPrepParallelism: Int

    Permalink
    Definition Classes
    Defaults
  46. def _defaultDataReductionFactor: Double

    Permalink
    Definition Classes
    Defaults
  47. def _defaultDateTimeConversionType: String

    Permalink
    Definition Classes
    Defaults
  48. def _defaultFeatureImportanceCutoffType: String

    Permalink
    Definition Classes
    Defaults
  49. def _defaultFeatureImportanceCutoffValue: Double

    Permalink
    Definition Classes
    Defaults
  50. def _defaultFeatureInteractionConfig: FeatureInteractionConfig

    Permalink
    Definition Classes
    Defaults
  51. def _defaultFeatureInteractionFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  52. def _defaultFeaturesCol: String

    Permalink
    Definition Classes
    Defaults
  53. def _defaultFieldsToIgnoreInVector: Array[String]

    Permalink
    Definition Classes
    Defaults
  54. def _defaultFirstGenerationConfig: FirstGenerationConfig

    Permalink
    Definition Classes
    Defaults
  55. def _defaultHyperSpaceInference: Boolean

    Permalink
    Definition Classes
    Defaults
  56. def _defaultHyperSpaceInferenceCount: Int

    Permalink
    Definition Classes
    Defaults
  57. def _defaultHyperSpaceModelCount: Int

    Permalink
    Definition Classes
    Defaults
  58. def _defaultHyperSpaceModelType: String

    Permalink
    Definition Classes
    Defaults
  59. def _defaultInitialGenerationMode: String

    Permalink
    Definition Classes
    Defaults
  60. def _defaultKSampleConfig: KSampleConfig

    Permalink
    Definition Classes
    Defaults
  61. def _defaultLabelCol: String

    Permalink
    Definition Classes
    Defaults
  62. def _defaultMlFlowArtifactsFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  63. def _defaultMlFlowLoggingFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  64. def _defaultModelingFamily: String

    Permalink
    Definition Classes
    Defaults
  65. def _defaultNAFillFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  66. def _defaultOneHotEncodeFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  67. def _defaultOutlierFilterFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  68. def _defaultPearsonFilterFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  69. def _defaultPipelineDebugFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  70. def _defaultPipelineId: String

    Permalink
    Definition Classes
    Defaults
  71. def _defaultScalingFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  72. def _defaultVarianceFilterFlag: Boolean

    Permalink
    Definition Classes
    Defaults
  73. var _deltaCacheBackingDirectory: String

    Permalink
  74. var _deltaCacheBackingDirectoryRemovalFlag: Boolean

    Permalink
  75. var _evolutionStrategy: String

    Permalink
  76. var _featureImportanceCutoffType: String

    Permalink
  77. var _featureImportanceCutoffValue: Double

    Permalink
  78. var _featureImportancesConfig: MainConfig

    Permalink
  79. def _featureImportancesDefaults: MainConfig

    Permalink
    Definition Classes
    Defaults
  80. var _featureInteractionConfig: FeatureInteractionConfig

    Permalink
  81. var _featureInteractionContinuousDiscretizerBucketCount: Int

    Permalink
  82. var _featureInteractionFlag: Boolean

    Permalink
  83. var _featureInteractionParallelism: Int

    Permalink
  84. var _featureInteractionRetentionMode: String

    Permalink
  85. var _featureInteractionTargetInteractionPercentage: Double

    Permalink
  86. var _featuresCol: String

    Permalink
  87. var _fieldsToIgnore: Array[String]

    Permalink
  88. var _fieldsToIgnoreInVector: Array[String]

    Permalink
  89. var _fillConfig: FillConfig

    Permalink
  90. def _fillConfigDefaults: FillConfig

    Permalink
    Definition Classes
    Defaults
  91. var _filterBounds: String

    Permalink
  92. var _filterPrecision: Double

    Permalink
  93. var _firstGenerationArraySeed: Long

    Permalink
  94. var _firstGenerationConfig: FirstGenerationConfig

    Permalink
  95. var _firstGenerationGenePool: Int

    Permalink
  96. var _firstGenerationIndexMixingMode: String

    Permalink
  97. var _firstGenerationMode: String

    Permalink
  98. var _firstGenerationPermutationCount: Int

    Permalink
  99. var _fixedMutationValue: Int

    Permalink
  100. def _gbtDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  101. def _gbtDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  102. var _generationalMutationStrategy: String

    Permalink
  103. var _geneticConfig: GeneticConfig

    Permalink
  104. var _geneticMBOCandidateFactor: Int

    Permalink
  105. var _geneticMBORegressorType: String

    Permalink
  106. var _geneticMixing: Double

    Permalink
  107. def _geneticTunerDefaults: GeneticConfig

    Permalink
    Definition Classes
    Defaults
  108. var _hyperSpaceInference: Boolean

    Permalink
  109. var _hyperSpaceInferenceCount: Int

    Permalink
  110. var _hyperSpaceModelCount: Int

    Permalink
  111. var _hyperSpaceModelType: String

    Permalink
  112. var _inferenceConfigSaveLocation: String

    Permalink
  113. def _inferenceConfigSaveLocationDefault: String

    Permalink
    Definition Classes
    Defaults
  114. var _kFold: Int

    Permalink
  115. var _kGroups: Int

    Permalink
  116. var _kMeansDistanceMeasurement: String

    Permalink
  117. var _kMeansMaxIter: Int

    Permalink
  118. var _kMeansPredictionCol: String

    Permalink
  119. var _kMeansSeed: Long

    Permalink
  120. var _kMeansTolerance: Double

    Permalink
  121. var _kSampleConfig: KSampleConfig

    Permalink
  122. var _labelBalanceMode: String

    Permalink
  123. var _labelCol: String

    Permalink
  124. def _lightGBMDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  125. def _lightGBMDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  126. def _linearRegressionDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  127. def _linearRegressionDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  128. def _logisticRegressionDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  129. def _logisticRegressionDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  130. var _lowerFilterNTile: Double

    Permalink
  131. var _lshHashTables: Int

    Permalink
  132. var _lshOutputCol: String

    Permalink
  133. var _lshSeed: Long

    Permalink
  134. var _mainConfig: MainConfig

    Permalink
  135. def _mainConfigDefaults: MainConfig

    Permalink
    Definition Classes
    Defaults
  136. var _minimumVectorCountToMutate: Int

    Permalink
  137. var _mlFlowAPIToken: String

    Permalink
  138. var _mlFlowArtifactsFlag: Boolean

    Permalink
  139. var _mlFlowBestSuffix: String

    Permalink
  140. var _mlFlowConfig: MLFlowConfig

    Permalink
  141. def _mlFlowConfigDefaults: MLFlowConfig

    Permalink
    Definition Classes
    Defaults
  142. var _mlFlowCustomRunTags: Map[String, String]

    Permalink
  143. var _mlFlowExperimentName: String

    Permalink
  144. var _mlFlowLoggingFlag: Boolean

    Permalink
  145. var _mlFlowLoggingMode: String

    Permalink
  146. var _mlFlowModelSaveDirectory: String

    Permalink
  147. var _mlFlowTrackingURI: String

    Permalink
  148. def _mlpcDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  149. def _mlpcDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  150. var _modelSeedMap: Map[String, Any]

    Permalink
  151. var _modelSeedSetStatus: Boolean

    Permalink
  152. var _modelSelectionDistinctThreshold: Int

    Permalink
  153. def _modelTypeDefault: String

    Permalink
    Definition Classes
    Defaults
  154. var _modelingFamily: String

    Permalink
  155. var _mutationMagnitudeMode: String

    Permalink
  156. var _mutationMode: String

    Permalink
  157. var _mutationValue: Double

    Permalink
  158. var _naFillFilterPrecision: Double

    Permalink
  159. var _naFillFlag: Boolean

    Permalink
  160. var _naFillMode: String

    Permalink
  161. def _naiveBayesDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  162. def _naiveBayesDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  163. var _numberOfGenerations: Int

    Permalink
  164. var _numberOfMutationsPerGeneration: Int

    Permalink
  165. var _numberOfParentsToRetain: Int

    Permalink
  166. var _numericBoundaries: Map[String, (Double, Double)]

    Permalink
  167. var _numericFillStat: String

    Permalink
  168. var _numericNABlanketFillValue: Double

    Permalink
  169. var _numericNAFillMap: Map[String, AnyVal]

    Permalink
  170. var _numericRatio: Double

    Permalink
  171. var _numericTarget: Int

    Permalink
  172. var _oneHotEncodeFlag: Boolean

    Permalink
  173. var _outlierConfig: OutlierConfig

    Permalink
  174. def _outlierConfigDefaults: OutlierConfig

    Permalink
    Definition Classes
    Defaults
  175. var _outlierFilterFlag: Boolean

    Permalink
  176. var _outputDfRepartitionScaleFactor: Int

    Permalink
  177. var _pNorm: Double

    Permalink
  178. var _parallelism: Int

    Permalink
  179. var _pearsonAutoFilterNTile: Double

    Permalink
  180. var _pearsonConfig: PearsonConfig

    Permalink
  181. def _pearsonConfigDefaults: PearsonConfig

    Permalink
    Definition Classes
    Defaults
  182. var _pearsonFilterDirection: String

    Permalink
  183. var _pearsonFilterFlag: Boolean

    Permalink
  184. var _pearsonFilterManualValue: Double

    Permalink
  185. var _pearsonFilterMode: String

    Permalink
  186. var _pearsonFilterStatistic: String

    Permalink
  187. var _pipelineDebugFlag: Boolean

    Permalink
  188. var _pipelineId: String

    Permalink
  189. var _quorumCount: Int

    Permalink
  190. def _rfDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  191. def _rfDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  192. var _scalerMax: Double

    Permalink
  193. var _scalerMin: Double

    Permalink
  194. var _scalerType: String

    Permalink
  195. var _scalingConfig: ScalingConfig

    Permalink
  196. def _scalingConfigDefaults: ScalingConfig

    Permalink
    Definition Classes
    Defaults
  197. var _scalingFlag: Boolean

    Permalink
  198. def _scoringDefaultClassifier: String

    Permalink
    Definition Classes
    Defaults
  199. def _scoringDefaultRegressor: String

    Permalink
    Definition Classes
    Defaults
  200. var _scoringMetric: String

    Permalink
  201. var _scoringOptimizationStrategy: String

    Permalink
  202. def _scoringOptimizationStrategyClassifier: String

    Permalink
    Definition Classes
    Defaults
  203. def _scoringOptimizationStrategyRegressor: String

    Permalink
    Definition Classes
    Defaults
  204. var _seed: Long

    Permalink
  205. var _splitCachingStrategy: String

    Permalink
  206. var _standardScalerMeanFlag: Boolean

    Permalink
  207. var _standardScalerStdDevFlag: Boolean

    Permalink
  208. var _stringBoundaries: Map[String, List[String]]

    Permalink
  209. final val _supportedFeatureImportanceCutoffTypes: List[String]

    Permalink
    Definition Classes
    Defaults
  210. final val _supportedModels: Array[String]

    Permalink
    Definition Classes
    Defaults
  211. def _svmDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  212. def _svmDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  213. var _syntheticCol: String

    Permalink
  214. var _trainPortion: Double

    Permalink
  215. var _trainSplitChronologicalColumn: String

    Permalink
  216. var _trainSplitChronologicalRandomPercentage: Double

    Permalink
  217. var _trainSplitColumnSet: Boolean

    Permalink
  218. var _trainSplitMethod: String

    Permalink
  219. def _treeSplitDefaults: MainConfig

    Permalink
    Definition Classes
    Defaults
  220. var _treeSplitsConfig: MainConfig

    Permalink
  221. def _treesDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  222. def _treesDefaultStringBoundaries: Map[String, List[String]]

    Permalink
    Definition Classes
    Defaults
  223. var _upperFilterNTile: Double

    Permalink
  224. var _varianceFilterFlag: Boolean

    Permalink
  225. var _vectorMutationMethod: String

    Permalink
  226. def _xgboostDefaultNumBoundaries: Map[String, (Double, Double)]

    Permalink
    Definition Classes
    Defaults
  227. final val allowableCardinalilties: List[String]

    Permalink
    Definition Classes
    Defaults
  228. final val allowableCategoricalFilterModes: List[String]

    Permalink
    Definition Classes
    Defaults
  229. final val allowableDateTimeConversions: List[String]

    Permalink
    Definition Classes
    Defaults
  230. final val allowableFeatureInteractionModes: List[String]

    Permalink
    Definition Classes
    Defaults
  231. final val allowableKMeansDistanceMeasurements: List[String]

    Permalink
    Definition Classes
    Defaults
  232. final val allowableLabelBalanceModes: List[String]

    Permalink
    Definition Classes
    Defaults
  233. final val allowableMBORegressorTypes: List[String]

    Permalink
    Definition Classes
    Defaults
  234. final val allowableMutationModes: List[String]

    Permalink
    Definition Classes
    Defaults
  235. final val allowableScalers: Array[String]

    Permalink

    Scaler Defaults

    Scaler Defaults

    Definition Classes
    SanitizerDefaults
  236. final val allowableVectorMutationMethods: List[String]

    Permalink
    Definition Classes
    Defaults
  237. final def asInstanceOf[T0]: T0

    Permalink
    Definition Classes
    Any
  238. def autoStoppingOff(): AutomationConfig.this.type

    Permalink
  239. def autoStoppingOn(): AutomationConfig.this.type

    Permalink
  240. def cardinalitySwitchOff(): AutomationConfig.this.type

    Permalink
  241. def cardinalitySwitchOn(): AutomationConfig.this.type

    Permalink
  242. def clone(): AnyRef

    Permalink
    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  243. def covarianceFilterOff(): AutomationConfig.this.type

    Permalink
  244. def covarianceFilterOn(): AutomationConfig.this.type

    Permalink
  245. def dataPrepCachingOff(): AutomationConfig.this.type

    Permalink
  246. def dataPrepCachingOn(): AutomationConfig.this.type

    Permalink
  247. def defaultFeaturesCol: String

    Permalink
    Definition Classes
    SanitizerDefaults
  248. def defaultLabelCol: String

    Permalink

    Global Defaults

    Global Defaults

    Definition Classes
    SanitizerDefaults
  249. def defaultPNorm: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  250. def defaultPearsonAutoFilterNTile: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  251. def defaultPearsonFilterDirection: String

    Permalink
    Definition Classes
    SanitizerDefaults
  252. def defaultPearsonFilterManualValue: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  253. def defaultPearsonFilterMode: String

    Permalink
    Definition Classes
    SanitizerDefaults
  254. def defaultPearsonFilterStatistic: String

    Permalink
    Definition Classes
    SanitizerDefaults
  255. def defaultRenamedFeaturesCol: String

    Permalink
    Definition Classes
    SanitizerDefaults
  256. def defaultScalerMax: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  257. def defaultScalerMin: Double

    Permalink
    Definition Classes
    SanitizerDefaults
  258. def defaultScalerType: String

    Permalink
    Definition Classes
    SanitizerDefaults
  259. def defaultStandardScalerMeanFlag: Boolean

    Permalink
    Definition Classes
    SanitizerDefaults
  260. def defaultStandardScalerStdDevFlag: Boolean

    Permalink
    Definition Classes
    SanitizerDefaults
  261. def deltaCheckBackingDirectoryRemovalOff(): AutomationConfig.this.type

    Permalink
  262. def deltaCheckBackingDirectoryRemovalOn(): AutomationConfig.this.type

    Permalink
  263. final def eq(arg0: AnyRef): Boolean

    Permalink
    Definition Classes
    AnyRef
  264. def equals(arg0: Any): Boolean

    Permalink
    Definition Classes
    AnyRef → Any
  265. def featureInteractionOff(): AutomationConfig.this.type

    Permalink
  266. def featureInteractionOn(): AutomationConfig.this.type

    Permalink
  267. def finalize(): Unit

    Permalink
    Attributes
    protected[java.lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  268. def getAutoStoppingFlag: Boolean

    Permalink
  269. def getAutoStoppingScore: Double

    Permalink
  270. def getCardinalityCheckMode: String

    Permalink
  271. def getCardinalityLimit: Int

    Permalink
  272. def getCardinalityPrecision: Double

    Permalink
  273. def getCardinalitySwitch: Boolean

    Permalink
  274. def getCardinalityType: String

    Permalink
  275. def getCategoricalNAFillMap: Map[String, String]

    Permalink
  276. def getCharacterFillStat: String

    Permalink
  277. def getCharacterNABlanketFillValue: String

    Permalink
  278. final def getClass(): Class[_]

    Permalink
    Definition Classes
    AnyRef → Any
  279. def getContinuousDataThreshold: Int

    Permalink
  280. def getContinuousEvolutionGeneticMixing: Double

    Permalink
  281. def getContinuousEvolutionMaxIterations: Int

    Permalink
  282. def getContinuousEvolutionMutationAggressiveness: Int

    Permalink
  283. def getContinuousEvolutionParallelism: Int

    Permalink
  284. def getContinuousEvolutionRollingImporvementCount: Int

    Permalink
  285. def getContinuousEvolutionStoppingScore: Double

    Permalink
  286. def getCorrelationCutoffHigh: Double

    Permalink
  287. def getCorrelationCutoffLow: Double

    Permalink
  288. def getCovarianceConfig: CovarianceConfig

    Permalink
  289. def getCovarianceFilterStatus: Boolean

    Permalink
  290. def getDataPrepCachingStatus: Boolean

    Permalink
  291. def getDataPrepParallelism: Int

    Permalink
  292. def getDataReductionFactor: Double

    Permalink
  293. def getDateTimeConversionType: String

    Permalink
  294. def getDeltaCacheBackingDirectory: String

    Permalink
  295. def getDeltaCacheBackingDirectoryRemovalFlag: Boolean

    Permalink
  296. def getEvolutionStrategy: String

    Permalink
  297. def getFeatConfig: MainConfig

    Permalink
  298. def getFeatureImportanceCutoffType: String

    Permalink
  299. def getFeatureImportanceCutoffValue: Double

    Permalink
  300. def getFeatureInteractionConfig: FeatureInteractionConfig

    Permalink
  301. def getFeatureInteractionContinuousDiscretizerBucketCount: Int

    Permalink
  302. def getFeatureInteractionParallelism: Int

    Permalink
  303. def getFeatureInteractionRetentionMode: String

    Permalink
  304. def getFeatureInteractionStatus: Boolean

    Permalink
  305. def getFeatureInteractionTargetInteractionPercentage: Double

    Permalink
  306. def getFeaturesCol: String

    Permalink
  307. def getFieldsToIgnore: Array[String]

    Permalink
  308. def getFieldsToIgnoreInVector: Array[String]

    Permalink
  309. def getFillConfig: FillConfig

    Permalink
  310. def getFilterBounds: String

    Permalink
  311. def getFilterPrecision: Double

    Permalink
  312. def getFirstGenerationArraySeed: Long

    Permalink
  313. def getFirstGenerationConfig: FirstGenerationConfig

    Permalink
  314. def getFirstGenerationGenePool: Int

    Permalink
  315. def getFirstGenerationIndexMixingMode: String

    Permalink
  316. def getFirstGenerationMode: String

    Permalink
  317. def getFirstGenerationPermutationCount: Int

    Permalink
  318. def getFixedMutationValue: Int

    Permalink
  319. def getGenerationalMutationStrategy: String

    Permalink
  320. def getGeneticConfig: GeneticConfig

    Permalink
  321. def getGeneticMixing: Double

    Permalink
  322. def getHyperSpaceInferenceCount: Int

    Permalink
  323. def getHyperSpaceInferenceStatus: Boolean

    Permalink
  324. def getHyperSpaceModelCount: Int

    Permalink
  325. def getHyperSpaceModelType: String

    Permalink
  326. def getInferenceConfigSaveLocation: String

    Permalink
  327. def getKFold: Int

    Permalink
  328. def getKGroups: Int

    Permalink
  329. def getKMeansDistanceMeasurement: String

    Permalink
  330. def getKMeansMaxIter: Int

    Permalink
  331. def getKMeansPredictionCol: String

    Permalink
  332. def getKMeansSeed: Long

    Permalink
  333. def getKMeansTolerance: Double

    Permalink
  334. def getKSampleConfig: KSampleConfig

    Permalink
  335. def getLSHHashTables: Int

    Permalink
  336. def getLSHOutputCol: String

    Permalink
  337. def getLabelCol: String

    Permalink
  338. def getLowerFilterNTile: Double

    Permalink
  339. def getMainConfig: MainConfig

    Permalink
  340. def getMinimumVectorCountToMutate: Int

    Permalink
  341. def getMlFlowBestSuffix: String

    Permalink
  342. def getMlFlowConfig: MLFlowConfig

    Permalink
  343. def getMlFlowCustomRunTags: Map[String, String]

    Permalink
  344. def getMlFlowExperimentName: String

    Permalink
  345. def getMlFlowLogArtifactsFlag: Boolean

    Permalink
  346. def getMlFlowLoggingFlag: Boolean

    Permalink
  347. def getMlFlowLoggingMode: String

    Permalink
  348. def getMlFlowModelSaveDirectory: String

    Permalink
  349. def getMlFlowTrackingURI: String

    Permalink
  350. def getModelSeedMap: Map[String, Any]

    Permalink
  351. def getModelSeedSetStatus: Boolean

    Permalink
  352. def getModelSelectionDistinctThreshold: Int

    Permalink
  353. def getModelingFamily: String

    Permalink
  354. def getMutationMagnitudeMode: String

    Permalink
  355. def getMutationMode: String

    Permalink
  356. def getMutationValue: Double

    Permalink
  357. def getNAFillFilterPrecision: Double

    Permalink
  358. def getNAFillMode: String

    Permalink
  359. def getNaFillStatus: Boolean

    Permalink
  360. def getNumberOfGenerations: Int

    Permalink
  361. def getNumberOfMutationsPerGeneration: Int

    Permalink
  362. def getNumberOfParentsToRetain: Int

    Permalink
  363. def getNumericBoundaries: Map[String, (Double, Double)]

    Permalink
  364. def getNumericFillStat: String

    Permalink
  365. def getNumericNABlanketFillValue: Double

    Permalink
  366. def getNumericNAFillMap: Map[String, AnyVal]

    Permalink
  367. def getOneHotEncodingStatus: Boolean

    Permalink
  368. def getOutlierConfig: OutlierConfig

    Permalink
  369. def getOutlierFilterStatus: Boolean

    Permalink
  370. def getPNorm: Double

    Permalink
  371. def getParallelism: Int

    Permalink
  372. def getPearsonAutoFilterNTile: Double

    Permalink
  373. def getPearsonConfig: PearsonConfig

    Permalink
  374. def getPearsonFilterDirection: String

    Permalink
  375. def getPearsonFilterManualValue: Double

    Permalink
  376. def getPearsonFilterMode: String

    Permalink
  377. def getPearsonFilterStatistic: String

    Permalink
  378. def getPearsonFilterStatus: Boolean

    Permalink
  379. def getPipelineId: String

    Permalink
  380. def getQuorumCount: Int

    Permalink
  381. def getScalerMax: Double

    Permalink
  382. def getScalerMin: Double

    Permalink
  383. def getScalerType: String

    Permalink
  384. def getScalingConfig: ScalingConfig

    Permalink
  385. def getScalingStatus: Boolean

    Permalink
  386. def getScoringMetric: String

    Permalink
  387. def getScoringOptimizationStrategy: String

    Permalink
  388. def getSeed: Long

    Permalink
  389. def getSplitCachingStrategy: String

    Permalink
  390. def getStandardScalingMeanFlag: Boolean

    Permalink
  391. def getStandardScalingStdDevFlag: Boolean

    Permalink
  392. def getStringBoundaries: Map[String, List[String]]

    Permalink
  393. def getSyntheticCol: String

    Permalink
  394. def getTrainPortion: Double

    Permalink
  395. def getTrainSplitChronologicalColumn: String

    Permalink
  396. def getTrainSplitChronologicalRandomPercentage: Double

    Permalink
  397. def getTrainSplitMethod: String

    Permalink
  398. def getTreeSplitsConfig: MainConfig

    Permalink
  399. def getUpperFilterNTile: Double

    Permalink
  400. def getVarianceFilterStatus: Boolean

    Permalink
  401. def getVectorMutationMethod: String

    Permalink
  402. def hashCode(): Int

    Permalink
    Definition Classes
    AnyRef → Any
  403. def hyperSpaceInferenceOff(): AutomationConfig.this.type

    Permalink
  404. def hyperSpaceInferenceOn(): AutomationConfig.this.type

    Permalink
  405. final def isInstanceOf[T0]: Boolean

    Permalink
    Definition Classes
    Any
  406. def mlFlowLogArtifactsOff(): AutomationConfig.this.type

    Permalink
  407. def mlFlowLogArtifactsOn(): AutomationConfig.this.type

    Permalink
  408. def mlFlowLoggingOff(): AutomationConfig.this.type

    Permalink
  409. def mlFlowLoggingOn(): AutomationConfig.this.type

    Permalink
  410. def naFillOff(): AutomationConfig.this.type

    Permalink
  411. def naFillOn(): AutomationConfig.this.type

    Permalink
  412. final def ne(arg0: AnyRef): Boolean

    Permalink
    Definition Classes
    AnyRef
  413. final def notify(): Unit

    Permalink
    Definition Classes
    AnyRef
  414. final def notifyAll(): Unit

    Permalink
    Definition Classes
    AnyRef
  415. def oneHotEncodingOff(): AutomationConfig.this.type

    Permalink
  416. def oneHotEncodingOn(): AutomationConfig.this.type

    Permalink
  417. def outlierFilterOff(): AutomationConfig.this.type

    Permalink
  418. def outlierFilterOn(): AutomationConfig.this.type

    Permalink
  419. def pearsonFilterOff(): AutomationConfig.this.type

    Permalink
  420. def pearsonFilterOn(): AutomationConfig.this.type

    Permalink
  421. def scalingOff(): AutomationConfig.this.type

    Permalink
  422. def scalingOn(): AutomationConfig.this.type

    Permalink
  423. def setAutoStoppingScore(value: Double): AutomationConfig.this.type

    Permalink
  424. def setCardinalityCheckMode(value: String): AutomationConfig.this.type

    Permalink
    Annotations
    @throws( classOf[AssertionError] )
  425. def setCardinalityLimit(value: Int): AutomationConfig.this.type

    Permalink
    Annotations
    @throws( classOf[IllegalArgumentException] )
  426. def setCardinalityPrecision(value: Double): AutomationConfig.this.type

    Permalink
    Annotations
    @throws( classOf[IllegalArgumentException] )
  427. def setCardinalitySwitch(value: Boolean): AutomationConfig.this.type

    Permalink
  428. def setCardinalityThreshold(value: Int): AutomationConfig.this.type

    Permalink

    Setter - for overriding the cardinality threshold exception threshold.

    Setter - for overriding the cardinality threshold exception threshold. [WARNING] increasing this value on a sufficiently large data set could incur, during runtime, excessive memory and cpu pressure on the cluster.

    value

    Int: the limit above which an exception will be thrown for a classification problem wherein the label distinct count is too large to successfully generate synthetic data.

    Since

    0.5.1

    Note

    Default: 20

  429. def setCardinalityType(value: String): AutomationConfig.this.type

    Permalink
    Annotations
    @throws( classOf[AssertionError] )
  430. def setCategoricalNAFillMap(value: Map[String, String]): AutomationConfig.this.type

    Permalink

    Setter for providing a map of [Column Name -> String Fill Value] for manual by-column overrides.

    Setter for providing a map of [Column Name -> String Fill Value] for manual by-column overrides. Any non-specified fields in this map will utilize the "auto" statistics-based fill paradigm to calculate and fill any NA values in non-numeric columns.

    value

    Map[String, String]: Column Name as String -> Fill Value as String

    Since

    0.5.2

    Note

    If fields are specified in here that are not part of the DataFrame's schema, an exception will be thrown.

    ,

    if naFillMode is specified as using Map Fill modes, this setter or the numeric na fill map MUST be set.

  431. def setCharacterFillStat(value: String): AutomationConfig.this.type

    Permalink
  432. def setCharacterNABlanketFillValue(value: String): AutomationConfig.this.type

    Permalink

    Setter for providing a 'blanket override' value (fill all found categorical columns' missing values with this specified value).

    Setter for providing a 'blanket override' value (fill all found categorical columns' missing values with this specified value).

    value

    String: A value to fill all categorical na values in the DataFrame with.

    Since

    0.5.2

  433. def setContinuousDataThreshold(value: Int): AutomationConfig.this.type

    Permalink
  434. def setContinuousEvolutionGeneticMixing(value: Double): AutomationConfig.this.type

    Permalink
  435. def setContinuousEvolutionImprovementThreshold(value: Int): AutomationConfig.this.type

    Permalink

    Setter for defining the secondary stopping criteria for continuous training mode ( number of consistentlt not-improving runs to terminate the learning algorithm due to diminishing returns.

    Setter for defining the secondary stopping criteria for continuous training mode ( number of consistentlt not-improving runs to terminate the learning algorithm due to diminishing returns.

    value

    Negative Integer (an improvement to a priori will reset the counter and subsequent non-improvements will decrement a mutable counter. If the counter hits this limit specified in value, the continuous mode algorithm will stop).

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.0

    Exceptions thrown

    IllegalArgumentException if the value is positive.

  436. def setContinuousEvolutionMaxIterations(value: Int): AutomationConfig.this.type

    Permalink
  437. def setContinuousEvolutionMutationAggressiveness(value: Int): AutomationConfig.this.type

    Permalink
  438. def setContinuousEvolutionParallelism(value: Int): AutomationConfig.this.type

    Permalink
  439. def setContinuousEvolutionRollingImprovementCount(value: Int): AutomationConfig.this.type

    Permalink
  440. def setContinuousEvolutionStoppingScore(value: Double): AutomationConfig.this.type

    Permalink
  441. def setCorrelationCutoffHigh(value: Double): AutomationConfig.this.type

    Permalink
  442. def setCorrelationCutoffLow(value: Double): AutomationConfig.this.type

    Permalink
  443. def setDataPrepParallelism(value: Int): AutomationConfig.this.type

    Permalink

    Setter for defining the number of concurrent threads allocated to performing asynchronous data prep tasks within the feature engineering aspect of this application.

    Setter for defining the number of concurrent threads allocated to performing asynchronous data prep tasks within the feature engineering aspect of this application.

    value

    Int: A value that must be greater than zero.

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.0

    Exceptions thrown

    IllegalArgumentException if a value less than or equal to zero is supplied.

    Note

    This value has an upper limit, depending on driver size, that will restrict the efficacy of the asynchronous tasks within the pool. Setting this too high may cause cluster instability.

  444. def setDataReductionFactor(value: Double): AutomationConfig.this.type

    Permalink
  445. def setDateTimeConversionType(value: String): AutomationConfig.this.type

    Permalink
  446. def setDeltaCacheBackingDirectory(value: String): AutomationConfig.this.type

    Permalink

    Setter for providing a path to write the kfold train/test splits as Delta data sets to (useful for extremely large data sets or a situation where using local disk storage might be prohibitively expensive)

    Setter for providing a path to write the kfold train/test splits as Delta data sets to (useful for extremely large data sets or a situation where using local disk storage might be prohibitively expensive)

    value

    String path to a dbfs location for creating the temporary (or persisted)

    Since

    0.7.1

  447. def setDeltaCacheBackingDirectoryRemovalFlag(value: Boolean): AutomationConfig.this.type

    Permalink

    Setter for whether or not to delete the written train/test splits for the run in Delta.

    Setter for whether or not to delete the written train/test splits for the run in Delta. Defaulted to true which means that the job will delete the data on Object store to clean itself up after the run is completed if the splitCachingStrategy is set to 'delta'

    value

    Boolean - true => delete false => leave on Object Store

    Since

    0.7.1

  448. def setEvolutionStrategy(value: String): AutomationConfig.this.type

    Permalink
  449. def setFeatConfig(value: MainConfig): AutomationConfig.this.type

    Permalink
  450. def setFeatConfig(): AutomationConfig.this.type

    Permalink
  451. def setFeatureImportanceCutoffType(value: String): AutomationConfig.this.type

    Permalink
  452. def setFeatureImportanceCutoffValue(value: Double): AutomationConfig.this.type

    Permalink
  453. def setFeatureInteractionContinuousDiscretizerBucketCount(value: Int): AutomationConfig.this.type

    Permalink

    Setter for determining the behavior of continuous feature columns.

    Setter for determining the behavior of continuous feature columns. In order to calculate Entropy for a continuous variable, the distribution must be converted to nominal values for estimation of per-split information gain. This setting defines how many nominal categorical values to create out of a continuously distributed feature in order to calculate Entropy.

    value

    Int -> must be greater than 1

    Since

    0.6.2

    Exceptions thrown

    IllegalArgumentException if the value specified is <= 1

  454. def setFeatureInteractionParallelism(value: Int): AutomationConfig.this.type

    Permalink

    Setter for configuring the concurrent count for scoring of feature interaction candidates.

    Setter for configuring the concurrent count for scoring of feature interaction candidates. Due to the nature of these operations, the configuration here may need to be set differently to that of the modeling and general feature engineering phases of the toolkit. This is highly dependent on the row count of the data set being submitted.

    value

    Int -> must be greater than 0

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.2

    Exceptions thrown

    IllegalArgumentException if the value is < 1

  455. def setFeatureInteractionRetentionMode(value: String): AutomationConfig.this.type

    Permalink

    Setter for determining the mode of operation for inclusion of interacted features.

    Setter for determining the mode of operation for inclusion of interacted features. Modes are:

    • all -> Includes all interactions between all features (after string indexing of categorical values)
    • optimistic -> If the Information Gain / Variance, as compared to at least ONE of the parents of the interaction is above the threshold set by featureInteractionTargetInteractionPercentage (e.g. if IG of left parent is 0.5 and right parent is 0.9, with threshold set at 10, if the interaction between these two parents has an IG of 0.42, it would be rejected, but if it was 0.46, it would be kept)
    • strict -> the threshold percentage must be met for BOTH parents. (in the above example, the IG for the interaction would have to be > 0.81 in order to be included in the feature vector).
    value

    String -> one of: 'all', 'optimistic', or 'strict'

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.2

    Exceptions thrown

    IllegalArgumentException if the specified value submitted is not permitted

  456. def setFeatureInteractionTargetInteractionPercentage(value: Double): AutomationConfig.this.type

    Permalink

    Setter for establishing the minimum acceptable InformationGain or Variance allowed for an interaction candidate based on comparison to the scores of its parents.

    Setter for establishing the minimum acceptable InformationGain or Variance allowed for an interaction candidate based on comparison to the scores of its parents.

    value

    Double in range of -inf -> inf

    Since

    0.6.2

  457. def setFeaturesCol(value: String): AutomationConfig.this.type

    Permalink
  458. def setFieldsToIgnore(value: Array[String]): AutomationConfig.this.type

    Permalink
  459. def setFieldsToIgnoreInVector(value: Array[String]): AutomationConfig.this.type

    Permalink
  460. def setFilterBounds(value: String): AutomationConfig.this.type

    Permalink
  461. def setFilterPrecision(value: Double): AutomationConfig.this.type

    Permalink
  462. def setFirstGenerationArraySeed(value: Long): AutomationConfig.this.type

    Permalink
  463. def setFirstGenerationGenePool(value: Int): AutomationConfig.this.type

    Permalink
  464. def setFirstGenerationIndexMixingMode(value: String): AutomationConfig.this.type

    Permalink
  465. def setFirstGenerationMode(value: String): AutomationConfig.this.type

    Permalink
  466. def setFirstGenerationPermutationCount(value: Int): AutomationConfig.this.type

    Permalink
  467. def setFixedMutationValue(value: Int): AutomationConfig.this.type

    Permalink
  468. def setGenerationalMutationStrategy(value: String): AutomationConfig.this.type

    Permalink
  469. def setGeneticMBOCandidateFactor(value: Int): AutomationConfig.this.type

    Permalink

    Setter for defining the factor to be applied to the candidate listing of hyperparameters to generate through mutation for each generation other than the initial and post-modeling optimization phases.

    Setter for defining the factor to be applied to the candidate listing of hyperparameters to generate through mutation for each generation other than the initial and post-modeling optimization phases. The larger this value (default: 10), the more potential space can be searched. There is not a large performance hit to this, and as such, values in excess of 100 are viable.

    value

    Int - a factor to multiply the numberOfMutationsPerGeneration by to generate a count of potential candidates.

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.0

    Exceptions thrown

    IllegalArgumentException if the value is not greater than zero.

  470. def setGeneticMBORegressorType(value: String): AutomationConfig.this.type

    Permalink

    Setter for selecting the type of Regressor to use for the within-epoch generation MBO of candidates

    Setter for selecting the type of Regressor to use for the within-epoch generation MBO of candidates

    value

    String - one of "XGBoost", "LinearRegression" or "RandomForest"

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.6.0

    Exceptions thrown

    IllegalArgumentException if the value is not supported

  471. def setGeneticMixing(value: Double): AutomationConfig.this.type

    Permalink
  472. def setHyperSpaceInferenceCount(value: Int): AutomationConfig.this.type

    Permalink
  473. def setHyperSpaceModelCount(value: Int): AutomationConfig.this.type

    Permalink
  474. def setHyperSpaceModelType(value: String): AutomationConfig.this.type

    Permalink
  475. def setInferenceConfigSaveLocation(value: String): AutomationConfig.this.type

    Permalink
    Annotations
    @throws( classOf[IllegalArgumentException] )
  476. def setKFold(value: Int): AutomationConfig.this.type

    Permalink
  477. def setKGroups(value: Int): AutomationConfig.this.type

    Permalink

    Setter for specifying the number of K-Groups to generate in the KMeans model

    Setter for specifying the number of K-Groups to generate in the KMeans model

    value

    Int: number of k groups to generate

    returns

    this

  478. def setKMeansDistanceMeasurement(value: String): AutomationConfig.this.type

    Permalink

    Setter for which distance measurement to use to calculate the nearness of vectors to a centroid

    Setter for which distance measurement to use to calculate the nearness of vectors to a centroid

    value

    String: Options -> "euclidean" or "cosine" Default: "euclidean"

    returns

    this

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if an invalid value is entered

  479. def setKMeansMaxIter(value: Int): AutomationConfig.this.type

    Permalink

    Setter for specifying the maximum number of iterations for the KMeans model to go through to converge

    Setter for specifying the maximum number of iterations for the KMeans model to go through to converge

    value

    Int: Maximum limit on iterations

    returns

    this

  480. def setKMeansPredictionCol(value: String): AutomationConfig.this.type

    Permalink

    Setter for the internal KMeans column for cluster membership attribution

    Setter for the internal KMeans column for cluster membership attribution

    value

    String: column name for internal algorithm column for group membership

    returns

    this

  481. def setKMeansSeed(value: Long): AutomationConfig.this.type

    Permalink

    Setter for a KMeans seed for the clustering algorithm

    Setter for a KMeans seed for the clustering algorithm

    value

    Long: Seed value

    returns

    this

  482. def setKMeansTolerance(value: Double): AutomationConfig.this.type

    Permalink

    Setter for Setting the tolerance for KMeans (must be >0)

    Setter for Setting the tolerance for KMeans (must be >0)

    value

    The tolerance value setting for KMeans

    returns

    this

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if a value less than 0 is entered

    See also

    reference: http://spark.apache.org/docs/latest/api/scala/index.html#org.apache.spark.ml.clustering.KMeans for further details.

  483. def setKSampleConfig(): AutomationConfig.this.type

    Permalink
  484. def setLSHHashTables(value: Int): AutomationConfig.this.type

    Permalink

    Setter for Configuring the number of Hash Tables to use for MinHashLSH

    Setter for Configuring the number of Hash Tables to use for MinHashLSH

    value

    Int: Count of hash tables to use

    returns

    this

    See also

    http://spark.apache.org/docs/latest/api/scala/index.html#org.apache.spark.ml.feature.MinHashLSH for more information

  485. def setLSHOutputCol(value: String): AutomationConfig.this.type

    Permalink

    Setter for the internal LSH output hash information column

    Setter for the internal LSH output hash information column

    value

    String: column name for the internal MinHashLSH Model transformation value

    returns

    this

  486. def setLSHSeed(value: Long): AutomationConfig.this.type

    Permalink

    Setter for Configuring the Seed value for the LSH MinHash model

    Setter for Configuring the Seed value for the LSH MinHash model

    value

    Long: A Seed value

    Since

    0.5.1

  487. def setLabelBalanceMode(value: String): AutomationConfig.this.type

    Permalink

    Setter - for determining the label balance approach mode.

    Setter - for determining the label balance approach mode.

    value

    String: one of: 'match', 'percentage' or 'target'

    Annotations
    @throws( ... )
    Since

    0.5.1

    Exceptions thrown

    UnsupportedOperationException() if the provided mode is not supported.

    Note

    Default: "percentage"

    ,

    Available modes:
    'match': Will match all smaller class counts to largest class count. [WARNING] - May significantly increase memory pressure!
    'percentage' Will adjust smaller classes to a percentage value of the largest class count. 'target' Will increase smaller class counts to a fixed numeric target of rows.

  488. def setLabelCol(value: String): AutomationConfig.this.type

    Permalink
  489. def setLowerFilterNTile(value: Double): AutomationConfig.this.type

    Permalink
  490. def setMainConfig(value: MainConfig): AutomationConfig.this.type

    Permalink
  491. def setMainConfig(): AutomationConfig.this.type

    Permalink
  492. def setMinimumVectorCountToMutate(value: Int): AutomationConfig.this.type

    Permalink

    Setter for minimum threshold for vector indexes to mutate within the feature vector.

    Setter for minimum threshold for vector indexes to mutate within the feature vector.

    value

    The minimum (or fixed) number of indexes to mutate.

    returns

    this

    Note

    In vectorMutationMethod "fixed" this sets the fixed count of how many vector positions to mutate. In vectorMutationMethod "random" this sets the lower threshold for 'at least this many indexes will be mutated'

  493. def setMlFlowAPIToken(value: String): AutomationConfig.this.type

    Permalink
  494. def setMlFlowBestSuffix(value: String): AutomationConfig.this.type

    Permalink
  495. def setMlFlowConfig(value: MLFlowConfig): AutomationConfig.this.type

    Permalink
  496. def setMlFlowCustomRunTags(value: Map[String, String]): AutomationConfig.this.type

    Permalink
  497. def setMlFlowExperimentName(value: String): AutomationConfig.this.type

    Permalink
  498. def setMlFlowLoggingMode(value: String): AutomationConfig.this.type

    Permalink
  499. def setMlFlowModelSaveDirectory(value: String): AutomationConfig.this.type

    Permalink
    Annotations
    @throws( classOf[IllegalArgumentException] )
  500. def setMlFlowTrackingURI(value: String): AutomationConfig.this.type

    Permalink
  501. def setModelSeedMap(value: Map[String, Any]): AutomationConfig.this.type

    Permalink
  502. def setModelSeedString(value: String): AutomationConfig.this.type

    Permalink
  503. def setModelSelectionDistinctThreshold(value: Int): AutomationConfig.this.type

    Permalink
  504. def setModelingFamily(value: String): AutomationConfig.this.type

    Permalink
  505. def setMutationMagnitudeMode(value: String): AutomationConfig.this.type

    Permalink
  506. def setMutationMode(value: String): AutomationConfig.this.type

    Permalink

    Setter for the Mutation Mode of the feature vector individual values

    Setter for the Mutation Mode of the feature vector individual values

    value

    String: the mode to use.

    returns

    this

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if the mode is not supported.

    Note

    Options: "weighted" - uses weighted averaging to scale the euclidean distance between the centroid vector and mutation candidate vectors "random" - randomly selects a position on the euclidean vector between the centroid vector and the candidate mutation vectors "ratio" - uses a ratio between the values of the centroid vector and the mutation vector *

  507. def setMutationValue(value: Double): AutomationConfig.this.type

    Permalink

    Setter for specifying the mutation magnitude for the modes 'weighted' and 'ratio' in mutationMode

    Setter for specifying the mutation magnitude for the modes 'weighted' and 'ratio' in mutationMode

    value

    Double: value between 0 and 1 for mutation magnitude adjustment.

    returns

    this

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if the value specified is outside of the range (0, 1)

    Note

    the higher this value, the closer to the centroid vector vs. the candidate mutation vector the synthetic row data will be.

  508. def setNAFillFilterPrecision(value: Double): AutomationConfig.this.type

    Permalink

    Setter for defining the precision for calculating the model type as per the label column

    Setter for defining the precision for calculating the model type as per the label column

    value

    Double: Precision accuracy for approximate distinct calculation.

    Annotations
    @throws( classOf[AssertionError] )
    Since

    0.5.2

    Exceptions thrown

    java.lang.AssertionError If the value is outside of the allowable range of {0, 1}

    Note

    setting this value to zero (0) for a large regression problem will incur a long processing time and an expensive shuffle.

  509. def setNAFillMode(value: String): AutomationConfig.this.type

    Permalink

    Mode for na fill
    Available modes:
    auto : Stats-based na fill for fields.

    Mode for na fill
    Available modes:
    auto : Stats-based na fill for fields. Usage of .setNumericFillStat and .setCharacterFillStat will inform the type of statistics that will be used to fill.
    mapFill : Custom by-column overrides to 'blanket fill' na values on a per-column basis. The categorical (string) fields are set via .setCategoricalNAFillMap while the numeric fields are set via .setNumericNAFillMap.
    blanketFillAll : Fills all fields based on the values specified by .setCharacterNABlanketFillValue and .setNumericNABlanketFillValue. All NA's for the appropriate types will be filled in accordingly throughout all columns.
    blanketFillCharOnly Will use statistics to fill in numeric fields, but will replace all categorical character fields na values with a blanket fill value.
    blanketFillNumOnly Will use statistics to fill in character fields, but will replace all numeric fields na values with a blanket value.

    value

    String: Mode for NA Fill

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Since

    0.5.2

    Exceptions thrown

    IllegalArgumentException if the mods specified is not supported.

  510. def setNumberOfGenerations(value: Int): AutomationConfig.this.type

    Permalink
  511. def setNumberOfMutationsPerGeneration(value: Int): AutomationConfig.this.type

    Permalink
  512. def setNumberOfParentsToRetain(value: Int): AutomationConfig.this.type

    Permalink
  513. def setNumericBoundaries(value: Map[String, (Double, Double)]): AutomationConfig.this.type

    Permalink
  514. def setNumericFillStat(value: String): AutomationConfig.this.type

    Permalink
  515. def setNumericNABlanketFillValue(value: Double): AutomationConfig.this.type

    Permalink

    Setter for providing a 'blanket override' value (fill all found numeric columns' missing values with this specified value)

    Setter for providing a 'blanket override' value (fill all found numeric columns' missing values with this specified value)

    value

    Double: A value to fill all numeric na value in the DataFrame with.

    Since

    0.5.2

  516. def setNumericNAFillMap(value: Map[String, AnyVal]): AutomationConfig.this.type

    Permalink

    Setter for providing a map of [Column Name -> AnyVal Fill Value] (must be numeric).

    Setter for providing a map of [Column Name -> AnyVal Fill Value] (must be numeric). Any non-specified fields in this map will utilize the "auto" statistics-based fill paradigm to calculate and fill any NA values in numeric columns.

    value

    Map[String, AnyVal]: Column Name as String -> Fill Numeric Type Value

    Since

    0.5.2

    Note

    If fields are specified in here that are not part of the DataFrame's schema, an exception will be thrown.

    ,

    if naFillMode is specified as using Map Fill modes, this setter or the categorical na fill map MUST be set.

  517. def setNumericRatio(value: Double): AutomationConfig.this.type

    Permalink

    Setter - for specifying the percentage ratio for the mode 'percentage' in setLabelBalanceMode()

    Setter - for specifying the percentage ratio for the mode 'percentage' in setLabelBalanceMode()

    value

    Double: A fractional double in the range of 0.0 to 1.0.

    Annotations
    @throws( ... )
    Since

    0.5.1

    Exceptions thrown

    UnsupportedOperationException() if the provided value is outside of the range of 0.0 -> 1.0

    Note

    Default: 0.2

    ,

    Setting this value to 1.0 is equivalent to setting the label balance mode to 'match'

  518. def setNumericTarget(value: Int): AutomationConfig.this.type

    Permalink

    Setter - for specifying the target row count to generate for 'target' mode in setLabelBalanceMode()

    Setter - for specifying the target row count to generate for 'target' mode in setLabelBalanceMode()

    value

    Int: The desired final number of rows per minority class label

    Since

    0.5.1

    Note

    [WARNING] Setting this value to too high of a number will greatly increase runtime and memory pressure.

  519. def setPNorm(value: Double): AutomationConfig.this.type

    Permalink
  520. def setParallelism(value: Int): AutomationConfig.this.type

    Permalink
  521. def setPearsonAutoFilterNTile(value: Double): AutomationConfig.this.type

    Permalink
  522. def setPearsonFilterDirection(value: String): AutomationConfig.this.type

    Permalink
  523. def setPearsonFilterManualValue(value: Double): AutomationConfig.this.type

    Permalink
  524. def setPearsonFilterMode(value: String): AutomationConfig.this.type

    Permalink
  525. def setPearsonFilterStatistic(value: String): AutomationConfig.this.type

    Permalink
  526. def setPipelineId(value: String): AutomationConfig.this.type

    Permalink
  527. def setQuorumCount(value: Int): AutomationConfig.this.type

    Permalink

    Setter for how many vectors to find in adjacency to the centroid for generation of synthetic data

    Setter for how many vectors to find in adjacency to the centroid for generation of synthetic data

    value

    Int: Number of vectors to find nearest each centroid within the class

    returns

    this

    Note

    the higher the value set here, the higher the variance in synthetic data generation

  528. def setScalerMax(value: Double): AutomationConfig.this.type

    Permalink
  529. def setScalerMin(value: Double): AutomationConfig.this.type

    Permalink
  530. def setScalerType(value: String): AutomationConfig.this.type

    Permalink
  531. def setScoringMetric(value: String): AutomationConfig.this.type

    Permalink
  532. def setScoringOptimizationStrategy(value: String): AutomationConfig.this.type

    Permalink
  533. def setSeed(value: Long): AutomationConfig.this.type

    Permalink
  534. def setSplitCachingStrategy(value: String): AutomationConfig.this.type

    Permalink

    Setter for determining the split caching strategy (either persist to disk for each kfold split or backing to Delta)

    Setter for determining the split caching strategy (either persist to disk for each kfold split or backing to Delta)

    value

    Configuration string either 'persist' or 'delta'

    Since

    0.7.1

  535. def setStandardScalerMeanFlagOff(): AutomationConfig.this.type

    Permalink
  536. def setStandardScalerMeanFlagOn(): AutomationConfig.this.type

    Permalink
  537. def setStandardScalerStdDevFlagOff(): AutomationConfig.this.type

    Permalink
  538. def setStandardScalerStdDevFlagOn(): AutomationConfig.this.type

    Permalink
  539. def setStringBoundaries(value: Map[String, List[String]]): AutomationConfig.this.type

    Permalink
  540. def setSyntheticCol(value: String): AutomationConfig.this.type

    Permalink

    Setter - for setting the name of the Synthetic column name

    Setter - for setting the name of the Synthetic column name

    value

    String: A column name that is uniquely not part of the main DataFrame

    Since

    0.5.1

  541. def setTrainPortion(value: Double): AutomationConfig.this.type

    Permalink
  542. def setTrainSplitChronologicalColumn(value: String): AutomationConfig.this.type

    Permalink
  543. def setTrainSplitChronologicalRandomPercentage(value: Double): AutomationConfig.this.type

    Permalink
  544. def setTrainSplitMethod(value: String): AutomationConfig.this.type

    Permalink
  545. def setTreeSplitsConfig(value: MainConfig): AutomationConfig.this.type

    Permalink
  546. def setTreeSplitsConfig(): AutomationConfig.this.type

    Permalink
  547. def setUpperFilterNTile(value: Double): AutomationConfig.this.type

    Permalink
  548. def setVectorMutationMethod(value: String): AutomationConfig.this.type

    Permalink

    Setter for the Vector Mutation Method

    Setter for the Vector Mutation Method

    value

    String - the mode to use.

    returns

    this

    Annotations
    @throws( classOf[IllegalArgumentException] )
    Exceptions thrown

    IllegalArgumentException() if the mode is not supported.

    Note

    Options: "fixed" - will use the value of minimumVectorCountToMutate to select random indexes of this number of indexes. "random" - will use this number as a lower bound on a random selection of indexes between this and the vector length. "all" - will mutate all of the vectors.

  549. final def synchronized[T0](arg0: ⇒ T0): T0

    Permalink
    Definition Classes
    AnyRef
  550. def toString(): String

    Permalink
    Definition Classes
    AnyRef → Any
  551. final val trainSplitMethods: List[String]

    Permalink
    Definition Classes
    Defaults
  552. def varianceFilterOff(): AutomationConfig.this.type

    Permalink
  553. def varianceFilterOn(): AutomationConfig.this.type

    Permalink
  554. final def wait(): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  555. final def wait(arg0: Long, arg1: Int): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  556. final def wait(arg0: Long): Unit

    Permalink
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )

Inherited from SanitizerDefaults

Inherited from Defaults

Inherited from AnyRef

Inherited from Any

Ungrouped