Packages

class Featurize extends Estimator[PipelineModel] with Wrappable with DefaultParamsWritable with HasOutputCol with HasInputCols with BasicLogging

Featurizes a dataset. Converts the specified columns to feature columns.

Linear Supertypes
BasicLogging, HasInputCols, HasOutputCol, DefaultParamsWritable, MLWritable, Wrappable, DotnetWrappable, RWrappable, PythonWrappable, BaseWrappable, Estimator[PipelineModel], PipelineStage, Logging, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. Featurize
  2. BasicLogging
  3. HasInputCols
  4. HasOutputCol
  5. DefaultParamsWritable
  6. MLWritable
  7. Wrappable
  8. DotnetWrappable
  9. RWrappable
  10. PythonWrappable
  11. BaseWrappable
  12. Estimator
  13. PipelineStage
  14. Logging
  15. Params
  16. Serializable
  17. Serializable
  18. Identifiable
  19. AnyRef
  20. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new Featurize()
  2. new Featurize(uid: String)

Value Members

  1. final def clear(param: Param[_]): Featurize.this.type
    Definition Classes
    Params
  2. def copy(extra: ParamMap): Estimator[PipelineModel]
    Definition Classes
    Featurize → Estimator → PipelineStage → Params
  3. def dotnetAdditionalMethods: String
    Definition Classes
    DotnetWrappable
  4. def explainParam(param: Param[_]): String
    Definition Classes
    Params
  5. def explainParams(): String
    Definition Classes
    Params
  6. final def extractParamMap(): ParamMap
    Definition Classes
    Params
  7. final def extractParamMap(extra: ParamMap): ParamMap
    Definition Classes
    Params
  8. def fit(dataset: Dataset[_]): PipelineModel

    Featurizes the dataset.

    Featurizes the dataset.

    dataset

    The input dataset to train.

    returns

    The featurized model.

    Definition Classes
    Featurize → Estimator
  9. def fit(dataset: Dataset[_], paramMaps: Seq[ParamMap]): Seq[PipelineModel]
    Definition Classes
    Estimator
    Annotations
    @Since( "2.0.0" )
  10. def fit(dataset: Dataset[_], paramMap: ParamMap): PipelineModel
    Definition Classes
    Estimator
    Annotations
    @Since( "2.0.0" )
  11. def fit(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): PipelineModel
    Definition Classes
    Estimator
    Annotations
    @Since( "2.0.0" ) @varargs()
  12. final def get[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  13. final def getDefault[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  14. final def getImputeMissing: Boolean

  15. def getInputCols: Array[String]

    Definition Classes
    HasInputCols
  16. final def getNumFeatures: Int

  17. final def getOneHotEncodeCategoricals: Boolean

  18. final def getOrDefault[T](param: Param[T]): T
    Definition Classes
    Params
  19. def getOutputCol: String

    Definition Classes
    HasOutputCol
  20. def getParam(paramName: String): Param[Any]
    Definition Classes
    Params
  21. def getParamInfo(p: Param[_]): ParamInfo[_]
    Definition Classes
    BaseWrappable
  22. final def hasDefault[T](param: Param[T]): Boolean
    Definition Classes
    Params
  23. def hasParam(paramName: String): Boolean
    Definition Classes
    Params
  24. val imputeMissing: Param[Boolean]
  25. val inputCols: StringArrayParam

    The names of the inputColumns

    The names of the inputColumns

    Definition Classes
    HasInputCols
  26. final def isDefined(param: Param[_]): Boolean
    Definition Classes
    Params
  27. final def isSet(param: Param[_]): Boolean
    Definition Classes
    Params
  28. def logClass(): Unit
    Definition Classes
    BasicLogging
  29. def logFit[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  30. def logPredict[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  31. def logTrain[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  32. def logTransform[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  33. def logVerb[T](verb: String, f: ⇒ T): T
    Definition Classes
    BasicLogging
  34. def makeDotnetFile(conf: CodegenConfig): Unit
    Definition Classes
    DotnetWrappable
  35. def makePyFile(conf: CodegenConfig): Unit
    Definition Classes
    PythonWrappable
  36. def makeRFile(conf: CodegenConfig): Unit
    Definition Classes
    RWrappable
  37. val numFeatures: IntParam

    Number of features to hash string columns to

  38. val oneHotEncodeCategoricals: Param[Boolean]

    One hot encode categorical columns when true; default is true

  39. val outputCol: Param[String]

    The name of the output column

    The name of the output column

    Definition Classes
    HasOutputCol
  40. lazy val params: Array[Param[_]]
    Definition Classes
    Params
  41. def pyAdditionalMethods: String
    Definition Classes
    PythonWrappable
  42. def pyInitFunc(): String
    Definition Classes
    PythonWrappable
  43. def save(path: String): Unit
    Definition Classes
    MLWritable
    Annotations
    @Since( "1.6.0" ) @throws( ... )
  44. final def set[T](param: Param[T], value: T): Featurize.this.type
    Definition Classes
    Params
  45. def setImputeMissing(value: Boolean): Featurize.this.type

  46. def setInputCols(value: Array[String]): Featurize.this.type

    Definition Classes
    HasInputCols
  47. def setNumFeatures(value: Int): Featurize.this.type

  48. def setOneHotEncodeCategoricals(value: Boolean): Featurize.this.type

  49. def setOutputCol(value: String): Featurize.this.type

    Definition Classes
    HasOutputCol
  50. def toString(): String
    Definition Classes
    Identifiable → AnyRef → Any
  51. def transformSchema(schema: StructType): StructType
    Definition Classes
    Featurize → PipelineStage
  52. val uid: String
    Definition Classes
    FeaturizeBasicLogging → Identifiable
  53. val ver: String
    Definition Classes
    BasicLogging
  54. def write: MLWriter
    Definition Classes
    DefaultParamsWritable → MLWritable