class TextPreprocessor extends Transformer with HasInputCol with HasOutputCol with Wrappable with ComplexParamsWritable with BasicLogging

TextPreprocessor takes a dataframe and a dictionary that maps (text -> replacement text), scans each cell in the input col and replaces all substring matches with the corresponding value. Priority is given to longer keys and from left to right.

Linear Supertypes
BasicLogging, ComplexParamsWritable, MLWritable, Wrappable, RWrappable, PythonWrappable, BaseWrappable, HasOutputCol, HasInputCol, Transformer, PipelineStage, Logging, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. TextPreprocessor
  2. BasicLogging
  3. ComplexParamsWritable
  4. MLWritable
  5. Wrappable
  6. RWrappable
  7. PythonWrappable
  8. BaseWrappable
  9. HasOutputCol
  10. HasInputCol
  11. Transformer
  12. PipelineStage
  13. Logging
  14. Params
  15. Serializable
  16. Serializable
  17. Identifiable
  18. AnyRef
  19. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new TextPreprocessor()
  2. new TextPreprocessor(uid: String)

Value Members

  1. final def !=(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int
    Definition Classes
    AnyRef → Any
  3. final def $[T](param: Param[T]): T
    Attributes
    protected
    Definition Classes
    Params
  4. final def ==(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  5. final def asInstanceOf[T0]: T0
    Definition Classes
    Any
  6. lazy val classNameHelper: String
    Attributes
    protected
    Definition Classes
    BaseWrappable
  7. final def clear(param: Param[_]): TextPreprocessor.this.type
    Definition Classes
    Params
  8. def clone(): AnyRef
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()
  9. def companionModelClassName: String
    Attributes
    protected
    Definition Classes
    BaseWrappable
  10. def copy(extra: ParamMap): TextPreprocessor
    Definition Classes
    TextPreprocessor → Transformer → PipelineStage → Params
  11. def copyValues[T <: Params](to: T, extra: ParamMap): T
    Attributes
    protected
    Definition Classes
    Params
  12. lazy val copyrightLines: String
    Attributes
    protected
    Definition Classes
    BaseWrappable
  13. final def defaultCopy[T <: Params](extra: ParamMap): T
    Attributes
    protected
    Definition Classes
    Params
  14. final def eq(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  15. def equals(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  16. def explainParam(param: Param[_]): String
    Definition Classes
    Params
  17. def explainParams(): String
    Definition Classes
    Params
  18. final def extractParamMap(): ParamMap
    Definition Classes
    Params
  19. final def extractParamMap(extra: ParamMap): ParamMap
    Definition Classes
    Params
  20. def finalize(): Unit
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  21. final def get[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  22. final def getClass(): Class[_]
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  23. final def getDefault[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  24. def getInputCol: String

    Definition Classes
    HasInputCol
  25. def getMap: Map[String, String]

  26. def getNormFunc: String

  27. final def getOrDefault[T](param: Param[T]): T
    Definition Classes
    Params
  28. def getOutputCol: String

    Definition Classes
    HasOutputCol
  29. def getParam(paramName: String): Param[Any]
    Definition Classes
    Params
  30. final def hasDefault[T](param: Param[T]): Boolean
    Definition Classes
    Params
  31. def hasParam(paramName: String): Boolean
    Definition Classes
    Params
  32. def hashCode(): Int
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  33. def initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  34. def initializeLogIfNecessary(isInterpreter: Boolean): Unit
    Attributes
    protected
    Definition Classes
    Logging
  35. val inputCol: Param[String]

    The name of the input column

    The name of the input column

    Definition Classes
    HasInputCol
  36. final def isDefined(param: Param[_]): Boolean
    Definition Classes
    Params
  37. final def isInstanceOf[T0]: Boolean
    Definition Classes
    Any
  38. final def isSet(param: Param[_]): Boolean
    Definition Classes
    Params
  39. def isTraceEnabled(): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  40. def isValidNormFunc(normFuncName: String): Boolean
  41. def log: Logger
    Attributes
    protected
    Definition Classes
    Logging
  42. def logBase(methodName: String): Unit
    Attributes
    protected
    Definition Classes
    BasicLogging
  43. def logClass(): Unit
    Definition Classes
    BasicLogging
  44. def logDebug(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  45. def logDebug(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  46. def logError(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  47. def logError(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  48. def logErrorBase(methodName: String, e: Exception): Unit
    Attributes
    protected
    Definition Classes
    BasicLogging
  49. def logFit[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  50. def logInfo(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  51. def logInfo(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  52. def logName: String
    Attributes
    protected
    Definition Classes
    Logging
  53. def logPredict[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  54. def logTrace(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  55. def logTrace(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  56. def logTrain[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  57. def logTransform[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  58. def logVerb[T](verb: String, f: ⇒ T): T
    Definition Classes
    BasicLogging
  59. def logWarning(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  60. def logWarning(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  61. def makePyFile(conf: CodegenConfig): Unit
    Definition Classes
    PythonWrappable
  62. def makeRFile(conf: CodegenConfig): Unit
    Definition Classes
    RWrappable
  63. val map: MapParam[String, String]
  64. final def ne(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  65. val normFunc: Param[String]
  66. val normFuncs: Map[String, (Char) ⇒ Char]
  67. final def notify(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  68. final def notifyAll(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  69. val outputCol: Param[String]

    The name of the output column

    The name of the output column

    Definition Classes
    HasOutputCol
  70. lazy val params: Array[Param[_]]
    Definition Classes
    Params
  71. def pyAdditionalMethods: String
    Definition Classes
    PythonWrappable
  72. lazy val pyClassDoc: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  73. lazy val pyClassName: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  74. def pyExtraEstimatorImports: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  75. def pyExtraEstimatorMethods: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  76. lazy val pyInheritedClasses: Seq[String]
    Attributes
    protected
    Definition Classes
    PythonWrappable
  77. def pyInitFunc(): String
    Definition Classes
    PythonWrappable
  78. lazy val pyInternalWrapper: Boolean
    Attributes
    protected
    Definition Classes
    PythonWrappable
  79. lazy val pyObjectBaseClass: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  80. def pyParamArg[T](p: Param[T]): String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  81. def pyParamDefault[T](p: Param[T]): Option[String]
    Attributes
    protected
    Definition Classes
    PythonWrappable
  82. def pyParamGetter(p: Param[_]): String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  83. def pyParamSetter(p: Param[_]): String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  84. def pyParamsArgs: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  85. def pyParamsDefaults: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  86. lazy val pyParamsDefinitions: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  87. def pyParamsGetters: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  88. def pyParamsSetters: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  89. def pythonClass(): String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  90. def rClass(): String
    Attributes
    protected
    Definition Classes
    RWrappable
  91. def rDocString: String
    Attributes
    protected
    Definition Classes
    RWrappable
  92. def rExtraBodyLines: String
    Attributes
    protected
    Definition Classes
    RWrappable
  93. def rExtraInitLines: String
    Attributes
    protected
    Definition Classes
    RWrappable
  94. lazy val rFuncName: String
    Attributes
    protected
    Definition Classes
    RWrappable
  95. lazy val rInternalWrapper: Boolean
    Attributes
    protected
    Definition Classes
    RWrappable
  96. def rParamArg[T](p: Param[T]): String
    Attributes
    protected
    Definition Classes
    RWrappable
  97. def rParamsArgs: String
    Attributes
    protected
    Definition Classes
    RWrappable
  98. def rSetterLines: String
    Attributes
    protected
    Definition Classes
    RWrappable
  99. def save(path: String): Unit
    Definition Classes
    MLWritable
    Annotations
    @Since( "1.6.0" ) @throws( ... )
  100. final def set(paramPair: ParamPair[_]): TextPreprocessor.this.type
    Attributes
    protected
    Definition Classes
    Params
  101. final def set(param: String, value: Any): TextPreprocessor.this.type
    Attributes
    protected
    Definition Classes
    Params
  102. final def set[T](param: Param[T], value: T): TextPreprocessor.this.type
    Definition Classes
    Params
  103. final def setDefault(paramPairs: ParamPair[_]*): TextPreprocessor.this.type
    Attributes
    protected
    Definition Classes
    Params
  104. final def setDefault[T](param: Param[T], value: T): TextPreprocessor.this.type
    Attributes
    protected
    Definition Classes
    Params
  105. def setInputCol(value: String): TextPreprocessor.this.type

    Definition Classes
    HasInputCol
  106. def setMap(value: Map[String, String]): TextPreprocessor.this.type

  107. def setNormFunc(value: String): TextPreprocessor.this.type

  108. def setOutputCol(value: String): TextPreprocessor.this.type

    Definition Classes
    HasOutputCol
  109. final def synchronized[T0](arg0: ⇒ T0): T0
    Definition Classes
    AnyRef
  110. def toString(): String
    Definition Classes
    Identifiable → AnyRef → Any
  111. def transform(dataset: Dataset[_]): DataFrame

    dataset

    - The input dataset, to be transformed

    returns

    The DataFrame that results from column selection

    Definition Classes
    TextPreprocessor → Transformer
  112. def transform(dataset: Dataset[_], paramMap: ParamMap): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" )
  113. def transform(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" ) @varargs()
  114. def transformSchema(schema: StructType): StructType
    Definition Classes
    TextPreprocessor → PipelineStage
  115. def transformSchema(schema: StructType, logging: Boolean): StructType
    Attributes
    protected
    Definition Classes
    PipelineStage
    Annotations
    @DeveloperApi()
  116. val uid: String
    Definition Classes
    TextPreprocessorBasicLogging → Identifiable
  117. val ver: String
    Definition Classes
    BasicLogging
  118. final def wait(): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  119. final def wait(arg0: Long, arg1: Int): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  120. final def wait(arg0: Long): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()
  121. def write: MLWriter
    Definition Classes
    ComplexParamsWritable → MLWritable

Inherited from BasicLogging

Inherited from ComplexParamsWritable

Inherited from MLWritable

Inherited from Wrappable

Inherited from RWrappable

Inherited from PythonWrappable

Inherited from BaseWrappable

Inherited from HasOutputCol

Inherited from HasInputCol

Inherited from Transformer

Inherited from PipelineStage

Inherited from Logging

Inherited from Params

Inherited from Serializable

Inherited from Serializable

Inherited from Identifiable

Inherited from AnyRef

Inherited from Any

getParam

param

setParam

Ungrouped