class TextPreprocessor extends Transformer with HasInputCol with HasOutputCol with Wrappable with ComplexParamsWritable with SynapseMLLogging

TextPreprocessor takes a dataframe and a dictionary that maps (text -> replacement text), scans each cell in the input col and replaces all substring matches with the corresponding value. Priority is given to longer keys and from left to right.

Linear Supertypes
SynapseMLLogging, ComplexParamsWritable, MLWritable, Wrappable, RWrappable, PythonWrappable, BaseWrappable, HasOutputCol, HasInputCol, Transformer, PipelineStage, Logging, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. TextPreprocessor
  2. SynapseMLLogging
  3. ComplexParamsWritable
  4. MLWritable
  5. Wrappable
  6. RWrappable
  7. PythonWrappable
  8. BaseWrappable
  9. HasOutputCol
  10. HasInputCol
  11. Transformer
  12. PipelineStage
  13. Logging
  14. Params
  15. Serializable
  16. Serializable
  17. Identifiable
  18. AnyRef
  19. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new TextPreprocessor()
  2. new TextPreprocessor(uid: String)

Value Members

  1. final def !=(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int
    Definition Classes
    AnyRef → Any
  3. final def $[T](param: Param[T]): T
    Attributes
    protected
    Definition Classes
    Params
  4. final def ==(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  5. final def asInstanceOf[T0]: T0
    Definition Classes
    Any
  6. lazy val classNameHelper: String
    Attributes
    protected
    Definition Classes
    BaseWrappable
  7. final def clear(param: Param[_]): TextPreprocessor.this.type
    Definition Classes
    Params
  8. def clone(): AnyRef
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()
  9. def companionModelClassName: String
    Attributes
    protected
    Definition Classes
    BaseWrappable
  10. def copy(extra: ParamMap): TextPreprocessor
    Definition Classes
    TextPreprocessor → Transformer → PipelineStage → Params
  11. def copyValues[T <: Params](to: T, extra: ParamMap): T
    Attributes
    protected
    Definition Classes
    Params
  12. lazy val copyrightLines: String
    Attributes
    protected
    Definition Classes
    BaseWrappable
  13. final def defaultCopy[T <: Params](extra: ParamMap): T
    Attributes
    protected
    Definition Classes
    Params
  14. final def eq(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  15. def equals(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  16. def explainParam(param: Param[_]): String
    Definition Classes
    Params
  17. def explainParams(): String
    Definition Classes
    Params
  18. final def extractParamMap(): ParamMap
    Definition Classes
    Params
  19. final def extractParamMap(extra: ParamMap): ParamMap
    Definition Classes
    Params
  20. def finalize(): Unit
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  21. final def get[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  22. final def getClass(): Class[_]
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  23. final def getDefault[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  24. def getInputCol: String

    Definition Classes
    HasInputCol
  25. def getMap: Map[String, String]

  26. def getNormFunc: String

  27. final def getOrDefault[T](param: Param[T]): T
    Definition Classes
    Params
  28. def getOutputCol: String

    Definition Classes
    HasOutputCol
  29. def getParam(paramName: String): Param[Any]
    Definition Classes
    Params
  30. def getParamInfo(p: Param[_]): ParamInfo[_]
    Definition Classes
    BaseWrappable
  31. def getPayload(methodName: String, numCols: Option[Int], executionSeconds: Option[Double], exception: Option[Exception]): Map[String, String]
    Attributes
    protected
    Definition Classes
    SynapseMLLogging
  32. final def hasDefault[T](param: Param[T]): Boolean
    Definition Classes
    Params
  33. def hasParam(paramName: String): Boolean
    Definition Classes
    Params
  34. def hashCode(): Int
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  35. def initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  36. def initializeLogIfNecessary(isInterpreter: Boolean): Unit
    Attributes
    protected
    Definition Classes
    Logging
  37. val inputCol: Param[String]

    The name of the input column

    The name of the input column

    Definition Classes
    HasInputCol
  38. final def isDefined(param: Param[_]): Boolean
    Definition Classes
    Params
  39. final def isInstanceOf[T0]: Boolean
    Definition Classes
    Any
  40. final def isSet(param: Param[_]): Boolean
    Definition Classes
    Params
  41. def isTraceEnabled(): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  42. def isValidNormFunc(normFuncName: String): Boolean
  43. def log: Logger
    Attributes
    protected
    Definition Classes
    Logging
  44. def logBase(info: Map[String, String], featureName: Option[String]): Unit
    Attributes
    protected
    Definition Classes
    SynapseMLLogging
  45. def logBase(methodName: String, numCols: Option[Int], executionSeconds: Option[Double], featureName: Option[String]): Unit
    Attributes
    protected
    Definition Classes
    SynapseMLLogging
  46. def logClass(featureName: String): Unit
    Definition Classes
    SynapseMLLogging
  47. def logDebug(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  48. def logDebug(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  49. def logError(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  50. def logError(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  51. def logErrorBase(methodName: String, e: Exception): Unit
    Attributes
    protected
    Definition Classes
    SynapseMLLogging
  52. def logFit[T](f: ⇒ T, columns: Int): T
    Definition Classes
    SynapseMLLogging
  53. def logInfo(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  54. def logInfo(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  55. def logName: String
    Attributes
    protected
    Definition Classes
    Logging
  56. def logTrace(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  57. def logTrace(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  58. def logTransform[T](f: ⇒ T, columns: Int): T
    Definition Classes
    SynapseMLLogging
  59. def logVerb[T](verb: String, f: ⇒ T, columns: Option[Int] = None): T
    Definition Classes
    SynapseMLLogging
  60. def logWarning(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  61. def logWarning(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  62. def makePyFile(conf: CodegenConfig): Unit
    Definition Classes
    PythonWrappable
  63. def makeRFile(conf: CodegenConfig): Unit
    Definition Classes
    RWrappable
  64. val map: StringStringMapParam
  65. final def ne(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  66. val normFunc: Param[String]
  67. val normFuncs: Map[String, (Char) ⇒ Char]
  68. final def notify(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  69. final def notifyAll(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  70. val outputCol: Param[String]

    The name of the output column

    The name of the output column

    Definition Classes
    HasOutputCol
  71. lazy val params: Array[Param[_]]
    Definition Classes
    Params
  72. def pyAdditionalMethods: String
    Definition Classes
    PythonWrappable
  73. lazy val pyClassDoc: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  74. lazy val pyClassName: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  75. def pyExtraEstimatorImports: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  76. def pyExtraEstimatorMethods: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  77. lazy val pyInheritedClasses: Seq[String]
    Attributes
    protected
    Definition Classes
    PythonWrappable
  78. def pyInitFunc(): String
    Definition Classes
    PythonWrappable
  79. lazy val pyInternalWrapper: Boolean
    Attributes
    protected
    Definition Classes
    PythonWrappable
  80. lazy val pyObjectBaseClass: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  81. def pyParamArg[T](p: Param[T]): String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  82. def pyParamDefault[T](p: Param[T]): Option[String]
    Attributes
    protected
    Definition Classes
    PythonWrappable
  83. def pyParamGetter(p: Param[_]): String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  84. def pyParamSetter(p: Param[_]): String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  85. def pyParamsArgs: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  86. def pyParamsDefaults: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  87. lazy val pyParamsDefinitions: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  88. def pyParamsGetters: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  89. def pyParamsSetters: String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  90. def pythonClass(): String
    Attributes
    protected
    Definition Classes
    PythonWrappable
  91. def rClass(): String
    Attributes
    protected
    Definition Classes
    RWrappable
  92. def rDocString: String
    Attributes
    protected
    Definition Classes
    RWrappable
  93. def rExtraBodyLines: String
    Attributes
    protected
    Definition Classes
    RWrappable
  94. def rExtraInitLines: String
    Attributes
    protected
    Definition Classes
    RWrappable
  95. lazy val rFuncName: String
    Attributes
    protected
    Definition Classes
    RWrappable
  96. lazy val rInternalWrapper: Boolean
    Attributes
    protected
    Definition Classes
    RWrappable
  97. def rParamArg[T](p: Param[T]): String
    Attributes
    protected
    Definition Classes
    RWrappable
  98. def rParamsArgs: String
    Attributes
    protected
    Definition Classes
    RWrappable
  99. def rSetterLines: String
    Attributes
    protected
    Definition Classes
    RWrappable
  100. def save(path: String): Unit
    Definition Classes
    MLWritable
    Annotations
    @Since( "1.6.0" ) @throws( ... )
  101. final def set(paramPair: ParamPair[_]): TextPreprocessor.this.type
    Attributes
    protected
    Definition Classes
    Params
  102. final def set(param: String, value: Any): TextPreprocessor.this.type
    Attributes
    protected
    Definition Classes
    Params
  103. final def set[T](param: Param[T], value: T): TextPreprocessor.this.type
    Definition Classes
    Params
  104. final def setDefault(paramPairs: ParamPair[_]*): TextPreprocessor.this.type
    Attributes
    protected
    Definition Classes
    Params
  105. final def setDefault[T](param: Param[T], value: T): TextPreprocessor.this.type
    Attributes
    protected[org.apache.spark.ml]
    Definition Classes
    Params
  106. def setInputCol(value: String): TextPreprocessor.this.type

    Definition Classes
    HasInputCol
  107. def setMap(value: Map[String, String]): TextPreprocessor.this.type

  108. def setNormFunc(value: String): TextPreprocessor.this.type

  109. def setOutputCol(value: String): TextPreprocessor.this.type

    Definition Classes
    HasOutputCol
  110. final def synchronized[T0](arg0: ⇒ T0): T0
    Definition Classes
    AnyRef
  111. val thisStage: Params
    Attributes
    protected
    Definition Classes
    BaseWrappable
  112. def toString(): String
    Definition Classes
    Identifiable → AnyRef → Any
  113. def transform(dataset: Dataset[_]): DataFrame

    dataset

    - The input dataset, to be transformed

    returns

    The DataFrame that results from column selection

    Definition Classes
    TextPreprocessor → Transformer
  114. def transform(dataset: Dataset[_], paramMap: ParamMap): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" )
  115. def transform(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" ) @varargs()
  116. def transformSchema(schema: StructType): StructType
    Definition Classes
    TextPreprocessor → PipelineStage
  117. def transformSchema(schema: StructType, logging: Boolean): StructType
    Attributes
    protected
    Definition Classes
    PipelineStage
    Annotations
    @DeveloperApi()
  118. val uid: String
    Definition Classes
    TextPreprocessorSynapseMLLogging → Identifiable
  119. final def wait(): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  120. final def wait(arg0: Long, arg1: Int): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  121. final def wait(arg0: Long): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()
  122. def write: MLWriter
    Definition Classes
    ComplexParamsWritable → MLWritable

Inherited from SynapseMLLogging

Inherited from ComplexParamsWritable

Inherited from MLWritable

Inherited from Wrappable

Inherited from RWrappable

Inherited from PythonWrappable

Inherited from BaseWrappable

Inherited from HasOutputCol

Inherited from HasInputCol

Inherited from Transformer

Inherited from PipelineStage

Inherited from Logging

Inherited from Params

Inherited from Serializable

Inherited from Serializable

Inherited from Identifiable

Inherited from AnyRef

Inherited from Any

getParam

param

setParam

Ungrouped