Packages

class PageSplitter extends Transformer with HasInputCol with HasOutputCol with Wrappable with DefaultParamsWritable with SynapseMLLogging

Splits text into chunks of at most n characters

Linear Supertypes
SynapseMLLogging, DefaultParamsWritable, MLWritable, Wrappable, DotnetWrappable, RWrappable, PythonWrappable, BaseWrappable, HasOutputCol, HasInputCol, Transformer, PipelineStage, Logging, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. PageSplitter
  2. SynapseMLLogging
  3. DefaultParamsWritable
  4. MLWritable
  5. Wrappable
  6. DotnetWrappable
  7. RWrappable
  8. PythonWrappable
  9. BaseWrappable
  10. HasOutputCol
  11. HasInputCol
  12. Transformer
  13. PipelineStage
  14. Logging
  15. Params
  16. Serializable
  17. Serializable
  18. Identifiable
  19. AnyRef
  20. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new PageSplitter()
  2. new PageSplitter(uid: String)

    uid

    The id of the module

Value Members

  1. val boundaryRegex: Param[String]
  2. final def clear(param: Param[_]): PageSplitter.this.type
    Definition Classes
    Params
  3. def copy(extra: ParamMap): PageSplitter
    Definition Classes
    PageSplitter → Transformer → PipelineStage → Params
  4. def dotnetAdditionalMethods: String
    Definition Classes
    DotnetWrappable
  5. def explainParam(param: Param[_]): String
    Definition Classes
    Params
  6. def explainParams(): String
    Definition Classes
    Params
  7. final def extractParamMap(): ParamMap
    Definition Classes
    Params
  8. final def extractParamMap(extra: ParamMap): ParamMap
    Definition Classes
    Params
  9. final def get[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  10. def getBoundaryRegex: String
  11. final def getDefault[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  12. def getInputCol: String

    Definition Classes
    HasInputCol
  13. def getMaximumPageLength: Int
  14. def getMinimumPageLength: Int
  15. final def getOrDefault[T](param: Param[T]): T
    Definition Classes
    Params
  16. def getOutputCol: String

    Definition Classes
    HasOutputCol
  17. def getParam(paramName: String): Param[Any]
    Definition Classes
    Params
  18. def getParamInfo(p: Param[_]): ParamInfo[_]
    Definition Classes
    BaseWrappable
  19. final def hasDefault[T](param: Param[T]): Boolean
    Definition Classes
    Params
  20. def hasParam(paramName: String): Boolean
    Definition Classes
    Params
  21. val inputCol: Param[String]

    The name of the input column

    The name of the input column

    Definition Classes
    HasInputCol
  22. final def isDefined(param: Param[_]): Boolean
    Definition Classes
    Params
  23. final def isSet(param: Param[_]): Boolean
    Definition Classes
    Params
  24. def logClass(featureName: String): Unit
    Definition Classes
    SynapseMLLogging
  25. def logFit[T](f: ⇒ T, columns: Int): T
    Definition Classes
    SynapseMLLogging
  26. def logTransform[T](f: ⇒ T, columns: Int): T
    Definition Classes
    SynapseMLLogging
  27. def logVerb[T](verb: String, f: ⇒ T, columns: Option[Int] = None): T
    Definition Classes
    SynapseMLLogging
  28. def makeDotnetFile(conf: CodegenConfig): Unit
    Definition Classes
    DotnetWrappable
  29. def makePyFile(conf: CodegenConfig): Unit
    Definition Classes
    PythonWrappable
  30. def makeRFile(conf: CodegenConfig): Unit
    Definition Classes
    RWrappable
  31. val maximumPageLength: IntParam
  32. val minimumPageLength: IntParam
  33. val outputCol: Param[String]

    The name of the output column

    The name of the output column

    Definition Classes
    HasOutputCol
  34. lazy val params: Array[Param[_]]
    Definition Classes
    Params
  35. def pyAdditionalMethods: String
    Definition Classes
    PythonWrappable
  36. def pyInitFunc(): String
    Definition Classes
    PythonWrappable
  37. def save(path: String): Unit
    Definition Classes
    MLWritable
    Annotations
    @Since( "1.6.0" ) @throws( ... )
  38. final def set[T](param: Param[T], value: T): PageSplitter.this.type
    Definition Classes
    Params
  39. def setBoundaryRegex(v: String): PageSplitter.this.type
  40. def setInputCol(value: String): PageSplitter.this.type

    Definition Classes
    HasInputCol
  41. def setMaximumPageLength(v: Int): PageSplitter.this.type
  42. def setMinimumPageLength(v: Int): PageSplitter.this.type
  43. def setOutputCol(value: String): PageSplitter.this.type

    Definition Classes
    HasOutputCol
  44. def split(textOpt: String): Seq[String]
  45. def toString(): String
    Definition Classes
    Identifiable → AnyRef → Any
  46. def transform(dataset: Dataset[_]): DataFrame
    Definition Classes
    PageSplitter → Transformer
  47. def transform(dataset: Dataset[_], paramMap: ParamMap): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" )
  48. def transform(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" ) @varargs()
  49. def transformSchema(schema: StructType): StructType
    Definition Classes
    PageSplitter → PipelineStage
  50. val uid: String
    Definition Classes
    PageSplitterSynapseMLLogging → Identifiable
  51. def write: MLWriter
    Definition Classes
    DefaultParamsWritable → MLWritable