Packages

class PageSplitter extends Transformer with HasInputCol with HasOutputCol with Wrappable with DefaultParamsWritable with BasicLogging

Splits text into chunks of at most n characters

Linear Supertypes
BasicLogging, DefaultParamsWritable, MLWritable, Wrappable, DotnetWrappable, RWrappable, PythonWrappable, BaseWrappable, HasOutputCol, HasInputCol, Transformer, PipelineStage, Logging, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. PageSplitter
  2. BasicLogging
  3. DefaultParamsWritable
  4. MLWritable
  5. Wrappable
  6. DotnetWrappable
  7. RWrappable
  8. PythonWrappable
  9. BaseWrappable
  10. HasOutputCol
  11. HasInputCol
  12. Transformer
  13. PipelineStage
  14. Logging
  15. Params
  16. Serializable
  17. Serializable
  18. Identifiable
  19. AnyRef
  20. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new PageSplitter()
  2. new PageSplitter(uid: String)

    uid

    The id of the module

Value Members

  1. val boundaryRegex: Param[String]
  2. final def clear(param: Param[_]): PageSplitter.this.type
    Definition Classes
    Params
  3. def copy(extra: ParamMap): MultiNGram
    Definition Classes
    PageSplitter → Transformer → PipelineStage → Params
  4. def dotnetAdditionalMethods: String
    Definition Classes
    DotnetWrappable
  5. def explainParam(param: Param[_]): String
    Definition Classes
    Params
  6. def explainParams(): String
    Definition Classes
    Params
  7. final def extractParamMap(): ParamMap
    Definition Classes
    Params
  8. final def extractParamMap(extra: ParamMap): ParamMap
    Definition Classes
    Params
  9. final def get[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  10. def getBoundaryRegex: String
  11. final def getDefault[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  12. def getInputCol: String

    Definition Classes
    HasInputCol
  13. def getMaximumPageLength: Int
  14. def getMinimumPageLength: Int
  15. final def getOrDefault[T](param: Param[T]): T
    Definition Classes
    Params
  16. def getOutputCol: String

    Definition Classes
    HasOutputCol
  17. def getParam(paramName: String): Param[Any]
    Definition Classes
    Params
  18. def getParamInfo(p: Param[_]): ParamInfo[_]
    Definition Classes
    BaseWrappable
  19. final def hasDefault[T](param: Param[T]): Boolean
    Definition Classes
    Params
  20. def hasParam(paramName: String): Boolean
    Definition Classes
    Params
  21. val inputCol: Param[String]

    The name of the input column

    The name of the input column

    Definition Classes
    HasInputCol
  22. final def isDefined(param: Param[_]): Boolean
    Definition Classes
    Params
  23. final def isSet(param: Param[_]): Boolean
    Definition Classes
    Params
  24. def logClass(): Unit
    Definition Classes
    BasicLogging
  25. def logFit[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  26. def logPredict[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  27. def logTrain[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  28. def logTransform[T](f: ⇒ T): T
    Definition Classes
    BasicLogging
  29. def logVerb[T](verb: String, f: ⇒ T): T
    Definition Classes
    BasicLogging
  30. def makeDotnetFile(conf: CodegenConfig): Unit
    Definition Classes
    DotnetWrappable
  31. def makePyFile(conf: CodegenConfig): Unit
    Definition Classes
    PythonWrappable
  32. def makeRFile(conf: CodegenConfig): Unit
    Definition Classes
    RWrappable
  33. val maximumPageLength: IntParam
  34. val minimumPageLength: IntParam
  35. val outputCol: Param[String]

    The name of the output column

    The name of the output column

    Definition Classes
    HasOutputCol
  36. lazy val params: Array[Param[_]]
    Definition Classes
    Params
  37. def pyAdditionalMethods: String
    Definition Classes
    PythonWrappable
  38. def pyInitFunc(): String
    Definition Classes
    PythonWrappable
  39. def save(path: String): Unit
    Definition Classes
    MLWritable
    Annotations
    @Since( "1.6.0" ) @throws( ... )
  40. final def set[T](param: Param[T], value: T): PageSplitter.this.type
    Definition Classes
    Params
  41. def setBoundaryRegex(v: String): PageSplitter.this.type
  42. def setInputCol(value: String): PageSplitter.this.type

    Definition Classes
    HasInputCol
  43. def setMaximumPageLength(v: Int): PageSplitter.this.type
  44. def setMinimumPageLength(v: Int): PageSplitter.this.type
  45. def setOutputCol(value: String): PageSplitter.this.type

    Definition Classes
    HasOutputCol
  46. def split(textOpt: String): Seq[String]
  47. def toString(): String
    Definition Classes
    Identifiable → AnyRef → Any
  48. def transform(dataset: Dataset[_]): DataFrame
    Definition Classes
    PageSplitter → Transformer
  49. def transform(dataset: Dataset[_], paramMap: ParamMap): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" )
  50. def transform(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" ) @varargs()
  51. def transformSchema(schema: StructType): StructType
    Definition Classes
    PageSplitter → PipelineStage
  52. val uid: String
    Definition Classes
    PageSplitterBasicLogging → Identifiable
  53. val ver: String
    Definition Classes
    BasicLogging
  54. def write: MLWriter
    Definition Classes
    DefaultParamsWritable → MLWritable