Packages

t

com.microsoft.azure.synapse.ml.featurize.text

TextFeaturizerParams

trait TextFeaturizerParams extends Wrappable with DefaultParamsWritable

Linear Supertypes
DefaultParamsWritable, MLWritable, Wrappable, DotnetWrappable, RWrappable, PythonWrappable, BaseWrappable, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Known Subclasses
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. TextFeaturizerParams
  2. DefaultParamsWritable
  3. MLWritable
  4. Wrappable
  5. DotnetWrappable
  6. RWrappable
  7. PythonWrappable
  8. BaseWrappable
  9. Params
  10. Serializable
  11. Serializable
  12. Identifiable
  13. AnyRef
  14. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Abstract Value Members

  1. abstract def copy(extra: ParamMap): Params
    Definition Classes
    Params
  2. abstract val uid: String
    Definition Classes
    Identifiable

Concrete Value Members

  1. val binary: BooleanParam

    All nonnegative word counts are set to 1 when set to true

  2. val caseSensitiveStopWords: BooleanParam

    Indicates whether a case sensitive comparison is performed on stop words.

  3. final def clear(param: Param[_]): TextFeaturizerParams.this.type
    Definition Classes
    Params
  4. val defaultStopWordLanguage: Param[String]

    Specify the language to use for stop word removal.

    Specify the language to use for stop word removal. The Use the custom setting when using the stopWords input

  5. def dotnetAdditionalMethods: String
    Definition Classes
    DotnetWrappable
  6. def explainParam(param: Param[_]): String
    Definition Classes
    Params
  7. def explainParams(): String
    Definition Classes
    Params
  8. final def extractParamMap(): ParamMap
    Definition Classes
    Params
  9. final def extractParamMap(extra: ParamMap): ParamMap
    Definition Classes
    Params
  10. final def get[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  11. final def getBinary: Boolean

  12. final def getCaseSensitiveStopWords: Boolean

  13. final def getDefault[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  14. final def getDefaultStopWordLanguage: String

  15. final def getMinDocFreq: Int

  16. final def getMinTokenLength: Int

  17. final def getNGramLength: Int

  18. final def getNumFeatures: Int

  19. final def getOrDefault[T](param: Param[T]): T
    Definition Classes
    Params
  20. def getParam(paramName: String): Param[Any]
    Definition Classes
    Params
  21. def getParamInfo(p: Param[_]): ParamInfo[_]
    Definition Classes
    BaseWrappable
  22. final def getStopWords: String

  23. final def getToLowercase: Boolean

  24. final def getTokenizerGaps: Boolean

  25. final def getTokenizerPattern: String

  26. final def getUseIDF: Boolean

  27. final def getUseNGram: Boolean

  28. final def getUseStopWordsRemover: Boolean

  29. final def getUseTokenizer: Boolean

  30. final def hasDefault[T](param: Param[T]): Boolean
    Definition Classes
    Params
  31. def hasParam(paramName: String): Boolean
    Definition Classes
    Params
  32. final def isDefined(param: Param[_]): Boolean
    Definition Classes
    Params
  33. final def isSet(param: Param[_]): Boolean
    Definition Classes
    Params
  34. def makeDotnetFile(conf: CodegenConfig): Unit
    Definition Classes
    DotnetWrappable
  35. def makePyFile(conf: CodegenConfig): Unit
    Definition Classes
    PythonWrappable
  36. def makeRFile(conf: CodegenConfig): Unit
    Definition Classes
    RWrappable
  37. val minDocFreq: IntParam

    Minimum number of documents in which a term should appear.

  38. val minTokenLength: IntParam

    Minumum token length; must be 0 or greater.

  39. val nGramLength: IntParam

    The size of the Ngrams

  40. val numFeatures: IntParam

    Set the number of features to hash each document to

  41. lazy val params: Array[Param[_]]
    Definition Classes
    Params
  42. def pyAdditionalMethods: String
    Definition Classes
    PythonWrappable
  43. def pyInitFunc(): String
    Definition Classes
    PythonWrappable
  44. def save(path: String): Unit
    Definition Classes
    MLWritable
    Annotations
    @Since( "1.6.0" ) @throws( ... )
  45. final def set[T](param: Param[T], value: T): TextFeaturizerParams.this.type
    Definition Classes
    Params
  46. val stopWords: Param[String]

    The words to be filtered out.

    The words to be filtered out. This is a comma separated list of words, encoded as a single string. For example, "a, the, and"

  47. val toLowercase: BooleanParam

    Indicates whether to convert all characters to lowercase before tokenizing.

  48. def toString(): String
    Definition Classes
    Identifiable → AnyRef → Any
  49. val tokenizerGaps: BooleanParam

    Indicates whether the regex splits on gaps (true) or matches tokens (false)

  50. val tokenizerPattern: Param[String]

    Regex pattern used to match delimiters if gaps (true) or tokens (false)

  51. val useIDF: BooleanParam

    Scale the Term Frequencies by IDF when set to true

  52. val useNGram: BooleanParam

    Enumerate N grams when set

  53. val useStopWordsRemover: BooleanParam

    Indicates whether to remove stop words from tokenized data.

  54. val useTokenizer: BooleanParam

    Tokenize the input when set to true

  55. def write: MLWriter
    Definition Classes
    DefaultParamsWritable → MLWritable