Packages

c

com.microsoft.azure.synapse.ml.io.binary

BinaryFileFormat

class BinaryFileFormat extends TextBasedFileFormat with DataSourceRegister

File format used for structured streaming of binary files

Linear Supertypes
DataSourceRegister, TextBasedFileFormat, FileFormat, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. BinaryFileFormat
  2. DataSourceRegister
  3. TextBasedFileFormat
  4. FileFormat
  5. AnyRef
  6. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new BinaryFileFormat()

Value Members

  1. def buildReader(sparkSession: SparkSession, dataSchema: StructType, partitionSchema: StructType, requiredSchema: StructType, filters: Seq[Filter], options: Map[String, String], hadoopConf: Configuration): (PartitionedFile) ⇒ Iterator[InternalRow]
    Definition Classes
    BinaryFileFormat → FileFormat
  2. def buildReaderWithPartitionValues(sparkSession: SparkSession, dataSchema: StructType, partitionSchema: StructType, requiredSchema: StructType, filters: Seq[Filter], options: Map[String, String], hadoopConf: Configuration): (PartitionedFile) ⇒ Iterator[InternalRow]
    Definition Classes
    FileFormat
  3. def equals(other: Any): Boolean
    Definition Classes
    BinaryFileFormat → AnyRef → Any
  4. def hashCode(): Int
    Definition Classes
    BinaryFileFormat → AnyRef → Any
  5. def inferSchema(sparkSession: SparkSession, options: Map[String, String], files: Seq[FileStatus]): Option[StructType]
    Definition Classes
    BinaryFileFormat → FileFormat
  6. def isSplitable(sparkSession: SparkSession, options: Map[String, String], path: Path): Boolean
    Definition Classes
    BinaryFileFormat → TextBasedFileFormat → FileFormat
  7. def prepareWrite(sparkSession: SparkSession, job: Job, options: Map[String, String], dataSchema: StructType): OutputWriterFactory
    Definition Classes
    BinaryFileFormat → FileFormat
  8. def shortName(): String
    Definition Classes
    BinaryFileFormat → DataSourceRegister
  9. def supportBatch(sparkSession: SparkSession, dataSchema: StructType): Boolean
    Definition Classes
    FileFormat
  10. def supportDataType(dataType: DataType): Boolean
    Definition Classes
    FileFormat
  11. def supportFieldName(name: String): Boolean
    Definition Classes
    FileFormat
  12. def toString(): String
    Definition Classes
    BinaryFileFormat → AnyRef → Any
  13. def vectorTypes(requiredSchema: StructType, partitionSchema: StructType, sqlConf: SQLConf): Option[Seq[String]]
    Definition Classes
    FileFormat