FileStreamInput

case class FileStreamInput(name: String, path: String, warehousePath: Option[String], catalogName: Option[String], schemaName: Option[String], tableName: Option[String], metastoreUris: Option[String], options: Option[Map[String, String]], format: Option[String], icebergCatalogType: Option[String], isMetric: Option[Boolean], schema: Option[Schema]) extends IncrementalReader with DatasourceReader with FileInputBase with Product with Serializable

Represents a file stream-based input configuration.

name: The name of the file stream input.
path: The path of the file stream input.
warehousePath: An optional warehouse path for the input.
catalogName: An optional catalog name for the input.
schemaName: An optional schema name for the input.
tableName: An optional table name for the input.
metastoreUris: An optional string representing metastore URIs for the input.
options: An optional map of options for the input.
format: An optional string representing the format of the input.
icebergCatalogType: An optional string representing the catalog type for Iceberg format.
isMetric: An optional flag indicating if the input is for metrics.
schema: An optional Schema for the input.

Linear Supertypes

Serializable, Serializable, Product, Equals, FileInputBase, DatasourceReader, Reader, IncrementalReader, AnyRef, Any

Ordering

Alphabetic
By Inheritance

Inherited

FileStreamInput
Serializable
Serializable
Product
Equals
FileInputBase
DatasourceReader
Reader
IncrementalReader
AnyRef
Any

Hide All
Show All

Visibility

Public
All

Instance Constructors

new FileStreamInput(name: String, path: String, warehousePath: Option[String], catalogName: Option[String], schemaName: Option[String], tableName: Option[String], metastoreUris: Option[String], options: Option[Map[String, String]], format: Option[String], icebergCatalogType: Option[String], isMetric: Option[Boolean], schema: Option[Schema])
name
The name of the file stream input.
path
The path of the file stream input.
warehousePath
An optional warehouse path for the input.
catalogName
An optional catalog name for the input.
schemaName
An optional schema name for the input.
tableName
An optional table name for the input.
metastoreUris
An optional string representing metastore URIs for the input.
options
An optional map of options for the input.
format
An optional string representing the format of the input.
icebergCatalogType
An optional string representing the catalog type for Iceberg format.
isMetric
An optional flag indicating if the input is for metrics.
schema
An optional Schema for the input.

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def asInstanceOf[T0]: T0

Definition Classes
Any
val catalogName: Option[String]
def clone(): AnyRef

Attributes
protected[lang]
Definition Classes
AnyRef
Annotations
@throws( ... ) @native()
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def finalize(): Unit

Attributes
protected[lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
val format: Option[String]
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
Annotations
@native()
def getFormat(format: Option[String], path: String): String
Determines the file format based on the specified format option or file path.
Determines the file format based on the specified format option or file path.
format
The optional format specified by the user.
path
The file path.
returns
The determined file format.

Definition Classes
FileInputBase
def getOptions(readFormat: String, options: Option[Map[String, String]]): Option[Map[String, String]]
Retrieves the options for reading files based on the file format.
Retrieves the options for reading files based on the file format.
readFormat
The file format.
options
The optional user-provided options.
returns
The options for reading files.

Definition Classes
FileInputBase
def getSchemaStruct(schema: Option[Schema], sparkSession: SparkSession): Option[StructType]
Retrieves the schema structure based on the provided schema path, schema string, and schema type.
Retrieves the schema structure based on the provided schema path, schema string, and schema type.
schema
Schema info
sparkSession
The Spark session.
returns
The schema structure as a StructType.

Definition Classes
FileInputBase
def getTable: String
Generates the fully qualified table name in the format: catalogName.schemaName.tableName.
Generates the fully qualified table name in the format: catalogName.schemaName.tableName.
returns
The fully qualified table name.
val icebergCatalogType: Option[String]
def isHiveCatalog(format: String): Boolean
Checks if the specified file format corresponds to a Hive catalog.
Checks if the specified file format corresponds to a Hive catalog.
format
The file format.
returns
true if the format corresponds to a Hive catalog, false otherwise.
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
val isMetric: Option[Boolean]
val metastoreUris: Option[String]
val name: String
The name of the data reader.
The name of the data reader.

Definition Classes
FileStreamInput → Reader
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
Annotations
@native()
final def notifyAll(): Unit

Definition Classes
AnyRef
Annotations
@native()
val options: Option[Map[String, String]]
val path: String
def persistIncrementalState(): Unit
Persists the incremental state if any.
Persists the incremental state if any.

Definition Classes
IncrementalReader
def read(sparkSession: SparkSession): DataFrame
Reads the file stream using the specified SparkSession and returns the resulting DataFrame.
Reads the file stream using the specified SparkSession and returns the resulting DataFrame.
sparkSession
The SparkSession.
returns
The DataFrame containing the read data.

Definition Classes
FileStreamInput → Reader
def readIncremental(df: DataFrame, incremental: Option[Incremental]): DataFrame
Reads data from a DataFrame with optional incremental settings.
Reads data from a DataFrame with optional incremental settings.
df
The DataFrame to read data from.
incremental
Optional Incremental settings to apply.
returns
A new DataFrame after applying incremental settings if provided, otherwise the original DataFrame.

Definition Classes
IncrementalReader
val schema: Option[Schema]
val schemaName: Option[String]
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
val tableName: Option[String]
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... ) @native()
val warehousePath: Option[String]

Packages

FileStreamInput

Instance Constructors

Value Members

Inherited from Serializable

Inherited from Serializable

Inherited from Product

Inherited from Equals

Inherited from FileInputBase

Inherited from DatasourceReader

Inherited from Reader

Inherited from IncrementalReader

Inherited from AnyRef

Inherited from Any

Ungrouped

Packages

FileStreamInput 

Instance Constructors

Value Members

Inherited from Serializable

Inherited from Serializable

Inherited from Product

Inherited from Equals

Inherited from FileInputBase

Inherited from DatasourceReader

Inherited from Reader

Inherited from IncrementalReader

Inherited from AnyRef

Inherited from Any

Ungrouped

FileStreamInput