FileStreamSinkLog

Instance Constructors

new FileStreamSinkLog(sparkSession: SparkSession, path: String)

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def add(batchId: Long, logs: Seq[SinkFileStatus]): Boolean

Store the metadata for the specified batchId and return true if successful.
Store the metadata for the specified batchId and return true if successful. If the batchId's metadata has already been stored, this method will return false.
Note that this method must be called on a org.apache.spark.util.UninterruptibleThread so that interrupts can be disabled while writing the batch file. This is because there is a potential dead-lock in Hadoop "Shell.runCommand" before 2.5.0 (HADOOP-10622). If the thread running "Shell.runCommand" is interrupted, then the thread can get deadlocked. In our case, writeBatch creates a file using HDFS API and calls "Shell.runCommand" to set the file permissions, and can get deadlocked if the stream execution thread is stopped by interrupt. Hence, we make sure that this method is called on UninterruptibleThread which allows us to disable interrupts here. Also see SPARK-14131.

Definition Classes
FileStreamSinkLog → HDFSMetadataLog → MetadataLog
def allFiles(): Array[SinkFileStatus]

Returns all files except the deleted ones.
final def asInstanceOf[T0]: T0

Definition Classes
Any
def batchIdToPath(batchId: Long): Path

Definition Classes
FileStreamSinkLog → HDFSMetadataLog
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
def deserialize(bytes: Array[Byte]): Seq[SinkFileStatus]

Definition Classes
FileStreamSinkLog → HDFSMetadataLog
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
val fileManager: FileManager

Attributes
protected
Definition Classes
HDFSMetadataLog
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
def get(startId: Option[Long], endId: Option[Long]): Array[(Long, Seq[SinkFileStatus])]

Return metadata for batches between startId (inclusive) and endId (inclusive).
Return metadata for batches between startId (inclusive) and endId (inclusive). If startId is None, just return all batches before endId (inclusive).

Definition Classes
HDFSMetadataLog → MetadataLog
def get(batchId: Long): Option[Seq[SinkFileStatus]]

Return the metadata for the specified batchId if it's stored.
Return the metadata for the specified batchId if it's stored. Otherwise, return None.

Definition Classes
HDFSMetadataLog → MetadataLog
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def getLatest(): Option[(Long, Seq[SinkFileStatus])]

Return the latest batch Id and its metadata if exist.
Return the latest batch Id and its metadata if exist.

Definition Classes
HDFSMetadataLog → MetadataLog
def hashCode(): Int

Definition Classes
AnyRef → Any
def initializeLogIfNecessary(isInterpreter: Boolean): Unit

Attributes
protected
Definition Classes
Logging
def isBatchFile(path: Path): Boolean

Definition Classes
FileStreamSinkLog → HDFSMetadataLog
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def isTraceEnabled(): Boolean

Attributes
protected
Definition Classes
Logging
def log: Logger

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logName: String

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
val metadataPath: Path

Definition Classes
HDFSMetadataLog
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def pathToBatchId(path: Path): Long

Definition Classes
FileStreamSinkLog → HDFSMetadataLog
def serialize(logData: Seq[SinkFileStatus]): Array[Byte]

Definition Classes
FileStreamSinkLog → HDFSMetadataLog
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

Related Docs: object FileStreamSinkLog | package streaming

class FileStreamSinkLog extends HDFSMetadataLog[Seq[SinkFileStatus]]

Instance Constructors

new FileStreamSinkLog(sparkSession: SparkSession, path: String)

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

def add(batchId: Long, logs: Seq[SinkFileStatus]): Boolean

def allFiles(): Array[SinkFileStatus]

final def asInstanceOf[T0]: T0

def batchIdToPath(batchId: Long): Path

def clone(): AnyRef

def deserialize(bytes: Array[Byte]): Seq[SinkFileStatus]

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

val fileManager: FileManager

def finalize(): Unit

def get(startId: Option[Long], endId: Option[Long]): Array[(Long, Seq[SinkFileStatus])]

def get(batchId: Long): Option[Seq[SinkFileStatus]]

final def getClass(): Class[_]

def getLatest(): Option[(Long, Seq[SinkFileStatus])]

def hashCode(): Int

def initializeLogIfNecessary(isInterpreter: Boolean): Unit

def isBatchFile(path: Path): Boolean

final def isInstanceOf[T0]: Boolean

def isTraceEnabled(): Boolean

def log: Logger

def logDebug(msg: ⇒ String, throwable: Throwable): Unit

def logDebug(msg: ⇒ String): Unit

def logError(msg: ⇒ String, throwable: Throwable): Unit

def logError(msg: ⇒ String): Unit

def logInfo(msg: ⇒ String, throwable: Throwable): Unit

def logInfo(msg: ⇒ String): Unit

def logName: String

def logTrace(msg: ⇒ String, throwable: Throwable): Unit

def logTrace(msg: ⇒ String): Unit

def logWarning(msg: ⇒ String, throwable: Throwable): Unit

def logWarning(msg: ⇒ String): Unit

val metadataPath: Path

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def pathToBatchId(path: Path): Long

def serialize(logData: Seq[SinkFileStatus]): Array[Byte]

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from HDFSMetadataLog[Seq[SinkFileStatus]]

Inherited from Logging

Inherited from MetadataLog[Seq[SinkFileStatus]]

Inherited from AnyRef

Inherited from Any

Ungrouped