MetricsJob

Instance Constructors

new MetricsJob(domain: Domain, schema: Schema, stage: Stage, storageHandler: StorageHandler, schemaHandler: SchemaHandler)(implicit settings: Settings)

domain
: Domain name
schema
: Schema
stage
: stage
storageHandler
: Storage Handler

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
def generateFullMetric(dataMetric: DataFrame, listAttibutes: List[String], colName: List[Column]): DataFrame

Function that retrieves full metrics dataframe with both set discrete and continuous metrics
Function that retrieves full metrics dataframe with both set discrete and continuous metrics
dataMetric
: dataframe obtain from computeDiscretMetric( ) or computeContinuiousMetric( )
listAttibutes
: list of all variables
colName
: list of column
returns
Dataframe : that contain the full metrics with all variables and all metrics
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def lockPath(path: String): Path
val logger: Logger

Attributes
protected
Definition Classes
StrictLogging
def metricsPath(path: String): Path

Function to build the metrics save path
Function to build the metrics save path
path
: path where metrics are stored
returns
: path where the metrics for the specified schema are stored
def name: String

Definition Classes
MetricsJob → SparkJob
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def partitionDataset(dataset: DataFrame, partition: List[String]): DataFrame

Definition Classes
SparkJob
def partitionedDatasetWriter(dataset: DataFrame, partition: List[String]): DataFrameWriter[Row]

Partition a dataset using dataset columns.
Partition a dataset using dataset columns. To partition the dataset using the igestion time, use the reserved column names :
- comet_year
- comet_month
- comet_day
- comet_hour
- comet_minute These columsn are renamed to "year", "month", "day", "hour", "minute" in the dataset and their values is set to the current date/time.
dataset
: Input dataset
partition
: list of columns to use for partitioning.
returns
The Spark session used to run this job

Definition Classes
SparkJob
def run(dataUse: DataFrame, timestamp: Timestamp): Try[SparkSession]
def run(): Try[SparkSession]

Just to force any spark job to implement its entry point using within the "run" method
Just to force any spark job to implement its entry point using within the "run" method
returns
: Spark Session used for the job

Definition Classes
MetricsJob → SparkJob
def save(dataToSave: DataFrame, path: Path): Unit

Saves a dataset.
Saves a dataset. If the path is empty (the first time we call metrics on the schema) then we can write.
If there's already parquet files stored in it, then create a temporary directory to compute on, and flush the path to move updated metrics in it
dataToSave
: dataset to be saved
path
: Path to save the file at
lazy val session: SparkSession

Definition Classes
SparkJob
implicit val settings: Settings

Definition Classes
MetricsJob → SparkJob
lazy val sparkEnv: SparkEnv

Definition Classes
SparkJob
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
def unionDisContMetric(discreteDataset: Option[DataFrame], continuousDataset: Option[DataFrame], domain: Domain, schema: Schema, count: Long, ingestionTime: Timestamp, stageState: Stage): Option[DataFrame]

Function Function that unifies discrete and continuous metrics dataframe, then write save the result to parquet
Function Function that unifies discrete and continuous metrics dataframe, then write save the result to parquet
discreteDataset
: dataframe that contains all the discrete metrics
continuousDataset
: dataframe that contains all the continuous metrics
domain
: name of the domain
schema
: schema of the initial data
ingestionTime
: time which correspond to the ingestion
stageState
: stage (unit / global)
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

Related Doc: package metrics

class MetricsJob extends SparkJob

Instance Constructors

new MetricsJob(domain: Domain, schema: Schema, stage: Stage, storageHandler: StorageHandler, schemaHandler: SchemaHandler)(implicit settings: Settings)

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

final def asInstanceOf[T0]: T0

def clone(): AnyRef

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

def generateFullMetric(dataMetric: DataFrame, listAttibutes: List[String], colName: List[Column]): DataFrame

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

def lockPath(path: String): Path

val logger: Logger

def metricsPath(path: String): Path

def name: String

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

def partitionDataset(dataset: DataFrame, partition: List[String]): DataFrame

def partitionedDatasetWriter(dataset: DataFrame, partition: List[String]): DataFrameWriter[Row]

def run(dataUse: DataFrame, timestamp: Timestamp): Try[SparkSession]

def run(): Try[SparkSession]

def save(dataToSave: DataFrame, path: Path): Unit

lazy val session: SparkSession

implicit val settings: Settings

lazy val sparkEnv: SparkEnv

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

def unionDisContMetric(discreteDataset: Option[DataFrame], continuousDataset: Option[DataFrame], domain: Domain, schema: Schema, count: Long, ingestionTime: Timestamp, stageState: Stage): Option[DataFrame]

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from SparkJob

Inherited from StrictLogging

Inherited from AnyRef

Inherited from Any

Ungrouped