Loader

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def Point3DRDDFromV2(spark: SparkSession, filename: String, colnames: String, isSpherical: Boolean, format: String, options: Map[String, String] = Map("" -> "")): RDD[Point3D]

Construct a RDD[Point3D] from whatever data source registered in Spark.
Construct a RDD[Point3D] from whatever data source registered in Spark. For more information about available official connectors: https://spark-packages.org/?q=tags%3A%22Data%20Sources%22
That currently includes: CSV, JSON, TXT, FITS, ROOT, HDF5, Avro, Parquet...
```
// Here is an example with a CSV file containing
// 3 spherical coordinates columns labeled Z_COSMO,RA,Dec.

// Filename
val fn = "path/to/file.csv"
// Spark datasource
val format = "csv"
// Options to pass to the DataFrameReader - optional
val options = Map("header" -> "true")

// Load the data as RDD[Point3D]
val rdd = new Point3DRDD(spark, fn, "Z_COSMO,RA,Dec", true, format, options)
```
spark
: (SparkSession) The spark session
filename
: (String) File name where the data is stored.
colnames
: (String) Comma-separated names of (x, y, z) columns. Example: "Z_COSMO,RA,Dec".
isSpherical
: (Boolean) If true, it assumes that the coordinates of the Point3D are (r, theta, phi). Otherwise, it assumes cartesian coordinates (x, y, z).
format
: (String) The name of the data source as registered in Spark. For example:
- text
- csv
- json
- com.astrolabsoftware.sparkfits
- org.dianahep.sparkroot
- gov.llnl.spark.hdf or hdf5
options
: (Map[String, String]) Options to pass to the DataFrameReader. Default is no options.
returns
(RDD[Point3D])
def Point3DRDDFromV2PythonHelper(spark: SparkSession, filename: String, colnames: String, isSpherical: Boolean, format: String, options: HashMap[String, String]): RDD[Point3D]

Point3DRDDFromV2 version suitable for py4j.
Point3DRDDFromV2 version suitable for py4j.
Note that pyspark works with Python wrappers around the *Java* version of Spark objects, not around the *Scala* version of Spark objects. Therefore on the Scala side, we trigger the method Point3DRDDFromV2PythonHelper which is a modified version of Point3DRDDFromV2. The change is that options on the Scala side is a java.util.HashMap in order to smoothly connect to dictionary in the Python side.
def SphereRDDFromV2(spark: SparkSession, filename: String, colnames: String, isSpherical: Boolean, format: String, options: Map[String, String] = Map("" -> "")): RDD[ShellEnvelope]

Construct a RDD[ShellEnvelope] from whatever data source registered in Spark.
Construct a RDD[ShellEnvelope] from whatever data source registered in Spark. For more information about available official connectors: https://spark-packages.org/?q=tags%3A%22Data%20Sources%22
That currently includes: CSV, JSON, TXT, FITS, ROOT, HDF5, Avro, Parquet...
```
// Here is an example with a CSV file containing
// 3 cartesian coordinates + 1 radius columns labeled x,y,z,radius.

// Filename
val fn = "path/to/file.csv"
// Spark datasource
val format = "csv"
// Options to pass to the DataFrameReader - optional
val options = Map("header" -> "true")

// Load the data as RDD[ShellEnvelope]
val rdd = new SphereRDD(spark, fn, "x,y,z,radius", true, format, options)
```
spark
: (SparkSession) The spark session
filename
: (String) File name where the data is stored. Extension must be explicitly written (.cvs, .json, or .txt)
colnames
: (String) Comma-separated names of (x, y, z, r) columns to read. Example: "Z_COSMO,RA,Dec,Radius".
isSpherical
: (Boolean) If true, it assumes that the coordinates of the center of the ShellEnvelope are (r, theta, phi). Otherwise, it assumes cartesian coordinates (x, y, z). Default is false.
format
: (String) The name of the data source as registered in Spark. For example:
- text
- csv
- json
- com.astrolabsoftware.sparkfits
- org.dianahep.sparkroot
- gov.llnl.spark.hdf or hdf5
options
: (Map[String, String]) Options to pass to the DataFrameReader. Default is no options.
returns
(RDD[ShellEnvelope])
def SphereRDDFromV2PythonHelper(spark: SparkSession, filename: String, colnames: String, isSpherical: Boolean, format: String, options: HashMap[String, String]): RDD[ShellEnvelope]

SphereRDDFromV2 version suitable for py4j.
SphereRDDFromV2 version suitable for py4j.
Note that pyspark works with Python wrappers around the *Java* version of Spark objects, not around the *Scala* version of Spark objects. Therefore on the Scala side, we trigger the method SphereRDDFromV2PythonHelper which is a modified version of SphereRDDFromV2. The change is that options on the Scala side is a java.util.HashMap in order to smoothly connect to dictionary in the Python side.
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

Related Doc: package spatial3DRDD

object Loader

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

def Point3DRDDFromV2(spark: SparkSession, filename: String, colnames: String, isSpherical: Boolean, format: String, options: Map[String, String] = Map("" -> "")): RDD[Point3D]

def Point3DRDDFromV2PythonHelper(spark: SparkSession, filename: String, colnames: String, isSpherical: Boolean, format: String, options: HashMap[String, String]): RDD[Point3D]

def SphereRDDFromV2(spark: SparkSession, filename: String, colnames: String, isSpherical: Boolean, format: String, options: Map[String, String] = Map("" -> "")): RDD[ShellEnvelope]

def SphereRDDFromV2PythonHelper(spark: SparkSession, filename: String, colnames: String, isSpherical: Boolean, format: String, options: HashMap[String, String]): RDD[ShellEnvelope]

final def asInstanceOf[T0]: T0

def clone(): AnyRef

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from AnyRef

Inherited from Any

Ungrouped