CassandraJoinRDD

Type Members

type Self = CassandraJoinRDD[Left, Right]

This is slightly different than Scala this.type.
This is slightly different than Scala this.type. this.type is the unique singleton type of an object which is not compatible with other instances of the same type, so returning anything other than this is not really possible without lying to the compiler by explicit casts. Here SelfType is used to return a copy of the object - a different instance of the same type

Definition Classes
CassandraJoinRDD → CassandraRDD

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
def +(other: String): String

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to any2stringadd[CassandraJoinRDD[Left, Right]] performed by method any2stringadd in scala.Predef.
Definition Classes
any2stringadd
def ++(other: RDD[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
def ->[B](y: B): (CassandraJoinRDD[Left, Right], B)

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to ArrowAssoc[CassandraJoinRDD[Left, Right]] performed by method ArrowAssoc in scala.Predef.
Definition Classes
ArrowAssoc
Annotations
@inline()
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def aggregate[U](zeroValue: U)(seqOp: (U, (Left, Right)) ⇒ U, combOp: (U, U) ⇒ U)(implicit arg0: ClassTag[U]): U

Definition Classes
RDD
def as[B, A0, A1, A2, A3, A4, A5, A6, A7, A8, A9, A10, A11](f: (A0, A1, A2, A3, A4, A5, A6, A7, A8, A9, A10, A11) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5], arg7: TypeConverter[A6], arg8: TypeConverter[A7], arg9: TypeConverter[A8], arg10: TypeConverter[A9], arg11: TypeConverter[A10], arg12: TypeConverter[A11]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2, A3, A4, A5, A6, A7, A8, A9, A10](f: (A0, A1, A2, A3, A4, A5, A6, A7, A8, A9, A10) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5], arg7: TypeConverter[A6], arg8: TypeConverter[A7], arg9: TypeConverter[A8], arg10: TypeConverter[A9], arg11: TypeConverter[A10]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2, A3, A4, A5, A6, A7, A8, A9](f: (A0, A1, A2, A3, A4, A5, A6, A7, A8, A9) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5], arg7: TypeConverter[A6], arg8: TypeConverter[A7], arg9: TypeConverter[A8], arg10: TypeConverter[A9]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2, A3, A4, A5, A6, A7, A8](f: (A0, A1, A2, A3, A4, A5, A6, A7, A8) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5], arg7: TypeConverter[A6], arg8: TypeConverter[A7], arg9: TypeConverter[A8]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2, A3, A4, A5, A6, A7](f: (A0, A1, A2, A3, A4, A5, A6, A7) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5], arg7: TypeConverter[A6], arg8: TypeConverter[A7]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2, A3, A4, A5, A6](f: (A0, A1, A2, A3, A4, A5, A6) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5], arg7: TypeConverter[A6]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2, A3, A4, A5](f: (A0, A1, A2, A3, A4, A5) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2, A3, A4](f: (A0, A1, A2, A3, A4) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2, A3](f: (A0, A1, A2, A3) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1, A2](f: (A0, A1, A2) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2]): CassandraRDD[B]

Definition Classes
CassandraRDD
def as[B, A0, A1](f: (A0, A1) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1]): CassandraRDD[B]

Definition Classes
CassandraRDD

def as[B, A0](f: (A0) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0]): CassandraRDD[B]

Maps each row into object of a different type using provided function taking column value(s) as argument(s).

Maps each row into object of a different type using provided function taking column value(s) as argument(s). Can be used to convert each row to a tuple or a case class object:

sc.cassandraTable("ks", "table")
  .select("column1")
  .as((s: String) => s)                 // yields CassandraRDD[String]

sc.cassandraTable("ks", "table")
  .select("column1", "column2")
  .as((_: String, _: Long))             // yields CassandraRDD[(String, Long)]

case class MyRow(key: String, value: Long)
sc.cassandraTable("ks", "table")
  .select("column1", "column2")
  .as(MyRow)                            // yields CassandraRDD[MyRow]

Definition Classes: CassandraRDD

final def asInstanceOf[T0]: T0

Definition Classes
Any
def cache(): CassandraJoinRDD.this.type

Definition Classes
RDD
def cartesian[U](other: RDD[U])(implicit arg0: ClassTag[U]): RDD[((Left, Right), U)]

Definition Classes
RDD
lazy val cassandraPartitionerClassName: String

Attributes
protected
Definition Classes
CassandraTableRowReaderProvider
def checkColumnsExistence(columns: Seq[SelectableColumnRef]): Seq[SelectableColumnRef]

Attributes
protected
Definition Classes
CassandraTableRowReaderProvider
def checkValidJoin(): Seq[NamedColumnRef]

This method will create the RowWriter required before the RDD is serialized.
This method will create the RowWriter required before the RDD is serialized. This is called during getPartitions

Attributes
protected
def checkpoint(): Unit

Definition Classes
RDD
val classTag: ClassTag[Right]

Attributes
protected
Definition Classes
CassandraJoinRDD → CassandraTableRowReaderProvider
def clearDependencies(): Unit

Attributes
protected
Definition Classes
RDD
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
def clusteringOrder(order: ClusteringOrder): Self

Adds a CQL ORDER BY clause to the query.
Adds a CQL ORDER BY clause to the query. It can be applied only in case there are clustering columns and primary key predicate is pushed down in where. It is useful when the default direction of ordering rows within a single Cassandra partition needs to be changed.

Definition Classes
CassandraRDD
val clusteringOrder: Option[ClusteringOrder]

Definition Classes
CassandraJoinRDD → CassandraRDD
def coalesce(numPartitions: Int, shuffle: Boolean)(implicit ord: Ordering[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
def collect[U](f: PartialFunction[(Left, Right), U])(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
def collect(): Array[(Left, Right)]

Definition Classes
RDD
val columnNames: ColumnSelector

Definition Classes
CassandraJoinRDD → CassandraTableRowReaderProvider → CassandraRDD
def compute(split: Partition, context: TaskContext): Iterator[(Left, Right)]

When computing a CassandraPartitionKeyRDD the data is selected via single CQL statements from the specified C* Keyspace and Table.
When computing a CassandraPartitionKeyRDD the data is selected via single CQL statements from the specified C* Keyspace and Table. This will be preformed on whatever data is available in the previous RDD in the chain.

Definition Classes
CassandraJoinRDD → RDD
val connector: CassandraConnector

Definition Classes
CassandraJoinRDD → CassandraTableRowReaderProvider → CassandraRDD
def consistencyLevel: ConsistencyLevel

Attributes
protected
Definition Classes
CassandraTableRowReaderProvider
def context: SparkContext

Definition Classes
RDD
def convertTo[B](implicit arg0: ClassTag[B], arg1: RowReaderFactory[B]): CassandraRDD[B]

Attributes
protected
Definition Classes
CassandraRDD
def copy(columnNames: ColumnSelector = columnNames, where: CqlWhereClause = where, limit: Option[Long] = limit, clusteringOrder: Option[ClusteringOrder] = None, readConf: ReadConf = readConf, connector: CassandraConnector = connector): Self

Allows to copy this RDD with changing some of the properties
Allows to copy this RDD with changing some of the properties

Attributes
protected
Definition Classes
CassandraJoinRDD → CassandraRDD
def count(): Long

Definition Classes
CassandraJoinRDD → RDD
def countApprox(timeout: Long, confidence: Double): PartialResult[BoundedDouble]

Definition Classes
RDD
Annotations
@Experimental()
def countApproxDistinct(relativeSD: Double): Long

Definition Classes
RDD
def countApproxDistinct(p: Int, sp: Int): Long

Definition Classes
RDD
Annotations
@Experimental()
def countByValue()(implicit ord: Ordering[(Left, Right)]): Map[(Left, Right), Long]

Definition Classes
RDD
def countByValueApprox(timeout: Long, confidence: Double)(implicit ord: Ordering[(Left, Right)]): PartialResult[Map[(Left, Right), BoundedDouble]]

Definition Classes
RDD
Annotations
@Experimental()
final def dependencies: Seq[Dependency[_]]

Definition Classes
RDD
def distinct(): RDD[(Left, Right)]

Definition Classes
RDD
def distinct(numPartitions: Int)(implicit ord: Ordering[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
def ensuring(cond: (CassandraJoinRDD[Left, Right]) ⇒ Boolean, msg: ⇒ Any): CassandraJoinRDD[Left, Right]

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to Ensuring[CassandraJoinRDD[Left, Right]] performed by method Ensuring in scala.Predef.
Definition Classes
Ensuring
def ensuring(cond: (CassandraJoinRDD[Left, Right]) ⇒ Boolean): CassandraJoinRDD[Left, Right]

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to Ensuring[CassandraJoinRDD[Left, Right]] performed by method Ensuring in scala.Predef.
Definition Classes
Ensuring
def ensuring(cond: Boolean, msg: ⇒ Any): CassandraJoinRDD[Left, Right]

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to Ensuring[CassandraJoinRDD[Left, Right]] performed by method Ensuring in scala.Predef.
Definition Classes
Ensuring
def ensuring(cond: Boolean): CassandraJoinRDD[Left, Right]

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to Ensuring[CassandraJoinRDD[Left, Right]] performed by method Ensuring in scala.Predef.
Definition Classes
Ensuring
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def fetchSize: Int

Attributes
protected
Definition Classes
CassandraTableRowReaderProvider
def filter(f: ((Left, Right)) ⇒ Boolean): RDD[(Left, Right)]

Definition Classes
RDD
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
def first(): (Left, Right)

Definition Classes
RDD
def firstParent[U](implicit arg0: ClassTag[U]): RDD[U]

Attributes
protected[org.apache.spark]
Definition Classes
RDD
def flatMap[U](f: ((Left, Right)) ⇒ TraversableOnce[U])(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
def fold(zeroValue: (Left, Right))(op: ((Left, Right), (Left, Right)) ⇒ (Left, Right)): (Left, Right)

Definition Classes
RDD
def foreach(f: ((Left, Right)) ⇒ Unit): Unit

Definition Classes
RDD
def foreachPartition(f: (Iterator[(Left, Right)]) ⇒ Unit): Unit

Definition Classes
RDD
def formatted(fmtstr: String): String

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to StringFormat[CassandraJoinRDD[Left, Right]] performed by method StringFormat in scala.Predef.
Definition Classes
StringFormat
Annotations
@inline()
def getCheckpointFile: Option[String]

Definition Classes
RDD
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def getDependencies: Seq[Dependency[_]]

Attributes
protected
Definition Classes
RDD
def getPartitions: Array[Partition]

Attributes
protected
Definition Classes
CassandraJoinRDD → RDD
def getPreferredLocations(split: Partition): Seq[String]

Definition Classes
CassandraJoinRDD → RDD
def getStorageLevel: StorageLevel

Definition Classes
RDD
def glom(): RDD[Array[(Left, Right)]]

Definition Classes
RDD
def groupBy[K](f: ((Left, Right)) ⇒ K, p: Partitioner)(implicit kt: ClassTag[K], ord: Ordering[K]): RDD[(K, Iterable[(Left, Right)])]

Definition Classes
RDD
def groupBy[K](f: ((Left, Right)) ⇒ K, numPartitions: Int)(implicit kt: ClassTag[K]): RDD[(K, Iterable[(Left, Right)])]

Definition Classes
RDD
def groupBy[K](f: ((Left, Right)) ⇒ K)(implicit kt: ClassTag[K]): RDD[(K, Iterable[(Left, Right)])]

Definition Classes
RDD
def hashCode(): Int

Definition Classes
AnyRef → Any
val id: Int

Definition Classes
RDD
def intersection(other: RDD[(Left, Right)], numPartitions: Int): RDD[(Left, Right)]

Definition Classes
RDD
def intersection(other: RDD[(Left, Right)], partitioner: Partitioner)(implicit ord: Ordering[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
def intersection(other: RDD[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
def isCheckpointed: Boolean

Definition Classes
RDD
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def isTraceEnabled(): Boolean

Attributes
protected
Definition Classes
Logging
final def iterator(split: Partition, context: TaskContext): Iterator[(Left, Right)]

Definition Classes
RDD
lazy val joinColumnNames: Seq[NamedColumnRef]
val joinColumns: ColumnSelector
def joinWithCassandraTable[R](keyspaceName: String, tableName: String, selectedColumns: ColumnSelector = AllColumns, joinColumns: ColumnSelector = PartitionKeyColumns)(implicit connector: CassandraConnector = ..., newType: ClassTag[R], rrf: RowReaderFactory[R], ev: ValidRDDType[R], currentType: ClassTag[(Left, Right)], rwf: RowWriterFactory[(Left, Right)]): CassandraJoinRDD[(Left, Right), R]

Uses the data from RDD to join with a Cassandra table without retrieving the entire table.
Uses the data from RDD to join with a Cassandra table without retrieving the entire table. Any RDD which can be used to saveToCassandra can be used to joinWithCassandra as well as any RDD which only specifies the partition Key of a Cassandra Table. This method executes single partition requests against the Cassandra Table and accepts the functional modifiers that a normal com.datastax.spark.connector.rdd.CassandraTableScanRDD takes.
By default this method only uses the Partition Key for joining but any combination of columns which are acceptable to C* can be used in the join. Specify columns using joinColumns as a parameter or the on() method.
Example With Prior Repartitioning:
```
val source = sc.parallelize(keys).map(x => new KVRow(x))
val repart = source.repartitionByCassandraReplica(keyspace, tableName, 10)
val someCass = repart.joinWithCassandraTable(keyspace, tableName)
```
Example Joining on Clustering Columns:
```
val source = sc.parallelize(keys).map(x => (x, x * 100))
val someCass = source.joinWithCassandraTable(keyspace, wideTable).on(SomeColumns("key", "group"))
```
Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to RDDFunctions[(Left, Right)] performed by method toRDDFunctions in com.datastax.spark.connector.
Definition Classes
RDDFunctions
def keyBy[K](f: ((Left, Right)) ⇒ K): RDD[(K, (Left, Right))]

Definition Classes
RDD
def keyByCassandraReplica(keyspaceName: String, tableName: String)(implicit connector: CassandraConnector = ..., currentType: ClassTag[(Left, Right)], rwf: RowWriterFactory[(Left, Right)]): RDD[(Set[InetAddress], (Left, Right))]

Key every row in the RDD by with the IP Adresses of all of the Cassandra nodes which a contain a replica of the data specified by that row.
Key every row in the RDD by with the IP Adresses of all of the Cassandra nodes which a contain a replica of the data specified by that row. The calling RDD must have rows that can be converted into the partition key of the given Cassandra Table.

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to RDDFunctions[(Left, Right)] performed by method toRDDFunctions in com.datastax.spark.connector.
Definition Classes
RDDFunctions
val keyspaceName: String

Definition Classes
CassandraJoinRDD → CassandraTableRowReaderProvider → CassandraRDD
implicit val leftClassTag: ClassTag[Left]
def limit(rowLimit: Long): Self

Adds the limit clause to CQL select statement.
Adds the limit clause to CQL select statement. The limit will be applied for each created Spark partition. In other words, unless the data are fetched from a single Cassandra partition the number of results is unpredictable.
The main purpose of passing limit clause is to fetch top n rows from a single Cassandra partition when the table is designed so that it uses clustering keys and a partition key predicate is passed to the where clause.

Definition Classes
CassandraRDD
val limit: Option[Long]

Definition Classes
CassandraJoinRDD → CassandraRDD
def log: Logger

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logName: String

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def map[U](f: ((Left, Right)) ⇒ U)(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
def mapPartitions[U](f: (Iterator[(Left, Right)]) ⇒ Iterator[U], preservesPartitioning: Boolean)(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
def mapPartitionsWithIndex[U](f: (Int, Iterator[(Left, Right)]) ⇒ Iterator[U], preservesPartitioning: Boolean)(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
def max()(implicit ord: Ordering[(Left, Right)]): (Left, Right)

Definition Classes
RDD
def min()(implicit ord: Ordering[(Left, Right)]): (Left, Right)

Definition Classes
RDD
var name: String

Definition Classes
RDD
def narrowColumnSelection(columns: Seq[SelectableColumnRef]): Seq[SelectableColumnRef]

Filters currently selected set of columns with a new set of columns
Filters currently selected set of columns with a new set of columns

Definition Classes
CassandraTableRowReaderProvider
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
def on(joinColumns: ColumnSelector): CassandraJoinRDD[Left, Right]
def parent[U](j: Int)(implicit arg0: ClassTag[U]): RDD[U]

Attributes
protected[org.apache.spark]
Definition Classes
RDD
val partitioner: Option[Partitioner]

Definition Classes
RDD
final def partitions: Array[Partition]

Definition Classes
RDD
def persist(): CassandraJoinRDD.this.type

Definition Classes
RDD
def persist(newLevel: StorageLevel): CassandraJoinRDD.this.type

Definition Classes
RDD
def pipe(command: Seq[String], env: Map[String, String], printPipeContext: ((String) ⇒ Unit) ⇒ Unit, printRDDElement: ((Left, Right), (String) ⇒ Unit) ⇒ Unit, separateWorkingDir: Boolean): RDD[String]

Definition Classes
RDD
def pipe(command: String, env: Map[String, String]): RDD[String]

Definition Classes
RDD
def pipe(command: String): RDD[String]

Definition Classes
RDD
final def preferredLocations(split: Partition): Seq[String]

Definition Classes
RDD
def protocolVersion(session: Session): ProtocolVersion

Definition Classes
CassandraTableRowReaderProvider
def quote(name: String): String

Attributes
protected
Definition Classes
CassandraTableRowReaderProvider
def randomSplit(weights: Array[Double], seed: Long): Array[RDD[(Left, Right)]]

Definition Classes
RDD
val readConf: ReadConf

Definition Classes
CassandraJoinRDD → CassandraTableRowReaderProvider → CassandraRDD
def reduce(f: ((Left, Right), (Left, Right)) ⇒ (Left, Right)): (Left, Right)

Definition Classes
RDD
def repartition(numPartitions: Int)(implicit ord: Ordering[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
def repartitionByCassandraReplica(keyspaceName: String, tableName: String, partitionsPerHost: Int = 10)(implicit connector: CassandraConnector = ..., currentType: ClassTag[(Left, Right)], rwf: RowWriterFactory[(Left, Right)]): CassandraPartitionedRDD[(Left, Right)]

Repartitions the data (via a shuffle) based upon the replication of the given keyspaceName and tableName.
Repartitions the data (via a shuffle) based upon the replication of the given keyspaceName and tableName. Calling this method before using joinWithCassandraTable will ensure that requests will be coordinator local. partitionsPerHost Controls the number of Spark Partitions that will be created in this repartitioning event. The calling RDD must have rows that can be converted into the partition key of the given Cassandra Table.

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to RDDFunctions[(Left, Right)] performed by method toRDDFunctions in com.datastax.spark.connector.
Definition Classes
RDDFunctions
implicit val rightClassTag: ClassTag[Right]
lazy val rowReader: RowReader[Right]

Attributes
protected
Definition Classes
CassandraTableRowReaderProvider
implicit val rowReaderFactory: RowReaderFactory[Right]

RowReaderFactory and ClassTag should be provided from implicit parameters in the constructor of the class implementing this trait
RowReaderFactory and ClassTag should be provided from implicit parameters in the constructor of the class implementing this trait

Definition Classes
CassandraJoinRDD → CassandraTableRowReaderProvider
See also
CassandraTableScanRDD
lazy val rowWriter: RowWriter[Left]
implicit val rowWriterFactory: RowWriterFactory[Left]
def sample(withReplacement: Boolean, fraction: Double, seed: Long): RDD[(Left, Right)]

Definition Classes
RDD
def saveAsCassandraTable(keyspaceName: String, tableName: String, columns: ColumnSelector = AllColumns, writeConf: WriteConf = ...)(implicit connector: CassandraConnector = ..., rwf: RowWriterFactory[(Left, Right)], columnMapper: ColumnMapper[(Left, Right)]): Unit

Saves the data from RDD to a new table with definition taken from the ColumnMapper for this class.
Saves the data from RDD to a new table with definition taken from the ColumnMapper for this class.
keyspaceName
keyspace where to create a new table
tableName
name of the table to create; the table must not exist
columns
Selects the columns to save data to. Uses only the unique column names, and you must select at least all primary key columns. All other fields are discarded. Non-selected property/column names are left unchanged. This parameter does not affect table creation.
writeConf
additional configuration object allowing to set consistency level, batch size, etc.
connector
optional, implicit connector to Cassandra
rwf
factory for obtaining the row writer to be used to extract column values from items of the RDD
columnMapper
a column mapper determining the definition of the table

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to RDDFunctions[(Left, Right)] performed by method toRDDFunctions in com.datastax.spark.connector.
Definition Classes
RDDFunctions
def saveAsCassandraTableEx(table: TableDef, columns: ColumnSelector = AllColumns, writeConf: WriteConf = ...)(implicit connector: CassandraConnector = ..., rwf: RowWriterFactory[(Left, Right)]): Unit

Saves the data from RDD to a new table defined by the given TableDef.
Saves the data from RDD to a new table defined by the given TableDef.
First it creates a new table with all columns from the TableDef and then it saves RDD content in the same way as saveToCassandra. The table must not exist prior to this call.
table
table definition used to create a new table
columns
Selects the columns to save data to. Uses only the unique column names, and you must select at least all primary key columns. All other fields are discarded. Non-selected property/column names are left unchanged. This parameter does not affect table creation.
writeConf
additional configuration object allowing to set consistency level, batch size, etc.
connector
optional, implicit connector to Cassandra
rwf
factory for obtaining the row writer to be used to extract column values from items of the RDD

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to RDDFunctions[(Left, Right)] performed by method toRDDFunctions in com.datastax.spark.connector.
Definition Classes
RDDFunctions
def saveAsObjectFile(path: String): Unit

Definition Classes
RDD
def saveAsTextFile(path: String, codec: Class[_ <: CompressionCodec]): Unit

Definition Classes
RDD
def saveAsTextFile(path: String): Unit

Definition Classes
RDD
def saveToCassandra(keyspaceName: String, tableName: String, columns: ColumnSelector = AllColumns, writeConf: WriteConf = ...)(implicit connector: CassandraConnector = ..., rwf: RowWriterFactory[(Left, Right)]): Unit

Saves the data from RDD to a Cassandra table.
Saves the data from RDD to a Cassandra table. Uses the specified column names.
keyspaceName
the name of the Keyspace to use
tableName
the name of the Table to use
writeConf
additional configuration object allowing to set consistency level, batch size, etc.

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to RDDFunctions[(Left, Right)] performed by method toRDDFunctions in com.datastax.spark.connector.
Definition Classes
RDDFunctions → WritableToCassandra
See also
com.datastax.spark.connector.writer.WritableToCassandra
def select(columns: SelectableColumnRef*): Self

Narrows down the selected set of columns.
Narrows down the selected set of columns. Use this for better performance, when you don't need all the columns in the result RDD. When called multiple times, it selects the subset of the already selected columns, so after a column was removed by the previous select call, it is not possible to add it back.
The selected columns are NamedColumnRef instances. This type allows to specify columns for straightforward retrieval and to read TTL or write time of regular columns as well. Implicit conversions included in com.datastax.spark.connector package make it possible to provide just column names (which is also backward compatible) and optional add .ttl or .writeTime suffix in order to create an appropriate NamedColumnRef instance.

Definition Classes
CassandraRDD
def selectedColumnNames: Seq[String]

Definition Classes
CassandraRDD
lazy val selectedColumnRefs: Seq[SelectableColumnRef]

Returns the names of columns to be selected from the table.
Returns the names of columns to be selected from the table.

Definition Classes
CassandraTableRowReaderProvider
def setName(_name: String): CassandraJoinRDD.this.type

Definition Classes
RDD
lazy val singleKeyCqlQuery: String
def sortBy[K](f: ((Left, Right)) ⇒ K, ascending: Boolean, numPartitions: Int)(implicit ord: Ordering[K], ctag: ClassTag[K]): RDD[(Left, Right)]

Definition Classes
RDD
def spanBy[U](f: ((Left, Right)) ⇒ U): RDD[(U, Iterable[(Left, Right)])]

Applies a function to each item, and groups consecutive items having the same value together.
Applies a function to each item, and groups consecutive items having the same value together. Contrary to groupBy, items from the same group must be already next to each other in the original collection. Works locally on each partition, so items from different partitions will never be placed in the same group.

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to RDDFunctions[(Left, Right)] performed by method toRDDFunctions in com.datastax.spark.connector.
Definition Classes
RDDFunctions
def spanByKey: RDD[(Left, Seq[Right])]

Groups items with the same key, assuming the items with the same key are next to each other in the collection.
Groups items with the same key, assuming the items with the same key are next to each other in the collection. It does not perform shuffle, therefore it is much faster than using much more universal Spark RDD groupByKey. For this method to be useful with Cassandra tables, the key must represent a prefix of the primary key, containing at least the partition key of the Cassandra table.

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to PairRDDFunctions[Left, Right] performed by method toPairRDDFunctions in com.datastax.spark.connector.
Definition Classes
PairRDDFunctions
def sparkContext: SparkContext

Definition Classes
RDD
def splitSize: Int

Attributes
protected
Definition Classes
CassandraTableRowReaderProvider
def subtract(other: RDD[(Left, Right)], p: Partitioner)(implicit ord: Ordering[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
def subtract(other: RDD[(Left, Right)], numPartitions: Int): RDD[(Left, Right)]

Definition Classes
RDD
def subtract(other: RDD[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
lazy val tableDef: TableDef

Definition Classes
CassandraTableRowReaderProvider
val tableName: String

Definition Classes
CassandraJoinRDD → CassandraTableRowReaderProvider → CassandraRDD
def take(num: Int): Array[(Left, Right)]

Definition Classes
CassandraRDD → RDD
def takeOrdered(num: Int)(implicit ord: Ordering[(Left, Right)]): Array[(Left, Right)]

Definition Classes
RDD
def takeSample(withReplacement: Boolean, num: Int, seed: Long): Array[(Left, Right)]

Definition Classes
RDD
def toDebugString: String

Definition Classes
RDD
def toEmptyCassandraRDD: EmptyCassandraRDD[(Left, Right)]

Definition Classes
CassandraJoinRDD → CassandraRDD
def toJavaRDD(): JavaRDD[(Left, Right)]

Definition Classes
RDD
def toLocalIterator: Iterator[(Left, Right)]

Definition Classes
RDD
def toString(): String

Definition Classes
RDD → AnyRef → Any
def top(num: Int)(implicit ord: Ordering[(Left, Right)]): Array[(Left, Right)]

Definition Classes
RDD
def union(other: RDD[(Left, Right)]): RDD[(Left, Right)]

Definition Classes
RDD
def unpersist(blocking: Boolean): CassandraJoinRDD.this.type

Definition Classes
RDD
def verify(): Unit

Checks for existence of keyspace, table, columns and whether the number of selected columns corresponds to the number of the columns expected by the target type constructor.
Checks for existence of keyspace, table, columns and whether the number of selected columns corresponds to the number of the columns expected by the target type constructor. If successful, does nothing, otherwise throws appropriate IOException or AssertionError.

Definition Classes
CassandraTableRowReaderProvider
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
def where(cql: String, values: Any*): Self

Adds a CQL WHERE predicate(s) to the query.
Adds a CQL WHERE predicate(s) to the query. Useful for leveraging secondary indexes in Cassandra. Implicitly adds an ALLOW FILTERING clause to the WHERE clause, however beware that some predicates might be rejected by Cassandra, particularly in cases when they filter on an unindexed, non-clustering column.

Definition Classes
CassandraRDD
val where: CqlWhereClause

Definition Classes
CassandraJoinRDD → CassandraRDD
def withAscOrder: Self

Definition Classes
CassandraRDD
def withConnector(connector: CassandraConnector): Self

Returns a copy of this Cassandra RDD with specified connector
Returns a copy of this Cassandra RDD with specified connector

Definition Classes
CassandraRDD
def withDescOrder: Self

Definition Classes
CassandraRDD
def withReadConf(readConf: ReadConf): Self

Allows to set custom read configuration, e.g.
Allows to set custom read configuration, e.g. consistency level or fetch size.

Definition Classes
CassandraRDD
def zip[U](other: RDD[U])(implicit arg0: ClassTag[U]): RDD[((Left, Right), U)]

Definition Classes
RDD
def zipPartitions[B, C, D, V](rdd2: RDD[B], rdd3: RDD[C], rdd4: RDD[D])(f: (Iterator[(Left, Right)], Iterator[B], Iterator[C], Iterator[D]) ⇒ Iterator[V])(implicit arg0: ClassTag[B], arg1: ClassTag[C], arg2: ClassTag[D], arg3: ClassTag[V]): RDD[V]

Definition Classes
RDD
def zipPartitions[B, C, D, V](rdd2: RDD[B], rdd3: RDD[C], rdd4: RDD[D], preservesPartitioning: Boolean)(f: (Iterator[(Left, Right)], Iterator[B], Iterator[C], Iterator[D]) ⇒ Iterator[V])(implicit arg0: ClassTag[B], arg1: ClassTag[C], arg2: ClassTag[D], arg3: ClassTag[V]): RDD[V]

Definition Classes
RDD
def zipPartitions[B, C, V](rdd2: RDD[B], rdd3: RDD[C])(f: (Iterator[(Left, Right)], Iterator[B], Iterator[C]) ⇒ Iterator[V])(implicit arg0: ClassTag[B], arg1: ClassTag[C], arg2: ClassTag[V]): RDD[V]

Definition Classes
RDD
def zipPartitions[B, C, V](rdd2: RDD[B], rdd3: RDD[C], preservesPartitioning: Boolean)(f: (Iterator[(Left, Right)], Iterator[B], Iterator[C]) ⇒ Iterator[V])(implicit arg0: ClassTag[B], arg1: ClassTag[C], arg2: ClassTag[V]): RDD[V]

Definition Classes
RDD
def zipPartitions[B, V](rdd2: RDD[B])(f: (Iterator[(Left, Right)], Iterator[B]) ⇒ Iterator[V])(implicit arg0: ClassTag[B], arg1: ClassTag[V]): RDD[V]

Definition Classes
RDD
def zipPartitions[B, V](rdd2: RDD[B], preservesPartitioning: Boolean)(f: (Iterator[(Left, Right)], Iterator[B]) ⇒ Iterator[V])(implicit arg0: ClassTag[B], arg1: ClassTag[V]): RDD[V]

Definition Classes
RDD
def zipWithIndex(): RDD[((Left, Right), Long)]

Definition Classes
RDD
def zipWithUniqueId(): RDD[((Left, Right), Long)]

Definition Classes
RDD
def →[B](y: B): (CassandraJoinRDD[Left, Right], B)

Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to ArrowAssoc[CassandraJoinRDD[Left, Right]] performed by method ArrowAssoc in scala.Predef.
Definition Classes
ArrowAssoc

Shadowed Implicit Value Members

val sparkContext: SparkContext
Implicit information
This member is added by an implicit conversion from CassandraJoinRDD[Left, Right] to RDDFunctions[(Left, Right)] performed by method toRDDFunctions in com.datastax.spark.connector.
Shadowing
This implicitly inherited member is shadowed by one or more members in this class.
To access this member you can use a type ascription:
(cassandraJoinRDD: RDDFunctions[(Left, Right)]).sparkContext
Definition Classes
RDDFunctions → WritableToCassandra

Deprecated Value Members

def filterWith[A](constructA: (Int) ⇒ A)(p: ((Left, Right), A) ⇒ Boolean): RDD[(Left, Right)]

Definition Classes
RDD
Annotations
@deprecated
Deprecated
(Since version 1.0.0) use mapPartitionsWithIndex and filter
def flatMapWith[A, U](constructA: (Int) ⇒ A, preservesPartitioning: Boolean)(f: ((Left, Right), A) ⇒ Seq[U])(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
Annotations
@deprecated
Deprecated
(Since version 1.0.0) use mapPartitionsWithIndex and flatMap
def foreachWith[A](constructA: (Int) ⇒ A)(f: ((Left, Right), A) ⇒ Unit): Unit

Definition Classes
RDD
Annotations
@deprecated
Deprecated
(Since version 1.0.0) use mapPartitionsWithIndex and foreach
def mapPartitionsWithContext[U](f: (TaskContext, Iterator[(Left, Right)]) ⇒ Iterator[U], preservesPartitioning: Boolean)(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
Annotations
@DeveloperApi() @deprecated
Deprecated
(Since version 1.2.0) use TaskContext.get
def mapPartitionsWithSplit[U](f: (Int, Iterator[(Left, Right)]) ⇒ Iterator[U], preservesPartitioning: Boolean)(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
Annotations
@deprecated
Deprecated
(Since version 0.7.0) use mapPartitionsWithIndex
def mapWith[A, U](constructA: (Int) ⇒ A, preservesPartitioning: Boolean)(f: ((Left, Right), A) ⇒ U)(implicit arg0: ClassTag[U]): RDD[U]

Definition Classes
RDD
Annotations
@deprecated
Deprecated
(Since version 1.0.0) use mapPartitionsWithIndex
def toArray(): Array[(Left, Right)]

Definition Classes
RDD
Annotations
@deprecated
Deprecated
(Since version 1.0.0) use collect

Related Doc: package rdd

class CassandraJoinRDD[Left, Right] extends CassandraRDD[(Left, Right)] with CassandraTableRowReaderProvider[Right]

Type Members

type Self = CassandraJoinRDD[Left, Right]

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

def +(other: String): String

def ++(other: RDD[(Left, Right)]): RDD[(Left, Right)]

def ->[B](y: B): (CassandraJoinRDD[Left, Right], B)

final def ==(arg0: Any): Boolean

def aggregate[U](zeroValue: U)(seqOp: (U, (Left, Right)) ⇒ U, combOp: (U, U) ⇒ U)(implicit arg0: ClassTag[U]): U

def as[B, A0, A1, A2, A3, A4, A5, A6](f: (A0, A1, A2, A3, A4, A5, A6) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5], arg7: TypeConverter[A6]): CassandraRDD[B]

def as[B, A0, A1, A2, A3, A4, A5](f: (A0, A1, A2, A3, A4, A5) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4], arg6: TypeConverter[A5]): CassandraRDD[B]

def as[B, A0, A1, A2, A3, A4](f: (A0, A1, A2, A3, A4) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3], arg5: TypeConverter[A4]): CassandraRDD[B]

def as[B, A0, A1, A2, A3](f: (A0, A1, A2, A3) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2], arg4: TypeConverter[A3]): CassandraRDD[B]

def as[B, A0, A1, A2](f: (A0, A1, A2) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1], arg3: TypeConverter[A2]): CassandraRDD[B]

def as[B, A0, A1](f: (A0, A1) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0], arg2: TypeConverter[A1]): CassandraRDD[B]

def as[B, A0](f: (A0) ⇒ B)(implicit arg0: ClassTag[B], arg1: TypeConverter[A0]): CassandraRDD[B]

final def asInstanceOf[T0]: T0

def cache(): CassandraJoinRDD.this.type

def cartesian[U](other: RDD[U])(implicit arg0: ClassTag[U]): RDD[((Left, Right), U)]

lazy val cassandraPartitionerClassName: String

def checkColumnsExistence(columns: Seq[SelectableColumnRef]): Seq[SelectableColumnRef]

def checkValidJoin(): Seq[NamedColumnRef]

def checkpoint(): Unit

val classTag: ClassTag[Right]

def clearDependencies(): Unit

def clone(): AnyRef

def clusteringOrder(order: ClusteringOrder): Self

val clusteringOrder: Option[ClusteringOrder]

def coalesce(numPartitions: Int, shuffle: Boolean)(implicit ord: Ordering[(Left, Right)]): RDD[(Left, Right)]

def collect[U](f: PartialFunction[(Left, Right), U])(implicit arg0: ClassTag[U]): RDD[U]

def collect(): Array[(Left, Right)]

val columnNames: ColumnSelector

def compute(split: Partition, context: TaskContext): Iterator[(Left, Right)]

val connector: CassandraConnector

def consistencyLevel: ConsistencyLevel

def context: SparkContext

def convertTo[B](implicit arg0: ClassTag[B], arg1: RowReaderFactory[B]): CassandraRDD[B]

def copy(columnNames: ColumnSelector = columnNames, where: CqlWhereClause = where, limit: Option[Long] = limit, clusteringOrder: Option[ClusteringOrder] = None, readConf: ReadConf = readConf, connector: CassandraConnector = connector): Self

def count(): Long

def countApprox(timeout: Long, confidence: Double): PartialResult[BoundedDouble]

def countApproxDistinct(relativeSD: Double): Long

def countApproxDistinct(p: Int, sp: Int): Long

def countByValue()(implicit ord: Ordering[(Left, Right)]): Map[(Left, Right), Long]

def countByValueApprox(timeout: Long, confidence: Double)(implicit ord: Ordering[(Left, Right)]): PartialResult[Map[(Left, Right), BoundedDouble]]

final def dependencies: Seq[Dependency[_]]

def distinct(): RDD[(Left, Right)]

def distinct(numPartitions: Int)(implicit ord: Ordering[(Left, Right)]): RDD[(Left, Right)]

def ensuring(cond: (CassandraJoinRDD[Left, Right]) ⇒ Boolean, msg: ⇒ Any): CassandraJoinRDD[Left, Right]

def ensuring(cond: (CassandraJoinRDD[Left, Right]) ⇒ Boolean): CassandraJoinRDD[Left, Right]

def ensuring(cond: Boolean, msg: ⇒ Any): CassandraJoinRDD[Left, Right]

def ensuring(cond: Boolean): CassandraJoinRDD[Left, Right]

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def fetchSize: Int

def filter(f: ((Left, Right)) ⇒ Boolean): RDD[(Left, Right)]

def finalize(): Unit

def first(): (Left, Right)

def firstParent[U](implicit arg0: ClassTag[U]): RDD[U]

def flatMap[U](f: ((Left, Right)) ⇒ TraversableOnce[U])(implicit arg0: ClassTag[U]): RDD[U]

def fold(zeroValue: (Left, Right))(op: ((Left, Right), (Left, Right)) ⇒ (Left, Right)): (Left, Right)

def foreach(f: ((Left, Right)) ⇒ Unit): Unit

def foreachPartition(f: (Iterator[(Left, Right)]) ⇒ Unit): Unit

def formatted(fmtstr: String): String

def getCheckpointFile: Option[String]

final def getClass(): Class[_]

def getDependencies: Seq[Dependency[_]]

def getPartitions: Array[Partition]

def getPreferredLocations(split: Partition): Seq[String]

def getStorageLevel: StorageLevel

def glom(): RDD[Array[(Left, Right)]]

def groupBy[K](f: ((Left, Right)) ⇒ K, p: Partitioner)(implicit kt: ClassTag[K], ord: Ordering[K]): RDD[(K, Iterable[(Left, Right)])]

def groupBy[K](f: ((Left, Right)) ⇒ K, numPartitions: Int)(implicit kt: ClassTag[K]): RDD[(K, Iterable[(Left, Right)])]

def groupBy[K](f: ((Left, Right)) ⇒ K)(implicit kt: ClassTag[K]): RDD[(K, Iterable[(Left, Right)])]

def hashCode(): Int

val id: Int

def intersection(other: RDD[(Left, Right)], numPartitions: Int): RDD[(Left, Right)]