org.apache.spark.rdd

Type Members

class AsyncRDDActions[T] extends Serializable with Logging

A set of asynchronous RDD actions available through an implicit conversion.
class CoGroupedRDD[K] extends RDD[(K, Seq[Seq[_]])]

A RDD that cogroups its parents.
class CoalescedRDD[T] extends RDD[T]

Represents a coalesced RDD that has fewer partitions than its parent RDD This class uses the PartitionCoalescer class to find a good partitioning of the parent RDD so that each new partition has roughly the same number of parent partitions and that the preferred location of each new partition overlaps with as many preferred locations of its parent partitions
case class CoalescedRDDPartition(index: Int, rdd: org.apache.spark.rdd.RDD[_], parentsIndices: Array[Int], preferredLocation: String) extends Partition with Product with Serializable

Class that captures a coalesced RDD by essentially keeping track of parent partitions
class DoubleRDDFunctions extends Logging with Serializable

Extra functions available on RDDs of Doubles through an implicit conversion.
class EmptyRDD[T] extends RDD[T]

An RDD that is empty, i.
class HadoopRDD[K, V] extends RDD[(K, V)] with Logging

An RDD that provides core functionality for reading data stored in Hadoop (e.
class JdbcRDD[T] extends RDD[T] with Logging

An RDD that executes an SQL query on a JDBC connection and reads results.
class NewHadoopRDD[K, V] extends RDD[(K, V)] with SparkHadoopMapReduceUtil with Logging
class OrderedRDDFunctions[K, V, P <: Product2[K, V]] extends Logging with Serializable

Extra functions available on RDDs of (key, value) pairs where the key is sortable through an implicit conversion.
class PairRDDFunctions[K, V] extends Logging with SparkHadoopMapReduceUtil with Serializable

Extra functions available on RDDs of (key, value) pairs through an implicit conversion.
class PartitionPruningRDD[T] extends RDD[T]

A RDD used to prune RDD partitions/partitions so we can avoid launching tasks on all partitions.
class PartitionPruningRDDPartition extends Partition
class PipedRDD[T] extends RDD[String]

An RDD that pipes the contents of each parent partition through an external command (printing them one per line) and returns the output as a collection of strings.
class PruneDependency[T] extends NarrowDependency[T]

Represents a dependency between the PartitionPruningRDD and its parent.
abstract class RDD[T] extends Serializable with Logging

A Resilient Distributed Dataset (RDD), the basic abstraction in Spark.
class SampledRDD[T] extends RDD[T]
class SequenceFileRDDFunctions[K, V] extends Logging with Serializable

Extra functions available on RDDs of (key, value) pairs to create a Hadoop SequenceFile, through an implicit conversion.
class ShuffledRDD[K, V, P <: Product2[K, V]] extends RDD[P]

The resulting RDD from a shuffle (e.
class UnionRDD[T] extends RDD[T]
abstract class ZippedPartitionsBaseRDD[V] extends RDD[V]
class ZippedPartitionsRDD2[A, B, V] extends ZippedPartitionsBaseRDD[V]
class ZippedPartitionsRDD3[A, B, C, V] extends ZippedPartitionsBaseRDD[V]
class ZippedPartitionsRDD4[A, B, C, D, V] extends ZippedPartitionsBaseRDD[V]
class ZippedRDD[T, U] extends RDD[(T, U)]

Value Members

object JdbcRDD extends Serializable
object PartitionPruningRDD extends Serializable
object PipedRDD extends Serializable

rdd

package rdd

Type Members

class AsyncRDDActions[T] extends Serializable with Logging

class CoGroupedRDD[K] extends RDD[(K, Seq[Seq[_]])]

class CoalescedRDD[T] extends RDD[T]

case class CoalescedRDDPartition(index: Int, rdd: org.apache.spark.rdd.RDD[_], parentsIndices: Array[Int], preferredLocation: String) extends Partition with Product with Serializable

class DoubleRDDFunctions extends Logging with Serializable

class EmptyRDD[T] extends RDD[T]

class HadoopRDD[K, V] extends RDD[(K, V)] with Logging

class JdbcRDD[T] extends RDD[T] with Logging

class NewHadoopRDD[K, V] extends RDD[(K, V)] with SparkHadoopMapReduceUtil with Logging

class OrderedRDDFunctions[K, V, P <: Product2[K, V]] extends Logging with Serializable

class PairRDDFunctions[K, V] extends Logging with SparkHadoopMapReduceUtil with Serializable

class PartitionPruningRDD[T] extends RDD[T]

class PartitionPruningRDDPartition extends Partition

class PipedRDD[T] extends RDD[String]

class PruneDependency[T] extends NarrowDependency[T]

abstract class RDD[T] extends Serializable with Logging

class SampledRDD[T] extends RDD[T]

class SequenceFileRDDFunctions[K, V] extends Logging with Serializable

class ShuffledRDD[K, V, P <: Product2[K, V]] extends RDD[P]

class UnionRDD[T] extends RDD[T]

abstract class ZippedPartitionsBaseRDD[V] extends RDD[V]

class ZippedPartitionsRDD2[A, B, V] extends ZippedPartitionsBaseRDD[V]

class ZippedPartitionsRDD3[A, B, C, V] extends ZippedPartitionsBaseRDD[V]

class ZippedPartitionsRDD4[A, B, C, D, V] extends ZippedPartitionsBaseRDD[V]

class ZippedRDD[T, U] extends RDD[(T, U)]

Value Members

object JdbcRDD extends Serializable

object PartitionPruningRDD extends Serializable

object PipedRDD extends Serializable