public class RandomRDDs
extends Object
i.i.d. samples from some distribution.| Constructor and Description | 
|---|
| RandomRDDs() | 
| Modifier and Type | Method and Description | 
|---|---|
| static JavaDoubleRDD | exponentialJavaRDD(JavaSparkContext jsc,
                  double mean,
                  long size)RandomRDDs.exponentialJavaRDDwith the default number of partitions and the default seed. | 
| static JavaDoubleRDD | exponentialJavaRDD(JavaSparkContext jsc,
                  double mean,
                  long size,
                  int numPartitions)RandomRDDs.exponentialJavaRDDwith the default seed. | 
| static JavaDoubleRDD | exponentialJavaRDD(JavaSparkContext jsc,
                  double mean,
                  long size,
                  int numPartitions,
                  long seed)Java-friendly version of  RandomRDDs.exponentialRDD. | 
| static JavaRDD<Vector> | exponentialJavaVectorRDD(JavaSparkContext jsc,
                        double mean,
                        long numRows,
                        int numCols)RandomRDDs.exponentialJavaVectorRDDwith the default number of partitions
 and the default seed. | 
| static JavaRDD<Vector> | exponentialJavaVectorRDD(JavaSparkContext jsc,
                        double mean,
                        long numRows,
                        int numCols,
                        int numPartitions)RandomRDDs.exponentialJavaVectorRDDwith the default seed. | 
| static JavaRDD<Vector> | exponentialJavaVectorRDD(JavaSparkContext jsc,
                        double mean,
                        long numRows,
                        int numCols,
                        int numPartitions,
                        long seed)Java-friendly version of  RandomRDDs.exponentialVectorRDD. | 
| static RDD<Object> | exponentialRDD(SparkContext sc,
              double mean,
              long size,
              int numPartitions,
              long seed)Generates an RDD comprised of  i.i.d.samples from the exponential distribution with
 the input mean. | 
| static RDD<Vector> | exponentialVectorRDD(SparkContext sc,
                    double mean,
                    long numRows,
                    int numCols,
                    int numPartitions,
                    long seed)Generates an RDD[Vector] with vectors containing  i.i.d.samples drawn from the
 exponential distribution with the input mean. | 
| static JavaDoubleRDD | gammaJavaRDD(JavaSparkContext jsc,
            double shape,
            double scale,
            long size)RandomRDDs.gammaJavaRDDwith the default number of partitions and the default seed. | 
| static JavaDoubleRDD | gammaJavaRDD(JavaSparkContext jsc,
            double shape,
            double scale,
            long size,
            int numPartitions)RandomRDDs.gammaJavaRDDwith the default seed. | 
| static JavaDoubleRDD | gammaJavaRDD(JavaSparkContext jsc,
            double shape,
            double scale,
            long size,
            int numPartitions,
            long seed)Java-friendly version of  RandomRDDs.gammaRDD. | 
| static JavaRDD<Vector> | gammaJavaVectorRDD(JavaSparkContext jsc,
                  double shape,
                  double scale,
                  long numRows,
                  int numCols)RandomRDDs.gammaJavaVectorRDDwith the default number of partitions and the default seed. | 
| static JavaRDD<Vector> | gammaJavaVectorRDD(JavaSparkContext jsc,
                  double shape,
                  double scale,
                  long numRows,
                  int numCols,
                  int numPartitions)RandomRDDs.gammaJavaVectorRDDwith the default seed. | 
| static JavaRDD<Vector> | gammaJavaVectorRDD(JavaSparkContext jsc,
                  double shape,
                  double scale,
                  long numRows,
                  int numCols,
                  int numPartitions,
                  long seed)Java-friendly version of  RandomRDDs.gammaVectorRDD. | 
| static RDD<Object> | gammaRDD(SparkContext sc,
        double shape,
        double scale,
        long size,
        int numPartitions,
        long seed)Generates an RDD comprised of  i.i.d.samples from the gamma distribution with the input
  shape and scale. | 
| static RDD<Vector> | gammaVectorRDD(SparkContext sc,
              double shape,
              double scale,
              long numRows,
              int numCols,
              int numPartitions,
              long seed)Generates an RDD[Vector] with vectors containing  i.i.d.samples drawn from the
 gamma distribution with the input shape and scale. | 
| static JavaDoubleRDD | logNormalJavaRDD(JavaSparkContext jsc,
                double mean,
                double std,
                long size)RandomRDDs.logNormalJavaRDDwith the default number of partitions and the default seed. | 
| static JavaDoubleRDD | logNormalJavaRDD(JavaSparkContext jsc,
                double mean,
                double std,
                long size,
                int numPartitions)RandomRDDs.logNormalJavaRDDwith the default seed. | 
| static JavaDoubleRDD | logNormalJavaRDD(JavaSparkContext jsc,
                double mean,
                double std,
                long size,
                int numPartitions,
                long seed)Java-friendly version of  RandomRDDs.logNormalRDD. | 
| static JavaRDD<Vector> | logNormalJavaVectorRDD(JavaSparkContext jsc,
                      double mean,
                      double std,
                      long numRows,
                      int numCols)RandomRDDs.logNormalJavaVectorRDDwith the default number of partitions and
 the default seed. | 
| static JavaRDD<Vector> | logNormalJavaVectorRDD(JavaSparkContext jsc,
                      double mean,
                      double std,
                      long numRows,
                      int numCols,
                      int numPartitions)RandomRDDs.logNormalJavaVectorRDDwith the default seed. | 
| static JavaRDD<Vector> | logNormalJavaVectorRDD(JavaSparkContext jsc,
                      double mean,
                      double std,
                      long numRows,
                      int numCols,
                      int numPartitions,
                      long seed)Java-friendly version of  RandomRDDs.logNormalVectorRDD. | 
| static RDD<Object> | logNormalRDD(SparkContext sc,
            double mean,
            double std,
            long size,
            int numPartitions,
            long seed)Generates an RDD comprised of  i.i.d.samples from the log normal distribution with the input
  mean and standard deviation | 
| static RDD<Vector> | logNormalVectorRDD(SparkContext sc,
                  double mean,
                  double std,
                  long numRows,
                  int numCols,
                  int numPartitions,
                  long seed)Generates an RDD[Vector] with vectors containing  i.i.d.samples drawn from a
 log normal distribution. | 
| static JavaDoubleRDD | normalJavaRDD(JavaSparkContext jsc,
             long size)RandomRDDs.normalJavaRDDwith the default number of partitions and the default seed. | 
| static JavaDoubleRDD | normalJavaRDD(JavaSparkContext jsc,
             long size,
             int numPartitions)RandomRDDs.normalJavaRDDwith the default seed. | 
| static JavaDoubleRDD | normalJavaRDD(JavaSparkContext jsc,
             long size,
             int numPartitions,
             long seed)Java-friendly version of  RandomRDDs.normalRDD. | 
| static JavaRDD<Vector> | normalJavaVectorRDD(JavaSparkContext jsc,
                   long numRows,
                   int numCols)RandomRDDs.normalJavaVectorRDDwith the default number of partitions and the default seed. | 
| static JavaRDD<Vector> | normalJavaVectorRDD(JavaSparkContext jsc,
                   long numRows,
                   int numCols,
                   int numPartitions)RandomRDDs.normalJavaVectorRDDwith the default seed. | 
| static JavaRDD<Vector> | normalJavaVectorRDD(JavaSparkContext jsc,
                   long numRows,
                   int numCols,
                   int numPartitions,
                   long seed)Java-friendly version of  RandomRDDs.normalVectorRDD. | 
| static RDD<Object> | normalRDD(SparkContext sc,
         long size,
         int numPartitions,
         long seed)Generates an RDD comprised of  i.i.d.samples from the standard normal distribution. | 
| static RDD<Vector> | normalVectorRDD(SparkContext sc,
               long numRows,
               int numCols,
               int numPartitions,
               long seed)Generates an RDD[Vector] with vectors containing  i.i.d.samples drawn from the
 standard normal distribution. | 
| static JavaDoubleRDD | poissonJavaRDD(JavaSparkContext jsc,
              double mean,
              long size)RandomRDDs.poissonJavaRDDwith the default number of partitions and the default seed. | 
| static JavaDoubleRDD | poissonJavaRDD(JavaSparkContext jsc,
              double mean,
              long size,
              int numPartitions)RandomRDDs.poissonJavaRDDwith the default seed. | 
| static JavaDoubleRDD | poissonJavaRDD(JavaSparkContext jsc,
              double mean,
              long size,
              int numPartitions,
              long seed)Java-friendly version of  RandomRDDs.poissonRDD. | 
| static JavaRDD<Vector> | poissonJavaVectorRDD(JavaSparkContext jsc,
                    double mean,
                    long numRows,
                    int numCols)RandomRDDs.poissonJavaVectorRDDwith the default number of partitions and the default seed. | 
| static JavaRDD<Vector> | poissonJavaVectorRDD(JavaSparkContext jsc,
                    double mean,
                    long numRows,
                    int numCols,
                    int numPartitions)RandomRDDs.poissonJavaVectorRDDwith the default seed. | 
| static JavaRDD<Vector> | poissonJavaVectorRDD(JavaSparkContext jsc,
                    double mean,
                    long numRows,
                    int numCols,
                    int numPartitions,
                    long seed)Java-friendly version of  RandomRDDs.poissonVectorRDD. | 
| static RDD<Object> | poissonRDD(SparkContext sc,
          double mean,
          long size,
          int numPartitions,
          long seed)Generates an RDD comprised of  i.i.d.samples from the Poisson distribution with the input
 mean. | 
| static RDD<Vector> | poissonVectorRDD(SparkContext sc,
                double mean,
                long numRows,
                int numCols,
                int numPartitions,
                long seed)Generates an RDD[Vector] with vectors containing  i.i.d.samples drawn from the
 Poisson distribution with the input mean. | 
| static <T> JavaRDD<T> | randomJavaRDD(JavaSparkContext jsc,
             RandomDataGenerator<T> generator,
             long size)RandomRDDs.randomJavaRDDwith the default seed & numPartitions | 
| static <T> JavaRDD<T> | randomJavaRDD(JavaSparkContext jsc,
             RandomDataGenerator<T> generator,
             long size,
             int numPartitions)RandomRDDs.randomJavaRDDwith the default seed. | 
| static <T> JavaRDD<T> | randomJavaRDD(JavaSparkContext jsc,
             RandomDataGenerator<T> generator,
             long size,
             int numPartitions,
             long seed)Generates an RDD comprised of  i.i.d.samples produced by the input RandomDataGenerator. | 
| static JavaRDD<Vector> | randomJavaVectorRDD(JavaSparkContext jsc,
                   RandomDataGenerator<Object> generator,
                   long numRows,
                   int numCols)RandomRDDs.randomJavaVectorRDDwith the default number of partitions and the default seed. | 
| static JavaRDD<Vector> | randomJavaVectorRDD(JavaSparkContext jsc,
                   RandomDataGenerator<Object> generator,
                   long numRows,
                   int numCols,
                   int numPartitions)::
  RandomRDDs.randomJavaVectorRDDwith the default seed. | 
| static JavaRDD<Vector> | randomJavaVectorRDD(JavaSparkContext jsc,
                   RandomDataGenerator<Object> generator,
                   long numRows,
                   int numCols,
                   int numPartitions,
                   long seed)Java-friendly version of  RandomRDDs.randomVectorRDD. | 
| static <T> RDD<T> | randomRDD(SparkContext sc,
         RandomDataGenerator<T> generator,
         long size,
         int numPartitions,
         long seed,
         scala.reflect.ClassTag<T> evidence$1)Generates an RDD comprised of  i.i.d.samples produced by the input RandomDataGenerator. | 
| static RDD<Vector> | randomVectorRDD(SparkContext sc,
               RandomDataGenerator<Object> generator,
               long numRows,
               int numCols,
               int numPartitions,
               long seed)Generates an RDD[Vector] with vectors containing  i.i.d.samples produced by the
 input RandomDataGenerator. | 
| static JavaDoubleRDD | uniformJavaRDD(JavaSparkContext jsc,
              long size)RandomRDDs.uniformJavaRDDwith the default number of partitions and the default seed. | 
| static JavaDoubleRDD | uniformJavaRDD(JavaSparkContext jsc,
              long size,
              int numPartitions)RandomRDDs.uniformJavaRDDwith the default seed. | 
| static JavaDoubleRDD | uniformJavaRDD(JavaSparkContext jsc,
              long size,
              int numPartitions,
              long seed)Java-friendly version of  RandomRDDs.uniformRDD. | 
| static JavaRDD<Vector> | uniformJavaVectorRDD(JavaSparkContext jsc,
                    long numRows,
                    int numCols)RandomRDDs.uniformJavaVectorRDDwith the default number of partitions and the default seed. | 
| static JavaRDD<Vector> | uniformJavaVectorRDD(JavaSparkContext jsc,
                    long numRows,
                    int numCols,
                    int numPartitions)RandomRDDs.uniformJavaVectorRDDwith the default seed. | 
| static JavaRDD<Vector> | uniformJavaVectorRDD(JavaSparkContext jsc,
                    long numRows,
                    int numCols,
                    int numPartitions,
                    long seed)Java-friendly version of  RandomRDDs.uniformVectorRDD. | 
| static RDD<Object> | uniformRDD(SparkContext sc,
          long size,
          int numPartitions,
          long seed)Generates an RDD comprised of  i.i.d.samples from the uniform distributionU(0.0, 1.0). | 
| static RDD<Vector> | uniformVectorRDD(SparkContext sc,
                long numRows,
                int numCols,
                int numPartitions,
                long seed)Generates an RDD[Vector] with vectors containing  i.i.d.samples drawn from the
 uniform distribution onU(0.0, 1.0). | 
public static RDD<Object> uniformRDD(SparkContext sc, long size, int numPartitions, long seed)
i.i.d. samples from the uniform distribution U(0.0, 1.0).
 
 To transform the distribution in the generated RDD from U(0.0, 1.0) to U(a, b), use
 RandomRDDs.uniformRDD(sc, n, p, seed).map(v => a + (b - a) * v).
 
sc - SparkContext used to create the RDD.size - Size of the RDD.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples ~ U(0.0, 1.0).public static JavaDoubleRDD uniformJavaRDD(JavaSparkContext jsc, long size, int numPartitions, long seed)
RandomRDDs.uniformRDD.jsc - (undocumented)size - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaDoubleRDD uniformJavaRDD(JavaSparkContext jsc, long size, int numPartitions)
RandomRDDs.uniformJavaRDD with the default seed.jsc - (undocumented)size - (undocumented)numPartitions - (undocumented)public static JavaDoubleRDD uniformJavaRDD(JavaSparkContext jsc, long size)
RandomRDDs.uniformJavaRDD with the default number of partitions and the default seed.jsc - (undocumented)size - (undocumented)public static RDD<Object> normalRDD(SparkContext sc, long size, int numPartitions, long seed)
i.i.d. samples from the standard normal distribution.
 
 To transform the distribution in the generated RDD from standard normal to some other normal
 N(mean, sigma^2^), use RandomRDDs.normalRDD(sc, n, p, seed).map(v => mean + sigma * v).
 
sc - SparkContext used to create the RDD.size - Size of the RDD.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples ~ N(0.0, 1.0).public static JavaDoubleRDD normalJavaRDD(JavaSparkContext jsc, long size, int numPartitions, long seed)
RandomRDDs.normalRDD.jsc - (undocumented)size - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaDoubleRDD normalJavaRDD(JavaSparkContext jsc, long size, int numPartitions)
RandomRDDs.normalJavaRDD with the default seed.jsc - (undocumented)size - (undocumented)numPartitions - (undocumented)public static JavaDoubleRDD normalJavaRDD(JavaSparkContext jsc, long size)
RandomRDDs.normalJavaRDD with the default number of partitions and the default seed.jsc - (undocumented)size - (undocumented)public static RDD<Object> poissonRDD(SparkContext sc, double mean, long size, int numPartitions, long seed)
i.i.d. samples from the Poisson distribution with the input
 mean.
 sc - SparkContext used to create the RDD.mean - Mean, or lambda, for the Poisson distribution.size - Size of the RDD.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples ~ Pois(mean).public static JavaDoubleRDD poissonJavaRDD(JavaSparkContext jsc, double mean, long size, int numPartitions, long seed)
RandomRDDs.poissonRDD.jsc - (undocumented)mean - (undocumented)size - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaDoubleRDD poissonJavaRDD(JavaSparkContext jsc, double mean, long size, int numPartitions)
RandomRDDs.poissonJavaRDD with the default seed.jsc - (undocumented)mean - (undocumented)size - (undocumented)numPartitions - (undocumented)public static JavaDoubleRDD poissonJavaRDD(JavaSparkContext jsc, double mean, long size)
RandomRDDs.poissonJavaRDD with the default number of partitions and the default seed.jsc - (undocumented)mean - (undocumented)size - (undocumented)public static RDD<Object> exponentialRDD(SparkContext sc, double mean, long size, int numPartitions, long seed)
i.i.d. samples from the exponential distribution with
 the input mean.
 sc - SparkContext used to create the RDD.mean - Mean, or 1 / lambda, for the exponential distribution.size - Size of the RDD.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples ~ Pois(mean).public static JavaDoubleRDD exponentialJavaRDD(JavaSparkContext jsc, double mean, long size, int numPartitions, long seed)
RandomRDDs.exponentialRDD.jsc - (undocumented)mean - (undocumented)size - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaDoubleRDD exponentialJavaRDD(JavaSparkContext jsc, double mean, long size, int numPartitions)
RandomRDDs.exponentialJavaRDD with the default seed.jsc - (undocumented)mean - (undocumented)size - (undocumented)numPartitions - (undocumented)public static JavaDoubleRDD exponentialJavaRDD(JavaSparkContext jsc, double mean, long size)
RandomRDDs.exponentialJavaRDD with the default number of partitions and the default seed.jsc - (undocumented)mean - (undocumented)size - (undocumented)public static RDD<Object> gammaRDD(SparkContext sc, double shape, double scale, long size, int numPartitions, long seed)
i.i.d. samples from the gamma distribution with the input
  shape and scale.
 sc - SparkContext used to create the RDD.shape - shape parameter (greater than 0) for the gamma distributionscale - scale parameter (greater than 0) for the gamma distributionsize - Size of the RDD.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples ~ Pois(mean).public static JavaDoubleRDD gammaJavaRDD(JavaSparkContext jsc, double shape, double scale, long size, int numPartitions, long seed)
RandomRDDs.gammaRDD.jsc - (undocumented)shape - (undocumented)scale - (undocumented)size - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaDoubleRDD gammaJavaRDD(JavaSparkContext jsc, double shape, double scale, long size, int numPartitions)
RandomRDDs.gammaJavaRDD with the default seed.jsc - (undocumented)shape - (undocumented)scale - (undocumented)size - (undocumented)numPartitions - (undocumented)public static JavaDoubleRDD gammaJavaRDD(JavaSparkContext jsc, double shape, double scale, long size)
RandomRDDs.gammaJavaRDD with the default number of partitions and the default seed.jsc - (undocumented)shape - (undocumented)scale - (undocumented)size - (undocumented)public static RDD<Object> logNormalRDD(SparkContext sc, double mean, double std, long size, int numPartitions, long seed)
i.i.d. samples from the log normal distribution with the input
  mean and standard deviation
 sc - SparkContext used to create the RDD.mean - mean for the log normal distributionstd - standard deviation for the log normal distributionsize - Size of the RDD.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples ~ Pois(mean).public static JavaDoubleRDD logNormalJavaRDD(JavaSparkContext jsc, double mean, double std, long size, int numPartitions, long seed)
RandomRDDs.logNormalRDD.jsc - (undocumented)mean - (undocumented)std - (undocumented)size - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaDoubleRDD logNormalJavaRDD(JavaSparkContext jsc, double mean, double std, long size, int numPartitions)
RandomRDDs.logNormalJavaRDD with the default seed.jsc - (undocumented)mean - (undocumented)std - (undocumented)size - (undocumented)numPartitions - (undocumented)public static JavaDoubleRDD logNormalJavaRDD(JavaSparkContext jsc, double mean, double std, long size)
RandomRDDs.logNormalJavaRDD with the default number of partitions and the default seed.jsc - (undocumented)mean - (undocumented)std - (undocumented)size - (undocumented)public static <T> RDD<T> randomRDD(SparkContext sc, RandomDataGenerator<T> generator, long size, int numPartitions, long seed, scala.reflect.ClassTag<T> evidence$1)
i.i.d. samples produced by the input RandomDataGenerator.
 sc - SparkContext used to create the RDD.generator - RandomDataGenerator used to populate the RDD.size - Size of the RDD.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).evidence$1 - (undocumented)i.i.d. samples produced by generator.public static <T> JavaRDD<T> randomJavaRDD(JavaSparkContext jsc, RandomDataGenerator<T> generator, long size, int numPartitions, long seed)
i.i.d. samples produced by the input RandomDataGenerator.
 jsc - JavaSparkContext used to create the RDD.generator - RandomDataGenerator used to populate the RDD.size - Size of the RDD.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples produced by generator.public static <T> JavaRDD<T> randomJavaRDD(JavaSparkContext jsc, RandomDataGenerator<T> generator, long size, int numPartitions)
RandomRDDs.randomJavaRDD with the default seed.jsc - (undocumented)generator - (undocumented)size - (undocumented)numPartitions - (undocumented)public static <T> JavaRDD<T> randomJavaRDD(JavaSparkContext jsc, RandomDataGenerator<T> generator, long size)
RandomRDDs.randomJavaRDD with the default seed & numPartitionsjsc - (undocumented)generator - (undocumented)size - (undocumented)public static RDD<Vector> uniformVectorRDD(SparkContext sc, long numRows, int numCols, int numPartitions, long seed)
i.i.d. samples drawn from the
 uniform distribution on U(0.0, 1.0).
 sc - SparkContext used to create the RDD.numRows - Number of Vectors in the RDD.numCols - Number of elements in each Vector.numPartitions - Number of partitions in the RDD.seed - Seed for the RNG that generates the seed for the generator in each partition.U(0.0, 1.0).public static JavaRDD<Vector> uniformJavaVectorRDD(JavaSparkContext jsc, long numRows, int numCols, int numPartitions, long seed)
RandomRDDs.uniformVectorRDD.jsc - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaRDD<Vector> uniformJavaVectorRDD(JavaSparkContext jsc, long numRows, int numCols, int numPartitions)
RandomRDDs.uniformJavaVectorRDD with the default seed.jsc - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)public static JavaRDD<Vector> uniformJavaVectorRDD(JavaSparkContext jsc, long numRows, int numCols)
RandomRDDs.uniformJavaVectorRDD with the default number of partitions and the default seed.jsc - (undocumented)numRows - (undocumented)numCols - (undocumented)public static RDD<Vector> normalVectorRDD(SparkContext sc, long numRows, int numCols, int numPartitions, long seed)
i.i.d. samples drawn from the
 standard normal distribution.
 sc - SparkContext used to create the RDD.numRows - Number of Vectors in the RDD.numCols - Number of elements in each Vector.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples ~ N(0.0, 1.0).public static JavaRDD<Vector> normalJavaVectorRDD(JavaSparkContext jsc, long numRows, int numCols, int numPartitions, long seed)
RandomRDDs.normalVectorRDD.jsc - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaRDD<Vector> normalJavaVectorRDD(JavaSparkContext jsc, long numRows, int numCols, int numPartitions)
RandomRDDs.normalJavaVectorRDD with the default seed.jsc - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)public static JavaRDD<Vector> normalJavaVectorRDD(JavaSparkContext jsc, long numRows, int numCols)
RandomRDDs.normalJavaVectorRDD with the default number of partitions and the default seed.jsc - (undocumented)numRows - (undocumented)numCols - (undocumented)public static RDD<Vector> logNormalVectorRDD(SparkContext sc, double mean, double std, long numRows, int numCols, int numPartitions, long seed)
i.i.d. samples drawn from a
 log normal distribution.
 sc - SparkContext used to create the RDD.mean - Mean of the log normal distribution.std - Standard deviation of the log normal distribution.numRows - Number of Vectors in the RDD.numCols - Number of elements in each Vector.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples.public static JavaRDD<Vector> logNormalJavaVectorRDD(JavaSparkContext jsc, double mean, double std, long numRows, int numCols, int numPartitions, long seed)
RandomRDDs.logNormalVectorRDD.jsc - (undocumented)mean - (undocumented)std - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaRDD<Vector> logNormalJavaVectorRDD(JavaSparkContext jsc, double mean, double std, long numRows, int numCols, int numPartitions)
RandomRDDs.logNormalJavaVectorRDD with the default seed.jsc - (undocumented)mean - (undocumented)std - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)public static JavaRDD<Vector> logNormalJavaVectorRDD(JavaSparkContext jsc, double mean, double std, long numRows, int numCols)
RandomRDDs.logNormalJavaVectorRDD with the default number of partitions and
 the default seed.jsc - (undocumented)mean - (undocumented)std - (undocumented)numRows - (undocumented)numCols - (undocumented)public static RDD<Vector> poissonVectorRDD(SparkContext sc, double mean, long numRows, int numCols, int numPartitions, long seed)
i.i.d. samples drawn from the
 Poisson distribution with the input mean.
 sc - SparkContext used to create the RDD.mean - Mean, or lambda, for the Poisson distribution.numRows - Number of Vectors in the RDD.numCols - Number of elements in each Vector.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism)seed - Random seed (default: a random long integer).i.i.d. samples ~ Pois(mean).public static JavaRDD<Vector> poissonJavaVectorRDD(JavaSparkContext jsc, double mean, long numRows, int numCols, int numPartitions, long seed)
RandomRDDs.poissonVectorRDD.jsc - (undocumented)mean - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaRDD<Vector> poissonJavaVectorRDD(JavaSparkContext jsc, double mean, long numRows, int numCols, int numPartitions)
RandomRDDs.poissonJavaVectorRDD with the default seed.jsc - (undocumented)mean - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)public static JavaRDD<Vector> poissonJavaVectorRDD(JavaSparkContext jsc, double mean, long numRows, int numCols)
RandomRDDs.poissonJavaVectorRDD with the default number of partitions and the default seed.jsc - (undocumented)mean - (undocumented)numRows - (undocumented)numCols - (undocumented)public static RDD<Vector> exponentialVectorRDD(SparkContext sc, double mean, long numRows, int numCols, int numPartitions, long seed)
i.i.d. samples drawn from the
 exponential distribution with the input mean.
 sc - SparkContext used to create the RDD.mean - Mean, or 1 / lambda, for the Exponential distribution.numRows - Number of Vectors in the RDD.numCols - Number of elements in each Vector.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism)seed - Random seed (default: a random long integer).i.i.d. samples ~ Exp(mean).public static JavaRDD<Vector> exponentialJavaVectorRDD(JavaSparkContext jsc, double mean, long numRows, int numCols, int numPartitions, long seed)
RandomRDDs.exponentialVectorRDD.jsc - (undocumented)mean - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaRDD<Vector> exponentialJavaVectorRDD(JavaSparkContext jsc, double mean, long numRows, int numCols, int numPartitions)
RandomRDDs.exponentialJavaVectorRDD with the default seed.jsc - (undocumented)mean - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)public static JavaRDD<Vector> exponentialJavaVectorRDD(JavaSparkContext jsc, double mean, long numRows, int numCols)
RandomRDDs.exponentialJavaVectorRDD with the default number of partitions
 and the default seed.jsc - (undocumented)mean - (undocumented)numRows - (undocumented)numCols - (undocumented)public static RDD<Vector> gammaVectorRDD(SparkContext sc, double shape, double scale, long numRows, int numCols, int numPartitions, long seed)
i.i.d. samples drawn from the
 gamma distribution with the input shape and scale.
 sc - SparkContext used to create the RDD.shape - shape parameter (greater than 0) for the gamma distribution.scale - scale parameter (greater than 0) for the gamma distribution.numRows - Number of Vectors in the RDD.numCols - Number of elements in each Vector.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism)seed - Random seed (default: a random long integer).i.i.d. samples ~ Exp(mean).public static JavaRDD<Vector> gammaJavaVectorRDD(JavaSparkContext jsc, double shape, double scale, long numRows, int numCols, int numPartitions, long seed)
RandomRDDs.gammaVectorRDD.jsc - (undocumented)shape - (undocumented)scale - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaRDD<Vector> gammaJavaVectorRDD(JavaSparkContext jsc, double shape, double scale, long numRows, int numCols, int numPartitions)
RandomRDDs.gammaJavaVectorRDD with the default seed.jsc - (undocumented)shape - (undocumented)scale - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)public static JavaRDD<Vector> gammaJavaVectorRDD(JavaSparkContext jsc, double shape, double scale, long numRows, int numCols)
RandomRDDs.gammaJavaVectorRDD with the default number of partitions and the default seed.jsc - (undocumented)shape - (undocumented)scale - (undocumented)numRows - (undocumented)numCols - (undocumented)public static RDD<Vector> randomVectorRDD(SparkContext sc, RandomDataGenerator<Object> generator, long numRows, int numCols, int numPartitions, long seed)
i.i.d. samples produced by the
 input RandomDataGenerator.
 sc - SparkContext used to create the RDD.generator - RandomDataGenerator used to populate the RDD.numRows - Number of Vectors in the RDD.numCols - Number of elements in each Vector.numPartitions - Number of partitions in the RDD (default: sc.defaultParallelism).seed - Random seed (default: a random long integer).i.i.d. samples produced by generator.public static JavaRDD<Vector> randomJavaVectorRDD(JavaSparkContext jsc, RandomDataGenerator<Object> generator, long numRows, int numCols, int numPartitions, long seed)
RandomRDDs.randomVectorRDD.jsc - (undocumented)generator - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)seed - (undocumented)public static JavaRDD<Vector> randomJavaVectorRDD(JavaSparkContext jsc, RandomDataGenerator<Object> generator, long numRows, int numCols, int numPartitions)
RandomRDDs.randomJavaVectorRDD with the default seed.jsc - (undocumented)generator - (undocumented)numRows - (undocumented)numCols - (undocumented)numPartitions - (undocumented)public static JavaRDD<Vector> randomJavaVectorRDD(JavaSparkContext jsc, RandomDataGenerator<Object> generator, long numRows, int numCols)
RandomRDDs.randomJavaVectorRDD with the default number of partitions and the default seed.jsc - (undocumented)generator - (undocumented)numRows - (undocumented)numCols - (undocumented)