How to use
range
method
in
org.apache.spark.sql.SparkSession

Best Java code snippets using org.apache.spark.sql.SparkSession.range (Showing top 12 results out of 315)

@Test
public void testSaveModeAPI() {
 spark
   .range(10)
   .write()
   .format("org.apache.spark.sql.test")
   .mode(SaveMode.ErrorIfExists)
   .save();
}

@Test
public void testSaveModeAPI() {
 spark
   .range(10)
   .write()
   .format("org.apache.spark.sql.test")
   .mode(SaveMode.ErrorIfExists)
   .save();
}

@Test
public void testSaveModeAPI() {
 spark
   .range(10)
   .write()
   .format("org.apache.spark.sql.test")
   .mode(SaveMode.ErrorIfExists)
   .save();
}

@SuppressWarnings("unchecked")
@Test
public void udf1Test() {
 spark.range(1, 10).toDF("value").createOrReplaceTempView("df");
 spark.udf().registerJavaUDAF("myDoubleAvg", MyDoubleAvg.class.getName());
 Row result = spark.sql("SELECT myDoubleAvg(value) as my_avg from df").head();
 Assert.assertEquals(105.0, result.getDouble(0), 1.0e-6);
}

@SuppressWarnings("unchecked")
@Test
public void udf1Test() {
 spark.range(1, 10).toDF("value").createOrReplaceTempView("df");
 spark.udf().registerJavaUDAF("myDoubleAvg", MyDoubleAvg.class.getName());
 Row result = spark.sql("SELECT myDoubleAvg(value) as my_avg from df").head();
 Assert.assertEquals(105.0, result.getDouble(0), 1.0e-6);
}

@SuppressWarnings("unchecked")
@Test
public void udf4Test() {
 spark.udf().register("inc", (Long i) -> i + 1, DataTypes.LongType);
 spark.range(10).toDF("x").createOrReplaceTempView("tmp");
 // This tests when Java UDFs are required to be the semantically same (See SPARK-9435).
 List<Row> results = spark.sql("SELECT inc(x) FROM tmp GROUP BY inc(x)").collectAsList();
 Assert.assertEquals(10, results.size());
 long sum = 0;
 for (Row result : results) {
  sum += result.getLong(0);
 }
 Assert.assertEquals(55, sum);
}

@SuppressWarnings("unchecked")
@Test
public void udf4Test() {
 spark.udf().register("inc", (Long i) -> i + 1, DataTypes.LongType);
 spark.range(10).toDF("x").createOrReplaceTempView("tmp");
 // This tests when Java UDFs are required to be the semantically same (See SPARK-9435).
 List<Row> results = spark.sql("SELECT inc(x) FROM tmp GROUP BY inc(x)").collectAsList();
 Assert.assertEquals(10, results.size());
 long sum = 0;
 for (Row result : results) {
  sum += result.getLong(0);
 }
 Assert.assertEquals(55, sum);
}

 @SuppressWarnings("unchecked")
 @Test
 public void udf4Test() {
  spark.udf().register("inc", (Long i) -> i + 1, DataTypes.LongType);

  spark.range(10).toDF("x").createOrReplaceTempView("tmp");
  // This tests when Java UDFs are required to be the semantically same (See SPARK-9435).
  List<Row> results = spark.sql("SELECT inc(x) FROM tmp GROUP BY inc(x)").collectAsList();
  Assert.assertEquals(10, results.size());
  long sum = 0;
  for (Row result : results) {
   sum += result.getLong(0);
  }
  Assert.assertEquals(55, sum);
 }
}

@Override
public Dataset<Row> read() throws Exception {    
 JavaRDD<Long> baseRDD = Contexts.getSparkSession().range(tasks).javaRDD().repartition(tasks);
 
 JavaRDD<Row> fixRDD = baseRDD.flatMap(new GenerateFIXMessages(ordersPerTask));
 
 StructType schema = DataTypes.createStructType(Lists.newArrayList(DataTypes.createStructField("fix", DataTypes.StringType, false)));
 
 Dataset<Row> fixDF = Contexts.getSparkSession().createDataFrame(fixRDD, schema);
 
 return fixDF;
}

BatchStep sourceStep = new BatchStep("source_step");
sourceStep.configure(sourceStepConfig);
Dataset<Row> sourceDF = Contexts.getSparkSession().range(5, 8).map(new LongToRowFunction(),
  RowEncoder.apply(DataTypes.createStructType(Lists.newArrayList(DataTypes.createStructField("value", DataTypes.LongType, false)))));
sourceStep.setData(sourceDF);

@Override
public Dataset<Row> read() throws Exception {
 Dataset<Row> df = Contexts.getSparkSession()
   .range(numPartitions * 10)
   .repartition(numPartitions)
   .map(new LongToRowFunction(), 
     RowEncoder.apply(DataTypes.createStructType(
       Lists.newArrayList(
         DataTypes.createStructField("value", DataTypes.LongType, true),
         DataTypes.createStructField("modulo", DataTypes.LongType, true))
       )));
 return df;
}

private JavaPairRDD<Row, Row> getDummyRDD(int numPartitions) {
 return Contexts.getSparkSession().range(numPartitions).javaRDD()
   .map(new LongToRowFunction()).keyBy(new ItselfFunction<Row>()).repartition(numPartitions);
}

Popular methods of SparkSession

Popular in Java

Finding current android device location
getApplicationContext (Context)
compareTo (BigDecimal)
findViewById (Activity)
FileReader (java.io)
A specialized Reader that reads from a file in the file system. All read requests made by calling me
Runnable (java.lang)
Represents a command that can be executed. Often used to run code in a different Thread.
ByteBuffer (java.nio)
A buffer for bytes. A byte buffer can be created in either one of the following ways: * #allocate
MessageDigest (java.security)
Uses a one-way hash function to turn an arbitrary number of bytes into a fixed-length byte sequence.
Date (java.sql)
A class which can consume and produce dates in SQL Date format. Dates are represented in SQL as yyyy
Loader (org.hibernate.loader)
Abstract superclass of object loading (and querying) strategies. This class implements useful common
Top Sublime Text plugins

How to use rangemethodin org.apache.spark.sql.SparkSession

Best Java code snippets using org.apache.spark.sql.SparkSession.range (Showing top 12 results out of 315)

How to use
range
method
in
org.apache.spark.sql.SparkSession