Advertisement
lorenzo_gatto

Untitled

Apr 26th, 2015
273
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Java 1.11 KB | None | 0 0
  1. import java.io.*;
  2. import org.apache.spark.SparkConf;
  3. import org.apache.spark.SparkContext;
  4. import org.apache.spark.api.java.JavaSparkContext;
  5. import org.apache.spark.api.java.*;
  6. import org.apache.spark.api.java.function.*;
  7. import org.apache.spark.sql.hive.HiveContext;
  8. import org.apache.spark.sql.SchemaRDD;
  9. import org.apache.spark.sql.api.java.Row;
  10. import java.util.Arrays;
  11. import scala.Tuple2;
  12.  
  13. public class SQL {
  14.  
  15.     public static void main(String[] args) {
  16.         String inputFile = "/home/lorenzo/Desktop/testtweets.json";
  17.         //String outputFile = "/words.txt";
  18.         SparkConf conf = new SparkConf().setAppName("Simple Application");
  19.         SparkContext sc = new SparkContext(conf);
  20.         HiveContext hiveCtx = new HiveContext(sc);
  21.         /*SchemaRDD input = hiveCtx.jsonFile(inputFile);
  22.         input.printSchema();
  23.         input.registerTempTable("tweets");
  24.         SchemaRDD topTweets = hiveCtx.sql("EXPLAIN SELECT text, retweetCount FROM tweets ORDER BY retweetCount LIMIT 10");
  25.         JavaRDD<String> topTweetText = topTweets.toJavaRDD().map((row) -> {
  26.             return row.getString(0);});
  27.         System.out.println("ciao" + topTweetText.collect());*/
  28.     }
  29. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement