Advertisement
Guest User

Untitled

a guest
Apr 28th, 2017
71
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.13 KB | None | 0 0
  1. package com.example;
  2.  
  3. import org.apache.spark.SparkContext;
  4. import org.apache.spark.api.java.JavaRDD;
  5. import org.apache.spark.api.java.function.Function;
  6. import org.apache.spark.sql.Dataset;
  7. import org.apache.spark.sql.Row;
  8. import org.apache.spark.sql.RowFactory;
  9. import org.apache.spark.sql.SparkSession;
  10. import org.apache.spark.sql.types.*;
  11.  
  12. public class Main {
  13.  
  14. public static void main(String[] args) {
  15.  
  16. SparkSession spark = SparkSession.builder().master("local[*]").appName("Word2Vec").getOrCreate();
  17. SparkContext sc = spark.sparkContext();
  18. sc.setLogLevel("WARN");
  19. JavaRDD<String> lines = sc.textFile("input.txt", 10).toJavaRDD();
  20. JavaRDD<Row> rows = lines.map(new Function<String, Row>(){
  21. public Row call(String line){
  22. return RowFactory.create(new String[][] {line.split(" ")});
  23. }
  24. });
  25.  
  26. StructType schema = new StructType(new StructField[] {
  27. new StructField("text", new ArrayType(DataTypes.StringType, true), false, Metadata.empty())
  28. });
  29. Dataset<Row> input = spark.createDataFrame(rows, schema);
  30. input.show(3);
  31. }
  32. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement