Advertisement
Guest User

Untitled

a guest
Jun 22nd, 2017
59
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.38 KB | None | 0 0
  1. import org.apache.spark.graphx._
  2. import org.apache.spark.rdd.RDD
  3. import org.apache.spark.sql._
  4. import org.apache.spark.sql.types._
  5. import org.graphframes._
  6. //import collection.mutable.HashMap
  7.  
  8.  
  9. val utenti = sqlContext.sql("SELECT user_id as id,name FROM users")
  10.  
  11. /*val usersVertices: RDD[(String, String)] = utenti.select("user_id", "name")
  12. .rdd
  13. .map(row => (row(0).asInstanceOf[String], row(1).asInstanceOf[String]))
  14. usersVertices.take(1)*/
  15.  
  16. utenti.show()
  17. val friends = sqlContext.sql("SELECT user_id,friends FROM users")
  18.  
  19. //friends.printSchema()
  20. var friends_arr = friends.map(e => (e.get(0).toString(), e.get(1).toString.replace("'","").replaceAll("\\s+","").replace("\"","").replace("[","").replace("]","").split(",") ) )
  21. friends.printSchema()
  22. //friends.flatMap { t => t._1.map { prp => (t.user_id, prp) }}.show
  23.  
  24.  
  25. val relationships= friends_arr.flatMap { t =>
  26. t._2.map { prp =>
  27. (t._1, prp) }}
  28.  
  29. val relazioni= relationships.toDF("src", "dst")
  30. // Edge DataFrame
  31. // Create a GraphFrame
  32. val gf = GraphFrame(utenti, relazioni)
  33.  
  34. val gx: Graph[Row, Row] = gf.toGraphX
  35. gx.cache()
  36.  
  37. val cc = gx.connectedComponents().vertices
  38.  
  39. val prova= sqlContext.sql("SELECT * FROM cc")
  40. prova.show()
  41. //val graph = Graph(friends_arr, relationships, defaultUser)
  42. //val a = friends_arr.count()
  43. //System.out.println("Ciao " + a)
  44. //friends_arr.printSchema()
  45. //friends_arr.take(1)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement