Guest User

Untitled

a guest
Oct 19th, 2017
395
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.92 KB | None | 0 0
  1. restultSet=testingData.map(lambda p: (p.label, linearModel.predict(p.features))).collect()
  2.  
  3. [(2.0, array([ 2.09078012])), (2.0, array([ 2.09078012])), (2.0, array([ 2.09078012])), (1.0, array([ 2.09078012])), (2.0, array([ 2.09078012])), (1.0, array([ 2.09078012]))]
  4.  
  5. restultSet.toDF()
  6.  
  7. import numpy as np
  8. from pyspark.ml.linalg import Vectors
  9.  
  10. # your data as an RDD (i.e. before 'collect')
  11. dd = sc.parallelize([(2.0, np.array([ 2.09078012])), (2.0, np.array([ 2.09078012])), (2.0, np.array([ 2.09078012])), (1.0, np.array([ 2.09078012])), (2.0, np.array([ 2.09078012])), (1.0, np.array([ 2.09078012]))])
  12. dd.take(1)
  13. # [(2.0, array([ 2.09078012]))]
  14.  
  15. df = dd.map(lambda x: (x[0], Vectors.dense(x[1]))).toDF()
  16. df.show()
  17. # +---+------------+
  18. # | _1| _2|
  19. # +---+------------+
  20. # |2.0|[2.09078012]|
  21. # |2.0|[2.09078012]|
  22. # |2.0|[2.09078012]|
  23. # |1.0|[2.09078012]|
  24. # |2.0|[2.09078012]|
  25. # |1.0|[2.09078012]|
  26. # +---+------------+
Add Comment
Please, Sign In to add comment