Advertisement
Guest User

Untitled

a guest
Dec 31st, 2018
166
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 4.19 KB | None | 0 0
  1. 18/12/18 05:16:49 WARN TaskSetManager: Lost task 183.3 in stage 13.0 (TID 62450, ip-172-31-16-247.us-west-2.compute.internal, executor 214): org.apache.spark.api.python.PythonException: Traceback (most recent call last):
  2. File "/mnt1/yarn/usercache/hadoop/appcache/application_1545091694164_0001/container_1545091694164_0001_01_000367/pyspark.zip/pyspark/worker.py", line 229, in main
  3. process()
  4. File "/mnt1/yarn/usercache/hadoop/appcache/application_1545091694164_0001/container_1545091694164_0001_01_000367/pyspark.zip/pyspark/worker.py", line 224, in process
  5. serializer.dump_stream(func(split_index, iterator), outfile)
  6. File "/usr/lib/spark/python/pyspark/rdd.py", line 2438, in pipeline_func
  7. File "/usr/lib/spark/python/pyspark/rdd.py", line 2438, in pipeline_func
  8. File "/usr/lib/spark/python/pyspark/rdd.py", line 2438, in pipeline_func
  9. File "/usr/lib/spark/python/pyspark/rdd.py", line 2438, in pipeline_func
  10. File "/usr/lib/spark/python/pyspark/rdd.py", line 362, in func
  11. File "/usr/lib/spark/python/pyspark/rdd.py", line 1865, in _mergeCombiners
  12. File "/mnt1/yarn/usercache/hadoop/appcache/application_1545091694164_0001/container_1545091694164_0001_01_000367/pyspark.zip/pyspark/shuffle.py", line 287, in mergeCombiners
  13. self._spill()
  14. File "/mnt1/yarn/usercache/hadoop/appcache/application_1545091694164_0001/container_1545091694164_0001_01_000367/pyspark.zip/pyspark/shuffle.py", line 315, in _spill
  15. self.serializer.dump_stream([(k, v)], streams[h])
  16. File "/mnt1/yarn/usercache/hadoop/appcache/application_1545091694164_0001/container_1545091694164_0001_01_000367/pyspark.zip/pyspark/serializers.py", line 376, in dump_stream
  17. bytes = self.serializer.dumps(vs)
  18. File "/mnt1/yarn/usercache/hadoop/appcache/application_1545091694164_0001/container_1545091694164_0001_01_000367/pyspark.zip/pyspark/serializers.py", line 627, in dumps
  19. return zlib.compress(self.serializer.dumps(obj), 1)
  20. File "/mnt1/yarn/usercache/hadoop/appcache/application_1545091694164_0001/container_1545091694164_0001_01_000367/pyspark.zip/pyspark/serializers.py", line 555, in dumps
  21. return pickle.dumps(obj, protocol)
  22. SystemError: error return without exception set
  23.  
  24. at org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)
  25. at org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)
  26. at org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)
  27. at org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)
  28. at org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)
  29. at scala.collection.Iterator$class.foreach(Iterator.scala:893)
  30. at org.apache.spark.InterruptibleIterator.foreach(InterruptibleIterator.scala:28)
  31. at scala.collection.generic.Growable$class.$plus$plus$eq(Growable.scala:59)
  32. at scala.collection.mutable.ArrayBuffer.$plus$plus$eq(ArrayBuffer.scala:104)
  33. at scala.collection.mutable.ArrayBuffer.$plus$plus$eq(ArrayBuffer.scala:48)
  34. at scala.collection.TraversableOnce$class.to(TraversableOnce.scala:310)
  35. at org.apache.spark.InterruptibleIterator.to(InterruptibleIterator.scala:28)
  36. at scala.collection.TraversableOnce$class.toBuffer(TraversableOnce.scala:302)
  37. at org.apache.spark.InterruptibleIterator.toBuffer(InterruptibleIterator.scala:28)
  38. at scala.collection.TraversableOnce$class.toArray(TraversableOnce.scala:289)
  39. at org.apache.spark.InterruptibleIterator.toArray(InterruptibleIterator.scala:28)
  40. at org.apache.spark.rdd.RDD$$anonfun$collect$1$$anonfun$12.apply(RDD.scala:939)
  41. at org.apache.spark.rdd.RDD$$anonfun$collect$1$$anonfun$12.apply(RDD.scala:939)
  42. at org.apache.spark.SparkContext$$anonfun$runJob$5.apply(SparkContext.scala:2067)
  43. at org.apache.spark.SparkContext$$anonfun$runJob$5.apply(SparkContext.scala:2067)
  44. at org.apache.spark.scheduler.ResultTask.runTask(ResultTask.scala:87)
  45. at org.apache.spark.scheduler.Task.run(Task.scala:109)
  46. at org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)
  47. at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
  48. at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
  49. at java.lang.Thread.run(Thread.java:748)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement