Guest User

Untitled

a guest
Jan 22nd, 2019
76
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 7.94 KB | None | 0 0
  1. # Copyright (c) Jupyter Development Team.
  2. # Distributed under the terms of the Modified BSD License
  3. ARG BASE_CONTAINER=jupyter/scipy-notebook
  4. FROM $BASE_CONTAINER
  5.  
  6. LABEL maintainer="Jupyter Project <jupyter@googlegroups.com>"
  7.  
  8. USER root
  9.  
  10. # Spark dependencies
  11. ENV SPARK_VERSION 2.3.2
  12. ENV SPARK_HADOOP_PROFILE 2.7
  13. ENV SPARK_SRC_URL https://www.apache.org/dist/spark/spark-$SPARK_VERSION/spark-${SPARK_VERSION}-bin-hadoop${SPARK_HADOOP_PROFILE}.tgz
  14. ENV SPARK_HOME=/opt/spark
  15. ENV PATH $PATH:$SPARK_HOME/bin
  16.  
  17. RUN apt-get update &&
  18. apt-get install -y openjdk-8-jdk-headless
  19. postgresql &&
  20. rm -rf /var/lib/apt/lists/*
  21. ENV JAVA_HOME /usr/lib/jvm/java-8-openjdk-amd64/
  22.  
  23. ENV PATH $PATH:$JAVA_HOME/bin
  24.  
  25.  
  26. RUN wget ${SPARK_SRC_URL}
  27.  
  28. RUN tar -xzf spark-${SPARK_VERSION}-bin-hadoop${SPARK_HADOOP_PROFILE}.tgz
  29.  
  30. RUN mv spark-${SPARK_VERSION}-bin-hadoop${SPARK_HADOOP_PROFILE} /opt/spark
  31.  
  32. RUN rm -f spark-${SPARK_VERSION}-bin-hadoop${SPARK_HADOOP_PROFILE}.tgz
  33.  
  34.  
  35.  
  36.  
  37.  
  38. USER $NB_UID
  39. ENV POST_URL https://jdbc.postgresql.org/download/postgresql-42.2.5.jar
  40. RUN wget ${POST_URL}
  41. RUN mv postgresql-42.2.5.jar $SPARK_HOME/jars
  42. # Install pyarrow
  43. RUN conda install --quiet -y 'pyarrow' &&
  44. conda install pyspark==2.3.2 &&
  45. conda clean -tipsy &&
  46. fix-permissions $CONDA_DIR &&
  47. fix-permissions /home/$NB_USER
  48.  
  49. WORKDIR $SPARK_HOME
  50.  
  51. master:
  52. image: my_notebook
  53. command: bin/spark-class org.apache.spark.deploy.master.Master -h master
  54. hostname: master
  55. environment:
  56. MASTER: spark://master:7077
  57. SPARK_CONF_DIR: /conf
  58. SPARK_PUBLIC_DNS: 192.168.XXX.XXX
  59. expose:
  60. - 7001
  61. - 7002
  62. - 7003
  63. - 7004
  64. - 7005
  65. - 7077
  66. - 6066
  67. ports:
  68. - 4040:4040
  69. - 6066:6066
  70. - 7077:7077
  71. - 8080:8080
  72. volumes:
  73. - ./conf/master:/conf
  74. - ./data:/tmp/data
  75.  
  76. worker:
  77. image: my_notebook
  78. command: bin/spark-class org.apache.spark.deploy.worker.Worker spark://192.168.XXX.XXX:7077
  79. hostname: worker
  80. environment:
  81. SPARK_CONF_DIR: /conf
  82. SPARK_WORKER_CORES: 4
  83. SPARK_WORKER_MEMORY: 4g
  84. SPARK_WORKER_PORT: 8881
  85. SPARK_WORKER_WEBUI_PORT: 8081
  86. SPARK_BLOCKMGR_PORT: 5003
  87. SPARK_PUBLIC_DNS: localhost
  88. expose:
  89. - 7012
  90. - 7013
  91. - 7014
  92. - 7015
  93. - 8881
  94. - 5001
  95. - 5003
  96. ports:
  97. - 8081:8081
  98. volumes:
  99. - ./conf/worker:/conf
  100. - ./data:/tmp/data
  101.  
  102. notebook:
  103. image: my_notebook
  104. command: jupyter notebook
  105. hostname: notebook
  106. environment:
  107. SPARK_PUBLIC_DNS: 192.168.1.129
  108. expose:
  109. - 7012
  110. - 7013
  111. - 7014
  112. - 7015
  113. - 8881
  114. - 8888
  115. ports:
  116. - 8888:8888
  117.  
  118. Spark Executor Command: "/usr/lib/jvm/java-8-openjdk-amd64//bin/java" "-cp" "/conf/:/opt/spark/jars/*" "-Xmx1024M" "-Dspark.driver.port=35147" "org.apache.spark.executor.CoarseGrainedExecutorBackend" "--driver-url" "spark://CoarseGrainedScheduler@notebook:35147" "--executor-id" "31" "--hostname" "172.17.0.3" "--cores" "2" "--app-id" "app-20190101134023-0001" "--worker-url" "spark://Worker@172.17.0.3:8881"
  119. ========================================
  120.  
  121. Exception in thread "main" java.lang.reflect.UndeclaredThrowableException
  122. at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1713)
  123. at org.apache.spark.deploy.SparkHadoopUtil.runAsSparkUser(SparkHadoopUtil.scala:63)
  124. at org.apache.spark.executor.CoarseGrainedExecutorBackend$.run(CoarseGrainedExecutorBackend.scala:188)
  125. at org.apache.spark.executor.CoarseGrainedExecutorBackend$.main(CoarseGrainedExecutorBackend.scala:293)
  126. at org.apache.spark.executor.CoarseGrainedExecutorBackend.main(CoarseGrainedExecutorBackend.scala)
  127. Caused by: org.apache.spark.SparkException: Exception thrown in awaitResult:
  128. at org.apache.spark.util.ThreadUtils$.awaitResult(ThreadUtils.scala:205)
  129. at org.apache.spark.rpc.RpcTimeout.awaitResult(RpcTimeout.scala:75)
  130. at org.apache.spark.rpc.RpcEnv.setupEndpointRefByURI(RpcEnv.scala:101)
  131. at org.apache.spark.executor.CoarseGrainedExecutorBackend$$anonfun$run$1.apply$mcV$sp(CoarseGrainedExecutorBackend.scala:201)
  132. at org.apache.spark.deploy.SparkHadoopUtil$$anon$2.run(SparkHadoopUtil.scala:64)
  133. at org.apache.spark.deploy.SparkHadoopUtil$$anon$2.run(SparkHadoopUtil.scala:63)
  134. at java.security.AccessController.doPrivileged(Native Method)
  135. at javax.security.auth.Subject.doAs(Subject.java:422)
  136. at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1698)
  137. ... 4 more
  138. Caused by: java.io.IOException: Failed to connect to notebook:35147
  139. at org.apache.spark.network.client.TransportClientFactory.createClient(TransportClientFactory.java:245)
  140. at org.apache.spark.network.client.TransportClientFactory.createClient(TransportClientFactory.java:187)
  141. at org.apache.spark.rpc.netty.NettyRpcEnv.createClient(NettyRpcEnv.scala:198)
  142. at org.apache.spark.rpc.netty.Outbox$$anon$1.call(Outbox.scala:194)
  143. at org.apache.spark.rpc.netty.Outbox$$anon$1.call(Outbox.scala:190)
  144. at java.util.concurrent.FutureTask.run(FutureTask.java:266)
  145. at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)
  146. at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)
  147. at java.lang.Thread.run(Thread.java:748)
  148. Caused by: java.net.UnknownHostException: notebook
  149. at java.net.InetAddress.getAllByName0(InetAddress.java:1281)
  150. at java.net.InetAddress.getAllByName(InetAddress.java:1193)
  151. at java.net.InetAddress.getAllByName(InetAddress.java:1127)
  152. at java.net.InetAddress.getByName(InetAddress.java:1077)
  153. at io.netty.util.internal.SocketUtils$8.run(SocketUtils.java:146)
  154. at io.netty.util.internal.SocketUtils$8.run(SocketUtils.java:143)
  155. at java.security.AccessController.doPrivileged(Native Method)
  156. at io.netty.util.internal.SocketUtils.addressByName(SocketUtils.java:143)
  157. at io.netty.resolver.DefaultNameResolver.doResolve(DefaultNameResolver.java:43)
  158. at io.netty.resolver.SimpleNameResolver.resolve(SimpleNameResolver.java:63)
  159. at io.netty.resolver.SimpleNameResolver.resolve(SimpleNameResolver.java:55)
  160. at io.netty.resolver.InetSocketAddressResolver.doResolve(InetSocketAddressResolver.java:57)
  161. at io.netty.resolver.InetSocketAddressResolver.doResolve(InetSocketAddressResolver.java:32)
  162. at io.netty.resolver.AbstractAddressResolver.resolve(AbstractAddressResolver.java:108)
  163. at io.netty.bootstrap.Bootstrap.doResolveAndConnect0(Bootstrap.java:208)
  164. at io.netty.bootstrap.Bootstrap.access$000(Bootstrap.java:49)
  165. at io.netty.bootstrap.Bootstrap$1.operationComplete(Bootstrap.java:188)
  166. at io.netty.bootstrap.Bootstrap$1.operationComplete(Bootstrap.java:174)
  167. at io.netty.util.concurrent.DefaultPromise.notifyListener0(DefaultPromise.java:507)
  168. at io.netty.util.concurrent.DefaultPromise.notifyListenersNow(DefaultPromise.java:481)
  169. at io.netty.util.concurrent.DefaultPromise.notifyListeners(DefaultPromise.java:420)
  170. at io.netty.util.concurrent.DefaultPromise.trySuccess(DefaultPromise.java:104)
  171. at io.netty.channel.DefaultChannelPromise.trySuccess(DefaultChannelPromise.java:82)
  172. at io.netty.channel.AbstractChannel$AbstractUnsafe.safeSetSuccess(AbstractChannel.java:978)
  173. at io.netty.channel.AbstractChannel$AbstractUnsafe.register0(AbstractChannel.java:512)
  174. at io.netty.channel.AbstractChannel$AbstractUnsafe.access$200(AbstractChannel.java:423)
  175. at io.netty.channel.AbstractChannel$AbstractUnsafe$1.run(AbstractChannel.java:482)
  176. at io.netty.util.concurrent.AbstractEventExecutor.safeExecute(AbstractEventExecutor.java:163)
  177. at io.netty.util.concurrent.SingleThreadEventExecutor.runAllTasks(SingleThreadEventExecutor.java:403)
  178. at io.netty.channel.nio.NioEventLoop.run(NioEventLoop.java:463)
  179. at io.netty.util.concurrent.SingleThreadEventExecutor$5.run(SingleThreadEventExecutor.java:858)
  180. at io.netty.util.concurrent.DefaultThreadFactory$DefaultRunnableDecorator.run(DefaultThreadFactory.java:138)
  181. ... 1 more
Add Comment
Please, Sign In to add comment