Advertisement
Guest User

Untitled

a guest
Feb 12th, 2016
53
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 3.49 KB | None | 0 0
  1. {
  2. "cells": [
  3. {
  4. "cell_type": "code",
  5. "execution_count": 1,
  6. "metadata": {
  7. "collapsed": false
  8. },
  9. "outputs": [
  10. {
  11. "name": "stdout",
  12. "output_type": "stream",
  13. "text": [
  14. "Populating the interactive namespace from numpy and matplotlib\n"
  15. ]
  16. }
  17. ],
  18. "source": [
  19. "import matplotlib.pyplot as plt\n",
  20. "import pandas as pd\n",
  21. "import numpy as np\n",
  22. "import plotly.plotly as py\n",
  23. "\n",
  24. "%pylab inline"
  25. ]
  26. },
  27. {
  28. "cell_type": "code",
  29. "execution_count": 2,
  30. "metadata": {
  31. "collapsed": false
  32. },
  33. "outputs": [
  34. {
  35. "data": {
  36. "text/plain": [
  37. "16"
  38. ]
  39. },
  40. "execution_count": 2,
  41. "metadata": {},
  42. "output_type": "execute_result"
  43. }
  44. ],
  45. "source": [
  46. "sc.defaultParallelism"
  47. ]
  48. },
  49. {
  50. "cell_type": "code",
  51. "execution_count": 3,
  52. "metadata": {
  53. "collapsed": true
  54. },
  55. "outputs": [],
  56. "source": [
  57. "frame = sqlContext.read.load(\"s3://telemetry-parquet/longitudinal/generation_date=20160208\")"
  58. ]
  59. },
  60. {
  61. "cell_type": "code",
  62. "execution_count": 4,
  63. "metadata": {
  64. "collapsed": false
  65. },
  66. "outputs": [
  67. {
  68. "data": {
  69. "text/plain": [
  70. "3498998"
  71. ]
  72. },
  73. "execution_count": 4,
  74. "metadata": {},
  75. "output_type": "execute_result"
  76. }
  77. ],
  78. "source": [
  79. "# frame.count()"
  80. ]
  81. },
  82. {
  83. "cell_type": "code",
  84. "execution_count": 14,
  85. "metadata": {
  86. "collapsed": false
  87. },
  88. "outputs": [
  89. {
  90. "name": "stdout",
  91. "output_type": "stream",
  92. "text": [
  93. "CPU times: user 44 ms, sys: 32 ms, total: 76 ms\n",
  94. "Wall time: 5min 9s\n"
  95. ]
  96. },
  97. {
  98. "data": {
  99. "text/plain": [
  100. "[Row(addons=[{}, {}])]"
  101. ]
  102. },
  103. "execution_count": 14,
  104. "metadata": {},
  105. "output_type": "execute_result"
  106. }
  107. ],
  108. "source": [
  109. "%time addon_frames = frame.selectExpr(\"last(activeAddons) as addons\").where(\"size(addons) > 0\").take(20)\n",
  110. "addon_frames"
  111. ]
  112. },
  113. {
  114. "cell_type": "code",
  115. "execution_count": 23,
  116. "metadata": {
  117. "collapsed": false
  118. },
  119. "outputs": [
  120. {
  121. "data": {
  122. "text/plain": [
  123. "[Row(addons=[{}, {}])]"
  124. ]
  125. },
  126. "execution_count": 23,
  127. "metadata": {},
  128. "output_type": "execute_result"
  129. }
  130. ],
  131. "source": [
  132. "sample_addons = frame.selectExpr(\"last(activeAddons) as addons\").take(30)\n",
  133. "sample_addons"
  134. ]
  135. },
  136. {
  137. "cell_type": "code",
  138. "execution_count": 25,
  139. "metadata": {
  140. "collapsed": false
  141. },
  142. "outputs": [
  143. {
  144. "data": {
  145. "text/plain": [
  146. "1"
  147. ]
  148. },
  149. "execution_count": 25,
  150. "metadata": {},
  151. "output_type": "execute_result"
  152. }
  153. ],
  154. "source": [
  155. "len(sample_addons)"
  156. ]
  157. },
  158. {
  159. "cell_type": "code",
  160. "execution_count": 13,
  161. "metadata": {
  162. "collapsed": false
  163. },
  164. "outputs": [
  165. {
  166. "data": {
  167. "text/plain": [
  168. "{}"
  169. ]
  170. },
  171. "execution_count": 13,
  172. "metadata": {},
  173. "output_type": "execute_result"
  174. }
  175. ],
  176. "source": [
  177. "addon_frame.addons[0]"
  178. ]
  179. }
  180. ],
  181. "metadata": {
  182. "kernelspec": {
  183. "display_name": "Python 2",
  184. "language": "python",
  185. "name": "python2"
  186. },
  187. "language_info": {
  188. "codemirror_mode": {
  189. "name": "ipython",
  190. "version": 2
  191. },
  192. "file_extension": ".py",
  193. "mimetype": "text/x-python",
  194. "name": "python",
  195. "nbconvert_exporter": "python",
  196. "pygments_lexer": "ipython2",
  197. "version": "2.7.10"
  198. }
  199. },
  200. "nbformat": 4,
  201. "nbformat_minor": 0
  202. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement