Advertisement
Guest User

Untitled

a guest
Oct 23rd, 2014
135
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.71 KB | None | 0 0
  1. import pycuda.driver as cuda
  2. import pycuda.autoinit
  3. from pycuda.compiler import SourceModule
  4. import numpy
  5. a = numpy.random.randn(4,4)
  6. a = a.astype(numpy.float32)
  7. a_gpu = cuda.mem_alloc(a.nbytes)
  8. cuda.memcpy_htod(a_gpu,a)
  9.  
  10. mod = SourceModule("""
  11. __global__ void doublify(float *a)
  12. {
  13. int idx = threadIdx.x + threadIdx.y * 4;
  14. a[idx] *= 2;
  15. }
  16. """)
  17.  
  18. import os
  19. os.system("vcvarsamd64.bat")
  20.  
  21. import pycuda.gpuarray as gpuarray
  22. import pycuda.driver as cuda
  23. import pycuda.autoinit
  24. import numpy
  25. a_gpu = gpuarray.to_gpu(numpy.random.randn(4, 4))
  26. print "a_gpu ="
  27. print a_gpu
  28. a_doubled = (2*a_gpu).get()
  29. print
  30. print "a_doubled ="
  31. print a_doubled
  32.  
  33. COMPILER-BINDIR = C:Program Files (x86)Microsoft Visual Studio 10.0VCbinamd64
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement