Advertisement
Guest User

Untitled

a guest
Jul 27th, 2017
63
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.56 KB | None | 0 0
  1. import pycuda.autoinit
  2. import pycuda.driver as drv
  3. import numpy
  4.  
  5. from pycuda.compiler import SourceModule
  6. mod = SourceModule("""
  7. __global__ void multiply_them(float *dest, float *a, float *b)
  8. {
  9. const int i = threadIdx.x;
  10. dest[i] = a[i] * b[i];
  11. }
  12. """)
  13.  
  14. multiply_them = mod.get_function("multiply_them")
  15.  
  16. a = numpy.random.randn(400).astype(numpy.float32)
  17. b = numpy.random.randn(400).astype(numpy.float32)
  18.  
  19. dest = numpy.zeros_like(a)
  20. multiply_them(
  21. drv.Out(dest), drv.In(a), drv.In(b),
  22. block=(400,1,1), grid=(1,1))
  23.  
  24. print dest-a*b
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement