Advertisement
Maverick82

PTX File generated by VS C++ 2010 Pro

May 16th, 2013
673
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 1.17 KB | None | 0 0
  1. //
  2. // Generated by NVIDIA NVVM Compiler
  3. // Compiler built on Wed Sep 26 00:26:26 2012 (1348590386)
  4. // Cuda compilation tools, release 5.0, V0.2.1221
  5. //
  6.  
  7. .version 3.1
  8. .target sm_20, debug
  9. .address_size 64
  10.  
  11. .file 1 "C:\\Users\\Mansoor\\Documents\\Visual Studio 2010\\Projects\\Testing_PTX\\x64/Debug/TestingPTX.compute_20.cpp3.i"
  12. .file 2 "C:/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v5.0/nvvm/ci_include.h"
  13. .file 3 "C:/Users/Mansoor/Documents/Visual Studio 2010/Projects/Testing_PTX/TestingPTX.cu"
  14.  
  15. .visible .entry _Z5helloPfS_(
  16. .param .u64 _Z5helloPfS__param_0,
  17. .param .u64 _Z5helloPfS__param_1
  18. )
  19. {
  20. .reg .s32 %r<4>;
  21. .reg .f32 %f<2>;
  22. .reg .s64 %rd<9>;
  23.  
  24.  
  25. .loc 3 13 1
  26. func_begin0:
  27. .loc 3 13 0
  28.  
  29. .loc 3 13 1
  30.  
  31. ld.param.u64 %rd1, [_Z5helloPfS__param_0];
  32. ld.param.u64 %rd2, [_Z5helloPfS__param_1];
  33. func_exec_begin0:
  34. .loc 3 15 1
  35. tmp0:
  36. mov.u32 %r1, %ctaid.x;
  37. tmp1:
  38. .loc 3 16 1
  39. cvt.s64.s32 %rd3, %r1;
  40. shl.b64 %rd4, %rd3, 2;
  41. add.s64 %rd5, %rd2, %rd4;
  42. ld.f32 %f1, [%rd5];
  43. cvt.s64.s32 %rd6, %r1;
  44. shl.b64 %rd7, %rd6, 2;
  45. add.s64 %rd8, %rd1, %rd7;
  46. st.f32 [%rd8], %f1;
  47. tmp2:
  48. .loc 3 20 2
  49. ret;
  50. tmp3:
  51. func_end0:
  52. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement