Advertisement
Guest User

Untitled

a guest
Sep 10th, 2014
330
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 19.08 KB | None | 0 0
  1. code for sm_21
  2. Function : _Z7kernel2PiS_S_j
  3. .headerflags @"EF_CUDA_SM21 EF_CUDA_PTX_SM(EF_CUDA_SM21)"
  4. /*0000*/ MOV R1, c[0x1][0x100]; /* 0x2800440400005de4 */
  5. /*0008*/ NOP; /* 0x4000000000001de4 */
  6. /*0010*/ MOV R3, c[0x0][0x38]; /* 0x28004000e000dde4 */
  7. /*0018*/ S2R R0, SR_CTAID.X; /* 0x2c00000094001c04 */
  8. /*0020*/ SHR.U32 R3, R3, 0x2; /* 0x5800c0000830dc03 */
  9. /*0028*/ S2R R2, SR_TID.X; /* 0x2c00000084009c04 */
  10. /*0030*/ IMAD R15, R0, c[0x0][0x8], R2; /* 0x200440002003dca3 */
  11. /*0038*/ ISETP.GE.U32.AND P0, PT, R15, R3, PT; /* 0x1b0e00000cf1dc03 */
  12. /*0040*/ @P0 EXIT; /* 0x80000000000001e7 */
  13. /*0048*/ MOV32I R17, 0x4; /* 0x1800000010045de2 */
  14. /*0050*/ IADD R7, R15, R3; /* 0x480000000cf1dc03 */
  15. /*0058*/ IMAD R8.CC, R15, R17, c[0x0][0x20]; /* 0x2023800080f21ca3 */
  16. /*0060*/ IMAD.HI.X R9, R15, R17, c[0x0][0x24]; /* 0x20a2800090f25ce3 */
  17. /*0068*/ IMAD R20.CC, R15, R17, c[0x0][0x28]; /* 0x20238000a0f51ca3 */
  18. /*0070*/ LD.E R0, [R8]; /* 0x8400000000801c85 */
  19. /*0078*/ IMAD.HI.X R21, R15, R17, c[0x0][0x2c]; /* 0x20a28000b0f55ce3 */
  20. /*0080*/ IMAD R2.CC, R15, R17, c[0x0][0x30]; /* 0x20238000c0f09ca3 */
  21. /*0088*/ MOV R12, c[0x0][0x38]; /* 0x28004000e0031de4 */
  22. /*0090*/ IMAD.HI.X R3, R15, R17, c[0x0][0x34]; /* 0x20a28000d0f0dce3 */
  23. /*0098*/ IMUL R13, R12, 0x3; /* 0x5000c0000cc35ca3 */
  24. /*00a0*/ IMAD.U32.U32 R10.CC, R7, R17, c[0x0][0x30]; /* 0x20238000c0729c03 */
  25. /*00a8*/ LD.E R14, [R2]; /* 0x8400000000239c85 */
  26. /*00b0*/ IMAD.U32.U32.HI.X R11, R7, R17, c[0x0][0x34]; /* 0x20a28000d072dc43 */
  27. /*00b8*/ LD.E R16, [R20]; /* 0x8400000001441c85 */
  28. /*00c0*/ IMAD.U32.U32 R4.CC, R7, R17, c[0x0][0x20]; /* 0x2023800080711c03 */
  29. /*00c8*/ SHR.U32 R3, R12, 0x1; /* 0x5800c00004c0dc03 */
  30. /*00d0*/ IMAD.U32.U32.HI.X R5, R7, R17, c[0x0][0x24]; /* 0x20a2800090715c43 */
  31. /*00d8*/ IADD R20, R15, R3; /* 0x480000000cf51c03 */
  32. /*00e0*/ IMAD.U32.U32 R6.CC, R7, R17, c[0x0][0x28]; /* 0x20238000a0719c03 */
  33. /*00e8*/ LD.E R18, [R4]; /* 0x8400000000449c85 */
  34. /*00f0*/ IMAD.U32.U32.HI R13, R13, c[0x10][0x0], R15; /* 0x201e400004d35c43 */
  35. /*00f8*/ LD.E R21, [R10]; /* 0x8400000000a55c85 */
  36. /*0100*/ IMAD.U32.U32.HI.X R7, R7, R17, c[0x0][0x2c]; /* 0x20a28000b071dc43 */
  37. /*0108*/ IMAD.U32.U32 R8.CC, R13, R17, c[0x0][0x28]; /* 0x20238000a0d21c03 */
  38. /*0110*/ LD.E R19, [R6]; /* 0x840000000064dc85 */
  39. /*0118*/ IMAD.U32.U32.HI.X R9, R13, R17, c[0x0][0x2c]; /* 0x20a28000b0d25c43 */
  40. /*0120*/ IMAD.U32.U32 R2.CC, R13, R17, c[0x0][0x20]; /* 0x2023800080d09c03 */
  41. /*0128*/ LD.E R9, [R8]; /* 0x8400000000825c85 */
  42. /*0130*/ IMAD.U32.U32.HI.X R3, R13, R17, c[0x0][0x24]; /* 0x20a2800090d0dc43 */
  43. /*0138*/ IMAD.U32.U32 R4.CC, R20, R17, c[0x0][0x28]; /* 0x20238000a1411c03 */
  44. /*0140*/ IMAD.U32.U32.HI.X R5, R20, R17, c[0x0][0x2c]; /* 0x20a28000b1415c43 */
  45. /*0148*/ LD.E R8, [R2]; /* 0x8400000000221c85 */
  46. /*0150*/ IMAD.U32.U32 R6.CC, R20, R17, c[0x0][0x30]; /* 0x20238000c1419c03 */
  47. /*0158*/ LD.E R5, [R4]; /* 0x8400000000415c85 */
  48. /*0160*/ IMAD.U32.U32.HI.X R7, R20, R17, c[0x0][0x34]; /* 0x20a28000d141dc43 */
  49. /*0168*/ MOV32I R4, 0xfffff800; /* 0x1bffffe000011de2 */
  50. /*0170*/ IMAD.U32.U32 R12.CC, R13, R17, c[0x0][0x30]; /* 0x20238000c0d31c03 */
  51. /*0178*/ LD.E R6, [R6]; /* 0x8400000000619c85 */
  52. /*0180*/ IMAD.U32.U32.HI.X R13, R13, R17, c[0x0][0x34]; /* 0x20a28000d0d35c43 */
  53. /*0188*/ IMAD.U32.U32 R10.CC, R20, R17, c[0x0][0x20]; /* 0x2023800081429c03 */
  54. /*0190*/ LD.E R13, [R12]; /* 0x8400000000c35c85 */
  55. /*0198*/ IMAD.U32.U32.HI.X R11, R20, R17, c[0x0][0x24]; /* 0x20a280009142dc43 */
  56. /*01a0*/ LD.E R17, [R10]; /* 0x8400000000a45c85 */
  57. /*01a8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  58. /*01b0*/ IMAD R7, R18, R19, R21; /* 0x202a00004d21dca3 */
  59. /*01b8*/ IMAD R12, R17, R5, R6; /* 0x200c000015131ca3 */
  60. /*01c0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  61. /*01c8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  62. /*01d0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  63. /*01d8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  64. /*01e0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  65. /*01e8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  66. /*01f0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  67. /*01f8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  68. /*0200*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  69. /*0208*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  70. /*0210*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  71. /*0218*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  72. /*0220*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  73. /*0228*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  74. /*0230*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  75. /*0238*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  76. /*0240*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  77. /*0248*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  78. /*0250*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  79. /*0258*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  80. /*0260*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  81. /*0268*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  82. /*0270*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  83. /*0278*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  84. /*0280*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  85. /*0288*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  86. /*0290*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  87. /*0298*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  88. /*02a0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  89. /*02a8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  90. /*02b0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  91. /*02b8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  92. /*02c0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  93. /*02c8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  94. /*02d0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  95. /*02d8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  96. /*02e0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  97. /*02e8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  98. /*02f0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  99. /*02f8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  100. /*0300*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  101. /*0308*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  102. /*0310*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  103. /*0318*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  104. /*0320*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  105. /*0328*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  106. /*0330*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  107. /*0338*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  108. /*0340*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  109. /*0348*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  110. /*0350*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  111. /*0358*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  112. /*0360*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  113. /*0368*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  114. /*0370*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  115. /*0378*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  116. /*0380*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  117. /*0388*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  118. /*0390*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  119. /*0398*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  120. /*03a0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  121. /*03a8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  122. /*03b0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  123. /*03b8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  124. /*03c0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  125. /*03c8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  126. /*03d0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  127. /*03d8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  128. /*03e0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  129. /*03e8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  130. /*03f0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  131. /*03f8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  132. /*0400*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  133. /*0408*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  134. /*0410*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  135. /*0418*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  136. /*0420*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  137. /*0428*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  138. /*0430*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  139. /*0438*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  140. /*0440*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  141. /*0448*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  142. /*0450*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  143. /*0458*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  144. /*0460*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  145. /*0468*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  146. /*0470*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  147. /*0478*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  148. /*0480*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  149. /*0488*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  150. /*0490*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  151. /*0498*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  152. /*04a0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  153. /*04a8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  154. /*04b0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  155. /*04b8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  156. /*04c0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  157. /*04c8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  158. /*04d0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  159. /*04d8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  160. /*04e0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  161. /*04e8*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  162. /*04f0*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  163. /*04f8*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  164. /*0500*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  165. /*0508*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  166. /*0510*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  167. /*0518*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  168. /*0520*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  169. /*0528*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  170. /*0530*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  171. /*0538*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  172. /*0540*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  173. /*0548*/ IADD R4, R4, 0x20; /* 0x4800c00080411c03 */
  174. /*0550*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  175. /*0558*/ IMAD R7, R7, R19, R21; /* 0x202a00004c71dca3 */
  176. /*0560*/ IMAD R12, R12, R5, R6; /* 0x200c000014c31ca3 */
  177. /*0568*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  178. /*0570*/ ISETP.NE.AND P0, PT, R4, RZ, PT; /* 0x1a8e0000fc41dc23 */
  179. /*0578*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  180. /*0580*/ IMAD R18, R7, R19, R21; /* 0x202a00004c749ca3 */
  181. /*0588*/ IMAD R17, R12, R5, R6; /* 0x200c000014c45ca3 */
  182. /*0590*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  183. /*0598*/ IMAD R0, R0, R16, R14; /* 0x201c000040001ca3 */
  184. /*05a0*/ IMAD R18, R18, R19, R21; /* 0x202a00004d249ca3 */
  185. /*05a8*/ IMAD R17, R17, R5, R6; /* 0x200c000015145ca3 */
  186. /*05b0*/ IMAD R8, R8, R9, R13; /* 0x201a000024821ca3 */
  187. /*05b8*/ @P0 BRA 0x1a8; /* 0x4003ffefa00001e7 */
  188. /*05c0*/ MOV32I R4, 0x40000000; /* 0x1900000000011de2 */
  189. /*05c8*/ MOV32I R9, 0x4; /* 0x1800000010025de2 */
  190. /*05d0*/ IMAD.U32.U32.HI R7, R4, c[0x0][0x38], R15; /* 0x201e4000e041dc43 */
  191. /*05d8*/ IMAD R4.CC, R15, R9, c[0x0][0x20]; /* 0x2013800080f11ca3 */
  192. /*05e0*/ IMAD.HI.X R5, R15, R9, c[0x0][0x24]; /* 0x2092800090f15ce3 */
  193. /*05e8*/ IMAD.U32.U32 R6.CC, R7, R9, c[0x0][0x20]; /* 0x2013800080719c03 */
  194. /*05f0*/ IMAD.U32.U32.HI.X R7, R7, R9, c[0x0][0x24]; /* 0x209280009071dc43 */
  195. /*05f8*/ ST.E [R4], R0; /* 0x9400000000401c85 */
  196. /*0600*/ ST.E [R6], R18; /* 0x9400000000649c85 */
  197. /*0608*/ ST.E [R10], R17; /* 0x9400000000a45c85 */
  198. /*0610*/ ST.E [R2], R8; /* 0x9400000000221c85 */
  199. /*0618*/ EXIT; /* 0x8000000000001de7 */
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement