Advertisement
Guest User

Untitled

a guest
Oct 4th, 2018
220
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 53.99 KB | None | 0 0
  1. (gdb) run teste.py
  2. Starting program: /home/marco/anaconda3/envs/fastai/bin/python teste.py
  3. [Thread debugging using libthread_db enabled]
  4. Using host libthread_db library "/lib/x86_64-linux-gnu/libthread_db.so.1".
  5. 1.0.0.dev20181004
  6. 9.2.148
  7. [New Thread 0x7fffae733700 (LWP 5415)]
  8. True
  9. GeForce GTX 1070
  10.  
  11. Thread 1 "python" received signal SIGILL, Illegal instruction.
  12. 0x00007fffb9057bc3 in at::cuda::detail::initGlobalStreamState() ()
  13. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  14. (gdb) bt
  15. #0 0x00007fffb9057bc3 in at::cuda::detail::initGlobalStreamState() ()
  16. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  17. #1 0x00007ffff7bc5827 in __pthread_once_slow (once_control=0x7fffe0608f68 <at::cuda::detail::init_flag>,
  18. init_routine=0x7fffb72d0a1c <std::__once_proxy()>) at pthread_once.c:116
  19. #2 0x00007fffb905580b in at::cuda::detail::CUDAStream_getCurrentStream(long) ()
  20. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  21. #3 0x00007fffb9054cc9 in at::cuda::getCurrentCUDAStream(long) ()
  22. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  23. #4 0x00007fffb924da57 in CudaCachingAllocator::allocate(unsigned long) const ()
  24. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  25. #5 0x00007fffb9251873 in THCStorage_resize ()
  26. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  27. #6 0x00007fffb9261ead in THCTensor_resizeNd ()
  28. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  29. #7 0x00007fffb9264d42 in THCTensor_setStorageNd ()
  30. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  31. #8 0x00007fffb926f7b4 in THCudaTensor_newWithStorage ()
  32. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  33. #9 0x00007fffb926f919 in THCudaTensor_newWithSize ()
  34. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  35. #10 0x00007fffb911eb7a in at::CUDAFloatType::th_tensor(at::ArrayRef<long>) const ()
  36. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2_gpu.so
  37. #11 0x00007fffe23ffd1f in at::native::tensor(at::Type const&, at::ArrayRef<long>) ()
  38. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2.so
  39. #12 0x00007fffe2688df9 in at::TypeDefault::tensor(at::ArrayRef<long>) const [clone .localalias.250] ()
  40. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2.so
  41. #13 0x00007fffb75ef9ba in torch::autograd::VariableType::tensor(at::ArrayRef<long>) const ()
  42. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libtorch.so.1
  43. #14 0x00007fffe26cdce1 in at::TypeDefault::copy(at::Tensor const&, bool, at::optional<at::Device>) const ()
  44. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2.so
  45. #15 0x00007fffe24851e0 in at::native::to_impl(at::Tensor const&, at::TensorOptions const&, bool) ()
  46. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2.so
  47. #16 0x00007fffe2487131 in at::native::to(at::Tensor const&, at::Device, bool) ()
  48. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2.so
  49. #17 0x00007fffe2688e93 in at::TypeDefault::to(at::Tensor const&, at::Device, bool) const ()
  50. ---Type <return> to continue, or q <return> to quit---
  51. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libcaffe2.so
  52. #18 0x00007fffb75f7e01 in torch::autograd::VariableType::to(at::Tensor const&, at::Device, bool) const ()
  53. from /home/marco/anaconda3/envs/fastai/lib/python3.7/site-packages/torch/lib/libtorch.so.1
  54. #19 0x00007fffe4e147e5 in at::Tensor::to (non_blocking=false, device=..., this=0x7fffb47b2ac0)
  55. at /opt/conda/conda-bld/pytorch-nightly_1538650032546/work/torch/lib/tmp_install/include/ATen/core/TensorMethods.h:1212
  56. #20 torch::autograd::dispatch_to (non_blocking=false, device=..., self=...)
  57. at torch/csrc/autograd/generated/python_variable_methods.cpp:235
  58. #21 torch::autograd::THPVariable_cuda (self=0x7fffb47b2ab0, args=<optimized out>, kwargs=<optimized out>)
  59. at torch/csrc/autograd/generated/python_variable_methods.cpp:269
  60. #22 0x00005555556b7ea4 in _PyMethodDef_RawFastCallKeywords ()
  61. #23 0x00005555556c0bef in _PyMethodDescr_FastCallKeywords ()
  62. #24 0x000055555572cc68 in _PyEval_EvalFrameDefault ()
  63. #25 0x0000555555666528 in _PyEval_EvalCodeWithName ()
  64. #26 0x00005555556673a4 in PyEval_EvalCodeEx ()
  65. #27 0x00005555556673cc in PyEval_EvalCode ()
  66. #28 0x0000555555781304 in run_mod ()
  67. #29 0x0000555555789611 in PyRun_FileExFlags ()
  68. #30 0x0000555555789804 in PyRun_SimpleFileExFlags ()
  69. #31 0x000055555578b17d in pymain_main.constprop ()
  70. #32 0x000055555578b3f0 in _Py_UnixMain ()
  71. #33 0x00007ffff77e6b97 in __libc_start_main (main=0x555555646e20 <main>, argc=2, argv=0x7fffffffdd38, init=<optimized out>,
  72. fini=<optimized out>, rtld_fini=<optimized out>, stack_end=0x7fffffffdd28) at ../csu/libc-start.c:310
  73. #34 0x0000555555737e32 in _start ()
  74. (gdb) disas
  75. Dump of assembler code for function _ZN2at4cuda6detailL21initGlobalStreamStateEv:
  76. 0x00007fffb9057340 <+0>: push %r15
  77. 0x00007fffb9057342 <+2>: push %r14
  78. 0x00007fffb9057344 <+4>: push %r13
  79. 0x00007fffb9057346 <+6>: push %r12
  80. 0x00007fffb9057348 <+8>: push %rbp
  81. 0x00007fffb9057349 <+9>: push %rbx
  82. 0x00007fffb905734a <+10>: sub $0x18,%rsp
  83. 0x00007fffb905734e <+14>: callq 0x7fffb8e6c500 <_ZN2at4cuda10getNumGPUsEv@plt>
  84. 0x00007fffb9057353 <+19>: mov 0x275b1bfe(%rip),%rbp # 0x7fffe0608f58 <_ZN2at4cuda6detailL15default_streamsE+8>
  85. 0x00007fffb905735a <+26>: mov 0x275b1bef(%rip),%rdx # 0x7fffe0608f50 <_ZN2at4cuda6detailL15default_streamsE>
  86. 0x00007fffb9057361 <+33>: mov %rax,%r8
  87. 0x00007fffb9057364 <+36>: mov %rax,0x261d62a5(%rip) # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  88. 0x00007fffb905736b <+43>: mov %rbp,%rax
  89. 0x00007fffb905736e <+46>: sub %rdx,%rax
  90. 0x00007fffb9057371 <+49>: sar $0x4,%rax
  91. 0x00007fffb9057375 <+53>: cmp %rax,%r8
  92. 0x00007fffb9057378 <+56>: ja 0x7fffb9057977 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1591>
  93. 0x00007fffb905737e <+62>: jb 0x7fffb90578ff <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1471>
  94. 0x00007fffb9057384 <+68>: mov 0x275b1bbd(%rip),%r12 # 0x7fffe0608f48 <_ZN2at4cuda6detailL12device_flagsE+72>
  95. 0x00007fffb905738b <+75>: mov 0x275b1b96(%rip),%rbx # 0x7fffe0608f28 <_ZN2at4cuda6detailL12device_flagsE+40>
  96. 0x00007fffb9057392 <+82>: mov 0x275b1b97(%rip),%rdx # 0x7fffe0608f30 <_ZN2at4cuda6detailL12device_flagsE+48>
  97. 0x00007fffb9057399 <+89>: mov 0x275b1b98(%rip),%r9 # 0x7fffe0608f38 <_ZN2at4cuda6detailL12device_flagsE+56>
  98. 0x00007fffb90573a0 <+96>: mov 0x275b1b79(%rip),%rbp # 0x7fffe0608f20 <_ZN2at4cuda6detailL12device_flagsE+32>
  99. 0x00007fffb90573a7 <+103>: mov 0x275b1b62(%rip),%rdi # 0x7fffe0608f10 <_ZN2at4cuda6detailL12device_flagsE+16>
  100. 0x00007fffb90573ae <+110>: mov %r12,%rax
  101. 0x00007fffb90573b1 <+113>: sub %rbx,%rax
  102. 0x00007fffb90573b4 <+116>: mov %rdx,%rsi
  103. 0x00007fffb90573b7 <+119>: sar $0x3,%rax
  104. 0x00007fffb90573bb <+123>: sub %r9,%rsi
  105. 0x00007fffb90573be <+126>: mov %rbp,%rcx
  106. 0x00007fffb90573c1 <+129>: sub $0x1,%rax
  107. 0x00007fffb90573c5 <+133>: sar $0x2,%rsi
  108. 0x00007fffb90573c9 <+137>: sub %rdi,%rcx
  109. ---Type <return> to continue, or q <return> to quit---
  110. 0x00007fffb90573cc <+140>: shl $0x7,%rax
  111. 0x00007fffb90573d0 <+144>: sar $0x2,%rcx
  112. 0x00007fffb90573d4 <+148>: add %rsi,%rax
  113. 0x00007fffb90573d7 <+151>: add %rcx,%rax
  114. 0x00007fffb90573da <+154>: cmp %r8,%rax
  115. 0x00007fffb90573dd <+157>: jae 0x7fffb9057850 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1296>
  116. 0x00007fffb90573e3 <+163>: mov %r8,%rbx
  117. 0x00007fffb90573e6 <+166>: sub %rax,%rbx
  118. 0x00007fffb90573e9 <+169>: jne 0x7fffb9057b4c <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2060>
  119. 0x00007fffb90573ef <+175>: mov 0x275b1ad2(%rip),%r12 # 0x7fffe0608ec8 <_ZN2at4cuda6detailL21low_priority_countersE+72>
  120. 0x00007fffb90573f6 <+182>: mov 0x275b1aab(%rip),%rbx # 0x7fffe0608ea8 <_ZN2at4cuda6detailL21low_priority_countersE+40>
  121. 0x00007fffb90573fd <+189>: mov 0x275b1aac(%rip),%rdx # 0x7fffe0608eb0 <_ZN2at4cuda6detailL21low_priority_countersE+48>
  122. 0x00007fffb9057404 <+196>: mov 0x275b1aad(%rip),%r9 # 0x7fffe0608eb8 <_ZN2at4cuda6detailL21low_priority_countersE+56>
  123. 0x00007fffb905740b <+203>: mov 0x275b1a8e(%rip),%rbp # 0x7fffe0608ea0 <_ZN2at4cuda6detailL21low_priority_countersE+32>
  124. 0x00007fffb9057412 <+210>: mov 0x275b1a77(%rip),%rdi # 0x7fffe0608e90 <_ZN2at4cuda6detailL21low_priority_countersE+16>
  125. 0x00007fffb9057419 <+217>: mov %r12,%rax
  126. 0x00007fffb905741c <+220>: sub %rbx,%rax
  127. 0x00007fffb905741f <+223>: mov %rdx,%rsi
  128. 0x00007fffb9057422 <+226>: sar $0x3,%rax
  129. 0x00007fffb9057426 <+230>: sub %r9,%rsi
  130. 0x00007fffb9057429 <+233>: mov %rbp,%rcx
  131. 0x00007fffb905742c <+236>: sub $0x1,%rax
  132. 0x00007fffb9057430 <+240>: sar $0x2,%rsi
  133. 0x00007fffb9057434 <+244>: sub %rdi,%rcx
  134. 0x00007fffb9057437 <+247>: shl $0x7,%rax
  135. 0x00007fffb905743b <+251>: sar $0x2,%rcx
  136. 0x00007fffb905743f <+255>: add %rsi,%rax
  137. 0x00007fffb9057442 <+258>: add %rcx,%rax
  138. 0x00007fffb9057445 <+261>: cmp %r8,%rax
  139. ---Type <return> to continue, or q <return> to quit---
  140. 0x00007fffb9057448 <+264>: jae 0x7fffb90577a0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1120>
  141. 0x00007fffb905744e <+270>: mov %r8,%rbx
  142. 0x00007fffb9057451 <+273>: sub %rax,%rbx
  143. 0x00007fffb9057454 <+276>: jne 0x7fffb9057a0b <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1739>
  144. 0x00007fffb905745a <+282>: mov 0x275b19e7(%rip),%r12 # 0x7fffe0608e48 <_ZN2at4cuda6detailL22high_priority_countersE+72>
  145. 0x00007fffb9057461 <+289>: mov 0x275b19c0(%rip),%rbx # 0x7fffe0608e28 <_ZN2at4cuda6detailL22high_priority_countersE+40>
  146. 0x00007fffb9057468 <+296>: mov 0x275b19c1(%rip),%rdx # 0x7fffe0608e30 <_ZN2at4cuda6detailL22high_priority_countersE+48>
  147. 0x00007fffb905746f <+303>: mov 0x275b19c2(%rip),%r9 # 0x7fffe0608e38 <_ZN2at4cuda6detailL22high_priority_countersE+56>
  148. 0x00007fffb9057476 <+310>: mov 0x275b19a3(%rip),%rbp # 0x7fffe0608e20 <_ZN2at4cuda6detailL22high_priority_countersE+32>
  149. 0x00007fffb905747d <+317>: mov 0x275b198c(%rip),%rdi # 0x7fffe0608e10 <_ZN2at4cuda6detailL22high_priority_countersE+16>
  150. 0x00007fffb9057484 <+324>: mov %r12,%rax
  151. 0x00007fffb9057487 <+327>: sub %rbx,%rax
  152. 0x00007fffb905748a <+330>: mov %rdx,%rsi
  153. 0x00007fffb905748d <+333>: sar $0x3,%rax
  154. 0x00007fffb9057491 <+337>: sub %r9,%rsi
  155. 0x00007fffb9057494 <+340>: mov %rbp,%rcx
  156. 0x00007fffb9057497 <+343>: sub $0x1,%rax
  157. 0x00007fffb905749b <+347>: sar $0x2,%rsi
  158. 0x00007fffb905749f <+351>: sub %rdi,%rcx
  159. 0x00007fffb90574a2 <+354>: shl $0x7,%rax
  160. 0x00007fffb90574a6 <+358>: sar $0x2,%rcx
  161. 0x00007fffb90574aa <+362>: add %rsi,%rax
  162. 0x00007fffb90574ad <+365>: add %rcx,%rax
  163. 0x00007fffb90574b0 <+368>: cmp %r8,%rax
  164. 0x00007fffb90574b3 <+371>: jae 0x7fffb90576f0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+944>
  165. 0x00007fffb90574b9 <+377>: mov %r8,%rbx
  166. 0x00007fffb90574bc <+380>: sub %rax,%rbx
  167. 0x00007fffb90574bf <+383>: jne 0x7fffb9057aac <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1900>
  168. 0x00007fffb90574c5 <+389>: mov 0x275b191c(%rip),%r12 # 0x7fffe0608de8 <_ZN2at4cuda6detailL20low_priority_strea---Type <return> to continue, or q <return> to quit---
  169. msE+8>
  170. 0x00007fffb90574cc <+396>: mov 0x275b190d(%rip),%rdx # 0x7fffe0608de0 <_ZN2at4cuda6detailL20low_priority_streamsE>
  171. 0x00007fffb90574d3 <+403>: mov %r12,%rax
  172. 0x00007fffb90574d6 <+406>: sub %rdx,%rax
  173. 0x00007fffb90574d9 <+409>: sar $0x9,%rax
  174. 0x00007fffb90574dd <+413>: cmp %r8,%rax
  175. 0x00007fffb90574e0 <+416>: jb 0x7fffb9057995 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1621>
  176. 0x00007fffb90574e6 <+422>: jbe 0x7fffb9057545 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+517>
  177. 0x00007fffb90574e8 <+424>: mov %r8,%r13
  178. 0x00007fffb90574eb <+427>: shl $0x9,%r13
  179. 0x00007fffb90574ef <+431>: add %rdx,%r13
  180. 0x00007fffb90574f2 <+434>: cmp %r13,%r12
  181. 0x00007fffb90574f5 <+437>: je 0x7fffb905753e <_ZN2at4cuda6detailL21initGlobalStreamStateEv+510>
  182. 0x00007fffb90574f7 <+439>: mov %r13,%rbp
  183. 0x00007fffb90574fa <+442>: nopw 0x0(%rax,%rax,1)
  184. 0x00007fffb9057500 <+448>: lea 0x200(%rbp),%r14
  185. 0x00007fffb9057507 <+455>: test %rbp,%rbp
  186. 0x00007fffb905750a <+458>: mov %r14,%rbx
  187. 0x00007fffb905750d <+461>: je 0x7fffb9057960 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1568>
  188. 0x00007fffb9057513 <+467>: nopl 0x0(%rax,%rax,1)
  189. 0x00007fffb9057518 <+472>: sub $0x10,%rbx
  190. 0x00007fffb905751c <+476>: mov 0x8(%rbx),%rdi
  191. 0x00007fffb9057520 <+480>: test %rdi,%rdi
  192. 0x00007fffb9057523 <+483>: je 0x7fffb905752a <_ZN2at4cuda6detailL21initGlobalStreamStateEv+490>
  193. 0x00007fffb9057525 <+485>: callq 0x7fffbac47820 <cudaStreamDestroy>
  194. 0x00007fffb905752a <+490>: cmp %rbx,%rbp
  195. 0x00007fffb905752d <+493>: jne 0x7fffb9057518 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+472>
  196. 0x00007fffb905752f <+495>: cmp %r14,%r12
  197. 0x00007fffb9057532 <+498>: mov %r14,%rbp
  198. 0x00007fffb9057535 <+501>: jne 0x7fffb9057500 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+448>
  199. 0x00007fffb9057537 <+503>: mov 0x261d60d2(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  200. 0x00007fffb905753e <+510>: mov %r13,0x275b18a3(%rip) # 0x7fffe0608de8 <_ZN2at4cuda6detailL20low_priority_streamsE+8>
  201. 0x00007fffb9057545 <+517>: mov 0x275b187c(%rip),%r12 # 0x7fffe0608dc8 <_ZN2at4cuda6detailL21high_priority_stre---Type <return> to continue, or q <return> to quit---
  202. amsE+8>
  203. 0x00007fffb905754c <+524>: mov 0x275b186d(%rip),%rdx # 0x7fffe0608dc0 <_ZN2at4cuda6detailL21high_priority_streamsE>
  204. 0x00007fffb9057553 <+531>: mov %r12,%rax
  205. 0x00007fffb9057556 <+534>: sub %rdx,%rax
  206. 0x00007fffb9057559 <+537>: sar $0x9,%rax
  207. 0x00007fffb905755d <+541>: cmp %r8,%rax
  208. 0x00007fffb9057560 <+544>: jb 0x7fffb90579d0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1680>
  209. 0x00007fffb9057566 <+550>: jbe 0x7fffb90575c5 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+645>
  210. 0x00007fffb9057568 <+552>: mov %r8,%r13
  211. 0x00007fffb905756b <+555>: shl $0x9,%r13
  212. 0x00007fffb905756f <+559>: add %rdx,%r13
  213. 0x00007fffb9057572 <+562>: cmp %r13,%r12
  214. 0x00007fffb9057575 <+565>: je 0x7fffb90575be <_ZN2at4cuda6detailL21initGlobalStreamStateEv+638>
  215. 0x00007fffb9057577 <+567>: mov %r13,%rbp
  216. 0x00007fffb905757a <+570>: nopw 0x0(%rax,%rax,1)
  217. 0x00007fffb9057580 <+576>: lea 0x200(%rbp),%r14
  218. 0x00007fffb9057587 <+583>: test %rbp,%rbp
  219. 0x00007fffb905758a <+586>: mov %r14,%rbx
  220. 0x00007fffb905758d <+589>: je 0x7fffb9057948 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1544>
  221. 0x00007fffb9057593 <+595>: nopl 0x0(%rax,%rax,1)
  222. 0x00007fffb9057598 <+600>: sub $0x10,%rbx
  223. 0x00007fffb905759c <+604>: mov 0x8(%rbx),%rdi
  224. 0x00007fffb90575a0 <+608>: test %rdi,%rdi
  225. 0x00007fffb90575a3 <+611>: je 0x7fffb90575aa <_ZN2at4cuda6detailL21initGlobalStreamStateEv+618>
  226. 0x00007fffb90575a5 <+613>: callq 0x7fffbac47820 <cudaStreamDestroy>
  227. 0x00007fffb90575aa <+618>: cmp %rbx,%rbp
  228. 0x00007fffb90575ad <+621>: jne 0x7fffb9057598 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+600>
  229. 0x00007fffb90575af <+623>: cmp %r14,%r12
  230. 0x00007fffb90575b2 <+626>: mov %r14,%rbp
  231. 0x00007fffb90575b5 <+629>: jne 0x7fffb9057580 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+576>
  232. 0x00007fffb90575b7 <+631>: mov 0x261d6052(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  233. 0x00007fffb90575be <+638>: mov %r13,0x275b1803(%rip) # 0x7fffe0608dc8 <_ZN2at4cuda6detailL21high_priority_streamsE+8>
  234. 0x00007fffb90575c5 <+645>: xor %edi,%edi
  235. ---Type <return> to continue, or q <return> to quit---
  236. 0x00007fffb90575c7 <+647>: xor %edx,%edx
  237. 0x00007fffb90575c9 <+649>: test %r8,%r8
  238. 0x00007fffb90575cc <+652>: jg 0x7fffb905765f <_ZN2at4cuda6detailL21initGlobalStreamStateEv+799>
  239. 0x00007fffb90575d2 <+658>: jmpq 0x7fffb90576d8 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+920>
  240. 0x00007fffb90575d7 <+663>: nopw 0x0(%rax,%rax,1)
  241. 0x00007fffb90575e0 <+672>: mov %rcx,%r8
  242. 0x00007fffb90575e3 <+675>: mov (%rsi,%rcx,8),%rcx
  243. 0x00007fffb90575e7 <+679>: shl $0x7,%r8
  244. 0x00007fffb90575eb <+683>: sub %r8,%rax
  245. 0x00007fffb90575ee <+686>: lea (%rcx,%rax,4),%rcx
  246. 0x00007fffb90575f2 <+690>: movl $0x0,(%rcx)
  247. 0x00007fffb90575f8 <+696>: mfence
  248. 0x00007fffb90575fb <+699>: mov 0x275b180e(%rip),%rcx # 0x7fffe0608e10 <_ZN2at4cuda6detailL22high_priority_countersE+16>
  249. 0x00007fffb9057602 <+706>: mov 0x275b181f(%rip),%rsi # 0x7fffe0608e28 <_ZN2at4cuda6detailL22high_priority_countersE+40>
  250. 0x00007fffb9057609 <+713>: mov %rcx,%rax
  251. 0x00007fffb905760c <+716>: sub 0x275b1805(%rip),%rax # 0x7fffe0608e18 <_ZN2at4cuda6detailL22high_priority_countersE+24>
  252. 0x00007fffb9057613 <+723>: add %rdi,%rcx
  253. 0x00007fffb9057616 <+726>: sar $0x2,%rax
  254. 0x00007fffb905761a <+730>: add %rdx,%rax
  255. 0x00007fffb905761d <+733>: cmp $0x7f,%rax
  256. 0x00007fffb9057621 <+737>: jbe 0x7fffb9057645 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+773>
  257. 0x00007fffb9057623 <+739>: mov %rax,%rcx
  258. 0x00007fffb9057626 <+742>: sar $0x7,%rcx
  259. 0x00007fffb905762a <+746>: test %rax,%rax
  260. 0x00007fffb905762d <+749>: jle 0x7fffb90576c0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+896>
  261. 0x00007fffb9057633 <+755>: mov %rcx,%r8
  262. 0x00007fffb9057636 <+758>: mov (%rsi,%rcx,8),%rcx
  263. 0x00007fffb905763a <+762>: shl $0x7,%r8
  264. 0x00007fffb905763e <+766>: sub %r8,%rax
  265. 0x00007fffb9057641 <+769>: lea (%rcx,%rax,4),%rcx
  266. 0x00007fffb9057645 <+773>: movl $0x0,(%rcx)
  267. 0x00007fffb905764b <+779>: add $0x1,%rdx
  268. ---Type <return> to continue, or q <return> to quit---
  269. 0x00007fffb905764f <+783>: add $0x4,%rdi
  270. 0x00007fffb9057653 <+787>: mfence
  271. 0x00007fffb9057656 <+790>: cmp %rdx,0x261d5fb3(%rip) # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  272. 0x00007fffb905765d <+797>: jle 0x7fffb90576d8 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+920>
  273. 0x00007fffb905765f <+799>: mov %rdx,%rax
  274. 0x00007fffb9057662 <+802>: mov 0x275b1827(%rip),%rcx # 0x7fffe0608e90 <_ZN2at4cuda6detailL21low_priority_countersE+16>
  275. 0x00007fffb9057669 <+809>: mov 0x275b1838(%rip),%rsi # 0x7fffe0608ea8 <_ZN2at4cuda6detailL21low_priority_countersE+40>
  276. 0x00007fffb9057670 <+816>: shl $0x4,%rax
  277. 0x00007fffb9057674 <+820>: add 0x275b18d5(%rip),%rax # 0x7fffe0608f50 <_ZN2at4cuda6detailL15default_streamsE>
  278. 0x00007fffb905767b <+827>: mov %rdx,(%rax)
  279. 0x00007fffb905767e <+830>: mov %rcx,%rax
  280. 0x00007fffb9057681 <+833>: sub 0x275b1810(%rip),%rax # 0x7fffe0608e98 <_ZN2at4cuda6detailL21low_priority_countersE+24>
  281. 0x00007fffb9057688 <+840>: add %rdi,%rcx
  282. 0x00007fffb905768b <+843>: sar $0x2,%rax
  283. 0x00007fffb905768f <+847>: add %rdx,%rax
  284. 0x00007fffb9057692 <+850>: cmp $0x7f,%rax
  285. 0x00007fffb9057696 <+854>: jbe 0x7fffb90575f2 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+690>
  286. 0x00007fffb905769c <+860>: mov %rax,%rcx
  287. 0x00007fffb905769f <+863>: sar $0x7,%rcx
  288. 0x00007fffb90576a3 <+867>: test %rax,%rax
  289. 0x00007fffb90576a6 <+870>: jg 0x7fffb90575e0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+672>
  290. 0x00007fffb90576ac <+876>: mov %rax,%rcx
  291. 0x00007fffb90576af <+879>: not %rcx
  292. 0x00007fffb90576b2 <+882>: shr $0x7,%rcx
  293. 0x00007fffb90576b6 <+886>: not %rcx
  294. 0x00007fffb90576b9 <+889>: jmpq 0x7fffb90575e0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+672>
  295. 0x00007fffb90576be <+894>: xchg %ax,%ax
  296. 0x00007fffb90576c0 <+896>: mov %rax,%rcx
  297. 0x00007fffb90576c3 <+899>: not %rcx
  298. 0x00007fffb90576c6 <+902>: shr $0x7,%rcx
  299. 0x00007fffb90576ca <+906>: not %rcx
  300. 0x00007fffb90576cd <+909>: jmpq 0x7fffb9057633 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+755>
  301. ---Type <return> to continue, or q <return> to quit---
  302. 0x00007fffb90576d2 <+914>: nopw 0x0(%rax,%rax,1)
  303. 0x00007fffb90576d8 <+920>: add $0x18,%rsp
  304. 0x00007fffb90576dc <+924>: pop %rbx
  305. 0x00007fffb90576dd <+925>: pop %rbp
  306. 0x00007fffb90576de <+926>: pop %r12
  307. 0x00007fffb90576e0 <+928>: pop %r13
  308. 0x00007fffb90576e2 <+930>: pop %r14
  309. 0x00007fffb90576e4 <+932>: pop %r15
  310. 0x00007fffb90576e6 <+934>: retq
  311. 0x00007fffb90576e7 <+935>: nopw 0x0(%rax,%rax,1)
  312. 0x00007fffb90576f0 <+944>: jbe 0x7fffb90574c5 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+389>
  313. 0x00007fffb90576f6 <+950>: mov 0x275b171b(%rip),%r14 # 0x7fffe0608e18 <_ZN2at4cuda6detailL22high_priority_countersE+24>
  314. 0x00007fffb90576fd <+957>: mov %rdi,%rax
  315. 0x00007fffb9057700 <+960>: lea (%rdi,%r8,4),%r13
  316. 0x00007fffb9057704 <+964>: sub %r14,%rax
  317. 0x00007fffb9057707 <+967>: sar $0x2,%rax
  318. 0x00007fffb905770b <+971>: add %r8,%rax
  319. 0x00007fffb905770e <+974>: cmp $0x7f,%rax
  320. 0x00007fffb9057712 <+978>: jbe 0x7fffb905773d <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1021>
  321. 0x00007fffb9057714 <+980>: mov %rax,%rdx
  322. 0x00007fffb9057717 <+983>: sar $0x7,%rdx
  323. 0x00007fffb905771b <+987>: test %rax,%rax
  324. 0x00007fffb905771e <+990>: jle 0x7fffb9057e6f <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2863>
  325. 0x00007fffb9057724 <+996>: lea (%rbx,%rdx,8),%rbx
  326. 0x00007fffb9057728 <+1000>: shl $0x7,%rdx
  327. 0x00007fffb905772c <+1004>: sub %rdx,%rax
  328. 0x00007fffb905772f <+1007>: mov (%rbx),%r14
  329. 0x00007fffb9057732 <+1010>: lea 0x200(%r14),%rbp
  330. 0x00007fffb9057739 <+1017>: lea (%r14,%rax,4),%r13
  331. 0x00007fffb905773d <+1021>: lea 0x8(%rbx),%r15
  332. 0x00007fffb9057741 <+1025>: add $0x8,%r12
  333. 0x00007fffb9057745 <+1029>: cmp %r15,%r12
  334. 0x00007fffb9057748 <+1032>: jbe 0x7fffb9057768 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1064>
  335. 0x00007fffb905774a <+1034>: nopw 0x0(%rax,%rax,1)
  336. ---Type <return> to continue, or q <return> to quit---
  337. 0x00007fffb9057750 <+1040>: mov (%r15),%rdi
  338. 0x00007fffb9057753 <+1043>: add $0x8,%r15
  339. 0x00007fffb9057757 <+1047>: callq 0x7fffb8e527c0 <_ZdlPv@plt>
  340. 0x00007fffb905775c <+1052>: cmp %r15,%r12
  341. 0x00007fffb905775f <+1055>: ja 0x7fffb9057750 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1040>
  342. 0x00007fffb9057761 <+1057>: mov 0x261d5ea8(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  343. 0x00007fffb9057768 <+1064>: mov %r13,0x8(%rsp)
  344. 0x00007fffb905776d <+1069>: movq 0x8(%rsp),%xmm0
  345. 0x00007fffb9057773 <+1075>: mov %rbp,0x8(%rsp)
  346. 0x00007fffb9057778 <+1080>: pinsrq $0x1,%r14,%xmm0
  347. 0x00007fffb905777f <+1087>: movaps %xmm0,0x275b16aa(%rip) # 0x7fffe0608e30 <_ZN2at4cuda6detailL22high_priority_countersE+48>
  348. 0x00007fffb9057786 <+1094>: movq 0x8(%rsp),%xmm0
  349. 0x00007fffb905778c <+1100>: pinsrq $0x1,%rbx,%xmm0
  350. 0x00007fffb9057793 <+1107>: movaps %xmm0,0x275b16a6(%rip) # 0x7fffe0608e40 <_ZN2at4cuda6detailL22high_priority_countersE+64>
  351. 0x00007fffb905779a <+1114>: jmpq 0x7fffb90574c5 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+389>
  352. 0x00007fffb905779f <+1119>: nop
  353. 0x00007fffb90577a0 <+1120>: jbe 0x7fffb905745a <_ZN2at4cuda6detailL21initGlobalStreamStateEv+282>
  354. 0x00007fffb90577a6 <+1126>: mov 0x275b16eb(%rip),%r14 # 0x7fffe0608e98 <_ZN2at4cuda6detailL21low_priority_countersE+24>
  355. 0x00007fffb90577ad <+1133>: mov %rdi,%rax
  356. 0x00007fffb90577b0 <+1136>: lea (%rdi,%r8,4),%r13
  357. 0x00007fffb90577b4 <+1140>: sub %r14,%rax
  358. 0x00007fffb90577b7 <+1143>: sar $0x2,%rax
  359. 0x00007fffb90577bb <+1147>: add %r8,%rax
  360. 0x00007fffb90577be <+1150>: cmp $0x7f,%rax
  361. 0x00007fffb90577c2 <+1154>: jbe 0x7fffb90577ed <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1197>
  362. 0x00007fffb90577c4 <+1156>: mov %rax,%rdx
  363. 0x00007fffb90577c7 <+1159>: sar $0x7,%rdx
  364. 0x00007fffb90577cb <+1163>: test %rax,%rax
  365. 0x00007fffb90577ce <+1166>: jle 0x7fffb9057e5d <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2845>
  366. 0x00007fffb90577d4 <+1172>: lea (%rbx,%rdx,8),%rbx
  367. 0x00007fffb90577d8 <+1176>: shl $0x7,%rdx
  368. 0x00007fffb90577dc <+1180>: sub %rdx,%rax
  369. ---Type <return> to continue, or q <return> to quit---
  370. 0x00007fffb90577df <+1183>: mov (%rbx),%r14
  371. 0x00007fffb90577e2 <+1186>: lea 0x200(%r14),%rbp
  372. 0x00007fffb90577e9 <+1193>: lea (%r14,%rax,4),%r13
  373. 0x00007fffb90577ed <+1197>: lea 0x8(%rbx),%r15
  374. 0x00007fffb90577f1 <+1201>: add $0x8,%r12
  375. 0x00007fffb90577f5 <+1205>: cmp %r15,%r12
  376. 0x00007fffb90577f8 <+1208>: jbe 0x7fffb9057818 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1240>
  377. 0x00007fffb90577fa <+1210>: nopw 0x0(%rax,%rax,1)
  378. 0x00007fffb9057800 <+1216>: mov (%r15),%rdi
  379. 0x00007fffb9057803 <+1219>: add $0x8,%r15
  380. 0x00007fffb9057807 <+1223>: callq 0x7fffb8e527c0 <_ZdlPv@plt>
  381. 0x00007fffb905780c <+1228>: cmp %r15,%r12
  382. 0x00007fffb905780f <+1231>: ja 0x7fffb9057800 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1216>
  383. 0x00007fffb9057811 <+1233>: mov 0x261d5df8(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  384. 0x00007fffb9057818 <+1240>: mov %r13,0x8(%rsp)
  385. 0x00007fffb905781d <+1245>: movq 0x8(%rsp),%xmm0
  386. 0x00007fffb9057823 <+1251>: mov %rbp,0x8(%rsp)
  387. 0x00007fffb9057828 <+1256>: pinsrq $0x1,%r14,%xmm0
  388. 0x00007fffb905782f <+1263>: movaps %xmm0,0x275b167a(%rip) # 0x7fffe0608eb0 <_ZN2at4cuda6detailL21low_priority_countersE+48>
  389. 0x00007fffb9057836 <+1270>: movq 0x8(%rsp),%xmm0
  390. 0x00007fffb905783c <+1276>: pinsrq $0x1,%rbx,%xmm0
  391. 0x00007fffb9057843 <+1283>: movaps %xmm0,0x275b1676(%rip) # 0x7fffe0608ec0 <_ZN2at4cuda6detailL21low_priority_countersE+64>
  392. 0x00007fffb905784a <+1290>: jmpq 0x7fffb905745a <_ZN2at4cuda6detailL21initGlobalStreamStateEv+282>
  393. 0x00007fffb905784f <+1295>: nop
  394. 0x00007fffb9057850 <+1296>: jbe 0x7fffb90573ef <_ZN2at4cuda6detailL21initGlobalStreamStateEv+175>
  395. 0x00007fffb9057856 <+1302>: mov 0x275b16bb(%rip),%r14 # 0x7fffe0608f18 <_ZN2at4cuda6detailL12device_flagsE+24>
  396. 0x00007fffb905785d <+1309>: mov %rdi,%rax
  397. 0x00007fffb9057860 <+1312>: lea (%rdi,%r8,4),%r13
  398. 0x00007fffb9057864 <+1316>: sub %r14,%rax
  399. 0x00007fffb9057867 <+1319>: sar $0x2,%rax
  400. 0x00007fffb905786b <+1323>: add %r8,%rax
  401. 0x00007fffb905786e <+1326>: cmp $0x7f,%rax
  402. 0x00007fffb9057872 <+1330>: jbe 0x7fffb905789d <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1373>
  403. ---Type <return> to continue, or q <return> to quit---
  404. 0x00007fffb9057874 <+1332>: mov %rax,%rdx
  405. 0x00007fffb9057877 <+1335>: sar $0x7,%rdx
  406. 0x00007fffb905787b <+1339>: test %rax,%rax
  407. 0x00007fffb905787e <+1342>: jle 0x7fffb9057e4b <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2827>
  408. 0x00007fffb9057884 <+1348>: lea (%rbx,%rdx,8),%rbx
  409. 0x00007fffb9057888 <+1352>: shl $0x7,%rdx
  410. 0x00007fffb905788c <+1356>: sub %rdx,%rax
  411. 0x00007fffb905788f <+1359>: mov (%rbx),%r14
  412. 0x00007fffb9057892 <+1362>: lea 0x200(%r14),%rbp
  413. 0x00007fffb9057899 <+1369>: lea (%r14,%rax,4),%r13
  414. 0x00007fffb905789d <+1373>: lea 0x8(%rbx),%r15
  415. 0x00007fffb90578a1 <+1377>: add $0x8,%r12
  416. 0x00007fffb90578a5 <+1381>: cmp %r15,%r12
  417. 0x00007fffb90578a8 <+1384>: jbe 0x7fffb90578c8 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1416>
  418. 0x00007fffb90578aa <+1386>: nopw 0x0(%rax,%rax,1)
  419. 0x00007fffb90578b0 <+1392>: mov (%r15),%rdi
  420. 0x00007fffb90578b3 <+1395>: add $0x8,%r15
  421. 0x00007fffb90578b7 <+1399>: callq 0x7fffb8e527c0 <_ZdlPv@plt>
  422. 0x00007fffb90578bc <+1404>: cmp %r15,%r12
  423. 0x00007fffb90578bf <+1407>: ja 0x7fffb90578b0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1392>
  424. 0x00007fffb90578c1 <+1409>: mov 0x261d5d48(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  425. 0x00007fffb90578c8 <+1416>: mov %r13,0x8(%rsp)
  426. 0x00007fffb90578cd <+1421>: movq 0x8(%rsp),%xmm0
  427. 0x00007fffb90578d3 <+1427>: mov %rbp,0x8(%rsp)
  428. 0x00007fffb90578d8 <+1432>: pinsrq $0x1,%r14,%xmm0
  429. 0x00007fffb90578df <+1439>: movaps %xmm0,0x275b164a(%rip) # 0x7fffe0608f30 <_ZN2at4cuda6detailL12device_flagsE+48>
  430. 0x00007fffb90578e6 <+1446>: movq 0x8(%rsp),%xmm0
  431. 0x00007fffb90578ec <+1452>: pinsrq $0x1,%rbx,%xmm0
  432. 0x00007fffb90578f3 <+1459>: movaps %xmm0,0x275b1646(%rip) # 0x7fffe0608f40 <_ZN2at4cuda6detailL12device_flagsE+64>
  433. 0x00007fffb90578fa <+1466>: jmpq 0x7fffb90573ef <_ZN2at4cuda6detailL21initGlobalStreamStateEv+175>
  434. 0x00007fffb90578ff <+1471>: mov %r8,%r12
  435. 0x00007fffb9057902 <+1474>: shl $0x4,%r12
  436. 0x00007fffb9057906 <+1478>: add %rdx,%r12
  437. ---Type <return> to continue, or q <return> to quit---
  438. 0x00007fffb9057909 <+1481>: cmp %r12,%rbp
  439. 0x00007fffb905790c <+1484>: je 0x7fffb9057936 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1526>
  440. 0x00007fffb905790e <+1486>: mov %r12,%rbx
  441. 0x00007fffb9057911 <+1489>: nopl 0x0(%rax)
  442. 0x00007fffb9057918 <+1496>: mov 0x8(%rbx),%rdi
  443. 0x00007fffb905791c <+1500>: test %rdi,%rdi
  444. 0x00007fffb905791f <+1503>: je 0x7fffb9057926 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1510>
  445. 0x00007fffb9057921 <+1505>: callq 0x7fffbac47820 <cudaStreamDestroy>
  446. 0x00007fffb9057926 <+1510>: add $0x10,%rbx
  447. 0x00007fffb905792a <+1514>: cmp %rbx,%rbp
  448. 0x00007fffb905792d <+1517>: jne 0x7fffb9057918 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1496>
  449. 0x00007fffb905792f <+1519>: mov 0x261d5cda(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  450. 0x00007fffb9057936 <+1526>: mov %r12,0x275b161b(%rip) # 0x7fffe0608f58 <_ZN2at4cuda6detailL15default_streamsE+8>
  451. 0x00007fffb905793d <+1533>: jmpq 0x7fffb9057384 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+68>
  452. 0x00007fffb9057942 <+1538>: nopw 0x0(%rax,%rax,1)
  453. 0x00007fffb9057948 <+1544>: mov $0x200,%r14d
  454. 0x00007fffb905794e <+1550>: cmp %r14,%r12
  455. 0x00007fffb9057951 <+1553>: mov %r14,%rbp
  456. 0x00007fffb9057954 <+1556>: jne 0x7fffb9057580 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+576>
  457. 0x00007fffb905795a <+1562>: jmpq 0x7fffb90575b7 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+631>
  458. 0x00007fffb905795f <+1567>: nop
  459. 0x00007fffb9057960 <+1568>: mov $0x200,%r14d
  460. 0x00007fffb9057966 <+1574>: cmp %r14,%r12
  461. 0x00007fffb9057969 <+1577>: mov %r14,%rbp
  462. 0x00007fffb905796c <+1580>: jne 0x7fffb9057500 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+448>
  463. 0x00007fffb9057972 <+1586>: jmpq 0x7fffb9057537 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+503>
  464. 0x00007fffb9057977 <+1591>: mov %r8,%rsi
  465. 0x00007fffb905797a <+1594>: lea 0x275b15cf(%rip),%rdi # 0x7fffe0608f50 <_ZN2at4cuda6detailL15default_streamsE>
  466. 0x00007fffb9057981 <+1601>: sub %rax,%rsi
  467. 0x00007fffb9057984 <+1604>: callq 0x7fffb8e4dc20 <_ZNSt6vectorI19CUDAStreamInternalsSaIS0_EE17_M_default_appendEm@plt>
  468. 0x00007fffb9057989 <+1609>: mov 0x261d5c80(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  469. 0x00007fffb9057990 <+1616>: jmpq 0x7fffb9057384 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+68>
  470. 0x00007fffb9057995 <+1621>: mov %r8,%rsi
  471. 0x00007fffb9057998 <+1624>: sub %rax,%rsi
  472. ---Type <return> to continue, or q <return> to quit---
  473. 0x00007fffb905799b <+1627>: je 0x7fffb9057545 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+517>
  474. 0x00007fffb90579a1 <+1633>: mov 0x275b1448(%rip),%rax # 0x7fffe0608df0 <_ZN2at4cuda6detailL20low_priority_streamsE+16>
  475. 0x00007fffb90579a8 <+1640>: sub %r12,%rax
  476. 0x00007fffb90579ab <+1643>: sar $0x9,%rax
  477. 0x00007fffb90579af <+1647>: cmp %rax,%rsi
  478. 0x00007fffb90579b2 <+1650>: jbe 0x7fffb9057d80 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2624>
  479. 0x00007fffb90579b8 <+1656>: lea 0x275b1421(%rip),%rdi # 0x7fffe0608de0 <_ZN2at4cuda6detailL20low_priority_streamsE>
  480. 0x00007fffb90579bf <+1663>: callq 0x7fffb9055220 <_ZNSt6vectorISt5arrayI19CUDAStreamInternalsLm32EESaIS2_EE17_M_default_appendEm.part.107>
  481. 0x00007fffb90579c4 <+1668>: mov 0x261d5c45(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  482. 0x00007fffb90579cb <+1675>: jmpq 0x7fffb9057545 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+517>
  483. 0x00007fffb90579d0 <+1680>: mov %r8,%rsi
  484. 0x00007fffb90579d3 <+1683>: sub %rax,%rsi
  485. 0x00007fffb90579d6 <+1686>: je 0x7fffb90575c5 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+645>
  486. 0x00007fffb90579dc <+1692>: mov 0x275b13ed(%rip),%rax # 0x7fffe0608dd0 <_ZN2at4cuda6detailL21high_priority_streamsE+16>
  487. 0x00007fffb90579e3 <+1699>: sub %r12,%rax
  488. 0x00007fffb90579e6 <+1702>: sar $0x9,%rax
  489. 0x00007fffb90579ea <+1706>: cmp %rax,%rsi
  490. 0x00007fffb90579ed <+1709>: jbe 0x7fffb9057de3 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2723>
  491. 0x00007fffb90579f3 <+1715>: lea 0x275b13c6(%rip),%rdi # 0x7fffe0608dc0 <_ZN2at4cuda6detailL21high_priority_streamsE>
  492. 0x00007fffb90579fa <+1722>: callq 0x7fffb9055220 <_ZNSt6vectorISt5arrayI19CUDAStreamInternalsLm32EESaIS2_EE17_M_default_appendEm.part.107>
  493. 0x00007fffb90579ff <+1727>: mov 0x261d5c0a(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  494. 0x00007fffb9057a06 <+1734>: jmpq 0x7fffb90575c5 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+645>
  495. 0x00007fffb9057a0b <+1739>: mov 0x275b14ae(%rip),%rcx # 0x7fffe0608ec0 <_ZN2at4cuda6detailL21low_priority_countersE+64>
  496. 0x00007fffb9057a12 <+1746>: mov %rcx,%rax
  497. 0x00007fffb9057a15 <+1749>: sub %rdx,%rax
  498. 0x00007fffb9057a18 <+1752>: sar $0x2,%rax
  499. 0x00007fffb9057a1c <+1756>: sub $0x1,%rax
  500. 0x00007fffb9057a20 <+1760>: cmp %rax,%rbx
  501. ---Type <return> to continue, or q <return> to quit---
  502. 0x00007fffb9057a23 <+1763>: ja 0x7fffb9057cc9 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2441>
  503. 0x00007fffb9057a29 <+1769>: mov %rdx,%rax
  504. 0x00007fffb9057a2c <+1772>: add %rbx,%rsi
  505. 0x00007fffb9057a2f <+1775>: cmp $0x7f,%rsi
  506. 0x00007fffb9057a33 <+1779>: ja 0x7fffb9057c90 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2384>
  507. 0x00007fffb9057a39 <+1785>: mov %rcx,0x8(%rsp)
  508. 0x00007fffb9057a3e <+1790>: lea (%rax,%rbx,4),%rdx
  509. 0x00007fffb9057a42 <+1794>: mov %r12,%rdi
  510. 0x00007fffb9057a45 <+1797>: movq 0x8(%rsp),%xmm1
  511. 0x00007fffb9057a4b <+1803>: lea 0x8(%r12),%rsi
  512. 0x00007fffb9057a50 <+1808>: jmp 0x7fffb9057a70 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1840>
  513. 0x00007fffb9057a52 <+1810>: nopw 0x0(%rax,%rax,1)
  514. 0x00007fffb9057a58 <+1816>: test %rax,%rax
  515. 0x00007fffb9057a5b <+1819>: je 0x7fffb9057a63 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1827>
  516. 0x00007fffb9057a5d <+1821>: movl $0x0,(%rax)
  517. 0x00007fffb9057a63 <+1827>: add $0x4,%rax
  518. 0x00007fffb9057a67 <+1831>: cmp %rax,%rcx
  519. 0x00007fffb9057a6a <+1834>: je 0x7fffb9057be8 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2216>
  520. 0x00007fffb9057a70 <+1840>: cmp %rdx,%rax
  521. 0x00007fffb9057a73 <+1843>: jne 0x7fffb9057a58 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1816>
  522. 0x00007fffb9057a75 <+1845>: mov %rax,0x8(%rsp)
  523. 0x00007fffb9057a7a <+1850>: mov 0x261d5b8f(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  524. 0x00007fffb9057a81 <+1857>: movq 0x8(%rsp),%xmm0
  525. 0x00007fffb9057a87 <+1863>: pinsrq $0x1,%r9,%xmm0
  526. 0x00007fffb9057a8e <+1870>: movaps %xmm0,0x275b141b(%rip) # 0x7fffe0608eb0 <_ZN2at4cuda6detailL21low_priority_countersE+48>
  527. 0x00007fffb9057a95 <+1877>: movdqa %xmm1,%xmm0
  528. 0x00007fffb9057a99 <+1881>: pinsrq $0x1,%rdi,%xmm0
  529. 0x00007fffb9057aa0 <+1888>: movaps %xmm0,0x275b1419(%rip) # 0x7fffe0608ec0 <_ZN2at4cuda6detailL21low_priority_countersE+64>
  530. 0x00007fffb9057aa7 <+1895>: jmpq 0x7fffb905745a <_ZN2at4cuda6detailL21initGlobalStreamStateEv+282>
  531. 0x00007fffb9057aac <+1900>: mov 0x275b138d(%rip),%rcx # 0x7fffe0608e40 <_ZN2at4cuda6detailL22high_priority_countersE+64>
  532. 0x00007fffb9057ab3 <+1907>: mov %rcx,%rax
  533. 0x00007fffb9057ab6 <+1910>: sub %rdx,%rax
  534. ---Type <return> to continue, or q <return> to quit---
  535. 0x00007fffb9057ab9 <+1913>: sar $0x2,%rax
  536. 0x00007fffb9057abd <+1917>: sub $0x1,%rax
  537. 0x00007fffb9057ac1 <+1921>: cmp %rax,%rbx
  538. 0x00007fffb9057ac4 <+1924>: ja 0x7fffb9057d43 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2563>
  539. 0x00007fffb9057aca <+1930>: mov %rdx,%rax
  540. 0x00007fffb9057acd <+1933>: add %rbx,%rsi
  541. 0x00007fffb9057ad0 <+1936>: cmp $0x7f,%rsi
  542. 0x00007fffb9057ad4 <+1940>: ja 0x7fffb9057c57 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2327>
  543. 0x00007fffb9057ada <+1946>: mov %rcx,0x8(%rsp)
  544. 0x00007fffb9057adf <+1951>: lea (%rax,%rbx,4),%rdx
  545. 0x00007fffb9057ae3 <+1955>: mov %r12,%rdi
  546. 0x00007fffb9057ae6 <+1958>: movq 0x8(%rsp),%xmm1
  547. 0x00007fffb9057aec <+1964>: lea 0x8(%r12),%rsi
  548. 0x00007fffb9057af1 <+1969>: jmp 0x7fffb9057b10 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2000>
  549. 0x00007fffb9057af3 <+1971>: nopl 0x0(%rax,%rax,1)
  550. 0x00007fffb9057af8 <+1976>: test %rax,%rax
  551. 0x00007fffb9057afb <+1979>: je 0x7fffb9057b03 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1987>
  552. 0x00007fffb9057afd <+1981>: movl $0x0,(%rax)
  553. 0x00007fffb9057b03 <+1987>: add $0x4,%rax
  554. 0x00007fffb9057b07 <+1991>: cmp %rax,%rcx
  555. 0x00007fffb9057b0a <+1994>: je 0x7fffb9057c0b <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2251>
  556. 0x00007fffb9057b10 <+2000>: cmp %rdx,%rax
  557. 0x00007fffb9057b13 <+2003>: jne 0x7fffb9057af8 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1976>
  558. 0x00007fffb9057b15 <+2005>: mov %rax,0x8(%rsp)
  559. 0x00007fffb9057b1a <+2010>: mov 0x261d5aef(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  560. 0x00007fffb9057b21 <+2017>: movq 0x8(%rsp),%xmm0
  561. 0x00007fffb9057b27 <+2023>: pinsrq $0x1,%r9,%xmm0
  562. 0x00007fffb9057b2e <+2030>: movaps %xmm0,0x275b12fb(%rip) # 0x7fffe0608e30 <_ZN2at4cuda6detailL22high_priority_countersE+48>
  563. 0x00007fffb9057b35 <+2037>: movdqa %xmm1,%xmm0
  564. 0x00007fffb9057b39 <+2041>: pinsrq $0x1,%rdi,%xmm0
  565. 0x00007fffb9057b40 <+2048>: movaps %xmm0,0x275b12f9(%rip) # 0x7fffe0608e40 <_ZN2at4cuda6detailL22high_priority_countersE+64>
  566. 0x00007fffb9057b47 <+2055>: jmpq 0x7fffb90574c5 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+389>
  567. 0x00007fffb9057b4c <+2060>: mov 0x275b13ed(%rip),%rcx # 0x7fffe0608f40 <_ZN2at4cuda6detailL12device_flagsE+64>
  568. ---Type <return> to continue, or q <return> to quit---
  569. 0x00007fffb9057b53 <+2067>: mov %rcx,%rax
  570. 0x00007fffb9057b56 <+2070>: sub %rdx,%rax
  571. 0x00007fffb9057b59 <+2073>: sar $0x2,%rax
  572. 0x00007fffb9057b5d <+2077>: sub $0x1,%rax
  573. 0x00007fffb9057b61 <+2081>: cmp %rax,%rbx
  574. 0x00007fffb9057b64 <+2084>: ja 0x7fffb9057d06 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2502>
  575. 0x00007fffb9057b6a <+2090>: mov %rdx,%rax
  576. 0x00007fffb9057b6d <+2093>: add %rbx,%rsi
  577. 0x00007fffb9057b70 <+2096>: cmp $0x7f,%rsi
  578. 0x00007fffb9057b74 <+2100>: ja 0x7fffb9057c1e <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2270>
  579. 0x00007fffb9057b7a <+2106>: mov %rcx,0x8(%rsp)
  580. 0x00007fffb9057b7f <+2111>: lea (%rax,%rbx,4),%rdx
  581. 0x00007fffb9057b83 <+2115>: mov %r12,%rdi
  582. 0x00007fffb9057b86 <+2118>: movq 0x8(%rsp),%xmm1
  583. 0x00007fffb9057b8c <+2124>: lea 0x8(%r12),%rsi
  584. 0x00007fffb9057b91 <+2129>: jmp 0x7fffb9057bac <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2156>
  585. 0x00007fffb9057b93 <+2131>: nopl 0x0(%rax,%rax,1)
  586. 0x00007fffb9057b98 <+2136>: test %rax,%rax
  587. 0x00007fffb9057b9b <+2139>: je 0x7fffb9057ba3 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2147>
  588. 0x00007fffb9057b9d <+2141>: movl $0x0,(%rax)
  589. 0x00007fffb9057ba3 <+2147>: add $0x4,%rax
  590. 0x00007fffb9057ba7 <+2151>: cmp %rax,%rcx
  591. 0x00007fffb9057baa <+2154>: je 0x7fffb9057bfb <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2235>
  592. 0x00007fffb9057bac <+2156>: cmp %rdx,%rax
  593. 0x00007fffb9057baf <+2159>: jne 0x7fffb9057b98 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2136>
  594. 0x00007fffb9057bb1 <+2161>: mov %rax,0x8(%rsp)
  595. 0x00007fffb9057bb6 <+2166>: mov 0x261d5a53(%rip),%r8 # 0x7fffdf22d610 <_ZN2at4cuda6detailL8num_gpusE>
  596. 0x00007fffb9057bbd <+2173>: movq 0x8(%rsp),%xmm0
  597. => 0x00007fffb9057bc3 <+2179>: pinsrq $0x1,%r9,%xmm0
  598. 0x00007fffb9057bca <+2186>: movaps %xmm0,0x275b135f(%rip) # 0x7fffe0608f30 <_ZN2at4cuda6detailL12device_flagsE+48>
  599. 0x00007fffb9057bd1 <+2193>: movdqa %xmm1,%xmm0
  600. 0x00007fffb9057bd5 <+2197>: pinsrq $0x1,%rdi,%xmm0
  601. 0x00007fffb9057bdc <+2204>: movaps %xmm0,0x275b135d(%rip) # 0x7fffe0608f40 <_ZN2at4cuda6detailL12device_flagsE+64>
  602. ---Type <return> to continue, or q <return> to quit---
  603. 0x00007fffb9057be3 <+2211>: jmpq 0x7fffb90573ef <_ZN2at4cuda6detailL21initGlobalStreamStateEv+175>
  604. 0x00007fffb9057be8 <+2216>: mov (%rsi),%rax
  605. 0x00007fffb9057beb <+2219>: add $0x8,%rsi
  606. 0x00007fffb9057bef <+2223>: lea 0x200(%rax),%rcx
  607. 0x00007fffb9057bf6 <+2230>: jmpq 0x7fffb9057a70 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1840>
  608. 0x00007fffb9057bfb <+2235>: mov (%rsi),%rax
  609. 0x00007fffb9057bfe <+2238>: add $0x8,%rsi
  610. 0x00007fffb9057c02 <+2242>: lea 0x200(%rax),%rcx
  611. 0x00007fffb9057c09 <+2249>: jmp 0x7fffb9057bac <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2156>
  612. 0x00007fffb9057c0b <+2251>: mov (%rsi),%rax
  613. 0x00007fffb9057c0e <+2254>: add $0x8,%rsi
  614. 0x00007fffb9057c12 <+2258>: lea 0x200(%rax),%rcx
  615. 0x00007fffb9057c19 <+2265>: jmpq 0x7fffb9057b10 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2000>
  616. 0x00007fffb9057c1e <+2270>: mov %rsi,%rdx
  617. 0x00007fffb9057c21 <+2273>: sar $0x7,%rdx
  618. 0x00007fffb9057c25 <+2277>: test %rsi,%rsi
  619. 0x00007fffb9057c28 <+2280>: jle 0x7fffb9057ea5 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2917>
  620. 0x00007fffb9057c2e <+2286>: lea (%r12,%rdx,8),%rdi
  621. 0x00007fffb9057c32 <+2290>: shl $0x7,%rdx
  622. 0x00007fffb9057c36 <+2294>: sub %rdx,%rsi
  623. 0x00007fffb9057c39 <+2297>: mov (%rdi),%r9
  624. 0x00007fffb9057c3c <+2300>: lea 0x200(%r9),%rbx
  625. 0x00007fffb9057c43 <+2307>: lea (%r9,%rsi,4),%rdx
  626. 0x00007fffb9057c47 <+2311>: mov %rbx,0x8(%rsp)
  627. 0x00007fffb9057c4c <+2316>: movq 0x8(%rsp),%xmm1
  628. 0x00007fffb9057c52 <+2322>: jmpq 0x7fffb9057b8c <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2124>
  629. 0x00007fffb9057c57 <+2327>: mov %rsi,%rdx
  630. 0x00007fffb9057c5a <+2330>: sar $0x7,%rdx
  631. 0x00007fffb9057c5e <+2334>: test %rsi,%rsi
  632. 0x00007fffb9057c61 <+2337>: jle 0x7fffb9057e93 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2899>
  633. 0x00007fffb9057c67 <+2343>: lea (%r12,%rdx,8),%rdi
  634. 0x00007fffb9057c6b <+2347>: shl $0x7,%rdx
  635. 0x00007fffb9057c6f <+2351>: sub %rdx,%rsi
  636. 0x00007fffb9057c72 <+2354>: mov (%rdi),%r9
  637. 0x00007fffb9057c75 <+2357>: lea 0x200(%r9),%rbx
  638. ---Type <return> to continue, or q <return> to quit---
  639. 0x00007fffb9057c7c <+2364>: lea (%r9,%rsi,4),%rdx
  640. 0x00007fffb9057c80 <+2368>: mov %rbx,0x8(%rsp)
  641. 0x00007fffb9057c85 <+2373>: movq 0x8(%rsp),%xmm1
  642. 0x00007fffb9057c8b <+2379>: jmpq 0x7fffb9057aec <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1964>
  643. 0x00007fffb9057c90 <+2384>: mov %rsi,%rdx
  644. 0x00007fffb9057c93 <+2387>: sar $0x7,%rdx
  645. 0x00007fffb9057c97 <+2391>: test %rsi,%rsi
  646. 0x00007fffb9057c9a <+2394>: jle 0x7fffb9057e81 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2881>
  647. 0x00007fffb9057ca0 <+2400>: lea (%r12,%rdx,8),%rdi
  648. 0x00007fffb9057ca4 <+2404>: shl $0x7,%rdx
  649. 0x00007fffb9057ca8 <+2408>: sub %rdx,%rsi
  650. 0x00007fffb9057cab <+2411>: mov (%rdi),%r9
  651. 0x00007fffb9057cae <+2414>: lea 0x200(%r9),%rbx
  652. 0x00007fffb9057cb5 <+2421>: lea (%r9,%rsi,4),%rdx
  653. 0x00007fffb9057cb9 <+2425>: mov %rbx,0x8(%rsp)
  654. 0x00007fffb9057cbe <+2430>: movq 0x8(%rsp),%xmm1
  655. 0x00007fffb9057cc4 <+2436>: jmpq 0x7fffb9057a4b <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1803>
  656. 0x00007fffb9057cc9 <+2441>: mov %rbx,%rsi
  657. 0x00007fffb9057ccc <+2444>: lea 0x275b11ad(%rip),%rdi # 0x7fffe0608e80 <_ZN2at4cuda6detailL21low_priority_countersE>
  658. 0x00007fffb9057cd3 <+2451>: sub %rax,%rsi
  659. 0x00007fffb9057cd6 <+2454>: callq 0x7fffb8e57410 <_ZNSt5dequeISt6atomicIjESaIS1_EE23_M_new_elements_at_backEm@plt>
  660. 0x00007fffb9057cdb <+2459>: mov 0x275b11ce(%rip),%rax # 0x7fffe0608eb0 <_ZN2at4cuda6detailL21low_priority_countersE+48>
  661. 0x00007fffb9057ce2 <+2466>: mov 0x275b11cf(%rip),%r9 # 0x7fffe0608eb8 <_ZN2at4cuda6detailL21low_priority_countersE+56>
  662. 0x00007fffb9057ce9 <+2473>: mov 0x275b11d0(%rip),%rcx # 0x7fffe0608ec0 <_ZN2at4cuda6detailL21low_priority_countersE+64>
  663. 0x00007fffb9057cf0 <+2480>: mov 0x275b11d1(%rip),%r12 # 0x7fffe0608ec8 <_ZN2at4cuda6detailL21low_priority_countersE+72>
  664. 0x00007fffb9057cf7 <+2487>: mov %rax,%rsi
  665. 0x00007fffb9057cfa <+2490>: sub %r9,%rsi
  666. 0x00007fffb9057cfd <+2493>: sar $0x2,%rsi
  667. 0x00007fffb9057d01 <+2497>: jmpq 0x7fffb9057a2c <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1772>
  668. 0x00007fffb9057d06 <+2502>: mov %rbx,%rsi
  669. ---Type <return> to continue, or q <return> to quit---
  670. 0x00007fffb9057d09 <+2505>: lea 0x275b11f0(%rip),%rdi # 0x7fffe0608f00 <_ZN2at4cuda6detailL12device_flagsE>
  671. 0x00007fffb9057d10 <+2512>: sub %rax,%rsi
  672. 0x00007fffb9057d13 <+2515>: callq 0x7fffb8e845a0 <_ZNSt5dequeISt9once_flagSaIS0_EE23_M_new_elements_at_backEm@plt>
  673. 0x00007fffb9057d18 <+2520>: mov 0x275b1211(%rip),%rax # 0x7fffe0608f30 <_ZN2at4cuda6detailL12device_flagsE+48>
  674. 0x00007fffb9057d1f <+2527>: mov 0x275b1212(%rip),%r9 # 0x7fffe0608f38 <_ZN2at4cuda6detailL12device_flagsE+56>
  675. 0x00007fffb9057d26 <+2534>: mov 0x275b1213(%rip),%rcx # 0x7fffe0608f40 <_ZN2at4cuda6detailL12device_flagsE+64>
  676. 0x00007fffb9057d2d <+2541>: mov 0x275b1214(%rip),%r12 # 0x7fffe0608f48 <_ZN2at4cuda6detailL12device_flagsE+72>
  677. 0x00007fffb9057d34 <+2548>: mov %rax,%rsi
  678. 0x00007fffb9057d37 <+2551>: sub %r9,%rsi
  679. 0x00007fffb9057d3a <+2554>: sar $0x2,%rsi
  680. 0x00007fffb9057d3e <+2558>: jmpq 0x7fffb9057b6d <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2093>
  681. 0x00007fffb9057d43 <+2563>: mov %rbx,%rsi
  682. 0x00007fffb9057d46 <+2566>: lea 0x275b10b3(%rip),%rdi # 0x7fffe0608e00 <_ZN2at4cuda6detailL22high_priority_countersE>
  683. 0x00007fffb9057d4d <+2573>: sub %rax,%rsi
  684. 0x00007fffb9057d50 <+2576>: callq 0x7fffb8e57410 <_ZNSt5dequeISt6atomicIjESaIS1_EE23_M_new_elements_at_backEm@plt>
  685. 0x00007fffb9057d55 <+2581>: mov 0x275b10d4(%rip),%rax # 0x7fffe0608e30 <_ZN2at4cuda6detailL22high_priority_countersE+48>
  686. 0x00007fffb9057d5c <+2588>: mov 0x275b10d5(%rip),%r9 # 0x7fffe0608e38 <_ZN2at4cuda6detailL22high_priority_countersE+56>
  687. 0x00007fffb9057d63 <+2595>: mov 0x275b10d6(%rip),%rcx # 0x7fffe0608e40 <_ZN2at4cuda6detailL22high_priority_countersE+64>
  688. 0x00007fffb9057d6a <+2602>: mov 0x275b10d7(%rip),%r12 # 0x7fffe0608e48 <_ZN2at4cuda6detailL22high_priority_countersE+72>
  689. 0x00007fffb9057d71 <+2609>: mov %rax,%rsi
  690. 0x00007fffb9057d74 <+2612>: sub %r9,%rsi
  691. 0x00007fffb9057d77 <+2615>: sar $0x2,%rsi
  692. 0x00007fffb9057d7b <+2619>: jmpq 0x7fffb9057acd <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1933>
  693. 0x00007fffb9057d80 <+2624>: mov %rsi,%r9
  694. 0x00007fffb9057d83 <+2627>: mov %r12,%rdx
  695. 0x00007fffb9057d86 <+2630>: xor %eax,%eax
  696. 0x00007fffb9057d88 <+2632>: mov $0x40,%r10d
  697. 0x00007fffb9057d8e <+2638>: xchg %ax,%ax
  698. 0x00007fffb9057d90 <+2640>: test %rdx,%rdx
  699. 0x00007fffb9057d93 <+2643>: je 0x7fffb9057ddc <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2716>
  700. ---Type <return> to continue, or q <return> to quit---
  701. 0x00007fffb9057d95 <+2645>: mov %rdx,%rdi
  702. 0x00007fffb9057d98 <+2648>: mov %r10,%rcx
  703. 0x00007fffb9057d9b <+2651>: rep stos %rax,%es:(%rdi)
  704. 0x00007fffb9057d9e <+2654>: lea 0x200(%rdx),%rdi
  705. 0x00007fffb9057da5 <+2661>: nopl (%rax)
  706. 0x00007fffb9057da8 <+2664>: movq $0xffffffffffffffff,(%rdx)
  707. 0x00007fffb9057daf <+2671>: movq $0x0,0x8(%rdx)
  708. 0x00007fffb9057db7 <+2679>: add $0x10,%rdx
  709. 0x00007fffb9057dbb <+2683>: cmp %rdi,%rdx
  710. 0x00007fffb9057dbe <+2686>: jne 0x7fffb9057da8 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2664>
  711. 0x00007fffb9057dc0 <+2688>: sub $0x1,%r9
  712. 0x00007fffb9057dc4 <+2692>: mov %rdi,%rdx
  713. 0x00007fffb9057dc7 <+2695>: jne 0x7fffb9057d90 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2640>
  714. 0x00007fffb9057dc9 <+2697>: shl $0x9,%rsi
  715. 0x00007fffb9057dcd <+2701>: add %rsi,%r12
  716. 0x00007fffb9057dd0 <+2704>: mov %r12,0x275b1011(%rip) # 0x7fffe0608de8 <_ZN2at4cuda6detailL20low_priority_streamsE+8>
  717. 0x00007fffb9057dd7 <+2711>: jmpq 0x7fffb9057545 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+517>
  718. 0x00007fffb9057ddc <+2716>: mov $0x200,%edi
  719. 0x00007fffb9057de1 <+2721>: jmp 0x7fffb9057dc0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2688>
  720. 0x00007fffb9057de3 <+2723>: mov %rsi,%r9
  721. 0x00007fffb9057de6 <+2726>: mov %r12,%rdx
  722. 0x00007fffb9057de9 <+2729>: xor %eax,%eax
  723. 0x00007fffb9057deb <+2731>: mov $0x40,%r10d
  724. 0x00007fffb9057df1 <+2737>: nopl 0x0(%rax)
  725. 0x00007fffb9057df8 <+2744>: test %rdx,%rdx
  726. 0x00007fffb9057dfb <+2747>: je 0x7fffb9057e44 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2820>
  727. 0x00007fffb9057dfd <+2749>: mov %rdx,%rdi
  728. 0x00007fffb9057e00 <+2752>: mov %r10,%rcx
  729. 0x00007fffb9057e03 <+2755>: rep stos %rax,%es:(%rdi)
  730. 0x00007fffb9057e06 <+2758>: lea 0x200(%rdx),%rdi
  731. 0x00007fffb9057e0d <+2765>: nopl (%rax)
  732. 0x00007fffb9057e10 <+2768>: movq $0xffffffffffffffff,(%rdx)
  733. 0x00007fffb9057e17 <+2775>: movq $0x0,0x8(%rdx)
  734. 0x00007fffb9057e1f <+2783>: add $0x10,%rdx
  735. ---Type <return> to continue, or q <return> to quit---
  736. 0x00007fffb9057e23 <+2787>: cmp %rdi,%rdx
  737. 0x00007fffb9057e26 <+2790>: jne 0x7fffb9057e10 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2768>
  738. 0x00007fffb9057e28 <+2792>: sub $0x1,%r9
  739. 0x00007fffb9057e2c <+2796>: mov %rdi,%rdx
  740. 0x00007fffb9057e2f <+2799>: jne 0x7fffb9057df8 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2744>
  741. 0x00007fffb9057e31 <+2801>: shl $0x9,%rsi
  742. 0x00007fffb9057e35 <+2805>: add %rsi,%r12
  743. 0x00007fffb9057e38 <+2808>: mov %r12,0x275b0f89(%rip) # 0x7fffe0608dc8 <_ZN2at4cuda6detailL21high_priority_streamsE+8>
  744. 0x00007fffb9057e3f <+2815>: jmpq 0x7fffb90575c5 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+645>
  745. 0x00007fffb9057e44 <+2820>: mov $0x200,%edi
  746. 0x00007fffb9057e49 <+2825>: jmp 0x7fffb9057e28 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2792>
  747. 0x00007fffb9057e4b <+2827>: mov %rax,%rdx
  748. 0x00007fffb9057e4e <+2830>: not %rdx
  749. 0x00007fffb9057e51 <+2833>: shr $0x7,%rdx
  750. 0x00007fffb9057e55 <+2837>: not %rdx
  751. 0x00007fffb9057e58 <+2840>: jmpq 0x7fffb9057884 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1348>
  752. 0x00007fffb9057e5d <+2845>: mov %rax,%rdx
  753. 0x00007fffb9057e60 <+2848>: not %rdx
  754. 0x00007fffb9057e63 <+2851>: shr $0x7,%rdx
  755. 0x00007fffb9057e67 <+2855>: not %rdx
  756. 0x00007fffb9057e6a <+2858>: jmpq 0x7fffb90577d4 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+1172>
  757. 0x00007fffb9057e6f <+2863>: mov %rax,%rdx
  758. 0x00007fffb9057e72 <+2866>: not %rdx
  759. 0x00007fffb9057e75 <+2869>: shr $0x7,%rdx
  760. 0x00007fffb9057e79 <+2873>: not %rdx
  761. 0x00007fffb9057e7c <+2876>: jmpq 0x7fffb9057724 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+996>
  762. 0x00007fffb9057e81 <+2881>: mov %rsi,%rdx
  763. 0x00007fffb9057e84 <+2884>: not %rdx
  764. 0x00007fffb9057e87 <+2887>: shr $0x7,%rdx
  765. 0x00007fffb9057e8b <+2891>: not %rdx
  766. 0x00007fffb9057e8e <+2894>: jmpq 0x7fffb9057ca0 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2400>
  767. 0x00007fffb9057e93 <+2899>: mov %rsi,%rdx
  768. 0x00007fffb9057e96 <+2902>: not %rdx
  769. 0x00007fffb9057e99 <+2905>: shr $0x7,%rdx
  770. ---Type <return> to continue, or q <return> to quit---
  771. 0x00007fffb9057e9d <+2909>: not %rdx
  772. 0x00007fffb9057ea0 <+2912>: jmpq 0x7fffb9057c67 <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2343>
  773. 0x00007fffb9057ea5 <+2917>: mov %rsi,%rdx
  774. 0x00007fffb9057ea8 <+2920>: not %rdx
  775. 0x00007fffb9057eab <+2923>: shr $0x7,%rdx
  776. 0x00007fffb9057eaf <+2927>: not %rdx
  777. 0x00007fffb9057eb2 <+2930>: jmpq 0x7fffb9057c2e <_ZN2at4cuda6detailL21initGlobalStreamStateEv+2286>
  778. End of assembler dump.
  779. (gdb)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement