Advertisement
Guest User

dmtcp_launch

a guest
Nov 17th, 2014
316
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 137.86 KB | None | 0 0
  1. [slurm@slurm-master ~]$ dmtcp_launch --rm srun -n 2 mpiLoop 50
  2. [6365] TRACE at dmtcp_launch.cpp:419 in main; REASON='dmtcp_launch starting new program:'
  3. argv[0] = srun
  4. [6365] TRACE at dmtcp_launch.cpp:433 in main; REASON='setting DMTCP_CHECKPOINT_DIR'
  5. ckptDir = /home/slurm
  6. [6365] TRACE at coordinatorapi.cpp:586 in connectToCoordOnStartup; REASON='sending coordinator handshake'
  7. UniquePid::ThisProcess() = 6db90f3d5a9dd200-6365-546a1de8
  8. [6365] TRACE at coordinatorapi.cpp:593 in connectToCoordOnStartup; REASON='Got virtual pid from coordinator'
  9. hello_remote.virtualPid = 40000
  10. [6365] TRACE at shareddata.cpp:189 in initialize; REASON='Shared area mapped'
  11. sharedDataHeader = 0x7f3eccb11000
  12. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  13. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  14. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  15. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  16. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  17. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  18. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  19. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  20. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  21. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  22. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  23. [6365] TRACE at jfilesystem.cpp:273 in FindHelperUtility; REASON='JALIB_UTILITY_DIR was set: using it'
  24. [6365] TRACE at dmtcp_launch.cpp:707 in setLDPreloadLibs; REASON='getting value of LD_PRELOAD'
  25. getenv("LD_PRELOAD") = /usr/local/bin/../lib/dmtcp/libdmtcp_batch-queue.so:/usr/local/bin/../lib/dmtcp/libdmtcp_alloc.so:/usr/local/bin
  26. /../lib/dmtcp/libdmtcp_dl.so:/usr/local/bin/../lib/dmtcp/libdmtcp_ipc.so:/usr/local/bin/../lib/dmtcp/libdmtcp.so:/usr/local/bin/../lib/dmtcp
  27. /libdmtcp_pid.so:
  28. preloadLibs = /usr/local/bin/../lib/dmtcp/libdmtcp_batch-queue.so:/usr/local/bin/../lib/dmtcp/libdmtcp_alloc.so:/usr/local/bin/../lib/d
  29. mtcp/libdmtcp_dl.so:/usr/local/bin/../lib/dmtcp/libdmtcp_ipc.so:/usr/local/bin/../lib/dmtcp/libdmtcp.so:/usr/local/bin/../lib/dmtcp/libdmtcp
  30. _pid.so:
  31. preloadLibs32 = libdmtcp_batch-queue.so:libdmtcp_alloc.so:libdmtcp_dl.so:libdmtcp_ipc.so:libdmtcp.so:libdmtcp_pid.so:
  32. [40000] TRACE at dmtcpworker.cpp:233 in prepareLogAndProcessdDataFromSerialFile; REASON='Root of processes tree'
  33. [40000] TRACE at dmtcpworker.cpp:278 in DmtcpWorker; REASON='libdmtcp.so: Running '
  34. jalib::Filesystem::GetProgramName() = srun
  35. getenv ("LD_PRELOAD") = /usr/local/bin/../lib/dmtcp/libdmtcp_batch-queue.so:/usr/local/bin/../lib/dmtcp/libdmtcp_alloc.so:/usr/local/bi
  36. n/../lib/dmtcp/libdmtcp_dl.so:/usr/local/bin/../lib/dmtcp/libdmtcp_ipc.so:/usr/local/bin/../lib/dmtcp/libdmtcp.so:/usr/local/bin/../lib/dmtc
  37. p/libdmtcp_pid.so:
  38. [40000] TRACE at dmtcpworker.cpp:96 in restoreUserLDPRELOAD; REASON='LD_PRELOAD'
  39. preload =
  40. userPreload = [40000] TRACE at coordinatorapi.cpp:164 in init; REASON='Informing coordinator of new process'
  41. UniquePid::ThisProcess() = 6db90f3d5a9dd200-40000-546a1de8
  42. [40000] TRACE at processinfo.cpp:174 in growStack; REASON='Original stack area'
  43. (void*)area.addr = 0x7fffe5c45000
  44. area.size = 86016
  45. [40000] TRACE at processinfo.cpp:196 in growStack; REASON='New stack size'
  46. (void*)area.addr = 0x7fffe526a000
  47. area.size = 10420224
  48. [40000] TRACE at shareddata.cpp:189 in initialize; REASON='Shared area mapped'
  49. sharedDataHeader = 0x7fa89e561000
  50. [40000] TRACE at fileconnlist.cpp:250 in scanForPreExisting; REASON='scanning pre-existing device'
  51. fd = 0
  52. device = /dev/pts/1
  53. [40000] TRACE at fileconnection.cpp:252 in PtyConnection; REASON='creating CTTY connection'
  54. _ptsName = /dev/pts/1
  55. _virtPtsName = /dev/pts/v0
  56. [40000] TRACE at fileconnlist.cpp:250 in scanForPreExisting; REASON='scanning pre-existing device'
  57. fd = 1
  58. device = /dev/pts/1
  59. [40000] TRACE at fileconnlist.cpp:250 in scanForPreExisting; REASON='scanning pre-existing device'
  60. fd = 2
  61. device = /dev/pts/1
  62. [40000] TRACE at socketconnlist.cpp:150 in scanForPreExisting; REASON='scanning pre-existing device'
  63. fd = 0
  64. device = /dev/pts/1
  65. [40000] TRACE at socketconnlist.cpp:150 in scanForPreExisting; REASON='scanning pre-existing device'
  66. fd = 1
  67. device = /dev/pts/1
  68. [40000] TRACE at socketconnlist.cpp:150 in scanForPreExisting; REASON='scanning pre-existing device'
  69. fd = 2
  70. device = /dev/pts/1
  71. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  72. th->tid = 6365
  73. th->virtual_tid = 40000
  74. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  75. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  76. tid = 6368
  77. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  78. virtualTid = 40002
  79. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  80. th->tid = 6368
  81. th->virtual_tid = 40002
  82. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  83. gettid() = 40002
  84. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  85. ret = 3
  86. domain = 2
  87. type = 1
  88. protocol = 6
  89. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  90. id() = 6db90f3d5a9dd200-40000-546a1de8(99005)
  91. domain = 2
  92. type = 1
  93. protocol = 6
  94. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  95. ret = 0
  96. sockfd = 3
  97. optname = 2
  98. [40000] TRACE at socketwrappers.cpp:141 in bind; REASON='bind'
  99. sockfd = 3
  100. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99005)
  101. [40000] TRACE at socketwrappers.cpp:159 in listen; REASON='listen'
  102. sockfd = 3
  103. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99005)
  104. backlog = 4096
  105. [40000] TRACE at threadlist.cpp:318 in checkpointhread; REASON='after sigsetjmp/getcontext'
  106. curThread->tid = 6368
  107. curThread->virtual_tid = 40002
  108. curThread->saved_sp = 0x7fa89e55d790
  109. [40000] TRACE at threadlist.cpp:334 in checkpointhread; REASON='before callbackSleepBetweenCheckpoint(0)'
  110. [40000] TRACE at dmtcpworker.cpp:468 in waitForStage1Suspend; REASON='running'
  111. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for SUSPEND message'
  112. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  113. ret = 4
  114. domain = 2
  115. type = 1
  116. protocol = 6
  117. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  118. id() = 6db90f3d5a9dd200-40000-546a1de8(99006)
  119. domain = 2
  120. type = 1
  121. protocol = 6
  122. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  123. ret = 0
  124. sockfd = 4
  125. optname = 2
  126. [40000] TRACE at socketwrappers.cpp:141 in bind; REASON='bind'
  127. sockfd = 4
  128. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99006)
  129. [40000] TRACE at socketwrappers.cpp:159 in listen; REASON='listen'
  130. sockfd = 4
  131. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99006)
  132. backlog = 1024
  133. [40000] TRACE at miscwrappers.cpp:120 in pipe; REASON='promoting pipe() to socketpair()'
  134. [40000] TRACE at socketwrappers.cpp:271 in socketpair; REASON='socketpair()'
  135. sv[0] = 5
  136. sv[1] = 6
  137. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  138. id() = 6db90f3d5a9dd200-40000-546a1de8(99007)
  139. domain = 1
  140. type = 1
  141. protocol = 0
  142. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  143. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  144. tid = 6369
  145. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  146. virtualTid = 40004
  147. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  148. th->tid = 6369
  149. th->virtual_tid = 40004
  150. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  151. gettid() = 40004
  152. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  153. ret = 7
  154. domain = 2
  155. type = 1
  156. protocol = 6
  157. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  158. id() = 6db90f3d5a9dd200-40000-546a1de8(99009)
  159. domain = 2
  160. type = 1
  161. protocol = 6
  162. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  163. ret = 0
  164. sockfd = 7
  165. optname = 2
  166. [40000] TRACE at socketwrappers.cpp:141 in bind; REASON='bind'
  167. sockfd = 7
  168. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99009)
  169. [40000] TRACE at socketwrappers.cpp:159 in listen; REASON='listen'
  170. sockfd = 7
  171. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99009)
  172. backlog = 4096
  173. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  174. ret = 8
  175. domain = 2
  176. type = 1
  177. protocol = 6
  178. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  179. id() = 6db90f3d5a9dd200-40000-546a1de8(99011)
  180. domain = 2
  181. type = 1
  182. protocol = 6
  183. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  184. sockfd = 8
  185. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99011)
  186. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  187. ret = 9
  188. domain = 1
  189. type = 1
  190. protocol = 0
  191. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  192. id() = 6db90f3d5a9dd200-40000-546a1de8(99012)
  193. domain = 1
  194. type = 1
  195. protocol = 0
  196. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  197. sockfd = 9
  198. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99012)
  199. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  200. ret = 9
  201. domain = 1
  202. type = 1
  203. protocol = 0
  204. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  205. id() = 6db90f3d5a9dd200-40000-546a1de8(99013)
  206. domain = 1
  207. type = 1
  208. protocol = 0
  209. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  210. sockfd = 9
  211. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99013)
  212. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  213. ret = 7
  214. domain = 2
  215. type = 1
  216. protocol = 6
  217. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  218. id() = 6db90f3d5a9dd200-40000-546a1de8(99015)
  219. domain = 2
  220. type = 1
  221. protocol = 6
  222. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  223. sockfd = 7
  224. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99015)
  225. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  226. ret = 8
  227. domain = 1
  228. type = 1
  229. protocol = 0
  230. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  231. id() = 6db90f3d5a9dd200-40000-546a1de8(99016)
  232. domain = 1
  233. type = 1
  234. protocol = 0
  235. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  236. sockfd = 8
  237. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99016)
  238. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  239. ret = 8
  240. domain = 1
  241. type = 1
  242. protocol = 0
  243. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  244. id() = 6db90f3d5a9dd200-40000-546a1de8(99017)
  245. domain = 1
  246. type = 1
  247. protocol = 0
  248. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  249. sockfd = 8
  250. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99017)
  251. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  252. ret = 7
  253. domain = 2
  254. type = 1
  255. protocol = 6
  256. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  257. id() = 6db90f3d5a9dd200-40000-546a1de8(99020)
  258. domain = 2
  259. type = 1
  260. protocol = 6
  261. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  262. ret = 0
  263. sockfd = 7
  264. optname = 2
  265. [40000] TRACE at socketwrappers.cpp:141 in bind; REASON='bind'
  266. sockfd = 7
  267. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99020)
  268. [40000] TRACE at socketwrappers.cpp:159 in listen; REASON='listen'
  269. sockfd = 7
  270. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99020)
  271. backlog = 1024
  272. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  273. ret = 8
  274. domain = 2
  275. type = 1
  276. protocol = 6
  277. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  278. id() = 6db90f3d5a9dd200-40000-546a1de8(99022)
  279. domain = 2
  280. type = 1
  281. protocol = 6
  282. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  283. sockfd = 8
  284. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99022)
  285. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  286. ret = 9
  287. domain = 1
  288. type = 1
  289. protocol = 0
  290. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  291. id() = 6db90f3d5a9dd200-40000-546a1de8(99023)
  292. domain = 1
  293. type = 1
  294. protocol = 0
  295. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  296. sockfd = 9
  297. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99023)
  298. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  299. ret = 9
  300. domain = 1
  301. type = 1
  302. protocol = 0
  303. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  304. id() = 6db90f3d5a9dd200-40000-546a1de8(99024)
  305. domain = 1
  306. type = 1
  307. protocol = 0
  308. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  309. sockfd = 9
  310. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99024)
  311. [40000] TRACE at miscwrappers.cpp:120 in pipe; REASON='promoting pipe() to socketpair()'
  312. [40000] TRACE at socketwrappers.cpp:271 in socketpair; REASON='socketpair()'
  313. sv[0] = 8
  314. sv[1] = 9
  315. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  316. id() = 6db90f3d5a9dd200-40000-546a1de8(99027)
  317. domain = 1
  318. type = 1
  319. protocol = 0
  320. [40000] TRACE at coordinatorapi.cpp:623 in createNewConnectionBeforeFork; REASON='Got virtual pid from coordinator'
  321. hello_remote.virtualPid = 41000
  322. [40000] TRACE at processinfo.cpp:357 in insertChild; REASON='Creating new virtualPid -> realPid mapping.'
  323. pid = 41000
  324. uniquePid = 6db90f3d5a9dd200-41000-546a1de8
  325. [40000] TRACE at execwrappers.cpp:205 in fork; REASON='fork()ed [PARENT] done'
  326. child = 6db90f3d5a9dd200-41000-546a1de8
  327. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  328. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  329. tid = 6374
  330. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  331. ret = 8
  332. domain = 2
  333. type = 1
  334. protocol = 6
  335. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  336. id() = 6db90f3d5a9dd200-40000-546a1de8(99029)
  337. domain = 2
  338. type = 1
  339. protocol = 6
  340. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  341. ret = 0
  342. sockfd = 8
  343. optname = 2
  344. [40000] TRACE at socketwrappers.cpp:141 in bind; REASON='bind'
  345. sockfd = 8
  346. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99029)
  347. [40000] TRACE at socketwrappers.cpp:159 in listen; REASON='listen'
  348. sockfd = 8
  349. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99029)
  350. backlog = 1024
  351. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  352. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  353. tid = 6375
  354. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  355. virtualTid = 40006
  356. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  357. th->tid = 6374
  358. th->virtual_tid = 40006
  359. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  360. gettid() = 40006
  361. [41000] TRACE at virtualidtable.h:182 in printMaps; REASON='Virtual To Real Mappings:'
  362. _idMapTable.size() = 5
  363. out.str() = Pid Maps
  364. Virtual -> Real
  365. 4213 -> 4213
  366. 40000 -> 6365
  367. 40002 -> 6368
  368. 40004 -> 6369
  369. 41000 -> 6373
  370.  
  371. [41000] TRACE at virtualidtable.h:182 in printMaps; REASON='Virtual To Real Mappings:'
  372. _idMapTable.size() = 5
  373. out.str() = Pid Maps
  374. Virtual -> Real
  375. 4213 -> 4213
  376. 40000 -> 6365
  377. 40002 -> 6368
  378. 40004 -> 6369
  379. 41000 -> 6373
  380.  
  381. [41000] TRACE at uniquepid.cpp:199 in resetOnFork; REASON='Explicitly setting process UniquePid'
  382. newId = 6db90f3d5a9dd200-41000-546a1de8
  383. [41000] TRACE at execwrappers.cpp:157 in pthread_atfork_child; REASON='fork()ed [CHILD]'
  384. child = 6db90f3d5a9dd200-41000-546a1de8
  385. parent = 6db90f3d5a9dd200-40000-546a1de8
  386. [41000] TRACE at coordinatorapi.cpp:186 in resetOnFork; REASON='Informing coordinator of new process'
  387. UniquePid::ThisProcess() = 6db90f3d5a9dd200-41000-546a1de8
  388. [41000] TRACE at virtualidtable.h:182 in printMaps; REASON='Virtual To Real Mappings:'
  389. _idMapTable.size() = 5
  390. out.str() = Pid Maps
  391. Virtual -> Real
  392. 4213 -> 4213
  393. 40000 -> 6365
  394. 40002 -> 6368
  395. 40004 -> 6369
  396. 41000 -> 6373
  397.  
  398. [41000] TRACE at virtualidtable.h:182 in printMaps; REASON='Virtual To Real Mappings:'
  399. _idMapTable.size() = 5
  400. out.str() = Pid Maps
  401. Virtual -> Real
  402. 4213 -> 4213
  403. 40000 -> 6365
  404. 40002 -> 6368
  405. 40004 -> 6369
  406. 41000 -> 6373
  407.  
  408. [41000] TRACE at dmtcpworker.cpp:349 in cleanupWorker; REASON='disconnecting from dmtcp coordinator'
  409. [41000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  410. thread->tid = 6369
  411. [41000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  412. thread->tid = 6368
  413. [41000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  414. thread->tid = 6365
  415. [41000] TRACE at execwrappers.cpp:199 in fork; REASON='fork() done [CHILD]'
  416. child = 6db90f3d5a9dd200-41000-546a1de8
  417. parent = 6db90f3d5a9dd200-40000-546a1de8
  418. [41000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  419. th->tid = 6373
  420. th->virtual_tid = 41000
  421. [41000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  422. [41000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  423. tid = 6376
  424. [40000] TRACE at miscwrappers.cpp:120 in pipe; REASON='promoting pipe() to socketpair()'
  425. [40000] TRACE at socketwrappers.cpp:271 in socketpair; REASON='socketpair()'
  426. sv[0] = 10
  427. sv[1] = 11
  428. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  429. id() = 6db90f3d5a9dd200-40000-546a1de8(99030)
  430. domain = 1
  431. type = 1
  432. protocol = 0
  433. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  434. ret = 12
  435. domain = 2
  436. type = 1
  437. protocol = 6
  438. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  439. id() = 6db90f3d5a9dd200-40000-546a1de8(99032)
  440. domain = 2
  441. type = 1
  442. protocol = 6
  443. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  444. ret = 0
  445. sockfd = 12
  446. optname = 2
  447. [40000] TRACE at socketwrappers.cpp:141 in bind; REASON='bind'
  448. sockfd = 12
  449. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99032)
  450. [40000] TRACE at socketwrappers.cpp:159 in listen; REASON='listen'
  451. sockfd = 12
  452. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99032)
  453. backlog = 1024
  454. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  455. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  456. tid = 6377
  457. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  458. virtualTid = 40008
  459. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  460. th->tid = 6375
  461. th->virtual_tid = 40008
  462. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  463. gettid() = 40008
  464. [40000] TRACE at miscwrappers.cpp:120 in pipe; REASON='promoting pipe() to socketpair()'
  465. [40000] TRACE at socketwrappers.cpp:271 in socketpair; REASON='socketpair()'
  466. sv[0] = 13
  467. sv[1] = 14
  468. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  469. id() = 6db90f3d5a9dd200-40000-546a1de8(99033)
  470. domain = 1
  471. type = 1
  472. protocol = 0
  473. [40000] TRACE at miscwrappers.cpp:120 in pipe; REASON='promoting pipe() to socketpair()'
  474. [40000] TRACE at socketwrappers.cpp:271 in socketpair; REASON='socketpair()'
  475. sv[0] = 15
  476. sv[1] = 16
  477. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  478. id() = 6db90f3d5a9dd200-40000-546a1de8(99036)
  479. domain = 1
  480. type = 1
  481. protocol = 0
  482. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  483. ret = 17
  484. domain = 2
  485. type = 1
  486. protocol = 6
  487. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  488. id() = 6db90f3d5a9dd200-40000-546a1de8(99038)
  489. domain = 2
  490. type = 1
  491. protocol = 6
  492. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  493. ret = 0
  494. sockfd = 17
  495. optname = 2
  496. [40000] TRACE at socketwrappers.cpp:141 in bind; REASON='bind'
  497. sockfd = 17
  498. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99038)
  499. [40000] TRACE at socketwrappers.cpp:159 in listen; REASON='listen'
  500. sockfd = 17
  501. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99038)
  502. backlog = 1024
  503. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  504. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  505. tid = 6378
  506. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  507. virtualTid = 40010
  508. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  509. th->tid = 6377
  510. th->virtual_tid = 40010
  511. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  512. gettid() = 40010
  513. [41000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  514. virtualTid = 41002
  515. [41000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  516. th->tid = 6376
  517. th->virtual_tid = 41002
  518. [41000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  519. gettid() = 41002
  520. [41000] TRACE at threadlist.cpp:318 in checkpointhread; REASON='after sigsetjmp/getcontext'
  521. curThread->tid = 6376
  522. curThread->virtual_tid = 41002
  523. curThread->saved_sp = 0x7fa89e55d790
  524. [41000] TRACE at threadlist.cpp:334 in checkpointhread; REASON='before callbackSleepBetweenCheckpoint(0)'
  525. [41000] TRACE at dmtcpworker.cpp:468 in waitForStage1Suspend; REASON='running'
  526. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for SUSPEND message'
  527. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  528. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  529. tid = 6379
  530. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  531. virtualTid = 40012
  532. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  533. th->tid = 6378
  534. th->virtual_tid = 40012
  535. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  536. gettid() = 40012
  537. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  538. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  539. tid = 6380
  540. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  541. virtualTid = 40014
  542. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  543. th->tid = 6379
  544. th->virtual_tid = 40014
  545. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  546. gettid() = 40014
  547. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  548. ret = 18
  549. domain = 2
  550. type = 1
  551. protocol = 6
  552. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  553. id() = 6db90f3d5a9dd200-40000-546a1de8(99040)
  554. domain = 2
  555. type = 1
  556. protocol = 6
  557. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  558. virtualTid = 40016
  559. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  560. th->tid = 6380
  561. th->virtual_tid = 40016
  562. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  563. sockfd = 18
  564. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99040)
  565. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  566. ret = 19
  567. domain = 1
  568. type = 1
  569. protocol = 0
  570. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  571. id() = 6db90f3d5a9dd200-40000-546a1de8(99041)
  572. domain = 1
  573. type = 1
  574. protocol = 0
  575. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  576. sockfd = 19
  577. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99041)
  578. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  579. gettid() = 40016
  580. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  581. ret = 19
  582. domain = 2
  583. type = 1
  584. protocol = 6
  585. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  586. id() = 6db90f3d5a9dd200-40000-546a1de8(99043)
  587. domain = 2
  588. type = 1
  589. protocol = 6
  590. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  591. sockfd = 19
  592. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99043)
  593. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  594. ret = 20
  595. domain = 1
  596. type = 1
  597. protocol = 0
  598. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  599. id() = 6db90f3d5a9dd200-40000-546a1de8(99044)
  600. domain = 1
  601. type = 1
  602. protocol = 0
  603. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  604. sockfd = 20
  605. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99044)
  606. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  607. ret = 20
  608. domain = 1
  609. type = 1
  610. protocol = 0
  611. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  612. id() = 6db90f3d5a9dd200-40000-546a1de8(99045)
  613. domain = 1
  614. type = 1
  615. protocol = 0
  616. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  617. sockfd = 20
  618. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99045)
  619. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  620. virtualTid = 0
  621. [40000] TRACE at socketwrappers.cpp:184 in process_accept; REASON='accepted incoming connection'
  622. sockfd = 17
  623. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99046)
  624. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  625. ret = 0
  626. sockfd = 18
  627. optname = 18
  628. [40000] TRACE at socketwrappers.cpp:184 in process_accept; REASON='accepted incoming connection'
  629. sockfd = 12
  630. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99047)
  631. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  632. ret = 21
  633. domain = 1
  634. type = 1
  635. protocol = 0
  636. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  637. id() = 6db90f3d5a9dd200-40000-546a1de8(99048)
  638. domain = 1
  639. type = 1
  640. protocol = 0
  641. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  642. sockfd = 21
  643. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99048)
  644. [40000] TRACE at socketwrappers.cpp:184 in process_accept; REASON='accepted incoming connection'
  645. sockfd = 8
  646. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99049)
  647. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  648. ret = 20
  649. domain = 1
  650. type = 1
  651. protocol = 0
  652. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  653. id() = 6db90f3d5a9dd200-40000-546a1de8(99050)
  654. domain = 1
  655. type = 1
  656. protocol = 0
  657. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  658. sockfd = 20
  659. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99050)
  660. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  661. virtualTid = 0
  662. [40000] TRACE at socketwrappers.cpp:184 in process_accept; REASON='accepted incoming connection'
  663. sockfd = 17
  664. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99051)
  665. [40000] TRACE at socketwrappers.cpp:237 in setsockopt; REASON='setsockopt'
  666. ret = 0
  667. sockfd = 19
  668. optname = 18
  669. [40000] TRACE at socketwrappers.cpp:184 in process_accept; REASON='accepted incoming connection'
  670. sockfd = 12
  671. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99052)
  672. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  673. ret = 21
  674. domain = 1
  675. type = 1
  676. protocol = 0
  677. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  678. id() = 6db90f3d5a9dd200-40000-546a1de8(99053)
  679. domain = 1
  680. type = 1
  681. protocol = 0
  682. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  683. sockfd = 21
  684. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99053)
  685. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  686. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  687. tid = 6381
  688. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  689. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  690. tid = 6382
  691. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  692. virtualTid = 40018
  693. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  694. th->tid = 6381
  695. th->virtual_tid = 40018
  696. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  697. thread->tid = 6380
  698. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  699. thread->tid = 6380
  700. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  701. thread->tid = 6379
  702. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  703. thread->tid = 6379
  704. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  705. gettid() = 40018
  706. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  707. ret = 20
  708. domain = 2
  709. type = 1
  710. protocol = 6
  711. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  712. id() = 6db90f3d5a9dd200-40000-546a1de8(99054)
  713. domain = 2
  714. type = 1
  715. protocol = 6
  716. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  717. virtualTid = 40020
  718. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  719. th->tid = 6382
  720. th->virtual_tid = 40020
  721. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  722. gettid() = 40020
  723. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  724. ret = 21
  725. domain = 2
  726. type = 1
  727. protocol = 6
  728. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  729. sockfd = 20
  730. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99054)
  731. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  732. ret = 22
  733. domain = 1
  734. type = 1
  735. protocol = 0
  736. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  737. id() = 6db90f3d5a9dd200-40000-546a1de8(99056)
  738. domain = 1
  739. type = 1
  740. protocol = 0
  741. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  742. sockfd = 22
  743. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99056)
  744. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  745. id() = 6db90f3d5a9dd200-40000-546a1de8(99055)
  746. domain = 2
  747. type = 1
  748. protocol = 6
  749. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  750. sockfd = 21
  751. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99055)
  752. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  753. ret = 22
  754. domain = 1
  755. type = 1
  756. protocol = 0
  757. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  758. id() = 6db90f3d5a9dd200-40000-546a1de8(99057)
  759. domain = 1
  760. type = 1
  761. protocol = 0
  762. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  763. sockfd = 22
  764. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99057)
  765. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  766. ret = 22
  767. domain = 1
  768. type = 1
  769. protocol = 0
  770. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  771. id() = 6db90f3d5a9dd200-40000-546a1de8(99058)
  772. domain = 1
  773. type = 1
  774. protocol = 0
  775. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  776. sockfd = 22
  777. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99058)
  778. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  779. virtualTid = 19
  780. [40000] TRACE at socketwrappers.cpp:184 in process_accept; REASON='accepted incoming connection'
  781. sockfd = 8
  782. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99059)
  783. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  784. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  785. tid = 6383
  786. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  787. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  788. tid = 6384
  789. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  790. virtualTid = 40022
  791. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  792. th->tid = 6383
  793. th->virtual_tid = 40022
  794. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  795. thread->tid = 6381
  796. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  797. thread->tid = 6381
  798. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  799. gettid() = 40022
  800. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  801. ret = 22
  802. domain = 2
  803. type = 1
  804. protocol = 6
  805. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  806. id() = 6db90f3d5a9dd200-40000-546a1de8(99060)
  807. domain = 2
  808. type = 1
  809. protocol = 6
  810. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  811. virtualTid = 40024
  812. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  813. th->tid = 6384
  814. th->virtual_tid = 40024
  815. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  816. gettid() = 40024
  817. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  818. sockfd = 22
  819. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99060)
  820. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  821. ret = 23
  822. domain = 1
  823. type = 1
  824. protocol = 0
  825. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  826. id() = 6db90f3d5a9dd200-40000-546a1de8(99061)
  827. domain = 1
  828. type = 1
  829. protocol = 0
  830. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  831. ret = 24
  832. domain = 1
  833. type = 1
  834. protocol = 0
  835. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  836. id() = 6db90f3d5a9dd200-40000-546a1de8(99062)
  837. domain = 1
  838. type = 1
  839. protocol = 0
  840. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  841. sockfd = 24
  842. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99062)
  843. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  844. virtualTid = 0
  845. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  846. sockfd = 23
  847. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99061)
  848. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  849. ret = 21
  850. domain = 2
  851. type = 1
  852. protocol = 6
  853. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  854. id() = 6db90f3d5a9dd200-40000-546a1de8(99063)
  855. domain = 2
  856. type = 1
  857. protocol = 6
  858. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  859. sockfd = 21
  860. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99063)
  861. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  862. ret = 23
  863. domain = 1
  864. type = 1
  865. protocol = 0
  866. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  867. id() = 6db90f3d5a9dd200-40000-546a1de8(99064)
  868. domain = 1
  869. type = 1
  870. protocol = 0
  871. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  872. sockfd = 23
  873. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99064)
  874. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  875. ret = 23
  876. domain = 1
  877. type = 1
  878. protocol = 0
  879. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  880. id() = 6db90f3d5a9dd200-40000-546a1de8(99065)
  881. domain = 1
  882. type = 1
  883. protocol = 0
  884. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  885. sockfd = 23
  886. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99065)
  887. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  888. virtualTid = 20
  889. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  890. ret = 22
  891. domain = 1
  892. type = 1
  893. protocol = 0
  894. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  895. id() = 6db90f3d5a9dd200-40000-546a1de8(99066)
  896. domain = 1
  897. type = 1
  898. protocol = 0
  899. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  900. sockfd = 22
  901. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99066)
  902. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  903. virtualTid = 0
  904. [40000] TRACE at socketwrappers.cpp:184 in process_accept; REASON='accepted incoming connection'
  905. sockfd = 8
  906. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99067)
  907. [40000] TRACE at socketwrappers.cpp:184 in process_accept; REASON='accepted incoming connection'
  908. sockfd = 8
  909. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99068)
  910. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  911. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  912. tid = 6385
  913. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  914. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  915. tid = 6386
  916. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  917. virtualTid = 40026
  918. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  919. th->tid = 6385
  920. th->virtual_tid = 40026
  921. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  922. thread->tid = 6384
  923. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  924. thread->tid = 6384
  925. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  926. thread->tid = 6383
  927. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  928. thread->tid = 6383
  929. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  930. thread->tid = 6382
  931. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  932. thread->tid = 6382
  933. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  934. gettid() = 40026
  935. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  936. ret = 21
  937. domain = 2
  938. type = 1
  939. protocol = 6
  940. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  941. id() = 6db90f3d5a9dd200-40000-546a1de8(99069)
  942. domain = 2
  943. type = 1
  944. protocol = 6
  945. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  946. virtualTid = 40028
  947. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  948. th->tid = 6386
  949. th->virtual_tid = 40028
  950. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  951. gettid() = 40028
  952. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  953. ret = 22
  954. domain = 2
  955. type = 1
  956. protocol = 6
  957. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  958. id() = 6db90f3d5a9dd200-40000-546a1de8(99070)
  959. domain = 2
  960. type = 1
  961. protocol = 6
  962. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  963. sockfd = 21
  964. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99069)
  965. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  966. ret = 23
  967. domain = 1
  968. type = 1
  969. protocol = 0
  970. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  971. id() = 6db90f3d5a9dd200-40000-546a1de8(99071)
  972. domain = 1
  973. type = 1
  974. protocol = 0
  975. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  976. sockfd = 23
  977. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99071)
  978. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  979. sockfd = 22
  980. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99070)
  981. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  982. ret = 23
  983. domain = 1
  984. type = 1
  985. protocol = 0
  986. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  987. id() = 6db90f3d5a9dd200-40000-546a1de8(99072)
  988. domain = 1
  989. type = 1
  990. protocol = 0
  991. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  992. sockfd = 23
  993. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99072)
  994. Process 0 of 2 is on slurm-compute1
  995. iteration 0 on process 0
  996. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  997. ret = 23
  998. domain = 1
  999. type = 1
  1000. protocol = 0
  1001. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  1002. id() = 6db90f3d5a9dd200-40000-546a1de8(99073)
  1003. domain = 1
  1004. type = 1
  1005. protocol = 0
  1006. Process 1 of 2 is on slurm-compute2
  1007. iteration 0 on process 1
  1008. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  1009. sockfd = 23
  1010. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99073)
  1011. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  1012. virtualTid = 20
  1013. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  1014. ret = 21
  1015. domain = 1
  1016. type = 1
  1017. protocol = 0
  1018. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  1019. id() = 6db90f3d5a9dd200-40000-546a1de8(99074)
  1020. domain = 1
  1021. type = 1
  1022. protocol = 0
  1023. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  1024. sockfd = 21
  1025. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99074)
  1026. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  1027. virtualTid = 0
  1028. iteration 1 on process 0
  1029. iteration 1 on process 1
  1030. iteration 2 on process 1
  1031. iteration 2 on process 0
  1032. iteration 3 on process 1
  1033. iteration 3 on process 0
  1034. iteration 4 on process 1
  1035. iteration 4 on process 0
  1036. iteration 5 on process 1
  1037. iteration 5 on process 0
  1038. [40000] TRACE at dmtcpworker.cpp:474 in waitForStage1Suspend; REASON='got SUSPEND message, preparing to acquire all ThreadSync locks'
  1039. [40000] TRACE at threadsync.cpp:133 in acquireLocks; REASON='waiting for dmtcp_lock(): to get synchronized with _runCoordinatorCmd if we use
  1040. DMTCP API'
  1041. [40000] TRACE at threadsync.cpp:136 in acquireLocks; REASON='Waiting for lock(&theCkptCanStart)'
  1042. [40000] TRACE at threadsync.cpp:139 in acquireLocks; REASON='Waiting for libdlLock'
  1043. [40000] TRACE at threadsync.cpp:142 in acquireLocks; REASON='Waiting for threads creation lock'
  1044. [40000] TRACE at threadsync.cpp:147 in acquireLocks; REASON='Waiting for other threads to exit DMTCP-Wrappers'
  1045. [40000] TRACE at threadsync.cpp:152 in acquireLocks; REASON='Waiting for newly created threads to finish initialization'
  1046. _uninitializedThreadCount = 0
  1047. [40000] TRACE at threadsync.cpp:157 in acquireLocks; REASON='Done acquiring all locks'
  1048. [40000] TRACE at dmtcpworker.cpp:477 in waitForStage1Suspend; REASON='Starting checkpoint, suspending...'
  1049. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  1050. thread->tid = 6386
  1051. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  1052. thread->tid = 6385
  1053. [41000] TRACE at dmtcpworker.cpp:474 in waitForStage1Suspend; REASON='got SUSPEND message, preparing to acquire all ThreadSync locks'
  1054. [41000] TRACE at threadsync.cpp:133 in acquireLocks; REASON='waiting for dmtcp_lock(): to get synchronized with _runCoordinatorCmd if we use
  1055. DMTCP API'
  1056. [41000] TRACE at threadsync.cpp:136 in acquireLocks; REASON='Waiting for lock(&theCkptCanStart)'
  1057. [41000] TRACE at threadsync.cpp:139 in acquireLocks; REASON='Waiting for libdlLock'
  1058. [41000] TRACE at threadsync.cpp:142 in acquireLocks; REASON='Waiting for threads creation lock'
  1059. [41000] TRACE at threadsync.cpp:147 in acquireLocks; REASON='Waiting for other threads to exit DMTCP-Wrappers'
  1060. [41000] TRACE at threadsync.cpp:152 in acquireLocks; REASON='Waiting for newly created threads to finish initialization'
  1061. _uninitializedThreadCount = 0
  1062. [41000] TRACE at threadsync.cpp:157 in acquireLocks; REASON='Done acquiring all locks'
  1063. [41000] TRACE at dmtcpworker.cpp:477 in waitForStage1Suspend; REASON='Starting checkpoint, suspending...'
  1064. [40000] TRACE at threadlist.cpp:502 in stopthisthread; REASON='Thread after sigsetjmp/getcontext'
  1065. curThread->tid = 6377
  1066. curThread->virtual_tid = 40010
  1067. curThread->saved_sp = 0x7fa89c429580
  1068. __builtin_return_address(0) = 0x7fa8a00ee710
  1069. [40000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1070. prgName.str = DMTCP:srun
  1071. [40000] TRACE at threadlist.cpp:530 in stopthisthread; REASON='User thread suspended'
  1072. curThread->tid = 6377
  1073. [40000] TRACE at threadlist.cpp:502 in stopthisthread; REASON='Thread after sigsetjmp/getcontext'
  1074. curThread->tid = 6375
  1075. curThread->virtual_tid = 40008
  1076. curThread->saved_sp = 0x7fa89ce2a540
  1077. __builtin_return_address(0) = 0x7fa8a00ee710
  1078. [40000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1079. prgName.str = DMTCP:srun
  1080. [40000] TRACE at threadlist.cpp:530 in stopthisthread; REASON='User thread suspended'
  1081. curThread->tid = 6375
  1082. [40000] TRACE at threadlist.cpp:502 in stopthisthread; REASON='Thread after sigsetjmp/getcontext'
  1083. curThread->tid = 6374
  1084. curThread->virtual_tid = 40006
  1085. curThread->saved_sp = 0x7fa89cf2b300
  1086. __builtin_return_address(0) = 0x7fa8a00ee710
  1087. [40000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1088. prgName.str = DMTCP:srun
  1089. [40000] TRACE at threadlist.cpp:530 in stopthisthread; REASON='User thread suspended'
  1090. curThread->tid = 6374
  1091. [40000] TRACE at threadlist.cpp:502 in stopthisthread; REASON='Thread after sigsetjmp/getcontext'
  1092. curThread->tid = 6369
  1093. curThread->virtual_tid = 40004
  1094. curThread->saved_sp = 0x7fa8a151f540
  1095. __builtin_return_address(0) = 0x7fa8a00ee710
  1096. [40000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1097. prgName.str = DMTCP:srun
  1098. [40000] TRACE at threadlist.cpp:530 in stopthisthread; REASON='User thread suspended'
  1099. curThread->tid = 6369
  1100. [40000] TRACE at threadlist.cpp:502 in stopthisthread; REASON='Thread after sigsetjmp/getcontext'
  1101. curThread->tid = 6365
  1102. curThread->virtual_tid = 40000
  1103. curThread->saved_sp = 0x7fffe5c57000
  1104. __builtin_return_address(0) = 0x7fa8a00ee710
  1105. [40000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1106. prgName.str = DMTCP:srun
  1107. [40000] TRACE at threadlist.cpp:530 in stopthisthread; REASON='User thread suspended'
  1108. curThread->tid = 6365
  1109. [41000] TRACE at threadlist.cpp:502 in stopthisthread; REASON='Thread after sigsetjmp/getcontext'
  1110. curThread->tid = 6373
  1111. curThread->virtual_tid = 41000
  1112. curThread->saved_sp = 0x7fffe5c57080
  1113. __builtin_return_address(0) = 0x7fa8a00ee710
  1114. [41000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1115. prgName.str = DMTCP:srun
  1116. [41000] TRACE at threadlist.cpp:530 in stopthisthread; REASON='User thread suspended'
  1117. curThread->tid = 6373
  1118. [41000] TRACE at threadlist.cpp:443 in suspendThreads; REASON='everything suspended'
  1119. numUserThreads = 1
  1120. [41000] TRACE at siginfo.cpp:110 in saveSigHandlers; REASON='saving signal handlers'
  1121. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1122. sig = 18
  1123. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1124. sig = 15
  1125. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1126. sig = 14
  1127. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1128. sig = 13
  1129. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1130. sig = 12
  1131. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1132. sig = 10
  1133. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1134. sig = 3
  1135. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1136. sig = 2
  1137. [41000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1138. sig = 1
  1139. [41000] TRACE at threadlist.cpp:347 in checkpointhread; REASON='before callbackSleepBetweenCheckpoint(0)'
  1140. [41000] TRACE at dmtcpworker.cpp:483 in waitForStage2Checkpoint; REASON='suspended'
  1141. [41000] TRACE at threadsync.cpp:164 in releaseLocks; REASON='Releasing ThreadSync locks'
  1142. [41000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1143. prgName.str = DMTCP:srun
  1144. [40000] TRACE at threadlist.cpp:502 in stopthisthread; REASON='Thread after sigsetjmp/getcontext'
  1145. curThread->tid = 6378
  1146. curThread->virtual_tid = 40012
  1147. curThread->saved_sp = 0x7fa89c3284c0
  1148. __builtin_return_address(0) = 0x7fa8a00ee710
  1149. [40000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1150. prgName.str = DMTCP:srun
  1151. [40000] TRACE at threadlist.cpp:530 in stopthisthread; REASON='User thread suspended'
  1152. curThread->tid = 6378
  1153. [40000] TRACE at threadlist.cpp:443 in suspendThreads; REASON='everything suspended'
  1154. numUserThreads = 6
  1155. [40000] TRACE at siginfo.cpp:110 in saveSigHandlers; REASON='saving signal handlers'
  1156. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1157. sig = 21
  1158. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1159. sig = 18
  1160. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1161. sig = 15
  1162. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1163. sig = 14
  1164. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1165. sig = 13
  1166. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1167. sig = 12
  1168. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1169. sig = 10
  1170. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1171. sig = 3
  1172. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1173. sig = 2
  1174. [40000] TRACE at siginfo.cpp:119 in saveSigHandlers; REASON='saving signal handler (non-default) for'
  1175. sig = 1
  1176. [40000] TRACE at threadlist.cpp:347 in checkpointhread; REASON='before callbackSleepBetweenCheckpoint(0)'
  1177. [40000] TRACE at dmtcpworker.cpp:483 in waitForStage2Checkpoint; REASON='suspended'
  1178. [40000] TRACE at threadsync.cpp:164 in releaseLocks; REASON='Releasing ThreadSync locks'
  1179. [40000] TRACE at procname.cpp:64 in prctlGetProcessName; REASON='prctl(PR_GET_NAME, ...) succeeded'
  1180. prgName.str = DMTCP:srun
  1181. [40000] TRACE at connectionlist.cpp:244 in list; REASON='ConnectionList'
  1182. (dmtcp_get_uniquepid_str ? dmtcp_get_uniquepid_str() : __null) = 6db90f3d5a9dd200-40000-546a1de8
  1183. o.str() =
  1184. 0,1,2 6db90f3d5a9dd200-40000-546a1de8(99000) :/dev/pts/1
  1185.  
  1186. [40000] TRACE at connectionlist.cpp:244 in list; REASON='ConnectionList'
  1187. (dmtcp_get_uniquepid_str ? dmtcp_get_uniquepid_str() : __null) = 6db90f3d5a9dd200-40000-546a1de8
  1188. o.str() =
  1189. 3 6db90f3d5a9dd200-40000-546a1de8(99005) <TCP Socket>
  1190. 4 6db90f3d5a9dd200-40000-546a1de8(99006) <TCP Socket>
  1191. 5 6db90f3d5a9dd200-40000-546a1de8(99007) <TCP Socket>
  1192. 6 6db90f3d5a9dd200-40000-546a1de8(99008) <TCP Socket>
  1193. 7 6db90f3d5a9dd200-40000-546a1de8(99020) <TCP Socket>
  1194. 9 6db90f3d5a9dd200-40000-546a1de8(99028) <TCP Socket>
  1195. 8 6db90f3d5a9dd200-40000-546a1de8(99029) <TCP Socket>
  1196. 10 6db90f3d5a9dd200-40000-546a1de8(99030) <TCP Socket>
  1197. 11 6db90f3d5a9dd200-40000-546a1de8(99031) <TCP Socket>
  1198. 12 6db90f3d5a9dd200-40000-546a1de8(99032) <TCP Socket>
  1199. 13 6db90f3d5a9dd200-40000-546a1de8(99033) <TCP Socket>
  1200. 14 6db90f3d5a9dd200-40000-546a1de8(99034) <TCP Socket>
  1201. 15 6db90f3d5a9dd200-40000-546a1de8(99036) <TCP Socket>
  1202. 16 6db90f3d5a9dd200-40000-546a1de8(99037) <TCP Socket>
  1203. 17 6db90f3d5a9dd200-40000-546a1de8(99038) <TCP Socket>
  1204. 18 6db90f3d5a9dd200-40000-546a1de8(99046) <TCP Socket>
  1205. 19 6db90f3d5a9dd200-40000-546a1de8(99051) <TCP Socket>
  1206.  
  1207. [40000] TRACE at connectionlist.cpp:244 in list; REASON='ConnectionList'
  1208. (dmtcp_get_uniquepid_str ? dmtcp_get_uniquepid_str() : __null) = 6db90f3d5a9dd200-40000-546a1de8
  1209. o.str() =
  1210.  
  1211. [41000] TRACE at connectionlist.cpp:244 in list; REASON='ConnectionList'
  1212. (dmtcp_get_uniquepid_str ? dmtcp_get_uniquepid_str() : __null) = 6db90f3d5a9dd200-41000-546a1de8
  1213. o.str() =
  1214. 0,1,2 6db90f3d5a9dd200-40000-546a1de8(99000) :/dev/pts/1
  1215.  
  1216. [41000] TRACE at connectionlist.cpp:244 in list; REASON='ConnectionList'
  1217. (dmtcp_get_uniquepid_str ? dmtcp_get_uniquepid_str() : __null) = 6db90f3d5a9dd200-41000-546a1de8
  1218. o.str() =
  1219. 3 6db90f3d5a9dd200-40000-546a1de8(99005) <TCP Socket>
  1220. 4 6db90f3d5a9dd200-40000-546a1de8(99006) <TCP Socket>
  1221. 5 6db90f3d5a9dd200-40000-546a1de8(99007) <TCP Socket>
  1222. 6 6db90f3d5a9dd200-40000-546a1de8(99008) <TCP Socket>
  1223. 7 6db90f3d5a9dd200-40000-546a1de8(99020) <TCP Socket>
  1224. 8 6db90f3d5a9dd200-40000-546a1de8(99027) <TCP Socket>
  1225.  
  1226. [41000] TRACE at connectionlist.cpp:244 in list; REASON='ConnectionList'
  1227. (dmtcp_get_uniquepid_str ? dmtcp_get_uniquepid_str() : __null) = 6db90f3d5a9dd200-41000-546a1de8
  1228. o.str() =
  1229.  
  1230. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for FD_LEADER_ELECTION message'
  1231. [41000] TRACE at dmtcpworker.cpp:449 in waitForCoordinatorMsg; REASON='Computation information'
  1232. msg.compGroup = 6db90f3d5a9dd200-40000-546a1de8
  1233. msg.numPeers = 2
  1234. [41000] TRACE at connectionlist.cpp:88 in eventHook; REASON='locking...'
  1235. [41000] TRACE at connectionlist.cpp:90 in eventHook; REASON='locked'
  1236. [41000] TRACE at connectionlist.cpp:88 in eventHook; REASON='locking...'
  1237. [41000] TRACE at connectionlist.cpp:90 in eventHook; REASON='locked'
  1238. [41000] TRACE at connectionlist.cpp:88 in eventHook; REASON='locking...'
  1239. [41000] TRACE at connectionlist.cpp:90 in eventHook; REASON='locked'
  1240. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for FD_LEADER_ELECTION message'
  1241. [40000] TRACE at dmtcpworker.cpp:449 in waitForCoordinatorMsg; REASON='Computation information'
  1242. msg.compGroup = 6db90f3d5a9dd200-40000-546a1de8
  1243. msg.numPeers = 2
  1244. [40000] TRACE at connectionlist.cpp:88 in eventHook; REASON='locking...'
  1245. [40000] TRACE at connectionlist.cpp:90 in eventHook; REASON='locked'
  1246. [40000] TRACE at connectionlist.cpp:88 in eventHook; REASON='locking...'
  1247. [40000] TRACE at connectionlist.cpp:90 in eventHook; REASON='locked'
  1248. [40000] TRACE at connectionlist.cpp:88 in eventHook; REASON='locking...'
  1249. [40000] TRACE at connectionlist.cpp:90 in eventHook; REASON='locked'
  1250. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for DRAIN message'
  1251. [41000] TRACE at pidwrappers.cpp:156 in tcgetpgrp; REASON='tcgetpgrp return value'
  1252. fd = 9
  1253. retval = 40000
  1254. [41000] TRACE at processinfo.cpp:481 in refresh; REASON='CHECK GROUP PID'
  1255. _gid = 40000
  1256. _fgid = 40000
  1257. _ppid = 40000
  1258. _pid = 41000
  1259. [41000] TRACE at connectionlist.cpp:94 in eventHook; REASON='draining...'
  1260. [41000] TRACE at connectionlist.cpp:96 in eventHook; REASON='drained'
  1261. [41000] TRACE at connectionlist.cpp:94 in eventHook; REASON='draining...'
  1262. [41000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1263. _hasLock = 1
  1264. _fds[0] = 8
  1265. _id = 6db90f3d5a9dd200-40000-546a1de8(99027)
  1266. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(-1)
  1267. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for DRAIN message'
  1268. [40000] TRACE at pidwrappers.cpp:156 in tcgetpgrp; REASON='tcgetpgrp return value'
  1269. fd = 20
  1270. retval = 40000
  1271. [40000] TRACE at processinfo.cpp:481 in refresh; REASON='CHECK GROUP PID'
  1272. _gid = 40000
  1273. _fgid = 40000
  1274. _ppid = 4213
  1275. _pid = 40000
  1276. [40000] TRACE at connectionlist.cpp:94 in eventHook; REASON='draining...'
  1277. [40000] TRACE at pidwrappers.cpp:156 in tcgetpgrp; REASON='tcgetpgrp return value'
  1278. fd = 0
  1279. retval = 40000
  1280. [40000] TRACE at connectionlist.cpp:96 in eventHook; REASON='drained'
  1281. [40000] TRACE at connectionlist.cpp:94 in eventHook; REASON='draining...'
  1282. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1283. _hasLock = 1
  1284. _fds[0] = 5
  1285. _id = 6db90f3d5a9dd200-40000-546a1de8(99007)
  1286. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(-1)
  1287. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1288. _hasLock = 1
  1289. _fds[0] = 6
  1290. _id = 6db90f3d5a9dd200-40000-546a1de8(99008)
  1291. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99007)
  1292. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1293. _hasLock = 1
  1294. _fds[0] = 9
  1295. _id = 6db90f3d5a9dd200-40000-546a1de8(99028)
  1296. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99027)
  1297. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1298. _hasLock = 1
  1299. _fds[0] = 10
  1300. _id = 6db90f3d5a9dd200-40000-546a1de8(99030)
  1301. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(-1)
  1302. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1303. _hasLock = 1
  1304. _fds[0] = 11
  1305. _id = 6db90f3d5a9dd200-40000-546a1de8(99031)
  1306. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99030)
  1307. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1308. _hasLock = 1
  1309. _fds[0] = 13
  1310. _id = 6db90f3d5a9dd200-40000-546a1de8(99033)
  1311. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(-1)
  1312. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1313. _hasLock = 1
  1314. _fds[0] = 14
  1315. _id = 6db90f3d5a9dd200-40000-546a1de8(99034)
  1316. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99033)
  1317. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1318. _hasLock = 1
  1319. _fds[0] = 15
  1320. _id = 6db90f3d5a9dd200-40000-546a1de8(99036)
  1321. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(-1)
  1322. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1323. _hasLock = 1
  1324. _fds[0] = 16
  1325. _id = 6db90f3d5a9dd200-40000-546a1de8(99037)
  1326. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99036)
  1327. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1328. _hasLock = 1
  1329. _fds[0] = 18
  1330. _id = 6db90f3d5a9dd200-40000-546a1de8(99046)
  1331. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(-1)
  1332. [40000] TRACE at socketconnection.cpp:366 in drain; REASON='Will drain socket'
  1333. _hasLock = 1
  1334. _fds[0] = 19
  1335. _id = 6db90f3d5a9dd200-40000-546a1de8(99051)
  1336. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(-1)
  1337. [41000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1338. _dataSockets[i]->socket().sockfd() = 8
  1339. buffer.size() = 0
  1340. (_dataSockets.size()) = 1
  1341. [41000] TRACE at connectionlist.cpp:96 in eventHook; REASON='drained'
  1342. [41000] TRACE at connectionlist.cpp:94 in eventHook; REASON='draining...'
  1343. [41000] TRACE at connectionlist.cpp:96 in eventHook; REASON='drained'
  1344. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for CHECKPOINT message'
  1345. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1346. _dataSockets[i]->socket().sockfd() = 5
  1347. buffer.size() = 0
  1348. (_dataSockets.size()) = 11
  1349. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1350. _dataSockets[i]->socket().sockfd() = 6
  1351. buffer.size() = 0
  1352. (_dataSockets.size()) = 11
  1353. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1354. _dataSockets[i]->socket().sockfd() = 9
  1355. buffer.size() = 0
  1356. (_dataSockets.size()) = 11
  1357. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1358. _dataSockets[i]->socket().sockfd() = 10
  1359. buffer.size() = 0
  1360. (_dataSockets.size()) = 11
  1361. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1362. _dataSockets[i]->socket().sockfd() = 11
  1363. buffer.size() = 0
  1364. (_dataSockets.size()) = 11
  1365. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1366. _dataSockets[i]->socket().sockfd() = 13
  1367. buffer.size() = 0
  1368. (_dataSockets.size()) = 11
  1369. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1370. _dataSockets[i]->socket().sockfd() = 14
  1371. buffer.size() = 0
  1372. (_dataSockets.size()) = 11
  1373. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1374. _dataSockets[i]->socket().sockfd() = 15
  1375. buffer.size() = 0
  1376. (_dataSockets.size()) = 11
  1377. [40000] TRACE at kernelbufferdrainer.cpp:105 in onTimeoutInterval; REASON='buffer drain complete'
  1378. _dataSockets[i]->socket().sockfd() = 16
  1379. buffer.size() = 0
  1380. (_dataSockets.size()) = 11
  1381. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1382. _dataSockets[i]->socket().sockfd() = 19
  1383. buffer.size() = 195
  1384. WARN_INTERVAL_SEC = 10
  1385. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1386. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1387. _dataSockets[i]->socket().sockfd() = 18
  1388. buffer.size() = 195
  1389. WARN_INTERVAL_SEC = 10
  1390. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1391. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1392. _dataSockets[i]->socket().sockfd() = 19
  1393. buffer.size() = 302
  1394. WARN_INTERVAL_SEC = 10
  1395. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1396. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1397. _dataSockets[i]->socket().sockfd() = 18
  1398. buffer.size() = 302
  1399. WARN_INTERVAL_SEC = 10
  1400. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1401. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1402. _dataSockets[i]->socket().sockfd() = 19
  1403. buffer.size() = 446
  1404. WARN_INTERVAL_SEC = 10
  1405. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1406. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1407. _dataSockets[i]->socket().sockfd() = 18
  1408. buffer.size() = 446
  1409. WARN_INTERVAL_SEC = 10
  1410. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1411. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1412. _dataSockets[i]->socket().sockfd() = 19
  1413. buffer.size() = 554
  1414. WARN_INTERVAL_SEC = 10
  1415. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1416. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1417. _dataSockets[i]->socket().sockfd() = 18
  1418. buffer.size() = 554
  1419. WARN_INTERVAL_SEC = 10
  1420. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1421. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1422. _dataSockets[i]->socket().sockfd() = 19
  1423. buffer.size() = 698
  1424. WARN_INTERVAL_SEC = 10
  1425. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1426. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1427. _dataSockets[i]->socket().sockfd() = 18
  1428. buffer.size() = 698
  1429. WARN_INTERVAL_SEC = 10
  1430. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1431. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1432. _dataSockets[i]->socket().sockfd() = 19
  1433. buffer.size() = 806
  1434. WARN_INTERVAL_SEC = 10
  1435. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1436. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1437. _dataSockets[i]->socket().sockfd() = 18
  1438. buffer.size() = 806
  1439. WARN_INTERVAL_SEC = 10
  1440. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1441. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1442. _dataSockets[i]->socket().sockfd() = 19
  1443. buffer.size() = 914
  1444. WARN_INTERVAL_SEC = 10
  1445. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1446. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1447. _dataSockets[i]->socket().sockfd() = 18
  1448. buffer.size() = 914
  1449. WARN_INTERVAL_SEC = 10
  1450. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1451. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1452. _dataSockets[i]->socket().sockfd() = 19
  1453. buffer.size() = 1058
  1454. WARN_INTERVAL_SEC = 10
  1455. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1456. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1457. _dataSockets[i]->socket().sockfd() = 18
  1458. buffer.size() = 1058
  1459. WARN_INTERVAL_SEC = 10
  1460. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1461. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1462. _dataSockets[i]->socket().sockfd() = 19
  1463. buffer.size() = 1166
  1464. WARN_INTERVAL_SEC = 10
  1465. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1466. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1467. _dataSockets[i]->socket().sockfd() = 18
  1468. buffer.size() = 1166
  1469. WARN_INTERVAL_SEC = 10
  1470. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1471. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1472. _dataSockets[i]->socket().sockfd() = 19
  1473. buffer.size() = 1310
  1474. WARN_INTERVAL_SEC = 10
  1475. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1476. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1477. _dataSockets[i]->socket().sockfd() = 18
  1478. buffer.size() = 1310
  1479. WARN_INTERVAL_SEC = 10
  1480. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1481. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1482. _dataSockets[i]->socket().sockfd() = 19
  1483. buffer.size() = 1418
  1484. WARN_INTERVAL_SEC = 10
  1485. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1486. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1487. _dataSockets[i]->socket().sockfd() = 18
  1488. buffer.size() = 1418
  1489. WARN_INTERVAL_SEC = 10
  1490. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1491. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1492. _dataSockets[i]->socket().sockfd() = 19
  1493. buffer.size() = 1526
  1494. WARN_INTERVAL_SEC = 10
  1495. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1496. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1497. _dataSockets[i]->socket().sockfd() = 18
  1498. buffer.size() = 1526
  1499. WARN_INTERVAL_SEC = 10
  1500. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1501. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1502. _dataSockets[i]->socket().sockfd() = 19
  1503. buffer.size() = 1670
  1504. WARN_INTERVAL_SEC = 10
  1505. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1506. [40000] WARNING at kernelbufferdrainer.cpp:124 in onTimeoutInterval; REASON='JWARNING(false) failed'
  1507. _dataSockets[i]->socket().sockfd() = 18
  1508. buffer.size() = 1670
  1509. WARN_INTERVAL_SEC = 10
  1510. Message: Still draining socket... perhaps remote host is not running under DMTCP?
  1511. [40000] TRACE at jsocket.cpp:735 in monitorSockets; REASON='accepting new connection'
  1512. i = 4
  1513. sk.sockfd() = 20
  1514. _listenSockets[i].sockfd() = 12
  1515. (strerror((*__errno_location ()))) = Success
  1516. [40000] WARNING at kernelbufferdrainer.cpp:61 in onConnect; REASON='JWARNING(false) failed'
  1517. sock.sockfd() = 20
  1518. Message: we don't yet support checkpointing non-accepted connections... restore will likely fail.. closing connection
  1519. [40000] TRACE at jsocket.cpp:735 in monitorSockets; REASON='accepting new connection'
  1520. i = 4
  1521. sk.sockfd() = 20
  1522. _listenSockets[i].sockfd() = 12
  1523. (strerror((*__errno_location ()))) = Success
  1524. [40000] WARNING at kernelbufferdrainer.cpp:61 in onConnect; REASON='JWARNING(false) failed'
  1525. sock.sockfd() = 20
  1526. Message: we don't yet support checkpointing non-accepted connections... restore will likely fail.. closing connection
  1527. [40000] TRACE at kernelbufferdrainer.cpp:84 in onDisconnect; REASON='found disconnected socket... marking it dead'
  1528. fd = 19
  1529. _reverseLookup[fd] = 6db90f3d5a9dd200-40000-546a1de8(99051)
  1530. (strerror((*__errno_location ()))) = Success
  1531. [40000] TRACE at kernelbufferdrainer.cpp:84 in onDisconnect; REASON='found disconnected socket... marking it dead'
  1532. fd = 18
  1533. _reverseLookup[fd] = 6db90f3d5a9dd200-40000-546a1de8(99046)
  1534. (strerror((*__errno_location ()))) = Success
  1535. [40000] TRACE at socketconnlist.cpp:58 in drain; REASON='recreating disconnected socket'
  1536. id = 6db90f3d5a9dd200-40000-546a1de8(99046)
  1537. [40000] TRACE at socketconnection.cpp:335 in onError; REASON='Error.'
  1538. id() = 6db90f3d5a9dd200-40000-546a1de8(99046)
  1539. [40000] TRACE at socketconnection.cpp:337 in onError; REASON='Creating dead socket.'
  1540. _fds[0] = 18
  1541. _fds.size() = 1
  1542. [40000] TRACE at socketconnlist.cpp:58 in drain; REASON='recreating disconnected socket'
  1543. id = 6db90f3d5a9dd200-40000-546a1de8(99051)
  1544. [40000] TRACE at socketconnection.cpp:335 in onError; REASON='Error.'
  1545. id() = 6db90f3d5a9dd200-40000-546a1de8(99051)
  1546. [40000] TRACE at socketconnection.cpp:337 in onError; REASON='Creating dead socket.'
  1547. _fds[0] = 19
  1548. _fds.size() = 1
  1549. [40000] TRACE at connectionlist.cpp:96 in eventHook; REASON='drained'
  1550. [40000] TRACE at connectionlist.cpp:94 in eventHook; REASON='draining...'
  1551. [40000] TRACE at connectionlist.cpp:96 in eventHook; REASON='drained'
  1552. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for CHECKPOINT message'
  1553. [41000] TRACE at dmtcpworker.cpp:508 in waitForStage2Checkpoint; REASON='got checkpoint message'
  1554. [41000] TRACE at connectionlist.cpp:100 in eventHook; REASON='preCKpt...'
  1555. [41000] TRACE at connectionlist.cpp:102 in eventHook; REASON='done preCkpt'
  1556. [41000] TRACE at connectionlist.cpp:100 in eventHook; REASON='preCKpt...'
  1557. [41000] TRACE at socketconnlist.cpp:71 in preCkpt; REASON='beginning handshakes'
  1558. [41000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1559. id() = 6db90f3d5a9dd200-40000-546a1de8(99027)
  1560. _fds[0] = 8
  1561. [40000] TRACE at dmtcpworker.cpp:508 in waitForStage2Checkpoint; REASON='got checkpoint message'
  1562. [40000] TRACE at connectionlist.cpp:100 in eventHook; REASON='preCKpt...'
  1563. [40000] TRACE at connectionlist.cpp:102 in eventHook; REASON='done preCkpt'
  1564. [40000] TRACE at connectionlist.cpp:100 in eventHook; REASON='preCKpt...'
  1565. [40000] TRACE at socketconnlist.cpp:71 in preCkpt; REASON='beginning handshakes'
  1566. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1567. id() = 6db90f3d5a9dd200-40000-546a1de8(99007)
  1568. _fds[0] = 5
  1569. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1570. id() = 6db90f3d5a9dd200-40000-546a1de8(99008)
  1571. _fds[0] = 6
  1572. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1573. id() = 6db90f3d5a9dd200-40000-546a1de8(99028)
  1574. _fds[0] = 9
  1575. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1576. id() = 6db90f3d5a9dd200-40000-546a1de8(99030)
  1577. _fds[0] = 10
  1578. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1579. id() = 6db90f3d5a9dd200-40000-546a1de8(99031)
  1580. _fds[0] = 11
  1581. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1582. id() = 6db90f3d5a9dd200-40000-546a1de8(99033)
  1583. _fds[0] = 13
  1584. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1585. id() = 6db90f3d5a9dd200-40000-546a1de8(99034)
  1586. _fds[0] = 14
  1587. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1588. id() = 6db90f3d5a9dd200-40000-546a1de8(99036)
  1589. _fds[0] = 15
  1590. [40000] TRACE at socketconnection.cpp:389 in doSendHandshakes; REASON='Sending handshake ...'
  1591. id() = 6db90f3d5a9dd200-40000-546a1de8(99037)
  1592. _fds[0] = 16
  1593. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1594. id() = 6db90f3d5a9dd200-40000-546a1de8(99007)
  1595. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99008)
  1596. _fds[0] = 5
  1597. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1598. id() = 6db90f3d5a9dd200-40000-546a1de8(99008)
  1599. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99007)
  1600. _fds[0] = 6
  1601. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1602. id() = 6db90f3d5a9dd200-40000-546a1de8(99028)
  1603. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99027)
  1604. _fds[0] = 9
  1605. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1606. id() = 6db90f3d5a9dd200-40000-546a1de8(99030)
  1607. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99031)
  1608. _fds[0] = 10
  1609. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1610. id() = 6db90f3d5a9dd200-40000-546a1de8(99031)
  1611. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99030)
  1612. _fds[0] = 11
  1613. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1614. id() = 6db90f3d5a9dd200-40000-546a1de8(99033)
  1615. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99034)
  1616. _fds[0] = 13
  1617. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1618. id() = 6db90f3d5a9dd200-40000-546a1de8(99034)
  1619. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99033)
  1620. _fds[0] = 14
  1621. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1622. id() = 6db90f3d5a9dd200-40000-546a1de8(99036)
  1623. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99037)
  1624. _fds[0] = 15
  1625. [40000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1626. id() = 6db90f3d5a9dd200-40000-546a1de8(99037)
  1627. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99036)
  1628. _fds[0] = 16
  1629. [40000] TRACE at socketconnlist.cpp:89 in preCkpt; REASON='handshaking done'
  1630. [40000] TRACE at connectionlist.cpp:102 in eventHook; REASON='done preCkpt'
  1631. [40000] TRACE at connectionlist.cpp:100 in eventHook; REASON='preCKpt...'
  1632. [40000] TRACE at connectionlist.cpp:102 in eventHook; REASON='done preCkpt'
  1633. [40000] TRACE at ckptserializer.cpp:545 in writeCkptImage; REASON='Thread performing checkpoint.'
  1634. gettid() = 40002
  1635. [40000] TRACE at ckptserializer.cpp:210 in open_ckpt_to_write_gz; REASON='open_ckpt_to_write_gz
  1636. '
  1637. [40000] TRACE at processinfo.cpp:511 in serialize; REASON='Serialized process information'
  1638. _sid = 1564
  1639. _ppid = 4213
  1640. _gid = 40000
  1641. _fgid = 40000
  1642. _procname = srun
  1643. _hostname = slurm-master
  1644. _launchCWD = /home/slurm
  1645. _ckptCWD = /home/slurm
  1646. _upid = 6db90f3d5a9dd200-40000-546a1de8
  1647. _uppid = 0-0-0
  1648. _compGroup = 6db90f3d5a9dd200-40000-546a1de8
  1649. _numPeers = 2
  1650. _noCoordinator = 0
  1651. _argvSize = 21
  1652. _envSize = 2884
  1653. _elfType = 1
  1654. [41000] TRACE at socketconnection.cpp:404 in doRecvHandshakes; REASON='Received handshake.'
  1655. id() = 6db90f3d5a9dd200-40000-546a1de8(99027)
  1656. _remotePeerId = 6db90f3d5a9dd200-40000-546a1de8(99028)
  1657. _fds[0] = 8
  1658. [41000] TRACE at socketconnlist.cpp:89 in preCkpt; REASON='handshaking done'
  1659. [41000] TRACE at connectionlist.cpp:102 in eventHook; REASON='done preCkpt'
  1660. [41000] TRACE at connectionlist.cpp:100 in eventHook; REASON='preCKpt...'
  1661. [41000] TRACE at connectionlist.cpp:102 in eventHook; REASON='done preCkpt'
  1662. [41000] TRACE at ckptserializer.cpp:545 in writeCkptImage; REASON='Thread performing checkpoint.'
  1663. gettid() = 41002
  1664. [41000] TRACE at ckptserializer.cpp:210 in open_ckpt_to_write_gz; REASON='open_ckpt_to_write_gz
  1665. '
  1666. [41000] TRACE at processinfo.cpp:511 in serialize; REASON='Serialized process information'
  1667. _sid = 1564
  1668. _ppid = 40000
  1669. _gid = 40000
  1670. _fgid = 40000
  1671. _procname = srun
  1672. _hostname = slurm-master
  1673. _launchCWD = /home/slurm
  1674. _ckptCWD = /home/slurm
  1675. _upid = 6db90f3d5a9dd200-41000-546a1de8
  1676. _uppid = 6db90f3d5a9dd200-40000-546a1de8
  1677. _compGroup = 6db90f3d5a9dd200-40000-546a1de8
  1678. _numPeers = 2
  1679. _noCoordinator = 0
  1680. _argvSize = 21
  1681. _envSize = 2884
  1682. _elfType = 1
  1683. [41000] TRACE at processinfo.cpp:522 in serialize; REASON='Serializing ChildPid Table'
  1684. _childTable.size() = 0
  1685. o.filename() =
  1686. [41000] TRACE at ckptserializer.cpp:571 in writeCkptImage; REASON='MTCP is about to write checkpoint image.'
  1687. ckptFilename = /home/slurm/ckpt_srun_6db90f3d5a9dd200-41000-546a1de8.dmtcp
  1688. [41000] TRACE at writeckpt.cpp:70 in mtcp_writememoryareas; REASON='Performing checkpoint.'
  1689. [40000] TRACE at processinfo.cpp:519 in serialize; REASON='This process is Root of Process Tree'
  1690. [40000] TRACE at processinfo.cpp:522 in serialize; REASON='Serializing ChildPid Table'
  1691. _childTable.size() = 1
  1692. o.filename() =
  1693. [40000] TRACE at ckptserializer.cpp:571 in writeCkptImage; REASON='MTCP is about to write checkpoint image.'
  1694. ckptFilename = /home/slurm/ckpt_srun_6db90f3d5a9dd200-40000-546a1de8.dmtcp
  1695. [40000] TRACE at writeckpt.cpp:70 in mtcp_writememoryareas; REASON='Performing checkpoint.'
  1696. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1697. addr = 0x400000
  1698. area->size = 1318912
  1699. area->name = /usr/local/bin/srun
  1700. area->offset = 0
  1701. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1702. addr = 0x400000
  1703. area->size = 1318912
  1704. area->name = /usr/local/bin/srun
  1705. area->offset = 0
  1706. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1707. addr = 0x742000
  1708. area->size = 24576
  1709. area->name = /usr/local/bin/srun
  1710. area->offset = 1318912
  1711. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1712. addr = 0x742000
  1713. area->size = 24576
  1714. area->name = /usr/local/bin/srun
  1715. area->offset = 1318912
  1716. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1717. addr = 0x748000
  1718. area->size = 20480
  1719. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1720. addr = 0x748000
  1721. area->size = 20480
  1722. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1723. addr = 0x1e88000
  1724. area->size = 745472
  1725. area->name = [heap]
  1726. area->offset = 0
  1727. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1728. addr = 0x1e88000
  1729. area->size = 4116480
  1730. area->name = [heap]
  1731. area->offset = 0
  1732. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1733. addr = 0x7fa898000000
  1734. area->size = 135168
  1735. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1736. addr = 0x7fa898021000
  1737. area->size = 66973696
  1738. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1739. addr = 0x7fa89cf2e000
  1740. area->size = 32768
  1741. area->name = /usr/lib64/libmunge.so.2.0.0
  1742. area->offset = 0
  1743. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1744. addr = 0x7fa89d136000
  1745. area->size = 4096
  1746. area->name = /usr/lib64/libmunge.so.2.0.0
  1747. area->offset = 32768
  1748. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1749. addr = 0x7fa89d137000
  1750. area->size = 12288
  1751. area->name = /usr/local/lib/slurm/auth_munge.so
  1752. area->offset = 0
  1753. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1754. addr = 0x7fa89d339000
  1755. area->size = 4096
  1756. area->name = /usr/local/lib/slurm/auth_munge.so
  1757. area->offset = 8192
  1758. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1759. addr = 0x7fa89d33a000
  1760. area->size = 77824
  1761. area->name = /usr/local/lib/slurm/mpi_pmi2.so
  1762. area->offset = 0
  1763. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1764. addr = 0x7fa89d54c000
  1765. area->size = 8192
  1766. area->name = /usr/local/lib/slurm/mpi_pmi2.so
  1767. area->offset = 73728
  1768. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1769. addr = 0x7fa89d54e000
  1770. area->size = 20480
  1771. area->name = /usr/local/lib/slurm/launch_slurm.so
  1772. area->offset = 0
  1773. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1774. addr = 0x7fa89d752000
  1775. area->size = 4096
  1776. area->name = /usr/local/lib/slurm/launch_slurm.so
  1777. area->offset = 16384
  1778. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1779. addr = 0x7fa89d753000
  1780. area->size = 8192
  1781. area->name = /usr/local/lib/slurm/switch_none.so
  1782. area->offset = 0
  1783. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1784. addr = 0x7fa89d954000
  1785. area->size = 4096
  1786. area->name = /usr/local/lib/slurm/switch_none.so
  1787. area->offset = 4096
  1788. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1789. addr = 0x7fa89d955000
  1790. area->size = 45056
  1791. area->name = /usr/local/lib/slurm/select_linear.so
  1792. area->offset = 0
  1793. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1794. addr = 0x7fa89db5f000
  1795. area->size = 4096
  1796. area->name = /usr/local/lib/slurm/select_linear.so
  1797. area->offset = 40960
  1798. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1799. addr = 0x7fa89db60000
  1800. area->size = 4096
  1801. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1802. addr = 0x7fa89db61000
  1803. area->size = 10485760
  1804. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1805. addr = 0x7fa87c000000
  1806. area->size = 135168
  1807. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1808. addr = 0x7fa89e793000
  1809. area->size = 4096
  1810. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1811. addr = 0x7fa89f194000
  1812. area->size = 4096
  1813. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1814. addr = 0x7fa89f195000
  1815. area->size = 49152
  1816. area->name = /lib64/libnss_files-2.12.so
  1817. area->offset = 0
  1818. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1819. addr = 0x7fa87c021000
  1820. area->size = 66973696
  1821. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1822. addr = 0x7fa89f3a1000
  1823. area->size = 4096
  1824. area->name = /lib64/libnss_files-2.12.so
  1825. area->offset = 49152
  1826. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1827. addr = 0x7fa89f3a2000
  1828. area->size = 4096
  1829. area->name = /lib64/libnss_files-2.12.so
  1830. area->offset = 53248
  1831. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1832. addr = 0x7fa89f3a3000
  1833. area->size = 28672
  1834. area->name = /lib64/librt-2.12.so
  1835. area->offset = 0
  1836. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1837. addr = 0x7fa89f5a9000
  1838. area->size = 4096
  1839. area->name = /lib64/librt-2.12.so
  1840. area->offset = 24576
  1841. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1842. addr = 0x7fa89f5aa000
  1843. area->size = 4096
  1844. area->name = /lib64/librt-2.12.so
  1845. area->offset = 28672
  1846. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1847. addr = 0x7fa89f5ab000
  1848. area->size = 90112
  1849. area->name = /lib64/libgcc_s-4.4.7-20120601.so.1
  1850. area->offset = 0
  1851. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1852. addr = 0x7fa89f7c0000
  1853. area->size = 4096
  1854. area->name = /lib64/libgcc_s-4.4.7-20120601.so.1
  1855. area->offset = 86016
  1856. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1857. addr = 0x7fa89f7c1000
  1858. area->size = 536576
  1859. area->name = /lib64/libm-2.12.so
  1860. area->offset = 0
  1861. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1862. addr = 0x7fa880000000
  1863. area->size = 135168
  1864. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1865. addr = 0x7fa880021000
  1866. area->size = 66973696
  1867. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1868. addr = 0x7fa89fa43000
  1869. area->size = 4096
  1870. area->name = /lib64/libm-2.12.so
  1871. area->offset = 532480
  1872. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1873. addr = 0x7fa89fa44000
  1874. area->size = 4096
  1875. area->name = /lib64/libm-2.12.so
  1876. area->offset = 536576
  1877. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1878. addr = 0x7fa89fa45000
  1879. area->size = 950272
  1880. area->name = /usr/lib64/libstdc++.so.6.0.13
  1881. area->offset = 0
  1882. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1883. addr = 0x7fa887eff000
  1884. area->size = 4096
  1885. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1886. addr = 0x7fa887f00000
  1887. area->size = 1048576
  1888. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1889. addr = 0x7fa888000000
  1890. area->size = 135168
  1891. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1892. addr = 0x7fa888021000
  1893. area->size = 66973696
  1894. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1895. addr = 0x7fa89fd2d000
  1896. area->size = 28672
  1897. area->name = /usr/lib64/libstdc++.so.6.0.13
  1898. area->offset = 950272
  1899. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1900. addr = 0x7fa89fd34000
  1901. area->size = 8192
  1902. area->name = /usr/lib64/libstdc++.so.6.0.13
  1903. area->offset = 978944
  1904. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1905. addr = 0x7fa89fd36000
  1906. area->size = 86016
  1907. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1908. addr = 0x7fa89fd4b000
  1909. area->size = 1613824
  1910. area->name = /lib64/libc-2.12.so
  1911. area->offset = 0
  1912. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1913. addr = 0x7fa88c000000
  1914. area->size = 3149824
  1915. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1916. addr = 0x7fa88c301000
  1917. area->size = 63959040
  1918. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1919. addr = 0x7fa890000000
  1920. area->size = 3149824
  1921. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1922. addr = 0x7fa890301000
  1923. area->size = 63959040
  1924. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1925. addr = 0x7fa894000000
  1926. area->size = 135168
  1927. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1928. addr = 0x7fa894021000
  1929. area->size = 66973696
  1930. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1931. addr = 0x7fa8a00d5000
  1932. area->size = 16384
  1933. area->name = /lib64/libc-2.12.so
  1934. area->offset = 1613824
  1935. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1936. addr = 0x7fa8a00d9000
  1937. area->size = 4096
  1938. area->name = /lib64/libc-2.12.so
  1939. area->offset = 1630208
  1940. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1941. addr = 0x7fa8a00da000
  1942. area->size = 20480
  1943. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1944. addr = 0x7fa8a00df000
  1945. area->size = 94208
  1946. area->name = /lib64/libpthread-2.12.so
  1947. area->offset = 0
  1948. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1949. addr = 0x7fa8a02f6000
  1950. area->size = 4096
  1951. area->name = /lib64/libpthread-2.12.so
  1952. area->offset = 94208
  1953. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1954. addr = 0x7fa8a02f7000
  1955. area->size = 4096
  1956. area->name = /lib64/libpthread-2.12.so
  1957. area->offset = 98304
  1958. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1959. addr = 0x7fa8a02f8000
  1960. area->size = 16384
  1961. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1962. addr = 0x7fa8a02fc000
  1963. area->size = 8192
  1964. area->name = /lib64/libdl-2.12.so
  1965. area->offset = 0
  1966. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1967. addr = 0x7fa8a04fe000
  1968. area->size = 4096
  1969. area->name = /lib64/libdl-2.12.so
  1970. area->offset = 8192
  1971. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1972. addr = 0x7fa8a04ff000
  1973. area->size = 4096
  1974. area->name = /lib64/libdl-2.12.so
  1975. area->offset = 12288
  1976. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1977. addr = 0x7fa8a0500000
  1978. area->size = 155648
  1979. area->name = /usr/local/lib/dmtcp/libdmtcp_pid.so
  1980. area->offset = 0
  1981. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1982. addr = 0x7fa8a0725000
  1983. area->size = 8192
  1984. area->name = /usr/local/lib/dmtcp/libdmtcp_pid.so
  1985. area->offset = 151552
  1986. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1987. addr = 0x7fa8a0727000
  1988. area->size = 823296
  1989. area->name = /usr/local/lib/dmtcp/libdmtcp.so
  1990. area->offset = 0
  1991. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1992. addr = 0x7fa898000000
  1993. area->size = 135168
  1994. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  1995. addr = 0x7fa898021000
  1996. area->size = 66973696
  1997. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  1998. addr = 0x7fa8a09ef000
  1999. area->size = 20480
  2000. area->name = /usr/local/lib/dmtcp/libdmtcp.so
  2001. area->offset = 819200
  2002. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2003. addr = 0x7fa8a09f4000
  2004. area->size = 20480
  2005. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2006. addr = 0x7fa8a09f9000
  2007. area->size = 1105920
  2008. area->name = /usr/local/lib/dmtcp/libdmtcp_ipc.so
  2009. area->offset = 0
  2010. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2011. addr = 0x7fa89c028000
  2012. area->size = 4096
  2013. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2014. addr = 0x7fa89c029000
  2015. area->size = 1048576
  2016. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2017. addr = 0x7fa89c129000
  2018. area->size = 4096
  2019. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2020. addr = 0x7fa89c12a000
  2021. area->size = 1048576
  2022. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2023. addr = 0x7fa89c22a000
  2024. area->size = 4096
  2025. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2026. addr = 0x7fa89c22b000
  2027. area->size = 1048576
  2028. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2029. addr = 0x7fa89c32b000
  2030. area->size = 4096
  2031. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2032. addr = 0x7fa89c32c000
  2033. area->size = 1048576
  2034. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2035. addr = 0x7fa8a0d07000
  2036. area->size = 28672
  2037. area->name = /usr/local/lib/dmtcp/libdmtcp_ipc.so
  2038. area->offset = 1105920
  2039. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2040. addr = 0x7fa8a0d0e000
  2041. area->size = 4096
  2042. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2043. addr = 0x7fa8a0d0f000
  2044. area->size = 4096
  2045. area->name = /usr/local/lib/dmtcp/libdmtcp_dl.so
  2046. area->offset = 0
  2047. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2048. addr = 0x7fa8a0f0f000
  2049. area->size = 4096
  2050. area->name = /usr/local/lib/dmtcp/libdmtcp_dl.so
  2051. area->offset = 0
  2052. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2053. addr = 0x7fa8a0f10000
  2054. area->size = 4096
  2055. area->name = /usr/local/lib/dmtcp/libdmtcp_alloc.so
  2056. area->offset = 0
  2057. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2058. addr = 0x7fa8a1111000
  2059. area->size = 4096
  2060. area->name = /usr/local/lib/dmtcp/libdmtcp_alloc.so
  2061. area->offset = 4096
  2062. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2063. addr = 0x7fa8a1112000
  2064. area->size = 77824
  2065. area->name = /usr/local/lib/dmtcp/libdmtcp_batch-queue.so
  2066. area->offset = 0
  2067. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2068. addr = 0x7fa89c42c000
  2069. area->size = 4096
  2070. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2071. addr = 0x7fa89c42d000
  2072. area->size = 10485760
  2073. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2074. addr = 0x7fa8a1325000
  2075. area->size = 4096
  2076. area->name = /usr/local/lib/dmtcp/libdmtcp_batch-queue.so
  2077. area->offset = 77824
  2078. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2079. addr = 0x7fa8a1326000
  2080. area->size = 131072
  2081. area->name = /lib64/ld-2.12.so
  2082. area->offset = 0
  2083. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2084. addr = 0x7fa8a1421000
  2085. area->size = 4096
  2086. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2087. addr = 0x7fa8a1422000
  2088. area->size = 1159168
  2089. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2090. addr = 0x7fa89ce2d000
  2091. area->size = 4096
  2092. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2093. addr = 0x7fa89ce2e000
  2094. area->size = 1048576
  2095. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2096. addr = 0x7fa89cf2e000
  2097. area->size = 32768
  2098. area->name = /usr/lib64/libmunge.so.2.0.0
  2099. area->offset = 0
  2100. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2101. addr = 0x7fa89d136000
  2102. area->size = 4096
  2103. area->name = /usr/lib64/libmunge.so.2.0.0
  2104. area->offset = 32768
  2105. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2106. addr = 0x7fa89d137000
  2107. area->size = 12288
  2108. area->name = /usr/local/lib/slurm/auth_munge.so
  2109. area->offset = 0
  2110. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2111. addr = 0x7fa89d339000
  2112. area->size = 4096
  2113. area->name = /usr/local/lib/slurm/auth_munge.so
  2114. area->offset = 8192
  2115. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2116. addr = 0x7fa89d33a000
  2117. area->size = 77824
  2118. area->name = /usr/local/lib/slurm/mpi_pmi2.so
  2119. area->offset = 0
  2120. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2121. addr = 0x7fa8a153e000
  2122. area->size = 28672
  2123. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2124. addr = 0x7fa89d54c000
  2125. area->size = 8192
  2126. area->name = /usr/local/lib/slurm/mpi_pmi2.so
  2127. area->offset = 73728
  2128. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2129. addr = 0x7fa8a1545000
  2130. area->size = 4096
  2131. area->name = /lib64/ld-2.12.so
  2132. area->offset = 126976
  2133. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2134. addr = 0x7fa8a1546000
  2135. area->size = 4096
  2136. area->name = /lib64/ld-2.12.so
  2137. area->offset = 131072
  2138. [41000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2139. addr = 0x7fa8a1547000
  2140. area->size = 4096
  2141. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2142. addr = 0x7fffe526a000
  2143. area->size = 10420224
  2144. area->name = [stack]
  2145. area->offset = 0
  2146. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2147. addr = 0x7fa89d54e000
  2148. area->size = 20480
  2149. area->name = /usr/local/lib/slurm/launch_slurm.so
  2150. area->offset = 0
  2151. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2152. addr = 0x7fa89d752000
  2153. area->size = 4096
  2154. area->name = /usr/local/lib/slurm/launch_slurm.so
  2155. area->offset = 16384
  2156. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2157. addr = 0x7fa89d753000
  2158. area->size = 8192
  2159. area->name = /usr/local/lib/slurm/switch_none.so
  2160. area->offset = 0
  2161. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2162. addr = 0x7fa89d954000
  2163. area->size = 4096
  2164. area->name = /usr/local/lib/slurm/switch_none.so
  2165. area->offset = 4096
  2166. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2167. addr = 0x7fa89d955000
  2168. area->size = 45056
  2169. area->name = /usr/local/lib/slurm/select_linear.so
  2170. area->offset = 0
  2171. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2172. addr = 0x7fa89db5f000
  2173. area->size = 4096
  2174. area->name = /usr/local/lib/slurm/select_linear.so
  2175. area->offset = 40960
  2176. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2177. addr = 0x7fa89db60000
  2178. area->size = 4096
  2179. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2180. addr = 0x7fa89db61000
  2181. area->size = 10485760
  2182. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2183. addr = 0x7fa89e793000
  2184. area->size = 4096
  2185. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2186. addr = 0x7fa89f194000
  2187. area->size = 4096
  2188. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2189. addr = 0x7fa89f195000
  2190. area->size = 49152
  2191. area->name = /lib64/libnss_files-2.12.so
  2192. area->offset = 0
  2193. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2194. addr = 0x7fa89f3a1000
  2195. area->size = 4096
  2196. area->name = /lib64/libnss_files-2.12.so
  2197. area->offset = 49152
  2198. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2199. addr = 0x7fa89f3a2000
  2200. area->size = 4096
  2201. area->name = /lib64/libnss_files-2.12.so
  2202. area->offset = 53248
  2203. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2204. addr = 0x7fa89f3a3000
  2205. area->size = 28672
  2206. area->name = /lib64/librt-2.12.so
  2207. area->offset = 0
  2208. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2209. addr = 0x7fa89f5a9000
  2210. area->size = 4096
  2211. area->name = /lib64/librt-2.12.so
  2212. area->offset = 24576
  2213. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2214. addr = 0x7fa89f5aa000
  2215. area->size = 4096
  2216. area->name = /lib64/librt-2.12.so
  2217. area->offset = 28672
  2218. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2219. addr = 0x7fa89f5ab000
  2220. area->size = 90112
  2221. area->name = /lib64/libgcc_s-4.4.7-20120601.so.1
  2222. area->offset = 0
  2223. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2224. addr = 0x7fa89f7c0000
  2225. area->size = 4096
  2226. area->name = /lib64/libgcc_s-4.4.7-20120601.so.1
  2227. area->offset = 86016
  2228. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2229. addr = 0x7fa89f7c1000
  2230. area->size = 536576
  2231. area->name = /lib64/libm-2.12.so
  2232. area->offset = 0
  2233. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2234. addr = 0x7fa89fa43000
  2235. area->size = 4096
  2236. area->name = /lib64/libm-2.12.so
  2237. area->offset = 532480
  2238. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2239. addr = 0x7fa89fa44000
  2240. area->size = 4096
  2241. area->name = /lib64/libm-2.12.so
  2242. area->offset = 536576
  2243. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2244. addr = 0x7fa89fa45000
  2245. area->size = 950272
  2246. area->name = /usr/lib64/libstdc++.so.6.0.13
  2247. area->offset = 0
  2248. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2249. addr = 0x7fa89fd2d000
  2250. area->size = 28672
  2251. area->name = /usr/lib64/libstdc++.so.6.0.13
  2252. area->offset = 950272
  2253. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2254. addr = 0x7fa89fd34000
  2255. area->size = 8192
  2256. area->name = /usr/lib64/libstdc++.so.6.0.13
  2257. area->offset = 978944
  2258. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2259. addr = 0x7fa89fd36000
  2260. area->size = 86016
  2261. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2262. addr = 0x7fa89fd4b000
  2263. area->size = 1613824
  2264. area->name = /lib64/libc-2.12.so
  2265. area->offset = 0
  2266. [41000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2267. addr = 0x7fffe5ca5000
  2268. area->size = 4096
  2269. area->name = [vdso]
  2270. area->offset = 0
  2271. [41000] TRACE at shareddata.cpp:189 in initialize; REASON='Shared area mapped'
  2272. sharedDataHeader = 0x7fa89e561000
  2273. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2274. addr = 0x7fa8a00d5000
  2275. area->size = 16384
  2276. area->name = /lib64/libc-2.12.so
  2277. area->offset = 1613824
  2278. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2279. addr = 0x7fa8a00d9000
  2280. area->size = 4096
  2281. area->name = /lib64/libc-2.12.so
  2282. area->offset = 1630208
  2283. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2284. addr = 0x7fa8a00da000
  2285. area->size = 20480
  2286. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2287. addr = 0x7fa8a00df000
  2288. area->size = 94208
  2289. area->name = /lib64/libpthread-2.12.so
  2290. area->offset = 0
  2291. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2292. addr = 0x7fa8a02f6000
  2293. area->size = 4096
  2294. area->name = /lib64/libpthread-2.12.so
  2295. area->offset = 94208
  2296. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2297. addr = 0x7fa8a02f7000
  2298. area->size = 4096
  2299. area->name = /lib64/libpthread-2.12.so
  2300. area->offset = 98304
  2301. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2302. addr = 0x7fa8a02f8000
  2303. area->size = 16384
  2304. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2305. addr = 0x7fa8a02fc000
  2306. area->size = 8192
  2307. area->name = /lib64/libdl-2.12.so
  2308. area->offset = 0
  2309. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2310. addr = 0x7fa8a04fe000
  2311. area->size = 4096
  2312. area->name = /lib64/libdl-2.12.so
  2313. area->offset = 8192
  2314. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2315. addr = 0x7fa8a04ff000
  2316. area->size = 4096
  2317. area->name = /lib64/libdl-2.12.so
  2318. area->offset = 12288
  2319. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2320. addr = 0x7fa8a0500000
  2321. area->size = 155648
  2322. area->name = /usr/local/lib/dmtcp/libdmtcp_pid.so
  2323. area->offset = 0
  2324. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2325. addr = 0x7fa8a0725000
  2326. area->size = 8192
  2327. area->name = /usr/local/lib/dmtcp/libdmtcp_pid.so
  2328. area->offset = 151552
  2329. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2330. addr = 0x7fa8a0727000
  2331. area->size = 823296
  2332. area->name = /usr/local/lib/dmtcp/libdmtcp.so
  2333. area->offset = 0
  2334. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2335. addr = 0x7fa8a09ef000
  2336. area->size = 20480
  2337. area->name = /usr/local/lib/dmtcp/libdmtcp.so
  2338. area->offset = 819200
  2339. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2340. addr = 0x7fa8a09f4000
  2341. area->size = 20480
  2342. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2343. addr = 0x7fa8a09f9000
  2344. area->size = 1105920
  2345. area->name = /usr/local/lib/dmtcp/libdmtcp_ipc.so
  2346. area->offset = 0
  2347. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2348. addr = 0x7fa8a0d07000
  2349. area->size = 28672
  2350. area->name = /usr/local/lib/dmtcp/libdmtcp_ipc.so
  2351. area->offset = 1105920
  2352. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2353. addr = 0x7fa8a0d0e000
  2354. area->size = 4096
  2355. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2356. addr = 0x7fa8a0d0f000
  2357. area->size = 4096
  2358. area->name = /usr/local/lib/dmtcp/libdmtcp_dl.so
  2359. area->offset = 0
  2360. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2361. addr = 0x7fa8a0f0f000
  2362. area->size = 4096
  2363. area->name = /usr/local/lib/dmtcp/libdmtcp_dl.so
  2364. area->offset = 0
  2365. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2366. addr = 0x7fa8a0f10000
  2367. area->size = 4096
  2368. area->name = /usr/local/lib/dmtcp/libdmtcp_alloc.so
  2369. area->offset = 0
  2370. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2371. addr = 0x7fa8a1111000
  2372. area->size = 4096
  2373. area->name = /usr/local/lib/dmtcp/libdmtcp_alloc.so
  2374. area->offset = 4096
  2375. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2376. addr = 0x7fa8a1112000
  2377. area->size = 77824
  2378. area->name = /usr/local/lib/dmtcp/libdmtcp_batch-queue.so
  2379. area->offset = 0
  2380. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2381. addr = 0x7fa8a1325000
  2382. area->size = 4096
  2383. area->name = /usr/local/lib/dmtcp/libdmtcp_batch-queue.so
  2384. area->offset = 77824
  2385. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2386. addr = 0x7fa8a1326000
  2387. area->size = 131072
  2388. area->name = /lib64/ld-2.12.so
  2389. area->offset = 0
  2390. [41000] TRACE at ckptserializer.cpp:599 in writeCkptImage; REASON='checkpoint complete'
  2391. [41000] TRACE at threadlist.cpp:357 in checkpointhread; REASON='before callbackPostCheckpoint(0, NULL)'
  2392. [41000] TRACE at coordinatorapi.cpp:672 in sendCkptFilename; REASON='recording filenames'
  2393. ckptFilename = /home/slurm/ckpt_srun_6db90f3d5a9dd200-41000-546a1de8.dmtcp
  2394. hostname = slurm-master
  2395. [41000] TRACE at dmtcpworker.cpp:519 in waitForStage3Refill; REASON='checkpointed'
  2396. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for REGISTER_NAME_SERVICE_DATA message'
  2397. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2398. addr = 0x7fa8a1421000
  2399. area->size = 4096
  2400. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2401. addr = 0x7fa8a1422000
  2402. area->size = 1159168
  2403. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2404. addr = 0x7fa8a153e000
  2405. area->size = 28672
  2406. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2407. addr = 0x7fa8a1545000
  2408. area->size = 4096
  2409. area->name = /lib64/ld-2.12.so
  2410. area->offset = 126976
  2411. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2412. addr = 0x7fa8a1546000
  2413. area->size = 4096
  2414. area->name = /lib64/ld-2.12.so
  2415. area->offset = 131072
  2416. [40000] TRACE at writeckpt.cpp:425 in writememoryarea; REASON='save anonymous'
  2417. addr = 0x7fa8a1547000
  2418. area->size = 4096
  2419. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2420. addr = 0x7fffe526a000
  2421. area->size = 10420224
  2422. area->name = [stack]
  2423. area->offset = 0
  2424. [40000] TRACE at writeckpt.cpp:427 in writememoryarea; REASON='save anonymous'
  2425. addr = 0x7fffe5ca5000
  2426. area->size = 4096
  2427. area->name = [vdso]
  2428. area->offset = 0
  2429. [40000] TRACE at shareddata.cpp:189 in initialize; REASON='Shared area mapped'
  2430. sharedDataHeader = 0x7fa89e561000
  2431. [40000] TRACE at ckptserializer.cpp:599 in writeCkptImage; REASON='checkpoint complete'
  2432. [40000] TRACE at threadlist.cpp:357 in checkpointhread; REASON='before callbackPostCheckpoint(0, NULL)'
  2433. [40000] TRACE at coordinatorapi.cpp:672 in sendCkptFilename; REASON='recording filenames'
  2434. ckptFilename = /home/slurm/ckpt_srun_6db90f3d5a9dd200-40000-546a1de8.dmtcp
  2435. hostname = slurm-master
  2436. [40000] TRACE at dmtcpworker.cpp:519 in waitForStage3Refill; REASON='checkpointed'
  2437. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for REGISTER_NAME_SERVICE_DATA message'
  2438. [41000] TRACE at dmtcpworker.cpp:528 in waitForStage3Refill; REASON='Key Value Pairs registered with the coordinator'
  2439. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for SEND_QUERIES message'
  2440. [40000] TRACE at dmtcpworker.cpp:528 in waitForStage3Refill; REASON='Key Value Pairs registered with the coordinator'
  2441. [41000] TRACE at dmtcpworker.cpp:533 in waitForStage3Refill; REASON='Queries sent to the coordinator'
  2442. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for REFILL message'
  2443. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for SEND_QUERIES message'
  2444. [40000] TRACE at dmtcpworker.cpp:533 in waitForStage3Refill; REASON='Queries sent to the coordinator'
  2445. [41000] TRACE at kernelbufferdrainer.cpp:167 in refillAllSockets; REASON='refilling socket buffers'
  2446. _drainedData.size() = 1
  2447. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for REFILL message'
  2448. [40000] TRACE at kernelbufferdrainer.cpp:167 in refillAllSockets; REASON='refilling socket buffers'
  2449. _drainedData.size() = 9
  2450. [41000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2451. size = 0
  2452. [41000] TRACE at kernelbufferdrainer.cpp:210 in refillAllSockets; REASON='buffers refilled'
  2453. [41000] TRACE at dmtcpworker.cpp:545 in waitForStage4Resume; REASON='refilled'
  2454. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for RESUME message'
  2455. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2456. size = 0
  2457. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2458. size = 0
  2459. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2460. size = 0
  2461. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2462. size = 0
  2463. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2464. size = 0
  2465. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2466. size = 0
  2467. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2468. size = 0
  2469. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2470. size = 0
  2471. [40000] TRACE at kernelbufferdrainer.cpp:199 in refillAllSockets; REASON='repeating buffer back to peer'
  2472. size = 0
  2473. [40000] TRACE at kernelbufferdrainer.cpp:210 in refillAllSockets; REASON='buffers refilled'
  2474. [40000] TRACE at dmtcpworker.cpp:545 in waitForStage4Resume; REASON='refilled'
  2475. [41000] TRACE at dmtcpworker.cpp:548 in waitForStage4Resume; REASON='got resume message'
  2476. [41000] TRACE at threadlist.cpp:361 in checkpointhread; REASON='resuming everything'
  2477. [41000] TRACE at threadlist.cpp:363 in checkpointhread; REASON='everything resumed'
  2478. [41000] TRACE at threadlist.cpp:334 in checkpointhread; REASON='before callbackSleepBetweenCheckpoint(0)'
  2479. [41000] TRACE at threadlist.cpp:532 in stopthisthread; REASON='User thread resuming'
  2480. curThread->tid = 6373
  2481. [41000] TRACE at threadlist.cpp:543 in stopthisthread; REASON='User thread returning to user code'
  2482. curThread->tid = 6373
  2483. __builtin_return_address(0) = 0x7fa8a00ee710
  2484. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for RESUME message'
  2485. [40000] TRACE at dmtcpworker.cpp:548 in waitForStage4Resume; REASON='got resume message'
  2486. [40000] TRACE at threadlist.cpp:361 in checkpointhread; REASON='resuming everything'
  2487. [40000] TRACE at threadlist.cpp:532 in stopthisthread; REASON='User thread resuming'
  2488. curThread->tid = 6377
  2489. [40000] TRACE at threadlist.cpp:543 in stopthisthread; REASON='User thread returning to user code'
  2490. curThread->tid = 6377
  2491. __builtin_return_address(0) = 0x7fa8a00ee710
  2492. [40000] TRACE at threadlist.cpp:532 in stopthisthread; REASON='User thread resuming'
  2493. curThread->tid = 6375
  2494. [40000] TRACE at threadlist.cpp:543 in stopthisthread; REASON='User thread returning to user code'
  2495. curThread->tid = 6375
  2496. __builtin_return_address(0) = 0x7fa8a00ee710
  2497. [40000] TRACE at threadlist.cpp:532 in stopthisthread; REASON='User thread resuming'
  2498. curThread->tid = 6374
  2499. [40000] TRACE at threadlist.cpp:543 in stopthisthread; REASON='User thread returning to user code'
  2500. curThread->tid = 6374
  2501. __builtin_return_address(0) = 0x7fa8a00ee710
  2502. [40000] TRACE at threadlist.cpp:532 in stopthisthread; REASON='User thread resuming'
  2503. curThread->tid = 6369
  2504. [40000] TRACE at threadlist.cpp:543 in stopthisthread; REASON='User thread returning to user code'
  2505. curThread->tid = 6369
  2506. __builtin_return_address(0) = 0x7fa8a00ee710
  2507. [40000] TRACE at threadlist.cpp:532 in stopthisthread; REASON='User thread resuming'
  2508. curThread->tid = 6365
  2509. [40000] TRACE at threadlist.cpp:543 in stopthisthread; REASON='User thread returning to user code'
  2510. curThread->tid = 6365
  2511. __builtin_return_address(0) = 0x7fa8a00ee710
  2512. [40000] TRACE at threadlist.cpp:532 in stopthisthread; REASON='User thread resuming'
  2513. curThread->tid = 6378
  2514. [40000] TRACE at threadlist.cpp:543 in stopthisthread; REASON='User thread returning to user code'
  2515. curThread->tid = 6378
  2516. __builtin_return_address(0) = 0x7fa8a00ee710
  2517. slurmstepd-slurm-compute1: Message length of 2071343164 exceeds maximum of 1024
  2518. iteration 6 on process 0
  2519. slurmstepd-slurm-compute2: Message length of 2071343164 exceeds maximum of 1024
  2520. iteration 6 on process 1
  2521. iteration 7 on process 0
  2522. iteration 7 on process 1
  2523. iteration 8 on process 0
  2524. iteration 8 on process 1
  2525. iteration 9 on process 0
  2526. iteration 9 on process 1
  2527. iteration 10 on process 0
  2528. iteration 10 on process 1
  2529. iteration 11 on process 0
  2530. iteration 11 on process 1
  2531. iteration 12 on process 0
  2532. iteration 12 on process 1
  2533. iteration 13 on process 0
  2534. iteration 13 on process 1
  2535. iteration 14 on process 0
  2536. iteration 14 on process 1
  2537. iteration 15 on process 0
  2538. iteration 15 on process 1
  2539. iteration 16 on process 0
  2540. iteration 16 on process 1
  2541. iteration 17 on process 0
  2542. iteration 17 on process 1
  2543. iteration 18 on process 0
  2544. iteration 18 on process 1
  2545. iteration 19 on process 0
  2546. iteration 19 on process 1
  2547. iteration 20 on process 0
  2548. iteration 20 on process 1
  2549. iteration 21 on process 0
  2550. iteration 21 on process 1
  2551. iteration 22 on process 0
  2552. iteration 22 on process 1
  2553. iteration 23 on process 0
  2554. iteration 23 on process 1
  2555. iteration 24 on process 0
  2556. iteration 24 on process 1
  2557. iteration 25 on process 0
  2558. iteration 25 on process 1
  2559. iteration 26 on process 0
  2560. iteration 26 on process 1
  2561. iteration 27 on process 0
  2562. iteration 27 on process 1
  2563. iteration 28 on process 0
  2564. iteration 28 on process 1
  2565. iteration 29 on process 0
  2566. slurmstepd-slurm-compute1: Failed to send MESSAGE_TASK_EXIT: Transport endpoint is not connected
  2567. iteration 29 on process 1
  2568. slurmstepd-slurm-compute2: Failed to send MESSAGE_TASK_EXIT: Transport endpoint is not connected
  2569. iteration 30 on process 0
  2570. iteration 30 on process 1
  2571. iteration 31 on process 0
  2572. iteration 31 on process 1
  2573. iteration 32 on process 0
  2574. iteration 32 on process 1
  2575. iteration 33 on process 0
  2576. iteration 33 on process 1
  2577. iteration 34 on process 0
  2578. iteration 34 on process 1
  2579. iteration 35 on process 0
  2580. iteration 35 on process 1
  2581. iteration 36 on process 0
  2582. iteration 36 on process 1
  2583. iteration 37 on process 0
  2584. iteration 37 on process 1
  2585. iteration 38 on process 0
  2586. iteration 38 on process 1
  2587. iteration 39 on process 0
  2588. iteration 39 on process 1
  2589. iteration 40 on process 0
  2590. iteration 40 on process 1
  2591. iteration 41 on process 0
  2592. iteration 41 on process 1
  2593. iteration 42 on process 0
  2594. iteration 42 on process 1
  2595. iteration 43 on process 0
  2596. iteration 43 on process 1
  2597. iteration 44 on process 0
  2598. iteration 44 on process 1
  2599. iteration 45 on process 0
  2600. iteration 45 on process 1
  2601. iteration 46 on process 0
  2602. iteration 46 on process 1
  2603. iteration 47 on process 0
  2604. iteration 47 on process 1
  2605. iteration 48 on process 0
  2606. iteration 48 on process 1
  2607. iteration 49 on process 0
  2608. iteration 49 on process 1
  2609. Goodbye world from process 0 of 2
  2610. Goodbye world from process 1 of 2
  2611. [40000] TRACE at threadlist.cpp:363 in checkpointhread; REASON='everything resumed'
  2612. [40000] TRACE at threadlist.cpp:334 in checkpointhread; REASON='before callbackSleepBetweenCheckpoint(0)'
  2613. [40000] TRACE at dmtcpworker.cpp:468 in waitForStage1Suspend; REASON='running'
  2614. [40000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for SUSPEND message'
  2615. [41000] TRACE at dmtcpworker.cpp:468 in waitForStage1Suspend; REASON='running'
  2616. [41000] TRACE at dmtcpworker.cpp:428 in waitForCoordinatorMsg; REASON='waiting for SUSPEND message'
  2617. ^Csrun: interrupt (one more within 1 sec to abort)
  2618. srun: tasks 0-1: running
  2619. ^Csrun: sending Ctrl-C to job 107.0
  2620. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  2621. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  2622. tid = 6403
  2623. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  2624. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  2625. tid = 6404
  2626. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  2627. virtualTid = 40030
  2628. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  2629. th->tid = 6403
  2630. th->virtual_tid = 40030
  2631. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  2632. gettid() = 40030
  2633. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2634. ret = 18
  2635. domain = 2
  2636. type = 1
  2637. protocol = 6
  2638. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2639. id() = 6db90f3d5a9dd200-40000-546a1de8(99075)
  2640. domain = 2
  2641. type = 1
  2642. protocol = 6
  2643. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  2644. virtualTid = 40032
  2645. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  2646. th->tid = 6404
  2647. th->virtual_tid = 40032
  2648. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  2649. gettid() = 40032
  2650. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2651. ret = 19
  2652. domain = 2
  2653. type = 1
  2654. protocol = 6
  2655. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2656. id() = 6db90f3d5a9dd200-40000-546a1de8(99076)
  2657. domain = 2
  2658. type = 1
  2659. protocol = 6
  2660. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2661. sockfd = 18
  2662. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99075)
  2663. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2664. ret = 20
  2665. domain = 1
  2666. type = 1
  2667. protocol = 0
  2668. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2669. id() = 6db90f3d5a9dd200-40000-546a1de8(99077)
  2670. domain = 1
  2671. type = 1
  2672. protocol = 0
  2673. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2674. sockfd = 20
  2675. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99077)
  2676. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2677. sockfd = 19
  2678. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99076)
  2679. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2680. ret = 20
  2681. domain = 1
  2682. type = 1
  2683. protocol = 0
  2684. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2685. id() = 6db90f3d5a9dd200-40000-546a1de8(99078)
  2686. domain = 1
  2687. type = 1
  2688. protocol = 0
  2689. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2690. sockfd = 20
  2691. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99078)
  2692. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2693. ret = 20
  2694. domain = 1
  2695. type = 1
  2696. protocol = 0
  2697. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2698. id() = 6db90f3d5a9dd200-40000-546a1de8(99079)
  2699. domain = 1
  2700. type = 1
  2701. protocol = 0
  2702. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2703. sockfd = 20
  2704. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99079)
  2705. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  2706. virtualTid = 1635198781
  2707. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2708. ret = 18
  2709. domain = 1
  2710. type = 1
  2711. protocol = 0
  2712. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2713. id() = 6db90f3d5a9dd200-40000-546a1de8(99080)
  2714. domain = 1
  2715. type = 1
  2716. protocol = 0
  2717. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2718. sockfd = 18
  2719. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99080)
  2720. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2721. ret = 18
  2722. domain = 2
  2723. type = 1
  2724. protocol = 6
  2725. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2726. id() = 6db90f3d5a9dd200-40000-546a1de8(99082)
  2727. domain = 2
  2728. type = 1
  2729. protocol = 6
  2730. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2731. sockfd = 18
  2732. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99082)
  2733. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2734. ret = 19
  2735. domain = 1
  2736. type = 1
  2737. protocol = 0
  2738. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2739. id() = 6db90f3d5a9dd200-40000-546a1de8(99083)
  2740. domain = 1
  2741. type = 1
  2742. protocol = 0
  2743. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2744. sockfd = 19
  2745. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99083)
  2746. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  2747. virtualTid = 0
  2748. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2749. ret = 19
  2750. domain = 1
  2751. type = 1
  2752. protocol = 0
  2753. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2754. id() = 6db90f3d5a9dd200-40000-546a1de8(99084)
  2755. domain = 1
  2756. type = 1
  2757. protocol = 0
  2758. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2759. sockfd = 19
  2760. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99084)
  2761. srun: Job step aborted: Waiting up to 2 seconds for job step to finish.
  2762. ^Csrun: interrupt (one more within 1 sec to abort)
  2763. srun: tasks 0-1: running
  2764. ^Csrun: sending Ctrl-C to job 107.0
  2765. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  2766. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  2767. tid = 6406
  2768. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  2769. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  2770. tid = 6407
  2771. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  2772. virtualTid = 40034
  2773. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  2774. th->tid = 6406
  2775. th->virtual_tid = 40034
  2776. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  2777. thread->tid = 6404
  2778. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  2779. thread->tid = 6404
  2780. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  2781. thread->tid = 6403
  2782. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  2783. thread->tid = 6403
  2784. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  2785. gettid() = 40034
  2786. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2787. ret = 18
  2788. domain = 2
  2789. type = 1
  2790. protocol = 6
  2791. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2792. id() = 6db90f3d5a9dd200-40000-546a1de8(99085)
  2793. domain = 2
  2794. type = 1
  2795. protocol = 6
  2796. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  2797. virtualTid = 40036
  2798. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  2799. th->tid = 6407
  2800. th->virtual_tid = 40036
  2801. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  2802. gettid() = 40036
  2803. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2804. ret = 19
  2805. domain = 2
  2806. type = 1
  2807. protocol = 6
  2808. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2809. id() = 6db90f3d5a9dd200-40000-546a1de8(99086)
  2810. domain = 2
  2811. type = 1
  2812. protocol = 6
  2813. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2814. sockfd = 18
  2815. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99085)
  2816. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2817. ret = 20
  2818. domain = 1
  2819. type = 1
  2820. protocol = 0
  2821. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2822. id() = 6db90f3d5a9dd200-40000-546a1de8(99087)
  2823. domain = 1
  2824. type = 1
  2825. protocol = 0
  2826. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2827. sockfd = 20
  2828. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99087)
  2829. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2830. sockfd = 19
  2831. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99086)
  2832. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2833. ret = 20
  2834. domain = 1
  2835. type = 1
  2836. protocol = 0
  2837. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2838. id() = 6db90f3d5a9dd200-40000-546a1de8(99088)
  2839. domain = 1
  2840. type = 1
  2841. protocol = 0
  2842. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2843. sockfd = 20
  2844. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99088)
  2845. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2846. ret = 20
  2847. domain = 1
  2848. type = 1
  2849. protocol = 0
  2850. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2851. id() = 6db90f3d5a9dd200-40000-546a1de8(99089)
  2852. domain = 1
  2853. type = 1
  2854. protocol = 0
  2855. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2856. sockfd = 20
  2857. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99089)
  2858. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  2859. virtualTid = 40030
  2860. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2861. ret = 18
  2862. domain = 1
  2863. type = 1
  2864. protocol = 0
  2865. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2866. id() = 6db90f3d5a9dd200-40000-546a1de8(99090)
  2867. domain = 1
  2868. type = 1
  2869. protocol = 0
  2870. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2871. sockfd = 18
  2872. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99090)
  2873. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  2874. virtualTid = 0
  2875. ^Csrun: forcing job termination
  2876. ^Csrun: job abort in progress
  2877. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2878. ret = 18
  2879. domain = 2
  2880. type = 1
  2881. protocol = 6
  2882. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2883. id() = 6db90f3d5a9dd200-40000-546a1de8(99092)
  2884. domain = 2
  2885. type = 1
  2886. protocol = 6
  2887. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2888. sockfd = 18
  2889. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99092)
  2890. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2891. ret = 19
  2892. domain = 1
  2893. type = 1
  2894. protocol = 0
  2895. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2896. id() = 6db90f3d5a9dd200-40000-546a1de8(99093)
  2897. domain = 1
  2898. type = 1
  2899. protocol = 0
  2900. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2901. sockfd = 19
  2902. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99093)
  2903. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2904. ret = 19
  2905. domain = 1
  2906. type = 1
  2907. protocol = 0
  2908. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2909. id() = 6db90f3d5a9dd200-40000-546a1de8(99094)
  2910. domain = 1
  2911. type = 1
  2912. protocol = 0
  2913. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2914. sockfd = 19
  2915. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99094)
  2916. ^C^C^C^C^C^C^C^C^C^C^C^C^C^Csrun: error: Timed out waiting for job step to complete
  2917. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2918. ret = 18
  2919. domain = 2
  2920. type = 1
  2921. protocol = 6
  2922. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2923. id() = 6db90f3d5a9dd200-40000-546a1de8(99096)
  2924. domain = 2
  2925. type = 1
  2926. protocol = 6
  2927. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2928. sockfd = 18
  2929. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99096)
  2930. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2931. ret = 19
  2932. domain = 1
  2933. type = 1
  2934. protocol = 0
  2935. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2936. id() = 6db90f3d5a9dd200-40000-546a1de8(99097)
  2937. domain = 1
  2938. type = 1
  2939. protocol = 0
  2940. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2941. sockfd = 19
  2942. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99097)
  2943. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2944. ret = 19
  2945. domain = 1
  2946. type = 1
  2947. protocol = 0
  2948. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2949. id() = 6db90f3d5a9dd200-40000-546a1de8(99098)
  2950. domain = 1
  2951. type = 1
  2952. protocol = 0
  2953. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2954. sockfd = 19
  2955. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99098)
  2956. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  2957. virtualTid = 0
  2958. [40000] TRACE at pid_miscwrappers.cpp:158 in __clone; REASON='Calling libc:__clone'
  2959. [40000] TRACE at pid_miscwrappers.cpp:167 in __clone; REASON='New thread created'
  2960. tid = 6410
  2961. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  2962. virtualTid = 0
  2963. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  2964. virtualTid = 0
  2965. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2966. ret = 0
  2967. domain = 2
  2968. type = 1
  2969. protocol = 6
  2970. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2971. id() = 6db90f3d5a9dd200-40000-546a1de8(99100)
  2972. domain = 2
  2973. type = 1
  2974. protocol = 6
  2975. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2976. sockfd = 0
  2977. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99100)
  2978. [40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  2979. ret = 4
  2980. domain = 1
  2981. type = 1
  2982. protocol = 0
  2983. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  2984. id() = 6db90f3d5a9dd200-40000-546a1de8(99101)
  2985. domain = 1
  2986. type = 1
  2987. protocol = 0
  2988. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  2989. sockfd = 4
  2990. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99101)
  2991. [40000] TRACE at pid_miscwrappers.cpp:118 in clone_start; REASON='Calling user function'
  2992. virtualTid = 40038
  2993. [40000] TRACE at threadlist.cpp:223 in updateTid; REASON='starting thread'
  2994. th->tid = 6410
  2995. th->virtual_tid = 40038
  2996. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  2997. thread->tid = 6407
  2998. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  2999. thread->tid = 6407
  3000. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  3001. thread->tid = 6406
  3002. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  3003. thread->tid = 6406
  3004. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  3005. thread->tid = 6378
  3006. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  3007. thread->tid = 6378
  3008. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  3009. thread->tid = 6377
  3010. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  3011. thread->tid = 6377
  3012. [40000] TRACE at threadlist.cpp:762 in addToActiveList; REASON='Killing zombie thread'
  3013. thread->tid = 6369
  3014. [40000] TRACE at threadlist.cpp:795 in threadIsDead; REASON='Putting thread on freelist'
  3015. thread->tid = 6369
  3016. [40000] TRACE at threadwrappers.cpp:66 in clone_start; REASON='Calling user function'
  3017. gettid() = 40038
  3018. ^Csrun: interrupt (abort already in progress)
  3019. srun: tasks 0-1: running
  3020. ^Csrun: job abort in progress
  3021. ^C[40000] TRACE at socketwrappers.cpp:59 in socket; REASON='socket created'
  3022. ret = 4
  3023. domain = 1
  3024. type = 1
  3025. protocol = 0
  3026. [40000] TRACE at socketconnection.cpp:195 in TcpConnection; REASON='Creating TcpConnection.'
  3027. id() = 6db90f3d5a9dd200-40000-546a1de8(99102)
  3028. domain = 1
  3029. type = 1
  3030. protocol = 0
  3031. [40000] TRACE at socketwrappers.cpp:121 in connect; REASON='connected'
  3032. sockfd = 4
  3033. con->id() = 6db90f3d5a9dd200-40000-546a1de8(99102)
  3034. [41000] TRACE at coordinatorapi.cpp:57 in dmtcp_CoordinatorAPI_EventHook; REASON='exit() in progress, disconnecting from dmtcp coordinator'
  3035. [41000] TRACE at threadlist.cpp:236 in killCkpthread; REASON='Kill checkpinthread'
  3036. ckptThread->tid = 6376
  3037. [40000] TRACE at threadwrappers.cpp:148 in pthread_start; REASON='Thread returned'
  3038. virtualTid = 8
  3039. [41000] TRACE at dmtcpworker.cpp:349 in cleanupWorker; REASON='disconnecting from dmtcp coordinator'
  3040. [40000] TRACE at dmtcpworker.cpp:349 in cleanupWorker; REASON='disconnecting from dmtcp coordinator'
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement