Advertisement
lamiastella

nan loss

Oct 16th, 2020 (edited)
175
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 2.22 MB | None | 0 0
  1. 1
  2.  
  3. network = Network()
  4.  
  5. 2
  6.  
  7. network.cuda()
  8.  
  9. 3
  10.  
  11.  
  12. 4
  13.  
  14. criterion = nn.MSELoss()
  15.  
  16. 5
  17.  
  18. optimizer = optim.Adam(network.parameters(), lr=0.0001)
  19.  
  20. 6
  21.  
  22.  
  23. 7
  24.  
  25. loss_min = np.inf
  26.  
  27. 8
  28.  
  29. num_epochs = 10
  30.  
  31. 9
  32.  
  33.  
  34. 10
  35.  
  36. start_time = time.time()
  37.  
  38. 11
  39.  
  40. for epoch in range(1,num_epochs+1):
  41.  
  42. 12
  43.  
  44.  
  45.  
  46. 13
  47.  
  48. loss_train = 0
  49.  
  50. 14
  51.  
  52. loss_test = 0
  53.  
  54. 15
  55.  
  56. running_loss = 0
  57.  
  58. 16
  59.  
  60.  
  61.  
  62. 17
  63.  
  64.  
  65.  
  66. 18
  67.  
  68. network.train()
  69.  
  70. 19
  71.  
  72. print('size of train loader is: ', len(train_loader))
  73.  
  74. 20
  75.  
  76.  
  77. 21
  78.  
  79. for step in range(1, len(train_loader)+1):
  80.  
  81. 22
  82.  
  83.  
  84. 23
  85.  
  86.  
  87.  
  88. 24
  89.  
  90. batch = next(iter(train_loader))
  91.  
  92. 25
  93.  
  94. images, landmarks = batch['image'], batch['landmarks']
  95.  
  96. 26
  97.  
  98. print(images.shape)
  99.  
  100. 27
  101.  
  102.  
  103.  
  104. 28
  105.  
  106. images = images.unsqueeze_(1)
  107.  
  108. 29
  109.  
  110.  
  111. 30
  112.  
  113. images = torch.cat((images,images,images),1)
  114.  
  115. 31
  116.  
  117. images = images.cuda()
  118.  
  119. 32
  120.  
  121.  
  122.  
  123. 33
  124.  
  125. landmarks = landmarks.view(landmarks.size(0),-1).cuda()
  126.  
  127. 34
  128.  
  129. norm_image = transforms.Normalize(0.3812, 0.1123)
  130.  
  131. 35
  132.  
  133. for image in images:
  134.  
  135. 36
  136.  
  137. image = image.float()
  138.  
  139. 37
  140.  
  141. ##image = to_tensor(image) #TypeError: pic should be PIL Image or ndarray. Got <class 'torch.Tensor'>
  142.  
  143. 38
  144.  
  145. image = norm_image(image)
  146.  
  147. 39
  148.  
  149.  
  150.  
  151. 40
  152.  
  153. ###removing landmarks normalize because of the following error
  154.  
  155. 41
  156.  
  157. ###ValueError: Expected tensor to be a tensor image of size (C, H, W). Got tensor.size() = torch.Size([8, 8])
  158.  
  159. 42
  160.  
  161.  
  162.  
  163. 43
  164.  
  165.  
  166.  
  167. 44
  168.  
  169. for i in range(8):
  170.  
  171. 45
  172.  
  173. if(i%2==0):
  174.  
  175. 46
  176.  
  177. landmarks[:,i] = landmarks[:,i]/800
  178.  
  179. 47
  180.  
  181. else:
  182.  
  183. 48
  184.  
  185. landmarks[:,i] = landmarks[:,i]/600
  186.  
  187. 49
  188.  
  189.  
  190.  
  191. 50
  192.  
  193. print(landmarks.shape)
  194.  
  195. 51
  196.  
  197. print(landmarks)
  198.  
  199. 52
  200.  
  201.  
  202.  
  203. 53
  204.  
  205.  
  206.  
  207. 54
  208.  
  209.  
  210. 55
  211.  
  212.  
  213.  
  214. 56
  215.  
  216. ##norm_landmarks = transforms.Normalize(0.4949, 0.2165)
  217.  
  218. 57
  219.  
  220. landmarks [landmarks != landmarks] = 0
  221.  
  222. 58
  223.  
  224. landmarks = landmarks.unsqueeze_(0)
  225.  
  226. 59
  227.  
  228. landmarks = norm_landmarks(landmarks)
  229.  
  230. 60
  231.  
  232.  
  233.  
  234. 61
  235.  
  236. predictions = network(images)
  237.  
  238. 62
  239.  
  240.  
  241.  
  242. 63
  243.  
  244. # clear all the gradients before calculating them
  245.  
  246. 64
  247.  
  248. optimizer.zero_grad()
  249.  
  250. 65
  251.  
  252.  
  253.  
  254. 66
  255.  
  256. print('predictions are: ', predictions.float())
  257.  
  258. 67
  259.  
  260. print('landmarks are: ', landmarks.float())
  261.  
  262. 68
  263.  
  264. # find the loss for the current step
  265.  
  266. 69
  267.  
  268. loss_train_step = criterion(predictions.float(), landmarks.float())
  269.  
  270. 70
  271.  
  272.  
  273.  
  274. 71
  275.  
  276.  
  277.  
  278. 72
  279.  
  280. loss_train_step = loss_train_step.to(torch.float32)
  281.  
  282. 73
  283.  
  284. print("loss_train_step before backward: ", loss_train_step)
  285.  
  286. 74
  287.  
  288.  
  289.  
  290. 75
  291.  
  292. # calculate the gradients
  293.  
  294. 76
  295.  
  296. loss_train_step.backward()
  297.  
  298. 77
  299.  
  300.  
  301.  
  302. 78
  303.  
  304. # update the parameters
  305.  
  306. 79
  307.  
  308. optimizer.step()
  309.  
  310. 80
  311.  
  312.  
  313.  
  314. 81
  315.  
  316. print("loss_train_step after backward: ", loss_train_step)
  317.  
  318. 82
  319.  
  320.  
  321. 83
  322.  
  323.  
  324.  
  325. 84
  326.  
  327. loss_train += loss_train_step.item()
  328.  
  329. 85
  330.  
  331.  
  332.  
  333. 86
  334.  
  335. print("loss_train: ", loss_train)
  336.  
  337. 87
  338.  
  339. running_loss = loss_train/step
  340.  
  341. 88
  342.  
  343. print('step: ', step)
  344.  
  345. 89
  346.  
  347. print('running loss: ', running_loss)
  348.  
  349. 90
  350.  
  351.  
  352.  
  353. 91
  354.  
  355. print_overwrite(step, len(train_loader), running_loss, 'train')
  356.  
  357. 92
  358.  
  359.  
  360.  
  361. 93
  362.  
  363. network.eval()
  364.  
  365. 94
  366.  
  367. with torch.no_grad():
  368.  
  369. 95
  370.  
  371.  
  372.  
  373. 96
  374.  
  375. for step in range(1,len(test_loader)+1):
  376.  
  377. 97
  378.  
  379.  
  380.  
  381. 98
  382.  
  383. batch = next(iter(train_loader))
  384.  
  385. 99
  386.  
  387. images, landmarks = batch['image'], batch['landmarks']
  388.  
  389. 100
  390.  
  391. images = images.cuda()
  392.  
  393. 101
  394.  
  395. landmarks = landmarks.view(landmarks.size(0),-1).cuda()
  396.  
  397. 102
  398.  
  399. ##[8, 600, 800] --> [8,3,600,800]
  400.  
  401. 103
  402.  
  403. images = images.unsqueeze(1)
  404.  
  405. 104
  406.  
  407. images = torch.cat((images, images, images), 1)
  408.  
  409. 105
  410.  
  411. predictions = network(images)
  412.  
  413. 106
  414.  
  415.  
  416. 107
  417.  
  418. # find the loss for the current step
  419.  
  420. 108
  421.  
  422. loss_test_step = criterion(predictions, landmarks)
  423.  
  424. 109
  425.  
  426.  
  427. 110
  428.  
  429. loss_test += loss_test_step.item()
  430.  
  431. 111
  432.  
  433. running_loss = loss_test/step
  434.  
  435. 112
  436.  
  437.  
  438. 113
  439.  
  440. print_overwrite(step, len(test_loader), running_loss, 'Validation')
  441.  
  442. 114
  443.  
  444.  
  445.  
  446. 115
  447.  
  448. loss_train /= len(train_loader)
  449.  
  450. 116
  451.  
  452. loss_test /= len(test_loader)
  453.  
  454. 117
  455.  
  456.  
  457.  
  458. 118
  459.  
  460. print('\n--------------------------------------------------')
  461.  
  462. 119
  463.  
  464. print('Epoch: {} Train Loss: {:.4f} Valid Loss: {:.4f}'.format(epoch, loss_train, loss_test))
  465.  
  466. 120
  467.  
  468. print('--------------------------------------------------')
  469.  
  470. 121
  471.  
  472.  
  473.  
  474. 122
  475.  
  476. if loss_test < loss_min:
  477.  
  478. 123
  479.  
  480. loss_min = loss_test
  481.  
  482. 124
  483.  
  484. torch.save(network.state_dict(), '../moth_landmarks.pth')
  485.  
  486. 125
  487.  
  488. print("\nMinimum Valid Loss of {:.4f} at epoch {}/{}".format(loss_min, epoch, num_epochs))
  489.  
  490. 126
  491.  
  492. print('Model Saved\n')
  493.  
  494. 127
  495.  
  496.  
  497.  
  498. 128
  499.  
  500. print('Training Complete')
  501.  
  502. 129
  503.  
  504. print("Total Elapsed Time : {} s".format(time.time()-start_time))
  505.  
  506. size of train loader is: 90
  507. torch.Size([8, 600, 800])
  508. torch.Size([8, 8])
  509. tensor([[0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  510. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  511. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913],
  512. [ nan, nan, 0.6512, 0.1717, 0.4100, 0.1983, 0.5253, 0.5240],
  513. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  514. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  515. [0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  516. [0.6202, 0.4066, 0.8746, 0.3376, 0.3717, 0.3090, 0.5842, 0.5165]],
  517. device='cuda:0', dtype=torch.float64)
  518. predictions are: tensor([[-0.1423, -0.1056, -0.3138, 0.4684, -0.1054, -0.5563, -0.0186, 0.1072],
  519. [-0.1047, -0.1028, -0.2962, 0.4469, -0.1573, -0.5332, -0.0197, 0.1038],
  520. [-0.1244, -0.0833, -0.2863, 0.4311, -0.1496, -0.4844, -0.0656, 0.0925],
  521. [-0.1570, -0.1024, -0.2959, 0.4236, -0.1198, -0.4870, -0.0458, 0.1049],
  522. [-0.1260, -0.1189, -0.3429, 0.4834, -0.1040, -0.5703, 0.0156, 0.0999],
  523. [-0.1380, -0.0681, -0.3151, 0.4013, -0.1561, -0.5097, -0.0721, 0.0928],
  524. [-0.1592, -0.1133, -0.2992, 0.4642, -0.1194, -0.5710, -0.0054, 0.0882],
  525. [-0.1140, -0.0634, -0.3053, 0.4357, -0.1321, -0.5395, -0.0382, 0.0839]],
  526. device='cuda:0', grad_fn=<AddmmBackward>)
  527. landmarks are: tensor([[[ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  528. 0.2083],
  529. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  530. 0.0802],
  531. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  532. -0.0168],
  533. [-2.2859, -2.2859, 0.7222, -1.4930, -0.3921, -1.3698, 0.1404,
  534. 0.1343],
  535. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  536. 0.1020],
  537. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  538. 0.1698],
  539. [ 0.6520, -0.3912, 1.7095, -0.9079, -0.0284, -1.3621, 0.8096,
  540. 0.2356],
  541. [ 0.5787, -0.4077, 1.7537, -0.7263, -0.5692, -0.8586, 0.4126,
  542. 0.1000]]], device='cuda:0')
  543. loss_train_step before backward: tensor(1.0104, device='cuda:0', grad_fn=<MseLossBackward>)
  544. loss_train_step after backward: tensor(1.0104, device='cuda:0', grad_fn=<MseLossBackward>)
  545. loss_train: 1.0104049444198608
  546. step: 1
  547. running loss: 1.0104049444198608
  548. Train Steps: 1/90 Loss: 1.0104 torch.Size([8, 600, 800])
  549. torch.Size([8, 8])
  550. tensor([[0.6336, 0.4191, 0.8938, 0.5167, 0.3937, 0.3517, 0.7343, 0.5748],
  551. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235],
  552. [0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  553. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  554. [0.6125, 0.4035, 0.7825, 0.3100, 0.3463, 0.4900, 0.5832, 0.5637],
  555. [0.6114, 0.4018, 0.7213, 0.1967, 0.3763, 0.2700, 0.5875, 0.5533],
  556. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  557. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617]],
  558. device='cuda:0', dtype=torch.float64)
  559. predictions are: tensor([[-0.0659, -0.2580, 0.0962, 0.1213, -0.2025, -0.6994, 0.0772, 0.1072],
  560. [-0.0033, -0.2372, 0.0826, 0.1461, -0.1880, -0.6930, 0.0741, 0.1244],
  561. [-0.0202, -0.2130, 0.0678, 0.1583, -0.1568, -0.6912, 0.0771, 0.1296],
  562. [ 0.0287, -0.2443, 0.0870, 0.1132, -0.1829, -0.6959, 0.0773, 0.1000],
  563. [-0.0197, -0.2014, 0.0873, 0.1103, -0.1730, -0.6639, 0.0322, 0.1340],
  564. [-0.0283, -0.2539, 0.0533, 0.1278, -0.1841, -0.6857, 0.0922, 0.1333],
  565. [ 0.0008, -0.2950, 0.0865, 0.1903, -0.2152, -0.7125, 0.1525, 0.1757],
  566. [ 0.0252, -0.2935, 0.0619, 0.1467, -0.1725, -0.6754, 0.0774, 0.1400]],
  567. device='cuda:0', grad_fn=<AddmmBackward>)
  568. landmarks are: tensor([[[ 0.6405, -0.3503, 1.8423, 0.1005, -0.4672, -0.6616, 1.1057,
  569. 0.3692],
  570. [ 0.5762, -0.4706, 1.7754, -0.0984, -0.3680, 0.2380, 0.6277,
  571. 0.1322],
  572. [ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  573. 0.5401],
  574. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  575. 0.2142],
  576. [ 0.5432, -0.4224, 1.3284, -0.8540, -0.6866, -0.0226, 0.4077,
  577. 0.3177],
  578. [ 0.5380, -0.4302, 1.0455, -1.3775, -0.5480, -1.0388, 0.4277,
  579. 0.2699],
  580. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  581. 0.1082],
  582. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  583. 0.3084]]], device='cuda:0')
  584. loss_train_step before backward: tensor(0.5292, device='cuda:0', grad_fn=<MseLossBackward>)
  585. loss_train_step after backward: tensor(0.5292, device='cuda:0', grad_fn=<MseLossBackward>)
  586. loss_train: 1.539566159248352
  587. step: 2
  588. running loss: 0.769783079624176
  589. Train Steps: 2/90 Loss: 0.7698 torch.Size([8, 600, 800])
  590. torch.Size([8, 8])
  591. tensor([[0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  592. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  593. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  594. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  595. [0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  596. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  597. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  598. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585]],
  599. device='cuda:0', dtype=torch.float64)
  600. predictions are: tensor([[ 0.1696, -0.3065, 0.4627, -0.0944, -0.2657, -0.7406, 0.1930, 0.1774],
  601. [ 0.1604, -0.3258, 0.4616, -0.0499, -0.2615, -0.7130, 0.2208, 0.1799],
  602. [ 0.1484, -0.3291, 0.4707, -0.0997, -0.2455, -0.7404, 0.1867, 0.1688],
  603. [ 0.1728, -0.3067, 0.4303, -0.0530, -0.2103, -0.7886, 0.2801, 0.1768],
  604. [ 0.1909, -0.2937, 0.4370, -0.1293, -0.2625, -0.7441, 0.1705, 0.1318],
  605. [ 0.1561, -0.3214, 0.4482, -0.0593, -0.2596, -0.7309, 0.2042, 0.2013],
  606. [ 0.1806, -0.3209, 0.4534, -0.0854, -0.2666, -0.7370, 0.2352, 0.1802],
  607. [ 0.1912, -0.2630, 0.4746, -0.0326, -0.2686, -0.7027, 0.2144, 0.1895]],
  608. device='cuda:0', grad_fn=<AddmmBackward>)
  609. landmarks are: tensor([[[ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  610. 0.3050],
  611. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  612. 0.0764],
  613. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  614. 0.2391],
  615. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  616. 0.1020],
  617. [ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  618. 0.2699],
  619. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  620. 0.2634],
  621. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  622. -0.0220],
  623. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  624. 0.2936]]], device='cuda:0')
  625. loss_train_step before backward: tensor(0.3366, device='cuda:0', grad_fn=<MseLossBackward>)
  626. loss_train_step after backward: tensor(0.3366, device='cuda:0', grad_fn=<MseLossBackward>)
  627. loss_train: 1.8762048482894897
  628. step: 3
  629. running loss: 0.6254016160964966
  630. Train Steps: 3/90 Loss: 0.6254 torch.Size([8, 600, 800])
  631. torch.Size([8, 8])
  632. tensor([[0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  633. [0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  634. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  635. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  636. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  637. [0.6261, 0.4131, 0.8938, 0.3550, 0.4000, 0.2683, 0.6188, 0.5283],
  638. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  639. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222]],
  640. device='cuda:0', dtype=torch.float64)
  641. predictions are: tensor([[ 0.3182, -0.3804, 0.7228, -0.2070, -0.2713, -0.7219, 0.3276, 0.2051],
  642. [ 0.3052, -0.3400, 0.7528, -0.3017, -0.3315, -0.7304, 0.2778, 0.2039],
  643. [ 0.3572, -0.3411, 0.7817, -0.2362, -0.2603, -0.7317, 0.3130, 0.1719],
  644. [ 0.3135, -0.3787, 0.8097, -0.2249, -0.3170, -0.6919, 0.3421, 0.2800],
  645. [ 0.3222, -0.3184, 0.7258, -0.2893, -0.2752, -0.7587, 0.2927, 0.1911],
  646. [ 0.3452, -0.3446, 0.7560, -0.2866, -0.3250, -0.7399, 0.3119, 0.1912],
  647. [ 0.3920, -0.3923, 0.8089, -0.1643, -0.3038, -0.6605, 0.3647, 0.2397],
  648. [ 0.2950, -0.3404, 0.7301, -0.2619, -0.2894, -0.7364, 0.2727, 0.1653]],
  649. device='cuda:0', grad_fn=<AddmmBackward>)
  650. landmarks are: tensor([[[ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  651. 0.0562],
  652. [ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  653. 0.1710],
  654. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  655. 0.3315],
  656. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  657. 0.1715],
  658. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  659. -0.0368],
  660. [ 0.6062, -0.3778, 1.8423, -0.6462, -0.4383, -1.0465, 0.5721,
  661. 0.1544],
  662. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  663. 0.3700],
  664. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  665. 0.5882]]], device='cuda:0')
  666. loss_train_step before backward: tensor(0.1705, device='cuda:0', grad_fn=<MseLossBackward>)
  667. loss_train_step after backward: tensor(0.1705, device='cuda:0', grad_fn=<MseLossBackward>)
  668. loss_train: 2.046713799238205
  669. step: 4
  670. running loss: 0.5116784498095512
  671.  
  672. Train Steps: 4/90 Loss: 0.5117 torch.Size([8, 600, 800])
  673. torch.Size([8, 8])
  674. tensor([[0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795],
  675. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528],
  676. [0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  677. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  678. [0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676],
  679. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  680. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  681. [ nan, nan, 0.8900, 0.3217, 0.5038, 0.2233, 0.6694, 0.5609]],
  682. device='cuda:0', dtype=torch.float64)
  683. predictions are: tensor([[ 0.4885, -0.4018, 1.0979, -0.3366, -0.3702, -0.6909, 0.3982, 0.2501],
  684. [ 0.4422, -0.3510, 1.0551, -0.4015, -0.3460, -0.7835, 0.3912, 0.2216],
  685. [ 0.4735, -0.3952, 1.0856, -0.3061, -0.3689, -0.6766, 0.3673, 0.2366],
  686. [ 0.4811, -0.3667, 1.0538, -0.3488, -0.3313, -0.6762, 0.3805, 0.2586],
  687. [ 0.4752, -0.3900, 1.0767, -0.3471, -0.3499, -0.7226, 0.3713, 0.2491],
  688. [ 0.4760, -0.4058, 1.0386, -0.4084, -0.3484, -0.8394, 0.4057, 0.2369],
  689. [ 0.4448, -0.3698, 1.0587, -0.4265, -0.3316, -0.8082, 0.3901, 0.2314],
  690. [ 0.4433, -0.3462, 1.0494, -0.4267, -0.3098, -0.7908, 0.3494, 0.1983]],
  691. device='cuda:0', grad_fn=<AddmmBackward>)
  692. landmarks are: tensor([[[ 6.3554e-01, -4.0805e-01, 1.6113e+00, 1.8522e-01, -4.7298e-01,
  693. 1.4673e-01, 9.9965e-01, 3.9055e-01],
  694. [-2.2859e+00, -2.2859e+00, 1.8423e+00, -9.6952e-01, -1.3233e-01,
  695. -8.4634e-01, 1.1349e+00, 2.6764e-01],
  696. [ 6.1184e-01, -3.9831e-01, 1.5824e+00, 3.4688e-01, -4.2679e-01,
  697. -6.8822e-02, 3.4688e-01, 5.3934e-01],
  698. [ 5.7079e-01, -4.0747e-01, 1.7961e+00, -2.3048e-01, -4.2102e-01,
  699. -9.9615e-02, 1.2187e-01, 8.9251e-02],
  700. [ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  701. 4.6189e-04, 2.9049e-01, 3.3573e-01],
  702. [ 6.1264e-01, -4.0570e-01, 1.4439e+00, -1.3159e+00, -1.1501e-01,
  703. -1.5777e+00, 5.5366e-01, -5.2974e-02],
  704. [ 6.2072e-01, -3.9360e-01, 1.7788e+00, -1.1235e+00, 1.4480e-01,
  705. -1.0850e+00, 1.1459e+00, 1.9818e-01],
  706. [-2.2859e+00, -2.2859e+00, 1.8249e+00, -8.0015e-01, 4.0878e-02,
  707. -1.2543e+00, 8.0590e-01, 3.0505e-01]]], device='cuda:0')
  708. loss_train_step before backward: tensor(0.5289, device='cuda:0', grad_fn=<MseLossBackward>)
  709. loss_train_step after backward: tensor(0.5289, device='cuda:0', grad_fn=<MseLossBackward>)
  710. loss_train: 2.5755676329135895
  711. step: 5
  712. running loss: 0.5151135265827179
  713. Train Steps: 5/90 Loss: 0.5151 torch.Size([8, 600, 800])
  714. torch.Size([8, 8])
  715. tensor([[0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  716. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  717. [0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  718. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  719. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  720. [0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510],
  721. [ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933],
  722. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717]],
  723. device='cuda:0', dtype=torch.float64)
  724. predictions are: tensor([[ 0.5403, -0.4755, 1.3845, -0.3674, -0.3488, -0.6346, 0.4944, 0.2667],
  725. [ 0.4828, -0.5086, 1.3642, -0.3836, -0.3648, -0.6673, 0.4748, 0.2593],
  726. [ 0.4669, -0.4383, 1.3275, -0.4923, -0.3288, -0.8227, 0.5028, 0.2269],
  727. [ 0.4408, -0.4837, 1.3020, -0.5519, -0.3340, -0.8562, 0.4644, 0.2288],
  728. [ 0.4844, -0.4597, 1.3352, -0.3919, -0.3426, -0.6659, 0.4823, 0.2951],
  729. [ 0.5130, -0.4774, 1.3368, -0.4231, -0.3680, -0.7182, 0.4799, 0.2842],
  730. [ 0.4028, -0.4552, 1.2646, -0.5310, -0.3368, -0.8135, 0.4102, 0.2107],
  731. [ 0.4311, -0.4643, 1.2980, -0.5692, -0.2955, -0.8370, 0.4452, 0.2128]],
  732. device='cuda:0', grad_fn=<AddmmBackward>)
  733. landmarks are: tensor([[[ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  734. 0.3700],
  735. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  736. 0.0711],
  737. [ 0.6520, -0.3912, 1.7095, -0.9079, -0.0284, -1.3621, 0.8096,
  738. 0.2356],
  739. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  740. 0.1917],
  741. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  742. 0.0985],
  743. [ 0.5334, -0.4252, 1.7499, -0.0226, -0.3979, -0.1920, 0.0558,
  744. 0.2589],
  745. [-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  746. 0.4543],
  747. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  748. 0.3546]]], device='cuda:0')
  749. loss_train_step before backward: tensor(0.2597, device='cuda:0', grad_fn=<MseLossBackward>)
  750. loss_train_step after backward: tensor(0.2597, device='cuda:0', grad_fn=<MseLossBackward>)
  751. loss_train: 2.8352708220481873
  752. step: 6
  753. running loss: 0.4725451370080312
  754. Train Steps: 6/90 Loss: 0.4725 torch.Size([8, 600, 800])
  755. torch.Size([8, 8])
  756. tensor([[0.6289, 0.4032, 0.8419, 0.5446, 0.4075, 0.5017, 0.6312, 0.5117],
  757. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  758. [0.6236, 0.3967, 0.8675, 0.5400, 0.3862, 0.4517, 0.5825, 0.5200],
  759. [0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044],
  760. [0.6229, 0.4066, 0.8513, 0.5717, 0.4500, 0.5050, 0.6025, 0.5350],
  761. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  762. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  763. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837]],
  764. device='cuda:0', dtype=torch.float64)
  765. predictions are: tensor([[ 0.4695, -0.5488, 1.5943, -0.4788, -0.3550, -0.6922, 0.5460, 0.2842],
  766. [ 0.4509, -0.5320, 1.5898, -0.3879, -0.3391, -0.6629, 0.5457, 0.2746],
  767. [ 0.4613, -0.5351, 1.5649, -0.4374, -0.3564, -0.6521, 0.5522, 0.2870],
  768. [ 0.3650, -0.5891, 1.4587, -0.6514, -0.3122, -0.8934, 0.5336, 0.2440],
  769. [ 0.4334, -0.5463, 1.5269, -0.4893, -0.3581, -0.7008, 0.5142, 0.2635],
  770. [ 0.3762, -0.5329, 1.4488, -0.6472, -0.3316, -0.8446, 0.5024, 0.2438],
  771. [ 0.4500, -0.5802, 1.5537, -0.4733, -0.2985, -0.6812, 0.5522, 0.2756],
  772. [ 0.3715, -0.5650, 1.4511, -0.6158, -0.3295, -0.7749, 0.4584, 0.2101]],
  773. device='cuda:0', grad_fn=<AddmmBackward>)
  774. landmarks are: tensor([[[ 0.6189, -0.4238, 1.6026, 0.2295, -0.4037, 0.0313, 0.6298,
  775. 0.0774],
  776. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  777. 0.0111],
  778. [ 0.5944, -0.4538, 1.7210, 0.2083, -0.5018, -0.1997, 0.4046,
  779. 0.1159],
  780. [ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  781. 0.0438],
  782. [ 0.5911, -0.4080, 1.6460, 0.3546, -0.2074, 0.0467, 0.4970,
  783. 0.1852],
  784. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  785. 0.0862],
  786. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  787. 0.2930],
  788. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  789. 0.4103]]], device='cuda:0')
  790. loss_train_step before backward: tensor(0.1155, device='cuda:0', grad_fn=<MseLossBackward>)
  791. loss_train_step after backward: tensor(0.1155, device='cuda:0', grad_fn=<MseLossBackward>)
  792. loss_train: 2.950811892747879
  793. step: 7
  794. running loss: 0.4215445561068399
  795. Train Steps: 7/90 Loss: 0.4215 torch.Size([8, 600, 800])
  796. torch.Size([8, 8])
  797. tensor([[0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  798. [ nan, nan, 0.8888, 0.3100, 0.5262, 0.2817, 0.7145, 0.6003],
  799. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  800. [0.6209, 0.3920, 0.8650, 0.5367, 0.4400, 0.5067, 0.6025, 0.4950],
  801. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  802. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  803. [0.6164, 0.4076, 0.8838, 0.4117, 0.3713, 0.5550, 0.6238, 0.5350],
  804. [0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390]],
  805. device='cuda:0', dtype=torch.float64)
  806. predictions are: tensor([[ 0.3134, -0.6794, 1.6194, -0.7281, -0.3209, -0.8706, 0.5486, 0.2226],
  807. [ 0.3383, -0.6451, 1.6516, -0.6063, -0.3142, -0.8186, 0.5737, 0.2116],
  808. [ 0.2937, -0.6742, 1.6026, -0.7307, -0.3141, -0.8592, 0.5482, 0.2223],
  809. [ 0.4637, -0.6103, 1.7207, -0.4602, -0.3870, -0.5815, 0.5783, 0.2602],
  810. [ 0.4362, -0.6387, 1.6842, -0.5264, -0.3400, -0.6412, 0.5542, 0.2823],
  811. [ 0.5325, -0.5639, 1.7223, -0.4289, -0.3985, -0.5341, 0.5724, 0.2672],
  812. [ 0.4656, -0.5311, 1.6839, -0.4444, -0.3957, -0.5205, 0.5554, 0.2717],
  813. [ 0.4447, -0.5605, 1.6902, -0.5166, -0.4024, -0.6472, 0.5584, 0.2629]],
  814. device='cuda:0', grad_fn=<AddmmBackward>)
  815. landmarks are: tensor([[[ 5.7997e-01, -4.3118e-01, 1.5709e+00, -1.0311e+00, -4.4411e-01,
  816. -1.1081e+00, 3.8730e-01, 8.5142e-02],
  817. [-2.2859e+00, -2.2859e+00, 1.8192e+00, -8.5404e-01, 1.4480e-01,
  818. -9.8491e-01, 1.0143e+00, 4.8673e-01],
  819. [ 6.1742e-01, -3.9842e-01, 1.5975e+00, -9.9214e-01, -3.6328e-01,
  820. -9.9261e-01, 8.2047e-01, 2.0505e-01],
  821. [ 5.8199e-01, -4.7544e-01, 1.7095e+00, 1.9292e-01, -2.5358e-01,
  822. 5.4350e-02, 4.9700e-01, 4.6189e-04],
  823. [ 6.1083e-01, -4.0082e-01, 1.9088e+00, -2.5294e-02, -5.7691e-01,
  824. -3.0747e-01, 7.9054e-01, 1.4989e-01],
  825. [ 6.5201e-01, -4.0564e-01, 1.9173e+00, -7.6520e-02, -5.5958e-01,
  826. -4.5373e-01, 7.9493e-01, 1.7680e-01],
  827. [ 5.6143e-01, -4.0323e-01, 1.7961e+00, -3.8445e-01, -5.7113e-01,
  828. 2.7760e-01, 5.9515e-01, 1.8522e-01],
  829. [ 6.5036e-01, -3.9360e-01, 1.8885e+00, -4.9222e-01, -3.4018e-01,
  830. -9.2333e-01, 8.0224e-01, 2.0352e-01]]], device='cuda:0')
  831. loss_train_step before backward: tensor(0.2142, device='cuda:0', grad_fn=<MseLossBackward>)
  832. loss_train_step after backward: tensor(0.2142, device='cuda:0', grad_fn=<MseLossBackward>)
  833. loss_train: 3.1650566458702087
  834. step: 8
  835. running loss: 0.3956320807337761
  836.  
  837. Train Steps: 8/90 Loss: 0.3956 torch.Size([8, 600, 800])
  838. torch.Size([8, 8])
  839. tensor([[0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  840. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297],
  841. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  842. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817],
  843. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927],
  844. [0.6248, 0.4032, 0.7738, 0.1900, 0.4813, 0.1400, 0.5941, 0.4904],
  845. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  846. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217]],
  847. device='cuda:0', dtype=torch.float64)
  848. predictions are: tensor([[ 0.3986, -0.6094, 1.7731, -0.5675, -0.4028, -0.6541, 0.6191, 0.1876],
  849. [ 0.5058, -0.5929, 1.8639, -0.3546, -0.4482, -0.4050, 0.6035, 0.2369],
  850. [ 0.3617, -0.6422, 1.7939, -0.5044, -0.3761, -0.5660, 0.5857, 0.2077],
  851. [ 0.2151, -0.7175, 1.6810, -0.7442, -0.3176, -0.7890, 0.5508, 0.1978],
  852. [ 0.4400, -0.6495, 1.8597, -0.4622, -0.3749, -0.5228, 0.6240, 0.2258],
  853. [ 0.2712, -0.7017, 1.7019, -0.7678, -0.3379, -0.8403, 0.5856, 0.1985],
  854. [ 0.3907, -0.6001, 1.8238, -0.4108, -0.4309, -0.5027, 0.5874, 0.2351],
  855. [ 0.3679, -0.6428, 1.7431, -0.5741, -0.3706, -0.6884, 0.6126, 0.1843]],
  856. device='cuda:0', grad_fn=<AddmmBackward>)
  857. landmarks are: tensor([[[ 0.6125, -0.4345, 1.4308, -1.1384, -0.4213, -1.0031, 0.7190,
  858. 0.1214],
  859. [ 0.6520, -0.4032, 1.8076, 0.1852, -0.5711, -0.1381, 0.7876,
  860. 0.1608],
  861. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  862. 0.2853],
  863. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  864. 0.4008],
  865. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  866. -0.0099],
  867. [ 0.5999, -0.4236, 1.2880, -1.4083, -0.0630, -1.6393, 0.4584,
  868. -0.0208],
  869. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  870. 0.2545],
  871. [ 0.5687, -0.4088, 1.0397, -1.1466, -0.3113, -1.1928, 0.4681,
  872. 0.5855]]], device='cuda:0')
  873. loss_train_step before backward: tensor(0.1039, device='cuda:0', grad_fn=<MseLossBackward>)
  874. loss_train_step after backward: tensor(0.1039, device='cuda:0', grad_fn=<MseLossBackward>)
  875. loss_train: 3.268991008400917
  876. step: 9
  877. running loss: 0.36322122315565747
  878. Train Steps: 9/90 Loss: 0.3632 torch.Size([8, 600, 800])
  879. torch.Size([8, 8])
  880. tensor([[0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  881. [0.6268, 0.4102, 0.8938, 0.3667, 0.4025, 0.2833, 0.6275, 0.5183],
  882. [0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  883. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  884. [0.6200, 0.4039, 0.8880, 0.4799, 0.3625, 0.4285, 0.5866, 0.5148],
  885. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  886. [0.6214, 0.4040, 0.8838, 0.3500, 0.3600, 0.5183, 0.6362, 0.5200],
  887. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116]],
  888. device='cuda:0', dtype=torch.float64)
  889. predictions are: tensor([[ 0.4023, -0.5970, 1.8370, -0.4402, -0.3702, -0.4494, 0.5963, 0.2152],
  890. [ 0.2735, -0.7746, 1.8249, -0.7597, -0.3093, -0.8099, 0.6603, 0.1850],
  891. [ 0.3854, -0.6540, 1.8492, -0.5377, -0.3915, -0.5254, 0.5822, 0.1906],
  892. [ 0.3886, -0.5986, 1.8082, -0.5924, -0.3838, -0.5982, 0.6233, 0.1837],
  893. [ 0.3802, -0.6962, 1.8287, -0.5726, -0.3557, -0.6003, 0.5991, 0.2111],
  894. [ 0.4066, -0.6400, 1.8792, -0.4734, -0.3624, -0.4860, 0.6284, 0.1999],
  895. [ 0.4266, -0.5321, 1.8191, -0.5020, -0.4016, -0.4485, 0.5741, 0.2038],
  896. [ 0.3916, -0.6078, 1.8294, -0.5132, -0.4115, -0.4810, 0.5802, 0.2019]],
  897. device='cuda:0', grad_fn=<AddmmBackward>)
  898. landmarks are: tensor([[[ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  899. 0.0412],
  900. [ 0.6092, -0.3913, 1.8423, -0.5923, -0.4268, -0.9772, 0.6125,
  901. 0.1082],
  902. [ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  903. 0.2237],
  904. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  905. -0.0220],
  906. [ 0.5781, -0.4205, 1.8159, -0.0691, -0.6116, -0.3069, 0.4236,
  907. 0.0919],
  908. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  909. 0.1979],
  910. [ 0.5841, -0.4199, 1.7961, -0.6693, -0.6231, 0.1082, 0.6529,
  911. 0.1159],
  912. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  913. 0.0772]]], device='cuda:0')
  914. loss_train_step before backward: tensor(0.0941, device='cuda:0', grad_fn=<MseLossBackward>)
  915. loss_train_step after backward: tensor(0.0941, device='cuda:0', grad_fn=<MseLossBackward>)
  916. loss_train: 3.3630512952804565
  917. step: 10
  918. running loss: 0.33630512952804564
  919. Train Steps: 10/90 Loss: 0.3363 torch.Size([8, 600, 800])
  920. torch.Size([8, 8])
  921. tensor([[0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  922. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  923. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  924. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  925. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  926. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  927. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  928. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006]],
  929. device='cuda:0', dtype=torch.float64)
  930. predictions are: tensor([[ 0.4281, -0.6018, 1.9033, -0.4220, -0.3854, -0.3424, 0.6084, 0.1981],
  931. [ 0.4875, -0.5669, 1.9027, -0.3804, -0.4182, -0.3505, 0.6296, 0.1911],
  932. [ 0.3455, -0.6332, 1.7253, -0.7356, -0.3643, -0.6066, 0.5329, 0.1503],
  933. [ 0.3817, -0.6205, 1.8508, -0.5359, -0.3424, -0.4687, 0.5927, 0.1690],
  934. [ 0.4571, -0.5370, 1.8616, -0.5107, -0.3985, -0.4145, 0.6011, 0.1742],
  935. [ 0.5165, -0.5026, 1.9352, -0.3225, -0.4410, -0.2379, 0.6228, 0.1941],
  936. [ 0.2141, -0.7852, 1.7427, -0.8960, -0.2852, -0.8919, 0.6142, 0.1452],
  937. [ 0.5665, -0.5681, 1.9401, -0.3287, -0.4210, -0.2708, 0.6404, 0.1673]],
  938. device='cuda:0', grad_fn=<AddmmBackward>)
  939. landmarks are: tensor([[[ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  940. 0.0622],
  941. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  942. 0.3007],
  943. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  944. 0.4103],
  945. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  946. 0.2853],
  947. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  948. 0.2365],
  949. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  950. 0.1715],
  951. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  952. 0.0051],
  953. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  954. 0.0261]]], device='cuda:0')
  955. loss_train_step before backward: tensor(0.0903, device='cuda:0', grad_fn=<MseLossBackward>)
  956. loss_train_step after backward: tensor(0.0903, device='cuda:0', grad_fn=<MseLossBackward>)
  957. loss_train: 3.453396238386631
  958. step: 11
  959. running loss: 0.3139451125806028
  960. Train Steps: 11/90 Loss: 0.3139 torch.Size([8, 600, 800])
  961. torch.Size([8, 8])
  962. tensor([[0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  963. [0.6132, 0.4037, 0.6963, 0.2217, 0.4100, 0.1950, 0.5395, 0.5175],
  964. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  965. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  966. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412],
  967. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  968. [0.6214, 0.4175, 0.7300, 0.2883, 0.4338, 0.2167, 0.5698, 0.5773],
  969. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350]],
  970. device='cuda:0', dtype=torch.float64)
  971. predictions are: tensor([[ 0.3583, -0.6343, 1.7170, -0.7579, -0.3092, -0.6544, 0.5731, 0.1568],
  972. [ 0.3602, -0.6007, 1.7199, -0.7404, -0.3476, -0.6163, 0.5342, 0.1324],
  973. [ 0.5714, -0.4951, 1.9335, -0.2031, -0.4453, -0.1089, 0.6063, 0.1638],
  974. [ 0.6233, -0.4319, 1.9334, -0.2226, -0.4486, -0.0354, 0.5995, 0.1807],
  975. [ 0.4814, -0.5525, 1.8654, -0.3785, -0.4045, -0.2285, 0.5742, 0.1675],
  976. [ 0.4247, -0.6203, 1.7907, -0.5895, -0.3542, -0.4821, 0.5728, 0.1632],
  977. [ 0.4121, -0.5504, 1.7687, -0.6334, -0.3926, -0.4873, 0.5501, 0.1550],
  978. [ 0.5594, -0.5201, 1.9404, -0.2369, -0.3908, -0.1411, 0.6089, 0.1694]],
  979. device='cuda:0', grad_fn=<AddmmBackward>)
  980. landmarks are: tensor([[[ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  981. 0.2442],
  982. [ 0.5465, -0.4214, 0.9300, -1.2620, -0.3921, -1.3852, 0.2062,
  983. 0.1043],
  984. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  985. -0.1385],
  986. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  987. 0.0985],
  988. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  989. 0.2138],
  990. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  991. 0.4470],
  992. [ 0.5841, -0.3574, 1.0859, -0.9541, -0.2824, -1.2851, 0.3460,
  993. 0.3808],
  994. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  995. 0.1854]]], device='cuda:0')
  996. loss_train_step before backward: tensor(0.1143, device='cuda:0', grad_fn=<MseLossBackward>)
  997. loss_train_step after backward: tensor(0.1143, device='cuda:0', grad_fn=<MseLossBackward>)
  998. loss_train: 3.5676762238144875
  999. step: 12
  1000. running loss: 0.29730635198454064
  1001.  
  1002. Train Steps: 12/90 Loss: 0.2973 torch.Size([8, 600, 800])
  1003. torch.Size([8, 8])
  1004. tensor([[0.6198, 0.4075, 0.8650, 0.5617, 0.4150, 0.4367, 0.5450, 0.5650],
  1005. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  1006. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650],
  1007. [0.6284, 0.4029, 0.8838, 0.3783, 0.3975, 0.2850, 0.6335, 0.5090],
  1008. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  1009. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598],
  1010. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  1011. [0.6069, 0.3975, 0.8625, 0.5083, 0.4388, 0.5483, 0.5650, 0.4967]],
  1012. device='cuda:0', dtype=torch.float64)
  1013. predictions are: tensor([[ 0.5343, -0.4726, 1.7997, -0.3158, -0.3930, -0.2037, 0.5199, 0.1621],
  1014. [ 0.5070, -0.4471, 1.7056, -0.5312, -0.4011, -0.3798, 0.4930, 0.1416],
  1015. [ 0.5230, -0.4723, 1.8404, -0.3098, -0.4120, -0.1843, 0.5487, 0.1675],
  1016. [ 0.5441, -0.4712, 1.8092, -0.4498, -0.4106, -0.3381, 0.5668, 0.1592],
  1017. [ 0.5783, -0.4525, 1.8416, -0.2854, -0.3991, -0.1710, 0.5524, 0.1664],
  1018. [ 0.4761, -0.5077, 1.7601, -0.4455, -0.3867, -0.3223, 0.5207, 0.1484],
  1019. [ 0.4512, -0.5921, 1.7266, -0.6192, -0.3187, -0.5162, 0.4994, 0.1540],
  1020. [ 0.5362, -0.4790, 1.8213, -0.3137, -0.4172, -0.1955, 0.5498, 0.1414]],
  1021. device='cuda:0', grad_fn=<AddmmBackward>)
  1022. landmarks are: tensor([[[ 0.5770, -0.4036, 1.7095, 0.3084, -0.3691, -0.2690, 0.2314,
  1023. 0.3238],
  1024. [ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  1025. 0.1159],
  1026. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  1027. 0.3238],
  1028. [ 0.6165, -0.4249, 1.7961, -0.5384, -0.4499, -0.9695, 0.6401,
  1029. 0.0652],
  1030. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  1031. 0.2091],
  1032. [ 0.5726, -0.4249, 1.5824, 0.3777, -0.0942, -0.0556, 0.2782,
  1033. 0.2997],
  1034. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  1035. 0.5624],
  1036. [ 0.5174, -0.4497, 1.6979, 0.0620, -0.2594, 0.2468, 0.3238,
  1037. 0.0082]]], device='cuda:0')
  1038. loss_train_step before backward: tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward>)
  1039. loss_train_step after backward: tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward>)
  1040. loss_train: 3.626456379890442
  1041. step: 13
  1042. running loss: 0.2789581830684955
  1043. Train Steps: 13/90 Loss: 0.2790 torch.Size([8, 600, 800])
  1044. torch.Size([8, 8])
  1045. tensor([[0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391],
  1046. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  1047. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  1048. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  1049. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717],
  1050. [0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  1051. [0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183],
  1052. [0.6124, 0.4069, 0.8314, 0.5001, 0.3738, 0.4650, 0.5167, 0.5402]],
  1053. device='cuda:0', dtype=torch.float64)
  1054. predictions are: tensor([[ 0.3386, -0.5945, 1.4882, -0.8442, -0.2679, -0.8243, 0.4488, 0.1746],
  1055. [ 0.6488, -0.4722, 1.7840, -0.1984, -0.4139, -0.1456, 0.5088, 0.2118],
  1056. [ 0.6712, -0.3812, 1.7589, -0.1449, -0.4616, -0.0147, 0.4819, 0.1966],
  1057. [ 0.5852, -0.3525, 1.7167, -0.2342, -0.4497, -0.0917, 0.4490, 0.1965],
  1058. [ 0.6722, -0.3628, 1.7972, -0.1442, -0.4551, -0.0454, 0.5214, 0.2173],
  1059. [ 0.6903, -0.3728, 1.7680, -0.1855, -0.4479, -0.0402, 0.4770, 0.2045],
  1060. [ 0.4033, -0.5384, 1.5374, -0.7993, -0.3055, -0.7459, 0.4317, 0.1558],
  1061. [ 0.5944, -0.3282, 1.7185, -0.2286, -0.4429, -0.0724, 0.4695, 0.1935]],
  1062. device='cuda:0', grad_fn=<AddmmBackward>)
  1063. landmarks are: tensor([[[ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  1064. 0.2043],
  1065. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  1066. 0.1390],
  1067. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  1068. 0.5239],
  1069. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  1070. 0.3478],
  1071. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  1072. 0.3546],
  1073. [ 0.5700, -0.4032, 1.7961, -0.1997, -0.5249, -0.2151, 0.3815,
  1074. 0.3161],
  1075. [ 0.5798, -0.4156, 1.3977, -1.0388, -0.4672, -1.1004, 0.3469,
  1076. 0.1082],
  1077. [ 0.5425, -0.4067, 1.5543, 0.0241, -0.5596, -0.1381, 0.1005,
  1078. 0.2093]]], device='cuda:0')
  1079. loss_train_step before backward: tensor(0.0389, device='cuda:0', grad_fn=<MseLossBackward>)
  1080. loss_train_step after backward: tensor(0.0389, device='cuda:0', grad_fn=<MseLossBackward>)
  1081. loss_train: 3.6653256751596928
  1082. step: 14
  1083. running loss: 0.2618089767971209
  1084. Train Steps: 14/90 Loss: 0.2618 torch.Size([8, 600, 800])
  1085. torch.Size([8, 8])
  1086. tensor([[0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  1087. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  1088. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  1089. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533],
  1090. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  1091. [0.6279, 0.4008, 0.8600, 0.4883, 0.4325, 0.5283, 0.7010, 0.5378],
  1092. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  1093. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901]],
  1094. device='cuda:0', dtype=torch.float64)
  1095. predictions are: tensor([[ 0.6552, -0.3837, 1.7376, -0.1305, -0.4385, -0.1260, 0.4828, 0.2422],
  1096. [ 0.5077, -0.4758, 1.5026, -0.5479, -0.3470, -0.5731, 0.4024, 0.2062],
  1097. [ 0.6341, -0.3702, 1.6776, -0.1107, -0.4211, -0.0452, 0.4231, 0.2498],
  1098. [ 0.6070, -0.3405, 1.5338, -0.4015, -0.4672, -0.2579, 0.4081, 0.2168],
  1099. [ 0.8312, -0.2328, 1.8114, 0.1777, -0.5426, 0.2986, 0.4698, 0.2533],
  1100. [ 0.7075, -0.2959, 1.7456, 0.0659, -0.5056, 0.1518, 0.4310, 0.2443],
  1101. [ 0.4628, -0.4883, 1.4341, -0.7040, -0.3237, -0.7027, 0.4005, 0.2153],
  1102. [ 0.4701, -0.4907, 1.4618, -0.6527, -0.3600, -0.6216, 0.3729, 0.2062]],
  1103. device='cuda:0', grad_fn=<AddmmBackward>)
  1104. landmarks are: tensor([[[ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  1105. 0.4386],
  1106. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  1107. 0.1494],
  1108. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  1109. 0.2853],
  1110. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  1111. 0.2699],
  1112. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  1113. 0.1005],
  1114. [ 0.6141, -0.4345, 1.6864, -0.0303, -0.2882, 0.1544, 0.9521,
  1115. 0.1982],
  1116. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  1117. 0.2032],
  1118. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  1119. -0.0220]]], device='cuda:0')
  1120. loss_train_step before backward: tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward>)
  1121. loss_train_step after backward: tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward>)
  1122. loss_train: 3.729193616658449
  1123. step: 15
  1124. running loss: 0.24861290777722994
  1125. Train Steps: 15/90 Loss: 0.2486 torch.Size([8, 600, 800])
  1126. torch.Size([8, 8])
  1127. tensor([[0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  1128. [0.6371, 0.4092, 0.8337, 0.5850, 0.3950, 0.5117, 0.6559, 0.5262],
  1129. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  1130. [0.6277, 0.4083, 0.8350, 0.2717, 0.4562, 0.1800, 0.5918, 0.4878],
  1131. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  1132. [0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501],
  1133. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  1134. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136]],
  1135. device='cuda:0', dtype=torch.float64)
  1136. predictions are: tensor([[ 0.8263, -0.1902, 1.7374, 0.2545, -0.5898, 0.3922, 0.4587, 0.2920],
  1137. [ 0.8305, -0.2324, 1.7869, 0.3114, -0.5759, 0.3759, 0.4640, 0.2764],
  1138. [ 0.5266, -0.4159, 1.3851, -0.5850, -0.3763, -0.5650, 0.3748, 0.2421],
  1139. [ 0.4363, -0.4686, 1.3255, -0.7476, -0.3138, -0.7884, 0.3587, 0.2176],
  1140. [ 0.7096, -0.3306, 1.6011, -0.1989, -0.4514, -0.1596, 0.4091, 0.2694],
  1141. [ 0.5078, -0.4304, 1.3690, -0.6331, -0.3530, -0.6531, 0.3775, 0.2460],
  1142. [ 0.5176, -0.3927, 1.3475, -0.6248, -0.3892, -0.6089, 0.3561, 0.2448],
  1143. [ 0.6879, -0.3213, 1.6219, -0.0797, -0.4829, -0.0799, 0.4250, 0.2820]],
  1144. device='cuda:0', grad_fn=<AddmmBackward>)
  1145. landmarks are: tensor([[[ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  1146. 0.2545],
  1147. [ 0.6569, -0.3960, 1.5651, 0.4162, -0.4614, 0.0774, 0.7438,
  1148. 0.1447],
  1149. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  1150. 0.3007],
  1151. [ 0.6132, -0.4002, 1.5709, -1.0311, -0.1785, -1.4545, 0.4474,
  1152. -0.0328],
  1153. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  1154. 0.3315],
  1155. [ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  1156. 0.2549],
  1157. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  1158. 0.1343],
  1159. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  1160. 0.0862]]], device='cuda:0')
  1161. loss_train_step before backward: tensor(0.2667, device='cuda:0', grad_fn=<MseLossBackward>)
  1162. loss_train_step after backward: tensor(0.2667, device='cuda:0', grad_fn=<MseLossBackward>)
  1163. loss_train: 3.9958606250584126
  1164. step: 16
  1165. running loss: 0.24974128906615078
  1166.  
  1167. Train Steps: 16/90 Loss: 0.2497 torch.Size([8, 600, 800])
  1168. torch.Size([8, 8])
  1169. tensor([[0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  1170. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  1171. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  1172. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  1173. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  1174. [0.6161, 0.4099, 0.8738, 0.4383, 0.3788, 0.5483, 0.5605, 0.5019],
  1175. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  1176. [0.6187, 0.4104, 0.7126, 0.2069, 0.3950, 0.2517, 0.5913, 0.5683]],
  1177. device='cuda:0', dtype=torch.float64)
  1178. predictions are: tensor([[ 0.5092, -0.4276, 1.2993, -0.6912, -0.3900, -0.7287, 0.3428, 0.2390],
  1179. [ 0.4638, -0.5024, 1.3391, -0.7674, -0.3217, -0.9413, 0.3813, 0.2378],
  1180. [ 0.7581, -0.2839, 1.6582, 0.2064, -0.5467, 0.2310, 0.4485, 0.2857],
  1181. [ 0.6093, -0.3809, 1.5054, -0.2810, -0.4603, -0.3393, 0.3837, 0.2761],
  1182. [ 0.7945, -0.2427, 1.6784, 0.1989, -0.5599, 0.2828, 0.4505, 0.2914],
  1183. [ 0.6689, -0.2769, 1.5637, 0.0263, -0.5515, 0.1618, 0.3862, 0.2881],
  1184. [ 0.5313, -0.4060, 1.3328, -0.6785, -0.4032, -0.7108, 0.3818, 0.2442],
  1185. [ 0.5118, -0.4049, 1.3256, -0.6318, -0.4154, -0.6396, 0.3457, 0.2628]],
  1186. device='cuda:0', grad_fn=<AddmmBackward>)
  1187. landmarks are: tensor([[[ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  1188. 0.2906],
  1189. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  1190. -0.0209],
  1191. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  1192. 0.4624],
  1193. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  1194. 0.0862],
  1195. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  1196. 0.0985],
  1197. [ 0.5597, -0.3928, 1.7499, -0.2613, -0.5365, 0.2468, 0.3028,
  1198. 0.0321],
  1199. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  1200. 0.2083],
  1201. [ 0.5718, -0.3905, 1.0053, -1.3305, -0.4614, -1.1235, 0.4450,
  1202. 0.3392]]], device='cuda:0')
  1203. loss_train_step before backward: tensor(0.0752, device='cuda:0', grad_fn=<MseLossBackward>)
  1204. loss_train_step after backward: tensor(0.0752, device='cuda:0', grad_fn=<MseLossBackward>)
  1205. loss_train: 4.071053955703974
  1206. step: 17
  1207. running loss: 0.23947376210023374
  1208. Train Steps: 17/90 Loss: 0.2395 torch.Size([8, 600, 800])
  1209. torch.Size([8, 8])
  1210. tensor([[0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283],
  1211. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  1212. [0.6135, 0.3994, 0.7913, 0.3050, 0.3625, 0.3050, 0.5837, 0.5050],
  1213. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  1214. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  1215. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  1216. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  1217. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600]],
  1218. device='cuda:0', dtype=torch.float64)
  1219. predictions are: tensor([[ 0.6578, -0.3683, 1.5521, -0.1059, -0.4751, -0.2149, 0.4410, 0.2723],
  1220. [ 0.5114, -0.4456, 1.2885, -0.7996, -0.3856, -0.9587, 0.4281, 0.2349],
  1221. [ 0.5884, -0.3397, 1.3325, -0.5015, -0.4970, -0.4707, 0.4000, 0.2406],
  1222. [ 0.6309, -0.3858, 1.5195, -0.1167, -0.5022, -0.1658, 0.3629, 0.2780],
  1223. [ 0.5000, -0.4365, 1.3342, -0.7227, -0.3862, -0.8498, 0.3772, 0.2283],
  1224. [ 0.5706, -0.3431, 1.3098, -0.5633, -0.5075, -0.5184, 0.3733, 0.2563],
  1225. [ 0.5632, -0.3163, 1.3676, -0.3814, -0.5250, -0.3097, 0.3615, 0.2432],
  1226. [ 0.5914, -0.3618, 1.5231, -0.0976, -0.4550, -0.1584, 0.4225, 0.2744]],
  1227. device='cuda:0', grad_fn=<AddmmBackward>)
  1228. landmarks are: tensor([[[ 0.5245, -0.4347, 1.6806, 0.1159, 0.0046, 0.0129, 0.1044,
  1229. 0.1544],
  1230. [ 0.6126, -0.4057, 1.4439, -1.3159, -0.1150, -1.5777, 0.5537,
  1231. -0.0530],
  1232. [ 0.5477, -0.4413, 1.3688, -0.8771, -0.6115, -0.8771, 0.4104,
  1233. 0.0467],
  1234. [ 0.5441, -0.3997, 1.7326, -0.2228, -0.4441, -0.2921, 0.0296,
  1235. 0.2409],
  1236. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  1237. 0.1005],
  1238. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  1239. 0.0622],
  1240. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  1241. 0.2386],
  1242. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  1243. 0.3007]]], device='cuda:0')
  1244. loss_train_step before backward: tensor(0.0491, device='cuda:0', grad_fn=<MseLossBackward>)
  1245. loss_train_step after backward: tensor(0.0491, device='cuda:0', grad_fn=<MseLossBackward>)
  1246. loss_train: 4.120140295475721
  1247. step: 18
  1248. running loss: 0.22889668308198452
  1249. Train Steps: 18/90 Loss: 0.2289 torch.Size([8, 600, 800])
  1250. torch.Size([8, 8])
  1251. tensor([[0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  1252. [0.6250, 0.4116, 0.8700, 0.4850, 0.4650, 0.5567, 0.6088, 0.5183],
  1253. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  1254. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  1255. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  1256. [0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083],
  1257. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  1258. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550]],
  1259. device='cuda:0', dtype=torch.float64)
  1260. predictions are: tensor([[ 0.6256, -0.3496, 1.5313, -0.1727, -0.4812, -0.2339, 0.4121, 0.2335],
  1261. [ 0.5802, -0.3599, 1.4961, -0.1003, -0.4505, -0.1714, 0.3991, 0.2416],
  1262. [ 0.6846, -0.3257, 1.6299, 0.1926, -0.5661, 0.1919, 0.4176, 0.2676],
  1263. [ 0.4458, -0.4585, 1.2494, -0.8908, -0.3609, -1.0730, 0.3473, 0.1982],
  1264. [ 0.4966, -0.3877, 1.1893, -0.8811, -0.4293, -0.9376, 0.3631, 0.2087],
  1265. [ 0.6634, -0.3550, 1.5272, -0.1704, -0.4972, -0.2177, 0.3968, 0.2328],
  1266. [ 0.4826, -0.3862, 1.2012, -0.8707, -0.4220, -0.9600, 0.3600, 0.1954],
  1267. [ 0.4057, -0.4449, 1.1502, -0.9486, -0.3773, -1.0787, 0.3214, 0.1925]],
  1268. device='cuda:0', grad_fn=<AddmmBackward>)
  1269. landmarks are: tensor([[[ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  1270. 0.3161],
  1271. [ 0.6012, -0.3846, 1.7326, -0.0457, -0.1381, 0.2853, 0.5259,
  1272. 0.1082],
  1273. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  1274. 0.1082],
  1275. [ 0.5485, -0.4209, 1.6691, -0.4152, -0.5249, -1.1081, 0.0725,
  1276. 0.0021],
  1277. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  1278. 0.0802],
  1279. [ 0.5774, -0.3868, 1.6286, -0.5692, -0.6462, -0.2767, 0.5143,
  1280. 0.5239],
  1281. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  1282. 0.3007],
  1283. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  1284. 0.2776]]], device='cuda:0')
  1285. loss_train_step before backward: tensor(0.0405, device='cuda:0', grad_fn=<MseLossBackward>)
  1286. loss_train_step after backward: tensor(0.0405, device='cuda:0', grad_fn=<MseLossBackward>)
  1287. loss_train: 4.160642504692078
  1288. step: 19
  1289. running loss: 0.21898118445747777
  1290. Train Steps: 19/90 Loss: 0.2190 torch.Size([8, 600, 800])
  1291. torch.Size([8, 8])
  1292. tensor([[0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  1293. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  1294. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  1295. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  1296. [0.6205, 0.4004, 0.8938, 0.4883, 0.3663, 0.5000, 0.6357, 0.4947],
  1297. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  1298. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  1299. [0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383]],
  1300. device='cuda:0', dtype=torch.float64)
  1301. predictions are: tensor([[ 0.4995, -0.4501, 1.2798, -0.9045, -0.3884, -1.1201, 0.3507, 0.1686],
  1302. [ 0.5374, -0.3718, 1.3481, -0.4737, -0.4760, -0.4540, 0.3643, 0.2129],
  1303. [ 0.5177, -0.4185, 1.3734, -0.5420, -0.4201, -0.6426, 0.3885, 0.1762],
  1304. [ 0.5296, -0.4432, 1.3546, -0.6588, -0.4503, -0.7486, 0.3094, 0.1954],
  1305. [ 0.5990, -0.3650, 1.4727, -0.2500, -0.4999, -0.2574, 0.3996, 0.2076],
  1306. [ 0.5845, -0.3787, 1.4616, -0.2690, -0.4853, -0.3027, 0.3903, 0.1992],
  1307. [ 0.5524, -0.3988, 1.3570, -0.6329, -0.4578, -0.6935, 0.3651, 0.1924],
  1308. [ 0.4944, -0.4201, 1.3606, -0.5418, -0.4362, -0.6470, 0.3477, 0.1965]],
  1309. device='cuda:0', grad_fn=<AddmmBackward>)
  1310. landmarks are: tensor([[[ 5.2355e-01, -4.2731e-01, 1.7499e+00, -4.3064e-01, -5.8268e-01,
  1311. -4.6143e-01, 1.6505e-01, 8.6245e-02],
  1312. [ 5.5456e-01, -4.6205e-01, 1.7788e+00, -4.2294e-01, -5.1917e-01,
  1313. -2.2633e-02, 4.2771e-01, 2.4681e-01],
  1314. [ 5.9988e-01, -3.5304e-01, 1.6402e+00, 3.7768e-01, -2.2471e-01,
  1315. -1.8430e-01, 3.0647e-01, 4.4696e-01],
  1316. [ 5.5525e-01, -3.9923e-01, 1.7557e+00, -2.6898e-01, -4.9030e-01,
  1317. -2.6898e-01, 5.4227e-02, 4.1446e-01],
  1318. [ 5.8031e-01, -4.3672e-01, 1.8423e+00, -3.0331e-02, -5.9423e-01,
  1319. 2.3557e-02, 6.5034e-01, -9.2270e-04],
  1320. [ 5.9082e-01, -4.3664e-01, 1.7557e+00, 1.3903e-01, -5.1917e-01,
  1321. 1.3133e-01, 6.5289e-01, 2.3557e-02],
  1322. [ 5.3839e-01, -4.3610e-01, 1.7961e+00, -4.9992e-01, -5.4804e-01,
  1323. -1.1501e-01, 3.9307e-01, 2.7760e-01],
  1324. [ 5.6637e-01, -4.3212e-01, 1.8249e+00, -2.0739e-01, -2.6513e-01,
  1325. 4.1617e-01, 5.6628e-01, 2.0062e-01]]], device='cuda:0')
  1326. loss_train_step before backward: tensor(0.0984, device='cuda:0', grad_fn=<MseLossBackward>)
  1327. loss_train_step after backward: tensor(0.0984, device='cuda:0', grad_fn=<MseLossBackward>)
  1328. loss_train: 4.259060598909855
  1329. step: 20
  1330. running loss: 0.21295302994549276
  1331.  
  1332. Train Steps: 20/90 Loss: 0.2130 torch.Size([8, 600, 800])
  1333. torch.Size([8, 8])
  1334. tensor([[0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  1335. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  1336. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  1337. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967],
  1338. [0.6339, 0.4102, 0.8588, 0.3133, 0.4425, 0.2117, 0.6417, 0.5089],
  1339. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100],
  1340. [0.6289, 0.4024, 0.9088, 0.4567, 0.3937, 0.5633, 0.7058, 0.5609],
  1341. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683]],
  1342. device='cuda:0', dtype=torch.float64)
  1343. predictions are: tensor([[ 0.4723, -0.4247, 1.1850, -0.9063, -0.4518, -0.8865, 0.2939, 0.1639],
  1344. [ 0.5025, -0.3635, 1.3192, -0.5956, -0.5070, -0.4938, 0.3355, 0.1808],
  1345. [ 0.4405, -0.4470, 1.2356, -1.0312, -0.3698, -1.2157, 0.3035, 0.1463],
  1346. [ 0.3921, -0.5284, 1.1823, -1.2778, -0.2926, -1.5964, 0.2982, 0.1206],
  1347. [ 0.5190, -0.3989, 1.3849, -0.7171, -0.4370, -0.7962, 0.4063, 0.1556],
  1348. [ 0.6043, -0.3868, 1.5303, -0.0823, -0.4990, -0.1121, 0.3608, 0.1888],
  1349. [ 0.6078, -0.3671, 1.6489, 0.1029, -0.5688, 0.1931, 0.3999, 0.2117],
  1350. [ 0.5852, -0.4089, 1.5890, -0.1718, -0.4224, -0.2408, 0.3769, 0.1869]],
  1351. device='cuda:0', grad_fn=<AddmmBackward>)
  1352. landmarks are: tensor([[[ 5.3591e-01, -4.1932e-01, 9.3580e-01, -8.2325e-01, -6.6351e-01,
  1353. -7.2317e-01, 9.4325e-02, 1.7099e-01],
  1354. [ 5.7633e-01, -4.1470e-01, 1.3226e+00, -1.0619e+00, -6.6351e-01,
  1355. -4.1524e-01, 5.3741e-01, 2.5450e-01],
  1356. [ 5.9151e-01, -3.6821e-01, 1.2187e+00, -1.2313e+00, -4.3256e-01,
  1357. -9.5412e-01, 5.7783e-01, 3.7768e-01],
  1358. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  1359. -1.5161e+00, 5.8660e-01, 8.0947e-03],
  1360. [ 6.4212e-01, -3.9120e-01, 1.6806e+00, -8.3865e-01, -2.4203e-01,
  1361. -1.3082e+00, 6.7795e-01, 6.4585e-02],
  1362. [ 6.2361e-01, -4.3441e-01, 1.6171e+00, 1.8522e-01, -3.4018e-01,
  1363. 2.3557e-02, 6.4711e-01, 6.9746e-02],
  1364. [ 6.1907e-01, -4.2731e-01, 1.9115e+00, -1.7660e-01, -4.6721e-01,
  1365. 3.1609e-01, 9.7406e-01, 3.0505e-01],
  1366. [ 5.3585e-01, -4.3703e-01, 1.7095e+00, -3.0331e-02, -8.0370e-02,
  1367. -3.8029e-02, 1.0439e-01, 3.3918e-01]]], device='cuda:0')
  1368. loss_train_step before backward: tensor(0.0438, device='cuda:0', grad_fn=<MseLossBackward>)
  1369. loss_train_step after backward: tensor(0.0438, device='cuda:0', grad_fn=<MseLossBackward>)
  1370. loss_train: 4.30288702994585
  1371. step: 21
  1372. running loss: 0.20489938237837382
  1373. Train Steps: 21/90 Loss: 0.2049 torch.Size([8, 600, 800])
  1374. torch.Size([8, 8])
  1375. tensor([[0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467],
  1376. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  1377. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297],
  1378. [0.6124, 0.4030, 0.8650, 0.4867, 0.4999, 0.5106, 0.5137, 0.5773],
  1379. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  1380. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  1381. [0.6185, 0.4042, 0.7700, 0.2250, 0.4062, 0.2117, 0.5763, 0.5150],
  1382. [0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869]],
  1383. device='cuda:0', dtype=torch.float64)
  1384. predictions are: tensor([[ 0.4667, -0.4029, 1.2225, -0.9475, -0.4710, -0.9117, 0.3017, 0.1536],
  1385. [ 0.4264, -0.4826, 1.3187, -1.0577, -0.3452, -1.2749, 0.3562, 0.1209],
  1386. [ 0.5903, -0.3429, 1.5855, -0.0366, -0.5336, 0.1025, 0.4147, 0.1930],
  1387. [ 0.5301, -0.4158, 1.5460, -0.2706, -0.4314, -0.2919, 0.3681, 0.1735],
  1388. [ 0.5612, -0.3537, 1.6040, 0.0042, -0.5038, 0.1165, 0.3997, 0.1812],
  1389. [ 0.5596, -0.3945, 1.5997, -0.1237, -0.4685, -0.0593, 0.3873, 0.1867],
  1390. [ 0.4114, -0.4599, 1.1883, -1.2378, -0.3738, -1.3679, 0.2803, 0.1201],
  1391. [ 0.4364, -0.4916, 1.2448, -1.2068, -0.3356, -1.4575, 0.3233, 0.1142]],
  1392. device='cuda:0', grad_fn=<AddmmBackward>)
  1393. landmarks are: tensor([[[ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  1394. 0.2391],
  1395. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  1396. 0.2944],
  1397. [ 0.6257, -0.4273, 1.8365, -0.0688, -0.4672, -0.0611, 1.1715,
  1398. 0.1608],
  1399. [ 0.5428, -0.4244, 1.7095, -0.0380, 0.0232, 0.0725, 0.0866,
  1400. 0.3806],
  1401. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  1402. 0.3777],
  1403. [ 0.5499, -0.4225, 1.8018, -0.2921, -0.3055, 0.0543, 0.4046,
  1404. 0.2699],
  1405. [ 0.5707, -0.4189, 1.2707, -1.2467, -0.4095, -1.3082, 0.3758,
  1406. 0.0928],
  1407. [ 0.6124, -0.4010, 1.4381, -1.3544, -0.0573, -1.5546, 0.5573,
  1408. -0.0369]]], device='cuda:0')
  1409. loss_train_step before backward: tensor(0.0400, device='cuda:0', grad_fn=<MseLossBackward>)
  1410. loss_train_step after backward: tensor(0.0400, device='cuda:0', grad_fn=<MseLossBackward>)
  1411. loss_train: 4.342839952558279
  1412. step: 22
  1413. running loss: 0.19740181602537632
  1414. Train Steps: 22/90 Loss: 0.1974 torch.Size([8, 600, 800])
  1415. torch.Size([8, 8])
  1416. tensor([[0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  1417. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  1418. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  1419. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  1420. [0.6267, 0.4094, 0.8712, 0.3083, 0.4400, 0.2267, 0.6250, 0.5200],
  1421. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  1422. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  1423. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200]],
  1424. device='cuda:0', dtype=torch.float64)
  1425. predictions are: tensor([[ 0.5874, -0.3813, 1.6545, -0.0507, -0.4417, 0.0812, 0.4304, 0.1834],
  1426. [ 0.3994, -0.4998, 1.2229, -1.3992, -0.2548, -1.6338, 0.2909, 0.1109],
  1427. [ 0.4773, -0.3984, 1.3342, -0.7806, -0.4434, -0.6878, 0.3460, 0.1358],
  1428. [ 0.5034, -0.4020, 1.5718, -0.4009, -0.3795, -0.3917, 0.4109, 0.1579],
  1429. [ 0.4831, -0.4854, 1.3986, -1.1440, -0.2725, -1.4507, 0.3654, 0.1005],
  1430. [ 0.6052, -0.4153, 1.6555, -0.1839, -0.4558, -0.1716, 0.4230, 0.1649],
  1431. [ 0.6080, -0.3871, 1.6687, -0.1327, -0.4663, -0.0808, 0.4349, 0.1612],
  1432. [ 0.5008, -0.3815, 1.3538, -0.8037, -0.4405, -0.6999, 0.3763, 0.1449]],
  1433. device='cuda:0', grad_fn=<AddmmBackward>)
  1434. landmarks are: tensor([[[ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  1435. 0.5239],
  1436. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  1437. 0.2853],
  1438. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  1439. 0.2386],
  1440. [ 0.5447, -0.3838, 1.7037, 0.1775, -0.1497, 0.1467, 0.1128,
  1441. 0.2431],
  1442. [ 0.6089, -0.3948, 1.7383, -0.8617, -0.2536, -1.2390, 0.6009,
  1443. 0.1159],
  1444. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  1445. 0.0697],
  1446. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  1447. 0.3007],
  1448. [ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  1449. 0.1159]]], device='cuda:0')
  1450. loss_train_step before backward: tensor(0.0464, device='cuda:0', grad_fn=<MseLossBackward>)
  1451. loss_train_step after backward: tensor(0.0464, device='cuda:0', grad_fn=<MseLossBackward>)
  1452. loss_train: 4.389246199280024
  1453. step: 23
  1454. running loss: 0.1908367912730445
  1455. Train Steps: 23/90 Loss: 0.1908 torch.Size([8, 600, 800])
  1456. torch.Size([8, 8])
  1457. tensor([[0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  1458. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  1459. [0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  1460. [0.6307, 0.4029, 0.8650, 0.5200, 0.3763, 0.4017, 0.7311, 0.5366],
  1461. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  1462. [0.6127, 0.4115, 0.7163, 0.2883, 0.3625, 0.2950, 0.5327, 0.5495],
  1463. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  1464. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550]],
  1465. device='cuda:0', dtype=torch.float64)
  1466. predictions are: tensor([[ 0.6133, -0.3910, 1.8013, 0.1958, -0.3964, 0.3140, 0.4751, 0.2048],
  1467. [ 0.4495, -0.4382, 1.2529, -1.0922, -0.3345, -1.1163, 0.2963, 0.1465],
  1468. [ 0.4924, -0.4259, 1.3304, -1.0964, -0.2980, -1.2180, 0.3399, 0.1222],
  1469. [ 0.5933, -0.4085, 1.6925, -0.3447, -0.3869, -0.4754, 0.4793, 0.1284],
  1470. [ 0.5779, -0.3745, 1.5604, -0.4256, -0.4401, -0.2684, 0.4439, 0.1614],
  1471. [ 0.4712, -0.4171, 1.3140, -0.8936, -0.4123, -0.7876, 0.3292, 0.1524],
  1472. [ 0.4787, -0.4535, 1.4525, -0.9943, -0.2762, -1.1924, 0.3752, 0.1188],
  1473. [ 0.5423, -0.4336, 1.6983, -0.3355, -0.3292, -0.3300, 0.4789, 0.1588]],
  1474. device='cuda:0', grad_fn=<AddmmBackward>)
  1475. landmarks are: tensor([[[ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  1476. 0.1661],
  1477. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  1478. 0.3931],
  1479. [ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  1480. 0.2442],
  1481. [ 0.6273, -0.4249, 1.7095, 0.1159, -0.5480, -0.4306, 1.0910,
  1482. 0.1928],
  1483. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  1484. 0.0021],
  1485. [ 0.5442, -0.3855, 1.0224, -0.9541, -0.6115, -0.9233, 0.1745,
  1486. 0.2522],
  1487. [ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  1488. 0.1931],
  1489. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  1490. 0.2776]]], device='cuda:0')
  1491. loss_train_step before backward: tensor(0.0366, device='cuda:0', grad_fn=<MseLossBackward>)
  1492. loss_train_step after backward: tensor(0.0366, device='cuda:0', grad_fn=<MseLossBackward>)
  1493. loss_train: 4.425804238766432
  1494. step: 24
  1495. running loss: 0.18440850994860133
  1496.  
  1497. Train Steps: 24/90 Loss: 0.1844 torch.Size([8, 600, 800])
  1498. torch.Size([8, 8])
  1499. tensor([[0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  1500. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  1501. [0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  1502. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  1503. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  1504. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  1505. [0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600],
  1506. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967]],
  1507. device='cuda:0', dtype=torch.float64)
  1508. predictions are: tensor([[ 0.5954, -0.4218, 1.5997, -0.6919, -0.3504, -0.7712, 0.4362, 0.1723],
  1509. [ 0.5064, -0.3984, 1.6899, -0.0856, -0.4166, 0.1454, 0.4647, 0.2048],
  1510. [ 0.5156, -0.4074, 1.3041, -1.1373, -0.3325, -1.1563, 0.3512, 0.1370],
  1511. [ 0.5488, -0.4500, 1.6568, -0.8152, -0.2328, -1.0531, 0.4730, 0.1296],
  1512. [ 0.5115, -0.4477, 1.4305, -1.0701, -0.2929, -1.2223, 0.3507, 0.1469],
  1513. [ 0.5264, -0.4210, 1.3500, -1.0950, -0.3389, -1.1687, 0.3748, 0.1390],
  1514. [ 0.5776, -0.4009, 1.8139, 0.1687, -0.4191, 0.2928, 0.5090, 0.2054],
  1515. [ 0.5844, -0.3730, 1.7113, -0.0934, -0.4380, 0.1155, 0.4841, 0.1837]],
  1516. device='cuda:0', grad_fn=<AddmmBackward>)
  1517. landmarks are: tensor([[[ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  1518. 0.2776],
  1519. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  1520. 0.0772],
  1521. [ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  1522. 0.0712],
  1523. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  1524. 0.3050],
  1525. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  1526. -0.0220],
  1527. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  1528. 0.3007],
  1529. [ 0.5762, -0.3840, 1.7268, 0.2622, -0.4210, 0.1313, 0.4277,
  1530. 0.3007],
  1531. [ 0.4974, -0.4482, 1.6633, -0.3306, -0.6173, 0.1313, 0.2925,
  1532. 0.0081]]], device='cuda:0')
  1533. loss_train_step before backward: tensor(0.0310, device='cuda:0', grad_fn=<MseLossBackward>)
  1534. loss_train_step after backward: tensor(0.0310, device='cuda:0', grad_fn=<MseLossBackward>)
  1535. loss_train: 4.456804607063532
  1536. step: 25
  1537. running loss: 0.17827218428254127
  1538. Train Steps: 25/90 Loss: 0.1783 torch.Size([8, 600, 800])
  1539. torch.Size([8, 8])
  1540. tensor([[ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  1541. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  1542. [0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544],
  1543. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  1544. [0.6273, 0.4105, 0.8988, 0.4517, 0.3912, 0.2550, 0.5894, 0.4811],
  1545. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  1546. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  1547. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600]],
  1548. device='cuda:0', dtype=torch.float64)
  1549. predictions are: tensor([[ 0.5044, -0.4351, 1.3826, -1.0189, -0.3350, -1.0562, 0.3842, 0.1582],
  1550. [ 0.5649, -0.4414, 1.5426, -0.8654, -0.3159, -0.9570, 0.4214, 0.1911],
  1551. [ 0.5411, -0.4083, 1.3608, -1.0084, -0.3764, -1.0115, 0.3643, 0.1792],
  1552. [ 0.5614, -0.4106, 1.7066, -0.1109, -0.4423, 0.2117, 0.5177, 0.2240],
  1553. [ 0.6142, -0.4105, 1.7577, -0.4887, -0.3124, -0.6148, 0.5242, 0.1637],
  1554. [ 0.5997, -0.4014, 1.5340, -0.7335, -0.3835, -0.6683, 0.4661, 0.1797],
  1555. [ 0.4949, -0.4439, 1.4315, -1.0887, -0.2691, -1.1977, 0.3793, 0.1786],
  1556. [ 0.6371, -0.4062, 1.9366, 0.3314, -0.4247, 0.4813, 0.5960, 0.2351]],
  1557. device='cuda:0', grad_fn=<AddmmBackward>)
  1558. landmarks are: tensor([[[-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  1559. 0.2183],
  1560. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  1561. 0.2853],
  1562. [ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  1563. 0.2747],
  1564. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  1565. 0.2083],
  1566. [ 0.6116, -0.3898, 1.8654, -0.1997, -0.4788, -1.1081, 0.4367,
  1567. -0.0637],
  1568. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  1569. 0.2043],
  1570. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  1571. 0.2853],
  1572. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  1573. 0.3007]]], device='cuda:0')
  1574. loss_train_step before backward: tensor(0.2222, device='cuda:0', grad_fn=<MseLossBackward>)
  1575. loss_train_step after backward: tensor(0.2222, device='cuda:0', grad_fn=<MseLossBackward>)
  1576. loss_train: 4.679033596068621
  1577. step: 26
  1578. running loss: 0.17996283061802387
  1579. Train Steps: 26/90 Loss: 0.1800 torch.Size([8, 600, 800])
  1580. torch.Size([8, 8])
  1581. tensor([[0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  1582. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  1583. [0.6199, 0.4065, 0.7598, 0.2385, 0.4317, 0.1981, 0.5933, 0.5221],
  1584. [0.6042, 0.3990, 0.6831, 0.2875, 0.3500, 0.3133, 0.5143, 0.5510],
  1585. [0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378],
  1586. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  1587. [0.6260, 0.4133, 0.8800, 0.5117, 0.3713, 0.3283, 0.6223, 0.4967],
  1588. [0.6236, 0.3977, 0.8985, 0.4806, 0.3835, 0.5216, 0.6613, 0.5166]],
  1589. device='cuda:0', dtype=torch.float64)
  1590. predictions are: tensor([[ 0.5752, -0.4557, 1.7538, -0.0873, -0.4162, 0.0275, 0.5230, 0.2209],
  1591. [ 0.5054, -0.4485, 1.6481, -0.3998, -0.3812, -0.2287, 0.4958, 0.1973],
  1592. [ 0.5210, -0.4305, 1.3226, -1.2333, -0.3546, -1.2685, 0.3925, 0.1713],
  1593. [ 0.4906, -0.4524, 1.2683, -1.1478, -0.3965, -1.0973, 0.3616, 0.2053],
  1594. [ 0.5731, -0.4653, 1.7510, -0.3070, -0.4253, -0.3510, 0.5229, 0.1982],
  1595. [ 0.5210, -0.4544, 1.4968, -0.9434, -0.3615, -1.0090, 0.4108, 0.1978],
  1596. [ 0.5749, -0.4515, 1.7346, -0.6102, -0.3249, -0.7786, 0.5225, 0.1889],
  1597. [ 0.5185, -0.4411, 1.7667, -0.0767, -0.4038, 0.1146, 0.5136, 0.2516]],
  1598. device='cuda:0', grad_fn=<AddmmBackward>)
  1599. landmarks are: tensor([[[ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  1600. -0.1331],
  1601. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  1602. 0.0231],
  1603. [ 0.5774, -0.4082, 1.2235, -1.1844, -0.2919, -1.3709, 0.4544,
  1604. 0.1256],
  1605. [ 0.5049, -0.4428, 0.8692, -0.9581, -0.6693, -0.8386, 0.0897,
  1606. 0.2589],
  1607. [ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  1608. 0.1982],
  1609. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  1610. 0.2237],
  1611. [ 0.6054, -0.3767, 1.7788, 0.0774, -0.5711, -0.7694, 0.5887,
  1612. 0.0081],
  1613. [ 0.5944, -0.4490, 1.8643, -0.0659, -0.5147, 0.1235, 0.7684,
  1614. 0.1004]]], device='cuda:0')
  1615. loss_train_step before backward: tensor(0.0442, device='cuda:0', grad_fn=<MseLossBackward>)
  1616. loss_train_step after backward: tensor(0.0442, device='cuda:0', grad_fn=<MseLossBackward>)
  1617. loss_train: 4.7232260555028915
  1618. step: 27
  1619. running loss: 0.17493429835195895
  1620. Train Steps: 27/90 Loss: 0.1749 torch.Size([8, 600, 800])
  1621. torch.Size([8, 8])
  1622. tensor([[0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  1623. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  1624. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  1625. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197],
  1626. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  1627. [0.6163, 0.4006, 0.8788, 0.4683, 0.3663, 0.4883, 0.5887, 0.5017],
  1628. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350],
  1629. [0.6198, 0.4130, 0.8762, 0.4117, 0.3650, 0.4900, 0.5707, 0.5103]],
  1630. device='cuda:0', dtype=torch.float64)
  1631. predictions are: tensor([[ 0.5405, -0.4394, 1.4507, -0.9549, -0.4286, -0.9721, 0.4815, 0.1903],
  1632. [ 0.4607, -0.4560, 1.2716, -0.9976, -0.4577, -0.8585, 0.3750, 0.2287],
  1633. [ 0.4619, -0.4713, 1.5905, -0.4083, -0.3709, -0.4039, 0.4716, 0.2178],
  1634. [ 0.4783, -0.4746, 1.6230, -0.4580, -0.3821, -0.4283, 0.4770, 0.2247],
  1635. [ 0.5517, -0.4558, 1.6601, -0.6311, -0.3759, -0.8260, 0.4948, 0.2009],
  1636. [ 0.4894, -0.4661, 1.5988, -0.3804, -0.4628, -0.1826, 0.4667, 0.2203],
  1637. [ 0.5504, -0.4706, 1.7239, -0.2985, -0.4422, -0.2883, 0.5128, 0.1965],
  1638. [ 0.5535, -0.4622, 1.7266, -0.4120, -0.4370, -0.4260, 0.4954, 0.2181]],
  1639. device='cuda:0', grad_fn=<AddmmBackward>)
  1640. landmarks are: tensor([[[ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  1641. -0.0957],
  1642. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  1643. 0.3546],
  1644. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  1645. 0.4547],
  1646. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  1647. 0.1146],
  1648. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  1649. 0.1661],
  1650. [ 0.5609, -0.4354, 1.7730, -0.1227, -0.5942, -0.0303, 0.4335,
  1651. 0.0313],
  1652. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  1653. 0.1854],
  1654. [ 0.5771, -0.3784, 1.7614, -0.3844, -0.6000, -0.0226, 0.3501,
  1655. 0.0712]]], device='cuda:0')
  1656. loss_train_step before backward: tensor(0.0562, device='cuda:0', grad_fn=<MseLossBackward>)
  1657. loss_train_step after backward: tensor(0.0562, device='cuda:0', grad_fn=<MseLossBackward>)
  1658. loss_train: 4.779460072517395
  1659. step: 28
  1660. running loss: 0.17069500258990697
  1661.  
  1662. Train Steps: 28/90 Loss: 0.1707 torch.Size([8, 600, 800])
  1663. torch.Size([8, 8])
  1664. tensor([[0.6311, 0.3998, 0.7975, 0.5767, 0.3838, 0.4850, 0.7327, 0.5343],
  1665. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  1666. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  1667. [0.6200, 0.3978, 0.8900, 0.4550, 0.3775, 0.5200, 0.6150, 0.5367],
  1668. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  1669. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  1670. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  1671. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482]],
  1672. device='cuda:0', dtype=torch.float64)
  1673. predictions are: tensor([[ 0.4621, -0.4910, 1.5000, -0.4019, -0.4888, -0.2934, 0.4030, 0.2112],
  1674. [ 0.4917, -0.4781, 1.5036, -0.9912, -0.3765, -1.2404, 0.4376, 0.1793],
  1675. [ 0.4635, -0.4929, 1.6376, -0.2115, -0.4377, -0.1783, 0.4493, 0.2203],
  1676. [ 0.4968, -0.4848, 1.6916, -0.1059, -0.5143, 0.0720, 0.5134, 0.2184],
  1677. [ 0.5540, -0.4735, 1.7266, -0.2006, -0.5030, -0.1378, 0.4941, 0.2128],
  1678. [ 0.5009, -0.4610, 1.3333, -1.0000, -0.4870, -1.0072, 0.4258, 0.1925],
  1679. [ 0.5170, -0.4835, 1.7170, -0.1887, -0.4760, -0.2195, 0.4769, 0.1899],
  1680. [ 0.4410, -0.5048, 1.4669, -1.0029, -0.3608, -1.2285, 0.4652, 0.1677]],
  1681. device='cuda:0', grad_fn=<AddmmBackward>)
  1682. landmarks are: tensor([[[ 0.6289, -0.4393, 1.3977, 0.3777, -0.5134, -0.0457, 1.0984,
  1683. 0.1821],
  1684. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  1685. -0.0209],
  1686. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  1687. 0.2634],
  1688. [ 0.5776, -0.4484, 1.8249, -0.1843, -0.5423, 0.1159, 0.5547,
  1689. 0.1929],
  1690. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  1691. 0.1159],
  1692. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  1693. -0.0220],
  1694. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  1695. -0.0370],
  1696. [-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  1697. 0.2463]]], device='cuda:0')
  1698. loss_train_step before backward: tensor(0.2187, device='cuda:0', grad_fn=<MseLossBackward>)
  1699. loss_train_step after backward: tensor(0.2187, device='cuda:0', grad_fn=<MseLossBackward>)
  1700. loss_train: 4.998158469796181
  1701. step: 29
  1702. running loss: 0.17235029206193728
  1703. Train Steps: 29/90 Loss: 0.1724 torch.Size([8, 600, 800])
  1704. torch.Size([8, 8])
  1705. tensor([[0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667],
  1706. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  1707. [0.6060, 0.3924, 0.8450, 0.5717, 0.4200, 0.5217, 0.5253, 0.4752],
  1708. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  1709. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  1710. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586],
  1711. [0.6261, 0.4066, 0.8325, 0.2150, 0.4763, 0.2667, 0.7002, 0.5633],
  1712. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822]],
  1713. device='cuda:0', dtype=torch.float64)
  1714. predictions are: tensor([[ 0.4439, -0.4882, 1.6552, -0.1041, -0.5164, -0.0036, 0.4752, 0.1893],
  1715. [ 0.4620, -0.4752, 1.6635, -0.2930, -0.4908, -0.3561, 0.4884, 0.1639],
  1716. [ 0.4005, -0.5161, 1.5989, -0.2423, -0.4633, -0.2455, 0.4451, 0.1616],
  1717. [ 0.4913, -0.5129, 1.6991, -0.2184, -0.4814, -0.2698, 0.4712, 0.1792],
  1718. [ 0.4668, -0.4844, 1.6592, -0.1376, -0.4977, -0.1037, 0.4597, 0.1926],
  1719. [ 0.3816, -0.5161, 1.4410, -0.9878, -0.3631, -1.2132, 0.4439, 0.1703],
  1720. [ 0.4210, -0.4985, 1.4144, -1.0300, -0.4295, -1.1849, 0.4380, 0.1659],
  1721. [ 0.4693, -0.5386, 1.6060, -0.4653, -0.4800, -0.5654, 0.4283, 0.1936]],
  1722. device='cuda:0', grad_fn=<AddmmBackward>)
  1723. landmarks are: tensor([[[ 0.5853, -0.3614, 1.6806, 0.2930, -0.4499, 0.1005, 0.3815,
  1724. 0.3315],
  1725. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  1726. -0.0102],
  1727. [ 0.5132, -0.4736, 1.6171, 0.3546, -0.3460, 0.1236, 0.1404,
  1728. -0.0911],
  1729. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  1730. 0.0313],
  1731. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  1732. 0.3007],
  1733. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  1734. 0.2944],
  1735. [ 0.6059, -0.4080, 1.5594, -1.2928, -0.0861, -1.0542, 0.9485,
  1736. 0.3157],
  1737. [ 0.5697, -0.4113, 1.7499, -0.2767, -0.6404, -0.7155, 0.1576,
  1738. 0.4032]]], device='cuda:0')
  1739. loss_train_step before backward: tensor(0.0521, device='cuda:0', grad_fn=<MseLossBackward>)
  1740. loss_train_step after backward: tensor(0.0521, device='cuda:0', grad_fn=<MseLossBackward>)
  1741. loss_train: 5.050214387476444
  1742. step: 30
  1743. running loss: 0.16834047958254814
  1744. Train Steps: 30/90 Loss: 0.1683 torch.Size([8, 600, 800])
  1745. torch.Size([8, 8])
  1746. tensor([[0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  1747. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  1748. [0.6083, 0.3957, 0.8638, 0.4950, 0.4363, 0.5083, 0.5346, 0.4980],
  1749. [0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383],
  1750. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  1751. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  1752. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  1753. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726]],
  1754. device='cuda:0', dtype=torch.float64)
  1755. predictions are: tensor([[ 0.4256, -0.5307, 1.4230, -0.6611, -0.4992, -0.7421, 0.4294, 0.1491],
  1756. [ 0.4814, -0.4975, 1.7566, -0.1036, -0.4995, -0.1922, 0.5431, 0.1585],
  1757. [ 0.4664, -0.5085, 1.9594, 0.3104, -0.4150, 0.1499, 0.5579, 0.1315],
  1758. [ 0.4296, -0.5129, 1.9311, 0.3247, -0.4423, 0.3089, 0.5455, 0.1614],
  1759. [ 0.3443, -0.5417, 1.3398, -0.8960, -0.4093, -1.0721, 0.3534, 0.1745],
  1760. [ 0.4356, -0.5197, 1.4351, -0.7563, -0.4948, -0.8742, 0.4220, 0.1475],
  1761. [ 0.3822, -0.5374, 1.4107, -0.7609, -0.4680, -0.9120, 0.3871, 0.1718],
  1762. [ 0.4443, -0.4906, 1.4567, -0.7145, -0.4900, -0.8297, 0.4329, 0.1366]],
  1763. device='cuda:0', grad_fn=<AddmmBackward>)
  1764. landmarks are: tensor([[[ 5.7296e-01, -4.5619e-01, 1.2195e+00, -1.2440e+00, -5.4966e-01,
  1765. -7.7109e-01, 5.7045e-01, 1.7788e-01],
  1766. [ 6.0710e-01, -4.1186e-01, 1.7788e+00, -5.1532e-01, -6.0000e-01,
  1767. -5.6921e-01, 6.5857e-01, -6.7050e-02],
  1768. [ 5.2379e-01, -4.5797e-01, 1.7037e+00, 4.6189e-04, -2.7090e-01,
  1769. 6.2048e-02, 1.8356e-01, 1.4106e-02],
  1770. [ 5.6637e-01, -4.3212e-01, 1.8249e+00, -2.0739e-01, -2.6513e-01,
  1771. 4.1617e-01, 5.6628e-01, 2.0062e-01],
  1772. [ 5.8620e-01, -3.5296e-01, 1.1032e+00, -1.0619e+00, -1.4965e-01,
  1773. -1.3852e+00, 3.4111e-01, 3.9307e-01],
  1774. [ 5.2194e-01, -4.5504e-01, 1.1415e+00, -9.1962e-01, -6.4042e-01,
  1775. -9.3872e-01, 1.8562e-01, 1.4106e-02],
  1776. [ 5.6028e-01, -3.7637e-01, 8.0878e-01, -1.1466e+00, -4.5566e-01,
  1777. -1.1158e+00, 3.6420e-01, 2.3911e-01],
  1778. [ 4.9971e-01, -4.4465e-01, 1.1610e+00, -9.7721e-01, -6.0577e-01,
  1779. -1.0311e+00, 1.4038e-01, -1.0312e-01]]], device='cuda:0')
  1780. loss_train_step before backward: tensor(0.0491, device='cuda:0', grad_fn=<MseLossBackward>)
  1781. loss_train_step after backward: tensor(0.0491, device='cuda:0', grad_fn=<MseLossBackward>)
  1782. loss_train: 5.099356964230537
  1783. step: 31
  1784. running loss: 0.16449538594292057
  1785. Train Steps: 31/90 Loss: 0.1645 torch.Size([8, 600, 800])
  1786. torch.Size([8, 8])
  1787. tensor([[0.6357, 0.4139, 0.8450, 0.5883, 0.3775, 0.4950, 0.6488, 0.5297],
  1788. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  1789. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  1790. [0.6128, 0.4115, 0.7934, 0.3778, 0.3450, 0.4033, 0.5337, 0.5456],
  1791. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  1792. [0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  1793. [0.6125, 0.4035, 0.7825, 0.3100, 0.3463, 0.4900, 0.5832, 0.5637],
  1794. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482]],
  1795. device='cuda:0', dtype=torch.float64)
  1796. predictions are: tensor([[ 0.4981, -0.5002, 1.8641, 0.2520, -0.4876, 0.1037, 0.5152, 0.1010],
  1797. [ 0.4992, -0.4909, 1.9148, 0.4428, -0.4518, 0.3332, 0.5102, 0.1114],
  1798. [ 0.5246, -0.4915, 1.7953, -0.2241, -0.4603, -0.4731, 0.5106, 0.1482],
  1799. [ 0.3892, -0.4989, 1.4743, -0.3986, -0.5017, -0.3789, 0.4380, 0.1431],
  1800. [ 0.3725, -0.5422, 1.3167, -0.9795, -0.4368, -1.2552, 0.3796, 0.1484],
  1801. [ 0.3573, -0.5144, 1.2350, -0.8814, -0.4860, -0.9428, 0.3407, 0.1568],
  1802. [ 0.3831, -0.4949, 1.4455, -0.4288, -0.5095, -0.3071, 0.3988, 0.1604],
  1803. [ 0.2896, -0.5915, 1.6280, -0.6673, -0.2973, -1.0396, 0.5594, 0.1253]],
  1804. device='cuda:0', grad_fn=<AddmmBackward>)
  1805. landmarks are: tensor([[[ 6.5036e-01, -3.7434e-01, 1.6171e+00, 4.3156e-01, -5.4226e-01,
  1806. 4.6189e-04, 7.1085e-01, 1.6077e-01],
  1807. [ 5.7829e-01, -4.3634e-01, 1.7724e+00, 4.3211e-02, -5.1531e-01,
  1808. 8.7136e-02, 4.8401e-01, 6.6263e-02],
  1809. [ 5.7685e-01, -3.8568e-01, 1.5305e+00, -7.6936e-01, -6.4619e-01,
  1810. -6.3079e-01, 3.9885e-01, 3.3149e-01],
  1811. [ 5.4440e-01, -3.8522e-01, 1.3786e+00, -5.4087e-01, -6.9238e-01,
  1812. -4.2294e-01, 1.7915e-01, 2.3412e-01],
  1813. [ 5.1085e-01, -4.3164e-01, 1.1436e+00, -1.3467e+00, -3.8637e-01,
  1814. -1.4160e+00, 1.2393e-01, -5.8033e-02],
  1815. [ 5.4099e-01, -4.3210e-01, 8.8383e-01, -9.8491e-01, -5.7691e-01,
  1816. -1.0003e+00, 2.6028e-01, 3.3149e-01],
  1817. [ 5.4319e-01, -4.2240e-01, 1.3284e+00, -8.5404e-01, -6.8661e-01,
  1818. -2.2633e-02, 4.0770e-01, 3.1769e-01],
  1819. [-2.2859e+00, -2.2859e+00, 1.6517e+00, -1.2620e+00, 2.1409e-01,
  1820. -1.1928e+00, 1.1166e+00, 2.4627e-01]]], device='cuda:0')
  1821. loss_train_step before backward: tensor(0.1953, device='cuda:0', grad_fn=<MseLossBackward>)
  1822. loss_train_step after backward: tensor(0.1953, device='cuda:0', grad_fn=<MseLossBackward>)
  1823. loss_train: 5.294639840722084
  1824. step: 32
  1825. running loss: 0.16545749502256513
  1826.  
  1827. Train Steps: 32/90 Loss: 0.1655 torch.Size([8, 600, 800])
  1828. torch.Size([8, 8])
  1829. tensor([[0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  1830. [0.6226, 0.4001, 0.8438, 0.5733, 0.3862, 0.4250, 0.5750, 0.5283],
  1831. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483],
  1832. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  1833. [0.6263, 0.4030, 0.9000, 0.4767, 0.3800, 0.5167, 0.6415, 0.4771],
  1834. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650],
  1835. [0.6099, 0.4030, 0.8638, 0.5117, 0.4983, 0.4965, 0.5086, 0.5388],
  1836. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650]],
  1837. device='cuda:0', dtype=torch.float64)
  1838. predictions are: tensor([[ 0.3085, -0.5768, 1.4610, -0.7784, -0.3601, -1.1018, 0.4599, 0.1369],
  1839. [ 0.4371, -0.5274, 1.7047, -0.0446, -0.4892, -0.1888, 0.5027, 0.0903],
  1840. [ 0.4908, -0.4720, 1.7375, -0.0467, -0.5059, -0.2004, 0.4971, 0.1306],
  1841. [ 0.3127, -0.5506, 1.1132, -1.1260, -0.4676, -1.1954, 0.3508, 0.1386],
  1842. [ 0.4899, -0.4851, 1.8631, 0.2737, -0.4897, 0.2595, 0.5035, 0.1027],
  1843. [ 0.2675, -0.5867, 1.1643, -1.0927, -0.4417, -1.2381, 0.3678, 0.1496],
  1844. [ 0.3908, -0.5745, 1.7423, -0.0200, -0.3634, -0.2191, 0.4888, 0.1441],
  1845. [ 0.3999, -0.5149, 1.7153, 0.0344, -0.4431, 0.0088, 0.4822, 0.1426]],
  1846. device='cuda:0', grad_fn=<AddmmBackward>)
  1847. landmarks are: tensor([[[ 0.5875, -0.3888, 1.3111, -0.8848, -0.4614, -0.9849, 0.5201,
  1848. 0.2622],
  1849. [ 0.5900, -0.4377, 1.6113, 0.3623, -0.5018, -0.3229, 0.3700,
  1850. 0.1544],
  1851. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  1852. 0.2468],
  1853. [ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  1854. 0.3852],
  1855. [ 0.6072, -0.4247, 1.8711, -0.0842, -0.5307, 0.1005, 0.6771,
  1856. -0.0821],
  1857. [-2.2859, -2.2859, 1.0361, -1.2021, -0.4210, -1.3390, 0.0871,
  1858. 0.3238],
  1859. [ 0.5309, -0.4246, 1.7037, 0.0774, 0.0158, 0.0075, 0.0635,
  1860. 0.2026],
  1861. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  1862. 0.3238]]], device='cuda:0')
  1863. loss_train_step before backward: tensor(0.1797, device='cuda:0', grad_fn=<MseLossBackward>)
  1864. loss_train_step after backward: tensor(0.1797, device='cuda:0', grad_fn=<MseLossBackward>)
  1865. loss_train: 5.4743141531944275
  1866. step: 33
  1867. running loss: 0.1658883076725584
  1868. Train Steps: 33/90 Loss: 0.1659 torch.Size([8, 600, 800])
  1869. torch.Size([8, 8])
  1870. tensor([[0.6277, 0.4013, 0.8888, 0.4767, 0.3600, 0.3567, 0.6148, 0.4672],
  1871. [0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  1872. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  1873. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  1874. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  1875. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749],
  1876. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  1877. [0.6300, 0.4102, 0.9088, 0.4433, 0.4088, 0.3067, 0.6820, 0.5540]],
  1878. device='cuda:0', dtype=torch.float64)
  1879. predictions are: tensor([[ 0.4537, -0.5209, 1.6994, -0.1240, -0.4797, -0.3147, 0.4962, 0.1137],
  1880. [ 0.2515, -0.5921, 1.1194, -1.0232, -0.4625, -1.1073, 0.3233, 0.1711],
  1881. [ 0.4298, -0.5692, 1.8640, 0.1525, -0.3792, -0.1307, 0.4597, 0.1279],
  1882. [ 0.3892, -0.5137, 1.5070, -0.3672, -0.4984, -0.3483, 0.4242, 0.1417],
  1883. [ 0.3929, -0.5408, 1.5922, -0.0295, -0.4774, -0.1083, 0.4134, 0.1505],
  1884. [ 0.3016, -0.5772, 1.1988, -0.8329, -0.4858, -0.8551, 0.3505, 0.1630],
  1885. [ 0.4089, -0.5140, 1.5588, -0.3554, -0.5156, -0.3883, 0.4443, 0.1207],
  1886. [ 0.2977, -0.6028, 1.8114, -0.2007, -0.3145, -0.6246, 0.5291, 0.1498]],
  1887. device='cuda:0', grad_fn=<AddmmBackward>)
  1888. landmarks are: tensor([[[ 0.6132, -0.4324, 1.8192, -0.0842, -0.6231, -0.6385, 0.5537,
  1889. -0.1278],
  1890. [ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  1891. 0.3315],
  1892. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  1893. -0.0220],
  1894. [ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  1895. 0.2930],
  1896. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  1897. 0.3478],
  1898. [ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  1899. 0.3694],
  1900. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  1901. 0.0236],
  1902. [ 0.6240, -0.3912, 1.9115, -0.2382, -0.3979, -0.8694, 0.8644,
  1903. 0.2730]]], device='cuda:0')
  1904. loss_train_step before backward: tensor(0.0368, device='cuda:0', grad_fn=<MseLossBackward>)
  1905. loss_train_step after backward: tensor(0.0368, device='cuda:0', grad_fn=<MseLossBackward>)
  1906. loss_train: 5.511073064059019
  1907. step: 34
  1908. running loss: 0.16209038423702998
  1909. Train Steps: 34/90 Loss: 0.1621 torch.Size([8, 600, 800])
  1910. torch.Size([8, 8])
  1911. tensor([[0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400],
  1912. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  1913. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  1914. [0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  1915. [0.6214, 0.4112, 0.7838, 0.2117, 0.3650, 0.3133, 0.5675, 0.5083],
  1916. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667],
  1917. [0.6250, 0.4116, 0.8700, 0.4850, 0.4650, 0.5567, 0.6088, 0.5183],
  1918. [0.6189, 0.4033, 0.8650, 0.5267, 0.4487, 0.5150, 0.5925, 0.5050]],
  1919. device='cuda:0', dtype=torch.float64)
  1920. predictions are: tensor([[ 0.3724, -0.5650, 1.5811, -0.3080, -0.4808, -0.4925, 0.4385, 0.1313],
  1921. [ 0.2653, -0.6318, 1.3712, -0.6937, -0.3957, -0.8542, 0.4976, 0.1337],
  1922. [ 0.1592, -0.6391, 1.2529, -0.8141, -0.3916, -0.9404, 0.3738, 0.2095],
  1923. [ 0.1828, -0.6339, 1.3143, -0.7811, -0.3769, -1.0112, 0.4253, 0.1762],
  1924. [ 0.4055, -0.5633, 1.4417, -0.5345, -0.5245, -0.6789, 0.4411, 0.1603],
  1925. [ 0.2255, -0.6256, 1.2832, -0.7301, -0.4409, -0.8754, 0.3790, 0.1613],
  1926. [ 0.5063, -0.4833, 1.8031, 0.4133, -0.4401, 0.4369, 0.4695, 0.1416],
  1927. [ 0.5404, -0.4651, 1.7917, 0.4030, -0.4918, 0.3713, 0.4484, 0.1168]],
  1928. device='cuda:0', grad_fn=<AddmmBackward>)
  1929. landmarks are: tensor([[[ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  1930. 0.2083],
  1931. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  1932. 0.1020],
  1933. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  1934. 0.2853],
  1935. [ 0.5908, -0.3832, 1.3804, -1.2543, -0.1270, -1.4671, 0.5721,
  1936. 0.2237],
  1937. [ 0.5845, -0.3864, 1.3342, -1.3082, -0.6000, -0.8386, 0.3353,
  1938. 0.0620],
  1939. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  1940. 0.3315],
  1941. [ 0.6012, -0.3846, 1.7326, -0.0457, -0.1381, 0.2853, 0.5259,
  1942. 0.1082],
  1943. [ 0.5726, -0.4230, 1.7095, 0.1467, -0.2132, 0.0928, 0.4508,
  1944. 0.0467]]], device='cuda:0')
  1945. loss_train_step before backward: tensor(0.2046, device='cuda:0', grad_fn=<MseLossBackward>)
  1946. loss_train_step after backward: tensor(0.2046, device='cuda:0', grad_fn=<MseLossBackward>)
  1947. loss_train: 5.71563608571887
  1948. step: 35
  1949. running loss: 0.16330388816339628
  1950. Train Steps: 35/90 Loss: 0.1633 torch.Size([8, 600, 800])
  1951. torch.Size([8, 8])
  1952. tensor([[0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395],
  1953. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  1954. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533],
  1955. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  1956. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  1957. [0.6314, 0.4107, 0.8750, 0.5100, 0.3788, 0.4900, 0.7121, 0.5864],
  1958. [0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  1959. [0.6289, 0.4032, 0.8419, 0.5446, 0.4075, 0.5017, 0.6312, 0.5117]],
  1960. device='cuda:0', dtype=torch.float64)
  1961. predictions are: tensor([[ 0.1656, -0.6813, 1.2116, -0.9808, -0.3851, -1.2191, 0.4084, 0.2121],
  1962. [ 0.5132, -0.4670, 1.8552, 0.3621, -0.4981, 0.4013, 0.4923, 0.1279],
  1963. [ 0.2068, -0.6265, 1.0946, -0.9656, -0.4810, -1.0109, 0.3559, 0.1965],
  1964. [ 0.4097, -0.5306, 1.4900, -0.4212, -0.4880, -0.4898, 0.4622, 0.1524],
  1965. [ 0.1992, -0.6792, 1.3864, -0.7662, -0.3886, -1.0255, 0.4300, 0.2195],
  1966. [ 0.5568, -0.4758, 1.8857, 0.3602, -0.4827, 0.2015, 0.5142, 0.1116],
  1967. [ 0.2005, -0.6281, 1.0860, -1.0023, -0.4493, -1.0749, 0.3525, 0.2077],
  1968. [ 0.5050, -0.4917, 1.7101, 0.1303, -0.4779, 0.0353, 0.4208, 0.1442]],
  1969. device='cuda:0', grad_fn=<AddmmBackward>)
  1970. landmarks are: tensor([[[ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  1971. 0.2058],
  1972. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  1973. 0.1082],
  1974. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  1975. 0.2699],
  1976. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  1977. 0.1005],
  1978. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  1979. 0.2853],
  1980. [ 0.6306, -0.3888, 1.7557, 0.0697, -0.5365, -0.0226, 1.0033,
  1981. 0.4226],
  1982. [ 0.5425, -0.3998, 0.9263, -0.8683, -0.6000, -1.0157, 0.0990,
  1983. 0.2476],
  1984. [ 0.6189, -0.4238, 1.6026, 0.2295, -0.4037, 0.0313, 0.6298,
  1985. 0.0774]]], device='cuda:0')
  1986. loss_train_step before backward: tensor(0.0442, device='cuda:0', grad_fn=<MseLossBackward>)
  1987. loss_train_step after backward: tensor(0.0442, device='cuda:0', grad_fn=<MseLossBackward>)
  1988. loss_train: 5.759868372231722
  1989. step: 36
  1990. running loss: 0.1599963436731034
  1991.  
  1992. Train Steps: 36/90 Loss: 0.1600 torch.Size([8, 600, 800])
  1993. torch.Size([8, 8])
  1994. tensor([[0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501],
  1995. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690],
  1996. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279],
  1997. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  1998. [0.6203, 0.4078, 0.8800, 0.5083, 0.3900, 0.5000, 0.6100, 0.5583],
  1999. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  2000. [0.6257, 0.4060, 0.8300, 0.2333, 0.4688, 0.2583, 0.7050, 0.5633],
  2001. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100]],
  2002. device='cuda:0', dtype=torch.float64)
  2003. predictions are: tensor([[ 0.0306, -0.7482, 1.1684, -1.1746, -0.3463, -1.4168, 0.4507, 0.2861],
  2004. [ 0.4355, -0.4647, 1.4831, -0.1241, -0.5088, -0.0437, 0.4310, 0.1761],
  2005. [ 0.5143, -0.4910, 1.6547, -0.1234, -0.5125, -0.2014, 0.4634, 0.1301],
  2006. [ 0.2105, -0.5922, 1.0609, -0.9738, -0.4900, -0.8628, 0.3837, 0.2377],
  2007. [ 0.5715, -0.4519, 1.6900, 0.0187, -0.5369, -0.0197, 0.4772, 0.1420],
  2008. [ 0.4221, -0.5485, 1.5904, -0.2299, -0.4761, -0.3609, 0.4290, 0.1838],
  2009. [ 0.0825, -0.7490, 1.3565, -1.0026, -0.3237, -1.2647, 0.5705, 0.2463],
  2010. [ 0.5655, -0.4344, 1.5807, 0.0510, -0.5576, 0.0759, 0.3991, 0.1501]],
  2011. device='cuda:0', grad_fn=<AddmmBackward>)
  2012. landmarks are: tensor([[[ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  2013. 0.2549],
  2014. [ 0.6306, -0.4153, 1.5141, 0.2224, -0.3691, 0.2622, 1.0033,
  2015. 0.3425],
  2016. [ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  2017. 0.1525],
  2018. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  2019. 0.3469],
  2020. [ 0.5794, -0.4023, 1.7788, 0.0620, -0.4845, 0.0236, 0.5316,
  2021. 0.2930],
  2022. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  2023. 0.0893],
  2024. [ 0.6042, -0.4105, 1.5478, -1.2082, -0.1208, -1.0927, 0.9704,
  2025. 0.3157],
  2026. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  2027. 0.5316]]], device='cuda:0')
  2028. loss_train_step before backward: tensor(0.0460, device='cuda:0', grad_fn=<MseLossBackward>)
  2029. loss_train_step after backward: tensor(0.0460, device='cuda:0', grad_fn=<MseLossBackward>)
  2030. loss_train: 5.805826131254435
  2031. step: 37
  2032. running loss: 0.15691421976363337
  2033. Train Steps: 37/90 Loss: 0.1569 torch.Size([8, 600, 800])
  2034. torch.Size([8, 8])
  2035. tensor([[0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467],
  2036. [0.6125, 0.4035, 0.7825, 0.3100, 0.3463, 0.4900, 0.5832, 0.5637],
  2037. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  2038. [0.6131, 0.4037, 0.6907, 0.2819, 0.3688, 0.2700, 0.5217, 0.5680],
  2039. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  2040. [0.6262, 0.4085, 0.8438, 0.3150, 0.4025, 0.2633, 0.6339, 0.4810],
  2041. [0.6167, 0.4048, 0.6831, 0.3639, 0.3763, 0.3017, 0.5700, 0.5883],
  2042. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317]],
  2043. device='cuda:0', dtype=torch.float64)
  2044. predictions are: tensor([[ 0.3484, -0.5611, 1.1903, -0.8528, -0.5253, -0.8242, 0.4086, 0.2321],
  2045. [ 0.5839, -0.4033, 1.4489, -0.3269, -0.5890, -0.0762, 0.4293, 0.1951],
  2046. [ 0.6881, -0.3780, 1.8892, 0.4334, -0.4735, 0.3656, 0.5026, 0.1625],
  2047. [ 0.3486, -0.5398, 1.1285, -0.8707, -0.5217, -0.8116, 0.3905, 0.2235],
  2048. [ 0.1830, -0.6934, 1.5746, -0.6413, -0.2942, -0.8391, 0.6271, 0.2453],
  2049. [ 0.4457, -0.5310, 1.4380, -0.6530, -0.4888, -0.6945, 0.5348, 0.1828],
  2050. [ 0.3547, -0.5630, 1.3450, -0.6403, -0.4638, -0.7016, 0.4201, 0.2484],
  2051. [ 0.1226, -0.6902, 1.2788, -0.9352, -0.3668, -1.0977, 0.4852, 0.2776]],
  2052. device='cuda:0', grad_fn=<AddmmBackward>)
  2053. landmarks are: tensor([[[ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  2054. 0.2391],
  2055. [ 0.5432, -0.4224, 1.3284, -0.8540, -0.6866, -0.0226, 0.4077,
  2056. 0.3177],
  2057. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  2058. 0.0851],
  2059. [ 0.5459, -0.4215, 0.9043, -0.9838, -0.5827, -1.0388, 0.1236,
  2060. 0.3378],
  2061. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  2062. 0.2142],
  2063. [ 0.6064, -0.3990, 1.6113, -0.8309, -0.4268, -1.0696, 0.6421,
  2064. -0.0640],
  2065. [ 0.5626, -0.4162, 0.8692, -0.6051, -0.5480, -0.8925, 0.3469,
  2066. 0.4316],
  2067. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  2068. 0.1698]]], device='cuda:0')
  2069. loss_train_step before backward: tensor(0.0582, device='cuda:0', grad_fn=<MseLossBackward>)
  2070. loss_train_step after backward: tensor(0.0582, device='cuda:0', grad_fn=<MseLossBackward>)
  2071. loss_train: 5.863999526947737
  2072. step: 38
  2073. running loss: 0.15431577702494045
  2074. Train Steps: 38/90 Loss: 0.1543 torch.Size([8, 600, 800])
  2075. torch.Size([8, 8])
  2076. tensor([[0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882],
  2077. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395],
  2078. [0.6286, 0.4060, 0.9188, 0.4333, 0.3675, 0.4167, 0.7034, 0.5528],
  2079. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  2080. [0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395],
  2081. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  2082. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  2083. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702]],
  2084. device='cuda:0', dtype=torch.float64)
  2085. predictions are: tensor([[ 0.6287, -0.4028, 1.6203, -0.1966, -0.4968, -0.2871, 0.5465, 0.1927],
  2086. [ 0.5755, -0.4245, 1.5422, -0.3178, -0.4948, -0.3611, 0.5096, 0.1966],
  2087. [ 0.5557, -0.4868, 1.7148, -0.1531, -0.4118, -0.2448, 0.5633, 0.2358],
  2088. [ 0.2434, -0.6120, 1.1403, -1.0868, -0.4222, -1.0653, 0.4561, 0.3103],
  2089. [ 0.2002, -0.6206, 0.9828, -1.2643, -0.4166, -1.2470, 0.4367, 0.3031],
  2090. [ 0.0895, -0.6730, 1.1629, -1.1852, -0.3008, -1.2543, 0.5230, 0.3339],
  2091. [ 0.6912, -0.3737, 1.6513, -0.1489, -0.5177, -0.0689, 0.4943, 0.1897],
  2092. [ 0.5583, -0.4039, 1.4031, -0.2909, -0.5239, -0.1276, 0.4636, 0.2189]],
  2093. device='cuda:0', grad_fn=<AddmmBackward>)
  2094. landmarks are: tensor([[[ 0.5379, -0.4358, 1.7326, 0.1852, -0.6058, -0.5461, 0.0684,
  2095. -0.0310],
  2096. [ 0.5697, -0.4514, 1.7420, 0.2672, -0.6055, -0.6312, 0.3449,
  2097. 0.2058],
  2098. [ 0.6174, -0.4105, 1.9577, -0.2844, -0.5885, -0.3614, 0.9631,
  2099. 0.2676],
  2100. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  2101. 0.2853],
  2102. [ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  2103. 0.2058],
  2104. [ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  2105. 0.2083],
  2106. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  2107. 0.1159],
  2108. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  2109. 0.3478]]], device='cuda:0')
  2110. loss_train_step before backward: tensor(0.0508, device='cuda:0', grad_fn=<MseLossBackward>)
  2111. loss_train_step after backward: tensor(0.0508, device='cuda:0', grad_fn=<MseLossBackward>)
  2112. loss_train: 5.914830353111029
  2113. step: 39
  2114. running loss: 0.15166231674643663
  2115. Train Steps: 39/90 Loss: 0.1517 torch.Size([8, 600, 800])
  2116. torch.Size([8, 8])
  2117. tensor([[0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  2118. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  2119. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  2120. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  2121. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  2122. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586],
  2123. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  2124. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400]],
  2125. device='cuda:0', dtype=torch.float64)
  2126. predictions are: tensor([[ 0.6486, -0.3410, 1.5774, -0.2222, -0.4965, -0.0596, 0.5604, 0.2172],
  2127. [ 0.6847, -0.3742, 1.5988, -0.2892, -0.5014, -0.3354, 0.5350, 0.2231],
  2128. [ 0.6656, -0.3219, 1.4963, -0.2681, -0.5249, -0.1370, 0.4741, 0.2231],
  2129. [ 0.5834, -0.4588, 1.4839, -0.5551, -0.5066, -0.6224, 0.4980, 0.2645],
  2130. [ 0.6183, -0.3602, 1.5010, -0.4473, -0.4864, -0.3845, 0.5184, 0.2457],
  2131. [ 0.1681, -0.6630, 1.1836, -1.3643, -0.2738, -1.4343, 0.6444, 0.3350],
  2132. [ 0.5656, -0.3962, 1.4756, -0.3737, -0.4396, -0.3481, 0.4812, 0.2817],
  2133. [ 0.1295, -0.6485, 1.0784, -1.3811, -0.3357, -1.4434, 0.5232, 0.3749]],
  2134. device='cuda:0', grad_fn=<AddmmBackward>)
  2135. landmarks are: tensor([[[ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  2136. 0.1554],
  2137. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  2138. 0.0313],
  2139. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  2140. 0.5239],
  2141. [ 0.5697, -0.4113, 1.7499, -0.2767, -0.6404, -0.7155, 0.1576,
  2142. 0.4032],
  2143. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  2144. 0.1439],
  2145. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  2146. 0.2944],
  2147. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  2148. 0.2634],
  2149. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  2150. 0.2083]]], device='cuda:0')
  2151. loss_train_step before backward: tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward>)
  2152. loss_train_step after backward: tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward>)
  2153. loss_train: 5.975822579115629
  2154. step: 40
  2155. running loss: 0.14939556447789074
  2156.  
  2157. Train Steps: 40/90 Loss: 0.1494 torch.Size([8, 600, 800])
  2158. torch.Size([8, 8])
  2159. tensor([[0.6205, 0.4081, 0.8950, 0.4017, 0.3788, 0.4700, 0.5963, 0.5667],
  2160. [0.6200, 0.3913, 0.8788, 0.5217, 0.4075, 0.5100, 0.6060, 0.4913],
  2161. [0.6114, 0.4018, 0.7213, 0.1967, 0.3763, 0.2700, 0.5875, 0.5533],
  2162. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  2163. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197],
  2164. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  2165. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  2166. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749]],
  2167. device='cuda:0', dtype=torch.float64)
  2168. predictions are: tensor([[ 0.7940, -0.2830, 1.7891, -0.1529, -0.4726, -0.1025, 0.5921, 0.2275],
  2169. [ 0.7956, -0.3095, 1.8062, 0.0619, -0.4303, 0.0046, 0.5869, 0.1973],
  2170. [ 0.4080, -0.4914, 1.0629, -1.2522, -0.4499, -1.1842, 0.4631, 0.3219],
  2171. [ 0.8304, -0.2782, 1.7126, -0.1263, -0.4942, -0.1525, 0.5709, 0.2095],
  2172. [ 0.6740, -0.3268, 1.7111, -0.1091, -0.3630, -0.1135, 0.5836, 0.2540],
  2173. [ 0.2240, -0.6083, 1.1813, -1.3228, -0.2818, -1.4002, 0.5638, 0.3649],
  2174. [ 0.2937, -0.5621, 1.0164, -1.4729, -0.3887, -1.4923, 0.4779, 0.3411],
  2175. [ 0.5184, -0.4149, 1.1081, -1.0105, -0.5213, -0.8176, 0.4427, 0.3183]],
  2176. device='cuda:0', grad_fn=<AddmmBackward>)
  2177. landmarks are: tensor([[[ 0.5799, -0.4012, 1.8480, -0.4306, -0.5365, -0.1150, 0.4681,
  2178. 0.3315],
  2179. [ 0.5776, -0.4784, 1.7730, 0.1236, -0.4037, 0.0697, 0.5132,
  2180. -0.0168],
  2181. [ 0.5380, -0.4302, 1.0455, -1.3775, -0.5480, -1.0388, 0.4277,
  2182. 0.2699],
  2183. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  2184. 0.0325],
  2185. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  2186. 0.1146],
  2187. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  2188. 0.1698],
  2189. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  2190. 0.1253],
  2191. [ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  2192. 0.3694]]], device='cuda:0')
  2193. loss_train_step before backward: tensor(0.0260, device='cuda:0', grad_fn=<MseLossBackward>)
  2194. loss_train_step after backward: tensor(0.0260, device='cuda:0', grad_fn=<MseLossBackward>)
  2195. loss_train: 6.001800514757633
  2196. step: 41
  2197. running loss: 0.14638537840872276
  2198. Train Steps: 41/90 Loss: 0.1464 torch.Size([8, 600, 800])
  2199. torch.Size([8, 8])
  2200. tensor([[0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  2201. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  2202. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  2203. [0.6239, 0.4107, 0.8162, 0.2763, 0.3625, 0.3600, 0.5988, 0.5700],
  2204. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  2205. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  2206. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  2207. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833]],
  2208. device='cuda:0', dtype=torch.float64)
  2209. predictions are: tensor([[ 0.4199, -0.4943, 1.0790, -1.4109, -0.3797, -1.4113, 0.5004, 0.3263],
  2210. [ 0.7100, -0.3301, 1.7054, -0.2859, -0.3876, -0.3165, 0.5298, 0.2141],
  2211. [ 0.6441, -0.3112, 1.6181, -0.4765, -0.3953, -0.5129, 0.5334, 0.2616],
  2212. [ 0.4550, -0.4527, 1.3070, -1.0951, -0.3657, -1.0771, 0.5272, 0.3358],
  2213. [ 0.7904, -0.2419, 1.7333, -0.0269, -0.4500, -0.0779, 0.5352, 0.2389],
  2214. [ 0.7278, -0.3011, 1.6891, -0.2632, -0.4183, -0.2551, 0.5382, 0.2533],
  2215. [ 0.3967, -0.4765, 0.9523, -1.4774, -0.4310, -1.3825, 0.4442, 0.3253],
  2216. [ 0.7859, -0.2656, 1.7115, -0.2033, -0.4576, -0.1586, 0.5810, 0.1942]],
  2217. device='cuda:0', grad_fn=<AddmmBackward>)
  2218. landmarks are: tensor([[[ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  2219. 0.0774],
  2220. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  2221. -0.0220],
  2222. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  2223. 0.1852],
  2224. [ 0.5960, -0.3888, 1.4840, -1.0095, -0.6115, -0.6231, 0.4797,
  2225. 0.3469],
  2226. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  2227. 0.3084],
  2228. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  2229. 0.2930],
  2230. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  2231. 0.2576],
  2232. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  2233. -0.0534]]], device='cuda:0')
  2234. loss_train_step before backward: tensor(0.0263, device='cuda:0', grad_fn=<MseLossBackward>)
  2235. loss_train_step after backward: tensor(0.0263, device='cuda:0', grad_fn=<MseLossBackward>)
  2236. loss_train: 6.028124667704105
  2237. step: 42
  2238. running loss: 0.1435267778024787
  2239. Train Steps: 42/90 Loss: 0.1435 torch.Size([8, 600, 800])
  2240. torch.Size([8, 8])
  2241. tensor([[0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  2242. [0.6269, 0.4073, 0.8900, 0.4933, 0.3625, 0.4183, 0.6288, 0.5150],
  2243. [ nan, nan, 0.8900, 0.3217, 0.5038, 0.2233, 0.6694, 0.5609],
  2244. [0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  2245. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  2246. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  2247. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  2248. [0.6209, 0.3920, 0.8650, 0.5367, 0.4400, 0.5067, 0.6025, 0.4950]],
  2249. device='cuda:0', dtype=torch.float64)
  2250. predictions are: tensor([[ 0.6704, -0.3256, 1.6446, -0.3800, -0.3220, -0.4287, 0.5034, 0.2098],
  2251. [ 0.7600, -0.2821, 1.6958, -0.3735, -0.4332, -0.5067, 0.5104, 0.2388],
  2252. [ 0.4023, -0.5221, 1.4291, -1.2232, -0.2208, -1.2984, 0.6148, 0.2990],
  2253. [ 0.4486, -0.4718, 1.0584, -1.5126, -0.3953, -1.4553, 0.4707, 0.3244],
  2254. [ 0.7212, -0.2695, 1.4876, -0.3751, -0.4994, -0.2967, 0.4663, 0.2486],
  2255. [ 0.7195, -0.2523, 1.4674, -0.6101, -0.5033, -0.4567, 0.4606, 0.2342],
  2256. [ 0.7293, -0.2780, 1.6936, -0.2997, -0.3912, -0.3453, 0.5069, 0.1911],
  2257. [ 0.7337, -0.2971, 1.6755, -0.2719, -0.3963, -0.3425, 0.4923, 0.2010]],
  2258. device='cuda:0', grad_fn=<AddmmBackward>)
  2259. landmarks are: tensor([[[ 5.3279e-01, -4.3610e-01, 1.7268e+00, 6.9746e-02, -6.3048e-02,
  2260. 2.0831e-01, 2.1029e-01, 5.3181e-02],
  2261. [ 6.0964e-01, -4.0462e-01, 1.8249e+00, -7.2363e-03, -6.1155e-01,
  2262. -3.5366e-01, 6.1824e-01, 9.2841e-02],
  2263. [-2.2859e+00, -2.2859e+00, 1.8249e+00, -8.0015e-01, 4.0878e-02,
  2264. -1.2543e+00, 8.0590e-01, 3.0505e-01],
  2265. [ 5.8614e-01, -3.9292e-01, 1.0570e+00, -1.4314e+00, -3.2864e-01,
  2266. -1.1235e+00, 6.1824e-01, 1.8522e-01],
  2267. [ 6.4542e-01, -3.9842e-01, 1.3804e+00, 2.5450e-01, -4.5566e-01,
  2268. -3.8029e-02, 1.1057e+00, 3.4780e-01],
  2269. [ 5.2748e-01, -4.3957e-01, 1.5543e+00, -2.8408e-01, -5.3649e-01,
  2270. -1.8430e-01, 1.2208e-01, 3.2654e-01],
  2271. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  2272. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  2273. [ 5.8199e-01, -4.7544e-01, 1.7095e+00, 1.9292e-01, -2.5358e-01,
  2274. 5.4350e-02, 4.9700e-01, 4.6189e-04]]], device='cuda:0')
  2275. loss_train_step before backward: tensor(0.2217, device='cuda:0', grad_fn=<MseLossBackward>)
  2276. loss_train_step after backward: tensor(0.2217, device='cuda:0', grad_fn=<MseLossBackward>)
  2277. loss_train: 6.249815843999386
  2278. step: 43
  2279. running loss: 0.14534455451161363
  2280. Train Steps: 43/90 Loss: 0.1453 torch.Size([8, 600, 800])
  2281. torch.Size([8, 8])
  2282. tensor([[0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  2283. [0.6200, 0.4112, 0.8862, 0.4100, 0.3638, 0.4917, 0.6088, 0.6050],
  2284. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  2285. [ nan, nan, 0.6992, 0.2791, 0.3950, 0.2383, 0.5483, 0.5819],
  2286. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598],
  2287. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  2288. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  2289. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967]],
  2290. device='cuda:0', dtype=torch.float64)
  2291. predictions are: tensor([[ 0.7581, -0.3525, 1.8243, -0.3983, -0.3701, -0.6395, 0.5296, 0.1889],
  2292. [ 0.8480, -0.2333, 1.9051, -0.0124, -0.4633, -0.0062, 0.5412, 0.1463],
  2293. [ 0.8636, -0.2277, 1.8561, -0.0840, -0.4672, -0.1841, 0.4694, 0.1467],
  2294. [ 0.4291, -0.4614, 1.0137, -1.4131, -0.4086, -1.3380, 0.3718, 0.2872],
  2295. [ 0.6720, -0.2897, 1.6456, -0.1900, -0.3317, -0.2876, 0.4857, 0.1960],
  2296. [ 0.3500, -0.5126, 0.9928, -1.5114, -0.3518, -1.4417, 0.4003, 0.3029],
  2297. [ 0.3663, -0.4884, 1.2399, -1.2750, -0.2920, -1.2833, 0.4599, 0.3037],
  2298. [ 0.7835, -0.2698, 1.8654, 0.0564, -0.3705, 0.0656, 0.5092, 0.1624]],
  2299. device='cuda:0', grad_fn=<AddmmBackward>)
  2300. landmarks are: tensor([[[ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  2301. 0.1005],
  2302. [ 0.5777, -0.3868, 1.8076, -0.3921, -0.6058, -0.0149, 0.5259,
  2303. 0.5085],
  2304. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  2305. 0.1159],
  2306. [-2.2859, -2.2859, 0.9438, -0.9967, -0.4614, -1.1851, 0.2468,
  2307. 0.4019],
  2308. [ 0.5726, -0.4249, 1.5824, 0.3777, -0.0942, -0.0556, 0.2782,
  2309. 0.2997],
  2310. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  2311. 0.2930],
  2312. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  2313. 0.3007],
  2314. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  2315. 0.4701]]], device='cuda:0')
  2316. loss_train_step before backward: tensor(0.5159, device='cuda:0', grad_fn=<MseLossBackward>)
  2317. loss_train_step after backward: tensor(0.5159, device='cuda:0', grad_fn=<MseLossBackward>)
  2318.  
  2319. loss_train: 6.765694998204708
  2320. step: 44
  2321. running loss: 0.15376579541374336
  2322. Train Steps: 44/90 Loss: 0.1538 torch.Size([8, 600, 800])
  2323. torch.Size([8, 8])
  2324. tensor([[0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748],
  2325. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  2326. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  2327. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  2328. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  2329. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  2330. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  2331. [0.6111, 0.4033, 0.8300, 0.3267, 0.3588, 0.3333, 0.5444, 0.5637]],
  2332. device='cuda:0', dtype=torch.float64)
  2333. predictions are: tensor([[ 0.5681, -0.3922, 1.6770, -0.3190, -0.3526, -0.5051, 0.4730, 0.1606],
  2334. [ 0.6769, -0.3203, 1.6853, -0.1504, -0.4270, -0.2334, 0.4160, 0.1653],
  2335. [ 0.4975, -0.4291, 1.5476, -0.6745, -0.3673, -0.7478, 0.4353, 0.2326],
  2336. [ 0.7256, -0.3172, 1.7803, -0.0423, -0.4017, -0.0852, 0.4411, 0.1329],
  2337. [ 0.7370, -0.3005, 1.8452, -0.0926, -0.4353, -0.1475, 0.4734, 0.1246],
  2338. [ 0.3213, -0.5524, 1.2729, -1.2532, -0.2965, -1.3091, 0.4605, 0.2714],
  2339. [ 0.2930, -0.5338, 1.3079, -1.0069, -0.2362, -0.9552, 0.4142, 0.2860],
  2340. [ 0.5536, -0.4193, 1.4912, -0.7955, -0.4314, -0.8450, 0.4179, 0.2130]],
  2341. device='cuda:0', grad_fn=<AddmmBackward>)
  2342. landmarks are: tensor([[[ 0.6421, -0.3647, 1.5940, 0.3084, -0.5192, -0.3691, 1.1057,
  2343. 0.3692],
  2344. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  2345. 0.2391],
  2346. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  2347. 0.3238],
  2348. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  2349. 0.0711],
  2350. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  2351. 0.1775],
  2352. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  2353. 0.2032],
  2354. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  2355. 0.5882],
  2356. [ 0.5366, -0.4232, 1.5478, -0.7771, -0.6289, -0.7463, 0.2288,
  2357. 0.3177]]], device='cuda:0')
  2358. loss_train_step before backward: tensor(0.0398, device='cuda:0', grad_fn=<MseLossBackward>)
  2359. loss_train_step after backward: tensor(0.0398, device='cuda:0', grad_fn=<MseLossBackward>)
  2360. loss_train: 6.80553362518549
  2361. step: 45
  2362. running loss: 0.15123408055967755
  2363. Train Steps: 45/90 Loss: 0.1512 torch.Size([8, 600, 800])
  2364. torch.Size([8, 8])
  2365. tensor([[0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  2366. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717],
  2367. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  2368. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  2369. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350],
  2370. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  2371. [0.6145, 0.4008, 0.8750, 0.5383, 0.3975, 0.4650, 0.5563, 0.5533],
  2372. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646]],
  2373. device='cuda:0', dtype=torch.float64)
  2374. predictions are: tensor([[ 0.3271, -0.5318, 1.5833, -0.6055, -0.2818, -0.7147, 0.4776, 0.2189],
  2375. [ 0.6006, -0.3905, 1.7411, -0.1581, -0.3956, -0.1973, 0.4302, 0.1447],
  2376. [ 0.3604, -0.5165, 1.4272, -0.8646, -0.3821, -0.9327, 0.3752, 0.2403],
  2377. [ 0.1835, -0.6378, 1.4985, -1.1170, -0.1787, -1.2397, 0.5342, 0.2482],
  2378. [ 0.6568, -0.3744, 1.8330, -0.0872, -0.4559, -0.2435, 0.4343, 0.1183],
  2379. [ 0.5622, -0.3841, 1.6823, -0.1538, -0.3768, -0.2230, 0.3884, 0.1781],
  2380. [ 0.6354, -0.3549, 1.7240, -0.0143, -0.4266, -0.0859, 0.4077, 0.1498],
  2381. [ 0.3661, -0.5067, 1.3478, -0.9482, -0.4265, -0.9791, 0.3621, 0.2470]],
  2382. device='cuda:0', grad_fn=<AddmmBackward>)
  2383. landmarks are: tensor([[[ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  2384. 0.5822],
  2385. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  2386. 0.3546],
  2387. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  2388. 0.3928],
  2389. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  2390. 0.0051],
  2391. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  2392. 0.1854],
  2393. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  2394. 0.0851],
  2395. [ 0.5526, -0.4347, 1.7557, 0.2006, -0.4499, -0.1381, 0.2834,
  2396. 0.2699],
  2397. [ 0.5483, -0.4105, 1.4208, -0.8002, -0.6000, -0.9002, 0.0511,
  2398. 0.3220]]], device='cuda:0')
  2399. loss_train_step before backward: tensor(0.0359, device='cuda:0', grad_fn=<MseLossBackward>)
  2400. loss_train_step after backward: tensor(0.0359, device='cuda:0', grad_fn=<MseLossBackward>)
  2401. loss_train: 6.841406472027302
  2402. step: 46
  2403. running loss: 0.14872622765276744
  2404. Train Steps: 46/90 Loss: 0.1487 torch.Size([8, 600, 800])
  2405. torch.Size([8, 8])
  2406. tensor([[0.6336, 0.4191, 0.8938, 0.5167, 0.3937, 0.3517, 0.7343, 0.5748],
  2407. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  2408. [0.6111, 0.4033, 0.8300, 0.3267, 0.3588, 0.3333, 0.5444, 0.5637],
  2409. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  2410. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  2411. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  2412. [0.6250, 0.4013, 0.8525, 0.5417, 0.4037, 0.5117, 0.6325, 0.5017],
  2413. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748]],
  2414. device='cuda:0', dtype=torch.float64)
  2415. predictions are: tensor([[ 0.3840, -0.5315, 1.8182, -0.2895, -0.2842, -0.6059, 0.4778, 0.1746],
  2416. [ 0.5873, -0.3852, 1.7610, 0.0130, -0.4095, -0.0445, 0.3412, 0.1994],
  2417. [ 0.4079, -0.5127, 1.5575, -0.6584, -0.4286, -0.7907, 0.3493, 0.2210],
  2418. [ 0.1248, -0.6520, 1.2992, -1.0770, -0.2927, -1.1115, 0.3463, 0.2811],
  2419. [ 0.5570, -0.4181, 1.8028, -0.0158, -0.3737, -0.1759, 0.3713, 0.1611],
  2420. [ 0.3128, -0.5459, 1.2268, -0.9812, -0.4740, -0.9341, 0.2947, 0.2475],
  2421. [ 0.6236, -0.3824, 1.7676, 0.0590, -0.4433, -0.0679, 0.3503, 0.1704],
  2422. [ 0.3081, -0.5636, 1.7776, -0.4745, -0.2314, -0.7536, 0.5243, 0.2039]],
  2423. device='cuda:0', grad_fn=<AddmmBackward>)
  2424. landmarks are: tensor([[[ 0.6405, -0.3503, 1.8423, 0.1005, -0.4672, -0.6616, 1.1057,
  2425. 0.3692],
  2426. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  2427. 0.3084],
  2428. [ 0.5366, -0.4232, 1.5478, -0.7771, -0.6289, -0.7463, 0.2288,
  2429. 0.3177],
  2430. [-2.2859, -2.2859, 1.2303, -0.7848, -0.4210, -1.1158, 0.2256,
  2431. 0.3777],
  2432. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  2433. 0.1854],
  2434. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  2435. 0.0442],
  2436. [ 0.6010, -0.4321, 1.6517, 0.2160, -0.4210, 0.0774, 0.6356,
  2437. 0.0313],
  2438. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  2439. 0.3692]]], device='cuda:0')
  2440. loss_train_step before backward: tensor(0.1665, device='cuda:0', grad_fn=<MseLossBackward>)
  2441. loss_train_step after backward: tensor(0.1665, device='cuda:0', grad_fn=<MseLossBackward>)
  2442. loss_train: 7.0079174265265465
  2443. step: 47
  2444. running loss: 0.1491046260963095
  2445. Train Steps: 47/90 Loss: 0.1491 torch.Size([8, 600, 800])
  2446. torch.Size([8, 8])
  2447. tensor([[ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  2448. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  2449. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  2450. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  2451. [ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  2452. [0.6273, 0.4105, 0.8988, 0.4517, 0.3912, 0.2550, 0.5894, 0.4811],
  2453. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320],
  2454. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217]],
  2455. device='cuda:0', dtype=torch.float64)
  2456. predictions are: tensor([[ 0.0535, -0.7069, 1.2344, -0.9993, -0.3315, -1.0784, 0.2902, 0.2823],
  2457. [ 0.2657, -0.5997, 1.6602, -0.5471, -0.2962, -0.7206, 0.4205, 0.2333],
  2458. [ 0.3856, -0.5336, 1.8462, -0.1078, -0.3412, -0.3655, 0.4130, 0.2259],
  2459. [ 0.3312, -0.5656, 1.4524, -0.7236, -0.4373, -0.8358, 0.3779, 0.2153],
  2460. [-0.0348, -0.7601, 1.2570, -1.0044, -0.2545, -1.0930, 0.3087, 0.3088],
  2461. [ 0.5419, -0.4685, 2.0130, 0.1167, -0.3741, -0.3086, 0.4475, 0.1471],
  2462. [ 0.8008, -0.2977, 1.9959, 0.6074, -0.5156, 0.4412, 0.3769, 0.1513],
  2463. [ 0.2861, -0.5947, 1.3415, -0.6672, -0.4133, -0.7388, 0.2971, 0.2424]],
  2464. device='cuda:0', grad_fn=<AddmmBackward>)
  2465. landmarks are: tensor([[[-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  2466. 0.3084],
  2467. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  2468. 0.3392],
  2469. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  2470. 0.3928],
  2471. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  2472. 0.2043],
  2473. [-2.2859, -2.2859, 0.9175, -1.3947, -0.3691, -1.2467, 0.2314,
  2474. 0.3238],
  2475. [ 0.6116, -0.3898, 1.8654, -0.1997, -0.4788, -1.1081, 0.4367,
  2476. -0.0637],
  2477. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  2478. 0.1715],
  2479. [ 0.5687, -0.4088, 1.0397, -1.1466, -0.3113, -1.1928, 0.4681,
  2480. 0.5855]]], device='cuda:0')
  2481. loss_train_step before backward: tensor(0.3112, device='cuda:0', grad_fn=<MseLossBackward>)
  2482.  
  2483. loss_train_step after backward: tensor(0.3112, device='cuda:0', grad_fn=<MseLossBackward>)
  2484. loss_train: 7.319082103669643
  2485. step: 48
  2486. running loss: 0.15248087715978423
  2487. Train Steps: 48/90 Loss: 0.1525 torch.Size([8, 600, 800])
  2488. torch.Size([8, 8])
  2489. tensor([[0.6075, 0.4007, 0.8275, 0.4917, 0.4050, 0.5100, 0.5167, 0.5280],
  2490. [0.6236, 0.3977, 0.8985, 0.4806, 0.3835, 0.5216, 0.6613, 0.5166],
  2491. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  2492. [0.6371, 0.4092, 0.8337, 0.5850, 0.3950, 0.5117, 0.6559, 0.5262],
  2493. [0.6109, 0.4015, 0.7668, 0.3639, 0.3513, 0.3667, 0.5200, 0.5641],
  2494. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  2495. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  2496. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250]],
  2497. device='cuda:0', dtype=torch.float64)
  2498. predictions are: tensor([[ 0.2065, -0.6275, 1.5711, -0.3425, -0.3605, -0.5036, 0.3276, 0.2431],
  2499. [ 0.3137, -0.5515, 1.6447, -0.2573, -0.4272, -0.3420, 0.3673, 0.2457],
  2500. [ 0.3199, -0.6279, 1.8709, -0.2268, -0.3714, -0.7510, 0.4436, 0.2008],
  2501. [ 0.3236, -0.5680, 1.6676, -0.1668, -0.4192, -0.4400, 0.3268, 0.2124],
  2502. [ 0.1441, -0.6837, 1.2961, -0.8674, -0.4645, -0.9738, 0.2507, 0.2833],
  2503. [ 0.4580, -0.5463, 1.8016, -0.0027, -0.4537, -0.3965, 0.3903, 0.1912],
  2504. [ 0.2008, -0.6386, 1.6768, -0.3726, -0.3226, -0.5094, 0.3750, 0.2283],
  2505. [ 0.3267, -0.5803, 1.8235, -0.1224, -0.3388, -0.3754, 0.4049, 0.2350]],
  2506. device='cuda:0', grad_fn=<AddmmBackward>)
  2507. landmarks are: tensor([[[ 0.5200, -0.4353, 1.5363, -0.0149, -0.4152, 0.0697, 0.1005,
  2508. 0.1530],
  2509. [ 0.5944, -0.4490, 1.8643, -0.0659, -0.5147, 0.1235, 0.7684,
  2510. 0.1004],
  2511. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  2512. -0.0957],
  2513. [ 0.6569, -0.3960, 1.5651, 0.4162, -0.4614, 0.0774, 0.7438,
  2514. 0.1447],
  2515. [ 0.5357, -0.4315, 1.2557, -0.6051, -0.6635, -0.5923, 0.1159,
  2516. 0.3198],
  2517. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  2518. 0.0291],
  2519. [ 0.5499, -0.4225, 1.8018, -0.2921, -0.3055, 0.0543, 0.4046,
  2520. 0.2699],
  2521. [ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  2522. 0.1390]]], device='cuda:0')
  2523. loss_train_step before backward: tensor(0.0701, device='cuda:0', grad_fn=<MseLossBackward>)
  2524. loss_train_step after backward: tensor(0.0701, device='cuda:0', grad_fn=<MseLossBackward>)
  2525. loss_train: 7.389189012348652
  2526. step: 49
  2527. running loss: 0.1507997757622174
  2528. Train Steps: 49/90 Loss: 0.1508 torch.Size([8, 600, 800])
  2529. torch.Size([8, 8])
  2530. tensor([[0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  2531. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  2532. [0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  2533. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967],
  2534. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  2535. [0.6201, 0.4036, 0.8596, 0.3850, 0.3492, 0.3785, 0.5978, 0.5131],
  2536. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  2537. [0.6267, 0.4094, 0.8712, 0.3083, 0.4400, 0.2267, 0.6250, 0.5200]],
  2538. device='cuda:0', dtype=torch.float64)
  2539. predictions are: tensor([[ 0.5294, -0.4750, 1.7715, 0.1190, -0.5351, -0.1170, 0.4085, 0.2083],
  2540. [-0.0845, -0.8747, 1.6868, -0.7018, -0.2010, -1.1213, 0.4768, 0.2605],
  2541. [ 0.0189, -0.7988, 1.2685, -0.9018, -0.4537, -1.1003, 0.2813, 0.2620],
  2542. [ 0.4374, -0.4821, 1.6311, -0.0043, -0.5430, -0.1109, 0.3076, 0.2101],
  2543. [ 0.3483, -0.5449, 1.8120, 0.2408, -0.3022, 0.0264, 0.3682, 0.2554],
  2544. [ 0.4092, -0.5825, 1.6334, -0.1759, -0.5376, -0.3951, 0.3223, 0.2299],
  2545. [ 0.3080, -0.5890, 1.4904, -0.3696, -0.5447, -0.5251, 0.2846, 0.2454],
  2546. [-0.0895, -0.8739, 1.7312, -0.6509, -0.1901, -1.0867, 0.4873, 0.2669]],
  2547. device='cuda:0', grad_fn=<AddmmBackward>)
  2548. landmarks are: tensor([[[ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  2549. -0.0670],
  2550. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  2551. 0.1467],
  2552. [ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  2553. -0.0108],
  2554. [ 0.4974, -0.4482, 1.6633, -0.3306, -0.6173, 0.1313, 0.2925,
  2555. 0.0081],
  2556. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  2557. 0.2083],
  2558. [ 0.5783, -0.4216, 1.6847, -0.5078, -0.6732, -0.5377, 0.4752,
  2559. 0.0839],
  2560. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  2561. 0.0021],
  2562. [ 0.6089, -0.3948, 1.7383, -0.8617, -0.2536, -1.2390, 0.6009,
  2563. 0.1159]]], device='cuda:0')
  2564. loss_train_step before backward: tensor(0.0571, device='cuda:0', grad_fn=<MseLossBackward>)
  2565. loss_train_step after backward: tensor(0.0571, device='cuda:0', grad_fn=<MseLossBackward>)
  2566. loss_train: 7.446262441575527
  2567. step: 50
  2568. running loss: 0.14892524883151054
  2569. Train Steps: 50/90 Loss: 0.1489 torch.Size([8, 600, 800])
  2570. torch.Size([8, 8])
  2571. tensor([[0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  2572. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  2573. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  2574. [0.6268, 0.4102, 0.8938, 0.3667, 0.4025, 0.2833, 0.6275, 0.5183],
  2575. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  2576. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297],
  2577. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297],
  2578. [0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136]],
  2579. device='cuda:0', dtype=torch.float64)
  2580. predictions are: tensor([[-0.1917, -0.8912, 1.1326, -1.0317, -0.4090, -1.2113, 0.2342, 0.2647],
  2581. [ 0.1447, -0.7247, 1.6322, -0.4428, -0.4324, -0.7945, 0.3599, 0.2245],
  2582. [ 0.3594, -0.6005, 1.9348, -0.0460, -0.4138, -0.4227, 0.5189, 0.1961],
  2583. [ 0.1087, -0.7685, 1.8399, -0.3096, -0.2694, -0.7375, 0.5243, 0.2236],
  2584. [-0.2596, -0.9368, 1.3766, -0.8925, -0.2801, -1.1774, 0.3548, 0.2806],
  2585. [ 0.7107, -0.3776, 1.8623, 0.5153, -0.5687, 0.2528, 0.3826, 0.1827],
  2586. [ 0.5197, -0.4508, 1.6900, 0.1712, -0.5216, 0.0608, 0.3766, 0.1881],
  2587. [ 0.3376, -0.5243, 1.4465, -0.2484, -0.5582, -0.1278, 0.3285, 0.2552]],
  2588. device='cuda:0', grad_fn=<AddmmBackward>)
  2589. landmarks are: tensor([[[ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  2590. 0.2699],
  2591. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  2592. 0.1005],
  2593. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  2594. 0.1544],
  2595. [ 0.6092, -0.3913, 1.8423, -0.5923, -0.4268, -0.9772, 0.6125,
  2596. 0.1082],
  2597. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  2598. 0.1698],
  2599. [ 0.6520, -0.4032, 1.8076, 0.1852, -0.5711, -0.1381, 0.7876,
  2600. 0.1608],
  2601. [ 0.6257, -0.4273, 1.8365, -0.0688, -0.4672, -0.0611, 1.1715,
  2602. 0.1608],
  2603. [ 0.5466, -0.3840, 1.5016, -0.6077, -0.6404, 0.2083, 0.3871,
  2604. 0.0862]]], device='cuda:0')
  2605. loss_train_step before backward: tensor(0.0788, device='cuda:0', grad_fn=<MseLossBackward>)
  2606. loss_train_step after backward: tensor(0.0788, device='cuda:0', grad_fn=<MseLossBackward>)
  2607. loss_train: 7.525062687695026
  2608. step: 51
  2609. running loss: 0.14755024877833386
  2610. Train Steps: 51/90 Loss: 0.1476 torch.Size([8, 600, 800])
  2611. torch.Size([8, 8])
  2612. tensor([[0.6176, 0.4017, 0.8788, 0.5100, 0.4075, 0.5250, 0.5913, 0.5033],
  2613. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  2614. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  2615. [0.6111, 0.4033, 0.8300, 0.3267, 0.3588, 0.3333, 0.5444, 0.5637],
  2616. [0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117],
  2617. [0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501],
  2618. [0.6196, 0.4088, 0.8888, 0.4583, 0.4500, 0.5683, 0.6138, 0.5883],
  2619. [0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817]],
  2620. device='cuda:0', dtype=torch.float64)
  2621. predictions are: tensor([[ 0.3924, -0.5213, 1.6944, 0.0514, -0.4727, -0.0790, 0.4196, 0.1729],
  2622. [ 0.0863, -0.7315, 1.6527, -0.4401, -0.4479, -0.7708, 0.4044, 0.2342],
  2623. [ 0.5413, -0.4434, 1.6979, 0.2409, -0.5767, 0.0799, 0.3926, 0.2002],
  2624. [ 0.1163, -0.7415, 1.5643, -0.5669, -0.5108, -0.8526, 0.3755, 0.2119],
  2625. [ 0.3633, -0.6097, 1.8357, -0.0659, -0.4941, -0.4124, 0.4238, 0.1571],
  2626. [-0.2876, -0.9784, 1.4261, -0.9724, -0.2718, -1.3018, 0.4072, 0.2629],
  2627. [ 0.2977, -0.5920, 1.6902, -0.0351, -0.3639, -0.1044, 0.4685, 0.2399],
  2628. [ 0.3709, -0.5620, 1.5785, -0.3152, -0.6058, -0.4485, 0.4069, 0.1557]],
  2629. device='cuda:0', grad_fn=<AddmmBackward>)
  2630. landmarks are: tensor([[[ 0.5668, -0.4306, 1.7730, 0.0697, -0.4037, 0.1390, 0.4450,
  2631. 0.0390],
  2632. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  2633. 0.3238],
  2634. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  2635. 0.5316],
  2636. [ 0.5366, -0.4232, 1.5478, -0.7771, -0.6289, -0.7463, 0.2288,
  2637. 0.3177],
  2638. [ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  2639. 0.0774],
  2640. [ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  2641. 0.2549],
  2642. [ 0.5759, -0.3978, 1.8192, -0.1689, -0.2074, 0.3392, 0.5490,
  2643. 0.4316],
  2644. [ 0.5669, -0.4794, 1.7499, -0.3383, -0.6751, -0.4229, 0.4970,
  2645. -0.0611]]], device='cuda:0')
  2646. loss_train_step before backward: tensor(0.0449, device='cuda:0', grad_fn=<MseLossBackward>)
  2647.  
  2648. loss_train_step after backward: tensor(0.0449, device='cuda:0', grad_fn=<MseLossBackward>)
  2649. loss_train: 7.569976683706045
  2650. step: 52
  2651. running loss: 0.14557647468665472
  2652. Train Steps: 52/90 Loss: 0.1456 torch.Size([8, 600, 800])
  2653. torch.Size([8, 8])
  2654. tensor([[0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274],
  2655. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  2656. [ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  2657. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646],
  2658. [0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  2659. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267],
  2660. [0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  2661. [0.6114, 0.4018, 0.7213, 0.1967, 0.3763, 0.2700, 0.5875, 0.5533]],
  2662. device='cuda:0', dtype=torch.float64)
  2663. predictions are: tensor([[ 0.0673, -0.7542, 1.7669, -0.3813, -0.2630, -0.6866, 0.5843, 0.1976],
  2664. [ 0.8705, -0.3015, 2.0107, 0.5344, -0.6006, 0.4336, 0.6015, 0.1237],
  2665. [-0.2974, -0.9372, 1.2530, -0.8868, -0.3178, -1.0227, 0.3237, 0.2703],
  2666. [ 0.3326, -0.5938, 1.5830, -0.2542, -0.5651, -0.4246, 0.3844, 0.1999],
  2667. [ 0.6440, -0.4098, 1.8351, 0.1432, -0.6327, -0.0068, 0.4699, 0.1745],
  2668. [ 0.0210, -0.7968, 1.5529, -0.6347, -0.3618, -0.9225, 0.4992, 0.1978],
  2669. [ 0.2055, -0.6765, 1.3400, -0.6754, -0.5636, -0.7407, 0.3770, 0.1858],
  2670. [ 0.1917, -0.6800, 1.3017, -0.6446, -0.5512, -0.7384, 0.3369, 0.1998]],
  2671. device='cuda:0', grad_fn=<AddmmBackward>)
  2672. landmarks are: tensor([[[ 0.6537, -0.3719, 1.6979, -0.8617, -0.0169, -1.3621, 0.6926,
  2673. 0.1501],
  2674. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  2675. 0.0774],
  2676. [-2.2859, -2.2859, 0.9175, -1.3947, -0.3691, -1.2467, 0.2314,
  2677. 0.3238],
  2678. [ 0.5483, -0.4105, 1.4208, -0.8002, -0.6000, -0.9002, 0.0511,
  2679. 0.3220],
  2680. [ 0.5581, -0.3912, 1.6460, -0.5230, -0.6173, -0.5923, 0.0681,
  2681. 0.4348],
  2682. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  2683. 0.1467],
  2684. [ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  2685. -0.0108],
  2686. [ 0.5380, -0.4302, 1.0455, -1.3775, -0.5480, -1.0388, 0.4277,
  2687. 0.2699]]], device='cuda:0')
  2688. loss_train_step before backward: tensor(0.1982, device='cuda:0', grad_fn=<MseLossBackward>)
  2689. loss_train_step after backward: tensor(0.1982, device='cuda:0', grad_fn=<MseLossBackward>)
  2690. loss_train: 7.7682068310678005
  2691. step: 53
  2692. running loss: 0.14656994020882644
  2693. Train Steps: 53/90 Loss: 0.1466 torch.Size([8, 600, 800])
  2694. torch.Size([8, 8])
  2695. tensor([[0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  2696. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679],
  2697. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  2698. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  2699. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  2700. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  2701. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  2702. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117]],
  2703. device='cuda:0', dtype=torch.float64)
  2704. predictions are: tensor([[-0.2143, -0.9404, 1.4668, -1.0647, -0.3230, -1.3438, 0.4597, 0.2239],
  2705. [-0.2777, -0.9847, 1.5412, -1.0364, -0.2318, -1.3185, 0.5605, 0.2012],
  2706. [ 0.6630, -0.3745, 1.6541, 0.1284, -0.6696, 0.0945, 0.4320, 0.1933],
  2707. [ 0.3220, -0.5820, 1.6807, -0.1678, -0.4297, -0.2776, 0.4604, 0.1703],
  2708. [ 0.7033, -0.3861, 1.6634, 0.0126, -0.7016, -0.1221, 0.5019, 0.1436],
  2709. [ 0.5057, -0.4786, 1.6570, -0.0877, -0.5653, -0.0970, 0.4212, 0.2048],
  2710. [ 0.2947, -0.5987, 1.6497, -0.2465, -0.4861, -0.4751, 0.4378, 0.1929],
  2711. [ 0.5106, -0.4723, 1.6720, -0.1766, -0.6225, -0.1774, 0.5021, 0.1598]],
  2712. device='cuda:0', grad_fn=<AddmmBackward>)
  2713. landmarks are: tensor([[[ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  2714. 0.2083],
  2715. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  2716. 0.3371],
  2717. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  2718. 0.5316],
  2719. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  2720. 0.0532],
  2721. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  2722. -0.1278],
  2723. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  2724. 0.3084],
  2725. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  2726. 0.5762],
  2727. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  2728. 0.0774]]], device='cuda:0')
  2729. loss_train_step before backward: tensor(0.1455, device='cuda:0', grad_fn=<MseLossBackward>)
  2730. loss_train_step after backward: tensor(0.1455, device='cuda:0', grad_fn=<MseLossBackward>)
  2731. loss_train: 7.913748513907194
  2732. step: 54
  2733. running loss: 0.14655089840568877
  2734. Train Steps: 54/90 Loss: 0.1466 torch.Size([8, 600, 800])
  2735. torch.Size([8, 8])
  2736. tensor([[0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  2737. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  2738. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  2739. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  2740. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  2741. [0.6260, 0.4253, 0.8938, 0.4400, 0.3675, 0.3650, 0.5675, 0.5767],
  2742. [0.6260, 0.4133, 0.8800, 0.5117, 0.3713, 0.3283, 0.6223, 0.4967],
  2743. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350]],
  2744. device='cuda:0', dtype=torch.float64)
  2745. predictions are: tensor([[ 0.5348, -0.4461, 1.6849, -0.0344, -0.5152, 0.0100, 0.5367, 0.1942],
  2746. [-0.2356, -0.9501, 1.0968, -1.2913, -0.4973, -1.4036, 0.2616, 0.2211],
  2747. [ 0.3467, -0.5774, 1.6509, -0.2637, -0.4446, -0.3173, 0.4580, 0.2147],
  2748. [ 0.2504, -0.6009, 1.6104, -0.3901, -0.4216, -0.3745, 0.5047, 0.1924],
  2749. [ 0.2240, -0.6485, 1.7115, -0.4295, -0.3777, -0.5357, 0.5990, 0.1783],
  2750. [ 0.5265, -0.4631, 1.7272, -0.2212, -0.6034, -0.4052, 0.5230, 0.1763],
  2751. [ 0.4698, -0.5562, 1.8330, -0.1877, -0.5408, -0.6042, 0.5758, 0.1269],
  2752. [ 0.5352, -0.5074, 1.7070, -0.1354, -0.5545, -0.2338, 0.4854, 0.1544]],
  2753. device='cuda:0', grad_fn=<AddmmBackward>)
  2754. landmarks are: tensor([[[ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  2755. 0.1661],
  2756. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  2757. 0.3469],
  2758. [ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  2759. 0.3007],
  2760. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  2761. 0.2853],
  2762. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  2763. 0.2776],
  2764. [ 0.6058, -0.3216, 1.8423, -0.2536, -0.5885, -0.6000, 0.3353,
  2765. 0.3777],
  2766. [ 0.6054, -0.3767, 1.7788, 0.0774, -0.5711, -0.7694, 0.5887,
  2767. 0.0081],
  2768. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  2769. 0.1854]]], device='cuda:0')
  2770. loss_train_step before backward: tensor(0.1391, device='cuda:0', grad_fn=<MseLossBackward>)
  2771. loss_train_step after backward: tensor(0.1391, device='cuda:0', grad_fn=<MseLossBackward>)
  2772. loss_train: 8.052847858518362
  2773. step: 55
  2774. running loss: 0.14641541560942475
  2775. Train Steps: 55/90 Loss: 0.1464 torch.Size([8, 600, 800])
  2776. torch.Size([8, 8])
  2777. tensor([[0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  2778. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  2779. [0.6087, 0.3951, 0.8387, 0.5833, 0.4188, 0.4933, 0.5146, 0.4830],
  2780. [0.6182, 0.3930, 0.8841, 0.3892, 0.3556, 0.4967, 0.6222, 0.5279],
  2781. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  2782. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  2783. [0.6260, 0.4120, 0.8013, 0.2350, 0.4888, 0.1533, 0.6281, 0.4895],
  2784. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917]],
  2785. device='cuda:0', dtype=torch.float64)
  2786. predictions are: tensor([[ 0.5108, -0.4988, 1.8392, -0.1524, -0.4782, -0.4393, 0.6054, 0.1707],
  2787. [-0.1989, -0.8882, 1.1078, -1.1526, -0.4256, -1.1660, 0.2669, 0.2613],
  2788. [ 0.6571, -0.3982, 1.7409, 0.0728, -0.5547, -0.0445, 0.5122, 0.1667],
  2789. [ 0.5398, -0.4333, 1.5151, -0.3352, -0.6108, -0.1219, 0.4888, 0.1776],
  2790. [ 0.8204, -0.2803, 1.7220, 0.1719, -0.6168, 0.2006, 0.5326, 0.1883],
  2791. [-0.0578, -0.8517, 1.5819, -0.9280, -0.2828, -1.1182, 0.6220, 0.1895],
  2792. [-0.1826, -0.9124, 1.3633, -1.1262, -0.3392, -1.3109, 0.4546, 0.1922],
  2793. [ 0.6652, -0.3629, 1.7669, 0.1831, -0.4866, 0.0789, 0.5693, 0.1919]],
  2794. device='cuda:0', grad_fn=<AddmmBackward>)
  2795. landmarks are: tensor([[[ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  2796. 0.1661],
  2797. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  2798. 0.3931],
  2799. [ 0.5258, -0.4610, 1.5882, 0.4085, -0.3517, -0.0072, 0.0910,
  2800. -0.0550],
  2801. [ 0.5697, -0.4706, 1.7976, -0.4884, -0.6433, 0.0081, 0.5878,
  2802. 0.1525],
  2803. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  2804. 0.3161],
  2805. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  2806. 0.2944],
  2807. [ 0.6053, -0.3830, 1.4150, -1.2005, -0.0284, -1.5777, 0.6154,
  2808. -0.0250],
  2809. [ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  2810. 0.4470]]], device='cuda:0')
  2811. loss_train_step before backward: tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward>)
  2812. loss_train_step after backward: tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward>)
  2813. loss_train: 8.11908669397235
  2814. step: 56
  2815. running loss: 0.14498369096379196
  2816.  
  2817. Train Steps: 56/90 Loss: 0.1450 torch.Size([8, 600, 800])
  2818. torch.Size([8, 8])
  2819. tensor([[0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  2820. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609],
  2821. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  2822. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  2823. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  2824. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  2825. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279],
  2826. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123]],
  2827. device='cuda:0', dtype=torch.float64)
  2828. predictions are: tensor([[ 0.4652, -0.4927, 1.4310, -0.5926, -0.5860, -0.4583, 0.4855, 0.1917],
  2829. [ 0.0168, -0.8016, 1.7405, -0.7322, -0.1639, -0.9592, 0.7691, 0.1852],
  2830. [ 0.9244, -0.2048, 1.9678, 0.4568, -0.4284, 0.4085, 0.6313, 0.1853],
  2831. [ 0.0860, -0.7330, 1.3060, -0.8993, -0.4453, -0.9782, 0.3544, 0.1966],
  2832. [ 0.0321, -0.7831, 1.3198, -0.9540, -0.4452, -1.0702, 0.3742, 0.1955],
  2833. [-0.0107, -0.7694, 1.3218, -0.8850, -0.4071, -0.9168, 0.3962, 0.2506],
  2834. [ 1.1011, -0.1720, 2.0850, 0.4680, -0.5672, 0.4022, 0.6618, 0.1479],
  2835. [ 0.2294, -0.6558, 1.3344, -0.7895, -0.5082, -0.8425, 0.4000, 0.1940]],
  2836. device='cuda:0', grad_fn=<AddmmBackward>)
  2837. landmarks are: tensor([[[ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  2838. 0.2237],
  2839. [ 0.6372, -0.3575, 1.6633, -1.2082, 0.2199, -1.2467, 1.1313,
  2840. 0.3050],
  2841. [ 0.5447, -0.3838, 1.7037, 0.1775, -0.1497, 0.1467, 0.1128,
  2842. 0.2431],
  2843. [ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  2844. 0.2906],
  2845. [ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  2846. -0.0580],
  2847. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  2848. 0.2622],
  2849. [ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  2850. 0.1525],
  2851. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  2852. 0.0802]]], device='cuda:0')
  2853. loss_train_step before backward: tensor(0.0934, device='cuda:0', grad_fn=<MseLossBackward>)
  2854. loss_train_step after backward: tensor(0.0934, device='cuda:0', grad_fn=<MseLossBackward>)
  2855. loss_train: 8.212458346039057
  2856. step: 57
  2857. running loss: 0.14407821659717643
  2858. Train Steps: 57/90 Loss: 0.1441 torch.Size([8, 600, 800])
  2859. torch.Size([8, 8])
  2860. tensor([[0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823],
  2861. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  2862. [0.6200, 0.4049, 0.8638, 0.5617, 0.4125, 0.5100, 0.6013, 0.5317],
  2863. [0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  2864. [0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  2865. [0.6187, 0.4104, 0.7126, 0.2069, 0.3950, 0.2517, 0.5913, 0.5683],
  2866. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  2867. [ nan, nan, 0.8850, 0.2817, 0.5112, 0.2183, 0.7184, 0.5436]],
  2868. device='cuda:0', dtype=torch.float64)
  2869. predictions are: tensor([[ 0.1649, -0.7242, 1.5017, -0.9635, -0.3496, -1.1003, 0.5266, 0.1752],
  2870. [ 0.5651, -0.4185, 1.4566, -0.3872, -0.5721, -0.2852, 0.4112, 0.2345],
  2871. [ 0.9952, -0.1645, 1.9069, 0.4831, -0.4560, 0.3968, 0.5863, 0.1960],
  2872. [ 0.6640, -0.3472, 1.5984, -0.2779, -0.5041, -0.0886, 0.5670, 0.2048],
  2873. [ 0.1283, -0.7124, 1.3394, -0.9232, -0.3711, -1.0119, 0.4405, 0.2160],
  2874. [ 0.1406, -0.7053, 1.3067, -0.9091, -0.4227, -0.9925, 0.3371, 0.2296],
  2875. [ 0.6080, -0.4196, 1.5368, -0.4087, -0.5550, -0.3284, 0.4938, 0.1815],
  2876. [ 0.0596, -0.7789, 1.7898, -0.7913, -0.1113, -1.0448, 0.7324, 0.1776]],
  2877. device='cuda:0', grad_fn=<AddmmBackward>)
  2878. landmarks are: tensor([[[ 0.6132, -0.4122, 1.5478, -1.0619, -0.2709, -1.4314, 0.5500,
  2879. -0.0583],
  2880. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  2881. 0.4036],
  2882. [ 0.5776, -0.4159, 1.7037, 0.3084, -0.3806, 0.0697, 0.4912,
  2883. 0.1698],
  2884. [ 0.6108, -0.4273, 1.8711, -0.6616, -0.5769, -0.1997, 0.9156,
  2885. 0.1554],
  2886. [ 0.5861, -0.3929, 1.0570, -1.4314, -0.3286, -1.1235, 0.6182,
  2887. 0.1852],
  2888. [ 0.5718, -0.3905, 1.0053, -1.3305, -0.4614, -1.1235, 0.4450,
  2889. 0.3392],
  2890. [ 0.5779, -0.4275, 1.5894, -0.8362, -0.6577, -0.5153, 0.5605,
  2891. 0.2006],
  2892. [-2.2859, -2.2859, 1.8018, -0.9849, 0.0755, -1.2774, 1.0326,
  2893. 0.2249]]], device='cuda:0')
  2894. loss_train_step before backward: tensor(0.1737, device='cuda:0', grad_fn=<MseLossBackward>)
  2895. loss_train_step after backward: tensor(0.1737, device='cuda:0', grad_fn=<MseLossBackward>)
  2896. loss_train: 8.38615109398961
  2897. step: 58
  2898. running loss: 0.14458881196533813
  2899. Train Steps: 58/90 Loss: 0.1446 torch.Size([8, 600, 800])
  2900. torch.Size([8, 8])
  2901. tensor([[0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  2902. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  2903. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  2904. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  2905. [0.6336, 0.4086, 0.8900, 0.3950, 0.3900, 0.2950, 0.6504, 0.5066],
  2906. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478],
  2907. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197],
  2908. [0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742]],
  2909. device='cuda:0', dtype=torch.float64)
  2910. predictions are: tensor([[ 0.7843, -0.2825, 1.5981, -0.0211, -0.4891, -0.0875, 0.5092, 0.2230],
  2911. [ 0.2781, -0.6108, 1.5591, -0.6938, -0.3728, -0.8706, 0.4629, 0.2388],
  2912. [ 0.5331, -0.3995, 1.5068, -0.4493, -0.4661, -0.2366, 0.5199, 0.2029],
  2913. [ 0.6395, -0.3974, 1.7493, -0.2473, -0.3899, -0.2536, 0.5395, 0.1864],
  2914. [ 0.3610, -0.5704, 1.4294, -0.7834, -0.4042, -0.8035, 0.5313, 0.1834],
  2915. [ 0.3174, -0.6453, 1.6677, -0.7387, -0.2951, -0.9430, 0.5775, 0.1927],
  2916. [ 0.4922, -0.4571, 1.6685, -0.2111, -0.2608, -0.2328, 0.5452, 0.2422],
  2917. [ 0.2434, -0.6341, 1.4036, -0.9700, -0.3803, -1.0104, 0.5442, 0.1745]],
  2918. device='cuda:0', grad_fn=<AddmmBackward>)
  2919. landmarks are: tensor([[[ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  2920. 0.4778],
  2921. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  2922. 0.3238],
  2923. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  2924. 0.0985],
  2925. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  2926. 0.1775],
  2927. [ 0.6405, -0.3984, 1.8249, -0.4614, -0.4845, -0.9233, 0.7182,
  2928. 0.0539],
  2929. [ 0.5792, -0.4052, 1.8214, -0.6587, -0.5384, -0.8924, 0.4381,
  2930. 0.2442],
  2931. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  2932. 0.1146],
  2933. [ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  2934. -0.0957]]], device='cuda:0')
  2935. loss_train_step before backward: tensor(0.0448, device='cuda:0', grad_fn=<MseLossBackward>)
  2936. loss_train_step after backward: tensor(0.0448, device='cuda:0', grad_fn=<MseLossBackward>)
  2937. loss_train: 8.43092280998826
  2938. step: 59
  2939. running loss: 0.14289699677946205
  2940. Train Steps: 59/90 Loss: 0.1429 torch.Size([8, 600, 800])
  2941. torch.Size([8, 8])
  2942. tensor([[0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  2943. [0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350],
  2944. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  2945. [0.6200, 0.4049, 0.8638, 0.5617, 0.4125, 0.5100, 0.6013, 0.5317],
  2946. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567],
  2947. [0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400],
  2948. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817],
  2949. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006]],
  2950. device='cuda:0', dtype=torch.float64)
  2951. predictions are: tensor([[ 0.2818, -0.5519, 1.1398, -0.9494, -0.4569, -0.8034, 0.3754, 0.2358],
  2952. [ 0.2219, -0.6087, 1.2525, -1.0545, -0.3426, -0.9762, 0.4758, 0.1897],
  2953. [ 0.3792, -0.5581, 1.6016, -0.6791, -0.3140, -0.8254, 0.5364, 0.1975],
  2954. [ 0.9969, -0.1383, 1.8140, 0.2493, -0.3933, 0.2813, 0.6364, 0.1949],
  2955. [ 0.0079, -0.7529, 1.2589, -1.0732, -0.2950, -1.1134, 0.4069, 0.2175],
  2956. [ 0.4674, -0.4826, 1.6665, -0.6039, -0.3580, -0.7430, 0.5824, 0.1887],
  2957. [-0.0475, -0.7370, 1.3782, -0.9749, -0.1228, -1.0500, 0.4923, 0.2548],
  2958. [ 1.1495, -0.1309, 1.9559, 0.3334, -0.4791, 0.2528, 0.6781, 0.1574]],
  2959. device='cuda:0', grad_fn=<AddmmBackward>)
  2960. landmarks are: tensor([[[ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  2961. 0.3315],
  2962. [ 0.5911, -0.4080, 1.2303, -0.9156, -0.3229, -1.2851, 0.4508,
  2963. 0.1852],
  2964. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  2965. 0.1494],
  2966. [ 0.5776, -0.4159, 1.7037, 0.3084, -0.3806, 0.0697, 0.4912,
  2967. 0.1698],
  2968. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  2969. 0.2853],
  2970. [ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  2971. 0.2083],
  2972. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  2973. 0.4008],
  2974. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  2975. 0.0261]]], device='cuda:0')
  2976. loss_train_step before backward: tensor(0.1616, device='cuda:0', grad_fn=<MseLossBackward>)
  2977. loss_train_step after backward: tensor(0.1616, device='cuda:0', grad_fn=<MseLossBackward>)
  2978. loss_train: 8.592534977942705
  2979. step: 60
  2980. running loss: 0.14320891629904509
  2981.  
  2982. Train Steps: 60/90 Loss: 0.1432 torch.Size([8, 600, 800])
  2983. torch.Size([8, 8])
  2984. tensor([[0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155],
  2985. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528],
  2986. [0.6275, 0.4013, 0.8850, 0.2833, 0.4975, 0.2233, 0.7058, 0.5343],
  2987. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  2988. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  2989. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  2990. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  2991. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833]],
  2992. device='cuda:0', dtype=torch.float64)
  2993. predictions are: tensor([[ 0.2086, -0.6300, 1.3176, -1.0979, -0.3326, -1.1253, 0.5210, 0.1824],
  2994. [ 0.1186, -0.6808, 1.6586, -0.8910, -0.1042, -1.1124, 0.6969, 0.1947],
  2995. [ 0.0176, -0.7576, 1.3594, -1.1991, -0.1722, -1.2693, 0.6071, 0.1854],
  2996. [-0.0947, -0.7664, 1.0023, -1.2901, -0.3211, -1.2261, 0.3050, 0.2503],
  2997. [ 0.9525, -0.1494, 1.7418, 0.1433, -0.4784, 0.0591, 0.4824, 0.2212],
  2998. [ 0.8451, -0.1980, 1.6479, 0.0220, -0.4704, 0.0241, 0.4932, 0.2086],
  2999. [ 0.8089, -0.3003, 1.8164, -0.1682, -0.4304, -0.2600, 0.5217, 0.2167],
  3000. [ 0.7858, -0.2762, 1.6638, -0.1935, -0.4581, -0.1493, 0.5384, 0.1817]],
  3001. device='cuda:0', grad_fn=<AddmmBackward>)
  3002. landmarks are: tensor([[[ 0.6126, -0.4161, 1.6344, -0.9541, -0.2247, -1.3467, 0.6339,
  3003. 0.0953],
  3004. [-2.2859, -2.2859, 1.8423, -0.9695, -0.1323, -0.8463, 1.1349,
  3005. 0.2676],
  3006. [ 0.6125, -0.4321, 1.8018, -0.9772, 0.0120, -1.2543, 0.9741,
  3007. 0.1821],
  3008. [ 0.6101, -0.3152, 1.0166, -0.7540, -0.0226, -1.4468, 0.2823,
  3009. 0.5702],
  3010. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  3011. 0.3007],
  3012. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  3013. -0.1061],
  3014. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  3015. 0.1390],
  3016. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  3017. -0.0534]]], device='cuda:0')
  3018. loss_train_step before backward: tensor(0.1915, device='cuda:0', grad_fn=<MseLossBackward>)
  3019. loss_train_step after backward: tensor(0.1915, device='cuda:0', grad_fn=<MseLossBackward>)
  3020. loss_train: 8.784059438854456
  3021. step: 61
  3022. running loss: 0.1440009744074501
  3023. Train Steps: 61/90 Loss: 0.1440 torch.Size([8, 600, 800])
  3024. torch.Size([8, 8])
  3025. tensor([[0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  3026. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  3027. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  3028. [0.6308, 0.3990, 0.8688, 0.5183, 0.3950, 0.4983, 0.6388, 0.5133],
  3029. [0.6239, 0.4206, 0.8750, 0.5400, 0.3688, 0.4850, 0.5737, 0.5700],
  3030. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  3031. [0.6193, 0.3930, 0.8949, 0.4437, 0.3852, 0.5435, 0.6263, 0.5263],
  3032. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390]],
  3033. device='cuda:0', dtype=torch.float64)
  3034. predictions are: tensor([[ 0.4254, -0.5102, 1.6345, -0.7446, -0.3703, -0.9065, 0.4836, 0.1739],
  3035. [ 0.3287, -0.5379, 1.2386, -0.9834, -0.4621, -0.9095, 0.4226, 0.2145],
  3036. [-0.0653, -0.8610, 1.5051, -1.2168, -0.0975, -1.5968, 0.5487, 0.2045],
  3037. [ 0.6743, -0.3409, 1.6672, -0.1588, -0.3592, -0.2565, 0.5132, 0.1833],
  3038. [ 0.8930, -0.2093, 1.7921, 0.0180, -0.4376, -0.1262, 0.5343, 0.2037],
  3039. [ 0.2680, -0.5955, 1.4384, -0.9249, -0.3006, -1.0350, 0.5602, 0.1513],
  3040. [ 0.6325, -0.3450, 1.5545, -0.3512, -0.4066, -0.2343, 0.5168, 0.2220],
  3041. [ 0.6448, -0.3246, 1.5906, -0.2330, -0.3459, -0.0971, 0.5405, 0.2321]],
  3042. device='cuda:0', grad_fn=<AddmmBackward>)
  3043. landmarks are: tensor([[[ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  3044. 0.0802],
  3045. [ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  3046. 0.1159],
  3047. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  3048. -0.0368],
  3049. [ 0.6275, -0.4430, 1.7268, 0.1082, -0.4614, 0.0159, 0.6644,
  3050. 0.0851],
  3051. [ 0.5960, -0.3430, 1.7557, 0.2083, -0.5827, -0.0457, 0.3642,
  3052. 0.3469],
  3053. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  3054. 0.1821],
  3055. [ 0.5746, -0.4706, 1.8476, -0.2365, -0.5068, 0.2245, 0.6069,
  3056. 0.1449],
  3057. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  3058. 0.2035]]], device='cuda:0')
  3059. loss_train_step before backward: tensor(0.0645, device='cuda:0', grad_fn=<MseLossBackward>)
  3060. loss_train_step after backward: tensor(0.0645, device='cuda:0', grad_fn=<MseLossBackward>)
  3061. loss_train: 8.848596323281527
  3062. step: 62
  3063. running loss: 0.14271929553679882
  3064. Train Steps: 62/90 Loss: 0.1427 torch.Size([8, 600, 800])
  3065. torch.Size([8, 8])
  3066. tensor([[0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  3067. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  3068. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  3069. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  3070. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  3071. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  3072. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  3073. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064]],
  3074. device='cuda:0', dtype=torch.float64)
  3075. predictions are: tensor([[ 6.0193e-01, -3.5355e-01, 1.4660e+00, -3.8460e-01, -4.2701e-01,
  3076. -3.7003e-01, 4.9220e-01, 2.1553e-01],
  3077. [ 6.1210e-01, -3.9221e-01, 1.6649e+00, -4.7105e-01, -4.3883e-01,
  3078. -6.3568e-01, 4.8713e-01, 1.8266e-01],
  3079. [-1.6378e-01, -8.3230e-01, 1.1472e+00, -1.3570e+00, -2.2156e-01,
  3080. -1.4473e+00, 4.2822e-01, 2.1547e-01],
  3081. [ 7.4028e-01, -3.1413e-01, 1.8390e+00, -2.3177e-01, -4.3150e-01,
  3082. -3.5873e-01, 6.1900e-01, 1.3988e-01],
  3083. [ 3.8143e-01, -5.2839e-01, 1.5582e+00, -8.0401e-01, -3.4977e-01,
  3084. -9.7758e-01, 5.2392e-01, 1.7169e-01],
  3085. [ 7.3339e-01, -3.0600e-01, 1.7870e+00, -5.2512e-02, -3.5248e-01,
  3086. -1.5096e-01, 5.9570e-01, 1.4974e-01],
  3087. [ 1.3114e-03, -7.5873e-01, 1.0977e+00, -1.2836e+00, -3.4830e-01,
  3088. -1.3368e+00, 3.7091e-01, 2.0337e-01],
  3089. [ 4.9602e-01, -4.2798e-01, 1.7384e+00, -2.2984e-01, -1.6082e-01,
  3090. -3.1048e-01, 6.1138e-01, 1.8955e-01]], device='cuda:0',
  3091. grad_fn=<AddmmBackward>)
  3092. landmarks are: tensor([[[ 0.6069, -0.3309, 1.3742, -0.1493, -0.5365, -0.9541, 0.2884,
  3093. 0.5071],
  3094. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  3095. 0.2116],
  3096. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  3097. 0.1343],
  3098. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  3099. 0.0467],
  3100. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  3101. 0.1005],
  3102. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  3103. 0.0159],
  3104. [ 0.5591, -0.3990, 0.9012, -1.2313, -0.3979, -1.3852, 0.0804,
  3105. 0.2071],
  3106. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  3107. 0.0532]]], device='cuda:0')
  3108. loss_train_step before backward: tensor(0.0488, device='cuda:0', grad_fn=<MseLossBackward>)
  3109. loss_train_step after backward: tensor(0.0488, device='cuda:0', grad_fn=<MseLossBackward>)
  3110. loss_train: 8.897438570857048
  3111. step: 63
  3112. running loss: 0.1412291836643976
  3113. Train Steps: 63/90 Loss: 0.1412 torch.Size([8, 600, 800])
  3114. torch.Size([8, 8])
  3115. tensor([[0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  3116. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  3117. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  3118. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  3119. [0.6135, 0.3994, 0.7913, 0.3050, 0.3625, 0.3050, 0.5837, 0.5050],
  3120. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  3121. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  3122. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400]],
  3123. device='cuda:0', dtype=torch.float64)
  3124. predictions are: tensor([[ 0.6887, -0.2958, 1.7633, -0.0927, -0.3535, -0.0904, 0.5729, 0.1684],
  3125. [-0.0433, -0.7717, 1.3271, -1.0488, -0.1998, -1.1762, 0.4160, 0.2186],
  3126. [ 0.9128, -0.2367, 1.9098, 0.0604, -0.4814, -0.3571, 0.5593, 0.1122],
  3127. [ 0.2893, -0.6126, 1.7348, -0.7418, -0.1768, -1.0713, 0.6419, 0.1588],
  3128. [ 0.4247, -0.5085, 1.3427, -0.8894, -0.4398, -0.8603, 0.4474, 0.1686],
  3129. [ 0.3004, -0.5806, 1.2293, -0.9643, -0.3975, -1.0585, 0.3702, 0.1898],
  3130. [ 0.3562, -0.5280, 1.3323, -0.9654, -0.3721, -1.0282, 0.4855, 0.1664],
  3131. [ 0.7345, -0.2874, 1.6705, -0.2287, -0.4608, -0.1024, 0.5201, 0.1640]],
  3132. device='cuda:0', grad_fn=<AddmmBackward>)
  3133. landmarks are: tensor([[[ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  3134. 0.2545],
  3135. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  3136. 0.3007],
  3137. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  3138. -0.0049],
  3139. [ 0.6128, -0.3828, 1.7499, -0.8386, -0.3344, -1.2620, 0.5792,
  3140. -0.0263],
  3141. [ 0.5477, -0.4413, 1.3688, -0.8771, -0.6115, -0.8771, 0.4104,
  3142. 0.0467],
  3143. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  3144. 0.2930],
  3145. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  3146. 0.1929],
  3147. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  3148. 0.2083]]], device='cuda:0')
  3149. loss_train_step before backward: tensor(0.1364, device='cuda:0', grad_fn=<MseLossBackward>)
  3150. loss_train_step after backward: tensor(0.1364, device='cuda:0', grad_fn=<MseLossBackward>)
  3151. loss_train: 9.033822163939476
  3152. step: 64
  3153. running loss: 0.1411534713115543
  3154.  
  3155. Train Steps: 64/90 Loss: 0.1412 torch.Size([8, 600, 800])
  3156. torch.Size([8, 8])
  3157. tensor([[0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882],
  3158. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  3159. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  3160. [0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  3161. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  3162. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  3163. [0.6250, 0.4106, 0.8700, 0.3717, 0.3588, 0.4967, 0.6038, 0.5167],
  3164. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433]],
  3165. device='cuda:0', dtype=torch.float64)
  3166. predictions are: tensor([[ 0.6446, -0.3956, 1.6840, -0.4547, -0.5014, -0.7255, 0.4978, 0.1312],
  3167. [ 0.0775, -0.7255, 1.5045, -1.0049, -0.1928, -1.3421, 0.4969, 0.1804],
  3168. [ 0.5250, -0.3771, 1.4217, -0.5524, -0.4841, -0.3258, 0.4748, 0.1695],
  3169. [ 0.2667, -0.6293, 1.7410, -0.6791, -0.1763, -1.1061, 0.6038, 0.1466],
  3170. [ 0.8183, -0.2901, 1.7640, -0.0631, -0.5073, -0.2813, 0.4108, 0.1293],
  3171. [-0.0212, -0.7648, 1.1398, -1.1932, -0.3444, -1.3294, 0.3225, 0.1775],
  3172. [ 0.6146, -0.3061, 1.4930, -0.4160, -0.4981, -0.2606, 0.4851, 0.1693],
  3173. [ 0.5536, -0.3818, 1.6883, -0.1470, -0.2797, -0.1758, 0.5672, 0.1822]],
  3174. device='cuda:0', grad_fn=<AddmmBackward>)
  3175. landmarks are: tensor([[[ 0.5595, -0.3988, 1.7672, -0.4460, -0.5538, -0.5384, 0.0828,
  3176. -0.0310],
  3177. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  3178. -0.0368],
  3179. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  3180. 0.2083],
  3181. [ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  3182. 0.0171],
  3183. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  3184. 0.1159],
  3185. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  3186. 0.2183],
  3187. [ 0.6010, -0.3896, 1.7326, -0.5692, -0.6289, 0.0082, 0.5028,
  3188. 0.1005],
  3189. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  3190. 0.2237]]], device='cuda:0')
  3191. loss_train_step before backward: tensor(0.1453, device='cuda:0', grad_fn=<MseLossBackward>)
  3192. loss_train_step after backward: tensor(0.1453, device='cuda:0', grad_fn=<MseLossBackward>)
  3193. loss_train: 9.179143756628036
  3194. step: 65
  3195. running loss: 0.14121759625581595
  3196. Train Steps: 65/90 Loss: 0.1412 torch.Size([8, 600, 800])
  3197. torch.Size([8, 8])
  3198. tensor([[0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  3199. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  3200. [0.6364, 0.4154, 0.8938, 0.3717, 0.4500, 0.2583, 0.6448, 0.5285],
  3201. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  3202. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  3203. [0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  3204. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  3205. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517]],
  3206. device='cuda:0', dtype=torch.float64)
  3207. predictions are: tensor([[ 0.6267, -0.3419, 1.6333, -0.1439, -0.4652, -0.1813, 0.4128, 0.1475],
  3208. [ 0.4693, -0.4492, 1.6629, -0.2391, -0.3128, -0.3149, 0.4396, 0.1641],
  3209. [ 0.0783, -0.7178, 1.6822, -0.9112, -0.1434, -1.2153, 0.5995, 0.1530],
  3210. [ 0.6831, -0.3662, 1.6256, -0.3334, -0.5366, -0.4167, 0.4806, 0.1187],
  3211. [ 0.7415, -0.2970, 1.6891, -0.0164, -0.5241, -0.1477, 0.4616, 0.1052],
  3212. [ 0.2370, -0.6096, 1.6264, -0.7659, -0.3008, -1.0667, 0.4651, 0.1323],
  3213. [ 0.0431, -0.7028, 1.2359, -1.1322, -0.4204, -1.2392, 0.3013, 0.1724],
  3214. [ 0.4519, -0.4859, 1.5367, -0.7710, -0.4870, -0.8818, 0.4508, 0.1412]],
  3215. device='cuda:0', grad_fn=<AddmmBackward>)
  3216. landmarks are: tensor([[[ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  3217. 0.1176],
  3218. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  3219. 0.4171],
  3220. [ 0.6537, -0.3671, 1.8423, -0.5692, -0.2074, -1.0927, 0.6926,
  3221. 0.1554],
  3222. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  3223. 0.1768],
  3224. [ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  3225. -0.1331],
  3226. [ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  3227. 0.1929],
  3228. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  3229. 0.2699],
  3230. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  3231. 0.2622]]], device='cuda:0')
  3232. loss_train_step before backward: tensor(0.1668, device='cuda:0', grad_fn=<MseLossBackward>)
  3233. loss_train_step after backward: tensor(0.1668, device='cuda:0', grad_fn=<MseLossBackward>)
  3234. loss_train: 9.345949053764343
  3235. step: 66
  3236. running loss: 0.14160528869339914
  3237. Train Steps: 66/90 Loss: 0.1416 torch.Size([8, 600, 800])
  3238. torch.Size([8, 8])
  3239. tensor([[0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617],
  3240. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  3241. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  3242. [0.6198, 0.3997, 0.8582, 0.5361, 0.4117, 0.5016, 0.5942, 0.5134],
  3243. [ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  3244. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  3245. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  3246. [0.6282, 0.4034, 0.7830, 0.2080, 0.4532, 0.2080, 0.6404, 0.5323]],
  3247. device='cuda:0', dtype=torch.float64)
  3248. predictions are: tensor([[ 0.7712, -0.2923, 1.8211, -0.0302, -0.6109, -0.2295, 0.3809, 0.1126],
  3249. [ 0.7003, -0.3199, 1.8258, -0.0810, -0.5108, -0.0843, 0.5129, 0.1062],
  3250. [ 0.1465, -0.6928, 1.1311, -1.1692, -0.4661, -1.2716, 0.2790, 0.1480],
  3251. [ 0.6411, -0.3872, 1.7449, -0.0299, -0.4848, -0.1530, 0.3797, 0.1211],
  3252. [-0.1579, -0.8550, 1.6510, -1.0446, -0.0177, -1.3773, 0.6750, 0.1100],
  3253. [ 0.3622, -0.5523, 1.4921, -0.6718, -0.5310, -0.9092, 0.2859, 0.1646],
  3254. [ 0.6469, -0.3301, 1.7399, -0.1981, -0.4915, -0.0087, 0.5131, 0.1263],
  3255. [ 0.0991, -0.7330, 1.4066, -1.1085, -0.3121, -1.4014, 0.4390, 0.1324]],
  3256. device='cuda:0', grad_fn=<AddmmBackward>)
  3257. landmarks are: tensor([[[ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  3258. 0.3084],
  3259. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  3260. 0.2237],
  3261. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  3262. 0.2576],
  3263. [ 0.5767, -0.4396, 1.6782, 0.1905, -0.3844, 0.0308, 0.4588,
  3264. 0.0855],
  3265. [-2.2859, -2.2859, 1.8018, -0.9002, 0.1910, -1.2467, 1.1057,
  3266. 0.3799],
  3267. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  3268. 0.4374],
  3269. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  3270. 0.1005],
  3271. [ 0.6158, -0.4225, 1.3307, -1.3253, -0.1924, -1.3252, 0.6721,
  3272. 0.1727]]], device='cuda:0')
  3273. loss_train_step before backward: tensor(0.1310, device='cuda:0', grad_fn=<MseLossBackward>)
  3274. loss_train_step after backward: tensor(0.1310, device='cuda:0', grad_fn=<MseLossBackward>)
  3275. loss_train: 9.476928368210793
  3276. step: 67
  3277. running loss: 0.14144669206284766
  3278. Train Steps: 67/90 Loss: 0.1414 torch.Size([8, 600, 800])
  3279. torch.Size([8, 8])
  3280. tensor([[0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667],
  3281. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  3282. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  3283. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  3284. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  3285. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  3286. [0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138],
  3287. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124]],
  3288. device='cuda:0', dtype=torch.float64)
  3289. predictions are: tensor([[ 0.7303, -0.2955, 1.7954, 0.1157, -0.5662, 0.0109, 0.4479, 0.1301],
  3290. [ 0.6625, -0.3700, 1.7461, -0.0592, -0.5969, -0.2779, 0.3915, 0.0902],
  3291. [ 0.3183, -0.5735, 1.6481, -0.6196, -0.5000, -0.7327, 0.3463, 0.1323],
  3292. [-0.0706, -0.8395, 1.4050, -1.1966, -0.2504, -1.4328, 0.4267, 0.1387],
  3293. [ 0.3940, -0.4962, 1.7431, -0.1674, -0.3207, -0.1481, 0.4893, 0.1618],
  3294. [ 0.3869, -0.5238, 1.6733, -0.3139, -0.4044, -0.6556, 0.4237, 0.1367],
  3295. [ 0.5155, -0.4132, 1.5255, -0.5827, -0.6067, -0.5232, 0.4523, 0.1157],
  3296. [-0.1190, -0.8626, 1.4404, -1.1726, -0.2574, -1.4463, 0.4442, 0.1302]],
  3297. device='cuda:0', grad_fn=<AddmmBackward>)
  3298. landmarks are: tensor([[[ 0.5853, -0.3614, 1.6806, 0.2930, -0.4499, 0.1005, 0.3815,
  3299. 0.3315],
  3300. [ 0.6148, -0.4130, 1.6864, 0.1698, -0.5307, -0.1150, 0.6125,
  3301. 0.0851],
  3302. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  3303. 0.1929],
  3304. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  3305. 0.1850],
  3306. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  3307. 0.0622],
  3308. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  3309. 0.5762],
  3310. [ 0.5438, -0.4206, 1.5189, -0.4537, -0.6115, -0.6231, 0.4365,
  3311. 0.5491],
  3312. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  3313. 0.0807]]], device='cuda:0')
  3314. loss_train_step before backward: tensor(0.0537, device='cuda:0', grad_fn=<MseLossBackward>)
  3315.  
  3316. loss_train_step after backward: tensor(0.0537, device='cuda:0', grad_fn=<MseLossBackward>)
  3317. loss_train: 9.530608255416155
  3318. step: 68
  3319. running loss: 0.14015600375611992
  3320. Train Steps: 68/90 Loss: 0.1402 torch.Size([8, 600, 800])
  3321. torch.Size([8, 8])
  3322. tensor([[0.6198, 0.4130, 0.8762, 0.4117, 0.3650, 0.4900, 0.5707, 0.5103],
  3323. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  3324. [0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183],
  3325. [0.6266, 0.4101, 0.8350, 0.2333, 0.3950, 0.2950, 0.6264, 0.4921],
  3326. [0.6307, 0.4029, 0.8988, 0.4817, 0.3937, 0.3500, 0.7311, 0.5378],
  3327. [0.6200, 0.4071, 0.7338, 0.1917, 0.4200, 0.2450, 0.6150, 0.5517],
  3328. [0.6268, 0.4029, 0.8500, 0.2683, 0.3937, 0.3500, 0.6860, 0.5297],
  3329. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483]],
  3330. device='cuda:0', dtype=torch.float64)
  3331. predictions are: tensor([[ 0.4384, -0.5000, 1.7996, -0.2838, -0.5043, -0.3255, 0.3941, 0.1576],
  3332. [ 0.7036, -0.3673, 1.8411, 0.1240, -0.5864, -0.0798, 0.4007, 0.1136],
  3333. [ 0.4413, -0.5175, 1.5479, -0.5979, -0.5562, -0.5699, 0.4458, 0.1313],
  3334. [-0.0993, -0.8470, 1.5847, -1.0225, -0.2267, -1.3204, 0.4917, 0.1482],
  3335. [ 0.3940, -0.5685, 1.9010, -0.2202, -0.3972, -0.7088, 0.4700, 0.1093],
  3336. [ 0.0720, -0.7794, 1.3627, -0.9925, -0.3594, -1.2348, 0.3514, 0.1815],
  3337. [ 0.4026, -0.5244, 1.4602, -0.7272, -0.5536, -0.7108, 0.4587, 0.1436],
  3338. [ 0.4534, -0.4552, 1.6432, -0.2746, -0.5154, -0.1603, 0.4155, 0.1531]],
  3339. device='cuda:0', grad_fn=<AddmmBackward>)
  3340. landmarks are: tensor([[[ 0.5771, -0.3784, 1.7614, -0.3844, -0.6000, -0.0226, 0.3501,
  3341. 0.0712],
  3342. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  3343. 0.0111],
  3344. [ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  3345. 0.1080],
  3346. [ 0.6081, -0.3918, 1.5709, -1.2082, -0.4614, -0.9233, 0.6072,
  3347. -0.0129],
  3348. [ 0.6273, -0.4249, 1.8654, -0.0611, -0.4672, -0.6693, 1.0910,
  3349. 0.1982],
  3350. [ 0.5779, -0.4054, 1.1032, -1.4006, -0.3460, -1.1543, 0.5547,
  3351. 0.2622],
  3352. [ 0.6092, -0.4249, 1.6402, -1.0465, -0.4672, -0.6693, 0.8827,
  3353. 0.1608],
  3354. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  3355. 0.2468]]], device='cuda:0')
  3356. loss_train_step before backward: tensor(0.0482, device='cuda:0', grad_fn=<MseLossBackward>)
  3357. loss_train_step after backward: tensor(0.0482, device='cuda:0', grad_fn=<MseLossBackward>)
  3358. loss_train: 9.57880049943924
  3359. step: 69
  3360. running loss: 0.13882319564404694
  3361. Train Steps: 69/90 Loss: 0.1388 torch.Size([8, 600, 800])
  3362. torch.Size([8, 8])
  3363. tensor([[0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  3364. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  3365. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  3366. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  3367. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  3368. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  3369. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  3370. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097]],
  3371. device='cuda:0', dtype=torch.float64)
  3372. predictions are: tensor([[ 0.5717, -0.4289, 1.9086, 0.0682, -0.4359, 0.2100, 0.5311, 0.1928],
  3373. [ 0.1212, -0.7306, 1.5996, -0.9908, -0.2890, -1.1521, 0.6839, 0.1284],
  3374. [-0.2105, -0.8776, 1.3527, -1.0402, -0.3279, -1.1361, 0.3717, 0.2074],
  3375. [ 0.6163, -0.3671, 1.7900, -0.0668, -0.6327, -0.2917, 0.4187, 0.1631],
  3376. [-0.0168, -0.8197, 1.1640, -1.2255, -0.4815, -1.3067, 0.3112, 0.1773],
  3377. [ 0.3989, -0.5297, 1.7450, -0.3858, -0.5510, -0.6769, 0.3761, 0.1441],
  3378. [ 0.6817, -0.3759, 1.8699, -0.0261, -0.6450, -0.3888, 0.4625, 0.0988],
  3379. [ 0.3942, -0.5177, 1.7776, -0.0976, -0.3729, -0.1446, 0.4075, 0.1746]],
  3380. device='cuda:0', grad_fn=<AddmmBackward>)
  3381. landmarks are: tensor([[[ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  3382. 0.4701],
  3383. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  3384. 0.1020],
  3385. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  3386. 0.3007],
  3387. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  3388. 0.3161],
  3389. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  3390. 0.1013],
  3391. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  3392. 0.2699],
  3393. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  3394. -0.0049],
  3395. [ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  3396. 0.0682]]], device='cuda:0')
  3397. loss_train_step before backward: tensor(0.1287, device='cuda:0', grad_fn=<MseLossBackward>)
  3398. loss_train_step after backward: tensor(0.1287, device='cuda:0', grad_fn=<MseLossBackward>)
  3399. loss_train: 9.707480400800705
  3400. step: 70
  3401. running loss: 0.13867829144001007
  3402. Train Steps: 70/90 Loss: 0.1387 torch.Size([8, 600, 800])
  3403. torch.Size([8, 8])
  3404. tensor([[0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  3405. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  3406. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  3407. [ nan, nan, 0.7625, 0.2433, 0.3713, 0.2867, 0.5235, 0.5220],
  3408. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351],
  3409. [0.6245, 0.4115, 0.8700, 0.4883, 0.4625, 0.5517, 0.6100, 0.5217],
  3410. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  3411. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417]],
  3412. device='cuda:0', dtype=torch.float64)
  3413. predictions are: tensor([[ 0.1662, -0.6768, 1.4210, -0.7968, -0.5248, -0.9291, 0.3372, 0.1923],
  3414. [ 0.4368, -0.4664, 1.9125, 0.0626, -0.3291, 0.1259, 0.5564, 0.1895],
  3415. [ 0.7224, -0.3700, 1.8125, -0.1950, -0.6755, -0.3210, 0.5398, 0.1174],
  3416. [-0.0464, -0.7945, 1.4098, -0.9435, -0.4752, -1.0650, 0.3346, 0.1966],
  3417. [ 0.1214, -0.7137, 1.4418, -0.9443, -0.4571, -1.1249, 0.4019, 0.1869],
  3418. [ 0.6116, -0.4209, 1.9821, 0.2965, -0.4020, 0.2547, 0.5225, 0.2192],
  3419. [ 0.4644, -0.5158, 1.5609, -0.7510, -0.5658, -0.8439, 0.5432, 0.1503],
  3420. [ 0.0048, -0.7716, 1.5697, -0.8414, -0.3493, -1.0282, 0.4463, 0.1949]],
  3421. device='cuda:0', grad_fn=<AddmmBackward>)
  3422. landmarks are: tensor([[[ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  3423. 0.3546],
  3424. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  3425. 0.2853],
  3426. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  3427. 0.1005],
  3428. [-2.2859, -2.2859, 1.2360, -1.1620, -0.5711, -0.9618, 0.1322,
  3429. 0.1253],
  3430. [ 0.5664, -0.4321, 1.2862, -1.0003, -0.2189, -1.4608, 0.3883,
  3431. 0.1855],
  3432. [ 0.5987, -0.3852, 1.7326, -0.0303, -0.1497, 0.2622, 0.5316,
  3433. 0.1236],
  3434. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  3435. 0.1929],
  3436. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  3437. 0.2160]]], device='cuda:0')
  3438. loss_train_step before backward: tensor(0.1591, device='cuda:0', grad_fn=<MseLossBackward>)
  3439. loss_train_step after backward: tensor(0.1591, device='cuda:0', grad_fn=<MseLossBackward>)
  3440. loss_train: 9.866620302200317
  3441. step: 71
  3442. running loss: 0.13896648312958193
  3443. Train Steps: 71/90 Loss: 0.1390 torch.Size([8, 600, 800])
  3444. torch.Size([8, 8])
  3445. tensor([[0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  3446. [0.6272, 0.4045, 0.8538, 0.5900, 0.3750, 0.4417, 0.5989, 0.4649],
  3447. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  3448. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  3449. [0.6214, 0.4175, 0.7300, 0.2883, 0.4338, 0.2167, 0.5698, 0.5773],
  3450. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  3451. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  3452. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083]],
  3453. device='cuda:0', dtype=torch.float64)
  3454. predictions are: tensor([[ 0.4457, -0.4978, 1.7293, -0.5260, -0.5322, -0.3158, 0.6324, 0.1981],
  3455. [ 0.6052, -0.4613, 1.9613, 0.0222, -0.5985, -0.3985, 0.4678, 0.1336],
  3456. [ 0.5346, -0.4371, 1.9981, 0.1041, -0.4223, 0.2140, 0.6126, 0.2160],
  3457. [-0.1207, -0.8934, 1.2949, -1.2738, -0.4610, -1.4685, 0.3517, 0.1985],
  3458. [ 0.1044, -0.7318, 1.3309, -1.0767, -0.4852, -1.1226, 0.3573, 0.2500],
  3459. [ 0.3721, -0.5522, 1.9450, 0.0344, -0.3227, -0.1119, 0.4806, 0.2193],
  3460. [ 0.1638, -0.7299, 1.3604, -1.0877, -0.5575, -1.2349, 0.3445, 0.1811],
  3461. [ 0.5890, -0.4262, 1.8733, 0.0180, -0.5640, -0.0120, 0.4816, 0.2140]],
  3462. device='cuda:0', grad_fn=<AddmmBackward>)
  3463. landmarks are: tensor([[[ 0.6108, -0.4273, 1.8711, -0.6616, -0.5769, -0.1997, 0.9156,
  3464. 0.1554],
  3465. [ 0.6109, -0.4177, 1.6575, 0.4393, -0.5538, -0.2459, 0.4805,
  3466. -0.1385],
  3467. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  3468. 0.1554],
  3469. [-2.2859, -2.2859, 1.0712, -1.2085, -0.3806, -1.3929, 0.0755,
  3470. 0.2006],
  3471. [ 0.5841, -0.3574, 1.0859, -0.9541, -0.2824, -1.2851, 0.3460,
  3472. 0.3808],
  3473. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  3474. 0.4171],
  3475. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  3476. 0.0802],
  3477. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  3478. 0.5239]]], device='cuda:0')
  3479. loss_train_step before backward: tensor(0.1390, device='cuda:0', grad_fn=<MseLossBackward>)
  3480.  
  3481. loss_train_step after backward: tensor(0.1390, device='cuda:0', grad_fn=<MseLossBackward>)
  3482. loss_train: 10.005621805787086
  3483. step: 72
  3484. running loss: 0.13896696952482065
  3485. Train Steps: 72/90 Loss: 0.1390 torch.Size([8, 600, 800])
  3486. torch.Size([8, 8])
  3487. tensor([[0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  3488. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426],
  3489. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356],
  3490. [0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350],
  3491. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  3492. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  3493. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  3494. [0.6081, 0.3950, 0.8538, 0.4667, 0.3850, 0.4917, 0.5342, 0.4954]],
  3495. device='cuda:0', dtype=torch.float64)
  3496. predictions are: tensor([[ 0.0624, -0.7368, 1.4473, -0.9337, -0.3668, -1.0164, 0.4630, 0.2204],
  3497. [ 0.5218, -0.4831, 1.9114, -0.0674, -0.5392, -0.3152, 0.4470, 0.1608],
  3498. [-0.0386, -0.7876, 1.6309, -0.7558, -0.2925, -0.8943, 0.5597, 0.2360],
  3499. [ 0.2419, -0.6400, 1.4512, -0.9229, -0.4733, -0.8848, 0.5008, 0.2013],
  3500. [ 0.2882, -0.6012, 1.3015, -0.7879, -0.6360, -0.6736, 0.3322, 0.2447],
  3501. [ 0.7135, -0.3395, 1.9640, 0.4515, -0.5205, 0.2684, 0.5442, 0.2294],
  3502. [-0.0281, -0.8188, 1.2931, -1.1416, -0.4590, -1.2413, 0.3957, 0.2089],
  3503. [ 0.6038, -0.4154, 1.8860, 0.0039, -0.5550, 0.0999, 0.5708, 0.1776]],
  3504. device='cuda:0', grad_fn=<AddmmBackward>)
  3505. landmarks are: tensor([[[ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  3506. 0.2442],
  3507. [ 0.5788, -0.4135, 1.8214, -0.2408, -0.6039, -0.7854, 0.4115,
  3508. 0.2203],
  3509. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  3510. 0.1879],
  3511. [ 0.5911, -0.4080, 1.2303, -0.9156, -0.3229, -1.2851, 0.4508,
  3512. 0.1852],
  3513. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  3514. 0.3315],
  3515. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  3516. 0.4624],
  3517. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  3518. 0.1253],
  3519. [ 0.5227, -0.4615, 1.6575, -0.1304, -0.5076, -0.0149, 0.1815,
  3520. 0.0021]]], device='cuda:0')
  3521. loss_train_step before backward: tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward>)
  3522. loss_train_step after backward: tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward>)
  3523. loss_train: 10.070557050406933
  3524. step: 73
  3525. running loss: 0.1379528363069443
  3526. Train Steps: 73/90 Loss: 0.1380 torch.Size([8, 600, 800])
  3527. torch.Size([8, 8])
  3528. tensor([[0.6108, 0.4011, 0.8037, 0.3400, 0.3700, 0.2933, 0.5658, 0.5617],
  3529. [0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378],
  3530. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  3531. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  3532. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  3533. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  3534. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  3535. [0.6090, 0.4010, 0.7838, 0.3483, 0.3538, 0.3783, 0.5462, 0.5077]],
  3536. device='cuda:0', dtype=torch.float64)
  3537. predictions are: tensor([[ 0.3564, -0.5746, 1.4583, -0.8204, -0.5787, -0.8137, 0.4769, 0.2382],
  3538. [ 0.7135, -0.3818, 1.8126, 0.1473, -0.6671, -0.2749, 0.4425, 0.1993],
  3539. [ 0.2154, -0.6045, 1.7846, -0.2033, -0.2362, -0.1025, 0.5369, 0.2716],
  3540. [ 0.5455, -0.4859, 1.8217, -0.0442, -0.5644, -0.1549, 0.3641, 0.2224],
  3541. [ 0.5563, -0.4529, 1.7759, -0.2288, -0.5570, -0.2708, 0.5477, 0.1839],
  3542. [-0.3794, -1.0313, 1.6012, -1.1200, -0.0692, -1.3016, 0.7081, 0.2265],
  3543. [ 0.2850, -0.6013, 1.3278, -0.8779, -0.5838, -0.7285, 0.4025, 0.2657],
  3544. [ 0.3451, -0.5976, 1.4313, -0.8132, -0.6137, -0.7096, 0.3903, 0.2457]],
  3545. device='cuda:0', grad_fn=<AddmmBackward>)
  3546. landmarks are: tensor([[[ 0.5355, -0.4335, 1.4266, -0.7155, -0.5769, -0.9310, 0.3275,
  3547. 0.3087],
  3548. [ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  3549. 0.1982],
  3550. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  3551. 0.2853],
  3552. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  3553. 0.1159],
  3554. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  3555. 0.1715],
  3556. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  3557. 0.3104],
  3558. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  3559. 0.3546],
  3560. [ 0.5270, -0.4336, 1.3342, -0.6770, -0.6520, -0.5384, 0.2370,
  3561. 0.0592]]], device='cuda:0')
  3562. loss_train_step before backward: tensor(0.1023, device='cuda:0', grad_fn=<MseLossBackward>)
  3563. loss_train_step after backward: tensor(0.1023, device='cuda:0', grad_fn=<MseLossBackward>)
  3564. loss_train: 10.172822825610638
  3565. step: 74
  3566. running loss: 0.13747057872446808
  3567. Train Steps: 74/90 Loss: 0.1375 torch.Size([8, 600, 800])
  3568. torch.Size([8, 8])
  3569. tensor([[0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  3570. [0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  3571. [0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  3572. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  3573. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  3574. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  3575. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817],
  3576. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633]],
  3577. device='cuda:0', dtype=torch.float64)
  3578. predictions are: tensor([[ 0.4214, -0.5060, 1.3804, -0.6720, -0.6546, -0.6298, 0.3875, 0.2875],
  3579. [ 0.4671, -0.4624, 1.8166, 0.0909, -0.3127, 0.1770, 0.5518, 0.2869],
  3580. [ 0.2761, -0.6391, 1.3203, -1.0693, -0.5863, -1.1693, 0.4733, 0.1975],
  3581. [ 0.5017, -0.4808, 1.8436, -0.1449, -0.5294, -0.1855, 0.4829, 0.2564],
  3582. [ 0.7856, -0.3420, 1.7747, -0.2400, -0.6585, -0.3377, 0.6026, 0.1817],
  3583. [-0.2893, -0.9720, 1.1546, -1.2933, -0.3962, -1.4782, 0.3583, 0.2215],
  3584. [-0.2827, -0.9134, 1.4449, -0.9290, -0.2064, -1.0815, 0.4354, 0.2955],
  3585. [ 0.6116, -0.4134, 1.9124, 0.2665, -0.3739, 0.3431, 0.5887, 0.2829]],
  3586. device='cuda:0', grad_fn=<AddmmBackward>)
  3587. landmarks are: tensor([[[ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  3588. 0.4036],
  3589. [ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  3590. 0.0412],
  3591. [ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  3592. -0.0108],
  3593. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  3594. 0.3161],
  3595. [ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  3596. -0.0099],
  3597. [-2.2859, -2.2859, 1.0513, -1.2851, -0.4441, -1.2313, 0.2206,
  3598. 0.1073],
  3599. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  3600. 0.4008],
  3601. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  3602. 0.3157]]], device='cuda:0')
  3603. loss_train_step before backward: tensor(0.1267, device='cuda:0', grad_fn=<MseLossBackward>)
  3604. loss_train_step after backward: tensor(0.1267, device='cuda:0', grad_fn=<MseLossBackward>)
  3605. loss_train: 10.29955194145441
  3606. step: 75
  3607. running loss: 0.13732735921939215
  3608. Train Steps: 75/90 Loss: 0.1373 torch.Size([8, 600, 800])
  3609. torch.Size([8, 8])
  3610. tensor([[0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136],
  3611. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  3612. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  3613. [0.6200, 0.4070, 0.8938, 0.4183, 0.3538, 0.4567, 0.6175, 0.5400],
  3614. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  3615. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  3616. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  3617. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320]],
  3618. device='cuda:0', dtype=torch.float64)
  3619. predictions are: tensor([[ 0.3176, -0.5450, 1.4536, -0.6316, -0.4627, -0.1740, 0.5203, 0.3189],
  3620. [ 0.2611, -0.6328, 1.6570, -0.4461, -0.4967, -0.8020, 0.4033, 0.2421],
  3621. [-0.3042, -0.9527, 1.2764, -1.1099, -0.2248, -1.2061, 0.4493, 0.3028],
  3622. [ 0.6198, -0.4280, 1.7268, -0.3493, -0.5287, -0.2621, 0.6554, 0.2258],
  3623. [ 0.6195, -0.3894, 1.6452, 0.0312, -0.5016, -0.0553, 0.5120, 0.2784],
  3624. [-0.1235, -0.8596, 1.2788, -0.9454, -0.4956, -1.0478, 0.2828, 0.2828],
  3625. [ 0.5220, -0.4900, 1.7215, -0.1318, -0.5259, -0.2601, 0.3993, 0.2380],
  3626. [ 0.5877, -0.4383, 1.7150, -0.3114, -0.5164, -0.3794, 0.6195, 0.1953]],
  3627. device='cuda:0', grad_fn=<AddmmBackward>)
  3628. landmarks are: tensor([[[ 0.5466, -0.3840, 1.5016, -0.6077, -0.6404, 0.2083, 0.3871,
  3629. 0.0862],
  3630. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  3631. 0.2699],
  3632. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  3633. 0.3854],
  3634. [ 0.5778, -0.4061, 1.8423, -0.3537, -0.6520, -0.1766, 0.5663,
  3635. 0.2083],
  3636. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  3637. 0.3745],
  3638. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  3639. 0.2837],
  3640. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  3641. 0.1159],
  3642. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  3643. 0.1715]]], device='cuda:0')
  3644. loss_train_step before backward: tensor(0.1469, device='cuda:0', grad_fn=<MseLossBackward>)
  3645. loss_train_step after backward: tensor(0.1469, device='cuda:0', grad_fn=<MseLossBackward>)
  3646. loss_train: 10.446426160633564
  3647. step: 76
  3648. running loss: 0.13745297579781005
  3649.  
  3650. Train Steps: 76/90 Loss: 0.1375 torch.Size([8, 600, 800])
  3651. torch.Size([8, 8])
  3652. tensor([[0.6099, 0.4030, 0.8638, 0.5117, 0.4983, 0.4965, 0.5086, 0.5388],
  3653. [0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  3654. [0.6185, 0.4129, 0.8900, 0.4567, 0.3937, 0.5417, 0.5734, 0.5110],
  3655. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  3656. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800],
  3657. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  3658. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  3659. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204]],
  3660. device='cuda:0', dtype=torch.float64)
  3661. predictions are: tensor([[ 0.1982, -0.6836, 1.6525, -0.2713, -0.2641, -0.4663, 0.4898, 0.2545],
  3662. [-0.2407, -0.9340, 1.4422, -1.1110, -0.3239, -1.3324, 0.5128, 0.2232],
  3663. [ 0.3009, -0.5716, 1.6889, -0.2674, -0.4470, -0.1971, 0.4458, 0.2760],
  3664. [ 0.6223, -0.3788, 1.5415, -0.1216, -0.5765, -0.2211, 0.5047, 0.2707],
  3665. [-0.1364, -0.8355, 1.0600, -1.1444, -0.5423, -1.2415, 0.2674, 0.2796],
  3666. [ 0.4898, -0.4481, 1.5487, -0.4247, -0.4844, -0.1815, 0.5657, 0.2896],
  3667. [ 0.5429, -0.4586, 1.7326, -0.2233, -0.4238, 0.0051, 0.6718, 0.2817],
  3668. [ 0.5129, -0.4504, 1.5689, -0.1454, -0.5120, -0.1783, 0.4519, 0.2615]],
  3669. device='cuda:0', grad_fn=<AddmmBackward>)
  3670. landmarks are: tensor([[[ 0.5309, -0.4246, 1.7037, 0.0774, 0.0158, 0.0075, 0.0635,
  3671. 0.2026],
  3672. [ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  3673. 0.0851],
  3674. [ 0.5711, -0.3788, 1.8249, -0.1766, -0.4672, 0.2160, 0.3625,
  3675. 0.0742],
  3676. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  3677. 0.3745],
  3678. [ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  3679. 0.3931],
  3680. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  3681. 0.2622],
  3682. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  3683. 0.1082],
  3684. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  3685. 0.1176]]], device='cuda:0')
  3686. loss_train_step before backward: tensor(0.0694, device='cuda:0', grad_fn=<MseLossBackward>)
  3687. loss_train_step after backward: tensor(0.0694, device='cuda:0', grad_fn=<MseLossBackward>)
  3688. loss_train: 10.51586477458477
  3689. step: 77
  3690. running loss: 0.1365696723972048
  3691. Train Steps: 77/90 Loss: 0.1366 torch.Size([8, 600, 800])
  3692. torch.Size([8, 8])
  3693. tensor([[0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183],
  3694. [0.6198, 0.3997, 0.8582, 0.5361, 0.4117, 0.5016, 0.5942, 0.5134],
  3695. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  3696. [0.6200, 0.3978, 0.8900, 0.4550, 0.3775, 0.5200, 0.6150, 0.5367],
  3697. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  3698. [0.6201, 0.4064, 0.8688, 0.5050, 0.4225, 0.5100, 0.6138, 0.5500],
  3699. [0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  3700. [0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297]],
  3701. device='cuda:0', dtype=torch.float64)
  3702. predictions are: tensor([[ 0.4612, -0.5073, 1.4651, -0.8233, -0.5214, -0.6658, 0.6923, 0.2148],
  3703. [ 0.5246, -0.4641, 1.5652, -0.0813, -0.4644, -0.0231, 0.4570, 0.2592],
  3704. [ 0.3270, -0.5956, 1.6400, -0.3893, -0.4486, -0.6250, 0.4818, 0.2420],
  3705. [ 0.6205, -0.3809, 1.6541, -0.1866, -0.4975, -0.0112, 0.6581, 0.2468],
  3706. [ 0.2243, -0.6179, 1.4108, -0.6065, -0.5477, -0.5506, 0.3383, 0.3082],
  3707. [ 0.5293, -0.4360, 1.5617, -0.0832, -0.4276, 0.0412, 0.4615, 0.2706],
  3708. [-0.2347, -0.8771, 1.2084, -1.0134, -0.3904, -1.1015, 0.3591, 0.2437],
  3709. [-0.0426, -0.7577, 1.6079, -0.4859, -0.2439, -0.7029, 0.5177, 0.2462]],
  3710. device='cuda:0', grad_fn=<AddmmBackward>)
  3711. landmarks are: tensor([[[ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  3712. 0.1080],
  3713. [ 0.5767, -0.4396, 1.6782, 0.1905, -0.3844, 0.0308, 0.4588,
  3714. 0.0855],
  3715. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  3716. 0.1005],
  3717. [ 0.5776, -0.4484, 1.8249, -0.1843, -0.5423, 0.1159, 0.5547,
  3718. 0.1929],
  3719. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  3720. 0.3392],
  3721. [ 0.5784, -0.4088, 1.7268, 0.0467, -0.3344, 0.0697, 0.5490,
  3722. 0.2545],
  3723. [ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  3724. 0.0111],
  3725. [ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  3726. 0.1608]]], device='cuda:0')
  3727. loss_train_step before backward: tensor(0.0475, device='cuda:0', grad_fn=<MseLossBackward>)
  3728. loss_train_step after backward: tensor(0.0475, device='cuda:0', grad_fn=<MseLossBackward>)
  3729. loss_train: 10.563358839601278
  3730. step: 78
  3731. running loss: 0.13542767743078563
  3732. Train Steps: 78/90 Loss: 0.1354 torch.Size([8, 600, 800])
  3733. torch.Size([8, 8])
  3734. tensor([[0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  3735. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  3736. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  3737. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  3738. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  3739. [0.6346, 0.4165, 0.9138, 0.3983, 0.3875, 0.4317, 0.7469, 0.5471],
  3740. [ nan, nan, 0.7412, 0.2200, 0.4450, 0.1517, 0.5312, 0.4983],
  3741. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350]],
  3742. device='cuda:0', dtype=torch.float64)
  3743. predictions are: tensor([[ 0.6535, -0.3603, 1.6467, 0.0109, -0.3417, 0.1054, 0.5565, 0.2526],
  3744. [-0.1297, -0.7888, 1.1310, -0.9446, -0.5002, -0.8548, 0.2892, 0.2735],
  3745. [ 0.7948, -0.2646, 1.6848, 0.0678, -0.6741, -0.2577, 0.5078, 0.1569],
  3746. [ 0.2547, -0.5520, 1.5519, -0.3196, -0.3354, -0.4262, 0.5298, 0.2917],
  3747. [ 0.6743, -0.3393, 1.6766, 0.0688, -0.3600, 0.1798, 0.5958, 0.2401],
  3748. [ 0.3992, -0.5258, 1.8062, -0.2436, -0.3569, -0.1706, 0.6703, 0.2025],
  3749. [-0.3108, -0.9624, 1.0015, -1.3031, -0.3757, -1.3097, 0.3483, 0.2303],
  3750. [ 0.0091, -0.7416, 1.2802, -0.9353, -0.3341, -0.8951, 0.4326, 0.2514]],
  3751. device='cuda:0', grad_fn=<AddmmBackward>)
  3752. landmarks are: tensor([[[ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  3753. 0.4239],
  3754. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  3755. 0.2699],
  3756. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  3757. -0.0957],
  3758. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  3759. 0.5822],
  3760. [ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  3761. 0.2364],
  3762. [ 0.6454, -0.3623, 1.9346, -0.4460, -0.4961, -0.2921, 1.1642,
  3763. 0.2409],
  3764. [-2.2859, -2.2859, 1.1379, -1.2697, -0.2305, -1.5854, 0.1679,
  3765. 0.0159],
  3766. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  3767. 0.1850]]], device='cuda:0')
  3768. loss_train_step before backward: tensor(0.2474, device='cuda:0', grad_fn=<MseLossBackward>)
  3769. loss_train_step after backward: tensor(0.2474, device='cuda:0', grad_fn=<MseLossBackward>)
  3770. loss_train: 10.810774769634008
  3771. step: 79
  3772. running loss: 0.13684525024853175
  3773. Train Steps: 79/90 Loss: 0.1368 torch.Size([8, 600, 800])
  3774. torch.Size([8, 8])
  3775. tensor([[0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  3776. [0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183],
  3777. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  3778. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  3779. [ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167],
  3780. [0.6083, 0.3957, 0.8638, 0.4950, 0.4363, 0.5083, 0.5346, 0.4980],
  3781. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  3782. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391]],
  3783. device='cuda:0', dtype=torch.float64)
  3784. predictions are: tensor([[ 0.5802, -0.3822, 1.6703, -0.0592, -0.3859, 0.1253, 0.4767, 0.2593],
  3785. [-0.0557, -0.7866, 1.2931, -0.9026, -0.4576, -1.0742, 0.3170, 0.2135],
  3786. [ 0.4856, -0.4461, 1.7900, -0.0398, -0.3855, -0.2339, 0.5998, 0.1871],
  3787. [ 0.5420, -0.3848, 1.5297, -0.1514, -0.4714, -0.0996, 0.5090, 0.2390],
  3788. [-0.4367, -1.0202, 1.1679, -1.1038, -0.3655, -1.1330, 0.2830, 0.2454],
  3789. [ 0.5202, -0.4176, 1.7353, -0.0741, -0.3475, 0.0032, 0.5747, 0.1865],
  3790. [ 0.5335, -0.4008, 1.6311, 0.0209, -0.3461, 0.0446, 0.4941, 0.2434],
  3791. [ 0.3662, -0.5787, 1.3590, -1.0290, -0.4626, -1.0988, 0.6388, 0.1773]],
  3792. device='cuda:0', grad_fn=<AddmmBackward>)
  3793. landmarks are: tensor([[[ 5.6374e-01, -4.1432e-01, 1.7519e+00, -7.8656e-02, -3.0554e-01,
  3794. -1.4935e-02, 3.7575e-01, 3.0839e-01],
  3795. [ 5.7985e-01, -4.1555e-01, 1.3977e+00, -1.0388e+00, -4.6721e-01,
  3796. -1.1004e+00, 3.4688e-01, 1.0824e-01],
  3797. [ 6.4542e-01, -3.7194e-01, 1.9115e+00, -1.3041e-01, -5.0762e-01,
  3798. -2.8437e-01, 1.0033e+00, 4.3864e-01],
  3799. [ 6.2895e-01, -4.3453e-01, 1.3794e+00, 3.6792e-01, -4.8453e-01,
  3800. 3.8953e-02, 9.2654e-01, 1.9283e-01],
  3801. [-2.2859e+00, -2.2859e+00, 1.2820e+00, -1.0801e+00, -5.8845e-01,
  3802. -1.0234e+00, 2.1409e-01, 1.0054e-01],
  3803. [ 5.2379e-01, -4.5797e-01, 1.7037e+00, 4.6189e-04, -2.7090e-01,
  3804. 6.2048e-02, 1.8356e-01, 1.4106e-02],
  3805. [ 5.7864e-01, -4.1409e-01, 1.7037e+00, 1.5443e-01, -1.8624e-01,
  3806. 7.3556e-02, 4.3926e-01, 8.5142e-02],
  3807. [ 5.7846e-01, -4.2587e-01, 1.4228e+00, -1.0261e+00, -4.1903e-01,
  3808. -1.2189e+00, 4.7633e-01, 2.0428e-01]]], device='cuda:0')
  3809. loss_train_step before backward: tensor(0.1085, device='cuda:0', grad_fn=<MseLossBackward>)
  3810. loss_train_step after backward: tensor(0.1085, device='cuda:0', grad_fn=<MseLossBackward>)
  3811. loss_train: 10.91929730400443
  3812. step: 80
  3813. running loss: 0.1364912163000554
  3814.  
  3815. Train Steps: 80/90 Loss: 0.1365 torch.Size([8, 600, 800])
  3816. torch.Size([8, 8])
  3817. tensor([[0.6200, 0.3978, 0.8900, 0.4550, 0.3775, 0.5200, 0.6150, 0.5367],
  3818. [0.6186, 0.4013, 0.8191, 0.3188, 0.4279, 0.2060, 0.5767, 0.5411],
  3819. [0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283],
  3820. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320],
  3821. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  3822. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412],
  3823. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  3824. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329]],
  3825. device='cuda:0', dtype=torch.float64)
  3826. predictions are: tensor([[ 0.6595, -0.3411, 1.7133, -0.1565, -0.4309, 0.0339, 0.6960, 0.1918],
  3827. [-0.1699, -0.8419, 1.3545, -0.8984, -0.3419, -1.0833, 0.3931, 0.2011],
  3828. [ 0.3309, -0.5462, 1.7022, -0.0703, -0.1565, -0.1186, 0.5422, 0.2256],
  3829. [ 0.6394, -0.3299, 1.6054, -0.1054, -0.4234, 0.0326, 0.5868, 0.2038],
  3830. [-0.1806, -0.9008, 1.0618, -1.1263, -0.4600, -1.2427, 0.2815, 0.1938],
  3831. [ 0.5022, -0.4241, 1.6264, 0.0332, -0.2760, -0.0482, 0.5249, 0.2056],
  3832. [ 0.4720, -0.4786, 1.7559, -0.1731, -0.4580, -0.1977, 0.5077, 0.1997],
  3833. [ 0.3408, -0.5362, 1.4742, -0.6118, -0.5730, -0.7129, 0.3912, 0.1708]],
  3834. device='cuda:0', grad_fn=<AddmmBackward>)
  3835. landmarks are: tensor([[[ 0.5776, -0.4484, 1.8249, -0.1843, -0.5423, 0.1159, 0.5547,
  3836. 0.1929],
  3837. [ 0.5713, -0.4321, 1.4975, -0.8134, -0.3094, -1.3345, 0.3779,
  3838. 0.2134],
  3839. [ 0.5245, -0.4347, 1.6806, 0.1159, 0.0046, 0.0129, 0.1044,
  3840. 0.1544],
  3841. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  3842. 0.1715],
  3843. [ 0.5470, -0.4081, 0.8492, -1.0773, -0.5307, -1.1620, 0.0912,
  3844. 0.1890],
  3845. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  3846. 0.2138],
  3847. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  3848. 0.1390],
  3849. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  3850. 0.1753]]], device='cuda:0')
  3851. loss_train_step before backward: tensor(0.0473, device='cuda:0', grad_fn=<MseLossBackward>)
  3852. loss_train_step after backward: tensor(0.0473, device='cuda:0', grad_fn=<MseLossBackward>)
  3853. loss_train: 10.966615419834852
  3854. step: 81
  3855. running loss: 0.13539031382512162
  3856. Train Steps: 81/90 Loss: 0.1354 torch.Size([8, 600, 800])
  3857. torch.Size([8, 8])
  3858. tensor([[0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  3859. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  3860. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  3861. [0.6099, 0.4030, 0.8638, 0.5117, 0.4983, 0.4965, 0.5086, 0.5388],
  3862. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  3863. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478],
  3864. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  3865. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567]],
  3866. device='cuda:0', dtype=torch.float64)
  3867. predictions are: tensor([[ 0.6577, -0.3297, 1.6868, 0.0782, -0.3042, 0.1605, 0.5671, 0.2163],
  3868. [ 0.6820, -0.3201, 1.8332, 0.0495, -0.4130, -0.1604, 0.6454, 0.1406],
  3869. [ 0.6271, -0.3454, 1.7065, 0.1052, -0.2852, 0.2045, 0.5946, 0.2010],
  3870. [ 0.4953, -0.4632, 1.7364, 0.0277, -0.2168, -0.0399, 0.5300, 0.1936],
  3871. [ 0.1193, -0.6399, 1.4553, -0.7747, -0.3613, -0.8269, 0.5000, 0.1925],
  3872. [ 0.4106, -0.5026, 1.6519, -0.4772, -0.4520, -0.6562, 0.5282, 0.1420],
  3873. [-0.2983, -0.9217, 1.1456, -0.9940, -0.4474, -1.0575, 0.2386, 0.2039],
  3874. [-0.3803, -0.9827, 1.1318, -1.0392, -0.4033, -1.1177, 0.2494, 0.1996]],
  3875. device='cuda:0', grad_fn=<AddmmBackward>)
  3876. landmarks are: tensor([[[ 0.5548, -0.4682, 1.7309, 0.0966, -0.1394, 0.1757, 0.5045,
  3877. 0.0942],
  3878. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  3879. 0.4386],
  3880. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  3881. 0.0764],
  3882. [ 0.5309, -0.4246, 1.7037, 0.0774, 0.0158, 0.0075, 0.0635,
  3883. 0.2026],
  3884. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  3885. 0.3392],
  3886. [ 0.5792, -0.4052, 1.8214, -0.6587, -0.5384, -0.8924, 0.4381,
  3887. 0.2442],
  3888. [-2.2859, -2.2859, 1.2030, -1.0288, -0.4961, -1.1081, 0.0813,
  3889. 0.3161],
  3890. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  3891. 0.2853]]], device='cuda:0')
  3892. loss_train_step before backward: tensor(0.1947, device='cuda:0', grad_fn=<MseLossBackward>)
  3893. loss_train_step after backward: tensor(0.1947, device='cuda:0', grad_fn=<MseLossBackward>)
  3894. loss_train: 11.161314766854048
  3895. step: 82
  3896. running loss: 0.1361135947177323
  3897. Train Steps: 82/90 Loss: 0.1361 torch.Size([8, 600, 800])
  3898. torch.Size([8, 8])
  3899. tensor([[0.6371, 0.4092, 0.8337, 0.5850, 0.3950, 0.5117, 0.6559, 0.5262],
  3900. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  3901. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  3902. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  3903. [0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  3904. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  3905. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  3906. [ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167]],
  3907. device='cuda:0', dtype=torch.float64)
  3908. predictions are: tensor([[ 1.0737, -0.0740, 1.8738, 0.5913, -0.4413, 0.5408, 0.5651, 0.1580],
  3909. [-0.5130, -1.0604, 1.2191, -0.9690, -0.2829, -1.0806, 0.2641, 0.2092],
  3910. [-0.1248, -0.8598, 1.8897, -0.6127, 0.0917, -0.7495, 0.8417, 0.1448],
  3911. [ 0.8726, -0.2283, 1.9341, 0.3120, -0.4677, 0.1949, 0.5191, 0.1281],
  3912. [ 0.4474, -0.4906, 1.3738, -0.7276, -0.4931, -0.7259, 0.4807, 0.1319],
  3913. [ 0.5036, -0.4894, 1.3357, -0.5319, -0.4911, -0.5718, 0.4147, 0.2147],
  3914. [ 0.4899, -0.4758, 1.3907, -0.6307, -0.4970, -0.6554, 0.4247, 0.1343],
  3915. [-0.4548, -1.0278, 1.3212, -0.8165, -0.3190, -0.8877, 0.2281, 0.1962]],
  3916. device='cuda:0', grad_fn=<AddmmBackward>)
  3917. landmarks are: tensor([[[ 0.6569, -0.3960, 1.5651, 0.4162, -0.4614, 0.0774, 0.7438,
  3918. 0.1447],
  3919. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  3920. 0.1373],
  3921. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  3922. 0.2142],
  3923. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  3924. 0.0467],
  3925. [ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  3926. -0.0108],
  3927. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  3928. 0.3700],
  3929. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  3930. -0.1031],
  3931. [-2.2859, -2.2859, 1.2820, -1.0801, -0.5885, -1.0234, 0.2141,
  3932. 0.1005]]], device='cuda:0')
  3933. loss_train_step before backward: tensor(0.2300, device='cuda:0', grad_fn=<MseLossBackward>)
  3934. loss_train_step after backward: tensor(0.2300, device='cuda:0', grad_fn=<MseLossBackward>)
  3935. loss_train: 11.391309630125761
  3936. step: 83
  3937. running loss: 0.1372446943388646
  3938. Train Steps: 83/90 Loss: 0.1372 torch.Size([8, 600, 800])
  3939. torch.Size([8, 8])
  3940. tensor([[0.6193, 0.4050, 0.7313, 0.2433, 0.4075, 0.2117, 0.5649, 0.5656],
  3941. [0.6346, 0.4092, 0.7712, 0.5917, 0.4037, 0.4767, 0.7343, 0.5725],
  3942. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083],
  3943. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  3944. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  3945. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  3946. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  3947. [0.6136, 0.4117, 0.8700, 0.5167, 0.4188, 0.5083, 0.5147, 0.5495]],
  3948. device='cuda:0', dtype=torch.float64)
  3949. predictions are: tensor([[-0.0929, -0.8711, 1.2389, -1.0993, -0.3887, -1.2384, 0.4037, 0.1447],
  3950. [ 0.3426, -0.5333, 1.5412, -0.1081, -0.3541, -0.0805, 0.4267, 0.2252],
  3951. [ 0.4016, -0.5626, 1.8441, -0.3404, -0.4835, -0.6410, 0.5482, 0.0721],
  3952. [-0.2117, -0.9704, 1.2032, -1.0936, -0.4017, -1.2933, 0.2922, 0.1594],
  3953. [ 0.5968, -0.3992, 1.6112, -0.5510, -0.5232, -0.4294, 0.6442, 0.1186],
  3954. [ 0.2000, -0.6920, 1.8410, -0.2265, -0.3198, -0.3455, 0.4740, 0.1843],
  3955. [ 0.3778, -0.5193, 1.7693, 0.1073, -0.1769, 0.0373, 0.4870, 0.1666],
  3956. [ 0.5991, -0.3642, 1.7881, 0.2127, -0.2926, 0.1899, 0.5110, 0.1492]],
  3957. device='cuda:0', grad_fn=<AddmmBackward>)
  3958. landmarks are: tensor([[[ 0.5746, -0.4153, 1.0917, -1.1620, -0.4037, -1.3082, 0.3234,
  3959. 0.3267],
  3960. [ 0.6454, -0.3960, 1.2764, 0.4470, -0.4210, -0.0842, 1.1057,
  3961. 0.3585],
  3962. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  3963. 0.0620],
  3964. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  3965. 0.3808],
  3966. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  3967. 0.2365],
  3968. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  3969. 0.3238],
  3970. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  3971. 0.0851],
  3972. [ 0.5482, -0.3841, 1.7326, 0.1005, -0.3517, 0.0620, 0.0912,
  3973. 0.2522]]], device='cuda:0')
  3974. loss_train_step before backward: tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward>)
  3975. loss_train_step after backward: tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward>)
  3976. loss_train: 11.450813557952642
  3977. step: 84
  3978. running loss: 0.13631920902324574
  3979.  
  3980. Train Steps: 84/90 Loss: 0.1363 torch.Size([8, 600, 800])
  3981. torch.Size([8, 8])
  3982. tensor([[0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  3983. [0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  3984. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  3985. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  3986. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  3987. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  3988. [ nan, nan, 0.8625, 0.2550, 0.5487, 0.2200, 0.7335, 0.5737],
  3989. [0.6040, 0.4002, 0.7338, 0.2267, 0.3975, 0.2100, 0.5231, 0.4778]],
  3990. device='cuda:0', dtype=torch.float64)
  3991. predictions are: tensor([[ 1.0472, -0.1337, 1.8173, 0.4242, -0.5189, 0.1716, 0.5610, 0.1083],
  3992. [ 0.8067, -0.3118, 1.8637, 0.3343, -0.3867, 0.3309, 0.5161, 0.1508],
  3993. [ 0.3921, -0.5289, 1.6973, -0.0309, -0.4470, -0.0295, 0.2790, 0.2103],
  3994. [ 0.4866, -0.4627, 1.3325, -0.6769, -0.5362, -0.4760, 0.4466, 0.1793],
  3995. [ 0.3842, -0.5916, 1.5074, -0.8420, -0.4493, -0.9451, 0.6339, 0.0836],
  3996. [-0.4744, -1.0623, 1.4592, -0.7937, -0.2200, -0.9876, 0.3152, 0.1966],
  3997. [-0.6824, -1.2032, 1.6402, -0.9928, 0.0528, -1.1821, 0.6461, 0.1668],
  3998. [-0.1324, -0.9212, 1.2158, -0.9944, -0.4907, -1.1888, 0.2543, 0.1415]],
  3999. device='cuda:0', grad_fn=<AddmmBackward>)
  4000. landmarks are: tensor([[[ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  4001. 0.2075],
  4002. [ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  4003. 0.3777],
  4004. [ 0.5441, -0.3997, 1.7326, -0.2228, -0.4441, -0.2921, 0.0296,
  4005. 0.2409],
  4006. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  4007. 0.3546],
  4008. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  4009. -0.0220],
  4010. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  4011. 0.2083],
  4012. [-2.2859, -2.2859, 1.6979, -1.1081, 0.2487, -1.2697, 1.1020,
  4013. 0.3638],
  4014. [ 0.5037, -0.4375, 1.1032, -1.2390, -0.4499, -1.3159, 0.1301,
  4015. -0.0791]]], device='cuda:0')
  4016. loss_train_step before backward: tensor(0.1343, device='cuda:0', grad_fn=<MseLossBackward>)
  4017. loss_train_step after backward: tensor(0.1343, device='cuda:0', grad_fn=<MseLossBackward>)
  4018. loss_train: 11.58513193950057
  4019. step: 85
  4020. running loss: 0.1362956698764773
  4021. Train Steps: 85/90 Loss: 0.1363 torch.Size([8, 600, 800])
  4022. torch.Size([8, 8])
  4023. tensor([[0.6196, 0.4068, 0.7645, 0.2234, 0.4575, 0.1737, 0.5926, 0.5284],
  4024. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  4025. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750],
  4026. [0.6182, 0.3967, 0.8263, 0.3065, 0.3526, 0.4161, 0.6192, 0.5290],
  4027. [0.6300, 0.4102, 0.9088, 0.4433, 0.4088, 0.3067, 0.6820, 0.5540],
  4028. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528],
  4029. [0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  4030. [0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656]],
  4031. device='cuda:0', dtype=torch.float64)
  4032. predictions are: tensor([[-6.5229e-02, -8.8510e-01, 1.2439e+00, -9.6002e-01, -4.1075e-01,
  4033. -1.1328e+00, 2.9228e-01, 1.5930e-01],
  4034. [ 5.0083e-01, -4.7344e-01, 1.8331e+00, 1.2776e-01, -1.5367e-01,
  4035. 1.6144e-01, 5.3884e-01, 1.9881e-01],
  4036. [-5.0049e-01, -1.1383e+00, 1.0559e+00, -1.1379e+00, -4.0530e-01,
  4037. -1.2439e+00, 2.0949e-01, 1.9963e-01],
  4038. [ 8.3195e-01, -2.8182e-01, 1.5013e+00, -5.1990e-01, -6.1314e-01,
  4039. -2.9477e-01, 6.0160e-01, 1.3491e-01],
  4040. [ 3.4898e-01, -5.4086e-01, 1.8459e+00, -2.4536e-02, -3.6836e-01,
  4041. -4.6690e-01, 5.0389e-01, 1.1189e-01],
  4042. [-2.3398e-01, -9.3486e-01, 1.8301e+00, -6.1287e-01, -1.3023e-01,
  4043. -8.4830e-01, 6.8406e-01, 1.4688e-01],
  4044. [-2.9074e-01, -9.9740e-01, 1.3294e+00, -8.7116e-01, -3.7710e-01,
  4045. -1.1082e+00, 3.2404e-01, 1.8692e-01],
  4046. [ 9.3682e-01, -1.8088e-01, 1.6402e+00, 1.7329e-03, -5.3351e-01,
  4047. 1.7422e-01, 5.1208e-01, 1.9848e-01]], device='cuda:0',
  4048. grad_fn=<AddmmBackward>)
  4049. landmarks are: tensor([[[ 0.5761, -0.4070, 1.2452, -1.2541, -0.1725, -1.4835, 0.4511,
  4050. 0.1545],
  4051. [ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  4052. 0.2853],
  4053. [ 0.5663, -0.4396, 0.8261, -1.1312, -0.2940, -1.3929, 0.2603,
  4054. 0.3700],
  4055. [ 0.5697, -0.4538, 1.5308, -0.8703, -0.6572, -0.3639, 0.5739,
  4056. 0.1576],
  4057. [ 0.6240, -0.3912, 1.9115, -0.2382, -0.3979, -0.8694, 0.8644,
  4058. 0.2730],
  4059. [-2.2859, -2.2859, 1.8423, -0.9695, -0.1323, -0.8463, 1.1349,
  4060. 0.2676],
  4061. [ 0.5917, -0.3861, 1.0455, -1.3698, -0.2882, -1.1928, 0.6067,
  4062. 0.2083],
  4063. [ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  4064. 0.3267]]], device='cuda:0')
  4065. loss_train_step before backward: tensor(0.1866, device='cuda:0', grad_fn=<MseLossBackward>)
  4066. loss_train_step after backward: tensor(0.1866, device='cuda:0', grad_fn=<MseLossBackward>)
  4067. loss_train: 11.77172925695777
  4068. step: 86
  4069. running loss: 0.1368805727553229
  4070. Train Steps: 86/90 Loss: 0.1369 torch.Size([8, 600, 800])
  4071. torch.Size([8, 8])
  4072. tensor([[0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  4073. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  4074. [ nan, nan, 0.7097, 0.2346, 0.4250, 0.1850, 0.5175, 0.5583],
  4075. [0.6129, 0.3930, 0.8769, 0.5105, 0.4146, 0.5642, 0.6000, 0.5082],
  4076. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  4077. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  4078. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927],
  4079. [0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350]],
  4080. device='cuda:0', dtype=torch.float64)
  4081. predictions are: tensor([[ 4.4188e-01, -5.1116e-01, 1.7300e+00, -2.0806e-01, -3.4683e-01,
  4082. -4.7736e-02, 4.7247e-01, 2.4311e-01],
  4083. [ 7.5987e-01, -3.2086e-01, 1.5680e+00, -9.0686e-04, -4.7657e-01,
  4084. -1.4873e-01, 4.9563e-01, 2.3884e-01],
  4085. [-9.0501e-01, -1.4015e+00, 1.0909e+00, -1.4329e+00, -3.3467e-01,
  4086. -1.6594e+00, 2.6124e-01, 1.6862e-01],
  4087. [ 6.2424e-01, -4.0011e-01, 1.6721e+00, -4.6716e-02, -2.9070e-01,
  4088. 3.5843e-02, 5.2984e-01, 2.0643e-01],
  4089. [ 2.5168e-01, -6.7213e-01, 1.5804e+00, -4.8583e-01, -5.6401e-01,
  4090. -7.9968e-01, 3.3252e-01, 1.5927e-01],
  4091. [ 7.6404e-01, -3.3559e-01, 1.7661e+00, -1.6401e-01, -4.4549e-01,
  4092. -1.6386e-01, 6.5402e-01, 1.4741e-01],
  4093. [ 3.2009e-01, -6.1624e-01, 1.7472e+00, -2.7111e-01, -2.9466e-01,
  4094. -3.7289e-01, 5.0791e-01, 1.5344e-01],
  4095. [-7.9375e-01, -1.3188e+00, 1.3903e+00, -1.2725e+00, -2.4440e-01,
  4096. -1.5361e+00, 3.7710e-01, 1.7771e-01]], device='cuda:0',
  4097. grad_fn=<AddmmBackward>)
  4098. landmarks are: tensor([[[ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  4099. 0.3161],
  4100. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  4101. 0.5401],
  4102. [-2.2859, -2.2859, 0.9922, -1.2021, -0.3229, -1.4314, 0.1044,
  4103. 0.2930],
  4104. [ 0.5450, -0.4706, 1.7643, 0.0722, -0.3708, 0.3200, 0.4854,
  4105. 0.0612],
  4106. [ 0.5697, -0.4113, 1.7499, -0.2767, -0.6404, -0.7155, 0.1576,
  4107. 0.4032],
  4108. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  4109. 0.0774],
  4110. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  4111. -0.0099],
  4112. [ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  4113. 0.1852]]], device='cuda:0')
  4114. loss_train_step before backward: tensor(0.1162, device='cuda:0', grad_fn=<MseLossBackward>)
  4115. loss_train_step after backward: tensor(0.1162, device='cuda:0', grad_fn=<MseLossBackward>)
  4116. loss_train: 11.88794718310237
  4117. step: 87
  4118. running loss: 0.13664307107014217
  4119. Train Steps: 87/90 Loss: 0.1366 torch.Size([8, 600, 800])
  4120. torch.Size([8, 8])
  4121. tensor([[0.6185, 0.4042, 0.7700, 0.2250, 0.4062, 0.2117, 0.5763, 0.5150],
  4122. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  4123. [0.6037, 0.4020, 0.8300, 0.4033, 0.3575, 0.4883, 0.5647, 0.5631],
  4124. [0.6267, 0.4080, 0.8438, 0.2633, 0.4763, 0.1800, 0.6259, 0.5240],
  4125. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  4126. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217],
  4127. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  4128. [0.6296, 0.4045, 0.9138, 0.4100, 0.4232, 0.4242, 0.7422, 0.5297]],
  4129. device='cuda:0', dtype=torch.float64)
  4130. predictions are: tensor([[-0.4403, -1.1100, 1.3071, -1.0556, -0.4015, -1.3357, 0.2999, 0.1572],
  4131. [-0.4792, -1.1614, 1.2105, -1.1959, -0.3678, -1.4565, 0.3273, 0.1607],
  4132. [ 0.5990, -0.3910, 1.5966, -0.3210, -0.4170, 0.0495, 0.5252, 0.2310],
  4133. [-0.2928, -1.0263, 1.6465, -0.8846, -0.2008, -1.1616, 0.5395, 0.1867],
  4134. [ 0.7680, -0.3232, 1.6906, 0.2699, -0.4037, 0.1270, 0.4906, 0.2611],
  4135. [ 0.1373, -0.7692, 1.2821, -0.8456, -0.4277, -0.9613, 0.3662, 0.2293],
  4136. [ 0.2150, -0.6974, 1.6454, -0.4520, -0.5265, -0.5073, 0.3394, 0.2385],
  4137. [ 0.9976, -0.1960, 1.7188, -0.2152, -0.4970, -0.1576, 0.6804, 0.1570]],
  4138. device='cuda:0', grad_fn=<AddmmBackward>)
  4139. landmarks are: tensor([[[ 0.5707, -0.4189, 1.2707, -1.2467, -0.4095, -1.3082, 0.3758,
  4140. 0.0928],
  4141. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  4142. 0.1253],
  4143. [ 0.5027, -0.4289, 1.5478, -0.4229, -0.6346, -0.0303, 0.3223,
  4144. 0.3148],
  4145. [ 0.6088, -0.4015, 1.6113, -1.0696, -0.0861, -1.4545, 0.6051,
  4146. 0.1343],
  4147. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  4148. 0.5401],
  4149. [ 0.5687, -0.4088, 1.0397, -1.1466, -0.3113, -1.1928, 0.4681,
  4150. 0.5855],
  4151. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  4152. 0.3392],
  4153. [ 0.6224, -0.4177, 1.9346, -0.3921, -0.3314, -0.3264, 1.1422,
  4154. 0.1608]]], device='cuda:0')
  4155. loss_train_step before backward: tensor(0.1034, device='cuda:0', grad_fn=<MseLossBackward>)
  4156. loss_train_step after backward: tensor(0.1034, device='cuda:0', grad_fn=<MseLossBackward>)
  4157. loss_train: 11.991319220513105
  4158. step: 88
  4159. running loss: 0.13626499114219437
  4160.  
  4161. Train Steps: 88/90 Loss: 0.1363 torch.Size([8, 600, 800])
  4162. torch.Size([8, 8])
  4163. tensor([[0.6246, 0.4008, 0.8757, 0.5088, 0.4101, 0.5392, 0.6644, 0.5133],
  4164. [0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083],
  4165. [0.6081, 0.3950, 0.8538, 0.4667, 0.3850, 0.4917, 0.5342, 0.4954],
  4166. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133],
  4167. [0.6182, 0.3930, 0.8841, 0.3892, 0.3556, 0.4967, 0.6222, 0.5279],
  4168. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  4169. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  4170. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378]],
  4171. device='cuda:0', dtype=torch.float64)
  4172. predictions are: tensor([[ 0.4388, -0.5066, 1.5570, -0.0962, -0.3215, -0.0344, 0.4251, 0.2929],
  4173. [ 0.4409, -0.5333, 1.5423, -0.5185, -0.5618, -0.4258, 0.3752, 0.2538],
  4174. [ 0.4461, -0.5290, 1.4972, -0.4042, -0.4689, -0.3502, 0.4340, 0.2296],
  4175. [ 0.1839, -0.7194, 1.4752, -0.6965, -0.6311, -0.9276, 0.2914, 0.2059],
  4176. [ 0.3816, -0.5760, 1.4603, -0.5821, -0.4492, -0.2598, 0.5169, 0.2633],
  4177. [ 0.4607, -0.5290, 1.5899, -0.0559, -0.5009, -0.4150, 0.3185, 0.2172],
  4178. [-0.2723, -1.0297, 1.5811, -0.9711, -0.3396, -1.3682, 0.4855, 0.1946],
  4179. [-0.1325, -0.9935, 1.5606, -1.2217, -0.1039, -1.4336, 0.7863, 0.1774]],
  4180. device='cuda:0', grad_fn=<AddmmBackward>)
  4181. landmarks are: tensor([[[ 0.5993, -0.4345, 1.7587, 0.0641, -0.3917, 0.2048, 0.7827,
  4182. 0.0852],
  4183. [ 0.5774, -0.3868, 1.6286, -0.5692, -0.6462, -0.2767, 0.5143,
  4184. 0.5239],
  4185. [ 0.5227, -0.4615, 1.6575, -0.1304, -0.5076, -0.0149, 0.1815,
  4186. 0.0021],
  4187. [ 0.5393, -0.4294, 1.6575, -0.4075, -0.6635, -0.6308, 0.3296,
  4188. 0.0851],
  4189. [ 0.5697, -0.4706, 1.7976, -0.4884, -0.6433, 0.0081, 0.5878,
  4190. 0.1525],
  4191. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  4192. -0.0370],
  4193. [ 0.6128, -0.3828, 1.7499, -0.8386, -0.3344, -1.2620, 0.5792,
  4194. -0.0263],
  4195. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  4196. 0.1982]]], device='cuda:0')
  4197. loss_train_step before backward: tensor(0.0703, device='cuda:0', grad_fn=<MseLossBackward>)
  4198. loss_train_step after backward: tensor(0.0703, device='cuda:0', grad_fn=<MseLossBackward>)
  4199. loss_train: 12.061648171395063
  4200. step: 89
  4201. running loss: 0.1355241367572479
  4202. Train Steps: 89/90 Loss: 0.1355 torch.Size([8, 600, 800])
  4203. torch.Size([8, 8])
  4204. tensor([[0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  4205. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  4206. [0.6199, 0.4071, 0.7600, 0.2117, 0.4037, 0.2767, 0.6138, 0.5550],
  4207. [0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  4208. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  4209. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  4210. [0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  4211. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927]],
  4212. device='cuda:0', dtype=torch.float64)
  4213. predictions are: tensor([[ 0.6735, -0.3933, 1.4704, -0.5424, -0.5828, -0.4557, 0.4849, 0.2398],
  4214. [ 0.2983, -0.6639, 1.7263, -0.3416, -0.2465, -0.5271, 0.5216, 0.2376],
  4215. [-0.2158, -0.9857, 1.3755, -1.1546, -0.3586, -1.3447, 0.3959, 0.2534],
  4216. [ 0.5483, -0.4424, 1.4602, -0.5501, -0.4750, -0.1833, 0.5094, 0.3046],
  4217. [ 0.3909, -0.5643, 1.7396, -0.2520, -0.2310, -0.3395, 0.5488, 0.2893],
  4218. [-0.4585, -1.1134, 1.1996, -1.0510, -0.5404, -1.2248, 0.1798, 0.2508],
  4219. [ 0.7076, -0.4017, 1.5375, -0.7291, -0.5402, -0.9808, 0.5706, 0.1742],
  4220. [ 0.3275, -0.6220, 1.6696, -0.2631, -0.3304, -0.3368, 0.3925, 0.2430]],
  4221. device='cuda:0', grad_fn=<AddmmBackward>)
  4222. landmarks are: tensor([[[ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  4223. 0.3559],
  4224. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  4225. -0.0039],
  4226. [ 0.5775, -0.4054, 1.2245, -1.3082, -0.4210, -1.0080, 0.5490,
  4227. 0.2776],
  4228. [ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  4229. 0.2545],
  4230. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  4231. 0.2853],
  4232. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  4233. 0.2837],
  4234. [ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  4235. -0.0957],
  4236. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  4237. -0.0099]]], device='cuda:0')
  4238. loss_train_step before backward: tensor(0.1250, device='cuda:0', grad_fn=<MseLossBackward>)
  4239. loss_train_step after backward: tensor(0.1250, device='cuda:0', grad_fn=<MseLossBackward>)
  4240. loss_train: 12.186646927148104
  4241. step: 90
  4242. running loss: 0.13540718807942337
  4243. Valid Steps: 10/10 Loss: nan 7.3225
  4244. --------------------------------------------------
  4245. Epoch: 1 Train Loss: 0.1354 Valid Loss: nan
  4246. --------------------------------------------------
  4247. size of train loader is: 90
  4248. torch.Size([8, 600, 800])
  4249. torch.Size([8, 8])
  4250. tensor([[0.6179, 0.3961, 0.8347, 0.6020, 0.3887, 0.4624, 0.5714, 0.5373],
  4251. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  4252. [0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  4253. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  4254. [0.6197, 0.4050, 0.7527, 0.2000, 0.4042, 0.2249, 0.5895, 0.4995],
  4255. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  4256. [0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  4257. [0.6336, 0.4154, 0.8900, 0.2767, 0.4988, 0.2867, 0.7422, 0.5540]],
  4258. device='cuda:0', dtype=torch.float64)
  4259. predictions are: tensor([[ 7.1007e-01, -3.5610e-01, 1.6399e+00, 6.3848e-02, -5.3525e-01,
  4260. -1.6645e-01, 3.9725e-01, 2.2814e-01],
  4261. [ 5.5852e-02, -7.9860e-01, 1.1793e+00, -1.0058e+00, -5.5704e-01,
  4262. -1.0473e+00, 2.7695e-01, 2.8426e-01],
  4263. [ 3.4867e-01, -5.3798e-01, 1.6127e+00, -2.1721e-01, -3.6062e-01,
  4264. -9.5872e-02, 3.0168e-01, 2.9245e-01],
  4265. [ 1.2011e-01, -7.8341e-01, 1.5370e+00, -1.1360e+00, -2.5911e-01,
  4266. -1.2756e+00, 6.6877e-01, 1.9165e-01],
  4267. [ 2.9767e-01, -6.7336e-01, 1.2427e+00, -1.1123e+00, -5.4911e-01,
  4268. -1.2077e+00, 3.5533e-01, 1.8474e-01],
  4269. [ 2.9968e-01, -6.2822e-01, 1.5641e+00, -6.2807e-01, -5.8927e-01,
  4270. -5.5374e-01, 3.0163e-01, 2.9457e-01],
  4271. [ 5.1429e-01, -4.5790e-01, 1.7073e+00, 6.4440e-03, -3.9337e-01,
  4272. 4.3100e-04, 3.4778e-01, 2.6891e-01],
  4273. [ 2.0770e-01, -7.3136e-01, 1.6545e+00, -9.7071e-01, -1.7980e-01,
  4274. -1.0599e+00, 7.4962e-01, 2.0022e-01]], device='cuda:0',
  4275. grad_fn=<AddmmBackward>)
  4276. landmarks are: tensor([[[ 0.5680, -0.4562, 1.5697, 0.4947, -0.4904, -0.1503, 0.3536,
  4277. 0.1956],
  4278. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  4279. 0.2391],
  4280. [ 0.5491, -0.4132, 1.7557, -0.0919, -0.2709, 0.0313, 0.0635,
  4281. 0.4032],
  4282. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  4283. 0.1020],
  4284. [ 0.5762, -0.4153, 1.1908, -1.3622, -0.4190, -1.2471, 0.4368,
  4285. 0.0213],
  4286. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  4287. 0.3392],
  4288. [ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  4289. 0.0467],
  4290. [ 0.6405, -0.3671, 1.8249, -1.0080, 0.0178, -0.9618, 1.1422,
  4291. 0.2730]]], device='cuda:0')
  4292. loss_train_step before backward: tensor(0.0426, device='cuda:0', grad_fn=<MseLossBackward>)
  4293. loss_train_step after backward: tensor(0.0426, device='cuda:0', grad_fn=<MseLossBackward>)
  4294. loss_train: 0.04259268939495087
  4295. step: 1
  4296. running loss: 0.04259268939495087
  4297. Train Steps: 1/90 Loss: 0.0426 torch.Size([8, 600, 800])
  4298. torch.Size([8, 8])
  4299. tensor([[0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  4300. [0.6084, 0.3981, 0.8588, 0.5233, 0.4600, 0.5367, 0.5680, 0.5006],
  4301. [0.6146, 0.4124, 0.8800, 0.4867, 0.3800, 0.4500, 0.5106, 0.5524],
  4302. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  4303. [0.6185, 0.4129, 0.8900, 0.4567, 0.3937, 0.5417, 0.5734, 0.5110],
  4304. [0.6276, 0.4235, 0.8888, 0.5333, 0.3800, 0.3117, 0.5427, 0.6164],
  4305. [0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  4306. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650]],
  4307. device='cuda:0', dtype=torch.float64)
  4308. predictions are: tensor([[ 0.4878, -0.4826, 1.4859, -0.7712, -0.6467, -0.7535, 0.3544, 0.2405],
  4309. [ 0.6440, -0.4132, 1.7307, -0.1418, -0.2576, -0.2243, 0.4596, 0.2307],
  4310. [ 0.8317, -0.2595, 1.6605, -0.2190, -0.5446, -0.2266, 0.4281, 0.2645],
  4311. [-0.1442, -0.9106, 1.3206, -1.2534, -0.4152, -1.3048, 0.3776, 0.2055],
  4312. [ 0.4407, -0.5200, 1.7622, -0.3675, -0.3601, -0.1808, 0.4552, 0.2645],
  4313. [ 0.8585, -0.2477, 1.6806, -0.0893, -0.4960, -0.5336, 0.4715, 0.2489],
  4314. [ 0.4703, -0.4759, 1.6254, -0.3660, -0.3193, -0.2449, 0.3914, 0.2745],
  4315. [-0.6149, -1.2198, 1.1038, -1.5154, -0.3264, -1.5851, 0.3474, 0.1998]],
  4316. device='cuda:0', grad_fn=<AddmmBackward>)
  4317. landmarks are: tensor([[[ 0.5581, -0.3912, 1.6460, -0.5230, -0.6173, -0.5923, 0.0681,
  4318. 0.4348],
  4319. [ 0.5241, -0.4470, 1.6806, 0.1313, -0.1612, 0.1929, 0.3378,
  4320. 0.0261],
  4321. [ 0.5529, -0.3811, 1.7788, -0.0380, -0.5307, -0.2074, 0.0727,
  4322. 0.2657],
  4323. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  4324. 0.3700],
  4325. [ 0.5711, -0.3788, 1.8249, -0.1766, -0.4672, 0.2160, 0.3625,
  4326. 0.0742],
  4327. [ 0.6131, -0.3299, 1.8192, 0.1775, -0.5307, -0.8463, 0.2206,
  4328. 0.5612],
  4329. [ 0.5491, -0.4132, 1.7557, -0.0919, -0.2709, 0.0313, 0.0635,
  4330. 0.4032],
  4331. [-2.2859, -2.2859, 1.0361, -1.2021, -0.4210, -1.3390, 0.0871,
  4332. 0.3238]]], device='cuda:0')
  4333. loss_train_step before backward: tensor(0.1098, device='cuda:0', grad_fn=<MseLossBackward>)
  4334. loss_train_step after backward: tensor(0.1098, device='cuda:0', grad_fn=<MseLossBackward>)
  4335. loss_train: 0.15242556482553482
  4336. step: 2
  4337. running loss: 0.07621278241276741
  4338.  
  4339. Train Steps: 2/90 Loss: 0.0762 torch.Size([8, 600, 800])
  4340. torch.Size([8, 8])
  4341. tensor([[0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  4342. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  4343. [0.6311, 0.3998, 0.7975, 0.5767, 0.3838, 0.4850, 0.7327, 0.5343],
  4344. [0.6186, 0.4013, 0.8191, 0.3188, 0.4279, 0.2060, 0.5767, 0.5411],
  4345. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  4346. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  4347. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  4348. [0.6115, 0.3998, 0.7063, 0.2383, 0.4037, 0.1950, 0.5320, 0.4993]],
  4349. device='cuda:0', dtype=torch.float64)
  4350. predictions are: tensor([[ 0.2055, -0.6563, 1.3950, -0.9640, -0.4633, -0.9175, 0.3805, 0.2383],
  4351. [ 0.4255, -0.4887, 1.5916, -0.6542, -0.4395, -0.7613, 0.4005, 0.2200],
  4352. [ 0.5741, -0.4211, 1.5171, -0.2034, -0.3918, -0.0850, 0.3576, 0.2748],
  4353. [ 0.2696, -0.5973, 1.3929, -0.9257, -0.4207, -0.9935, 0.3744, 0.2466],
  4354. [ 0.5596, -0.4324, 1.7364, -0.3859, -0.4203, -0.5341, 0.4266, 0.2516],
  4355. [ 0.6552, -0.3283, 1.7068, -0.2231, -0.4293, -0.4643, 0.4657, 0.2142],
  4356. [ 0.3758, -0.5187, 1.6616, -0.1487, -0.2192, 0.0357, 0.3985, 0.2725],
  4357. [ 0.1727, -0.7338, 1.0763, -1.1915, -0.5032, -1.1693, 0.2439, 0.2383]],
  4358. device='cuda:0', grad_fn=<AddmmBackward>)
  4359. landmarks are: tensor([[[ 5.6966e-01, -4.4416e-01, 1.3529e+00, -9.5152e-01, -5.7742e-01,
  4360. -7.8011e-01, 5.2533e-01, 1.9310e-01],
  4361. [ 5.7841e-01, -4.0062e-01, 1.7911e+00, -5.7008e-01, -5.1916e-01,
  4362. -1.0331e+00, 4.1374e-01, 2.1391e-01],
  4363. [ 6.2895e-01, -4.3934e-01, 1.3977e+00, 3.7768e-01, -5.1339e-01,
  4364. -4.5727e-02, 1.0984e+00, 1.8214e-01],
  4365. [ 5.7131e-01, -4.3212e-01, 1.4975e+00, -8.1340e-01, -3.0942e-01,
  4366. -1.3345e+00, 3.7786e-01, 2.1339e-01],
  4367. [ 6.0935e-01, -3.9469e-01, 1.8885e+00, -2.9977e-01, -5.7691e-01,
  4368. -6.7698e-01, 6.0670e-01, 1.0054e-01],
  4369. [ 6.5201e-01, -3.6231e-01, 1.8885e+00, 3.1255e-02, -5.5381e-01,
  4370. -5.3841e-01, 6.9257e-01, 1.6611e-01],
  4371. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  4372. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  4373. [ 5.3837e-01, -4.3934e-01, 9.7621e-01, -1.1851e+00, -4.2102e-01,
  4374. -1.3852e+00, 1.7122e-01, 2.0118e-02]]], device='cuda:0')
  4375. loss_train_step before backward: tensor(0.0365, device='cuda:0', grad_fn=<MseLossBackward>)
  4376. loss_train_step after backward: tensor(0.0365, device='cuda:0', grad_fn=<MseLossBackward>)
  4377. loss_train: 0.1889284811913967
  4378. step: 3
  4379. running loss: 0.06297616039713223
  4380. Train Steps: 3/90 Loss: 0.0630 torch.Size([8, 600, 800])
  4381. torch.Size([8, 8])
  4382. tensor([[0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  4383. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  4384. [0.6114, 0.4018, 0.7213, 0.1967, 0.3763, 0.2700, 0.5875, 0.5533],
  4385. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  4386. [0.6037, 0.4020, 0.8300, 0.4033, 0.3575, 0.4883, 0.5647, 0.5631],
  4387. [0.6339, 0.4112, 0.8838, 0.5067, 0.4000, 0.5433, 0.7549, 0.5378],
  4388. [0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  4389. [0.6286, 0.4097, 0.8107, 0.2414, 0.4425, 0.2483, 0.6745, 0.5385]],
  4390. device='cuda:0', dtype=torch.float64)
  4391. predictions are: tensor([[ 0.9354, -0.1689, 1.7982, -0.0957, -0.5106, -0.0445, 0.4831, 0.2091],
  4392. [ 0.2110, -0.6863, 1.2094, -1.0299, -0.4531, -1.1977, 0.2558, 0.2339],
  4393. [ 0.4777, -0.5063, 1.2934, -0.9708, -0.5087, -0.9821, 0.3245, 0.2426],
  4394. [ 0.2455, -0.6200, 1.3273, -0.9011, -0.4809, -0.9806, 0.2810, 0.2534],
  4395. [ 0.4969, -0.4011, 1.6330, -0.3698, -0.3892, -0.0085, 0.3747, 0.2756],
  4396. [ 0.8093, -0.2633, 1.9032, 0.2491, -0.2979, 0.3559, 0.4084, 0.2968],
  4397. [ 0.1955, -0.6490, 1.4015, -0.7826, -0.4914, -0.8720, 0.2076, 0.2256],
  4398. [ 0.4164, -0.5204, 1.6887, -0.7912, -0.2706, -1.0754, 0.5404, 0.1997]],
  4399. device='cuda:0', grad_fn=<AddmmBackward>)
  4400. landmarks are: tensor([[[ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  4401. -0.0670],
  4402. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  4403. 0.3007],
  4404. [ 0.5380, -0.4302, 1.0455, -1.3775, -0.5480, -1.0388, 0.4277,
  4405. 0.2699],
  4406. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  4407. 0.3546],
  4408. [ 0.5027, -0.4289, 1.5478, -0.4229, -0.6346, -0.0303, 0.3223,
  4409. 0.3148],
  4410. [ 0.6421, -0.3864, 1.7961, 0.0543, -0.4383, 0.2237, 1.2007,
  4411. 0.1982],
  4412. [ 0.5532, -0.3888, 1.4727, -0.7463, -0.5538, -1.0465, 0.0265,
  4413. 0.2138],
  4414. [ 0.6174, -0.3936, 1.4586, -1.1709, -0.2420, -1.1389, 0.8296,
  4415. 0.2012]]], device='cuda:0')
  4416. loss_train_step before backward: tensor(0.0430, device='cuda:0', grad_fn=<MseLossBackward>)
  4417. loss_train_step after backward: tensor(0.0430, device='cuda:0', grad_fn=<MseLossBackward>)
  4418. loss_train: 0.23190448060631752
  4419. step: 4
  4420. running loss: 0.05797612015157938
  4421. Train Steps: 4/90 Loss: 0.0580 torch.Size([8, 600, 800])
  4422. torch.Size([8, 8])
  4423. tensor([[0.6161, 0.4076, 0.8900, 0.4667, 0.4125, 0.5917, 0.6262, 0.5367],
  4424. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  4425. [0.6037, 0.4020, 0.8300, 0.4033, 0.3575, 0.4883, 0.5647, 0.5631],
  4426. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  4427. [0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  4428. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  4429. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  4430. [0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131]],
  4431. device='cuda:0', dtype=torch.float64)
  4432. predictions are: tensor([[ 0.7001, -0.2766, 1.6908, -0.1484, -0.3457, -0.0808, 0.4303, 0.2640],
  4433. [ 0.4341, -0.5333, 1.4638, -0.8986, -0.4397, -1.1506, 0.3810, 0.2546],
  4434. [ 0.4200, -0.4447, 1.4699, -0.5509, -0.4799, -0.3041, 0.3056, 0.2709],
  4435. [ 0.5279, -0.4039, 1.6207, -0.2760, -0.3859, -0.1375, 0.2687, 0.2574],
  4436. [ 0.6383, -0.3270, 1.5034, -0.3866, -0.5343, -0.3790, 0.2957, 0.2652],
  4437. [ 0.2794, -0.6039, 1.6532, -1.1591, -0.1907, -1.4350, 0.7113, 0.1612],
  4438. [ 0.4900, -0.4513, 1.6026, -0.0751, -0.3859, -0.1690, 0.2521, 0.2527],
  4439. [ 0.6725, -0.3149, 1.4706, -0.6186, -0.5776, -0.5253, 0.3481, 0.2127]],
  4440. device='cuda:0', grad_fn=<AddmmBackward>)
  4441. landmarks are: tensor([[[ 0.5598, -0.4032, 1.8249, -0.1304, -0.3806, 0.4470, 0.6067,
  4442. 0.1929],
  4443. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  4444. 0.5701],
  4445. [ 0.5027, -0.4289, 1.5478, -0.4229, -0.6346, -0.0303, 0.3223,
  4446. 0.3148],
  4447. [ 0.5499, -0.4225, 1.8018, -0.2921, -0.3055, 0.0543, 0.4046,
  4448. 0.2699],
  4449. [ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  4450. 0.3267],
  4451. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  4452. 0.2944],
  4453. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  4454. 0.1627],
  4455. [ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  4456. 0.0840]]], device='cuda:0')
  4457. loss_train_step before backward: tensor(0.0299, device='cuda:0', grad_fn=<MseLossBackward>)
  4458. loss_train_step after backward: tensor(0.0299, device='cuda:0', grad_fn=<MseLossBackward>)
  4459. loss_train: 0.26177416928112507
  4460. step: 5
  4461. running loss: 0.05235483385622501
  4462. Train Steps: 5/90 Loss: 0.0524 torch.Size([8, 600, 800])
  4463. torch.Size([8, 8])
  4464. tensor([[0.6263, 0.4030, 0.9000, 0.4767, 0.3800, 0.5167, 0.6415, 0.4771],
  4465. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  4466. [0.6225, 0.4116, 0.8662, 0.3517, 0.3663, 0.3233, 0.5837, 0.5317],
  4467. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  4468. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  4469. [ nan, nan, 0.6992, 0.2791, 0.3950, 0.2383, 0.5483, 0.5819],
  4470. [0.6092, 0.4001, 0.8638, 0.4867, 0.4288, 0.5367, 0.5484, 0.5064],
  4471. [0.6152, 0.4131, 0.6863, 0.2567, 0.3625, 0.3300, 0.5765, 0.5305]],
  4472. device='cuda:0', dtype=torch.float64)
  4473. predictions are: tensor([[ 0.5591, -0.3862, 1.8141, -0.1409, -0.3558, -0.0230, 0.4684, 0.1989],
  4474. [ 0.7180, -0.3285, 1.7612, 0.0262, -0.4315, -0.1326, 0.3433, 0.2333],
  4475. [ 0.6214, -0.3498, 1.5698, -0.8629, -0.4971, -1.0170, 0.4340, 0.2186],
  4476. [ 0.7594, -0.2548, 1.7353, 0.0515, -0.2798, -0.1146, 0.3592, 0.2564],
  4477. [ 0.7539, -0.2979, 1.6140, -0.6767, -0.5285, -0.6289, 0.5362, 0.1763],
  4478. [-0.0267, -0.8053, 1.0535, -1.2585, -0.4485, -1.2836, 0.2414, 0.2479],
  4479. [ 0.6017, -0.3277, 1.7198, -0.1452, -0.3064, -0.0624, 0.3880, 0.2317],
  4480. [ 0.4863, -0.4454, 1.1515, -1.0345, -0.5895, -0.9306, 0.2529, 0.2732]],
  4481. device='cuda:0', grad_fn=<AddmmBackward>)
  4482. landmarks are: tensor([[[ 0.6072, -0.4247, 1.8711, -0.0842, -0.5307, 0.1005, 0.6771,
  4483. -0.0821],
  4484. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  4485. 0.0697],
  4486. [ 0.5893, -0.3847, 1.7152, -0.6616, -0.5942, -0.7925, 0.4104,
  4487. 0.1698],
  4488. [ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  4489. 0.2364],
  4490. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  4491. -0.0670],
  4492. [-2.2859, -2.2859, 0.9438, -0.9967, -0.4614, -1.1851, 0.2468,
  4493. 0.4019],
  4494. [ 0.5278, -0.4377, 1.7037, -0.0380, -0.3055, 0.1929, 0.2473,
  4495. 0.0532],
  4496. [ 0.5557, -0.3779, 0.8838, -1.1004, -0.6115, -0.7617, 0.3769,
  4497. 0.1644]]], device='cuda:0')
  4498. loss_train_step before backward: tensor(0.1336, device='cuda:0', grad_fn=<MseLossBackward>)
  4499. loss_train_step after backward: tensor(0.1336, device='cuda:0', grad_fn=<MseLossBackward>)
  4500. loss_train: 0.39533588476479053
  4501. step: 6
  4502. running loss: 0.06588931412746508
  4503.  
  4504. Train Steps: 6/90 Loss: 0.0659 torch.Size([8, 600, 800])
  4505. torch.Size([8, 8])
  4506. tensor([[0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823],
  4507. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  4508. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  4509. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  4510. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  4511. [0.6289, 0.4081, 0.8720, 0.3487, 0.3900, 0.3183, 0.6703, 0.5376],
  4512. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  4513. [0.6030, 0.3969, 0.7988, 0.3917, 0.3450, 0.3667, 0.5266, 0.4700]],
  4514. device='cuda:0', dtype=torch.float64)
  4515. predictions are: tensor([[ 0.5827, -0.4379, 1.4441, -1.1022, -0.3418, -1.2180, 0.5851, 0.1748],
  4516. [ 0.6353, -0.2988, 1.7405, 0.2265, -0.2744, 0.2779, 0.4264, 0.2445],
  4517. [ 0.6568, -0.3217, 1.5801, -0.5005, -0.5412, -0.4082, 0.3244, 0.2201],
  4518. [ 0.4810, -0.4567, 1.2555, -0.9256, -0.5145, -0.7963, 0.3975, 0.2130],
  4519. [ 0.6530, -0.3305, 1.5795, -0.3256, -0.5694, -0.2815, 0.2549, 0.2598],
  4520. [ 0.6139, -0.3530, 1.6029, -0.5732, -0.3805, -0.8116, 0.4547, 0.2125],
  4521. [ 0.3853, -0.4860, 1.6758, -0.1242, -0.3653, -0.0897, 0.4411, 0.2086],
  4522. [ 0.5693, -0.3776, 1.4477, -0.5859, -0.5408, -0.5223, 0.3565, 0.1967]],
  4523. device='cuda:0', grad_fn=<AddmmBackward>)
  4524. landmarks are: tensor([[[ 0.6132, -0.4122, 1.5478, -1.0619, -0.2709, -1.4314, 0.5500,
  4525. -0.0583],
  4526. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  4527. 0.3371],
  4528. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  4529. 0.0802],
  4530. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  4531. 0.2545],
  4532. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  4533. 0.3238],
  4534. [ 0.6191, -0.4008, 1.7420, -0.6753, -0.4845, -0.8156, 0.8101,
  4535. 0.1974],
  4536. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  4537. 0.0774],
  4538. [ 0.4992, -0.4525, 1.4035, -0.4768, -0.6924, -0.5923, 0.1465,
  4539. -0.1151]]], device='cuda:0')
  4540. loss_train_step before backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  4541. loss_train_step after backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  4542. loss_train: 0.4160845186561346
  4543. step: 7
  4544. running loss: 0.05944064552230494
  4545. Train Steps: 7/90 Loss: 0.0594 torch.Size([8, 600, 800])
  4546. torch.Size([8, 8])
  4547. tensor([[0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  4548. [0.6239, 0.4206, 0.8750, 0.5400, 0.3688, 0.4850, 0.5737, 0.5700],
  4549. [0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  4550. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332],
  4551. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  4552. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  4553. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  4554. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272]],
  4555. device='cuda:0', dtype=torch.float64)
  4556. predictions are: tensor([[ 0.7021, -0.3496, 1.2926, -1.1388, -0.4333, -1.1794, 0.4480, 0.1941],
  4557. [ 0.9963, -0.1069, 1.7337, 0.1366, -0.6265, -0.0216, 0.4571, 0.1893],
  4558. [ 0.4696, -0.4188, 1.6972, -0.1467, -0.3254, 0.0139, 0.5288, 0.1844],
  4559. [ 0.4513, -0.4183, 1.4989, -0.2108, -0.4803, -0.1647, 0.3797, 0.1903],
  4560. [ 0.6194, -0.3489, 1.4720, -0.8228, -0.5840, -0.7738, 0.4798, 0.2157],
  4561. [ 0.3232, -0.5147, 1.6214, -0.3481, -0.2429, -0.1752, 0.4896, 0.2023],
  4562. [ 0.4407, -0.4461, 1.6146, -0.1038, -0.3282, -0.0575, 0.4005, 0.1977],
  4563. [ 0.4908, -0.4550, 1.4114, -0.8419, -0.5530, -0.9475, 0.3662, 0.1874]],
  4564. device='cuda:0', grad_fn=<AddmmBackward>)
  4565. landmarks are: tensor([[[ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  4566. 0.1850],
  4567. [ 0.5960, -0.3430, 1.7557, 0.2083, -0.5827, -0.0457, 0.3642,
  4568. 0.3469],
  4569. [ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  4570. 0.1661],
  4571. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  4572. 0.1768],
  4573. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  4574. 0.5624],
  4575. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  4576. 0.3007],
  4577. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  4578. 0.0764],
  4579. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  4580. 0.1494]]], device='cuda:0')
  4581. loss_train_step before backward: tensor(0.0386, device='cuda:0', grad_fn=<MseLossBackward>)
  4582. loss_train_step after backward: tensor(0.0386, device='cuda:0', grad_fn=<MseLossBackward>)
  4583. loss_train: 0.4546631034463644
  4584. step: 8
  4585. running loss: 0.05683288793079555
  4586. Train Steps: 8/90 Loss: 0.0568 torch.Size([8, 600, 800])
  4587. torch.Size([8, 8])
  4588. tensor([[0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749],
  4589. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  4590. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  4591. [0.6257, 0.4060, 0.8300, 0.2333, 0.4688, 0.2583, 0.7050, 0.5633],
  4592. [0.6203, 0.4056, 0.8942, 0.4086, 0.3643, 0.3617, 0.5917, 0.5482],
  4593. [0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758],
  4594. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  4595. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500]],
  4596. device='cuda:0', dtype=torch.float64)
  4597. predictions are: tensor([[ 0.2553, -0.5819, 1.1939, -0.8524, -0.5313, -0.6417, 0.3589, 0.1984],
  4598. [ 0.7735, -0.2880, 1.4316, -0.4455, -0.6361, -0.5807, 0.2920, 0.2505],
  4599. [ 0.8888, -0.1807, 1.8123, 0.0572, -0.5599, 0.0372, 0.5111, 0.1406],
  4600. [ 0.5415, -0.4451, 1.6313, -0.9964, -0.1940, -1.0505, 0.8056, 0.1340],
  4601. [ 0.7210, -0.2990, 1.6302, -0.2831, -0.5936, -0.3882, 0.4315, 0.1563],
  4602. [ 0.4772, -0.4362, 1.7029, 0.0759, -0.3797, 0.1898, 0.4535, 0.1590],
  4603. [ 0.4588, -0.4792, 1.2327, -0.9956, -0.4738, -0.8281, 0.4887, 0.1862],
  4604. [ 0.5360, -0.3870, 1.7055, -0.0526, -0.3721, 0.0659, 0.5101, 0.1510]],
  4605. device='cuda:0', grad_fn=<AddmmBackward>)
  4606. landmarks are: tensor([[[ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  4607. 0.3694],
  4608. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  4609. 0.4470],
  4610. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  4611. 0.2516],
  4612. [ 0.6042, -0.4105, 1.5478, -1.2082, -0.1208, -1.0927, 0.9704,
  4613. 0.3157],
  4614. [ 0.5791, -0.4127, 1.8442, -0.3985, -0.6031, -0.6154, 0.4473,
  4615. 0.2464],
  4616. [ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  4617. -0.0881],
  4618. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  4619. 0.1621],
  4620. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  4621. 0.2545]]], device='cuda:0')
  4622. loss_train_step before backward: tensor(0.0231, device='cuda:0', grad_fn=<MseLossBackward>)
  4623. loss_train_step after backward: tensor(0.0231, device='cuda:0', grad_fn=<MseLossBackward>)
  4624. loss_train: 0.4777647405862808
  4625. step: 9
  4626. running loss: 0.05308497117625342
  4627. Train Steps: 9/90 Loss: 0.0531 torch.Size([8, 600, 800])
  4628. torch.Size([8, 8])
  4629. tensor([[0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  4630. [0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748],
  4631. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  4632. [0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  4633. [0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843],
  4634. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  4635. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  4636. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617]],
  4637. device='cuda:0', dtype=torch.float64)
  4638. predictions are: tensor([[ 0.3739, -0.5290, 1.7073, -0.4004, -0.4418, -0.0480, 0.6693, 0.1278],
  4639. [ 0.5947, -0.3743, 1.6106, -0.0960, -0.4672, -0.2712, 0.5061, 0.1534],
  4640. [ 0.6945, -0.3319, 1.6409, 0.2558, -0.4384, 0.1308, 0.4694, 0.1777],
  4641. [ 0.9772, -0.1057, 1.5562, -0.1561, -0.7040, -0.3083, 0.3698, 0.1888],
  4642. [ 0.6909, -0.3311, 1.8099, -0.0290, -0.5085, 0.1348, 0.5433, 0.1238],
  4643. [ 0.5375, -0.4298, 1.6000, -1.0680, -0.1836, -0.9936, 0.8623, 0.1370],
  4644. [ 0.7472, -0.2899, 1.4580, -0.5038, -0.6770, -0.3817, 0.3422, 0.2079],
  4645. [-0.0050, -0.7495, 1.0129, -1.3194, -0.4006, -1.1948, 0.3865, 0.2216]],
  4646. device='cuda:0', grad_fn=<AddmmBackward>)
  4647. landmarks are: tensor([[[ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  4648. 0.2083],
  4649. [ 0.6421, -0.3647, 1.5940, 0.3084, -0.5192, -0.3691, 1.1057,
  4650. 0.3692],
  4651. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  4652. 0.5239],
  4653. [ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  4654. 0.4393],
  4655. [ 0.6075, -0.4159, 1.8654, -0.1458, -0.5249, 0.0159, 0.6359,
  4656. -0.0490],
  4657. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  4658. 0.2944],
  4659. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  4660. 0.2567],
  4661. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  4662. 0.3084]]], device='cuda:0')
  4663. loss_train_step before backward: tensor(0.1472, device='cuda:0', grad_fn=<MseLossBackward>)
  4664. loss_train_step after backward: tensor(0.1472, device='cuda:0', grad_fn=<MseLossBackward>)
  4665. loss_train: 0.6249740868806839
  4666. step: 10
  4667. running loss: 0.06249740868806839
  4668.  
  4669. Train Steps: 10/90 Loss: 0.0625 torch.Size([8, 600, 800])
  4670. torch.Size([8, 8])
  4671. tensor([[0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  4672. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  4673. [0.6202, 0.4066, 0.8746, 0.3376, 0.3717, 0.3090, 0.5842, 0.5165],
  4674. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  4675. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  4676. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  4677. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  4678. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100]],
  4679. device='cuda:0', dtype=torch.float64)
  4680. predictions are: tensor([[ 0.5993, -0.4172, 1.2918, -0.8599, -0.4895, -0.8689, 0.4674, 0.2569],
  4681. [ 0.6262, -0.3522, 1.7937, 0.2198, -0.4215, 0.3747, 0.6560, 0.1763],
  4682. [ 0.8618, -0.2339, 1.5645, -0.7135, -0.6392, -0.8297, 0.5180, 0.1674],
  4683. [ 0.5942, -0.3806, 1.8856, 0.2418, -0.3690, 0.4265, 0.7306, 0.1557],
  4684. [-0.1523, -0.8777, 1.0009, -1.3971, -0.3676, -1.3578, 0.4247, 0.2480],
  4685. [ 0.6371, -0.3410, 1.8052, 0.0200, -0.3949, 0.2762, 0.6559, 0.1790],
  4686. [ 0.6024, -0.4038, 1.3672, -1.0748, -0.5515, -1.0605, 0.6216, 0.1504],
  4687. [ 0.6503, -0.3460, 1.6743, 0.2830, -0.5657, 0.1409, 0.4786, 0.1767]],
  4688. device='cuda:0', grad_fn=<AddmmBackward>)
  4689. landmarks are: tensor([[[ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  4690. 0.6084],
  4691. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  4692. 0.3371],
  4693. [ 0.5787, -0.4077, 1.7537, -0.7263, -0.5692, -0.8586, 0.4126,
  4694. 0.1000],
  4695. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  4696. 0.3157],
  4697. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  4698. 0.3623],
  4699. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  4700. 0.0928],
  4701. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  4702. 0.2043],
  4703. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  4704. 0.5316]]], device='cuda:0')
  4705. loss_train_step before backward: tensor(0.1232, device='cuda:0', grad_fn=<MseLossBackward>)
  4706. loss_train_step after backward: tensor(0.1232, device='cuda:0', grad_fn=<MseLossBackward>)
  4707. loss_train: 0.7481739446520805
  4708. step: 11
  4709. running loss: 0.06801581315018913
  4710. Train Steps: 11/90 Loss: 0.0680 torch.Size([8, 600, 800])
  4711. torch.Size([8, 8])
  4712. tensor([[0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  4713. [0.6272, 0.4045, 0.8538, 0.5900, 0.3750, 0.4417, 0.5989, 0.4649],
  4714. [0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  4715. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  4716. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  4717. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  4718. [0.6193, 0.4050, 0.7313, 0.2433, 0.4075, 0.2117, 0.5649, 0.5656],
  4719. [0.6090, 0.4010, 0.7838, 0.3483, 0.3538, 0.3783, 0.5462, 0.5077]],
  4720. device='cuda:0', dtype=torch.float64)
  4721. predictions are: tensor([[ 0.6062, -0.3971, 1.4841, -0.8442, -0.4335, -0.7972, 0.6544, 0.2369],
  4722. [ 0.7315, -0.3394, 1.7088, 0.1553, -0.5659, -0.1784, 0.6413, 0.1370],
  4723. [ 0.6299, -0.3791, 1.5284, -0.3892, -0.6555, -0.3467, 0.4660, 0.2540],
  4724. [ 0.4641, -0.4911, 1.8043, -0.0249, -0.2395, -0.0491, 0.7281, 0.1559],
  4725. [ 0.4449, -0.4664, 1.5657, -0.5493, -0.5251, -0.2868, 0.7594, 0.1848],
  4726. [ 0.3801, -0.5408, 1.7443, 0.1158, -0.3322, 0.1869, 0.5623, 0.2204],
  4727. [ 0.4160, -0.5228, 1.1209, -1.0819, -0.5001, -1.0193, 0.5185, 0.2376],
  4728. [ 0.4419, -0.5029, 1.3971, -0.7442, -0.5796, -0.5155, 0.5558, 0.1858]],
  4729. device='cuda:0', grad_fn=<AddmmBackward>)
  4730. landmarks are: tensor([[[ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  4731. 0.2699],
  4732. [ 0.6109, -0.4177, 1.6575, 0.4393, -0.5538, -0.2459, 0.4805,
  4733. -0.1385],
  4734. [ 0.5581, -0.3912, 1.6460, -0.5230, -0.6173, -0.5923, 0.0681,
  4735. 0.4348],
  4736. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  4737. -0.0039],
  4738. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  4739. 0.2391],
  4740. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  4741. 0.3057],
  4742. [ 0.5746, -0.4153, 1.0917, -1.1620, -0.4037, -1.3082, 0.3234,
  4743. 0.3267],
  4744. [ 0.5270, -0.4336, 1.3342, -0.6770, -0.6520, -0.5384, 0.2370,
  4745. 0.0592]]], device='cuda:0')
  4746. loss_train_step before backward: tensor(0.0295, device='cuda:0', grad_fn=<MseLossBackward>)
  4747. loss_train_step after backward: tensor(0.0295, device='cuda:0', grad_fn=<MseLossBackward>)
  4748. loss_train: 0.7777050696313381
  4749. step: 12
  4750. running loss: 0.06480875580261151
  4751. Train Steps: 12/90 Loss: 0.0648 torch.Size([8, 600, 800])
  4752. torch.Size([8, 8])
  4753. tensor([[0.6184, 0.4079, 0.8350, 0.3700, 0.3675, 0.2883, 0.5312, 0.5783],
  4754. [0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117],
  4755. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  4756. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  4757. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  4758. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  4759. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  4760. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436]],
  4761. device='cuda:0', dtype=torch.float64)
  4762. predictions are: tensor([[ 0.4202, -0.5173, 1.3836, -0.6753, -0.5700, -0.7469, 0.4485, 0.2560],
  4763. [ 0.4411, -0.5239, 1.6127, -0.2479, -0.5575, -0.2546, 0.5313, 0.2155],
  4764. [ 0.3881, -0.5298, 1.6339, -0.9055, -0.2468, -0.8263, 0.8806, 0.2196],
  4765. [ 0.4624, -0.4736, 1.6928, -0.2386, -0.2085, -0.0825, 0.7356, 0.2267],
  4766. [ 0.3695, -0.5581, 1.3107, -0.6324, -0.6252, -0.6646, 0.4025, 0.3258],
  4767. [ 0.6355, -0.4044, 1.6213, -0.0035, -0.5570, -0.2023, 0.6437, 0.1830],
  4768. [ 0.4304, -0.5043, 1.4906, -0.5608, -0.6256, -0.4607, 0.4872, 0.2247],
  4769. [ 0.6903, -0.3622, 1.7952, 0.1668, -0.4360, 0.3059, 0.8035, 0.2034]],
  4770. device='cuda:0', grad_fn=<AddmmBackward>)
  4771. landmarks are: tensor([[[ 0.5704, -0.4019, 1.5709, -0.5769, -0.5885, -0.9541, 0.1679,
  4772. 0.3854],
  4773. [ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  4774. 0.0774],
  4775. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  4776. 0.3050],
  4777. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  4778. 0.2776],
  4779. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  4780. 0.4374],
  4781. [ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  4782. 0.2075],
  4783. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  4784. 0.0862],
  4785. [ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  4786. 0.2249]]], device='cuda:0')
  4787. loss_train_step before backward: tensor(0.0215, device='cuda:0', grad_fn=<MseLossBackward>)
  4788. loss_train_step after backward: tensor(0.0215, device='cuda:0', grad_fn=<MseLossBackward>)
  4789. loss_train: 0.7992481663823128
  4790. step: 13
  4791. running loss: 0.06148062818325483
  4792. Train Steps: 13/90 Loss: 0.0615 torch.Size([8, 600, 800])
  4793. torch.Size([8, 8])
  4794. tensor([[0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  4795. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750],
  4796. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  4797. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  4798. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  4799. [0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  4800. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  4801. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578]],
  4802. device='cuda:0', dtype=torch.float64)
  4803. predictions are: tensor([[-0.0145, -0.7906, 1.1196, -1.0009, -0.4156, -0.9101, 0.4786, 0.3279],
  4804. [-0.1917, -0.9380, 1.0036, -1.1857, -0.4182, -1.1089, 0.4359, 0.3034],
  4805. [ 0.9721, -0.1997, 1.9877, 0.5234, -0.4360, 0.5324, 0.7571, 0.1728],
  4806. [ 0.9694, -0.2090, 2.0023, 0.2408, -0.5046, 0.1142, 0.8536, 0.1759],
  4807. [ 0.9472, -0.1856, 1.9436, -0.1935, -0.5401, -0.2110, 0.8041, 0.1836],
  4808. [ 0.3610, -0.5303, 1.3561, -0.7856, -0.5148, -0.7644, 0.4557, 0.2544],
  4809. [ 0.7199, -0.3162, 1.7110, -0.1089, -0.3733, -0.3602, 0.6635, 0.2948],
  4810. [-0.4062, -1.0408, 1.1087, -1.0144, -0.4563, -0.8119, 0.3634, 0.2917]],
  4811. device='cuda:0', grad_fn=<AddmmBackward>)
  4812. landmarks are: tensor([[[ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  4813. 0.2622],
  4814. [ 0.5663, -0.4396, 0.8261, -1.1312, -0.2940, -1.3929, 0.2603,
  4815. 0.3700],
  4816. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  4817. 0.3777],
  4818. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  4819. 0.4386],
  4820. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  4821. 0.1544],
  4822. [ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  4823. 0.0111],
  4824. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  4825. 0.5822],
  4826. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  4827. 0.2905]]], device='cuda:0')
  4828. loss_train_step before backward: tensor(0.1652, device='cuda:0', grad_fn=<MseLossBackward>)
  4829.  
  4830. loss_train_step after backward: tensor(0.1652, device='cuda:0', grad_fn=<MseLossBackward>)
  4831. loss_train: 0.964469201862812
  4832. step: 14
  4833. running loss: 0.06889065727591515
  4834. Train Steps: 14/90 Loss: 0.0689 torch.Size([8, 600, 800])
  4835. torch.Size([8, 8])
  4836. tensor([[0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083],
  4837. [0.6350, 0.4043, 0.8738, 0.5650, 0.3850, 0.4750, 0.6401, 0.4950],
  4838. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  4839. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  4840. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  4841. [0.6245, 0.4100, 0.7762, 0.2583, 0.4963, 0.1517, 0.5875, 0.5417],
  4842. [0.6239, 0.4206, 0.8750, 0.5400, 0.3688, 0.4850, 0.5737, 0.5700],
  4843. [0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676]],
  4844. device='cuda:0', dtype=torch.float64)
  4845. predictions are: tensor([[ 0.7869, -0.3033, 1.7974, -0.1969, -0.6868, -0.0957, 0.6042, 0.2605],
  4846. [ 0.8107, -0.2904, 1.8674, 0.4519, -0.6166, 0.1297, 0.6507, 0.2021],
  4847. [-0.2218, -0.9150, 1.0375, -1.0969, -0.4347, -1.0455, 0.3649, 0.3677],
  4848. [ 0.2698, -0.6191, 1.7095, -1.0067, -0.0719, -0.8716, 0.9475, 0.2549],
  4849. [-0.1655, -0.9113, 1.0007, -1.1529, -0.5338, -1.2172, 0.2648, 0.3071],
  4850. [ 0.0616, -0.7328, 1.1565, -1.1089, -0.3360, -1.1049, 0.4130, 0.3369],
  4851. [ 1.0715, -0.1211, 1.9333, 0.5056, -0.6645, 0.2440, 0.6736, 0.2401],
  4852. [ 0.6491, -0.3910, 1.8553, 0.1901, -0.3428, 0.2149, 0.6684, 0.2235]],
  4853. device='cuda:0', grad_fn=<AddmmBackward>)
  4854. landmarks are: tensor([[[ 5.7742e-01, -3.8684e-01, 1.6286e+00, -5.6921e-01, -6.4619e-01,
  4855. -2.7667e-01, 5.1432e-01, 5.2394e-01],
  4856. [ 6.4706e-01, -4.1832e-01, 1.7499e+00, 3.2379e-01, -5.0762e-01,
  4857. -9.1917e-02, 6.7064e-01, 4.6189e-04],
  4858. [ 5.7131e-01, -3.6712e-01, 8.6651e-01, -1.0696e+00, -3.6905e-01,
  4859. -1.2236e+00, 3.5266e-01, 2.6220e-01],
  4860. [ 6.2401e-01, -3.7675e-01, 1.6575e+00, -1.2851e+00, 2.9492e-01,
  4861. -1.2467e+00, 1.1276e+00, 2.1421e-01],
  4862. [ 5.1085e-01, -4.3164e-01, 1.1436e+00, -1.3467e+00, -3.8637e-01,
  4863. -1.4160e+00, 1.2393e-01, -5.8033e-02],
  4864. [ 5.9850e-01, -3.9207e-01, 1.2995e+00, -1.0927e+00, 6.2356e-03,
  4865. -1.5854e+00, 4.2771e-01, 2.1601e-01],
  4866. [ 5.9601e-01, -3.4305e-01, 1.7557e+00, 2.0831e-01, -5.8268e-01,
  4867. -4.5727e-02, 3.6420e-01, 3.4688e-01],
  4868. [ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  4869. 4.6189e-04, 2.9049e-01, 3.3573e-01]]], device='cuda:0')
  4870. loss_train_step before backward: tensor(0.0739, device='cuda:0', grad_fn=<MseLossBackward>)
  4871. loss_train_step after backward: tensor(0.0739, device='cuda:0', grad_fn=<MseLossBackward>)
  4872. loss_train: 1.038370206952095
  4873. step: 15
  4874. running loss: 0.069224680463473
  4875. Train Steps: 15/90 Loss: 0.0692 torch.Size([8, 600, 800])
  4876. torch.Size([8, 8])
  4877. tensor([[0.6205, 0.4004, 0.8938, 0.4883, 0.3663, 0.5000, 0.6357, 0.4947],
  4878. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817],
  4879. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  4880. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217],
  4881. [0.6042, 0.3990, 0.6831, 0.2875, 0.3500, 0.3133, 0.5143, 0.5510],
  4882. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038],
  4883. [0.6272, 0.4045, 0.8538, 0.5900, 0.3750, 0.4417, 0.5989, 0.4649],
  4884. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552]],
  4885. device='cuda:0', dtype=torch.float64)
  4886. predictions are: tensor([[ 0.7944, -0.3463, 1.9906, 0.2476, -0.5201, 0.2336, 0.7704, 0.1918],
  4887. [ 0.0689, -0.7012, 1.3575, -0.7715, -0.3078, -0.7171, 0.4185, 0.3937],
  4888. [ 0.3230, -0.5789, 1.3084, -0.9413, -0.4369, -1.0296, 0.4259, 0.3471],
  4889. [ 0.5474, -0.4719, 1.2206, -0.8174, -0.4809, -0.9417, 0.4338, 0.3615],
  4890. [ 0.1219, -0.7330, 1.1250, -0.9224, -0.6118, -0.8752, 0.3285, 0.3161],
  4891. [ 0.5981, -0.4339, 1.8751, 0.1986, -0.4184, 0.1858, 0.5192, 0.2195],
  4892. [ 0.8358, -0.2984, 1.8211, 0.3606, -0.6419, -0.1551, 0.5716, 0.2108],
  4893. [-0.1780, -0.8768, 1.5876, -1.0652, -0.0232, -0.9913, 0.8239, 0.2795]],
  4894. device='cuda:0', grad_fn=<AddmmBackward>)
  4895. landmarks are: tensor([[[ 5.8031e-01, -4.3672e-01, 1.8423e+00, -3.0331e-02, -5.9423e-01,
  4896. 2.3557e-02, 6.5034e-01, -9.2270e-04],
  4897. [ 5.9636e-01, -3.3795e-01, 1.4785e+00, -8.3865e-01, -2.4203e-01,
  4898. -1.0619e+00, 3.2379e-01, 4.0077e-01],
  4899. [ 5.7962e-01, -4.3256e-01, 1.4439e+00, -1.1774e+00, -2.9400e-01,
  4900. -1.3390e+00, 3.9307e-01, 9.2841e-02],
  4901. [ 5.6871e-01, -4.0878e-01, 1.0397e+00, -1.1466e+00, -3.1132e-01,
  4902. -1.1928e+00, 4.6813e-01, 5.8553e-01],
  4903. [ 5.0491e-01, -4.4280e-01, 8.6919e-01, -9.5814e-01, -6.6928e-01,
  4904. -8.3865e-01, 8.9698e-02, 2.5891e-01],
  4905. [ 5.2494e-01, -4.4734e-01, 1.7326e+00, -9.1917e-02, -2.0162e-01,
  4906. 1.5443e-01, 1.7328e-01, 4.1158e-02],
  4907. [ 6.1085e-01, -4.1771e-01, 1.6575e+00, 4.3926e-01, -5.5381e-01,
  4908. -2.4588e-01, 4.8055e-01, -1.3847e-01],
  4909. [-2.2859e+00, -2.2859e+00, 1.7557e+00, -1.1466e+00, 8.7067e-02,
  4910. -1.0773e+00, 1.1239e+00, 2.7833e-01]]], device='cuda:0')
  4911. loss_train_step before backward: tensor(0.1397, device='cuda:0', grad_fn=<MseLossBackward>)
  4912. loss_train_step after backward: tensor(0.1397, device='cuda:0', grad_fn=<MseLossBackward>)
  4913. loss_train: 1.1780213713645935
  4914. step: 16
  4915. running loss: 0.0736263357102871
  4916. Train Steps: 16/90 Loss: 0.0736 torch.Size([8, 600, 800])
  4917. torch.Size([8, 8])
  4918. tensor([[0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  4919. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  4920. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  4921. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  4922. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  4923. [0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  4924. [0.6184, 0.4079, 0.8350, 0.3700, 0.3675, 0.2883, 0.5312, 0.5783],
  4925. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550]],
  4926. device='cuda:0', dtype=torch.float64)
  4927. predictions are: tensor([[ 0.3631, -0.5394, 1.4618, -0.3937, -0.5298, -0.5855, 0.3389, 0.2794],
  4928. [ 0.4413, -0.5507, 1.2269, -0.7110, -0.4430, -0.9009, 0.4244, 0.2799],
  4929. [-0.3335, -0.9625, 1.3309, -0.7680, -0.2863, -0.7579, 0.4095, 0.3167],
  4930. [ 0.4255, -0.4960, 1.6453, -0.6700, -0.1697, -0.6607, 0.6740, 0.2752],
  4931. [-0.3251, -0.9842, 1.0067, -0.9940, -0.3619, -1.0681, 0.3570, 0.3390],
  4932. [ 0.5777, -0.4170, 1.6715, -0.5359, -0.3518, -0.6406, 0.6042, 0.2708],
  4933. [ 0.6887, -0.3486, 1.7259, -0.0297, -0.5322, -0.4222, 0.4260, 0.2669],
  4934. [ 0.8123, -0.2894, 1.7652, -0.2682, -0.5185, -0.1183, 0.7801, 0.2465]],
  4935. device='cuda:0', grad_fn=<AddmmBackward>)
  4936. landmarks are: tensor([[[ 0.5532, -0.3888, 1.4727, -0.7463, -0.5538, -1.0465, 0.0265,
  4937. 0.2138],
  4938. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  4939. 0.2576],
  4940. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  4941. 0.3007],
  4942. [ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  4943. -0.0369],
  4944. [-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  4945. 0.4543],
  4946. [ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  4947. 0.0851],
  4948. [ 0.5704, -0.4019, 1.5709, -0.5769, -0.5885, -0.9541, 0.1679,
  4949. 0.3854],
  4950. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  4951. 0.2776]]], device='cuda:0')
  4952. loss_train_step before backward: tensor(0.2478, device='cuda:0', grad_fn=<MseLossBackward>)
  4953. loss_train_step after backward: tensor(0.2478, device='cuda:0', grad_fn=<MseLossBackward>)
  4954. loss_train: 1.425776869058609
  4955. step: 17
  4956. running loss: 0.08386922759168289
  4957. Train Steps: 17/90 Loss: 0.0839 torch.Size([8, 600, 800])
  4958. torch.Size([8, 8])
  4959. tensor([[0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  4960. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  4961. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  4962. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  4963. [0.6128, 0.4115, 0.7934, 0.3778, 0.3450, 0.4033, 0.5337, 0.5456],
  4964. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667],
  4965. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  4966. [ nan, nan, 0.7097, 0.2346, 0.4250, 0.1850, 0.5175, 0.5583]],
  4967. device='cuda:0', dtype=torch.float64)
  4968. predictions are: tensor([[ 0.7392, -0.3159, 1.9126, 0.2965, -0.2309, 0.2665, 0.6292, 0.2335],
  4969. [ 0.6183, -0.4341, 1.8354, -0.2402, -0.4850, -0.2214, 0.6888, 0.2186],
  4970. [ 0.7088, -0.3281, 1.7322, -0.1589, -0.4614, -0.2889, 0.5233, 0.2228],
  4971. [ 0.3687, -0.5831, 1.6318, -0.3442, -0.5248, -0.8639, 0.3086, 0.3081],
  4972. [ 0.6640, -0.3452, 1.5032, -0.5834, -0.5535, -0.6198, 0.4556, 0.2848],
  4973. [-0.3263, -0.9667, 1.2706, -1.0857, -0.2673, -1.1992, 0.3529, 0.3348],
  4974. [ 0.3817, -0.5648, 1.2980, -0.9832, -0.4549, -1.1130, 0.4572, 0.2740],
  4975. [-0.7312, -1.2464, 1.0082, -1.2988, -0.2090, -1.4575, 0.2481, 0.3142]],
  4976. device='cuda:0', grad_fn=<AddmmBackward>)
  4977. landmarks are: tensor([[[ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  4978. 0.0412],
  4979. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  4980. 0.2083],
  4981. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  4982. 0.3265],
  4983. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  4984. 0.2116],
  4985. [ 0.5444, -0.3852, 1.3786, -0.5409, -0.6924, -0.4229, 0.1791,
  4986. 0.2341],
  4987. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  4988. 0.3315],
  4989. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  4990. 0.1779],
  4991. [-2.2859, -2.2859, 0.9922, -1.2021, -0.3229, -1.4314, 0.1044,
  4992. 0.2930]]], device='cuda:0')
  4993. loss_train_step before backward: tensor(0.1672, device='cuda:0', grad_fn=<MseLossBackward>)
  4994. loss_train_step after backward: tensor(0.1672, device='cuda:0', grad_fn=<MseLossBackward>)
  4995. loss_train: 1.5929645597934723
  4996. step: 18
  4997. running loss: 0.08849803109963734
  4998.  
  4999. Train Steps: 18/90 Loss: 0.0885 torch.Size([8, 600, 800])
  5000. torch.Size([8, 8])
  5001. tensor([[0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  5002. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  5003. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  5004. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  5005. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  5006. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  5007. [0.6275, 0.4050, 0.9038, 0.3767, 0.3838, 0.3533, 0.7074, 0.5575],
  5008. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350]],
  5009. device='cuda:0', dtype=torch.float64)
  5010. predictions are: tensor([[ 0.7018, -0.3557, 1.7540, -0.1224, -0.4276, -0.0423, 0.5841, 0.2146],
  5011. [ 0.2970, -0.6503, 1.6967, -0.1300, -0.4445, -0.3633, 0.4110, 0.2402],
  5012. [ 0.0251, -0.7716, 1.1079, -1.0232, -0.4226, -1.2824, 0.2213, 0.3022],
  5013. [ 0.3834, -0.5366, 1.4415, -0.5750, -0.4902, -0.5628, 0.3763, 0.2302],
  5014. [-0.1063, -0.8539, 1.1570, -1.0314, -0.4734, -1.0130, 0.2999, 0.2568],
  5015. [ 0.0538, -0.7577, 1.6569, -0.3731, -0.4748, -0.4974, 0.3697, 0.2801],
  5016. [ 0.3470, -0.5624, 1.7853, -0.5192, -0.2951, -0.8880, 0.6386, 0.2389],
  5017. [ 0.1852, -0.6856, 1.3280, -1.0545, -0.2309, -1.3210, 0.3448, 0.3081]],
  5018. device='cuda:0', grad_fn=<AddmmBackward>)
  5019. landmarks are: tensor([[[ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  5020. -0.0322],
  5021. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  5022. 0.2314],
  5023. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  5024. 0.2853],
  5025. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  5026. 0.1552],
  5027. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  5028. 0.0442],
  5029. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  5030. 0.1929],
  5031. [ 0.6125, -0.4153, 1.8885, -0.5461, -0.5134, -0.6539, 0.9814,
  5032. 0.2890],
  5033. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  5034. 0.1850]]], device='cuda:0')
  5035. loss_train_step before backward: tensor(0.0528, device='cuda:0', grad_fn=<MseLossBackward>)
  5036. loss_train_step after backward: tensor(0.0528, device='cuda:0', grad_fn=<MseLossBackward>)
  5037. loss_train: 1.6457261517643929
  5038. step: 19
  5039. running loss: 0.08661716588233646
  5040. Train Steps: 19/90 Loss: 0.0866 torch.Size([8, 600, 800])
  5041. torch.Size([8, 8])
  5042. tensor([[0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  5043. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  5044. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  5045. [0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  5046. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  5047. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  5048. [0.6317, 0.4038, 0.8287, 0.5900, 0.3800, 0.4717, 0.6295, 0.4986],
  5049. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433]],
  5050. device='cuda:0', dtype=torch.float64)
  5051. predictions are: tensor([[ 0.7591, -0.3409, 1.7338, -0.0023, -0.5642, -0.2221, 0.4435, 0.2436],
  5052. [ 0.3795, -0.5712, 1.7574, -0.1573, -0.3790, -0.1880, 0.3507, 0.2420],
  5053. [-0.8353, -1.2972, 1.2454, -1.2587, -0.2312, -1.3055, 0.2796, 0.2779],
  5054. [-0.5438, -1.1473, 1.0012, -1.3929, -0.3499, -1.5850, 0.1994, 0.2789],
  5055. [ 0.5224, -0.4489, 1.7406, -0.0551, -0.3338, -0.1273, 0.4229, 0.1991],
  5056. [-0.5449, -1.1069, 1.2491, -1.3066, -0.2089, -1.4304, 0.3174, 0.2808],
  5057. [ 0.9422, -0.2005, 1.7710, 0.0972, -0.6246, -0.3440, 0.4153, 0.1871],
  5058. [ 0.5999, -0.4022, 1.3268, -1.1283, -0.6029, -0.9938, 0.4009, 0.2491]],
  5059. device='cuda:0', grad_fn=<AddmmBackward>)
  5060. landmarks are: tensor([[[ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  5061. 0.3161],
  5062. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  5063. 0.3057],
  5064. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  5065. 0.3007],
  5066. [ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  5067. 0.2699],
  5068. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  5069. 0.2386],
  5070. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  5071. 0.1698],
  5072. [ 0.6320, -0.4206, 1.5420, 0.4393, -0.5307, -0.1073, 0.6216,
  5073. 0.0171],
  5074. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  5075. 0.2237]]], device='cuda:0')
  5076. loss_train_step before backward: tensor(0.1236, device='cuda:0', grad_fn=<MseLossBackward>)
  5077. loss_train_step after backward: tensor(0.1236, device='cuda:0', grad_fn=<MseLossBackward>)
  5078. loss_train: 1.7693058922886848
  5079. step: 20
  5080. running loss: 0.08846529461443424
  5081. Train Steps: 20/90 Loss: 0.0885 torch.Size([8, 600, 800])
  5082. torch.Size([8, 8])
  5083. tensor([[0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  5084. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  5085. [0.6261, 0.4131, 0.8938, 0.3550, 0.4000, 0.2683, 0.6188, 0.5283],
  5086. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  5087. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  5088. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  5089. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  5090. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837]],
  5091. device='cuda:0', dtype=torch.float64)
  5092. predictions are: tensor([[ 0.1886, -0.6836, 1.5729, -0.2674, -0.2233, -0.4119, 0.3165, 0.2492],
  5093. [ 0.4372, -0.5134, 1.6379, -0.3847, -0.5800, -0.9076, 0.2784, 0.1690],
  5094. [-0.0067, -0.8098, 1.6752, -0.9982, -0.3071, -1.3077, 0.4903, 0.2232],
  5095. [ 0.3528, -0.5931, 1.6171, -0.1919, -0.5364, -0.4231, 0.2934, 0.1907],
  5096. [ 0.3657, -0.5674, 1.6048, -0.6359, -0.4923, -0.3539, 0.4614, 0.1826],
  5097. [ 0.1345, -0.6927, 1.1944, -1.0451, -0.4435, -0.9648, 0.2830, 0.3123],
  5098. [ 0.3865, -0.5515, 1.5863, -0.5621, -0.4879, -0.5619, 0.4382, 0.1526],
  5099. [-0.4958, -1.1116, 0.9192, -1.2360, -0.4738, -1.2510, 0.0091, 0.3017]],
  5100. device='cuda:0', grad_fn=<AddmmBackward>)
  5101. landmarks are: tensor([[[ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  5102. 0.4239],
  5103. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  5104. -0.0049],
  5105. [ 0.6062, -0.3778, 1.8423, -0.6462, -0.4383, -1.0465, 0.5721,
  5106. 0.1544],
  5107. [ 0.6148, -0.4130, 1.6864, 0.1698, -0.5307, -0.1150, 0.6125,
  5108. 0.0851],
  5109. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  5110. 0.0985],
  5111. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  5112. 0.3469],
  5113. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  5114. 0.1715],
  5115. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  5116. 0.4103]]], device='cuda:0')
  5117. loss_train_step before backward: tensor(0.0934, device='cuda:0', grad_fn=<MseLossBackward>)
  5118. loss_train_step after backward: tensor(0.0934, device='cuda:0', grad_fn=<MseLossBackward>)
  5119. loss_train: 1.8627125546336174
  5120. step: 21
  5121. running loss: 0.08870059783969607
  5122. Train Steps: 21/90 Loss: 0.0887 torch.Size([8, 600, 800])
  5123. torch.Size([8, 8])
  5124. tensor([[0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320],
  5125. [ nan, nan, 0.7625, 0.2433, 0.3713, 0.2867, 0.5235, 0.5220],
  5126. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  5127. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  5128. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  5129. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  5130. [ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  5131. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297]],
  5132. device='cuda:0', dtype=torch.float64)
  5133. predictions are: tensor([[ 0.8606, -0.2453, 1.3886, -0.9505, -0.4922, -1.0851, 0.4113, 0.2025],
  5134. [-0.9464, -1.3543, 1.1559, -1.1529, -0.4029, -1.2134, 0.1268, 0.2243],
  5135. [ 0.1395, -0.6876, 1.0224, -0.8792, -0.6390, -0.9361, -0.0147, 0.2747],
  5136. [ 0.2228, -0.6074, 1.3296, -0.9617, -0.5155, -1.1569, 0.2396, 0.2520],
  5137. [ 0.0331, -0.7152, 1.2906, -0.9207, -0.5002, -1.0947, 0.1238, 0.2317],
  5138. [ 0.5004, -0.4776, 1.7450, 0.0990, -0.4102, 0.1276, 0.3315, 0.1553],
  5139. [-0.5480, -1.0970, 1.6360, -1.0426, 0.0103, -1.0901, 0.6953, 0.2123],
  5140. [ 0.7488, -0.3436, 1.7506, 0.0133, -0.5513, 0.1343, 0.4193, 0.1387]],
  5141. device='cuda:0', grad_fn=<AddmmBackward>)
  5142. landmarks are: tensor([[[ 6.1413e-01, -4.1527e-01, 1.4208e+00, -1.2697e+00, -2.9400e-01,
  5143. -1.0234e+00, 8.6439e-01, 1.7146e-01],
  5144. [-2.2859e+00, -2.2859e+00, 1.2360e+00, -1.1620e+00, -5.7113e-01,
  5145. -9.6182e-01, 1.3215e-01, 1.2532e-01],
  5146. [ 5.6293e-01, -3.8707e-01, 7.2426e-01, -9.5814e-01, -5.8268e-01,
  5147. -9.8491e-01, 1.2881e-01, 4.1034e-01],
  5148. [ 5.6966e-01, -4.4656e-01, 1.1973e+00, -1.1871e+00, -4.5712e-01,
  5149. -9.9653e-01, 5.2186e-01, 2.0324e-01],
  5150. [ 5.6951e-01, -3.9269e-01, 1.3226e+00, -9.0023e-01, -4.6721e-01,
  5151. -1.1928e+00, 1.7367e-01, 3.6998e-01],
  5152. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  5153. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  5154. [-2.2859e+00, -2.2859e+00, 1.8018e+00, -9.0023e-01, 1.9099e-01,
  5155. -1.2467e+00, 1.1057e+00, 3.7986e-01],
  5156. [ 6.2566e-01, -4.2731e-01, 1.8365e+00, -6.8822e-02, -4.6721e-01,
  5157. -6.1124e-02, 1.1715e+00, 1.6077e-01]]], device='cuda:0')
  5158. loss_train_step before backward: tensor(0.1541, device='cuda:0', grad_fn=<MseLossBackward>)
  5159.  
  5160. loss_train_step after backward: tensor(0.1541, device='cuda:0', grad_fn=<MseLossBackward>)
  5161. loss_train: 2.016780845820904
  5162. step: 22
  5163. running loss: 0.0916718566282229
  5164. Train Steps: 22/90 Loss: 0.0917 torch.Size([8, 600, 800])
  5165. torch.Size([8, 8])
  5166. tensor([[0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  5167. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  5168. [0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758],
  5169. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  5170. [0.6200, 0.4070, 0.8938, 0.4183, 0.3538, 0.4567, 0.6175, 0.5400],
  5171. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  5172. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  5173. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084]],
  5174. device='cuda:0', dtype=torch.float64)
  5175. predictions are: tensor([[-0.0417, -0.8324, 1.5706, -0.6496, -0.5061, -0.7902, 0.3200, 0.1959],
  5176. [ 0.6402, -0.3714, 1.5161, -0.6605, -0.4793, -0.3589, 0.4657, 0.1758],
  5177. [ 0.0140, -0.7716, 1.4618, -0.3929, -0.4085, -0.4324, 0.2697, 0.1847],
  5178. [-0.0728, -0.8222, 1.4052, -0.7861, -0.5726, -1.2827, 0.1695, 0.2282],
  5179. [ 0.6133, -0.3940, 1.4564, -0.7158, -0.5758, -0.6346, 0.4125, 0.1667],
  5180. [-0.1707, -0.8710, 1.3833, -0.9728, -0.5769, -1.0311, 0.2213, 0.2043],
  5181. [ 0.1520, -0.6904, 1.5596, -0.5260, -0.2024, -0.6276, 0.3844, 0.1957],
  5182. [ 0.0610, -0.7315, 1.5109, -0.3846, -0.2611, -0.3896, 0.2713, 0.2347]],
  5183. device='cuda:0', grad_fn=<AddmmBackward>)
  5184. landmarks are: tensor([[[ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  5185. 0.1390],
  5186. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  5187. 0.1005],
  5188. [ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  5189. -0.0881],
  5190. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  5191. 0.2699],
  5192. [ 0.5778, -0.4061, 1.8423, -0.3537, -0.6520, -0.1766, 0.5663,
  5193. 0.2083],
  5194. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  5195. 0.0802],
  5196. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  5197. 0.2853],
  5198. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  5199. 0.0622]]], device='cuda:0')
  5200. loss_train_step before backward: tensor(0.1489, device='cuda:0', grad_fn=<MseLossBackward>)
  5201. loss_train_step after backward: tensor(0.1489, device='cuda:0', grad_fn=<MseLossBackward>)
  5202. loss_train: 2.1656840667128563
  5203. step: 23
  5204. running loss: 0.09416017681360245
  5205. Train Steps: 23/90 Loss: 0.0942 torch.Size([8, 600, 800])
  5206. torch.Size([8, 8])
  5207. tensor([[0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  5208. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083],
  5209. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350],
  5210. [0.6277, 0.4118, 0.8988, 0.3833, 0.3950, 0.2650, 0.6290, 0.4938],
  5211. [0.6198, 0.4075, 0.8650, 0.5617, 0.4150, 0.4367, 0.5450, 0.5650],
  5212. [0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  5213. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  5214. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220]],
  5215. device='cuda:0', dtype=torch.float64)
  5216. predictions are: tensor([[ 0.0037, -0.7422, 1.3922, -1.1547, -0.4432, -1.1044, 0.3581, 0.2139],
  5217. [ 0.3885, -0.5133, 1.5515, -0.7567, -0.6069, -0.8293, 0.3334, 0.1393],
  5218. [ 0.2714, -0.6226, 1.5515, -0.2874, -0.5171, -0.2793, 0.2606, 0.1226],
  5219. [-0.1505, -0.8803, 1.5943, -0.8312, -0.3734, -1.0537, 0.4488, 0.1856],
  5220. [ 0.5403, -0.4329, 1.4621, -0.1111, -0.4986, -0.3244, 0.2106, 0.2074],
  5221. [ 0.0936, -0.6823, 1.5448, -0.2891, -0.5000, -0.3389, 0.3101, 0.2221],
  5222. [ 0.5081, -0.4559, 1.6541, -0.3323, -0.2829, 0.0522, 0.4847, 0.1648],
  5223. [-0.2603, -0.9413, 0.9716, -1.3636, -0.4094, -1.4996, 0.1687, 0.2274]],
  5224. device='cuda:0', grad_fn=<AddmmBackward>)
  5225. landmarks are: tensor([[[ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  5226. 0.2699],
  5227. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  5228. 0.0620],
  5229. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  5230. 0.1854],
  5231. [ 0.6135, -0.3841, 1.8654, -0.5153, -0.4614, -1.0619, 0.6195,
  5232. -0.0049],
  5233. [ 0.5770, -0.4036, 1.7095, 0.3084, -0.3691, -0.2690, 0.2314,
  5234. 0.3238],
  5235. [ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  5236. 0.3623],
  5237. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  5238. 0.0928],
  5239. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  5240. 0.1253]]], device='cuda:0')
  5241. loss_train_step before backward: tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward>)
  5242. loss_train_step after backward: tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward>)
  5243. loss_train: 2.2315543591976166
  5244. step: 24
  5245. running loss: 0.09298143163323402
  5246. Train Steps: 24/90 Loss: 0.0930 torch.Size([8, 600, 800])
  5247. torch.Size([8, 8])
  5248. tensor([[0.6084, 0.3981, 0.8588, 0.5233, 0.4600, 0.5367, 0.5680, 0.5006],
  5249. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  5250. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  5251. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  5252. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667],
  5253. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412],
  5254. [0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  5255. [0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320]],
  5256. device='cuda:0', dtype=torch.float64)
  5257. predictions are: tensor([[ 0.2694, -0.6120, 1.6079, -0.1341, -0.3535, -0.1856, 0.2777, 0.1239],
  5258. [-0.1129, -0.8312, 1.4104, -1.0356, -0.4240, -1.0812, 0.3827, 0.2333],
  5259. [ 0.3946, -0.4807, 1.1978, -0.9625, -0.5292, -0.8474, 0.3154, 0.2285],
  5260. [ 0.2245, -0.6238, 1.6883, -0.4121, -0.5650, -0.2460, 0.3334, 0.1264],
  5261. [-0.0742, -0.8103, 1.6389, -0.7168, -0.5823, -0.6310, 0.3868, 0.1623],
  5262. [ 0.3275, -0.5708, 1.5419, -0.0796, -0.3344, -0.2834, 0.2763, 0.1428],
  5263. [ 0.3363, -0.5500, 1.5343, -0.2309, -0.3338, -0.3383, 0.3287, 0.1582],
  5264. [ 0.4521, -0.4659, 1.3048, -1.2154, -0.4436, -1.2450, 0.4739, 0.1569]],
  5265. device='cuda:0', grad_fn=<AddmmBackward>)
  5266. landmarks are: tensor([[[ 0.5241, -0.4470, 1.6806, 0.1313, -0.1612, 0.1929, 0.3378,
  5267. 0.0261],
  5268. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  5269. 0.5701],
  5270. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  5271. 0.3469],
  5272. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  5273. 0.1775],
  5274. [ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  5275. 0.3315],
  5276. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  5277. 0.2138],
  5278. [ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  5279. 0.4239],
  5280. [ 0.6141, -0.4153, 1.4208, -1.2697, -0.2940, -1.0234, 0.8644,
  5281. 0.1715]]], device='cuda:0')
  5282. loss_train_step before backward: tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward>)
  5283. loss_train_step after backward: tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward>)
  5284. loss_train: 2.2920665852725506
  5285. step: 25
  5286. running loss: 0.09168266341090202
  5287. Train Steps: 25/90 Loss: 0.0917 torch.Size([8, 600, 800])
  5288. torch.Size([8, 8])
  5289. tensor([[0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  5290. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  5291. [0.6182, 0.3998, 0.8793, 0.4191, 0.3552, 0.4285, 0.6038, 0.5312],
  5292. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  5293. [0.6099, 0.4030, 0.8638, 0.5117, 0.4983, 0.4965, 0.5086, 0.5388],
  5294. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  5295. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  5296. [0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378]],
  5297. device='cuda:0', dtype=torch.float64)
  5298. predictions are: tensor([[ 0.5360, -0.4152, 1.2727, -0.8990, -0.4217, -0.8114, 0.3388, 0.2447],
  5299. [ 0.7213, -0.2711, 1.7282, -0.4758, -0.5359, -0.0893, 0.5664, 0.0697],
  5300. [ 0.5419, -0.4243, 1.8018, -0.3781, -0.5639, -0.1564, 0.3643, 0.1712],
  5301. [-0.1072, -0.8073, 1.2532, -1.0415, -0.3916, -1.0363, 0.3168, 0.2298],
  5302. [ 0.1826, -0.6807, 1.8562, -0.0210, -0.1675, -0.0548, 0.4331, 0.1280],
  5303. [-0.2581, -0.9261, 1.1611, -1.1396, -0.3878, -1.1883, 0.2695, 0.2118],
  5304. [-0.1382, -0.8743, 1.2336, -1.0734, -0.4734, -1.1985, 0.2244, 0.1587],
  5305. [ 0.9495, -0.1562, 1.7437, 0.2298, -0.6145, -0.1484, 0.3448, 0.1113]],
  5306. device='cuda:0', grad_fn=<AddmmBackward>)
  5307. landmarks are: tensor([[[ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  5308. 0.5401],
  5309. [ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  5310. -0.0099],
  5311. [ 0.5697, -0.4393, 1.7754, -0.3503, -0.6453, -0.3067, 0.5028,
  5312. 0.1677],
  5313. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  5314. 0.2622],
  5315. [ 0.5309, -0.4246, 1.7037, 0.0774, 0.0158, 0.0075, 0.0635,
  5316. 0.2026],
  5317. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  5318. 0.3469],
  5319. [ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  5320. -0.0580],
  5321. [ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  5322. 0.1982]]], device='cuda:0')
  5323. loss_train_step before backward: tensor(0.1472, device='cuda:0', grad_fn=<MseLossBackward>)
  5324.  
  5325. loss_train_step after backward: tensor(0.1472, device='cuda:0', grad_fn=<MseLossBackward>)
  5326. loss_train: 2.439281862229109
  5327. step: 26
  5328. running loss: 0.09381853316265804
  5329. Train Steps: 26/90 Loss: 0.0938 torch.Size([8, 600, 800])
  5330. torch.Size([8, 8])
  5331. tensor([[0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  5332. [0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433],
  5333. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  5334. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  5335. [0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748],
  5336. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517],
  5337. [0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  5338. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913]],
  5339. device='cuda:0', dtype=torch.float64)
  5340. predictions are: tensor([[ 0.7377, -0.2847, 1.2891, -0.9831, -0.6037, -0.6774, 0.3743, 0.1758],
  5341. [ 0.7532, -0.3084, 1.7839, -0.0081, -0.2489, 0.1553, 0.4885, 0.1983],
  5342. [ 0.0920, -0.6706, 1.3227, -0.8929, -0.4635, -0.9294, 0.2370, 0.2070],
  5343. [ 0.4035, -0.5192, 1.7010, 0.0193, -0.2705, 0.0588, 0.4027, 0.1585],
  5344. [ 0.3594, -0.5149, 1.6956, 0.1053, -0.4258, -0.2073, 0.3934, 0.1345],
  5345. [ 0.7228, -0.2703, 1.5759, -0.6418, -0.6070, -0.4731, 0.3995, 0.1768],
  5346. [ 0.1192, -0.6348, 1.3703, -0.8587, -0.4873, -0.9933, 0.2480, 0.1672],
  5347. [-0.3907, -0.9933, 1.3532, -1.0529, -0.2807, -1.1499, 0.4252, 0.2074]],
  5348. device='cuda:0', grad_fn=<AddmmBackward>)
  5349. landmarks are: tensor([[[ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  5350. 0.0412],
  5351. [ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  5352. 0.2237],
  5353. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  5354. 0.3700],
  5355. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  5356. 0.4171],
  5357. [ 0.6421, -0.3647, 1.5940, 0.3084, -0.5192, -0.3691, 1.1057,
  5358. 0.3692],
  5359. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  5360. 0.2622],
  5361. [ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  5362. 0.0111],
  5363. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  5364. -0.0168]]], device='cuda:0')
  5365. loss_train_step before backward: tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward>)
  5366. loss_train_step after backward: tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward>)
  5367. loss_train: 2.498351190239191
  5368. step: 27
  5369. running loss: 0.09253152556441448
  5370. Train Steps: 27/90 Loss: 0.0925 torch.Size([8, 600, 800])
  5371. torch.Size([8, 8])
  5372. tensor([[0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  5373. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  5374. [ nan, nan, 0.6992, 0.2791, 0.3950, 0.2383, 0.5483, 0.5819],
  5375. [0.6267, 0.4094, 0.8712, 0.3083, 0.4400, 0.2267, 0.6250, 0.5200],
  5376. [0.6030, 0.3969, 0.7988, 0.3917, 0.3450, 0.3667, 0.5266, 0.4700],
  5377. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  5378. [0.6187, 0.4104, 0.7126, 0.2069, 0.3950, 0.2517, 0.5913, 0.5683],
  5379. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563]],
  5380. device='cuda:0', dtype=torch.float64)
  5381. predictions are: tensor([[ 0.7374, -0.2478, 1.5541, -0.5682, -0.4088, -0.1455, 0.5582, 0.1738],
  5382. [ 0.8026, -0.1954, 1.4651, -0.5861, -0.5108, -0.2191, 0.4381, 0.1958],
  5383. [-0.3435, -0.9865, 1.1572, -0.7504, -0.3741, -0.8815, 0.1974, 0.2048],
  5384. [ 0.4001, -0.5106, 1.9784, -0.5306, -0.1866, -0.6455, 0.7068, 0.1653],
  5385. [ 0.8539, -0.2140, 1.7453, -0.1278, -0.4997, -0.1058, 0.3985, 0.1125],
  5386. [ 0.6154, -0.3897, 1.2614, -0.7802, -0.4414, -0.8929, 0.3122, 0.2156],
  5387. [ 0.7323, -0.2899, 1.3559, -0.6403, -0.4691, -0.8427, 0.2395, 0.2310],
  5388. [-0.4492, -1.0322, 1.4731, -0.4906, -0.4800, -0.5407, 0.1952, 0.1919]],
  5389. device='cuda:0', grad_fn=<AddmmBackward>)
  5390. landmarks are: tensor([[[ 0.5799, -0.4099, 1.5651, -1.0465, -0.5885, -0.3075, 0.6413,
  5391. 0.1390],
  5392. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  5393. 0.2545],
  5394. [-2.2859, -2.2859, 0.9438, -0.9967, -0.4614, -1.1851, 0.2468,
  5395. 0.4019],
  5396. [ 0.6089, -0.3948, 1.7383, -0.8617, -0.2536, -1.2390, 0.6009,
  5397. 0.1159],
  5398. [ 0.4992, -0.4525, 1.4035, -0.4768, -0.6924, -0.5923, 0.1465,
  5399. -0.1151],
  5400. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  5401. 0.2576],
  5402. [ 0.5718, -0.3905, 1.0053, -1.3305, -0.4614, -1.1235, 0.4450,
  5403. 0.3392],
  5404. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  5405. 0.2837]]], device='cuda:0')
  5406. loss_train_step before backward: tensor(0.2237, device='cuda:0', grad_fn=<MseLossBackward>)
  5407. loss_train_step after backward: tensor(0.2237, device='cuda:0', grad_fn=<MseLossBackward>)
  5408. loss_train: 2.722070474177599
  5409. step: 28
  5410. running loss: 0.09721680264919996
  5411. Train Steps: 28/90 Loss: 0.0972 torch.Size([8, 600, 800])
  5412. torch.Size([8, 8])
  5413. tensor([[0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  5414. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  5415. [0.6236, 0.3967, 0.8675, 0.5400, 0.3862, 0.4517, 0.5825, 0.5200],
  5416. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  5417. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  5418. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  5419. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  5420. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773]],
  5421. device='cuda:0', dtype=torch.float64)
  5422. predictions are: tensor([[ 0.7305, -0.3132, 1.8139, 0.0944, -0.3673, 0.3312, 0.4564, 0.1943],
  5423. [ 0.4552, -0.4721, 1.6356, -0.4081, -0.5364, -0.3788, 0.2233, 0.1668],
  5424. [ 0.5072, -0.4483, 1.6649, 0.2623, -0.4183, 0.0033, 0.3367, 0.1549],
  5425. [-0.0679, -0.8478, 1.5491, -1.2164, -0.0420, -1.1702, 0.8427, 0.1657],
  5426. [ 0.4734, -0.4277, 1.4086, -0.7942, -0.5250, -0.4327, 0.4632, 0.2055],
  5427. [ 0.7182, -0.3058, 1.7048, -0.6412, -0.4689, -0.8560, 0.4083, 0.2025],
  5428. [ 0.4958, -0.4098, 1.5977, -0.2361, -0.4395, -0.1448, 0.4607, 0.1308],
  5429. [ 0.3944, -0.5354, 1.0374, -1.0903, -0.5026, -1.1602, 0.1620, 0.2851]],
  5430. device='cuda:0', grad_fn=<AddmmBackward>)
  5431. landmarks are: tensor([[[ 0.6047, -0.4209, 1.7557, -0.0303, -0.4845, 0.2545, 0.6587,
  5432. 0.1236],
  5433. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  5434. 0.0862],
  5435. [ 0.5944, -0.4538, 1.7210, 0.2083, -0.5018, -0.1997, 0.4046,
  5436. 0.1159],
  5437. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  5438. 0.1982],
  5439. [ 0.5779, -0.4275, 1.5894, -0.8362, -0.6577, -0.5153, 0.5605,
  5440. 0.2006],
  5441. [ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  5442. 0.2139],
  5443. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  5444. 0.1715],
  5445. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  5446. 0.3808]]], device='cuda:0')
  5447. loss_train_step before backward: tensor(0.0290, device='cuda:0', grad_fn=<MseLossBackward>)
  5448. loss_train_step after backward: tensor(0.0290, device='cuda:0', grad_fn=<MseLossBackward>)
  5449. loss_train: 2.751073746010661
  5450. step: 29
  5451. running loss: 0.09486461193140211
  5452. Train Steps: 29/90 Loss: 0.0949 torch.Size([8, 600, 800])
  5453. torch.Size([8, 8])
  5454. tensor([[0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  5455. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  5456. [0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869],
  5457. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  5458. [0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  5459. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  5460. [0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390],
  5461. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567]],
  5462. device='cuda:0', dtype=torch.float64)
  5463. predictions are: tensor([[ 0.6250, -0.4144, 1.6957, 0.1613, -0.4815, 0.1147, 0.3846, 0.1633],
  5464. [ 1.0344, -0.0511, 1.5689, 0.0435, -0.5933, -0.2652, 0.2690, 0.2165],
  5465. [ 0.4900, -0.4944, 1.4873, -1.2496, -0.2852, -1.3362, 0.6333, 0.2112],
  5466. [ 0.2213, -0.5748, 1.6522, -0.3171, -0.2605, 0.1559, 0.4833, 0.1932],
  5467. [ 0.6316, -0.3629, 1.5085, -0.9237, -0.4612, -1.0227, 0.4347, 0.2365],
  5468. [ 0.4009, -0.5173, 1.6601, 0.0104, -0.4300, 0.1274, 0.4248, 0.1939],
  5469. [ 0.6442, -0.3294, 1.5468, -0.6170, -0.3791, -0.6776, 0.6063, 0.1621],
  5470. [-0.3326, -0.9680, 1.2587, -1.1487, -0.3353, -1.1027, 0.3654, 0.2544]],
  5471. device='cuda:0', grad_fn=<AddmmBackward>)
  5472. landmarks are: tensor([[[ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  5473. 0.0697],
  5474. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  5475. 0.3392],
  5476. [ 0.6124, -0.4010, 1.4381, -1.3544, -0.0573, -1.5546, 0.5573,
  5477. -0.0369],
  5478. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  5479. 0.2936],
  5480. [ 0.5875, -0.3888, 1.3111, -0.8848, -0.4614, -0.9849, 0.5201,
  5481. 0.2622],
  5482. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  5483. 0.5239],
  5484. [ 0.6504, -0.3936, 1.8885, -0.4922, -0.3402, -0.9233, 0.8022,
  5485. 0.2035],
  5486. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  5487. 0.2853]]], device='cuda:0')
  5488. loss_train_step before backward: tensor(0.0458, device='cuda:0', grad_fn=<MseLossBackward>)
  5489. loss_train_step after backward: tensor(0.0458, device='cuda:0', grad_fn=<MseLossBackward>)
  5490. loss_train: 2.796903731301427
  5491. step: 30
  5492. running loss: 0.09323012437671423
  5493.  
  5494. Train Steps: 30/90 Loss: 0.0932 torch.Size([8, 600, 800])
  5495. torch.Size([8, 8])
  5496. tensor([[0.6128, 0.4116, 0.8450, 0.4583, 0.3675, 0.4867, 0.5337, 0.5446],
  5497. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  5498. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  5499. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  5500. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  5501. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  5502. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  5503. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567]],
  5504. device='cuda:0', dtype=torch.float64)
  5505. predictions are: tensor([[ 0.2950, -0.5529, 1.5650, -0.1983, -0.3732, -0.0056, 0.4572, 0.2051],
  5506. [ 0.6665, -0.3533, 1.6722, 0.3198, -0.4098, 0.0561, 0.4334, 0.2532],
  5507. [ 0.3297, -0.5676, 1.8212, -0.9010, -0.2561, -1.0195, 0.8730, 0.1724],
  5508. [ 0.9322, -0.1943, 1.7126, -0.6697, -0.4805, -0.9836, 0.5364, 0.2048],
  5509. [ 0.6783, -0.3507, 1.2963, -1.0498, -0.5918, -0.8010, 0.4516, 0.2145],
  5510. [ 0.4780, -0.4556, 1.7030, -0.1402, -0.4341, -0.1432, 0.4271, 0.2051],
  5511. [ 0.1772, -0.6843, 1.0516, -1.1705, -0.5276, -1.2873, 0.2467, 0.2395],
  5512. [ 0.4062, -0.5089, 1.7335, -0.1380, -0.1525, -0.0088, 0.4933, 0.1989]],
  5513. device='cuda:0', grad_fn=<AddmmBackward>)
  5514. landmarks are: tensor([[[ 0.5444, -0.3846, 1.6171, -0.1689, -0.5885, -0.0380, 0.1791,
  5515. 0.2296],
  5516. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  5517. 0.3007],
  5518. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  5519. 0.3050],
  5520. [ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  5521. 0.2139],
  5522. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  5523. 0.0412],
  5524. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  5525. 0.1439],
  5526. [ 0.5470, -0.4081, 0.8492, -1.0773, -0.5307, -1.1620, 0.0912,
  5527. 0.1890],
  5528. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  5529. 0.2853]]], device='cuda:0')
  5530. loss_train_step before backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  5531. loss_train_step after backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  5532. loss_train: 2.8161120787262917
  5533. step: 31
  5534. running loss: 0.09084232512020296
  5535. Train Steps: 31/90 Loss: 0.0908 torch.Size([8, 600, 800])
  5536. torch.Size([8, 8])
  5537. tensor([[0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  5538. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  5539. [0.6284, 0.4093, 0.8900, 0.4700, 0.3650, 0.3850, 0.6212, 0.5167],
  5540. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  5541. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450],
  5542. [0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383],
  5543. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  5544. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250]],
  5545. device='cuda:0', dtype=torch.float64)
  5546. predictions are: tensor([[ 0.3344, -0.5869, 1.6304, -0.2963, -0.3374, -0.3541, 0.4984, 0.2313],
  5547. [ 0.6908, -0.3503, 1.6515, -0.0700, -0.4126, -0.3634, 0.4649, 0.2478],
  5548. [ 0.7039, -0.3515, 1.7289, -0.5859, -0.5596, -1.0050, 0.6109, 0.1697],
  5549. [ 0.4358, -0.5206, 1.6912, -0.1203, -0.3773, -0.2881, 0.4537, 0.1943],
  5550. [ 0.6527, -0.3829, 1.6514, -0.3966, -0.3452, -0.1804, 0.4861, 0.2402],
  5551. [ 0.2703, -0.5918, 1.6975, -0.4348, -0.2091, -0.3389, 0.6179, 0.2223],
  5552. [ 0.6149, -0.3941, 1.2463, -1.3619, -0.5945, -1.1821, 0.4503, 0.2203],
  5553. [ 0.6631, -0.3669, 1.7404, -0.3028, -0.3693, -0.3110, 0.5155, 0.2463]],
  5554. device='cuda:0', grad_fn=<AddmmBackward>)
  5555. landmarks are: tensor([[[ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  5556. 0.1627],
  5557. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  5558. 0.3007],
  5559. [ 0.6164, -0.3956, 1.8249, -0.1150, -0.6000, -0.5076, 0.5836,
  5560. 0.1005],
  5561. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  5562. 0.0711],
  5563. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  5564. 0.2314],
  5565. [ 0.5664, -0.4321, 1.8249, -0.2074, -0.2651, 0.4162, 0.5663,
  5566. 0.2006],
  5567. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  5568. 0.0412],
  5569. [ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  5570. 0.1390]]], device='cuda:0')
  5571. loss_train_step before backward: tensor(0.0467, device='cuda:0', grad_fn=<MseLossBackward>)
  5572. loss_train_step after backward: tensor(0.0467, device='cuda:0', grad_fn=<MseLossBackward>)
  5573. loss_train: 2.8628441616892815
  5574. step: 32
  5575. running loss: 0.08946388005279005
  5576. Train Steps: 32/90 Loss: 0.0895 torch.Size([8, 600, 800])
  5577. torch.Size([8, 8])
  5578. tensor([[0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  5579. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  5580. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  5581. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  5582. [0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447],
  5583. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  5584. [0.6353, 0.4128, 0.9138, 0.3533, 0.4688, 0.3250, 0.7145, 0.5991],
  5585. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400]],
  5586. device='cuda:0', dtype=torch.float64)
  5587. predictions are: tensor([[ 0.3982, -0.5270, 1.6897, 0.0661, -0.4512, -0.1298, 0.4194, 0.2139],
  5588. [ 0.4820, -0.4519, 1.0651, -1.1793, -0.3780, -1.2608, 0.3199, 0.3024],
  5589. [ 0.7377, -0.2993, 1.5560, 0.0784, -0.4592, -0.0693, 0.3546, 0.2839],
  5590. [ 0.3434, -0.5464, 1.7874, -0.2388, -0.3171, -0.1256, 0.5441, 0.1799],
  5591. [ 0.4071, -0.4964, 1.8216, -0.1906, -0.4884, 0.0066, 0.5674, 0.1910],
  5592. [ 0.8802, -0.2046, 1.6890, 0.0257, -0.5662, -0.2507, 0.3828, 0.1599],
  5593. [ 0.1629, -0.7121, 1.8712, -0.8241, -0.1683, -0.9695, 0.9181, 0.1917],
  5594. [ 0.9275, -0.1944, 1.2945, -1.3044, -0.3726, -1.3874, 0.5662, 0.2288]],
  5595. device='cuda:0', grad_fn=<AddmmBackward>)
  5596. landmarks are: tensor([[[ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  5597. 0.1313],
  5598. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  5599. 0.3931],
  5600. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  5601. 0.5239],
  5602. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  5603. 0.0051],
  5604. [ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  5605. 0.2302],
  5606. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  5607. -0.0102],
  5608. [ 0.6487, -0.3792, 1.9346, -0.6539, -0.1208, -0.7848, 1.0143,
  5609. 0.4814],
  5610. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  5611. 0.2083]]], device='cuda:0')
  5612. loss_train_step before backward: tensor(0.0337, device='cuda:0', grad_fn=<MseLossBackward>)
  5613. loss_train_step after backward: tensor(0.0337, device='cuda:0', grad_fn=<MseLossBackward>)
  5614. loss_train: 2.8965813778340816
  5615. step: 33
  5616. running loss: 0.08777519326769945
  5617. Train Steps: 33/90 Loss: 0.0878 torch.Size([8, 600, 800])
  5618. torch.Size([8, 8])
  5619. tensor([[0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  5620. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  5621. [0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  5622. [0.6203, 0.4056, 0.8942, 0.4086, 0.3643, 0.3617, 0.5917, 0.5482],
  5623. [0.6350, 0.4144, 0.9250, 0.4100, 0.4125, 0.3750, 0.7129, 0.5945],
  5624. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  5625. [0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  5626. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367]],
  5627. device='cuda:0', dtype=torch.float64)
  5628. predictions are: tensor([[ 7.4253e-01, -3.1317e-01, 1.4131e+00, -8.4927e-01, -4.4791e-01,
  5629. -8.2762e-01, 5.7978e-01, 2.1282e-01],
  5630. [ 4.5485e-01, -4.8451e-01, 1.7093e+00, 3.4834e-01, -4.3732e-01,
  5631. -1.3684e-02, 3.7540e-01, 2.9459e-01],
  5632. [ 3.7311e-01, -5.3037e-01, 1.1646e+00, -8.6670e-01, -5.0887e-01,
  5633. -7.3844e-01, 2.4022e-01, 2.4823e-01],
  5634. [ 7.2810e-01, -3.0743e-01, 1.7642e+00, -2.3315e-01, -4.7777e-01,
  5635. -3.8799e-01, 5.0412e-01, 2.1321e-01],
  5636. [ 2.1975e-01, -6.6211e-01, 1.9491e+00, -2.8295e-01, -1.4412e-01,
  5637. -5.3107e-01, 8.4005e-01, 2.2348e-01],
  5638. [ 3.7371e-01, -5.1912e-01, 1.7898e+00, -9.8038e-04, -4.0995e-01,
  5639. 1.5966e-01, 5.4400e-01, 1.4020e-01],
  5640. [ 8.9009e-01, -2.2979e-01, 1.2286e+00, -9.8838e-01, -5.1678e-01,
  5641. -9.6966e-01, 4.1535e-01, 2.4532e-01],
  5642. [ 8.0319e-01, -2.6611e-01, 1.7041e+00, -7.1392e-01, -3.1660e-01,
  5643. -9.2966e-01, 6.5947e-01, 2.2535e-01]], device='cuda:0',
  5644. grad_fn=<AddmmBackward>)
  5645. landmarks are: tensor([[[ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  5646. 0.1080],
  5647. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  5648. 0.3084],
  5649. [ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  5650. 0.1710],
  5651. [ 0.5791, -0.4127, 1.8442, -0.3985, -0.6031, -0.6154, 0.4473,
  5652. 0.2464],
  5653. [ 0.6471, -0.3719, 1.9866, -0.3921, -0.3806, -0.5538, 1.0070,
  5654. 0.4600],
  5655. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  5656. -0.0670],
  5657. [ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  5658. 0.0562],
  5659. [ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  5660. 0.1931]]], device='cuda:0')
  5661. loss_train_step before backward: tensor(0.0267, device='cuda:0', grad_fn=<MseLossBackward>)
  5662. loss_train_step after backward: tensor(0.0267, device='cuda:0', grad_fn=<MseLossBackward>)
  5663. loss_train: 2.92330539226532
  5664. step: 34
  5665. running loss: 0.0859795703607447
  5666.  
  5667. Train Steps: 34/90 Loss: 0.0860 torch.Size([8, 600, 800])
  5668. torch.Size([8, 8])
  5669. tensor([[0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  5670. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208],
  5671. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  5672. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  5673. [0.6196, 0.4088, 0.8888, 0.4583, 0.4500, 0.5683, 0.6138, 0.5883],
  5674. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  5675. [0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  5676. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390]],
  5677. device='cuda:0', dtype=torch.float64)
  5678. predictions are: tensor([[ 0.8903, -0.2314, 1.6684, -0.4563, -0.6001, -0.5134, 0.4911, 0.2531],
  5679. [ 0.6476, -0.3743, 1.3517, -1.0156, -0.4161, -1.1527, 0.6536, 0.2023],
  5680. [ 0.3698, -0.5161, 1.6889, 0.1680, -0.3293, 0.1163, 0.4273, 0.2552],
  5681. [ 0.4036, -0.4773, 1.3534, -0.6551, -0.5117, -0.5085, 0.4268, 0.2266],
  5682. [ 0.5026, -0.4508, 1.7764, 0.0095, -0.2172, 0.1691, 0.5443, 0.2641],
  5683. [ 0.8662, -0.2546, 1.6973, -0.5305, -0.3797, -1.0850, 0.5950, 0.2191],
  5684. [ 0.7662, -0.2932, 1.5427, -0.9673, -0.3746, -1.1312, 0.6072, 0.1884],
  5685. [ 0.2559, -0.5938, 1.7963, 0.2113, -0.3554, 0.0888, 0.5212, 0.1696]],
  5686. device='cuda:0', grad_fn=<AddmmBackward>)
  5687. landmarks are: tensor([[[ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  5688. 0.3392],
  5689. [ 0.5885, -0.4429, 1.4266, -0.9926, -0.4383, -1.2313, 0.4228,
  5690. 0.1195],
  5691. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  5692. 0.3777],
  5693. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  5694. 0.3417],
  5695. [ 0.5759, -0.3978, 1.8192, -0.1689, -0.2074, 0.3392, 0.5490,
  5696. 0.4316],
  5697. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  5698. -0.0529],
  5699. [ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  5700. 0.0851],
  5701. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  5702. 0.2035]]], device='cuda:0')
  5703. loss_train_step before backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  5704. loss_train_step after backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  5705. loss_train: 2.944044752046466
  5706. step: 35
  5707. running loss: 0.08411556434418474
  5708. Train Steps: 35/90 Loss: 0.0841 torch.Size([8, 600, 800])
  5709. torch.Size([8, 8])
  5710. tensor([[ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  5711. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  5712. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  5713. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  5714. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235],
  5715. [0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  5716. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  5717. [0.6038, 0.3946, 0.8413, 0.4883, 0.3563, 0.4550, 0.5266, 0.4693]],
  5718. device='cuda:0', dtype=torch.float64)
  5719. predictions are: tensor([[ 0.1132, -0.7020, 1.3995, -0.7614, -0.5315, -0.8818, 0.3390, 0.2145],
  5720. [ 0.6932, -0.3358, 1.7980, -0.1423, -0.4874, -0.1082, 0.4483, 0.2249],
  5721. [ 1.0330, -0.1652, 1.8622, 0.3639, -0.4635, 0.0057, 0.5467, 0.1839],
  5722. [-0.3976, -1.0464, 1.0914, -1.1965, -0.3316, -1.3292, 0.3589, 0.2467],
  5723. [ 0.4669, -0.4691, 1.8673, 0.1160, -0.2885, 0.2232, 0.6384, 0.2342],
  5724. [ 0.8902, -0.2152, 1.3809, -1.1008, -0.2806, -1.3165, 0.6639, 0.2483],
  5725. [ 1.1518, -0.0532, 1.6962, -0.6029, -0.5221, -0.6022, 0.6503, 0.2845],
  5726. [ 0.8269, -0.2339, 1.7614, 0.1012, -0.4519, -0.0218, 0.5402, 0.1910]],
  5727. device='cuda:0', grad_fn=<AddmmBackward>)
  5728. landmarks are: tensor([[[-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  5729. 0.1133],
  5730. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  5731. 0.0893],
  5732. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  5733. -0.0049],
  5734. [-2.2859, -2.2859, 1.0513, -1.2851, -0.4441, -1.2313, 0.2206,
  5735. 0.1073],
  5736. [ 0.5762, -0.4706, 1.7754, -0.0984, -0.3680, 0.2380, 0.6277,
  5737. 0.1322],
  5738. [ 0.5917, -0.3861, 1.0455, -1.3698, -0.2882, -1.1928, 0.6067,
  5739. 0.2083],
  5740. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  5741. 0.5624],
  5742. [ 0.5030, -0.4631, 1.5998, -0.0303, -0.6404, -0.1843, 0.1465,
  5743. -0.1181]]], device='cuda:0')
  5744. loss_train_step before backward: tensor(0.2440, device='cuda:0', grad_fn=<MseLossBackward>)
  5745. loss_train_step after backward: tensor(0.2440, device='cuda:0', grad_fn=<MseLossBackward>)
  5746. loss_train: 3.1880801748484373
  5747. step: 36
  5748. running loss: 0.08855778263467881
  5749. Train Steps: 36/90 Loss: 0.0886 torch.Size([8, 600, 800])
  5750. torch.Size([8, 8])
  5751. tensor([[0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  5752. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  5753. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235],
  5754. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  5755. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  5756. [0.6275, 0.4157, 0.8337, 0.5800, 0.3763, 0.4200, 0.5547, 0.6125],
  5757. [0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  5758. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901]],
  5759. device='cuda:0', dtype=torch.float64)
  5760. predictions are: tensor([[ 0.6768, -0.3240, 1.6868, -1.0501, -0.2776, -1.1492, 0.7312, 0.1656],
  5761. [ 0.6052, -0.3957, 1.7534, -0.1127, -0.5399, -0.3517, 0.5323, 0.1732],
  5762. [ 0.3163, -0.5653, 1.7590, -0.0033, -0.3279, 0.0508, 0.4693, 0.2262],
  5763. [ 0.7730, -0.3122, 1.8314, -0.1909, -0.5424, -0.1122, 0.4518, 0.2226],
  5764. [ 0.7522, -0.3238, 1.3224, -1.1095, -0.3794, -1.1402, 0.5556, 0.2368],
  5765. [ 0.8689, -0.2526, 1.6390, 0.1715, -0.4881, -0.2192, 0.3752, 0.2783],
  5766. [ 0.3152, -0.6392, 1.7184, 0.0382, -0.4561, -0.1316, 0.4029, 0.2143],
  5767. [ 0.4995, -0.4912, 1.5503, -0.8207, -0.5154, -0.7694, 0.6317, 0.1574]],
  5768. device='cuda:0', grad_fn=<AddmmBackward>)
  5769. landmarks are: tensor([[[ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  5770. 0.1467],
  5771. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  5772. 0.1082],
  5773. [ 0.5762, -0.4706, 1.7754, -0.0984, -0.3680, 0.2380, 0.6277,
  5774. 0.1322],
  5775. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  5776. 0.1775],
  5777. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  5778. 0.3315],
  5779. [ 0.6124, -0.3658, 1.5651, 0.3931, -0.5480, -0.3460, 0.2761,
  5780. 0.5431],
  5781. [ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  5782. 0.3777],
  5783. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  5784. -0.0220]]], device='cuda:0')
  5785. loss_train_step before backward: tensor(0.0140, device='cuda:0', grad_fn=<MseLossBackward>)
  5786. loss_train_step after backward: tensor(0.0140, device='cuda:0', grad_fn=<MseLossBackward>)
  5787. loss_train: 3.2020612247288227
  5788. step: 37
  5789. running loss: 0.08654219526294116
  5790. Train Steps: 37/90 Loss: 0.0865 torch.Size([8, 600, 800])
  5791. torch.Size([8, 8])
  5792. tensor([[0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  5793. [0.6197, 0.4091, 0.8800, 0.4783, 0.3538, 0.4767, 0.5950, 0.5550],
  5794. [0.6216, 0.4100, 0.7350, 0.2067, 0.4325, 0.2050, 0.5950, 0.5333],
  5795. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  5796. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  5797. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  5798. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  5799. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426]],
  5800. device='cuda:0', dtype=torch.float64)
  5801. predictions are: tensor([[ 0.5374, -0.4509, 1.7941, 0.2094, -0.3937, 0.1123, 0.4918, 0.2022],
  5802. [ 0.6597, -0.3745, 1.7606, 0.0741, -0.4634, 0.1028, 0.4925, 0.2353],
  5803. [ 0.3929, -0.5305, 1.1526, -1.1111, -0.3497, -1.3115, 0.4014, 0.2133],
  5804. [ 0.3941, -0.5861, 1.9533, 0.0592, -0.3937, -0.2195, 0.7192, 0.2054],
  5805. [ 0.7141, -0.3497, 1.5147, -0.8251, -0.4656, -0.9256, 0.4631, 0.2019],
  5806. [ 0.7035, -0.3585, 1.7677, -0.3576, -0.5942, -0.2835, 0.4756, 0.1937],
  5807. [ 0.6302, -0.3811, 1.2863, -0.9902, -0.5425, -0.8486, 0.4420, 0.1782],
  5808. [ 0.4674, -0.5172, 1.7270, -0.2313, -0.5116, -0.5873, 0.4607, 0.1997]],
  5809. device='cuda:0', grad_fn=<AddmmBackward>)
  5810. landmarks are: tensor([[[ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  5811. 0.1627],
  5812. [ 0.5763, -0.3963, 1.7788, -0.0765, -0.6520, -0.0842, 0.4624,
  5813. 0.2776],
  5814. [ 0.5853, -0.3920, 1.1090, -1.3313, -0.2882, -1.3390, 0.4624,
  5815. 0.1775],
  5816. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  5817. 0.4386],
  5818. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  5819. 0.1931],
  5820. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  5821. 0.0802],
  5822. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  5823. 0.0622],
  5824. [ 0.5788, -0.4135, 1.8214, -0.2408, -0.6039, -0.7854, 0.4115,
  5825. 0.2203]]], device='cuda:0')
  5826. loss_train_step before backward: tensor(0.0173, device='cuda:0', grad_fn=<MseLossBackward>)
  5827. loss_train_step after backward: tensor(0.0173, device='cuda:0', grad_fn=<MseLossBackward>)
  5828. loss_train: 3.2193711400032043
  5829. step: 38
  5830. running loss: 0.08472029315797906
  5831.  
  5832. Train Steps: 38/90 Loss: 0.0847 torch.Size([8, 600, 800])
  5833. torch.Size([8, 8])
  5834. tensor([[0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  5835. [0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131],
  5836. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  5837. [0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  5838. [0.6198, 0.3997, 0.8582, 0.5361, 0.4117, 0.5016, 0.5942, 0.5134],
  5839. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  5840. [0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436],
  5841. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267]],
  5842. device='cuda:0', dtype=torch.float64)
  5843. predictions are: tensor([[ 0.3966, -0.5936, 1.8039, 0.2802, -0.5525, -0.2142, 0.4026, 0.1941],
  5844. [ 0.7885, -0.2987, 1.7053, -0.3514, -0.5758, -0.1134, 0.5165, 0.1591],
  5845. [ 0.6118, -0.3937, 1.6096, -0.7545, -0.3470, -1.0085, 0.4864, 0.1848],
  5846. [ 0.2276, -0.6336, 1.0980, -0.9782, -0.5359, -0.9213, 0.2522, 0.2356],
  5847. [ 0.6053, -0.4369, 1.8010, 0.2543, -0.5330, 0.1212, 0.4244, 0.2200],
  5848. [ 0.6160, -0.4273, 1.6637, -0.5837, -0.6304, -0.6150, 0.4379, 0.2124],
  5849. [ 0.6644, -0.3704, 1.7846, -0.1783, -0.4724, 0.0512, 0.6495, 0.2111],
  5850. [ 0.3931, -0.5582, 1.4735, -1.0682, -0.2781, -1.2448, 0.7007, 0.1874]],
  5851. device='cuda:0', grad_fn=<AddmmBackward>)
  5852. landmarks are: tensor([[[ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  5853. -0.0370],
  5854. [ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  5855. 0.0840],
  5856. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  5857. -0.0368],
  5858. [ 0.5425, -0.3998, 0.9263, -0.8683, -0.6000, -1.0157, 0.0990,
  5859. 0.2476],
  5860. [ 0.5767, -0.4396, 1.6782, 0.1905, -0.3844, 0.0308, 0.4588,
  5861. 0.0855],
  5862. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  5863. 0.3315],
  5864. [ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  5865. 0.2249],
  5866. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  5867. 0.1467]]], device='cuda:0')
  5868. loss_train_step before backward: tensor(0.0228, device='cuda:0', grad_fn=<MseLossBackward>)
  5869. loss_train_step after backward: tensor(0.0228, device='cuda:0', grad_fn=<MseLossBackward>)
  5870. loss_train: 3.242176616564393
  5871. step: 39
  5872. running loss: 0.08313273375806136
  5873. Train Steps: 39/90 Loss: 0.0831 torch.Size([8, 600, 800])
  5874. torch.Size([8, 8])
  5875. tensor([[0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  5876. [0.6229, 0.4086, 0.7538, 0.2600, 0.4775, 0.1617, 0.5900, 0.5383],
  5877. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  5878. [0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  5879. [0.6250, 0.4103, 0.8950, 0.4400, 0.3912, 0.5650, 0.6050, 0.5133],
  5880. [0.6161, 0.4076, 0.8900, 0.4667, 0.4125, 0.5917, 0.6262, 0.5367],
  5881. [0.6201, 0.4017, 0.8871, 0.4621, 0.3517, 0.4675, 0.5999, 0.5106],
  5882. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334]],
  5883. device='cuda:0', dtype=torch.float64)
  5884. predictions are: tensor([[ 3.5106e-01, -6.2456e-01, 1.8187e+00, -1.4204e-01, -7.0050e-01,
  5885. -4.5938e-01, 4.0855e-01, 1.4211e-01],
  5886. [ 3.8717e-01, -5.6815e-01, 1.1987e+00, -1.1633e+00, -4.1027e-01,
  5887. -1.3726e+00, 3.9880e-01, 2.0288e-01],
  5888. [ 5.8238e-01, -4.1615e-01, 1.8140e+00, -5.7646e-02, -3.4776e-01,
  5889. -5.9229e-03, 4.6542e-01, 2.3383e-01],
  5890. [ 1.1506e-01, -7.4752e-01, 1.2902e+00, -1.1127e+00, -3.6575e-01,
  5891. -1.3568e+00, 4.9368e-01, 2.0120e-01],
  5892. [ 9.3898e-01, -1.8494e-01, 1.8908e+00, 1.1370e-03, -5.2647e-01,
  5893. 2.3662e-01, 5.5223e-01, 1.8537e-01],
  5894. [ 7.6586e-01, -3.0031e-01, 1.8964e+00, 9.3340e-02, -4.1862e-01,
  5895. 3.0666e-01, 5.2751e-01, 2.0029e-01],
  5896. [ 6.4795e-01, -4.0853e-01, 1.7987e+00, -6.2643e-03, -6.3486e-01,
  5897. -1.4099e-01, 4.4951e-01, 1.5382e-01],
  5898. [ 4.4453e-01, -5.2647e-01, 1.3447e+00, -1.0519e+00, -6.0382e-01,
  5899. -9.8575e-01, 5.0882e-01, 1.7739e-01]], device='cuda:0',
  5900. grad_fn=<AddmmBackward>)
  5901. landmarks are: tensor([[[ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  5902. 0.0467],
  5903. [ 0.5911, -0.3984, 1.1956, -1.0850, -0.0804, -1.5392, 0.4393,
  5904. 0.2006],
  5905. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  5906. 0.3007],
  5907. [ 0.5917, -0.3861, 1.0455, -1.3698, -0.2882, -1.1928, 0.6067,
  5908. 0.2083],
  5909. [ 0.6010, -0.3909, 1.8480, -0.2536, -0.4788, 0.3238, 0.5085,
  5910. 0.0851],
  5911. [ 0.5598, -0.4032, 1.8249, -0.1304, -0.3806, 0.4470, 0.6067,
  5912. 0.1929],
  5913. [ 0.5783, -0.4306, 1.8114, -0.1515, -0.6617, -0.1268, 0.4851,
  5914. 0.0727],
  5915. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  5916. 0.1779]]], device='cuda:0')
  5917. loss_train_step before backward: tensor(0.0254, device='cuda:0', grad_fn=<MseLossBackward>)
  5918. loss_train_step after backward: tensor(0.0254, device='cuda:0', grad_fn=<MseLossBackward>)
  5919. loss_train: 3.2675318624824286
  5920. step: 40
  5921. running loss: 0.08168829656206071
  5922. Train Steps: 40/90 Loss: 0.0817 torch.Size([8, 600, 800])
  5923. torch.Size([8, 8])
  5924. tensor([[0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  5925. [0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  5926. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  5927. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  5928. [0.6350, 0.4043, 0.8738, 0.5650, 0.3850, 0.4750, 0.6401, 0.4950],
  5929. [0.6225, 0.4116, 0.8662, 0.3517, 0.3663, 0.3233, 0.5837, 0.5317],
  5930. [0.6128, 0.4116, 0.8450, 0.4583, 0.3675, 0.4867, 0.5337, 0.5446],
  5931. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351]],
  5932. device='cuda:0', dtype=torch.float64)
  5933. predictions are: tensor([[ 0.4367, -0.5225, 1.2960, -1.1648, -0.3793, -1.1430, 0.5874, 0.1746],
  5934. [ 0.1962, -0.6501, 1.1282, -1.0401, -0.5617, -0.9396, 0.2712, 0.2072],
  5935. [ 0.6875, -0.3992, 1.8857, 0.2476, -0.6058, -0.0681, 0.4812, 0.1275],
  5936. [ 0.7143, -0.3665, 1.8605, 0.0773, -0.5132, 0.1704, 0.4499, 0.2356],
  5937. [ 0.6062, -0.4491, 1.9378, 0.2578, -0.6167, -0.0194, 0.5542, 0.1477],
  5938. [ 0.5631, -0.4239, 1.6553, -0.6901, -0.5287, -0.7452, 0.4552, 0.1585],
  5939. [ 0.6069, -0.3986, 1.7356, -0.1607, -0.5416, 0.0315, 0.4627, 0.1705],
  5940. [ 0.2619, -0.6570, 1.2979, -1.1250, -0.3744, -1.2685, 0.4204, 0.1447]],
  5941. device='cuda:0', grad_fn=<AddmmBackward>)
  5942. landmarks are: tensor([[[ 5.8614e-01, -3.9292e-01, 1.0570e+00, -1.4314e+00, -3.2864e-01,
  5943. -1.1235e+00, 6.1824e-01, 1.8522e-01],
  5944. [ 5.4099e-01, -4.3210e-01, 8.8383e-01, -9.8491e-01, -5.7691e-01,
  5945. -1.0003e+00, 2.6028e-01, 3.3149e-01],
  5946. [ 6.3949e-01, -4.2132e-01, 1.7037e+00, 3.6228e-01, -4.3256e-01,
  5947. -1.0731e-01, 6.5602e-01, -4.8817e-03],
  5948. [ 5.5393e-01, -4.0308e-01, 1.7168e+00, -5.9398e-02, -3.7483e-01,
  5949. 5.4350e-02, 1.3903e-01, 3.7768e-01],
  5950. [ 6.4706e-01, -4.1832e-01, 1.7499e+00, 3.2379e-01, -5.0762e-01,
  5951. -9.1917e-02, 6.7064e-01, 4.6189e-04],
  5952. [ 5.8932e-01, -3.8468e-01, 1.7152e+00, -6.6159e-01, -5.9423e-01,
  5953. -7.9246e-01, 4.1039e-01, 1.6982e-01],
  5954. [ 5.4440e-01, -3.8460e-01, 1.6171e+00, -1.6890e-01, -5.8845e-01,
  5955. -3.8029e-02, 1.7915e-01, 2.2961e-01],
  5956. [ 5.6637e-01, -4.3212e-01, 1.2862e+00, -1.0003e+00, -2.1894e-01,
  5957. -1.4608e+00, 3.8827e-01, 1.8549e-01]]], device='cuda:0')
  5958. loss_train_step before backward: tensor(0.0188, device='cuda:0', grad_fn=<MseLossBackward>)
  5959. loss_train_step after backward: tensor(0.0188, device='cuda:0', grad_fn=<MseLossBackward>)
  5960. loss_train: 3.2863815408200026
  5961. step: 41
  5962. running loss: 0.08015564733707323
  5963. Train Steps: 41/90 Loss: 0.0802 torch.Size([8, 600, 800])
  5964. torch.Size([8, 8])
  5965. tensor([[0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667],
  5966. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  5967. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  5968. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  5969. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  5970. [0.6262, 0.4052, 0.8888, 0.4700, 0.3675, 0.5117, 0.6350, 0.5233],
  5971. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  5972. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038]],
  5973. device='cuda:0', dtype=torch.float64)
  5974. predictions are: tensor([[ 0.6545, -0.3618, 1.5680, -0.6445, -0.5170, -0.7510, 0.4842, 0.1577],
  5975. [ 0.4752, -0.4913, 1.6541, -0.3822, -0.6434, -0.4164, 0.4551, 0.2095],
  5976. [ 0.3454, -0.5692, 1.5968, -0.1963, -0.6108, -0.2757, 0.2590, 0.1625],
  5977. [-0.3859, -1.0327, 1.4048, -1.1683, -0.1083, -1.1432, 0.6973, 0.1848],
  5978. [ 0.7585, -0.2932, 1.6858, -0.1326, -0.3363, 0.0059, 0.4644, 0.1856],
  5979. [ 0.8664, -0.2708, 1.8608, -0.0368, -0.6589, -0.0560, 0.5618, 0.1448],
  5980. [ 0.7278, -0.3654, 1.6793, 0.0226, -0.5101, -0.1967, 0.3999, 0.1454],
  5981. [ 0.5154, -0.4584, 1.2732, -1.0080, -0.6305, -0.8144, 0.3943, 0.1073]],
  5982. device='cuda:0', grad_fn=<AddmmBackward>)
  5983. landmarks are: tensor([[[ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  5984. 0.3315],
  5985. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  5986. 0.1929],
  5987. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  5988. 0.0893],
  5989. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  5990. 0.3104],
  5991. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  5992. 0.3007],
  5993. [ 0.6063, -0.4142, 1.8192, -0.1150, -0.5885, 0.0774, 0.6471,
  5994. 0.1313],
  5995. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  5996. 0.1854],
  5997. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  5998. 0.0412]]], device='cuda:0')
  5999. loss_train_step before backward: tensor(0.1001, device='cuda:0', grad_fn=<MseLossBackward>)
  6000. loss_train_step after backward: tensor(0.1001, device='cuda:0', grad_fn=<MseLossBackward>)
  6001. loss_train: 3.386511316522956
  6002. step: 42
  6003. running loss: 0.08063122182197514
  6004.  
  6005. Train Steps: 42/90 Loss: 0.0806 torch.Size([8, 600, 800])
  6006. torch.Size([8, 8])
  6007. tensor([[0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  6008. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  6009. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  6010. [0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  6011. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795],
  6012. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  6013. [ nan, nan, 0.8625, 0.2550, 0.5487, 0.2200, 0.7335, 0.5737],
  6014. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367]],
  6015. device='cuda:0', dtype=torch.float64)
  6016. predictions are: tensor([[ 0.3529, -0.5591, 1.5007, -0.3760, -0.6113, -0.3282, 0.2479, 0.2410],
  6017. [ 0.8080, -0.2771, 1.6025, -0.3582, -0.6192, -0.1207, 0.3971, 0.0940],
  6018. [ 0.5119, -0.4641, 1.4563, -0.7292, -0.5492, -0.8653, 0.3301, 0.0829],
  6019. [ 0.2396, -0.6196, 1.5460, -0.4810, -0.4276, -0.7962, 0.3526, 0.1782],
  6020. [ 0.9781, -0.1953, 1.7784, 0.0812, -0.5292, 0.1354, 0.6026, 0.1393],
  6021. [ 0.7572, -0.3118, 1.6693, -0.2089, -0.5883, -0.2834, 0.4285, 0.1437],
  6022. [-0.4364, -1.0733, 1.4616, -1.2481, -0.0045, -1.1192, 0.8184, 0.1947],
  6023. [ 0.5306, -0.4469, 1.6497, -0.4279, -0.6176, -0.3333, 0.4536, 0.1986]],
  6024. device='cuda:0', grad_fn=<AddmmBackward>)
  6025. landmarks are: tensor([[[ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  6026. 0.4145],
  6027. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  6028. 0.0502],
  6029. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  6030. 0.1005],
  6031. [ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  6032. 0.1929],
  6033. [ 0.6355, -0.4080, 1.6113, 0.1852, -0.4730, 0.1467, 0.9996,
  6034. 0.3905],
  6035. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  6036. 0.2314],
  6037. [-2.2859, -2.2859, 1.6979, -1.1081, 0.2487, -1.2697, 1.1020,
  6038. 0.3638],
  6039. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  6040. 0.1929]]], device='cuda:0')
  6041. loss_train_step before backward: tensor(0.1016, device='cuda:0', grad_fn=<MseLossBackward>)
  6042. loss_train_step after backward: tensor(0.1016, device='cuda:0', grad_fn=<MseLossBackward>)
  6043. loss_train: 3.488085037097335
  6044. step: 43
  6045. running loss: 0.08111825667668221
  6046. Train Steps: 43/90 Loss: 0.0811 torch.Size([8, 600, 800])
  6047. torch.Size([8, 8])
  6048. tensor([[0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  6049. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  6050. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483],
  6051. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  6052. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  6053. [0.6201, 0.4064, 0.8688, 0.5050, 0.4225, 0.5100, 0.6138, 0.5500],
  6054. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  6055. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667]],
  6056. device='cuda:0', dtype=torch.float64)
  6057. predictions are: tensor([[ 0.5349, -0.4455, 1.7570, -0.2074, -0.5198, -0.4080, 0.4787, 0.1820],
  6058. [ 0.8963, -0.2477, 1.9448, -0.1026, -0.4083, 0.2798, 0.6832, 0.1334],
  6059. [ 0.3211, -0.5580, 1.6122, -0.2500, -0.5693, -0.4049, 0.2903, 0.1702],
  6060. [ 0.3067, -0.5936, 1.0340, -1.2498, -0.3961, -1.2777, 0.3361, 0.1416],
  6061. [ 0.9243, -0.1990, 1.6087, -0.5908, -0.5360, -0.4200, 0.5517, 0.1284],
  6062. [ 0.6387, -0.3762, 1.7011, 0.0358, -0.4203, 0.0398, 0.3977, 0.1838],
  6063. [-0.7036, -1.2559, 1.3289, -0.8699, -0.4771, -0.9723, 0.2688, 0.1476],
  6064. [ 0.5620, -0.4357, 1.7383, -0.5753, -0.5294, -0.5052, 0.5535, 0.1751]],
  6065. device='cuda:0', grad_fn=<AddmmBackward>)
  6066. landmarks are: tensor([[[ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  6067. 0.1499],
  6068. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  6069. 0.1082],
  6070. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  6071. 0.2468],
  6072. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  6073. 0.2576],
  6074. [ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  6075. 0.2930],
  6076. [ 0.5784, -0.4088, 1.7268, 0.0467, -0.3344, 0.0697, 0.5490,
  6077. 0.2545],
  6078. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  6079. 0.0893],
  6080. [ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  6081. 0.3315]]], device='cuda:0')
  6082. loss_train_step before backward: tensor(0.0732, device='cuda:0', grad_fn=<MseLossBackward>)
  6083. loss_train_step after backward: tensor(0.0732, device='cuda:0', grad_fn=<MseLossBackward>)
  6084. loss_train: 3.561272194609046
  6085. step: 44
  6086. running loss: 0.08093800442293286
  6087. Train Steps: 44/90 Loss: 0.0809 torch.Size([8, 600, 800])
  6088. torch.Size([8, 8])
  6089. tensor([[0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  6090. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  6091. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  6092. [ nan, nan, 0.9050, 0.3500, 0.5138, 0.2300, 0.7359, 0.5702],
  6093. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235],
  6094. [0.6268, 0.4061, 0.8350, 0.2433, 0.4575, 0.2283, 0.6350, 0.5300],
  6095. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  6096. [ nan, nan, 0.9088, 0.3783, 0.4562, 0.2617, 0.6741, 0.5575]],
  6097. device='cuda:0', dtype=torch.float64)
  6098. predictions are: tensor([[ 0.5818, -0.3966, 1.3973, -0.8580, -0.6440, -0.5126, 0.4475, 0.1186],
  6099. [ 0.4153, -0.4874, 1.2256, -0.7259, -0.5466, -0.6686, 0.3026, 0.2101],
  6100. [ 0.7514, -0.3059, 1.7006, 0.0987, -0.3783, 0.1060, 0.2963, 0.1680],
  6101. [-0.2648, -0.9652, 1.7160, -0.6842, -0.1627, -0.8070, 0.7399, 0.2166],
  6102. [ 0.5834, -0.4091, 1.7065, -0.0113, -0.5106, 0.1586, 0.4210, 0.1692],
  6103. [ 0.2055, -0.6349, 1.4568, -0.9875, -0.3721, -1.0002, 0.5307, 0.1490],
  6104. [ 0.5841, -0.4346, 1.6850, -0.2511, -0.6876, -0.1978, 0.3221, 0.1884],
  6105. [ 0.0765, -0.7286, 1.7289, -0.5439, -0.2815, -0.7442, 0.6015, 0.1698]],
  6106. device='cuda:0', grad_fn=<AddmmBackward>)
  6107. landmarks are: tensor([[[ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  6108. 0.1159],
  6109. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  6110. 0.3469],
  6111. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  6112. 0.0532],
  6113. [-2.2859, -2.2859, 1.8942, -0.6693, 0.0871, -1.2236, 1.1130,
  6114. 0.3478],
  6115. [ 0.5762, -0.4706, 1.7754, -0.0984, -0.3680, 0.2380, 0.6277,
  6116. 0.1322],
  6117. [ 0.6093, -0.4104, 1.5709, -1.1620, -0.1727, -1.2313, 0.6471,
  6118. 0.1621],
  6119. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  6120. 0.2930],
  6121. [-2.2859, -2.2859, 1.9115, -0.5384, -0.1785, -1.0773, 0.8278,
  6122. 0.2890]]], device='cuda:0')
  6123. loss_train_step before backward: tensor(0.2405, device='cuda:0', grad_fn=<MseLossBackward>)
  6124. loss_train_step after backward: tensor(0.2405, device='cuda:0', grad_fn=<MseLossBackward>)
  6125. loss_train: 3.8017283137887716
  6126. step: 45
  6127. running loss: 0.08448285141752826
  6128. Train Steps: 45/90 Loss: 0.0845 torch.Size([8, 600, 800])
  6129. torch.Size([8, 8])
  6130. tensor([[0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617],
  6131. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  6132. [0.6261, 0.4131, 0.8938, 0.3550, 0.4000, 0.2683, 0.6188, 0.5283],
  6133. [0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117],
  6134. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  6135. [0.6124, 0.4075, 0.7696, 0.4153, 0.3475, 0.3767, 0.5157, 0.5427],
  6136. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412],
  6137. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892]],
  6138. device='cuda:0', dtype=torch.float64)
  6139. predictions are: tensor([[ 0.2672, -0.5984, 1.5340, -0.0941, -0.3328, -0.1551, 0.3480, 0.2435],
  6140. [ 0.4768, -0.4793, 1.7141, -0.1435, -0.5566, -0.1459, 0.5068, 0.1785],
  6141. [ 0.1151, -0.7118, 1.6953, -0.8581, -0.3410, -0.9446, 0.6515, 0.1427],
  6142. [ 0.2253, -0.6507, 1.7210, -0.3347, -0.5786, -0.4340, 0.3847, 0.1178],
  6143. [ 0.5995, -0.4095, 1.6505, -0.4597, -0.5058, -0.2441, 0.3787, 0.1836],
  6144. [ 0.4865, -0.4288, 1.3854, -0.7569, -0.5593, -0.5213, 0.3683, 0.1623],
  6145. [ 0.2983, -0.6022, 1.6223, 0.0036, -0.2758, -0.0715, 0.3743, 0.2261],
  6146. [-0.1031, -0.8570, 1.6374, -0.9917, -0.2689, -1.0909, 0.6932, 0.1572]],
  6147. device='cuda:0', grad_fn=<AddmmBackward>)
  6148. landmarks are: tensor([[[ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  6149. 0.3084],
  6150. [ 0.6148, -0.4130, 1.6864, 0.1698, -0.5307, -0.1150, 0.6125,
  6151. 0.0851],
  6152. [ 0.6062, -0.3778, 1.8423, -0.6462, -0.4383, -1.0465, 0.5721,
  6153. 0.1544],
  6154. [ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  6155. 0.0774],
  6156. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  6157. 0.3087],
  6158. [ 0.5427, -0.4035, 1.2688, -0.3675, -0.6808, -0.5461, 0.0959,
  6159. 0.2206],
  6160. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  6161. 0.2138],
  6162. [ 0.6128, -0.3828, 1.7499, -0.8386, -0.3344, -1.2620, 0.5792,
  6163. -0.0263]]], device='cuda:0')
  6164. loss_train_step before backward: tensor(0.0429, device='cuda:0', grad_fn=<MseLossBackward>)
  6165. loss_train_step after backward: tensor(0.0429, device='cuda:0', grad_fn=<MseLossBackward>)
  6166. loss_train: 3.8446308206766844
  6167. step: 46
  6168. running loss: 0.08357893088427575
  6169.  
  6170. Train Steps: 46/90 Loss: 0.0836 torch.Size([8, 600, 800])
  6171. torch.Size([8, 8])
  6172. tensor([[0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  6173. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575],
  6174. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  6175. [0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131],
  6176. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  6177. [ nan, nan, 0.7412, 0.2200, 0.4450, 0.1517, 0.5312, 0.4983],
  6178. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  6179. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220]],
  6180. device='cuda:0', dtype=torch.float64)
  6181. predictions are: tensor([[ 5.1204e-01, -4.0808e-01, 2.0241e+00, -6.4815e-04, -3.0531e-01,
  6182. -2.6063e-01, 6.0652e-01, 2.0491e-01],
  6183. [ 7.8274e-01, -2.8036e-01, 1.8523e+00, -4.5895e-01, -4.4856e-01,
  6184. 9.5163e-03, 7.9724e-01, 1.7100e-01],
  6185. [ 1.6438e-02, -7.3354e-01, 1.6209e+00, -8.2435e-01, -2.8295e-01,
  6186. -8.0990e-01, 6.1467e-01, 1.8458e-01],
  6187. [ 1.1100e+00, -7.7610e-02, 1.8684e+00, -1.1496e-01, -5.9891e-01,
  6188. 1.6606e-01, 4.7673e-01, 1.2712e-01],
  6189. [ 7.8423e-01, -2.5731e-01, 1.6101e+00, -3.6818e-01, -6.1474e-01,
  6190. -1.4655e-01, 3.7293e-01, 1.9924e-01],
  6191. [-1.0913e+00, -1.4849e+00, 1.1627e+00, -9.4262e-01, -2.5918e-01,
  6192. -1.1330e+00, 3.0192e-01, 2.3340e-01],
  6193. [-3.3309e-01, -9.9671e-01, 1.1426e+00, -8.3217e-01, -3.9860e-01,
  6194. -1.0915e+00, 2.8002e-01, 2.2096e-01],
  6195. [-2.7431e-01, -9.2364e-01, 1.1610e+00, -8.5328e-01, -3.1564e-01,
  6196. -1.1378e+00, 2.8685e-01, 2.2268e-01]], device='cuda:0',
  6197. grad_fn=<AddmmBackward>)
  6198. landmarks are: tensor([[[ 6.5365e-01, -3.6231e-01, 1.9115e+00, -2.6898e-01, -4.0370e-01,
  6199. -8.3095e-01, 6.9257e-01, 1.6077e-01],
  6200. [ 6.1577e-01, -4.2490e-01, 1.8654e+00, -9.0023e-01, -3.2286e-01,
  6201. -3.5366e-01, 9.6675e-01, 2.8902e-01],
  6202. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  6203. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  6204. [ 5.5813e-01, -4.5860e-01, 1.5586e+00, -3.7466e-01, -6.7920e-01,
  6205. -2.3907e-01, 4.4552e-01, 8.4044e-02],
  6206. [ 5.3274e-01, -4.3811e-01, 1.2880e+00, -6.3079e-01, -6.8661e-01,
  6207. -5.3072e-01, 2.6581e-01, 3.4174e-01],
  6208. [-2.2859e+00, -2.2859e+00, 1.1379e+00, -1.2697e+00, -2.3048e-01,
  6209. -1.5854e+00, 1.6790e-01, 1.5858e-02],
  6210. [ 5.5912e-01, -3.9900e-01, 9.0115e-01, -1.2313e+00, -3.9792e-01,
  6211. -1.3852e+00, 8.0445e-02, 2.0706e-01],
  6212. [ 5.5664e-01, -4.1601e-01, 9.9353e-01, -1.3313e+00, -2.8245e-01,
  6213. -1.5161e+00, 2.1441e-01, 1.2532e-01]]], device='cuda:0')
  6214. loss_train_step before backward: tensor(0.1320, device='cuda:0', grad_fn=<MseLossBackward>)
  6215. loss_train_step after backward: tensor(0.1320, device='cuda:0', grad_fn=<MseLossBackward>)
  6216. loss_train: 3.9766319822520018
  6217. step: 47
  6218. running loss: 0.08460919111174472
  6219. Train Steps: 47/90 Loss: 0.0846 torch.Size([8, 600, 800])
  6220. torch.Size([8, 8])
  6221. tensor([[0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  6222. [ nan, nan, 0.6992, 0.2791, 0.3950, 0.2383, 0.5483, 0.5819],
  6223. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  6224. [0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617],
  6225. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578],
  6226. [0.6229, 0.4086, 0.7538, 0.2600, 0.4775, 0.1617, 0.5900, 0.5383],
  6227. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  6228. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800]],
  6229. device='cuda:0', dtype=torch.float64)
  6230. predictions are: tensor([[ 0.6122, -0.3670, 1.3447, -0.9112, -0.3654, -1.0974, 0.4136, 0.1788],
  6231. [-0.8619, -1.2983, 1.1162, -0.8752, -0.3778, -1.0457, 0.2680, 0.2437],
  6232. [ 0.9006, -0.2098, 2.0488, 0.0939, -0.2921, 0.4136, 0.6445, 0.1981],
  6233. [ 0.8501, -0.2358, 1.9843, 0.0972, -0.2533, 0.0895, 0.5619, 0.2259],
  6234. [-1.4110, -1.6712, 1.2796, -0.7929, -0.3579, -0.9350, 0.3379, 0.2312],
  6235. [ 0.4885, -0.4263, 1.3314, -1.0387, -0.2906, -1.1694, 0.4948, 0.2056],
  6236. [ 0.9188, -0.1726, 2.0675, -0.0769, -0.5989, 0.1320, 0.6938, 0.0644],
  6237. [-0.4029, -0.9729, 1.3120, -0.6700, -0.4773, -0.8498, 0.2555, 0.2297]],
  6238. device='cuda:0', grad_fn=<AddmmBackward>)
  6239. landmarks are: tensor([[[ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  6240. 0.1449],
  6241. [-2.2859, -2.2859, 0.9438, -0.9967, -0.4614, -1.1851, 0.2468,
  6242. 0.4019],
  6243. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  6244. 0.2237],
  6245. [ 0.5432, -0.4388, 1.7557, -0.0303, -0.0919, -0.1150, 0.2699,
  6246. 0.3087],
  6247. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  6248. 0.2905],
  6249. [ 0.5911, -0.3984, 1.1956, -1.0850, -0.0804, -1.5392, 0.4393,
  6250. 0.2006],
  6251. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  6252. -0.0670],
  6253. [ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  6254. 0.3931]]], device='cuda:0')
  6255. loss_train_step before backward: tensor(0.1134, device='cuda:0', grad_fn=<MseLossBackward>)
  6256. loss_train_step after backward: tensor(0.1134, device='cuda:0', grad_fn=<MseLossBackward>)
  6257. loss_train: 4.090075312182307
  6258. step: 48
  6259. running loss: 0.0852099023371314
  6260. Train Steps: 48/90 Loss: 0.0852 torch.Size([8, 600, 800])
  6261. torch.Size([8, 8])
  6262. tensor([[0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  6263. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  6264. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064],
  6265. [0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  6266. [0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  6267. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  6268. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  6269. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760]],
  6270. device='cuda:0', dtype=torch.float64)
  6271. predictions are: tensor([[-0.0881, -0.8622, 1.7180, -0.3380, -0.1900, -0.3595, 0.5118, 0.1946],
  6272. [ 0.3039, -0.5632, 1.6433, -0.7080, -0.5210, -0.6785, 0.4957, 0.2307],
  6273. [ 0.1802, -0.7043, 1.6741, -0.2930, -0.1235, -0.5044, 0.3889, 0.2316],
  6274. [-0.6809, -1.1939, 1.2687, -1.0639, -0.3153, -1.4568, 0.3238, 0.1441],
  6275. [ 0.3311, -0.5428, 1.7258, -0.2202, -0.2688, -0.0183, 0.4605, 0.2348],
  6276. [ 0.1304, -0.6649, 1.6293, -0.6603, -0.5442, -0.5658, 0.5650, 0.1014],
  6277. [ 0.3655, -0.5611, 1.7344, -0.1714, -0.4312, -0.2769, 0.4720, 0.1755],
  6278. [ 0.4916, -0.4244, 1.5928, -0.1345, -0.4315, -0.3216, 0.4903, 0.2304]],
  6279. device='cuda:0', grad_fn=<AddmmBackward>)
  6280. landmarks are: tensor([[[ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  6281. 0.2622],
  6282. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  6283. 0.1929],
  6284. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  6285. 0.0532],
  6286. [ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  6287. 0.0111],
  6288. [ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  6289. 0.0412],
  6290. [ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  6291. -0.0099],
  6292. [ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  6293. 0.0663],
  6294. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  6295. 0.3745]]], device='cuda:0')
  6296. loss_train_step before backward: tensor(0.0986, device='cuda:0', grad_fn=<MseLossBackward>)
  6297. loss_train_step after backward: tensor(0.0986, device='cuda:0', grad_fn=<MseLossBackward>)
  6298. loss_train: 4.188635913655162
  6299. step: 49
  6300. running loss: 0.08548236558479923
  6301. Train Steps: 49/90 Loss: 0.0855 torch.Size([8, 600, 800])
  6302. torch.Size([8, 8])
  6303. tensor([[0.6124, 0.4075, 0.7696, 0.4153, 0.3475, 0.3767, 0.5157, 0.5427],
  6304. [0.6126, 0.4073, 0.8750, 0.5133, 0.3800, 0.4333, 0.4986, 0.5378],
  6305. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  6306. [0.6022, 0.3994, 0.8025, 0.3350, 0.3350, 0.4400, 0.5565, 0.5025],
  6307. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  6308. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  6309. [0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  6310. [0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071]],
  6311. device='cuda:0', dtype=torch.float64)
  6312. predictions are: tensor([[ 0.3454, -0.4971, 1.4509, -0.5696, -0.5079, -0.5487, 0.3331, 0.1901],
  6313. [ 0.3420, -0.5645, 1.7734, 0.0995, -0.4219, -0.2674, 0.3567, 0.2133],
  6314. [ 0.2438, -0.6110, 1.4486, -0.8155, -0.3154, -1.0944, 0.4986, 0.2272],
  6315. [-0.4310, -1.0179, 1.4841, -0.7465, -0.4986, -0.4605, 0.4811, 0.1436],
  6316. [ 0.0408, -0.7762, 1.8346, -0.0525, -0.3941, -0.1446, 0.5553, 0.1564],
  6317. [-0.1729, -0.8700, 1.3802, -0.9201, -0.1231, -1.1452, 0.4031, 0.2139],
  6318. [ 0.3208, -0.5864, 1.8330, -0.0026, -0.1255, 0.0109, 0.5079, 0.2647],
  6319. [ 0.1492, -0.6696, 1.2125, -1.0467, -0.4508, -1.1560, 0.3488, 0.1378]],
  6320. device='cuda:0', grad_fn=<AddmmBackward>)
  6321. landmarks are: tensor([[[ 0.5427, -0.4035, 1.2688, -0.3675, -0.6808, -0.5461, 0.0959,
  6322. 0.2206],
  6323. [ 0.5435, -0.4045, 1.7557, 0.0851, -0.5307, -0.2844, 0.0172,
  6324. 0.1980],
  6325. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  6326. 0.3777],
  6327. [ 0.4956, -0.4413, 1.4208, -0.7386, -0.7386, -0.2536, 0.2843,
  6328. 0.0351],
  6329. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  6330. -0.0534],
  6331. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  6332. 0.2083],
  6333. [ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  6334. 0.0592],
  6335. [ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  6336. 0.0562]]], device='cuda:0')
  6337. loss_train_step before backward: tensor(0.0689, device='cuda:0', grad_fn=<MseLossBackward>)
  6338.  
  6339. loss_train_step after backward: tensor(0.0689, device='cuda:0', grad_fn=<MseLossBackward>)
  6340. loss_train: 4.257585039362311
  6341. step: 50
  6342. running loss: 0.08515170078724622
  6343. Train Steps: 50/90 Loss: 0.0852 torch.Size([8, 600, 800])
  6344. torch.Size([8, 8])
  6345. tensor([[ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  6346. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  6347. [0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  6348. [0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  6349. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  6350. [0.6262, 0.4052, 0.8888, 0.4700, 0.3675, 0.5117, 0.6350, 0.5233],
  6351. [0.6179, 0.3961, 0.8347, 0.6020, 0.3887, 0.4624, 0.5714, 0.5373],
  6352. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397]],
  6353. device='cuda:0', dtype=torch.float64)
  6354. predictions are: tensor([[-1.4041, -1.6769, 1.1390, -0.9196, -0.2693, -1.1782, 0.2023, 0.2169],
  6355. [ 0.6574, -0.3363, 1.7427, 0.2147, -0.4140, 0.0338, 0.3964, 0.2300],
  6356. [ 0.1212, -0.6699, 1.4240, -1.0007, -0.3117, -1.0039, 0.5159, 0.1357],
  6357. [ 0.3221, -0.5317, 1.4546, -0.9382, -0.4403, -0.4426, 0.5357, 0.1844],
  6358. [ 0.6383, -0.3453, 1.7350, -0.3782, -0.4291, -0.7050, 0.3973, 0.1939],
  6359. [ 0.6196, -0.4027, 1.9948, -0.1199, -0.3932, 0.0846, 0.6095, 0.1669],
  6360. [ 0.4998, -0.4693, 1.7146, 0.2622, -0.3820, -0.1580, 0.3382, 0.1745],
  6361. [-0.3319, -0.9927, 1.0219, -1.1324, -0.3122, -1.3981, 0.2109, 0.1964]],
  6362. device='cuda:0', grad_fn=<AddmmBackward>)
  6363. landmarks are: tensor([[[-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  6364. 0.2183],
  6365. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  6366. 0.5316],
  6367. [ 0.6125, -0.4345, 1.4308, -1.1384, -0.4213, -1.0031, 0.7190,
  6368. 0.1214],
  6369. [ 0.5799, -0.4099, 1.5651, -1.0465, -0.5885, -0.3075, 0.6413,
  6370. 0.1390],
  6371. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  6372. 0.2699],
  6373. [ 0.6063, -0.4142, 1.8192, -0.1150, -0.5885, 0.0774, 0.6471,
  6374. 0.1313],
  6375. [ 0.5680, -0.4562, 1.5697, 0.4947, -0.4904, -0.1503, 0.3536,
  6376. 0.1956],
  6377. [ 0.5591, -0.3990, 0.9012, -1.2313, -0.3979, -1.3852, 0.0804,
  6378. 0.2071]]], device='cuda:0')
  6379. loss_train_step before backward: tensor(0.0524, device='cuda:0', grad_fn=<MseLossBackward>)
  6380. loss_train_step after backward: tensor(0.0524, device='cuda:0', grad_fn=<MseLossBackward>)
  6381. loss_train: 4.309938298538327
  6382. step: 51
  6383. running loss: 0.08450859408898681
  6384. Train Steps: 51/90 Loss: 0.0845 torch.Size([8, 600, 800])
  6385. torch.Size([8, 8])
  6386. tensor([[0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  6387. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  6388. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  6389. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  6390. [0.6250, 0.4131, 0.8688, 0.2983, 0.4275, 0.2367, 0.6162, 0.5367],
  6391. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  6392. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  6393. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412]],
  6394. device='cuda:0', dtype=torch.float64)
  6395. predictions are: tensor([[ 0.1343, -0.6719, 1.1848, -0.9330, -0.2622, -1.1929, 0.2911, 0.1972],
  6396. [ 0.1454, -0.6445, 1.3932, -0.7919, -0.4341, -0.7242, 0.3274, 0.2350],
  6397. [ 0.6946, -0.3061, 1.8101, 0.3960, -0.4587, 0.0493, 0.4624, 0.1293],
  6398. [ 0.3389, -0.5140, 1.4280, -0.7080, -0.5626, -0.5696, 0.3538, 0.1557],
  6399. [ 0.1701, -0.6353, 1.6288, -0.7426, -0.2407, -0.7913, 0.5828, 0.1906],
  6400. [ 0.6218, -0.3358, 1.3809, -0.8998, -0.4000, -0.9331, 0.4869, 0.1414],
  6401. [-1.3165, -1.6054, 1.0127, -1.0492, -0.3465, -1.1461, 0.2269, 0.2403],
  6402. [ 0.4412, -0.4863, 1.7145, 0.4136, -0.2517, 0.1877, 0.3192, 0.2372]],
  6403. device='cuda:0', grad_fn=<AddmmBackward>)
  6404. landmarks are: tensor([[[ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  6405. 0.1005],
  6406. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  6407. 0.2853],
  6408. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  6409. -0.0049],
  6410. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  6411. 0.0942],
  6412. [ 0.6011, -0.3778, 1.7268, -0.9079, -0.3113, -1.1928, 0.5605,
  6413. 0.1929],
  6414. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  6415. 0.1929],
  6416. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  6417. 0.2930],
  6418. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  6419. 0.2138]]], device='cuda:0')
  6420. loss_train_step before backward: tensor(0.0551, device='cuda:0', grad_fn=<MseLossBackward>)
  6421. loss_train_step after backward: tensor(0.0551, device='cuda:0', grad_fn=<MseLossBackward>)
  6422. loss_train: 4.365078965201974
  6423. step: 52
  6424. running loss: 0.08394382625388411
  6425. Train Steps: 52/90 Loss: 0.0839 torch.Size([8, 600, 800])
  6426. torch.Size([8, 8])
  6427. tensor([[0.6152, 0.4131, 0.6863, 0.2567, 0.3625, 0.3300, 0.5765, 0.5305],
  6428. [0.6364, 0.4154, 0.8938, 0.3717, 0.4500, 0.2583, 0.6448, 0.5285],
  6429. [0.6124, 0.4030, 0.8650, 0.4867, 0.4999, 0.5106, 0.5137, 0.5773],
  6430. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  6431. [0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  6432. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100],
  6433. [0.6284, 0.4093, 0.8900, 0.4700, 0.3650, 0.3850, 0.6212, 0.5167],
  6434. [0.6307, 0.4029, 0.8988, 0.4817, 0.3937, 0.3500, 0.7311, 0.5378]],
  6435. device='cuda:0', dtype=torch.float64)
  6436. predictions are: tensor([[ 0.7222, -0.2672, 0.9825, -1.1078, -0.5705, -0.9164, 0.1739, 0.2092],
  6437. [ 0.0665, -0.7308, 1.5910, -0.8096, -0.2316, -1.0253, 0.5274, 0.2099],
  6438. [ 0.3037, -0.5983, 1.5746, -0.1910, -0.2327, -0.1118, 0.2617, 0.2293],
  6439. [-1.2385, -1.5823, 0.9541, -1.2474, -0.2575, -1.4829, 0.2528, 0.2454],
  6440. [ 0.3653, -0.5106, 1.7113, -0.0647, -0.3102, 0.2423, 0.4094, 0.1881],
  6441. [ 0.4853, -0.4565, 1.5947, 0.0082, -0.4378, -0.0843, 0.3777, 0.1922],
  6442. [ 0.8494, -0.2006, 1.7019, -0.1805, -0.6135, -0.5201, 0.4251, 0.0953],
  6443. [ 0.1864, -0.6458, 1.7229, -0.2324, -0.4180, -0.7384, 0.4583, 0.1592]],
  6444. device='cuda:0', grad_fn=<AddmmBackward>)
  6445. landmarks are: tensor([[[ 0.5557, -0.3779, 0.8838, -1.1004, -0.6115, -0.7617, 0.3769,
  6446. 0.1644],
  6447. [ 0.6537, -0.3671, 1.8423, -0.5692, -0.2074, -1.0927, 0.6926,
  6448. 0.1554],
  6449. [ 0.5428, -0.4244, 1.7095, -0.0380, 0.0232, 0.0725, 0.0866,
  6450. 0.3806],
  6451. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  6452. 0.3623],
  6453. [ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  6454. 0.0412],
  6455. [ 0.6236, -0.4344, 1.6171, 0.1852, -0.3402, 0.0236, 0.6471,
  6456. 0.0697],
  6457. [ 0.6164, -0.3956, 1.8249, -0.1150, -0.6000, -0.5076, 0.5836,
  6458. 0.1005],
  6459. [ 0.6273, -0.4249, 1.8654, -0.0611, -0.4672, -0.6693, 1.0910,
  6460. 0.1982]]], device='cuda:0')
  6461. loss_train_step before backward: tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward>)
  6462. loss_train_step after backward: tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward>)
  6463. loss_train: 4.425908403471112
  6464. step: 53
  6465. running loss: 0.08350770572587005
  6466. Train Steps: 53/90 Loss: 0.0835 torch.Size([8, 600, 800])
  6467. torch.Size([8, 8])
  6468. tensor([[0.6196, 0.4068, 0.7645, 0.2234, 0.4575, 0.1737, 0.5926, 0.5284],
  6469. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  6470. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  6471. [0.6176, 0.4030, 0.8850, 0.4850, 0.3688, 0.4050, 0.5312, 0.5783],
  6472. [0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843],
  6473. [0.6109, 0.4015, 0.7668, 0.3639, 0.3513, 0.3667, 0.5200, 0.5641],
  6474. [ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729],
  6475. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450]],
  6476. device='cuda:0', dtype=torch.float64)
  6477. predictions are: tensor([[ 0.5744, -0.4358, 1.1659, -1.2056, -0.2736, -1.3638, 0.3496, 0.1837],
  6478. [ 0.7267, -0.3071, 1.6715, 0.2827, -0.4446, -0.0200, 0.4095, 0.1985],
  6479. [ 0.3578, -0.5564, 1.3084, -1.0304, -0.2044, -1.2064, 0.3487, 0.2020],
  6480. [ 0.2623, -0.5900, 1.6264, 0.0475, -0.5414, -0.3029, 0.2797, 0.1594],
  6481. [ 0.3787, -0.5423, 1.8219, -0.1248, -0.5105, -0.0737, 0.4833, 0.1497],
  6482. [ 0.3219, -0.5242, 1.3093, -0.7075, -0.5767, -0.5406, 0.2827, 0.1780],
  6483. [-0.7890, -1.2903, 0.9590, -1.2208, -0.3849, -1.4650, 0.2070, 0.1993],
  6484. [ 0.2771, -0.6158, 1.7014, -0.1671, -0.3850, 0.1569, 0.4584, 0.2011]],
  6485. device='cuda:0', grad_fn=<AddmmBackward>)
  6486. landmarks are: tensor([[[ 0.5761, -0.4070, 1.2452, -1.2541, -0.1725, -1.4835, 0.4511,
  6487. 0.1545],
  6488. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  6489. 0.3007],
  6490. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  6491. 0.2083],
  6492. [ 0.5667, -0.4246, 1.8018, -0.0457, -0.5827, -0.4152, 0.1679,
  6493. 0.3854],
  6494. [ 0.6075, -0.4159, 1.8654, -0.1458, -0.5249, 0.0159, 0.6359,
  6495. -0.0490],
  6496. [ 0.5357, -0.4315, 1.2557, -0.6051, -0.6635, -0.5923, 0.1159,
  6497. 0.3198],
  6498. [-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  6499. 0.3604],
  6500. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  6501. 0.2314]]], device='cuda:0')
  6502. loss_train_step before backward: tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward>)
  6503. loss_train_step after backward: tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward>)
  6504. loss_train: 4.492464052513242
  6505. step: 54
  6506. running loss: 0.08319377875024522
  6507.  
  6508. Train Steps: 54/90 Loss: 0.0832 torch.Size([8, 600, 800])
  6509. torch.Size([8, 8])
  6510. tensor([[0.6214, 0.4112, 0.7838, 0.2117, 0.3650, 0.3133, 0.5675, 0.5083],
  6511. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  6512. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  6513. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  6514. [0.6339, 0.4112, 0.8838, 0.5067, 0.4000, 0.5433, 0.7549, 0.5378],
  6515. [ nan, nan, 0.8625, 0.2550, 0.5487, 0.2200, 0.7335, 0.5737],
  6516. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  6517. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750]],
  6518. device='cuda:0', dtype=torch.float64)
  6519. predictions are: tensor([[ 0.9089, -0.1808, 1.2733, -1.0337, -0.5515, -1.1081, 0.3434, 0.1587],
  6520. [ 0.8128, -0.2403, 1.4522, -0.6860, -0.6329, -0.7484, 0.2570, 0.1964],
  6521. [ 1.2244, 0.0209, 1.4750, 0.2158, -0.4895, -0.2091, 0.2452, 0.2366],
  6522. [ 0.7003, -0.3044, 1.5976, -0.0632, -0.4107, 0.0459, 0.3074, 0.2059],
  6523. [ 0.8016, -0.2368, 1.7200, -0.0157, -0.4262, 0.1961, 0.5880, 0.1784],
  6524. [-2.0187, -2.1144, 1.5037, -1.0512, -0.0099, -1.3094, 0.7017, 0.2278],
  6525. [ 0.6363, -0.3475, 1.5620, -0.2526, -0.5205, -0.2222, 0.1970, 0.1762],
  6526. [-0.8353, -1.2941, 0.8914, -1.2110, -0.3824, -1.3947, 0.1707, 0.2402]],
  6527. device='cuda:0', grad_fn=<AddmmBackward>)
  6528. landmarks are: tensor([[[ 0.5845, -0.3864, 1.3342, -1.3082, -0.6000, -0.8386, 0.3353,
  6529. 0.0620],
  6530. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  6531. 0.3315],
  6532. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  6533. 0.4470],
  6534. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  6535. 0.3084],
  6536. [ 0.6421, -0.3864, 1.7961, 0.0543, -0.4383, 0.2237, 1.2007,
  6537. 0.1982],
  6538. [-2.2859, -2.2859, 1.6979, -1.1081, 0.2487, -1.2697, 1.1020,
  6539. 0.3638],
  6540. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  6541. 0.0893],
  6542. [ 0.5663, -0.4396, 0.8261, -1.1312, -0.2940, -1.3929, 0.2603,
  6543. 0.3700]]], device='cuda:0')
  6544. loss_train_step before backward: tensor(0.0768, device='cuda:0', grad_fn=<MseLossBackward>)
  6545. loss_train_step after backward: tensor(0.0768, device='cuda:0', grad_fn=<MseLossBackward>)
  6546. loss_train: 4.569240244105458
  6547. step: 55
  6548. running loss: 0.08307709534737197
  6549. Train Steps: 55/90 Loss: 0.0831 torch.Size([8, 600, 800])
  6550. torch.Size([8, 8])
  6551. tensor([[0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  6552. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  6553. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  6554. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  6555. [0.6262, 0.4085, 0.8438, 0.3150, 0.4025, 0.2633, 0.6339, 0.4810],
  6556. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  6557. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  6558. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672]],
  6559. device='cuda:0', dtype=torch.float64)
  6560. predictions are: tensor([[ 0.4381, -0.5051, 1.6501, -0.5635, -0.4440, -0.7391, 0.4992, 0.2375],
  6561. [ 0.8613, -0.2273, 1.4765, -0.8301, -0.5814, -0.6689, 0.3431, 0.1861],
  6562. [ 0.5253, -0.4384, 1.5418, -0.5003, -0.5351, -0.5880, 0.3159, 0.2336],
  6563. [-1.3941, -1.6921, 0.9840, -1.2563, -0.2956, -1.3670, 0.2403, 0.2752],
  6564. [ 0.2707, -0.6181, 1.3609, -1.0859, -0.4104, -1.0531, 0.4897, 0.1458],
  6565. [ 0.4641, -0.4778, 1.4754, 0.0333, -0.1887, -0.2335, 0.3023, 0.2703],
  6566. [ 0.3964, -0.5099, 1.5877, 0.1125, -0.4331, -0.1267, 0.4035, 0.1513],
  6567. [ 1.0365, -0.1044, 1.5411, -0.0426, -0.5323, -0.1892, 0.3891, 0.1199]],
  6568. device='cuda:0', grad_fn=<AddmmBackward>)
  6569. landmarks are: tensor([[[ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  6570. 0.1005],
  6571. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  6572. 0.1753],
  6573. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  6574. 0.1544],
  6575. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  6576. 0.3084],
  6577. [ 0.6064, -0.3990, 1.6113, -0.8309, -0.4268, -1.0696, 0.6421,
  6578. -0.0640],
  6579. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  6580. 0.4547],
  6581. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  6582. -0.0049],
  6583. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  6584. -0.1278]]], device='cuda:0')
  6585. loss_train_step before backward: tensor(0.0489, device='cuda:0', grad_fn=<MseLossBackward>)
  6586. loss_train_step after backward: tensor(0.0489, device='cuda:0', grad_fn=<MseLossBackward>)
  6587. loss_train: 4.618122825399041
  6588. step: 56
  6589. running loss: 0.08246647902498287
  6590. Train Steps: 56/90 Loss: 0.0825 torch.Size([8, 600, 800])
  6591. torch.Size([8, 8])
  6592. tensor([[0.6284, 0.4029, 0.8838, 0.3783, 0.3975, 0.2850, 0.6335, 0.5090],
  6593. [0.6038, 0.3946, 0.8413, 0.4883, 0.3563, 0.4550, 0.5266, 0.4693],
  6594. [0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167],
  6595. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  6596. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  6597. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567],
  6598. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  6599. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390]],
  6600. device='cuda:0', dtype=torch.float64)
  6601. predictions are: tensor([[ 0.1561, -0.7037, 1.4751, -0.8651, -0.4711, -1.0469, 0.5206, 0.1341],
  6602. [ 0.5377, -0.4234, 1.5176, -0.2102, -0.5475, -0.2934, 0.2895, 0.1455],
  6603. [ 0.2270, -0.6552, 1.1592, -1.1152, -0.4722, -1.0442, 0.3479, 0.2583],
  6604. [ 0.4311, -0.5644, 1.5158, -1.1601, -0.2336, -1.4870, 0.4191, 0.1780],
  6605. [ 0.3855, -0.5671, 1.5510, -0.7643, -0.5894, -0.6581, 0.5060, 0.1097],
  6606. [ 0.1805, -0.6948, 1.5721, 0.1061, -0.2787, -0.1696, 0.3229, 0.2565],
  6607. [ 0.5569, -0.4505, 1.4991, 0.0849, -0.4491, -0.2875, 0.2419, 0.2883],
  6608. [ 0.1861, -0.6641, 1.6742, -0.1751, -0.4272, 0.1524, 0.5527, 0.2295]],
  6609. device='cuda:0', grad_fn=<AddmmBackward>)
  6610. landmarks are: tensor([[[ 0.6165, -0.4249, 1.7961, -0.5384, -0.4499, -0.9695, 0.6401,
  6611. 0.0652],
  6612. [ 0.5030, -0.4631, 1.5998, -0.0303, -0.6404, -0.1843, 0.1465,
  6613. -0.1181],
  6614. [ 0.5631, -0.4129, 1.2129, -0.9233, -0.4152, -1.0311, 0.4566,
  6615. 0.5624],
  6616. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  6617. -0.0368],
  6618. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  6619. -0.0670],
  6620. [ 0.5620, -0.4346, 1.6691, 0.3315, -0.2594, -0.0072, 0.2891,
  6621. 0.2853],
  6622. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  6623. 0.4470],
  6624. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  6625. 0.2035]]], device='cuda:0')
  6626. loss_train_step before backward: tensor(0.0432, device='cuda:0', grad_fn=<MseLossBackward>)
  6627. loss_train_step after backward: tensor(0.0432, device='cuda:0', grad_fn=<MseLossBackward>)
  6628. loss_train: 4.661323884502053
  6629. step: 57
  6630. running loss: 0.08177761200880795
  6631. Train Steps: 57/90 Loss: 0.0818 torch.Size([8, 600, 800])
  6632. torch.Size([8, 8])
  6633. tensor([[0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  6634. [0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  6635. [0.6201, 0.4017, 0.8871, 0.4621, 0.3517, 0.4675, 0.5999, 0.5106],
  6636. [0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  6637. [0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  6638. [0.6260, 0.4133, 0.8800, 0.5117, 0.3713, 0.3283, 0.6223, 0.4967],
  6639. [0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436],
  6640. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433]],
  6641. device='cuda:0', dtype=torch.float64)
  6642. predictions are: tensor([[ 0.0544, -0.7835, 1.6998, -0.2782, -0.1604, -0.2922, 0.4850, 0.1874],
  6643. [ 0.4879, -0.4952, 1.6149, -0.6312, -0.3887, -1.1637, 0.4164, 0.2082],
  6644. [ 0.2649, -0.6053, 1.6451, -0.2102, -0.5783, -0.1651, 0.4630, 0.1315],
  6645. [ 0.2480, -0.6386, 1.6026, 0.0719, -0.2249, -0.1325, 0.3098, 0.2759],
  6646. [ 0.1634, -0.7327, 1.2079, -1.2229, -0.4614, -1.3717, 0.3322, 0.2116],
  6647. [ 1.0088, -0.1769, 1.6499, -0.2045, -0.4546, -0.9317, 0.4750, 0.1453],
  6648. [ 0.2639, -0.6029, 1.6201, -0.3808, -0.5056, -0.0960, 0.6122, 0.1866],
  6649. [ 0.3316, -0.5745, 1.2158, -1.0627, -0.6265, -0.7776, 0.3601, 0.1813]],
  6650. device='cuda:0', grad_fn=<AddmmBackward>)
  6651. landmarks are: tensor([[[ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  6652. 0.2776],
  6653. [ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  6654. 0.1929],
  6655. [ 0.5783, -0.4306, 1.8114, -0.1515, -0.6617, -0.1268, 0.4851,
  6656. 0.0727],
  6657. [ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  6658. 0.4239],
  6659. [ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  6660. 0.3007],
  6661. [ 0.6054, -0.3767, 1.7788, 0.0774, -0.5711, -0.7694, 0.5887,
  6662. 0.0081],
  6663. [ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  6664. 0.2249],
  6665. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  6666. 0.2237]]], device='cuda:0')
  6667. loss_train_step before backward: tensor(0.0437, device='cuda:0', grad_fn=<MseLossBackward>)
  6668. loss_train_step after backward: tensor(0.0437, device='cuda:0', grad_fn=<MseLossBackward>)
  6669. loss_train: 4.704992236569524
  6670. step: 58
  6671. running loss: 0.08112055580292282
  6672.  
  6673. Train Steps: 58/90 Loss: 0.0811 torch.Size([8, 600, 800])
  6674. torch.Size([8, 8])
  6675. tensor([[0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  6676. [0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  6677. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  6678. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  6679. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  6680. [ nan, nan, 0.9050, 0.3500, 0.5138, 0.2300, 0.7359, 0.5702],
  6681. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  6682. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332]],
  6683. device='cuda:0', dtype=torch.float64)
  6684. predictions are: tensor([[ 0.6725, -0.3250, 1.3117, -0.8996, -0.4375, -0.9283, 0.3662, 0.2144],
  6685. [ 0.8203, -0.2586, 1.2539, -0.8671, -0.4885, -0.8802, 0.2916, 0.2076],
  6686. [-0.6151, -1.1069, 1.2332, -0.7149, -0.5765, -0.8060, 0.1702, 0.2368],
  6687. [ 1.7519, 0.3353, 1.6793, 0.2937, -0.6515, -0.0736, 0.3457, 0.1722],
  6688. [ 0.9992, -0.1174, 1.3909, -0.8545, -0.3347, -0.9903, 0.4672, 0.1633],
  6689. [-0.7490, -1.2308, 1.8226, -0.4618, -0.1372, -0.7754, 0.7525, 0.2115],
  6690. [-1.7876, -1.9232, 1.5286, -0.8708, -0.1098, -0.9816, 0.6602, 0.2375],
  6691. [ 1.5744, 0.1914, 1.7823, 0.1854, -0.5948, 0.1148, 0.5642, 0.1143]],
  6692. device='cuda:0', grad_fn=<AddmmBackward>)
  6693. landmarks are: tensor([[[ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  6694. 0.2032],
  6695. [ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  6696. 0.3007],
  6697. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  6698. 0.2699],
  6699. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  6700. 0.3161],
  6701. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  6702. 0.1917],
  6703. [-2.2859, -2.2859, 1.8942, -0.6693, 0.0871, -1.2236, 1.1130,
  6704. 0.3478],
  6705. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  6706. 0.3104],
  6707. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  6708. 0.1768]]], device='cuda:0')
  6709. loss_train_step before backward: tensor(0.2201, device='cuda:0', grad_fn=<MseLossBackward>)
  6710. loss_train_step after backward: tensor(0.2201, device='cuda:0', grad_fn=<MseLossBackward>)
  6711. loss_train: 4.925117092207074
  6712. step: 59
  6713. running loss: 0.08347656088486566
  6714. Train Steps: 59/90 Loss: 0.0835 torch.Size([8, 600, 800])
  6715. torch.Size([8, 8])
  6716. tensor([[0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901],
  6717. [0.6264, 0.4035, 0.8888, 0.4883, 0.4050, 0.5217, 0.6361, 0.4791],
  6718. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  6719. [0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350],
  6720. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  6721. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  6722. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  6723. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750]],
  6724. device='cuda:0', dtype=torch.float64)
  6725. predictions are: tensor([[ 0.4033, -0.5310, 1.8569, -0.6054, -0.5117, -0.6812, 0.6229, 0.1313],
  6726. [ 0.4407, -0.5129, 1.8577, 0.1828, -0.4270, 0.1355, 0.5361, 0.1932],
  6727. [-0.1968, -0.9619, 1.9427, -0.6664, -0.1138, -1.0862, 0.8384, 0.1491],
  6728. [-0.0191, -0.8111, 1.3862, -1.2234, -0.2565, -1.2246, 0.4617, 0.2555],
  6729. [ 0.8325, -0.2923, 1.7349, 0.3951, -0.4775, -0.0507, 0.5048, 0.1812],
  6730. [ 0.3294, -0.5901, 1.8064, 0.0931, -0.5397, -0.2080, 0.5408, 0.1618],
  6731. [ 0.2896, -0.6054, 1.0851, -0.9982, -0.5647, -0.8826, 0.1846, 0.2427],
  6732. [ 0.8394, -0.2579, 1.1610, -0.9770, -0.4822, -1.0040, 0.3513, 0.2346]],
  6733. device='cuda:0', grad_fn=<AddmmBackward>)
  6734. landmarks are: tensor([[[ 0.6077, -0.3965, 1.8480, -0.6539, -0.6231, -0.4537, 0.6216,
  6735. -0.0220],
  6736. [ 0.6074, -0.4223, 1.8192, -0.0303, -0.4152, 0.1236, 0.6524,
  6737. -0.0731],
  6738. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  6739. 0.2142],
  6740. [ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  6741. 0.1852],
  6742. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  6743. -0.1385],
  6744. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  6745. 0.1082],
  6746. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  6747. 0.3315],
  6748. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  6749. 0.3700]]], device='cuda:0')
  6750. loss_train_step before backward: tensor(0.0440, device='cuda:0', grad_fn=<MseLossBackward>)
  6751. loss_train_step after backward: tensor(0.0440, device='cuda:0', grad_fn=<MseLossBackward>)
  6752. loss_train: 4.969099497422576
  6753. step: 60
  6754. running loss: 0.08281832495704293
  6755. Train Steps: 60/90 Loss: 0.0828 torch.Size([8, 600, 800])
  6756. torch.Size([8, 8])
  6757. tensor([[0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  6758. [0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136],
  6759. [0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350],
  6760. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  6761. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  6762. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  6763. [0.6129, 0.4069, 0.8750, 0.5067, 0.3875, 0.4233, 0.5235, 0.5881],
  6764. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726]],
  6765. device='cuda:0', dtype=torch.float64)
  6766. predictions are: tensor([[-0.1576, -0.9122, 1.2972, -1.2263, -0.1811, -1.4133, 0.4684, 0.2480],
  6767. [ 0.2890, -0.6472, 1.9153, 0.1004, -0.1274, -0.1649, 0.6380, 0.1997],
  6768. [-0.0181, -0.8165, 1.4741, -1.3042, -0.2795, -1.3269, 0.5811, 0.2282],
  6769. [ 0.4858, -0.4523, 1.6892, -0.2371, -0.5700, -0.3723, 0.6010, 0.1366],
  6770. [ 0.8972, -0.2306, 1.8460, 0.3335, -0.4067, 0.0752, 0.6305, 0.1847],
  6771. [ 0.3262, -0.6062, 1.8215, -0.3808, -0.6322, -0.4538, 0.5082, 0.1785],
  6772. [ 0.2143, -0.6786, 1.8186, 0.2153, -0.5068, -0.2337, 0.4954, 0.1994],
  6773. [ 0.7243, -0.3422, 1.3246, -1.1767, -0.5365, -1.1800, 0.4903, 0.1229]],
  6774. device='cuda:0', grad_fn=<AddmmBackward>)
  6775. landmarks are: tensor([[[ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  6776. 0.3854],
  6777. [ 0.5564, -0.3842, 1.7268, 0.1005, -0.0250, 0.3225, 0.2658,
  6778. 0.0862],
  6779. [ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  6780. 0.1852],
  6781. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  6782. 0.2853],
  6783. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  6784. 0.3161],
  6785. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  6786. 0.3238],
  6787. [ 0.5452, -0.4067, 1.7557, 0.0543, -0.4961, -0.3306, 0.1323,
  6788. 0.4306],
  6789. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  6790. -0.1031]]], device='cuda:0')
  6791. loss_train_step before backward: tensor(0.0569, device='cuda:0', grad_fn=<MseLossBackward>)
  6792. loss_train_step after backward: tensor(0.0569, device='cuda:0', grad_fn=<MseLossBackward>)
  6793. loss_train: 5.025980396196246
  6794. step: 61
  6795. running loss: 0.0823931212491188
  6796. Train Steps: 61/90 Loss: 0.0824 torch.Size([8, 600, 800])
  6797. torch.Size([8, 8])
  6798. tensor([[0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  6799. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  6800. [0.6289, 0.4032, 0.8419, 0.5446, 0.4075, 0.5017, 0.6312, 0.5117],
  6801. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  6802. [0.6229, 0.4066, 0.8513, 0.5717, 0.4500, 0.5050, 0.6025, 0.5350],
  6803. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  6804. [ nan, nan, 0.8463, 0.2550, 0.5850, 0.2133, 0.7129, 0.6072],
  6805. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400]],
  6806. device='cuda:0', dtype=torch.float64)
  6807. predictions are: tensor([[ 0.6747, -0.3336, 1.7131, -0.3043, -0.6373, -0.1198, 0.5301, 0.1279],
  6808. [ 0.3088, -0.5878, 1.4396, -1.0615, -0.3396, -1.2393, 0.4457, 0.2140],
  6809. [ 0.5520, -0.4229, 1.8363, 0.2268, -0.5093, -0.0411, 0.6594, 0.1800],
  6810. [ 0.2341, -0.6258, 1.8258, 0.1728, -0.3747, -0.0613, 0.4904, 0.1651],
  6811. [ 0.6160, -0.3853, 1.7532, 0.3894, -0.3895, -0.0292, 0.4597, 0.1998],
  6812. [-0.1318, -0.8842, 1.0308, -1.2271, -0.5247, -1.3953, 0.2541, 0.2315],
  6813. [-0.7442, -1.3088, 1.8895, -0.8294, -0.0512, -1.0553, 1.0225, 0.2369],
  6814. [ 0.9457, -0.1848, 1.5723, -1.0821, -0.2259, -1.0955, 0.6738, 0.1960]],
  6815. device='cuda:0', grad_fn=<AddmmBackward>)
  6816. landmarks are: tensor([[[ 5.2448e-01, -4.3610e-01, 1.5940e+00, -2.9207e-01, -5.4804e-01,
  6817. -9.1917e-02, 2.4319e-01, 5.0176e-02],
  6818. [ 5.7962e-01, -4.3256e-01, 1.4439e+00, -1.1774e+00, -2.9400e-01,
  6819. -1.3390e+00, 3.9307e-01, 9.2841e-02],
  6820. [ 6.1888e-01, -4.2379e-01, 1.6026e+00, 2.2948e-01, -4.0370e-01,
  6821. 3.1255e-02, 6.2979e-01, 7.7444e-02],
  6822. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  6823. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  6824. [ 5.9107e-01, -4.0805e-01, 1.6460e+00, 3.5458e-01, -2.0739e-01,
  6825. 4.6651e-02, 4.9700e-01, 1.8522e-01],
  6826. [ 5.5912e-01, -3.9900e-01, 9.0115e-01, -1.2313e+00, -3.9792e-01,
  6827. -1.3852e+00, 8.0445e-02, 2.0706e-01],
  6828. [-2.2859e+00, -2.2859e+00, 1.6229e+00, -1.1081e+00, 4.1617e-01,
  6829. -1.3005e+00, 1.0070e+00, 5.1879e-01],
  6830. [ 5.9579e-01, -3.8176e-01, 1.5536e+00, -1.1081e+00, -2.0739e-01,
  6831. -1.3390e+00, 5.6628e-01, 2.0831e-01]]], device='cuda:0')
  6832. loss_train_step before backward: tensor(0.0864, device='cuda:0', grad_fn=<MseLossBackward>)
  6833. loss_train_step after backward: tensor(0.0864, device='cuda:0', grad_fn=<MseLossBackward>)
  6834. loss_train: 5.112371591851115
  6835. step: 62
  6836. running loss: 0.08245760632017927
  6837.  
  6838. Train Steps: 62/90 Loss: 0.0825 torch.Size([8, 600, 800])
  6839. torch.Size([8, 8])
  6840. tensor([[0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  6841. [0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167],
  6842. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  6843. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586],
  6844. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  6845. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  6846. [0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  6847. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285]],
  6848. device='cuda:0', dtype=torch.float64)
  6849. predictions are: tensor([[ 1.0652, -0.0872, 1.6244, 0.1411, -0.5858, -0.4915, 0.3320, 0.1692],
  6850. [ 0.4764, -0.4995, 1.2932, -0.9137, -0.4796, -0.9494, 0.4467, 0.2394],
  6851. [ 0.5212, -0.4979, 1.4810, -0.8740, -0.4198, -0.9972, 0.4141, 0.2848],
  6852. [-0.5558, -1.2075, 1.6232, -1.1434, 0.0361, -1.3837, 0.8139, 0.2174],
  6853. [ 0.6402, -0.3467, 1.4580, -0.7266, -0.6276, -0.4378, 0.4899, 0.1890],
  6854. [ 0.1559, -0.7151, 1.9275, -0.6109, -0.1726, -1.0339, 0.7443, 0.1235],
  6855. [ 0.2836, -0.6025, 1.9319, 0.1667, -0.3236, 0.1527, 0.6902, 0.1907],
  6856. [ 0.1549, -0.6862, 1.9986, 0.2127, -0.4233, 0.2488, 0.7887, 0.1478]],
  6857. device='cuda:0', grad_fn=<AddmmBackward>)
  6858. landmarks are: tensor([[[ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  6859. 0.3392],
  6860. [ 0.5631, -0.4129, 1.2129, -0.9233, -0.4152, -1.0311, 0.4566,
  6861. 0.5624],
  6862. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  6863. 0.5701],
  6864. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  6865. 0.2944],
  6866. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  6867. 0.2776],
  6868. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  6869. 0.2142],
  6870. [ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  6871. 0.1661],
  6872. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  6873. 0.1554]]], device='cuda:0')
  6874. loss_train_step before backward: tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward>)
  6875. loss_train_step after backward: tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward>)
  6876. loss_train: 5.176298273727298
  6877. step: 63
  6878. running loss: 0.08216346466233806
  6879. Train Steps: 63/90 Loss: 0.0822 torch.Size([8, 600, 800])
  6880. torch.Size([8, 8])
  6881. tensor([[0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  6882. [0.6250, 0.4110, 0.7238, 0.2067, 0.4263, 0.1883, 0.5625, 0.5633],
  6883. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609],
  6884. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  6885. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  6886. [0.6198, 0.4075, 0.8650, 0.5617, 0.4150, 0.4367, 0.5450, 0.5650],
  6887. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  6888. [0.6108, 0.4011, 0.8037, 0.3400, 0.3700, 0.2933, 0.5658, 0.5617]],
  6889. device='cuda:0', dtype=torch.float64)
  6890. predictions are: tensor([[ 1.0356, -0.1234, 1.7094, -0.6482, -0.3317, -0.7847, 0.5696, 0.2211],
  6891. [ 0.3286, -0.6007, 1.2848, -0.8995, -0.3070, -1.1710, 0.4285, 0.2396],
  6892. [-0.8547, -1.3968, 1.9650, -0.7491, 0.1321, -1.1016, 1.1164, 0.2244],
  6893. [ 0.4023, -0.5407, 1.4807, -0.8273, -0.4771, -0.7097, 0.6189, 0.1762],
  6894. [ 0.4463, -0.5124, 1.2960, -0.9030, -0.4845, -0.9337, 0.3351, 0.2077],
  6895. [ 0.2804, -0.6267, 1.8965, 0.6625, -0.3471, 0.0380, 0.4486, 0.2180],
  6896. [ 0.5654, -0.3786, 1.6728, -0.4492, -0.5768, -0.1508, 0.6567, 0.1743],
  6897. [ 0.4768, -0.4687, 1.5823, -0.5242, -0.4902, -0.6029, 0.5122, 0.1763]],
  6898. device='cuda:0', grad_fn=<AddmmBackward>)
  6899. landmarks are: tensor([[[ 0.5875, -0.3888, 1.3111, -0.8848, -0.4614, -0.9849, 0.5201,
  6900. 0.2622],
  6901. [ 0.6010, -0.3875, 1.0570, -1.3313, -0.3171, -1.4160, 0.3122,
  6902. 0.3161],
  6903. [ 0.6372, -0.3575, 1.6633, -1.2082, 0.2199, -1.2467, 1.1313,
  6904. 0.3050],
  6905. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  6906. 0.1779],
  6907. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  6908. 0.0802],
  6909. [ 0.5770, -0.4036, 1.7095, 0.3084, -0.3691, -0.2690, 0.2314,
  6910. 0.3238],
  6911. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  6912. 0.2776],
  6913. [ 0.5355, -0.4335, 1.4266, -0.7155, -0.5769, -0.9310, 0.3275,
  6914. 0.3087]]], device='cuda:0')
  6915. loss_train_step before backward: tensor(0.0955, device='cuda:0', grad_fn=<MseLossBackward>)
  6916. loss_train_step after backward: tensor(0.0955, device='cuda:0', grad_fn=<MseLossBackward>)
  6917. loss_train: 5.271774662658572
  6918. step: 64
  6919. running loss: 0.08237147910404019
  6920. Train Steps: 64/90 Loss: 0.0824 torch.Size([8, 600, 800])
  6921. torch.Size([8, 8])
  6922. tensor([[0.6209, 0.3920, 0.8650, 0.5367, 0.4400, 0.5067, 0.6025, 0.4950],
  6923. [0.6277, 0.4013, 0.8888, 0.4767, 0.3600, 0.3567, 0.6148, 0.4672],
  6924. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  6925. [0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  6926. [0.6059, 0.4002, 0.7562, 0.2767, 0.3538, 0.3033, 0.5529, 0.5455],
  6927. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  6928. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  6929. [0.6064, 0.3953, 0.8738, 0.4417, 0.3663, 0.4683, 0.5511, 0.5416]],
  6930. device='cuda:0', dtype=torch.float64)
  6931. predictions are: tensor([[-0.1920, -0.9985, 1.9063, 0.1103, -0.1318, -0.3085, 0.7094, 0.2498],
  6932. [ 0.7767, -0.3053, 1.7186, -0.3475, -0.4719, -0.7444, 0.6525, 0.1397],
  6933. [ 0.1857, -0.7125, 1.8274, -0.0031, -0.2454, -0.2910, 0.5246, 0.2424],
  6934. [ 0.6512, -0.3863, 1.4643, -0.8827, -0.4335, -1.0586, 0.3989, 0.2542],
  6935. [ 0.4884, -0.4620, 1.2575, -1.1185, -0.4550, -1.0417, 0.4923, 0.2755],
  6936. [ 0.5038, -0.4734, 1.2670, -1.2477, -0.5148, -1.0009, 0.4584, 0.2556],
  6937. [ 0.4376, -0.5049, 1.8492, -0.1855, -0.2348, -0.1066, 0.7327, 0.2066],
  6938. [ 0.5826, -0.4122, 1.8609, -0.2930, -0.4397, -0.3699, 0.7610, 0.1792]],
  6939. device='cuda:0', grad_fn=<AddmmBackward>)
  6940. landmarks are: tensor([[[ 5.8199e-01, -4.7544e-01, 1.7095e+00, 1.9292e-01, -2.5358e-01,
  6941. 5.4350e-02, 4.9700e-01, 4.6189e-04],
  6942. [ 6.1322e-01, -4.3241e-01, 1.8192e+00, -8.4219e-02, -6.2309e-01,
  6943. -6.3849e-01, 5.5366e-01, -1.2778e-01],
  6944. [ 5.4348e-01, -4.5974e-01, 1.6575e+00, 1.5858e-02, -3.2286e-01,
  6945. -1.1501e-01, 1.8767e-01, 1.8544e-01],
  6946. [ 5.5319e-01, -3.8879e-01, 1.4727e+00, -7.4627e-01, -5.5381e-01,
  6947. -1.0465e+00, 2.6467e-02, 2.1383e-01],
  6948. [ 5.1288e-01, -4.3741e-01, 1.2072e+00, -1.0080e+00, -6.5196e-01,
  6949. -8.8483e-01, 2.6787e-01, 2.3353e-01],
  6950. [ 5.0092e-01, -4.3333e-01, 1.1090e+00, -1.1158e+00, -6.9815e-01,
  6951. -7.3087e-01, 2.6170e-01, 6.2199e-02],
  6952. [ 5.6039e-01, -4.6197e-01, 1.7961e+00, -1.9969e-01, -3.2286e-01,
  6953. 1.0824e-01, 4.1039e-01, 2.5450e-01],
  6954. [ 5.1490e-01, -4.6028e-01, 1.7499e+00, -2.4588e-01, -5.9423e-01,
  6955. -1.2271e-01, 2.5964e-01, 2.1549e-01]]], device='cuda:0')
  6956. loss_train_step before backward: tensor(0.0448, device='cuda:0', grad_fn=<MseLossBackward>)
  6957. loss_train_step after backward: tensor(0.0448, device='cuda:0', grad_fn=<MseLossBackward>)
  6958. loss_train: 5.316538447514176
  6959. step: 65
  6960. running loss: 0.08179289919252579
  6961. Train Steps: 65/90 Loss: 0.0818 torch.Size([8, 600, 800])
  6962. torch.Size([8, 8])
  6963. tensor([[0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  6964. [0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  6965. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  6966. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  6967. [0.6185, 0.4079, 0.8838, 0.4617, 0.4838, 0.5650, 0.6175, 0.5850],
  6968. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  6969. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  6970. [0.6284, 0.4093, 0.8900, 0.4700, 0.3650, 0.3850, 0.6212, 0.5167]],
  6971. device='cuda:0', dtype=torch.float64)
  6972. predictions are: tensor([[ 0.1470, -0.7047, 1.6310, -0.2381, -0.2549, -0.3992, 0.4727, 0.2435],
  6973. [ 0.4058, -0.5714, 1.8483, -0.1800, -0.3816, -0.1532, 0.7788, 0.2107],
  6974. [ 0.4472, -0.5076, 1.6044, -0.1745, -0.2147, -0.2088, 0.4506, 0.2606],
  6975. [ 0.2987, -0.5943, 1.5517, -0.6556, -0.5261, -0.4434, 0.5252, 0.2261],
  6976. [ 0.4258, -0.5116, 1.7422, -0.3681, -0.1858, -0.1330, 0.6773, 0.2530],
  6977. [ 0.9321, -0.1669, 1.5974, -0.3834, -0.4631, -0.9787, 0.4675, 0.2501],
  6978. [ 0.9310, -0.1953, 1.3346, -1.2929, -0.2924, -1.4419, 0.5972, 0.2600],
  6979. [ 0.1639, -0.7135, 1.7702, -0.3880, -0.5578, -0.8406, 0.6680, 0.1920]],
  6980. device='cuda:0', grad_fn=<AddmmBackward>)
  6981. landmarks are: tensor([[[ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  6982. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  6983. [ 6.0468e-01, -4.2094e-01, 1.7557e+00, -3.0331e-02, -4.8453e-01,
  6984. 2.5450e-01, 6.5866e-01, 1.2363e-01],
  6985. [ 5.5484e-01, -4.6823e-01, 1.7309e+00, 9.6578e-02, -1.3942e-01,
  6986. 1.7573e-01, 5.0451e-01, 9.4188e-02],
  6987. [ 5.2448e-01, -4.3610e-01, 1.5940e+00, -2.9207e-01, -5.4804e-01,
  6988. -9.1917e-02, 2.4319e-01, 5.0176e-02],
  6989. [ 5.7067e-01, -4.0169e-01, 1.7961e+00, -1.5350e-01, -5.1501e-02,
  6990. 3.2379e-01, 5.6628e-01, 4.1617e-01],
  6991. [ 5.9007e-01, -4.0000e-01, 1.8423e+00, -6.8822e-02, -5.3072e-01,
  6992. -9.2333e-01, 3.6420e-01, 1.8522e-01],
  6993. [ 6.1577e-01, -3.9601e-01, 1.4092e+00, -1.2774e+00, -2.0739e-01,
  6994. -1.1851e+00, 8.4910e-01, 1.9173e-01],
  6995. [ 6.1640e-01, -3.9561e-01, 1.8249e+00, -1.1501e-01, -6.0000e-01,
  6996. -5.0762e-01, 5.8360e-01, 1.0054e-01]]], device='cuda:0')
  6997. loss_train_step before backward: tensor(0.0462, device='cuda:0', grad_fn=<MseLossBackward>)
  6998. loss_train_step after backward: tensor(0.0462, device='cuda:0', grad_fn=<MseLossBackward>)
  6999. loss_train: 5.362761614844203
  7000. step: 66
  7001. running loss: 0.0812539638612758
  7002.  
  7003. Train Steps: 66/90 Loss: 0.0813 torch.Size([8, 600, 800])
  7004. torch.Size([8, 8])
  7005. tensor([[0.6186, 0.4013, 0.8191, 0.3188, 0.4279, 0.2060, 0.5767, 0.5411],
  7006. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  7007. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  7008. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  7009. [0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  7010. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533],
  7011. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  7012. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320]],
  7013. device='cuda:0', dtype=torch.float64)
  7014. predictions are: tensor([[ 1.1903, 0.0091, 1.5244, -0.6896, -0.3186, -0.7837, 0.4619, 0.2637],
  7015. [-1.1955, -1.5569, 1.2581, -0.9294, -0.3222, -1.0647, 0.3363, 0.3174],
  7016. [ 1.1021, -0.0334, 1.8661, 0.1296, -0.4194, -0.2605, 0.6152, 0.1854],
  7017. [-1.0808, -1.4725, 1.1546, -1.0496, -0.2942, -1.1167, 0.2463, 0.3367],
  7018. [ 1.2006, -0.0122, 1.3387, -0.9424, -0.2428, -0.9820, 0.4809, 0.2814],
  7019. [ 0.8916, -0.2122, 1.2474, -0.9546, -0.4703, -0.7094, 0.5053, 0.2677],
  7020. [ 0.9518, -0.2066, 1.7941, -0.2452, -0.5559, -0.2133, 0.7859, 0.1155],
  7021. [ 0.6461, -0.3687, 1.8293, 0.2481, -0.3678, 0.1926, 0.6810, 0.1674]],
  7022. device='cuda:0', grad_fn=<AddmmBackward>)
  7023. landmarks are: tensor([[[ 0.5713, -0.4321, 1.4975, -0.8134, -0.3094, -1.3345, 0.3779,
  7024. 0.2134],
  7025. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  7026. 0.2183],
  7027. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  7028. 0.1661],
  7029. [-2.2859, -2.2859, 1.0513, -1.2851, -0.4441, -1.2313, 0.2206,
  7030. 0.1073],
  7031. [ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  7032. 0.2442],
  7033. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  7034. 0.2699],
  7035. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  7036. 0.0697],
  7037. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  7038. 0.1715]]], device='cuda:0')
  7039. loss_train_step before backward: tensor(0.1144, device='cuda:0', grad_fn=<MseLossBackward>)
  7040. loss_train_step after backward: tensor(0.1144, device='cuda:0', grad_fn=<MseLossBackward>)
  7041. loss_train: 5.477159423753619
  7042. step: 67
  7043. running loss: 0.08174864811572566
  7044. Train Steps: 67/90 Loss: 0.0817 torch.Size([8, 600, 800])
  7045. torch.Size([8, 8])
  7046. tensor([[0.6250, 0.4106, 0.8700, 0.3717, 0.3588, 0.4967, 0.6038, 0.5167],
  7047. [0.6269, 0.4073, 0.8900, 0.4933, 0.3625, 0.4183, 0.6288, 0.5150],
  7048. [0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  7049. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  7050. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  7051. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  7052. [0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  7053. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795]],
  7054. device='cuda:0', dtype=torch.float64)
  7055. predictions are: tensor([[ 0.7726, -0.2872, 1.5579, -0.6419, -0.4527, -0.1764, 0.6722, 0.1945],
  7056. [ 0.7038, -0.3455, 1.7372, -0.0100, -0.4515, -0.4409, 0.4419, 0.2044],
  7057. [ 0.3806, -0.5373, 1.5902, -0.6628, -0.4155, -0.2866, 0.7564, 0.1726],
  7058. [ 0.3435, -0.5409, 1.6290, -0.5285, -0.3532, -0.7808, 0.4576, 0.3081],
  7059. [-0.3292, -1.0527, 0.9807, -1.2696, -0.3676, -1.4329, 0.1426, 0.3147],
  7060. [ 0.8057, -0.2529, 1.3971, -1.0243, -0.3280, -1.0554, 0.4332, 0.2968],
  7061. [ 0.4678, -0.4743, 1.6984, 0.0821, -0.4409, -0.3279, 0.4225, 0.2544],
  7062. [ 0.9089, -0.2301, 1.7610, 0.1076, -0.3777, 0.0481, 0.7147, 0.1679]],
  7063. device='cuda:0', grad_fn=<AddmmBackward>)
  7064. landmarks are: tensor([[[ 0.6010, -0.3896, 1.7326, -0.5692, -0.6289, 0.0082, 0.5028,
  7065. 0.1005],
  7066. [ 0.6096, -0.4046, 1.8249, -0.0072, -0.6115, -0.3537, 0.6182,
  7067. 0.0928],
  7068. [ 0.6108, -0.4273, 1.8711, -0.6616, -0.5769, -0.1997, 0.9156,
  7069. 0.1554],
  7070. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  7071. 0.3928],
  7072. [-2.2859, -2.2859, 1.0712, -1.2085, -0.3806, -1.3929, 0.0755,
  7073. 0.2006],
  7074. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  7075. 0.2160],
  7076. [ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  7077. 0.3623],
  7078. [ 0.6355, -0.4080, 1.6113, 0.1852, -0.4730, 0.1467, 0.9996,
  7079. 0.3905]]], device='cuda:0')
  7080. loss_train_step before backward: tensor(0.1032, device='cuda:0', grad_fn=<MseLossBackward>)
  7081. loss_train_step after backward: tensor(0.1032, device='cuda:0', grad_fn=<MseLossBackward>)
  7082. loss_train: 5.580386197194457
  7083. step: 68
  7084. running loss: 0.08206450289991848
  7085. Train Steps: 68/90 Loss: 0.0821 torch.Size([8, 600, 800])
  7086. torch.Size([8, 8])
  7087. tensor([[0.6277, 0.4083, 0.8350, 0.2717, 0.4562, 0.1800, 0.5918, 0.4878],
  7088. [0.6059, 0.4002, 0.7562, 0.2767, 0.3538, 0.3033, 0.5529, 0.5455],
  7089. [0.6142, 0.4127, 0.7575, 0.3067, 0.3438, 0.4383, 0.5778, 0.5207],
  7090. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  7091. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586],
  7092. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  7093. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  7094. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700]],
  7095. device='cuda:0', dtype=torch.float64)
  7096. predictions are: tensor([[ 0.0113, -0.7472, 1.4550, -0.8894, -0.2580, -0.9753, 0.4123, 0.2772],
  7097. [ 0.4000, -0.5421, 1.2346, -0.7698, -0.5962, -0.8030, 0.3929, 0.2342],
  7098. [ 0.3309, -0.5806, 1.3000, -0.6666, -0.6106, -0.3164, 0.3896, 0.2519],
  7099. [ 0.7557, -0.3389, 1.8301, 0.0937, -0.4879, 0.2119, 0.5420, 0.1904],
  7100. [ 0.4026, -0.5461, 1.5781, -1.0008, -0.0243, -1.1922, 0.8809, 0.2303],
  7101. [ 0.6067, -0.4049, 1.7667, 0.0835, -0.2052, -0.0215, 0.5257, 0.1727],
  7102. [ 0.5976, -0.4035, 1.4973, -0.7421, -0.5810, -0.9208, 0.4500, 0.2530],
  7103. [ 0.6578, -0.3394, 1.3067, -0.5173, -0.5163, -0.6640, 0.3923, 0.2634]],
  7104. device='cuda:0', grad_fn=<AddmmBackward>)
  7105. landmarks are: tensor([[[ 0.6132, -0.4002, 1.5709, -1.0311, -0.1785, -1.4545, 0.4474,
  7106. -0.0328],
  7107. [ 0.5129, -0.4374, 1.2072, -1.0080, -0.6520, -0.8848, 0.2679,
  7108. 0.2335],
  7109. [ 0.5509, -0.3798, 1.2129, -0.8694, -0.6982, -0.2613, 0.3830,
  7110. 0.1193],
  7111. [ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  7112. 0.3161],
  7113. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  7114. 0.2944],
  7115. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  7116. 0.2776],
  7117. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  7118. 0.1931],
  7119. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  7120. 0.3469]]], device='cuda:0')
  7121. loss_train_step before backward: tensor(0.0307, device='cuda:0', grad_fn=<MseLossBackward>)
  7122. loss_train_step after backward: tensor(0.0307, device='cuda:0', grad_fn=<MseLossBackward>)
  7123. loss_train: 5.611077474430203
  7124. step: 69
  7125. running loss: 0.08131996339753918
  7126. Train Steps: 69/90 Loss: 0.0813 torch.Size([8, 600, 800])
  7127. torch.Size([8, 8])
  7128. tensor([[0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  7129. [0.6149, 0.4054, 0.6713, 0.2333, 0.4025, 0.2017, 0.5213, 0.5695],
  7130. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  7131. [0.6268, 0.4061, 0.8350, 0.2433, 0.4575, 0.2283, 0.6350, 0.5300],
  7132. [0.6165, 0.4106, 0.7575, 0.1733, 0.3838, 0.2650, 0.5680, 0.5116],
  7133. [0.6218, 0.4137, 0.7263, 0.2233, 0.4075, 0.2650, 0.6212, 0.5783],
  7134. [0.6226, 0.4125, 0.8800, 0.4900, 0.4512, 0.5600, 0.6275, 0.5517],
  7135. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609]],
  7136. device='cuda:0', dtype=torch.float64)
  7137. predictions are: tensor([[ 0.3484, -0.5802, 1.6820, -0.0106, -0.6042, -0.0191, 0.2717, 0.2010],
  7138. [-0.0371, -0.8269, 1.0462, -1.0266, -0.5768, -1.1250, 0.1318, 0.3113],
  7139. [ 0.2505, -0.6367, 1.7123, 0.0646, -0.3241, 0.1082, 0.4883, 0.1706],
  7140. [ 0.7437, -0.2872, 1.5725, -0.9677, -0.3447, -1.0602, 0.6722, 0.2208],
  7141. [ 0.6053, -0.4160, 1.2632, -0.9159, -0.6230, -0.9971, 0.3718, 0.2289],
  7142. [ 0.5458, -0.4351, 1.2529, -0.7791, -0.5063, -0.8925, 0.3689, 0.3058],
  7143. [ 0.9709, -0.1950, 1.7543, 0.1357, -0.3991, 0.3494, 0.5204, 0.2254],
  7144. [ 0.2469, -0.6231, 1.6615, -1.0366, -0.0289, -1.1851, 1.0284, 0.2094]],
  7145. device='cuda:0', grad_fn=<AddmmBackward>)
  7146. landmarks are: tensor([[[ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  7147. 0.0893],
  7148. [ 0.5544, -0.4133, 0.8145, -1.2082, -0.4268, -1.3544, 0.1221,
  7149. 0.3446],
  7150. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  7151. 0.2622],
  7152. [ 0.6093, -0.4104, 1.5709, -1.1620, -0.1727, -1.2313, 0.6471,
  7153. 0.1621],
  7154. [ 0.5618, -0.3895, 1.2129, -1.4853, -0.5134, -1.0619, 0.3378,
  7155. 0.0772],
  7156. [ 0.5863, -0.3749, 1.0686, -1.2543, -0.4037, -1.0619, 0.5836,
  7157. 0.3854],
  7158. [ 0.5897, -0.3804, 1.7788, -0.0226, -0.2016, 0.3007, 0.6125,
  7159. 0.2622],
  7160. [ 0.6372, -0.3575, 1.6633, -1.2082, 0.2199, -1.2467, 1.1313,
  7161. 0.3050]]], device='cuda:0')
  7162. loss_train_step before backward: tensor(0.0399, device='cuda:0', grad_fn=<MseLossBackward>)
  7163. loss_train_step after backward: tensor(0.0399, device='cuda:0', grad_fn=<MseLossBackward>)
  7164. loss_train: 5.6510243806988
  7165. step: 70
  7166. running loss: 0.08072891972426857
  7167.  
  7168. Train Steps: 70/90 Loss: 0.0807 torch.Size([8, 600, 800])
  7169. torch.Size([8, 8])
  7170. tensor([[0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  7171. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  7172. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567],
  7173. [0.6064, 0.3953, 0.8738, 0.4417, 0.3663, 0.4683, 0.5511, 0.5416],
  7174. [0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  7175. [0.6101, 0.4042, 0.7775, 0.2617, 0.3713, 0.2817, 0.5440, 0.5650],
  7176. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  7177. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400]],
  7178. device='cuda:0', dtype=torch.float64)
  7179. predictions are: tensor([[ 0.6906, -0.3369, 1.5061, -0.8076, -0.6131, -0.6987, 0.4593, 0.2867],
  7180. [ 1.1220, -0.1122, 1.6284, 0.0842, -0.5748, -0.0547, 0.4497, 0.1736],
  7181. [-1.1066, -1.4997, 1.2091, -1.2279, -0.3574, -1.2843, 0.2825, 0.3239],
  7182. [ 0.8739, -0.2342, 1.6656, -0.2235, -0.6230, -0.1619, 0.4995, 0.1426],
  7183. [ 0.1316, -0.6897, 1.6279, -1.2489, 0.0040, -1.3089, 1.0166, 0.2204],
  7184. [-0.0195, -0.7876, 1.2561, -1.1085, -0.4725, -1.0848, 0.1783, 0.2908],
  7185. [ 1.0028, -0.1599, 1.6230, -0.1222, -0.6060, -0.2397, 0.3403, 0.1853],
  7186. [ 1.0546, -0.1132, 1.6749, -0.0623, -0.2407, 0.1899, 0.5196, 0.2179]],
  7187. device='cuda:0', grad_fn=<AddmmBackward>)
  7188. landmarks are: tensor([[[ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  7189. 0.5624],
  7190. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  7191. 0.0697],
  7192. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  7193. 0.2853],
  7194. [ 0.5149, -0.4603, 1.7499, -0.2459, -0.5942, -0.1227, 0.2596,
  7195. 0.2155],
  7196. [ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  7197. 0.2142],
  7198. [ 0.5320, -0.4189, 1.3053, -1.0773, -0.5711, -0.9849, 0.2267,
  7199. 0.3237],
  7200. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  7201. 0.2314],
  7202. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  7203. 0.2083]]], device='cuda:0')
  7204. loss_train_step before backward: tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward>)
  7205. loss_train_step after backward: tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward>)
  7206. loss_train: 5.719259122386575
  7207. step: 71
  7208. running loss: 0.08055294538572641
  7209. Train Steps: 71/90 Loss: 0.0806 torch.Size([8, 600, 800])
  7210. torch.Size([8, 8])
  7211. tensor([[0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  7212. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  7213. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  7214. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  7215. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  7216. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  7217. [0.6179, 0.3961, 0.8347, 0.6020, 0.3887, 0.4624, 0.5714, 0.5373],
  7218. [0.6353, 0.4128, 0.9138, 0.3533, 0.4688, 0.3250, 0.7145, 0.5991]],
  7219. device='cuda:0', dtype=torch.float64)
  7220. predictions are: tensor([[ 0.3293, -0.5473, 1.5970, -0.7552, -0.4687, -1.1431, 0.3605, 0.2590],
  7221. [ 0.5273, -0.4548, 1.5444, -0.1336, -0.3016, -0.1362, 0.2556, 0.2522],
  7222. [ 0.5754, -0.4633, 1.3858, -1.3929, -0.2541, -1.4203, 0.6970, 0.2267],
  7223. [ 0.3987, -0.5329, 1.1977, -1.1102, -0.6819, -0.5298, 0.3855, 0.2635],
  7224. [ 0.7827, -0.3052, 1.5950, -0.4448, -0.5119, 0.0966, 0.5064, 0.1696],
  7225. [ 0.7617, -0.3088, 1.5791, 0.0172, -0.4719, 0.0445, 0.3501, 0.2548],
  7226. [ 0.5747, -0.4432, 1.4921, -0.0964, -0.5980, -0.3201, 0.3020, 0.2039],
  7227. [-0.0334, -0.8246, 1.8454, -0.9392, -0.1398, -1.1044, 0.9246, 0.2017]],
  7228. device='cuda:0', grad_fn=<AddmmBackward>)
  7229. landmarks are: tensor([[[ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  7230. 0.1929],
  7231. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  7232. 0.2634],
  7233. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  7234. 0.0851],
  7235. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  7236. 0.2545],
  7237. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  7238. -0.0322],
  7239. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  7240. 0.3161],
  7241. [ 0.5680, -0.4562, 1.5697, 0.4947, -0.4904, -0.1503, 0.3536,
  7242. 0.1956],
  7243. [ 0.6487, -0.3792, 1.9346, -0.6539, -0.1208, -0.7848, 1.0143,
  7244. 0.4814]]], device='cuda:0')
  7245. loss_train_step before backward: tensor(0.0389, device='cuda:0', grad_fn=<MseLossBackward>)
  7246. loss_train_step after backward: tensor(0.0389, device='cuda:0', grad_fn=<MseLossBackward>)
  7247. loss_train: 5.758151488378644
  7248. step: 72
  7249. running loss: 0.07997432622748117
  7250. Train Steps: 72/90 Loss: 0.0800 torch.Size([8, 600, 800])
  7251. torch.Size([8, 8])
  7252. tensor([[0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  7253. [0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  7254. [0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617],
  7255. [0.6042, 0.3990, 0.6831, 0.2875, 0.3500, 0.3133, 0.5143, 0.5510],
  7256. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  7257. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  7258. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  7259. [0.6152, 0.4131, 0.6863, 0.2567, 0.3625, 0.3300, 0.5765, 0.5305]],
  7260. device='cuda:0', dtype=torch.float64)
  7261. predictions are: tensor([[ 0.7339, -0.3342, 1.6868, -0.8073, -0.5287, -0.6222, 0.6321, 0.2477],
  7262. [ 0.2298, -0.6195, 1.3810, -1.2579, -0.2440, -1.3400, 0.6141, 0.2401],
  7263. [ 0.6787, -0.3341, 1.6653, 0.1779, -0.2311, -0.0670, 0.4532, 0.2377],
  7264. [ 0.1206, -0.7352, 1.1463, -1.0930, -0.5663, -0.8224, 0.2956, 0.2897],
  7265. [ 0.6156, -0.3924, 1.8099, -0.0031, -0.2276, 0.0718, 0.4336, 0.1735],
  7266. [ 0.9364, -0.2195, 1.8013, -0.1140, -0.5267, -0.1311, 0.5028, 0.1453],
  7267. [-0.1940, -0.9203, 1.4506, -1.0456, -0.4763, -1.1710, 0.3304, 0.2000],
  7268. [ 0.4077, -0.5119, 1.1473, -1.1172, -0.5598, -0.7982, 0.3682, 0.2957]],
  7269. device='cuda:0', grad_fn=<AddmmBackward>)
  7270. landmarks are: tensor([[[ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  7271. 0.5624],
  7272. [ 0.5917, -0.3861, 1.0455, -1.3698, -0.2882, -1.1928, 0.6067,
  7273. 0.2083],
  7274. [ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  7275. 0.3084],
  7276. [ 0.5049, -0.4428, 0.8692, -0.9581, -0.6693, -0.8386, 0.0897,
  7277. 0.2589],
  7278. [ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  7279. 0.0682],
  7280. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  7281. 0.2314],
  7282. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  7283. -0.0220],
  7284. [ 0.5557, -0.3779, 0.8838, -1.1004, -0.6115, -0.7617, 0.3769,
  7285. 0.1644]]], device='cuda:0')
  7286. loss_train_step before backward: tensor(0.0385, device='cuda:0', grad_fn=<MseLossBackward>)
  7287. loss_train_step after backward: tensor(0.0385, device='cuda:0', grad_fn=<MseLossBackward>)
  7288. loss_train: 5.796630242839456
  7289. step: 73
  7290. running loss: 0.0794058937375268
  7291. Train Steps: 73/90 Loss: 0.0794 torch.Size([8, 600, 800])
  7292. torch.Size([8, 8])
  7293. tensor([[0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  7294. [0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  7295. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  7296. [0.6261, 0.4066, 0.8325, 0.2150, 0.4763, 0.2667, 0.7002, 0.5633],
  7297. [0.6273, 0.4100, 0.7137, 0.2133, 0.4000, 0.2650, 0.6075, 0.5633],
  7298. [0.6185, 0.4079, 0.8838, 0.4617, 0.4838, 0.5650, 0.6175, 0.5850],
  7299. [0.6226, 0.4001, 0.8438, 0.5733, 0.3862, 0.4250, 0.5750, 0.5283],
  7300. [0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285]],
  7301. device='cuda:0', dtype=torch.float64)
  7302. predictions are: tensor([[ 0.2847, -0.5792, 1.3632, -0.7519, -0.6296, -0.4213, 0.2320, 0.2479],
  7303. [ 0.9402, -0.1907, 1.7925, -0.0052, -0.3164, 0.1891, 0.5462, 0.1902],
  7304. [-0.1207, -0.9044, 1.0360, -1.2763, -0.4952, -1.2274, 0.1613, 0.3052],
  7305. [ 0.5824, -0.4396, 1.6488, -1.2598, -0.1587, -1.4267, 0.8792, 0.1771],
  7306. [-0.1792, -0.8918, 1.1804, -1.4088, -0.4414, -1.3778, 0.3201, 0.2816],
  7307. [ 0.9521, -0.1891, 1.8129, -0.1594, -0.1669, 0.0568, 0.5431, 0.2250],
  7308. [ 0.5457, -0.4516, 1.6558, 0.1544, -0.5624, -0.3605, 0.2724, 0.1758],
  7309. [ 0.7240, -0.3286, 1.6456, -0.6170, -0.5346, -0.1263, 0.6180, 0.1891]],
  7310. device='cuda:0', grad_fn=<AddmmBackward>)
  7311. landmarks are: tensor([[[ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  7312. 0.2386],
  7313. [ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  7314. 0.1661],
  7315. [ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  7316. 0.3852],
  7317. [ 0.6059, -0.4080, 1.5594, -1.2928, -0.0861, -1.0542, 0.9485,
  7318. 0.3157],
  7319. [ 0.6115, -0.3924, 1.0109, -1.3005, -0.4383, -1.0619, 0.5201,
  7320. 0.3161],
  7321. [ 0.5707, -0.4017, 1.7961, -0.1535, -0.0515, 0.3238, 0.5663,
  7322. 0.4162],
  7323. [ 0.5900, -0.4377, 1.6113, 0.3623, -0.5018, -0.3229, 0.3700,
  7324. 0.1544],
  7325. [ 0.6108, -0.4273, 1.8711, -0.6616, -0.5769, -0.1997, 0.9156,
  7326. 0.1554]]], device='cuda:0')
  7327. loss_train_step before backward: tensor(0.0481, device='cuda:0', grad_fn=<MseLossBackward>)
  7328. loss_train_step after backward: tensor(0.0481, device='cuda:0', grad_fn=<MseLossBackward>)
  7329. loss_train: 5.844778308644891
  7330. step: 74
  7331. running loss: 0.07898349065736339
  7332.  
  7333. Train Steps: 74/90 Loss: 0.0790 torch.Size([8, 600, 800])
  7334. torch.Size([8, 8])
  7335. tensor([[0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  7336. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540],
  7337. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  7338. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567],
  7339. [0.6064, 0.4019, 0.8650, 0.4517, 0.4037, 0.5367, 0.5703, 0.5609],
  7340. [0.6218, 0.4137, 0.7263, 0.2233, 0.4075, 0.2650, 0.6212, 0.5783],
  7341. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  7342. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563]],
  7343. device='cuda:0', dtype=torch.float64)
  7344. predictions are: tensor([[ 0.6634, -0.3417, 1.6444, -0.0885, -0.5261, 0.1245, 0.4036, 0.2044],
  7345. [ 0.0769, -0.6972, 1.6346, -1.2106, 0.0788, -1.1002, 0.9462, 0.1777],
  7346. [ 0.7241, -0.3058, 1.3758, -0.9954, -0.4782, -0.8373, 0.4019, 0.2229],
  7347. [-0.9479, -1.3831, 1.1639, -1.1251, -0.3941, -1.1239, 0.1696, 0.2574],
  7348. [ 0.7407, -0.2983, 1.7178, 0.0877, -0.3567, 0.4966, 0.5218, 0.1839],
  7349. [ 0.7174, -0.3030, 1.2691, -0.8878, -0.4343, -0.9197, 0.4034, 0.2610],
  7350. [ 0.7942, -0.2631, 1.2833, -0.8850, -0.3832, -0.8959, 0.4042, 0.2976],
  7351. [ 0.4527, -0.4678, 1.5730, -0.3388, -0.6123, -0.5245, 0.2143, 0.1994]],
  7352. device='cuda:0', grad_fn=<AddmmBackward>)
  7353. landmarks are: tensor([[[ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  7354. 0.3267],
  7355. [ 0.6487, -0.3792, 1.6344, -1.0850, 0.2659, -1.5397, 0.8059,
  7356. 0.2730],
  7357. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  7358. 0.2853],
  7359. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  7360. 0.2853],
  7361. [ 0.5151, -0.4296, 1.7095, -0.1997, -0.4210, 0.1929, 0.3484,
  7362. 0.3047],
  7363. [ 0.5863, -0.3749, 1.0686, -1.2543, -0.4037, -1.0619, 0.5836,
  7364. 0.3854],
  7365. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  7366. 0.6084],
  7367. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  7368. 0.2837]]], device='cuda:0')
  7369. loss_train_step before backward: tensor(0.0734, device='cuda:0', grad_fn=<MseLossBackward>)
  7370. loss_train_step after backward: tensor(0.0734, device='cuda:0', grad_fn=<MseLossBackward>)
  7371. loss_train: 5.9181370083242655
  7372. step: 75
  7373. running loss: 0.07890849344432355
  7374. Train Steps: 75/90 Loss: 0.0789 torch.Size([8, 600, 800])
  7375. torch.Size([8, 8])
  7376. tensor([[0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  7377. [0.6185, 0.4129, 0.8900, 0.4567, 0.3937, 0.5417, 0.5734, 0.5110],
  7378. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  7379. [0.6211, 0.3993, 0.7650, 0.1933, 0.4575, 0.1550, 0.5965, 0.4895],
  7380. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  7381. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  7382. [0.6182, 0.3967, 0.8263, 0.3065, 0.3526, 0.4161, 0.6192, 0.5290],
  7383. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733]],
  7384. device='cuda:0', dtype=torch.float64)
  7385. predictions are: tensor([[ 0.4961, -0.4331, 1.5760, -0.2348, -0.5834, -0.4121, 0.2109, 0.2769],
  7386. [ 0.7604, -0.2908, 1.7494, -0.1816, -0.3328, 0.1616, 0.4631, 0.2463],
  7387. [ 0.6928, -0.3400, 1.6568, -0.1040, -0.4998, -0.2940, 0.4876, 0.1865],
  7388. [ 0.5090, -0.4994, 1.2263, -1.5922, -0.1983, -1.5729, 0.5735, 0.2009],
  7389. [ 0.4650, -0.4823, 1.6588, -0.0199, -0.2635, -0.0374, 0.3917, 0.1881],
  7390. [ 0.7070, -0.3193, 1.6073, -0.4942, -0.5277, -0.3145, 0.2996, 0.2586],
  7391. [ 0.6871, -0.3422, 1.4430, -0.9179, -0.5518, -0.4318, 0.6278, 0.2200],
  7392. [-0.7194, -1.2560, 1.0205, -1.5431, -0.1226, -1.5735, 0.3658, 0.3317]],
  7393. device='cuda:0', grad_fn=<AddmmBackward>)
  7394. landmarks are: tensor([[[ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  7395. 0.4357],
  7396. [ 0.5711, -0.3788, 1.8249, -0.1766, -0.4672, 0.2160, 0.3625,
  7397. 0.0742],
  7398. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  7399. 0.1082],
  7400. [ 0.5828, -0.4417, 1.2476, -1.3929, -0.1727, -1.5700, 0.4694,
  7401. -0.0248],
  7402. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  7403. 0.0159],
  7404. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  7405. 0.3238],
  7406. [ 0.5697, -0.4538, 1.5308, -0.8703, -0.6572, -0.3639, 0.5739,
  7407. 0.1576],
  7408. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  7409. 0.3623]]], device='cuda:0')
  7410. loss_train_step before backward: tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward>)
  7411. loss_train_step after backward: tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward>)
  7412. loss_train: 5.985258931294084
  7413. step: 76
  7414. running loss: 0.07875340699071162
  7415. Train Steps: 76/90 Loss: 0.0788 torch.Size([8, 600, 800])
  7416. torch.Size([8, 8])
  7417. tensor([[0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  7418. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  7419. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  7420. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  7421. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  7422. [0.6261, 0.4066, 0.8325, 0.2150, 0.4763, 0.2667, 0.7002, 0.5633],
  7423. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  7424. [0.6090, 0.4010, 0.7838, 0.3483, 0.3538, 0.3783, 0.5462, 0.5077]],
  7425. device='cuda:0', dtype=torch.float64)
  7426. predictions are: tensor([[ 0.2429, -0.6192, 1.5609, 0.0381, -0.3987, 0.1600, 0.2758, 0.2319],
  7427. [ 0.6422, -0.3465, 1.4123, -0.8676, -0.6071, -0.7099, 0.3021, 0.2425],
  7428. [ 0.4155, -0.4701, 1.5756, -1.0316, -0.1855, -0.9949, 0.7275, 0.2318],
  7429. [ 0.2456, -0.6119, 1.5407, -0.1703, -0.4710, 0.0538, 0.3149, 0.2587],
  7430. [ 0.4306, -0.5004, 1.4961, -0.8191, -0.3195, -1.1378, 0.4181, 0.2407],
  7431. [ 0.6043, -0.4138, 1.4270, -1.2980, -0.1460, -1.2675, 0.8263, 0.2275],
  7432. [ 0.3764, -0.5286, 1.5590, 0.0285, -0.3335, 0.1087, 0.2864, 0.2451],
  7433. [ 0.3725, -0.5430, 1.1990, -0.9545, -0.6115, -0.5813, 0.2128, 0.2504]],
  7434. device='cuda:0', grad_fn=<AddmmBackward>)
  7435. landmarks are: tensor([[[ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  7436. 0.0663],
  7437. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  7438. 0.1753],
  7439. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  7440. 0.3050],
  7441. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  7442. 0.3469],
  7443. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  7444. -0.0529],
  7445. [ 0.6059, -0.4080, 1.5594, -1.2928, -0.0861, -1.0542, 0.9485,
  7446. 0.3157],
  7447. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  7448. 0.0711],
  7449. [ 0.5270, -0.4336, 1.3342, -0.6770, -0.6520, -0.5384, 0.2370,
  7450. 0.0592]]], device='cuda:0')
  7451. loss_train_step before backward: tensor(0.0258, device='cuda:0', grad_fn=<MseLossBackward>)
  7452. loss_train_step after backward: tensor(0.0258, device='cuda:0', grad_fn=<MseLossBackward>)
  7453. loss_train: 6.011011159047484
  7454. step: 77
  7455. running loss: 0.07806507998762967
  7456. Train Steps: 77/90 Loss: 0.0781 torch.Size([8, 600, 800])
  7457. torch.Size([8, 8])
  7458. tensor([[0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  7459. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  7460. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332],
  7461. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  7462. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795],
  7463. [0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  7464. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  7465. [0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433]],
  7466. device='cuda:0', dtype=torch.float64)
  7467. predictions are: tensor([[ 0.4532, -0.4790, 1.3550, -0.6564, -0.5215, -0.4282, 0.2318, 0.2345],
  7468. [ 0.3515, -0.5440, 1.4068, -1.3205, -0.1814, -1.4695, 0.5088, 0.2038],
  7469. [ 0.1470, -0.6419, 1.4864, -0.0764, -0.4137, -0.0734, 0.2511, 0.2779],
  7470. [ 0.4911, -0.4676, 1.3029, -1.1856, -0.4020, -1.2807, 0.5175, 0.2134],
  7471. [ 0.4871, -0.4626, 1.7018, 0.0512, -0.3980, 0.0687, 0.4746, 0.2630],
  7472. [ 0.3120, -0.5893, 1.3329, -0.9873, -0.5125, -0.4713, 0.4975, 0.2488],
  7473. [ 0.5257, -0.4181, 1.4685, -0.6656, -0.6150, -0.5175, 0.4017, 0.2125],
  7474. [ 0.6028, -0.3793, 1.7381, -0.1580, -0.0723, -0.1443, 0.4997, 0.2906]],
  7475. device='cuda:0', grad_fn=<AddmmBackward>)
  7476. landmarks are: tensor([[[ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  7477. 0.1552],
  7478. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  7479. 0.0807],
  7480. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  7481. 0.1768],
  7482. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  7483. 0.2043],
  7484. [ 0.6355, -0.4080, 1.6113, 0.1852, -0.4730, 0.1467, 0.9996,
  7485. 0.3905],
  7486. [ 0.5799, -0.4099, 1.5651, -1.0465, -0.5885, -0.3075, 0.6413,
  7487. 0.1390],
  7488. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  7489. 0.2365],
  7490. [ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  7491. 0.2237]]], device='cuda:0')
  7492. loss_train_step before backward: tensor(0.0425, device='cuda:0', grad_fn=<MseLossBackward>)
  7493. loss_train_step after backward: tensor(0.0425, device='cuda:0', grad_fn=<MseLossBackward>)
  7494. loss_train: 6.053500270470977
  7495. step: 78
  7496. running loss: 0.07760897782655099
  7497.  
  7498. Train Steps: 78/90 Loss: 0.0776 torch.Size([8, 600, 800])
  7499. torch.Size([8, 8])
  7500. tensor([[0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  7501. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  7502. [0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  7503. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  7504. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  7505. [0.6216, 0.4100, 0.7350, 0.2067, 0.4325, 0.2050, 0.5950, 0.5333],
  7506. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  7507. [0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676]],
  7508. device='cuda:0', dtype=torch.float64)
  7509. predictions are: tensor([[ 0.4413, -0.4662, 1.6231, -0.0098, -0.5385, -0.2463, 0.3870, 0.2384],
  7510. [-0.1857, -0.8836, 1.1719, -1.4335, -0.3002, -1.3386, 0.4504, 0.2599],
  7511. [ 0.3408, -0.5526, 1.1232, -1.1451, -0.6713, -0.8068, 0.2262, 0.2412],
  7512. [ 0.4423, -0.5052, 1.7007, 0.0671, -0.4582, -0.0958, 0.4439, 0.1918],
  7513. [ 0.5977, -0.3991, 1.6609, -0.2335, -0.4152, -0.0203, 0.4947, 0.2128],
  7514. [ 0.4420, -0.4872, 1.0551, -1.5288, -0.4055, -1.4832, 0.4326, 0.2587],
  7515. [ 0.4850, -0.4208, 1.7230, -0.2698, -0.1252, -0.2177, 0.5447, 0.2066],
  7516. [ 0.7261, -0.3160, 1.7007, -0.2241, -0.2409, -0.1268, 0.4922, 0.2211]],
  7517. device='cuda:0', grad_fn=<AddmmBackward>)
  7518. landmarks are: tensor([[[ 6.1149e-01, -3.7244e-01, 1.7557e+00, 3.4688e-01, -4.4411e-01,
  7519. -1.0731e-01, 4.9122e-01, 2.3911e-01],
  7520. [ 5.8487e-01, -3.8360e-01, 1.2649e+00, -1.2236e+00, -3.4596e-01,
  7521. -1.2313e+00, 4.5081e-01, 1.6982e-01],
  7522. [ 5.3591e-01, -4.1932e-01, 9.3580e-01, -8.2325e-01, -6.6351e-01,
  7523. -7.2317e-01, 9.4325e-02, 1.7099e-01],
  7524. [ 5.7748e-01, -4.6066e-01, 1.6741e+00, 1.9623e-01, -4.0362e-01,
  7525. -1.2115e-01, 4.5876e-01, 1.9786e-01],
  7526. [ 5.6039e-01, -4.6197e-01, 1.7961e+00, -1.9969e-01, -3.2286e-01,
  7527. 1.0824e-01, 4.1039e-01, 2.5450e-01],
  7528. [ 5.8528e-01, -3.9199e-01, 1.1090e+00, -1.3313e+00, -2.8822e-01,
  7529. -1.3390e+00, 4.6236e-01, 1.7752e-01],
  7530. [ 5.3508e-01, -4.3212e-01, 1.7326e+00, -1.3811e-01, 4.6329e-02,
  7531. 1.0491e-01, 4.1617e-01, 2.7760e-01],
  7532. [ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  7533. 4.6189e-04, 2.9049e-01, 3.3573e-01]]], device='cuda:0')
  7534. loss_train_step before backward: tensor(0.0302, device='cuda:0', grad_fn=<MseLossBackward>)
  7535. loss_train_step after backward: tensor(0.0302, device='cuda:0', grad_fn=<MseLossBackward>)
  7536. loss_train: 6.083718063309789
  7537. step: 79
  7538. running loss: 0.07700908940898467
  7539. Train Steps: 79/90 Loss: 0.0770 torch.Size([8, 600, 800])
  7540. torch.Size([8, 8])
  7541. tensor([[0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  7542. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  7543. [0.6296, 0.4045, 0.9138, 0.4100, 0.4232, 0.4242, 0.7422, 0.5297],
  7544. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  7545. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  7546. [0.6160, 0.4093, 0.8314, 0.4417, 0.3675, 0.4583, 0.5250, 0.5808],
  7547. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  7548. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742]],
  7549. device='cuda:0', dtype=torch.float64)
  7550. predictions are: tensor([[ 0.1627, -0.6941, 0.9786, -1.1865, -0.5091, -0.9566, 0.1641, 0.3193],
  7551. [ 0.4703, -0.4958, 1.7074, 0.0998, -0.4157, -0.0632, 0.4524, 0.1856],
  7552. [ 0.6864, -0.3392, 1.5980, -0.5553, -0.4134, -0.3026, 0.6323, 0.1914],
  7553. [ 0.4189, -0.4609, 1.6604, -0.2478, -0.3532, -0.0982, 0.3636, 0.2113],
  7554. [ 0.6215, -0.3834, 1.6149, -0.8199, -0.2564, -1.1783, 0.5599, 0.1797],
  7555. [ 0.3355, -0.5244, 1.5251, -0.3258, -0.3835, -0.0800, 0.3727, 0.2703],
  7556. [ 0.4983, -0.4797, 1.2142, -1.1775, -0.5485, -0.8428, 0.4820, 0.2132],
  7557. [ 0.3679, -0.5232, 1.6810, -0.1140, -0.4568, -0.6179, 0.4762, 0.1681]],
  7558. device='cuda:0', grad_fn=<AddmmBackward>)
  7559. landmarks are: tensor([[[ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  7560. 0.4103],
  7561. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  7562. 0.0111],
  7563. [ 0.6224, -0.4177, 1.9346, -0.3921, -0.3314, -0.3264, 1.1422,
  7564. 0.1608],
  7565. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  7566. 0.1439],
  7567. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  7568. -0.0529],
  7569. [ 0.5592, -0.3956, 1.5543, -0.2456, -0.5885, -0.1689, 0.1392,
  7570. 0.3968],
  7571. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  7572. 0.2545],
  7573. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  7574. -0.0957]]], device='cuda:0')
  7575. loss_train_step before backward: tensor(0.0294, device='cuda:0', grad_fn=<MseLossBackward>)
  7576. loss_train_step after backward: tensor(0.0294, device='cuda:0', grad_fn=<MseLossBackward>)
  7577. loss_train: 6.113160545006394
  7578. step: 80
  7579. running loss: 0.07641450681257993
  7580. Train Steps: 80/90 Loss: 0.0764 torch.Size([8, 600, 800])
  7581. torch.Size([8, 8])
  7582. tensor([[0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  7583. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  7584. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  7585. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  7586. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  7587. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598],
  7588. [0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617],
  7589. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392]],
  7590. device='cuda:0', dtype=torch.float64)
  7591. predictions are: tensor([[ 0.6616, -0.3725, 1.5009, -1.1986, -0.1821, -1.1744, 0.8349, 0.1502],
  7592. [ 0.5140, -0.4440, 1.6731, 0.1572, -0.5335, -0.1048, 0.4126, 0.1451],
  7593. [ 0.2424, -0.6267, 1.0445, -1.1448, -0.6994, -0.8297, 0.1809, 0.2472],
  7594. [ 0.5195, -0.4319, 1.5449, -1.2729, -0.2066, -1.1167, 0.6421, 0.1443],
  7595. [ 0.6524, -0.3687, 1.5164, -0.6111, -0.6951, -0.3538, 0.4975, 0.2012],
  7596. [ 0.4303, -0.4790, 1.5850, 0.0598, -0.2176, -0.2040, 0.3833, 0.2430],
  7597. [ 0.2529, -0.5771, 1.5279, 0.0467, -0.2950, -0.1728, 0.3096, 0.2634],
  7598. [ 0.3993, -0.4989, 1.6358, 0.0904, -0.4416, -0.0155, 0.3070, 0.2172]],
  7599. device='cuda:0', grad_fn=<AddmmBackward>)
  7600. landmarks are: tensor([[[ 0.6520, -0.3912, 1.7095, -0.9079, -0.0284, -1.3621, 0.8096,
  7601. 0.2356],
  7602. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  7603. -0.0049],
  7604. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  7605. 0.3315],
  7606. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  7607. -0.0209],
  7608. [ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  7609. 0.2930],
  7610. [ 0.5726, -0.4249, 1.5824, 0.3777, -0.0942, -0.0556, 0.2782,
  7611. 0.2997],
  7612. [ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  7613. 0.3084],
  7614. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  7615. 0.2048]]], device='cuda:0')
  7616. loss_train_step before backward: tensor(0.0210, device='cuda:0', grad_fn=<MseLossBackward>)
  7617. loss_train_step after backward: tensor(0.0210, device='cuda:0', grad_fn=<MseLossBackward>)
  7618. loss_train: 6.13416051492095
  7619. step: 81
  7620. running loss: 0.07573037672741914
  7621. Train Steps: 81/90 Loss: 0.0757 torch.Size([8, 600, 800])
  7622. torch.Size([8, 8])
  7623. tensor([[ nan, nan, 0.7412, 0.2200, 0.4450, 0.1517, 0.5312, 0.4983],
  7624. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  7625. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  7626. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  7627. [0.6250, 0.4116, 0.8700, 0.4850, 0.4650, 0.5567, 0.6088, 0.5183],
  7628. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  7629. [0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  7630. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309]],
  7631. device='cuda:0', dtype=torch.float64)
  7632. predictions are: tensor([[-0.8470, -1.3406, 0.9710, -1.2401, -0.3874, -1.3271, 0.1391, 0.1894],
  7633. [ 0.9333, -0.1303, 1.5740, -0.8103, -0.3536, -0.8830, 0.5989, 0.1798],
  7634. [ 0.9719, -0.1713, 1.7116, 0.3834, -0.6196, -0.0734, 0.4194, 0.1456],
  7635. [ 0.8045, -0.2672, 1.7701, -0.0866, -0.4186, 0.3582, 0.5741, 0.2192],
  7636. [ 0.7323, -0.2955, 1.8138, 0.0565, -0.1777, 0.2783, 0.5645, 0.2337],
  7637. [-0.4810, -1.0622, 1.0033, -1.1718, -0.4243, -1.2152, 0.1338, 0.2037],
  7638. [ 0.8303, -0.2347, 1.4033, -0.9560, -0.4656, -0.8805, 0.6346, 0.1497],
  7639. [ 0.6676, -0.2687, 1.7781, 0.0762, -0.3945, -0.3554, 0.4669, 0.1738]],
  7640. device='cuda:0', grad_fn=<AddmmBackward>)
  7641. landmarks are: tensor([[[-2.2859, -2.2859, 1.1379, -1.2697, -0.2305, -1.5854, 0.1679,
  7642. 0.0159],
  7643. [ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  7644. 0.1931],
  7645. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  7646. -0.1278],
  7647. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  7648. 0.2622],
  7649. [ 0.6012, -0.3846, 1.7326, -0.0457, -0.1381, 0.2853, 0.5259,
  7650. 0.1082],
  7651. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  7652. 0.1343],
  7653. [ 0.6125, -0.4345, 1.4308, -1.1384, -0.4213, -1.0031, 0.7190,
  7654. 0.1214],
  7655. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  7656. 0.1661]]], device='cuda:0')
  7657. loss_train_step before backward: tensor(0.0915, device='cuda:0', grad_fn=<MseLossBackward>)
  7658. loss_train_step after backward: tensor(0.0915, device='cuda:0', grad_fn=<MseLossBackward>)
  7659. loss_train: 6.2256993018090725
  7660. step: 82
  7661. running loss: 0.07592316221718381
  7662.  
  7663. Train Steps: 82/90 Loss: 0.0759 torch.Size([8, 600, 800])
  7664. torch.Size([8, 8])
  7665. tensor([[0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  7666. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  7667. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  7668. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717],
  7669. [0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783],
  7670. [0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  7671. [0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  7672. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500]],
  7673. device='cuda:0', dtype=torch.float64)
  7674. predictions are: tensor([[-0.4372, -1.0773, 0.9684, -1.1526, -0.4889, -1.4327, 0.1665, 0.1314],
  7675. [ 0.8245, -0.2356, 1.2412, -1.2070, -0.3522, -1.4770, 0.4970, 0.1102],
  7676. [ 0.6625, -0.3387, 1.8488, 0.0791, -0.2400, 0.1239, 0.5469, 0.1703],
  7677. [ 0.6149, -0.3869, 1.8176, 0.0247, -0.3495, -0.1160, 0.5422, 0.1320],
  7678. [ 0.5138, -0.4426, 1.1079, -0.9809, -0.7097, -0.8575, 0.2407, 0.2462],
  7679. [ 0.6288, -0.3711, 1.8621, 0.0934, -0.3120, 0.1545, 0.6857, 0.1629],
  7680. [ 0.4593, -0.4756, 1.8160, 0.1128, -0.2644, 0.2836, 0.5064, 0.1714],
  7681. [ 0.5796, -0.3572, 1.7196, 0.0223, -0.5261, -0.5082, 0.3354, 0.1745]],
  7682. device='cuda:0', grad_fn=<AddmmBackward>)
  7683. landmarks are: tensor([[[ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  7684. 0.1013],
  7685. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  7686. 0.1005],
  7687. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  7688. 0.0622],
  7689. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  7690. 0.3546],
  7691. [ 0.5680, -0.4005, 0.8030, -1.0542, -0.6289, -0.7540, 0.3700,
  7692. 0.3854],
  7693. [ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  7694. 0.1661],
  7695. [ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  7696. 0.0412],
  7697. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  7698. 0.2545]]], device='cuda:0')
  7699. loss_train_step before backward: tensor(0.0369, device='cuda:0', grad_fn=<MseLossBackward>)
  7700. loss_train_step after backward: tensor(0.0369, device='cuda:0', grad_fn=<MseLossBackward>)
  7701. loss_train: 6.262647982686758
  7702. step: 83
  7703. running loss: 0.07545359015285251
  7704. Train Steps: 83/90 Loss: 0.0755 torch.Size([8, 600, 800])
  7705. torch.Size([8, 8])
  7706. tensor([[0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  7707. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  7708. [0.6124, 0.4075, 0.7696, 0.4153, 0.3475, 0.3767, 0.5157, 0.5427],
  7709. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  7710. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  7711. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  7712. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  7713. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083]],
  7714. device='cuda:0', dtype=torch.float64)
  7715. predictions are: tensor([[ 0.5588, -0.4253, 1.3032, -0.8714, -0.5930, -0.6349, 0.4121, 0.1612],
  7716. [ 0.5840, -0.3910, 1.6718, -0.5996, -0.2422, -0.9303, 0.5476, 0.1022],
  7717. [ 0.5503, -0.4172, 1.4038, -0.4003, -0.5918, -0.4394, 0.2558, 0.1828],
  7718. [ 0.0503, -0.7139, 1.2194, -0.9917, -0.2453, -1.0379, 0.3115, 0.1644],
  7719. [ 0.6324, -0.3348, 1.6029, -0.8426, -0.1930, -0.8667, 0.6539, 0.1151],
  7720. [ 0.6758, -0.3652, 1.8777, 0.4324, -0.4339, 0.3469, 0.6145, 0.1447],
  7721. [ 0.5173, -0.4611, 1.6718, 0.3990, -0.4012, 0.1117, 0.4887, 0.2058],
  7722. [ 0.4877, -0.4613, 1.7446, -0.1365, -0.5940, -0.5164, 0.3340, 0.0479]],
  7723. device='cuda:0', grad_fn=<AddmmBackward>)
  7724. landmarks are: tensor([[[ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  7725. 0.2237],
  7726. [ 0.6128, -0.3828, 1.7499, -0.8386, -0.3344, -1.2620, 0.5792,
  7727. -0.0263],
  7728. [ 0.5427, -0.4035, 1.2688, -0.3675, -0.6808, -0.5461, 0.0959,
  7729. 0.2206],
  7730. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  7731. 0.1698],
  7732. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  7733. 0.1467],
  7734. [ 0.6421, -0.3695, 1.7788, 0.0236, -0.4845, 0.1544, 1.1971,
  7735. 0.2196],
  7736. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  7737. 0.3745],
  7738. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  7739. 0.0620]]], device='cuda:0')
  7740. loss_train_step before backward: tensor(0.0327, device='cuda:0', grad_fn=<MseLossBackward>)
  7741. loss_train_step after backward: tensor(0.0327, device='cuda:0', grad_fn=<MseLossBackward>)
  7742. loss_train: 6.2953284196555614
  7743. step: 84
  7744. running loss: 0.0749443859482805
  7745. Train Steps: 84/90 Loss: 0.0749 torch.Size([8, 600, 800])
  7746. torch.Size([8, 8])
  7747. tensor([[0.6171, 0.4127, 0.8900, 0.4800, 0.4325, 0.5783, 0.5769, 0.5090],
  7748. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  7749. [0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823],
  7750. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  7751. [0.6280, 0.4101, 0.9050, 0.4533, 0.3775, 0.3217, 0.6338, 0.4915],
  7752. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  7753. [0.6075, 0.4000, 0.8513, 0.5183, 0.4510, 0.5329, 0.5180, 0.5280],
  7754. [0.6167, 0.4048, 0.6831, 0.3639, 0.3763, 0.3017, 0.5700, 0.5883]],
  7755. device='cuda:0', dtype=torch.float64)
  7756. predictions are: tensor([[ 0.5941, -0.4105, 1.7887, 0.0018, -0.3170, 0.2443, 0.5468, 0.1424],
  7757. [ 0.8466, -0.2356, 1.7616, -0.3460, -0.4721, -0.6073, 0.5775, 0.1030],
  7758. [ 0.6348, -0.4047, 1.4215, -1.2086, -0.3035, -1.2415, 0.7195, 0.0656],
  7759. [ 0.6285, -0.3556, 1.6495, 0.1077, -0.5253, -0.5284, 0.3942, 0.1090],
  7760. [ 0.5837, -0.3673, 1.7452, -0.1876, -0.4923, -0.7255, 0.4623, 0.0394],
  7761. [ 0.6060, -0.3984, 1.7194, -0.0774, -0.5157, -0.1249, 0.5227, 0.1249],
  7762. [ 0.3936, -0.5132, 1.6742, 0.0635, -0.1754, 0.0217, 0.4127, 0.1566],
  7763. [-0.0444, -0.7899, 1.1317, -0.8592, -0.4773, -0.8693, 0.1572, 0.2092]],
  7764. device='cuda:0', grad_fn=<AddmmBackward>)
  7765. landmarks are: tensor([[[ 0.5645, -0.3797, 1.8249, -0.0688, -0.2882, 0.3854, 0.3789,
  7766. 0.0652],
  7767. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  7768. 0.1005],
  7769. [ 0.6132, -0.4122, 1.5478, -1.0619, -0.2709, -1.4314, 0.5500,
  7770. -0.0583],
  7771. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  7772. 0.1698],
  7773. [ 0.6148, -0.3918, 1.8942, -0.1920, -0.5423, -0.8002, 0.6414,
  7774. -0.0156],
  7775. [ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  7776. 0.1779],
  7777. [ 0.5202, -0.4382, 1.6460, 0.1082, -0.2029, 0.1754, 0.1067,
  7778. 0.1530],
  7779. [ 0.5626, -0.4162, 0.8692, -0.6051, -0.5480, -0.8925, 0.3469,
  7780. 0.4316]]], device='cuda:0')
  7781. loss_train_step before backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  7782. loss_train_step after backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  7783. loss_train: 6.315675836056471
  7784. step: 85
  7785. running loss: 0.0743020686594879
  7786. Train Steps: 85/90 Loss: 0.0743 torch.Size([8, 600, 800])
  7787. torch.Size([8, 8])
  7788. tensor([[0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  7789. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  7790. [0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  7791. [0.6357, 0.4159, 0.8788, 0.5583, 0.3638, 0.4433, 0.6488, 0.5297],
  7792. [0.6205, 0.4004, 0.8938, 0.4883, 0.3663, 0.5000, 0.6357, 0.4947],
  7793. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  7794. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  7795. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456]],
  7796. device='cuda:0', dtype=torch.float64)
  7797. predictions are: tensor([[ 1.0889, -0.0847, 1.4050, -1.0740, -0.3015, -1.3084, 0.4984, 0.0900],
  7798. [ 0.7538, -0.3029, 1.8606, 0.0660, -0.4251, 0.0576, 0.5933, 0.1187],
  7799. [ 0.3395, -0.5567, 1.6117, -0.3520, -0.5353, -0.2820, 0.4529, 0.1650],
  7800. [ 0.7772, -0.2671, 1.8426, 0.1250, -0.5436, -0.4465, 0.5795, 0.0673],
  7801. [ 0.4460, -0.5134, 1.7618, -0.0583, -0.5205, -0.1142, 0.5861, 0.0676],
  7802. [-0.0893, -0.8130, 1.1007, -1.2895, -0.3983, -1.5112, 0.2485, 0.0711],
  7803. [ 0.5626, -0.4279, 1.7289, 0.1548, -0.2305, -0.0760, 0.4865, 0.1444],
  7804. [ 0.4831, -0.4688, 1.6880, 0.0459, -0.3398, -0.0117, 0.4747, 0.1757]],
  7805. device='cuda:0', grad_fn=<AddmmBackward>)
  7806. landmarks are: tensor([[[ 5.7679e-01, -4.0308e-01, 1.3838e+00, -1.1527e+00, -2.1876e-01,
  7807. -1.4216e+00, 4.3790e-01, 1.8502e-01],
  7808. [ 5.9913e-01, -3.8029e-01, 1.8018e+00, -5.3426e-02, -3.4596e-01,
  7809. 1.8522e-01, 5.3741e-01, 1.3903e-01],
  7810. [ 5.2835e-01, -4.4288e-01, 1.5940e+00, -2.8437e-01, -5.8268e-01,
  7811. -1.4580e-01, 2.8226e-01, 3.2671e-01],
  7812. [ 6.5036e-01, -3.6471e-01, 1.7730e+00, 2.9299e-01, -6.0577e-01,
  7813. -2.3818e-01, 7.1085e-01, 1.6077e-01],
  7814. [ 5.8031e-01, -4.3672e-01, 1.8423e+00, -3.0331e-02, -5.9423e-01,
  7815. 2.3557e-02, 6.5034e-01, -9.2270e-04],
  7816. [ 5.6761e-01, -4.1124e-01, 1.1898e+00, -1.2467e+00, -2.9400e-01,
  7817. -1.4622e+00, 2.1029e-01, 1.3434e-01],
  7818. [ 5.4428e-01, -3.8314e-01, 1.7095e+00, 1.6212e-01, -2.0162e-01,
  7819. 1.3903e-01, 1.4368e-01, 2.3637e-01],
  7820. [ 5.4428e-01, -3.8399e-01, 1.7095e+00, 6.2048e-02, -3.9792e-01,
  7821. 1.9292e-01, 1.6218e-01, 2.3412e-01]]], device='cuda:0')
  7822. loss_train_step before backward: tensor(0.0275, device='cuda:0', grad_fn=<MseLossBackward>)
  7823. loss_train_step after backward: tensor(0.0275, device='cuda:0', grad_fn=<MseLossBackward>)
  7824. loss_train: 6.343135943636298
  7825. step: 86
  7826. running loss: 0.07375739469344533
  7827.  
  7828. Train Steps: 86/90 Loss: 0.0738 torch.Size([8, 600, 800])
  7829. torch.Size([8, 8])
  7830. tensor([[0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  7831. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  7832. [0.6236, 0.3967, 0.8675, 0.5400, 0.3862, 0.4517, 0.5825, 0.5200],
  7833. [0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  7834. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  7835. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  7836. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  7837. [0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533]],
  7838. device='cuda:0', dtype=torch.float64)
  7839. predictions are: tensor([[ 0.3789, -0.5709, 1.7497, -0.0941, -0.4350, -0.0917, 0.5710, 0.1533],
  7840. [ 0.6201, -0.4236, 1.7590, -0.4153, -0.6013, -0.2876, 0.6609, 0.0435],
  7841. [ 0.5135, -0.4883, 1.8328, 0.1927, -0.4158, -0.2144, 0.5694, 0.0815],
  7842. [ 0.7109, -0.2940, 1.6941, -0.1075, -0.5754, -0.5636, 0.3950, 0.1171],
  7843. [ 0.5652, -0.4250, 1.7889, 0.1220, -0.4005, -0.2076, 0.5230, 0.0870],
  7844. [ 0.5411, -0.4651, 1.1210, -1.0702, -0.5344, -1.0046, 0.2457, 0.1836],
  7845. [ 0.5682, -0.4166, 1.6892, -0.0446, -0.2701, -0.6571, 0.4846, 0.1540],
  7846. [ 0.8239, -0.2596, 1.5885, -0.9988, -0.3349, -0.9175, 0.5501, 0.0685]],
  7847. device='cuda:0', grad_fn=<AddmmBackward>)
  7848. landmarks are: tensor([[[ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  7849. 0.5239],
  7850. [ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  7851. -0.0099],
  7852. [ 0.5944, -0.4538, 1.7210, 0.2083, -0.5018, -0.1997, 0.4046,
  7853. 0.1159],
  7854. [ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  7855. 0.4393],
  7856. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  7857. 0.2391],
  7858. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  7859. 0.4103],
  7860. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  7861. 0.5762],
  7862. [ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  7863. 0.2699]]], device='cuda:0')
  7864. loss_train_step before backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  7865. loss_train_step after backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  7866. loss_train: 6.368460373952985
  7867. step: 87
  7868. running loss: 0.07320069395348258
  7869. Train Steps: 87/90 Loss: 0.0732 torch.Size([8, 600, 800])
  7870. torch.Size([8, 8])
  7871. tensor([[0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676],
  7872. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  7873. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426],
  7874. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  7875. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  7876. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  7877. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  7878. [0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882]],
  7879. device='cuda:0', dtype=torch.float64)
  7880. predictions are: tensor([[ 0.3796, -0.5730, 1.8118, 0.0626, -0.1858, 0.1095, 0.5429, 0.1698],
  7881. [ 0.2873, -0.6146, 1.8132, 0.1036, -0.1824, 0.1075, 0.5311, 0.1494],
  7882. [ 0.6287, -0.3633, 1.7577, -0.1201, -0.5401, -0.5168, 0.4512, 0.1066],
  7883. [ 0.7294, -0.3134, 1.3254, -0.9326, -0.5984, -0.9560, 0.4578, 0.1106],
  7884. [ 0.6293, -0.3388, 1.7535, 0.0480, -0.4836, -0.6253, 0.4843, 0.1036],
  7885. [ 0.7504, -0.3159, 1.5468, -0.8603, -0.3524, -0.7077, 0.5296, 0.1618],
  7886. [ 0.6767, -0.3592, 1.1190, -1.0683, -0.5741, -1.1130, 0.3685, 0.1548],
  7887. [ 0.5433, -0.4318, 1.8166, 0.2886, -0.6087, -0.4237, 0.5091, 0.0742]],
  7888. device='cuda:0', grad_fn=<AddmmBackward>)
  7889. landmarks are: tensor([[[ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  7890. 4.6189e-04, 2.9049e-01, 3.3573e-01],
  7891. [ 5.3585e-01, -4.3703e-01, 1.7095e+00, -3.0331e-02, -8.0370e-02,
  7892. -3.8029e-02, 1.0439e-01, 3.3918e-01],
  7893. [ 5.7875e-01, -4.1347e-01, 1.8214e+00, -2.4075e-01, -6.0389e-01,
  7894. -7.8543e-01, 4.1155e-01, 2.2033e-01],
  7895. [ 4.9971e-01, -4.4465e-01, 1.1610e+00, -9.7721e-01, -6.0577e-01,
  7896. -1.0311e+00, 1.4038e-01, -1.0312e-01],
  7897. [ 5.9007e-01, -4.0000e-01, 1.8423e+00, -6.8822e-02, -5.3072e-01,
  7898. -9.2333e-01, 3.6420e-01, 1.8522e-01],
  7899. [ 5.7783e-01, -3.9299e-01, 1.5189e+00, -9.3872e-01, -4.3256e-01,
  7900. -9.1563e-01, 4.8545e-01, 3.3918e-01],
  7901. [ 5.0531e-01, -4.2810e-01, 8.9538e-01, -1.3698e+00, -5.4226e-01,
  7902. -1.1389e+00, 2.4525e-01, 8.6245e-02],
  7903. [ 5.3788e-01, -4.3580e-01, 1.7326e+00, 1.8522e-01, -6.0577e-01,
  7904. -5.4611e-01, 6.8408e-02, -3.0981e-02]]], device='cuda:0')
  7905. loss_train_step before backward: tensor(0.0248, device='cuda:0', grad_fn=<MseLossBackward>)
  7906. loss_train_step after backward: tensor(0.0248, device='cuda:0', grad_fn=<MseLossBackward>)
  7907. loss_train: 6.393300803378224
  7908. step: 88
  7909. running loss: 0.07265114549293437
  7910. Train Steps: 88/90 Loss: 0.0727 torch.Size([8, 600, 800])
  7911. torch.Size([8, 8])
  7912. tensor([[0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  7913. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  7914. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  7915. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  7916. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  7917. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412],
  7918. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  7919. [0.6289, 0.4024, 0.9088, 0.4567, 0.3937, 0.5633, 0.7058, 0.5609]],
  7920. device='cuda:0', dtype=torch.float64)
  7921. predictions are: tensor([[ 0.6858, -0.3454, 1.5921, -0.3030, -0.6412, -0.4857, 0.3554, 0.1860],
  7922. [ 0.6335, -0.4234, 1.8358, 0.0389, -0.5274, 0.0525, 0.6177, 0.1727],
  7923. [ 0.4526, -0.4640, 1.5374, -1.1822, -0.0993, -1.4783, 0.6228, 0.0749],
  7924. [ 0.0231, -0.7600, 1.2551, -0.8862, -0.6108, -1.3019, 0.1301, 0.1329],
  7925. [ 0.7427, -0.3045, 1.7052, -0.2803, -0.4116, -0.1438, 0.4753, 0.1974],
  7926. [ 0.8011, -0.2826, 1.6989, 0.2847, -0.3568, -0.3909, 0.3260, 0.1932],
  7927. [ 0.8804, -0.2614, 1.8125, 0.1778, -0.4982, 0.1325, 0.6062, 0.2211],
  7928. [ 0.7056, -0.3785, 1.8138, -0.0180, -0.5265, 0.0883, 0.6572, 0.2042]],
  7929. device='cuda:0', grad_fn=<AddmmBackward>)
  7930. landmarks are: tensor([[[ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  7931. 0.3265],
  7932. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  7933. 0.1554],
  7934. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  7935. 0.3104],
  7936. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  7937. 0.2699],
  7938. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  7939. 0.2936],
  7940. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  7941. 0.2138],
  7942. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  7943. 0.3157],
  7944. [ 0.6191, -0.4273, 1.9115, -0.1766, -0.4672, 0.3161, 0.9741,
  7945. 0.3050]]], device='cuda:0')
  7946. loss_train_step before backward: tensor(0.3238, device='cuda:0', grad_fn=<MseLossBackward>)
  7947. loss_train_step after backward: tensor(0.3238, device='cuda:0', grad_fn=<MseLossBackward>)
  7948. loss_train: 6.717064084485173
  7949. step: 89
  7950. running loss: 0.07547263016275475
  7951. Train Steps: 89/90 Loss: 0.0755 torch.Size([8, 600, 800])
  7952. torch.Size([8, 8])
  7953. tensor([[0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  7954. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  7955. [0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436],
  7956. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  7957. [0.6132, 0.4037, 0.6963, 0.2217, 0.4100, 0.1950, 0.5395, 0.5175],
  7958. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  7959. [ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729],
  7960. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167]],
  7961. device='cuda:0', dtype=torch.float64)
  7962. predictions are: tensor([[ 0.6784, -0.3806, 1.9874, 0.0074, -0.5508, 0.0863, 0.5777, 0.2291],
  7963. [ 0.4791, -0.4740, 1.2944, -0.7627, -0.4662, -0.9881, 0.2634, 0.2488],
  7964. [ 0.7636, -0.3399, 1.8175, -0.1967, -0.4223, 0.0778, 0.7374, 0.2327],
  7965. [ 0.6685, -0.3923, 1.8977, 0.5432, -0.4429, -0.0133, 0.5661, 0.1591],
  7966. [ 0.6327, -0.3888, 1.1758, -0.9603, -0.4457, -1.3570, 0.2291, 0.1677],
  7967. [ 0.5583, -0.4858, 1.8936, 0.0071, -0.5720, 0.0042, 0.5830, 0.1419],
  7968. [-0.0687, -0.8334, 1.0642, -1.0043, -0.3935, -1.2683, 0.1451, 0.2017],
  7969. [ 0.8477, -0.2481, 1.7314, -0.2783, -0.5498, -0.6370, 0.5573, 0.1633]],
  7970. device='cuda:0', grad_fn=<AddmmBackward>)
  7971. landmarks are: tensor([[[ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  7972. 0.3161],
  7973. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  7974. 0.3546],
  7975. [ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  7976. 0.2249],
  7977. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  7978. -0.0049],
  7979. [ 0.5465, -0.4214, 0.9300, -1.2620, -0.3921, -1.3852, 0.2062,
  7980. 0.1043],
  7981. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  7982. -0.0670],
  7983. [-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  7984. 0.3604],
  7985. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  7986. 0.1005]]], device='cuda:0')
  7987. loss_train_step before backward: tensor(0.1345, device='cuda:0', grad_fn=<MseLossBackward>)
  7988. loss_train_step after backward: tensor(0.1345, device='cuda:0', grad_fn=<MseLossBackward>)
  7989. loss_train: 6.85155183263123
  7990. step: 90
  7991. running loss: 0.07612835369590255
  7992.  
  7993. Valid Steps: 10/10 Loss: nan 61
  7994. --------------------------------------------------
  7995. Epoch: 2 Train Loss: 0.0761 Valid Loss: nan
  7996. --------------------------------------------------
  7997. size of train loader is: 90
  7998. torch.Size([8, 600, 800])
  7999. torch.Size([8, 8])
  8000. tensor([[0.6260, 0.4153, 0.9000, 0.4533, 0.4025, 0.2633, 0.6223, 0.4967],
  8001. [0.6350, 0.4144, 0.9250, 0.4100, 0.4125, 0.3750, 0.7129, 0.5945],
  8002. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  8003. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  8004. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  8005. [0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  8006. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567],
  8007. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142]],
  8008. device='cuda:0', dtype=torch.float64)
  8009. predictions are: tensor([[ 0.4644, -0.4431, 1.6816, -0.0788, -0.5316, -0.8118, 0.3678, 0.1957],
  8010. [ 0.3627, -0.5644, 1.7695, -0.1866, -0.3259, -0.4964, 0.6251, 0.2581],
  8011. [ 0.7497, -0.3301, 1.4605, -0.7863, -0.7153, -0.5758, 0.6303, 0.2166],
  8012. [ 0.5202, -0.4933, 1.6469, -0.0964, -0.5065, 0.0323, 0.4776, 0.2630],
  8013. [ 0.3867, -0.5193, 1.5639, -0.8843, -0.0533, -0.8858, 0.7233, 0.2240],
  8014. [ 0.3793, -0.5255, 1.4437, -0.7890, -0.4778, -0.8875, 0.3171, 0.1730],
  8015. [ 0.6539, -0.3837, 1.6159, 0.2937, -0.4373, -0.0220, 0.4100, 0.2954],
  8016. [ 0.3520, -0.5612, 1.6328, -0.0203, -0.6282, -0.1089, 0.2260, 0.2060]],
  8017. device='cuda:0', grad_fn=<AddmmBackward>)
  8018. landmarks are: tensor([[[ 0.6055, -0.3676, 1.8711, -0.1920, -0.4268, -1.0696, 0.5887,
  8019. 0.0081],
  8020. [ 0.6471, -0.3719, 1.9866, -0.3921, -0.3806, -0.5538, 1.0070,
  8021. 0.4600],
  8022. [ 0.5779, -0.4275, 1.5894, -0.8362, -0.6577, -0.5153, 0.5605,
  8023. 0.2006],
  8024. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  8025. 0.2545],
  8026. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  8027. 0.2142],
  8028. [ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  8029. 0.0851],
  8030. [ 0.5620, -0.4346, 1.6691, 0.3315, -0.2594, -0.0072, 0.2891,
  8031. 0.2853],
  8032. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  8033. 0.0893]]], device='cuda:0')
  8034. loss_train_step before backward: tensor(0.0298, device='cuda:0', grad_fn=<MseLossBackward>)
  8035. loss_train_step after backward: tensor(0.0298, device='cuda:0', grad_fn=<MseLossBackward>)
  8036. loss_train: 0.02976425550878048
  8037. step: 1
  8038. running loss: 0.02976425550878048
  8039. Train Steps: 1/90 Loss: 0.0298 torch.Size([8, 600, 800])
  8040. torch.Size([8, 8])
  8041. tensor([[0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  8042. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  8043. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  8044. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  8045. [0.6350, 0.4043, 0.8738, 0.5650, 0.3850, 0.4750, 0.6401, 0.4950],
  8046. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  8047. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  8048. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600]],
  8049. device='cuda:0', dtype=torch.float64)
  8050. predictions are: tensor([[ 0.2171, -0.6386, 1.4917, -0.9178, -0.3628, -0.8859, 0.3591, 0.1758],
  8051. [ 0.4784, -0.4798, 1.6804, 0.0476, -0.5666, -0.5235, 0.3980, 0.2267],
  8052. [ 0.2964, -0.6088, 1.7696, -0.4092, -0.2328, -0.7607, 0.5548, 0.2144],
  8053. [ 0.5832, -0.4517, 1.6893, -0.2107, -0.5384, -0.1259, 0.5803, 0.2860],
  8054. [ 0.6926, -0.3706, 1.8076, 0.1113, -0.5554, -0.0664, 0.6463, 0.2072],
  8055. [ 0.3910, -0.5487, 1.6927, -0.3536, -0.6326, -0.4973, 0.4058, 0.2500],
  8056. [ 0.3494, -0.5530, 1.1658, -0.9490, -0.4045, -0.9441, 0.3029, 0.3491],
  8057. [ 0.7162, -0.3370, 1.7149, 0.1530, -0.5052, -0.0180, 0.5345, 0.3138]],
  8058. device='cuda:0', grad_fn=<AddmmBackward>)
  8059. landmarks are: tensor([[[ 5.7997e-01, -4.3118e-01, 1.5709e+00, -1.0311e+00, -4.4411e-01,
  8060. -1.1081e+00, 3.8730e-01, 8.5142e-02],
  8061. [ 5.9013e-01, -4.1570e-01, 1.7557e+00, 1.9292e-01, -5.4226e-01,
  8062. -5.9230e-01, 3.5843e-01, 1.6982e-01],
  8063. [ 6.2236e-01, -4.3453e-01, 1.9404e+00, -2.9207e-01, -3.1709e-01,
  8064. -8.7714e-01, 1.0655e+00, 2.1421e-01],
  8065. [ 5.7131e-01, -4.1045e-01, 1.7557e+00, 4.6651e-02, -6.5196e-01,
  8066. -2.6898e-01, 3.9885e-01, 5.2394e-01],
  8067. [ 6.4706e-01, -4.1832e-01, 1.7499e+00, 3.2379e-01, -5.0762e-01,
  8068. -9.1917e-02, 6.7064e-01, 4.6189e-04],
  8069. [ 5.8799e-01, -3.8868e-01, 1.8423e+00, -3.3056e-01, -6.2309e-01,
  8070. -5.2302e-01, 4.0462e-01, 1.5443e-01],
  8071. [ 5.7460e-01, -4.0208e-01, 1.0801e+00, -1.1312e+00, -3.2286e-01,
  8072. -1.1081e+00, 4.8034e-01, 6.0842e-01],
  8073. [ 5.8909e-01, -3.5574e-01, 1.7326e+00, 3.3918e-01, -4.2102e-01,
  8074. -1.2271e-01, 3.2379e-01, 3.0069e-01]]], device='cuda:0')
  8075. loss_train_step before backward: tensor(0.0238, device='cuda:0', grad_fn=<MseLossBackward>)
  8076. loss_train_step after backward: tensor(0.0238, device='cuda:0', grad_fn=<MseLossBackward>)
  8077. loss_train: 0.053598225116729736
  8078. step: 2
  8079. running loss: 0.026799112558364868
  8080. Train Steps: 2/90 Loss: 0.0268 torch.Size([8, 600, 800])
  8081. torch.Size([8, 8])
  8082. tensor([[0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  8083. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  8084. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  8085. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  8086. [0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869],
  8087. [0.6101, 0.4042, 0.7775, 0.2617, 0.3713, 0.2817, 0.5440, 0.5650],
  8088. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  8089. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332]],
  8090. device='cuda:0', dtype=torch.float64)
  8091. predictions are: tensor([[ 0.4246, -0.5008, 1.2521, -0.9797, -0.3414, -1.0541, 0.5136, 0.3221],
  8092. [-0.0271, -0.7760, 1.0477, -0.9932, -0.3399, -1.3101, 0.2273, 0.2716],
  8093. [ 0.7331, -0.3530, 1.8778, 0.4137, -0.4636, 0.0050, 0.6195, 0.2694],
  8094. [ 0.5305, -0.4416, 1.7704, -0.2950, -0.6993, -0.4477, 0.4500, 0.2283],
  8095. [ 0.0741, -0.7198, 1.4817, -0.8829, -0.1518, -1.0529, 0.5162, 0.2382],
  8096. [-0.0500, -0.7776, 1.3050, -0.7022, -0.4658, -0.7708, 0.1221, 0.3052],
  8097. [ 0.6535, -0.3872, 2.0202, -0.0684, -0.6126, 0.1059, 0.6727, 0.2721],
  8098. [ 0.8910, -0.2266, 1.7665, 0.1437, -0.5468, 0.1158, 0.6713, 0.2996]],
  8099. device='cuda:0', grad_fn=<AddmmBackward>)
  8100. landmarks are: tensor([[[ 0.5861, -0.3929, 1.0570, -1.4314, -0.3286, -1.1235, 0.6182,
  8101. 0.1852],
  8102. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  8103. 0.1253],
  8104. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  8105. 0.1313],
  8106. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  8107. 0.1753],
  8108. [ 0.6124, -0.4010, 1.4381, -1.3544, -0.0573, -1.5546, 0.5573,
  8109. -0.0369],
  8110. [ 0.5320, -0.4189, 1.3053, -1.0773, -0.5711, -0.9849, 0.2267,
  8111. 0.3237],
  8112. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  8113. 0.3161],
  8114. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  8115. 0.1768]]], device='cuda:0')
  8116. loss_train_step before backward: tensor(0.0572, device='cuda:0', grad_fn=<MseLossBackward>)
  8117. loss_train_step after backward: tensor(0.0572, device='cuda:0', grad_fn=<MseLossBackward>)
  8118. loss_train: 0.11081135272979736
  8119. step: 3
  8120. running loss: 0.03693711757659912
  8121. Train Steps: 3/90 Loss: 0.0369 torch.Size([8, 600, 800])
  8122. torch.Size([8, 8])
  8123. tensor([[0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  8124. [0.6177, 0.4086, 0.8738, 0.3950, 0.3775, 0.5600, 0.6225, 0.5700],
  8125. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  8126. [0.6286, 0.4060, 0.9188, 0.4333, 0.3675, 0.4167, 0.7034, 0.5528],
  8127. [0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117],
  8128. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  8129. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  8130. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795]],
  8131. device='cuda:0', dtype=torch.float64)
  8132. predictions are: tensor([[ 0.3962, -0.5233, 1.6373, -0.6012, -0.6109, -0.6016, 0.4131, 0.2866],
  8133. [ 0.8978, -0.2230, 1.7190, -0.6673, -0.4464, 0.1228, 0.8288, 0.3088],
  8134. [ 0.8697, -0.2394, 1.7297, 0.0657, -0.4729, -0.1425, 0.5340, 0.2836],
  8135. [ 0.4009, -0.5431, 1.8679, -0.2984, -0.4186, -0.5946, 0.6249, 0.2787],
  8136. [ 0.3967, -0.5239, 1.7884, -0.1002, -0.5768, -0.4514, 0.3042, 0.2203],
  8137. [ 0.2635, -0.5390, 1.5640, -0.2989, -0.2955, -0.9008, 0.3495, 0.3293],
  8138. [-0.8458, -1.3516, 0.9245, -1.1352, -0.3281, -1.4677, 0.0543, 0.2653],
  8139. [ 0.8833, -0.2316, 1.8017, -0.0581, -0.4491, -0.0319, 0.8155, 0.3043]],
  8140. device='cuda:0', grad_fn=<AddmmBackward>)
  8141. landmarks are: tensor([[[ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  8142. 0.3392],
  8143. [ 0.5671, -0.3988, 1.7499, -0.4614, -0.5423, 0.3007, 0.5894,
  8144. 0.3469],
  8145. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  8146. 0.1544],
  8147. [ 0.6174, -0.4105, 1.9577, -0.2844, -0.5885, -0.3614, 0.9631,
  8148. 0.2676],
  8149. [ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  8150. 0.0774],
  8151. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  8152. 0.5822],
  8153. [-2.2859, -2.2859, 1.0712, -1.2085, -0.3806, -1.3929, 0.0755,
  8154. 0.2006],
  8155. [ 0.6355, -0.4080, 1.6113, 0.1852, -0.4730, 0.1467, 0.9996,
  8156. 0.3905]]], device='cuda:0')
  8157. loss_train_step before backward: tensor(0.0703, device='cuda:0', grad_fn=<MseLossBackward>)
  8158. loss_train_step after backward: tensor(0.0703, device='cuda:0', grad_fn=<MseLossBackward>)
  8159. loss_train: 0.18106389790773392
  8160. step: 4
  8161. running loss: 0.04526597447693348
  8162.  
  8163. Train Steps: 4/90 Loss: 0.0453 torch.Size([8, 600, 800])
  8164. torch.Size([8, 8])
  8165. tensor([[0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350],
  8166. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  8167. [0.6201, 0.4017, 0.8871, 0.4621, 0.3517, 0.4675, 0.5999, 0.5106],
  8168. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  8169. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  8170. [0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155],
  8171. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  8172. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799]],
  8173. device='cuda:0', dtype=torch.float64)
  8174. predictions are: tensor([[ 0.4974, -0.4397, 1.3189, -0.9185, -0.3947, -0.9882, 0.4938, 0.2704],
  8175. [-1.2384, -1.5859, 1.0754, -0.9062, -0.3067, -1.0850, 0.0830, 0.2715],
  8176. [ 0.8753, -0.2470, 1.9504, 0.1446, -0.6124, 0.1460, 0.6680, 0.2374],
  8177. [ 0.4194, -0.4939, 1.1516, -0.8221, -0.5055, -0.9677, 0.3401, 0.3332],
  8178. [ 0.2939, -0.5620, 1.6364, -0.6533, -0.2373, -0.7871, 0.6217, 0.2830],
  8179. [ 0.6833, -0.3461, 1.5232, -0.9011, -0.2480, -1.0147, 0.7707, 0.2400],
  8180. [ 0.9637, -0.1672, 2.0570, 0.1913, -0.6407, 0.2832, 0.6602, 0.2757],
  8181. [ 0.3353, -0.5188, 1.7350, -0.2497, -0.4663, -0.4829, 0.4751, 0.3412]],
  8182. device='cuda:0', grad_fn=<AddmmBackward>)
  8183. landmarks are: tensor([[[ 0.5911, -0.4080, 1.2303, -0.9156, -0.3229, -1.2851, 0.4508,
  8184. 0.1852],
  8185. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  8186. 0.1373],
  8187. [ 0.5783, -0.4306, 1.8114, -0.1515, -0.6617, -0.1268, 0.4851,
  8188. 0.0727],
  8189. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  8190. 0.2930],
  8191. [ 0.6174, -0.3984, 1.5975, -0.9921, -0.3633, -0.9926, 0.8205,
  8192. 0.2050],
  8193. [ 0.6126, -0.4161, 1.6344, -0.9541, -0.2247, -1.3467, 0.6339,
  8194. 0.0953],
  8195. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  8196. 0.1775],
  8197. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  8198. 0.3928]]], device='cuda:0')
  8199. loss_train_step before backward: tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward>)
  8200. loss_train_step after backward: tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward>)
  8201. loss_train: 0.24632898718118668
  8202. step: 5
  8203. running loss: 0.04926579743623734
  8204. Train Steps: 5/90 Loss: 0.0493 torch.Size([8, 600, 800])
  8205. torch.Size([8, 8])
  8206. tensor([[0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  8207. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  8208. [0.6193, 0.4050, 0.7313, 0.2433, 0.4075, 0.2117, 0.5649, 0.5656],
  8209. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567],
  8210. [0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136],
  8211. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  8212. [0.6165, 0.4106, 0.7575, 0.1733, 0.3838, 0.2650, 0.5680, 0.5116],
  8213. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967]],
  8214. device='cuda:0', dtype=torch.float64)
  8215. predictions are: tensor([[-0.0326, -0.7844, 1.3051, -0.8212, -0.3678, -1.0649, 0.3889, 0.3106],
  8216. [ 0.4314, -0.4934, 1.6887, -0.4932, -0.6464, -0.7139, 0.3917, 0.2290],
  8217. [ 0.2542, -0.5932, 1.1377, -0.9746, -0.4692, -1.0381, 0.3510, 0.3077],
  8218. [ 0.7676, -0.3140, 1.8666, 0.5899, -0.4083, 0.2689, 0.5522, 0.3187],
  8219. [ 0.6571, -0.3569, 1.7394, -0.4057, -0.6427, 0.3132, 0.6880, 0.2942],
  8220. [ 0.4241, -0.5237, 1.5921, -1.0009, -0.0236, -1.0447, 0.9168, 0.2845],
  8221. [ 0.3779, -0.5320, 1.3481, -0.8482, -0.5710, -1.0561, 0.4776, 0.2223],
  8222. [-0.1864, -0.8626, 1.5975, -0.7790, -0.1724, -0.9359, 0.5434, 0.2635]],
  8223. device='cuda:0', grad_fn=<AddmmBackward>)
  8224. landmarks are: tensor([[[ 5.9169e-01, -3.8607e-01, 1.0455e+00, -1.3698e+00, -2.8822e-01,
  8225. -1.1928e+00, 6.0670e-01, 2.0831e-01],
  8226. [ 5.4825e-01, -4.2490e-01, 1.5305e+00, -7.3857e-01, -6.1155e-01,
  8227. -8.6944e-01, 3.3533e-01, 1.0054e-01],
  8228. [ 5.7460e-01, -4.1527e-01, 1.0917e+00, -1.1620e+00, -4.0370e-01,
  8229. -1.3082e+00, 3.2339e-01, 3.2671e-01],
  8230. [ 5.6195e-01, -4.3457e-01, 1.6691e+00, 3.3149e-01, -2.5935e-01,
  8231. -7.2363e-03, 2.8915e-01, 2.8530e-01],
  8232. [ 5.4660e-01, -3.8397e-01, 1.5016e+00, -6.0770e-01, -6.4042e-01,
  8233. 2.0831e-01, 3.8714e-01, 8.6245e-02],
  8234. [ 6.2072e-01, -3.9360e-01, 1.7788e+00, -1.1235e+00, 1.4480e-01,
  8235. -1.0850e+00, 1.1459e+00, 1.9818e-01],
  8236. [ 5.6184e-01, -3.8945e-01, 1.2129e+00, -1.4853e+00, -5.1339e-01,
  8237. -1.0619e+00, 3.3778e-01, 7.7228e-02],
  8238. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  8239. -1.5161e+00, 5.8660e-01, 8.0947e-03]]], device='cuda:0')
  8240. loss_train_step before backward: tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward>)
  8241. loss_train_step after backward: tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward>)
  8242. loss_train: 0.3102681040763855
  8243. step: 6
  8244. running loss: 0.05171135067939758
  8245. Train Steps: 6/90 Loss: 0.0517 torch.Size([8, 600, 800])
  8246. torch.Size([8, 8])
  8247. tensor([[0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  8248. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533],
  8249. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  8250. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550],
  8251. [0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  8252. [0.6189, 0.4033, 0.8650, 0.5267, 0.4487, 0.5150, 0.5925, 0.5050],
  8253. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  8254. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456]],
  8255. device='cuda:0', dtype=torch.float64)
  8256. predictions are: tensor([[ 1.0117, -0.1618, 1.9431, 0.1343, -0.5366, -0.3326, 0.7663, 0.1990],
  8257. [-1.0768, -1.5103, 0.9567, -1.3619, -0.3016, -1.6007, 0.2505, 0.2646],
  8258. [ 0.7019, -0.3086, 1.7838, -0.1395, -0.7029, -0.5296, 0.4112, 0.2605],
  8259. [-0.0792, -0.8122, 1.4107, -0.9500, -0.5097, -1.0802, 0.2752, 0.2552],
  8260. [ 0.5814, -0.4038, 1.4747, -1.1459, -0.5425, -0.5329, 0.7750, 0.2706],
  8261. [ 0.6678, -0.3636, 1.8524, -0.0345, -0.2189, -0.0571, 0.5808, 0.2862],
  8262. [ 0.3820, -0.5253, 1.6017, -1.1825, -0.3065, -1.0830, 0.6300, 0.2799],
  8263. [ 0.6951, -0.3400, 1.8050, -0.0378, -0.3050, 0.0485, 0.5817, 0.3112]],
  8264. device='cuda:0', grad_fn=<AddmmBackward>)
  8265. landmarks are: tensor([[[ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  8266. 0.0291],
  8267. [-2.2859, -2.2859, 0.7023, -1.3883, -0.4268, -1.3621, 0.0813,
  8268. 0.2699],
  8269. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  8270. 0.4357],
  8271. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  8272. 0.2776],
  8273. [ 0.5799, -0.4099, 1.5651, -1.0465, -0.5885, -0.3075, 0.6413,
  8274. 0.1390],
  8275. [ 0.5726, -0.4230, 1.7095, 0.1467, -0.2132, 0.0928, 0.4508,
  8276. 0.0467],
  8277. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  8278. 0.3392],
  8279. [ 0.5443, -0.3840, 1.7095, 0.0620, -0.3979, 0.1929, 0.1622,
  8280. 0.2341]]], device='cuda:0')
  8281. loss_train_step before backward: tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward>)
  8282. loss_train_step after backward: tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward>)
  8283. loss_train: 0.37389400601387024
  8284. step: 7
  8285. running loss: 0.05341342943055289
  8286. Train Steps: 7/90 Loss: 0.0534 torch.Size([8, 600, 800])
  8287. torch.Size([8, 8])
  8288. tensor([[0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  8289. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  8290. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  8291. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344],
  8292. [0.6200, 0.3913, 0.8788, 0.5217, 0.4075, 0.5100, 0.6060, 0.4913],
  8293. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  8294. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  8295. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413]],
  8296. device='cuda:0', dtype=torch.float64)
  8297. predictions are: tensor([[ 0.0096, -0.7602, 0.9648, -1.2757, -0.4615, -1.1769, 0.3001, 0.3017],
  8298. [ 0.2265, -0.6059, 1.3263, -1.2305, -0.4143, -1.1986, 0.5272, 0.2549],
  8299. [ 0.4254, -0.4732, 1.6860, 0.2153, -0.4557, -0.1081, 0.4277, 0.3285],
  8300. [ 0.9220, -0.1908, 1.9226, -0.0915, -0.6569, -0.3724, 0.5336, 0.1467],
  8301. [ 0.7344, -0.3511, 1.9044, 0.0650, -0.4269, 0.1083, 0.6133, 0.1700],
  8302. [ 0.4440, -0.4838, 1.4899, -0.6572, -0.6243, -0.7794, 0.3746, 0.2894],
  8303. [-0.5248, -1.0886, 1.2168, -1.2470, -0.2981, -1.0941, 0.3924, 0.3101],
  8304. [ 0.3848, -0.5339, 1.8826, -1.0373, 0.0069, -1.0555, 1.0492, 0.1640]],
  8305. device='cuda:0', grad_fn=<AddmmBackward>)
  8306. landmarks are: tensor([[[ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  8307. 0.3852],
  8308. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  8309. 0.2032],
  8310. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  8311. 0.4470],
  8312. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  8313. 0.1824],
  8314. [ 0.5776, -0.4784, 1.7730, 0.1236, -0.4037, 0.0697, 0.5132,
  8315. -0.0168],
  8316. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  8317. 0.4470],
  8318. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  8319. 0.2853],
  8320. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  8321. 0.2142]]], device='cuda:0')
  8322. loss_train_step before backward: tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward>)
  8323. loss_train_step after backward: tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward>)
  8324. loss_train: 0.43161700665950775
  8325. step: 8
  8326. running loss: 0.05395212583243847
  8327.  
  8328. Train Steps: 8/90 Loss: 0.0540 torch.Size([8, 600, 800])
  8329. torch.Size([8, 8])
  8330. tensor([[0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  8331. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  8332. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  8333. [0.6245, 0.4100, 0.7762, 0.2583, 0.4963, 0.1517, 0.5875, 0.5417],
  8334. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  8335. [0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  8336. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  8337. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567]],
  8338. device='cuda:0', dtype=torch.float64)
  8339. predictions are: tensor([[ 0.4623, -0.4913, 1.8371, 0.3857, -0.4122, 0.2493, 0.5271, 0.1908],
  8340. [ 0.6949, -0.3453, 1.8927, -0.5485, -0.4945, -0.7875, 0.6493, 0.1366],
  8341. [ 0.2863, -0.5883, 1.2984, -0.9925, -0.5895, -0.7914, 0.3332, 0.1886],
  8342. [-0.0663, -0.7860, 1.2408, -1.1712, -0.1767, -1.2552, 0.4436, 0.2503],
  8343. [ 0.0550, -0.7215, 1.0977, -1.0060, -0.5058, -1.0154, 0.3654, 0.2937],
  8344. [ 0.2194, -0.6018, 1.1889, -0.9221, -0.3864, -0.8253, 0.3989, 0.3544],
  8345. [ 0.7135, -0.3359, 2.0395, -0.5939, -0.1271, -0.8327, 0.9730, 0.1247],
  8346. [ 0.1684, -0.6724, 1.2012, -1.1064, -0.4767, -0.9897, 0.3972, 0.2452]],
  8347. device='cuda:0', grad_fn=<AddmmBackward>)
  8348. landmarks are: tensor([[[ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  8349. 0.2237],
  8350. [ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  8351. 0.2139],
  8352. [ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  8353. 0.0141],
  8354. [ 0.5985, -0.3921, 1.2995, -1.0927, 0.0062, -1.5854, 0.4277,
  8355. 0.2160],
  8356. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  8357. 0.2391],
  8358. [ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  8359. 0.5401],
  8360. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  8361. 0.2142],
  8362. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  8363. 0.2853]]], device='cuda:0')
  8364. loss_train_step before backward: tensor(0.0441, device='cuda:0', grad_fn=<MseLossBackward>)
  8365. loss_train_step after backward: tensor(0.0441, device='cuda:0', grad_fn=<MseLossBackward>)
  8366. loss_train: 0.4756833612918854
  8367. step: 9
  8368. running loss: 0.05285370681020948
  8369. Train Steps: 9/90 Loss: 0.0529 torch.Size([8, 600, 800])
  8370. torch.Size([8, 8])
  8371. tensor([[0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  8372. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  8373. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  8374. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  8375. [0.6275, 0.4050, 0.9038, 0.3767, 0.3838, 0.3533, 0.7074, 0.5575],
  8376. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  8377. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  8378. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702]],
  8379. device='cuda:0', dtype=torch.float64)
  8380. predictions are: tensor([[ 0.2563, -0.6047, 1.2636, -1.1187, -0.5007, -0.8370, 0.3980, 0.2478],
  8381. [ 0.4033, -0.5214, 1.6198, -0.9454, -0.4773, -0.9102, 0.5505, 0.2541],
  8382. [ 0.1984, -0.6554, 1.7125, 0.0773, -0.3777, -0.4354, 0.3894, 0.1948],
  8383. [ 0.6152, -0.3854, 1.7423, -0.4495, -0.5086, -0.2344, 0.5880, 0.1688],
  8384. [ 0.7010, -0.3407, 1.9443, -0.7245, -0.2994, -1.1247, 0.8264, 0.1196],
  8385. [ 0.2452, -0.5995, 1.1966, -1.1032, -0.5102, -0.7389, 0.3625, 0.2906],
  8386. [ 0.0631, -0.7514, 1.0383, -1.2927, -0.3640, -1.4295, 0.3175, 0.2634],
  8387. [ 0.5745, -0.3833, 1.5549, -0.1126, -0.4069, -0.2537, 0.5014, 0.2783]],
  8388. device='cuda:0', grad_fn=<AddmmBackward>)
  8389. landmarks are: tensor([[[ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  8390. 0.2237],
  8391. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  8392. 0.5624],
  8393. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  8394. 0.2391],
  8395. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  8396. 0.0985],
  8397. [ 0.6125, -0.4153, 1.8885, -0.5461, -0.5134, -0.6539, 0.9814,
  8398. 0.2890],
  8399. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  8400. 0.3546],
  8401. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  8402. 0.2930],
  8403. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  8404. 0.3478]]], device='cuda:0')
  8405. loss_train_step before backward: tensor(0.0468, device='cuda:0', grad_fn=<MseLossBackward>)
  8406. loss_train_step after backward: tensor(0.0468, device='cuda:0', grad_fn=<MseLossBackward>)
  8407. loss_train: 0.5225014016032219
  8408. step: 10
  8409. running loss: 0.05225014016032219
  8410. Train Steps: 10/90 Loss: 0.0523 torch.Size([8, 600, 800])
  8411. torch.Size([8, 8])
  8412. tensor([[0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  8413. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  8414. [0.6260, 0.4253, 0.8938, 0.4400, 0.3675, 0.3650, 0.5675, 0.5767],
  8415. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  8416. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  8417. [0.6273, 0.4100, 0.7137, 0.2133, 0.4000, 0.2650, 0.6075, 0.5633],
  8418. [0.6277, 0.4118, 0.8988, 0.3833, 0.3950, 0.2650, 0.6290, 0.4938],
  8419. [0.6214, 0.4175, 0.7300, 0.2883, 0.4338, 0.2167, 0.5698, 0.5773]],
  8420. device='cuda:0', dtype=torch.float64)
  8421. predictions are: tensor([[-0.4314, -1.0916, 0.9281, -1.1852, -0.4754, -1.1881, 0.1755, 0.3128],
  8422. [ 0.6351, -0.3751, 1.7415, 0.0037, -0.3866, -0.0694, 0.4654, 0.1710],
  8423. [ 0.9734, -0.1112, 1.7456, -0.4610, -0.5858, -0.7201, 0.5528, 0.2130],
  8424. [ 0.7597, -0.2628, 1.6129, -0.4537, -0.5275, -0.2665, 0.4179, 0.2051],
  8425. [ 0.7301, -0.2926, 1.8193, -0.0412, -0.3160, 0.2844, 0.7483, 0.2097],
  8426. [-0.0348, -0.7843, 1.0376, -1.5226, -0.3714, -1.4824, 0.4634, 0.2735],
  8427. [ 0.3638, -0.5736, 1.8100, -0.7922, -0.3260, -1.3180, 0.7065, 0.1236],
  8428. [ 0.1663, -0.6514, 1.0272, -1.2652, -0.3324, -1.2683, 0.3238, 0.3170]],
  8429. device='cuda:0', grad_fn=<AddmmBackward>)
  8430. landmarks are: tensor([[[ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  8431. 0.4085],
  8432. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  8433. 0.0711],
  8434. [ 0.6058, -0.3216, 1.8423, -0.2536, -0.5885, -0.6000, 0.3353,
  8435. 0.3777],
  8436. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  8437. 0.3265],
  8438. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  8439. 0.3157],
  8440. [ 0.6115, -0.3924, 1.0109, -1.3005, -0.4383, -1.0619, 0.5201,
  8441. 0.3161],
  8442. [ 0.6135, -0.3841, 1.8654, -0.5153, -0.4614, -1.0619, 0.6195,
  8443. -0.0049],
  8444. [ 0.5841, -0.3574, 1.0859, -0.9541, -0.2824, -1.2851, 0.3460,
  8445. 0.3808]]], device='cuda:0')
  8446. loss_train_step before backward: tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward>)
  8447. loss_train_step after backward: tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward>)
  8448. loss_train: 0.5832267887890339
  8449. step: 11
  8450. running loss: 0.05302061716263944
  8451. Train Steps: 11/90 Loss: 0.0530 torch.Size([8, 600, 800])
  8452. torch.Size([8, 8])
  8453. tensor([[0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383],
  8454. [0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378],
  8455. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  8456. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  8457. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  8458. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  8459. [0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350],
  8460. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540]],
  8461. device='cuda:0', dtype=torch.float64)
  8462. predictions are: tensor([[ 0.6115, -0.3336, 1.6059, -0.4732, -0.3632, 0.0570, 0.5158, 0.2598],
  8463. [ 0.6079, -0.3892, 1.4494, -0.0570, -0.6873, -0.5817, 0.3053, 0.2103],
  8464. [ 0.7655, -0.2788, 1.4467, -0.8692, -0.6469, -0.6972, 0.4732, 0.1591],
  8465. [ 0.3337, -0.5651, 1.4831, -0.1191, -0.5095, -0.3914, 0.3344, 0.2294],
  8466. [ 0.4696, -0.4529, 1.4901, 0.0385, -0.6042, -0.0918, 0.3001, 0.2966],
  8467. [ 0.6387, -0.3689, 1.6943, -1.0324, -0.1716, -1.3331, 0.7935, 0.1650],
  8468. [ 0.3009, -0.5571, 1.0399, -1.4437, -0.4154, -1.3370, 0.4036, 0.2582],
  8469. [-0.2349, -0.9462, 1.4178, -1.5820, 0.0318, -1.4545, 0.7773, 0.2556]],
  8470. device='cuda:0', grad_fn=<AddmmBackward>)
  8471. landmarks are: tensor([[[ 0.5664, -0.4321, 1.8249, -0.2074, -0.2651, 0.4162, 0.5663,
  8472. 0.2006],
  8473. [ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  8474. 0.1982],
  8475. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  8476. -0.0670],
  8477. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  8478. 0.1313],
  8479. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  8480. 0.5316],
  8481. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  8482. 0.2142],
  8483. [ 0.5911, -0.4080, 1.2303, -0.9156, -0.3229, -1.2851, 0.4508,
  8484. 0.1852],
  8485. [ 0.6487, -0.3792, 1.6344, -1.0850, 0.2659, -1.5397, 0.8059,
  8486. 0.2730]]], device='cuda:0')
  8487. loss_train_step before backward: tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward>)
  8488. loss_train_step after backward: tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward>)
  8489. loss_train: 0.6444090195000172
  8490. step: 12
  8491. running loss: 0.05370075162500143
  8492.  
  8493. Train Steps: 12/90 Loss: 0.0537 torch.Size([8, 600, 800])
  8494. torch.Size([8, 8])
  8495. tensor([[0.6145, 0.4008, 0.8750, 0.5383, 0.3975, 0.4650, 0.5563, 0.5533],
  8496. [0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  8497. [0.6030, 0.3969, 0.7988, 0.3917, 0.3450, 0.3667, 0.5266, 0.4700],
  8498. [0.6272, 0.4120, 0.9038, 0.4117, 0.3725, 0.3200, 0.6175, 0.5250],
  8499. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  8500. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  8501. [0.6371, 0.4092, 0.8337, 0.5850, 0.3950, 0.5117, 0.6559, 0.5262],
  8502. [0.6308, 0.3990, 0.8688, 0.5183, 0.3950, 0.4983, 0.6388, 0.5133]],
  8503. device='cuda:0', dtype=torch.float64)
  8504. predictions are: tensor([[ 0.3441, -0.5397, 1.5219, 0.0440, -0.4011, -0.1755, 0.2975, 0.2755],
  8505. [ 0.1604, -0.6528, 0.9091, -1.3186, -0.5518, -1.0986, 0.2071, 0.3260],
  8506. [ 0.6327, -0.3453, 1.3894, -0.7139, -0.6229, -0.6713, 0.3165, 0.2111],
  8507. [ 0.5513, -0.4404, 1.7052, -0.7359, -0.4866, -1.0530, 0.6075, 0.1834],
  8508. [ 0.4135, -0.5046, 1.4512, -0.8828, -0.2866, -0.9949, 0.6271, 0.1815],
  8509. [ 0.3910, -0.5328, 1.3725, -1.4320, -0.0645, -1.5060, 0.8007, 0.2209],
  8510. [ 0.7513, -0.2595, 1.5456, -0.0458, -0.5058, -0.1437, 0.5182, 0.2074],
  8511. [ 0.5279, -0.4191, 1.5979, -0.1190, -0.4333, -0.1138, 0.4706, 0.2032]],
  8512. device='cuda:0', grad_fn=<AddmmBackward>)
  8513. landmarks are: tensor([[[ 0.5526, -0.4347, 1.7557, 0.2006, -0.4499, -0.1381, 0.2834,
  8514. 0.2699],
  8515. [ 0.5425, -0.3998, 0.9263, -0.8683, -0.6000, -1.0157, 0.0990,
  8516. 0.2476],
  8517. [ 0.4992, -0.4525, 1.4035, -0.4768, -0.6924, -0.5923, 0.1465,
  8518. -0.1151],
  8519. [ 0.6111, -0.3828, 1.8885, -0.3844, -0.5654, -0.8079, 0.5663,
  8520. 0.1390],
  8521. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  8522. 0.1821],
  8523. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  8524. 0.1020],
  8525. [ 0.6569, -0.3960, 1.5651, 0.4162, -0.4614, 0.0774, 0.7438,
  8526. 0.1447],
  8527. [ 0.6275, -0.4430, 1.7268, 0.1082, -0.4614, 0.0159, 0.6644,
  8528. 0.0851]]], device='cuda:0')
  8529. loss_train_step before backward: tensor(0.0372, device='cuda:0', grad_fn=<MseLossBackward>)
  8530. loss_train_step after backward: tensor(0.0372, device='cuda:0', grad_fn=<MseLossBackward>)
  8531. loss_train: 0.6816200353205204
  8532. step: 13
  8533. running loss: 0.0524323104092708
  8534. Train Steps: 13/90 Loss: 0.0524 torch.Size([8, 600, 800])
  8535. torch.Size([8, 8])
  8536. tensor([[0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  8537. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  8538. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  8539. [0.6187, 0.4104, 0.7126, 0.2069, 0.3950, 0.2517, 0.5913, 0.5683],
  8540. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  8541. [0.6069, 0.3975, 0.8625, 0.5083, 0.4388, 0.5483, 0.5650, 0.4967],
  8542. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  8543. [0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350]],
  8544. device='cuda:0', dtype=torch.float64)
  8545. predictions are: tensor([[ 0.6906, -0.3250, 1.7244, 0.2441, -0.6534, -0.5400, 0.4928, 0.0983],
  8546. [ 0.7984, -0.2507, 1.3635, -0.5323, -0.6371, -0.7391, 0.3126, 0.2900],
  8547. [ 0.6796, -0.2984, 1.4948, -1.3600, -0.1548, -1.2440, 0.7837, 0.1997],
  8548. [ 0.6440, -0.3274, 1.0033, -1.1558, -0.4957, -1.1206, 0.3775, 0.2980],
  8549. [-0.6363, -1.1912, 0.9427, -1.3059, -0.3338, -1.3175, 0.2988, 0.2964],
  8550. [ 0.5409, -0.4155, 1.6573, 0.1337, -0.2963, 0.1204, 0.4237, 0.1673],
  8551. [ 0.4925, -0.4208, 1.6593, -0.0255, -0.3210, 0.0899, 0.5519, 0.1780],
  8552. [ 0.5728, -0.3631, 1.1779, -1.0559, -0.3516, -1.1277, 0.5243, 0.2186]],
  8553. device='cuda:0', grad_fn=<AddmmBackward>)
  8554. landmarks are: tensor([[[ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  8555. -0.0957],
  8556. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  8557. 0.4470],
  8558. [ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  8559. -0.0369],
  8560. [ 0.5718, -0.3905, 1.0053, -1.3305, -0.4614, -1.1235, 0.4450,
  8561. 0.3392],
  8562. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  8563. 0.3084],
  8564. [ 0.5174, -0.4497, 1.6979, 0.0620, -0.2594, 0.2468, 0.3238,
  8565. 0.0082],
  8566. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  8567. 0.1474],
  8568. [ 0.5911, -0.4080, 1.2303, -0.9156, -0.3229, -1.2851, 0.4508,
  8569. 0.1852]]], device='cuda:0')
  8570. loss_train_step before backward: tensor(0.0724, device='cuda:0', grad_fn=<MseLossBackward>)
  8571. loss_train_step after backward: tensor(0.0724, device='cuda:0', grad_fn=<MseLossBackward>)
  8572. loss_train: 0.7540136612951756
  8573. step: 14
  8574. running loss: 0.053858118663941114
  8575. Train Steps: 14/90 Loss: 0.0539 torch.Size([8, 600, 800])
  8576. torch.Size([8, 8])
  8577. tensor([[0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  8578. [0.6037, 0.4020, 0.8300, 0.4033, 0.3575, 0.4883, 0.5647, 0.5631],
  8579. [0.6260, 0.4253, 0.8938, 0.4400, 0.3675, 0.3650, 0.5675, 0.5767],
  8580. [0.6182, 0.3967, 0.8263, 0.3065, 0.3526, 0.4161, 0.6192, 0.5290],
  8581. [0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274],
  8582. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  8583. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500],
  8584. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402]],
  8585. device='cuda:0', dtype=torch.float64)
  8586. predictions are: tensor([[ 3.8594e-01, -4.9731e-01, 1.3426e+00, -7.9972e-01, -5.6520e-01,
  8587. -5.4576e-01, 5.2629e-01, 1.8728e-01],
  8588. [ 4.3697e-01, -4.5928e-01, 1.3931e+00, -5.5027e-01, -4.7881e-01,
  8589. -1.3916e-01, 3.5979e-01, 2.4473e-01],
  8590. [ 8.3286e-01, -2.0214e-01, 1.5449e+00, -3.9255e-01, -5.2480e-01,
  8591. -7.8448e-01, 4.5361e-01, 2.3245e-01],
  8592. [ 5.0168e-01, -4.3097e-01, 1.3078e+00, -9.1020e-01, -5.8755e-01,
  8593. -6.2334e-01, 5.8320e-01, 1.7699e-01],
  8594. [ 7.1887e-01, -3.1333e-01, 1.5627e+00, -1.1709e+00, -4.1819e-04,
  8595. -1.5454e+00, 8.5491e-01, 2.0092e-01],
  8596. [ 4.4513e-01, -4.4595e-01, 1.5378e+00, -2.1944e-01, -4.1386e-01,
  8597. -3.5445e-01, 3.4656e-01, 1.7412e-01],
  8598. [ 6.1162e-01, -3.6164e-01, 1.5413e+00, -1.8645e-01, -4.5866e-01,
  8599. -7.5103e-01, 3.8984e-01, 2.1871e-01],
  8600. [ 2.9098e-01, -5.9695e-01, 1.4410e+00, 1.1175e-01, -3.4529e-01,
  8601. -4.0318e-01, 3.0012e-01, 1.9724e-01]], device='cuda:0',
  8602. grad_fn=<AddmmBackward>)
  8603. landmarks are: tensor([[[ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  8604. 0.2391],
  8605. [ 0.5027, -0.4289, 1.5478, -0.4229, -0.6346, -0.0303, 0.3223,
  8606. 0.3148],
  8607. [ 0.6058, -0.3216, 1.8423, -0.2536, -0.5885, -0.6000, 0.3353,
  8608. 0.3777],
  8609. [ 0.5697, -0.4538, 1.5308, -0.8703, -0.6572, -0.3639, 0.5739,
  8610. 0.1576],
  8611. [ 0.6537, -0.3719, 1.6979, -0.8617, -0.0169, -1.3621, 0.6926,
  8612. 0.1501],
  8613. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  8614. 0.1439],
  8615. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  8616. 0.2545],
  8617. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  8618. 0.2091]]], device='cuda:0')
  8619. loss_train_step before backward: tensor(0.0246, device='cuda:0', grad_fn=<MseLossBackward>)
  8620. loss_train_step after backward: tensor(0.0246, device='cuda:0', grad_fn=<MseLossBackward>)
  8621. loss_train: 0.7785959504544735
  8622. step: 15
  8623. running loss: 0.0519063966969649
  8624. Train Steps: 15/90 Loss: 0.0519 torch.Size([8, 600, 800])
  8625. torch.Size([8, 8])
  8626. tensor([[0.6022, 0.3994, 0.8025, 0.3350, 0.3350, 0.4400, 0.5565, 0.5025],
  8627. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  8628. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  8629. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  8630. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  8631. [0.6129, 0.3930, 0.8769, 0.5105, 0.4146, 0.5642, 0.6000, 0.5082],
  8632. [0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  8633. [0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183]],
  8634. device='cuda:0', dtype=torch.float64)
  8635. predictions are: tensor([[ 0.3495, -0.5137, 1.2867, -0.7977, -0.5919, -0.4932, 0.3754, 0.2001],
  8636. [ 0.7947, -0.2719, 1.7608, -0.7762, -0.0301, -1.4611, 0.8805, 0.1307],
  8637. [ 0.0306, -0.7537, 1.0149, -1.0745, -0.5246, -0.9820, 0.2472, 0.2447],
  8638. [ 0.6324, -0.3694, 1.6234, 0.0647, -0.5520, -0.8712, 0.4582, 0.1424],
  8639. [ 0.7833, -0.2346, 1.5707, -0.3463, -0.3770, 0.0528, 0.5279, 0.2255],
  8640. [ 0.7305, -0.2862, 1.5712, 0.0126, -0.2571, 0.0699, 0.4072, 0.2189],
  8641. [ 0.4863, -0.4808, 1.5423, 0.0540, -0.5026, -0.2989, 0.2758, 0.1930],
  8642. [ 0.5454, -0.4141, 1.3707, -0.7669, -0.4660, -0.6807, 0.5137, 0.2013]],
  8643. device='cuda:0', grad_fn=<AddmmBackward>)
  8644. landmarks are: tensor([[[ 0.4956, -0.4413, 1.4208, -0.7386, -0.7386, -0.2536, 0.2843,
  8645. 0.0351],
  8646. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  8647. 0.2142],
  8648. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  8649. 0.0442],
  8650. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  8651. -0.0957],
  8652. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  8653. 0.2622],
  8654. [ 0.5450, -0.4706, 1.7643, 0.0722, -0.3708, 0.3200, 0.4854,
  8655. 0.0612],
  8656. [ 0.5773, -0.4316, 1.7399, 0.1287, -0.5153, -0.0817, 0.4313,
  8657. 0.0919],
  8658. [ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  8659. 0.1080]]], device='cuda:0')
  8660. loss_train_step before backward: tensor(0.0321, device='cuda:0', grad_fn=<MseLossBackward>)
  8661. loss_train_step after backward: tensor(0.0321, device='cuda:0', grad_fn=<MseLossBackward>)
  8662. loss_train: 0.8107367865741253
  8663. step: 16
  8664. running loss: 0.05067104916088283
  8665.  
  8666. Train Steps: 16/90 Loss: 0.0507 torch.Size([8, 600, 800])
  8667. torch.Size([8, 8])
  8668. tensor([[0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  8669. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  8670. [0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843],
  8671. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  8672. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  8673. [0.6087, 0.3951, 0.8387, 0.5833, 0.4188, 0.4933, 0.5146, 0.4830],
  8674. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  8675. [0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617]],
  8676. device='cuda:0', dtype=torch.float64)
  8677. predictions are: tensor([[ 0.6864, -0.3161, 1.3957, -0.8741, -0.6393, -0.4115, 0.5721, 0.1944],
  8678. [ 0.6869, -0.2809, 1.5808, 0.1829, -0.1508, -0.4284, 0.3990, 0.2674],
  8679. [ 1.0103, -0.1350, 1.8808, -0.1997, -0.6168, -0.1198, 0.6180, 0.0456],
  8680. [ 0.4554, -0.4768, 1.7386, -0.1356, -0.2300, -0.1834, 0.4971, 0.1328],
  8681. [ 0.2051, -0.6472, 1.1485, -1.0484, -0.5905, -0.9150, 0.3315, 0.1749],
  8682. [ 0.6647, -0.3565, 1.6234, 0.2364, -0.4079, -0.3115, 0.3650, 0.1571],
  8683. [ 0.0915, -0.7536, 0.9806, -1.4417, -0.3319, -1.7779, 0.4103, 0.1761],
  8684. [ 0.6232, -0.3394, 1.5547, 0.1898, -0.2631, -0.2693, 0.3681, 0.2310]],
  8685. device='cuda:0', grad_fn=<AddmmBackward>)
  8686. landmarks are: tensor([[[ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  8687. 0.2776],
  8688. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  8689. 0.4547],
  8690. [ 0.6075, -0.4159, 1.8654, -0.1458, -0.5249, 0.0159, 0.6359,
  8691. -0.0490],
  8692. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  8693. 0.2622],
  8694. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  8695. 0.0442],
  8696. [ 0.5258, -0.4610, 1.5882, 0.4085, -0.3517, -0.0072, 0.0910,
  8697. -0.0550],
  8698. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  8699. 0.1253],
  8700. [ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  8701. 0.3084]]], device='cuda:0')
  8702. loss_train_step before backward: tensor(0.0270, device='cuda:0', grad_fn=<MseLossBackward>)
  8703. loss_train_step after backward: tensor(0.0270, device='cuda:0', grad_fn=<MseLossBackward>)
  8704. loss_train: 0.8377538155764341
  8705. step: 17
  8706. running loss: 0.04927963621037848
  8707. Train Steps: 17/90 Loss: 0.0493 torch.Size([8, 600, 800])
  8708. torch.Size([8, 8])
  8709. tensor([[0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  8710. [0.6115, 0.3998, 0.7063, 0.2383, 0.4037, 0.1950, 0.5320, 0.4993],
  8711. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  8712. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  8713. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  8714. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  8715. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  8716. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153]],
  8717. device='cuda:0', dtype=torch.float64)
  8718. predictions are: tensor([[ 0.4288, -0.4854, 1.6467, 0.1719, -0.4551, 0.0582, 0.4286, 0.1805],
  8719. [ 0.5306, -0.4610, 0.9986, -1.3014, -0.4066, -1.3574, 0.3123, 0.1790],
  8720. [ 0.7175, -0.2925, 1.6305, -0.1981, -0.5236, -0.6448, 0.4414, 0.1654],
  8721. [ 0.5649, -0.4179, 1.0909, -1.1380, -0.4752, -1.0641, 0.3576, 0.1617],
  8722. [ 0.4000, -0.5173, 1.6446, 0.3024, -0.3259, -0.0621, 0.4557, 0.1149],
  8723. [ 0.5420, -0.4195, 1.7541, 0.0212, -0.4687, -0.2140, 0.5426, 0.1165],
  8724. [ 0.5727, -0.4093, 1.5485, -0.5428, -0.4685, -0.9696, 0.3440, 0.1536],
  8725. [ 0.6472, -0.3293, 1.6709, 0.1153, -0.1787, 0.1713, 0.4548, 0.1555]],
  8726. device='cuda:0', grad_fn=<AddmmBackward>)
  8727. landmarks are: tensor([[[ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  8728. 0.5239],
  8729. [ 0.5384, -0.4393, 0.9762, -1.1851, -0.4210, -1.3852, 0.1712,
  8730. 0.0201],
  8731. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  8732. 0.2699],
  8733. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  8734. 0.0802],
  8735. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  8736. 0.1313],
  8737. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  8738. 0.1499],
  8739. [ 0.5485, -0.4209, 1.6691, -0.4152, -0.5249, -1.1081, 0.0725,
  8740. 0.0021],
  8741. [ 0.5548, -0.4682, 1.7309, 0.0966, -0.1394, 0.1757, 0.5045,
  8742. 0.0942]]], device='cuda:0')
  8743. loss_train_step before backward: tensor(0.0131, device='cuda:0', grad_fn=<MseLossBackward>)
  8744. loss_train_step after backward: tensor(0.0131, device='cuda:0', grad_fn=<MseLossBackward>)
  8745. loss_train: 0.8508864175528288
  8746. step: 18
  8747. running loss: 0.04727146764182382
  8748. Train Steps: 18/90 Loss: 0.0473 torch.Size([8, 600, 800])
  8749. torch.Size([8, 8])
  8750. tensor([[0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  8751. [0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  8752. [0.6097, 0.4024, 0.8488, 0.3717, 0.3875, 0.5517, 0.5836, 0.5591],
  8753. [0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  8754. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197],
  8755. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  8756. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  8757. [0.6275, 0.4157, 0.8337, 0.5800, 0.3763, 0.4200, 0.5547, 0.6125]],
  8758. device='cuda:0', dtype=torch.float64)
  8759. predictions are: tensor([[ 0.4882, -0.4754, 1.3462, -1.0380, -0.4194, -1.2863, 0.3462, 0.1151],
  8760. [ 0.6720, -0.3324, 1.6458, -0.4131, -0.3798, -1.0912, 0.4214, 0.1275],
  8761. [ 0.5824, -0.3736, 1.5879, -0.6035, -0.3317, 0.1944, 0.6438, 0.1732],
  8762. [ 0.5314, -0.4397, 1.4854, -0.0471, -0.4339, -0.2989, 0.4611, 0.1603],
  8763. [ 0.3135, -0.5562, 1.6645, 0.0351, -0.2306, 0.0211, 0.3456, 0.1590],
  8764. [ 0.6142, -0.3721, 1.6466, 0.2753, -0.4500, -0.0996, 0.4397, 0.0354],
  8765. [ 0.5489, -0.4391, 1.4079, -0.5499, -0.6380, -0.7958, 0.2248, 0.2013],
  8766. [ 0.6976, -0.3084, 1.5207, 0.3261, -0.4993, -0.1174, 0.3380, 0.2032]],
  8767. device='cuda:0', grad_fn=<AddmmBackward>)
  8768. landmarks are: tensor([[[ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  8769. 0.0111],
  8770. [ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  8771. 0.1929],
  8772. [ 0.5301, -0.4273, 1.6344, -0.5692, -0.4961, 0.2622, 0.4098,
  8773. 0.2966],
  8774. [ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  8775. 0.3745],
  8776. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  8777. 0.1146],
  8778. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  8779. -0.0049],
  8780. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  8781. 0.4374],
  8782. [ 0.6124, -0.3658, 1.5651, 0.3931, -0.5480, -0.3460, 0.2761,
  8783. 0.5431]]], device='cuda:0')
  8784. loss_train_step before backward: tensor(0.0252, device='cuda:0', grad_fn=<MseLossBackward>)
  8785. loss_train_step after backward: tensor(0.0252, device='cuda:0', grad_fn=<MseLossBackward>)
  8786. loss_train: 0.8761011473834515
  8787. step: 19
  8788. running loss: 0.046110586704392185
  8789. Train Steps: 19/90 Loss: 0.0461 torch.Size([8, 600, 800])
  8790. torch.Size([8, 8])
  8791. tensor([[0.6196, 0.4088, 0.8888, 0.4583, 0.4500, 0.5683, 0.6138, 0.5883],
  8792. [0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667],
  8793. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  8794. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  8795. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  8796. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  8797. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  8798. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834]],
  8799. device='cuda:0', dtype=torch.float64)
  8800. predictions are: tensor([[ 0.7217, -0.2845, 1.9075, 0.2389, -0.2370, 0.5157, 0.5562, 0.1797],
  8801. [ 0.6534, -0.3390, 1.8560, 0.8615, -0.4630, 0.5337, 0.4289, 0.1413],
  8802. [ 0.4276, -0.5171, 1.1000, -0.8050, -0.5874, -1.0325, 0.1186, 0.1669],
  8803. [ 0.5049, -0.4677, 1.8860, 0.3048, -0.2772, 0.1354, 0.3989, 0.0883],
  8804. [ 0.4303, -0.5046, 1.0362, -0.7526, -0.5927, -0.9086, 0.1313, 0.2303],
  8805. [ 0.2386, -0.6472, 1.1012, -0.9978, -0.3905, -1.3685, 0.2712, 0.1517],
  8806. [ 0.6727, -0.3058, 1.6422, -0.0121, -0.6491, -0.0651, 0.3661, 0.1395],
  8807. [ 0.7852, -0.3123, 1.5772, -0.9977, -0.1710, -1.3506, 0.8036, 0.0506]],
  8808. device='cuda:0', grad_fn=<AddmmBackward>)
  8809. landmarks are: tensor([[[ 0.5759, -0.3978, 1.8192, -0.1689, -0.2074, 0.3392, 0.5490,
  8810. 0.4316],
  8811. [ 0.5853, -0.3614, 1.6806, 0.2930, -0.4499, 0.1005, 0.3815,
  8812. 0.3315],
  8813. [ 0.5470, -0.4081, 0.8492, -1.0773, -0.5307, -1.1620, 0.0912,
  8814. 0.1890],
  8815. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  8816. 0.0051],
  8817. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  8818. 0.3546],
  8819. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  8820. 0.1253],
  8821. [ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  8822. 0.2930],
  8823. [ 0.6126, -0.4057, 1.4439, -1.3159, -0.1150, -1.5777, 0.5537,
  8824. -0.0530]]], device='cuda:0')
  8825. loss_train_step before backward: tensor(0.0413, device='cuda:0', grad_fn=<MseLossBackward>)
  8826.  
  8827. loss_train_step after backward: tensor(0.0413, device='cuda:0', grad_fn=<MseLossBackward>)
  8828. loss_train: 0.9173775799572468
  8829. step: 20
  8830. running loss: 0.045868878997862336
  8831. Train Steps: 20/90 Loss: 0.0459 torch.Size([8, 600, 800])
  8832. torch.Size([8, 8])
  8833. tensor([[0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  8834. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  8835. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875],
  8836. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  8837. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  8838. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  8839. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  8840. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999]],
  8841. device='cuda:0', dtype=torch.float64)
  8842. predictions are: tensor([[ 0.7893, -0.2475, 1.7366, 0.2809, -0.4846, 0.0459, 0.5071, 0.1226],
  8843. [ 0.5180, -0.4447, 1.6718, 0.4874, -0.3442, 0.0526, 0.3643, 0.1179],
  8844. [ 1.0198, -0.1212, 1.6432, -0.3591, -0.6406, -0.6661, 0.2950, 0.1079],
  8845. [ 0.9893, -0.1316, 1.7666, 0.0423, -0.4163, 0.3851, 0.7108, 0.1294],
  8846. [-0.4476, -1.0955, 1.0936, -1.0599, -0.2677, -1.2739, 0.2665, 0.2393],
  8847. [ 1.0255, -0.0901, 1.7566, -0.0326, -0.5185, -0.2372, 0.4457, 0.1847],
  8848. [ 0.7385, -0.2714, 1.6558, 0.0937, -0.4627, 0.0625, 0.1644, 0.1464],
  8849. [-0.2213, -0.9596, 1.1754, -1.1070, -0.3095, -1.3147, 0.2532, 0.1814]],
  8850. device='cuda:0', grad_fn=<AddmmBackward>)
  8851. landmarks are: tensor([[[ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  8852. 0.1779],
  8853. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  8854. 0.1979],
  8855. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  8856. -0.0340],
  8857. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  8858. 0.1715],
  8859. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  8860. 0.3084],
  8861. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  8862. 0.3238],
  8863. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  8864. 0.0893],
  8865. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  8866. 0.0231]]], device='cuda:0')
  8867. loss_train_step before backward: tensor(0.2049, device='cuda:0', grad_fn=<MseLossBackward>)
  8868. loss_train_step after backward: tensor(0.2049, device='cuda:0', grad_fn=<MseLossBackward>)
  8869. loss_train: 1.122323576360941
  8870. step: 21
  8871. running loss: 0.05344397982671147
  8872. Train Steps: 21/90 Loss: 0.0534 torch.Size([8, 600, 800])
  8873. torch.Size([8, 8])
  8874. tensor([[0.6245, 0.4115, 0.8700, 0.4883, 0.4625, 0.5517, 0.6100, 0.5217],
  8875. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967],
  8876. [0.6250, 0.4106, 0.8700, 0.3717, 0.3588, 0.4967, 0.6038, 0.5167],
  8877. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  8878. [0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  8879. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  8880. [0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882],
  8881. [ nan, nan, 0.7412, 0.2200, 0.4450, 0.1517, 0.5312, 0.4983]],
  8882. device='cuda:0', dtype=torch.float64)
  8883. predictions are: tensor([[ 0.8088, -0.2508, 1.7559, 0.1688, -0.2472, 0.3217, 0.4909, 0.2069],
  8884. [ 0.9829, -0.1435, 1.6416, -0.8073, -0.1479, -1.0794, 0.5959, 0.1515],
  8885. [ 0.8976, -0.1853, 1.6383, -0.2905, -0.5018, 0.1907, 0.5584, 0.1761],
  8886. [ 0.5843, -0.3556, 1.3610, -0.4377, -0.6175, -0.2176, 0.2037, 0.2051],
  8887. [ 0.6115, -0.3894, 1.6423, -0.0639, -0.6122, -0.2054, 0.3690, 0.0912],
  8888. [ 0.8306, -0.2088, 1.6910, 0.3271, -0.6185, -0.2251, 0.2638, 0.2357],
  8889. [ 0.4336, -0.5279, 1.7140, 0.4916, -0.5995, -0.3352, 0.2393, 0.1133],
  8890. [-0.9037, -1.4468, 1.1021, -1.1638, -0.2849, -1.4912, 0.2202, 0.1359]],
  8891. device='cuda:0', grad_fn=<AddmmBackward>)
  8892. landmarks are: tensor([[[ 5.9873e-01, -3.8522e-01, 1.7326e+00, -3.0331e-02, -1.4965e-01,
  8893. 2.6220e-01, 5.3164e-01, 1.2363e-01],
  8894. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  8895. -1.5161e+00, 5.8660e-01, 8.0947e-03],
  8896. [ 6.0098e-01, -3.8961e-01, 1.7326e+00, -5.6921e-01, -6.2887e-01,
  8897. 8.1601e-03, 5.0277e-01, 1.0054e-01],
  8898. [ 5.0762e-01, -4.4426e-01, 1.2337e+00, -5.0235e-01, -6.8083e-01,
  8899. -3.6135e-01, 8.6614e-02, 2.3862e-01],
  8900. [ 5.6692e-01, -4.7937e-01, 1.7499e+00, -3.3826e-01, -6.7506e-01,
  8901. -4.2294e-01, 4.9700e-01, -6.1124e-02],
  8902. [ 5.9024e-01, -3.4927e-01, 1.7961e+00, -7.2363e-03, -5.9423e-01,
  8903. -5.6151e-01, 3.1801e-01, 3.1609e-01],
  8904. [ 5.3788e-01, -4.3580e-01, 1.7326e+00, 1.8522e-01, -6.0577e-01,
  8905. -5.4611e-01, 6.8408e-02, -3.0981e-02],
  8906. [-2.2859e+00, -2.2859e+00, 1.1379e+00, -1.2697e+00, -2.3048e-01,
  8907. -1.5854e+00, 1.6790e-01, 1.5858e-02]]], device='cuda:0')
  8908. loss_train_step before backward: tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward>)
  8909. loss_train_step after backward: tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward>)
  8910. loss_train: 1.1902863197028637
  8911. step: 22
  8912. running loss: 0.05410392362285744
  8913. Train Steps: 22/90 Loss: 0.0541 torch.Size([8, 600, 800])
  8914. torch.Size([8, 8])
  8915. tensor([[0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  8916. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  8917. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  8918. [0.6346, 0.4092, 0.7712, 0.5917, 0.4037, 0.4767, 0.7343, 0.5725],
  8919. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  8920. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  8921. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  8922. [0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383]],
  8923. device='cuda:0', dtype=torch.float64)
  8924. predictions are: tensor([[ 0.5841, -0.4228, 1.7081, -0.6441, -0.2441, -1.1153, 0.5499, 0.0982],
  8925. [ 0.4278, -0.5337, 1.6374, -0.0478, -0.6051, -0.2112, 0.1915, 0.1604],
  8926. [ 0.6027, -0.4234, 1.2634, -0.8264, -0.6503, -0.8771, 0.4061, 0.1357],
  8927. [ 0.4495, -0.5041, 1.4335, 0.1495, -0.5340, -0.1502, 0.3682, 0.2350],
  8928. [ 0.5330, -0.4750, 1.5403, -0.4251, -0.6036, -0.9126, 0.1916, 0.1295],
  8929. [ 0.4893, -0.4719, 1.7569, 0.1496, -0.3485, 0.2388, 0.4058, 0.1906],
  8930. [ 0.4003, -0.5475, 1.7447, -0.0725, -0.2012, -0.1510, 0.3865, 0.1682],
  8931. [ 0.4466, -0.5168, 1.7576, 0.0200, -0.3755, 0.2759, 0.4909, 0.1671]],
  8932. device='cuda:0', grad_fn=<AddmmBackward>)
  8933. landmarks are: tensor([[[ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  8934. 0.0051],
  8935. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  8936. 0.3087],
  8937. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  8938. 0.1779],
  8939. [ 0.6454, -0.3960, 1.2764, 0.4470, -0.4210, -0.0842, 1.1057,
  8940. 0.3585],
  8941. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  8942. 0.1494],
  8943. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  8944. 0.0622],
  8945. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  8946. 0.2776],
  8947. [ 0.5664, -0.4321, 1.8249, -0.2074, -0.2651, 0.4162, 0.5663,
  8948. 0.2006]]], device='cuda:0')
  8949. loss_train_step before backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  8950. loss_train_step after backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  8951. loss_train: 1.2187356799840927
  8952. step: 23
  8953. running loss: 0.05298850782539533
  8954. Train Steps: 23/90 Loss: 0.0530 torch.Size([8, 600, 800])
  8955. torch.Size([8, 8])
  8956. tensor([[0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  8957. [0.6203, 0.4078, 0.8800, 0.5083, 0.3900, 0.5000, 0.6100, 0.5583],
  8958. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  8959. [0.6268, 0.4102, 0.8938, 0.3667, 0.4025, 0.2833, 0.6275, 0.5183],
  8960. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567],
  8961. [0.6136, 0.4117, 0.8700, 0.5167, 0.4188, 0.5083, 0.5147, 0.5495],
  8962. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  8963. [0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667]],
  8964. device='cuda:0', dtype=torch.float64)
  8965. predictions are: tensor([[ 0.6472, -0.3689, 1.6346, -0.8492, -0.3853, -0.9779, 0.5521, 0.1281],
  8966. [ 0.3331, -0.6111, 1.7036, 0.2330, -0.5683, 0.1859, 0.3486, 0.1685],
  8967. [ 0.6470, -0.3728, 1.4712, -1.0258, -0.3932, -1.1447, 0.4923, 0.0939],
  8968. [ 0.5844, -0.4290, 1.7303, -0.4750, -0.4808, -0.8322, 0.4734, 0.1240],
  8969. [ 0.2903, -0.6353, 1.5557, 0.3560, -0.3045, 0.0172, 0.2414, 0.2126],
  8970. [ 0.2699, -0.6419, 1.6350, 0.2703, -0.4484, 0.1321, 0.2392, 0.1861],
  8971. [ 0.1457, -0.7198, 1.6238, -0.0021, -0.3622, 0.0578, 0.3708, 0.1807],
  8972. [ 0.7875, -0.2717, 1.6199, -0.5207, -0.6258, -0.5832, 0.3459, 0.1732]],
  8973. device='cuda:0', grad_fn=<AddmmBackward>)
  8974. landmarks are: tensor([[[ 6.0837e-01, -4.0762e-01, 1.6806e+00, -9.6182e-01, -2.9977e-01,
  8975. -9.6952e-01, 6.3557e-01, 1.4673e-01],
  8976. [ 5.7939e-01, -4.0231e-01, 1.7788e+00, 6.2048e-02, -4.8453e-01,
  8977. 2.3557e-02, 5.3164e-01, 2.9299e-01],
  8978. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  8979. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  8980. [ 6.0918e-01, -3.9130e-01, 1.8423e+00, -5.9230e-01, -4.2679e-01,
  8981. -9.7721e-01, 6.1247e-01, 1.0824e-01],
  8982. [ 5.6195e-01, -4.3457e-01, 1.6691e+00, 3.3149e-01, -2.5935e-01,
  8983. -7.2363e-03, 2.8915e-01, 2.8530e-01],
  8984. [ 5.4821e-01, -3.8414e-01, 1.7326e+00, 1.0054e-01, -3.5173e-01,
  8985. 6.2048e-02, 9.1240e-02, 2.5215e-01],
  8986. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  8987. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  8988. [ 5.7829e-01, -3.9330e-01, 1.6748e+00, -6.1540e-01, -5.7691e-01,
  8989. -6.4619e-01, 4.7968e-01, 3.3149e-01]]], device='cuda:0')
  8990. loss_train_step before backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  8991.  
  8992. loss_train_step after backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  8993. loss_train: 1.2390678264200687
  8994. step: 24
  8995. running loss: 0.051627826100836195
  8996. Train Steps: 24/90 Loss: 0.0516 torch.Size([8, 600, 800])
  8997. torch.Size([8, 8])
  8998. tensor([[0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  8999. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  9000. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064],
  9001. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  9002. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  9003. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  9004. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  9005. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395]],
  9006. device='cuda:0', dtype=torch.float64)
  9007. predictions are: tensor([[ 0.1949, -0.6706, 1.7265, 0.0499, -0.5140, -0.1403, 0.4085, 0.2467],
  9008. [ 0.7997, -0.3032, 1.3810, -1.0131, -0.5489, -0.8264, 0.3527, 0.1973],
  9009. [ 0.3795, -0.5790, 1.7047, -0.0913, -0.1195, -0.1106, 0.3014, 0.1788],
  9010. [ 0.8255, -0.2797, 1.6323, -0.6465, -0.6656, -0.5635, 0.3617, 0.1430],
  9011. [ 0.2209, -0.6711, 1.5705, -0.1209, -0.6546, -0.3792, 0.2130, 0.2171],
  9012. [ 0.3898, -0.5788, 1.8787, -0.3252, -0.2116, -0.8951, 0.6498, 0.0578],
  9013. [ 0.4747, -0.5116, 1.7857, -0.2169, -0.2496, 0.1502, 0.5376, 0.1775],
  9014. [ 0.3268, -0.6048, 1.6250, 0.1335, -0.5727, -0.5164, 0.2695, 0.1240]],
  9015. device='cuda:0', grad_fn=<AddmmBackward>)
  9016. landmarks are: tensor([[[ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  9017. 0.3623],
  9018. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  9019. 0.2853],
  9020. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  9021. 0.0532],
  9022. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  9023. 0.1753],
  9024. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  9025. 0.4357],
  9026. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  9027. 0.2142],
  9028. [ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  9029. 0.2699],
  9030. [ 0.5697, -0.4514, 1.7420, 0.2672, -0.6055, -0.6312, 0.3449,
  9031. 0.2058]]], device='cuda:0')
  9032. loss_train_step before backward: tensor(0.0248, device='cuda:0', grad_fn=<MseLossBackward>)
  9033. loss_train_step after backward: tensor(0.0248, device='cuda:0', grad_fn=<MseLossBackward>)
  9034. loss_train: 1.2638748027384281
  9035. step: 25
  9036. running loss: 0.05055499210953712
  9037. Train Steps: 25/90 Loss: 0.0506 torch.Size([8, 600, 800])
  9038. torch.Size([8, 8])
  9039. tensor([[0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  9040. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533],
  9041. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  9042. [0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  9043. [0.6198, 0.4115, 0.7762, 0.2717, 0.3713, 0.3200, 0.5837, 0.5683],
  9044. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344],
  9045. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  9046. [0.6261, 0.4066, 0.8325, 0.2150, 0.4763, 0.2667, 0.7002, 0.5633]],
  9047. device='cuda:0', dtype=torch.float64)
  9048. predictions are: tensor([[ 0.7765, -0.3130, 1.6100, -0.5837, -0.6955, -0.3657, 0.2162, 0.2099],
  9049. [-1.2546, -1.6816, 1.0257, -1.0399, -0.3609, -1.2230, 0.1650, 0.1903],
  9050. [ 0.6993, -0.4141, 1.8532, 0.5163, -0.5222, 0.1399, 0.4955, 0.1509],
  9051. [ 0.7386, -0.3365, 1.8392, 0.0971, -0.3573, 0.2887, 0.4597, 0.2088],
  9052. [ 0.6512, -0.3750, 1.5533, -0.6460, -0.5720, -0.5968, 0.2478, 0.2290],
  9053. [ 0.5814, -0.4463, 1.8323, 0.1737, -0.6186, -0.1798, 0.2413, 0.1486],
  9054. [ 0.5449, -0.4473, 1.8061, -0.7797, -0.1826, -0.8444, 0.7036, 0.1541],
  9055. [ 0.8164, -0.3197, 1.7249, -0.7490, -0.1492, -1.0003, 0.7974, 0.0999]],
  9056. device='cuda:0', grad_fn=<AddmmBackward>)
  9057. landmarks are: tensor([[[ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  9058. 0.2776],
  9059. [-2.2859, -2.2859, 0.7023, -1.3883, -0.4268, -1.3621, 0.0813,
  9060. 0.2699],
  9061. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  9062. 0.0261],
  9063. [ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  9064. 0.2391],
  9065. [ 0.5768, -0.3852, 1.2995, -1.0311, -0.5711, -0.8079, 0.4104,
  9066. 0.3392],
  9067. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  9068. 0.1824],
  9069. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  9070. 0.2944],
  9071. [ 0.6059, -0.4080, 1.5594, -1.2928, -0.0861, -1.0542, 0.9485,
  9072. 0.3157]]], device='cuda:0')
  9073. loss_train_step before backward: tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward>)
  9074. loss_train_step after backward: tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward>)
  9075. loss_train: 1.3201934099197388
  9076. step: 26
  9077. running loss: 0.05077666961229765
  9078. Train Steps: 26/90 Loss: 0.0508 torch.Size([8, 600, 800])
  9079. torch.Size([8, 8])
  9080. tensor([[0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  9081. [0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  9082. [0.6198, 0.4075, 0.8650, 0.5617, 0.4150, 0.4367, 0.5450, 0.5650],
  9083. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  9084. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  9085. [0.6136, 0.4117, 0.8700, 0.5167, 0.4188, 0.5083, 0.5147, 0.5495],
  9086. [0.6273, 0.4100, 0.7137, 0.2133, 0.4000, 0.2650, 0.6075, 0.5633],
  9087. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494]],
  9088. device='cuda:0', dtype=torch.float64)
  9089. predictions are: tensor([[ 0.4843, -0.4923, 1.8988, -0.3992, -0.2177, 0.0468, 0.5391, 0.2222],
  9090. [ 0.4154, -0.5881, 1.2895, -1.1669, -0.4763, -1.3328, 0.2543, 0.1306],
  9091. [ 0.4518, -0.5199, 1.7362, 0.0782, -0.4067, -0.2372, 0.3323, 0.2551],
  9092. [ 0.5852, -0.4918, 1.9120, -0.1694, -0.4795, 0.0024, 0.5392, 0.1263],
  9093. [ 0.6552, -0.4101, 1.8002, 0.1895, -0.3935, -0.2230, 0.4755, 0.2813],
  9094. [ 0.5180, -0.4848, 1.8587, 0.0052, -0.4058, 0.0462, 0.3925, 0.1988],
  9095. [ 0.1950, -0.6670, 1.2533, -1.3154, -0.4737, -1.2690, 0.4056, 0.1900],
  9096. [ 0.2802, -0.6517, 1.8728, -0.1009, -0.4746, -0.4945, 0.5519, 0.1651]],
  9097. device='cuda:0', grad_fn=<AddmmBackward>)
  9098. landmarks are: tensor([[[ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  9099. 0.3007],
  9100. [ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  9101. 0.0774],
  9102. [ 0.5770, -0.4036, 1.7095, 0.3084, -0.3691, -0.2690, 0.2314,
  9103. 0.3238],
  9104. [ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  9105. 0.0663],
  9106. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  9107. 0.4624],
  9108. [ 0.5482, -0.3841, 1.7326, 0.1005, -0.3517, 0.0620, 0.0912,
  9109. 0.2522],
  9110. [ 0.6115, -0.3924, 1.0109, -1.3005, -0.4383, -1.0619, 0.5201,
  9111. 0.3161],
  9112. [ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  9113. 0.2516]]], device='cuda:0')
  9114. loss_train_step before backward: tensor(0.0273, device='cuda:0', grad_fn=<MseLossBackward>)
  9115. loss_train_step after backward: tensor(0.0273, device='cuda:0', grad_fn=<MseLossBackward>)
  9116. loss_train: 1.3474591448903084
  9117. step: 27
  9118. running loss: 0.049905894255196606
  9119. Train Steps: 27/90 Loss: 0.0499 torch.Size([8, 600, 800])
  9120. torch.Size([8, 8])
  9121. tensor([[0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  9122. [0.6224, 0.3964, 0.8225, 0.5717, 0.4150, 0.4617, 0.5775, 0.5267],
  9123. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344],
  9124. [0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274],
  9125. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  9126. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  9127. [0.6099, 0.4030, 0.8638, 0.5117, 0.4983, 0.4965, 0.5086, 0.5388],
  9128. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600]],
  9129. device='cuda:0', dtype=torch.float64)
  9130. predictions are: tensor([[ 0.4047, -0.5641, 1.8557, -0.3915, -0.3121, 0.0780, 0.5668, 0.2369],
  9131. [ 0.5390, -0.4681, 1.7114, -0.0121, -0.5081, -0.2583, 0.4403, 0.2166],
  9132. [ 0.3382, -0.6112, 1.8243, -0.2912, -0.6956, -0.5718, 0.3748, 0.1359],
  9133. [ 0.1285, -0.7148, 1.7671, -0.9421, -0.1662, -1.1593, 0.6499, 0.1509],
  9134. [ 0.5752, -0.4616, 1.7676, -0.2336, -0.2807, -0.1014, 0.4329, 0.2863],
  9135. [ 0.3819, -0.5542, 1.1212, -1.1021, -0.6073, -1.2107, 0.3160, 0.2424],
  9136. [ 0.5454, -0.4809, 1.7989, -0.1910, -0.1672, -0.2807, 0.4104, 0.2157],
  9137. [ 0.6235, -0.4284, 1.7667, 0.0837, -0.4849, -0.0909, 0.5290, 0.3062]],
  9138. device='cuda:0', grad_fn=<AddmmBackward>)
  9139. landmarks are: tensor([[[ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  9140. 0.2699],
  9141. [ 0.5891, -0.4550, 1.5132, 0.3546, -0.3691, -0.1535, 0.3815,
  9142. 0.1467],
  9143. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  9144. 0.1824],
  9145. [ 0.6537, -0.3719, 1.6979, -0.8617, -0.0169, -1.3621, 0.6926,
  9146. 0.1501],
  9147. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  9148. 0.4171],
  9149. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  9150. 0.2391],
  9151. [ 0.5309, -0.4246, 1.7037, 0.0774, 0.0158, 0.0075, 0.0635,
  9152. 0.2026],
  9153. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  9154. 0.3007]]], device='cuda:0')
  9155. loss_train_step before backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  9156. loss_train_step after backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  9157. loss_train: 1.3758654911071062
  9158. step: 28
  9159. running loss: 0.04913805325382522
  9160.  
  9161. Train Steps: 28/90 Loss: 0.0491 torch.Size([8, 600, 800])
  9162. torch.Size([8, 8])
  9163. tensor([[0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  9164. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767],
  9165. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  9166. [ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933],
  9167. [0.6171, 0.4127, 0.8900, 0.4800, 0.4325, 0.5783, 0.5769, 0.5090],
  9168. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  9169. [0.6226, 0.4001, 0.8438, 0.5733, 0.3862, 0.4250, 0.5750, 0.5283],
  9170. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378]],
  9171. device='cuda:0', dtype=torch.float64)
  9172. predictions are: tensor([[ 0.4980, -0.4510, 1.1881, -0.9858, -0.5650, -0.8815, 0.2687, 0.2701],
  9173. [ 0.6081, -0.3681, 1.7448, -0.0104, -0.5931, -0.5104, 0.2804, 0.2786],
  9174. [ 0.8465, -0.2756, 1.5485, -0.9244, -0.5099, -0.8537, 0.6211, 0.1732],
  9175. [-1.4354, -1.7735, 1.1950, -0.9369, -0.3766, -1.0535, 0.1421, 0.2662],
  9176. [ 0.8859, -0.2152, 1.9825, 0.0037, -0.3014, 0.4025, 0.5873, 0.2754],
  9177. [ 0.9285, -0.2262, 1.8356, -0.0805, -0.3351, 0.0737, 0.4443, 0.3068],
  9178. [ 0.5997, -0.4376, 1.7979, 0.2760, -0.4896, -0.1813, 0.4074, 0.2335],
  9179. [ 0.5675, -0.4697, 1.8163, -1.0207, 0.0638, -1.0853, 1.0176, 0.1437]],
  9180. device='cuda:0', grad_fn=<AddmmBackward>)
  9181. landmarks are: tensor([[[ 0.5425, -0.3998, 0.9263, -0.8683, -0.6000, -1.0157, 0.0990,
  9182. 0.2476],
  9183. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  9184. 0.3778],
  9185. [ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  9186. 0.1080],
  9187. [-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  9188. 0.4543],
  9189. [ 0.5645, -0.3797, 1.8249, -0.0688, -0.2882, 0.3854, 0.3789,
  9190. 0.0652],
  9191. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  9192. 0.3057],
  9193. [ 0.5900, -0.4377, 1.6113, 0.3623, -0.5018, -0.3229, 0.3700,
  9194. 0.1544],
  9195. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  9196. 0.1982]]], device='cuda:0')
  9197. loss_train_step before backward: tensor(0.0327, device='cuda:0', grad_fn=<MseLossBackward>)
  9198. loss_train_step after backward: tensor(0.0327, device='cuda:0', grad_fn=<MseLossBackward>)
  9199. loss_train: 1.4085994269698858
  9200. step: 29
  9201. running loss: 0.048572394033444335
  9202. Train Steps: 29/90 Loss: 0.0486 torch.Size([8, 600, 800])
  9203. torch.Size([8, 8])
  9204. tensor([[0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  9205. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  9206. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  9207. [0.6102, 0.3999, 0.8750, 0.5133, 0.3825, 0.4750, 0.5637, 0.5083],
  9208. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  9209. [0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783],
  9210. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  9211. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142]],
  9212. device='cuda:0', dtype=torch.float64)
  9213. predictions are: tensor([[ 0.8314, -0.2732, 1.7540, -0.4890, -0.5828, -0.5468, 0.6514, 0.1730],
  9214. [ 0.6223, -0.3878, 1.9407, -0.0566, -0.0362, 0.2270, 0.7201, 0.3392],
  9215. [-0.0648, -0.8505, 0.9972, -1.0496, -0.3593, -1.3296, 0.2686, 0.3011],
  9216. [ 0.6182, -0.4060, 1.8672, 0.1088, -0.4125, -0.1731, 0.4656, 0.2312],
  9217. [ 0.7090, -0.3358, 1.9056, -0.3081, -0.2719, 0.1284, 0.6481, 0.3014],
  9218. [ 0.5278, -0.4470, 1.1147, -0.9866, -0.5895, -0.8632, 0.3399, 0.3552],
  9219. [-0.2827, -0.9884, 1.6530, -0.4936, -0.3237, -1.1280, 0.2926, 0.1953],
  9220. [ 0.4771, -0.4732, 1.8016, -0.2574, -0.3934, -0.2234, 0.3285, 0.2492]],
  9221. device='cuda:0', grad_fn=<AddmmBackward>)
  9222. landmarks are: tensor([[[ 0.5669, -0.4794, 1.7499, -0.3383, -0.6751, -0.4229, 0.4970,
  9223. -0.0611],
  9224. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  9225. 0.2083],
  9226. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  9227. 0.3808],
  9228. [ 0.5326, -0.4390, 1.7557, 0.0851, -0.5192, -0.0919, 0.3180,
  9229. 0.0620],
  9230. [ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  9231. 0.3161],
  9232. [ 0.5680, -0.4005, 0.8030, -1.0542, -0.6289, -0.7540, 0.3700,
  9233. 0.3854],
  9234. [ 0.5485, -0.4209, 1.6691, -0.4152, -0.5249, -1.1081, 0.0725,
  9235. 0.0021],
  9236. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  9237. 0.0893]]], device='cuda:0')
  9238. loss_train_step before backward: tensor(0.0391, device='cuda:0', grad_fn=<MseLossBackward>)
  9239. loss_train_step after backward: tensor(0.0391, device='cuda:0', grad_fn=<MseLossBackward>)
  9240. loss_train: 1.447685481980443
  9241. step: 30
  9242. running loss: 0.04825618273268143
  9243. Train Steps: 30/90 Loss: 0.0483 torch.Size([8, 600, 800])
  9244. torch.Size([8, 8])
  9245. tensor([[0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  9246. [0.6179, 0.4008, 0.8600, 0.4015, 0.3932, 0.2515, 0.5711, 0.5438],
  9247. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  9248. [0.6200, 0.4039, 0.8880, 0.4799, 0.3625, 0.4285, 0.5866, 0.5148],
  9249. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  9250. [0.6307, 0.4029, 0.8650, 0.5200, 0.3763, 0.4017, 0.7311, 0.5366],
  9251. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  9252. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301]],
  9253. device='cuda:0', dtype=torch.float64)
  9254. predictions are: tensor([[ 0.4710, -0.5241, 1.6559, -0.7972, -0.2771, -0.8978, 0.7490, 0.1722],
  9255. [ 0.2822, -0.5709, 1.4792, -0.7684, -0.3218, -1.0572, 0.2195, 0.2607],
  9256. [ 0.3433, -0.5362, 1.0719, -1.1185, -0.5896, -0.8732, 0.2522, 0.3263],
  9257. [ 0.3159, -0.5916, 1.7861, -0.2359, -0.5078, -0.4310, 0.3561, 0.2378],
  9258. [ 0.4398, -0.4827, 1.7726, -0.2350, -0.0829, 0.0155, 0.4125, 0.3373],
  9259. [ 0.3263, -0.5749, 1.7963, -0.0346, -0.3689, -0.5563, 0.4905, 0.1943],
  9260. [ 0.6169, -0.3935, 1.6085, -0.0899, -0.3845, -0.1183, 0.6086, 0.3813],
  9261. [ 0.6808, -0.3486, 1.7518, -0.1970, -0.3165, -0.0122, 0.5884, 0.2809]],
  9262. device='cuda:0', grad_fn=<AddmmBackward>)
  9263. landmarks are: tensor([[[ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  9264. 0.1821],
  9265. [ 0.5680, -0.4345, 1.6864, -0.4315, -0.4698, -1.1241, 0.3518,
  9266. 0.2261],
  9267. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  9268. 0.3315],
  9269. [ 0.5781, -0.4205, 1.8159, -0.0691, -0.6116, -0.3069, 0.4236,
  9270. 0.0919],
  9271. [ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  9272. 0.3007],
  9273. [ 0.6273, -0.4249, 1.7095, 0.1159, -0.5480, -0.4306, 1.0910,
  9274. 0.1928],
  9275. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  9276. 0.3478],
  9277. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  9278. 0.1627]]], device='cuda:0')
  9279. loss_train_step before backward: tensor(0.0302, device='cuda:0', grad_fn=<MseLossBackward>)
  9280. loss_train_step after backward: tensor(0.0302, device='cuda:0', grad_fn=<MseLossBackward>)
  9281. loss_train: 1.477879423648119
  9282. step: 31
  9283. running loss: 0.04767352979510061
  9284. Train Steps: 31/90 Loss: 0.0477 torch.Size([8, 600, 800])
  9285. torch.Size([8, 8])
  9286. tensor([[0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783],
  9287. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  9288. [0.6272, 0.4120, 0.9038, 0.4117, 0.3725, 0.3200, 0.6175, 0.5250],
  9289. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  9290. [0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  9291. [0.6129, 0.3930, 0.8769, 0.5105, 0.4146, 0.5642, 0.6000, 0.5082],
  9292. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  9293. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413]],
  9294. device='cuda:0', dtype=torch.float64)
  9295. predictions are: tensor([[ 0.5117, -0.4196, 0.9786, -0.9416, -0.6249, -0.8022, 0.2050, 0.3726],
  9296. [ 0.5619, -0.3987, 1.7834, 0.0175, -0.4419, -0.3582, 0.4923, 0.2641],
  9297. [ 0.3236, -0.5390, 1.8023, -0.3149, -0.4430, -0.8161, 0.4877, 0.2087],
  9298. [ 0.4976, -0.4769, 1.7585, 0.0139, -0.1965, 0.0074, 0.3728, 0.2565],
  9299. [ 0.4925, -0.4334, 1.1824, -1.0599, -0.4519, -1.0876, 0.3643, 0.2796],
  9300. [ 0.7676, -0.2882, 1.7267, 0.1517, -0.2220, 0.2903, 0.4297, 0.2950],
  9301. [ 0.3197, -0.5553, 1.3923, -0.9086, -0.5696, -0.3927, 0.5116, 0.3125],
  9302. [-0.0600, -0.8208, 1.8714, -0.7073, 0.0863, -0.9754, 0.9008, 0.1728]],
  9303. device='cuda:0', grad_fn=<AddmmBackward>)
  9304. landmarks are: tensor([[[ 0.5680, -0.4005, 0.8030, -1.0542, -0.6289, -0.7540, 0.3700,
  9305. 0.3854],
  9306. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  9307. 0.1499],
  9308. [ 0.6111, -0.3828, 1.8885, -0.3844, -0.5654, -0.8079, 0.5663,
  9309. 0.1390],
  9310. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  9311. 0.0051],
  9312. [ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  9313. 0.3007],
  9314. [ 0.5450, -0.4706, 1.7643, 0.0722, -0.3708, 0.3200, 0.4854,
  9315. 0.0612],
  9316. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  9317. 0.2776],
  9318. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  9319. 0.2142]]], device='cuda:0')
  9320. loss_train_step before backward: tensor(0.0254, device='cuda:0', grad_fn=<MseLossBackward>)
  9321. loss_train_step after backward: tensor(0.0254, device='cuda:0', grad_fn=<MseLossBackward>)
  9322. loss_train: 1.5033203139901161
  9323. step: 32
  9324. running loss: 0.04697875981219113
  9325.  
  9326. Train Steps: 32/90 Loss: 0.0470 torch.Size([8, 600, 800])
  9327. torch.Size([8, 8])
  9328. tensor([[0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  9329. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  9330. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  9331. [0.6128, 0.4116, 0.8450, 0.4583, 0.3675, 0.4867, 0.5337, 0.5446],
  9332. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  9333. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  9334. [0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138],
  9335. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332]],
  9336. device='cuda:0', dtype=torch.float64)
  9337. predictions are: tensor([[ 0.6046, -0.4041, 1.3856, -1.1072, -0.3421, -1.0320, 0.7189, 0.1829],
  9338. [ 0.3036, -0.5672, 1.7304, -0.7838, -0.2106, -1.1523, 0.6788, 0.1557],
  9339. [ 0.8693, -0.1994, 1.6628, 0.1078, -0.4714, -0.5727, 0.3917, 0.2545],
  9340. [ 0.4444, -0.4605, 1.5921, -0.3418, -0.3893, -0.0181, 0.3984, 0.3219],
  9341. [-0.8497, -1.3179, 1.3370, -0.8653, -0.4921, -0.9819, 0.1373, 0.2156],
  9342. [ 0.7128, -0.3160, 1.6909, 0.0323, -0.1249, 0.1409, 0.4211, 0.3112],
  9343. [ 0.8694, -0.2089, 1.4843, -0.6585, -0.5412, -0.5137, 0.5688, 0.3325],
  9344. [ 0.6722, -0.3150, 1.5615, -0.0606, -0.3911, -0.0069, 0.5004, 0.3152]],
  9345. device='cuda:0', grad_fn=<AddmmBackward>)
  9346. landmarks are: tensor([[[ 0.6125, -0.4345, 1.4308, -1.1384, -0.4213, -1.0031, 0.7190,
  9347. 0.1214],
  9348. [ 0.6128, -0.3828, 1.7499, -0.8386, -0.3344, -1.2620, 0.5792,
  9349. -0.0263],
  9350. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  9351. 0.1698],
  9352. [ 0.5444, -0.3846, 1.6171, -0.1689, -0.5885, -0.0380, 0.1791,
  9353. 0.2296],
  9354. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  9355. 0.0893],
  9356. [ 0.5548, -0.4682, 1.7309, 0.0966, -0.1394, 0.1757, 0.5045,
  9357. 0.0942],
  9358. [ 0.5438, -0.4206, 1.5189, -0.4537, -0.6115, -0.6231, 0.4365,
  9359. 0.5491],
  9360. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  9361. 0.1768]]], device='cuda:0')
  9362. loss_train_step before backward: tensor(0.0719, device='cuda:0', grad_fn=<MseLossBackward>)
  9363. loss_train_step after backward: tensor(0.0719, device='cuda:0', grad_fn=<MseLossBackward>)
  9364. loss_train: 1.575185589492321
  9365. step: 33
  9366. running loss: 0.047732896651282455
  9367. Train Steps: 33/90 Loss: 0.0477 torch.Size([8, 600, 800])
  9368. torch.Size([8, 8])
  9369. tensor([[0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  9370. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  9371. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100],
  9372. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  9373. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  9374. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633],
  9375. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  9376. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183]],
  9377. device='cuda:0', dtype=torch.float64)
  9378. predictions are: tensor([[ 0.9045, -0.2045, 1.7665, -0.0190, -0.4189, -0.0906, 0.6821, 0.1926],
  9379. [ 0.6531, -0.3369, 1.7089, -0.5142, -0.4372, -0.1780, 0.5593, 0.1922],
  9380. [ 0.9902, -0.1364, 1.6734, -0.0408, -0.3670, -0.1510, 0.6068, 0.2448],
  9381. [-1.6674, -1.8711, 1.1930, -1.0522, -0.3653, -1.3092, 0.2291, 0.2265],
  9382. [ 0.6062, -0.3637, 1.6419, -0.6272, -0.6213, -0.5816, 0.3713, 0.2625],
  9383. [ 1.0549, -0.0778, 1.6522, 0.2349, -0.3027, -0.0812, 0.4714, 0.3484],
  9384. [ 0.8803, -0.1778, 1.6896, -0.1564, -0.2772, -0.2500, 0.4931, 0.2272],
  9385. [ 0.2314, -0.5895, 0.9697, -1.2898, -0.2493, -1.2955, 0.3786, 0.3206]],
  9386. device='cuda:0', grad_fn=<AddmmBackward>)
  9387. landmarks are: tensor([[[ 5.9082e-01, -4.3664e-01, 1.7557e+00, 1.3903e-01, -5.1917e-01,
  9388. 1.3133e-01, 6.5289e-01, 2.3557e-02],
  9389. [ 5.1680e-01, -4.5558e-01, 1.7095e+00, -2.9207e-01, -4.2102e-01,
  9390. 6.2048e-02, 1.4038e-01, 2.3124e-02],
  9391. [ 6.2361e-01, -4.3441e-01, 1.6171e+00, 1.8522e-01, -3.4018e-01,
  9392. 2.3557e-02, 6.4711e-01, 6.9746e-02],
  9393. [-2.2859e+00, -2.2859e+00, 1.2030e+00, -1.0288e+00, -4.9607e-01,
  9394. -1.1081e+00, 8.1293e-02, 3.1609e-01],
  9395. [ 5.7569e-01, -3.9169e-01, 1.7095e+00, -4.7683e-01, -6.3464e-01,
  9396. -4.2294e-01, 3.9307e-01, 3.2379e-01],
  9397. [ 5.8799e-01, -3.6051e-01, 1.7037e+00, 3.2379e-01, -2.9400e-01,
  9398. -7.6520e-02, 3.1801e-01, 3.1609e-01],
  9399. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  9400. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  9401. [ 6.1010e-01, -3.1524e-01, 1.0166e+00, -7.5396e-01, -2.2633e-02,
  9402. -1.4468e+00, 2.8226e-01, 5.7018e-01]]], device='cuda:0')
  9403. loss_train_step before backward: tensor(0.0464, device='cuda:0', grad_fn=<MseLossBackward>)
  9404. loss_train_step after backward: tensor(0.0464, device='cuda:0', grad_fn=<MseLossBackward>)
  9405. loss_train: 1.6215668469667435
  9406. step: 34
  9407. running loss: 0.047693142557845396
  9408. Train Steps: 34/90 Loss: 0.0477 torch.Size([8, 600, 800])
  9409. torch.Size([8, 8])
  9410. tensor([[0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  9411. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  9412. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  9413. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  9414. [0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783],
  9415. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  9416. [0.6336, 0.4154, 0.8900, 0.2767, 0.4988, 0.2867, 0.7422, 0.5540],
  9417. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552]],
  9418. device='cuda:0', dtype=torch.float64)
  9419. predictions are: tensor([[ 0.8166, -0.1899, 1.3306, -0.7404, -0.4580, -0.7054, 0.4630, 0.3116],
  9420. [ 1.0022, -0.1160, 1.6696, 0.1123, -0.4108, 0.1231, 0.3683, 0.2487],
  9421. [-1.8722, -1.9516, 1.0990, -0.9600, -0.3088, -1.2137, 0.1891, 0.1847],
  9422. [ 1.2242, 0.0453, 1.6560, 0.5276, -0.4548, 0.1647, 0.3594, 0.2172],
  9423. [ 0.9550, -0.1220, 0.9757, -0.8584, -0.7268, -0.6853, 0.3104, 0.3065],
  9424. [ 0.8092, -0.2271, 1.7159, -0.2274, -0.6485, -0.1693, 0.3869, 0.2246],
  9425. [ 0.9884, -0.1324, 1.6578, -0.7221, -0.1089, -0.8412, 0.9937, 0.1319],
  9426. [-0.7703, -1.1830, 1.6248, -0.8926, 0.0598, -0.9897, 0.8520, 0.1865]],
  9427. device='cuda:0', grad_fn=<AddmmBackward>)
  9428. landmarks are: tensor([[[ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  9429. 0.5701],
  9430. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  9431. 0.3057],
  9432. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  9433. 0.0231],
  9434. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  9435. 0.2048],
  9436. [ 0.5680, -0.4005, 0.8030, -1.0542, -0.6289, -0.7540, 0.3700,
  9437. 0.3854],
  9438. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  9439. 0.2930],
  9440. [ 0.6405, -0.3671, 1.8249, -1.0080, 0.0178, -0.9618, 1.1422,
  9441. 0.2730],
  9442. [-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  9443. 0.2783]]], device='cuda:0')
  9444. loss_train_step before backward: tensor(0.1038, device='cuda:0', grad_fn=<MseLossBackward>)
  9445. loss_train_step after backward: tensor(0.1038, device='cuda:0', grad_fn=<MseLossBackward>)
  9446. loss_train: 1.725327029824257
  9447. step: 35
  9448. running loss: 0.04929505799497877
  9449. Train Steps: 35/90 Loss: 0.0493 torch.Size([8, 600, 800])
  9450. torch.Size([8, 8])
  9451. tensor([[0.6198, 0.4075, 0.8650, 0.5617, 0.4150, 0.4367, 0.5450, 0.5650],
  9452. [0.6173, 0.4114, 0.7325, 0.2500, 0.4213, 0.1917, 0.5338, 0.5700],
  9453. [0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  9454. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  9455. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  9456. [0.6182, 0.3930, 0.8841, 0.3892, 0.3556, 0.4967, 0.6222, 0.5279],
  9457. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  9458. [0.6127, 0.4115, 0.7163, 0.2883, 0.3625, 0.2950, 0.5327, 0.5495]],
  9459. device='cuda:0', dtype=torch.float64)
  9460. predictions are: tensor([[ 1.0376, -0.0549, 1.6175, 0.2950, -0.3642, -0.3018, 0.4173, 0.2902],
  9461. [-1.3129, -1.5726, 1.0380, -1.1441, -0.2995, -1.3562, 0.2976, 0.2221],
  9462. [ 1.0837, -0.0560, 1.7402, 0.1596, -0.3138, 0.0089, 0.4249, 0.1761],
  9463. [ 1.2470, 0.0356, 1.7279, 0.3775, -0.3578, 0.1207, 0.5581, 0.2648],
  9464. [ 0.7240, -0.2872, 1.7171, -0.3920, -0.4311, -0.0944, 0.5612, 0.1505],
  9465. [ 0.7184, -0.3035, 1.6816, -0.6363, -0.5410, -0.1442, 0.8086, 0.2079],
  9466. [-1.6307, -1.8106, 1.2022, -0.9604, -0.3940, -1.2524, 0.2497, 0.2113],
  9467. [ 0.9433, -0.1526, 1.0979, -1.1195, -0.5620, -0.9940, 0.4218, 0.2257]],
  9468. device='cuda:0', grad_fn=<AddmmBackward>)
  9469. landmarks are: tensor([[[ 0.5770, -0.4036, 1.7095, 0.3084, -0.3691, -0.2690, 0.2314,
  9470. 0.3238],
  9471. [ 0.5652, -0.3858, 1.0975, -1.1312, -0.3402, -1.4006, 0.1794,
  9472. 0.3469],
  9473. [ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  9474. 0.0467],
  9475. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  9476. 0.3161],
  9477. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  9478. 0.0231],
  9479. [ 0.5697, -0.4706, 1.7976, -0.4884, -0.6433, 0.0081, 0.5878,
  9480. 0.1525],
  9481. [-2.2859, -2.2859, 1.2030, -1.0288, -0.4961, -1.1081, 0.0813,
  9482. 0.3161],
  9483. [ 0.5442, -0.3855, 1.0224, -0.9541, -0.6115, -0.9233, 0.1745,
  9484. 0.2522]]], device='cuda:0')
  9485. loss_train_step before backward: tensor(0.1254, device='cuda:0', grad_fn=<MseLossBackward>)
  9486. loss_train_step after backward: tensor(0.1254, device='cuda:0', grad_fn=<MseLossBackward>)
  9487. loss_train: 1.8506858050823212
  9488. step: 36
  9489. running loss: 0.05140793903006448
  9490.  
  9491. Train Steps: 36/90 Loss: 0.0514 torch.Size([8, 600, 800])
  9492. torch.Size([8, 8])
  9493. tensor([[0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  9494. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  9495. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  9496. [0.6097, 0.4024, 0.8488, 0.3717, 0.3875, 0.5517, 0.5836, 0.5591],
  9497. [ nan, nan, 0.8900, 0.3217, 0.5038, 0.2233, 0.6694, 0.5609],
  9498. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  9499. [0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  9500. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679]],
  9501. device='cuda:0', dtype=torch.float64)
  9502. predictions are: tensor([[ 0.3210, -0.4926, 1.6567, -0.4000, -0.3599, -1.0264, 0.4894, 0.1499],
  9503. [ 0.6571, -0.3596, 1.0842, -1.2060, -0.6313, -1.0385, 0.5151, 0.1963],
  9504. [ 0.5058, -0.4447, 1.5437, 0.0189, -0.4176, -0.1923, 0.2316, 0.1914],
  9505. [ 0.1817, -0.6537, 1.4349, -0.7227, -0.4305, 0.0920, 0.4942, 0.2824],
  9506. [-1.3286, -1.6251, 1.6110, -0.9346, 0.0318, -1.2953, 0.6881, 0.1814],
  9507. [ 0.9706, -0.1940, 1.5802, 0.2639, -0.6015, -0.3286, 0.4616, 0.1453],
  9508. [ 0.5066, -0.4450, 1.4328, -0.3905, -0.5788, -0.2500, 0.2859, 0.2596],
  9509. [ 0.6623, -0.3516, 1.6435, 0.1237, -0.3628, 0.2921, 0.5939, 0.2574]],
  9510. device='cuda:0', grad_fn=<AddmmBackward>)
  9511. landmarks are: tensor([[[ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  9512. 0.1608],
  9513. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  9514. 0.1779],
  9515. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  9516. 0.1854],
  9517. [ 0.5301, -0.4273, 1.6344, -0.5692, -0.4961, 0.2622, 0.4098,
  9518. 0.2966],
  9519. [-2.2859, -2.2859, 1.8249, -0.8002, 0.0409, -1.2543, 0.8059,
  9520. 0.3050],
  9521. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  9522. 0.0291],
  9523. [ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  9524. 0.3267],
  9525. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  9526. 0.3371]]], device='cuda:0')
  9527. loss_train_step before backward: tensor(0.0419, device='cuda:0', grad_fn=<MseLossBackward>)
  9528. loss_train_step after backward: tensor(0.0419, device='cuda:0', grad_fn=<MseLossBackward>)
  9529. loss_train: 1.8925394713878632
  9530. step: 37
  9531. running loss: 0.051149715442915224
  9532. Train Steps: 37/90 Loss: 0.0511 torch.Size([8, 600, 800])
  9533. torch.Size([8, 8])
  9534. tensor([[0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  9535. [0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391],
  9536. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  9537. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  9538. [0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  9539. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  9540. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  9541. [0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550]],
  9542. device='cuda:0', dtype=torch.float64)
  9543. predictions are: tensor([[ 0.1391, -0.6635, 1.4068, -1.0223, -0.4018, -1.1637, 0.4464, 0.0945],
  9544. [ 0.4628, -0.4339, 1.3757, -0.9598, -0.3049, -1.1301, 0.4751, 0.1769],
  9545. [ 0.4638, -0.5336, 1.4785, -0.6946, -0.6105, -0.6798, 0.6793, 0.1371],
  9546. [ 0.3253, -0.5462, 1.5459, 0.2808, -0.2164, 0.0366, 0.2902, 0.2458],
  9547. [ 0.2621, -0.6162, 1.4384, 0.0273, -0.4463, -0.3500, 0.6303, 0.2597],
  9548. [ 0.2308, -0.6349, 1.5872, -0.2894, -0.2790, 0.2705, 0.4701, 0.2369],
  9549. [ 0.0074, -0.7388, 1.5592, 0.3414, -0.4608, -0.2093, 0.3406, 0.1944],
  9550. [ 0.0809, -0.7228, 1.3165, -0.9145, -0.6861, -0.7330, 0.3129, 0.2097]],
  9551. device='cuda:0', grad_fn=<AddmmBackward>)
  9552. landmarks are: tensor([[[ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  9553. 0.0851],
  9554. [ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  9555. 0.2043],
  9556. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  9557. -0.0220],
  9558. [ 0.5447, -0.3838, 1.7037, 0.1775, -0.1497, 0.1467, 0.1128,
  9559. 0.2431],
  9560. [ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  9561. 0.3745],
  9562. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  9563. 0.2936],
  9564. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  9565. 0.2391],
  9566. [ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  9567. 0.2776]]], device='cuda:0')
  9568. loss_train_step before backward: tensor(0.0379, device='cuda:0', grad_fn=<MseLossBackward>)
  9569. loss_train_step after backward: tensor(0.0379, device='cuda:0', grad_fn=<MseLossBackward>)
  9570. loss_train: 1.9304494857788086
  9571. step: 38
  9572. running loss: 0.05080130225733707
  9573. Train Steps: 38/90 Loss: 0.0508 torch.Size([8, 600, 800])
  9574. torch.Size([8, 8])
  9575. tensor([[0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  9576. [0.6200, 0.4070, 0.8938, 0.4183, 0.3538, 0.4567, 0.6175, 0.5400],
  9577. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  9578. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  9579. [0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083],
  9580. [0.6131, 0.4037, 0.6907, 0.2819, 0.3688, 0.2700, 0.5217, 0.5680],
  9581. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  9582. [0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667]],
  9583. device='cuda:0', dtype=torch.float64)
  9584. predictions are: tensor([[ 0.3057, -0.5980, 1.6707, 0.3744, -0.3315, -0.2668, 0.4939, 0.1397],
  9585. [ 0.3730, -0.5857, 1.6908, -0.3420, -0.5077, -0.1843, 0.5378, 0.1543],
  9586. [ 0.3094, -0.5495, 1.2988, -0.7486, -0.5875, -0.4744, 0.3223, 0.2321],
  9587. [ 0.0189, -0.7939, 1.7198, -0.3256, -0.4821, -0.3460, 0.3194, 0.2208],
  9588. [-0.0583, -0.8413, 1.6697, -0.4644, -0.5157, -0.3376, 0.4319, 0.2579],
  9589. [-0.0959, -0.8424, 0.9313, -1.0887, -0.5208, -1.0755, 0.2619, 0.2573],
  9590. [ 0.4857, -0.5217, 1.4339, -1.0939, -0.3772, -1.2367, 0.7471, 0.0930],
  9591. [ 0.5980, -0.3976, 1.7367, 0.5304, -0.3018, 0.2016, 0.4894, 0.2275]],
  9592. device='cuda:0', grad_fn=<AddmmBackward>)
  9593. landmarks are: tensor([[[ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  9594. -0.1492],
  9595. [ 0.5778, -0.4061, 1.8423, -0.3537, -0.6520, -0.1766, 0.5663,
  9596. 0.2083],
  9597. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  9598. 0.2386],
  9599. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  9600. 0.2930],
  9601. [ 0.5774, -0.3868, 1.6286, -0.5692, -0.6462, -0.2767, 0.5143,
  9602. 0.5239],
  9603. [ 0.5459, -0.4215, 0.9043, -0.9838, -0.5827, -1.0388, 0.1236,
  9604. 0.3378],
  9605. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  9606. -0.0220],
  9607. [ 0.5853, -0.3614, 1.6806, 0.2930, -0.4499, 0.1005, 0.3815,
  9608. 0.3315]]], device='cuda:0')
  9609. loss_train_step before backward: tensor(0.0421, device='cuda:0', grad_fn=<MseLossBackward>)
  9610. loss_train_step after backward: tensor(0.0421, device='cuda:0', grad_fn=<MseLossBackward>)
  9611. loss_train: 1.9725742973387241
  9612. step: 39
  9613. running loss: 0.05057882813689036
  9614. Train Steps: 39/90 Loss: 0.0506 torch.Size([8, 600, 800])
  9615. torch.Size([8, 8])
  9616. tensor([[ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  9617. [0.6185, 0.4079, 0.8838, 0.4617, 0.4838, 0.5650, 0.6175, 0.5850],
  9618. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575],
  9619. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528],
  9620. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550],
  9621. [0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097],
  9622. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  9623. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250]],
  9624. device='cuda:0', dtype=torch.float64)
  9625. predictions are: tensor([[-1.5030, -1.7617, 1.5962, -0.7638, -0.0465, -1.1517, 0.7468, 0.2570],
  9626. [ 0.6592, -0.3707, 1.6703, 0.0753, -0.2731, 0.2695, 0.3758, 0.2453],
  9627. [ 0.8878, -0.2623, 1.4946, -0.6248, -0.5640, -0.3283, 0.7205, 0.1871],
  9628. [-0.2709, -0.9534, 1.8355, -0.6016, -0.2469, -1.0011, 0.8533, 0.1493],
  9629. [ 0.1519, -0.6594, 1.1395, -0.7464, -0.7456, -0.9452, -0.0113, 0.1914],
  9630. [ 0.5785, -0.4321, 1.6872, 0.1249, -0.4040, 0.3933, 0.3312, 0.1839],
  9631. [ 0.5743, -0.4212, 0.8302, -1.1150, -0.6334, -1.2068, 0.3029, 0.2081],
  9632. [ 0.6235, -0.3960, 1.6506, 0.2356, -0.4930, 0.2425, 0.3186, 0.1754]],
  9633. device='cuda:0', grad_fn=<AddmmBackward>)
  9634. landmarks are: tensor([[[-2.2859, -2.2859, 1.8018, -0.9002, 0.1910, -1.2467, 1.1057,
  9635. 0.3799],
  9636. [ 0.5707, -0.4017, 1.7961, -0.1535, -0.0515, 0.3238, 0.5663,
  9637. 0.4162],
  9638. [ 0.6158, -0.4249, 1.8654, -0.9002, -0.3229, -0.3537, 0.9667,
  9639. 0.2890],
  9640. [-2.2859, -2.2859, 1.8423, -0.9695, -0.1323, -0.8463, 1.1349,
  9641. 0.2676],
  9642. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  9643. 0.2776],
  9644. [ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  9645. 0.0682],
  9646. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  9647. 0.2576],
  9648. [ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  9649. 0.1390]]], device='cuda:0')
  9650. loss_train_step before backward: tensor(0.1352, device='cuda:0', grad_fn=<MseLossBackward>)
  9651. loss_train_step after backward: tensor(0.1352, device='cuda:0', grad_fn=<MseLossBackward>)
  9652. loss_train: 2.107771832495928
  9653. step: 40
  9654. running loss: 0.05269429581239819
  9655.  
  9656. Train Steps: 40/90 Loss: 0.0527 torch.Size([8, 600, 800])
  9657. torch.Size([8, 8])
  9658. tensor([[ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  9659. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433],
  9660. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  9661. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  9662. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  9663. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  9664. [0.6200, 0.4049, 0.8638, 0.5617, 0.4125, 0.5100, 0.6013, 0.5317],
  9665. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578]],
  9666. device='cuda:0', dtype=torch.float64)
  9667. predictions are: tensor([[-1.4297, -1.6886, 0.9586, -1.0350, -0.4966, -1.1245, 0.2422, 0.2725],
  9668. [ 0.7484, -0.3261, 1.7147, 0.2348, -0.1303, 0.2234, 0.4167, 0.1816],
  9669. [ 0.9006, -0.1798, 1.8771, -0.0190, -0.2798, -0.6128, 0.7785, 0.1212],
  9670. [ 0.9955, -0.1387, 1.5056, -0.5418, -0.7577, -0.3477, 0.2791, 0.1715],
  9671. [ 1.1263, -0.0555, 1.6218, -0.5745, -0.5147, -0.7123, 0.5116, 0.1374],
  9672. [ 0.1350, -0.6184, 1.1729, -1.1085, -0.3779, -0.8162, 0.4339, 0.3186],
  9673. [ 0.9295, -0.2291, 1.6967, 0.4022, -0.3601, 0.3717, 0.5515, 0.1648],
  9674. [-2.0216, -2.0805, 1.1421, -0.9266, -0.5279, -0.9488, 0.2146, 0.2698]],
  9675. device='cuda:0', grad_fn=<AddmmBackward>)
  9676. landmarks are: tensor([[[-2.2859, -2.2859, 1.0712, -1.2085, -0.3806, -1.3929, 0.0755,
  9677. 0.2006],
  9678. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  9679. 0.2237],
  9680. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  9681. 0.3692],
  9682. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  9683. 0.2567],
  9684. [ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  9685. 0.2139],
  9686. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  9687. 0.2853],
  9688. [ 0.5776, -0.4159, 1.7037, 0.3084, -0.3806, 0.0697, 0.4912,
  9689. 0.1698],
  9690. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  9691. 0.2905]]], device='cuda:0')
  9692. loss_train_step before backward: tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward>)
  9693. loss_train_step after backward: tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward>)
  9694. loss_train: 2.1670092418789864
  9695. step: 41
  9696. running loss: 0.05285388394826796
  9697. Train Steps: 41/90 Loss: 0.0529 torch.Size([8, 600, 800])
  9698. torch.Size([8, 8])
  9699. tensor([[0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  9700. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  9701. [0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882],
  9702. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  9703. [0.6226, 0.4125, 0.8800, 0.4900, 0.4512, 0.5600, 0.6275, 0.5517],
  9704. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  9705. [0.6236, 0.3967, 0.8675, 0.5400, 0.3862, 0.4517, 0.5825, 0.5200],
  9706. [0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071]],
  9707. device='cuda:0', dtype=torch.float64)
  9708. predictions are: tensor([[-0.3570, -1.0477, 1.9500, -0.7166, -0.2661, -0.7335, 0.7896, 0.2005],
  9709. [ 0.1600, -0.7055, 1.7179, -0.2601, -0.1441, 0.0563, 0.3919, 0.2460],
  9710. [ 0.2115, -0.6359, 1.6255, -0.0376, -0.6835, -0.6661, 0.2499, 0.1468],
  9711. [-0.0534, -0.8461, 1.5375, 0.2503, -0.5311, -0.0212, 0.3671, 0.3205],
  9712. [ 0.3429, -0.5866, 1.6651, -0.2636, -0.2702, 0.2513, 0.4242, 0.2724],
  9713. [ 0.3025, -0.6347, 1.5513, -0.8119, -0.4023, -0.8750, 0.6761, 0.1629],
  9714. [ 0.1845, -0.6954, 1.6102, 0.1688, -0.5439, -0.2238, 0.3499, 0.2069],
  9715. [ 0.6012, -0.4584, 1.0800, -1.4243, -0.6784, -1.1147, 0.3999, 0.1815]],
  9716. device='cuda:0', grad_fn=<AddmmBackward>)
  9717. landmarks are: tensor([[[ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  9718. 0.2676],
  9719. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  9720. 0.2853],
  9721. [ 0.5379, -0.4358, 1.7326, 0.1852, -0.6058, -0.5461, 0.0684,
  9722. -0.0310],
  9723. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  9724. 0.5316],
  9725. [ 0.5897, -0.3804, 1.7788, -0.0226, -0.2016, 0.3007, 0.6125,
  9726. 0.2622],
  9727. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  9728. 0.1821],
  9729. [ 0.5944, -0.4538, 1.7210, 0.2083, -0.5018, -0.1997, 0.4046,
  9730. 0.1159],
  9731. [ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  9732. 0.0562]]], device='cuda:0')
  9733. loss_train_step before backward: tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward>)
  9734. loss_train_step after backward: tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward>)
  9735. loss_train: 2.229224521666765
  9736. step: 42
  9737. running loss: 0.05307677432539917
  9738. Train Steps: 42/90 Loss: 0.0531 torch.Size([8, 600, 800])
  9739. torch.Size([8, 8])
  9740. tensor([[0.6203, 0.4056, 0.8942, 0.4086, 0.3643, 0.3617, 0.5917, 0.5482],
  9741. [0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  9742. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  9743. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  9744. [0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544],
  9745. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  9746. [0.6111, 0.4033, 0.8300, 0.3267, 0.3588, 0.3333, 0.5444, 0.5637],
  9747. [0.6064, 0.3953, 0.8738, 0.4417, 0.3663, 0.4683, 0.5511, 0.5416]],
  9748. device='cuda:0', dtype=torch.float64)
  9749. predictions are: tensor([[ 0.2737, -0.6350, 1.8644, -0.3020, -0.5419, -0.4866, 0.5516, 0.1753],
  9750. [-0.2903, -0.9783, 1.4274, -0.8604, -0.4192, -1.0997, 0.3088, 0.1842],
  9751. [ 0.2797, -0.6562, 1.8521, 0.2928, -0.4158, 0.0558, 0.6270, 0.1605],
  9752. [ 0.1652, -0.7392, 1.9001, -0.0229, -0.1119, 0.4007, 0.5122, 0.2274],
  9753. [ 0.1744, -0.7025, 0.9219, -1.1211, -0.4517, -1.2485, 0.2254, 0.2856],
  9754. [ 0.4882, -0.4664, 1.4131, -0.6096, -0.4171, -0.6723, 0.5737, 0.3040],
  9755. [ 0.2635, -0.6419, 1.5242, -0.7674, -0.6309, -0.7327, 0.2655, 0.2337],
  9756. [ 0.0690, -0.8091, 1.8354, -0.1112, -0.5163, 0.0057, 0.4869, 0.1616]],
  9757. device='cuda:0', grad_fn=<AddmmBackward>)
  9758. landmarks are: tensor([[[ 0.5791, -0.4127, 1.8442, -0.3985, -0.6031, -0.6154, 0.4473,
  9759. 0.2464],
  9760. [ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  9761. 0.0111],
  9762. [ 0.6148, -0.4130, 1.6864, 0.1698, -0.5307, -0.1150, 0.6125,
  9763. 0.0851],
  9764. [ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  9765. 0.2699],
  9766. [ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  9767. 0.2747],
  9768. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  9769. 0.3469],
  9770. [ 0.5366, -0.4232, 1.5478, -0.7771, -0.6289, -0.7463, 0.2288,
  9771. 0.3177],
  9772. [ 0.5149, -0.4603, 1.7499, -0.2459, -0.5942, -0.1227, 0.2596,
  9773. 0.2155]]], device='cuda:0')
  9774. loss_train_step before backward: tensor(0.0456, device='cuda:0', grad_fn=<MseLossBackward>)
  9775. loss_train_step after backward: tensor(0.0456, device='cuda:0', grad_fn=<MseLossBackward>)
  9776. loss_train: 2.2748365253210068
  9777. step: 43
  9778. running loss: 0.052903175007465275
  9779. Train Steps: 43/90 Loss: 0.0529 torch.Size([8, 600, 800])
  9780. torch.Size([8, 8])
  9781. tensor([[0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  9782. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  9783. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  9784. [0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183],
  9785. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267],
  9786. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  9787. [0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  9788. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533]],
  9789. device='cuda:0', dtype=torch.float64)
  9790. predictions are: tensor([[ 0.5413, -0.4571, 1.9170, 0.0479, -0.6285, 0.0270, 0.2009, 0.2187],
  9791. [-0.0423, -0.8500, 1.2509, -0.7857, -0.3819, -0.8803, 0.3350, 0.2688],
  9792. [ 0.3422, -0.5660, 1.1678, -0.6439, -0.4835, -0.6990, 0.2194, 0.2989],
  9793. [ 0.1666, -0.7358, 1.9808, -0.2059, -0.4849, 0.0364, 0.7351, 0.1599],
  9794. [ 0.1013, -0.7613, 1.7859, -0.6040, -0.0864, -0.9437, 0.7968, 0.1880],
  9795. [ 0.3649, -0.5743, 1.5560, -0.5668, -0.5240, -0.5518, 0.4174, 0.1397],
  9796. [-0.6398, -1.2337, 1.2423, -0.8344, -0.2962, -1.1112, 0.2853, 0.2156],
  9797. [ 0.5759, -0.4420, 1.3873, -0.7166, -0.5027, -0.4597, 0.4913, 0.2565]],
  9798. device='cuda:0', grad_fn=<AddmmBackward>)
  9799. landmarks are: tensor([[[ 0.5581, -0.3912, 1.6460, -0.5230, -0.6173, -0.5923, 0.0681,
  9800. 0.4348],
  9801. [ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  9802. 0.2906],
  9803. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  9804. 0.3546],
  9805. [ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  9806. 0.1080],
  9807. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  9808. 0.1467],
  9809. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  9810. -0.1031],
  9811. [ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  9812. 0.0261],
  9813. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  9814. 0.2699]]], device='cuda:0')
  9815. loss_train_step before backward: tensor(0.1343, device='cuda:0', grad_fn=<MseLossBackward>)
  9816. loss_train_step after backward: tensor(0.1343, device='cuda:0', grad_fn=<MseLossBackward>)
  9817. loss_train: 2.4091132134199142
  9818. step: 44
  9819. running loss: 0.054752573032270775
  9820.  
  9821. Train Steps: 44/90 Loss: 0.0548 torch.Size([8, 600, 800])
  9822. torch.Size([8, 8])
  9823. tensor([[0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  9824. [0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467],
  9825. [0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  9826. [0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  9827. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  9828. [0.6201, 0.4151, 0.8588, 0.5467, 0.3700, 0.3950, 0.5637, 0.5933],
  9829. [0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  9830. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583]],
  9831. device='cuda:0', dtype=torch.float64)
  9832. predictions are: tensor([[ 0.4334, -0.5116, 1.3480, -0.8113, -0.3142, -1.0172, 0.4388, 0.3419],
  9833. [ 0.4893, -0.5194, 1.3963, -1.1550, -0.5044, -1.0069, 0.5392, 0.1921],
  9834. [ 0.0556, -0.8011, 2.0050, 0.2513, -0.3090, 0.1978, 0.3072, 0.1363],
  9835. [ 0.0547, -0.7857, 1.8429, -0.2424, -0.5380, -0.0357, 0.3545, 0.2218],
  9836. [ 0.0402, -0.8175, 1.9599, 0.0763, -0.3227, 0.1221, 0.5820, 0.1758],
  9837. [ 0.4812, -0.4551, 1.8308, 0.2619, -0.5223, -0.2912, 0.3599, 0.2569],
  9838. [-0.0621, -0.8441, 1.1563, -1.2337, -0.5207, -1.1930, 0.2766, 0.2215],
  9839. [ 0.6473, -0.4163, 1.2970, -1.1117, -0.4648, -1.1489, 0.4737, 0.2342]],
  9840. device='cuda:0', grad_fn=<AddmmBackward>)
  9841. landmarks are: tensor([[[ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  9842. 0.5401],
  9843. [ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  9844. 0.2391],
  9845. [ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  9846. 0.0467],
  9847. [ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  9848. 0.3267],
  9849. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  9850. 0.1627],
  9851. [ 0.5785, -0.3687, 1.6806, 0.2391, -0.5769, -0.4614, 0.3180,
  9852. 0.4547],
  9853. [ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  9854. 0.0712],
  9855. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  9856. 0.2930]]], device='cuda:0')
  9857. loss_train_step before backward: tensor(0.0466, device='cuda:0', grad_fn=<MseLossBackward>)
  9858. loss_train_step after backward: tensor(0.0466, device='cuda:0', grad_fn=<MseLossBackward>)
  9859. loss_train: 2.45572542399168
  9860. step: 45
  9861. running loss: 0.054571676088704
  9862. Train Steps: 45/90 Loss: 0.0546 torch.Size([8, 600, 800])
  9863. torch.Size([8, 8])
  9864. tensor([[0.6266, 0.4101, 0.8350, 0.2333, 0.3950, 0.2950, 0.6264, 0.4921],
  9865. [0.6236, 0.3967, 0.8675, 0.5400, 0.3862, 0.4517, 0.5825, 0.5200],
  9866. [0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  9867. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  9868. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  9869. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  9870. [0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467],
  9871. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436]],
  9872. device='cuda:0', dtype=torch.float64)
  9873. predictions are: tensor([[ 0.0486, -0.7520, 1.5484, -1.2891, -0.3776, -1.1524, 0.5029, 0.2081],
  9874. [ 0.1276, -0.7314, 1.7045, 0.1468, -0.5277, -0.3232, 0.3239, 0.1693],
  9875. [ 0.1799, -0.6887, 1.7231, -0.0090, -0.3742, 0.0133, 0.1609, 0.1769],
  9876. [ 0.4219, -0.5362, 1.5284, -0.9328, -0.6049, -0.6821, 0.3582, 0.3489],
  9877. [ 0.5471, -0.4507, 1.6436, 0.3289, -0.4051, -0.3247, 0.3472, 0.3031],
  9878. [ 0.4886, -0.4759, 1.6206, -1.0411, -0.2340, -1.1404, 0.6254, 0.2247],
  9879. [ 0.5113, -0.4774, 1.1860, -1.2704, -0.5188, -1.0736, 0.4048, 0.2197],
  9880. [ 0.2363, -0.6918, 1.8009, -0.0398, -0.4113, 0.2251, 0.6258, 0.2378]],
  9881. device='cuda:0', grad_fn=<AddmmBackward>)
  9882. landmarks are: tensor([[[ 0.6081, -0.3918, 1.5709, -1.2082, -0.4614, -0.9233, 0.6072,
  9883. -0.0129],
  9884. [ 0.5944, -0.4538, 1.7210, 0.2083, -0.5018, -0.1997, 0.4046,
  9885. 0.1159],
  9886. [ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  9887. 0.0467],
  9888. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  9889. 0.5624],
  9890. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  9891. 0.4624],
  9892. [ 0.6174, -0.3984, 1.5975, -0.9921, -0.3633, -0.9926, 0.8205,
  9893. 0.2050],
  9894. [ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  9895. 0.2391],
  9896. [ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  9897. 0.2249]]], device='cuda:0')
  9898. loss_train_step before backward: tensor(0.0342, device='cuda:0', grad_fn=<MseLossBackward>)
  9899. loss_train_step after backward: tensor(0.0342, device='cuda:0', grad_fn=<MseLossBackward>)
  9900. loss_train: 2.489884562790394
  9901. step: 46
  9902. running loss: 0.05412792527805204
  9903. Train Steps: 46/90 Loss: 0.0541 torch.Size([8, 600, 800])
  9904. torch.Size([8, 8])
  9905. tensor([[0.6308, 0.3990, 0.8688, 0.5183, 0.3950, 0.4983, 0.6388, 0.5133],
  9906. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  9907. [0.6216, 0.4099, 0.7225, 0.2033, 0.4188, 0.2217, 0.5975, 0.5283],
  9908. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  9909. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  9910. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344],
  9911. [0.6058, 0.3986, 0.8324, 0.4626, 0.3838, 0.4983, 0.5147, 0.5466],
  9912. [0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986]],
  9913. device='cuda:0', dtype=torch.float64)
  9914. predictions are: tensor([[ 0.2156, -0.7264, 1.8884, 0.1304, -0.4089, 0.0797, 0.6120, 0.1767],
  9915. [ 0.5065, -0.4851, 1.3740, -1.1749, -0.4529, -0.8285, 0.6044, 0.2467],
  9916. [ 0.7207, -0.3375, 1.1234, -1.1218, -0.3663, -1.1669, 0.2888, 0.2777],
  9917. [ 0.5620, -0.4515, 1.7631, -0.4039, -0.5657, -0.5033, 0.4060, 0.2434],
  9918. [ 0.3018, -0.6048, 1.0069, -1.1920, -0.3891, -1.2506, 0.2564, 0.3108],
  9919. [ 0.4506, -0.5106, 1.7971, -0.1529, -0.6035, -0.4831, 0.2787, 0.1326],
  9920. [ 0.1461, -0.7076, 1.6684, -0.1707, -0.4278, 0.0296, 0.3463, 0.2320],
  9921. [ 0.3512, -0.5647, 1.8268, -0.5372, -0.2307, -1.0289, 0.5388, 0.2037]],
  9922. device='cuda:0', grad_fn=<AddmmBackward>)
  9923. landmarks are: tensor([[[ 0.6275, -0.4430, 1.7268, 0.1082, -0.4614, 0.0159, 0.6644,
  9924. 0.0851],
  9925. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  9926. 0.1621],
  9927. [ 0.5850, -0.3925, 1.0513, -1.3467, -0.3517, -1.2620, 0.4739,
  9928. 0.1544],
  9929. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  9930. 0.1544],
  9931. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  9932. 0.3007],
  9933. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  9934. 0.1824],
  9935. [ 0.5124, -0.4446, 1.5587, -0.1493, -0.5134, 0.0159, 0.0912,
  9936. 0.2386],
  9937. [ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  9938. 0.0171]]], device='cuda:0')
  9939. loss_train_step before backward: tensor(0.0191, device='cuda:0', grad_fn=<MseLossBackward>)
  9940. loss_train_step after backward: tensor(0.0191, device='cuda:0', grad_fn=<MseLossBackward>)
  9941. loss_train: 2.5090342573821545
  9942. step: 47
  9943. running loss: 0.053383707603875626
  9944. Train Steps: 47/90 Loss: 0.0534 torch.Size([8, 600, 800])
  9945. torch.Size([8, 8])
  9946. tensor([[0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097],
  9947. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540],
  9948. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  9949. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  9950. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  9951. [0.6261, 0.4066, 0.8325, 0.2150, 0.4763, 0.2667, 0.7002, 0.5633],
  9952. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  9953. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064]],
  9954. device='cuda:0', dtype=torch.float64)
  9955. predictions are: tensor([[ 0.8475, -0.2794, 1.7623, -0.0957, -0.4256, 0.2351, 0.4581, 0.2182],
  9956. [-0.2862, -0.9827, 1.5954, -1.0876, -0.1128, -1.1886, 0.7696, 0.2542],
  9957. [ 0.5297, -0.4046, 1.3062, -0.6987, -0.7591, -0.5133, 0.2072, 0.2336],
  9958. [ 0.7029, -0.3222, 0.8991, -1.0768, -0.5859, -1.2088, 0.0907, 0.2763],
  9959. [ 0.4878, -0.4625, 1.5844, -0.8308, -0.2686, -1.0829, 0.5105, 0.2126],
  9960. [ 0.3900, -0.5851, 1.5981, -1.0304, -0.2450, -1.2939, 0.9065, 0.1962],
  9961. [ 0.4773, -0.5220, 1.6869, -0.1609, -0.5247, 0.0040, 0.3232, 0.2207],
  9962. [ 0.4895, -0.4908, 1.6441, 0.0550, -0.2706, -0.1646, 0.1716, 0.2209]],
  9963. device='cuda:0', grad_fn=<AddmmBackward>)
  9964. landmarks are: tensor([[[ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  9965. 0.0682],
  9966. [ 0.6487, -0.3792, 1.6344, -1.0850, 0.2659, -1.5397, 0.8059,
  9967. 0.2730],
  9968. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  9969. 0.2386],
  9970. [ 0.5470, -0.4081, 0.8492, -1.0773, -0.5307, -1.1620, 0.0912,
  9971. 0.1890],
  9972. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  9973. 0.0051],
  9974. [ 0.6059, -0.4080, 1.5594, -1.2928, -0.0861, -1.0542, 0.9485,
  9975. 0.3157],
  9976. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  9977. 0.2545],
  9978. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  9979. 0.0532]]], device='cuda:0')
  9980. loss_train_step before backward: tensor(0.0418, device='cuda:0', grad_fn=<MseLossBackward>)
  9981.  
  9982. loss_train_step after backward: tensor(0.0418, device='cuda:0', grad_fn=<MseLossBackward>)
  9983. loss_train: 2.550849635154009
  9984. step: 48
  9985. running loss: 0.05314270073237518
  9986. Train Steps: 48/90 Loss: 0.0531 torch.Size([8, 600, 800])
  9987. torch.Size([8, 8])
  9988. tensor([[0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  9989. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  9990. [0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  9991. [0.6211, 0.4069, 0.8750, 0.5117, 0.4150, 0.4900, 0.5875, 0.5167],
  9992. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  9993. [0.6086, 0.3998, 0.8788, 0.4450, 0.4025, 0.4650, 0.5306, 0.5103],
  9994. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  9995. [0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617]],
  9996. device='cuda:0', dtype=torch.float64)
  9997. predictions are: tensor([[ 0.5748, -0.4237, 1.6063, -0.8094, -0.6753, -0.6006, 0.4739, 0.1426],
  9998. [ 0.6394, -0.3932, 1.5600, -0.2398, -0.4541, -0.4561, 0.6120, 0.2591],
  9999. [ 0.7896, -0.2924, 1.2072, -1.4725, -0.2467, -1.6366, 0.4556, 0.2659],
  10000. [ 0.6717, -0.3560, 1.6344, -0.4148, -0.4480, -0.3918, 0.3761, 0.2047],
  10001. [ 0.5630, -0.4586, 1.6663, -0.2600, -0.5572, -0.5696, 0.4639, 0.1523],
  10002. [ 0.3004, -0.6163, 1.5867, -0.7224, -0.5165, -0.5790, 0.2084, 0.2126],
  10003. [ 0.4216, -0.5652, 1.7460, -0.4298, -0.1611, -0.1235, 0.5190, 0.2736],
  10004. [ 0.5407, -0.4184, 1.4882, -0.1265, -0.2424, -0.5134, 0.2740, 0.2863]],
  10005. device='cuda:0', grad_fn=<AddmmBackward>)
  10006. landmarks are: tensor([[[ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  10007. -0.0099],
  10008. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  10009. 0.3745],
  10010. [ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  10011. 0.2442],
  10012. [ 0.5828, -0.4066, 1.7557, 0.0774, -0.3691, -0.0226, 0.4277,
  10013. 0.1005],
  10014. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  10015. 0.0111],
  10016. [ 0.5253, -0.4392, 1.7730, -0.2305, -0.4268, -0.1381, 0.1651,
  10017. 0.0712],
  10018. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  10019. 0.2083],
  10020. [ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  10021. 0.3084]]], device='cuda:0')
  10022. loss_train_step before backward: tensor(0.0571, device='cuda:0', grad_fn=<MseLossBackward>)
  10023. loss_train_step after backward: tensor(0.0571, device='cuda:0', grad_fn=<MseLossBackward>)
  10024. loss_train: 2.607935193926096
  10025. step: 49
  10026. running loss: 0.05322316722298155
  10027. Train Steps: 49/90 Loss: 0.0532 torch.Size([8, 600, 800])
  10028. torch.Size([8, 8])
  10029. tensor([[0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  10030. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  10031. [ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729],
  10032. [0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667],
  10033. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  10034. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  10035. [0.6184, 0.4079, 0.8350, 0.3700, 0.3675, 0.2883, 0.5312, 0.5783],
  10036. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334]],
  10037. device='cuda:0', dtype=torch.float64)
  10038. predictions are: tensor([[ 0.6072, -0.3902, 1.6371, -0.2984, -0.5227, -0.1801, 0.3244, 0.2093],
  10039. [ 0.7488, -0.2995, 1.2322, -1.1851, -0.3223, -1.2072, 0.5751, 0.2034],
  10040. [-0.4687, -1.0840, 0.9513, -1.2575, -0.3393, -1.3697, 0.1948, 0.2901],
  10041. [ 1.0454, -0.1078, 1.6811, -0.6875, -0.4405, -0.7529, 0.4998, 0.2144],
  10042. [ 0.6249, -0.4240, 1.7408, 0.0835, -0.1700, 0.0287, 0.4339, 0.1851],
  10043. [ 0.5893, -0.3850, 1.3182, -1.1520, -0.3977, -0.9190, 0.5694, 0.2199],
  10044. [ 1.0067, -0.1159, 1.5522, -0.5882, -0.5079, -0.9046, 0.2085, 0.2066],
  10045. [ 0.7296, -0.3669, 1.8127, -0.0611, -0.4475, -0.2764, 0.6066, 0.1349]],
  10046. device='cuda:0', grad_fn=<AddmmBackward>)
  10047. landmarks are: tensor([[[ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  10048. 0.3267],
  10049. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  10050. 0.2468],
  10051. [-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  10052. 0.3604],
  10053. [ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  10054. 0.3315],
  10055. [ 0.5548, -0.4682, 1.7309, 0.0966, -0.1394, 0.1757, 0.5045,
  10056. 0.0942],
  10057. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  10058. 0.1621],
  10059. [ 0.5704, -0.4019, 1.5709, -0.5769, -0.5885, -0.9541, 0.1679,
  10060. 0.3854],
  10061. [ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  10062. 0.1779]]], device='cuda:0')
  10063. loss_train_step before backward: tensor(0.0894, device='cuda:0', grad_fn=<MseLossBackward>)
  10064. loss_train_step after backward: tensor(0.0894, device='cuda:0', grad_fn=<MseLossBackward>)
  10065. loss_train: 2.6973820067942142
  10066. step: 50
  10067. running loss: 0.05394764013588429
  10068. Train Steps: 50/90 Loss: 0.0539 torch.Size([8, 600, 800])
  10069. torch.Size([8, 8])
  10070. tensor([[0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  10071. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575],
  10072. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  10073. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  10074. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  10075. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  10076. [0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  10077. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466]],
  10078. device='cuda:0', dtype=torch.float64)
  10079. predictions are: tensor([[ 0.7791, -0.2850, 1.6467, -0.0968, -0.3366, -0.3221, 0.2981, 0.1525],
  10080. [ 0.5286, -0.4658, 1.6174, -0.9831, -0.3909, -0.7397, 0.8328, 0.1719],
  10081. [ 0.4610, -0.5079, 1.6431, -0.6665, -0.5766, -0.4751, 0.6097, 0.1839],
  10082. [ 0.6320, -0.3769, 1.6806, -0.2920, -0.2413, -0.3868, 0.5874, 0.1817],
  10083. [ 0.5876, -0.3599, 0.9087, -1.2984, -0.4308, -1.4225, 0.2108, 0.2846],
  10084. [ 0.6575, -0.3667, 1.7049, -0.3855, -0.1634, -0.2377, 0.4880, 0.2273],
  10085. [ 0.9322, -0.1638, 1.4860, -0.7307, -0.6229, -0.9279, 0.2114, 0.2237],
  10086. [ 0.5982, -0.3987, 1.6030, -0.1148, -0.2391, -0.3081, 0.3186, 0.1958]],
  10087. device='cuda:0', grad_fn=<AddmmBackward>)
  10088. landmarks are: tensor([[[ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  10089. 0.0467],
  10090. [ 0.6158, -0.4249, 1.8654, -0.9002, -0.3229, -0.3537, 0.9667,
  10091. 0.2890],
  10092. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  10093. 0.2083],
  10094. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  10095. 0.1474],
  10096. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  10097. 0.3546],
  10098. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  10099. 0.3007],
  10100. [ 0.5581, -0.3912, 1.6460, -0.5230, -0.6173, -0.5923, 0.0681,
  10101. 0.4348],
  10102. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  10103. 0.2386]]], device='cuda:0')
  10104. loss_train_step before backward: tensor(0.0397, device='cuda:0', grad_fn=<MseLossBackward>)
  10105. loss_train_step after backward: tensor(0.0397, device='cuda:0', grad_fn=<MseLossBackward>)
  10106. loss_train: 2.7370548360049725
  10107. step: 51
  10108. running loss: 0.05366774188245044
  10109. Train Steps: 51/90 Loss: 0.0537 torch.Size([8, 600, 800])
  10110. torch.Size([8, 8])
  10111. tensor([[0.6184, 0.4079, 0.8350, 0.3700, 0.3675, 0.2883, 0.5312, 0.5783],
  10112. [0.6292, 0.4010, 0.8988, 0.4800, 0.3638, 0.3817, 0.6357, 0.5051],
  10113. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390],
  10114. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  10115. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  10116. [0.6269, 0.4073, 0.8900, 0.4933, 0.3625, 0.4183, 0.6288, 0.5150],
  10117. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  10118. [0.6289, 0.4024, 0.9088, 0.4567, 0.3937, 0.5633, 0.7058, 0.5609]],
  10119. device='cuda:0', dtype=torch.float64)
  10120. predictions are: tensor([[ 0.8567, -0.1718, 1.3547, -0.7763, -0.4955, -0.9446, 0.0881, 0.2427],
  10121. [ 0.5651, -0.4153, 1.5431, -0.3089, -0.4450, -0.5726, 0.3844, 0.1504],
  10122. [ 0.6591, -0.3766, 1.6432, -0.2126, -0.3674, 0.1996, 0.5802, 0.2341],
  10123. [ 0.4659, -0.4568, 1.6246, -1.0287, -0.2502, -1.0492, 0.6522, 0.2027],
  10124. [ 0.4960, -0.4170, 1.1506, -1.3285, -0.1680, -1.3687, 0.4071, 0.2298],
  10125. [ 0.8298, -0.2185, 1.5897, -0.2481, -0.4702, -0.4676, 0.2961, 0.1988],
  10126. [ 0.5850, -0.4000, 1.5434, -0.1594, -0.4074, -0.6108, 0.4559, 0.1936],
  10127. [ 0.7825, -0.3099, 1.6470, -0.3506, -0.3493, 0.2103, 0.7165, 0.2178]],
  10128. device='cuda:0', grad_fn=<AddmmBackward>)
  10129. landmarks are: tensor([[[ 0.5704, -0.4019, 1.5709, -0.5769, -0.5885, -0.9541, 0.1679,
  10130. 0.3854],
  10131. [ 0.6204, -0.4336, 1.8654, -0.0688, -0.6058, -0.5230, 0.6503,
  10132. 0.0472],
  10133. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  10134. 0.2035],
  10135. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  10136. 0.3050],
  10137. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  10138. 0.2083],
  10139. [ 0.6096, -0.4046, 1.8249, -0.0072, -0.6115, -0.3537, 0.6182,
  10140. 0.0928],
  10141. [ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  10142. 0.2516],
  10143. [ 0.6191, -0.4273, 1.9115, -0.1766, -0.4672, 0.3161, 0.9741,
  10144. 0.3050]]], device='cuda:0')
  10145. loss_train_step before backward: tensor(0.0385, device='cuda:0', grad_fn=<MseLossBackward>)
  10146. loss_train_step after backward: tensor(0.0385, device='cuda:0', grad_fn=<MseLossBackward>)
  10147. loss_train: 2.775506906211376
  10148. step: 52
  10149. running loss: 0.05337513281175724
  10150.  
  10151. Train Steps: 52/90 Loss: 0.0534 torch.Size([8, 600, 800])
  10152. torch.Size([8, 8])
  10153. tensor([[0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433],
  10154. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  10155. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  10156. [ nan, nan, 0.8625, 0.2550, 0.5487, 0.2200, 0.7335, 0.5737],
  10157. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  10158. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533],
  10159. [0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  10160. [0.6260, 0.4153, 0.9000, 0.4533, 0.4025, 0.2633, 0.6223, 0.4967]],
  10161. device='cuda:0', dtype=torch.float64)
  10162. predictions are: tensor([[ 1.2758, -0.0035, 1.7499, -0.0705, -0.1819, 0.2553, 0.6336, 0.2368],
  10163. [ 1.0472, -0.1138, 1.7491, -0.2063, -0.3777, 0.2831, 0.5343, 0.2114],
  10164. [ 1.0555, -0.0865, 1.6605, -0.5979, -0.5562, -0.4504, 0.5985, 0.0961],
  10165. [-0.9829, -1.4003, 1.5955, -1.0695, 0.0910, -1.2272, 0.8067, 0.2447],
  10166. [ 1.1451, -0.0027, 1.6130, 0.1069, -0.5170, -0.5456, 0.3886, 0.1717],
  10167. [-0.4768, -1.0166, 0.8050, -1.3387, -0.3480, -1.3481, 0.2209, 0.2965],
  10168. [ 0.7727, -0.2133, 1.0725, -1.0082, -0.5601, -0.6336, 0.1684, 0.2660],
  10169. [ 1.1011, 0.0046, 1.6445, -0.3508, -0.3602, -0.9335, 0.4613, 0.1539]],
  10170. device='cuda:0', grad_fn=<AddmmBackward>)
  10171. landmarks are: tensor([[[ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  10172. 0.2237],
  10173. [ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  10174. 0.3161],
  10175. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  10176. -0.0670],
  10177. [-2.2859, -2.2859, 1.6979, -1.1081, 0.2487, -1.2697, 1.1020,
  10178. 0.3638],
  10179. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  10180. 0.1698],
  10181. [-2.2859, -2.2859, 0.7023, -1.3883, -0.4268, -1.3621, 0.0813,
  10182. 0.2699],
  10183. [ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  10184. 0.1710],
  10185. [ 0.6055, -0.3676, 1.8711, -0.1920, -0.4268, -1.0696, 0.5887,
  10186. 0.0081]]], device='cuda:0')
  10187. loss_train_step before backward: tensor(0.1587, device='cuda:0', grad_fn=<MseLossBackward>)
  10188. loss_train_step after backward: tensor(0.1587, device='cuda:0', grad_fn=<MseLossBackward>)
  10189. loss_train: 2.9342208728194237
  10190. step: 53
  10191. running loss: 0.05536265797772497
  10192. Train Steps: 53/90 Loss: 0.0554 torch.Size([8, 600, 800])
  10193. torch.Size([8, 8])
  10194. tensor([[0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  10195. [0.6307, 0.4045, 0.8025, 0.5833, 0.3775, 0.4867, 0.6892, 0.5459],
  10196. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  10197. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  10198. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  10199. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  10200. [0.6109, 0.4015, 0.7668, 0.3639, 0.3513, 0.3667, 0.5200, 0.5641],
  10201. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183]],
  10202. device='cuda:0', dtype=torch.float64)
  10203. predictions are: tensor([[ 0.3557, -0.4607, 1.3432, -0.7182, -0.4009, -1.1316, 0.1919, 0.2739],
  10204. [ 0.6425, -0.3514, 1.5266, -0.1332, -0.3826, -0.3711, 0.5698, 0.1939],
  10205. [ 0.3685, -0.5062, 1.3575, -1.2130, -0.1406, -1.5512, 0.6332, 0.1769],
  10206. [ 0.6780, -0.3683, 1.8085, -0.1522, -0.3207, 0.1319, 0.8006, 0.1867],
  10207. [ 0.9286, -0.1924, 1.7689, 0.0137, -0.3892, 0.0995, 0.7076, 0.1731],
  10208. [ 0.7650, -0.2433, 1.5615, -0.4926, -0.5390, -0.5534, 0.2164, 0.2737],
  10209. [ 0.5087, -0.3998, 1.2703, -0.8557, -0.5282, -0.6876, 0.2457, 0.2515],
  10210. [ 0.8064, -0.2767, 1.7967, -0.1745, -0.3430, 0.2104, 0.6670, 0.1899]],
  10211. device='cuda:0', grad_fn=<AddmmBackward>)
  10212. landmarks are: tensor([[[ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  10213. 0.3928],
  10214. [ 0.6273, -0.4177, 1.4208, 0.4085, -0.5423, -0.0380, 0.8973,
  10215. 0.2356],
  10216. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  10217. 0.1917],
  10218. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  10219. 0.1554],
  10220. [ 0.6421, -0.3695, 1.7788, 0.0236, -0.4845, 0.1544, 1.1971,
  10221. 0.2196],
  10222. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  10223. 0.3238],
  10224. [ 0.5357, -0.4315, 1.2557, -0.6051, -0.6635, -0.5923, 0.1159,
  10225. 0.3198],
  10226. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  10227. 0.1082]]], device='cuda:0')
  10228. loss_train_step before backward: tensor(0.0291, device='cuda:0', grad_fn=<MseLossBackward>)
  10229. loss_train_step after backward: tensor(0.0291, device='cuda:0', grad_fn=<MseLossBackward>)
  10230. loss_train: 2.9632861856371164
  10231. step: 54
  10232. running loss: 0.054875670104391046
  10233. Train Steps: 54/90 Loss: 0.0549 torch.Size([8, 600, 800])
  10234. torch.Size([8, 8])
  10235. tensor([[0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  10236. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  10237. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749],
  10238. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567],
  10239. [0.6145, 0.4008, 0.8750, 0.5383, 0.3975, 0.4650, 0.5563, 0.5533],
  10240. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  10241. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  10242. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183]],
  10243. device='cuda:0', dtype=torch.float64)
  10244. predictions are: tensor([[ 0.4483, -0.4180, 1.0823, -1.1483, -0.1529, -1.1096, 0.4683, 0.3558],
  10245. [ 0.5588, -0.3981, 1.7192, -0.2750, -0.4433, -0.2098, 0.4805, 0.2380],
  10246. [ 0.4985, -0.4167, 1.3104, -0.8960, -0.5438, -0.5640, 0.4597, 0.2455],
  10247. [ 0.8661, -0.2295, 1.7761, 0.4190, -0.2540, 0.1397, 0.5771, 0.2036],
  10248. [ 0.8158, -0.2632, 1.8079, 0.3212, -0.3979, 0.0774, 0.5858, 0.1922],
  10249. [ 0.8015, -0.2651, 1.9091, -0.0199, -0.4642, -0.2573, 0.7678, 0.1320],
  10250. [ 0.0030, -0.7220, 1.4453, -0.7867, -0.5837, -0.7954, 0.2402, 0.1659],
  10251. [ 0.5133, -0.4323, 1.2798, -1.3046, -0.2583, -1.3138, 0.6630, 0.1580]],
  10252. device='cuda:0', grad_fn=<AddmmBackward>)
  10253. landmarks are: tensor([[[ 0.6101, -0.3152, 1.0166, -0.7540, -0.0226, -1.4468, 0.2823,
  10254. 0.5702],
  10255. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  10256. 0.4145],
  10257. [ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  10258. 0.3694],
  10259. [ 0.5620, -0.4346, 1.6691, 0.3315, -0.2594, -0.0072, 0.2891,
  10260. 0.2853],
  10261. [ 0.5526, -0.4347, 1.7557, 0.2006, -0.4499, -0.1381, 0.2834,
  10262. 0.2699],
  10263. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  10264. 0.1499],
  10265. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  10266. 0.1133],
  10267. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  10268. 0.1082]]], device='cuda:0')
  10269. loss_train_step before backward: tensor(0.1432, device='cuda:0', grad_fn=<MseLossBackward>)
  10270. loss_train_step after backward: tensor(0.1432, device='cuda:0', grad_fn=<MseLossBackward>)
  10271. loss_train: 3.106526607647538
  10272. step: 55
  10273. running loss: 0.05648230195722797
  10274. Train Steps: 55/90 Loss: 0.0565 torch.Size([8, 600, 800])
  10275. torch.Size([8, 8])
  10276. tensor([[0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  10277. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  10278. [0.6260, 0.4153, 0.9000, 0.4533, 0.4025, 0.2633, 0.6223, 0.4967],
  10279. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  10280. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  10281. [0.6193, 0.4050, 0.7313, 0.2433, 0.4075, 0.2117, 0.5649, 0.5656],
  10282. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  10283. [ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167]],
  10284. device='cuda:0', dtype=torch.float64)
  10285. predictions are: tensor([[ 1.0553e+00, -1.5796e-01, 2.0803e+00, 3.1226e-01, -3.8757e-01,
  10286. 6.7862e-01, 8.9026e-01, 1.5629e-01],
  10287. [ 1.4193e-01, -6.1169e-01, 1.3132e+00, -9.7362e-01, -2.6433e-01,
  10288. -1.0044e+00, 5.2136e-01, 2.8896e-01],
  10289. [ 9.9363e-01, -7.4630e-02, 1.8583e+00, 3.2327e-02, -3.5001e-01,
  10290. -7.8548e-01, 6.0284e-01, 1.4803e-01],
  10291. [ 5.2145e-01, -3.7143e-01, 1.2435e+00, -8.4906e-01, -4.3652e-01,
  10292. -8.5257e-01, 4.4860e-01, 3.1134e-01],
  10293. [ 1.3241e+00, -6.1965e-04, 2.0147e+00, 5.9596e-02, -4.7098e-01,
  10294. 5.4668e-01, 9.9321e-01, 1.6055e-01],
  10295. [ 4.0170e-01, -4.5806e-01, 1.1629e+00, -9.4310e-01, -3.3796e-01,
  10296. -9.8315e-01, 4.4373e-01, 2.4660e-01],
  10297. [ 5.9641e-01, -3.5358e-01, 1.0719e+00, -7.0736e-01, -5.0569e-01,
  10298. -7.0185e-01, 2.7299e-01, 3.3588e-01],
  10299. [-1.0682e+00, -1.4444e+00, 1.2887e+00, -8.3251e-01, -4.0688e-01,
  10300. -9.9458e-01, 2.4550e-01, 2.2370e-01]], device='cuda:0',
  10301. grad_fn=<AddmmBackward>)
  10302. landmarks are: tensor([[[ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  10303. 0.1082],
  10304. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  10305. 0.1698],
  10306. [ 0.6055, -0.3676, 1.8711, -0.1920, -0.4268, -1.0696, 0.5887,
  10307. 0.0081],
  10308. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  10309. 0.3546],
  10310. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  10311. 0.1715],
  10312. [ 0.5746, -0.4153, 1.0917, -1.1620, -0.4037, -1.3082, 0.3234,
  10313. 0.3267],
  10314. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  10315. 0.4103],
  10316. [-2.2859, -2.2859, 1.2820, -1.0801, -0.5885, -1.0234, 0.2141,
  10317. 0.1005]]], device='cuda:0')
  10318. loss_train_step before backward: tensor(0.0860, device='cuda:0', grad_fn=<MseLossBackward>)
  10319. loss_train_step after backward: tensor(0.0860, device='cuda:0', grad_fn=<MseLossBackward>)
  10320.  
  10321. loss_train: 3.1925710681825876
  10322. step: 56
  10323. running loss: 0.05701019764611764
  10324. Train Steps: 56/90 Loss: 0.0570 torch.Size([8, 600, 800])
  10325. torch.Size([8, 8])
  10326. tensor([[0.6272, 0.4045, 0.8538, 0.5900, 0.3750, 0.4417, 0.5989, 0.4649],
  10327. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  10328. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  10329. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  10330. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  10331. [0.6144, 0.4032, 0.8563, 0.3283, 0.3525, 0.4200, 0.5775, 0.5583],
  10332. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  10333. [0.6132, 0.4037, 0.6963, 0.2217, 0.4100, 0.1950, 0.5395, 0.5175]],
  10334. device='cuda:0', dtype=torch.float64)
  10335. predictions are: tensor([[ 0.7179, -0.3238, 1.7458, 0.3163, -0.5806, -0.1069, 0.5669, 0.1582],
  10336. [ 0.0706, -0.6531, 0.9820, -1.0993, -0.2456, -1.0041, 0.3436, 0.3978],
  10337. [ 0.5253, -0.4076, 1.7337, 0.1074, -0.3820, 0.2137, 0.4023, 0.2355],
  10338. [ 0.5145, -0.4474, 2.0043, -0.2206, -0.2732, -0.6411, 0.8709, 0.1705],
  10339. [ 0.6235, -0.4090, 1.7221, 0.4188, -0.5392, 0.1507, 0.6613, 0.1973],
  10340. [ 0.6203, -0.3780, 1.6743, -0.5646, -0.6705, -0.1017, 0.4486, 0.2820],
  10341. [ 0.3270, -0.5656, 1.5257, -1.1182, -0.2016, -1.1584, 0.8714, 0.2187],
  10342. [ 0.1576, -0.6544, 1.0196, -1.1413, -0.4234, -1.1670, 0.3124, 0.2487]],
  10343. device='cuda:0', grad_fn=<AddmmBackward>)
  10344. landmarks are: tensor([[[ 6.1085e-01, -4.1771e-01, 1.6575e+00, 4.3926e-01, -5.5381e-01,
  10345. -2.4588e-01, 4.8055e-01, -1.3847e-01],
  10346. [ 6.1010e-01, -3.1524e-01, 1.0166e+00, -7.5396e-01, -2.2633e-02,
  10347. -1.4468e+00, 2.8226e-01, 5.7018e-01],
  10348. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  10349. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  10350. [ 6.2236e-01, -4.3453e-01, 1.9404e+00, -2.9207e-01, -3.1709e-01,
  10351. -8.7714e-01, 1.0655e+00, 2.1421e-01],
  10352. [ 6.1201e-01, -4.3711e-01, 1.7037e+00, 4.7005e-01, -5.8268e-01,
  10353. -2.2633e-02, 5.3538e-01, -1.3313e-01],
  10354. [ 5.5196e-01, -4.2371e-01, 1.6691e+00, -7.6936e-01, -6.5774e-01,
  10355. -3.4596e-01, 3.8152e-01, 2.9299e-01],
  10356. [ 6.0855e-01, -4.0839e-01, 1.5536e+00, -1.1466e+00, -7.4596e-02,
  10357. -1.4853e+00, 6.2979e-01, 8.5142e-02],
  10358. [ 5.4648e-01, -4.2140e-01, 9.3002e-01, -1.2620e+00, -3.9215e-01,
  10359. -1.3852e+00, 2.0618e-01, 1.0428e-01]]], device='cuda:0')
  10360. loss_train_step before backward: tensor(0.0330, device='cuda:0', grad_fn=<MseLossBackward>)
  10361. loss_train_step after backward: tensor(0.0330, device='cuda:0', grad_fn=<MseLossBackward>)
  10362. loss_train: 3.2255628500133753
  10363. step: 57
  10364. running loss: 0.056588821930059215
  10365. Train Steps: 57/90 Loss: 0.0566 torch.Size([8, 600, 800])
  10366. torch.Size([8, 8])
  10367. tensor([[0.6364, 0.4092, 0.8525, 0.5633, 0.3875, 0.4950, 0.6599, 0.5285],
  10368. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633],
  10369. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  10370. [0.6277, 0.4118, 0.8988, 0.3833, 0.3950, 0.2650, 0.6290, 0.4938],
  10371. [0.6201, 0.4151, 0.8588, 0.5467, 0.3700, 0.3950, 0.5637, 0.5933],
  10372. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  10373. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  10374. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235]],
  10375. device='cuda:0', dtype=torch.float64)
  10376. predictions are: tensor([[ 0.6005, -0.4291, 1.6331, 0.1981, -0.4927, 0.1141, 0.6502, 0.2158],
  10377. [ 0.3800, -0.5244, 1.5364, 0.2919, -0.3730, 0.0861, 0.3863, 0.3102],
  10378. [ 0.3911, -0.4867, 1.4536, -0.7373, -0.5116, -0.8875, 0.3204, 0.2352],
  10379. [ 0.3081, -0.5687, 1.7045, -0.6232, -0.4642, -0.9397, 0.6238, 0.1902],
  10380. [ 0.3725, -0.4843, 1.4808, 0.0960, -0.5485, -0.2804, 0.3564, 0.3270],
  10381. [ 0.3914, -0.4865, 1.5987, -1.1421, -0.3147, -0.9816, 0.8374, 0.2485],
  10382. [ 0.4910, -0.4554, 1.6362, -0.9180, -0.3677, -1.0994, 0.7497, 0.2050],
  10383. [ 0.3051, -0.6135, 1.6622, -0.1353, -0.3918, 0.2559, 0.6588, 0.2314]],
  10384. device='cuda:0', grad_fn=<AddmmBackward>)
  10385. landmarks are: tensor([[[ 6.5365e-01, -3.9601e-01, 1.6517e+00, 3.1609e-01, -4.9607e-01,
  10386. 4.6189e-04, 7.6203e-01, 1.5543e-01],
  10387. [ 5.8799e-01, -3.6051e-01, 1.7037e+00, 3.2379e-01, -2.9400e-01,
  10388. -7.6520e-02, 3.1801e-01, 3.1609e-01],
  10389. [ 5.7113e-01, -4.0146e-01, 1.6979e+00, -6.7698e-01, -5.3649e-01,
  10390. -1.0619e+00, 1.7122e-01, 1.4937e-01],
  10391. [ 6.1351e-01, -3.8406e-01, 1.8654e+00, -5.1532e-01, -4.6143e-01,
  10392. -1.0619e+00, 6.1946e-01, -4.8817e-03],
  10393. [ 5.7852e-01, -3.6867e-01, 1.6806e+00, 2.3911e-01, -5.7691e-01,
  10394. -4.6143e-01, 3.1801e-01, 4.5466e-01],
  10395. [ 6.0837e-01, -4.0762e-01, 1.6806e+00, -9.6182e-01, -2.9977e-01,
  10396. -9.6952e-01, 6.3557e-01, 1.4673e-01],
  10397. [ 6.1282e-01, -3.8283e-01, 1.7499e+00, -8.3865e-01, -3.3441e-01,
  10398. -1.2620e+00, 5.7925e-01, -2.6256e-02],
  10399. [ 5.7625e-01, -4.7064e-01, 1.7754e+00, -9.8417e-02, -3.6803e-01,
  10400. 2.3803e-01, 6.2770e-01, 1.3223e-01]]], device='cuda:0')
  10401. loss_train_step before backward: tensor(0.0179, device='cuda:0', grad_fn=<MseLossBackward>)
  10402. loss_train_step after backward: tensor(0.0179, device='cuda:0', grad_fn=<MseLossBackward>)
  10403. loss_train: 3.2434706911444664
  10404. step: 58
  10405. running loss: 0.05592190846800804
  10406. Train Steps: 58/90 Loss: 0.0559 torch.Size([8, 600, 800])
  10407. torch.Size([8, 8])
  10408. tensor([[0.6164, 0.3956, 0.8757, 0.5088, 0.4300, 0.5320, 0.6022, 0.5202],
  10409. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  10410. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  10411. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332],
  10412. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  10413. [0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383],
  10414. [0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  10415. [0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617]],
  10416. device='cuda:0', dtype=torch.float64)
  10417. predictions are: tensor([[ 0.6097, -0.3595, 1.6705, -0.0305, -0.4489, -0.0061, 0.5127, 0.2028],
  10418. [ 0.6639, -0.3332, 1.6342, -0.4861, -0.7198, -0.5016, 0.3668, 0.2877],
  10419. [ 0.5705, -0.3734, 1.9512, -0.2589, -0.3449, -1.1658, 0.9691, 0.1807],
  10420. [ 0.6820, -0.3269, 1.5413, -0.0517, -0.5332, -0.0984, 0.6546, 0.2289],
  10421. [ 0.2860, -0.6007, 1.7352, -0.1885, -0.3268, -0.1205, 0.5123, 0.2239],
  10422. [ 0.6428, -0.3875, 1.7646, -0.3212, -0.3645, 0.1299, 0.7426, 0.2294],
  10423. [-1.0394, -1.4764, 0.8833, -1.3383, -0.4541, -1.6894, 0.2561, 0.2452],
  10424. [ 0.6094, -0.3865, 1.7440, -0.0939, -0.2608, -0.1809, 0.4635, 0.2568]],
  10425. device='cuda:0', grad_fn=<AddmmBackward>)
  10426. landmarks are: tensor([[[ 0.5614, -0.4586, 1.7587, 0.0641, -0.2998, 0.1712, 0.4958,
  10427. 0.1170],
  10428. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  10429. 0.3238],
  10430. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  10431. 0.3692],
  10432. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  10433. 0.1768],
  10434. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  10435. 0.2622],
  10436. [ 0.5664, -0.4321, 1.8249, -0.2074, -0.2651, 0.4162, 0.5663,
  10437. 0.2006],
  10438. [ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  10439. 0.2699],
  10440. [ 0.5432, -0.4388, 1.7557, -0.0303, -0.0919, -0.1150, 0.2699,
  10441. 0.3087]]], device='cuda:0')
  10442. loss_train_step before backward: tensor(0.0746, device='cuda:0', grad_fn=<MseLossBackward>)
  10443. loss_train_step after backward: tensor(0.0746, device='cuda:0', grad_fn=<MseLossBackward>)
  10444. loss_train: 3.3181116357445717
  10445. step: 59
  10446. running loss: 0.05623918026685715
  10447. Train Steps: 59/90 Loss: 0.0562 torch.Size([8, 600, 800])
  10448. torch.Size([8, 8])
  10449. tensor([[0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  10450. [0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  10451. [0.6186, 0.4013, 0.8191, 0.3188, 0.4279, 0.2060, 0.5767, 0.5411],
  10452. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  10453. [0.6201, 0.4064, 0.8688, 0.5050, 0.4225, 0.5100, 0.6138, 0.5500],
  10454. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  10455. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  10456. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837]],
  10457. device='cuda:0', dtype=torch.float64)
  10458. predictions are: tensor([[ 0.5722, -0.3972, 1.2615, -0.8737, -0.5309, -0.9137, 0.4895, 0.1950],
  10459. [ 0.2688, -0.6062, 1.5072, -0.8471, -0.5606, -0.7359, 0.5700, 0.1372],
  10460. [ 0.5582, -0.3715, 1.6745, -0.5818, -0.3719, -1.0065, 0.5898, 0.1881],
  10461. [ 0.4482, -0.5203, 2.0914, 0.4037, -0.2245, 0.3096, 0.6900, 0.1714],
  10462. [ 0.6675, -0.3792, 2.0147, 0.5004, -0.4290, 0.4757, 0.7432, 0.1545],
  10463. [ 0.7220, -0.3007, 1.1824, -0.7761, -0.4194, -1.0112, 0.4273, 0.3017],
  10464. [-1.0870, -1.5275, 1.1445, -0.9036, -0.3555, -1.3402, 0.3323, 0.2497],
  10465. [ 0.6270, -0.3712, 1.2397, -0.6168, -0.5985, -0.6370, 0.3945, 0.3137]],
  10466. device='cuda:0', grad_fn=<AddmmBackward>)
  10467. landmarks are: tensor([[[ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  10468. 0.0862],
  10469. [ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  10470. -0.0108],
  10471. [ 0.5713, -0.4321, 1.4975, -0.8134, -0.3094, -1.3345, 0.3779,
  10472. 0.2134],
  10473. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  10474. 0.3392],
  10475. [ 0.5784, -0.4088, 1.7268, 0.0467, -0.3344, 0.0697, 0.5490,
  10476. 0.2545],
  10477. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  10478. 0.3808],
  10479. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  10480. 0.3469],
  10481. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  10482. 0.4103]]], device='cuda:0')
  10483. loss_train_step before backward: tensor(0.0950, device='cuda:0', grad_fn=<MseLossBackward>)
  10484.  
  10485. loss_train_step after backward: tensor(0.0950, device='cuda:0', grad_fn=<MseLossBackward>)
  10486. loss_train: 3.413125194609165
  10487. step: 60
  10488. running loss: 0.05688541991015275
  10489. Train Steps: 60/90 Loss: 0.0569 torch.Size([8, 600, 800])
  10490. torch.Size([8, 8])
  10491. tensor([[0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  10492. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  10493. [0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  10494. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  10495. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  10496. [0.6060, 0.3924, 0.8450, 0.5717, 0.4200, 0.5217, 0.5253, 0.4752],
  10497. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  10498. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783]],
  10499. device='cuda:0', dtype=torch.float64)
  10500. predictions are: tensor([[ 0.4477, -0.4989, 1.0241, -1.1866, -0.4538, -1.1541, 0.3545, 0.2349],
  10501. [ 0.5304, -0.4797, 1.9840, -0.0666, -0.5513, -0.0591, 0.9308, 0.1303],
  10502. [ 0.3024, -0.5637, 1.5836, -0.9812, -0.3989, -1.0223, 0.4467, 0.1653],
  10503. [ 0.1767, -0.6606, 1.9765, -0.0760, -0.2892, -0.9039, 0.8481, 0.2020],
  10504. [ 0.3131, -0.5527, 1.3676, -0.6091, -0.6676, -0.2343, 0.2590, 0.2547],
  10505. [ 0.3597, -0.5725, 1.6503, 0.4191, -0.3494, 0.0670, 0.4046, 0.2217],
  10506. [ 0.6185, -0.4473, 1.8138, 0.3166, -0.5707, -0.0937, 0.6552, 0.1352],
  10507. [ 0.1686, -0.6116, 1.1855, -1.0051, -0.2213, -1.1281, 0.3396, 0.3605]],
  10508. device='cuda:0', grad_fn=<AddmmBackward>)
  10509. landmarks are: tensor([[[ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  10510. 0.2576],
  10511. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  10512. 0.2516],
  10513. [ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  10514. 0.0851],
  10515. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  10516. 0.3692],
  10517. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  10518. 0.2386],
  10519. [ 0.5132, -0.4736, 1.6171, 0.3546, -0.3460, 0.1236, 0.1404,
  10520. -0.0911],
  10521. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  10522. 0.0291],
  10523. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  10524. 0.3854]]], device='cuda:0')
  10525. loss_train_step before backward: tensor(0.0200, device='cuda:0', grad_fn=<MseLossBackward>)
  10526. loss_train_step after backward: tensor(0.0200, device='cuda:0', grad_fn=<MseLossBackward>)
  10527. loss_train: 3.433107813820243
  10528. step: 61
  10529. running loss: 0.05628045596426628
  10530. Train Steps: 61/90 Loss: 0.0563 torch.Size([8, 600, 800])
  10531. torch.Size([8, 8])
  10532. tensor([[0.6296, 0.4060, 0.9100, 0.3267, 0.4726, 0.3367, 0.7446, 0.5355],
  10533. [0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  10534. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  10535. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  10536. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550],
  10537. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  10538. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  10539. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689]],
  10540. device='cuda:0', dtype=torch.float64)
  10541. predictions are: tensor([[ 0.1825, -0.7061, 1.7562, -0.5810, -0.2417, -0.6851, 0.8891, 0.1766],
  10542. [ 0.5891, -0.4146, 1.3659, -0.8705, -0.2362, -1.3972, 0.5131, 0.2131],
  10543. [ 0.7430, -0.3105, 1.0501, -0.8250, -0.3662, -1.2392, 0.3054, 0.2914],
  10544. [ 0.6278, -0.3860, 1.5139, -0.6035, -0.6098, -0.5631, 0.4918, 0.1655],
  10545. [ 0.0770, -0.7091, 1.4412, -0.5819, -0.5632, -0.9197, 0.1810, 0.1949],
  10546. [ 0.3116, -0.6728, 1.9799, 0.2008, -0.3828, 0.4249, 0.8613, 0.1679],
  10547. [-0.1072, -0.8606, 1.7340, -0.0695, -0.4591, -0.2890, 0.4195, 0.2378],
  10548. [ 0.4073, -0.5107, 1.4580, -0.4866, -0.6220, -0.3523, 0.3635, 0.2498]],
  10549. device='cuda:0', grad_fn=<AddmmBackward>)
  10550. landmarks are: tensor([[[ 0.6224, -0.4105, 1.9173, -0.7771, -0.1030, -0.7308, 1.1532,
  10551. 0.1875],
  10552. [ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  10553. 0.2442],
  10554. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  10555. 0.3808],
  10556. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  10557. 0.0942],
  10558. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  10559. 0.2776],
  10560. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  10561. 0.1082],
  10562. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  10563. 0.4145],
  10564. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  10565. 0.3417]]], device='cuda:0')
  10566. loss_train_step before backward: tensor(0.0419, device='cuda:0', grad_fn=<MseLossBackward>)
  10567. loss_train_step after backward: tensor(0.0419, device='cuda:0', grad_fn=<MseLossBackward>)
  10568. loss_train: 3.4750487077981234
  10569. step: 62
  10570. running loss: 0.056049172706421346
  10571. Train Steps: 62/90 Loss: 0.0560 torch.Size([8, 600, 800])
  10572. torch.Size([8, 8])
  10573. tensor([[0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  10574. [0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843],
  10575. [0.6203, 0.4021, 0.8780, 0.5031, 0.3667, 0.3882, 0.5842, 0.5405],
  10576. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  10577. [0.6064, 0.4019, 0.8650, 0.4517, 0.4037, 0.5367, 0.5703, 0.5609],
  10578. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  10579. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  10580. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272]],
  10581. device='cuda:0', dtype=torch.float64)
  10582. predictions are: tensor([[ 0.5372, -0.4427, 1.7632, 0.0029, -0.1842, -0.0286, 0.4543, 0.2477],
  10583. [ 0.7022, -0.3753, 2.0274, -0.0909, -0.5449, -0.0211, 0.7920, 0.0436],
  10584. [ 0.8202, -0.2692, 1.8586, 0.2130, -0.6447, -0.3823, 0.6089, 0.0845],
  10585. [-1.2660, -1.6953, 0.9615, -1.1883, -0.3203, -1.5984, 0.1894, 0.2762],
  10586. [ 0.4728, -0.4804, 1.6838, -0.2210, -0.3768, 0.2081, 0.5723, 0.2581],
  10587. [ 0.0046, -0.7779, 1.0222, -0.8906, -0.4931, -1.0298, 0.2306, 0.3229],
  10588. [ 1.1376, -0.0465, 1.2655, -0.9522, -0.3285, -1.1190, 0.5421, 0.3597],
  10589. [ 0.4906, -0.4482, 1.6257, -0.5826, -0.4980, -1.0188, 0.3590, 0.1793]],
  10590. device='cuda:0', grad_fn=<AddmmBackward>)
  10591. landmarks are: tensor([[[ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  10592. 0.3007],
  10593. [ 0.6075, -0.4159, 1.8654, -0.1458, -0.5249, 0.0159, 0.6359,
  10594. -0.0490],
  10595. [ 0.5791, -0.4289, 1.7694, 0.0379, -0.5923, -0.4927, 0.4126,
  10596. 0.2107],
  10597. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  10598. 0.3469],
  10599. [ 0.5151, -0.4296, 1.7095, -0.1997, -0.4210, 0.1929, 0.3484,
  10600. 0.3047],
  10601. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  10602. 0.4085],
  10603. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  10604. 0.6084],
  10605. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  10606. 0.1494]]], device='cuda:0')
  10607. loss_train_step before backward: tensor(0.0488, device='cuda:0', grad_fn=<MseLossBackward>)
  10608. loss_train_step after backward: tensor(0.0488, device='cuda:0', grad_fn=<MseLossBackward>)
  10609. loss_train: 3.523830173537135
  10610. step: 63
  10611. running loss: 0.055933812278367225
  10612. Train Steps: 63/90 Loss: 0.0559 torch.Size([8, 600, 800])
  10613. torch.Size([8, 8])
  10614. tensor([[0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136],
  10615. [0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600],
  10616. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  10617. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  10618. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  10619. [0.6115, 0.3998, 0.7063, 0.2383, 0.4037, 0.1950, 0.5320, 0.4993],
  10620. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  10621. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344]],
  10622. device='cuda:0', dtype=torch.float64)
  10623. predictions are: tensor([[ 0.2926, -0.6040, 1.6742, -0.2913, -0.0972, -0.4117, 0.4652, 0.2531],
  10624. [ 0.4361, -0.5205, 1.5725, 0.0129, -0.3745, -0.1130, 0.4582, 0.2891],
  10625. [ 0.4407, -0.5717, 1.6980, -0.5028, -0.3800, 0.0268, 0.6957, 0.2434],
  10626. [ 0.6617, -0.4029, 1.7236, -0.1642, -0.4997, -0.3592, 0.7090, 0.1786],
  10627. [ 0.1602, -0.6668, 1.5842, -0.4179, -0.6784, -0.8125, 0.2578, 0.2007],
  10628. [ 0.6501, -0.3948, 0.9773, -1.4541, -0.3942, -1.6491, 0.1857, 0.2270],
  10629. [ 0.2614, -0.6123, 1.6131, -0.0798, -0.4499, -0.5095, 0.4385, 0.2353],
  10630. [ 0.2661, -0.6166, 1.6872, -0.4090, -0.5893, -0.7739, 0.3292, 0.1672]],
  10631. device='cuda:0', grad_fn=<AddmmBackward>)
  10632. landmarks are: tensor([[[ 0.5564, -0.3842, 1.7268, 0.1005, -0.0250, 0.3225, 0.2658,
  10633. 0.0862],
  10634. [ 0.5762, -0.3840, 1.7268, 0.2622, -0.4210, 0.1313, 0.4277,
  10635. 0.3007],
  10636. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  10637. 0.1082],
  10638. [ 0.6148, -0.4130, 1.6864, 0.1698, -0.5307, -0.1150, 0.6125,
  10639. 0.0851],
  10640. [ 0.5443, -0.3994, 1.7499, -0.1227, -0.6173, -0.5769, 0.0049,
  10641. 0.2071],
  10642. [ 0.5384, -0.4393, 0.9762, -1.1851, -0.4210, -1.3852, 0.1712,
  10643. 0.0201],
  10644. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  10645. 0.2391],
  10646. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  10647. 0.1824]]], device='cuda:0')
  10648. loss_train_step before backward: tensor(0.0479, device='cuda:0', grad_fn=<MseLossBackward>)
  10649. loss_train_step after backward: tensor(0.0479, device='cuda:0', grad_fn=<MseLossBackward>)
  10650. loss_train: 3.5717637445777655
  10651. step: 64
  10652. running loss: 0.055808808509027585
  10653.  
  10654. Train Steps: 64/90 Loss: 0.0558 torch.Size([8, 600, 800])
  10655. torch.Size([8, 8])
  10656. tensor([[0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  10657. [0.6110, 0.4047, 0.8700, 0.4483, 0.3713, 0.3967, 0.5088, 0.5517],
  10658. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  10659. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  10660. [0.6030, 0.3969, 0.7988, 0.3917, 0.3450, 0.3667, 0.5266, 0.4700],
  10661. [0.6346, 0.4092, 0.7712, 0.5917, 0.4037, 0.4767, 0.7343, 0.5725],
  10662. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  10663. [0.6264, 0.4035, 0.8888, 0.4883, 0.4050, 0.5217, 0.6361, 0.4791]],
  10664. device='cuda:0', dtype=torch.float64)
  10665. predictions are: tensor([[ 0.1179, -0.7341, 0.9864, -1.3143, -0.3100, -1.6252, 0.2862, 0.2487],
  10666. [-0.0459, -0.8347, 1.5879, -0.2601, -0.5802, -0.5579, 0.1200, 0.2064],
  10667. [ 0.1300, -0.7234, 1.6999, -0.2421, -0.2803, -0.0950, 0.4022, 0.2162],
  10668. [ 0.7086, -0.3531, 1.8816, -0.3375, -0.4554, -0.5277, 0.5610, 0.2529],
  10669. [ 0.6942, -0.3544, 1.5433, -0.5519, -0.6117, -0.6795, 0.2996, 0.1721],
  10670. [ 0.4877, -0.4784, 1.4619, -0.0209, -0.3364, -0.2908, 0.5970, 0.2885],
  10671. [ 0.5985, -0.3888, 1.0590, -1.0507, -0.5366, -0.9573, 0.2380, 0.2933],
  10672. [ 0.4173, -0.5434, 1.8164, -0.0607, -0.3924, -0.0882, 0.5622, 0.1204]],
  10673. device='cuda:0', grad_fn=<AddmmBackward>)
  10674. landmarks are: tensor([[[ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  10675. 0.2906],
  10676. [ 0.5363, -0.4168, 1.7326, -0.2151, -0.5711, -0.4537, 0.0640,
  10677. 0.2622],
  10678. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  10679. 0.2545],
  10680. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  10681. 0.3238],
  10682. [ 0.4992, -0.4525, 1.4035, -0.4768, -0.6924, -0.5923, 0.1465,
  10683. -0.1151],
  10684. [ 0.6454, -0.3960, 1.2764, 0.4470, -0.4210, -0.0842, 1.1057,
  10685. 0.3585],
  10686. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  10687. 0.3315],
  10688. [ 0.6074, -0.4223, 1.8192, -0.0303, -0.4152, 0.1236, 0.6524,
  10689. -0.0731]]], device='cuda:0')
  10690. loss_train_step before backward: tensor(0.0361, device='cuda:0', grad_fn=<MseLossBackward>)
  10691. loss_train_step after backward: tensor(0.0361, device='cuda:0', grad_fn=<MseLossBackward>)
  10692. loss_train: 3.6078634057193995
  10693. step: 65
  10694. running loss: 0.05550559085722153
  10695. Train Steps: 65/90 Loss: 0.0555 torch.Size([8, 600, 800])
  10696. torch.Size([8, 8])
  10697. tensor([[0.6269, 0.4073, 0.8900, 0.4933, 0.3625, 0.4183, 0.6288, 0.5150],
  10698. [0.6171, 0.4127, 0.8900, 0.4800, 0.4325, 0.5783, 0.5769, 0.5090],
  10699. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  10700. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  10701. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  10702. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  10703. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  10704. [0.6350, 0.4043, 0.8738, 0.5650, 0.3850, 0.4750, 0.6401, 0.4950]],
  10705. device='cuda:0', dtype=torch.float64)
  10706. predictions are: tensor([[ 0.6163, -0.4138, 1.7250, -0.3640, -0.5013, -0.7299, 0.5247, 0.1902],
  10707. [ 0.5455, -0.4279, 1.6308, -0.4267, -0.2563, -0.1842, 0.3521, 0.2184],
  10708. [ 0.4818, -0.4494, 1.5292, -0.1557, -0.1983, -0.3982, 0.2413, 0.2642],
  10709. [ 0.6494, -0.3782, 1.5309, -0.6403, -0.3890, -0.0985, 0.4624, 0.2583],
  10710. [ 0.2372, -0.6260, 1.3226, -0.8351, -0.6079, -0.6038, 0.2684, 0.2611],
  10711. [-0.0703, -0.8515, 1.4496, -0.6823, -0.6232, -1.0105, 0.1126, 0.2541],
  10712. [ 0.3390, -0.5573, 1.5586, -0.0887, -0.4338, -0.5858, 0.3697, 0.2282],
  10713. [ 0.6466, -0.4126, 1.6265, -0.0297, -0.4755, -0.4721, 0.5771, 0.1254]],
  10714. device='cuda:0', grad_fn=<AddmmBackward>)
  10715. landmarks are: tensor([[[ 6.0964e-01, -4.0462e-01, 1.8249e+00, -7.2363e-03, -6.1155e-01,
  10716. -3.5366e-01, 6.1824e-01, 9.2841e-02],
  10717. [ 5.6449e-01, -3.7968e-01, 1.8249e+00, -6.8822e-02, -2.8822e-01,
  10718. 3.8537e-01, 3.7891e-01, 6.5205e-02],
  10719. [ 5.4475e-01, -3.8383e-01, 1.7037e+00, 1.7752e-01, -1.4965e-01,
  10720. 1.4673e-01, 1.1283e-01, 2.4313e-01],
  10721. [ 5.4169e-01, -4.3549e-01, 1.8018e+00, -3.3826e-01, -3.9792e-01,
  10722. 2.6220e-01, 5.1432e-01, 2.6220e-01],
  10723. [ 5.3672e-01, -4.2941e-01, 1.5709e+00, -4.9992e-01, -6.6928e-01,
  10724. -3.0747e-01, 2.4546e-01, 3.5585e-01],
  10725. [ 5.6969e-01, -4.1132e-01, 1.7499e+00, -2.7667e-01, -6.4042e-01,
  10726. -7.1547e-01, 1.5756e-01, 4.0319e-01],
  10727. [ 6.1149e-01, -3.7244e-01, 1.7557e+00, 3.4688e-01, -4.4411e-01,
  10728. -1.0731e-01, 4.9122e-01, 2.3911e-01],
  10729. [ 6.4706e-01, -4.1832e-01, 1.7499e+00, 3.2379e-01, -5.0762e-01,
  10730. -9.1917e-02, 6.7064e-01, 4.6189e-04]]], device='cuda:0')
  10731. loss_train_step before backward: tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward>)
  10732. loss_train_step after backward: tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward>)
  10733. loss_train: 3.6683297883719206
  10734. step: 66
  10735. running loss: 0.055580754369271526
  10736. Train Steps: 66/90 Loss: 0.0556 torch.Size([8, 600, 800])
  10737. torch.Size([8, 8])
  10738. tensor([[0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  10739. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  10740. [0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  10741. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  10742. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426],
  10743. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  10744. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  10745. [0.6224, 0.4061, 0.8988, 0.4300, 0.3838, 0.4750, 0.6112, 0.5483]],
  10746. device='cuda:0', dtype=torch.float64)
  10747. predictions are: tensor([[ 0.3850, -0.5190, 1.6111, 0.1055, -0.3750, -0.2330, 0.2022, 0.1973],
  10748. [ 0.3577, -0.5619, 1.4013, -1.0461, -0.6647, -0.5698, 0.4761, 0.2041],
  10749. [ 0.6324, -0.3384, 1.5729, -0.1080, -0.1719, -0.2944, 0.2511, 0.2831],
  10750. [ 0.1516, -0.6485, 1.5047, 0.1610, -0.4048, -0.4003, 0.2617, 0.3252],
  10751. [ 0.3335, -0.5744, 1.6998, -0.5424, -0.5618, -0.9373, 0.3913, 0.1944],
  10752. [ 0.6777, -0.3749, 1.0782, -1.4071, -0.6146, -1.0976, 0.3684, 0.1518],
  10753. [ 0.3836, -0.5650, 1.5613, 0.1353, -0.2767, -0.2953, 0.2244, 0.2116],
  10754. [ 0.7497, -0.3079, 1.7789, -0.4326, -0.5525, -0.0923, 0.4460, 0.1365]],
  10755. device='cuda:0', grad_fn=<AddmmBackward>)
  10756. landmarks are: tensor([[[ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  10757. 0.2048],
  10758. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  10759. 0.2391],
  10760. [ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  10761. 0.4239],
  10762. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  10763. 0.4470],
  10764. [ 0.5788, -0.4135, 1.8214, -0.2408, -0.6039, -0.7854, 0.4115,
  10765. 0.2203],
  10766. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  10767. 0.0622],
  10768. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  10769. -0.0610],
  10770. [ 0.5888, -0.4101, 1.8654, -0.2998, -0.5134, -0.0919, 0.5374,
  10771. 0.2468]]], device='cuda:0')
  10772. loss_train_step before backward: tensor(0.0281, device='cuda:0', grad_fn=<MseLossBackward>)
  10773. loss_train_step after backward: tensor(0.0281, device='cuda:0', grad_fn=<MseLossBackward>)
  10774. loss_train: 3.6964302863925695
  10775. step: 67
  10776. running loss: 0.05517060128944134
  10777. Train Steps: 67/90 Loss: 0.0552 torch.Size([8, 600, 800])
  10778. torch.Size([8, 8])
  10779. tensor([[0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  10780. [0.6260, 0.4253, 0.8938, 0.4400, 0.3675, 0.3650, 0.5675, 0.5767],
  10781. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  10782. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528],
  10783. [0.6197, 0.4050, 0.7527, 0.2000, 0.4042, 0.2249, 0.5895, 0.4995],
  10784. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  10785. [0.6198, 0.4115, 0.7762, 0.2717, 0.3713, 0.3200, 0.5837, 0.5683],
  10786. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611]],
  10787. device='cuda:0', dtype=torch.float64)
  10788. predictions are: tensor([[ 1.0962, -0.0146, 1.2800, -0.4273, -0.4927, -0.5402, 0.3793, 0.2654],
  10789. [ 1.1303, 0.0088, 1.7883, 0.1866, -0.6208, -0.2242, 0.3961, 0.1948],
  10790. [-0.9555, -1.3945, 0.9320, -1.0741, -0.2958, -1.0923, 0.1046, 0.3117],
  10791. [-0.2414, -0.9752, 1.8767, -0.6888, -0.1368, -0.7230, 0.9422, 0.2153],
  10792. [ 1.2111, 0.0026, 1.0614, -0.9498, -0.4365, -1.0711, 0.2465, 0.1665],
  10793. [-0.9628, -1.4400, 1.3093, -0.5955, -0.5826, -0.5954, -0.0528, 0.1944],
  10794. [ 0.7971, -0.2340, 1.3919, -0.7441, -0.5827, -0.6364, 0.2316, 0.2503],
  10795. [ 1.2873, 0.0838, 1.7751, 0.3542, -0.3632, 0.3964, 0.1676, 0.1421]],
  10796. device='cuda:0', grad_fn=<AddmmBackward>)
  10797. landmarks are: tensor([[[ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  10798. 0.3469],
  10799. [ 0.6058, -0.3216, 1.8423, -0.2536, -0.5885, -0.6000, 0.3353,
  10800. 0.3777],
  10801. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  10802. 0.3084],
  10803. [-2.2859, -2.2859, 1.8423, -0.9695, -0.1323, -0.8463, 1.1349,
  10804. 0.2676],
  10805. [ 0.5762, -0.4153, 1.1908, -1.3622, -0.4190, -1.2471, 0.4368,
  10806. 0.0213],
  10807. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  10808. 0.1133],
  10809. [ 0.5768, -0.3852, 1.2995, -1.0311, -0.5711, -0.8079, 0.4104,
  10810. 0.3392],
  10811. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  10812. 0.3057]]], device='cuda:0')
  10813. loss_train_step before backward: tensor(0.2376, device='cuda:0', grad_fn=<MseLossBackward>)
  10814. loss_train_step after backward: tensor(0.2376, device='cuda:0', grad_fn=<MseLossBackward>)
  10815. loss_train: 3.9340319838374853
  10816. step: 68
  10817. running loss: 0.05785341152702184
  10818.  
  10819. Train Steps: 68/90 Loss: 0.0579 torch.Size([8, 600, 800])
  10820. torch.Size([8, 8])
  10821. tensor([[0.6273, 0.4100, 0.7137, 0.2133, 0.4000, 0.2650, 0.6075, 0.5633],
  10822. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  10823. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  10824. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767],
  10825. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  10826. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  10827. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750],
  10828. [0.6308, 0.3990, 0.8688, 0.5183, 0.3950, 0.4983, 0.6388, 0.5133]],
  10829. device='cuda:0', dtype=torch.float64)
  10830. predictions are: tensor([[ 0.9220, -0.1580, 1.0716, -1.1080, -0.4721, -0.9665, 0.4439, 0.2881],
  10831. [ 0.9092, -0.1540, 1.7848, 0.5763, -0.4562, 0.3608, 0.1721, 0.1350],
  10832. [ 1.0781, -0.0502, 1.5693, -0.8404, -0.4444, -0.5808, 0.4128, 0.2579],
  10833. [ 0.7694, -0.1921, 1.6814, 0.1707, -0.6954, -0.4038, 0.1699, 0.1999],
  10834. [-1.3740, -1.7090, 1.0674, -0.9417, -0.4480, -0.9951, 0.0507, 0.2347],
  10835. [ 0.7294, -0.2306, 1.4294, -0.7451, -0.2152, -0.9191, 0.3202, 0.2228],
  10836. [-0.9718, -1.4156, 0.8144, -1.1385, -0.3027, -1.2208, 0.0989, 0.3416],
  10837. [ 1.0325, -0.1115, 1.8781, 0.3365, -0.4912, 0.4340, 0.5514, 0.0747]],
  10838. device='cuda:0', grad_fn=<AddmmBackward>)
  10839. landmarks are: tensor([[[ 0.6115, -0.3924, 1.0109, -1.3005, -0.4383, -1.0619, 0.5201,
  10840. 0.3161],
  10841. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  10842. 0.2048],
  10843. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  10844. 0.3392],
  10845. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  10846. 0.3778],
  10847. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  10848. 0.2183],
  10849. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  10850. 0.2083],
  10851. [ 0.5663, -0.4396, 0.8261, -1.1312, -0.2940, -1.3929, 0.2603,
  10852. 0.3700],
  10853. [ 0.6275, -0.4430, 1.7268, 0.1082, -0.4614, 0.0159, 0.6644,
  10854. 0.0851]]], device='cuda:0')
  10855. loss_train_step before backward: tensor(0.1133, device='cuda:0', grad_fn=<MseLossBackward>)
  10856. loss_train_step after backward: tensor(0.1133, device='cuda:0', grad_fn=<MseLossBackward>)
  10857. loss_train: 4.047340488061309
  10858. step: 69
  10859. running loss: 0.05865710852262766
  10860. Train Steps: 69/90 Loss: 0.0587 torch.Size([8, 600, 800])
  10861. torch.Size([8, 8])
  10862. tensor([[0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283],
  10863. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  10864. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  10865. [0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  10866. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  10867. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500],
  10868. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  10869. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317]],
  10870. device='cuda:0', dtype=torch.float64)
  10871. predictions are: tensor([[ 0.5268, -0.4157, 1.5812, -0.0265, -0.1701, -0.2196, 0.0827, 0.2199],
  10872. [ 0.4279, -0.4902, 1.4951, 0.0641, -0.5407, -0.0932, 0.2282, 0.2088],
  10873. [ 0.0935, -0.7143, 1.5847, -0.2925, -0.2550, -0.1841, 0.1801, 0.1760],
  10874. [ 0.5612, -0.4071, 1.5233, -0.3984, -0.5938, -0.1783, 0.2074, 0.2572],
  10875. [ 0.4294, -0.4534, 1.4494, -0.5346, -0.3546, 0.1353, 0.2257, 0.2259],
  10876. [ 0.4408, -0.4619, 1.5718, -0.1829, -0.6354, -0.6182, 0.2701, 0.2355],
  10877. [ 0.2905, -0.6043, 1.6711, -1.0866, -0.3326, -1.1208, 0.8237, 0.2227],
  10878. [ 0.6131, -0.3707, 1.5938, 0.0196, -0.6678, -0.7217, 0.3395, 0.1753]],
  10879. device='cuda:0', grad_fn=<AddmmBackward>)
  10880. landmarks are: tensor([[[ 0.5245, -0.4347, 1.6806, 0.1159, 0.0046, 0.0129, 0.1044,
  10881. 0.1544],
  10882. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  10883. 0.1544],
  10884. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  10885. -0.0039],
  10886. [ 0.5700, -0.4032, 1.7961, -0.1997, -0.5249, -0.2151, 0.3815,
  10887. 0.3161],
  10888. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  10889. 0.2936],
  10890. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  10891. 0.2545],
  10892. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  10893. 0.3050],
  10894. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  10895. 0.1698]]], device='cuda:0')
  10896. loss_train_step before backward: tensor(0.0292, device='cuda:0', grad_fn=<MseLossBackward>)
  10897. loss_train_step after backward: tensor(0.0292, device='cuda:0', grad_fn=<MseLossBackward>)
  10898. loss_train: 4.076580006629229
  10899. step: 70
  10900. running loss: 0.05823685723756041
  10901. Train Steps: 70/90 Loss: 0.0582 torch.Size([8, 600, 800])
  10902. torch.Size([8, 8])
  10903. tensor([[0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  10904. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  10905. [0.6086, 0.3998, 0.8788, 0.4450, 0.4025, 0.4650, 0.5306, 0.5103],
  10906. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  10907. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  10908. [0.6126, 0.4073, 0.8750, 0.5133, 0.3800, 0.4333, 0.4986, 0.5378],
  10909. [0.6336, 0.4086, 0.8900, 0.3950, 0.3900, 0.2950, 0.6504, 0.5066],
  10910. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412]],
  10911. device='cuda:0', dtype=torch.float64)
  10912. predictions are: tensor([[ 0.0387, -0.7622, 1.2751, -0.9462, -0.5724, -1.0365, 0.1144, 0.2447],
  10913. [ 0.3928, -0.5237, 1.6429, -0.0807, -0.3716, -0.0862, 0.2124, 0.1810],
  10914. [ 0.3224, -0.5755, 1.7140, -0.3758, -0.4884, -0.1473, 0.1929, 0.1669],
  10915. [ 0.5737, -0.3796, 1.5390, -0.4548, -0.5041, -0.2859, 0.1710, 0.2812],
  10916. [ 0.4217, -0.4986, 1.6079, 0.0801, -0.4330, -0.0176, 0.3749, 0.2277],
  10917. [ 0.2513, -0.5825, 1.6658, 0.0256, -0.5307, -0.3036, 0.2110, 0.2185],
  10918. [ 0.7274, -0.3245, 1.5881, -0.7377, -0.4621, -1.0521, 0.7483, 0.1522],
  10919. [ 0.5020, -0.4279, 1.5960, 0.1977, -0.1573, -0.0532, 0.2000, 0.2492]],
  10920. device='cuda:0', grad_fn=<AddmmBackward>)
  10921. landmarks are: tensor([[[ 0.5532, -0.3888, 1.4727, -0.7463, -0.5538, -1.0465, 0.0265,
  10922. 0.2138],
  10923. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  10924. 0.1854],
  10925. [ 0.5253, -0.4392, 1.7730, -0.2305, -0.4268, -0.1381, 0.1651,
  10926. 0.0712],
  10927. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  10928. 0.4145],
  10929. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  10930. 0.1544],
  10931. [ 0.5435, -0.4045, 1.7557, 0.0851, -0.5307, -0.2844, 0.0172,
  10932. 0.1980],
  10933. [ 0.6405, -0.3984, 1.8249, -0.4614, -0.4845, -0.9233, 0.7182,
  10934. 0.0539],
  10935. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  10936. 0.2138]]], device='cuda:0')
  10937. loss_train_step before backward: tensor(0.0193, device='cuda:0', grad_fn=<MseLossBackward>)
  10938. loss_train_step after backward: tensor(0.0193, device='cuda:0', grad_fn=<MseLossBackward>)
  10939. loss_train: 4.095911048352718
  10940. step: 71
  10941. running loss: 0.05768888800496787
  10942. Train Steps: 71/90 Loss: 0.0577 torch.Size([8, 600, 800])
  10943. torch.Size([8, 8])
  10944. tensor([[0.6277, 0.4013, 0.8888, 0.4767, 0.3600, 0.3567, 0.6148, 0.4672],
  10945. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  10946. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  10947. [0.6151, 0.4058, 0.7068, 0.2680, 0.3400, 0.4083, 0.5775, 0.5733],
  10948. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633],
  10949. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  10950. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  10951. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012]],
  10952. device='cuda:0', dtype=torch.float64)
  10953. predictions are: tensor([[ 0.5969, -0.4272, 1.8214, -0.2437, -0.6127, -0.7385, 0.4143, 0.1130],
  10954. [ 0.2856, -0.6078, 1.3131, -1.0711, -0.6239, -0.5276, 0.3054, 0.2557],
  10955. [ 0.5606, -0.4006, 1.7808, 0.4420, -0.3751, -0.0319, 0.2513, 0.2444],
  10956. [ 0.3458, -0.5758, 1.1444, -1.0937, -0.6510, -0.5539, 0.1815, 0.3004],
  10957. [ 0.5171, -0.4272, 1.7789, 0.4450, -0.2649, 0.0206, 0.1874, 0.2545],
  10958. [ 0.3801, -0.5404, 1.8297, -0.2141, -0.4082, 0.2344, 0.2679, 0.1173],
  10959. [ 0.0454, -0.7213, 1.2479, -0.9528, -0.0633, -1.2849, 0.2315, 0.3592],
  10960. [ 0.6147, -0.4189, 1.8836, 0.2746, -0.5885, -0.2440, 0.4363, 0.1093]],
  10961. device='cuda:0', grad_fn=<AddmmBackward>)
  10962. landmarks are: tensor([[[ 0.6132, -0.4324, 1.8192, -0.0842, -0.6231, -0.6385, 0.5537,
  10963. -0.1278],
  10964. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  10965. 0.2545],
  10966. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  10967. 0.3007],
  10968. [ 0.5552, -0.4113, 0.9790, -1.0480, -0.7155, -0.3998, 0.3815,
  10969. 0.3623],
  10970. [ 0.5880, -0.3605, 1.7037, 0.3238, -0.2940, -0.0765, 0.3180,
  10971. 0.3161],
  10972. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  10973. -0.0322],
  10974. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  10975. 0.5624],
  10976. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  10977. 0.0291]]], device='cuda:0')
  10978. loss_train_step before backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  10979. loss_train_step after backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  10980. loss_train: 4.11814627237618
  10981. step: 72
  10982. running loss: 0.05719647600522472
  10983.  
  10984. Train Steps: 72/90 Loss: 0.0572 torch.Size([8, 600, 800])
  10985. torch.Size([8, 8])
  10986. tensor([[0.6280, 0.4101, 0.9050, 0.4533, 0.3775, 0.3217, 0.6338, 0.4915],
  10987. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  10988. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450],
  10989. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  10990. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800],
  10991. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  10992. [0.6124, 0.4069, 0.8314, 0.5001, 0.3738, 0.4650, 0.5167, 0.5402],
  10993. [0.6346, 0.4165, 0.9138, 0.3983, 0.3875, 0.4317, 0.7469, 0.5471]],
  10994. device='cuda:0', dtype=torch.float64)
  10995. predictions are: tensor([[ 0.6401, -0.3275, 1.9039, 0.0135, -0.5674, -0.7047, 0.5180, 0.0962],
  10996. [ 0.5311, -0.3679, 1.7335, 0.1201, -0.2505, 0.2096, 0.0463, 0.1490],
  10997. [ 0.7563, -0.2695, 1.7467, -0.0610, -0.3387, 0.3851, 0.3857, 0.1715],
  10998. [-1.4279, -1.7449, 0.9868, -1.1764, -0.1548, -1.2947, 0.2669, 0.3564],
  10999. [ 0.2403, -0.5642, 1.0672, -0.7588, -0.5522, -0.9347, 0.0379, 0.3111],
  11000. [ 0.7850, -0.2328, 1.5708, -0.5475, -0.5102, -0.8937, 0.2295, 0.2070],
  11001. [ 0.9283, -0.1462, 1.5625, 0.1236, -0.4814, -0.0100, 0.1466, 0.2467],
  11002. [ 0.2391, -0.6283, 1.9438, -0.2441, -0.3081, -0.1375, 0.7502, 0.2023]],
  11003. device='cuda:0', grad_fn=<AddmmBackward>)
  11004. landmarks are: tensor([[[ 0.6148, -0.3918, 1.8942, -0.1920, -0.5423, -0.8002, 0.6414,
  11005. -0.0156],
  11006. [ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  11007. 0.0682],
  11008. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  11009. 0.2314],
  11010. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  11011. 0.3623],
  11012. [ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  11013. 0.3931],
  11014. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  11015. 0.1494],
  11016. [ 0.5425, -0.4067, 1.5543, 0.0241, -0.5596, -0.1381, 0.1005,
  11017. 0.2093],
  11018. [ 0.6454, -0.3623, 1.9346, -0.4460, -0.4961, -0.2921, 1.1642,
  11019. 0.2409]]], device='cuda:0')
  11020. loss_train_step before backward: tensor(0.0410, device='cuda:0', grad_fn=<MseLossBackward>)
  11021. loss_train_step after backward: tensor(0.0410, device='cuda:0', grad_fn=<MseLossBackward>)
  11022. loss_train: 4.15917850472033
  11023. step: 73
  11024. running loss: 0.05697504800986754
  11025. Train Steps: 73/90 Loss: 0.0570 torch.Size([8, 600, 800])
  11026. torch.Size([8, 8])
  11027. tensor([[0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  11028. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  11029. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  11030. [0.6218, 0.4137, 0.7263, 0.2233, 0.4075, 0.2650, 0.6212, 0.5783],
  11031. [0.6200, 0.4039, 0.8880, 0.4799, 0.3625, 0.4285, 0.5866, 0.5148],
  11032. [0.6300, 0.4102, 0.9088, 0.4433, 0.4088, 0.3067, 0.6820, 0.5540],
  11033. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  11034. [0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136]],
  11035. device='cuda:0', dtype=torch.float64)
  11036. predictions are: tensor([[ 0.0255, -0.7414, 1.0145, -1.0360, -0.3244, -1.0102, 0.2996, 0.3519],
  11037. [ 0.1935, -0.6416, 0.8982, -0.9045, -0.4853, -0.9969, 0.0657, 0.2896],
  11038. [ 0.5508, -0.4163, 1.8753, -0.2968, -0.3653, -0.9057, 0.3999, 0.1318],
  11039. [ 0.9391, -0.2031, 1.1864, -0.7964, -0.4275, -0.8836, 0.3701, 0.3034],
  11040. [ 0.3174, -0.5763, 1.8704, 0.0961, -0.6383, -0.0635, 0.1696, 0.1344],
  11041. [ 0.0848, -0.7070, 2.0174, -0.0102, -0.3566, -0.5104, 0.5992, 0.1564],
  11042. [ 0.4316, -0.5112, 1.8690, 0.0852, -0.5426, 0.1211, 0.4263, 0.1277],
  11043. [ 0.3346, -0.5371, 1.7998, 0.2516, -0.0975, 0.4123, 0.1748, 0.1796]],
  11044. device='cuda:0', grad_fn=<AddmmBackward>)
  11045. landmarks are: tensor([[[ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  11046. 0.2622],
  11047. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  11048. 0.3546],
  11049. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  11050. -0.0529],
  11051. [ 0.5863, -0.3749, 1.0686, -1.2543, -0.4037, -1.0619, 0.5836,
  11052. 0.3854],
  11053. [ 0.5781, -0.4205, 1.8159, -0.0691, -0.6116, -0.3069, 0.4236,
  11054. 0.0919],
  11055. [ 0.6240, -0.3912, 1.9115, -0.2382, -0.3979, -0.8694, 0.8644,
  11056. 0.2730],
  11057. [ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  11058. 0.1779],
  11059. [ 0.5564, -0.3842, 1.7268, 0.1005, -0.0250, 0.3225, 0.2658,
  11060. 0.0862]]], device='cuda:0')
  11061. loss_train_step before backward: tensor(0.0431, device='cuda:0', grad_fn=<MseLossBackward>)
  11062. loss_train_step after backward: tensor(0.0431, device='cuda:0', grad_fn=<MseLossBackward>)
  11063. loss_train: 4.202301474288106
  11064. step: 74
  11065. running loss: 0.05678785776065008
  11066. Train Steps: 74/90 Loss: 0.0568 torch.Size([8, 600, 800])
  11067. torch.Size([8, 8])
  11068. tensor([[0.6282, 0.4034, 0.7830, 0.2080, 0.4532, 0.2080, 0.6404, 0.5323],
  11069. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  11070. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  11071. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  11072. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  11073. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  11074. [0.6129, 0.4069, 0.8750, 0.5067, 0.3875, 0.4233, 0.5235, 0.5881],
  11075. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383]],
  11076. device='cuda:0', dtype=torch.float64)
  11077. predictions are: tensor([[ 0.7725, -0.2617, 1.3868, -1.0722, -0.2079, -1.3805, 0.5797, 0.2321],
  11078. [ 0.7794, -0.2949, 1.9241, 0.0387, -0.4490, 0.2553, 0.8479, 0.1340],
  11079. [ 0.8670, -0.1966, 1.7308, 0.3913, -0.4143, -0.0618, 0.3734, 0.2194],
  11080. [ 0.5301, -0.4200, 1.6865, -0.3245, -0.6355, -0.6120, 0.1663, 0.2268],
  11081. [ 0.5905, -0.3883, 1.7943, -0.0852, -0.4299, 0.0460, 0.2930, 0.1580],
  11082. [-1.6482, -1.9028, 1.1660, -1.1783, -0.2913, -1.2421, 0.1438, 0.2935],
  11083. [ 0.5850, -0.3715, 1.7286, 0.1431, -0.5558, -0.2252, 0.1153, 0.2125],
  11084. [ 0.5957, -0.3554, 1.7312, -0.0205, -0.2870, -0.0232, 0.1938, 0.1764]],
  11085. device='cuda:0', grad_fn=<AddmmBackward>)
  11086. landmarks are: tensor([[[ 6.1577e-01, -4.2249e-01, 1.3307e+00, -1.3253e+00, -1.9244e-01,
  11087. -1.3252e+00, 6.7213e-01, 1.7271e-01],
  11088. [ 6.4212e-01, -3.6953e-01, 1.7788e+00, 2.3557e-02, -4.8453e-01,
  11089. 1.5443e-01, 1.1971e+00, 2.1955e-01],
  11090. [ 5.8909e-01, -3.5574e-01, 1.7326e+00, 3.3918e-01, -4.2102e-01,
  11091. -1.2271e-01, 3.2379e-01, 3.0069e-01],
  11092. [ 5.6969e-01, -4.1132e-01, 1.7499e+00, -2.7667e-01, -6.4042e-01,
  11093. -7.1547e-01, 1.5756e-01, 4.0319e-01],
  11094. [ 5.2500e-01, -4.6613e-01, 1.7383e+00, -7.6520e-02, -4.2679e-01,
  11095. -2.2633e-02, 2.5348e-01, 2.0347e-01],
  11096. [-2.2859e+00, -2.2859e+00, 9.0115e-01, -1.4006e+00, -4.6721e-01,
  11097. -1.1928e+00, 1.3421e-01, 1.3734e-01],
  11098. [ 5.4515e-01, -4.0670e-01, 1.7557e+00, 5.4350e-02, -4.9607e-01,
  11099. -3.3056e-01, 1.3228e-01, 4.3063e-01],
  11100. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  11101. -6.8822e-02, 2.3086e-01, 2.0046e-01]]], device='cuda:0')
  11102. loss_train_step before backward: tensor(0.0209, device='cuda:0', grad_fn=<MseLossBackward>)
  11103. loss_train_step after backward: tensor(0.0209, device='cuda:0', grad_fn=<MseLossBackward>)
  11104. loss_train: 4.223247792571783
  11105. step: 75
  11106. running loss: 0.056309970567623775
  11107. Train Steps: 75/90 Loss: 0.0563 torch.Size([8, 600, 800])
  11108. torch.Size([8, 8])
  11109. tensor([[0.6199, 0.4065, 0.7598, 0.2385, 0.4317, 0.1981, 0.5933, 0.5221],
  11110. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  11111. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  11112. [0.6277, 0.4118, 0.8988, 0.3833, 0.3950, 0.2650, 0.6290, 0.4938],
  11113. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552],
  11114. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  11115. [0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250],
  11116. [0.6216, 0.4100, 0.7350, 0.2067, 0.4325, 0.2050, 0.5950, 0.5333]],
  11117. device='cuda:0', dtype=torch.float64)
  11118. predictions are: tensor([[ 0.7325, -0.3244, 1.1943, -0.8618, -0.3379, -0.9226, 0.3813, 0.1958],
  11119. [ 0.6158, -0.3913, 1.6816, 0.5930, -0.4862, 0.2030, 0.3024, 0.2457],
  11120. [ 0.6307, -0.3547, 1.6683, -0.4211, -0.6285, -0.4675, 0.1638, 0.1631],
  11121. [ 0.6086, -0.3802, 1.9739, -0.0922, -0.4960, -0.5134, 0.4618, 0.1108],
  11122. [-1.6262, -1.8678, 1.7056, -0.6897, 0.0506, -0.6270, 0.7561, 0.2796],
  11123. [ 0.5644, -0.3997, 1.8604, -0.3902, -0.3610, -0.6911, 0.5889, 0.1362],
  11124. [ 0.6110, -0.4007, 1.1670, -0.8371, -0.5049, -0.6734, 0.3403, 0.2276],
  11125. [ 0.6246, -0.3696, 1.0815, -0.8941, -0.3092, -1.0043, 0.2052, 0.3066]],
  11126. device='cuda:0', grad_fn=<AddmmBackward>)
  11127. landmarks are: tensor([[[ 0.5774, -0.4082, 1.2235, -1.1844, -0.2919, -1.3709, 0.4544,
  11128. 0.1256],
  11129. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  11130. 0.5401],
  11131. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  11132. 0.1005],
  11133. [ 0.6135, -0.3841, 1.8654, -0.5153, -0.4614, -1.0619, 0.6195,
  11134. -0.0049],
  11135. [-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  11136. 0.2783],
  11137. [ 0.6128, -0.3828, 1.7499, -0.8386, -0.3344, -1.2620, 0.5792,
  11138. -0.0263],
  11139. [ 0.5891, -0.3937, 1.1494, -1.2390, -0.5076, -0.9695, 0.4797,
  11140. 0.1390],
  11141. [ 0.5853, -0.3920, 1.1090, -1.3313, -0.2882, -1.3390, 0.4624,
  11142. 0.1775]]], device='cuda:0')
  11143. loss_train_step before backward: tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward>)
  11144.  
  11145. loss_train_step after backward: tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward>)
  11146. loss_train: 4.284526634961367
  11147. step: 76
  11148. running loss: 0.05637535046001798
  11149. Train Steps: 76/90 Loss: 0.0564 torch.Size([8, 600, 800])
  11150. torch.Size([8, 8])
  11151. tensor([[0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  11152. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  11153. [0.6225, 0.4116, 0.8662, 0.3517, 0.3663, 0.3233, 0.5837, 0.5317],
  11154. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133],
  11155. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  11156. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297],
  11157. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  11158. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279]],
  11159. device='cuda:0', dtype=torch.float64)
  11160. predictions are: tensor([[ 0.5418, -0.4318, 1.7813, 0.4587, -0.0794, -0.2210, 0.4923, 0.2903],
  11161. [ 0.6229, -0.4087, 0.9010, -1.1260, -0.3065, -1.4490, 0.2739, 0.3452],
  11162. [ 0.7011, -0.3479, 1.7164, -0.6893, -0.4533, -0.8815, 0.4622, 0.2529],
  11163. [ 0.3350, -0.5665, 1.7980, -0.4537, -0.5948, -0.7768, 0.2783, 0.1598],
  11164. [ 0.2740, -0.6352, 1.6905, -0.5705, -0.6383, -0.4217, 0.5188, 0.1312],
  11165. [ 0.2169, -0.6774, 1.7397, -0.1561, -0.3435, -0.0342, 0.6219, 0.1825],
  11166. [ 0.1279, -0.7503, 1.7811, -0.0669, -0.4797, -0.1236, 0.4468, 0.1145],
  11167. [ 0.4340, -0.5311, 1.8522, -0.1038, -0.4461, -0.0288, 0.4235, 0.1248]],
  11168. device='cuda:0', grad_fn=<AddmmBackward>)
  11169. landmarks are: tensor([[[ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  11170. 0.4470],
  11171. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  11172. 0.3808],
  11173. [ 0.5893, -0.3847, 1.7152, -0.6616, -0.5942, -0.7925, 0.4104,
  11174. 0.1698],
  11175. [ 0.5393, -0.4294, 1.6575, -0.4075, -0.6635, -0.6308, 0.3296,
  11176. 0.0851],
  11177. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  11178. 0.0236],
  11179. [ 0.6257, -0.4273, 1.8365, -0.0688, -0.4672, -0.0611, 1.1715,
  11180. 0.1608],
  11181. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  11182. -0.0534],
  11183. [ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  11184. 0.1525]]], device='cuda:0')
  11185. loss_train_step before backward: tensor(0.0220, device='cuda:0', grad_fn=<MseLossBackward>)
  11186. loss_train_step after backward: tensor(0.0220, device='cuda:0', grad_fn=<MseLossBackward>)
  11187. loss_train: 4.306571505963802
  11188. step: 77
  11189. running loss: 0.055929500077451975
  11190. Train Steps: 77/90 Loss: 0.0559 torch.Size([8, 600, 800])
  11191. torch.Size([8, 8])
  11192. tensor([[0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  11193. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667],
  11194. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817],
  11195. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  11196. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533],
  11197. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  11198. [0.6197, 0.3986, 0.8800, 0.4617, 0.4188, 0.4783, 0.5687, 0.5550],
  11199. [0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467]],
  11200. device='cuda:0', dtype=torch.float64)
  11201. predictions are: tensor([[ 0.2123, -0.6681, 1.4267, -0.7008, -0.3961, -1.0789, 0.4470, 0.1575],
  11202. [ 0.6287, -0.4280, 1.9480, -0.2461, -0.6259, -0.2741, 0.5778, 0.1985],
  11203. [ 0.2384, -0.6014, 1.5249, -0.6004, -0.1790, -0.7868, 0.4314, 0.3348],
  11204. [ 0.2662, -0.6620, 1.6252, -0.7981, -0.0459, -1.2227, 0.8659, 0.1341],
  11205. [ 0.3869, -0.5725, 1.1212, -0.8591, -0.5330, -0.8021, 0.4060, 0.2322],
  11206. [ 0.6979, -0.3889, 1.9113, -0.0834, -0.5975, -0.2396, 0.4525, 0.2011],
  11207. [ 0.1241, -0.7364, 1.8760, 0.2413, -0.3607, 0.2421, 0.2625, 0.1373],
  11208. [ 0.4837, -0.5007, 1.1885, -0.8307, -0.4771, -0.9443, 0.4297, 0.1917]],
  11209. device='cuda:0', grad_fn=<AddmmBackward>)
  11210. landmarks are: tensor([[[ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  11211. 0.2043],
  11212. [ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  11213. 0.3315],
  11214. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  11215. 0.4008],
  11216. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  11217. 0.1020],
  11218. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  11219. 0.2699],
  11220. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  11221. 0.1929],
  11222. [ 0.5763, -0.4450, 1.7788, -0.1535, -0.3517, -0.0765, 0.3411,
  11223. 0.2776],
  11224. [ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  11225. 0.2391]]], device='cuda:0')
  11226. loss_train_step before backward: tensor(0.0397, device='cuda:0', grad_fn=<MseLossBackward>)
  11227. loss_train_step after backward: tensor(0.0397, device='cuda:0', grad_fn=<MseLossBackward>)
  11228. loss_train: 4.346283700317144
  11229. step: 78
  11230. running loss: 0.05572158590150185
  11231. Train Steps: 78/90 Loss: 0.0557 torch.Size([8, 600, 800])
  11232. torch.Size([8, 8])
  11233. tensor([[0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  11234. [0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097],
  11235. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  11236. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  11237. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  11238. [0.6165, 0.4106, 0.7575, 0.1733, 0.3838, 0.2650, 0.5680, 0.5116],
  11239. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  11240. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927]],
  11241. device='cuda:0', dtype=torch.float64)
  11242. predictions are: tensor([[ 0.2503, -0.6194, 1.6771, -0.5663, -0.2092, -0.0134, 0.4559, 0.2668],
  11243. [ 0.4025, -0.5215, 1.7636, -0.3499, -0.2321, 0.0510, 0.4189, 0.2570],
  11244. [ 0.3624, -0.5574, 1.6009, -0.4521, -0.5776, -0.7097, 0.4002, 0.2726],
  11245. [ 0.4997, -0.5109, 1.9008, -0.2579, -0.4983, -0.6274, 0.6899, 0.2027],
  11246. [ 0.3547, -0.6100, 1.7118, -0.0586, -0.3042, -0.1724, 0.6228, 0.1929],
  11247. [ 0.8087, -0.3421, 1.1945, -1.4183, -0.5040, -1.5953, 0.5418, 0.1857],
  11248. [ 0.5330, -0.4932, 1.7886, 0.0924, -0.4707, -0.4936, 0.5452, 0.1295],
  11249. [ 0.4743, -0.5207, 1.8230, 0.0724, -0.5959, -0.6447, 0.4366, 0.1072]],
  11250. device='cuda:0', grad_fn=<AddmmBackward>)
  11251. landmarks are: tensor([[[ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  11252. 0.2936],
  11253. [ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  11254. 0.0682],
  11255. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  11256. 0.2853],
  11257. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  11258. 0.1499],
  11259. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  11260. 0.1176],
  11261. [ 0.5618, -0.3895, 1.2129, -1.4853, -0.5134, -1.0619, 0.3378,
  11262. 0.0772],
  11263. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  11264. -0.0049],
  11265. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  11266. -0.0102]]], device='cuda:0')
  11267. loss_train_step before backward: tensor(0.0373, device='cuda:0', grad_fn=<MseLossBackward>)
  11268. loss_train_step after backward: tensor(0.0373, device='cuda:0', grad_fn=<MseLossBackward>)
  11269. loss_train: 4.3835613541305065
  11270. step: 79
  11271. running loss: 0.055488118406715276
  11272. Train Steps: 79/90 Loss: 0.0555 torch.Size([8, 600, 800])
  11273. torch.Size([8, 8])
  11274. tensor([[0.6332, 0.4128, 0.9200, 0.3517, 0.4400, 0.3833, 0.7461, 0.5494],
  11275. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646],
  11276. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  11277. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  11278. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  11279. [0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  11280. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  11281. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585]],
  11282. device='cuda:0', dtype=torch.float64)
  11283. predictions are: tensor([[ 0.2519, -0.6683, 1.8736, -0.7073, -0.3280, -0.7509, 1.0281, 0.1443],
  11284. [ 0.2991, -0.6456, 1.4643, -0.8791, -0.6811, -1.1794, 0.2277, 0.1704],
  11285. [ 0.4103, -0.5468, 1.4818, -1.0196, -0.6254, -0.7361, 0.6622, 0.1772],
  11286. [ 0.6202, -0.4099, 1.7969, 0.1244, -0.5959, -0.7569, 0.3795, 0.1859],
  11287. [ 0.4177, -0.5366, 1.7767, 0.0455, -0.1893, -0.0683, 0.3880, 0.1860],
  11288. [ 0.6376, -0.4223, 1.7051, 0.2728, -0.3978, -0.2228, 0.6107, 0.2835],
  11289. [ 0.7116, -0.3657, 1.2793, -1.2706, -0.4624, -1.1501, 0.7176, 0.1937],
  11290. [ 0.3611, -0.5519, 1.7906, -0.4244, -0.2106, 0.0961, 0.5442, 0.1985]],
  11291. device='cuda:0', grad_fn=<AddmmBackward>)
  11292. landmarks are: tensor([[[ 0.6388, -0.3792, 1.9635, -0.6616, -0.2536, -0.5153, 1.1605,
  11293. 0.2516],
  11294. [ 0.5483, -0.4105, 1.4208, -0.8002, -0.6000, -0.9002, 0.0511,
  11295. 0.3220],
  11296. [ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  11297. 0.1159],
  11298. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  11299. 0.3392],
  11300. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  11301. 0.2386],
  11302. [ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  11303. 0.5393],
  11304. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  11305. 0.1621],
  11306. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  11307. 0.2936]]], device='cuda:0')
  11308. loss_train_step before backward: tensor(0.0244, device='cuda:0', grad_fn=<MseLossBackward>)
  11309.  
  11310. loss_train_step after backward: tensor(0.0244, device='cuda:0', grad_fn=<MseLossBackward>)
  11311. loss_train: 4.407923875376582
  11312. step: 80
  11313. running loss: 0.055099048442207275
  11314. Train Steps: 80/90 Loss: 0.0551 torch.Size([8, 600, 800])
  11315. torch.Size([8, 8])
  11316. tensor([[0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  11317. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  11318. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  11319. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  11320. [0.6100, 0.4071, 0.7601, 0.3444, 0.3400, 0.4117, 0.5625, 0.5617],
  11321. [0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783],
  11322. [0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  11323. [0.6185, 0.4129, 0.8900, 0.4567, 0.3937, 0.5417, 0.5734, 0.5110]],
  11324. device='cuda:0', dtype=torch.float64)
  11325. predictions are: tensor([[ 3.5290e-01, -6.1397e-01, 1.9549e+00, -5.3336e-03, -2.9136e-01,
  11326. -7.2324e-02, 9.3207e-01, 1.6320e-01],
  11327. [ 2.8469e-01, -6.2809e-01, 1.9445e+00, -2.0434e-04, -1.3079e-01,
  11328. -2.2070e-02, 6.3742e-01, 2.1544e-01],
  11329. [ 3.5060e-01, -5.5138e-01, 1.1136e+00, -1.1509e+00, -2.4896e-01,
  11330. -1.5926e+00, 4.1498e-01, 2.8779e-01],
  11331. [ 6.6889e-01, -3.9197e-01, 1.8542e+00, 2.6315e-01, -2.2090e-01,
  11332. -2.3001e-01, 3.9280e-01, 1.7063e-01],
  11333. [ 4.6131e-01, -4.7106e-01, 1.4068e+00, -8.2631e-01, -7.4783e-01,
  11334. -6.5008e-01, 4.4228e-01, 2.2298e-01],
  11335. [ 8.3234e-01, -2.7670e-01, 1.0542e+00, -1.0518e+00, -7.1007e-01,
  11336. -1.0961e+00, 3.9934e-01, 2.9696e-01],
  11337. [ 2.8947e-01, -6.0541e-01, 1.5527e+00, -9.9893e-01, -6.6533e-01,
  11338. -6.2536e-01, 7.8111e-01, 1.6534e-01],
  11339. [ 6.4313e-01, -4.2306e-01, 2.0376e+00, -1.2549e-01, -4.8717e-01,
  11340. -1.5416e-01, 5.7382e-01, 1.1506e-01]], device='cuda:0',
  11341. grad_fn=<AddmmBackward>)
  11342. landmarks are: tensor([[[ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  11343. 0.1661],
  11344. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  11345. 0.2083],
  11346. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  11347. 0.3931],
  11348. [ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  11349. 0.2364],
  11350. [ 0.5318, -0.4056, 1.2249, -0.6949, -0.7155, -0.3844, 0.3122,
  11351. 0.3084],
  11352. [ 0.5680, -0.4005, 0.8030, -1.0542, -0.6289, -0.7540, 0.3700,
  11353. 0.3854],
  11354. [ 0.5799, -0.4099, 1.5651, -1.0465, -0.5885, -0.3075, 0.6413,
  11355. 0.1390],
  11356. [ 0.5711, -0.3788, 1.8249, -0.1766, -0.4672, 0.2160, 0.3625,
  11357. 0.0742]]], device='cuda:0')
  11358. loss_train_step before backward: tensor(0.0296, device='cuda:0', grad_fn=<MseLossBackward>)
  11359. loss_train_step after backward: tensor(0.0296, device='cuda:0', grad_fn=<MseLossBackward>)
  11360. loss_train: 4.4374978970736265
  11361. step: 81
  11362. running loss: 0.05478392465522996
  11363. Train Steps: 81/90 Loss: 0.0548 torch.Size([8, 600, 800])
  11364. torch.Size([8, 8])
  11365. tensor([[ nan, nan, 0.9088, 0.3783, 0.4562, 0.2617, 0.6741, 0.5575],
  11366. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  11367. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  11368. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  11369. [0.6152, 0.4131, 0.6863, 0.2567, 0.3625, 0.3300, 0.5765, 0.5305],
  11370. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064],
  11371. [0.6075, 0.4000, 0.8513, 0.5183, 0.4510, 0.5329, 0.5180, 0.5280],
  11372. [0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103]],
  11373. device='cuda:0', dtype=torch.float64)
  11374. predictions are: tensor([[ 0.1934, -0.6862, 2.0995, -0.3841, -0.2928, -0.8127, 1.0653, 0.1940],
  11375. [ 0.3868, -0.5774, 1.4899, -1.2743, -0.2030, -1.3073, 0.9704, 0.1167],
  11376. [ 0.1129, -0.7319, 1.4276, -0.8536, -0.6659, -0.9510, 0.3433, 0.1963],
  11377. [ 0.9127, -0.1787, 1.4410, -0.5508, -0.5565, -0.6560, 0.6148, 0.2726],
  11378. [ 0.6915, -0.3389, 1.0534, -1.0535, -0.6616, -0.7224, 0.4801, 0.2981],
  11379. [ 0.5534, -0.4577, 1.8698, 0.1757, -0.1685, 0.1346, 0.3258, 0.1852],
  11380. [ 0.5698, -0.4565, 1.8043, 0.2670, -0.2506, 0.2621, 0.3408, 0.1853],
  11381. [ 0.3866, -0.5505, 0.9395, -1.1604, -0.5641, -1.0599, 0.3823, 0.2258]],
  11382. device='cuda:0', grad_fn=<AddmmBackward>)
  11383. landmarks are: tensor([[[-2.2859, -2.2859, 1.9115, -0.5384, -0.1785, -1.0773, 0.8278,
  11384. 0.2890],
  11385. [ 0.6126, -0.4057, 1.4439, -1.3159, -0.1150, -1.5777, 0.5537,
  11386. -0.0530],
  11387. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  11388. -0.0220],
  11389. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  11390. 0.3469],
  11391. [ 0.5557, -0.3779, 0.8838, -1.1004, -0.6115, -0.7617, 0.3769,
  11392. 0.1644],
  11393. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  11394. 0.0532],
  11395. [ 0.5202, -0.4382, 1.6460, 0.1082, -0.2029, 0.1754, 0.1067,
  11396. 0.1530],
  11397. [ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  11398. 0.0712]]], device='cuda:0')
  11399. loss_train_step before backward: tensor(0.1651, device='cuda:0', grad_fn=<MseLossBackward>)
  11400. loss_train_step after backward: tensor(0.1651, device='cuda:0', grad_fn=<MseLossBackward>)
  11401. loss_train: 4.602609543129802
  11402. step: 82
  11403. running loss: 0.05612938467231465
  11404. Train Steps: 82/90 Loss: 0.0561 torch.Size([8, 600, 800])
  11405. torch.Size([8, 8])
  11406. tensor([[0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350],
  11407. [0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136],
  11408. [ nan, nan, 0.8463, 0.2550, 0.5850, 0.2133, 0.7129, 0.6072],
  11409. [0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378],
  11410. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  11411. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913],
  11412. [0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131],
  11413. [ nan, nan, 0.9050, 0.3500, 0.5138, 0.2300, 0.7359, 0.5702]],
  11414. device='cuda:0', dtype=torch.float64)
  11415. predictions are: tensor([[ 0.6205, -0.3294, 1.2714, -1.1643, -0.4718, -0.8882, 0.4508, 0.2994],
  11416. [ 0.8339, -0.2433, 1.6666, -0.0028, -0.2328, 0.1562, 0.3314, 0.2164],
  11417. [-0.2367, -0.9609, 1.5820, -1.1476, -0.0225, -0.9568, 1.1855, 0.2878],
  11418. [ 1.3021, 0.0271, 1.6371, 0.3666, -0.7279, -0.3856, 0.4049, 0.1173],
  11419. [ 0.8664, -0.2550, 1.7417, -0.1421, -0.6307, -0.0862, 0.6780, 0.1225],
  11420. [ 0.2749, -0.5678, 1.1647, -1.2503, -0.3124, -1.2384, 0.3588, 0.2341],
  11421. [ 1.0003, -0.1206, 1.5467, -0.5714, -0.7366, -0.1394, 0.3882, 0.1260],
  11422. [-0.8779, -1.3588, 1.7350, -0.7833, -0.1671, -0.9548, 0.8598, 0.2712]],
  11423. device='cuda:0', grad_fn=<AddmmBackward>)
  11424. landmarks are: tensor([[[ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  11425. 0.1852],
  11426. [ 0.5564, -0.3842, 1.7268, 0.1005, -0.0250, 0.3225, 0.2658,
  11427. 0.0862],
  11428. [-2.2859, -2.2859, 1.6229, -1.1081, 0.4162, -1.3005, 1.0070,
  11429. 0.5188],
  11430. [ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  11431. 0.1982],
  11432. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  11433. 0.0774],
  11434. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  11435. -0.0168],
  11436. [ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  11437. 0.0840],
  11438. [-2.2859, -2.2859, 1.8942, -0.6693, 0.0871, -1.2236, 1.1130,
  11439. 0.3478]]], device='cuda:0')
  11440. loss_train_step before backward: tensor(0.1799, device='cuda:0', grad_fn=<MseLossBackward>)
  11441. loss_train_step after backward: tensor(0.1799, device='cuda:0', grad_fn=<MseLossBackward>)
  11442. loss_train: 4.782462088391185
  11443. step: 83
  11444. running loss: 0.05762002516133958
  11445. Train Steps: 83/90 Loss: 0.0576 torch.Size([8, 600, 800])
  11446. torch.Size([8, 8])
  11447. tensor([[ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  11448. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478],
  11449. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  11450. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  11451. [0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  11452. [0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869],
  11453. [0.6246, 0.4008, 0.8757, 0.5088, 0.4101, 0.5392, 0.6644, 0.5133],
  11454. [0.6223, 0.4130, 0.8100, 0.2983, 0.3525, 0.3900, 0.5694, 0.5103]],
  11455. device='cuda:0', dtype=torch.float64)
  11456. predictions are: tensor([[-1.6758, -1.8790, 0.9515, -1.1832, -0.3921, -1.2005, 0.1190, 0.2377],
  11457. [ 0.6928, -0.3176, 1.7793, -0.5673, -0.5725, -0.8589, 0.5203, 0.2073],
  11458. [ 0.6950, -0.3005, 1.5411, -0.6932, -0.5098, -0.0067, 0.7635, 0.2678],
  11459. [ 0.8057, -0.2322, 1.5274, -0.7015, -0.6557, -0.4211, 0.5909, 0.1877],
  11460. [ 0.8430, -0.2581, 1.7463, 0.0786, -0.2258, 0.1675, 0.8384, 0.2404],
  11461. [ 0.8383, -0.2479, 1.3780, -1.2788, -0.1072, -1.4723, 0.6900, 0.1429],
  11462. [ 0.7669, -0.3051, 1.6815, 0.1584, -0.2706, 0.1765, 0.6218, 0.2041],
  11463. [ 0.6534, -0.3386, 1.4837, -0.7632, -0.6079, -0.6089, 0.3371, 0.2506]],
  11464. device='cuda:0', grad_fn=<AddmmBackward>)
  11465. landmarks are: tensor([[[-2.2859, -2.2859, 1.0513, -1.2851, -0.4441, -1.2313, 0.2206,
  11466. 0.1073],
  11467. [ 0.5792, -0.4052, 1.8214, -0.6587, -0.5384, -0.8924, 0.4381,
  11468. 0.2442],
  11469. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  11470. 0.2083],
  11471. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  11472. 0.2391],
  11473. [ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  11474. 0.1661],
  11475. [ 0.6124, -0.4010, 1.4381, -1.3544, -0.0573, -1.5546, 0.5573,
  11476. -0.0369],
  11477. [ 0.5993, -0.4345, 1.7587, 0.0641, -0.3917, 0.2048, 0.7827,
  11478. 0.0852],
  11479. [ 0.5886, -0.3784, 1.4554, -0.9079, -0.6577, -0.4845, 0.3440,
  11480. 0.0712]]], device='cuda:0')
  11481. loss_train_step before backward: tensor(0.0214, device='cuda:0', grad_fn=<MseLossBackward>)
  11482. loss_train_step after backward: tensor(0.0214, device='cuda:0', grad_fn=<MseLossBackward>)
  11483. loss_train: 4.803826930001378
  11484. step: 84
  11485. running loss: 0.057188415833349736
  11486.  
  11487. Train Steps: 84/90 Loss: 0.0572 torch.Size([8, 600, 800])
  11488. torch.Size([8, 8])
  11489. tensor([[0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  11490. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  11491. [0.6160, 0.4093, 0.8314, 0.4417, 0.3675, 0.4583, 0.5250, 0.5808],
  11492. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  11493. [0.6128, 0.4115, 0.7934, 0.3778, 0.3450, 0.4033, 0.5337, 0.5456],
  11494. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817],
  11495. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  11496. [0.6203, 0.4076, 0.8611, 0.2878, 0.4050, 0.2554, 0.5907, 0.5496]],
  11497. device='cuda:0', dtype=torch.float64)
  11498. predictions are: tensor([[ 0.5288, -0.4258, 1.6598, 0.0234, -0.6744, -0.2807, 0.2428, 0.2266],
  11499. [ 0.9124, -0.1514, 0.9119, -1.0870, -0.1578, -1.0845, 0.3587, 0.3047],
  11500. [ 0.5259, -0.4405, 1.5958, -0.1026, -0.4962, 0.0710, 0.4900, 0.2501],
  11501. [ 0.4467, -0.4996, 1.2111, -1.1375, -0.1979, -1.1565, 0.5828, 0.1334],
  11502. [ 0.8034, -0.2387, 1.4822, -0.5721, -0.6348, -0.1920, 0.4950, 0.1476],
  11503. [ 0.0750, -0.6879, 1.3695, -0.9216, -0.2341, -0.8327, 0.4966, 0.2875],
  11504. [-0.2534, -0.9799, 1.8873, -0.7545, -0.4268, -0.6145, 1.0349, 0.0990],
  11505. [ 0.2832, -0.5986, 1.6411, -0.9750, -0.3327, -0.7753, 0.6956, 0.1492]],
  11506. device='cuda:0', grad_fn=<AddmmBackward>)
  11507. landmarks are: tensor([[[ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  11508. 0.4357],
  11509. [ 0.6101, -0.3152, 1.0166, -0.7540, -0.0226, -1.4468, 0.2823,
  11510. 0.5702],
  11511. [ 0.5592, -0.3956, 1.5543, -0.2456, -0.5885, -0.1689, 0.1392,
  11512. 0.3968],
  11513. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  11514. 0.2083],
  11515. [ 0.5444, -0.3852, 1.3786, -0.5409, -0.6924, -0.4229, 0.1791,
  11516. 0.2341],
  11517. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  11518. 0.4008],
  11519. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  11520. 0.1390],
  11521. [ 0.5790, -0.4031, 1.6915, -0.9564, -0.4152, -1.1063, 0.4425,
  11522. 0.2528]]], device='cuda:0')
  11523. loss_train_step before backward: tensor(0.0526, device='cuda:0', grad_fn=<MseLossBackward>)
  11524. loss_train_step after backward: tensor(0.0526, device='cuda:0', grad_fn=<MseLossBackward>)
  11525. loss_train: 4.856406262144446
  11526. step: 85
  11527. running loss: 0.057134191319346425
  11528. Train Steps: 85/90 Loss: 0.0571 torch.Size([8, 600, 800])
  11529. torch.Size([8, 8])
  11530. tensor([[0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  11531. [0.6168, 0.4081, 0.8438, 0.3367, 0.3500, 0.4667, 0.6212, 0.5400],
  11532. [0.6196, 0.4068, 0.7645, 0.2234, 0.4575, 0.1737, 0.5926, 0.5284],
  11533. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  11534. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  11535. [0.6187, 0.4104, 0.7126, 0.2069, 0.3950, 0.2517, 0.5913, 0.5683],
  11536. [0.6171, 0.4127, 0.8900, 0.4800, 0.4325, 0.5783, 0.5769, 0.5090],
  11537. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617]],
  11538. device='cuda:0', dtype=torch.float64)
  11539. predictions are: tensor([[ 1.3328e-01, -6.7352e-01, 1.6691e+00, -2.4416e-01, -1.3594e-01,
  11540. -3.2876e-04, 4.3535e-01, 2.3712e-01],
  11541. [ 5.2176e-01, -4.1727e-01, 1.4926e+00, -8.6348e-01, -5.5333e-01,
  11542. -1.8318e-01, 7.7127e-01, 2.5558e-01],
  11543. [ 9.9327e-01, -1.1433e-01, 1.0954e+00, -1.3476e+00, -2.7377e-01,
  11544. -1.3365e+00, 3.8144e-01, 1.8049e-01],
  11545. [-8.2795e-01, -1.3359e+00, 1.9219e+00, -7.7653e-01, -3.3671e-01,
  11546. -8.4426e-01, 9.5188e-01, 1.5540e-01],
  11547. [ 4.9690e-01, -4.4354e-01, 1.7715e+00, 3.1300e-02, -6.5161e-01,
  11548. -6.7309e-01, 5.1132e-01, 5.7911e-02],
  11549. [ 7.3540e-01, -2.5406e-01, 9.1125e-01, -1.3418e+00, -4.7364e-01,
  11550. -1.1851e+00, 3.1099e-01, 2.4200e-01],
  11551. [ 4.7442e-01, -4.5498e-01, 1.7000e+00, -1.5574e-01, -2.9064e-01,
  11552. 1.7565e-01, 4.3889e-01, 2.0958e-01],
  11553. [ 6.5780e-01, -3.2612e-01, 1.6180e+00, -1.8878e-01, -3.5431e-01,
  11554. 1.8572e-02, 3.9815e-01, 2.2789e-01]], device='cuda:0',
  11555. grad_fn=<AddmmBackward>)
  11556. landmarks are: tensor([[[ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  11557. 0.2853],
  11558. [ 0.5631, -0.4008, 1.6113, -0.7309, -0.6693, -0.1304, 0.5836,
  11559. 0.2083],
  11560. [ 0.5761, -0.4070, 1.2452, -1.2541, -0.1725, -1.4835, 0.4511,
  11561. 0.1545],
  11562. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  11563. 0.2676],
  11564. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  11565. -0.0049],
  11566. [ 0.5718, -0.3905, 1.0053, -1.3305, -0.4614, -1.1235, 0.4450,
  11567. 0.3392],
  11568. [ 0.5645, -0.3797, 1.8249, -0.0688, -0.2882, 0.3854, 0.3789,
  11569. 0.0652],
  11570. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  11571. 0.3084]]], device='cuda:0')
  11572. loss_train_step before backward: tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward>)
  11573. loss_train_step after backward: tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward>)
  11574. loss_train: 4.923488324508071
  11575. step: 86
  11576. running loss: 0.05724986423846594
  11577. Train Steps: 86/90 Loss: 0.0572 torch.Size([8, 600, 800])
  11578. torch.Size([8, 8])
  11579. tensor([[0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  11580. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  11581. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  11582. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  11583. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  11584. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  11585. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  11586. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667]],
  11587. device='cuda:0', dtype=torch.float64)
  11588. predictions are: tensor([[ 0.6679, -0.3393, 1.1044, -1.2029, -0.5126, -0.9637, 0.2172, 0.1473],
  11589. [ 0.2462, -0.6525, 1.7013, 0.3707, -0.3928, 0.1506, 0.3154, 0.2182],
  11590. [ 0.2769, -0.6023, 1.5248, -1.0627, -0.4206, -0.9832, 0.6722, 0.0666],
  11591. [ 0.6292, -0.3429, 1.2376, -1.0654, -0.3068, -0.9931, 0.4548, 0.3508],
  11592. [-0.0074, -0.7957, 1.7611, -0.6247, -0.3023, -0.7269, 0.8707, 0.0755],
  11593. [ 0.5369, -0.4352, 1.6622, -0.9727, -0.4015, -0.7603, 0.5024, 0.2316],
  11594. [ 0.2221, -0.6411, 1.7975, -0.0278, -0.1875, 0.1898, 0.6727, 0.1995],
  11595. [ 0.5766, -0.3768, 1.0787, -1.0031, -0.5580, -0.6710, 0.2390, 0.2642]],
  11596. device='cuda:0', grad_fn=<AddmmBackward>)
  11597. landmarks are: tensor([[[ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  11598. 0.0802],
  11599. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  11600. -0.1061],
  11601. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  11602. -0.0220],
  11603. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  11604. 0.6084],
  11605. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  11606. 0.1821],
  11607. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  11608. 0.3392],
  11609. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  11610. 0.1474],
  11611. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  11612. 0.3315]]], device='cuda:0')
  11613. loss_train_step before backward: tensor(0.0238, device='cuda:0', grad_fn=<MseLossBackward>)
  11614. loss_train_step after backward: tensor(0.0238, device='cuda:0', grad_fn=<MseLossBackward>)
  11615. loss_train: 4.947322266176343
  11616. step: 87
  11617. running loss: 0.05686577317444073
  11618. Train Steps: 87/90 Loss: 0.0569 torch.Size([8, 600, 800])
  11619. torch.Size([8, 8])
  11620. tensor([[0.6307, 0.4029, 0.8650, 0.5200, 0.3763, 0.4017, 0.7311, 0.5366],
  11621. [0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390],
  11622. [0.6205, 0.4012, 0.8675, 0.3283, 0.3713, 0.3050, 0.5813, 0.5117],
  11623. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  11624. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  11625. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  11626. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  11627. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533]],
  11628. device='cuda:0', dtype=torch.float64)
  11629. predictions are: tensor([[ 0.7241, -0.3271, 1.7330, 0.0022, -0.4415, -0.4059, 0.5559, 0.1113],
  11630. [ 0.8021, -0.2346, 1.5974, -0.6172, -0.2946, -0.7826, 0.7004, 0.1298],
  11631. [ 0.5272, -0.4370, 1.6671, -0.8570, -0.4961, -0.7450, 0.4616, 0.1232],
  11632. [-0.0215, -0.7598, 0.7726, -1.3853, -0.3094, -1.2399, 0.1006, 0.2363],
  11633. [ 0.6110, -0.3637, 1.6312, -1.1276, -0.2190, -0.9056, 0.7891, 0.1843],
  11634. [ 0.5471, -0.3935, 1.6186, -0.3462, -0.4808, -0.3456, 0.2056, 0.2678],
  11635. [ 1.0903, -0.1401, 1.7994, -0.1475, -0.3498, 0.5473, 0.7149, 0.1603],
  11636. [-1.3033, -1.6128, 1.1779, -0.9719, -0.4504, -0.8305, 0.2302, 0.2690]],
  11637. device='cuda:0', grad_fn=<AddmmBackward>)
  11638. landmarks are: tensor([[[ 0.6273, -0.4249, 1.7095, 0.1159, -0.5480, -0.4306, 1.0910,
  11639. 0.1928],
  11640. [ 0.6504, -0.3936, 1.8885, -0.4922, -0.3402, -0.9233, 0.8022,
  11641. 0.2035],
  11642. [ 0.5799, -0.4329, 1.7210, -0.7694, -0.5711, -0.8771, 0.3988,
  11643. 0.0774],
  11644. [ 0.5591, -0.3990, 0.9012, -1.2313, -0.3979, -1.3852, 0.0804,
  11645. 0.2071],
  11646. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  11647. 0.1467],
  11648. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  11649. 0.1852],
  11650. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  11651. 0.1082],
  11652. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  11653. 0.2699]]], device='cuda:0')
  11654. loss_train_step before backward: tensor(0.0496, device='cuda:0', grad_fn=<MseLossBackward>)
  11655. loss_train_step after backward: tensor(0.0496, device='cuda:0', grad_fn=<MseLossBackward>)
  11656. loss_train: 4.99695965833962
  11657. step: 88
  11658. running loss: 0.056783632481132044
  11659.  
  11660. Train Steps: 88/90 Loss: 0.0568 torch.Size([8, 600, 800])
  11661. torch.Size([8, 8])
  11662. tensor([[0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  11663. [0.6129, 0.4069, 0.8750, 0.5067, 0.3875, 0.4233, 0.5235, 0.5881],
  11664. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  11665. [0.6261, 0.4045, 0.8865, 0.5369, 0.3895, 0.4859, 0.6683, 0.5249],
  11666. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  11667. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  11668. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  11669. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879]],
  11670. device='cuda:0', dtype=torch.float64)
  11671. predictions are: tensor([[ 0.5584, -0.4093, 1.1146, -1.4048, -0.2779, -1.3822, 0.1954, 0.1406],
  11672. [ 0.4821, -0.4613, 1.6472, -0.0517, -0.4324, -0.3837, 0.1814, 0.2442],
  11673. [ 0.4873, -0.4168, 1.3685, -0.8206, -0.5818, -0.4522, 0.2436, 0.1914],
  11674. [ 0.3995, -0.5603, 1.7979, -0.0745, -0.4099, -0.0866, 0.7555, 0.1212],
  11675. [ 0.0065, -0.7383, 0.9568, -1.1590, -0.3999, -1.0661, 0.2975, 0.3177],
  11676. [ 0.6278, -0.4072, 1.7102, -0.8546, -0.5490, -0.6138, 0.4779, 0.2245],
  11677. [ 0.0327, -0.7839, 1.8877, -0.2893, -0.2485, -0.4808, 0.8511, 0.2126],
  11678. [ 0.7731, -0.3011, 1.7908, -0.3452, -0.3399, 0.2271, 0.5904, 0.0849]],
  11679. device='cuda:0', grad_fn=<AddmmBackward>)
  11680. landmarks are: tensor([[[ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  11681. 0.0774],
  11682. [ 0.5452, -0.4067, 1.7557, 0.0543, -0.4961, -0.3306, 0.1323,
  11683. 0.4306],
  11684. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  11685. 0.2386],
  11686. [ 0.6059, -0.4177, 1.8087, 0.1941, -0.4868, -0.0414, 0.8010,
  11687. 0.1385],
  11688. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  11689. 0.4085],
  11690. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  11691. 0.3392],
  11692. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  11693. 0.4386],
  11694. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  11695. -0.0322]]], device='cuda:0')
  11696. loss_train_step before backward: tensor(0.0316, device='cuda:0', grad_fn=<MseLossBackward>)
  11697. loss_train_step after backward: tensor(0.0316, device='cuda:0', grad_fn=<MseLossBackward>)
  11698. loss_train: 5.028513407334685
  11699. step: 89
  11700. running loss: 0.05650015064420995
  11701. Train Steps: 89/90 Loss: 0.0565 torch.Size([8, 600, 800])
  11702. torch.Size([8, 8])
  11703. tensor([[0.6129, 0.4114, 0.6950, 0.2467, 0.4050, 0.2133, 0.5363, 0.5550],
  11704. [0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843],
  11705. [0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  11706. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  11707. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436],
  11708. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550],
  11709. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  11710. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100]],
  11711. device='cuda:0', dtype=torch.float64)
  11712. predictions are: tensor([[ 0.4825, -0.4272, 0.9730, -1.4118, -0.4009, -1.3373, 0.0767, 0.2495],
  11713. [ 0.4915, -0.4617, 1.9515, -0.4588, -0.5543, -0.2200, 0.6500, 0.0742],
  11714. [ 0.3416, -0.6033, 1.6379, -0.0055, -0.4627, -0.4151, 0.4429, 0.1592],
  11715. [ 0.4801, -0.4831, 1.6780, -0.1948, -0.3423, -0.0419, 0.2214, 0.2790],
  11716. [ 0.6173, -0.4038, 1.7523, -0.1950, -0.3700, 0.1127, 0.7578, 0.2431],
  11717. [ 0.5661, -0.4204, 1.8014, -0.4218, -0.4077, 0.0485, 0.4907, 0.2373],
  11718. [ 0.0555, -0.7193, 0.9680, -1.5541, -0.2692, -1.6329, 0.2577, 0.1827],
  11719. [ 0.4184, -0.5378, 1.6813, -0.1549, -0.4171, -0.3171, 0.5697, 0.1647]],
  11720. device='cuda:0', grad_fn=<AddmmBackward>)
  11721. landmarks are: tensor([[[ 0.5448, -0.3859, 0.9242, -1.1466, -0.4152, -1.3005, 0.1910,
  11722. 0.2776],
  11723. [ 0.6075, -0.4159, 1.8654, -0.1458, -0.5249, 0.0159, 0.6359,
  11724. -0.0490],
  11725. [ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  11726. -0.1492],
  11727. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  11728. 0.3777],
  11729. [ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  11730. 0.2249],
  11731. [ 0.5968, -0.3725, 1.8423, -0.1381, -0.4037, 0.1852, 0.6009,
  11732. 0.2776],
  11733. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  11734. 0.1253],
  11735. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  11736. 0.0697]]], device='cuda:0')
  11737. loss_train_step before backward: tensor(0.0333, device='cuda:0', grad_fn=<MseLossBackward>)
  11738. loss_train_step after backward: tensor(0.0333, device='cuda:0', grad_fn=<MseLossBackward>)
  11739. loss_train: 5.0618322510272264
  11740. step: 90
  11741. running loss: 0.05624258056696918
  11742. Valid Steps: 10/10 Loss: nan 62
  11743. --------------------------------------------------
  11744. Epoch: 3 Train Loss: 0.0562 Valid Loss: nan
  11745. --------------------------------------------------
  11746. size of train loader is: 90
  11747. torch.Size([8, 600, 800])
  11748. torch.Size([8, 8])
  11749. tensor([[0.6136, 0.4117, 0.8700, 0.5167, 0.4188, 0.5083, 0.5147, 0.5495],
  11750. [0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  11751. [0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  11752. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  11753. [0.6296, 0.4060, 0.9100, 0.3267, 0.4726, 0.3367, 0.7446, 0.5355],
  11754. [0.6268, 0.4029, 0.8500, 0.2683, 0.3937, 0.3500, 0.6860, 0.5297],
  11755. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  11756. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567]],
  11757. device='cuda:0', dtype=torch.float64)
  11758. predictions are: tensor([[ 0.7934, -0.2856, 1.6860, 0.1092, -0.3487, 0.0531, 0.2048, 0.2442],
  11759. [ 0.6889, -0.3477, 1.0870, -1.3416, -0.3528, -1.3638, 0.1548, 0.2013],
  11760. [ 0.5929, -0.4533, 1.6458, -0.0300, -0.2567, 0.1042, 0.5948, 0.2456],
  11761. [-1.2841, -1.6451, 1.3930, -0.9300, -0.5634, -0.8736, 0.1785, 0.2065],
  11762. [ 0.2508, -0.6173, 1.6443, -0.9053, -0.2038, -0.8371, 0.8204, 0.1669],
  11763. [ 0.7218, -0.3298, 1.5397, -1.0182, -0.5050, -0.7588, 0.8013, 0.1396],
  11764. [ 0.9012, -0.2219, 1.7789, -0.3461, -0.6196, -0.1334, 0.4337, 0.0805],
  11765. [ 0.8209, -0.2396, 1.5937, -0.2505, -0.5622, -0.4064, 0.3184, 0.2603]],
  11766. device='cuda:0', grad_fn=<AddmmBackward>)
  11767. landmarks are: tensor([[[ 0.5482, -0.3841, 1.7326, 0.1005, -0.3517, 0.0620, 0.0912,
  11768. 0.2522],
  11769. [ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  11770. 0.0774],
  11771. [ 0.6042, -0.4273, 1.6920, 0.1860, -0.2717, 0.1406, 0.7997,
  11772. 0.1004],
  11773. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  11774. 0.1133],
  11775. [ 0.6224, -0.4105, 1.9173, -0.7771, -0.1030, -0.7308, 1.1532,
  11776. 0.1875],
  11777. [ 0.6092, -0.4249, 1.6402, -1.0465, -0.4672, -0.6693, 0.8827,
  11778. 0.1608],
  11779. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  11780. -0.0670],
  11781. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  11782. 0.2853]]], device='cuda:0')
  11783. loss_train_step before backward: tensor(0.0408, device='cuda:0', grad_fn=<MseLossBackward>)
  11784. loss_train_step after backward: tensor(0.0408, device='cuda:0', grad_fn=<MseLossBackward>)
  11785. loss_train: 0.0408310666680336
  11786. step: 1
  11787. running loss: 0.0408310666680336
  11788. Train Steps: 1/90 Loss: 0.0408 torch.Size([8, 600, 800])
  11789. torch.Size([8, 8])
  11790. tensor([[0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  11791. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  11792. [ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  11793. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  11794. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  11795. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  11796. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  11797. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967]],
  11798. device='cuda:0', dtype=torch.float64)
  11799. predictions are: tensor([[ 0.8029, -0.2294, 1.0461, -1.3274, -0.4808, -1.3214, 0.4222, 0.1729],
  11800. [ 0.5322, -0.4257, 1.7850, -0.4723, -0.6244, -0.5832, 0.4501, 0.2225],
  11801. [-1.7818, -1.9189, 1.1634, -1.3966, -0.2579, -1.3634, 0.2830, 0.2149],
  11802. [ 0.7616, -0.3080, 1.6486, -0.0197, -0.4939, -0.2841, 0.5924, 0.1066],
  11803. [ 0.7523, -0.2829, 1.6721, -0.1539, -0.2369, -0.1656, 0.1428, 0.1686],
  11804. [ 0.8615, -0.2260, 1.7055, -0.0355, -0.3871, 0.1315, 0.7918, 0.1862],
  11805. [ 0.6541, -0.3519, 1.6196, -0.1458, -0.3515, -0.2593, 0.2668, 0.1777],
  11806. [ 0.7497, -0.3061, 1.7884, -0.3122, -0.4508, 0.1585, 0.5595, 0.2249]],
  11807. device='cuda:0', grad_fn=<AddmmBackward>)
  11808. landmarks are: tensor([[[ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  11809. 0.2930],
  11810. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  11811. 0.3238],
  11812. [-2.2859, -2.2859, 0.9175, -1.3947, -0.3691, -1.2467, 0.2314,
  11813. 0.3238],
  11814. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  11815. 0.0697],
  11816. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  11817. 0.3392],
  11818. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  11819. 0.3371],
  11820. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  11821. 0.3700],
  11822. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  11823. 0.4701]]], device='cuda:0')
  11824. loss_train_step before backward: tensor(0.0242, device='cuda:0', grad_fn=<MseLossBackward>)
  11825. loss_train_step after backward: tensor(0.0242, device='cuda:0', grad_fn=<MseLossBackward>)
  11826. loss_train: 0.06501925364136696
  11827. step: 2
  11828. running loss: 0.03250962682068348
  11829.  
  11830. Train Steps: 2/90 Loss: 0.0325 torch.Size([8, 600, 800])
  11831. torch.Size([8, 8])
  11832. tensor([[0.6198, 0.4075, 0.8650, 0.5617, 0.4150, 0.4367, 0.5450, 0.5650],
  11833. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  11834. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  11835. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  11836. [0.6268, 0.4102, 0.8938, 0.3667, 0.4025, 0.2833, 0.6275, 0.5183],
  11837. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  11838. [0.6161, 0.4099, 0.8738, 0.4383, 0.3788, 0.5483, 0.5605, 0.5019],
  11839. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268]],
  11840. device='cuda:0', dtype=torch.float64)
  11841. predictions are: tensor([[ 0.2261, -0.6299, 1.5691, 0.0380, -0.4303, -0.4064, 0.3217, 0.2605],
  11842. [ 0.8775, -0.2186, 1.6144, -0.0903, -0.2743, -0.0483, 0.2540, 0.2187],
  11843. [ 0.4941, -0.4669, 1.6542, 0.0592, -0.4179, 0.0067, 0.4888, 0.2468],
  11844. [ 0.6490, -0.3877, 1.5852, 0.0381, -0.5231, -0.2220, 0.4692, 0.1378],
  11845. [ 0.6293, -0.3672, 1.8195, -0.9589, -0.4476, -1.1585, 0.6918, 0.1580],
  11846. [-0.9213, -1.3341, 1.0464, -1.5667, -0.3857, -1.5674, 0.3233, 0.1719],
  11847. [ 0.8097, -0.2308, 1.6492, -0.5242, -0.5474, 0.1092, 0.4527, 0.1488],
  11848. [ 0.6409, -0.3545, 1.6522, -0.3213, -0.3163, -0.0979, 0.5912, 0.1635]],
  11849. device='cuda:0', grad_fn=<AddmmBackward>)
  11850. landmarks are: tensor([[[ 0.5770, -0.4036, 1.7095, 0.3084, -0.3691, -0.2690, 0.2314,
  11851. 0.3238],
  11852. [ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  11853. 0.2364],
  11854. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  11855. 0.3161],
  11856. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  11857. -0.1385],
  11858. [ 0.6092, -0.3913, 1.8423, -0.5923, -0.4268, -0.9772, 0.6125,
  11859. 0.1082],
  11860. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  11861. 0.1343],
  11862. [ 0.5597, -0.3928, 1.7499, -0.2613, -0.5365, 0.2468, 0.3028,
  11863. 0.0321],
  11864. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  11865. 0.1474]]], device='cuda:0')
  11866. loss_train_step before backward: tensor(0.0751, device='cuda:0', grad_fn=<MseLossBackward>)
  11867. loss_train_step after backward: tensor(0.0751, device='cuda:0', grad_fn=<MseLossBackward>)
  11868. loss_train: 0.1400858722627163
  11869. step: 3
  11870. running loss: 0.04669529075423876
  11871. Train Steps: 3/90 Loss: 0.0467 torch.Size([8, 600, 800])
  11872. torch.Size([8, 8])
  11873. tensor([[0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  11874. [0.6201, 0.4102, 0.7288, 0.2417, 0.4150, 0.2383, 0.6100, 0.5500],
  11875. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  11876. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  11877. [0.6189, 0.4033, 0.8650, 0.5267, 0.4487, 0.5150, 0.5925, 0.5050],
  11878. [0.6058, 0.3986, 0.8324, 0.4626, 0.3838, 0.4983, 0.5147, 0.5466],
  11879. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  11880. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750]],
  11881. device='cuda:0', dtype=torch.float64)
  11882. predictions are: tensor([[ 0.3854, -0.5699, 1.7729, -0.4065, -0.3826, -0.5799, 0.8162, 0.0487],
  11883. [ 0.4473, -0.4987, 1.2553, -0.9025, -0.4371, -1.0451, 0.5099, 0.1875],
  11884. [ 0.3850, -0.5415, 1.2425, -1.1285, -0.3311, -1.2141, 0.4639, 0.1034],
  11885. [ 0.4943, -0.4585, 1.7603, -0.3231, -0.4710, -0.5697, 0.3823, 0.2806],
  11886. [ 0.5609, -0.4599, 1.7936, 0.3726, -0.2832, 0.3955, 0.2943, 0.1781],
  11887. [ 0.3167, -0.5832, 1.6743, 0.1032, -0.5132, 0.2972, 0.2819, 0.1813],
  11888. [ 0.0717, -0.6920, 1.2379, -0.9312, -0.3837, -0.9721, 0.3222, 0.3046],
  11889. [ 0.5122, -0.4441, 1.2345, -0.7984, -0.4852, -0.8042, 0.5456, 0.2060]],
  11890. device='cuda:0', grad_fn=<AddmmBackward>)
  11891. landmarks are: tensor([[[ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  11892. 0.1821],
  11893. [ 0.5784, -0.3913, 1.0801, -1.1697, -0.3691, -1.1851, 0.5316,
  11894. 0.2545],
  11895. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  11896. 0.1082],
  11897. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  11898. 0.3928],
  11899. [ 0.5726, -0.4230, 1.7095, 0.1467, -0.2132, 0.0928, 0.4508,
  11900. 0.0467],
  11901. [ 0.5124, -0.4446, 1.5587, -0.1493, -0.5134, 0.0159, 0.0912,
  11902. 0.2386],
  11903. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  11904. 0.2853],
  11905. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  11906. 0.3700]]], device='cuda:0')
  11907. loss_train_step before backward: tensor(0.0287, device='cuda:0', grad_fn=<MseLossBackward>)
  11908. loss_train_step after backward: tensor(0.0287, device='cuda:0', grad_fn=<MseLossBackward>)
  11909. loss_train: 0.16878480091691017
  11910. step: 4
  11911. running loss: 0.04219620022922754
  11912. Train Steps: 4/90 Loss: 0.0422 torch.Size([8, 600, 800])
  11913. torch.Size([8, 8])
  11914. tensor([[0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667],
  11915. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  11916. [0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  11917. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  11918. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  11919. [0.6260, 0.4153, 0.9000, 0.4533, 0.4025, 0.2633, 0.6223, 0.4967],
  11920. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800],
  11921. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683]],
  11922. device='cuda:0', dtype=torch.float64)
  11923. predictions are: tensor([[ 0.6402, -0.3300, 1.6367, -0.5436, -0.4823, -0.6285, 0.3887, 0.2062],
  11924. [ 0.4304, -0.5247, 1.8311, -0.0857, -0.2697, 0.3819, 0.6370, 0.2235],
  11925. [ 0.3012, -0.6414, 1.6228, 0.3746, -0.3542, -0.0797, 0.5618, 0.0932],
  11926. [ 0.3471, -0.5312, 1.0608, -0.9703, -0.4720, -0.8061, 0.3146, 0.2213],
  11927. [ 0.3248, -0.5650, 1.7027, -0.1101, -0.4417, -0.2336, 0.5059, 0.1623],
  11928. [ 0.3386, -0.5307, 1.7406, -0.2570, -0.3301, -1.0203, 0.5861, 0.1280],
  11929. [ 0.3174, -0.5268, 1.0960, -0.8999, -0.4709, -0.9923, 0.1387, 0.2535],
  11930. [ 0.6184, -0.4022, 1.6616, -0.6118, -0.5818, -0.3922, 0.4269, 0.2213]],
  11931. device='cuda:0', grad_fn=<AddmmBackward>)
  11932. landmarks are: tensor([[[ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  11933. 0.3315],
  11934. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  11935. 0.4701],
  11936. [ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  11937. -0.1492],
  11938. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  11939. 0.3315],
  11940. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  11941. 0.2314],
  11942. [ 0.6055, -0.3676, 1.8711, -0.1920, -0.4268, -1.0696, 0.5887,
  11943. 0.0081],
  11944. [ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  11945. 0.3931],
  11946. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  11947. 0.3392]]], device='cuda:0')
  11948. loss_train_step before backward: tensor(0.0165, device='cuda:0', grad_fn=<MseLossBackward>)
  11949. loss_train_step after backward: tensor(0.0165, device='cuda:0', grad_fn=<MseLossBackward>)
  11950. loss_train: 0.18524960055947304
  11951. step: 5
  11952. running loss: 0.037049920111894605
  11953. Train Steps: 5/90 Loss: 0.0370 torch.Size([8, 600, 800])
  11954. torch.Size([8, 8])
  11955. tensor([[0.6234, 0.4179, 0.7825, 0.3450, 0.3813, 0.2867, 0.5675, 0.5617],
  11956. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  11957. [0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283],
  11958. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  11959. [0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  11960. [0.6164, 0.3956, 0.8757, 0.5088, 0.4300, 0.5320, 0.6022, 0.5202],
  11961. [0.6200, 0.4071, 0.7338, 0.1917, 0.4200, 0.2450, 0.6150, 0.5517],
  11962. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783]],
  11963. device='cuda:0', dtype=torch.float64)
  11964. predictions are: tensor([[ 0.2791, -0.5424, 1.3593, -0.6483, -0.5082, -0.7606, 0.2373, 0.3004],
  11965. [ 0.5529, -0.4208, 1.3162, -0.7741, -0.5420, -0.8749, 0.5742, 0.2522],
  11966. [ 0.5527, -0.4374, 1.6764, 0.2120, -0.1778, 0.1175, 0.2001, 0.1639],
  11967. [ 0.7011, -0.3902, 1.7922, 0.3820, -0.5591, 0.0326, 0.7921, 0.0431],
  11968. [ 0.1883, -0.6151, 1.7248, -0.4770, -0.3421, -1.0000, 0.5109, 0.1547],
  11969. [ 0.2386, -0.6325, 1.7365, 0.1798, -0.4045, 0.3961, 0.4558, 0.1295],
  11970. [ 0.3358, -0.5460, 1.2014, -1.0744, -0.4078, -1.0060, 0.5095, 0.1908],
  11971. [ 0.3464, -0.4803, 1.1684, -0.9478, -0.2323, -1.0542, 0.3087, 0.2845]],
  11972. device='cuda:0', grad_fn=<AddmmBackward>)
  11973. landmarks are: tensor([[[ 0.5935, -0.3558, 1.3284, -0.6924, -0.5249, -0.9618, 0.3353,
  11974. 0.3084],
  11975. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  11976. 0.3777],
  11977. [ 0.5245, -0.4347, 1.6806, 0.1159, 0.0046, 0.0129, 0.1044,
  11978. 0.1544],
  11979. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  11980. 0.0291],
  11981. [ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  11982. 0.0171],
  11983. [ 0.5614, -0.4586, 1.7587, 0.0641, -0.2998, 0.1712, 0.4958,
  11984. 0.1170],
  11985. [ 0.5779, -0.4054, 1.1032, -1.4006, -0.3460, -1.1543, 0.5547,
  11986. 0.2622],
  11987. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  11988. 0.3854]]], device='cuda:0')
  11989. loss_train_step before backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  11990. loss_train_step after backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  11991. loss_train: 0.21053649485111237
  11992. step: 6
  11993. running loss: 0.03508941580851873
  11994.  
  11995. Train Steps: 6/90 Loss: 0.0351 torch.Size([8, 600, 800])
  11996. torch.Size([8, 8])
  11997. tensor([[0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  11998. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  11999. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  12000. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  12001. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517],
  12002. [0.6177, 0.4086, 0.8738, 0.3950, 0.3775, 0.5600, 0.6225, 0.5700],
  12003. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356],
  12004. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167]],
  12005. device='cuda:0', dtype=torch.float64)
  12006. predictions are: tensor([[ 0.3029, -0.6244, 1.8468, 0.1460, -0.4225, 0.1632, 0.9719, 0.1582],
  12007. [ 0.3994, -0.5348, 1.6714, 0.0397, -0.2388, -0.1771, 0.2345, 0.1581],
  12008. [ 0.2754, -0.6236, 1.7249, 0.0636, -0.3578, -0.0518, 0.3006, 0.1270],
  12009. [ 0.6174, -0.3559, 1.3701, -0.3050, -0.6034, -0.3570, 0.1214, 0.1833],
  12010. [ 0.5716, -0.4054, 1.5687, -0.6477, -0.6942, -0.6264, 0.4524, 0.2152],
  12011. [ 0.2340, -0.6259, 1.7155, -0.2797, -0.4494, 0.2091, 0.7213, 0.2117],
  12012. [ 0.6382, -0.3643, 1.3742, -0.9335, -0.3079, -1.3957, 0.6677, 0.2151],
  12013. [ 0.5772, -0.3455, 1.0543, -0.8894, -0.1617, -1.3255, 0.2601, 0.3533]],
  12014. device='cuda:0', grad_fn=<AddmmBackward>)
  12015. landmarks are: tensor([[[ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  12016. 0.1554],
  12017. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  12018. -0.0039],
  12019. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  12020. 0.0051],
  12021. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  12022. 0.1552],
  12023. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  12024. 0.2622],
  12025. [ 0.5671, -0.3988, 1.7499, -0.4614, -0.5423, 0.3007, 0.5894,
  12026. 0.3469],
  12027. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  12028. 0.1879],
  12029. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  12030. 0.5624]]], device='cuda:0')
  12031. loss_train_step before backward: tensor(0.0187, device='cuda:0', grad_fn=<MseLossBackward>)
  12032. loss_train_step after backward: tensor(0.0187, device='cuda:0', grad_fn=<MseLossBackward>)
  12033. loss_train: 0.22919072955846786
  12034. step: 7
  12035. running loss: 0.03274153279406684
  12036. Train Steps: 7/90 Loss: 0.0327 torch.Size([8, 600, 800])
  12037. torch.Size([8, 8])
  12038. tensor([[0.6250, 0.4103, 0.8950, 0.4400, 0.3912, 0.5650, 0.6050, 0.5133],
  12039. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  12040. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  12041. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  12042. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  12043. [ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  12044. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  12045. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875]],
  12046. device='cuda:0', dtype=torch.float64)
  12047. predictions are: tensor([[ 0.5962, -0.3807, 1.8008, -0.0904, -0.3684, 0.2387, 0.6538, 0.1876],
  12048. [ 0.5492, -0.4183, 1.7119, -0.1476, -0.3619, 0.1762, 0.4529, 0.2305],
  12049. [ 0.7731, -0.3102, 1.6519, 0.2326, -0.3488, -0.1404, 0.5892, 0.1673],
  12050. [ 0.7477, -0.2326, 1.3266, -0.5177, -0.3959, -0.8787, 0.3715, 0.3245],
  12051. [ 0.8838, -0.2180, 1.6062, 0.3130, -0.3376, -0.1118, 0.7455, 0.2682],
  12052. [-1.4788, -1.7508, 1.1179, -1.3049, -0.2588, -1.3062, 0.2117, 0.2637],
  12053. [ 0.8055, -0.2542, 1.6588, -0.3911, -0.6106, -0.3597, 0.4233, 0.1606],
  12054. [ 0.9708, -0.1498, 1.6112, -0.6890, -0.6115, -0.9635, 0.1644, 0.1881]],
  12055. device='cuda:0', grad_fn=<AddmmBackward>)
  12056. landmarks are: tensor([[[ 0.6010, -0.3909, 1.8480, -0.2536, -0.4788, 0.3238, 0.5085,
  12057. 0.0851],
  12058. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  12059. 0.2622],
  12060. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  12061. 0.0697],
  12062. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  12063. 0.3469],
  12064. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  12065. 0.3745],
  12066. [-2.2859, -2.2859, 0.9175, -1.3947, -0.3691, -1.2467, 0.2314,
  12067. 0.3238],
  12068. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  12069. 0.0236],
  12070. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  12071. -0.0340]]], device='cuda:0')
  12072. loss_train_step before backward: tensor(0.0315, device='cuda:0', grad_fn=<MseLossBackward>)
  12073. loss_train_step after backward: tensor(0.0315, device='cuda:0', grad_fn=<MseLossBackward>)
  12074. loss_train: 0.2607172168791294
  12075. step: 8
  12076. running loss: 0.032589652109891176
  12077. Train Steps: 8/90 Loss: 0.0326 torch.Size([8, 600, 800])
  12078. torch.Size([8, 8])
  12079. tensor([[0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  12080. [0.6346, 0.4165, 0.9138, 0.3983, 0.3875, 0.4317, 0.7469, 0.5471],
  12081. [ nan, nan, 0.8900, 0.3217, 0.5038, 0.2233, 0.6694, 0.5609],
  12082. [0.6127, 0.4115, 0.7163, 0.2883, 0.3625, 0.2950, 0.5327, 0.5495],
  12083. [0.6083, 0.3957, 0.8638, 0.4950, 0.4363, 0.5083, 0.5346, 0.4980],
  12084. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  12085. [0.6257, 0.4060, 0.8300, 0.2333, 0.4688, 0.2583, 0.7050, 0.5633],
  12086. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578]],
  12087. device='cuda:0', dtype=torch.float64)
  12088. predictions are: tensor([[ 0.9991, -0.1294, 1.8289, -0.3092, -0.4135, -0.4943, 0.7495, 0.1788],
  12089. [ 0.6798, -0.3583, 1.8032, -0.0833, -0.4193, -0.0604, 0.7310, 0.2062],
  12090. [-1.1939, -1.5435, 1.6261, -0.7515, -0.1293, -1.0238, 0.6422, 0.2504],
  12091. [ 1.0001, -0.1213, 1.0754, -0.6870, -0.5014, -0.7288, 0.2028, 0.2405],
  12092. [ 1.0468, -0.0862, 1.6703, 0.3435, -0.3764, 0.3130, 0.1611, 0.1331],
  12093. [ 0.9204, -0.1412, 1.6262, 0.0114, -0.5259, -0.2258, 0.2021, 0.2598],
  12094. [ 0.7783, -0.2752, 1.5301, -0.8552, -0.2124, -1.0131, 0.8405, 0.2358],
  12095. [-0.8339, -1.2837, 1.0198, -0.9123, -0.5547, -0.8795, 0.0556, 0.2826]],
  12096. device='cuda:0', grad_fn=<AddmmBackward>)
  12097. landmarks are: tensor([[[ 6.3883e-01, -3.6231e-01, 1.9173e+00, -7.3857e-01, -3.5173e-01,
  12098. -5.8460e-01, 1.1495e+00, 2.6764e-01],
  12099. [ 6.4542e-01, -3.6231e-01, 1.9346e+00, -4.4604e-01, -4.9607e-01,
  12100. -2.9207e-01, 1.1642e+00, 2.4092e-01],
  12101. [-2.2859e+00, -2.2859e+00, 1.8249e+00, -8.0015e-01, 4.0878e-02,
  12102. -1.2543e+00, 8.0590e-01, 3.0505e-01],
  12103. [ 5.4417e-01, -3.8545e-01, 1.0224e+00, -9.5412e-01, -6.1155e-01,
  12104. -9.2333e-01, 1.7452e-01, 2.5215e-01],
  12105. [ 5.2379e-01, -4.5797e-01, 1.7037e+00, 4.6189e-04, -2.7090e-01,
  12106. 6.2048e-02, 1.8356e-01, 1.4106e-02],
  12107. [ 6.0722e-01, -3.2394e-01, 1.8423e+00, -3.5366e-01, -4.9607e-01,
  12108. -3.9215e-01, 2.0831e-01, 1.8522e-01],
  12109. [ 6.0425e-01, -4.1045e-01, 1.5478e+00, -1.2082e+00, -1.2079e-01,
  12110. -1.0927e+00, 9.7040e-01, 3.1574e-01],
  12111. [-2.2859e+00, -2.2859e+00, 1.1020e+00, -1.0994e+00, -5.3649e-01,
  12112. -1.0542e+00, 5.4227e-02, 2.9047e-01]]], device='cuda:0')
  12113. loss_train_step before backward: tensor(0.1190, device='cuda:0', grad_fn=<MseLossBackward>)
  12114. loss_train_step after backward: tensor(0.1190, device='cuda:0', grad_fn=<MseLossBackward>)
  12115. loss_train: 0.3797225020825863
  12116. step: 9
  12117. running loss: 0.042191389120287366
  12118. Train Steps: 9/90 Loss: 0.0422 torch.Size([8, 600, 800])
  12119. torch.Size([8, 8])
  12120. tensor([[0.6275, 0.4157, 0.8337, 0.5800, 0.3763, 0.4200, 0.5547, 0.6125],
  12121. [ nan, nan, 0.8900, 0.3217, 0.5038, 0.2233, 0.6694, 0.5609],
  12122. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  12123. [0.6250, 0.4103, 0.8950, 0.4400, 0.3912, 0.5650, 0.6050, 0.5133],
  12124. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  12125. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  12126. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  12127. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528]],
  12128. device='cuda:0', dtype=torch.float64)
  12129. predictions are: tensor([[ 1.2359, 0.0152, 1.4352, 0.4591, -0.4579, -0.1886, 0.3458, 0.3827],
  12130. [-1.4108, -1.7165, 1.6278, -0.9198, -0.0999, -1.1243, 0.6107, 0.2600],
  12131. [ 1.0880, -0.0631, 1.4730, -0.7942, -0.2523, -1.2433, 0.1780, 0.2025],
  12132. [ 0.9040, -0.1922, 1.7536, -0.0645, -0.4241, 0.4290, 0.6224, 0.1873],
  12133. [ 0.9999, -0.1657, 1.5762, -0.5998, -0.5918, -0.5274, 0.6032, 0.1100],
  12134. [ 0.6061, -0.3682, 1.4800, -0.3083, -0.6131, -0.1629, 0.2296, 0.2176],
  12135. [ 0.9515, -0.1362, 1.5629, -0.2965, -0.5961, -0.2386, 0.4166, 0.2649],
  12136. [-0.7224, -1.2803, 1.7950, -0.7486, -0.2483, -0.8924, 0.8542, 0.2345]],
  12137. device='cuda:0', grad_fn=<AddmmBackward>)
  12138. landmarks are: tensor([[[ 0.6124, -0.3658, 1.5651, 0.3931, -0.5480, -0.3460, 0.2761,
  12139. 0.5431],
  12140. [-2.2859, -2.2859, 1.8249, -0.8002, 0.0409, -1.2543, 0.8059,
  12141. 0.3050],
  12142. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  12143. -0.0368],
  12144. [ 0.6010, -0.3909, 1.8480, -0.2536, -0.4788, 0.3238, 0.5085,
  12145. 0.0851],
  12146. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  12147. -0.0220],
  12148. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  12149. 0.3559],
  12150. [ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  12151. 0.2930],
  12152. [-2.2859, -2.2859, 1.8423, -0.9695, -0.1323, -0.8463, 1.1349,
  12153. 0.2676]]], device='cuda:0')
  12154. loss_train_step before backward: tensor(0.1079, device='cuda:0', grad_fn=<MseLossBackward>)
  12155. loss_train_step after backward: tensor(0.1079, device='cuda:0', grad_fn=<MseLossBackward>)
  12156. loss_train: 0.48758096620440483
  12157. step: 10
  12158. running loss: 0.048758096620440484
  12159.  
  12160. Train Steps: 10/90 Loss: 0.0488 torch.Size([8, 600, 800])
  12161. torch.Size([8, 8])
  12162. tensor([[0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  12163. [ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729],
  12164. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  12165. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395],
  12166. [0.6275, 0.4013, 0.8850, 0.2833, 0.4975, 0.2233, 0.7058, 0.5343],
  12167. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  12168. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  12169. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901]],
  12170. device='cuda:0', dtype=torch.float64)
  12171. predictions are: tensor([[ 0.7067, -0.3148, 1.0492, -1.0354, -0.4981, -0.9338, 0.3020, 0.3286],
  12172. [-0.7523, -1.2924, 0.9029, -1.2760, -0.3634, -1.3894, 0.3071, 0.3262],
  12173. [ 0.6640, -0.3744, 1.8604, -0.2007, -0.5467, 0.1417, 0.5132, 0.2404],
  12174. [ 0.5437, -0.4182, 1.7214, 0.1975, -0.6007, -0.5034, 0.4236, 0.2390],
  12175. [ 0.3511, -0.5864, 1.7093, -0.9693, 0.0304, -1.2827, 1.0219, 0.1822],
  12176. [ 1.1674, -0.0858, 1.8699, -0.0512, -0.5583, -0.3091, 0.7732, 0.1525],
  12177. [ 0.3252, -0.5765, 1.7152, 0.1841, -0.2517, 0.2405, 0.2954, 0.2331],
  12178. [ 0.3638, -0.5548, 1.8978, -0.1514, -0.4938, -0.0809, 0.1914, 0.1650]],
  12179. device='cuda:0', grad_fn=<AddmmBackward>)
  12180. landmarks are: tensor([[[ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  12181. 0.3315],
  12182. [-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  12183. 0.3604],
  12184. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  12185. 0.1775],
  12186. [ 0.5697, -0.4514, 1.7420, 0.2672, -0.6055, -0.6312, 0.3449,
  12187. 0.2058],
  12188. [ 0.6125, -0.4321, 1.8018, -0.9772, 0.0120, -1.2543, 0.9741,
  12189. 0.1821],
  12190. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  12191. 0.0325],
  12192. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  12193. 0.0851],
  12194. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  12195. -0.0220]]], device='cuda:0')
  12196. loss_train_step before backward: tensor(0.0692, device='cuda:0', grad_fn=<MseLossBackward>)
  12197. loss_train_step after backward: tensor(0.0692, device='cuda:0', grad_fn=<MseLossBackward>)
  12198. loss_train: 0.5567609034478664
  12199. step: 11
  12200. running loss: 0.05061462758616968
  12201. Train Steps: 11/90 Loss: 0.0506 torch.Size([8, 600, 800])
  12202. torch.Size([8, 8])
  12203. tensor([[0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  12204. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  12205. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  12206. [0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391],
  12207. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  12208. [0.6058, 0.3986, 0.8324, 0.4626, 0.3838, 0.4983, 0.5147, 0.5466],
  12209. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  12210. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402]],
  12211. device='cuda:0', dtype=torch.float64)
  12212. predictions are: tensor([[ 0.3899, -0.5611, 1.6083, -1.0398, -0.0411, -1.4380, 0.9611, 0.1850],
  12213. [ 0.7063, -0.3622, 1.7582, -0.4214, -0.6344, -0.0607, 0.7025, 0.2027],
  12214. [ 0.0398, -0.7886, 1.7258, -0.0711, -0.5843, 0.0780, 0.3114, 0.1939],
  12215. [ 0.3534, -0.5398, 1.6284, -0.9779, -0.2579, -1.2172, 0.6238, 0.2286],
  12216. [ 0.5881, -0.3905, 1.2062, -1.0493, -0.2944, -1.2115, 0.6174, 0.4106],
  12217. [ 0.1641, -0.6547, 1.5900, -0.0401, -0.4739, 0.0842, 0.2363, 0.2308],
  12218. [ 0.3576, -0.5340, 1.6793, -0.2877, -0.6649, -0.5644, 0.2157, 0.2440],
  12219. [ 0.3927, -0.5486, 1.7002, 0.2642, -0.4248, -0.0980, 0.4854, 0.1575]],
  12220. device='cuda:0', grad_fn=<AddmmBackward>)
  12221. landmarks are: tensor([[[ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  12222. 0.1020],
  12223. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  12224. 0.2083],
  12225. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  12226. 0.3469],
  12227. [ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  12228. 0.2043],
  12229. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  12230. 0.6084],
  12231. [ 0.5124, -0.4446, 1.5587, -0.1493, -0.5134, 0.0159, 0.0912,
  12232. 0.2386],
  12233. [ 0.5697, -0.4113, 1.7499, -0.2767, -0.6404, -0.7155, 0.1576,
  12234. 0.4032],
  12235. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  12236. 0.2091]]], device='cuda:0')
  12237. loss_train_step before backward: tensor(0.0200, device='cuda:0', grad_fn=<MseLossBackward>)
  12238. loss_train_step after backward: tensor(0.0200, device='cuda:0', grad_fn=<MseLossBackward>)
  12239. loss_train: 0.5767896324396133
  12240. step: 12
  12241. running loss: 0.04806580270330111
  12242. Train Steps: 12/90 Loss: 0.0481 torch.Size([8, 600, 800])
  12243. torch.Size([8, 8])
  12244. tensor([[0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  12245. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  12246. [0.6225, 0.4116, 0.8662, 0.3517, 0.3663, 0.3233, 0.5837, 0.5317],
  12247. [0.6286, 0.4060, 0.9188, 0.4333, 0.3675, 0.4167, 0.7034, 0.5528],
  12248. [0.6275, 0.4013, 0.8850, 0.2833, 0.4975, 0.2233, 0.7058, 0.5343],
  12249. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  12250. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  12251. [0.6267, 0.4080, 0.8438, 0.2633, 0.4763, 0.1800, 0.6259, 0.5240]],
  12252. device='cuda:0', dtype=torch.float64)
  12253. predictions are: tensor([[ 0.7066, -0.3359, 1.6617, 0.1113, -0.4845, 0.2730, 0.3180, 0.1751],
  12254. [ 0.6655, -0.3258, 1.6267, 0.1583, -0.5994, -0.3720, 0.3459, 0.2149],
  12255. [ 0.7973, -0.2172, 1.5151, -0.6836, -0.6012, -0.6649, 0.2786, 0.2913],
  12256. [ 0.7946, -0.2888, 1.9036, -0.3246, -0.5414, -0.2549, 0.8325, 0.2533],
  12257. [ 0.5353, -0.4337, 1.5933, -0.9831, -0.0078, -1.1072, 0.9309, 0.2004],
  12258. [ 0.3392, -0.5292, 1.6934, -0.5276, -0.3595, -1.0432, 0.5401, 0.1994],
  12259. [-2.1027, -2.1584, 1.0679, -0.8955, -0.4812, -0.9877, 0.2749, 0.2430],
  12260. [ 0.5163, -0.4084, 1.4821, -1.0341, -0.1654, -1.1220, 0.6254, 0.2533]],
  12261. device='cuda:0', grad_fn=<AddmmBackward>)
  12262. landmarks are: tensor([[[ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  12263. 0.0711],
  12264. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  12265. 0.1698],
  12266. [ 0.5893, -0.3847, 1.7152, -0.6616, -0.5942, -0.7925, 0.4104,
  12267. 0.1698],
  12268. [ 0.6174, -0.4105, 1.9577, -0.2844, -0.5885, -0.3614, 0.9631,
  12269. 0.2676],
  12270. [ 0.6125, -0.4321, 1.8018, -0.9772, 0.0120, -1.2543, 0.9741,
  12271. 0.1821],
  12272. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  12273. -0.0529],
  12274. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  12275. 0.2183],
  12276. [ 0.6088, -0.4015, 1.6113, -1.0696, -0.0861, -1.4545, 0.6051,
  12277. 0.1343]]], device='cuda:0')
  12278. loss_train_step before backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  12279. loss_train_step after backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  12280. loss_train: 0.5947947613894939
  12281. step: 13
  12282. running loss: 0.045753443183807224
  12283. Train Steps: 13/90 Loss: 0.0458 torch.Size([8, 600, 800])
  12284. torch.Size([8, 8])
  12285. tensor([[0.6107, 0.4050, 0.8700, 0.4850, 0.4470, 0.4848, 0.5043, 0.5431],
  12286. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  12287. [0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  12288. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  12289. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395],
  12290. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  12291. [ nan, nan, 0.8888, 0.3100, 0.5262, 0.2817, 0.7145, 0.6003],
  12292. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800]],
  12293. device='cuda:0', dtype=torch.float64)
  12294. predictions are: tensor([[ 0.8568, -0.1986, 1.7606, -0.0271, -0.2534, -0.0415, 0.1967, 0.1760],
  12295. [ 1.1717, -0.0319, 1.6136, -0.6131, -0.6550, -0.5300, 0.3238, 0.1442],
  12296. [ 1.0539, -0.1441, 1.7893, -0.6783, -0.5686, -0.2087, 0.8835, 0.2074],
  12297. [ 1.0515, -0.1461, 1.7092, -0.7597, -0.5884, -0.7283, 0.6856, 0.1205],
  12298. [ 0.7875, -0.2442, 1.7666, 0.2316, -0.5501, -0.6627, 0.4504, 0.2163],
  12299. [-2.0296, -2.1249, 1.2080, -0.9242, -0.4599, -1.0183, 0.2166, 0.2925],
  12300. [-1.3036, -1.6394, 1.8677, -0.7513, 0.0723, -1.0658, 1.0924, 0.3734],
  12301. [ 0.5397, -0.3751, 1.1715, -0.8596, -0.4805, -1.1048, 0.2473, 0.3443]],
  12302. device='cuda:0', grad_fn=<AddmmBackward>)
  12303. landmarks are: tensor([[[ 5.3508e-01, -4.1527e-01, 1.7326e+00, -4.5727e-02, -2.2139e-01,
  12304. -4.6642e-02, 4.3431e-02, 2.2284e-01],
  12305. [ 5.2061e-01, -4.6028e-01, 1.4670e+00, -4.7683e-01, -6.5774e-01,
  12306. -3.9985e-01, 1.8356e-01, 2.0831e-03],
  12307. [ 6.1083e-01, -4.2731e-01, 1.8711e+00, -6.6159e-01, -5.7691e-01,
  12308. -1.9969e-01, 9.1557e-01, 1.5543e-01],
  12309. [ 6.0306e-01, -4.3072e-01, 1.7268e+00, -8.0015e-01, -6.0577e-01,
  12310. -6.4619e-01, 6.4417e-01, -2.1963e-02],
  12311. [ 5.6966e-01, -4.5138e-01, 1.7420e+00, 2.6720e-01, -6.0553e-01,
  12312. -6.3118e-01, 3.4489e-01, 2.0578e-01],
  12313. [-2.2859e+00, -2.2859e+00, 1.2030e+00, -1.0288e+00, -4.9607e-01,
  12314. -1.1081e+00, 8.1293e-02, 3.1609e-01],
  12315. [-2.2859e+00, -2.2859e+00, 1.8192e+00, -8.5404e-01, 1.4480e-01,
  12316. -9.8491e-01, 1.0143e+00, 4.8673e-01],
  12317. [ 5.5484e-01, -3.9360e-01, 1.1634e+00, -8.1049e-01, -5.1917e-01,
  12318. -1.0696e+00, 2.3718e-01, 3.9307e-01]]], device='cuda:0')
  12319. loss_train_step before backward: tensor(0.0493, device='cuda:0', grad_fn=<MseLossBackward>)
  12320. loss_train_step after backward: tensor(0.0493, device='cuda:0', grad_fn=<MseLossBackward>)
  12321. loss_train: 0.644109707325697
  12322. step: 14
  12323. running loss: 0.04600783623754978
  12324.  
  12325. Train Steps: 14/90 Loss: 0.0460 torch.Size([8, 600, 800])
  12326. torch.Size([8, 8])
  12327. tensor([[0.6142, 0.4127, 0.7575, 0.3067, 0.3438, 0.4383, 0.5778, 0.5207],
  12328. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  12329. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  12330. [0.6193, 0.3930, 0.8949, 0.4437, 0.3852, 0.5435, 0.6263, 0.5263],
  12331. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395],
  12332. [0.6264, 0.4067, 0.9050, 0.4183, 0.3775, 0.4600, 0.6308, 0.4862],
  12333. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  12334. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567]],
  12335. device='cuda:0', dtype=torch.float64)
  12336. predictions are: tensor([[ 0.3045, -0.5674, 1.3769, -0.9429, -0.6118, -0.4503, 0.2990, 0.2750],
  12337. [ 0.0977, -0.6868, 1.3143, -0.7793, 0.0222, -1.2691, 0.4035, 0.3906],
  12338. [ 0.4517, -0.4892, 1.5790, -0.6596, -0.6443, -0.5839, 0.3201, 0.2341],
  12339. [ 0.0941, -0.8263, 1.9781, -0.0808, -0.4988, 0.1383, 0.6655, 0.1129],
  12340. [ 0.4164, -0.5374, 1.9136, 0.3085, -0.5462, -0.6897, 0.5370, 0.1564],
  12341. [ 0.2482, -0.6505, 2.1673, -0.2775, -0.6107, -0.3451, 0.8151, 0.0446],
  12342. [-0.0211, -0.7762, 1.3772, -0.9917, -0.2255, -1.2161, 0.5604, 0.3626],
  12343. [ 0.3111, -0.6232, 1.2350, -1.1596, -0.4139, -1.2741, 0.4848, 0.2642]],
  12344. device='cuda:0', grad_fn=<AddmmBackward>)
  12345. landmarks are: tensor([[[ 0.5509, -0.3798, 1.2129, -0.8694, -0.6982, -0.2613, 0.3830,
  12346. 0.1193],
  12347. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  12348. 0.5624],
  12349. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  12350. 0.3417],
  12351. [ 0.5746, -0.4706, 1.8476, -0.2365, -0.5068, 0.2245, 0.6069,
  12352. 0.1449],
  12353. [ 0.5697, -0.4514, 1.7420, 0.2672, -0.6055, -0.6312, 0.3449,
  12354. 0.2058],
  12355. [ 0.6072, -0.4075, 1.8942, -0.3537, -0.5423, -0.1612, 0.6277,
  12356. -0.0400],
  12357. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  12358. 0.2853],
  12359. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  12360. 0.2853]]], device='cuda:0')
  12361. loss_train_step before backward: tensor(0.0427, device='cuda:0', grad_fn=<MseLossBackward>)
  12362. loss_train_step after backward: tensor(0.0427, device='cuda:0', grad_fn=<MseLossBackward>)
  12363. loss_train: 0.6868270449340343
  12364. step: 15
  12365. running loss: 0.04578846966226895
  12366. Train Steps: 15/90 Loss: 0.0458 torch.Size([8, 600, 800])
  12367. torch.Size([8, 8])
  12368. tensor([[0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  12369. [0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183],
  12370. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  12371. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  12372. [0.6203, 0.4056, 0.8942, 0.4086, 0.3643, 0.3617, 0.5917, 0.5482],
  12373. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  12374. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  12375. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667]],
  12376. device='cuda:0', dtype=torch.float64)
  12377. predictions are: tensor([[ 0.4056, -0.5116, 1.7553, -0.5207, -0.1930, -1.2530, 0.6542, 0.2057],
  12378. [ 0.0376, -0.7179, 1.3283, -0.9410, -0.3670, -1.1820, 0.3219, 0.2579],
  12379. [ 0.7586, -0.2953, 1.6136, -0.7672, -0.5980, -0.7300, 0.5055, 0.2464],
  12380. [ 1.1241, -0.0934, 1.7848, -0.3410, -0.5859, -0.2160, 0.5642, 0.0793],
  12381. [ 0.6242, -0.3637, 1.8110, -0.4475, -0.5276, -0.6335, 0.5430, 0.2081],
  12382. [-2.5332, -2.4693, 1.1160, -0.8603, -0.3118, -1.1134, 0.3019, 0.2916],
  12383. [ 0.6375, -0.3858, 1.7093, 0.0144, -0.3216, -0.1430, 0.4885, 0.1177],
  12384. [ 0.4408, -0.4880, 1.7590, -0.6851, -0.6015, -0.5339, 0.6534, 0.3028]],
  12385. device='cuda:0', grad_fn=<AddmmBackward>)
  12386. landmarks are: tensor([[[ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  12387. -0.0529],
  12388. [ 0.5798, -0.4156, 1.3977, -1.0388, -0.4672, -1.1004, 0.3469,
  12389. 0.1082],
  12390. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  12391. 0.1753],
  12392. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  12393. -0.0670],
  12394. [ 0.5791, -0.4127, 1.8442, -0.3985, -0.6031, -0.6154, 0.4473,
  12395. 0.2464],
  12396. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  12397. 0.2183],
  12398. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  12399. 0.0159],
  12400. [ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  12401. 0.3315]]], device='cuda:0')
  12402. loss_train_step before backward: tensor(0.0251, device='cuda:0', grad_fn=<MseLossBackward>)
  12403. loss_train_step after backward: tensor(0.0251, device='cuda:0', grad_fn=<MseLossBackward>)
  12404. loss_train: 0.7119743004441261
  12405. step: 16
  12406. running loss: 0.04449839377775788
  12407. Train Steps: 16/90 Loss: 0.0445 torch.Size([8, 600, 800])
  12408. torch.Size([8, 8])
  12409. tensor([[0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  12410. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  12411. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  12412. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  12413. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  12414. [0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250],
  12415. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533],
  12416. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332]],
  12417. device='cuda:0', dtype=torch.float64)
  12418. predictions are: tensor([[-0.5698, -1.1630, 1.7988, -1.0738, 0.0985, -1.2631, 0.9678, 0.2631],
  12419. [ 0.6247, -0.3964, 1.8911, -0.4913, -0.7389, -0.3246, 0.3989, 0.1941],
  12420. [-1.1609, -1.5773, 1.9380, -0.7570, -0.0841, -1.2592, 0.9371, 0.2391],
  12421. [ 0.4757, -0.5144, 1.6757, 0.2291, -0.5092, -0.3942, 0.3250, 0.1567],
  12422. [ 0.1884, -0.6917, 1.8490, -0.1794, -0.5994, 0.2266, 0.3432, 0.1332],
  12423. [ 0.6206, -0.3816, 1.1967, -1.1353, -0.5213, -1.1738, 0.2903, 0.2247],
  12424. [ 0.6793, -0.3524, 1.1073, -1.2023, -0.6062, -1.0704, 0.3309, 0.2422],
  12425. [ 0.5047, -0.4610, 1.5853, 0.0454, -0.5763, -0.2399, 0.3652, 0.1877]],
  12426. device='cuda:0', grad_fn=<AddmmBackward>)
  12427. landmarks are: tensor([[[ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  12428. 0.2142],
  12429. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  12430. 0.3161],
  12431. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  12432. 0.2142],
  12433. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  12434. 0.1313],
  12435. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  12436. 0.1082],
  12437. [ 0.5891, -0.3937, 1.1494, -1.2390, -0.5076, -0.9695, 0.4797,
  12438. 0.1390],
  12439. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  12440. 0.2699],
  12441. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  12442. 0.1768]]], device='cuda:0')
  12443. loss_train_step before backward: tensor(0.1294, device='cuda:0', grad_fn=<MseLossBackward>)
  12444. loss_train_step after backward: tensor(0.1294, device='cuda:0', grad_fn=<MseLossBackward>)
  12445. loss_train: 0.8413371220231056
  12446. step: 17
  12447. running loss: 0.04949041894253563
  12448. Train Steps: 17/90 Loss: 0.0495 torch.Size([8, 600, 800])
  12449. torch.Size([8, 8])
  12450. tensor([[0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  12451. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  12452. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598],
  12453. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  12454. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  12455. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  12456. [0.6176, 0.4030, 0.8850, 0.4850, 0.3688, 0.4050, 0.5312, 0.5783],
  12457. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500]],
  12458. device='cuda:0', dtype=torch.float64)
  12459. predictions are: tensor([[ 0.3496, -0.6161, 1.8231, -0.7200, -0.6343, -0.1043, 0.8363, 0.1154],
  12460. [ 0.2936, -0.5610, 1.7201, -0.4867, -0.2092, -0.3321, 0.2514, 0.2062],
  12461. [ 0.5884, -0.4009, 1.6049, 0.0735, -0.1333, -0.5680, 0.4170, 0.2590],
  12462. [-0.0426, -0.8502, 1.6135, 0.1152, -0.2904, -0.5447, 0.2721, 0.1971],
  12463. [-0.1033, -0.8852, 2.0310, -0.9600, -0.3148, -1.1868, 1.0985, 0.2178],
  12464. [ 0.2483, -0.6758, 1.7849, -0.3754, -0.3378, -0.4320, 0.2930, 0.1095],
  12465. [-0.0405, -0.8126, 1.6816, -0.3414, -0.7438, -0.7737, 0.2725, 0.1434],
  12466. [ 0.3748, -0.5497, 1.3174, -1.2418, -0.7503, -0.8426, 0.5530, 0.2293]],
  12467. device='cuda:0', grad_fn=<AddmmBackward>)
  12468. landmarks are: tensor([[[ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  12469. 0.1005],
  12470. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  12471. 0.2853],
  12472. [ 0.5726, -0.4249, 1.5824, 0.3777, -0.0942, -0.0556, 0.2782,
  12473. 0.2997],
  12474. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  12475. -0.0610],
  12476. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  12477. 0.2676],
  12478. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  12479. 0.0051],
  12480. [ 0.5667, -0.4246, 1.8018, -0.0457, -0.5827, -0.4152, 0.1679,
  12481. 0.3854],
  12482. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  12483. 0.2545]]], device='cuda:0')
  12484. loss_train_step before backward: tensor(0.0813, device='cuda:0', grad_fn=<MseLossBackward>)
  12485. loss_train_step after backward: tensor(0.0813, device='cuda:0', grad_fn=<MseLossBackward>)
  12486. loss_train: 0.9225974231958389
  12487. step: 18
  12488. running loss: 0.05125541239976883
  12489.  
  12490. Train Steps: 18/90 Loss: 0.0513 torch.Size([8, 600, 800])
  12491. torch.Size([8, 8])
  12492. tensor([[0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  12493. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  12494. [0.6198, 0.4101, 0.8838, 0.5283, 0.3763, 0.5267, 0.5913, 0.5567],
  12495. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567],
  12496. [0.6146, 0.4124, 0.8800, 0.4867, 0.3800, 0.4500, 0.5106, 0.5524],
  12497. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  12498. [0.6268, 0.4102, 0.8938, 0.3667, 0.4025, 0.2833, 0.6275, 0.5183],
  12499. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719]],
  12500. device='cuda:0', dtype=torch.float64)
  12501. predictions are: tensor([[ 0.4430, -0.4844, 1.7350, -0.4449, -0.5268, -0.4250, 0.4806, 0.1754],
  12502. [ 0.7304, -0.3097, 1.7664, -0.6020, -0.5014, -0.2737, 0.5494, 0.1550],
  12503. [ 0.8088, -0.2873, 1.7017, -0.1383, -0.4139, -0.1332, 0.5881, 0.2076],
  12504. [-2.3069, -2.3295, 1.1612, -1.1341, -0.2896, -1.2715, 0.1326, 0.3356],
  12505. [ 0.6132, -0.3375, 1.7022, -0.2673, -0.5030, -0.4217, 0.3474, 0.1730],
  12506. [ 0.4882, -0.4704, 1.8124, -0.1721, -0.5237, -0.8142, 0.6059, 0.0388],
  12507. [ 0.4792, -0.4727, 1.7930, -0.9632, -0.2783, -1.1860, 0.7636, 0.1998],
  12508. [ 0.5194, -0.4366, 1.5938, -0.0664, -0.4184, -0.2661, 0.3575, 0.1813]],
  12509. device='cuda:0', grad_fn=<AddmmBackward>)
  12510. landmarks are: tensor([[[ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  12511. 0.1159],
  12512. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  12513. 0.1775],
  12514. [ 0.5770, -0.3918, 1.7961, 0.1544, -0.5480, 0.1467, 0.4450,
  12515. 0.2853],
  12516. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  12517. 0.2853],
  12518. [ 0.5529, -0.3811, 1.7788, -0.0380, -0.5307, -0.2074, 0.0727,
  12519. 0.2657],
  12520. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  12521. -0.0049],
  12522. [ 0.6092, -0.3913, 1.8423, -0.5923, -0.4268, -0.9772, 0.6125,
  12523. 0.1082],
  12524. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  12525. -0.1061]]], device='cuda:0')
  12526. loss_train_step before backward: tensor(0.0290, device='cuda:0', grad_fn=<MseLossBackward>)
  12527. loss_train_step after backward: tensor(0.0290, device='cuda:0', grad_fn=<MseLossBackward>)
  12528. loss_train: 0.9516376163810492
  12529. step: 19
  12530. running loss: 0.050086190335844695
  12531. Train Steps: 19/90 Loss: 0.0501 torch.Size([8, 600, 800])
  12532. torch.Size([8, 8])
  12533. tensor([[0.6272, 0.4120, 0.9038, 0.4117, 0.3725, 0.3200, 0.6175, 0.5250],
  12534. [0.6135, 0.3994, 0.7913, 0.3050, 0.3625, 0.3050, 0.5837, 0.5050],
  12535. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083],
  12536. [0.6167, 0.4048, 0.6831, 0.3639, 0.3763, 0.3017, 0.5700, 0.5883],
  12537. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  12538. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  12539. [0.6199, 0.4093, 0.7913, 0.2533, 0.4288, 0.2467, 0.5975, 0.5700],
  12540. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933]],
  12541. device='cuda:0', dtype=torch.float64)
  12542. predictions are: tensor([[ 0.1724, -0.7311, 1.9600, -0.4847, -0.5312, -0.7648, 0.7926, 0.1386],
  12543. [ 0.4509, -0.5342, 1.4227, -1.0582, -0.5859, -0.7999, 0.5457, 0.1146],
  12544. [ 0.0037, -0.8193, 1.9162, -0.4894, -0.6796, -0.5751, 0.5336, 0.0400],
  12545. [-0.0795, -0.8154, 1.1245, -0.8385, -0.5245, -0.8974, 0.2899, 0.3562],
  12546. [ 0.7510, -0.2744, 1.6003, -0.7833, -0.2182, -1.1405, 0.3211, 0.1225],
  12547. [ 0.1794, -0.6694, 1.7174, 0.0391, -0.2750, 0.1796, 0.3027, 0.1166],
  12548. [-0.3175, -1.0336, 1.3863, -1.1355, -0.3639, -1.0212, 0.5602, 0.2073],
  12549. [ 0.6083, -0.3555, 1.6484, 0.3436, -0.0741, -0.2059, 0.3531, 0.2449]],
  12550. device='cuda:0', grad_fn=<AddmmBackward>)
  12551. landmarks are: tensor([[[ 0.6111, -0.3828, 1.8885, -0.3844, -0.5654, -0.8079, 0.5663,
  12552. 0.1390],
  12553. [ 0.5477, -0.4413, 1.3688, -0.8771, -0.6115, -0.8771, 0.4104,
  12554. 0.0467],
  12555. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  12556. 0.0620],
  12557. [ 0.5626, -0.4162, 0.8692, -0.6051, -0.5480, -0.8925, 0.3469,
  12558. 0.4316],
  12559. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  12560. -0.0368],
  12561. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  12562. 0.2386],
  12563. [ 0.5771, -0.3955, 1.3688, -1.1158, -0.3055, -1.1466, 0.4739,
  12564. 0.3469],
  12565. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  12566. 0.4547]]], device='cuda:0')
  12567. loss_train_step before backward: tensor(0.0521, device='cuda:0', grad_fn=<MseLossBackward>)
  12568. loss_train_step after backward: tensor(0.0521, device='cuda:0', grad_fn=<MseLossBackward>)
  12569. loss_train: 1.0037182997912169
  12570. step: 20
  12571. running loss: 0.05018591498956084
  12572. Train Steps: 20/90 Loss: 0.0502 torch.Size([8, 600, 800])
  12573. torch.Size([8, 8])
  12574. tensor([[0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  12575. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  12576. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  12577. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064],
  12578. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  12579. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  12580. [0.6275, 0.4050, 0.9038, 0.3767, 0.3838, 0.3533, 0.7074, 0.5575],
  12581. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717]],
  12582. device='cuda:0', dtype=torch.float64)
  12583. predictions are: tensor([[ 0.1581, -0.7393, 1.1670, -1.3299, -0.6123, -1.1580, 0.3761, 0.1508],
  12584. [ 0.7792, -0.3083, 1.7652, 0.1693, -0.4503, -0.1500, 0.5473, 0.1806],
  12585. [-0.0364, -0.8090, 1.1568, -1.1909, -0.6619, -0.9205, 0.3632, 0.2406],
  12586. [ 0.1614, -0.6613, 1.7122, -0.0781, -0.0744, -0.1382, 0.0251, 0.1446],
  12587. [ 0.1000, -0.7275, 1.7813, -0.1652, -0.1890, -0.0821, 0.1867, 0.1571],
  12588. [ 0.4845, -0.4482, 1.8444, -0.0939, -0.4233, -0.6957, 0.6399, 0.1452],
  12589. [ 0.5154, -0.4710, 1.9175, -0.6788, -0.4608, -0.8603, 0.9891, 0.1327],
  12590. [ 0.1317, -0.7220, 1.7761, -0.2175, -0.3860, -0.1320, 0.3566, 0.1352]],
  12591. device='cuda:0', grad_fn=<AddmmBackward>)
  12592. landmarks are: tensor([[[ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  12593. 0.0562],
  12594. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  12595. 0.3007],
  12596. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  12597. 0.3007],
  12598. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  12599. 0.0532],
  12600. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  12601. 0.3392],
  12602. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  12603. 0.1661],
  12604. [ 0.6125, -0.4153, 1.8885, -0.5461, -0.5134, -0.6539, 0.9814,
  12605. 0.2890],
  12606. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  12607. 0.3546]]], device='cuda:0')
  12608. loss_train_step before backward: tensor(0.0353, device='cuda:0', grad_fn=<MseLossBackward>)
  12609. loss_train_step after backward: tensor(0.0353, device='cuda:0', grad_fn=<MseLossBackward>)
  12610. loss_train: 1.0390332210808992
  12611. step: 21
  12612. running loss: 0.049477772432423774
  12613. Train Steps: 21/90 Loss: 0.0495 torch.Size([8, 600, 800])
  12614. torch.Size([8, 8])
  12615. tensor([[0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  12616. [0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  12617. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  12618. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  12619. [0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  12620. [0.6058, 0.3986, 0.8324, 0.4626, 0.3838, 0.4983, 0.5147, 0.5466],
  12621. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  12622. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517]],
  12623. device='cuda:0', dtype=torch.float64)
  12624. predictions are: tensor([[ 0.5319, -0.4074, 1.9047, -0.0513, -0.4148, -0.4593, 0.4412, 0.1348],
  12625. [ 0.2248, -0.6662, 1.6434, -0.0576, -0.4394, -0.2607, 0.5983, 0.2211],
  12626. [ 0.5160, -0.4834, 1.7566, 0.1108, -0.4688, 0.0316, 0.6468, 0.1698],
  12627. [ 0.5514, -0.4455, 1.8779, 0.2109, -0.5295, -0.2038, 0.3353, -0.0306],
  12628. [ 0.0569, -0.7394, 0.9787, -1.4228, -0.3317, -1.4684, 0.0992, 0.2083],
  12629. [ 0.1960, -0.6464, 1.6755, -0.2134, -0.4800, 0.0778, 0.1021, 0.1230],
  12630. [ 0.3866, -0.5533, 2.0356, -0.8076, -0.3010, -0.5609, 0.8130, 0.1686],
  12631. [ 0.2819, -0.5713, 1.0122, -1.2399, -0.3901, -1.1646, 0.2829, 0.3324]],
  12632. device='cuda:0', grad_fn=<AddmmBackward>)
  12633. landmarks are: tensor([[[ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  12634. 0.1661],
  12635. [ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  12636. 0.3745],
  12637. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  12638. 0.3745],
  12639. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  12640. -0.0102],
  12641. [ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  12642. 0.0261],
  12643. [ 0.5124, -0.4446, 1.5587, -0.1493, -0.5134, 0.0159, 0.0912,
  12644. 0.2386],
  12645. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  12646. 0.2676],
  12647. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  12648. 0.2622]]], device='cuda:0')
  12649. loss_train_step before backward: tensor(0.0374, device='cuda:0', grad_fn=<MseLossBackward>)
  12650. loss_train_step after backward: tensor(0.0374, device='cuda:0', grad_fn=<MseLossBackward>)
  12651. loss_train: 1.0764061901718378
  12652. step: 22
  12653. running loss: 0.0489275540987199
  12654.  
  12655. Train Steps: 22/90 Loss: 0.0489 torch.Size([8, 600, 800])
  12656. torch.Size([8, 8])
  12657. tensor([[0.6108, 0.4011, 0.8037, 0.3400, 0.3700, 0.2933, 0.5658, 0.5617],
  12658. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412],
  12659. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  12660. [0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  12661. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  12662. [0.6293, 0.3982, 0.8700, 0.5300, 0.3763, 0.4717, 0.7050, 0.5297],
  12663. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  12664. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879]],
  12665. device='cuda:0', dtype=torch.float64)
  12666. predictions are: tensor([[ 0.4221, -0.4916, 1.3856, -0.8910, -0.5794, -0.8885, 0.3294, 0.2227],
  12667. [ 0.3831, -0.5018, 1.5959, 0.2377, -0.1456, -0.1022, 0.0904, 0.2351],
  12668. [ 0.6868, -0.3415, 1.8932, -0.6819, -0.1232, -1.1595, 0.8876, 0.1838],
  12669. [ 0.5910, -0.4053, 1.6661, -0.5671, -0.6732, -0.4688, 0.3958, 0.1051],
  12670. [ 0.2762, -0.5875, 1.6663, 0.0127, -0.2104, -0.0351, 0.2161, 0.1858],
  12671. [ 0.2888, -0.6276, 1.7013, 0.0176, -0.4367, -0.1943, 0.6267, 0.1648],
  12672. [ 0.4352, -0.4806, 1.5642, -0.6004, -0.6763, -0.3811, 0.2263, 0.1577],
  12673. [ 0.2547, -0.6514, 1.8138, -0.4008, -0.4382, 0.1134, 0.4997, 0.0756]],
  12674. device='cuda:0', grad_fn=<AddmmBackward>)
  12675. landmarks are: tensor([[[ 0.5355, -0.4335, 1.4266, -0.7155, -0.5769, -0.9310, 0.3275,
  12676. 0.3087],
  12677. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  12678. 0.2138],
  12679. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  12680. 0.2142],
  12681. [ 0.5669, -0.4794, 1.7499, -0.3383, -0.6751, -0.4229, 0.4970,
  12682. -0.0611],
  12683. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  12684. 0.0851],
  12685. [ 0.6207, -0.4466, 1.7326, 0.1621, -0.5480, -0.1073, 0.9704,
  12686. 0.1608],
  12687. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  12688. 0.3559],
  12689. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  12690. -0.0322]]], device='cuda:0')
  12691. loss_train_step before backward: tensor(0.0177, device='cuda:0', grad_fn=<MseLossBackward>)
  12692. loss_train_step after backward: tensor(0.0177, device='cuda:0', grad_fn=<MseLossBackward>)
  12693. loss_train: 1.0940845366567373
  12694. step: 23
  12695. running loss: 0.04756889289811901
  12696. Train Steps: 23/90 Loss: 0.0476 torch.Size([8, 600, 800])
  12697. torch.Size([8, 8])
  12698. tensor([[0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  12699. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  12700. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  12701. [0.6203, 0.4076, 0.8611, 0.2878, 0.4050, 0.2554, 0.5907, 0.5496],
  12702. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  12703. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  12704. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  12705. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717]],
  12706. device='cuda:0', dtype=torch.float64)
  12707. predictions are: tensor([[ 0.4754, -0.4291, 0.9876, -0.9167, -0.4275, -0.9420, 0.2557, 0.2084],
  12708. [ 0.5949, -0.3673, 0.9835, -0.8483, -0.4139, -1.0030, 0.3359, 0.2510],
  12709. [-1.5239, -1.7801, 1.4724, -0.5498, -0.4969, -0.6206, 0.1061, 0.2190],
  12710. [ 1.0447, -0.0863, 1.6853, -0.6476, -0.2820, -0.6336, 0.6414, 0.1602],
  12711. [ 0.7545, -0.2793, 1.3460, -0.7836, -0.4708, -0.6146, 0.4870, 0.2678],
  12712. [ 0.8902, -0.1837, 1.6729, -0.4024, -0.5099, -0.6107, 0.3860, 0.1088],
  12713. [ 0.6083, -0.3687, 1.9450, 0.3126, -0.4421, 0.1083, 0.5850, 0.1294],
  12714. [ 0.5531, -0.4151, 1.8876, 0.2921, -0.2572, 0.2739, 0.4322, 0.0999]],
  12715. device='cuda:0', grad_fn=<AddmmBackward>)
  12716. landmarks are: tensor([[[ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  12717. 0.0712],
  12718. [ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  12719. 0.3852],
  12720. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  12721. 0.1133],
  12722. [ 0.5790, -0.4031, 1.6915, -0.9564, -0.4152, -1.1063, 0.4425,
  12723. 0.2528],
  12724. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  12725. 0.2853],
  12726. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  12727. 0.1005],
  12728. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  12729. 0.1159],
  12730. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  12731. 0.3546]]], device='cuda:0')
  12732. loss_train_step before backward: tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward>)
  12733. loss_train_step after backward: tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward>)
  12734. loss_train: 1.1515279468148947
  12735. step: 24
  12736. running loss: 0.04798033111728728
  12737. Train Steps: 24/90 Loss: 0.0480 torch.Size([8, 600, 800])
  12738. torch.Size([8, 8])
  12739. tensor([[0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758],
  12740. [0.6289, 0.4081, 0.8720, 0.3487, 0.3900, 0.3183, 0.6703, 0.5376],
  12741. [ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167],
  12742. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  12743. [0.6075, 0.4000, 0.8513, 0.5183, 0.4510, 0.5329, 0.5180, 0.5280],
  12744. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  12745. [0.6179, 0.4008, 0.8600, 0.4015, 0.3932, 0.2515, 0.5711, 0.5438],
  12746. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683]],
  12747. device='cuda:0', dtype=torch.float64)
  12748. predictions are: tensor([[ 0.5418, -0.4124, 1.8235, -0.1119, -0.3812, 0.1074, 0.7229, 0.1254],
  12749. [ 0.6203, -0.3487, 1.6785, -0.5720, -0.4225, -0.8041, 0.6948, 0.1912],
  12750. [-1.7598, -1.9331, 1.1522, -1.0600, -0.4270, -0.9675, -0.0287, 0.3160],
  12751. [ 1.1561, -0.0339, 1.7192, 0.2305, -0.5978, -0.1364, 0.6343, 0.0543],
  12752. [ 0.7348, -0.2362, 1.6043, 0.1218, -0.2008, 0.1591, 0.0928, 0.1539],
  12753. [ 0.6645, -0.3278, 1.6605, 0.1640, -0.3562, 0.2098, 0.6699, 0.1587],
  12754. [ 0.8523, -0.1380, 1.3972, -0.5103, -0.4060, -0.9285, 0.1484, 0.2288],
  12755. [ 0.9301, -0.1348, 1.4233, -0.9516, -0.4670, -0.7360, 0.4224, 0.2452]],
  12756. device='cuda:0', grad_fn=<AddmmBackward>)
  12757. landmarks are: tensor([[[ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  12758. -0.0881],
  12759. [ 0.6191, -0.4008, 1.7420, -0.6753, -0.4845, -0.8156, 0.8101,
  12760. 0.1974],
  12761. [-2.2859, -2.2859, 1.2820, -1.0801, -0.5885, -1.0234, 0.2141,
  12762. 0.1005],
  12763. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  12764. -0.1278],
  12765. [ 0.5202, -0.4382, 1.6460, 0.1082, -0.2029, 0.1754, 0.1067,
  12766. 0.1530],
  12767. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  12768. 0.1176],
  12769. [ 0.5680, -0.4345, 1.6864, -0.4315, -0.4698, -1.1241, 0.3518,
  12770. 0.2261],
  12771. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  12772. 0.3392]]], device='cuda:0')
  12773. loss_train_step before backward: tensor(0.0297, device='cuda:0', grad_fn=<MseLossBackward>)
  12774. loss_train_step after backward: tensor(0.0297, device='cuda:0', grad_fn=<MseLossBackward>)
  12775. loss_train: 1.1811874378472567
  12776. step: 25
  12777. running loss: 0.04724749751389026
  12778. Train Steps: 25/90 Loss: 0.0472 torch.Size([8, 600, 800])
  12779. torch.Size([8, 8])
  12780. tensor([[0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  12781. [0.6129, 0.4114, 0.6950, 0.2467, 0.4050, 0.2133, 0.5363, 0.5550],
  12782. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  12783. [0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390],
  12784. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  12785. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  12786. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  12787. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600]],
  12788. device='cuda:0', dtype=torch.float64)
  12789. predictions are: tensor([[ 1.1092, -0.0598, 1.7175, -0.5010, -0.7258, -0.0769, 0.5840, 0.1207],
  12790. [ 0.7990, -0.2687, 1.0544, -0.9522, -0.4777, -1.0258, 0.1616, 0.2518],
  12791. [ 0.6795, -0.3569, 1.8876, 0.3645, -0.4024, 0.2626, 0.5803, 0.1490],
  12792. [ 0.8305, -0.2397, 1.7730, -0.4483, -0.3952, -0.6633, 0.7930, 0.1416],
  12793. [ 1.0673, -0.0639, 1.7255, 0.5401, -0.5086, -0.2005, 0.5255, 0.2547],
  12794. [ 0.7767, -0.2754, 1.1634, -1.0008, -0.5500, -0.8639, 0.2313, 0.1580],
  12795. [-1.7676, -1.9638, 1.1525, -1.1372, -0.3661, -1.0775, 0.0339, 0.3052],
  12796. [ 0.5077, -0.4275, 1.8660, 0.0588, -0.0673, 0.2542, 0.3526, 0.2022]],
  12797. device='cuda:0', grad_fn=<AddmmBackward>)
  12798. landmarks are: tensor([[[ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  12799. 0.2365],
  12800. [ 0.5448, -0.3859, 0.9242, -1.1466, -0.4152, -1.3005, 0.1910,
  12801. 0.2776],
  12802. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  12803. 0.1544],
  12804. [ 0.6504, -0.3936, 1.8885, -0.4922, -0.3402, -0.9233, 0.8022,
  12805. 0.2035],
  12806. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  12807. 0.4778],
  12808. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  12809. 0.0802],
  12810. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  12811. 0.1373],
  12812. [ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  12813. 0.3007]]], device='cuda:0')
  12814. loss_train_step before backward: tensor(0.0428, device='cuda:0', grad_fn=<MseLossBackward>)
  12815.  
  12816. loss_train_step after backward: tensor(0.0428, device='cuda:0', grad_fn=<MseLossBackward>)
  12817. loss_train: 1.2239569071680307
  12818. step: 26
  12819. running loss: 0.047075265660308875
  12820. Train Steps: 26/90 Loss: 0.0471 torch.Size([8, 600, 800])
  12821. torch.Size([8, 8])
  12822. tensor([[0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  12823. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320],
  12824. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  12825. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  12826. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  12827. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  12828. [0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  12829. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892]],
  12830. device='cuda:0', dtype=torch.float64)
  12831. predictions are: tensor([[ 0.5252, -0.4151, 1.6701, 0.0175, -0.1096, 0.1072, 0.4594, 0.2154],
  12832. [ 0.4531, -0.4956, 1.5928, 0.0686, -0.4088, 0.0361, 0.6365, 0.2085],
  12833. [ 0.2903, -0.5712, 1.5617, -0.4637, -0.6604, -0.6051, 0.1524, 0.2101],
  12834. [ 0.3504, -0.5716, 1.7172, -0.3043, -0.4345, 0.1715, 0.5451, 0.1113],
  12835. [ 0.3246, -0.5665, 1.6040, -0.0296, -0.3346, 0.0444, 0.3115, 0.2818],
  12836. [ 0.7752, -0.2857, 1.4962, -0.7700, -0.5900, -0.9204, 0.3944, 0.1760],
  12837. [ 1.0919, -0.0991, 1.5440, -0.8091, -0.4919, -1.0663, 0.7723, 0.1144],
  12838. [ 0.3260, -0.5237, 1.5657, -0.0825, -0.6330, -0.5299, 0.1789, 0.2688]],
  12839. device='cuda:0', grad_fn=<AddmmBackward>)
  12840. landmarks are: tensor([[[ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  12841. 0.0592],
  12842. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  12843. 0.1715],
  12844. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  12845. 0.2567],
  12846. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  12847. -0.0322],
  12848. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  12849. 0.3777],
  12850. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  12851. 0.1005],
  12852. [ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  12853. -0.0957],
  12854. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  12855. 0.4357]]], device='cuda:0')
  12856. loss_train_step before backward: tensor(0.0250, device='cuda:0', grad_fn=<MseLossBackward>)
  12857. loss_train_step after backward: tensor(0.0250, device='cuda:0', grad_fn=<MseLossBackward>)
  12858. loss_train: 1.2489608246833086
  12859. step: 27
  12860. running loss: 0.046257808321604026
  12861. Train Steps: 27/90 Loss: 0.0463 torch.Size([8, 600, 800])
  12862. torch.Size([8, 8])
  12863. tensor([[0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  12864. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  12865. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  12866. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  12867. [0.6262, 0.4052, 0.8888, 0.4700, 0.3675, 0.5117, 0.6350, 0.5233],
  12868. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  12869. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217],
  12870. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083]],
  12871. device='cuda:0', dtype=torch.float64)
  12872. predictions are: tensor([[ 0.4644, -0.4701, 1.7021, 0.0982, -0.1020, 0.1515, 0.2594, 0.2304],
  12873. [ 0.6701, -0.3498, 1.1743, -1.0372, -0.5572, -0.7721, 0.4599, 0.2256],
  12874. [ 0.5408, -0.4026, 1.7313, 0.0126, -0.4380, -0.1173, 0.1420, 0.1929],
  12875. [ 0.6182, -0.3839, 1.3790, -0.8283, -0.5608, -0.8546, 0.4777, 0.1537],
  12876. [ 0.7149, -0.3733, 1.9399, 0.0853, -0.4579, 0.1658, 0.8671, 0.1258],
  12877. [ 0.4842, -0.4774, 1.7424, 0.0258, -0.5271, -0.1801, 0.4708, 0.1866],
  12878. [ 0.0581, -0.7235, 1.0430, -0.9465, -0.4204, -1.1660, 0.2980, 0.3445],
  12879. [ 0.5249, -0.4811, 1.8443, -0.2301, -0.6742, -0.5042, 0.4780, 0.0843]],
  12880. device='cuda:0', grad_fn=<AddmmBackward>)
  12881. landmarks are: tensor([[[ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  12882. 0.3007],
  12883. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  12884. 0.1621],
  12885. [ 0.5441, -0.3997, 1.7326, -0.2228, -0.4441, -0.2921, 0.0296,
  12886. 0.2409],
  12887. [ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  12888. 0.1080],
  12889. [ 0.6063, -0.4142, 1.8192, -0.1150, -0.5885, 0.0774, 0.6471,
  12890. 0.1313],
  12891. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  12892. 0.2314],
  12893. [ 0.5687, -0.4088, 1.0397, -1.1466, -0.3113, -1.1928, 0.4681,
  12894. 0.5855],
  12895. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  12896. 0.0620]]], device='cuda:0')
  12897. loss_train_step before backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  12898. loss_train_step after backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  12899. loss_train: 1.2669219318777323
  12900. step: 28
  12901. running loss: 0.04524721185277615
  12902. Train Steps: 28/90 Loss: 0.0452 torch.Size([8, 600, 800])
  12903. torch.Size([8, 8])
  12904. tensor([[0.6200, 0.4049, 0.8638, 0.5617, 0.4125, 0.5100, 0.6013, 0.5317],
  12905. [0.6126, 0.4073, 0.8750, 0.5133, 0.3800, 0.4333, 0.4986, 0.5378],
  12906. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  12907. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  12908. [0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  12909. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  12910. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  12911. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719]],
  12912. device='cuda:0', dtype=torch.float64)
  12913. predictions are: tensor([[ 0.3292, -0.6127, 1.6667, 0.2913, -0.3799, 0.2480, 0.4851, 0.1940],
  12914. [ 0.5045, -0.4484, 1.7734, 0.2048, -0.5201, -0.0983, 0.3444, 0.1669],
  12915. [ 0.9764, -0.1649, 1.7343, -0.0197, -0.3502, 0.1187, 0.3336, 0.2008],
  12916. [ 0.6445, -0.4002, 1.4565, -1.2108, -0.2055, -1.2694, 0.7895, 0.1524],
  12917. [ 0.4371, -0.5265, 1.5985, -0.6078, -0.6801, -0.6091, 0.4320, 0.1052],
  12918. [ 0.9756, -0.1525, 1.5874, 0.0874, -0.4362, -0.7796, 0.5513, 0.2914],
  12919. [-0.1907, -0.9122, 1.2446, -1.0707, -0.4485, -0.9089, 0.2790, 0.2335],
  12920. [ 0.3977, -0.5413, 1.5528, -0.5059, -0.7190, -0.1582, 0.2814, 0.1526]],
  12921. device='cuda:0', grad_fn=<AddmmBackward>)
  12922. landmarks are: tensor([[[ 0.5776, -0.4159, 1.7037, 0.3084, -0.3806, 0.0697, 0.4912,
  12923. 0.1698],
  12924. [ 0.5435, -0.4045, 1.7557, 0.0851, -0.5307, -0.2844, 0.0172,
  12925. 0.1980],
  12926. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  12927. 0.3057],
  12928. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  12929. 0.1020],
  12930. [ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  12931. 0.1963],
  12932. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  12933. 0.5762],
  12934. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  12935. 0.3007],
  12936. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  12937. 0.3559]]], device='cuda:0')
  12938. loss_train_step before backward: tensor(0.1221, device='cuda:0', grad_fn=<MseLossBackward>)
  12939. loss_train_step after backward: tensor(0.1221, device='cuda:0', grad_fn=<MseLossBackward>)
  12940. loss_train: 1.3889758083969355
  12941. step: 29
  12942. running loss: 0.04789571753092881
  12943. Train Steps: 29/90 Loss: 0.0479 torch.Size([8, 600, 800])
  12944. torch.Size([8, 8])
  12945. tensor([[0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  12946. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  12947. [0.6200, 0.3978, 0.8900, 0.4550, 0.3775, 0.5200, 0.6150, 0.5367],
  12948. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038],
  12949. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478],
  12950. [ nan, nan, 0.6992, 0.2791, 0.3950, 0.2383, 0.5483, 0.5819],
  12951. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  12952. [0.6179, 0.3961, 0.8347, 0.6020, 0.3887, 0.4624, 0.5714, 0.5373]],
  12953. device='cuda:0', dtype=torch.float64)
  12954. predictions are: tensor([[ 0.6447, -0.3391, 1.0203, -1.0295, -0.2438, -1.3132, 0.3005, 0.3568],
  12955. [ 0.7181, -0.3352, 1.7661, -0.0676, -0.5545, 0.0418, 0.3674, 0.1823],
  12956. [ 0.3253, -0.6027, 1.8249, -0.0198, -0.5174, 0.2183, 0.4973, 0.1816],
  12957. [ 1.0088, -0.1655, 1.8082, -0.0407, -0.3024, 0.0897, 0.3959, 0.1048],
  12958. [ 0.6614, -0.4317, 1.8519, -0.5815, -0.5667, -0.8422, 0.6848, 0.1938],
  12959. [-0.8125, -1.3321, 1.0198, -1.1514, -0.5100, -1.2320, 0.2646, 0.2864],
  12960. [ 0.6633, -0.3855, 1.5774, -0.5996, -0.7283, -0.3927, 0.4222, 0.1267],
  12961. [ 0.8054, -0.3088, 1.6503, 0.4464, -0.5051, -0.2037, 0.5452, 0.1913]],
  12962. device='cuda:0', grad_fn=<AddmmBackward>)
  12963. landmarks are: tensor([[[ 6.1010e-01, -3.1524e-01, 1.0166e+00, -7.5396e-01, -2.2633e-02,
  12964. -1.4468e+00, 2.8226e-01, 5.7018e-01],
  12965. [ 5.3684e-01, -4.4057e-01, 1.7730e+00, -1.7660e-01, -5.2494e-01,
  12966. -5.3426e-02, 2.3141e-01, 3.4688e-01],
  12967. [ 5.7760e-01, -4.4842e-01, 1.8249e+00, -1.8430e-01, -5.4226e-01,
  12968. 1.1594e-01, 5.5473e-01, 1.9292e-01],
  12969. [ 5.2494e-01, -4.4734e-01, 1.7326e+00, -9.1917e-02, -2.0162e-01,
  12970. 1.5443e-01, 1.7328e-01, 4.1158e-02],
  12971. [ 5.7921e-01, -4.0523e-01, 1.8214e+00, -6.5874e-01, -5.3842e-01,
  12972. -8.9239e-01, 4.3812e-01, 2.4425e-01],
  12973. [-2.2859e+00, -2.2859e+00, 9.4385e-01, -9.9666e-01, -4.6143e-01,
  12974. -1.1851e+00, 2.4679e-01, 4.0188e-01],
  12975. [ 5.2061e-01, -4.6028e-01, 1.4670e+00, -4.7683e-01, -6.5774e-01,
  12976. -3.9985e-01, 1.8356e-01, 2.0831e-03],
  12977. [ 5.6801e-01, -4.5619e-01, 1.5697e+00, 4.9469e-01, -4.9038e-01,
  12978. -1.5026e-01, 3.5357e-01, 1.9563e-01]]], device='cuda:0')
  12979. loss_train_step before backward: tensor(0.0670, device='cuda:0', grad_fn=<MseLossBackward>)
  12980. loss_train_step after backward: tensor(0.0670, device='cuda:0', grad_fn=<MseLossBackward>)
  12981. loss_train: 1.4559749905019999
  12982. step: 30
  12983. running loss: 0.048532499683399996
  12984.  
  12985. Train Steps: 30/90 Loss: 0.0485 torch.Size([8, 600, 800])
  12986. torch.Size([8, 8])
  12987. tensor([[0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748],
  12988. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  12989. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  12990. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800],
  12991. [0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617],
  12992. [0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  12993. [0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882],
  12994. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938]],
  12995. device='cuda:0', dtype=torch.float64)
  12996. predictions are: tensor([[ 0.3969, -0.5640, 1.6768, 0.0966, -0.4565, -0.4329, 0.6561, 0.2496],
  12997. [ 0.2968, -0.6093, 1.6604, -0.1043, -0.5758, -0.1632, 0.3509, 0.3169],
  12998. [ 0.7539, -0.3650, 1.8065, -0.1882, -0.5726, -0.0869, 0.6342, 0.1433],
  12999. [ 0.2691, -0.5931, 1.1348, -1.0432, -0.6014, -1.0747, 0.2123, 0.2751],
  13000. [ 0.8217, -0.2588, 1.6736, -0.1274, -0.1709, -0.0524, 0.2523, 0.2500],
  13001. [ 0.5199, -0.5038, 1.1993, -1.2389, -0.5359, -1.1787, 0.5091, 0.2795],
  13002. [ 0.3096, -0.5846, 1.7719, -0.4621, -0.6384, -0.5422, 0.2241, 0.1382],
  13003. [ 0.4792, -0.4978, 1.7307, 0.2366, -0.4688, -0.1269, 0.5286, 0.1288]],
  13004. device='cuda:0', grad_fn=<AddmmBackward>)
  13005. landmarks are: tensor([[[ 0.6421, -0.3647, 1.5940, 0.3084, -0.5192, -0.3691, 1.1057,
  13006. 0.3692],
  13007. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  13008. 0.5239],
  13009. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  13010. 0.0774],
  13011. [ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  13012. 0.3931],
  13013. [ 0.5432, -0.4388, 1.7557, -0.0303, -0.0919, -0.1150, 0.2699,
  13014. 0.3087],
  13015. [ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  13016. 0.3007],
  13017. [ 0.5595, -0.3988, 1.7672, -0.4460, -0.5538, -0.5384, 0.0828,
  13018. -0.0310],
  13019. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  13020. -0.0049]]], device='cuda:0')
  13021. loss_train_step before backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  13022. loss_train_step after backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  13023. loss_train: 1.4763062540441751
  13024. step: 31
  13025. running loss: 0.04762278238852178
  13026. Train Steps: 31/90 Loss: 0.0476 torch.Size([8, 600, 800])
  13027. torch.Size([8, 8])
  13028. tensor([[0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  13029. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  13030. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  13031. [0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  13032. [0.6224, 0.4061, 0.8988, 0.4300, 0.3838, 0.4750, 0.6112, 0.5483],
  13033. [0.6357, 0.4159, 0.8788, 0.5583, 0.3638, 0.4433, 0.6488, 0.5297],
  13034. [0.6250, 0.4103, 0.8950, 0.4400, 0.3912, 0.5650, 0.6050, 0.5133],
  13035. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167]],
  13036. device='cuda:0', dtype=torch.float64)
  13037. predictions are: tensor([[ 0.2273, -0.6596, 1.1092, -0.9489, -0.6768, -0.8663, 0.0910, 0.2431],
  13038. [ 0.7486, -0.3217, 1.6883, 0.0425, -0.3411, -0.1704, 0.2981, 0.2276],
  13039. [ 0.5208, -0.4361, 1.6414, 0.4044, -0.4322, -0.2129, 0.3308, 0.3269],
  13040. [-0.0311, -0.8324, 1.0396, -1.3393, -0.3552, -1.6871, 0.3319, 0.1816],
  13041. [ 0.7902, -0.3247, 1.8514, -0.2893, -0.5331, -0.0267, 0.5042, 0.1592],
  13042. [ 0.3829, -0.5580, 1.7809, 0.2276, -0.5510, -0.3927, 0.5745, 0.2348],
  13043. [ 0.6664, -0.3745, 1.8520, -0.2423, -0.4796, 0.2054, 0.6264, 0.1599],
  13044. [ 0.4054, -0.5725, 1.5891, -0.7661, -0.6209, -0.6981, 0.5075, 0.3368]],
  13045. device='cuda:0', grad_fn=<AddmmBackward>)
  13046. landmarks are: tensor([[[ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  13047. 0.1710],
  13048. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  13049. 0.3700],
  13050. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  13051. 0.3007],
  13052. [ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  13053. 0.0261],
  13054. [ 0.5888, -0.4101, 1.8654, -0.2998, -0.5134, -0.0919, 0.5374,
  13055. 0.2468],
  13056. [ 0.6504, -0.3647, 1.7730, 0.2930, -0.6058, -0.2382, 0.7109,
  13057. 0.1608],
  13058. [ 0.6010, -0.3909, 1.8480, -0.2536, -0.4788, 0.3238, 0.5085,
  13059. 0.0851],
  13060. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  13061. 0.5624]]], device='cuda:0')
  13062. loss_train_step before backward: tensor(0.0216, device='cuda:0', grad_fn=<MseLossBackward>)
  13063. loss_train_step after backward: tensor(0.0216, device='cuda:0', grad_fn=<MseLossBackward>)
  13064. loss_train: 1.4978971872478724
  13065. step: 32
  13066. running loss: 0.04680928710149601
  13067. Train Steps: 32/90 Loss: 0.0468 torch.Size([8, 600, 800])
  13068. torch.Size([8, 8])
  13069. tensor([[0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  13070. [0.6202, 0.4066, 0.8746, 0.3376, 0.3717, 0.3090, 0.5842, 0.5165],
  13071. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  13072. [0.6179, 0.4008, 0.8600, 0.4015, 0.3932, 0.2515, 0.5711, 0.5438],
  13073. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  13074. [0.6279, 0.4008, 0.8600, 0.4883, 0.4325, 0.5283, 0.7010, 0.5378],
  13075. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  13076. [0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118]],
  13077. device='cuda:0', dtype=torch.float64)
  13078. predictions are: tensor([[ 0.6682, -0.3635, 1.1771, -0.8218, -0.3968, -0.9152, 0.4136, 0.3601],
  13079. [ 0.6833, -0.3600, 1.7315, -0.4808, -0.6057, -0.7120, 0.4325, 0.1391],
  13080. [-1.7206, -1.9316, 1.4490, -0.7641, -0.6125, -0.7112, 0.2333, 0.2175],
  13081. [ 0.4376, -0.4658, 1.5066, -0.4000, -0.4101, -0.9178, 0.2045, 0.2454],
  13082. [ 0.2897, -0.5951, 1.3823, -0.8484, -0.4510, -0.7861, 0.5288, 0.2703],
  13083. [ 1.0572, -0.1334, 1.7365, 0.1202, -0.3583, 0.3940, 0.6201, 0.1901],
  13084. [ 1.1275, -0.1140, 1.7753, 0.0943, -0.6044, -0.1970, 0.5039, 0.1713],
  13085. [ 0.6546, -0.3253, 1.1122, -0.6033, -0.3702, -0.9839, 0.1899, 0.3367]],
  13086. device='cuda:0', grad_fn=<AddmmBackward>)
  13087. landmarks are: tensor([[[ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  13088. 0.6084],
  13089. [ 0.5787, -0.4077, 1.7537, -0.7263, -0.5692, -0.8586, 0.4126,
  13090. 0.1000],
  13091. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  13092. 0.1133],
  13093. [ 0.5680, -0.4345, 1.6864, -0.4315, -0.4698, -1.1241, 0.3518,
  13094. 0.2261],
  13095. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  13096. 0.2160],
  13097. [ 0.6141, -0.4345, 1.6864, -0.0303, -0.2882, 0.1544, 0.9521,
  13098. 0.1982],
  13099. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  13100. 0.1768],
  13101. [ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  13102. 0.5401]]], device='cuda:0')
  13103. loss_train_step before backward: tensor(0.0360, device='cuda:0', grad_fn=<MseLossBackward>)
  13104. loss_train_step after backward: tensor(0.0360, device='cuda:0', grad_fn=<MseLossBackward>)
  13105. loss_train: 1.533901834860444
  13106. step: 33
  13107. running loss: 0.04648187378364982
  13108. Train Steps: 33/90 Loss: 0.0465 torch.Size([8, 600, 800])
  13109. torch.Size([8, 8])
  13110. tensor([[0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  13111. [0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  13112. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  13113. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  13114. [0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  13115. [0.6201, 0.4036, 0.8596, 0.3850, 0.3492, 0.3785, 0.5978, 0.5131],
  13116. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  13117. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483]],
  13118. device='cuda:0', dtype=torch.float64)
  13119. predictions are: tensor([[ 0.1480, -0.7081, 1.4007, -0.5825, -0.5700, -1.0408, 0.2384, 0.2237],
  13120. [ 0.5896, -0.4433, 1.4925, -0.8253, -0.5779, -0.3485, 0.6271, 0.2747],
  13121. [ 0.3425, -0.5901, 1.0766, -0.9527, -0.5053, -1.1356, 0.2093, 0.2348],
  13122. [ 0.8501, -0.2678, 1.8594, 0.1508, -0.2696, 0.3967, 0.5798, 0.2531],
  13123. [ 0.2669, -0.6123, 1.8149, -0.1087, -0.3577, -0.8990, 0.6010, 0.2930],
  13124. [ 0.7211, -0.3709, 1.6834, -0.3010, -0.6311, -0.5038, 0.3394, 0.2056],
  13125. [ 0.0754, -0.7388, 1.3125, -0.8194, -0.4243, -1.1414, 0.2379, 0.2833],
  13126. [ 0.3136, -0.6088, 1.6698, -0.2275, -0.5166, -0.0057, 0.3620, 0.2574]],
  13127. device='cuda:0', grad_fn=<AddmmBackward>)
  13128. landmarks are: tensor([[[ 0.5532, -0.3888, 1.4727, -0.7463, -0.5538, -1.0465, 0.0265,
  13129. 0.2138],
  13130. [ 0.5799, -0.4099, 1.5651, -1.0465, -0.5885, -0.3075, 0.6413,
  13131. 0.1390],
  13132. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  13133. 0.0802],
  13134. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  13135. 0.0928],
  13136. [ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  13137. 0.1608],
  13138. [ 0.5783, -0.4216, 1.6847, -0.5078, -0.6732, -0.5377, 0.4752,
  13139. 0.0839],
  13140. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  13141. 0.3700],
  13142. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  13143. 0.2468]]], device='cuda:0')
  13144. loss_train_step before backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  13145. loss_train_step after backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  13146. loss_train: 1.5591852515935898
  13147. step: 34
  13148. running loss: 0.04585838975275264
  13149.  
  13150. Train Steps: 34/90 Loss: 0.0459 torch.Size([8, 600, 800])
  13151. torch.Size([8, 8])
  13152. tensor([[0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  13153. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  13154. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350],
  13155. [0.6272, 0.4120, 0.9038, 0.4117, 0.3725, 0.3200, 0.6175, 0.5250],
  13156. [0.6171, 0.4127, 0.8900, 0.4800, 0.4325, 0.5783, 0.5769, 0.5090],
  13157. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  13158. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197],
  13159. [0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136]],
  13160. device='cuda:0', dtype=torch.float64)
  13161. predictions are: tensor([[ 0.3723, -0.5713, 1.5412, -1.1410, -0.4123, -1.2833, 0.7458, 0.2572],
  13162. [-0.0439, -0.7983, 1.3700, -0.6209, -0.6206, -1.1788, 0.1694, 0.3199],
  13163. [ 0.4568, -0.5009, 1.5959, -0.0868, -0.5835, -0.4344, 0.1355, 0.2190],
  13164. [ 0.3854, -0.5706, 1.7432, -0.5431, -0.6401, -0.9886, 0.6589, 0.2581],
  13165. [ 0.6753, -0.3385, 1.6879, -0.1744, -0.3901, 0.1000, 0.3988, 0.2561],
  13166. [ 0.6335, -0.3926, 1.5830, -0.1774, -0.4380, -0.2220, 0.5967, 0.2536],
  13167. [ 0.2948, -0.5686, 1.6185, -0.0778, -0.3593, -0.0700, 0.2592, 0.2595],
  13168. [ 0.4754, -0.4777, 1.6022, -0.0768, -0.2555, -0.0874, 0.2974, 0.2777]],
  13169. device='cuda:0', grad_fn=<AddmmBackward>)
  13170. landmarks are: tensor([[[ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  13171. 0.1467],
  13172. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  13173. 0.3928],
  13174. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  13175. 0.1854],
  13176. [ 0.6111, -0.3828, 1.8885, -0.3844, -0.5654, -0.8079, 0.5663,
  13177. 0.1390],
  13178. [ 0.5645, -0.3797, 1.8249, -0.0688, -0.2882, 0.3854, 0.3789,
  13179. 0.0652],
  13180. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  13181. 0.1627],
  13182. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  13183. 0.1146],
  13184. [ 0.5564, -0.3842, 1.7268, 0.1005, -0.0250, 0.3225, 0.2658,
  13185. 0.0862]]], device='cuda:0')
  13186. loss_train_step before backward: tensor(0.0343, device='cuda:0', grad_fn=<MseLossBackward>)
  13187. loss_train_step after backward: tensor(0.0343, device='cuda:0', grad_fn=<MseLossBackward>)
  13188. loss_train: 1.593443851917982
  13189. step: 35
  13190. running loss: 0.04552696719765663
  13191. Train Steps: 35/90 Loss: 0.0455 torch.Size([8, 600, 800])
  13192. torch.Size([8, 8])
  13193. tensor([[0.6260, 0.4106, 0.8025, 0.2583, 0.4550, 0.1867, 0.6281, 0.4869],
  13194. [0.6264, 0.4035, 0.8888, 0.4883, 0.4050, 0.5217, 0.6361, 0.4791],
  13195. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  13196. [0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097],
  13197. [0.6196, 0.4088, 0.8888, 0.4583, 0.4500, 0.5683, 0.6138, 0.5883],
  13198. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  13199. [0.6132, 0.3930, 0.8672, 0.4754, 0.3712, 0.5222, 0.5974, 0.5098],
  13200. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980]],
  13201. device='cuda:0', dtype=torch.float64)
  13202. predictions are: tensor([[ 0.1774, -0.6739, 1.3619, -1.0813, -0.2807, -1.6227, 0.5180, 0.2143],
  13203. [ 0.3338, -0.5876, 1.7390, -0.0251, -0.5067, -0.1704, 0.4971, 0.2085],
  13204. [ 0.4705, -0.4790, 1.7364, -0.0638, -0.3783, 0.0956, 0.4293, 0.2739],
  13205. [ 0.6925, -0.3200, 1.7505, -0.1045, -0.3952, 0.1059, 0.3062, 0.2407],
  13206. [ 0.6138, -0.3833, 1.7019, -0.2001, -0.2819, 0.0471, 0.4653, 0.3456],
  13207. [ 0.4023, -0.5554, 1.5965, -0.7829, -0.4790, -1.2861, 0.6305, 0.2734],
  13208. [ 0.3821, -0.5534, 1.6308, -0.1025, -0.5651, -0.0953, 0.3352, 0.2354],
  13209. [ 0.2864, -0.6015, 1.1239, -0.9904, -0.6295, -1.1959, 0.0964, 0.2094]],
  13210. device='cuda:0', grad_fn=<AddmmBackward>)
  13211. landmarks are: tensor([[[ 0.6058, -0.3892, 1.4208, -1.0927, -0.1843, -1.4237, 0.6154,
  13212. -0.0370],
  13213. [ 0.6074, -0.4223, 1.8192, -0.0303, -0.4152, 0.1236, 0.6524,
  13214. -0.0731],
  13215. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  13216. 0.0928],
  13217. [ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  13218. 0.0682],
  13219. [ 0.5759, -0.3978, 1.8192, -0.1689, -0.2074, 0.3392, 0.5490,
  13220. 0.4316],
  13221. [ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  13222. 0.1931],
  13223. [ 0.5466, -0.4706, 1.7198, -0.0903, -0.5712, 0.1261, 0.4733,
  13224. 0.0688],
  13225. [ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  13226. 0.0141]]], device='cuda:0')
  13227. loss_train_step before backward: tensor(0.0277, device='cuda:0', grad_fn=<MseLossBackward>)
  13228. loss_train_step after backward: tensor(0.0277, device='cuda:0', grad_fn=<MseLossBackward>)
  13229. loss_train: 1.6211165934801102
  13230. step: 36
  13231. running loss: 0.045031016485558614
  13232. Train Steps: 36/90 Loss: 0.0450 torch.Size([8, 600, 800])
  13233. torch.Size([8, 8])
  13234. tensor([[0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  13235. [0.6185, 0.4042, 0.7700, 0.2250, 0.4062, 0.2117, 0.5763, 0.5150],
  13236. [0.6161, 0.4076, 0.8900, 0.4667, 0.4125, 0.5917, 0.6262, 0.5367],
  13237. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  13238. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  13239. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  13240. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550],
  13241. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320]],
  13242. device='cuda:0', dtype=torch.float64)
  13243. predictions are: tensor([[ 0.3947, -0.4847, 1.5870, -0.3033, -0.5490, -0.3614, 0.0847, 0.3221],
  13244. [ 0.1355, -0.6723, 1.1828, -1.0753, -0.4606, -1.4371, 0.2556, 0.1990],
  13245. [ 0.5287, -0.4141, 1.7355, -0.2123, -0.3593, 0.2886, 0.3807, 0.2076],
  13246. [ 0.3074, -0.5518, 1.6790, -0.8450, -0.1968, -1.2325, 0.5182, 0.1985],
  13247. [ 0.5691, -0.4298, 1.5528, -0.9136, -0.3392, -1.1796, 0.6582, 0.2453],
  13248. [ 0.5131, -0.4907, 1.6979, 0.1381, -0.5536, -0.2265, 0.5239, 0.1741],
  13249. [ 0.5242, -0.4441, 1.7725, -0.1746, -0.4777, 0.0534, 0.4184, 0.2524],
  13250. [ 0.4037, -0.5380, 1.6122, -0.0100, -0.4977, -0.0729, 0.4697, 0.2294]],
  13251. device='cuda:0', grad_fn=<AddmmBackward>)
  13252. landmarks are: tensor([[[ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  13253. 0.4145],
  13254. [ 0.5707, -0.4189, 1.2707, -1.2467, -0.4095, -1.3082, 0.3758,
  13255. 0.0928],
  13256. [ 0.5598, -0.4032, 1.8249, -0.1304, -0.3806, 0.4470, 0.6067,
  13257. 0.1929],
  13258. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  13259. 0.0051],
  13260. [ 0.6174, -0.3984, 1.5975, -0.9921, -0.3633, -0.9926, 0.8205,
  13261. 0.2050],
  13262. [ 0.6148, -0.4130, 1.6864, 0.1698, -0.5307, -0.1150, 0.6125,
  13263. 0.0851],
  13264. [ 0.5968, -0.3725, 1.8423, -0.1381, -0.4037, 0.1852, 0.6009,
  13265. 0.2776],
  13266. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  13267. 0.1715]]], device='cuda:0')
  13268. loss_train_step before backward: tensor(0.0234, device='cuda:0', grad_fn=<MseLossBackward>)
  13269. loss_train_step after backward: tensor(0.0234, device='cuda:0', grad_fn=<MseLossBackward>)
  13270. loss_train: 1.6445499509572983
  13271. step: 37
  13272. running loss: 0.04444729597181887
  13273. Train Steps: 37/90 Loss: 0.0444 torch.Size([8, 600, 800])
  13274. torch.Size([8, 8])
  13275. tensor([[0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  13276. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  13277. [0.6100, 0.4071, 0.7601, 0.3444, 0.3400, 0.4117, 0.5625, 0.5617],
  13278. [0.6030, 0.3969, 0.7988, 0.3917, 0.3450, 0.3667, 0.5266, 0.4700],
  13279. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  13280. [0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  13281. [0.6196, 0.4068, 0.7645, 0.2234, 0.4575, 0.1737, 0.5926, 0.5284],
  13282. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519]],
  13283. device='cuda:0', dtype=torch.float64)
  13284. predictions are: tensor([[ 0.1872, -0.6722, 1.8496, -0.0055, -0.4651, -0.0681, 0.4674, 0.1633],
  13285. [ 0.4701, -0.4734, 1.5983, -1.1720, -0.0912, -1.0880, 0.6450, 0.1887],
  13286. [ 0.2988, -0.5591, 1.3431, -0.8010, -0.6583, -0.3453, 0.2976, 0.2991],
  13287. [ 0.4385, -0.4926, 1.5840, -0.5594, -0.6529, -0.5741, 0.2479, 0.1788],
  13288. [ 0.5675, -0.4378, 1.8293, 0.2816, -0.5209, -0.2343, 0.4806, 0.1298],
  13289. [ 0.4914, -0.4685, 1.6776, -0.5615, -0.5379, -0.7593, 0.4647, 0.1668],
  13290. [ 0.6671, -0.3534, 1.2841, -1.0860, -0.1890, -1.3536, 0.4186, 0.2550],
  13291. [ 0.5687, -0.3997, 1.7216, 0.1144, -0.1886, 0.1014, 0.2823, 0.2538]],
  13292. device='cuda:0', grad_fn=<AddmmBackward>)
  13293. landmarks are: tensor([[[ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  13294. 0.0313],
  13295. [ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  13296. -0.0369],
  13297. [ 0.5318, -0.4056, 1.2249, -0.6949, -0.7155, -0.3844, 0.3122,
  13298. 0.3084],
  13299. [ 0.4992, -0.4525, 1.4035, -0.4768, -0.6924, -0.5923, 0.1465,
  13300. -0.1151],
  13301. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  13302. -0.0102],
  13303. [ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  13304. 0.1963],
  13305. [ 0.5761, -0.4070, 1.2452, -1.2541, -0.1725, -1.4835, 0.4511,
  13306. 0.1545],
  13307. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  13308. 0.2634]]], device='cuda:0')
  13309. loss_train_step before backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  13310.  
  13311. loss_train_step after backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  13312. loss_train: 1.6591525804251432
  13313. step: 38
  13314. running loss: 0.04366191001118798
  13315. Train Steps: 38/90 Loss: 0.0437 torch.Size([8, 600, 800])
  13316. torch.Size([8, 8])
  13317. tensor([[0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  13318. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433],
  13319. [0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097],
  13320. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  13321. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  13322. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  13323. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  13324. [0.6201, 0.4151, 0.8588, 0.5467, 0.3700, 0.3950, 0.5637, 0.5933]],
  13325. device='cuda:0', dtype=torch.float64)
  13326. predictions are: tensor([[ 6.9073e-01, -3.3128e-01, 1.5764e+00, -1.0210e+00, -4.4448e-01,
  13327. -1.1284e+00, 5.1971e-01, 9.0985e-02],
  13328. [ 7.7653e-01, -2.6876e-01, 1.7526e+00, 9.8295e-04, -1.8860e-01,
  13329. -1.1193e-01, 3.4547e-01, 1.6992e-01],
  13330. [ 8.5491e-01, -2.1427e-01, 1.9309e+00, -2.1968e-01, -3.7515e-01,
  13331. 3.5782e-01, 5.1594e-01, 1.0342e-01],
  13332. [ 5.4454e-01, -4.1243e-01, 1.8518e+00, -1.7703e-01, -1.7207e-01,
  13333. -6.9722e-02, 5.0051e-01, 1.7933e-01],
  13334. [ 8.4427e-01, -2.5028e-01, 1.1858e+00, -1.1193e+00, -4.6734e-01,
  13335. -1.2457e+00, 5.1291e-01, 1.8033e-01],
  13336. [-1.3002e+00, -1.5918e+00, 1.1560e+00, -1.2955e+00, -2.7973e-01,
  13337. -1.4764e+00, 3.8677e-01, 2.7004e-01],
  13338. [ 6.1068e-01, -3.7035e-01, 1.7309e+00, -1.0349e-02, -3.6074e-01,
  13339. 1.1573e-01, 3.6811e-01, 1.5947e-01],
  13340. [ 6.7004e-01, -2.9821e-01, 1.7256e+00, 2.0917e-01, -6.2269e-01,
  13341. -4.3491e-01, 3.2126e-01, 2.6025e-01]], device='cuda:0',
  13342. grad_fn=<AddmmBackward>)
  13343. landmarks are: tensor([[[ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  13344. 0.0807],
  13345. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  13346. 0.2237],
  13347. [ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  13348. 0.0682],
  13349. [ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  13350. 0.2853],
  13351. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  13352. 0.2930],
  13353. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  13354. 0.3623],
  13355. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  13356. 0.2386],
  13357. [ 0.5785, -0.3687, 1.6806, 0.2391, -0.5769, -0.4614, 0.3180,
  13358. 0.4547]]], device='cuda:0')
  13359. loss_train_step before backward: tensor(0.0425, device='cuda:0', grad_fn=<MseLossBackward>)
  13360. loss_train_step after backward: tensor(0.0425, device='cuda:0', grad_fn=<MseLossBackward>)
  13361. loss_train: 1.7016998585313559
  13362. step: 39
  13363. running loss: 0.0436333297059322
  13364. Train Steps: 39/90 Loss: 0.0436 torch.Size([8, 600, 800])
  13365. torch.Size([8, 8])
  13366. tensor([[0.6263, 0.4030, 0.9000, 0.4767, 0.3800, 0.5167, 0.6415, 0.4771],
  13367. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  13368. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  13369. [0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  13370. [0.6086, 0.3998, 0.8788, 0.4450, 0.4025, 0.4650, 0.5306, 0.5103],
  13371. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  13372. [0.6261, 0.4045, 0.8865, 0.5369, 0.3895, 0.4859, 0.6683, 0.5249],
  13373. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717]],
  13374. device='cuda:0', dtype=torch.float64)
  13375. predictions are: tensor([[ 0.4242, -0.5076, 1.9139, -0.3800, -0.3886, -0.0722, 0.5852, 0.0703],
  13376. [ 0.6892, -0.3367, 1.8315, -0.3075, -0.3468, -0.2121, 0.3945, 0.1449],
  13377. [ 0.5346, -0.4161, 1.7029, -0.1029, -0.4170, -0.3621, 0.4635, 0.3057],
  13378. [ 0.5330, -0.4363, 1.8144, -0.1320, -0.4021, -0.2648, 0.4028, 0.0935],
  13379. [ 0.4335, -0.4818, 1.7706, -0.5227, -0.3796, -0.3209, 0.2563, 0.1315],
  13380. [ 0.5602, -0.4312, 1.8075, -0.1298, -0.2862, -0.0801, 0.4577, 0.1479],
  13381. [ 0.6446, -0.3702, 1.8362, -0.1281, -0.4253, -0.1565, 0.6927, 0.0867],
  13382. [ 0.4386, -0.4931, 1.0271, -1.2705, -0.3864, -1.4639, 0.2277, 0.2080]],
  13383. device='cuda:0', grad_fn=<AddmmBackward>)
  13384. landmarks are: tensor([[[ 0.6072, -0.4247, 1.8711, -0.0842, -0.5307, 0.1005, 0.6771,
  13385. -0.0821],
  13386. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  13387. 0.2035],
  13388. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  13389. 0.3161],
  13390. [ 0.5773, -0.4316, 1.7399, 0.1287, -0.5153, -0.0817, 0.4313,
  13391. 0.0919],
  13392. [ 0.5253, -0.4392, 1.7730, -0.2305, -0.4268, -0.1381, 0.1651,
  13393. 0.0712],
  13394. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  13395. 0.0711],
  13396. [ 0.6059, -0.4177, 1.8087, 0.1941, -0.4868, -0.0414, 0.8010,
  13397. 0.1385],
  13398. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  13399. 0.3546]]], device='cuda:0')
  13400. loss_train_step before backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  13401. loss_train_step after backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  13402. loss_train: 1.7223987337201834
  13403. step: 40
  13404. running loss: 0.04305996834300459
  13405. Train Steps: 40/90 Loss: 0.0431 torch.Size([8, 600, 800])
  13406. torch.Size([8, 8])
  13407. tensor([[0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  13408. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  13409. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  13410. [0.6200, 0.4039, 0.8880, 0.4799, 0.3625, 0.4285, 0.5866, 0.5148],
  13411. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  13412. [ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167],
  13413. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  13414. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343]],
  13415. device='cuda:0', dtype=torch.float64)
  13416. predictions are: tensor([[ 9.7662e-01, -1.1745e-01, 1.6946e+00, -1.8736e-02, -2.7298e-01,
  13417. 1.1961e-01, 6.4769e-01, 1.2871e-01],
  13418. [ 8.3737e-01, -2.2624e-01, 1.7305e+00, -1.1073e-03, -3.4214e-01,
  13419. -1.4048e-01, 4.8221e-01, 1.4542e-01],
  13420. [ 6.4155e-01, -3.4631e-01, 1.7510e+00, -1.0764e-01, -2.6191e-01,
  13421. -6.1281e-02, 3.9667e-01, 7.9823e-02],
  13422. [ 7.0425e-01, -2.9291e-01, 1.8040e+00, -2.7007e-01, -4.8139e-01,
  13423. -3.5236e-01, 3.2093e-01, 1.1178e-01],
  13424. [ 8.2886e-01, -2.0781e-01, 1.6514e+00, 6.9484e-02, -3.7936e-01,
  13425. -2.4129e-02, 2.7950e-01, 1.7206e-01],
  13426. [-1.6621e+00, -1.8554e+00, 1.2965e+00, -1.3455e+00, -3.9351e-01,
  13427. -1.0603e+00, 1.3691e-01, 1.4077e-01],
  13428. [ 7.7488e-01, -2.3785e-01, 1.8051e+00, -5.3855e-01, -4.5368e-01,
  13429. -4.5824e-01, 4.3108e-01, 2.1553e-01],
  13430. [ 8.9303e-01, -1.7966e-01, 1.6875e+00, -8.4745e-01, -2.5337e-01,
  13431. -1.0233e+00, 7.5601e-01, 7.6916e-02]], device='cuda:0',
  13432. grad_fn=<AddmmBackward>)
  13433. landmarks are: tensor([[[ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  13434. 0.1176],
  13435. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  13436. 0.1979],
  13437. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  13438. 0.0159],
  13439. [ 0.5781, -0.4205, 1.8159, -0.0691, -0.6116, -0.3069, 0.4236,
  13440. 0.0919],
  13441. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  13442. -0.1061],
  13443. [-2.2859, -2.2859, 1.2820, -1.0801, -0.5885, -1.0234, 0.2141,
  13444. 0.1005],
  13445. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  13446. 0.3238],
  13447. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  13448. 0.1821]]], device='cuda:0')
  13449. loss_train_step before backward: tensor(0.0354, device='cuda:0', grad_fn=<MseLossBackward>)
  13450. loss_train_step after backward: tensor(0.0354, device='cuda:0', grad_fn=<MseLossBackward>)
  13451. loss_train: 1.757778873667121
  13452. step: 41
  13453. running loss: 0.04287265545529563
  13454.  
  13455. Train Steps: 41/90 Loss: 0.0429 torch.Size([8, 600, 800])
  13456. torch.Size([8, 8])
  13457. tensor([[0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  13458. [0.6115, 0.3998, 0.7063, 0.2383, 0.4037, 0.1950, 0.5320, 0.4993],
  13459. [0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  13460. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  13461. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  13462. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  13463. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  13464. [0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131]],
  13465. device='cuda:0', dtype=torch.float64)
  13466. predictions are: tensor([[ 0.5364, -0.4022, 1.7602, -0.2904, -0.5344, -0.4302, 0.1283, 0.1212],
  13467. [ 0.6020, -0.3860, 1.1146, -1.0672, -0.2285, -1.3674, 0.2108, 0.0569],
  13468. [ 0.5184, -0.4487, 1.8782, 0.1548, -0.1674, 0.3226, 0.6550, 0.1418],
  13469. [ 0.6975, -0.3259, 1.4950, -0.8409, -0.2680, -0.8396, 0.5728, 0.1666],
  13470. [ 0.5019, -0.4184, 1.5995, -0.2894, -0.3780, -0.9116, 0.2311, 0.1745],
  13471. [ 0.4203, -0.4804, 1.6434, -0.4923, -0.5403, -0.3176, 0.3912, 0.0179],
  13472. [ 0.0798, -0.6898, 1.6994, -0.5779, -0.3896, 0.1759, 0.8041, 0.1626],
  13473. [ 0.5689, -0.4070, 1.7062, -0.3296, -0.4752, -0.0741, 0.4950, 0.0697]],
  13474. device='cuda:0', grad_fn=<AddmmBackward>)
  13475. landmarks are: tensor([[[ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  13476. 0.2567],
  13477. [ 0.5384, -0.4393, 0.9762, -1.1851, -0.4210, -1.3852, 0.1712,
  13478. 0.0201],
  13479. [ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  13480. 0.2391],
  13481. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  13482. 0.2160],
  13483. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  13484. 0.3928],
  13485. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  13486. 0.0021],
  13487. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  13488. 0.2083],
  13489. [ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  13490. 0.0840]]], device='cuda:0')
  13491. loss_train_step before backward: tensor(0.0208, device='cuda:0', grad_fn=<MseLossBackward>)
  13492. loss_train_step after backward: tensor(0.0208, device='cuda:0', grad_fn=<MseLossBackward>)
  13493. loss_train: 1.778610149398446
  13494. step: 42
  13495. running loss: 0.042347860699963005
  13496. Train Steps: 42/90 Loss: 0.0423 torch.Size([8, 600, 800])
  13497. torch.Size([8, 8])
  13498. tensor([[0.6161, 0.4099, 0.8738, 0.4383, 0.3788, 0.5483, 0.5605, 0.5019],
  13499. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  13500. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  13501. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  13502. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208],
  13503. [0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  13504. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  13505. [0.6179, 0.4008, 0.8600, 0.4015, 0.3932, 0.2515, 0.5711, 0.5438]],
  13506. device='cuda:0', dtype=torch.float64)
  13507. predictions are: tensor([[ 0.3502, -0.5350, 1.8028, -0.1968, -0.4146, 0.5732, 0.5760, 0.0674],
  13508. [ 0.7001, -0.2969, 1.4979, -0.3223, -0.5520, -0.0171, 0.1787, 0.0619],
  13509. [ 0.5623, -0.3918, 1.8224, -0.2495, -0.3759, -0.4400, 0.4877, 0.2254],
  13510. [ 0.4395, -0.4990, 1.0913, -1.0361, -0.3294, -1.1480, 0.3250, 0.1471],
  13511. [ 0.3808, -0.5393, 1.5022, -0.8524, -0.3207, -0.9561, 0.5060, 0.0491],
  13512. [ 0.5369, -0.4363, 1.2601, -0.9757, -0.3010, -1.1186, 0.2567, 0.0580],
  13513. [ 0.4902, -0.4967, 1.9258, 0.1589, -0.4215, 0.2360, 0.8296, 0.0872],
  13514. [ 0.4893, -0.4287, 1.6650, -0.4043, -0.3079, -0.8211, 0.2554, 0.1332]],
  13515. device='cuda:0', grad_fn=<AddmmBackward>)
  13516. landmarks are: tensor([[[ 0.5597, -0.3928, 1.7499, -0.2613, -0.5365, 0.2468, 0.3028,
  13517. 0.0321],
  13518. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  13519. 0.1552],
  13520. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  13521. 0.3928],
  13522. [ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  13523. 0.2906],
  13524. [ 0.5885, -0.4429, 1.4266, -0.9926, -0.4383, -1.2313, 0.4228,
  13525. 0.1195],
  13526. [ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  13527. 0.0774],
  13528. [ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  13529. 0.1779],
  13530. [ 0.5680, -0.4345, 1.6864, -0.4315, -0.4698, -1.1241, 0.3518,
  13531. 0.2261]]], device='cuda:0')
  13532. loss_train_step before backward: tensor(0.0289, device='cuda:0', grad_fn=<MseLossBackward>)
  13533. loss_train_step after backward: tensor(0.0289, device='cuda:0', grad_fn=<MseLossBackward>)
  13534. loss_train: 1.8074938002973795
  13535. step: 43
  13536. running loss: 0.04203473954179952
  13537. Train Steps: 43/90 Loss: 0.0420 torch.Size([8, 600, 800])
  13538. torch.Size([8, 8])
  13539. tensor([[0.6038, 0.3946, 0.8413, 0.4883, 0.3563, 0.4550, 0.5266, 0.4693],
  13540. [0.6260, 0.4106, 0.8025, 0.2583, 0.4550, 0.1867, 0.6281, 0.4869],
  13541. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  13542. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  13543. [0.6289, 0.4032, 0.8419, 0.5446, 0.4075, 0.5017, 0.6312, 0.5117],
  13544. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  13545. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  13546. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519]],
  13547. device='cuda:0', dtype=torch.float64)
  13548. predictions are: tensor([[ 0.7905, -0.2252, 1.6335, -0.0263, -0.6232, -0.1224, 0.1979, 0.1167],
  13549. [ 0.7494, -0.2658, 1.4417, -1.1422, -0.2417, -1.3671, 0.5485, 0.0467],
  13550. [-1.5169, -1.7478, 1.5878, -1.2802, -0.0359, -1.0986, 0.6142, 0.1493],
  13551. [ 0.7136, -0.3303, 1.8095, 0.1998, -0.4240, 0.2751, 0.4201, 0.1101],
  13552. [ 0.9599, -0.1700, 1.7080, 0.1720, -0.4273, 0.1289, 0.6565, 0.1152],
  13553. [ 0.6922, -0.3478, 1.7639, -0.0507, -0.5437, 0.0132, 0.4204, 0.0642],
  13554. [ 0.7462, -0.2894, 1.2072, -1.1087, -0.6579, -0.7699, 0.3299, 0.0590],
  13555. [ 0.7810, -0.2467, 1.7174, 0.1712, -0.2060, 0.1815, 0.2094, 0.1444]],
  13556. device='cuda:0', grad_fn=<AddmmBackward>)
  13557. landmarks are: tensor([[[ 0.5030, -0.4631, 1.5998, -0.0303, -0.6404, -0.1843, 0.1465,
  13558. -0.1181],
  13559. [ 0.6058, -0.3892, 1.4208, -1.0927, -0.1843, -1.4237, 0.6154,
  13560. -0.0370],
  13561. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  13562. 0.3104],
  13563. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  13564. 0.0711],
  13565. [ 0.6189, -0.4238, 1.6026, 0.2295, -0.4037, 0.0313, 0.6298,
  13566. 0.0774],
  13567. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  13568. -0.0534],
  13569. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  13570. 0.0622],
  13571. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  13572. 0.2634]]], device='cuda:0')
  13573. loss_train_step before backward: tensor(0.0319, device='cuda:0', grad_fn=<MseLossBackward>)
  13574. loss_train_step after backward: tensor(0.0319, device='cuda:0', grad_fn=<MseLossBackward>)
  13575. loss_train: 1.8393607195466757
  13576. step: 44
  13577. running loss: 0.041803652716969904
  13578. Train Steps: 44/90 Loss: 0.0418 torch.Size([8, 600, 800])
  13579. torch.Size([8, 8])
  13580. tensor([[0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  13581. [0.6038, 0.3946, 0.8413, 0.4883, 0.3563, 0.4550, 0.5266, 0.4693],
  13582. [0.6211, 0.4069, 0.8750, 0.5117, 0.4150, 0.4900, 0.5875, 0.5167],
  13583. [0.6250, 0.4131, 0.8688, 0.2983, 0.4275, 0.2367, 0.6162, 0.5367],
  13584. [0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  13585. [0.6246, 0.4008, 0.8757, 0.5088, 0.4101, 0.5392, 0.6644, 0.5133],
  13586. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  13587. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064]],
  13588. device='cuda:0', dtype=torch.float64)
  13589. predictions are: tensor([[ 0.4716, -0.4719, 1.7441, -0.2225, -0.5760, -0.4219, 0.7062, 0.1232],
  13590. [ 0.5111, -0.4207, 1.4883, -0.2494, -0.6212, -0.3269, 0.2111, 0.1063],
  13591. [ 0.5906, -0.4036, 1.6814, -0.0946, -0.4266, -0.0143, 0.4353, 0.0676],
  13592. [ 0.7047, -0.3238, 1.6344, -1.1320, -0.3182, -1.2865, 0.5688, 0.0724],
  13593. [ 0.4475, -0.5090, 1.6610, -0.0321, -0.5360, -0.1445, 0.3971, 0.0563],
  13594. [ 0.3423, -0.5918, 1.6331, -0.1741, -0.3868, 0.2066, 0.6619, 0.1233],
  13595. [ 0.3358, -0.5321, 1.5918, -0.2288, -0.3002, -0.1307, 0.2582, 0.1861],
  13596. [ 0.6290, -0.3624, 1.6425, -0.1294, -0.1318, -0.0388, 0.1791, 0.0794]],
  13597. device='cuda:0', grad_fn=<AddmmBackward>)
  13598. landmarks are: tensor([[[ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  13599. 0.1499],
  13600. [ 0.5030, -0.4631, 1.5998, -0.0303, -0.6404, -0.1843, 0.1465,
  13601. -0.1181],
  13602. [ 0.5828, -0.4066, 1.7557, 0.0774, -0.3691, -0.0226, 0.4277,
  13603. 0.1005],
  13604. [ 0.6011, -0.3778, 1.7268, -0.9079, -0.3113, -1.1928, 0.5605,
  13605. 0.1929],
  13606. [ 0.5773, -0.4316, 1.7399, 0.1287, -0.5153, -0.0817, 0.4313,
  13607. 0.0919],
  13608. [ 0.5993, -0.4345, 1.7587, 0.0641, -0.3917, 0.2048, 0.7827,
  13609. 0.0852],
  13610. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  13611. 0.3057],
  13612. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  13613. 0.0532]]], device='cuda:0')
  13614. loss_train_step before backward: tensor(0.0137, device='cuda:0', grad_fn=<MseLossBackward>)
  13615.  
  13616. loss_train_step after backward: tensor(0.0137, device='cuda:0', grad_fn=<MseLossBackward>)
  13617. loss_train: 1.8530531292781234
  13618. step: 45
  13619. running loss: 0.04117895842840274
  13620. Train Steps: 45/90 Loss: 0.0412 torch.Size([8, 600, 800])
  13621. torch.Size([8, 8])
  13622. tensor([[ nan, nan, 0.7625, 0.2433, 0.3713, 0.2867, 0.5235, 0.5220],
  13623. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  13624. [0.6193, 0.3930, 0.8949, 0.4437, 0.3852, 0.5435, 0.6263, 0.5263],
  13625. [0.6248, 0.4032, 0.7738, 0.1900, 0.4813, 0.1400, 0.5941, 0.4904],
  13626. [0.6200, 0.4049, 0.8638, 0.5617, 0.4125, 0.5100, 0.6013, 0.5317],
  13627. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  13628. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  13629. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433]],
  13630. device='cuda:0', dtype=torch.float64)
  13631. predictions are: tensor([[-2.0062, -2.1088, 1.2378, -1.1293, -0.6208, -0.9271, 0.1880, 0.1063],
  13632. [ 0.6630, -0.3410, 1.7287, 0.0418, -0.1805, 0.1816, 0.3918, 0.1792],
  13633. [ 0.6831, -0.3443, 1.8144, -0.0936, -0.5714, 0.2910, 0.6572, 0.0492],
  13634. [ 0.7003, -0.3176, 1.2593, -1.1093, -0.1448, -1.5150, 0.5180, 0.0846],
  13635. [ 0.9637, -0.1827, 1.7292, 0.3907, -0.4397, 0.2822, 0.5706, 0.0913],
  13636. [ 1.0779, -0.0850, 1.2507, -0.9365, -0.5781, -0.9499, 0.3741, 0.0290],
  13637. [ 0.6943, -0.2916, 1.5082, -0.5144, -0.6949, -0.6832, 0.2075, 0.1789],
  13638. [ 0.9264, -0.1761, 1.7016, 0.2059, -0.1610, 0.0985, 0.3311, 0.1391]],
  13639. device='cuda:0', grad_fn=<AddmmBackward>)
  13640. landmarks are: tensor([[[-2.2859, -2.2859, 1.2360, -1.1620, -0.5711, -0.9618, 0.1322,
  13641. 0.1253],
  13642. [ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  13643. 0.3007],
  13644. [ 0.5746, -0.4706, 1.8476, -0.2365, -0.5068, 0.2245, 0.6069,
  13645. 0.1449],
  13646. [ 0.5999, -0.4236, 1.2880, -1.4083, -0.0630, -1.6393, 0.4584,
  13647. -0.0208],
  13648. [ 0.5776, -0.4159, 1.7037, 0.3084, -0.3806, 0.0697, 0.4912,
  13649. 0.1698],
  13650. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  13651. -0.1031],
  13652. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  13653. 0.2237],
  13654. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  13655. 0.2237]]], device='cuda:0')
  13656. loss_train_step before backward: tensor(0.0267, device='cuda:0', grad_fn=<MseLossBackward>)
  13657. loss_train_step after backward: tensor(0.0267, device='cuda:0', grad_fn=<MseLossBackward>)
  13658. loss_train: 1.8797959005460143
  13659. step: 46
  13660. running loss: 0.04086512827273944
  13661. Train Steps: 46/90 Loss: 0.0409 torch.Size([8, 600, 800])
  13662. torch.Size([8, 8])
  13663. tensor([[0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  13664. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  13665. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  13666. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  13667. [0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  13668. [0.6199, 0.4071, 0.7600, 0.2117, 0.4037, 0.2767, 0.6138, 0.5550],
  13669. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  13670. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967]],
  13671. device='cuda:0', dtype=torch.float64)
  13672. predictions are: tensor([[ 0.4136, -0.5211, 1.6518, -0.5711, -0.4877, -1.1473, 0.1868, 0.0327],
  13673. [ 0.0622, -0.7807, 1.6220, 0.0317, -0.5489, -0.1672, 0.4488, 0.2454],
  13674. [ 0.1679, -0.6337, 1.3389, -0.7607, -0.6656, -0.5568, 0.2576, 0.1309],
  13675. [ 0.6829, -0.3497, 1.8155, -0.0984, -0.4948, 0.0420, 0.4061, 0.0627],
  13676. [ 0.4903, -0.4681, 1.6231, 0.1573, -0.1295, -0.0120, 0.1925, 0.1658],
  13677. [ 0.7352, -0.3283, 1.3336, -1.2855, -0.3736, -1.1986, 0.5552, 0.1144],
  13678. [ 0.6767, -0.3760, 1.6842, 0.2048, -0.3348, 0.2051, 0.7426, 0.0626],
  13679. [ 0.5668, -0.4108, 1.6528, -0.3251, -0.5824, 0.0828, 0.4796, 0.0241]],
  13680. device='cuda:0', grad_fn=<AddmmBackward>)
  13681. landmarks are: tensor([[[ 0.5485, -0.4209, 1.6691, -0.4152, -0.5249, -1.1081, 0.0725,
  13682. 0.0021],
  13683. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  13684. 0.5239],
  13685. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  13686. 0.3417],
  13687. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  13688. 0.1775],
  13689. [ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  13690. 0.4239],
  13691. [ 0.5775, -0.4054, 1.2245, -1.3082, -0.4210, -1.0080, 0.5490,
  13692. 0.2776],
  13693. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  13694. 0.1176],
  13695. [ 0.4974, -0.4482, 1.6633, -0.3306, -0.6173, 0.1313, 0.2925,
  13696. 0.0081]]], device='cuda:0')
  13697. loss_train_step before backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  13698. loss_train_step after backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  13699. loss_train: 1.8977786405012012
  13700. step: 47
  13701. running loss: 0.040378268946834064
  13702. Train Steps: 47/90 Loss: 0.0404 torch.Size([8, 600, 800])
  13703. torch.Size([8, 8])
  13704. tensor([[0.6267, 0.4094, 0.8712, 0.3083, 0.4400, 0.2267, 0.6250, 0.5200],
  13705. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  13706. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  13707. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  13708. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  13709. [0.6192, 0.3980, 0.7078, 0.2750, 0.4250, 0.2100, 0.5450, 0.5783],
  13710. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  13711. [0.6218, 0.4137, 0.7263, 0.2233, 0.4075, 0.2650, 0.6212, 0.5783]],
  13712. device='cuda:0', dtype=torch.float64)
  13713. predictions are: tensor([[ 0.6224, -0.3776, 1.7414, -0.8322, -0.2218, -0.8424, 0.5022, 0.0806],
  13714. [ 0.4926, -0.5226, 1.6715, 0.2126, -0.5110, 0.1479, 0.4177, 0.2301],
  13715. [ 0.5360, -0.4621, 1.0516, -1.1743, -0.4601, -0.9034, 0.2978, 0.1392],
  13716. [ 0.8273, -0.2386, 1.7271, 0.1335, -0.6301, -0.1857, 0.1177, 0.0842],
  13717. [ 1.0371, -0.1818, 1.8480, 0.4197, -0.5808, -0.2250, 0.4951, 0.0019],
  13718. [-1.5094, -1.7850, 1.0574, -1.0092, -0.3379, -0.9945, 0.2675, 0.1895],
  13719. [ 0.6967, -0.3592, 1.9175, -0.3306, -0.5247, -0.1906, 0.6084, 0.0473],
  13720. [ 0.7549, -0.3261, 1.1601, -0.8692, -0.4138, -0.8388, 0.4756, 0.2019]],
  13721. device='cuda:0', grad_fn=<AddmmBackward>)
  13722. landmarks are: tensor([[[ 0.6089, -0.3948, 1.7383, -0.8617, -0.2536, -1.2390, 0.6009,
  13723. 0.1159],
  13724. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  13725. 0.5239],
  13726. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  13727. 0.2853],
  13728. [ 0.5443, -0.3994, 1.7499, -0.1227, -0.6173, -0.5769, 0.0049,
  13729. 0.2071],
  13730. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  13731. -0.0957],
  13732. [ 0.5742, -0.4474, 0.9834, -1.0159, -0.3229, -1.3159, 0.2314,
  13733. 0.3854],
  13734. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  13735. 0.1544],
  13736. [ 0.5863, -0.3749, 1.0686, -1.2543, -0.4037, -1.0619, 0.5836,
  13737. 0.3854]]], device='cuda:0')
  13738. loss_train_step before backward: tensor(0.1265, device='cuda:0', grad_fn=<MseLossBackward>)
  13739. loss_train_step after backward: tensor(0.1265, device='cuda:0', grad_fn=<MseLossBackward>)
  13740. loss_train: 2.0243153674528003
  13741. step: 48
  13742. running loss: 0.04217323682193334
  13743. Train Steps: 48/90 Loss: 0.0422 torch.Size([8, 600, 800])
  13744. torch.Size([8, 8])
  13745. tensor([[0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  13746. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  13747. [0.6202, 0.4066, 0.8746, 0.3376, 0.3717, 0.3090, 0.5842, 0.5165],
  13748. [0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  13749. [0.6339, 0.4112, 0.8838, 0.5067, 0.4000, 0.5433, 0.7549, 0.5378],
  13750. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  13751. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  13752. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334]],
  13753. device='cuda:0', dtype=torch.float64)
  13754. predictions are: tensor([[ 0.5666, -0.4526, 1.4781, -0.7345, -0.4664, -0.7452, 0.4017, 0.1356],
  13755. [ 0.3569, -0.5902, 1.4038, -0.7881, -0.1524, -1.2387, 0.5315, 0.1132],
  13756. [ 0.8075, -0.3212, 1.7756, -0.3874, -0.5380, -0.8027, 0.3158, 0.0359],
  13757. [ 0.4889, -0.5159, 1.4719, -0.5841, -0.6540, -0.5052, 0.1248, 0.1664],
  13758. [ 0.3145, -0.6566, 1.7905, 0.4144, -0.3301, 0.5480, 0.6483, 0.1989],
  13759. [ 0.2731, -0.6563, 1.5606, -0.4530, -0.5923, -0.3571, 0.4636, 0.1154],
  13760. [ 0.4306, -0.5213, 1.4185, -0.5322, -0.6252, -0.2094, 0.3687, 0.1786],
  13761. [ 0.3540, -0.5800, 1.2383, -0.7893, -0.4970, -0.7637, 0.4088, 0.1234]],
  13762. device='cuda:0', grad_fn=<AddmmBackward>)
  13763. landmarks are: tensor([[[ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  13764. 0.2699],
  13765. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  13766. 0.1917],
  13767. [ 0.5787, -0.4077, 1.7537, -0.7263, -0.5692, -0.8586, 0.4126,
  13768. 0.1000],
  13769. [ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  13770. 0.2776],
  13771. [ 0.6421, -0.3864, 1.7961, 0.0543, -0.4383, 0.2237, 1.2007,
  13772. 0.1982],
  13773. [ 0.5779, -0.4275, 1.5894, -0.8362, -0.6577, -0.5153, 0.5605,
  13774. 0.2006],
  13775. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  13776. 0.2776],
  13777. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  13778. 0.1779]]], device='cuda:0')
  13779. loss_train_step before backward: tensor(0.0430, device='cuda:0', grad_fn=<MseLossBackward>)
  13780. loss_train_step after backward: tensor(0.0430, device='cuda:0', grad_fn=<MseLossBackward>)
  13781. loss_train: 2.067306305281818
  13782. step: 49
  13783. running loss: 0.04218992459758812
  13784.  
  13785. Train Steps: 49/90 Loss: 0.0422 torch.Size([8, 600, 800])
  13786. torch.Size([8, 8])
  13787. tensor([[0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  13788. [0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467],
  13789. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  13790. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  13791. [0.6084, 0.3981, 0.8588, 0.5233, 0.4600, 0.5367, 0.5680, 0.5006],
  13792. [0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  13793. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  13794. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533]],
  13795. device='cuda:0', dtype=torch.float64)
  13796. predictions are: tensor([[ 0.5385, -0.4836, 1.2245, -0.9226, -0.4233, -1.0781, 0.2606, 0.1285],
  13797. [ 0.6310, -0.4203, 1.2385, -0.8954, -0.5206, -0.7738, 0.6003, 0.1909],
  13798. [ 0.7104, -0.3214, 1.5186, -0.3326, -0.2686, -0.7922, 0.3363, 0.3189],
  13799. [ 0.8336, -0.3251, 1.8312, -0.2580, -0.6616, -0.3110, 0.6699, 0.0044],
  13800. [ 0.6117, -0.4478, 1.7861, 0.4758, -0.2638, 0.4468, 0.2286, 0.1295],
  13801. [ 0.6076, -0.4409, 1.5538, -0.6097, -0.7504, -0.3698, 0.2756, 0.2015],
  13802. [ 0.5570, -0.4618, 1.5436, -0.8213, -0.4644, -0.8386, 0.4805, 0.1029],
  13803. [-1.1730, -1.5919, 0.9783, -1.0332, -0.4394, -1.1426, 0.3340, 0.2623]],
  13804. device='cuda:0', grad_fn=<AddmmBackward>)
  13805. landmarks are: tensor([[[ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  13806. 0.0774],
  13807. [ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  13808. 0.2391],
  13809. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  13810. 0.5882],
  13811. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  13812. -0.0670],
  13813. [ 0.5241, -0.4470, 1.6806, 0.1313, -0.1612, 0.1929, 0.3378,
  13814. 0.0261],
  13815. [ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  13816. 0.2776],
  13817. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  13818. 0.0807],
  13819. [-2.2859, -2.2859, 0.7023, -1.3883, -0.4268, -1.3621, 0.0813,
  13820. 0.2699]]], device='cuda:0')
  13821. loss_train_step before backward: tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward>)
  13822. loss_train_step after backward: tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward>)
  13823. loss_train: 2.1241164905950427
  13824. step: 50
  13825. running loss: 0.04248232981190085
  13826. Train Steps: 50/90 Loss: 0.0425 torch.Size([8, 600, 800])
  13827. torch.Size([8, 8])
  13828. tensor([[0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  13829. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  13830. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  13831. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567],
  13832. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083],
  13833. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  13834. [0.6198, 0.4115, 0.7762, 0.2717, 0.3713, 0.3200, 0.5837, 0.5683],
  13835. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417]],
  13836. device='cuda:0', dtype=torch.float64)
  13837. predictions are: tensor([[ 0.7524, -0.3048, 1.7285, 0.0559, -0.5789, -0.3614, 0.4482, 0.2964],
  13838. [ 0.6012, -0.4074, 1.7178, -0.2578, -0.3618, 0.1045, 0.5429, 0.2140],
  13839. [ 0.7497, -0.3409, 1.7492, 0.1629, -0.3651, 0.2797, 0.8453, 0.2304],
  13840. [-1.1396, -1.5549, 1.0833, -1.2028, -0.4997, -1.1879, 0.1421, 0.2040],
  13841. [ 0.7176, -0.3714, 1.7701, -0.4835, -0.6730, -0.7595, 0.3634, 0.0367],
  13842. [ 0.5878, -0.4171, 1.6346, 0.3001, -0.3926, -0.0520, 0.1840, 0.1566],
  13843. [ 0.6174, -0.4194, 1.3560, -1.0567, -0.6214, -1.0043, 0.3839, 0.2182],
  13844. [ 0.4703, -0.5073, 1.3387, -1.1426, -0.4838, -1.0649, 0.5185, 0.2052]],
  13845. device='cuda:0', grad_fn=<AddmmBackward>)
  13846. landmarks are: tensor([[[ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  13847. 0.3623],
  13848. [ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  13849. 0.3161],
  13850. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  13851. 0.3371],
  13852. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  13853. 0.2853],
  13854. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  13855. 0.0620],
  13856. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  13857. 0.2048],
  13858. [ 0.5768, -0.3852, 1.2995, -1.0311, -0.5711, -0.8079, 0.4104,
  13859. 0.3392],
  13860. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  13861. 0.2160]]], device='cuda:0')
  13862. loss_train_step before backward: tensor(0.0363, device='cuda:0', grad_fn=<MseLossBackward>)
  13863. loss_train_step after backward: tensor(0.0363, device='cuda:0', grad_fn=<MseLossBackward>)
  13864. loss_train: 2.1603687768802047
  13865. step: 51
  13866. running loss: 0.04236017209569029
  13867. Train Steps: 51/90 Loss: 0.0424 torch.Size([8, 600, 800])
  13868. torch.Size([8, 8])
  13869. tensor([[0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  13870. [0.6075, 0.4000, 0.8513, 0.5183, 0.4510, 0.5329, 0.5180, 0.5280],
  13871. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  13872. [0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  13873. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  13874. [0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  13875. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646],
  13876. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649]],
  13877. device='cuda:0', dtype=torch.float64)
  13878. predictions are: tensor([[ 0.7951, -0.3181, 1.3667, -0.9975, -0.6434, -0.7699, 0.4930, 0.1455],
  13879. [ 0.6817, -0.3643, 1.6849, -0.0330, -0.1792, -0.0081, 0.2371, 0.2157],
  13880. [ 0.5805, -0.4193, 1.4511, -0.7298, -0.5682, -1.1159, 0.2997, 0.2842],
  13881. [ 0.7572, -0.3580, 1.8490, -0.1689, -0.4425, 0.1329, 0.8386, 0.1823],
  13882. [-1.5188, -1.8176, 1.2768, -1.1645, -0.4267, -1.1418, 0.3316, 0.2596],
  13883. [ 0.8045, -0.2769, 1.7545, -0.1248, -0.5806, -0.3896, 0.5359, 0.3604],
  13884. [ 0.3195, -0.5944, 1.3143, -1.0067, -0.6936, -0.9331, 0.1250, 0.2017],
  13885. [ 0.8338, -0.3000, 1.6501, 0.2392, -0.5147, -0.1556, 0.5634, 0.1801]],
  13886. device='cuda:0', grad_fn=<AddmmBackward>)
  13887. landmarks are: tensor([[[ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  13888. 0.0942],
  13889. [ 0.5202, -0.4382, 1.6460, 0.1082, -0.2029, 0.1754, 0.1067,
  13890. 0.1530],
  13891. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  13892. 0.3928],
  13893. [ 0.6047, -0.4209, 1.7557, -0.0303, -0.4845, 0.2545, 0.6587,
  13894. 0.1236],
  13895. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  13896. 0.3007],
  13897. [ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  13898. 0.3623],
  13899. [ 0.5483, -0.4105, 1.4208, -0.8002, -0.6000, -0.9002, 0.0511,
  13900. 0.3220],
  13901. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  13902. -0.1385]]], device='cuda:0')
  13903. loss_train_step before backward: tensor(0.0298, device='cuda:0', grad_fn=<MseLossBackward>)
  13904. loss_train_step after backward: tensor(0.0298, device='cuda:0', grad_fn=<MseLossBackward>)
  13905. loss_train: 2.1901937695220113
  13906. step: 52
  13907. running loss: 0.04211911095234637
  13908. Train Steps: 52/90 Loss: 0.0421 torch.Size([8, 600, 800])
  13909. torch.Size([8, 8])
  13910. tensor([[0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  13911. [0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758],
  13912. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  13913. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217],
  13914. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478],
  13915. [0.6205, 0.4004, 0.8938, 0.4883, 0.3663, 0.5000, 0.6357, 0.4947],
  13916. [0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  13917. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436]],
  13918. device='cuda:0', dtype=torch.float64)
  13919. predictions are: tensor([[ 0.2910, -0.6319, 0.8737, -1.2362, -0.5089, -1.1692, 0.2117, 0.3007],
  13920. [ 0.5419, -0.4641, 1.7910, -0.0319, -0.4816, 0.1344, 0.4855, 0.1718],
  13921. [ 0.4724, -0.5371, 1.8747, -0.3285, -0.5541, -0.7206, 0.4187, 0.2375],
  13922. [ 0.4847, -0.4866, 1.0764, -1.1323, -0.4219, -1.1624, 0.3798, 0.4126],
  13923. [ 0.3838, -0.5823, 1.7736, -0.6931, -0.6253, -0.8531, 0.3493, 0.2185],
  13924. [ 0.4651, -0.5428, 1.7617, 0.0150, -0.6195, 0.0082, 0.4829, 0.1659],
  13925. [-0.0310, -0.8469, 1.2318, -1.2809, -0.3572, -1.3031, 0.5550, 0.2932],
  13926. [ 0.6677, -0.3943, 1.7676, 0.1537, -0.4608, 0.2785, 0.6763, 0.2784]],
  13927. device='cuda:0', grad_fn=<AddmmBackward>)
  13928. landmarks are: tensor([[[ 5.4827e-01, -3.9908e-01, 8.0300e-01, -1.2159e+00, -5.0185e-01,
  13929. -1.1928e+00, 2.6243e-01, 3.8516e-01],
  13930. [ 6.0716e-01, -4.2502e-01, 1.8249e+00, -7.2363e-03, -4.0370e-01,
  13931. 1.0824e-01, 6.7296e-01, -8.8090e-02],
  13932. [ 6.0935e-01, -3.9469e-01, 1.8885e+00, -2.9977e-01, -5.7691e-01,
  13933. -6.7698e-01, 6.0670e-01, 1.0054e-01],
  13934. [ 5.6871e-01, -4.0878e-01, 1.0397e+00, -1.1466e+00, -3.1132e-01,
  13935. -1.1928e+00, 4.6813e-01, 5.8553e-01],
  13936. [ 5.7921e-01, -4.0523e-01, 1.8214e+00, -6.5874e-01, -5.3842e-01,
  13937. -8.9239e-01, 4.3812e-01, 2.4425e-01],
  13938. [ 5.8031e-01, -4.3672e-01, 1.8423e+00, -3.0331e-02, -5.9423e-01,
  13939. 2.3557e-02, 6.5034e-01, -9.2270e-04],
  13940. [ 5.9169e-01, -3.8607e-01, 1.0455e+00, -1.3698e+00, -2.8822e-01,
  13941. -1.1928e+00, 6.0670e-01, 2.0831e-01],
  13942. [ 6.4212e-01, -3.8157e-01, 1.7037e+00, 1.9292e-01, -4.0370e-01,
  13943. 2.3911e-01, 1.1861e+00, 2.2489e-01]]], device='cuda:0')
  13944. loss_train_step before backward: tensor(0.0241, device='cuda:0', grad_fn=<MseLossBackward>)
  13945. loss_train_step after backward: tensor(0.0241, device='cuda:0', grad_fn=<MseLossBackward>)
  13946. loss_train: 2.2142448211088777
  13947. step: 53
  13948. running loss: 0.04177820417186562
  13949.  
  13950. Train Steps: 53/90 Loss: 0.0418 torch.Size([8, 600, 800])
  13951. torch.Size([8, 8])
  13952. tensor([[0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  13953. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  13954. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  13955. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  13956. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  13957. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  13958. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  13959. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749]],
  13960. device='cuda:0', dtype=torch.float64)
  13961. predictions are: tensor([[ 2.5260e-02, -7.6672e-01, 1.0277e+00, -1.2165e+00, -3.4002e-01,
  13962. -1.3102e+00, 4.8023e-01, 3.9226e-01],
  13963. [ 6.2153e-01, -4.3315e-01, 1.9337e+00, 1.7966e-03, -5.1253e-01,
  13964. 9.0811e-02, 5.9042e-01, 1.6422e-01],
  13965. [ 4.9724e-01, -5.0812e-01, 1.6399e+00, -7.6851e-01, -6.8466e-01,
  13966. -7.5338e-01, 3.2359e-01, 3.3033e-01],
  13967. [ 6.1532e-01, -4.3510e-01, 1.4187e+00, -8.1107e-01, -6.2200e-01,
  13968. -7.1508e-01, 4.0486e-01, 1.7140e-01],
  13969. [ 3.6046e-01, -5.7041e-01, 1.3250e+00, -1.0281e+00, -6.1943e-01,
  13970. -6.3158e-01, 4.3742e-01, 2.4319e-01],
  13971. [ 3.0706e-01, -6.2405e-01, 1.9129e+00, -7.9856e-01, -4.4438e-01,
  13972. -9.1659e-01, 7.7821e-01, 1.9522e-01],
  13973. [ 5.9681e-01, -4.0429e-01, 1.6356e+00, 4.3390e-01, -3.5430e-01,
  13974. -3.2069e-01, 4.2337e-01, 4.7371e-01],
  13975. [ 2.7878e-01, -6.1629e-01, 1.1768e+00, -9.2799e-01, -6.1763e-01,
  13976. -7.4626e-01, 2.4131e-01, 3.0193e-01]], device='cuda:0',
  13977. grad_fn=<AddmmBackward>)
  13978. landmarks are: tensor([[[ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  13979. 0.2622],
  13980. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  13981. 0.2237],
  13982. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  13983. 0.3315],
  13984. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  13985. 0.0942],
  13986. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  13987. 0.2237],
  13988. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  13989. 0.1390],
  13990. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  13991. 0.4470],
  13992. [ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  13993. 0.3694]]], device='cuda:0')
  13994. loss_train_step before backward: tensor(0.0175, device='cuda:0', grad_fn=<MseLossBackward>)
  13995. loss_train_step after backward: tensor(0.0175, device='cuda:0', grad_fn=<MseLossBackward>)
  13996. loss_train: 2.2317135045304894
  13997. step: 54
  13998. running loss: 0.04132802786167573
  13999. Train Steps: 54/90 Loss: 0.0413 torch.Size([8, 600, 800])
  14000. torch.Size([8, 8])
  14001. tensor([[0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  14002. [0.6307, 0.4029, 0.8988, 0.4817, 0.3937, 0.3500, 0.7311, 0.5378],
  14003. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  14004. [0.6223, 0.4130, 0.8100, 0.2983, 0.3525, 0.3900, 0.5694, 0.5103],
  14005. [0.6234, 0.4179, 0.7825, 0.3450, 0.3813, 0.2867, 0.5675, 0.5617],
  14006. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  14007. [0.6261, 0.4045, 0.8865, 0.5369, 0.3895, 0.4859, 0.6683, 0.5249],
  14008. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197]],
  14009. device='cuda:0', dtype=torch.float64)
  14010. predictions are: tensor([[ 0.3991, -0.5190, 1.6326, -0.1913, -0.3595, -0.1455, 0.4408, 0.2888],
  14011. [ 0.2619, -0.6540, 1.8745, -0.3648, -0.5207, -0.9587, 0.7523, 0.2107],
  14012. [ 0.3949, -0.5408, 0.8073, -1.4307, -0.5081, -1.3098, 0.3159, 0.3495],
  14013. [ 0.3794, -0.5318, 1.4255, -1.1229, -0.7340, -0.7321, 0.3473, 0.2941],
  14014. [ 0.3057, -0.5531, 1.3458, -1.0888, -0.5595, -1.1431, 0.3626, 0.4253],
  14015. [ 0.6391, -0.3797, 1.6804, 0.1259, -0.4331, -0.0430, 0.4921, 0.3337],
  14016. [ 0.5814, -0.4455, 1.7452, -0.0697, -0.6352, -0.1981, 0.7558, 0.1840],
  14017. [ 0.3373, -0.5463, 1.6790, -0.1625, -0.2885, -0.1123, 0.2628, 0.2724]],
  14018. device='cuda:0', grad_fn=<AddmmBackward>)
  14019. landmarks are: tensor([[[ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  14020. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  14021. [ 6.2730e-01, -4.2490e-01, 1.8654e+00, -6.1124e-02, -4.6721e-01,
  14022. -6.6928e-01, 1.0910e+00, 1.9818e-01],
  14023. [ 5.4827e-01, -3.9908e-01, 8.0300e-01, -1.2159e+00, -5.0185e-01,
  14024. -1.1928e+00, 2.6243e-01, 3.8516e-01],
  14025. [ 5.8863e-01, -3.7837e-01, 1.4554e+00, -9.0793e-01, -6.5774e-01,
  14026. -4.8453e-01, 3.4395e-01, 7.1216e-02],
  14027. [ 5.9348e-01, -3.5581e-01, 1.3284e+00, -6.9238e-01, -5.2494e-01,
  14028. -9.6182e-01, 3.3533e-01, 3.0839e-01],
  14029. [ 5.7419e-01, -3.7921e-01, 1.6460e+00, 3.0839e-01, -3.4596e-01,
  14030. 1.4673e-01, 4.1617e-01, 3.1609e-01],
  14031. [ 6.0589e-01, -4.1768e-01, 1.8087e+00, 1.9408e-01, -4.8680e-01,
  14032. -4.1391e-02, 8.0095e-01, 1.3848e-01],
  14033. [ 5.7696e-01, -3.6243e-01, 1.7326e+00, 5.4350e-02, -1.4965e-01,
  14034. 3.2379e-01, 2.3775e-01, 1.1464e-01]]], device='cuda:0')
  14035. loss_train_step before backward: tensor(0.0297, device='cuda:0', grad_fn=<MseLossBackward>)
  14036. loss_train_step after backward: tensor(0.0297, device='cuda:0', grad_fn=<MseLossBackward>)
  14037. loss_train: 2.261423231102526
  14038. step: 55
  14039. running loss: 0.04111678602004593
  14040. Train Steps: 55/90 Loss: 0.0411 torch.Size([8, 600, 800])
  14041. torch.Size([8, 8])
  14042. tensor([[0.6118, 0.4052, 0.8463, 0.3917, 0.3538, 0.3450, 0.5053, 0.5593],
  14043. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  14044. [0.6211, 0.4069, 0.8750, 0.5117, 0.4150, 0.4900, 0.5875, 0.5167],
  14045. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  14046. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  14047. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  14048. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  14049. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804]],
  14050. device='cuda:0', dtype=torch.float64)
  14051. predictions are: tensor([[ 0.0752, -0.7276, 1.4581, -0.7417, -0.6950, -0.7660, 0.0415, 0.3244],
  14052. [ 0.3550, -0.5610, 1.6460, -0.5112, -0.6129, -0.5533, 0.4340, 0.2236],
  14053. [ 0.4733, -0.4840, 1.6904, -0.1513, -0.3921, -0.0886, 0.5491, 0.2488],
  14054. [ 0.5271, -0.4809, 1.5573, 0.0957, -0.5033, -0.2430, 0.6557, 0.2935],
  14055. [ 0.3911, -0.4719, 1.0264, -1.1537, -0.1195, -1.2667, 0.3460, 0.4831],
  14056. [ 0.4838, -0.4367, 1.6707, -0.3050, -0.5068, -0.9674, 0.4554, 0.3163],
  14057. [ 0.3380, -0.5800, 1.6796, -0.6661, -0.6049, -0.2165, 0.6289, 0.3577],
  14058. [ 0.7290, -0.3204, 1.6073, -0.8694, -0.6387, -0.6692, 0.6848, 0.1262]],
  14059. device='cuda:0', grad_fn=<AddmmBackward>)
  14060. landmarks are: tensor([[[ 0.5399, -0.4142, 1.6229, -0.4768, -0.6520, -0.6924, 0.0481,
  14061. 0.2972],
  14062. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  14063. 0.0467],
  14064. [ 0.5828, -0.4066, 1.7557, 0.0774, -0.3691, -0.0226, 0.4277,
  14065. 0.1005],
  14066. [ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  14067. -0.1331],
  14068. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  14069. 0.5624],
  14070. [ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  14071. 0.1852],
  14072. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  14073. 0.3161],
  14074. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  14075. -0.0670]]], device='cuda:0')
  14076. loss_train_step before backward: tensor(0.0350, device='cuda:0', grad_fn=<MseLossBackward>)
  14077. loss_train_step after backward: tensor(0.0350, device='cuda:0', grad_fn=<MseLossBackward>)
  14078. loss_train: 2.296431795693934
  14079. step: 56
  14080. running loss: 0.04100771063739168
  14081. Train Steps: 56/90 Loss: 0.0410 torch.Size([8, 600, 800])
  14082. torch.Size([8, 8])
  14083. tensor([[0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  14084. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  14085. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  14086. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517],
  14087. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  14088. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  14089. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  14090. [0.6146, 0.4124, 0.8800, 0.4867, 0.3800, 0.4500, 0.5106, 0.5524]],
  14091. device='cuda:0', dtype=torch.float64)
  14092. predictions are: tensor([[-0.5338, -1.0908, 1.0218, -1.2956, -0.2762, -1.3676, 0.3314, 0.2925],
  14093. [ 0.7514, -0.3161, 1.7225, -0.0812, -0.4777, -0.1617, 0.6445, 0.1176],
  14094. [ 0.6451, -0.3701, 1.8502, -0.3280, -0.4483, -0.7106, 0.7212, 0.2513],
  14095. [ 0.7114, -0.2943, 1.5651, -0.8324, -0.6431, -0.5288, 0.6222, 0.2602],
  14096. [ 0.7963, -0.2482, 1.6338, -0.7183, -0.6423, -0.4676, 0.5556, 0.3234],
  14097. [-0.1757, -0.8331, 1.1903, -0.9809, -0.4011, -1.0549, 0.2312, 0.3846],
  14098. [ 0.4617, -0.4524, 1.3170, -0.5441, -0.5445, -0.7966, 0.2700, 0.4307],
  14099. [ 0.5571, -0.3778, 1.7054, 0.1239, -0.4832, -0.2008, 0.3696, 0.2623]],
  14100. device='cuda:0', grad_fn=<AddmmBackward>)
  14101. landmarks are: tensor([[[ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  14102. 0.1343],
  14103. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  14104. -0.0534],
  14105. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  14106. 0.1005],
  14107. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  14108. 0.2622],
  14109. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  14110. 0.3392],
  14111. [-2.2859, -2.2859, 1.2303, -0.7848, -0.4210, -1.1158, 0.2256,
  14112. 0.3777],
  14113. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  14114. 0.4470],
  14115. [ 0.5529, -0.3811, 1.7788, -0.0380, -0.5307, -0.2074, 0.0727,
  14116. 0.2657]]], device='cuda:0')
  14117. loss_train_step before backward: tensor(0.1399, device='cuda:0', grad_fn=<MseLossBackward>)
  14118.  
  14119. loss_train_step after backward: tensor(0.1399, device='cuda:0', grad_fn=<MseLossBackward>)
  14120. loss_train: 2.436326772905886
  14121. step: 57
  14122. running loss: 0.042742574963261164
  14123. Train Steps: 57/90 Loss: 0.0427 torch.Size([8, 600, 800])
  14124. torch.Size([8, 8])
  14125. tensor([[0.6257, 0.4060, 0.8300, 0.2333, 0.4688, 0.2583, 0.7050, 0.5633],
  14126. [0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436],
  14127. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575],
  14128. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  14129. [0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395],
  14130. [0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  14131. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  14132. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183]],
  14133. device='cuda:0', dtype=torch.float64)
  14134. predictions are: tensor([[ 3.8910e-01, -4.9305e-01, 1.6736e+00, -1.0089e+00, -2.0297e-01,
  14135. -1.2898e+00, 8.2985e-01, 3.0091e-01],
  14136. [ 4.2471e-01, -4.7600e-01, 1.7696e+00, -1.4306e-01, -4.9965e-01,
  14137. -9.5795e-02, 7.4937e-01, 2.1200e-01],
  14138. [ 5.2550e-01, -4.1549e-01, 1.6856e+00, -5.4736e-01, -4.8786e-01,
  14139. -3.7032e-01, 7.5352e-01, 2.1056e-01],
  14140. [ 4.8281e-01, -4.3335e-01, 1.8100e+00, 1.3539e-03, -3.4686e-01,
  14141. 2.0120e-01, 5.2785e-01, 3.4740e-01],
  14142. [ 4.8238e-01, -4.4421e-01, 1.1127e+00, -1.1223e+00, -4.4218e-01,
  14143. -1.2524e+00, 3.8058e-01, 2.7940e-01],
  14144. [ 2.9010e-01, -5.9548e-01, 1.1687e+00, -1.0469e+00, -6.2078e-01,
  14145. -1.0666e+00, 3.2697e-01, 1.9013e-01],
  14146. [ 3.8660e-01, -4.7169e-01, 1.3892e+00, -2.7819e-01, -6.6921e-01,
  14147. -3.4179e-01, -8.3418e-02, 1.6513e-01],
  14148. [ 4.1583e-01, -4.8280e-01, 1.3151e+00, -8.3128e-01, -5.0556e-01,
  14149. -9.7859e-01, 4.4635e-01, 5.0129e-01]], device='cuda:0',
  14150. grad_fn=<AddmmBackward>)
  14151. landmarks are: tensor([[[ 0.6042, -0.4105, 1.5478, -1.2082, -0.1208, -1.0927, 0.9704,
  14152. 0.3157],
  14153. [ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  14154. 0.2249],
  14155. [ 0.6158, -0.4249, 1.8654, -0.9002, -0.3229, -0.3537, 0.9667,
  14156. 0.2890],
  14157. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  14158. 0.4701],
  14159. [ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  14160. 0.2058],
  14161. [ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  14162. 0.0562],
  14163. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  14164. 0.1552],
  14165. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  14166. 0.5701]]], device='cuda:0')
  14167. loss_train_step before backward: tensor(0.0216, device='cuda:0', grad_fn=<MseLossBackward>)
  14168. loss_train_step after backward: tensor(0.0216, device='cuda:0', grad_fn=<MseLossBackward>)
  14169. loss_train: 2.4578881757333875
  14170. step: 58
  14171. running loss: 0.04237738234023082
  14172. Train Steps: 58/90 Loss: 0.0424 torch.Size([8, 600, 800])
  14173. torch.Size([8, 8])
  14174. tensor([[0.6245, 0.4100, 0.7762, 0.2583, 0.4963, 0.1517, 0.5875, 0.5417],
  14175. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  14176. [0.6272, 0.4045, 0.8538, 0.5900, 0.3750, 0.4417, 0.5989, 0.4649],
  14177. [0.6275, 0.4050, 0.9038, 0.3767, 0.3838, 0.3533, 0.7074, 0.5575],
  14178. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679],
  14179. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  14180. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  14181. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433]],
  14182. device='cuda:0', dtype=torch.float64)
  14183. predictions are: tensor([[ 0.4276, -0.4216, 1.0481, -1.0719, -0.1652, -1.3034, 0.2338, 0.3338],
  14184. [ 0.6741, -0.2671, 1.6596, 0.0128, -0.5760, -0.7280, 0.2549, 0.2385],
  14185. [ 0.5957, -0.3851, 1.6734, 0.3216, -0.6498, -0.2558, 0.4546, 0.1138],
  14186. [ 0.6606, -0.3073, 1.7693, -0.5237, -0.6310, -0.6105, 0.7902, 0.2340],
  14187. [-0.8477, -1.3076, 1.6011, -1.1105, 0.0148, -1.0858, 0.9775, 0.3887],
  14188. [ 0.6939, -0.2546, 1.6675, -0.2473, -0.4186, 0.2012, 0.3346, 0.2056],
  14189. [ 0.5684, -0.3351, 1.5003, -1.0045, -0.4395, -0.9511, 0.5698, 0.2595],
  14190. [ 0.5738, -0.3424, 1.1729, -1.0006, -0.6760, -0.5028, 0.3477, 0.2576]],
  14191. device='cuda:0', grad_fn=<AddmmBackward>)
  14192. landmarks are: tensor([[[ 0.5985, -0.3921, 1.2995, -1.0927, 0.0062, -1.5854, 0.4277,
  14193. 0.2160],
  14194. [ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  14195. 0.1852],
  14196. [ 0.6109, -0.4177, 1.6575, 0.4393, -0.5538, -0.2459, 0.4805,
  14197. -0.1385],
  14198. [ 0.6125, -0.4153, 1.8885, -0.5461, -0.5134, -0.6539, 0.9814,
  14199. 0.2890],
  14200. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  14201. 0.3371],
  14202. [ 0.5499, -0.4225, 1.8018, -0.2921, -0.3055, 0.0543, 0.4046,
  14203. 0.2699],
  14204. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  14205. 0.1467],
  14206. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  14207. 0.2237]]], device='cuda:0')
  14208. loss_train_step before backward: tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward>)
  14209. loss_train_step after backward: tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward>)
  14210. loss_train: 2.520900216884911
  14211. step: 59
  14212. running loss: 0.04272712232008324
  14213. Train Steps: 59/90 Loss: 0.0427 torch.Size([8, 600, 800])
  14214. torch.Size([8, 8])
  14215. tensor([[0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155],
  14216. [0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  14217. [0.6314, 0.4107, 0.8750, 0.5100, 0.3788, 0.4900, 0.7121, 0.5864],
  14218. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  14219. [0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447],
  14220. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  14221. [0.6239, 0.4107, 0.8162, 0.2763, 0.3625, 0.3600, 0.5988, 0.5700],
  14222. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927]],
  14223. device='cuda:0', dtype=torch.float64)
  14224. predictions are: tensor([[ 0.9893, -0.0856, 1.4816, -1.0489, -0.1731, -1.3726, 0.6884, 0.1718],
  14225. [ 0.5411, -0.3862, 1.4689, 0.1822, -0.3924, -0.1881, 0.3981, 0.4081],
  14226. [ 0.5717, -0.3800, 1.8185, 0.0153, -0.4474, -0.1558, 0.8028, 0.2387],
  14227. [ 0.0362, -0.6552, 1.6265, -0.2109, -0.3773, -0.2945, 0.1722, 0.2111],
  14228. [ 0.5384, -0.3899, 1.8012, -0.2197, -0.4780, -0.1419, 0.7585, 0.1865],
  14229. [ 0.3051, -0.5194, 1.7123, -0.9239, -0.4580, -0.9475, 0.5561, 0.2275],
  14230. [-0.0521, -0.7613, 1.2508, -1.1285, -0.5612, -0.7800, 0.2824, 0.3768],
  14231. [ 0.6793, -0.2890, 1.6110, -0.4560, -0.6494, -0.4286, 0.3983, 0.0995]],
  14232. device='cuda:0', grad_fn=<AddmmBackward>)
  14233. landmarks are: tensor([[[ 0.6126, -0.4161, 1.6344, -0.9541, -0.2247, -1.3467, 0.6339,
  14234. 0.0953],
  14235. [ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  14236. 0.5393],
  14237. [ 0.6306, -0.3888, 1.7557, 0.0697, -0.5365, -0.0226, 1.0033,
  14238. 0.4226],
  14239. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  14240. 0.1439],
  14241. [ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  14242. 0.2302],
  14243. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  14244. 0.1390],
  14245. [ 0.5960, -0.3888, 1.4840, -1.0095, -0.6115, -0.6231, 0.4797,
  14246. 0.3469],
  14247. [ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  14248. -0.0099]]], device='cuda:0')
  14249. loss_train_step before backward: tensor(0.0357, device='cuda:0', grad_fn=<MseLossBackward>)
  14250. loss_train_step after backward: tensor(0.0357, device='cuda:0', grad_fn=<MseLossBackward>)
  14251. loss_train: 2.5565678672865033
  14252. step: 60
  14253. running loss: 0.04260946445477506
  14254. Train Steps: 60/90 Loss: 0.0426 torch.Size([8, 600, 800])
  14255. torch.Size([8, 8])
  14256. tensor([[0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882],
  14257. [0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  14258. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  14259. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  14260. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  14261. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  14262. [0.6296, 0.4060, 0.9100, 0.3267, 0.4726, 0.3367, 0.7446, 0.5355],
  14263. [0.6110, 0.4047, 0.8700, 0.4483, 0.3713, 0.3967, 0.5088, 0.5517]],
  14264. device='cuda:0', dtype=torch.float64)
  14265. predictions are: tensor([[ 0.7788, -0.2101, 1.7978, -0.4085, -0.6473, -0.3535, 0.1756, 0.1227],
  14266. [ 0.8946, -0.1416, 1.6702, -0.9497, 0.0064, -1.1562, 0.9449, 0.2182],
  14267. [ 0.9714, -0.1470, 1.8020, 0.1940, -0.4284, 0.0314, 0.6996, 0.1681],
  14268. [-0.5611, -1.1197, 0.9617, -1.1811, -0.3930, -1.2175, 0.3303, 0.3160],
  14269. [-1.0809, -1.4155, 0.9003, -1.1566, -0.3876, -1.1537, 0.2993, 0.4127],
  14270. [ 0.6877, -0.3139, 1.9421, 0.1481, -0.5822, -0.3625, 0.5538, 0.1134],
  14271. [ 0.7454, -0.2486, 1.7348, -0.7554, -0.2176, -0.6656, 0.9340, 0.1684],
  14272. [ 0.8294, -0.1889, 1.6893, -0.1422, -0.6164, -0.2008, 0.1228, 0.2367]],
  14273. device='cuda:0', grad_fn=<AddmmBackward>)
  14274. landmarks are: tensor([[[ 0.5595, -0.3988, 1.7672, -0.4460, -0.5538, -0.5384, 0.0828,
  14275. -0.0310],
  14276. [ 0.6520, -0.3912, 1.7095, -0.9079, -0.0284, -1.3621, 0.8096,
  14277. 0.2356],
  14278. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  14279. 0.1979],
  14280. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  14281. 0.1013],
  14282. [-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  14283. 0.4543],
  14284. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  14285. -0.0049],
  14286. [ 0.6224, -0.4105, 1.9173, -0.7771, -0.1030, -0.7308, 1.1532,
  14287. 0.1875],
  14288. [ 0.5363, -0.4168, 1.7326, -0.2151, -0.5711, -0.4537, 0.0640,
  14289. 0.2622]]], device='cuda:0')
  14290. loss_train_step before backward: tensor(0.0806, device='cuda:0', grad_fn=<MseLossBackward>)
  14291. loss_train_step after backward: tensor(0.0806, device='cuda:0', grad_fn=<MseLossBackward>)
  14292. loss_train: 2.6371513130143285
  14293. step: 61
  14294. running loss: 0.04323198873793981
  14295.  
  14296. Train Steps: 61/90 Loss: 0.0432 torch.Size([8, 600, 800])
  14297. torch.Size([8, 8])
  14298. tensor([[0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  14299. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  14300. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  14301. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  14302. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  14303. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433],
  14304. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  14305. [0.6226, 0.4125, 0.8800, 0.4900, 0.4512, 0.5600, 0.6275, 0.5517]],
  14306. device='cuda:0', dtype=torch.float64)
  14307. predictions are: tensor([[ 0.5904, -0.3481, 1.3853, -0.9300, -0.7038, -0.5478, 0.6628, 0.1901],
  14308. [ 0.7472, -0.2219, 1.4910, -0.8652, -0.2222, -1.3944, 0.4443, 0.2165],
  14309. [ 0.5629, -0.3763, 1.8600, -0.0448, -0.2762, -0.1915, 0.5234, 0.1410],
  14310. [ 0.7760, -0.2245, 1.2375, -0.9950, -0.6542, -0.6808, 0.6083, 0.2506],
  14311. [-2.2670, -2.2596, 1.1679, -1.1750, -0.4814, -1.3681, 0.2612, 0.2891],
  14312. [ 0.9036, -0.1748, 1.7474, 0.1289, -0.1123, -0.3393, 0.3888, 0.2046],
  14313. [ 0.9780, -0.1009, 1.8675, -0.0857, -0.2561, -0.0475, 0.7317, 0.1477],
  14314. [ 0.9501, -0.1388, 1.8309, -0.0459, -0.2355, 0.0528, 0.6644, 0.2409]],
  14315. device='cuda:0', grad_fn=<AddmmBackward>)
  14316. landmarks are: tensor([[[ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  14317. 0.2545],
  14318. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  14319. 0.2083],
  14320. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  14321. 0.2622],
  14322. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  14323. 0.3546],
  14324. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  14325. 0.1373],
  14326. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  14327. 0.2237],
  14328. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  14329. 0.2237],
  14330. [ 0.5897, -0.3804, 1.7788, -0.0226, -0.2016, 0.3007, 0.6125,
  14331. 0.2622]]], device='cuda:0')
  14332. loss_train_step before backward: tensor(0.0268, device='cuda:0', grad_fn=<MseLossBackward>)
  14333. loss_train_step after backward: tensor(0.0268, device='cuda:0', grad_fn=<MseLossBackward>)
  14334. loss_train: 2.6639770111069083
  14335. step: 62
  14336. running loss: 0.04296737114688562
  14337. Train Steps: 62/90 Loss: 0.0430 torch.Size([8, 600, 800])
  14338. torch.Size([8, 8])
  14339. tensor([[0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  14340. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  14341. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  14342. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540],
  14343. [0.6336, 0.4086, 0.8900, 0.3950, 0.3900, 0.2950, 0.6504, 0.5066],
  14344. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  14345. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  14346. [0.6336, 0.4191, 0.8938, 0.5167, 0.3937, 0.3517, 0.7343, 0.5748]],
  14347. device='cuda:0', dtype=torch.float64)
  14348. predictions are: tensor([[ 0.3569, -0.4949, 1.6938, -0.3559, -0.2054, 0.1943, 0.5201, 0.1686],
  14349. [ 0.4867, -0.4273, 1.7035, -0.3954, -0.6700, -0.4678, 0.2266, 0.1097],
  14350. [ 0.6877, -0.3373, 1.6928, 0.1891, -0.4250, -0.0477, 0.4994, 0.1601],
  14351. [-0.9558, -1.3822, 1.5410, -1.2279, 0.1464, -1.2743, 0.9212, 0.3460],
  14352. [ 0.9958, -0.1204, 1.7140, -0.5015, -0.3964, -0.9068, 0.7189, 0.0435],
  14353. [ 0.8597, -0.1777, 1.4339, -1.0562, -0.4009, -0.8427, 0.4997, 0.2891],
  14354. [ 0.3033, -0.5074, 1.3019, -0.7391, -0.6111, -0.5300, 0.2686, 0.2457],
  14355. [ 0.5942, -0.3914, 1.8203, 0.0827, -0.3343, -0.6801, 0.7941, 0.2058]],
  14356. device='cuda:0', grad_fn=<AddmmBackward>)
  14357. landmarks are: tensor([[[ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  14358. 0.2936],
  14359. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  14360. 0.0862],
  14361. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  14362. 0.1544],
  14363. [ 0.6487, -0.3792, 1.6344, -1.0850, 0.2659, -1.5397, 0.8059,
  14364. 0.2730],
  14365. [ 0.6405, -0.3984, 1.8249, -0.4614, -0.4845, -0.9233, 0.7182,
  14366. 0.0539],
  14367. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  14368. 0.3392],
  14369. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  14370. 0.3417],
  14371. [ 0.6405, -0.3503, 1.8423, 0.1005, -0.4672, -0.6616, 1.1057,
  14372. 0.3692]]], device='cuda:0')
  14373. loss_train_step before backward: tensor(0.0702, device='cuda:0', grad_fn=<MseLossBackward>)
  14374. loss_train_step after backward: tensor(0.0702, device='cuda:0', grad_fn=<MseLossBackward>)
  14375. loss_train: 2.7341925194486976
  14376. step: 63
  14377. running loss: 0.043399881261090435
  14378. Train Steps: 63/90 Loss: 0.0434 torch.Size([8, 600, 800])
  14379. torch.Size([8, 8])
  14380. tensor([[0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  14381. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  14382. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  14383. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  14384. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  14385. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  14386. [0.6277, 0.4118, 0.8988, 0.3833, 0.3950, 0.2650, 0.6290, 0.4938],
  14387. [0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097]],
  14388. device='cuda:0', dtype=torch.float64)
  14389. predictions are: tensor([[ 0.8489, -0.2227, 1.7997, -0.5051, -0.4486, -0.5622, 0.6693, 0.2327],
  14390. [ 0.2771, -0.5652, 1.6160, -0.3772, -0.4482, -0.3172, 0.3491, 0.1680],
  14391. [ 0.1536, -0.6882, 1.8718, -0.3745, -0.4070, 0.1483, 0.8937, 0.1137],
  14392. [ 0.5407, -0.3957, 1.7259, -0.1100, -0.5389, -0.6844, 0.4568, 0.2921],
  14393. [ 0.3525, -0.5436, 0.8690, -1.2150, -0.4159, -1.3178, 0.2979, 0.2886],
  14394. [ 0.5503, -0.4333, 1.7132, 0.0185, -0.0879, -0.1173, 0.5199, 0.1360],
  14395. [ 0.4545, -0.4887, 1.8710, -0.6144, -0.2999, -1.2758, 0.7149, 0.0996],
  14396. [ 0.3100, -0.5452, 1.8769, -0.2250, -0.1633, 0.1682, 0.5864, 0.1355]],
  14397. device='cuda:0', grad_fn=<AddmmBackward>)
  14398. landmarks are: tensor([[[ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  14399. 0.3238],
  14400. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  14401. 0.3265],
  14402. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  14403. 0.1005],
  14404. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  14405. 0.3161],
  14406. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  14407. 0.3546],
  14408. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  14409. 0.0851],
  14410. [ 0.6135, -0.3841, 1.8654, -0.5153, -0.4614, -1.0619, 0.6195,
  14411. -0.0049],
  14412. [ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  14413. 0.0682]]], device='cuda:0')
  14414. loss_train_step before backward: tensor(0.0240, device='cuda:0', grad_fn=<MseLossBackward>)
  14415. loss_train_step after backward: tensor(0.0240, device='cuda:0', grad_fn=<MseLossBackward>)
  14416. loss_train: 2.7581892935559154
  14417. step: 64
  14418. running loss: 0.04309670771181118
  14419. Train Steps: 64/90 Loss: 0.0431 torch.Size([8, 600, 800])
  14420. torch.Size([8, 8])
  14421. tensor([[0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  14422. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  14423. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  14424. [0.6239, 0.4206, 0.8750, 0.5400, 0.3688, 0.4850, 0.5737, 0.5700],
  14425. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  14426. [0.6289, 0.4032, 0.8419, 0.5446, 0.4075, 0.5017, 0.6312, 0.5117],
  14427. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  14428. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167]],
  14429. device='cuda:0', dtype=torch.float64)
  14430. predictions are: tensor([[ 0.5196, -0.4510, 1.7051, -0.8963, -0.5621, -1.1083, 0.6279, 0.0341],
  14431. [ 0.4282, -0.4812, 1.6406, -0.0781, 0.0335, -0.6546, 0.3637, 0.3195],
  14432. [ 0.3719, -0.5328, 1.7015, -0.3336, -0.2812, -0.1746, 0.2990, 0.2221],
  14433. [ 0.5406, -0.4317, 1.7712, -0.1215, -0.4843, -0.2928, 0.5235, 0.1871],
  14434. [ 0.6402, -0.3560, 1.6619, 0.0413, -0.3322, -0.5363, 0.4270, 0.3390],
  14435. [ 0.6243, -0.4074, 1.6774, -0.2420, -0.3619, -0.3324, 0.7050, 0.0932],
  14436. [ 0.3252, -0.5740, 1.8606, -0.2420, -0.3334, 0.1080, 0.7974, 0.2020],
  14437. [ 0.1856, -0.6645, 1.8283, -0.6080, -0.4700, 0.0561, 0.7195, 0.0907]],
  14438. device='cuda:0', grad_fn=<AddmmBackward>)
  14439. landmarks are: tensor([[[ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  14440. 0.1963],
  14441. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  14442. 0.4547],
  14443. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  14444. 0.3777],
  14445. [ 0.5960, -0.3430, 1.7557, 0.2083, -0.5827, -0.0457, 0.3642,
  14446. 0.3469],
  14447. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  14448. 0.4624],
  14449. [ 0.6189, -0.4238, 1.6026, 0.2295, -0.4037, 0.0313, 0.6298,
  14450. 0.0774],
  14451. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  14452. 0.3157],
  14453. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  14454. 0.1005]]], device='cuda:0')
  14455. loss_train_step before backward: tensor(0.0390, device='cuda:0', grad_fn=<MseLossBackward>)
  14456. loss_train_step after backward: tensor(0.0390, device='cuda:0', grad_fn=<MseLossBackward>)
  14457. loss_train: 2.797200477682054
  14458. step: 65
  14459. running loss: 0.04303385350280083
  14460.  
  14461. Train Steps: 65/90 Loss: 0.0430 torch.Size([8, 600, 800])
  14462. torch.Size([8, 8])
  14463. tensor([[0.6203, 0.4078, 0.8800, 0.5083, 0.3900, 0.5000, 0.6100, 0.5583],
  14464. [0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617],
  14465. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  14466. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  14467. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  14468. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  14469. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  14470. [0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044]],
  14471. device='cuda:0', dtype=torch.float64)
  14472. predictions are: tensor([[ 0.6687, -0.3593, 1.8971, 0.1707, -0.4330, 0.0961, 0.6451, 0.1299],
  14473. [ 0.5644, -0.4138, 1.7877, 0.0097, -0.0366, -0.0669, 0.4079, 0.2327],
  14474. [ 0.7685, -0.2672, 1.7709, -0.5620, -0.6552, -0.2216, 0.4247, 0.1788],
  14475. [-1.0692, -1.4496, 1.1144, -1.0959, -0.2064, -1.3422, 0.3366, 0.3403],
  14476. [ 0.3732, -0.5458, 1.8620, 0.0651, -0.0702, -0.0228, 0.4075, 0.1777],
  14477. [ 0.4668, -0.4828, 1.4026, -0.9949, -0.5788, -0.5876, 0.6636, 0.2020],
  14478. [ 0.5879, -0.4394, 1.9501, 0.2348, -0.5701, -0.4968, 0.7669, 0.0505],
  14479. [ 0.9447, -0.1949, 1.2377, -1.2274, -0.2411, -1.2837, 0.5303, 0.2160]],
  14480. device='cuda:0', grad_fn=<AddmmBackward>)
  14481. landmarks are: tensor([[[ 0.5794, -0.4023, 1.7788, 0.0620, -0.4845, 0.0236, 0.5316,
  14482. 0.2930],
  14483. [ 0.5432, -0.4388, 1.7557, -0.0303, -0.0919, -0.1150, 0.2699,
  14484. 0.3087],
  14485. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  14486. 0.0802],
  14487. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  14488. 0.3084],
  14489. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  14490. 0.3392],
  14491. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  14492. 0.2237],
  14493. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  14494. -0.0957],
  14495. [ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  14496. 0.0438]]], device='cuda:0')
  14497. loss_train_step before backward: tensor(0.0485, device='cuda:0', grad_fn=<MseLossBackward>)
  14498. loss_train_step after backward: tensor(0.0485, device='cuda:0', grad_fn=<MseLossBackward>)
  14499. loss_train: 2.845730713568628
  14500. step: 66
  14501. running loss: 0.04311713202376709
  14502. Train Steps: 66/90 Loss: 0.0431 torch.Size([8, 600, 800])
  14503. torch.Size([8, 8])
  14504. tensor([[0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  14505. [0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  14506. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  14507. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  14508. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  14509. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  14510. [0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  14511. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528]],
  14512. device='cuda:0', dtype=torch.float64)
  14513. predictions are: tensor([[ 0.3285, -0.5892, 1.8296, -0.5351, -0.5713, -0.4515, 0.6056, 0.1702],
  14514. [ 0.1763, -0.6597, 1.6175, 0.2585, -0.3035, 0.0659, 0.3303, 0.1897],
  14515. [ 0.4622, -0.5033, 1.6857, -0.1942, -0.5921, -0.4273, 0.6031, 0.1828],
  14516. [ 0.2868, -0.5815, 1.7712, -0.0843, -0.2788, 0.4183, 0.5205, 0.2098],
  14517. [ 0.4892, -0.4744, 1.8808, -0.3870, -0.2168, -0.9448, 0.8276, 0.1716],
  14518. [ 0.4710, -0.4649, 1.6061, 0.1596, -0.1887, 0.1203, 0.1593, 0.2353],
  14519. [ 0.7560, -0.3035, 1.0503, -1.2743, -0.3153, -1.2866, 0.1925, 0.1969],
  14520. [ 0.5216, -0.4476, 1.9730, -0.6449, -0.3307, -0.5987, 0.9147, 0.1548]],
  14521. device='cuda:0', grad_fn=<AddmmBackward>)
  14522. landmarks are: tensor([[[ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  14523. 0.1544],
  14524. [ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  14525. 0.2237],
  14526. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  14527. 0.1768],
  14528. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  14529. 0.0928],
  14530. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  14531. 0.2142],
  14532. [ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  14533. 0.2364],
  14534. [ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  14535. 0.0774],
  14536. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  14537. 0.2676]]], device='cuda:0')
  14538. loss_train_step before backward: tensor(0.0175, device='cuda:0', grad_fn=<MseLossBackward>)
  14539. loss_train_step after backward: tensor(0.0175, device='cuda:0', grad_fn=<MseLossBackward>)
  14540. loss_train: 2.86319727730006
  14541. step: 67
  14542. running loss: 0.042734287720896415
  14543. Train Steps: 67/90 Loss: 0.0427 torch.Size([8, 600, 800])
  14544. torch.Size([8, 8])
  14545. tensor([[0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  14546. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  14547. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  14548. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133],
  14549. [0.6268, 0.4029, 0.8500, 0.2683, 0.3937, 0.3500, 0.6860, 0.5297],
  14550. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  14551. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  14552. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960]],
  14553. device='cuda:0', dtype=torch.float64)
  14554. predictions are: tensor([[ 0.4266, -0.5112, 1.7698, 0.0365, -0.0220, 0.1191, 0.4562, 0.2976],
  14555. [ 0.4087, -0.5572, 1.9169, 0.0073, -0.5026, 0.2506, 0.6863, 0.1113],
  14556. [ 0.1075, -0.7343, 1.3653, -0.8740, -0.4800, -0.9601, 0.2076, 0.2042],
  14557. [ 0.3999, -0.5319, 1.7445, -0.3835, -0.6190, -0.5022, 0.2338, 0.1659],
  14558. [ 0.5842, -0.4576, 1.6458, -0.9018, -0.4912, -0.6226, 1.0400, 0.1461],
  14559. [ 0.7194, -0.3208, 1.6277, 0.1032, -0.2578, -0.7793, 0.5120, 0.4292],
  14560. [ 0.5912, -0.4189, 1.2441, -1.0201, -0.4948, -0.9039, 0.3610, 0.1170],
  14561. [ 0.3899, -0.5879, 1.9004, 0.0208, -0.1882, 0.1316, 0.4283, 0.0949]],
  14562. device='cuda:0', grad_fn=<AddmmBackward>)
  14563. landmarks are: tensor([[[ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  14564. 0.3007],
  14565. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  14566. 0.2237],
  14567. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  14568. -0.0220],
  14569. [ 0.5393, -0.4294, 1.6575, -0.4075, -0.6635, -0.6308, 0.3296,
  14570. 0.0851],
  14571. [ 0.6092, -0.4249, 1.6402, -1.0465, -0.4672, -0.6693, 0.8827,
  14572. 0.1608],
  14573. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  14574. 0.5762],
  14575. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  14576. -0.1031],
  14577. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  14578. 0.0051]]], device='cuda:0')
  14579. loss_train_step before backward: tensor(0.0202, device='cuda:0', grad_fn=<MseLossBackward>)
  14580. loss_train_step after backward: tensor(0.0202, device='cuda:0', grad_fn=<MseLossBackward>)
  14581. loss_train: 2.883371683768928
  14582. step: 68
  14583. running loss: 0.042402524761307764
  14584. Train Steps: 68/90 Loss: 0.0424 torch.Size([8, 600, 800])
  14585. torch.Size([8, 8])
  14586. tensor([[0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  14587. [ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  14588. [0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426],
  14589. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  14590. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  14591. [0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  14592. [0.6198, 0.3997, 0.8582, 0.5361, 0.4117, 0.5016, 0.5942, 0.5134],
  14593. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633]],
  14594. device='cuda:0', dtype=torch.float64)
  14595. predictions are: tensor([[ 1.0256, -0.1258, 1.8074, -0.7311, -0.2773, -0.7034, 0.7876, 0.1885],
  14596. [-1.4408, -1.7286, 1.1651, -1.0770, -0.1554, -0.9629, 0.2680, 0.3037],
  14597. [ 0.9199, -0.2048, 1.3228, -1.0172, -0.2033, -1.1164, 0.5515, 0.1754],
  14598. [ 1.0787, -0.1060, 1.6983, -0.5107, -0.6539, -0.3158, 0.4087, 0.2556],
  14599. [-1.2559, -1.5952, 1.3378, -0.7338, -0.5142, -0.7789, 0.1824, 0.2635],
  14600. [ 0.8443, -0.2714, 1.8309, -0.3378, -0.5479, -0.5533, 0.6412, 0.0626],
  14601. [ 0.9600, -0.2078, 1.8367, 0.3667, -0.4265, 0.3660, 0.4879, 0.1222],
  14602. [ 0.9529, -0.1759, 1.7623, 0.5614, -0.3391, 0.2584, 0.3591, 0.2860]],
  14603. device='cuda:0', grad_fn=<AddmmBackward>)
  14604. landmarks are: tensor([[[ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  14605. 0.1467],
  14606. [-2.2859, -2.2859, 0.9175, -1.3947, -0.3691, -1.2467, 0.2314,
  14607. 0.3238],
  14608. [ 0.5784, -0.4153, 1.2972, -1.2541, -0.2265, -1.4553, 0.4741,
  14609. 0.2203],
  14610. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  14611. 0.3315],
  14612. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  14613. 0.2699],
  14614. [ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  14615. 0.1963],
  14616. [ 0.5767, -0.4396, 1.6782, 0.1905, -0.3844, 0.0308, 0.4588,
  14617. 0.0855],
  14618. [ 0.5880, -0.3605, 1.7037, 0.3238, -0.2940, -0.0765, 0.3180,
  14619. 0.3161]]], device='cuda:0')
  14620. loss_train_step before backward: tensor(0.0832, device='cuda:0', grad_fn=<MseLossBackward>)
  14621. loss_train_step after backward: tensor(0.0832, device='cuda:0', grad_fn=<MseLossBackward>)
  14622. loss_train: 2.9666087506338954
  14623. step: 69
  14624. running loss: 0.042994329719331814
  14625.  
  14626. Train Steps: 69/90 Loss: 0.0430 torch.Size([8, 600, 800])
  14627. torch.Size([8, 8])
  14628. tensor([[0.6193, 0.4050, 0.7313, 0.2433, 0.4075, 0.2117, 0.5649, 0.5656],
  14629. [0.6339, 0.4102, 0.8588, 0.3133, 0.4425, 0.2117, 0.6417, 0.5089],
  14630. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  14631. [0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  14632. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  14633. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  14634. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  14635. [0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395]],
  14636. device='cuda:0', dtype=torch.float64)
  14637. predictions are: tensor([[ 0.0945, -0.7125, 1.0857, -0.9566, -0.3616, -0.9317, 0.1844, 0.2622],
  14638. [ 0.6179, -0.4146, 1.6800, -0.5893, -0.2319, -0.8998, 0.7288, 0.1170],
  14639. [ 0.4128, -0.5567, 1.8628, 0.3670, -0.6036, -0.1763, 0.3295, 0.0783],
  14640. [-0.0069, -0.8548, 1.7534, -0.8855, 0.1549, -1.0048, 0.9400, 0.2685],
  14641. [ 0.4008, -0.5571, 1.9227, -0.1961, -0.5610, -0.1070, 0.5655, 0.1825],
  14642. [ 0.7813, -0.2972, 1.7793, -0.0681, -0.6172, -0.1469, 0.3549, 0.2691],
  14643. [ 0.6439, -0.3781, 1.7482, -0.2119, -0.6423, 0.3156, 0.2430, 0.1745],
  14644. [ 0.5604, -0.4501, 1.1170, -1.0097, -0.3723, -0.8632, 0.3318, 0.2643]],
  14645. device='cuda:0', grad_fn=<AddmmBackward>)
  14646. landmarks are: tensor([[[ 0.5746, -0.4153, 1.0917, -1.1620, -0.4037, -1.3082, 0.3234,
  14647. 0.3267],
  14648. [ 0.6421, -0.3912, 1.6806, -0.8386, -0.2420, -1.3082, 0.6780,
  14649. 0.0646],
  14650. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  14651. -0.0049],
  14652. [ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  14653. 0.2142],
  14654. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  14655. 0.1544],
  14656. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  14657. 0.1544],
  14658. [ 0.5384, -0.4361, 1.7961, -0.4999, -0.5480, -0.1150, 0.3931,
  14659. 0.2776],
  14660. [ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  14661. 0.2058]]], device='cuda:0')
  14662. loss_train_step before backward: tensor(0.0494, device='cuda:0', grad_fn=<MseLossBackward>)
  14663. loss_train_step after backward: tensor(0.0494, device='cuda:0', grad_fn=<MseLossBackward>)
  14664. loss_train: 3.0159969767555594
  14665. step: 70
  14666. running loss: 0.043085671096507995
  14667. Train Steps: 70/90 Loss: 0.0431 torch.Size([8, 600, 800])
  14668. torch.Size([8, 8])
  14669. tensor([[0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297],
  14670. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  14671. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  14672. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  14673. [0.6276, 0.4235, 0.8888, 0.5333, 0.3800, 0.3117, 0.5427, 0.6164],
  14674. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  14675. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667],
  14676. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117]],
  14677. device='cuda:0', dtype=torch.float64)
  14678. predictions are: tensor([[ 0.6908, -0.4021, 1.8993, 0.1808, -0.5602, -0.0866, 0.6491, 0.1600],
  14679. [ 0.3828, -0.5673, 1.8360, -0.3507, -0.4966, 0.0851, 0.3386, 0.1186],
  14680. [ 0.7606, -0.3255, 1.8966, 0.1732, -0.3291, 0.5183, 0.7372, 0.2568],
  14681. [ 0.5708, -0.4434, 1.7218, -0.5815, -0.7062, -0.3660, 0.2640, 0.0845],
  14682. [ 0.6328, -0.3785, 1.7117, 0.1811, -0.4657, -0.6712, 0.3862, 0.3782],
  14683. [ 0.5071, -0.4653, 1.1100, -1.0328, -0.0600, -1.3080, 0.1529, 0.3689],
  14684. [-0.3958, -1.1060, 1.3111, -1.2376, -0.3739, -0.9371, 0.3930, 0.2738],
  14685. [ 0.4604, -0.5685, 1.9232, -0.0375, -0.5582, -0.0750, 0.5697, 0.0881]],
  14686. device='cuda:0', grad_fn=<AddmmBackward>)
  14687. landmarks are: tensor([[[ 0.6520, -0.4032, 1.8076, 0.1852, -0.5711, -0.1381, 0.7876,
  14688. 0.1608],
  14689. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  14690. 0.2468],
  14691. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  14692. 0.3371],
  14693. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  14694. 0.2365],
  14695. [ 0.6131, -0.3299, 1.8192, 0.1775, -0.5307, -0.8463, 0.2206,
  14696. 0.5612],
  14697. [ 0.6101, -0.3152, 1.0166, -0.7540, -0.0226, -1.4468, 0.2823,
  14698. 0.5702],
  14699. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  14700. 0.3315],
  14701. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  14702. 0.0774]]], device='cuda:0')
  14703. loss_train_step before backward: tensor(0.0906, device='cuda:0', grad_fn=<MseLossBackward>)
  14704. loss_train_step after backward: tensor(0.0906, device='cuda:0', grad_fn=<MseLossBackward>)
  14705. loss_train: 3.1066278582438827
  14706. step: 71
  14707. running loss: 0.043755321947096935
  14708. Train Steps: 71/90 Loss: 0.0438 torch.Size([8, 600, 800])
  14709. torch.Size([8, 8])
  14710. tensor([[0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  14711. [0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  14712. [0.6317, 0.4038, 0.8287, 0.5900, 0.3800, 0.4717, 0.6295, 0.4986],
  14713. [0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  14714. [ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  14715. [0.6125, 0.4035, 0.7825, 0.3100, 0.3463, 0.4900, 0.5832, 0.5637],
  14716. [0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  14717. [0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250]],
  14718. device='cuda:0', dtype=torch.float64)
  14719. predictions are: tensor([[ 0.5412, -0.4559, 1.7843, 0.0259, -0.2841, 0.1660, 0.2377, 0.1969],
  14720. [ 0.6741, -0.3356, 1.8233, -0.4519, -0.2874, -1.1560, 0.4323, 0.2217],
  14721. [ 0.7896, -0.3125, 1.7426, 0.3888, -0.6745, -0.0785, 0.5314, 0.1593],
  14722. [ 0.6071, -0.4343, 1.7290, -0.3111, -0.7544, -0.4238, 0.3074, 0.0894],
  14723. [-1.1140, -1.5608, 1.7046, -0.9713, 0.0438, -1.1867, 0.8088, 0.3351],
  14724. [ 0.4090, -0.5324, 1.3724, -0.7669, -0.7136, -0.0075, 0.4359, 0.2871],
  14725. [ 0.6645, -0.3611, 1.7667, 0.1716, -0.2005, 0.3721, 0.2576, 0.2559],
  14726. [ 0.7018, -0.3551, 1.2018, -1.1815, -0.5421, -0.9914, 0.5265, 0.1972]],
  14727. device='cuda:0', grad_fn=<AddmmBackward>)
  14728. landmarks are: tensor([[[ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  14729. 0.2622],
  14730. [ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  14731. 0.0171],
  14732. [ 0.6320, -0.4206, 1.5420, 0.4393, -0.5307, -0.1073, 0.6216,
  14733. 0.0171],
  14734. [ 0.5669, -0.4794, 1.7499, -0.3383, -0.6751, -0.4229, 0.4970,
  14735. -0.0611],
  14736. [-2.2859, -2.2859, 1.8018, -0.9002, 0.1910, -1.2467, 1.1057,
  14737. 0.3799],
  14738. [ 0.5432, -0.4224, 1.3284, -0.8540, -0.6866, -0.0226, 0.4077,
  14739. 0.3177],
  14740. [ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  14741. 0.0592],
  14742. [ 0.5891, -0.3937, 1.1494, -1.2390, -0.5076, -0.9695, 0.4797,
  14743. 0.1390]]], device='cuda:0')
  14744. loss_train_step before backward: tensor(0.0398, device='cuda:0', grad_fn=<MseLossBackward>)
  14745. loss_train_step after backward: tensor(0.0398, device='cuda:0', grad_fn=<MseLossBackward>)
  14746. loss_train: 3.146448607556522
  14747. step: 72
  14748. running loss: 0.043700675104951694
  14749. Train Steps: 72/90 Loss: 0.0437 torch.Size([8, 600, 800])
  14750. torch.Size([8, 8])
  14751. tensor([[0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  14752. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  14753. [0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901],
  14754. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  14755. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650],
  14756. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767],
  14757. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  14758. [0.6273, 0.4100, 0.7137, 0.2133, 0.4000, 0.2650, 0.6075, 0.5633]],
  14759. device='cuda:0', dtype=torch.float64)
  14760. predictions are: tensor([[ 0.5118, -0.4524, 1.7195, -0.3490, -0.4138, -0.5709, 0.4172, 0.3501],
  14761. [ 1.0943, -0.0776, 1.6530, -0.0977, -0.2364, -0.7991, 0.5785, 0.3261],
  14762. [ 0.6776, -0.4029, 1.9237, -0.5634, -0.6072, -0.3619, 0.7648, 0.0746],
  14763. [ 1.0923, -0.1342, 1.7725, -0.4052, -0.6281, 0.1162, 0.4874, 0.1301],
  14764. [ 0.6887, -0.3659, 1.7554, 0.0926, -0.3180, 0.2316, 0.3344, 0.1946],
  14765. [ 0.6969, -0.3097, 1.6428, 0.0207, -0.5718, -0.5985, 0.2854, 0.2422],
  14766. [-2.1434, -2.2292, 1.0703, -1.2591, -0.3749, -1.2681, 0.2250, 0.1873],
  14767. [ 0.3197, -0.6014, 1.0105, -1.1921, -0.3945, -1.0479, 0.4393, 0.2994]],
  14768. device='cuda:0', grad_fn=<AddmmBackward>)
  14769. landmarks are: tensor([[[ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  14770. 0.3928],
  14771. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  14772. 0.5822],
  14773. [ 0.6077, -0.3965, 1.8480, -0.6539, -0.6231, -0.4537, 0.6216,
  14774. -0.0220],
  14775. [ 0.5384, -0.4361, 1.7961, -0.4999, -0.5480, -0.1150, 0.3931,
  14776. 0.2776],
  14777. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  14778. 0.3238],
  14779. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  14780. 0.3778],
  14781. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  14782. 0.1373],
  14783. [ 0.6115, -0.3924, 1.0109, -1.3005, -0.4383, -1.0619, 0.5201,
  14784. 0.3161]]], device='cuda:0')
  14785. loss_train_step before backward: tensor(0.0283, device='cuda:0', grad_fn=<MseLossBackward>)
  14786. loss_train_step after backward: tensor(0.0283, device='cuda:0', grad_fn=<MseLossBackward>)
  14787. loss_train: 3.174727371893823
  14788. step: 73
  14789. running loss: 0.043489416053340044
  14790.  
  14791. Train Steps: 73/90 Loss: 0.0435 torch.Size([8, 600, 800])
  14792. torch.Size([8, 8])
  14793. tensor([[0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  14794. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  14795. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  14796. [0.6260, 0.4133, 0.8800, 0.5117, 0.3713, 0.3283, 0.6223, 0.4967],
  14797. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  14798. [0.6124, 0.4069, 0.8314, 0.5001, 0.3738, 0.4650, 0.5167, 0.5402],
  14799. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  14800. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332]],
  14801. device='cuda:0', dtype=torch.float64)
  14802. predictions are: tensor([[ 0.5926, -0.4584, 1.1286, -1.4791, -0.3460, -1.2189, 0.5719, 0.2300],
  14803. [ 0.2274, -0.6594, 1.7152, -0.5702, -0.6758, -0.4601, 0.1921, 0.1128],
  14804. [ 0.6375, -0.3545, 1.6312, -0.4032, -0.2160, -0.9396, 0.4620, 0.3717],
  14805. [ 0.2176, -0.6772, 1.8095, -0.1802, -0.4826, -0.6983, 0.5700, 0.1636],
  14806. [ 0.0604, -0.7763, 1.6917, 0.1112, -0.4883, -0.2882, 0.1321, 0.1681],
  14807. [ 0.4266, -0.5131, 1.5818, -0.1841, -0.4556, -0.1109, 0.2273, 0.2884],
  14808. [ 0.5517, -0.4476, 1.8382, -0.2390, -0.5477, -0.2693, 0.7168, 0.2239],
  14809. [ 0.4387, -0.5354, 1.6025, -0.0815, -0.5076, 0.0810, 0.6287, 0.2390]],
  14810. device='cuda:0', grad_fn=<AddmmBackward>)
  14811. landmarks are: tensor([[[ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  14812. 0.2468],
  14813. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  14814. 0.0862],
  14815. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  14816. 0.5822],
  14817. [ 0.6054, -0.3767, 1.7788, 0.0774, -0.5711, -0.7694, 0.5887,
  14818. 0.0081],
  14819. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  14820. -0.0370],
  14821. [ 0.5425, -0.4067, 1.5543, 0.0241, -0.5596, -0.1381, 0.1005,
  14822. 0.2093],
  14823. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  14824. 0.1499],
  14825. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  14826. 0.1768]]], device='cuda:0')
  14827. loss_train_step before backward: tensor(0.0268, device='cuda:0', grad_fn=<MseLossBackward>)
  14828. loss_train_step after backward: tensor(0.0268, device='cuda:0', grad_fn=<MseLossBackward>)
  14829. loss_train: 3.2015545638278127
  14830. step: 74
  14831. running loss: 0.04326425086253801
  14832. Train Steps: 74/90 Loss: 0.0433 torch.Size([8, 600, 800])
  14833. torch.Size([8, 8])
  14834. tensor([[0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136],
  14835. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  14836. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  14837. [0.6264, 0.4069, 0.7900, 0.1650, 0.4275, 0.2267, 0.6290, 0.4947],
  14838. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  14839. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  14840. [0.6250, 0.4106, 0.8700, 0.3717, 0.3588, 0.4967, 0.6038, 0.5167],
  14841. [0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274]],
  14842. device='cuda:0', dtype=torch.float64)
  14843. predictions are: tensor([[ 0.4025, -0.5363, 1.6971, 0.1246, -0.1701, 0.1078, 0.2141, 0.2565],
  14844. [ 0.4167, -0.5550, 1.7186, -0.4311, -0.7491, -0.2282, 0.5160, 0.2378],
  14845. [ 0.3892, -0.5351, 1.5867, 0.4916, -0.4973, -0.3103, 0.2211, 0.4570],
  14846. [-0.0709, -0.8842, 1.3462, -1.3077, -0.3917, -1.4341, 0.6078, 0.1435],
  14847. [ 0.5810, -0.4226, 1.7171, -0.1685, -0.4232, 0.1927, 0.2545, 0.2298],
  14848. [ 0.3430, -0.6123, 1.4879, -1.0594, -0.5487, -1.2002, 0.5690, 0.0772],
  14849. [ 0.7413, -0.3250, 1.6692, -0.4937, -0.6821, 0.0267, 0.6439, 0.2146],
  14850. [ 0.1623, -0.6903, 1.6709, -0.8004, -0.1233, -1.2627, 0.6041, 0.2084]],
  14851. device='cuda:0', grad_fn=<AddmmBackward>)
  14852. landmarks are: tensor([[[ 5.5635e-01, -3.8422e-01, 1.7268e+00, 1.0054e-01, -2.4997e-02,
  14853. 3.2255e-01, 2.6581e-01, 8.6245e-02],
  14854. [ 5.7783e-01, -4.3934e-01, 1.8018e+00, -4.6143e-01, -6.6928e-01,
  14855. -1.3811e-01, 5.4896e-01, 2.0831e-01],
  14856. [ 6.0381e-01, -3.4642e-01, 1.7037e+00, 3.9307e-01, -4.4411e-01,
  14857. -2.6128e-01, 3.0069e-01, 4.6236e-01],
  14858. [ 6.0739e-01, -4.0631e-01, 1.3630e+00, -1.5238e+00, -3.1132e-01,
  14859. -1.2390e+00, 6.1950e-01, -9.2270e-04],
  14860. [ 5.4990e-01, -4.2249e-01, 1.8018e+00, -2.9207e-01, -3.0554e-01,
  14861. 5.4350e-02, 4.0462e-01, 2.6990e-01],
  14862. [ 6.0421e-01, -4.2248e-01, 1.5420e+00, -1.2082e+00, -4.7298e-01,
  14863. -1.0311e+00, 6.3800e-01, -2.1963e-02],
  14864. [ 6.0098e-01, -3.8961e-01, 1.7326e+00, -5.6921e-01, -6.2887e-01,
  14865. 8.1601e-03, 5.0277e-01, 1.0054e-01],
  14866. [ 6.5365e-01, -3.7194e-01, 1.6979e+00, -8.6174e-01, -1.6859e-02,
  14867. -1.3621e+00, 6.9257e-01, 1.5008e-01]]], device='cuda:0')
  14868. loss_train_step before backward: tensor(0.0287, device='cuda:0', grad_fn=<MseLossBackward>)
  14869. loss_train_step after backward: tensor(0.0287, device='cuda:0', grad_fn=<MseLossBackward>)
  14870. loss_train: 3.2302527902647853
  14871. step: 75
  14872. running loss: 0.04307003720353047
  14873. Train Steps: 75/90 Loss: 0.0431 torch.Size([8, 600, 800])
  14874. torch.Size([8, 8])
  14875. tensor([[ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  14876. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  14877. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  14878. [0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  14879. [0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320],
  14880. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  14881. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  14882. [0.6182, 0.3967, 0.8263, 0.3065, 0.3526, 0.4161, 0.6192, 0.5290]],
  14883. device='cuda:0', dtype=torch.float64)
  14884. predictions are: tensor([[-1.8661, -2.0538, 1.2785, -0.8249, -0.6488, -0.8578, 0.1658, 0.2023],
  14885. [ 0.6903, -0.3068, 1.8189, 0.1420, -0.4976, -0.8075, 0.3031, 0.2389],
  14886. [ 0.7957, -0.2790, 1.3134, -0.9248, -0.5435, -0.9453, 0.2031, 0.1206],
  14887. [ 0.9262, -0.2276, 1.8351, 0.1683, -0.3136, 0.3725, 0.7447, 0.2883],
  14888. [ 0.6961, -0.3637, 1.4982, -1.0795, -0.2947, -1.1262, 0.6684, 0.2113],
  14889. [-0.1521, -0.8515, 1.1088, -1.1953, -0.3039, -1.4054, 0.2218, 0.2412],
  14890. [ 0.8814, -0.2470, 1.7744, 0.1652, -0.3566, 0.0847, 0.4990, 0.2598],
  14891. [ 0.7957, -0.3254, 1.6967, -0.7133, -0.7268, -0.3437, 0.6567, 0.1718]],
  14892. device='cuda:0', grad_fn=<AddmmBackward>)
  14893. landmarks are: tensor([[[-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  14894. 0.2837],
  14895. [ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  14896. 0.1852],
  14897. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  14898. -0.1031],
  14899. [ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  14900. 0.1661],
  14901. [ 0.6141, -0.4153, 1.4208, -1.2697, -0.2940, -1.0234, 0.8644,
  14902. 0.1715],
  14903. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  14904. 0.1343],
  14905. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  14906. 0.1627],
  14907. [ 0.5697, -0.4538, 1.5308, -0.8703, -0.6572, -0.3639, 0.5739,
  14908. 0.1576]]], device='cuda:0')
  14909. loss_train_step before backward: tensor(0.0314, device='cuda:0', grad_fn=<MseLossBackward>)
  14910. loss_train_step after backward: tensor(0.0314, device='cuda:0', grad_fn=<MseLossBackward>)
  14911. loss_train: 3.2616537315770984
  14912. step: 76
  14913. running loss: 0.042916496468119715
  14914. Train Steps: 76/90 Loss: 0.0429 torch.Size([8, 600, 800])
  14915. torch.Size([8, 8])
  14916. tensor([[0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  14917. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  14918. [0.6264, 0.4069, 0.7900, 0.1650, 0.4275, 0.2267, 0.6290, 0.4947],
  14919. [0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320],
  14920. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  14921. [0.6081, 0.3950, 0.8538, 0.4667, 0.3850, 0.4917, 0.5342, 0.4954],
  14922. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  14923. [0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083]],
  14924. device='cuda:0', dtype=torch.float64)
  14925. predictions are: tensor([[ 0.5106, -0.4525, 1.8837, 0.1418, -0.5735, -0.5365, 0.4087, 0.0735],
  14926. [ 0.7139, -0.3620, 1.7725, 0.1793, -0.4467, 0.1089, 0.4679, 0.1903],
  14927. [ 0.2135, -0.6826, 1.3965, -1.3342, -0.2621, -1.3666, 0.6790, 0.1654],
  14928. [ 0.5085, -0.4804, 1.4542, -1.1903, -0.2808, -1.1662, 0.6581, 0.2043],
  14929. [ 0.0263, -0.7549, 0.9504, -1.1005, -0.4628, -1.2502, 0.0552, 0.2227],
  14930. [ 0.5397, -0.4609, 1.7287, -0.2117, -0.5355, -0.0586, 0.2339, 0.0983],
  14931. [ 0.2517, -0.6470, 1.7428, 0.1414, -0.4972, -0.3696, 0.7320, 0.2673],
  14932. [ 0.2752, -0.5864, 1.6242, -0.6104, -0.6357, -0.2963, 0.3731, 0.3826]],
  14933. device='cuda:0', grad_fn=<AddmmBackward>)
  14934. landmarks are: tensor([[[ 6.2730e-01, -4.1045e-01, 1.8480e+00, 1.0824e-01, -5.5381e-01,
  14935. -5.0762e-01, 6.4140e-01, -4.8817e-03],
  14936. [ 5.9082e-01, -4.3664e-01, 1.7557e+00, 1.3903e-01, -5.1917e-01,
  14937. 1.3133e-01, 6.5289e-01, 2.3557e-02],
  14938. [ 6.0739e-01, -4.0631e-01, 1.3630e+00, -1.5238e+00, -3.1132e-01,
  14939. -1.2390e+00, 6.1950e-01, -9.2270e-04],
  14940. [ 6.1413e-01, -4.1527e-01, 1.4208e+00, -1.2697e+00, -2.9400e-01,
  14941. -1.0234e+00, 8.6439e-01, 1.7146e-01],
  14942. [ 5.4700e-01, -4.0808e-01, 8.4919e-01, -1.0773e+00, -5.3072e-01,
  14943. -1.1620e+00, 9.1240e-02, 1.8903e-01],
  14944. [ 5.2269e-01, -4.6151e-01, 1.6575e+00, -1.3041e-01, -5.0762e-01,
  14945. -1.4935e-02, 1.8150e-01, 2.0831e-03],
  14946. [ 6.2236e-01, -4.0323e-01, 1.5940e+00, 2.9299e-01, -5.7691e-01,
  14947. -2.6898e-01, 8.8998e-01, 2.5161e-01],
  14948. [ 5.7742e-01, -3.8684e-01, 1.6286e+00, -5.6921e-01, -6.4619e-01,
  14949. -2.7667e-01, 5.1432e-01, 5.2394e-01]]], device='cuda:0')
  14950. loss_train_step before backward: tensor(0.0231, device='cuda:0', grad_fn=<MseLossBackward>)
  14951. loss_train_step after backward: tensor(0.0231, device='cuda:0', grad_fn=<MseLossBackward>)
  14952. loss_train: 3.2847120529040694
  14953. step: 77
  14954. running loss: 0.04265859808966324
  14955.  
  14956. Train Steps: 77/90 Loss: 0.0427 torch.Size([8, 600, 800])
  14957. torch.Size([8, 8])
  14958. tensor([[0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  14959. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  14960. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  14961. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  14962. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064],
  14963. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  14964. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  14965. [0.6185, 0.4079, 0.8838, 0.4617, 0.4838, 0.5650, 0.6175, 0.5850]],
  14966. device='cuda:0', dtype=torch.float64)
  14967. predictions are: tensor([[ 0.3915, -0.5025, 1.7193, -0.3797, -0.6087, -1.2569, 0.5107, 0.0821],
  14968. [ 0.4523, -0.4895, 1.5831, -0.5257, -0.6798, -0.7597, 0.3999, 0.1821],
  14969. [ 0.3838, -0.5686, 1.6145, -0.2962, -0.6730, -0.5379, 0.5283, 0.3127],
  14970. [ 0.1110, -0.6749, 1.5092, -0.0243, -0.5125, -0.6090, 0.4088, 0.3631],
  14971. [ 0.3467, -0.5665, 1.6822, -0.2644, -0.0797, -0.4045, 0.2067, 0.1177],
  14972. [ 0.7551, -0.3455, 1.6826, -0.6358, -0.4583, 0.0169, 0.7260, 0.1225],
  14973. [ 0.3825, -0.5697, 1.6859, -0.4049, -0.2606, -0.2820, 0.3845, 0.1126],
  14974. [ 0.4185, -0.5269, 1.6859, -0.5249, -0.1563, -0.1265, 0.5731, 0.2411]],
  14975. device='cuda:0', grad_fn=<AddmmBackward>)
  14976. landmarks are: tensor([[[ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  14977. 0.1852],
  14978. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  14979. 0.2853],
  14980. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  14981. 0.5239],
  14982. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  14983. 0.4470],
  14984. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  14985. 0.0532],
  14986. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  14987. 0.2622],
  14988. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  14989. 0.2622],
  14990. [ 0.5707, -0.4017, 1.7961, -0.1535, -0.0515, 0.3238, 0.5663,
  14991. 0.4162]]], device='cuda:0')
  14992. loss_train_step before backward: tensor(0.0481, device='cuda:0', grad_fn=<MseLossBackward>)
  14993. loss_train_step after backward: tensor(0.0481, device='cuda:0', grad_fn=<MseLossBackward>)
  14994. loss_train: 3.33284895028919
  14995. step: 78
  14996. running loss: 0.042728832696015254
  14997. Train Steps: 78/90 Loss: 0.0427 torch.Size([8, 600, 800])
  14998. torch.Size([8, 8])
  14999. tensor([[0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  15000. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456],
  15001. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  15002. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875],
  15003. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  15004. [ nan, nan, 0.7097, 0.2346, 0.4250, 0.1850, 0.5175, 0.5583],
  15005. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  15006. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413]],
  15007. device='cuda:0', dtype=torch.float64)
  15008. predictions are: tensor([[ 1.4889, 0.1334, 1.8088, -0.1667, -0.6862, -0.3736, 0.5403, 0.0498],
  15009. [ 1.3320, 0.0668, 1.7552, 0.3750, -0.3791, 0.2351, 0.4607, 0.2350],
  15010. [-1.3916, -1.6578, 0.9473, -1.2229, -0.4628, -1.2002, 0.2467, 0.2536],
  15011. [ 0.9997, -0.1110, 1.7093, -0.5094, -0.6704, -0.7536, 0.3662, 0.0959],
  15012. [ 0.9938, -0.1120, 1.7601, 0.2227, -0.2643, 0.1579, 0.2913, 0.1372],
  15013. [-0.9061, -1.3098, 0.9455, -1.1612, -0.3852, -1.3221, 0.2039, 0.2837],
  15014. [-1.6012, -1.8199, 1.1570, -1.0037, -0.5747, -1.0591, 0.2236, 0.2229],
  15015. [ 1.1578, -0.0632, 1.7333, -1.0920, 0.0493, -1.0529, 1.2628, 0.2168]],
  15016. device='cuda:0', grad_fn=<AddmmBackward>)
  15017. landmarks are: tensor([[[ 0.5669, -0.4794, 1.7499, -0.3383, -0.6751, -0.4229, 0.4970,
  15018. -0.0611],
  15019. [ 0.5443, -0.3840, 1.7095, 0.0620, -0.3979, 0.1929, 0.1622,
  15020. 0.2341],
  15021. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  15022. 0.2930],
  15023. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  15024. -0.0340],
  15025. [ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  15026. 0.0682],
  15027. [-2.2859, -2.2859, 0.9922, -1.2021, -0.3229, -1.4314, 0.1044,
  15028. 0.2930],
  15029. [-2.2859, -2.2859, 1.2030, -1.0288, -0.4961, -1.1081, 0.0813,
  15030. 0.3161],
  15031. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  15032. 0.2142]]], device='cuda:0')
  15033. loss_train_step before backward: tensor(0.1332, device='cuda:0', grad_fn=<MseLossBackward>)
  15034. loss_train_step after backward: tensor(0.1332, device='cuda:0', grad_fn=<MseLossBackward>)
  15035. loss_train: 3.4660702189430594
  15036. step: 79
  15037. running loss: 0.043874306568899485
  15038. Train Steps: 79/90 Loss: 0.0439 torch.Size([8, 600, 800])
  15039. torch.Size([8, 8])
  15040. tensor([[0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  15041. [0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  15042. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  15043. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100],
  15044. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  15045. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350],
  15046. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  15047. [0.6177, 0.4086, 0.8738, 0.3950, 0.3775, 0.5600, 0.6225, 0.5700]],
  15048. device='cuda:0', dtype=torch.float64)
  15049. predictions are: tensor([[ 0.4458, -0.5032, 1.5592, 0.0993, -0.4399, -0.3817, 0.4723, 0.1310],
  15050. [ 0.7403, -0.2708, 1.5286, -0.8189, -0.5177, -0.9784, 0.4248, 0.1831],
  15051. [ 0.1945, -0.5920, 1.5142, -0.3926, -0.6283, -0.8031, 0.0536, 0.2479],
  15052. [ 0.6446, -0.3842, 1.5927, -0.0636, -0.3261, -0.2536, 0.5394, 0.1778],
  15053. [ 0.1360, -0.7198, 1.8964, -0.9149, -0.2398, -0.8776, 1.0256, 0.1518],
  15054. [ 0.2770, -0.6113, 1.6559, -0.1666, -0.4320, -0.4876, 0.1736, 0.1383],
  15055. [ 0.2104, -0.6595, 1.6697, -0.1950, -0.4642, -0.4355, 0.3429, 0.0977],
  15056. [ 0.4589, -0.4922, 1.5949, -0.6927, -0.3965, 0.1450, 0.6767, 0.2705]],
  15057. device='cuda:0', grad_fn=<AddmmBackward>)
  15058. landmarks are: tensor([[[ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  15059. -0.1492],
  15060. [ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  15061. 0.1621],
  15062. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  15063. 0.4357],
  15064. [ 0.6236, -0.4344, 1.6171, 0.1852, -0.3402, 0.0236, 0.6471,
  15065. 0.0697],
  15066. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  15067. 0.2676],
  15068. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  15069. 0.1854],
  15070. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  15071. 0.0313],
  15072. [ 0.5671, -0.3988, 1.7499, -0.4614, -0.5423, 0.3007, 0.5894,
  15073. 0.3469]]], device='cuda:0')
  15074. loss_train_step before backward: tensor(0.0359, device='cuda:0', grad_fn=<MseLossBackward>)
  15075. loss_train_step after backward: tensor(0.0359, device='cuda:0', grad_fn=<MseLossBackward>)
  15076. loss_train: 3.502012967132032
  15077. step: 80
  15078. running loss: 0.0437751620891504
  15079. Train Steps: 80/90 Loss: 0.0438 torch.Size([8, 600, 800])
  15080. torch.Size([8, 8])
  15081. tensor([[0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  15082. [0.6186, 0.4013, 0.8191, 0.3188, 0.4279, 0.2060, 0.5767, 0.5411],
  15083. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  15084. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  15085. [0.6350, 0.4144, 0.9250, 0.4100, 0.4125, 0.3750, 0.7129, 0.5945],
  15086. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690],
  15087. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  15088. [0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973]],
  15089. device='cuda:0', dtype=torch.float64)
  15090. predictions are: tensor([[ 0.4675, -0.4482, 1.5720, -0.3319, -0.5601, -0.4890, 0.3313, 0.2283],
  15091. [ 0.4698, -0.4146, 1.3785, -1.0504, -0.3257, -1.3054, 0.3977, 0.1078],
  15092. [ 0.1245, -0.6607, 1.5465, -0.6004, -0.4580, -1.0717, 0.1884, 0.1108],
  15093. [ 0.6066, -0.3798, 1.5851, -0.5191, -0.5383, -0.1436, 0.3088, 0.0781],
  15094. [ 0.0988, -0.7262, 1.8452, -0.4678, -0.2128, -0.6663, 1.0411, 0.2591],
  15095. [ 0.5097, -0.4873, 1.5568, -0.0783, -0.3597, 0.2482, 0.9797, 0.3026],
  15096. [ 0.5244, -0.4431, 1.5430, 0.2526, -0.2678, -0.0672, 0.1750, 0.1631],
  15097. [-0.1690, -0.8363, 1.3229, -0.9650, -0.4343, -1.2110, 0.2810, 0.0549]],
  15098. device='cuda:0', grad_fn=<AddmmBackward>)
  15099. landmarks are: tensor([[[ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  15100. 0.2853],
  15101. [ 0.5713, -0.4321, 1.4975, -0.8134, -0.3094, -1.3345, 0.3779,
  15102. 0.2134],
  15103. [ 0.5485, -0.4209, 1.6691, -0.4152, -0.5249, -1.1081, 0.0725,
  15104. 0.0021],
  15105. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  15106. 0.0502],
  15107. [ 0.6471, -0.3719, 1.9866, -0.3921, -0.3806, -0.5538, 1.0070,
  15108. 0.4600],
  15109. [ 0.6306, -0.4153, 1.5141, 0.2224, -0.3691, 0.2622, 1.0033,
  15110. 0.3425],
  15111. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  15112. -0.0610],
  15113. [ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  15114. 0.0111]]], device='cuda:0')
  15115. loss_train_step before backward: tensor(0.0330, device='cuda:0', grad_fn=<MseLossBackward>)
  15116. loss_train_step after backward: tensor(0.0330, device='cuda:0', grad_fn=<MseLossBackward>)
  15117. loss_train: 3.53500113543123
  15118. step: 81
  15119. running loss: 0.043641989326311484
  15120.  
  15121. Train Steps: 81/90 Loss: 0.0436 torch.Size([8, 600, 800])
  15122. torch.Size([8, 8])
  15123. tensor([[0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  15124. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  15125. [0.6196, 0.4068, 0.7645, 0.2234, 0.4575, 0.1737, 0.5926, 0.5284],
  15126. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  15127. [0.6308, 0.3990, 0.8688, 0.5183, 0.3950, 0.4983, 0.6388, 0.5133],
  15128. [0.6111, 0.4033, 0.8300, 0.3267, 0.3588, 0.3333, 0.5444, 0.5637],
  15129. [0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283],
  15130. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136]],
  15131. device='cuda:0', dtype=torch.float64)
  15132. predictions are: tensor([[ 0.2931, -0.5850, 1.3665, -1.0628, -0.4258, -1.0431, 0.5518, 0.2436],
  15133. [ 0.7559, -0.2991, 1.5757, -1.0323, -0.1496, -1.3116, 0.6911, 0.1442],
  15134. [ 0.7068, -0.3175, 1.2592, -1.1584, -0.2464, -1.3062, 0.4130, 0.1583],
  15135. [ 0.2576, -0.6200, 1.7675, 0.3444, -0.5498, 0.0901, 0.4331, 0.1720],
  15136. [ 0.3448, -0.5905, 1.7996, 0.2079, -0.4959, 0.1073, 0.7317, 0.1350],
  15137. [-0.2655, -0.9400, 1.5480, -0.6480, -0.6969, -0.6634, 0.2014, 0.1471],
  15138. [ 0.2986, -0.5727, 1.7204, 0.2381, -0.0618, 0.0382, 0.2197, 0.1804],
  15139. [ 0.2452, -0.6121, 1.0176, -1.1555, -0.5223, -1.0575, 0.2831, 0.1055]],
  15140. device='cuda:0', grad_fn=<AddmmBackward>)
  15141. landmarks are: tensor([[[ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  15142. 0.3315],
  15143. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  15144. 0.0851],
  15145. [ 0.5761, -0.4070, 1.2452, -1.2541, -0.1725, -1.4835, 0.4511,
  15146. 0.1545],
  15147. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  15148. 0.1544],
  15149. [ 0.6275, -0.4430, 1.7268, 0.1082, -0.4614, 0.0159, 0.6644,
  15150. 0.0851],
  15151. [ 0.5366, -0.4232, 1.5478, -0.7771, -0.6289, -0.7463, 0.2288,
  15152. 0.3177],
  15153. [ 0.5245, -0.4347, 1.6806, 0.1159, 0.0046, 0.0129, 0.1044,
  15154. 0.1544],
  15155. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  15156. 0.0862]]], device='cuda:0')
  15157. loss_train_step before backward: tensor(0.0293, device='cuda:0', grad_fn=<MseLossBackward>)
  15158. loss_train_step after backward: tensor(0.0293, device='cuda:0', grad_fn=<MseLossBackward>)
  15159. loss_train: 3.564255858771503
  15160. step: 82
  15161. running loss: 0.04346653486306711
  15162. Train Steps: 82/90 Loss: 0.0435 torch.Size([8, 600, 800])
  15163. torch.Size([8, 8])
  15164. tensor([[0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  15165. [0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  15166. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567],
  15167. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  15168. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533],
  15169. [0.6128, 0.4116, 0.8450, 0.4583, 0.3675, 0.4867, 0.5337, 0.5446],
  15170. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563],
  15171. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217]],
  15172. device='cuda:0', dtype=torch.float64)
  15173. predictions are: tensor([[ 0.9934, -0.1945, 1.8464, -0.3701, -0.3761, -0.5561, 0.9081, 0.0323],
  15174. [ 1.0571, -0.0771, 1.3978, -0.8396, -0.1539, -1.1052, 0.5071, 0.1309],
  15175. [-1.6352, -1.8696, 1.1451, -0.8900, -0.4603, -0.8711, 0.1760, 0.1800],
  15176. [ 0.6482, -0.3183, 1.6749, -0.8900, -0.1365, -0.8788, 0.6645, 0.0612],
  15177. [-1.4340, -1.7223, 0.8990, -1.0310, -0.4178, -1.1867, 0.1727, 0.2790],
  15178. [ 0.7065, -0.3046, 1.7416, 0.1067, -0.4849, 0.2435, 0.4102, 0.1512],
  15179. [ 0.6215, -0.3323, 1.6901, -0.1141, -0.5998, -0.5355, 0.1440, 0.1141],
  15180. [ 0.9429, -0.1613, 1.1300, -0.8821, -0.3557, -0.9696, 0.4113, 0.3535]],
  15181. device='cuda:0', grad_fn=<AddmmBackward>)
  15182. landmarks are: tensor([[[ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  15183. 0.1821],
  15184. [ 0.5908, -0.3832, 1.3804, -1.2543, -0.1270, -1.4671, 0.5721,
  15185. 0.2237],
  15186. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  15187. 0.2853],
  15188. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  15189. -0.0209],
  15190. [-2.2859, -2.2859, 0.7023, -1.3883, -0.4268, -1.3621, 0.0813,
  15191. 0.2699],
  15192. [ 0.5444, -0.3846, 1.6171, -0.1689, -0.5885, -0.0380, 0.1791,
  15193. 0.2296],
  15194. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  15195. 0.2837],
  15196. [ 0.5687, -0.4088, 1.0397, -1.1466, -0.3113, -1.1928, 0.4681,
  15197. 0.5855]]], device='cuda:0')
  15198. loss_train_step before backward: tensor(0.0665, device='cuda:0', grad_fn=<MseLossBackward>)
  15199. loss_train_step after backward: tensor(0.0665, device='cuda:0', grad_fn=<MseLossBackward>)
  15200. loss_train: 3.630719925276935
  15201. step: 83
  15202. running loss: 0.043743613557553435
  15203. Train Steps: 83/90 Loss: 0.0437 torch.Size([8, 600, 800])
  15204. torch.Size([8, 8])
  15205. tensor([[0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  15206. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  15207. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679],
  15208. [ nan, nan, 0.9050, 0.3500, 0.5138, 0.2300, 0.7359, 0.5702],
  15209. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650],
  15210. [0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  15211. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667],
  15212. [0.6199, 0.4065, 0.7598, 0.2385, 0.4317, 0.1981, 0.5933, 0.5221]],
  15213. device='cuda:0', dtype=torch.float64)
  15214. predictions are: tensor([[ 1.1672, -0.0103, 1.4356, -0.7056, -0.6808, -0.2443, 0.4589, 0.0789],
  15215. [ 1.2498, 0.1052, 1.4687, -0.1174, -0.2292, -0.6798, 0.1431, 0.2818],
  15216. [-1.0567, -1.4895, 1.6280, -0.8708, 0.0069, -0.7950, 0.9648, 0.2630],
  15217. [-0.4714, -1.0502, 1.8932, -0.3346, -0.0877, -0.7876, 0.8404, 0.2231],
  15218. [-1.2858, -1.5904, 1.0354, -0.9126, -0.5178, -1.0090, 0.1041, 0.1625],
  15219. [ 1.2956, 0.0862, 1.2792, -0.7547, -0.2526, -1.0581, 0.2798, 0.0854],
  15220. [-1.0856, -1.4630, 1.2056, -0.8829, -0.5616, -0.7047, 0.3875, 0.2448],
  15221. [ 1.5989, 0.2509, 1.3222, -0.8339, -0.3640, -0.9206, 0.3607, 0.0468]],
  15222. device='cuda:0', grad_fn=<AddmmBackward>)
  15223. landmarks are: tensor([[[ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  15224. 0.2237],
  15225. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  15226. 0.5882],
  15227. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  15228. 0.3371],
  15229. [-2.2859, -2.2859, 1.8942, -0.6693, 0.0871, -1.2236, 1.1130,
  15230. 0.3478],
  15231. [-2.2859, -2.2859, 1.0361, -1.2021, -0.4210, -1.3390, 0.0871,
  15232. 0.3238],
  15233. [ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  15234. 0.2442],
  15235. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  15236. 0.3315],
  15237. [ 0.5774, -0.4082, 1.2235, -1.1844, -0.2919, -1.3709, 0.4544,
  15238. 0.1256]]], device='cuda:0')
  15239. loss_train_step before backward: tensor(0.2647, device='cuda:0', grad_fn=<MseLossBackward>)
  15240. loss_train_step after backward: tensor(0.2647, device='cuda:0', grad_fn=<MseLossBackward>)
  15241. loss_train: 3.8954066587612033
  15242. step: 84
  15243. running loss: 0.04637388879477623
  15244. Train Steps: 84/90 Loss: 0.0464 torch.Size([8, 600, 800])
  15245. torch.Size([8, 8])
  15246. tensor([[0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  15247. [0.6200, 0.3978, 0.8900, 0.4550, 0.3775, 0.5200, 0.6150, 0.5367],
  15248. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  15249. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  15250. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  15251. [0.6202, 0.4066, 0.8746, 0.3376, 0.3717, 0.3090, 0.5842, 0.5165],
  15252. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  15253. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207]],
  15254. device='cuda:0', dtype=torch.float64)
  15255. predictions are: tensor([[ 0.0092, -0.7831, 1.4251, -0.8901, -0.6195, -0.3991, 0.4450, 0.2552],
  15256. [ 0.1866, -0.6944, 1.7594, -0.0529, -0.4564, 0.0751, 0.3812, 0.1549],
  15257. [ 0.4072, -0.4985, 1.0225, -1.0642, -0.3926, -1.3225, 0.2822, 0.2517],
  15258. [-0.3008, -0.9750, 1.1834, -1.0713, -0.5787, -0.8064, 0.1357, 0.1497],
  15259. [ 0.4684, -0.5414, 1.8716, 0.1877, -0.3996, 0.2120, 0.9094, 0.1500],
  15260. [ 0.7999, -0.2541, 1.8295, -0.6501, -0.4471, -1.0200, 0.4277, 0.0413],
  15261. [ 0.4781, -0.4347, 1.6580, 0.4612, 0.0516, -0.3173, 0.2600, 0.3793],
  15262. [ 0.3030, -0.6041, 1.5122, -1.0825, -0.1982, -1.4243, 0.6538, 0.1128]],
  15263. device='cuda:0', grad_fn=<AddmmBackward>)
  15264. landmarks are: tensor([[[ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  15265. 0.2776],
  15266. [ 0.5776, -0.4484, 1.8249, -0.1843, -0.5423, 0.1159, 0.5547,
  15267. 0.1929],
  15268. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  15269. 0.2391],
  15270. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  15271. 0.0442],
  15272. [ 0.6421, -0.3695, 1.7788, 0.0236, -0.4845, 0.1544, 1.1971,
  15273. 0.2196],
  15274. [ 0.5787, -0.4077, 1.7537, -0.7263, -0.5692, -0.8586, 0.4126,
  15275. 0.1000],
  15276. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  15277. 0.4547],
  15278. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  15279. 0.1193]]], device='cuda:0')
  15280. loss_train_step before backward: tensor(0.0374, device='cuda:0', grad_fn=<MseLossBackward>)
  15281. loss_train_step after backward: tensor(0.0374, device='cuda:0', grad_fn=<MseLossBackward>)
  15282. loss_train: 3.9328551990911365
  15283. step: 85
  15284. running loss: 0.04626888469518984
  15285.  
  15286. Train Steps: 85/90 Loss: 0.0463 torch.Size([8, 600, 800])
  15287. torch.Size([8, 8])
  15288. tensor([[0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  15289. [0.6069, 0.3975, 0.8625, 0.5083, 0.4388, 0.5483, 0.5650, 0.4967],
  15290. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  15291. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  15292. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  15293. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  15294. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  15295. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552]],
  15296. device='cuda:0', dtype=torch.float64)
  15297. predictions are: tensor([[ 0.3836, -0.5184, 1.6498, 0.0154, -0.1134, 0.1239, 0.3044, 0.1965],
  15298. [ 0.4918, -0.4554, 1.6638, 0.0633, -0.2440, 0.0597, 0.2894, 0.1129],
  15299. [ 0.7150, -0.2920, 1.2913, -1.2055, -0.1567, -1.4490, 0.4141, 0.1894],
  15300. [ 0.7872, -0.2240, 1.7332, -0.0770, -0.4979, -1.0182, 0.3480, 0.1206],
  15301. [ 0.5916, -0.3943, 1.0506, -1.1736, -0.5250, -1.0944, 0.4367, 0.2910],
  15302. [ 0.5973, -0.3884, 1.6319, 0.2809, -0.4084, 0.0409, 0.4515, 0.2362],
  15303. [ 0.1417, -0.6834, 1.4807, -0.8859, -0.7096, -0.4316, 0.4162, 0.2001],
  15304. [-2.0467, -2.1798, 1.6085, -1.1863, -0.0272, -1.3415, 0.9383, 0.2650]],
  15305. device='cuda:0', grad_fn=<AddmmBackward>)
  15306. landmarks are: tensor([[[ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  15307. 0.0592],
  15308. [ 0.5174, -0.4497, 1.6979, 0.0620, -0.2594, 0.2468, 0.3238,
  15309. 0.0082],
  15310. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  15311. 0.1850],
  15312. [ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  15313. 0.1852],
  15314. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  15315. 0.3700],
  15316. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  15317. 0.3161],
  15318. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  15319. 0.2391],
  15320. [-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  15321. 0.2783]]], device='cuda:0')
  15322. loss_train_step before backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  15323. loss_train_step after backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  15324. loss_train: 3.9474326334893703
  15325. step: 86
  15326. running loss: 0.04590037945917873
  15327. Train Steps: 86/90 Loss: 0.0459 torch.Size([8, 600, 800])
  15328. torch.Size([8, 8])
  15329. tensor([[0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  15330. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  15331. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  15332. [0.6084, 0.3981, 0.8588, 0.5233, 0.4600, 0.5367, 0.5680, 0.5006],
  15333. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  15334. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  15335. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  15336. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400]],
  15337. device='cuda:0', dtype=torch.float64)
  15338. predictions are: tensor([[ 0.3863, -0.5068, 1.3909, -1.0064, -0.0798, -1.3737, 0.4426, 0.1917],
  15339. [ 0.0985, -0.7115, 1.3916, -1.2851, -0.0720, -1.3754, 0.7241, 0.2478],
  15340. [ 0.3931, -0.5064, 1.5499, -0.4864, -0.6317, -0.7154, 0.0686, 0.1628],
  15341. [ 0.2412, -0.6454, 1.5829, 0.1082, -0.1753, 0.0653, 0.2417, 0.1627],
  15342. [ 0.0780, -0.7639, 1.7483, -0.3355, -0.5922, -0.1877, 0.5523, 0.0529],
  15343. [ 0.2777, -0.6107, 1.5568, 0.3643, -0.1859, -0.3246, 0.4243, 0.4047],
  15344. [ 0.1649, -0.6641, 1.2672, -1.1711, -0.3359, -1.0829, 0.6421, 0.2771],
  15345. [-0.1123, -0.8771, 1.6413, -0.5845, -0.6554, -0.2488, 0.6509, 0.2595]],
  15346. device='cuda:0', grad_fn=<AddmmBackward>)
  15347. landmarks are: tensor([[[ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  15348. 0.2083],
  15349. [ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  15350. 0.2083],
  15351. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  15352. 0.2567],
  15353. [ 0.5241, -0.4470, 1.6806, 0.1313, -0.1612, 0.1929, 0.3378,
  15354. 0.0261],
  15355. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  15356. -0.0670],
  15357. [ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  15358. 0.4470],
  15359. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  15360. 0.2160],
  15361. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  15362. 0.2083]]], device='cuda:0')
  15363. loss_train_step before backward: tensor(0.0403, device='cuda:0', grad_fn=<MseLossBackward>)
  15364. loss_train_step after backward: tensor(0.0403, device='cuda:0', grad_fn=<MseLossBackward>)
  15365. loss_train: 3.9877162650227547
  15366. step: 87
  15367. running loss: 0.04583581913819258
  15368. Train Steps: 87/90 Loss: 0.0458 torch.Size([8, 600, 800])
  15369. torch.Size([8, 8])
  15370. tensor([[0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823],
  15371. [0.6129, 0.3930, 0.8769, 0.5105, 0.4146, 0.5642, 0.6000, 0.5082],
  15372. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  15373. [0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390],
  15374. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  15375. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  15376. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  15377. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896]],
  15378. device='cuda:0', dtype=torch.float64)
  15379. predictions are: tensor([[ 0.1744, -0.6968, 1.5299, -1.1521, -0.1250, -1.4734, 0.6400, 0.1067],
  15380. [ 0.4351, -0.5575, 1.7017, 0.2760, -0.1643, 0.3751, 0.4155, 0.1889],
  15381. [-0.1450, -0.9232, 1.6934, -1.1407, -0.0424, -1.2464, 1.1251, 0.2949],
  15382. [ 0.1820, -0.6939, 1.7591, -0.4505, -0.2610, -1.0295, 0.6851, 0.1865],
  15383. [ 0.4787, -0.4771, 1.3901, -0.4078, -0.5066, -0.3232, 0.0269, 0.1471],
  15384. [ 0.1439, -0.7145, 1.1538, -1.0634, -0.5412, -0.6070, 0.4496, 0.3232],
  15385. [ 0.1047, -0.7455, 1.5241, -0.7351, -0.6339, -0.3523, 0.4122, 0.2333],
  15386. [ 0.3210, -0.5923, 1.4436, -0.4391, -0.5093, -0.9542, 0.0538, 0.3497]],
  15387. device='cuda:0', grad_fn=<AddmmBackward>)
  15388. landmarks are: tensor([[[ 0.6132, -0.4122, 1.5478, -1.0619, -0.2709, -1.4314, 0.5500,
  15389. -0.0583],
  15390. [ 0.5450, -0.4706, 1.7643, 0.0722, -0.3708, 0.3200, 0.4854,
  15391. 0.0612],
  15392. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  15393. 0.2944],
  15394. [ 0.6504, -0.3936, 1.8885, -0.4922, -0.3402, -0.9233, 0.8022,
  15395. 0.2035],
  15396. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  15397. 0.1552],
  15398. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  15399. 0.3546],
  15400. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  15401. 0.2391],
  15402. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  15403. 0.4374]]], device='cuda:0')
  15404. loss_train_step before backward: tensor(0.0404, device='cuda:0', grad_fn=<MseLossBackward>)
  15405. loss_train_step after backward: tensor(0.0404, device='cuda:0', grad_fn=<MseLossBackward>)
  15406. loss_train: 4.0281651839613914
  15407. step: 88
  15408. running loss: 0.04577460436319763
  15409. Train Steps: 88/90 Loss: 0.0458 torch.Size([8, 600, 800])
  15410. torch.Size([8, 8])
  15411. tensor([[0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  15412. [0.6267, 0.4080, 0.8438, 0.2633, 0.4763, 0.1800, 0.6259, 0.5240],
  15413. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  15414. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  15415. [0.6259, 0.4133, 0.8200, 0.2317, 0.5025, 0.1533, 0.6250, 0.4947],
  15416. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  15417. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  15418. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100]],
  15419. device='cuda:0', dtype=torch.float64)
  15420. predictions are: tensor([[ 0.1915, -0.6440, 1.4687, -0.5500, -0.6943, -0.3780, 0.1095, 0.2380],
  15421. [ 0.3804, -0.5327, 1.4882, -1.2403, -0.1517, -1.4743, 0.5692, 0.2154],
  15422. [-0.0196, -0.8108, 1.5399, -0.0779, -0.3252, 0.0614, 0.3196, 0.2752],
  15423. [ 0.3610, -0.5834, 1.6524, -0.2101, -0.6242, -0.3816, 0.5197, 0.1405],
  15424. [ 0.4290, -0.5124, 1.3662, -1.4068, -0.0729, -1.5972, 0.5732, 0.2222],
  15425. [ 0.1196, -0.7140, 1.5856, -0.2194, -0.1171, -0.0294, 0.3316, 0.3566],
  15426. [ 0.1048, -0.7306, 1.9049, -0.7238, -0.1563, -1.2254, 0.9249, 0.1957],
  15427. [ 0.2424, -0.6750, 1.5581, 0.0550, -0.4404, -0.0346, 0.5450, 0.2040]],
  15428. device='cuda:0', grad_fn=<AddmmBackward>)
  15429. landmarks are: tensor([[[ 5.3672e-01, -4.2941e-01, 1.5709e+00, -4.9992e-01, -6.6928e-01,
  15430. -3.0747e-01, 2.4546e-01, 3.5585e-01],
  15431. [ 6.0878e-01, -4.0146e-01, 1.6113e+00, -1.0696e+00, -8.6143e-02,
  15432. -1.4545e+00, 6.0510e-01, 1.3434e-01],
  15433. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  15434. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  15435. [ 6.1742e-01, -4.4897e-01, 1.8885e+00, -9.9615e-02, -4.8453e-01,
  15436. -3.6905e-01, 9.8137e-01, 1.7146e-01],
  15437. [ 6.0514e-01, -3.7714e-01, 1.5016e+00, -1.2159e+00, 3.5104e-02,
  15438. -1.5777e+00, 6.0099e-01, -9.2270e-04],
  15439. [ 5.5052e-01, -4.2071e-01, 1.7095e+00, -5.3426e-02, -5.0936e-02,
  15440. 1.0502e-01, 3.8730e-01, 3.0069e-01],
  15441. [ 6.1083e-01, -4.2008e-01, 1.9346e+00, -5.5381e-01, -1.4965e-01,
  15442. -1.0773e+00, 1.0545e+00, 2.1421e-01],
  15443. [ 6.2361e-01, -4.3441e-01, 1.6171e+00, 1.8522e-01, -3.4018e-01,
  15444. 2.3557e-02, 6.4711e-01, 6.9746e-02]]], device='cuda:0')
  15445. loss_train_step before backward: tensor(0.0387, device='cuda:0', grad_fn=<MseLossBackward>)
  15446. loss_train_step after backward: tensor(0.0387, device='cuda:0', grad_fn=<MseLossBackward>)
  15447. loss_train: 4.066847592592239
  15448. step: 89
  15449. running loss: 0.04569491677069932
  15450.  
  15451. Train Steps: 89/90 Loss: 0.0457 torch.Size([8, 600, 800])
  15452. torch.Size([8, 8])
  15453. tensor([[0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  15454. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  15455. [0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400],
  15456. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038],
  15457. [0.6236, 0.3977, 0.8985, 0.4806, 0.3835, 0.5216, 0.6613, 0.5166],
  15458. [0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  15459. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  15460. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600]],
  15461. device='cuda:0', dtype=torch.float64)
  15462. predictions are: tensor([[ 0.2890, -0.5716, 1.3113, -1.2958, -0.1987, -1.5838, 0.4590, 0.2383],
  15463. [ 0.2683, -0.5812, 1.4407, -1.0742, -0.1550, -1.5367, 0.4240, 0.2070],
  15464. [ 0.4971, -0.4523, 1.5860, -0.8335, -0.6447, -0.9323, 0.5781, 0.2279],
  15465. [ 0.2467, -0.6203, 1.7023, -0.1982, -0.2799, -0.1041, 0.2939, 0.1046],
  15466. [ 0.2707, -0.6597, 1.7397, -0.2222, -0.5196, 0.0379, 0.8742, 0.2198],
  15467. [ 0.2934, -0.6259, 1.6778, -0.0822, -0.4994, -0.3037, 0.4800, 0.2324],
  15468. [ 0.1104, -0.7315, 1.6631, -0.0197, -0.1773, -0.1624, 0.3443, 0.3367],
  15469. [ 0.1810, -0.6591, 1.6120, -0.3214, -0.1508, -0.0314, 0.4300, 0.3403]],
  15470. device='cuda:0', grad_fn=<AddmmBackward>)
  15471. landmarks are: tensor([[[ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  15472. 0.1850],
  15473. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  15474. 0.2083],
  15475. [ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  15476. 0.2083],
  15477. [ 0.5249, -0.4473, 1.7326, -0.0919, -0.2016, 0.1544, 0.1733,
  15478. 0.0412],
  15479. [ 0.5944, -0.4490, 1.8643, -0.0659, -0.5147, 0.1235, 0.7684,
  15480. 0.1004],
  15481. [ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  15482. 0.3777],
  15483. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  15484. 0.4171],
  15485. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  15486. 0.3007]]], device='cuda:0')
  15487. loss_train_step before backward: tensor(0.0306, device='cuda:0', grad_fn=<MseLossBackward>)
  15488. loss_train_step after backward: tensor(0.0306, device='cuda:0', grad_fn=<MseLossBackward>)
  15489. loss_train: 4.097452521324158
  15490. step: 90
  15491. running loss: 0.04552725023693509
  15492. Valid Steps: 10/10 Loss: nan 5.8477
  15493. --------------------------------------------------
  15494. Epoch: 4 Train Loss: 0.0455 Valid Loss: nan
  15495. --------------------------------------------------
  15496. size of train loader is: 90
  15497. torch.Size([8, 600, 800])
  15498. torch.Size([8, 8])
  15499. tensor([[0.6081, 0.3950, 0.8538, 0.4667, 0.3850, 0.4917, 0.5342, 0.4954],
  15500. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  15501. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  15502. [0.6250, 0.4013, 0.8525, 0.5417, 0.4037, 0.5117, 0.6325, 0.5017],
  15503. [0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667],
  15504. [0.6124, 0.4030, 0.8650, 0.4867, 0.4999, 0.5106, 0.5137, 0.5773],
  15505. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  15506. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999]],
  15507. device='cuda:0', dtype=torch.float64)
  15508. predictions are: tensor([[ 3.4651e-01, -5.8417e-01, 1.7318e+00, -5.1866e-01, -5.5468e-01,
  15509. -4.1584e-01, 3.5147e-01, 5.9733e-02],
  15510. [ 2.0160e-01, -6.7345e-01, 1.7936e+00, -4.8521e-01, -6.1855e-02,
  15511. -4.0095e-01, 5.5372e-01, 2.8475e-01],
  15512. [ 4.4827e-01, -4.2845e-01, 1.4146e+00, -5.0683e-01, -5.0848e-01,
  15513. -1.2103e+00, 2.3973e-01, 5.2721e-01],
  15514. [ 5.1592e-01, -4.7822e-01, 1.7209e+00, -1.5612e-01, -4.5384e-01,
  15515. -2.8481e-01, 7.0564e-01, 1.2522e-01],
  15516. [ 7.6344e-01, -2.9085e-01, 1.7067e+00, 8.7751e-04, -4.5148e-01,
  15517. -2.4599e-01, 6.7884e-01, 2.8083e-01],
  15518. [ 2.3650e-01, -6.3350e-01, 1.7368e+00, -3.9993e-01, -3.5953e-02,
  15519. -4.3623e-01, 3.3012e-01, 2.6307e-01],
  15520. [ 3.1048e-01, -5.8417e-01, 1.7569e+00, -4.4972e-01, -6.0495e-02,
  15521. -4.0298e-01, 5.7915e-01, 3.2222e-01],
  15522. [ 1.8989e-01, -6.7958e-01, 1.7583e+00, -5.6773e-01, -4.8253e-01,
  15523. -2.4003e-01, 4.2579e-01, 8.0821e-02]], device='cuda:0',
  15524. grad_fn=<AddmmBackward>)
  15525. landmarks are: tensor([[[ 0.5227, -0.4615, 1.6575, -0.1304, -0.5076, -0.0149, 0.1815,
  15526. 0.0021],
  15527. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  15528. 0.2853],
  15529. [ 0.6069, -0.3309, 1.3742, -0.1493, -0.5365, -0.9541, 0.2884,
  15530. 0.5071],
  15531. [ 0.6010, -0.4321, 1.6517, 0.2160, -0.4210, 0.0774, 0.6356,
  15532. 0.0313],
  15533. [ 0.5853, -0.3614, 1.6806, 0.2930, -0.4499, 0.1005, 0.3815,
  15534. 0.3315],
  15535. [ 0.5428, -0.4244, 1.7095, -0.0380, 0.0232, 0.0725, 0.0866,
  15536. 0.3806],
  15537. [ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  15538. 0.3007],
  15539. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  15540. 0.0231]]], device='cuda:0')
  15541. loss_train_step before backward: tensor(0.0548, device='cuda:0', grad_fn=<MseLossBackward>)
  15542. loss_train_step after backward: tensor(0.0548, device='cuda:0', grad_fn=<MseLossBackward>)
  15543. loss_train: 0.054758865386247635
  15544. step: 1
  15545. running loss: 0.054758865386247635
  15546. Train Steps: 1/90 Loss: 0.0548 torch.Size([8, 600, 800])
  15547. torch.Size([8, 8])
  15548. tensor([[0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  15549. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  15550. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  15551. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  15552. [0.6239, 0.4107, 0.8162, 0.2763, 0.3625, 0.3600, 0.5988, 0.5700],
  15553. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  15554. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  15555. [0.6236, 0.3967, 0.8675, 0.5400, 0.3862, 0.4517, 0.5825, 0.5200]],
  15556. device='cuda:0', dtype=torch.float64)
  15557. predictions are: tensor([[ 0.3067, -0.5911, 1.3730, -1.0648, -0.3434, -0.9991, 0.5182, 0.3448],
  15558. [-0.3291, -0.9670, 1.0663, -1.0819, -0.3201, -1.1403, 0.2702, 0.3937],
  15559. [ 0.5365, -0.4417, 1.6636, -1.0241, -0.0103, -1.3002, 0.7841, 0.2095],
  15560. [ 0.7065, -0.3506, 1.7970, -0.1609, -0.5044, 0.1665, 0.2508, 0.1114],
  15561. [-0.1420, -0.8803, 1.4987, -0.7562, -0.4674, -0.4524, 0.4285, 0.3405],
  15562. [ 0.6437, -0.3572, 1.7996, -0.9246, -0.2193, -0.9633, 0.7583, 0.2072],
  15563. [ 0.3890, -0.5329, 1.5026, -0.9721, -0.3509, -1.0259, 0.4017, 0.1881],
  15564. [ 0.6239, -0.4407, 1.8843, 0.4963, -0.4543, 0.0053, 0.5245, 0.1646]],
  15565. device='cuda:0', grad_fn=<AddmmBackward>)
  15566. landmarks are: tensor([[[ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  15567. 0.3315],
  15568. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  15569. 0.2622],
  15570. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  15571. 0.1020],
  15572. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  15573. 0.0502],
  15574. [ 0.5960, -0.3888, 1.4840, -1.0095, -0.6115, -0.6231, 0.4797,
  15575. 0.3469],
  15576. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  15577. 0.1467],
  15578. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  15579. 0.2043],
  15580. [ 0.5944, -0.4538, 1.7210, 0.2083, -0.5018, -0.1997, 0.4046,
  15581. 0.1159]]], device='cuda:0')
  15582. loss_train_step before backward: tensor(0.0447, device='cuda:0', grad_fn=<MseLossBackward>)
  15583. loss_train_step after backward: tensor(0.0447, device='cuda:0', grad_fn=<MseLossBackward>)
  15584. loss_train: 0.09948705509305
  15585. step: 2
  15586. running loss: 0.049743527546525
  15587. Train Steps: 2/90 Loss: 0.0497 torch.Size([8, 600, 800])
  15588. torch.Size([8, 8])
  15589. tensor([[0.6296, 0.4060, 0.9100, 0.3267, 0.4726, 0.3367, 0.7446, 0.5355],
  15590. [0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  15591. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  15592. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  15593. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  15594. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  15595. [0.6126, 0.4073, 0.8750, 0.5133, 0.3800, 0.4333, 0.4986, 0.5378],
  15596. [0.6209, 0.3920, 0.8650, 0.5367, 0.4400, 0.5067, 0.6025, 0.4950]],
  15597. device='cuda:0', dtype=torch.float64)
  15598. predictions are: tensor([[ 0.5210, -0.4563, 1.7610, -0.8858, -0.2437, -0.7401, 0.9069, 0.1881],
  15599. [ 0.2435, -0.5746, 1.7808, -0.4829, -0.3414, -1.1378, 0.3184, 0.3190],
  15600. [-0.1094, -0.8018, 0.9690, -1.3126, -0.3771, -1.2953, 0.2717, 0.4078],
  15601. [ 0.4078, -0.5230, 1.8003, -0.1228, -0.0185, 0.1290, 0.4568, 0.3150],
  15602. [ 0.7459, -0.3426, 1.8601, 0.1211, -0.5755, -0.1134, 0.6215, 0.1065],
  15603. [ 0.4384, -0.4892, 1.4912, -1.1436, -0.3577, -1.0383, 0.4101, 0.1810],
  15604. [ 0.6986, -0.3227, 1.7810, 0.1030, -0.4969, -0.2094, 0.2139, 0.2080],
  15605. [ 0.7046, -0.3568, 1.7441, 0.0391, -0.2582, 0.1621, 0.4744, 0.1544]],
  15606. device='cuda:0', grad_fn=<AddmmBackward>)
  15607. landmarks are: tensor([[[ 6.2236e-01, -4.1045e-01, 1.9173e+00, -7.7706e-01, -1.0299e-01,
  15608. -7.3084e-01, 1.1532e+00, 1.8749e-01],
  15609. [ 5.8995e-01, -3.9323e-01, 1.8307e+00, -3.9215e-01, -4.2679e-01,
  15610. -1.1851e+00, 3.7575e-01, 1.9292e-01],
  15611. [ 5.7131e-01, -3.6712e-01, 8.6651e-01, -1.0696e+00, -3.6905e-01,
  15612. -1.2236e+00, 3.5266e-01, 2.6220e-01],
  15613. [ 5.3712e-01, -4.2517e-01, 1.7037e+00, -6.8822e-02, -3.4180e-02,
  15614. 6.2048e-02, 3.7575e-01, 2.8530e-01],
  15615. [ 6.2401e-01, -4.3212e-01, 1.8423e+00, 1.8522e-01, -5.8845e-01,
  15616. -1.6120e-01, 6.9623e-01, 1.1149e-02],
  15617. [ 5.7898e-01, -4.0793e-01, 1.5929e+00, -1.0630e+00, -4.7294e-01,
  15618. -1.0725e+00, 4.1374e-01, 8.0707e-02],
  15619. [ 5.4353e-01, -4.0454e-01, 1.7557e+00, 8.5142e-02, -5.3072e-01,
  15620. -2.8437e-01, 1.7213e-02, 1.9805e-01],
  15621. [ 5.8199e-01, -4.7544e-01, 1.7095e+00, 1.9292e-01, -2.5358e-01,
  15622. 5.4350e-02, 4.9700e-01, 4.6189e-04]]], device='cuda:0')
  15623. loss_train_step before backward: tensor(0.0220, device='cuda:0', grad_fn=<MseLossBackward>)
  15624. loss_train_step after backward: tensor(0.0220, device='cuda:0', grad_fn=<MseLossBackward>)
  15625. loss_train: 0.12145851366221905
  15626. step: 3
  15627. running loss: 0.040486171220739685
  15628.  
  15629. Train Steps: 3/90 Loss: 0.0405 torch.Size([8, 600, 800])
  15630. torch.Size([8, 8])
  15631. tensor([[0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  15632. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  15633. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  15634. [0.6201, 0.4151, 0.8588, 0.5467, 0.3700, 0.3950, 0.5637, 0.5933],
  15635. [0.6107, 0.4050, 0.8700, 0.4850, 0.4470, 0.4848, 0.5043, 0.5431],
  15636. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550],
  15637. [0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350],
  15638. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519]],
  15639. device='cuda:0', dtype=torch.float64)
  15640. predictions are: tensor([[ 0.5027, -0.4413, 1.8971, -0.8446, -0.2785, -1.2732, 0.7965, 0.1499],
  15641. [ 0.3700, -0.5806, 1.7208, 0.2440, -0.2295, 0.1421, 0.3970, 0.1733],
  15642. [ 0.4950, -0.4589, 1.1742, -1.2359, -0.5166, -1.0659, 0.2792, 0.1711],
  15643. [ 0.6150, -0.3365, 1.7022, 0.1509, -0.4928, -0.4111, 0.5337, 0.3872],
  15644. [ 0.6815, -0.3452, 1.8120, -0.0561, -0.2128, 0.1955, 0.3699, 0.1365],
  15645. [ 0.2446, -0.5919, 1.4378, -0.8585, -0.5198, -0.8801, 0.1190, 0.2465],
  15646. [ 0.7320, -0.2839, 1.4079, -1.1618, -0.3278, -1.2204, 0.5434, 0.2279],
  15647. [ 0.4952, -0.4617, 1.7817, 0.0618, -0.1303, 0.2405, 0.4049, 0.2265]],
  15648. device='cuda:0', grad_fn=<AddmmBackward>)
  15649. landmarks are: tensor([[[ 0.6128, -0.3828, 1.7499, -0.8386, -0.3344, -1.2620, 0.5792,
  15650. -0.0263],
  15651. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  15652. -0.0610],
  15653. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  15654. 0.0802],
  15655. [ 0.5785, -0.3687, 1.6806, 0.2391, -0.5769, -0.4614, 0.3180,
  15656. 0.4547],
  15657. [ 0.5351, -0.4153, 1.7326, -0.0457, -0.2214, -0.0466, 0.0434,
  15658. 0.2228],
  15659. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  15660. 0.2776],
  15661. [ 0.5911, -0.4080, 1.2303, -0.9156, -0.3229, -1.2851, 0.4508,
  15662. 0.1852],
  15663. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  15664. 0.2634]]], device='cuda:0')
  15665. loss_train_step before backward: tensor(0.0177, device='cuda:0', grad_fn=<MseLossBackward>)
  15666. loss_train_step after backward: tensor(0.0177, device='cuda:0', grad_fn=<MseLossBackward>)
  15667. loss_train: 0.13915947452187538
  15668. step: 4
  15669. running loss: 0.034789868630468845
  15670. Train Steps: 4/90 Loss: 0.0348 torch.Size([8, 600, 800])
  15671. torch.Size([8, 8])
  15672. tensor([[0.6059, 0.4002, 0.7562, 0.2767, 0.3538, 0.3033, 0.5529, 0.5455],
  15673. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  15674. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567],
  15675. [0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131],
  15676. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  15677. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  15678. [0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391],
  15679. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467]],
  15680. device='cuda:0', dtype=torch.float64)
  15681. predictions are: tensor([[ 0.8880, -0.1930, 1.3037, -0.9538, -0.5272, -0.8709, 0.3894, 0.2118],
  15682. [ 0.7731, -0.2506, 1.6970, 0.1314, -0.1712, 0.3505, 0.3391, 0.2241],
  15683. [-1.9436, -2.0312, 1.3338, -0.8958, -0.3679, -1.0223, 0.3111, 0.2546],
  15684. [ 0.9518, -0.1705, 1.7189, -0.3662, -0.5749, -0.1627, 0.4393, 0.1420],
  15685. [ 0.7302, -0.2546, 1.4106, -1.0633, -0.1283, -1.3372, 0.4802, 0.2443],
  15686. [ 0.9238, -0.1728, 1.6986, -0.2053, -0.4794, -0.0917, 0.3199, 0.2095],
  15687. [ 0.9332, -0.1299, 1.6650, -0.8772, -0.2057, -1.0746, 0.5534, 0.1711],
  15688. [ 0.8415, -0.2139, 1.7384, 0.2925, -0.3925, -0.0505, 0.5245, 0.2025]],
  15689. device='cuda:0', grad_fn=<AddmmBackward>)
  15690. landmarks are: tensor([[[ 0.5129, -0.4374, 1.2072, -1.0080, -0.6520, -0.8848, 0.2679,
  15691. 0.2335],
  15692. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  15693. 0.2386],
  15694. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  15695. 0.2853],
  15696. [ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  15697. 0.0840],
  15698. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  15699. 0.1850],
  15700. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  15701. 0.3265],
  15702. [ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  15703. 0.2043],
  15704. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  15705. 0.2391]]], device='cuda:0')
  15706. loss_train_step before backward: tensor(0.0299, device='cuda:0', grad_fn=<MseLossBackward>)
  15707. loss_train_step after backward: tensor(0.0299, device='cuda:0', grad_fn=<MseLossBackward>)
  15708. loss_train: 0.16904453001916409
  15709. step: 5
  15710. running loss: 0.033808906003832816
  15711. Train Steps: 5/90 Loss: 0.0338 torch.Size([8, 600, 800])
  15712. torch.Size([8, 8])
  15713. tensor([[0.6189, 0.4033, 0.8650, 0.5267, 0.4487, 0.5150, 0.5925, 0.5050],
  15714. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  15715. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  15716. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  15717. [0.6064, 0.4019, 0.8650, 0.4517, 0.4037, 0.5367, 0.5703, 0.5609],
  15718. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  15719. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  15720. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575]],
  15721. device='cuda:0', dtype=torch.float64)
  15722. predictions are: tensor([[ 0.8357, -0.2498, 1.7605, 0.2656, -0.2423, 0.1694, 0.2467, 0.1434],
  15723. [ 0.9518, -0.1559, 1.2529, -0.8951, -0.6224, -0.6567, 0.3689, 0.2523],
  15724. [ 0.6504, -0.3560, 1.8047, -0.0042, -0.0985, 0.1004, 0.2837, 0.2233],
  15725. [ 0.8765, -0.1998, 1.3278, -0.8894, -0.6295, -0.8862, 0.1980, 0.1767],
  15726. [ 0.8432, -0.2417, 1.7446, -0.0057, -0.4000, 0.3157, 0.2729, 0.1645],
  15727. [ 0.6089, -0.3450, 1.5589, -0.3284, -0.5271, -1.1253, 0.0505, 0.2763],
  15728. [-0.9919, -1.4238, 1.7263, -1.0578, 0.1417, -1.2524, 1.0073, 0.2014],
  15729. [ 1.0442, -0.1350, 1.7510, -0.6142, -0.4799, -0.3495, 0.8260, 0.1358]],
  15730. device='cuda:0', grad_fn=<AddmmBackward>)
  15731. landmarks are: tensor([[[ 0.5726, -0.4230, 1.7095, 0.1467, -0.2132, 0.0928, 0.4508,
  15732. 0.0467],
  15733. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  15734. 0.3546],
  15735. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  15736. 0.2853],
  15737. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  15738. 0.2545],
  15739. [ 0.5151, -0.4296, 1.7095, -0.1997, -0.4210, 0.1929, 0.3484,
  15740. 0.3047],
  15741. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  15742. 0.3928],
  15743. [-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  15744. 0.2463],
  15745. [ 0.6158, -0.4249, 1.8654, -0.9002, -0.3229, -0.3537, 0.9667,
  15746. 0.2890]]], device='cuda:0')
  15747. loss_train_step before backward: tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward>)
  15748. loss_train_step after backward: tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward>)
  15749. loss_train: 0.2331299614161253
  15750. step: 6
  15751. running loss: 0.038854993569354214
  15752. Train Steps: 6/90 Loss: 0.0389 torch.Size([8, 600, 800])
  15753. torch.Size([8, 8])
  15754. tensor([[0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183],
  15755. [0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  15756. [0.6108, 0.4011, 0.8037, 0.3400, 0.3700, 0.2933, 0.5658, 0.5617],
  15757. [0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274],
  15758. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478],
  15759. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  15760. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  15761. [0.6151, 0.4058, 0.7068, 0.2680, 0.3400, 0.4083, 0.5775, 0.5733]],
  15762. device='cuda:0', dtype=torch.float64)
  15763. predictions are: tensor([[ 0.9756, -0.1992, 1.7893, -0.4266, -0.4919, -0.2887, 0.6990, 0.1151],
  15764. [ 0.9571, -0.1918, 1.1712, -1.0054, -0.2589, -1.1467, 0.5271, 0.2481],
  15765. [ 0.8672, -0.2019, 1.5381, -0.4543, -0.4556, -0.7202, 0.2660, 0.1861],
  15766. [ 0.8332, -0.2177, 1.7749, -0.5389, 0.0245, -1.0307, 0.5606, 0.1816],
  15767. [ 0.7884, -0.2923, 1.8857, -0.3090, -0.4546, -0.6597, 0.4157, 0.1693],
  15768. [-2.0707, -2.1505, 1.0834, -0.9208, -0.3323, -0.9233, 0.0729, 0.2109],
  15769. [ 1.1957, -0.0154, 1.8045, -0.1536, -0.4955, 0.1855, 0.2426, 0.1583],
  15770. [ 0.8495, -0.2346, 1.1987, -0.7389, -0.6078, -0.2832, 0.3070, 0.2877]],
  15771. device='cuda:0', grad_fn=<AddmmBackward>)
  15772. landmarks are: tensor([[[ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  15773. 0.1080],
  15774. [ 0.5861, -0.3929, 1.0570, -1.4314, -0.3286, -1.1235, 0.6182,
  15775. 0.1852],
  15776. [ 0.5355, -0.4335, 1.4266, -0.7155, -0.5769, -0.9310, 0.3275,
  15777. 0.3087],
  15778. [ 0.6537, -0.3719, 1.6979, -0.8617, -0.0169, -1.3621, 0.6926,
  15779. 0.1501],
  15780. [ 0.5792, -0.4052, 1.8214, -0.6587, -0.5384, -0.8924, 0.4381,
  15781. 0.2442],
  15782. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  15783. 0.2930],
  15784. [ 0.5384, -0.4361, 1.7961, -0.4999, -0.5480, -0.1150, 0.3931,
  15785. 0.2776],
  15786. [ 0.5552, -0.4113, 0.9790, -1.0480, -0.7155, -0.3998, 0.3815,
  15787. 0.3623]]], device='cuda:0')
  15788. loss_train_step before backward: tensor(0.0500, device='cuda:0', grad_fn=<MseLossBackward>)
  15789. loss_train_step after backward: tensor(0.0500, device='cuda:0', grad_fn=<MseLossBackward>)
  15790. loss_train: 0.28310741670429707
  15791. step: 7
  15792. running loss: 0.04044391667204244
  15793.  
  15794. Train Steps: 7/90 Loss: 0.0404 torch.Size([8, 600, 800])
  15795. torch.Size([8, 8])
  15796. tensor([[0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  15797. [0.6200, 0.4071, 0.7338, 0.1917, 0.4200, 0.2450, 0.6150, 0.5517],
  15798. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  15799. [0.6292, 0.4010, 0.8988, 0.4800, 0.3638, 0.3817, 0.6357, 0.5051],
  15800. [0.6176, 0.4017, 0.8788, 0.5100, 0.4075, 0.5250, 0.5913, 0.5033],
  15801. [0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  15802. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  15803. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461]],
  15804. device='cuda:0', dtype=torch.float64)
  15805. predictions are: tensor([[ 0.7177, -0.2844, 1.2895, -0.7119, -0.6197, -0.5738, 0.1653, 0.3376],
  15806. [ 0.6297, -0.4088, 1.2134, -1.3051, -0.3212, -1.3260, 0.5060, 0.2098],
  15807. [ 0.5482, -0.4027, 1.6650, 0.0851, -0.4617, -0.6359, 0.1926, 0.2705],
  15808. [ 0.6680, -0.3811, 1.8350, -0.1524, -0.4657, -0.6388, 0.6130, 0.1218],
  15809. [ 0.6451, -0.3880, 1.7837, 0.0488, -0.2782, 0.2239, 0.3377, 0.1277],
  15810. [ 0.6347, -0.3732, 1.6429, -0.5697, -0.4933, 0.0440, 0.5640, 0.2210],
  15811. [ 0.7459, -0.3111, 1.7528, -0.4887, -0.6403, -0.4226, 0.3598, 0.0651],
  15812. [ 0.6221, -0.3853, 1.7191, 0.1670, -0.1029, 0.1177, 0.2200, 0.1834]],
  15813. device='cuda:0', grad_fn=<AddmmBackward>)
  15814. landmarks are: tensor([[[ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  15815. 0.4036],
  15816. [ 0.5779, -0.4054, 1.1032, -1.4006, -0.3460, -1.1543, 0.5547,
  15817. 0.2622],
  15818. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  15819. 0.3392],
  15820. [ 0.6204, -0.4336, 1.8654, -0.0688, -0.6058, -0.5230, 0.6503,
  15821. 0.0472],
  15822. [ 0.5668, -0.4306, 1.7730, 0.0697, -0.4037, 0.1390, 0.4450,
  15823. 0.0390],
  15824. [ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  15825. 0.2545],
  15826. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  15827. 0.0236],
  15828. [ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  15829. 0.2364]]], device='cuda:0')
  15830. loss_train_step before backward: tensor(0.0066, device='cuda:0', grad_fn=<MseLossBackward>)
  15831. loss_train_step after backward: tensor(0.0066, device='cuda:0', grad_fn=<MseLossBackward>)
  15832. loss_train: 0.289715682156384
  15833. step: 8
  15834. running loss: 0.036214460269548
  15835. Train Steps: 8/90 Loss: 0.0362 torch.Size([8, 600, 800])
  15836. torch.Size([8, 8])
  15837. tensor([[0.6202, 0.4066, 0.8746, 0.3376, 0.3717, 0.3090, 0.5842, 0.5165],
  15838. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967],
  15839. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  15840. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  15841. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  15842. [0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  15843. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  15844. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136]],
  15845. device='cuda:0', dtype=torch.float64)
  15846. predictions are: tensor([[ 1.1728, -0.0307, 1.7745, -0.4279, -0.6014, -0.7678, 0.3550, 0.1150],
  15847. [ 1.1965, -0.0361, 1.7375, -0.0554, -0.5987, 0.2345, 0.5089, 0.1112],
  15848. [-1.2754, -1.6184, 1.6297, -0.9376, 0.1132, -0.9360, 0.9832, 0.2434],
  15849. [ 0.9482, -0.2055, 1.7096, 0.2033, -0.3678, 0.2868, 0.2874, 0.2983],
  15850. [ 0.8853, -0.1925, 1.5021, -1.0313, -0.1642, -1.0260, 0.5182, 0.1084],
  15851. [ 0.8353, -0.2145, 1.0419, -0.7815, -0.5458, -0.8351, 0.1290, 0.3244],
  15852. [-0.7671, -1.2577, 1.3239, -0.5202, -0.6450, -0.6157, 0.0111, 0.2329],
  15853. [ 0.9063, -0.2047, 0.9747, -0.9788, -0.5142, -1.0113, 0.2779, 0.1766]],
  15854. device='cuda:0', grad_fn=<AddmmBackward>)
  15855. landmarks are: tensor([[[ 0.5787, -0.4077, 1.7537, -0.7263, -0.5692, -0.8586, 0.4126,
  15856. 0.1000],
  15857. [ 0.4974, -0.4482, 1.6633, -0.3306, -0.6173, 0.1313, 0.2925,
  15858. 0.0081],
  15859. [-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  15860. 0.2463],
  15861. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  15862. 0.3777],
  15863. [ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  15864. -0.0369],
  15865. [ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  15866. 0.3315],
  15867. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  15868. 0.2837],
  15869. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  15870. 0.0862]]], device='cuda:0')
  15871. loss_train_step before backward: tensor(0.1240, device='cuda:0', grad_fn=<MseLossBackward>)
  15872. loss_train_step after backward: tensor(0.1240, device='cuda:0', grad_fn=<MseLossBackward>)
  15873. loss_train: 0.41375276912003756
  15874. step: 9
  15875. running loss: 0.045972529902226396
  15876. Train Steps: 9/90 Loss: 0.0460 torch.Size([8, 600, 800])
  15877. torch.Size([8, 8])
  15878. tensor([[0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  15879. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  15880. [0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117],
  15881. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  15882. [0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  15883. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650],
  15884. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  15885. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567]],
  15886. device='cuda:0', dtype=torch.float64)
  15887. predictions are: tensor([[ 0.9313, -0.2026, 1.4965, -0.8860, -0.4646, -0.8344, 0.7200, 0.1272],
  15888. [-1.7722, -1.9497, 1.0401, -1.0044, -0.4755, -0.9832, 0.1582, 0.2319],
  15889. [ 1.1622, -0.0263, 1.8426, -0.0205, -0.6599, -0.2158, 0.2817, 0.1618],
  15890. [ 1.0712, -0.1175, 1.1899, -1.1806, -0.3783, -1.2676, 0.5125, 0.1718],
  15891. [ 1.0987, -0.0886, 1.7554, 0.2702, -0.3929, 0.3518, 0.2888, 0.1255],
  15892. [ 0.8446, -0.2262, 1.7078, 0.0515, -0.3860, 0.2727, 0.2133, 0.2586],
  15893. [ 1.0712, -0.1029, 1.5134, -0.9648, -0.2017, -1.2557, 0.7378, 0.2042],
  15894. [-1.1009, -1.4880, 1.1267, -0.8914, -0.5174, -0.8465, 0.0194, 0.3053]],
  15895. device='cuda:0', grad_fn=<AddmmBackward>)
  15896. landmarks are: tensor([[[ 0.6125, -0.4345, 1.4308, -1.1384, -0.4213, -1.0031, 0.7190,
  15897. 0.1214],
  15898. [-2.2859, -2.2859, 1.0513, -1.2851, -0.4441, -1.2313, 0.2206,
  15899. 0.1073],
  15900. [ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  15901. 0.0774],
  15902. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  15903. 0.1082],
  15904. [ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  15905. 0.0467],
  15906. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  15907. 0.3238],
  15908. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  15909. 0.0851],
  15910. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  15911. 0.2853]]], device='cuda:0')
  15912. loss_train_step before backward: tensor(0.0825, device='cuda:0', grad_fn=<MseLossBackward>)
  15913. loss_train_step after backward: tensor(0.0825, device='cuda:0', grad_fn=<MseLossBackward>)
  15914. loss_train: 0.4962860615924001
  15915. step: 10
  15916. running loss: 0.04962860615924001
  15917. Train Steps: 10/90 Loss: 0.0496 torch.Size([8, 600, 800])
  15918. torch.Size([8, 8])
  15919. tensor([[0.6364, 0.4092, 0.8525, 0.5633, 0.3875, 0.4950, 0.6599, 0.5285],
  15920. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  15921. [0.6269, 0.4073, 0.8900, 0.4933, 0.3625, 0.4183, 0.6288, 0.5150],
  15922. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  15923. [0.6128, 0.4115, 0.7934, 0.3778, 0.3450, 0.4033, 0.5337, 0.5456],
  15924. [0.6060, 0.3924, 0.8450, 0.5717, 0.4200, 0.5217, 0.5253, 0.4752],
  15925. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  15926. [0.6126, 0.4073, 0.8750, 0.5133, 0.3800, 0.4333, 0.4986, 0.5378]],
  15927. device='cuda:0', dtype=torch.float64)
  15928. predictions are: tensor([[ 1.0878, -0.1095, 1.6107, -0.0532, -0.4727, -0.1721, 0.7642, 0.1889],
  15929. [ 0.8507, -0.2066, 1.5986, -0.0028, -0.3621, 0.0362, 0.4501, 0.2864],
  15930. [ 0.8927, -0.2078, 1.7943, -0.2751, -0.5363, -0.4577, 0.5687, 0.1468],
  15931. [ 0.6973, -0.3176, 1.6548, -0.6774, -0.6204, -0.6440, 0.2402, 0.1518],
  15932. [ 0.7442, -0.2523, 1.3724, -0.8019, -0.6210, -0.5154, 0.2633, 0.2536],
  15933. [ 0.6057, -0.3823, 1.5197, 0.0231, -0.3128, -0.0456, 0.1714, 0.1913],
  15934. [-2.1630, -2.2389, 1.0234, -1.2700, -0.4265, -1.2075, 0.2050, 0.1823],
  15935. [ 0.8390, -0.2155, 1.6746, -0.1264, -0.5022, -0.4144, 0.1339, 0.1871]],
  15936. device='cuda:0', grad_fn=<AddmmBackward>)
  15937. landmarks are: tensor([[[ 6.5365e-01, -3.9601e-01, 1.6517e+00, 3.1609e-01, -4.9607e-01,
  15938. 4.6189e-04, 7.6203e-01, 1.5543e-01],
  15939. [ 5.7419e-01, -3.7921e-01, 1.6460e+00, 3.0839e-01, -3.4596e-01,
  15940. 1.4673e-01, 4.1617e-01, 3.1609e-01],
  15941. [ 6.0964e-01, -4.0462e-01, 1.8249e+00, -7.2363e-03, -6.1155e-01,
  15942. -3.5366e-01, 6.1824e-01, 9.2841e-02],
  15943. [ 5.2355e-01, -4.2731e-01, 1.7499e+00, -4.3064e-01, -5.8268e-01,
  15944. -4.6143e-01, 1.6505e-01, 8.6245e-02],
  15945. [ 5.4440e-01, -3.8522e-01, 1.3786e+00, -5.4087e-01, -6.9238e-01,
  15946. -4.2294e-01, 1.7915e-01, 2.3412e-01],
  15947. [ 5.1316e-01, -4.7360e-01, 1.6171e+00, 3.5458e-01, -3.4596e-01,
  15948. 1.2363e-01, 1.4038e-01, -9.1096e-02],
  15949. [-2.2859e+00, -2.2859e+00, 1.0513e+00, -1.2851e+00, -4.4411e-01,
  15950. -1.2313e+00, 2.2057e-01, 1.0729e-01],
  15951. [ 5.4353e-01, -4.0454e-01, 1.7557e+00, 8.5142e-02, -5.3072e-01,
  15952. -2.8437e-01, 1.7213e-02, 1.9805e-01]]], device='cuda:0')
  15953. loss_train_step before backward: tensor(0.0259, device='cuda:0', grad_fn=<MseLossBackward>)
  15954. loss_train_step after backward: tensor(0.0259, device='cuda:0', grad_fn=<MseLossBackward>)
  15955. loss_train: 0.5221390677616
  15956. step: 11
  15957. running loss: 0.047467187978327274
  15958.  
  15959. Train Steps: 11/90 Loss: 0.0475 torch.Size([8, 600, 800])
  15960. torch.Size([8, 8])
  15961. tensor([[0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  15962. [0.6264, 0.4069, 0.7900, 0.1650, 0.4275, 0.2267, 0.6290, 0.4947],
  15963. [0.6224, 0.3964, 0.8225, 0.5717, 0.4150, 0.4617, 0.5775, 0.5267],
  15964. [0.6125, 0.4035, 0.7825, 0.3100, 0.3463, 0.4900, 0.5832, 0.5637],
  15965. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  15966. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  15967. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  15968. [0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667]],
  15969. device='cuda:0', dtype=torch.float64)
  15970. predictions are: tensor([[ 0.3029, -0.5813, 1.6058, 0.2992, -0.4347, -0.2948, 0.2373, 0.4066],
  15971. [ 0.1432, -0.7466, 1.3805, -1.3673, -0.3420, -1.3187, 0.7347, 0.0626],
  15972. [ 0.1686, -0.6956, 1.5923, 0.0621, -0.4416, -0.2541, 0.3519, 0.1528],
  15973. [ 0.2014, -0.6436, 1.2887, -0.8800, -0.6039, 0.0331, 0.3587, 0.2998],
  15974. [ 0.5978, -0.4018, 1.1764, -1.0731, -0.6076, -0.8882, 0.0660, 0.0662],
  15975. [ 0.5845, -0.4183, 1.5968, -0.8787, -0.6331, -0.9194, 0.3063, 0.0992],
  15976. [ 0.5553, -0.4389, 1.4506, -1.0662, -0.4033, -1.0708, 0.5415, 0.1191],
  15977. [ 0.3629, -0.5407, 1.6632, 0.1891, -0.4559, 0.0866, 0.4513, 0.2735]],
  15978. device='cuda:0', grad_fn=<AddmmBackward>)
  15979. landmarks are: tensor([[[ 6.0381e-01, -3.4642e-01, 1.7037e+00, 3.9307e-01, -4.4411e-01,
  15980. -2.6128e-01, 3.0069e-01, 4.6236e-01],
  15981. [ 6.0739e-01, -4.0631e-01, 1.3630e+00, -1.5238e+00, -3.1132e-01,
  15982. -1.2390e+00, 6.1950e-01, -9.2270e-04],
  15983. [ 5.8915e-01, -4.5504e-01, 1.5132e+00, 3.5458e-01, -3.6905e-01,
  15984. -1.5350e-01, 3.8152e-01, 1.4673e-01],
  15985. [ 5.4319e-01, -4.2240e-01, 1.3284e+00, -8.5404e-01, -6.8661e-01,
  15986. -2.2633e-02, 4.0770e-01, 3.1769e-01],
  15987. [ 5.2194e-01, -4.5504e-01, 1.1415e+00, -9.1962e-01, -6.4042e-01,
  15988. -9.3872e-01, 1.8562e-01, 1.4106e-02],
  15989. [ 5.4825e-01, -4.2490e-01, 1.5305e+00, -7.3857e-01, -6.1155e-01,
  15990. -8.6944e-01, 3.3533e-01, 1.0054e-01],
  15991. [ 5.7962e-01, -3.8776e-01, 1.3688e+00, -1.0542e+00, -4.0947e-01,
  15992. -1.1312e+00, 5.8938e-01, 1.9292e-01],
  15993. [ 5.8528e-01, -3.6135e-01, 1.6806e+00, 2.9299e-01, -4.4988e-01,
  15994. 1.0054e-01, 3.8152e-01, 3.3149e-01]]], device='cuda:0')
  15995. loss_train_step before backward: tensor(0.0200, device='cuda:0', grad_fn=<MseLossBackward>)
  15996. loss_train_step after backward: tensor(0.0200, device='cuda:0', grad_fn=<MseLossBackward>)
  15997. loss_train: 0.5421810066327453
  15998. step: 12
  15999. running loss: 0.04518175055272877
  16000. Train Steps: 12/90 Loss: 0.0452 torch.Size([8, 600, 800])
  16001. torch.Size([8, 8])
  16002. tensor([[0.6307, 0.4029, 0.8988, 0.4817, 0.3937, 0.3500, 0.7311, 0.5378],
  16003. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  16004. [ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729],
  16005. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  16006. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  16007. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  16008. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083],
  16009. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467]],
  16010. device='cuda:0', dtype=torch.float64)
  16011. predictions are: tensor([[ 0.1219, -0.7227, 1.8549, -0.1560, -0.5318, -0.7085, 0.7696, 0.0714],
  16012. [ 0.8323, -0.2219, 1.6331, -0.1667, -0.2122, 0.0865, 0.1752, 0.2409],
  16013. [-2.4100, -2.4214, 0.8703, -1.1893, -0.4963, -1.1885, 0.1118, 0.2354],
  16014. [ 0.7064, -0.3345, 1.2014, -1.1894, -0.3038, -1.3511, 0.4325, 0.1430],
  16015. [ 0.6720, -0.3316, 1.6616, -0.2564, -0.6401, -0.3004, 0.3643, 0.1793],
  16016. [ 0.5241, -0.4137, 1.6657, -0.1205, -0.2329, 0.3921, 0.3336, 0.2425],
  16017. [ 0.4922, -0.4644, 1.7609, -0.4795, -0.7322, -0.6432, 0.3411, 0.0464],
  16018. [ 0.9622, -0.1731, 0.8906, -1.0965, -0.5967, -1.1497, 0.3895, 0.2532]],
  16019. device='cuda:0', grad_fn=<AddmmBackward>)
  16020. landmarks are: tensor([[[ 0.6273, -0.4249, 1.8654, -0.0611, -0.4672, -0.6693, 1.0910,
  16021. 0.1982],
  16022. [ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  16023. 0.3007],
  16024. [-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  16025. 0.3604],
  16026. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  16027. 0.2083],
  16028. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  16029. 0.2314],
  16030. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  16031. 0.2083],
  16032. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  16033. 0.0620],
  16034. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  16035. 0.2391]]], device='cuda:0')
  16036. loss_train_step before backward: tensor(0.0205, device='cuda:0', grad_fn=<MseLossBackward>)
  16037. loss_train_step after backward: tensor(0.0205, device='cuda:0', grad_fn=<MseLossBackward>)
  16038. loss_train: 0.5627054637297988
  16039. step: 13
  16040. running loss: 0.04328503567152298
  16041. Train Steps: 13/90 Loss: 0.0433 torch.Size([8, 600, 800])
  16042. torch.Size([8, 8])
  16043. tensor([[0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633],
  16044. [0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  16045. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  16046. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  16047. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390],
  16048. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456],
  16049. [0.6075, 0.4007, 0.8275, 0.4917, 0.4050, 0.5100, 0.5167, 0.5280],
  16050. [0.6286, 0.4060, 0.9188, 0.4333, 0.3675, 0.4167, 0.7034, 0.5528]],
  16051. device='cuda:0', dtype=torch.float64)
  16052. predictions are: tensor([[ 0.4958, -0.4315, 1.4636, 0.0741, -0.4305, -0.2701, 0.1757, 0.2284],
  16053. [ 0.0142, -0.7257, 1.3866, -0.4004, -0.6804, -0.9269, 0.1312, 0.2729],
  16054. [ 0.4388, -0.4977, 1.5452, -0.0589, -0.6108, -0.3443, 0.2965, 0.2244],
  16055. [ 0.1248, -0.7289, 1.5169, -1.3572, -0.3329, -1.3349, 0.9413, 0.0911],
  16056. [ 0.2870, -0.6169, 1.5969, -0.4151, -0.4717, 0.0487, 0.7505, 0.2085],
  16057. [ 0.3186, -0.5650, 1.4995, -0.1835, -0.3716, 0.0049, 0.0432, 0.1541],
  16058. [ 0.1244, -0.6726, 1.3800, -0.3604, -0.4168, -0.0753, -0.0819, 0.1340],
  16059. [ 0.3934, -0.5537, 1.8068, -0.5702, -0.5608, -0.6095, 0.8026, 0.1045]],
  16060. device='cuda:0', grad_fn=<AddmmBackward>)
  16061. landmarks are: tensor([[[ 0.5880, -0.3605, 1.7037, 0.3238, -0.2940, -0.0765, 0.3180,
  16062. 0.3161],
  16063. [ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  16064. 0.4393],
  16065. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  16066. 0.3161],
  16067. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  16068. 0.2944],
  16069. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  16070. 0.2035],
  16071. [ 0.5443, -0.3840, 1.7095, 0.0620, -0.3979, 0.1929, 0.1622,
  16072. 0.2341],
  16073. [ 0.5200, -0.4353, 1.5363, -0.0149, -0.4152, 0.0697, 0.1005,
  16074. 0.1530],
  16075. [ 0.6174, -0.4105, 1.9577, -0.2844, -0.5885, -0.3614, 0.9631,
  16076. 0.2676]]], device='cuda:0')
  16077. loss_train_step before backward: tensor(0.0514, device='cuda:0', grad_fn=<MseLossBackward>)
  16078. loss_train_step after backward: tensor(0.0514, device='cuda:0', grad_fn=<MseLossBackward>)
  16079. loss_train: 0.6141552468761802
  16080. step: 14
  16081. running loss: 0.043868231919727156
  16082. Train Steps: 14/90 Loss: 0.0439 torch.Size([8, 600, 800])
  16083. torch.Size([8, 8])
  16084. tensor([[0.6350, 0.4144, 0.9250, 0.4100, 0.4125, 0.3750, 0.7129, 0.5945],
  16085. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  16086. [0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  16087. [0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  16088. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  16089. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  16090. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  16091. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083]],
  16092. device='cuda:0', dtype=torch.float64)
  16093. predictions are: tensor([[ 0.1153, -0.7137, 1.8762, -0.4651, -0.3093, -0.7997, 0.9198, 0.2673],
  16094. [ 0.2380, -0.6188, 1.6252, -0.5804, -0.7252, -0.4364, 0.3297, 0.1032],
  16095. [ 0.4029, -0.5418, 1.0334, -1.3869, -0.4907, -1.4458, 0.2220, 0.0935],
  16096. [ 0.4753, -0.5046, 1.0829, -1.3684, -0.6306, -1.0880, 0.3981, 0.0556],
  16097. [ 0.0737, -0.7363, 1.5422, 0.0759, -0.5337, -0.1861, 0.7105, 0.2673],
  16098. [ 0.2822, -0.5751, 1.5885, -0.0442, -0.2840, -0.0404, 0.1796, 0.1596],
  16099. [ 0.2269, -0.6090, 1.6293, -0.0549, -0.2520, 0.0713, 0.2031, 0.1629],
  16100. [-0.0072, -0.7856, 1.5862, -0.1222, -0.6186, -0.3006, 0.3431, 0.3637]],
  16101. device='cuda:0', grad_fn=<AddmmBackward>)
  16102. landmarks are: tensor([[[ 0.6471, -0.3719, 1.9866, -0.3921, -0.3806, -0.5538, 1.0070,
  16103. 0.4600],
  16104. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  16105. 0.0236],
  16106. [ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  16107. 0.0774],
  16108. [ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  16109. 0.0562],
  16110. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  16111. 0.3745],
  16112. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  16113. 0.0851],
  16114. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  16115. 0.0764],
  16116. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  16117. 0.5239]]], device='cuda:0')
  16118. loss_train_step before backward: tensor(0.0415, device='cuda:0', grad_fn=<MseLossBackward>)
  16119. loss_train_step after backward: tensor(0.0415, device='cuda:0', grad_fn=<MseLossBackward>)
  16120. loss_train: 0.6556800110265613
  16121. step: 15
  16122. running loss: 0.04371200073510408
  16123.  
  16124. Train Steps: 15/90 Loss: 0.0437 torch.Size([8, 600, 800])
  16125. torch.Size([8, 8])
  16126. tensor([[0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  16127. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  16128. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  16129. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  16130. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  16131. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  16132. [0.6161, 0.4076, 0.8900, 0.4667, 0.4125, 0.5917, 0.6262, 0.5367],
  16133. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683]],
  16134. device='cuda:0', dtype=torch.float64)
  16135. predictions are: tensor([[ 0.1218, -0.6983, 1.2977, -0.7802, -0.6482, -0.9329, 0.1384, 0.3076],
  16136. [ 0.1443, -0.6555, 1.6092, -0.6454, -0.6445, -0.6126, 0.2774, 0.1033],
  16137. [ 0.3040, -0.5442, 1.3830, -0.0120, -0.4510, -0.2879, 0.3900, 0.3919],
  16138. [ 0.0439, -0.7803, 1.1903, -1.3528, -0.3130, -1.4106, 0.5307, 0.1385],
  16139. [ 0.4143, -0.5202, 1.7113, -0.1068, -0.4546, 0.0416, 0.4255, 0.0655],
  16140. [ 0.3109, -0.5906, 1.6933, -0.0469, -0.5008, -0.4294, 0.8705, 0.1147],
  16141. [ 0.1866, -0.6275, 1.6986, -0.3177, -0.2417, 0.3220, 0.5624, 0.1782],
  16142. [ 0.2944, -0.5437, 1.5597, -0.0388, -0.5235, -0.6436, 0.3104, 0.2505]],
  16143. device='cuda:0', grad_fn=<AddmmBackward>)
  16144. landmarks are: tensor([[[ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  16145. 0.4374],
  16146. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  16147. 0.0862],
  16148. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  16149. 0.5401],
  16150. [ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  16151. 0.0928],
  16152. [ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  16153. 0.0663],
  16154. [ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  16155. 0.2516],
  16156. [ 0.5598, -0.4032, 1.8249, -0.1304, -0.3806, 0.4470, 0.6067,
  16157. 0.1929],
  16158. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  16159. 0.3392]]], device='cuda:0')
  16160. loss_train_step before backward: tensor(0.0385, device='cuda:0', grad_fn=<MseLossBackward>)
  16161. loss_train_step after backward: tensor(0.0385, device='cuda:0', grad_fn=<MseLossBackward>)
  16162. loss_train: 0.6941816275939345
  16163. step: 16
  16164. running loss: 0.04338635172462091
  16165. Train Steps: 16/90 Loss: 0.0434 torch.Size([8, 600, 800])
  16166. torch.Size([8, 8])
  16167. tensor([[0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  16168. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  16169. [0.6229, 0.4086, 0.7538, 0.2600, 0.4775, 0.1617, 0.5900, 0.5383],
  16170. [0.6165, 0.4106, 0.7575, 0.1733, 0.3838, 0.2650, 0.5680, 0.5116],
  16171. [0.6211, 0.4069, 0.8750, 0.5117, 0.4150, 0.4900, 0.5875, 0.5167],
  16172. [0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  16173. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  16174. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367]],
  16175. device='cuda:0', dtype=torch.float64)
  16176. predictions are: tensor([[ 2.7160e-01, -6.1288e-01, 1.3024e+00, -1.0790e+00, -2.4634e-01,
  16177. -1.3686e+00, 5.0634e-01, 1.6069e-01],
  16178. [ 2.6692e-01, -5.8733e-01, 1.6549e+00, 1.7750e-01, -2.6255e-01,
  16179. 1.4141e-01, 3.5143e-01, 1.6915e-01],
  16180. [ 3.3903e-01, -5.6775e-01, 1.0713e+00, -1.1558e+00, -2.5916e-01,
  16181. -1.4428e+00, 3.9940e-01, 2.0511e-01],
  16182. [ 4.3410e-01, -5.4499e-01, 1.1180e+00, -1.2465e+00, -5.6629e-01,
  16183. -1.0447e+00, 5.5686e-01, 4.9847e-02],
  16184. [ 2.5437e-01, -6.0803e-01, 1.7518e+00, 1.5235e-01, -4.2358e-01,
  16185. 4.0426e-02, 5.6769e-01, 1.3766e-01],
  16186. [ 6.4946e-04, -7.1879e-01, 1.5425e+00, 7.2002e-03, -6.0888e-01,
  16187. -6.5312e-01, 2.5940e-01, 3.6687e-01],
  16188. [ 1.4826e-01, -6.5294e-01, 1.8039e+00, -3.0606e-01, -5.9294e-01,
  16189. -5.2833e-02, 6.3769e-01, 2.8626e-01],
  16190. [ 8.7252e-02, -6.8236e-01, 1.6944e+00, -4.0593e-01, -6.6378e-01,
  16191. -3.7071e-01, 5.3112e-01, 2.8553e-01]], device='cuda:0',
  16192. grad_fn=<AddmmBackward>)
  16193. landmarks are: tensor([[[ 0.5908, -0.3832, 1.3804, -1.2543, -0.1270, -1.4671, 0.5721,
  16194. 0.2237],
  16195. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  16196. 0.0851],
  16197. [ 0.5911, -0.3984, 1.1956, -1.0850, -0.0804, -1.5392, 0.4393,
  16198. 0.2006],
  16199. [ 0.5618, -0.3895, 1.2129, -1.4853, -0.5134, -1.0619, 0.3378,
  16200. 0.0772],
  16201. [ 0.5828, -0.4066, 1.7557, 0.0774, -0.3691, -0.0226, 0.4277,
  16202. 0.1005],
  16203. [ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  16204. 0.4393],
  16205. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  16206. 0.3161],
  16207. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  16208. 0.1929]]], device='cuda:0')
  16209. loss_train_step before backward: tensor(0.0320, device='cuda:0', grad_fn=<MseLossBackward>)
  16210. loss_train_step after backward: tensor(0.0320, device='cuda:0', grad_fn=<MseLossBackward>)
  16211. loss_train: 0.7261817371472716
  16212. step: 17
  16213. running loss: 0.04271657277336892
  16214. Train Steps: 17/90 Loss: 0.0427 torch.Size([8, 600, 800])
  16215. torch.Size([8, 8])
  16216. tensor([[0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882],
  16217. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  16218. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  16219. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  16220. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  16221. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  16222. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  16223. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767]],
  16224. device='cuda:0', dtype=torch.float64)
  16225. predictions are: tensor([[ 0.9092, -0.1473, 1.7510, -0.4465, -0.6588, -0.6622, 0.2803, 0.0766],
  16226. [ 0.6855, -0.2995, 1.7302, -0.2893, -0.4286, 0.1628, 0.6664, 0.2222],
  16227. [ 0.5960, -0.4104, 1.4210, -1.1680, -0.3207, -1.3542, 0.9038, 0.1072],
  16228. [ 0.5793, -0.3802, 1.6687, 0.1535, -0.4748, -0.2674, 0.5813, 0.1793],
  16229. [-2.6504, -2.5917, 1.0145, -1.4165, -0.4417, -1.2874, 0.2440, 0.2193],
  16230. [ 0.6755, -0.2863, 1.4774, 0.1994, -0.5063, -0.2944, 0.5160, 0.4400],
  16231. [ 0.4113, -0.4544, 1.6717, 0.0710, -0.1949, -0.0334, 0.2397, 0.2295],
  16232. [ 0.6982, -0.2907, 1.6843, -0.0253, -0.4022, 0.0244, 0.4109, 0.3028]],
  16233. device='cuda:0', grad_fn=<AddmmBackward>)
  16234. landmarks are: tensor([[[ 0.5595, -0.3988, 1.7672, -0.4460, -0.5538, -0.5384, 0.0828,
  16235. -0.0310],
  16236. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  16237. 0.2622],
  16238. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  16239. 0.1193],
  16240. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  16241. 0.2091],
  16242. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  16243. 0.1373],
  16244. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  16245. 0.5401],
  16246. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  16247. 0.2634],
  16248. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  16249. 0.3777]]], device='cuda:0')
  16250. loss_train_step before backward: tensor(0.0168, device='cuda:0', grad_fn=<MseLossBackward>)
  16251. loss_train_step after backward: tensor(0.0168, device='cuda:0', grad_fn=<MseLossBackward>)
  16252. loss_train: 0.7429619831964374
  16253. step: 18
  16254. running loss: 0.04127566573313541
  16255. Train Steps: 18/90 Loss: 0.0413 torch.Size([8, 600, 800])
  16256. torch.Size([8, 8])
  16257. tensor([[0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  16258. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  16259. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  16260. [0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  16261. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  16262. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351],
  16263. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  16264. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433]],
  16265. device='cuda:0', dtype=torch.float64)
  16266. predictions are: tensor([[ 0.1537, -0.7204, 1.6356, -0.8018, -0.6451, -0.8134, 0.7579, 0.1320],
  16267. [ 0.5381, -0.3980, 1.6382, -0.0354, -0.6471, -0.7040, 0.4174, 0.4160],
  16268. [ 0.3666, -0.4972, 1.6796, -0.2601, -0.1986, 0.0435, 0.4511, 0.3033],
  16269. [ 0.2557, -0.5845, 1.7455, 0.0321, -0.1672, 0.1011, 0.3273, 0.2243],
  16270. [ 0.2479, -0.6265, 1.6954, 0.2720, -0.5356, -0.2905, 0.6293, 0.1359],
  16271. [ 0.5597, -0.4278, 1.1547, -1.2702, -0.3355, -1.5681, 0.3867, 0.1769],
  16272. [ 0.3058, -0.5402, 1.7025, -0.1812, -0.2044, 0.0503, 0.5050, 0.2742],
  16273. [ 0.2479, -0.6194, 1.8035, -0.1138, -0.5522, -0.0488, 0.5325, 0.2004]],
  16274. device='cuda:0', grad_fn=<AddmmBackward>)
  16275. landmarks are: tensor([[[ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  16276. -0.0220],
  16277. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  16278. 0.3161],
  16279. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  16280. 0.3007],
  16281. [ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  16282. 0.0592],
  16283. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  16284. -0.0049],
  16285. [ 0.5664, -0.4321, 1.2862, -1.0003, -0.2189, -1.4608, 0.3883,
  16286. 0.1855],
  16287. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  16288. 0.2237],
  16289. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  16290. 0.2237]]], device='cuda:0')
  16291. loss_train_step before backward: tensor(0.0247, device='cuda:0', grad_fn=<MseLossBackward>)
  16292. loss_train_step after backward: tensor(0.0247, device='cuda:0', grad_fn=<MseLossBackward>)
  16293. loss_train: 0.7676935633644462
  16294. step: 19
  16295. running loss: 0.04040492438760243
  16296.  
  16297. Train Steps: 19/90 Loss: 0.0404 torch.Size([8, 600, 800])
  16298. torch.Size([8, 8])
  16299. tensor([[0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882],
  16300. [ nan, nan, 0.8850, 0.2817, 0.5112, 0.2183, 0.7184, 0.5436],
  16301. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  16302. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  16303. [0.6200, 0.4071, 0.7338, 0.1917, 0.4200, 0.2450, 0.6150, 0.5517],
  16304. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  16305. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  16306. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933]],
  16307. device='cuda:0', dtype=torch.float64)
  16308. predictions are: tensor([[ 0.5391, -0.4111, 1.8399, 0.5539, -0.5385, -0.3105, 0.1539, 0.1573],
  16309. [-0.4865, -1.1033, 1.7536, -0.9170, 0.0708, -1.0576, 1.1059, 0.2863],
  16310. [ 0.7090, -0.2659, 1.6790, -0.7104, -0.3165, -0.8219, 0.6182, 0.2112],
  16311. [ 1.0314, -0.0671, 1.9320, 0.0433, -0.5273, 0.1994, 0.5365, 0.3001],
  16312. [ 0.7391, -0.2983, 1.1664, -1.0349, -0.3136, -0.9762, 0.4261, 0.2512],
  16313. [ 0.9982, -0.1675, 1.8577, 0.0253, -0.5594, -0.2516, 0.6394, 0.1182],
  16314. [ 0.6368, -0.3559, 1.2847, -0.8534, -0.4753, -0.6293, 0.4588, 0.2208],
  16315. [-2.1450, -2.2038, 0.8288, -1.1550, -0.3983, -1.0886, 0.1174, 0.3643]],
  16316. device='cuda:0', grad_fn=<AddmmBackward>)
  16317. landmarks are: tensor([[[ 0.5379, -0.4358, 1.7326, 0.1852, -0.6058, -0.5461, 0.0684,
  16318. -0.0310],
  16319. [-2.2859, -2.2859, 1.8018, -0.9849, 0.0755, -1.2774, 1.0326,
  16320. 0.2249],
  16321. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  16322. 0.1467],
  16323. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  16324. 0.3161],
  16325. [ 0.5779, -0.4054, 1.1032, -1.4006, -0.3460, -1.1543, 0.5547,
  16326. 0.2622],
  16327. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  16328. 0.0697],
  16329. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  16330. 0.1779],
  16331. [-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  16332. 0.4543]]], device='cuda:0')
  16333. loss_train_step before backward: tensor(0.1029, device='cuda:0', grad_fn=<MseLossBackward>)
  16334. loss_train_step after backward: tensor(0.1029, device='cuda:0', grad_fn=<MseLossBackward>)
  16335. loss_train: 0.8706217845901847
  16336. step: 20
  16337. running loss: 0.04353108922950923
  16338. Train Steps: 20/90 Loss: 0.0435 torch.Size([8, 600, 800])
  16339. torch.Size([8, 8])
  16340. tensor([[0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  16341. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  16342. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  16343. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  16344. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  16345. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550],
  16346. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  16347. [0.6353, 0.4128, 0.9138, 0.3533, 0.4688, 0.3250, 0.7145, 0.5991]],
  16348. device='cuda:0', dtype=torch.float64)
  16349. predictions are: tensor([[ 0.5395, -0.4382, 1.1486, -1.2259, -0.4905, -0.8644, 0.3337, 0.1198],
  16350. [ 0.6198, -0.3472, 1.6669, -0.0291, -0.5057, -0.2221, 0.2427, 0.3126],
  16351. [ 0.4126, -0.5339, 1.4331, -1.0436, -0.2162, -1.1185, 0.6102, 0.1433],
  16352. [ 0.5501, -0.4162, 1.8176, -0.2285, -0.5117, 0.0819, 0.6617, 0.2014],
  16353. [ 0.6478, -0.3610, 1.6992, 0.5170, -0.4537, 0.1087, 0.4591, 0.1850],
  16354. [ 0.1851, -0.6295, 1.3142, -0.7649, -0.5219, -0.7357, -0.0488, 0.2572],
  16355. [ 0.2418, -0.6364, 1.9933, 0.0325, -0.2490, -0.7881, 0.7903, 0.2832],
  16356. [-0.4642, -1.0908, 1.9517, -0.5161, -0.0796, -0.6657, 1.0323, 0.3870]],
  16357. device='cuda:0', grad_fn=<AddmmBackward>)
  16358. landmarks are: tensor([[[ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  16359. 0.0562],
  16360. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  16361. 0.2853],
  16362. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  16363. 0.1193],
  16364. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  16365. 0.0985],
  16366. [ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  16367. -0.1331],
  16368. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  16369. 0.2776],
  16370. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  16371. 0.3692],
  16372. [ 0.6487, -0.3792, 1.9346, -0.6539, -0.1208, -0.7848, 1.0143,
  16373. 0.4814]]], device='cuda:0')
  16374. loss_train_step before backward: tensor(0.0475, device='cuda:0', grad_fn=<MseLossBackward>)
  16375. loss_train_step after backward: tensor(0.0475, device='cuda:0', grad_fn=<MseLossBackward>)
  16376. loss_train: 0.9181526629254222
  16377. step: 21
  16378. running loss: 0.04372155537740106
  16379. Train Steps: 21/90 Loss: 0.0437 torch.Size([8, 600, 800])
  16380. torch.Size([8, 8])
  16381. tensor([[0.6211, 0.3993, 0.7650, 0.1933, 0.4575, 0.1550, 0.5965, 0.4895],
  16382. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  16383. [0.6142, 0.4127, 0.7575, 0.3067, 0.3438, 0.4383, 0.5778, 0.5207],
  16384. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  16385. [0.6205, 0.4081, 0.8950, 0.4017, 0.3788, 0.4700, 0.5963, 0.5667],
  16386. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  16387. [0.6364, 0.4092, 0.8525, 0.5633, 0.3875, 0.4950, 0.6599, 0.5285],
  16388. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356]],
  16389. device='cuda:0', dtype=torch.float64)
  16390. predictions are: tensor([[ 0.0581, -0.7464, 1.3099, -1.2809, -0.1847, -1.5320, 0.3973, 0.1047],
  16391. [ 0.4789, -0.4865, 2.0377, 0.2317, -0.4262, 0.3754, 0.9245, 0.2274],
  16392. [ 0.2831, -0.5276, 1.3031, -0.8277, -0.5686, -0.3106, 0.3127, 0.3282],
  16393. [-0.0833, -0.8177, 1.0154, -1.2084, -0.3860, -1.3190, 0.2106, 0.2604],
  16394. [ 0.7950, -0.2507, 1.9152, -0.1057, -0.5803, 0.0395, 0.5121, 0.2700],
  16395. [ 0.3878, -0.5124, 1.9157, 0.1641, -0.0578, 0.0620, 0.4092, 0.2649],
  16396. [ 0.6601, -0.3920, 1.8787, 0.6277, -0.4979, 0.0237, 0.6823, 0.2055],
  16397. [ 0.4764, -0.4623, 1.5466, -0.8331, -0.2431, -1.1635, 0.6208, 0.2329]],
  16398. device='cuda:0', grad_fn=<AddmmBackward>)
  16399. landmarks are: tensor([[[ 5.8284e-01, -4.4175e-01, 1.2476e+00, -1.3929e+00, -1.7275e-01,
  16400. -1.5700e+00, 4.6937e-01, -2.4798e-02],
  16401. [ 6.0260e-01, -4.4175e-01, 1.8654e+00, -8.4219e-02, -4.4411e-01,
  16402. 2.6220e-01, 9.2654e-01, 1.5543e-01],
  16403. [ 5.5087e-01, -3.7983e-01, 1.2129e+00, -8.6944e-01, -6.9815e-01,
  16404. -2.6128e-01, 3.8302e-01, 1.1931e-01],
  16405. [ 5.2315e-01, -4.1886e-01, 9.3580e-01, -1.4006e+00, -3.9215e-01,
  16406. -1.3698e+00, 2.5553e-01, 2.9064e-01],
  16407. [ 5.7991e-01, -4.0115e-01, 1.8480e+00, -4.3064e-01, -5.3649e-01,
  16408. -1.1501e-01, 4.6813e-01, 3.3149e-01],
  16409. [ 5.3712e-01, -4.2517e-01, 1.7037e+00, -6.8822e-02, -3.4180e-02,
  16410. 6.2048e-02, 3.7575e-01, 2.8530e-01],
  16411. [ 6.5365e-01, -3.9601e-01, 1.6517e+00, 3.1609e-01, -4.9607e-01,
  16412. 4.6189e-04, 7.6203e-01, 1.5543e-01],
  16413. [ 6.1742e-01, -4.2249e-01, 1.4975e+00, -1.1709e+00, -3.1736e-01,
  16414. -1.1806e+00, 6.5391e-01, 1.8793e-01]]], device='cuda:0')
  16415. loss_train_step before backward: tensor(0.0307, device='cuda:0', grad_fn=<MseLossBackward>)
  16416. loss_train_step after backward: tensor(0.0307, device='cuda:0', grad_fn=<MseLossBackward>)
  16417. loss_train: 0.9488857751712203
  16418. step: 22
  16419. running loss: 0.043131171598691835
  16420. Train Steps: 22/90 Loss: 0.0431 torch.Size([8, 600, 800])
  16421. torch.Size([8, 8])
  16422. tensor([[0.6259, 0.4133, 0.8200, 0.2317, 0.5025, 0.1533, 0.6250, 0.4947],
  16423. [0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882],
  16424. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208],
  16425. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  16426. [0.6205, 0.4012, 0.8675, 0.3283, 0.3713, 0.3050, 0.5813, 0.5117],
  16427. [0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  16428. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  16429. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567]],
  16430. device='cuda:0', dtype=torch.float64)
  16431. predictions are: tensor([[ 0.4515, -0.4720, 1.4325, -1.0735, -0.0188, -1.3452, 0.6986, 0.1841],
  16432. [ 0.6504, -0.3483, 1.7911, -0.2205, -0.5954, -0.4333, 0.2837, 0.1217],
  16433. [ 0.1686, -0.6797, 1.4327, -0.8897, -0.3231, -1.0884, 0.6743, 0.1728],
  16434. [ 0.2799, -0.5739, 1.7917, 0.1795, -0.2080, 0.2609, 0.3030, 0.1324],
  16435. [ 0.0126, -0.7755, 1.7338, -0.6765, -0.5620, -0.7782, 0.6809, 0.1863],
  16436. [ 0.5867, -0.3887, 1.3940, -0.7872, -0.4405, -0.8869, 0.5255, 0.3176],
  16437. [ 0.5458, -0.4143, 1.7265, -0.0424, -0.4915, -0.1369, 0.3132, 0.2854],
  16438. [ 0.4597, -0.4834, 1.8259, 0.0604, -0.1184, 0.2290, 0.6608, 0.2708]],
  16439. device='cuda:0', grad_fn=<AddmmBackward>)
  16440. landmarks are: tensor([[[ 6.0514e-01, -3.7714e-01, 1.5016e+00, -1.2159e+00, 3.5104e-02,
  16441. -1.5777e+00, 6.0099e-01, -9.2270e-04],
  16442. [ 5.5953e-01, -3.9877e-01, 1.7672e+00, -4.4604e-01, -5.5381e-01,
  16443. -5.3841e-01, 8.2802e-02, -3.0981e-02],
  16444. [ 5.8851e-01, -4.4288e-01, 1.4266e+00, -9.9261e-01, -4.3834e-01,
  16445. -1.2313e+00, 4.2276e-01, 1.1948e-01],
  16446. [ 5.5155e-01, -4.2249e-01, 1.7788e+00, -5.3426e-02, -2.0162e-01,
  16447. 1.9292e-01, 1.5683e-01, 6.8210e-02],
  16448. [ 5.7991e-01, -4.3295e-01, 1.7210e+00, -7.6936e-01, -5.7113e-01,
  16449. -8.7714e-01, 3.9885e-01, 7.7444e-02],
  16450. [ 5.8747e-01, -3.8876e-01, 1.3111e+00, -8.8483e-01, -4.6143e-01,
  16451. -9.8491e-01, 5.2009e-01, 2.6220e-01],
  16452. [ 5.4405e-01, -3.9969e-01, 1.7326e+00, -2.2279e-01, -4.4411e-01,
  16453. -2.9207e-01, 2.9551e-02, 2.4088e-01],
  16454. [ 5.5978e-01, -4.2731e-01, 1.7152e+00, -1.2271e-01, -6.4698e-03,
  16455. 1.9169e-01, 5.1432e-01, 2.8530e-01]]], device='cuda:0')
  16456. loss_train_step before backward: tensor(0.0256, device='cuda:0', grad_fn=<MseLossBackward>)
  16457. loss_train_step after backward: tensor(0.0256, device='cuda:0', grad_fn=<MseLossBackward>)
  16458. loss_train: 0.974448068998754
  16459. step: 23
  16460. running loss: 0.042367307347771915
  16461.  
  16462. Train Steps: 23/90 Loss: 0.0424 torch.Size([8, 600, 800])
  16463. torch.Size([8, 8])
  16464. tensor([[0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  16465. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  16466. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  16467. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  16468. [0.6234, 0.4179, 0.7825, 0.3450, 0.3813, 0.2867, 0.5675, 0.5617],
  16469. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  16470. [0.6261, 0.4131, 0.8938, 0.3550, 0.4000, 0.2683, 0.6188, 0.5283],
  16471. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679]],
  16472. device='cuda:0', dtype=torch.float64)
  16473. predictions are: tensor([[ 0.5464, -0.4343, 1.5575, -0.8826, -0.4123, -0.6552, 0.5500, 0.2263],
  16474. [ 0.8880, -0.2405, 1.9189, -0.1182, -0.5029, -0.3676, 0.4924, 0.2121],
  16475. [ 0.0587, -0.7420, 0.9993, -1.1595, -0.2452, -1.3513, 0.2003, 0.2672],
  16476. [ 0.3428, -0.5721, 1.6978, -0.4107, -0.5528, -0.2838, 0.3479, 0.0575],
  16477. [ 0.1762, -0.6208, 1.4553, -0.6422, -0.3622, -0.7972, 0.3625, 0.3719],
  16478. [ 0.4635, -0.4896, 1.5542, -0.8813, -0.2341, -1.0112, 0.6000, 0.1013],
  16479. [ 0.6053, -0.4251, 1.9318, -0.4953, -0.3275, -0.9114, 0.6566, 0.1574],
  16480. [ 0.3713, -0.5982, 1.8847, 0.3658, -0.2720, 0.4730, 0.9611, 0.2410]],
  16481. device='cuda:0', grad_fn=<AddmmBackward>)
  16482. landmarks are: tensor([[[ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  16483. 0.2699],
  16484. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  16485. 0.1544],
  16486. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  16487. 0.3007],
  16488. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  16489. 0.0021],
  16490. [ 0.5935, -0.3558, 1.3284, -0.6924, -0.5249, -0.9618, 0.3353,
  16491. 0.3084],
  16492. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  16493. 0.1929],
  16494. [ 0.6062, -0.3778, 1.8423, -0.6462, -0.4383, -1.0465, 0.5721,
  16495. 0.1544],
  16496. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  16497. 0.3371]]], device='cuda:0')
  16498. loss_train_step before backward: tensor(0.0266, device='cuda:0', grad_fn=<MseLossBackward>)
  16499. loss_train_step after backward: tensor(0.0266, device='cuda:0', grad_fn=<MseLossBackward>)
  16500. loss_train: 1.001086718402803
  16501. step: 24
  16502. running loss: 0.04171194660011679
  16503. Train Steps: 24/90 Loss: 0.0417 torch.Size([8, 600, 800])
  16504. torch.Size([8, 8])
  16505. tensor([[0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  16506. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  16507. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  16508. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  16509. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267],
  16510. [0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  16511. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  16512. [0.6267, 0.4094, 0.8712, 0.3083, 0.4400, 0.2267, 0.6250, 0.5200]],
  16513. device='cuda:0', dtype=torch.float64)
  16514. predictions are: tensor([[ 0.1870, -0.6556, 1.0506, -1.2502, -0.2470, -1.4751, 0.2263, 0.1088],
  16515. [ 0.9500, -0.1776, 1.8741, -0.2319, -0.6673, -0.1799, 0.6115, 0.2558],
  16516. [ 0.5001, -0.4606, 1.8854, 0.0563, -0.1951, 0.3606, 0.6289, 0.2175],
  16517. [ 0.3553, -0.5747, 1.8311, -0.1599, -0.5016, 0.1822, 0.3915, 0.0840],
  16518. [ 0.4626, -0.5170, 1.5021, -1.0981, -0.1401, -1.4030, 0.7077, 0.1556],
  16519. [ 0.5643, -0.4305, 1.2420, -1.1086, -0.3508, -1.2393, 0.2733, 0.1198],
  16520. [ 0.5204, -0.5165, 1.8178, 0.2130, -0.5849, -0.0536, 0.5791, 0.3442],
  16521. [ 0.3039, -0.5933, 1.8124, -0.8292, -0.2101, -1.0178, 0.6856, 0.2138]],
  16522. device='cuda:0', grad_fn=<AddmmBackward>)
  16523. landmarks are: tensor([[[ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  16524. 0.0261],
  16525. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  16526. 0.1929],
  16527. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  16528. 0.2237],
  16529. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  16530. 0.0231],
  16531. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  16532. 0.1467],
  16533. [ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  16534. 0.0774],
  16535. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  16536. 0.5239],
  16537. [ 0.6089, -0.3948, 1.7383, -0.8617, -0.2536, -1.2390, 0.6009,
  16538. 0.1159]]], device='cuda:0')
  16539. loss_train_step before backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  16540. loss_train_step after backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  16541. loss_train: 1.0197177669033408
  16542. step: 25
  16543. running loss: 0.040788710676133634
  16544. Train Steps: 25/90 Loss: 0.0408 torch.Size([8, 600, 800])
  16545. torch.Size([8, 8])
  16546. tensor([[0.6286, 0.4097, 0.8107, 0.2414, 0.4425, 0.2483, 0.6745, 0.5385],
  16547. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  16548. [0.6198, 0.4115, 0.7762, 0.2717, 0.3713, 0.3200, 0.5837, 0.5683],
  16549. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  16550. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  16551. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  16552. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  16553. [0.6099, 0.4030, 0.8638, 0.5117, 0.4983, 0.4965, 0.5086, 0.5388]],
  16554. device='cuda:0', dtype=torch.float64)
  16555. predictions are: tensor([[ 0.6903, -0.3480, 1.6033, -1.1603, -0.2271, -1.2476, 0.8479, 0.1206],
  16556. [ 0.9546, -0.2341, 1.9506, -0.1557, -0.5827, -0.3543, 0.8376, 0.1278],
  16557. [ 0.7325, -0.3103, 1.4645, -1.0865, -0.5483, -0.8621, 0.4646, 0.2128],
  16558. [ 0.9658, -0.1793, 1.7586, 0.3576, -0.2545, -0.2151, 0.4456, 0.2952],
  16559. [ 0.6139, -0.3888, 1.7524, 0.0334, -0.2684, 0.1579, 0.3302, 0.1551],
  16560. [ 0.9975, -0.1532, 1.7208, -0.8041, -0.6586, -0.6190, 0.5044, 0.1213],
  16561. [-1.4734, -1.7306, 1.0105, -1.3044, -0.3757, -1.4271, 0.1577, 0.2327],
  16562. [ 0.5141, -0.4748, 1.8513, -0.0350, -0.0525, -0.0404, 0.2714, 0.1178]],
  16563. device='cuda:0', grad_fn=<AddmmBackward>)
  16564. landmarks are: tensor([[[ 0.6174, -0.3936, 1.4586, -1.1709, -0.2420, -1.1389, 0.8296,
  16565. 0.2012],
  16566. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  16567. 0.1768],
  16568. [ 0.5768, -0.3852, 1.2995, -1.0311, -0.5711, -0.8079, 0.4104,
  16569. 0.3392],
  16570. [ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  16571. 0.4470],
  16572. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  16573. 0.2386],
  16574. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  16575. 0.1753],
  16576. [-2.2859, -2.2859, 1.0712, -1.2085, -0.3806, -1.3929, 0.0755,
  16577. 0.2006],
  16578. [ 0.5309, -0.4246, 1.7037, 0.0774, 0.0158, 0.0075, 0.0635,
  16579. 0.2026]]], device='cuda:0')
  16580. loss_train_step before backward: tensor(0.0308, device='cuda:0', grad_fn=<MseLossBackward>)
  16581. loss_train_step after backward: tensor(0.0308, device='cuda:0', grad_fn=<MseLossBackward>)
  16582. loss_train: 1.0505003025755286
  16583. step: 26
  16584. running loss: 0.04040385779136649
  16585. Train Steps: 26/90 Loss: 0.0404 torch.Size([8, 600, 800])
  16586. torch.Size([8, 8])
  16587. tensor([[0.6200, 0.4112, 0.8862, 0.4100, 0.3638, 0.4917, 0.6088, 0.6050],
  16588. [0.6273, 0.4105, 0.8988, 0.4517, 0.3912, 0.2550, 0.5894, 0.4811],
  16589. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517],
  16590. [0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250],
  16591. [0.6182, 0.3998, 0.8793, 0.4191, 0.3552, 0.4285, 0.6038, 0.5312],
  16592. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  16593. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  16594. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852]],
  16595. device='cuda:0', dtype=torch.float64)
  16596. predictions are: tensor([[ 0.3545, -0.5765, 1.8130, -0.4768, -0.5115, -0.0557, 0.6404, 0.3101],
  16597. [ 0.8690, -0.2657, 1.8614, -0.3410, -0.3643, -1.1425, 0.4606, -0.0299],
  16598. [ 0.5647, -0.4242, 1.6549, -0.8860, -0.5752, -0.6408, 0.4819, 0.1474],
  16599. [ 0.5902, -0.3918, 1.2179, -1.2495, -0.3850, -1.0606, 0.3993, 0.0960],
  16600. [ 0.7421, -0.3249, 1.7175, -0.5679, -0.5654, -0.3985, 0.4766, 0.1935],
  16601. [ 0.3850, -0.5400, 1.6495, -1.0489, -0.2069, -1.1659, 0.7564, 0.1570],
  16602. [ 0.6308, -0.3960, 1.5943, 0.2649, -0.3435, -0.1843, 0.4090, 0.3099],
  16603. [ 0.4256, -0.5386, 1.7622, -0.0179, -0.1365, -0.0189, 0.2498, 0.2253]],
  16604. device='cuda:0', grad_fn=<AddmmBackward>)
  16605. landmarks are: tensor([[[ 0.5777, -0.3868, 1.8076, -0.3921, -0.6058, -0.0149, 0.5259,
  16606. 0.5085],
  16607. [ 0.6116, -0.3898, 1.8654, -0.1997, -0.4788, -1.1081, 0.4367,
  16608. -0.0637],
  16609. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  16610. 0.2622],
  16611. [ 0.5891, -0.3937, 1.1494, -1.2390, -0.5076, -0.9695, 0.4797,
  16612. 0.1390],
  16613. [ 0.5697, -0.4393, 1.7754, -0.3503, -0.6453, -0.3067, 0.5028,
  16614. 0.1677],
  16615. [ 0.6174, -0.3984, 1.5975, -0.9921, -0.3633, -0.9926, 0.8205,
  16616. 0.2050],
  16617. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  16618. 0.5239],
  16619. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  16620. 0.4171]]], device='cuda:0')
  16621. loss_train_step before backward: tensor(0.0119, device='cuda:0', grad_fn=<MseLossBackward>)
  16622.  
  16623. loss_train_step after backward: tensor(0.0119, device='cuda:0', grad_fn=<MseLossBackward>)
  16624. loss_train: 1.0623777024447918
  16625. step: 27
  16626. running loss: 0.039347322312770064
  16627. Train Steps: 27/90 Loss: 0.0393 torch.Size([8, 600, 800])
  16628. torch.Size([8, 8])
  16629. tensor([[0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  16630. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  16631. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  16632. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  16633. [0.6177, 0.4086, 0.8738, 0.3950, 0.3775, 0.5600, 0.6225, 0.5700],
  16634. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  16635. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  16636. [0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823]],
  16637. device='cuda:0', dtype=torch.float64)
  16638. predictions are: tensor([[ 1.0085, -0.1871, 1.8592, -0.1330, -0.5335, -0.2461, 0.5151, 0.1121],
  16639. [ 0.3415, -0.6384, 1.7394, -0.0560, -0.5300, -0.2992, 0.4617, 0.3580],
  16640. [ 0.3285, -0.5683, 1.3489, -1.0629, -0.3567, -1.1883, 0.1364, 0.1996],
  16641. [ 0.9330, -0.2222, 1.7962, -0.3420, -0.4949, -0.8077, 0.4360, 0.1853],
  16642. [ 0.1978, -0.6507, 1.7339, -0.5420, -0.4382, 0.2163, 0.6497, 0.2670],
  16643. [ 0.5605, -0.4510, 1.8137, -0.1079, -0.2602, 0.0344, 0.3814, 0.2185],
  16644. [ 0.6950, -0.3404, 1.2603, -1.1607, -0.5204, -0.9337, 0.4292, 0.1559],
  16645. [ 0.6403, -0.3981, 1.6608, -1.2186, -0.1359, -1.5327, 0.6665, -0.0350]],
  16646. device='cuda:0', grad_fn=<AddmmBackward>)
  16647. landmarks are: tensor([[[ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  16648. 0.1159],
  16649. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  16650. 0.5239],
  16651. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  16652. 0.3700],
  16653. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  16654. 0.2699],
  16655. [ 0.5671, -0.3988, 1.7499, -0.4614, -0.5423, 0.3007, 0.5894,
  16656. 0.3469],
  16657. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  16658. 0.3084],
  16659. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  16660. 0.3007],
  16661. [ 0.6132, -0.4122, 1.5478, -1.0619, -0.2709, -1.4314, 0.5500,
  16662. -0.0583]]], device='cuda:0')
  16663. loss_train_step before backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  16664. loss_train_step after backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  16665. loss_train: 1.081544168293476
  16666. step: 28
  16667. running loss: 0.03862657743905272
  16668. Train Steps: 28/90 Loss: 0.0386 torch.Size([8, 600, 800])
  16669. torch.Size([8, 8])
  16670. tensor([[0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  16671. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  16672. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  16673. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  16674. [0.6273, 0.4105, 0.8988, 0.4517, 0.3912, 0.2550, 0.5894, 0.4811],
  16675. [0.6236, 0.3977, 0.8985, 0.4806, 0.3835, 0.5216, 0.6613, 0.5166],
  16676. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  16677. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783]],
  16678. device='cuda:0', dtype=torch.float64)
  16679. predictions are: tensor([[ 7.0282e-01, -3.5619e-01, 1.7135e+00, -4.1727e-02, -3.3237e-01,
  16680. 1.0901e-02, 6.6772e-01, 2.1084e-01],
  16681. [ 3.8480e-01, -5.4974e-01, 1.7183e+00, -4.0325e-01, -5.3389e-01,
  16682. -2.2765e-01, 2.6194e-01, 2.6075e-01],
  16683. [ 7.6077e-01, -3.0297e-01, 1.5522e+00, -1.4613e+00, -3.3689e-01,
  16684. -1.3400e+00, 7.1667e-01, 7.7529e-02],
  16685. [ 7.0844e-01, -3.7311e-01, 1.6807e+00, 2.1612e-01, -2.8488e-01,
  16686. -1.6373e-01, 1.3775e-01, 1.9161e-01],
  16687. [ 9.8953e-01, -1.7994e-01, 1.8835e+00, -4.4454e-01, -4.4358e-01,
  16688. -1.2113e+00, 4.9894e-01, 5.9100e-02],
  16689. [ 2.3141e-01, -6.8316e-01, 1.7980e+00, -3.3082e-01, -5.0640e-01,
  16690. 9.5241e-05, 7.1420e-01, 2.7764e-01],
  16691. [ 4.2223e-01, -5.0048e-01, 1.6832e+00, -6.2590e-01, -5.5156e-01,
  16692. -1.7219e-01, 3.4742e-01, 2.4207e-01],
  16693. [ 7.0103e-01, -3.0725e-01, 9.7545e-01, -1.3389e+00, -4.3456e-01,
  16694. -1.3520e+00, 1.6919e-01, 2.4624e-01]], device='cuda:0',
  16695. grad_fn=<AddmmBackward>)
  16696. landmarks are: tensor([[[ 6.0425e-01, -4.2731e-01, 1.6920e+00, 1.8595e-01, -2.7171e-01,
  16697. 1.4059e-01, 7.9965e-01, 1.0043e-01],
  16698. [ 5.3684e-01, -4.4057e-01, 1.7730e+00, -1.7660e-01, -5.2494e-01,
  16699. -5.3426e-02, 2.3141e-01, 3.4688e-01],
  16700. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  16701. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  16702. [ 5.1928e-01, -4.6990e-01, 1.5767e+00, 4.0077e-01, -2.4203e-01,
  16703. 7.7444e-02, 1.1776e-01, -6.1038e-02],
  16704. [ 6.1161e-01, -3.8976e-01, 1.8654e+00, -1.9969e-01, -4.7875e-01,
  16705. -1.1081e+00, 4.3668e-01, -6.3661e-02],
  16706. [ 5.9436e-01, -4.4897e-01, 1.8643e+00, -6.5918e-02, -5.1472e-01,
  16707. 1.2348e-01, 7.6842e-01, 1.0043e-01],
  16708. [ 5.5456e-01, -4.6205e-01, 1.7788e+00, -4.2294e-01, -5.1917e-01,
  16709. -2.2633e-02, 4.2771e-01, 2.4681e-01],
  16710. [ 5.4827e-01, -3.9908e-01, 8.0300e-01, -1.2159e+00, -5.0185e-01,
  16711. -1.1928e+00, 2.6243e-01, 3.8516e-01]]], device='cuda:0')
  16712. loss_train_step before backward: tensor(0.0218, device='cuda:0', grad_fn=<MseLossBackward>)
  16713. loss_train_step after backward: tensor(0.0218, device='cuda:0', grad_fn=<MseLossBackward>)
  16714. loss_train: 1.1033018305897713
  16715. step: 29
  16716. running loss: 0.03804489070999211
  16717. Train Steps: 29/90 Loss: 0.0380 torch.Size([8, 600, 800])
  16718. torch.Size([8, 8])
  16719. tensor([[0.6264, 0.4069, 0.7900, 0.1650, 0.4275, 0.2267, 0.6290, 0.4947],
  16720. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  16721. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  16722. [0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183],
  16723. [0.6198, 0.3997, 0.8582, 0.5361, 0.4117, 0.5016, 0.5942, 0.5134],
  16724. [0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  16725. [0.6177, 0.4086, 0.8738, 0.3950, 0.3775, 0.5600, 0.6225, 0.5700],
  16726. [0.6339, 0.4102, 0.8588, 0.3133, 0.4425, 0.2117, 0.6417, 0.5089]],
  16727. device='cuda:0', dtype=torch.float64)
  16728. predictions are: tensor([[ 0.9041, -0.2328, 1.4413, -1.2928, -0.3322, -1.1886, 0.6267, 0.0711],
  16729. [ 0.7592, -0.2912, 1.6034, -0.9775, -0.1320, -1.3031, 0.6796, 0.1741],
  16730. [-1.2913, -1.6136, 0.9918, -1.1419, -0.4308, -1.3234, 0.0654, 0.2949],
  16731. [ 0.8360, -0.2591, 1.3810, -0.9939, -0.5174, -1.0080, 0.2762, 0.1503],
  16732. [ 0.7807, -0.3532, 1.7547, 0.2277, -0.4817, 0.1521, 0.4084, 0.1783],
  16733. [ 0.7861, -0.2807, 1.6459, -0.4515, -0.6758, -0.4393, 0.1187, 0.3166],
  16734. [ 0.4825, -0.4640, 1.7166, -0.4412, -0.5613, 0.3670, 0.6141, 0.3111],
  16735. [ 0.8659, -0.2588, 1.6902, -0.7670, -0.2796, -1.1250, 0.6830, 0.1375]],
  16736. device='cuda:0', grad_fn=<AddmmBackward>)
  16737. landmarks are: tensor([[[ 6.0739e-01, -4.0631e-01, 1.3630e+00, -1.5238e+00, -3.1132e-01,
  16738. -1.2390e+00, 6.1950e-01, -9.2270e-04],
  16739. [ 6.4707e-01, -3.8397e-01, 1.5767e+00, -1.0311e+00, -4.5727e-02,
  16740. -1.5007e+00, 6.8892e-01, 1.0199e-01],
  16741. [-2.2859e+00, -2.2859e+00, 1.0712e+00, -1.2085e+00, -3.8060e-01,
  16742. -1.3929e+00, 7.5520e-02, 2.0062e-01],
  16743. [ 5.7985e-01, -4.1555e-01, 1.3977e+00, -1.0388e+00, -4.6721e-01,
  16744. -1.1004e+00, 3.4688e-01, 1.0824e-01],
  16745. [ 5.7673e-01, -4.3957e-01, 1.6782e+00, 1.9046e-01, -3.8437e-01,
  16746. 3.0841e-02, 4.5876e-01, 8.5521e-02],
  16747. [ 5.5813e-01, -3.9120e-01, 1.6460e+00, -5.2302e-01, -6.1732e-01,
  16748. -5.9230e-01, 6.8107e-02, 4.3475e-01],
  16749. [ 5.6715e-01, -3.9885e-01, 1.7499e+00, -4.6143e-01, -5.4226e-01,
  16750. 3.0069e-01, 5.8938e-01, 3.4688e-01],
  16751. [ 6.4212e-01, -3.9120e-01, 1.6806e+00, -8.3865e-01, -2.4203e-01,
  16752. -1.3082e+00, 6.7795e-01, 6.4585e-02]]], device='cuda:0')
  16753. loss_train_step before backward: tensor(0.0340, device='cuda:0', grad_fn=<MseLossBackward>)
  16754. loss_train_step after backward: tensor(0.0340, device='cuda:0', grad_fn=<MseLossBackward>)
  16755. loss_train: 1.1373316459357738
  16756. step: 30
  16757. running loss: 0.0379110548645258
  16758.  
  16759. Train Steps: 30/90 Loss: 0.0379 torch.Size([8, 600, 800])
  16760. torch.Size([8, 8])
  16761. tensor([[0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  16762. [0.6192, 0.3980, 0.7078, 0.2750, 0.4250, 0.2100, 0.5450, 0.5783],
  16763. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  16764. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533],
  16765. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  16766. [0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  16767. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  16768. [0.6145, 0.4008, 0.8750, 0.5383, 0.3975, 0.4650, 0.5563, 0.5533]],
  16769. device='cuda:0', dtype=torch.float64)
  16770. predictions are: tensor([[ 0.9908, -0.1592, 1.7502, -0.3743, -0.6669, -0.1327, 0.2648, 0.2209],
  16771. [-0.1769, -0.8809, 1.1025, -1.1944, -0.3271, -1.3661, 0.1683, 0.3038],
  16772. [-0.9808, -1.4234, 1.6078, -1.3676, 0.0597, -1.3673, 0.7059, 0.2835],
  16773. [-1.0429, -1.4503, 0.9365, -1.3842, -0.4058, -1.4962, 0.0476, 0.3043],
  16774. [ 1.3095, 0.0057, 1.8528, 0.1808, -0.6550, -0.1029, 0.3944, 0.2550],
  16775. [ 1.3513, 0.0706, 1.4051, -1.2822, -0.5891, -1.0075, 0.4432, -0.0362],
  16776. [ 1.3579, 0.0215, 1.8816, 0.1004, -0.4905, 0.3744, 0.8456, 0.2072],
  16777. [ 1.0344, -0.1677, 1.8004, 0.2043, -0.4927, -0.0642, 0.3500, 0.2197]],
  16778. device='cuda:0', grad_fn=<AddmmBackward>)
  16779. landmarks are: tensor([[[ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  16780. 0.3267],
  16781. [ 0.5742, -0.4474, 0.9834, -1.0159, -0.3229, -1.3159, 0.2314,
  16782. 0.3854],
  16783. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  16784. 0.3104],
  16785. [-2.2859, -2.2859, 0.7023, -1.3883, -0.4268, -1.3621, 0.0813,
  16786. 0.2699],
  16787. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  16788. 0.3161],
  16789. [ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  16790. -0.0108],
  16791. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  16792. 0.3371],
  16793. [ 0.5526, -0.4347, 1.7557, 0.2006, -0.4499, -0.1381, 0.2834,
  16794. 0.2699]]], device='cuda:0')
  16795. loss_train_step before backward: tensor(0.1383, device='cuda:0', grad_fn=<MseLossBackward>)
  16796. loss_train_step after backward: tensor(0.1383, device='cuda:0', grad_fn=<MseLossBackward>)
  16797. loss_train: 1.2756343595683575
  16798. step: 31
  16799. running loss: 0.04114949546994701
  16800. Train Steps: 31/90 Loss: 0.0411 torch.Size([8, 600, 800])
  16801. torch.Size([8, 8])
  16802. tensor([[0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  16803. [0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  16804. [0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390],
  16805. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  16806. [0.6211, 0.4069, 0.8750, 0.5117, 0.4150, 0.4900, 0.5875, 0.5167],
  16807. [0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167],
  16808. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  16809. [0.6236, 0.3977, 0.8985, 0.4806, 0.3835, 0.5216, 0.6613, 0.5166]],
  16810. device='cuda:0', dtype=torch.float64)
  16811. predictions are: tensor([[ 0.7756, -0.2943, 1.5082, -1.1577, -0.5133, -0.9230, 0.4684, 0.1807],
  16812. [ 0.3804, -0.5261, 0.9433, -1.4339, -0.4707, -1.3062, 0.1094, 0.1210],
  16813. [ 0.6888, -0.3697, 1.7758, -0.6519, -0.3946, -1.1142, 0.5529, 0.1363],
  16814. [ 0.6840, -0.3646, 1.5596, 0.2019, -0.4157, -0.2509, 0.2369, 0.3986],
  16815. [ 0.8092, -0.3029, 1.7801, -0.0520, -0.4425, -0.0876, 0.3524, 0.1252],
  16816. [ 0.6672, -0.3370, 1.2757, -1.0965, -0.4721, -1.1377, 0.3404, 0.3186],
  16817. [ 0.3779, -0.5995, 1.8432, -0.2514, -0.4791, 0.1413, 0.7156, 0.2372],
  16818. [ 0.3615, -0.6130, 1.7762, -0.2651, -0.5145, 0.0278, 0.5792, 0.2315]],
  16819. device='cuda:0', grad_fn=<AddmmBackward>)
  16820. landmarks are: tensor([[[ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  16821. 0.2699],
  16822. [ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  16823. 0.0712],
  16824. [ 0.6504, -0.3936, 1.8885, -0.4922, -0.3402, -0.9233, 0.8022,
  16825. 0.2035],
  16826. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  16827. 0.5239],
  16828. [ 0.5828, -0.4066, 1.7557, 0.0774, -0.3691, -0.0226, 0.4277,
  16829. 0.1005],
  16830. [ 0.5631, -0.4129, 1.2129, -0.9233, -0.4152, -1.0311, 0.4566,
  16831. 0.5624],
  16832. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  16833. 0.1554],
  16834. [ 0.5944, -0.4490, 1.8643, -0.0659, -0.5147, 0.1235, 0.7684,
  16835. 0.1004]]], device='cuda:0')
  16836. loss_train_step before backward: tensor(0.0165, device='cuda:0', grad_fn=<MseLossBackward>)
  16837. loss_train_step after backward: tensor(0.0165, device='cuda:0', grad_fn=<MseLossBackward>)
  16838. loss_train: 1.2920843735337257
  16839. step: 32
  16840. running loss: 0.04037763667292893
  16841. Train Steps: 32/90 Loss: 0.0404 torch.Size([8, 600, 800])
  16842. torch.Size([8, 8])
  16843. tensor([[0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  16844. [0.6205, 0.4004, 0.8938, 0.4883, 0.3663, 0.5000, 0.6357, 0.4947],
  16845. [0.6177, 0.4086, 0.8738, 0.3950, 0.3775, 0.5600, 0.6225, 0.5700],
  16846. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  16847. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  16848. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  16849. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  16850. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938]],
  16851. device='cuda:0', dtype=torch.float64)
  16852. predictions are: tensor([[ 0.7272, -0.3183, 1.7046, -0.5656, -0.4559, -1.0896, 0.1794, 0.1725],
  16853. [ 0.4934, -0.5156, 1.8159, -0.1265, -0.5439, -0.0894, 0.4923, 0.2124],
  16854. [ 0.6612, -0.3344, 1.7433, -0.5302, -0.4852, 0.2510, 0.5717, 0.3081],
  16855. [ 0.7566, -0.2804, 1.0319, -1.3667, -0.4885, -1.1770, 0.3090, 0.1345],
  16856. [ 0.6595, -0.3936, 1.5598, 0.0052, -0.4803, -0.1097, 0.5725, 0.2791],
  16857. [-0.9094, -1.3789, 1.0018, -1.3468, -0.2830, -1.5701, 0.1808, 0.3358],
  16858. [ 0.7135, -0.3099, 1.2355, -1.1843, -0.5799, -0.8957, 0.4245, 0.2362],
  16859. [ 0.8254, -0.3237, 1.8059, 0.2547, -0.4740, -0.2230, 0.5220, 0.1259]],
  16860. device='cuda:0', grad_fn=<AddmmBackward>)
  16861. landmarks are: tensor([[[ 5.4850e-01, -4.2094e-01, 1.6691e+00, -4.1524e-01, -5.2494e-01,
  16862. -1.1081e+00, 7.2521e-02, 2.0831e-03],
  16863. [ 5.8031e-01, -4.3672e-01, 1.8423e+00, -3.0331e-02, -5.9423e-01,
  16864. 2.3557e-02, 6.5034e-01, -9.2270e-04],
  16865. [ 5.6715e-01, -3.9885e-01, 1.7499e+00, -4.6143e-01, -5.4226e-01,
  16866. 3.0069e-01, 5.8938e-01, 3.4688e-01],
  16867. [ 5.0531e-01, -4.2810e-01, 8.9538e-01, -1.3698e+00, -5.4226e-01,
  16868. -1.1389e+00, 2.4525e-01, 8.6245e-02],
  16869. [ 6.2895e-01, -4.3453e-01, 1.3794e+00, 3.6792e-01, -4.8453e-01,
  16870. 3.8953e-02, 9.2654e-01, 1.9283e-01],
  16871. [-2.2859e+00, -2.2859e+00, 6.7598e-01, -1.4083e+00, -3.2864e-01,
  16872. -1.4160e+00, 2.4873e-01, 3.4688e-01],
  16873. [ 5.4660e-01, -4.0805e-01, 1.0668e+00, -1.1764e+00, -6.2887e-01,
  16874. -7.6166e-01, 4.8545e-01, 3.0069e-01],
  16875. [ 6.3949e-01, -4.2132e-01, 1.7037e+00, 3.6228e-01, -4.3256e-01,
  16876. -1.0731e-01, 6.5602e-01, -4.8817e-03]]], device='cuda:0')
  16877. loss_train_step before backward: tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward>)
  16878. loss_train_step after backward: tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward>)
  16879. loss_train: 1.3506991527974606
  16880. step: 33
  16881. running loss: 0.0409302773574988
  16882. Train Steps: 33/90 Loss: 0.0409 torch.Size([8, 600, 800])
  16883. torch.Size([8, 8])
  16884. tensor([[0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  16885. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  16886. [0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  16887. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426],
  16888. [0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  16889. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  16890. [0.6176, 0.4017, 0.8788, 0.5100, 0.4075, 0.5250, 0.5913, 0.5033],
  16891. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364]],
  16892. device='cuda:0', dtype=torch.float64)
  16893. predictions are: tensor([[ 0.3825, -0.5192, 1.5531, -0.5483, -0.5774, -0.2306, 0.2690, 0.1452],
  16894. [ 0.3526, -0.5745, 1.5906, 0.1417, -0.4948, -0.4045, 0.2288, 0.1579],
  16895. [ 0.5171, -0.4502, 1.0703, -1.4119, -0.5305, -1.0881, 0.4877, 0.2627],
  16896. [ 0.4865, -0.4936, 1.6517, -0.4755, -0.5666, -0.7995, 0.4503, 0.1849],
  16897. [ 0.8655, -0.1874, 1.4872, -0.2307, -0.6180, -0.7052, 0.3166, 0.3255],
  16898. [ 0.4165, -0.5100, 1.6322, -0.2517, -0.3476, -0.0160, 0.4465, 0.2920],
  16899. [ 0.4606, -0.5201, 1.6801, -0.0939, -0.3939, 0.0481, 0.4526, 0.2095],
  16900. [ 0.4394, -0.4942, 1.3631, -1.2998, -0.2485, -1.3518, 0.7349, 0.1318]],
  16901. device='cuda:0', grad_fn=<AddmmBackward>)
  16902. landmarks are: tensor([[[ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  16903. 0.0502],
  16904. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  16905. -0.0370],
  16906. [ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  16907. 0.3007],
  16908. [ 0.5788, -0.4135, 1.8214, -0.2408, -0.6039, -0.7854, 0.4115,
  16909. 0.2203],
  16910. [ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  16911. 0.4393],
  16912. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  16913. 0.3084],
  16914. [ 0.5668, -0.4306, 1.7730, 0.0697, -0.4037, 0.1390, 0.4450,
  16915. 0.0390],
  16916. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  16917. 0.1917]]], device='cuda:0')
  16918. loss_train_step before backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  16919.  
  16920. loss_train_step after backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  16921. loss_train: 1.3644524635747075
  16922. step: 34
  16923. running loss: 0.04013095481102081
  16924. Train Steps: 34/90 Loss: 0.0401 torch.Size([8, 600, 800])
  16925. torch.Size([8, 8])
  16926. tensor([[0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  16927. [0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117],
  16928. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  16929. [0.6110, 0.4047, 0.8700, 0.4483, 0.3713, 0.3967, 0.5088, 0.5517],
  16930. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  16931. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  16932. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  16933. [0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544]],
  16934. device='cuda:0', dtype=torch.float64)
  16935. predictions are: tensor([[ 0.5411, -0.4536, 1.7278, -0.3899, -0.5399, -0.1135, 0.6217, 0.1842],
  16936. [ 0.3986, -0.5291, 1.6807, -0.3776, -0.6092, -0.5501, 0.3713, 0.1663],
  16937. [ 0.6661, -0.3267, 1.3198, -0.6602, -0.6227, -0.4715, 0.1822, 0.1441],
  16938. [ 0.3818, -0.5150, 1.5559, -0.4041, -0.6201, -0.5724, 0.1614, 0.2175],
  16939. [ 0.3520, -0.6014, 1.6483, 0.0400, -0.4569, -0.2901, 0.5195, 0.1823],
  16940. [ 0.7070, -0.3190, 1.6861, -0.3544, -0.1871, 0.0213, 0.5974, 0.2302],
  16941. [ 0.5853, -0.4072, 1.4730, 0.1342, -0.3969, -0.3106, 0.5202, 0.4160],
  16942. [ 0.1553, -0.6436, 0.8552, -1.3981, -0.4279, -1.4607, 0.2782, 0.2042]],
  16943. device='cuda:0', grad_fn=<AddmmBackward>)
  16944. landmarks are: tensor([[[ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  16945. 0.1775],
  16946. [ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  16947. 0.0774],
  16948. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  16949. 0.1552],
  16950. [ 0.5363, -0.4168, 1.7326, -0.2151, -0.5711, -0.4537, 0.0640,
  16951. 0.2622],
  16952. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  16953. 0.1979],
  16954. [ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  16955. 0.2699],
  16956. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  16957. 0.5239],
  16958. [ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  16959. 0.2747]]], device='cuda:0')
  16960. loss_train_step before backward: tensor(0.0201, device='cuda:0', grad_fn=<MseLossBackward>)
  16961. loss_train_step after backward: tensor(0.0201, device='cuda:0', grad_fn=<MseLossBackward>)
  16962. loss_train: 1.3845558362081647
  16963. step: 35
  16964. running loss: 0.03955873817737613
  16965. Train Steps: 35/90 Loss: 0.0396 torch.Size([8, 600, 800])
  16966. torch.Size([8, 8])
  16967. tensor([[0.6293, 0.3982, 0.8700, 0.5300, 0.3763, 0.4717, 0.7050, 0.5297],
  16968. [0.6136, 0.4117, 0.8700, 0.5167, 0.4188, 0.5083, 0.5147, 0.5495],
  16969. [0.6280, 0.4101, 0.9050, 0.4533, 0.3775, 0.3217, 0.6338, 0.4915],
  16970. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  16971. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  16972. [0.6114, 0.4018, 0.7213, 0.1967, 0.3763, 0.2700, 0.5875, 0.5533],
  16973. [0.6250, 0.4106, 0.8700, 0.3717, 0.3588, 0.4967, 0.6038, 0.5167],
  16974. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917]],
  16975. device='cuda:0', dtype=torch.float64)
  16976. predictions are: tensor([[ 0.2897, -0.6276, 1.5647, -0.0474, -0.4891, -0.2550, 0.5759, 0.1923],
  16977. [ 0.5408, -0.4012, 1.5358, 0.0289, -0.3157, -0.0208, 0.1720, 0.2009],
  16978. [ 0.5524, -0.4431, 1.6840, -0.4082, -0.5403, -0.9415, 0.4238, 0.0553],
  16979. [ 0.4974, -0.4879, 1.6445, -0.0998, -0.4748, -0.0273, 0.3334, 0.1735],
  16980. [ 0.5754, -0.4577, 1.6794, -0.2655, -0.5683, -0.5576, 0.6392, 0.2151],
  16981. [ 0.2067, -0.6470, 0.9056, -1.5566, -0.5469, -1.1697, 0.3692, 0.1897],
  16982. [ 0.6249, -0.3607, 1.5125, -0.7481, -0.5763, -0.1067, 0.5937, 0.2508],
  16983. [ 0.3513, -0.5097, 1.4105, 0.1475, -0.3911, -0.3318, 0.2325, 0.4419]],
  16984. device='cuda:0', grad_fn=<AddmmBackward>)
  16985. landmarks are: tensor([[[ 0.6207, -0.4466, 1.7326, 0.1621, -0.5480, -0.1073, 0.9704,
  16986. 0.1608],
  16987. [ 0.5482, -0.3841, 1.7326, 0.1005, -0.3517, 0.0620, 0.0912,
  16988. 0.2522],
  16989. [ 0.6148, -0.3918, 1.8942, -0.1920, -0.5423, -0.8002, 0.6414,
  16990. -0.0156],
  16991. [ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  16992. 0.0663],
  16993. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  16994. 0.1768],
  16995. [ 0.5380, -0.4302, 1.0455, -1.3775, -0.5480, -1.0388, 0.4277,
  16996. 0.2699],
  16997. [ 0.6010, -0.3896, 1.7326, -0.5692, -0.6289, 0.0082, 0.5028,
  16998. 0.1005],
  16999. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  17000. 0.4470]]], device='cuda:0')
  17001. loss_train_step before backward: tensor(0.0228, device='cuda:0', grad_fn=<MseLossBackward>)
  17002. loss_train_step after backward: tensor(0.0228, device='cuda:0', grad_fn=<MseLossBackward>)
  17003. loss_train: 1.4073562482371926
  17004. step: 36
  17005. running loss: 0.039093229117699795
  17006. Train Steps: 36/90 Loss: 0.0391 torch.Size([8, 600, 800])
  17007. torch.Size([8, 8])
  17008. tensor([[0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  17009. [0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  17010. [0.6124, 0.4075, 0.7696, 0.4153, 0.3475, 0.3767, 0.5157, 0.5427],
  17011. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  17012. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  17013. [ nan, nan, 0.7097, 0.2346, 0.4250, 0.1850, 0.5175, 0.5583],
  17014. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  17015. [0.6293, 0.3982, 0.8700, 0.5300, 0.3763, 0.4717, 0.7050, 0.5297]],
  17016. device='cuda:0', dtype=torch.float64)
  17017. predictions are: tensor([[ 0.6089, -0.3586, 0.9983, -1.0574, -0.4327, -1.0262, 0.4522, 0.3104],
  17018. [ 0.7212, -0.3187, 1.2293, -1.0060, -0.4093, -1.1530, 0.3823, 0.1102],
  17019. [ 0.9051, -0.1809, 1.4924, -0.3170, -0.7052, -0.3290, 0.1440, 0.1669],
  17020. [ 0.1922, -0.6328, 0.9536, -0.8334, -0.5797, -0.8038, 0.2082, 0.3640],
  17021. [ 0.9224, -0.2444, 2.0366, 0.1023, -0.4859, 0.4914, 0.9817, 0.1094],
  17022. [-2.0891, -2.1434, 1.0060, -1.0435, -0.4197, -1.1671, 0.2153, 0.2539],
  17023. [ 0.3065, -0.5146, 1.1554, -0.6968, -0.1279, -1.0569, 0.2675, 0.3804],
  17024. [ 0.7788, -0.3376, 1.8395, 0.3493, -0.5287, 0.0480, 0.6786, 0.0816]],
  17025. device='cuda:0', grad_fn=<AddmmBackward>)
  17026. landmarks are: tensor([[[ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  17027. 0.2622],
  17028. [ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  17029. 0.1449],
  17030. [ 0.5427, -0.4035, 1.2688, -0.3675, -0.6808, -0.5461, 0.0959,
  17031. 0.2206],
  17032. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  17033. 0.4085],
  17034. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  17035. 0.1554],
  17036. [-2.2859, -2.2859, 0.9922, -1.2021, -0.3229, -1.4314, 0.1044,
  17037. 0.2930],
  17038. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  17039. 0.5624],
  17040. [ 0.6207, -0.4466, 1.7326, 0.1621, -0.5480, -0.1073, 0.9704,
  17041. 0.1608]]], device='cuda:0')
  17042. loss_train_step before backward: tensor(0.0270, device='cuda:0', grad_fn=<MseLossBackward>)
  17043. loss_train_step after backward: tensor(0.0270, device='cuda:0', grad_fn=<MseLossBackward>)
  17044. loss_train: 1.4343694495037198
  17045. step: 37
  17046. running loss: 0.038766741878478915
  17047. Train Steps: 37/90 Loss: 0.0388 torch.Size([8, 600, 800])
  17048. torch.Size([8, 8])
  17049. tensor([[0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  17050. [0.6161, 0.4055, 0.8675, 0.3867, 0.3713, 0.4033, 0.5195, 0.5162],
  17051. [0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  17052. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  17053. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  17054. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  17055. [0.6272, 0.4120, 0.9038, 0.4117, 0.3725, 0.3200, 0.6175, 0.5250],
  17056. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433]],
  17057. device='cuda:0', dtype=torch.float64)
  17058. predictions are: tensor([[-1.0315, -1.4505, 0.8585, -1.1804, -0.3616, -1.3684, 0.2596, 0.2981],
  17059. [ 0.3760, -0.4742, 1.6197, -0.2871, -0.5844, -0.3497, 0.1494, 0.1322],
  17060. [ 0.2731, -0.5802, 0.7607, -1.3135, -0.4940, -1.0363, 0.2531, 0.2214],
  17061. [ 0.6946, -0.3087, 1.6473, 0.2415, -0.1956, 0.1741, 0.4767, 0.1525],
  17062. [ 0.7139, -0.3329, 1.4853, 0.1988, -0.4484, 0.0563, 0.7421, 0.2211],
  17063. [ 0.5019, -0.4580, 1.7091, -0.0458, -0.5463, -0.2297, 0.5223, 0.2264],
  17064. [ 0.7135, -0.3331, 1.8205, -0.2745, -0.5317, -0.6166, 0.6577, 0.1887],
  17065. [ 0.4978, -0.4209, 1.3890, -0.5404, -0.6099, -0.6694, 0.2540, 0.2692]],
  17066. device='cuda:0', grad_fn=<AddmmBackward>)
  17067. landmarks are: tensor([[[ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  17068. 0.2699],
  17069. [ 0.5598, -0.4129, 1.7210, -0.4999, -0.5711, -0.4229, 0.1136,
  17070. 0.0983],
  17071. [ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  17072. 0.0712],
  17073. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  17074. 0.0851],
  17075. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  17076. 0.1928],
  17077. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  17078. 0.2314],
  17079. [ 0.6111, -0.3828, 1.8885, -0.3844, -0.5654, -0.8079, 0.5663,
  17080. 0.1390],
  17081. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  17082. 0.2237]]], device='cuda:0')
  17083. loss_train_step before backward: tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward>)
  17084.  
  17085. loss_train_step after backward: tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward>)
  17086. loss_train: 1.501950633712113
  17087. step: 38
  17088. running loss: 0.03952501667663455
  17089. Train Steps: 38/90 Loss: 0.0395 torch.Size([8, 600, 800])
  17090. torch.Size([8, 8])
  17091. tensor([[0.6203, 0.4056, 0.8942, 0.4086, 0.3643, 0.3617, 0.5917, 0.5482],
  17092. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528],
  17093. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  17094. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  17095. [0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  17096. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  17097. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  17098. [0.6284, 0.4029, 0.8838, 0.3783, 0.3975, 0.2850, 0.6335, 0.5090]],
  17099. device='cuda:0', dtype=torch.float64)
  17100. predictions are: tensor([[ 0.6832, -0.3513, 1.7042, -0.1977, -0.6291, -0.4616, 0.5176, 0.1659],
  17101. [-0.7401, -1.2939, 1.7845, -0.6514, -0.1847, -0.8358, 1.0248, 0.2050],
  17102. [-0.5645, -1.1050, 0.7261, -1.0714, -0.4450, -1.3088, 0.0884, 0.2421],
  17103. [ 0.6336, -0.3166, 1.6069, 0.0188, -0.1684, 0.2818, 0.4854, 0.2356],
  17104. [ 0.6863, -0.3263, 1.6596, 0.1793, -0.3551, 0.1340, 0.4881, 0.2052],
  17105. [ 0.6414, -0.3296, 1.4893, -0.1288, -0.5712, -0.1099, 0.2392, 0.1740],
  17106. [ 0.4698, -0.4321, 0.7184, -0.8961, -0.6497, -0.8492, 0.1134, 0.3681],
  17107. [ 0.7837, -0.2923, 1.5828, -0.4301, -0.5045, -0.8921, 0.5768, 0.0597]],
  17108. device='cuda:0', grad_fn=<AddmmBackward>)
  17109. landmarks are: tensor([[[ 0.5791, -0.4127, 1.8442, -0.3985, -0.6031, -0.6154, 0.4473,
  17110. 0.2464],
  17111. [-2.2859, -2.2859, 1.8423, -0.9695, -0.1323, -0.8463, 1.1349,
  17112. 0.2676],
  17113. [ 0.5591, -0.3990, 0.9012, -1.2313, -0.3979, -1.3852, 0.0804,
  17114. 0.2071],
  17115. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  17116. 0.3007],
  17117. [ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  17118. 0.2391],
  17119. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  17120. 0.3265],
  17121. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  17122. 0.4103],
  17123. [ 0.6165, -0.4249, 1.7961, -0.5384, -0.4499, -0.9695, 0.6401,
  17124. 0.0652]]], device='cuda:0')
  17125. loss_train_step before backward: tensor(0.0914, device='cuda:0', grad_fn=<MseLossBackward>)
  17126. loss_train_step after backward: tensor(0.0914, device='cuda:0', grad_fn=<MseLossBackward>)
  17127. loss_train: 1.5933644147589803
  17128. step: 39
  17129. running loss: 0.04085549781433283
  17130. Train Steps: 39/90 Loss: 0.0409 torch.Size([8, 600, 800])
  17131. torch.Size([8, 8])
  17132. tensor([[0.6186, 0.4013, 0.8191, 0.3188, 0.4279, 0.2060, 0.5767, 0.5411],
  17133. [0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  17134. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  17135. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  17136. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  17137. [0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  17138. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  17139. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567]],
  17140. device='cuda:0', dtype=torch.float64)
  17141. predictions are: tensor([[ 0.5238, -0.3950, 1.2829, -0.8842, -0.3780, -1.2504, 0.3666, 0.1162],
  17142. [ 0.2301, -0.5965, 1.5215, 0.3388, -0.3021, -0.0835, 0.4180, 0.1480],
  17143. [ 0.3454, -0.4980, 1.4978, 0.1416, -0.5490, -0.5785, 0.3343, 0.2566],
  17144. [ 0.5529, -0.4195, 1.7595, -0.3212, -0.4820, 0.2027, 0.8572, 0.1335],
  17145. [ 0.3021, -0.5822, 1.6934, -0.0044, -0.4441, -0.0950, 0.3973, 0.1461],
  17146. [ 0.3611, -0.5352, 0.9858, -1.2857, -0.5901, -1.0377, 0.4483, 0.2478],
  17147. [ 0.2816, -0.5578, 1.3447, -0.7849, -0.6097, -0.5858, 0.5139, 0.3761],
  17148. [ 0.3448, -0.5351, 1.4953, 0.3681, -0.2450, -0.1087, 0.2777, 0.2207]],
  17149. device='cuda:0', grad_fn=<AddmmBackward>)
  17150. landmarks are: tensor([[[ 0.5713, -0.4321, 1.4975, -0.8134, -0.3094, -1.3345, 0.3779,
  17151. 0.2134],
  17152. [ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  17153. 0.2237],
  17154. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  17155. 0.3392],
  17156. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  17157. 0.1005],
  17158. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  17159. 0.2035],
  17160. [ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  17161. 0.3007],
  17162. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  17163. 0.5624],
  17164. [ 0.5620, -0.4346, 1.6691, 0.3315, -0.2594, -0.0072, 0.2891,
  17165. 0.2853]]], device='cuda:0')
  17166. loss_train_step before backward: tensor(0.0166, device='cuda:0', grad_fn=<MseLossBackward>)
  17167. loss_train_step after backward: tensor(0.0166, device='cuda:0', grad_fn=<MseLossBackward>)
  17168. loss_train: 1.610002956353128
  17169. step: 40
  17170. running loss: 0.0402500739088282
  17171. Train Steps: 40/90 Loss: 0.0403 torch.Size([8, 600, 800])
  17172. torch.Size([8, 8])
  17173. tensor([[0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  17174. [0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136],
  17175. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  17176. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  17177. [0.6176, 0.4030, 0.8850, 0.4850, 0.3688, 0.4050, 0.5312, 0.5783],
  17178. [0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350],
  17179. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  17180. [0.6223, 0.4130, 0.8100, 0.2983, 0.3525, 0.3900, 0.5694, 0.5103]],
  17181. device='cuda:0', dtype=torch.float64)
  17182. predictions are: tensor([[ 0.5868, -0.4193, 1.2456, -0.9690, -0.5729, -0.7326, 0.5721, 0.2117],
  17183. [ 0.3966, -0.4664, 1.5337, -0.4057, -0.4873, 0.2182, 0.5452, 0.3014],
  17184. [-0.0431, -0.8257, 0.8331, -1.1309, -0.4279, -1.1973, 0.2385, 0.2226],
  17185. [ 0.3674, -0.5902, 1.4668, -0.8268, -0.2956, -1.1755, 0.6494, 0.1242],
  17186. [ 0.3705, -0.5327, 1.7229, 0.2829, -0.4762, -0.2262, 0.2493, 0.2158],
  17187. [ 0.4006, -0.4981, 1.2489, -0.7730, -0.3574, -1.0831, 0.3577, 0.2296],
  17188. [ 0.3442, -0.6000, 1.7299, 0.7331, -0.4478, 0.0127, 0.5833, 0.1481],
  17189. [ 0.3361, -0.5357, 1.5195, -0.5111, -0.5457, -0.3380, 0.4007, 0.2688]],
  17190. device='cuda:0', grad_fn=<AddmmBackward>)
  17191. landmarks are: tensor([[[ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  17192. 0.1779],
  17193. [ 0.5466, -0.3840, 1.5016, -0.6077, -0.6404, 0.2083, 0.3871,
  17194. 0.0862],
  17195. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  17196. 0.1013],
  17197. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  17198. 0.1193],
  17199. [ 0.5667, -0.4246, 1.8018, -0.0457, -0.5827, -0.4152, 0.1679,
  17200. 0.3854],
  17201. [ 0.5911, -0.4080, 1.2303, -0.9156, -0.3229, -1.2851, 0.4508,
  17202. 0.1852],
  17203. [ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  17204. -0.1331],
  17205. [ 0.5886, -0.3784, 1.4554, -0.9079, -0.6577, -0.4845, 0.3440,
  17206. 0.0712]]], device='cuda:0')
  17207. loss_train_step before backward: tensor(0.0313, device='cuda:0', grad_fn=<MseLossBackward>)
  17208. loss_train_step after backward: tensor(0.0313, device='cuda:0', grad_fn=<MseLossBackward>)
  17209. loss_train: 1.6413122108206153
  17210. step: 41
  17211. running loss: 0.040032005141966226
  17212. Train Steps: 41/90 Loss: 0.0400 torch.Size([8, 600, 800])
  17213. torch.Size([8, 8])
  17214. tensor([[0.6257, 0.4060, 0.8300, 0.2333, 0.4688, 0.2583, 0.7050, 0.5633],
  17215. [0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  17216. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  17217. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  17218. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  17219. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  17220. [ nan, nan, 0.8900, 0.3217, 0.5038, 0.2233, 0.6694, 0.5609],
  17221. [0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758]],
  17222. device='cuda:0', dtype=torch.float64)
  17223. predictions are: tensor([[ 0.7870, -0.2595, 1.2943, -1.1052, -0.3462, -1.0785, 0.7152, 0.2656],
  17224. [ 0.4789, -0.4572, 1.4920, 0.2105, -0.5343, -0.1205, 0.1726, 0.2225],
  17225. [ 0.6183, -0.3261, 1.4758, 0.0889, -0.4249, 0.0699, 0.1858, 0.2688],
  17226. [ 0.7325, -0.2322, 1.4474, -0.0852, -0.2401, 0.0818, 0.2022, 0.2692],
  17227. [ 0.6747, -0.3397, 1.6252, -0.1277, -0.6790, -0.1723, 0.4741, 0.0560],
  17228. [ 0.2175, -0.6533, 1.6239, -0.7552, -0.1979, -1.1170, 0.7941, 0.1465],
  17229. [-1.5191, -1.7626, 1.4842, -0.8116, -0.1347, -1.1538, 0.5951, 0.3030],
  17230. [ 0.6647, -0.3226, 1.5790, 0.1086, -0.5153, 0.0848, 0.4939, 0.1292]],
  17231. device='cuda:0', grad_fn=<AddmmBackward>)
  17232. landmarks are: tensor([[[ 0.6042, -0.4105, 1.5478, -1.2082, -0.1208, -1.0927, 0.9704,
  17233. 0.3157],
  17234. [ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  17235. 0.3777],
  17236. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  17237. 0.3084],
  17238. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  17239. 0.2853],
  17240. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  17241. -0.0670],
  17242. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  17243. 0.2142],
  17244. [-2.2859, -2.2859, 1.8249, -0.8002, 0.0409, -1.2543, 0.8059,
  17245. 0.3050],
  17246. [ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  17247. -0.0881]]], device='cuda:0')
  17248. loss_train_step before backward: tensor(0.0408, device='cuda:0', grad_fn=<MseLossBackward>)
  17249. loss_train_step after backward: tensor(0.0408, device='cuda:0', grad_fn=<MseLossBackward>)
  17250. loss_train: 1.682096759788692
  17251. step: 42
  17252. running loss: 0.040049922852111716
  17253.  
  17254. Train Steps: 42/90 Loss: 0.0400 torch.Size([8, 600, 800])
  17255. torch.Size([8, 8])
  17256. tensor([[0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  17257. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  17258. [0.6151, 0.4058, 0.7068, 0.2680, 0.3400, 0.4083, 0.5775, 0.5733],
  17259. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  17260. [0.6226, 0.4001, 0.8438, 0.5733, 0.3862, 0.4250, 0.5750, 0.5283],
  17261. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  17262. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  17263. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150]],
  17264. device='cuda:0', dtype=torch.float64)
  17265. predictions are: tensor([[ 0.5004, -0.4306, 1.6711, -0.3141, -0.1863, 0.1056, 0.4462, 0.1948],
  17266. [ 0.3833, -0.5706, 1.7636, 0.1744, -0.3820, -0.0903, 0.6075, 0.1104],
  17267. [ 0.7137, -0.3340, 1.0047, -1.1597, -0.6519, -0.5842, 0.4302, 0.3509],
  17268. [ 0.2005, -0.6191, 1.5591, -0.4497, -0.5971, -1.0111, 0.1772, 0.1835],
  17269. [ 0.3202, -0.6021, 1.6128, 0.3261, -0.4215, -0.4935, 0.3956, 0.1628],
  17270. [ 0.4754, -0.4941, 1.8339, -0.1144, -0.4388, -0.0946, 0.6142, 0.1738],
  17271. [ 0.4219, -0.4805, 1.3762, -0.5846, -0.5242, -1.1056, 0.2978, 0.3035],
  17272. [ 0.3386, -0.5356, 1.7691, -0.1034, -0.1531, 0.1973, 0.6431, 0.2470]],
  17273. device='cuda:0', grad_fn=<AddmmBackward>)
  17274. landmarks are: tensor([[[ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  17275. 0.2936],
  17276. [ 0.5908, -0.4366, 1.7557, 0.1390, -0.5192, 0.1313, 0.6529,
  17277. 0.0236],
  17278. [ 0.5552, -0.4113, 0.9790, -1.0480, -0.7155, -0.3998, 0.3815,
  17279. 0.3623],
  17280. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  17281. 0.2116],
  17282. [ 0.5900, -0.4377, 1.6113, 0.3623, -0.5018, -0.3229, 0.3700,
  17283. 0.1544],
  17284. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  17285. 0.2237],
  17286. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  17287. 0.3928],
  17288. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  17289. 0.0928]]], device='cuda:0')
  17290. loss_train_step before backward: tensor(0.0167, device='cuda:0', grad_fn=<MseLossBackward>)
  17291. loss_train_step after backward: tensor(0.0167, device='cuda:0', grad_fn=<MseLossBackward>)
  17292. loss_train: 1.6988404570147395
  17293. step: 43
  17294. running loss: 0.03950791760499394
  17295. Train Steps: 43/90 Loss: 0.0395 torch.Size([8, 600, 800])
  17296. torch.Size([8, 8])
  17297. tensor([[0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  17298. [0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758],
  17299. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  17300. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  17301. [0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  17302. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690],
  17303. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  17304. [0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667]],
  17305. device='cuda:0', dtype=torch.float64)
  17306. predictions are: tensor([[ 0.7240, -0.3647, 1.4197, -1.1986, -0.3715, -1.4628, 0.6403, 0.0908],
  17307. [ 0.3467, -0.5586, 1.7756, -0.1293, -0.4171, -0.0376, 0.5929, 0.1243],
  17308. [ 0.5438, -0.4304, 1.6915, 0.2665, -0.4031, -0.1974, 0.4155, 0.2774],
  17309. [ 0.4697, -0.4414, 1.6029, 0.1337, -0.1995, -0.1209, 0.1611, 0.2092],
  17310. [ 0.1763, -0.6875, 1.6918, -0.0366, -0.4339, -0.2375, 0.3021, 0.2240],
  17311. [ 0.3239, -0.5864, 1.5668, 0.0814, -0.3454, 0.1129, 0.7768, 0.3226],
  17312. [ 0.5229, -0.4454, 1.6353, -0.4913, -0.5194, -0.0920, 0.3297, 0.1946],
  17313. [ 0.4346, -0.4854, 1.6011, -0.7661, -0.5156, -0.7754, 0.4753, 0.2727]],
  17314. device='cuda:0', grad_fn=<AddmmBackward>)
  17315. landmarks are: tensor([[[ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  17316. 0.1193],
  17317. [ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  17318. -0.0881],
  17319. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  17320. 0.3007],
  17321. [ 0.5447, -0.3838, 1.7037, 0.1775, -0.1497, 0.1467, 0.1128,
  17322. 0.2431],
  17323. [ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  17324. 0.3777],
  17325. [ 0.6306, -0.4153, 1.5141, 0.2224, -0.3691, 0.2622, 1.0033,
  17326. 0.3425],
  17327. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  17328. 0.2468],
  17329. [ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  17330. 0.3315]]], device='cuda:0')
  17331. loss_train_step before backward: tensor(0.0154, device='cuda:0', grad_fn=<MseLossBackward>)
  17332. loss_train_step after backward: tensor(0.0154, device='cuda:0', grad_fn=<MseLossBackward>)
  17333. loss_train: 1.7142196567729115
  17334. step: 44
  17335. running loss: 0.03895953765392981
  17336. Train Steps: 44/90 Loss: 0.0390 torch.Size([8, 600, 800])
  17337. torch.Size([8, 8])
  17338. tensor([[ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  17339. [0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  17340. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  17341. [0.6185, 0.4079, 0.8838, 0.4617, 0.4838, 0.5650, 0.6175, 0.5850],
  17342. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  17343. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  17344. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  17345. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649]],
  17346. device='cuda:0', dtype=torch.float64)
  17347. predictions are: tensor([[-1.8981, -2.0774, 1.7373, -1.0459, 0.1501, -1.2919, 0.9771, 0.2549],
  17348. [ 0.6542, -0.3248, 1.6869, 0.0199, -0.3070, 0.0515, 0.1334, 0.2514],
  17349. [ 0.7948, -0.2716, 1.4147, -0.7527, -0.6649, -0.6969, 0.3543, 0.1676],
  17350. [ 0.5800, -0.3888, 1.8255, -0.1103, -0.1156, 0.1581, 0.5761, 0.3198],
  17351. [ 0.7730, -0.2810, 1.3485, -0.9682, -0.6464, -0.4463, 0.5706, 0.2872],
  17352. [ 0.5955, -0.4088, 1.9148, 0.0193, -0.5055, 0.0592, 0.5711, 0.1925],
  17353. [ 0.5736, -0.3881, 0.9811, -1.1537, -0.4690, -1.4067, 0.1148, 0.1811],
  17354. [ 0.9616, -0.1831, 1.7293, 0.5908, -0.5086, -0.0755, 0.4916, 0.0809]],
  17355. device='cuda:0', grad_fn=<AddmmBackward>)
  17356. landmarks are: tensor([[[-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  17357. 0.2463],
  17358. [ 0.5491, -0.4132, 1.7557, -0.0919, -0.2709, 0.0313, 0.0635,
  17359. 0.4032],
  17360. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  17361. 0.0942],
  17362. [ 0.5707, -0.4017, 1.7961, -0.1535, -0.0515, 0.3238, 0.5663,
  17363. 0.4162],
  17364. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  17365. 0.2545],
  17366. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  17367. 0.2237],
  17368. [ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  17369. -0.0580],
  17370. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  17371. -0.1385]]], device='cuda:0')
  17372. loss_train_step before backward: tensor(0.0156, device='cuda:0', grad_fn=<MseLossBackward>)
  17373. loss_train_step after backward: tensor(0.0156, device='cuda:0', grad_fn=<MseLossBackward>)
  17374. loss_train: 1.7298358231782913
  17375. step: 45
  17376. running loss: 0.0384407960706287
  17377. Train Steps: 45/90 Loss: 0.0384 torch.Size([8, 600, 800])
  17378. torch.Size([8, 8])
  17379. tensor([[ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552],
  17380. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  17381. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356],
  17382. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  17383. [0.6248, 0.4032, 0.7738, 0.1900, 0.4813, 0.1400, 0.5941, 0.4904],
  17384. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  17385. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  17386. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350]],
  17387. device='cuda:0', dtype=torch.float64)
  17388. predictions are: tensor([[-2.2043, -2.2418, 1.7081, -0.8358, -0.0276, -1.0152, 0.8084, 0.2407],
  17389. [ 0.5243, -0.4429, 1.9431, -0.0100, -0.6092, 0.0366, 0.5699, 0.1601],
  17390. [ 0.6887, -0.3278, 1.3823, -0.8020, -0.3371, -1.0292, 0.6584, 0.2193],
  17391. [ 0.6709, -0.3032, 1.7437, 0.0247, -0.1854, 0.2688, 0.3536, 0.2386],
  17392. [ 0.9483, -0.1798, 1.2172, -0.9029, -0.1352, -1.4696, 0.4495, 0.1328],
  17393. [ 0.6183, -0.3735, 1.6392, -0.4924, -0.5940, 0.1497, 0.6687, 0.2686],
  17394. [ 0.6845, -0.2976, 1.3550, -0.4397, -0.6997, -0.2449, 0.1676, 0.2389],
  17395. [ 0.7395, -0.2648, 1.2949, -0.8578, -0.2455, -1.1228, 0.3436, 0.2488]],
  17396. device='cuda:0', grad_fn=<AddmmBackward>)
  17397. landmarks are: tensor([[[-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  17398. 0.2783],
  17399. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  17400. 0.1390],
  17401. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  17402. 0.1879],
  17403. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  17404. 0.2853],
  17405. [ 0.5999, -0.4236, 1.2880, -1.4083, -0.0630, -1.6393, 0.4584,
  17406. -0.0208],
  17407. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  17408. 0.2083],
  17409. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  17410. 0.2386],
  17411. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  17412. 0.1850]]], device='cuda:0')
  17413. loss_train_step before backward: tensor(0.0250, device='cuda:0', grad_fn=<MseLossBackward>)
  17414. loss_train_step after backward: tensor(0.0250, device='cuda:0', grad_fn=<MseLossBackward>)
  17415. loss_train: 1.7548013236373663
  17416. step: 46
  17417. running loss: 0.038147854861681874
  17418.  
  17419. Train Steps: 46/90 Loss: 0.0381 torch.Size([8, 600, 800])
  17420. torch.Size([8, 8])
  17421. tensor([[0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  17422. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  17423. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  17424. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567],
  17425. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  17426. [0.6060, 0.3924, 0.8450, 0.5717, 0.4200, 0.5217, 0.5253, 0.4752],
  17427. [0.6293, 0.3982, 0.8700, 0.5300, 0.3763, 0.4717, 0.7050, 0.5297],
  17428. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507]],
  17429. device='cuda:0', dtype=torch.float64)
  17430. predictions are: tensor([[ 0.5808, -0.4027, 1.7523, 0.1851, -0.2221, 0.0181, 0.2749, 0.2247],
  17431. [ 0.1685, -0.6521, 1.8133, -0.9287, -0.1096, -1.2804, 0.6237, 0.1164],
  17432. [ 0.5971, -0.3892, 1.8052, -0.2200, -0.3549, 0.2286, 0.5063, 0.3570],
  17433. [-1.4883, -1.7690, 1.2798, -1.1738, -0.4054, -1.2219, 0.2785, 0.2763],
  17434. [ 0.4992, -0.4773, 1.9323, -0.2267, -0.4326, 0.3214, 0.7804, 0.2136],
  17435. [ 0.7130, -0.3289, 1.7113, 0.3647, -0.3429, 0.0021, 0.2070, 0.1561],
  17436. [ 0.6170, -0.4312, 1.7823, 0.1004, -0.4980, -0.1354, 0.7443, 0.1665],
  17437. [ 1.4584, 0.1012, 1.0517, -1.3167, -0.5159, -1.1998, 0.3566, 0.2365]],
  17438. device='cuda:0', grad_fn=<AddmmBackward>)
  17439. landmarks are: tensor([[[ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  17440. 0.2364],
  17441. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  17442. 0.0051],
  17443. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  17444. 0.4701],
  17445. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  17446. 0.2853],
  17447. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  17448. 0.1082],
  17449. [ 0.5132, -0.4736, 1.6171, 0.3546, -0.3460, 0.1236, 0.1404,
  17450. -0.0911],
  17451. [ 0.6207, -0.4466, 1.7326, 0.1621, -0.5480, -0.1073, 0.9704,
  17452. 0.1608],
  17453. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  17454. 0.2576]]], device='cuda:0')
  17455. loss_train_step before backward: tensor(0.0435, device='cuda:0', grad_fn=<MseLossBackward>)
  17456. loss_train_step after backward: tensor(0.0435, device='cuda:0', grad_fn=<MseLossBackward>)
  17457. loss_train: 1.7982591893523932
  17458. step: 47
  17459. running loss: 0.038260833816008366
  17460. Train Steps: 47/90 Loss: 0.0383 torch.Size([8, 600, 800])
  17461. torch.Size([8, 8])
  17462. tensor([[0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  17463. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  17464. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  17465. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  17466. [0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167],
  17467. [0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510],
  17468. [0.6042, 0.3990, 0.6831, 0.2875, 0.3500, 0.3133, 0.5143, 0.5510],
  17469. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268]],
  17470. device='cuda:0', dtype=torch.float64)
  17471. predictions are: tensor([[ 0.5740, -0.4570, 1.2343, -1.2853, -0.3430, -1.3086, 0.2643, 0.1285],
  17472. [ 0.7208, -0.4197, 1.9882, 0.2828, -0.5127, -0.1009, 0.7220, 0.0963],
  17473. [-1.0776, -1.5501, 1.2808, -1.1677, -0.3018, -1.2895, 0.2042, 0.2265],
  17474. [ 0.6298, -0.4848, 2.0928, -0.0428, -0.5081, -0.2292, 0.8535, 0.1820],
  17475. [ 0.9159, -0.2347, 1.5106, -0.9483, -0.3872, -0.8938, 0.5857, 0.3830],
  17476. [ 0.3516, -0.5812, 1.9792, 0.1283, -0.3523, 0.1517, 0.2751, 0.1903],
  17477. [ 0.7296, -0.3684, 1.1634, -1.1615, -0.5584, -0.6658, 0.1552, 0.3173],
  17478. [ 0.5119, -0.5072, 1.9833, -0.0225, -0.1524, 0.3139, 0.7481, 0.1937]],
  17479. device='cuda:0', grad_fn=<AddmmBackward>)
  17480. landmarks are: tensor([[[ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  17481. -0.0580],
  17482. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  17483. -0.1278],
  17484. [-2.2859, -2.2859, 1.0712, -1.2085, -0.3806, -1.3929, 0.0755,
  17485. 0.2006],
  17486. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  17487. 0.1768],
  17488. [ 0.5631, -0.4129, 1.2129, -0.9233, -0.4152, -1.0311, 0.4566,
  17489. 0.5624],
  17490. [ 0.5334, -0.4252, 1.7499, -0.0226, -0.3979, -0.1920, 0.0558,
  17491. 0.2589],
  17492. [ 0.5049, -0.4428, 0.8692, -0.9581, -0.6693, -0.8386, 0.0897,
  17493. 0.2589],
  17494. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  17495. 0.1474]]], device='cuda:0')
  17496. loss_train_step before backward: tensor(0.0539, device='cuda:0', grad_fn=<MseLossBackward>)
  17497. loss_train_step after backward: tensor(0.0539, device='cuda:0', grad_fn=<MseLossBackward>)
  17498. loss_train: 1.852201757952571
  17499. step: 48
  17500. running loss: 0.038587536624011896
  17501. Train Steps: 48/90 Loss: 0.0386 torch.Size([8, 600, 800])
  17502. torch.Size([8, 8])
  17503. tensor([[0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  17504. [0.6196, 0.4088, 0.8888, 0.4583, 0.4500, 0.5683, 0.6138, 0.5883],
  17505. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  17506. [0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290],
  17507. [0.6163, 0.4006, 0.8788, 0.4683, 0.3663, 0.4883, 0.5887, 0.5017],
  17508. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  17509. [0.6201, 0.4064, 0.8688, 0.5050, 0.4225, 0.5100, 0.6138, 0.5500],
  17510. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222]],
  17511. device='cuda:0', dtype=torch.float64)
  17512. predictions are: tensor([[ 0.3295, -0.5814, 1.8805, -0.0697, -0.5494, -0.1917, 0.4035, 0.2892],
  17513. [ 0.7263, -0.3292, 1.8847, -0.2392, -0.1815, 0.3605, 0.5436, 0.2755],
  17514. [-1.5498, -1.8469, 1.1289, -1.4847, -0.3832, -1.3001, 0.2906, 0.2223],
  17515. [ 0.7428, -0.3750, 1.4495, -1.3152, -0.2427, -1.3279, 0.7417, 0.0372],
  17516. [ 0.4533, -0.5365, 1.8424, -0.2498, -0.5483, 0.0561, 0.5313, 0.1250],
  17517. [ 0.5942, -0.4407, 1.8397, 0.1174, -0.5398, -0.1064, 0.4411, 0.2406],
  17518. [ 0.7884, -0.3214, 1.8269, 0.0239, -0.3524, 0.1700, 0.4697, 0.1303],
  17519. [ 0.9849, -0.1455, 1.5928, -0.6527, -0.0722, -1.1593, 0.4756, 0.3225]],
  17520. device='cuda:0', grad_fn=<AddmmBackward>)
  17521. landmarks are: tensor([[[ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  17522. 0.3623],
  17523. [ 0.5759, -0.3978, 1.8192, -0.1689, -0.2074, 0.3392, 0.5490,
  17524. 0.4316],
  17525. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  17526. 0.2930],
  17527. [ 0.6125, -0.4273, 1.2807, -1.3253, -0.2574, -1.2542, 0.6864,
  17528. 0.1575],
  17529. [ 0.5609, -0.4354, 1.7730, -0.1227, -0.5942, -0.0303, 0.4335,
  17530. 0.0313],
  17531. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  17532. 0.3161],
  17533. [ 0.5784, -0.4088, 1.7268, 0.0467, -0.3344, 0.0697, 0.5490,
  17534. 0.2545],
  17535. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  17536. 0.5882]]], device='cuda:0')
  17537. loss_train_step before backward: tensor(0.0276, device='cuda:0', grad_fn=<MseLossBackward>)
  17538. loss_train_step after backward: tensor(0.0276, device='cuda:0', grad_fn=<MseLossBackward>)
  17539. loss_train: 1.8798270765691996
  17540. step: 49
  17541. running loss: 0.03836381788916734
  17542. Train Steps: 49/90 Loss: 0.0384 torch.Size([8, 600, 800])
  17543. torch.Size([8, 8])
  17544. tensor([[0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  17545. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  17546. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  17547. [0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501],
  17548. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  17549. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  17550. [ nan, nan, 0.8888, 0.3100, 0.5262, 0.2817, 0.7145, 0.6003],
  17551. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980]],
  17552. device='cuda:0', dtype=torch.float64)
  17553. predictions are: tensor([[ 0.0420, -0.7969, 1.9109, -0.8322, -0.1011, -0.8858, 0.9601, 0.1443],
  17554. [ 0.6866, -0.3095, 1.7257, -0.0317, -0.5664, -0.5953, 0.2935, 0.1853],
  17555. [ 0.2108, -0.6950, 1.9938, -0.5592, -0.2313, -0.8180, 0.9008, 0.1145],
  17556. [ 0.5528, -0.4017, 1.3345, -1.0168, -0.2567, -1.0105, 0.4153, 0.2544],
  17557. [ 0.6255, -0.3738, 1.1034, -1.1191, -0.5814, -0.7942, 0.3894, 0.3216],
  17558. [ 0.7603, -0.3225, 1.7301, 0.1145, -0.2304, 0.4093, 0.1185, 0.0922],
  17559. [-1.5151, -1.8184, 1.7782, -0.8214, -0.0171, -0.7889, 0.8844, 0.3772],
  17560. [ 0.9260, -0.1868, 1.1814, -1.0478, -0.6314, -0.6874, 0.0614, 0.0822]],
  17561. device='cuda:0', grad_fn=<AddmmBackward>)
  17562. landmarks are: tensor([[[ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  17563. 0.2142],
  17564. [ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  17565. 0.1852],
  17566. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  17567. 0.2142],
  17568. [ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  17569. 0.2549],
  17570. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  17571. 0.3546],
  17572. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  17573. 0.0532],
  17574. [-2.2859, -2.2859, 1.8192, -0.8540, 0.1448, -0.9849, 1.0143,
  17575. 0.4867],
  17576. [ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  17577. 0.0141]]], device='cuda:0')
  17578. loss_train_step before backward: tensor(0.0425, device='cuda:0', grad_fn=<MseLossBackward>)
  17579. loss_train_step after backward: tensor(0.0425, device='cuda:0', grad_fn=<MseLossBackward>)
  17580. loss_train: 1.9223244320601225
  17581. step: 50
  17582. running loss: 0.03844648864120245
  17583.  
  17584. Train Steps: 50/90 Loss: 0.0384 torch.Size([8, 600, 800])
  17585. torch.Size([8, 8])
  17586. tensor([[0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  17587. [ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  17588. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  17589. [0.6260, 0.4153, 0.9000, 0.4533, 0.4025, 0.2633, 0.6223, 0.4967],
  17590. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  17591. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  17592. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  17593. [0.6203, 0.4076, 0.8611, 0.2878, 0.4050, 0.2554, 0.5907, 0.5496]],
  17594. device='cuda:0', dtype=torch.float64)
  17595. predictions are: tensor([[ 0.5079, -0.4253, 1.7334, -0.5518, -0.2087, -1.0789, 0.5205, 0.1830],
  17596. [-2.1959, -2.2539, 1.6896, -0.8953, 0.1348, -0.9927, 0.8918, 0.3466],
  17597. [ 0.7811, -0.3041, 1.3094, -1.1007, -0.1904, -1.1196, 0.6205, 0.1609],
  17598. [ 0.6017, -0.3955, 1.7478, -0.2562, -0.3932, -0.8967, 0.5031, 0.0947],
  17599. [ 0.5943, -0.3944, 1.5952, -0.4495, -0.6258, -0.1813, 0.4599, 0.2885],
  17600. [ 0.5591, -0.3863, 1.4813, -0.8121, -0.5755, -0.7021, 0.1551, 0.1755],
  17601. [ 0.7742, -0.2851, 1.6700, -0.2640, -0.4691, 0.5642, 0.4217, 0.1421],
  17602. [ 0.5294, -0.4214, 1.5105, -0.9518, -0.3016, -0.8068, 0.4605, 0.2259]],
  17603. device='cuda:0', grad_fn=<AddmmBackward>)
  17604. landmarks are: tensor([[[ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  17605. 0.0171],
  17606. [-2.2859, -2.2859, 1.8018, -0.9002, 0.1910, -1.2467, 1.1057,
  17607. 0.3799],
  17608. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  17609. 0.1917],
  17610. [ 0.6055, -0.3676, 1.8711, -0.1920, -0.4268, -1.0696, 0.5887,
  17611. 0.0081],
  17612. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  17613. 0.1929],
  17614. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  17615. 0.1005],
  17616. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  17617. 0.0772],
  17618. [ 0.5790, -0.4031, 1.6915, -0.9564, -0.4152, -1.1063, 0.4425,
  17619. 0.2528]]], device='cuda:0')
  17620. loss_train_step before backward: tensor(0.0130, device='cuda:0', grad_fn=<MseLossBackward>)
  17621. loss_train_step after backward: tensor(0.0130, device='cuda:0', grad_fn=<MseLossBackward>)
  17622. loss_train: 1.9353253524750471
  17623. step: 51
  17624. running loss: 0.037947555930883274
  17625. Train Steps: 51/90 Loss: 0.0379 torch.Size([8, 600, 800])
  17626. torch.Size([8, 8])
  17627. tensor([[0.6282, 0.4034, 0.7830, 0.2080, 0.4532, 0.2080, 0.6404, 0.5323],
  17628. [ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729],
  17629. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  17630. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  17631. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133],
  17632. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  17633. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  17634. [0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510]],
  17635. device='cuda:0', dtype=torch.float64)
  17636. predictions are: tensor([[ 0.7340, -0.3327, 1.4879, -1.1681, -0.0782, -1.3344, 0.7709, 0.1514],
  17637. [-0.8746, -1.3776, 1.0971, -1.3145, -0.2678, -1.3062, 0.2473, 0.3377],
  17638. [ 1.0725, -0.1333, 1.8916, -0.2227, -0.3438, 0.3868, 0.5975, 0.2453],
  17639. [ 1.0992, -0.1554, 1.8354, 0.2487, -0.5583, -0.2261, 0.6530, 0.0657],
  17640. [ 0.5148, -0.4407, 1.8467, -0.5045, -0.5949, -0.5906, 0.3270, 0.1523],
  17641. [ 0.8868, -0.2235, 1.5971, -1.0558, -0.2848, -1.0580, 0.6227, 0.1622],
  17642. [-2.1556, -2.2283, 1.1792, -1.2546, -0.2982, -1.1205, 0.3752, 0.3032],
  17643. [ 0.7901, -0.2864, 1.8163, 0.0887, -0.4164, 0.0258, 0.2030, 0.1948]],
  17644. device='cuda:0', grad_fn=<AddmmBackward>)
  17645. landmarks are: tensor([[[ 0.6158, -0.4225, 1.3307, -1.3253, -0.1924, -1.3252, 0.6721,
  17646. 0.1727],
  17647. [-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  17648. 0.3604],
  17649. [ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  17650. 0.3161],
  17651. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  17652. -0.1278],
  17653. [ 0.5393, -0.4294, 1.6575, -0.4075, -0.6635, -0.6308, 0.3296,
  17654. 0.0851],
  17655. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  17656. 0.1929],
  17657. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  17658. 0.2930],
  17659. [ 0.5334, -0.4252, 1.7499, -0.0226, -0.3979, -0.1920, 0.0558,
  17660. 0.2589]]], device='cuda:0')
  17661. loss_train_step before backward: tensor(0.0704, device='cuda:0', grad_fn=<MseLossBackward>)
  17662. loss_train_step after backward: tensor(0.0704, device='cuda:0', grad_fn=<MseLossBackward>)
  17663. loss_train: 2.0057187657803297
  17664. step: 52
  17665. running loss: 0.038571514726544805
  17666. Train Steps: 52/90 Loss: 0.0386 torch.Size([8, 600, 800])
  17667. torch.Size([8, 8])
  17668. tensor([[0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  17669. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  17670. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  17671. [0.6196, 0.4068, 0.7645, 0.2234, 0.4575, 0.1737, 0.5926, 0.5284],
  17672. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  17673. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  17674. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  17675. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196]],
  17676. device='cuda:0', dtype=torch.float64)
  17677. predictions are: tensor([[-0.0896, -0.8350, 1.8853, -0.9877, -0.0115, -1.3491, 0.7882, 0.0851],
  17678. [ 0.2664, -0.6331, 1.5328, -0.9256, -0.5753, -0.5936, 0.5557, 0.4303],
  17679. [ 0.2831, -0.6234, 1.7790, -0.2026, -0.5764, -0.2057, 0.4492, 0.1349],
  17680. [ 0.2364, -0.6552, 1.3299, -1.3268, -0.1236, -1.4516, 0.5103, 0.1620],
  17681. [ 0.4781, -0.5272, 1.7003, 0.0702, -0.4299, -0.1375, 0.4306, 0.1112],
  17682. [ 0.4198, -0.5174, 1.7888, -0.1580, -0.2072, 0.1132, 0.0995, 0.0633],
  17683. [ 0.4876, -0.4862, 1.3988, -1.0940, -0.6574, -0.4401, 0.6009, 0.2054],
  17684. [ 0.3655, -0.5576, 1.7252, -0.1082, -0.3145, -0.9504, 0.4736, 0.3978]],
  17685. device='cuda:0', grad_fn=<AddmmBackward>)
  17686. landmarks are: tensor([[[ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  17687. 0.0051],
  17688. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  17689. 0.5624],
  17690. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  17691. 0.1159],
  17692. [ 0.5761, -0.4070, 1.2452, -1.2541, -0.1725, -1.4835, 0.4511,
  17693. 0.1545],
  17694. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  17695. 0.2091],
  17696. [ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  17697. 0.0682],
  17698. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  17699. 0.2545],
  17700. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  17701. 0.5762]]], device='cuda:0')
  17702. loss_train_step before backward: tensor(0.0279, device='cuda:0', grad_fn=<MseLossBackward>)
  17703. loss_train_step after backward: tensor(0.0279, device='cuda:0', grad_fn=<MseLossBackward>)
  17704. loss_train: 2.0335935931652784
  17705. step: 53
  17706. running loss: 0.038369690437080724
  17707. Train Steps: 53/90 Loss: 0.0384 torch.Size([8, 600, 800])
  17708. torch.Size([8, 8])
  17709. tensor([[0.6107, 0.4050, 0.8700, 0.4850, 0.4470, 0.4848, 0.5043, 0.5431],
  17710. [0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  17711. [0.6179, 0.4008, 0.8600, 0.4015, 0.3932, 0.2515, 0.5711, 0.5438],
  17712. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  17713. [0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350],
  17714. [0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433],
  17715. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  17716. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235]],
  17717. device='cuda:0', dtype=torch.float64)
  17718. predictions are: tensor([[ 0.4297, -0.4967, 1.6639, -0.1452, -0.3522, -0.0779, 0.1092, 0.1016],
  17719. [-0.0545, -0.8022, 1.8791, -0.6957, -0.2669, -1.4643, 0.7409, 0.1956],
  17720. [ 0.1286, -0.6560, 1.5928, -0.6839, -0.3915, -1.2792, 0.3740, 0.2566],
  17721. [ 0.2547, -0.6250, 1.2035, -1.4607, -0.3059, -1.5024, 0.5547, 0.1377],
  17722. [-0.0957, -0.8061, 1.3868, -1.1668, -0.4368, -1.0446, 0.5488, 0.2840],
  17723. [ 0.9410, -0.2207, 1.7451, -0.2033, -0.2315, 0.1644, 0.6318, 0.2716],
  17724. [ 0.5294, -0.4676, 1.7483, -0.0365, -0.1930, -0.0027, 0.2473, 0.0986],
  17725. [ 0.0932, -0.7754, 1.6980, -0.1735, -0.4596, 0.0964, 0.6184, 0.1822]],
  17726. device='cuda:0', grad_fn=<AddmmBackward>)
  17727. landmarks are: tensor([[[ 0.5351, -0.4153, 1.7326, -0.0457, -0.2214, -0.0466, 0.0434,
  17728. 0.2228],
  17729. [ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  17730. 0.0171],
  17731. [ 0.5680, -0.4345, 1.6864, -0.4315, -0.4698, -1.1241, 0.3518,
  17732. 0.2261],
  17733. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  17734. 0.1082],
  17735. [ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  17736. 0.1852],
  17737. [ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  17738. 0.2237],
  17739. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  17740. 0.0532],
  17741. [ 0.5762, -0.4706, 1.7754, -0.0984, -0.3680, 0.2380, 0.6277,
  17742. 0.1322]]], device='cuda:0')
  17743. loss_train_step before backward: tensor(0.0433, device='cuda:0', grad_fn=<MseLossBackward>)
  17744. loss_train_step after backward: tensor(0.0433, device='cuda:0', grad_fn=<MseLossBackward>)
  17745. loss_train: 2.076877860352397
  17746. step: 54
  17747. running loss: 0.03846070111763698
  17748.  
  17749. Train Steps: 54/90 Loss: 0.0385 torch.Size([8, 600, 800])
  17750. torch.Size([8, 8])
  17751. tensor([[0.6307, 0.4045, 0.8025, 0.5833, 0.3775, 0.4867, 0.6892, 0.5459],
  17752. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  17753. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  17754. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  17755. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  17756. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  17757. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  17758. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279]],
  17759. device='cuda:0', dtype=torch.float64)
  17760. predictions are: tensor([[ 0.4562, -0.5427, 1.6782, 0.0694, -0.4969, -0.1446, 0.6702, 0.2226],
  17761. [-0.1811, -0.8887, 1.0253, -1.2883, -0.3301, -1.3747, 0.0681, 0.2783],
  17762. [ 0.8465, -0.3035, 1.8925, -0.1580, -0.5932, -0.4709, 0.5199, 0.1389],
  17763. [ 0.0712, -0.7317, 1.5243, -1.0640, -0.3472, -1.1446, 0.3364, 0.2090],
  17764. [ 0.4380, -0.5539, 1.8446, 0.0722, -0.3768, 0.1330, 0.3437, 0.1530],
  17765. [-0.0180, -0.8051, 1.5171, -1.2229, -0.1305, -1.3399, 0.7107, 0.2390],
  17766. [-0.0261, -0.8366, 1.5963, -1.1512, -0.2253, -1.3229, 0.6682, 0.1688],
  17767. [ 0.6177, -0.4220, 1.8000, -0.2515, -0.5198, -0.0278, 0.3949, 0.1956]],
  17768. device='cuda:0', grad_fn=<AddmmBackward>)
  17769. landmarks are: tensor([[[ 0.6273, -0.4177, 1.4208, 0.4085, -0.5423, -0.0380, 0.8973,
  17770. 0.2356],
  17771. [ 0.5591, -0.3990, 0.9012, -1.2313, -0.3979, -1.3852, 0.0804,
  17772. 0.2071],
  17773. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  17774. 0.0325],
  17775. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  17776. 0.2043],
  17777. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  17778. 0.0711],
  17779. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  17780. 0.1917],
  17781. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  17782. 0.1193],
  17783. [ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  17784. 0.1525]]], device='cuda:0')
  17785. loss_train_step before backward: tensor(0.0463, device='cuda:0', grad_fn=<MseLossBackward>)
  17786. loss_train_step after backward: tensor(0.0463, device='cuda:0', grad_fn=<MseLossBackward>)
  17787. loss_train: 2.1231579910963774
  17788. step: 55
  17789. running loss: 0.03860287256538868
  17790. Train Steps: 55/90 Loss: 0.0386 torch.Size([8, 600, 800])
  17791. torch.Size([8, 8])
  17792. tensor([[0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  17793. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  17794. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550],
  17795. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  17796. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  17797. [0.6097, 0.4024, 0.8488, 0.3717, 0.3875, 0.5517, 0.5836, 0.5591],
  17798. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  17799. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933]],
  17800. device='cuda:0', dtype=torch.float64)
  17801. predictions are: tensor([[ 0.3630, -0.5458, 1.6351, 0.1872, -0.3983, -0.4754, 0.3092, 0.3913],
  17802. [ 0.2263, -0.6256, 1.3120, -1.3146, -0.4408, -1.4280, 0.5027, 0.2511],
  17803. [ 0.2667, -0.6203, 1.8972, -0.3692, -0.3622, -0.1678, 0.5342, 0.2368],
  17804. [ 0.2488, -0.6262, 1.3356, -1.1459, -0.5657, -0.8258, 0.5429, 0.2466],
  17805. [ 0.3914, -0.5923, 1.8955, -0.0133, -0.4285, -0.2241, 0.6273, 0.0103],
  17806. [ 0.0806, -0.7299, 1.6935, -0.6597, -0.4001, 0.0085, 0.5942, 0.2190],
  17807. [ 0.4726, -0.4565, 1.3884, -1.1786, -0.5101, -1.2969, 0.1848, -0.0156],
  17808. [ 0.4982, -0.4523, 1.7932, 0.2545, 0.0606, -0.6184, 0.3437, 0.3104]],
  17809. device='cuda:0', grad_fn=<AddmmBackward>)
  17810. landmarks are: tensor([[[ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  17811. 0.5401],
  17812. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  17813. 0.3546],
  17814. [ 0.5968, -0.3725, 1.8423, -0.1381, -0.4037, 0.1852, 0.6009,
  17815. 0.2776],
  17816. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  17817. 0.3546],
  17818. [ 0.5908, -0.4366, 1.7557, 0.1390, -0.5192, 0.1313, 0.6529,
  17819. 0.0236],
  17820. [ 0.5301, -0.4273, 1.6344, -0.5692, -0.4961, 0.2622, 0.4098,
  17821. 0.2966],
  17822. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  17823. -0.1031],
  17824. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  17825. 0.4547]]], device='cuda:0')
  17826. loss_train_step before backward: tensor(0.0382, device='cuda:0', grad_fn=<MseLossBackward>)
  17827. loss_train_step after backward: tensor(0.0382, device='cuda:0', grad_fn=<MseLossBackward>)
  17828. loss_train: 2.161322994157672
  17829. step: 56
  17830. running loss: 0.038595053467101285
  17831. Train Steps: 56/90 Loss: 0.0386 torch.Size([8, 600, 800])
  17832. torch.Size([8, 8])
  17833. tensor([[0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  17834. [0.6189, 0.4033, 0.8650, 0.5267, 0.4487, 0.5150, 0.5925, 0.5050],
  17835. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  17836. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  17837. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  17838. [0.6308, 0.3990, 0.8688, 0.5183, 0.3950, 0.4983, 0.6388, 0.5133],
  17839. [0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426],
  17840. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433]],
  17841. device='cuda:0', dtype=torch.float64)
  17842. predictions are: tensor([[ 0.4092, -0.5138, 1.8144, -0.1999, -0.3258, -0.0545, 0.4307, 0.1656],
  17843. [ 0.4702, -0.4808, 1.7870, -0.0377, -0.1724, -0.1545, 0.3535, 0.1485],
  17844. [ 0.3143, -0.5592, 1.5140, 0.1310, -0.4379, -0.4050, 0.2350, 0.4357],
  17845. [ 0.6361, -0.4048, 1.8149, -0.2947, -0.5310, -0.4568, 0.6891, 0.1461],
  17846. [ 0.0101, -0.7609, 1.3474, -1.3365, -0.3493, -1.3944, 0.4397, 0.2876],
  17847. [ 0.4153, -0.5429, 1.7749, -0.1072, -0.4279, -0.2432, 0.6392, 0.1070],
  17848. [ 0.1730, -0.6428, 1.2906, -1.3643, -0.2571, -1.6480, 0.3724, 0.1490],
  17849. [ 0.5979, -0.4057, 1.8060, -0.3230, -0.5050, -0.1868, 0.4154, 0.1172]],
  17850. device='cuda:0', grad_fn=<AddmmBackward>)
  17851. landmarks are: tensor([[[ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  17852. 0.1390],
  17853. [ 0.5726, -0.4230, 1.7095, 0.1467, -0.2132, 0.0928, 0.4508,
  17854. 0.0467],
  17855. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  17856. 0.5401],
  17857. [ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  17858. 0.1779],
  17859. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  17860. 0.3315],
  17861. [ 0.6275, -0.4430, 1.7268, 0.1082, -0.4614, 0.0159, 0.6644,
  17862. 0.0851],
  17863. [ 0.5784, -0.4153, 1.2972, -1.2541, -0.2265, -1.4553, 0.4741,
  17864. 0.2203],
  17865. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  17866. 0.2237]]], device='cuda:0')
  17867. loss_train_step before backward: tensor(0.0283, device='cuda:0', grad_fn=<MseLossBackward>)
  17868. loss_train_step after backward: tensor(0.0283, device='cuda:0', grad_fn=<MseLossBackward>)
  17869. loss_train: 2.189621262252331
  17870. step: 57
  17871. running loss: 0.03841440810969001
  17872. Train Steps: 57/90 Loss: 0.0384 torch.Size([8, 600, 800])
  17873. torch.Size([8, 8])
  17874. tensor([[0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433],
  17875. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  17876. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  17877. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  17878. [0.6129, 0.4114, 0.6950, 0.2467, 0.4050, 0.2133, 0.5363, 0.5550],
  17879. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  17880. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436],
  17881. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136]],
  17882. device='cuda:0', dtype=torch.float64)
  17883. predictions are: tensor([[ 0.6948, -0.3456, 1.8998, 0.0423, -0.1258, 0.0501, 0.6125, 0.2276],
  17884. [ 0.3303, -0.5843, 1.8655, 0.0207, -0.4595, -0.1592, 0.3264, 0.0907],
  17885. [ 0.1220, -0.6186, 1.3515, -0.9253, -0.1465, -1.4670, 0.3551, 0.3518],
  17886. [ 0.5260, -0.4394, 1.9115, -0.1421, -0.3737, 0.0497, 0.5564, 0.1762],
  17887. [ 0.0102, -0.7211, 1.0825, -1.0281, -0.4573, -1.3510, 0.0147, 0.2470],
  17888. [ 0.3063, -0.5432, 1.2584, -1.0544, -0.5468, -1.2192, 0.4297, 0.2727],
  17889. [ 0.4030, -0.5388, 1.8117, 0.1530, -0.4069, 0.0941, 0.9434, 0.1687],
  17890. [ 0.5400, -0.4138, 1.0428, -1.2295, -0.5807, -1.2244, 0.2741, 0.0920]],
  17891. device='cuda:0', grad_fn=<AddmmBackward>)
  17892. landmarks are: tensor([[[ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  17893. 0.2237],
  17894. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  17895. 0.2035],
  17896. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  17897. 0.3854],
  17898. [ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  17899. 0.3161],
  17900. [ 0.5448, -0.3859, 0.9242, -1.1466, -0.4152, -1.3005, 0.1910,
  17901. 0.2776],
  17902. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  17903. 0.3546],
  17904. [ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  17905. 0.2249],
  17906. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  17907. 0.0862]]], device='cuda:0')
  17908. loss_train_step before backward: tensor(0.0236, device='cuda:0', grad_fn=<MseLossBackward>)
  17909. loss_train_step after backward: tensor(0.0236, device='cuda:0', grad_fn=<MseLossBackward>)
  17910. loss_train: 2.213260428979993
  17911. step: 58
  17912. running loss: 0.038159662568620564
  17913.  
  17914. Train Steps: 58/90 Loss: 0.0382 torch.Size([8, 600, 800])
  17915. torch.Size([8, 8])
  17916. tensor([[0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  17917. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  17918. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  17919. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450],
  17920. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  17921. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  17922. [0.6250, 0.4106, 0.8700, 0.3717, 0.3588, 0.4967, 0.6038, 0.5167],
  17923. [0.6084, 0.3981, 0.8588, 0.5233, 0.4600, 0.5367, 0.5680, 0.5006]],
  17924. device='cuda:0', dtype=torch.float64)
  17925. predictions are: tensor([[ 0.7516, -0.2493, 1.6080, -0.1194, -0.3354, -0.4171, 0.2348, 0.2148],
  17926. [ 0.1629, -0.6173, 1.6239, -0.3986, -0.4561, 0.0161, 0.4742, 0.1740],
  17927. [ 0.4031, -0.4658, 1.5838, 0.0052, -0.1537, -0.3175, 0.1387, 0.2543],
  17928. [ 0.5602, -0.4197, 1.6715, -0.3033, -0.3595, -0.1238, 0.5330, 0.2328],
  17929. [ 0.4136, -0.4696, 1.6398, -1.0198, -0.4677, -1.4931, 0.7789, 0.1734],
  17930. [ 0.2517, -0.6238, 1.5922, 0.0767, -0.4577, -0.4736, 0.5105, 0.1944],
  17931. [ 0.7147, -0.2776, 1.5206, -0.6886, -0.5991, -0.2994, 0.6749, 0.2496],
  17932. [ 0.4535, -0.4406, 1.5970, 0.0072, -0.1969, -0.2337, 0.1553, 0.1555]],
  17933. device='cuda:0', grad_fn=<AddmmBackward>)
  17934. landmarks are: tensor([[[ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  17935. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  17936. [ 5.3759e-01, -3.9030e-01, 1.7095e+00, -3.2286e-01, -4.7298e-01,
  17937. 4.7005e-01, 3.8714e-01, 7.7228e-02],
  17938. [ 5.3181e-01, -4.3102e-01, 1.6864e+00, 5.4350e-02, -1.5543e-01,
  17939. 1.3133e-01, 6.3480e-02, 2.6342e-01],
  17940. [ 5.9602e-01, -4.1016e-01, 1.8018e+00, -1.6120e-01, -3.3441e-01,
  17941. 1.1594e-01, 5.4896e-01, 2.3141e-01],
  17942. [ 6.1742e-01, -4.2008e-01, 1.7309e+00, -8.7840e-01, -4.7351e-01,
  17943. -9.5238e-01, 6.2423e-01, 1.9310e-01],
  17944. [ 5.7748e-01, -4.6066e-01, 1.6741e+00, 1.9623e-01, -4.0362e-01,
  17945. -1.2115e-01, 4.5876e-01, 1.9786e-01],
  17946. [ 6.0098e-01, -3.8961e-01, 1.7326e+00, -5.6921e-01, -6.2887e-01,
  17947. 8.1601e-03, 5.0277e-01, 1.0054e-01],
  17948. [ 5.2408e-01, -4.4696e-01, 1.6806e+00, 1.3133e-01, -1.6120e-01,
  17949. 1.9292e-01, 3.3778e-01, 2.6129e-02]]], device='cuda:0')
  17950. loss_train_step before backward: tensor(0.0338, device='cuda:0', grad_fn=<MseLossBackward>)
  17951. loss_train_step after backward: tensor(0.0338, device='cuda:0', grad_fn=<MseLossBackward>)
  17952. loss_train: 2.2470400538295507
  17953. step: 59
  17954. running loss: 0.038085424641178825
  17955. Train Steps: 59/90 Loss: 0.0381 torch.Size([8, 600, 800])
  17956. torch.Size([8, 8])
  17957. tensor([[0.6277, 0.4013, 0.8888, 0.4767, 0.3600, 0.3567, 0.6148, 0.4672],
  17958. [0.6186, 0.4013, 0.8191, 0.3188, 0.4279, 0.2060, 0.5767, 0.5411],
  17959. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  17960. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  17961. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  17962. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  17963. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  17964. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679]],
  17965. device='cuda:0', dtype=torch.float64)
  17966. predictions are: tensor([[ 1.4318, 0.1613, 1.6839, -0.1669, -0.6021, -0.5390, 0.4439, 0.0423],
  17967. [ 1.2904, 0.1413, 1.4333, -0.7264, -0.3609, -1.2067, 0.1633, 0.1794],
  17968. [ 1.0495, -0.0377, 1.2722, -0.9776, -0.3320, -1.2180, 0.2905, 0.1976],
  17969. [ 1.0321, -0.0924, 1.4443, 0.2232, -0.4871, 0.0177, 0.6999, 0.2629],
  17970. [ 0.9761, -0.0933, 1.1736, -1.0616, -0.5285, -0.7053, 0.4697, 0.2521],
  17971. [-1.8286, -1.9014, 1.0395, -0.8848, -0.4785, -1.0044, 0.0752, 0.2423],
  17972. [ 0.9323, -0.1344, 1.6433, 0.1998, -0.2636, 0.3281, 0.3945, 0.1279],
  17973. [-2.3898, -2.3125, 1.5499, -0.9304, 0.1178, -1.0389, 0.9971, 0.3760]],
  17974. device='cuda:0', grad_fn=<AddmmBackward>)
  17975. landmarks are: tensor([[[ 0.6132, -0.4324, 1.8192, -0.0842, -0.6231, -0.6385, 0.5537,
  17976. -0.1278],
  17977. [ 0.5713, -0.4321, 1.4975, -0.8134, -0.3094, -1.3345, 0.3779,
  17978. 0.2134],
  17979. [ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  17980. 0.0928],
  17981. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  17982. 0.3478],
  17983. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  17984. 0.1621],
  17985. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  17986. 0.2183],
  17987. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  17988. 0.0764],
  17989. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  17990. 0.3371]]], device='cuda:0')
  17991. loss_train_step before backward: tensor(0.0677, device='cuda:0', grad_fn=<MseLossBackward>)
  17992. loss_train_step after backward: tensor(0.0677, device='cuda:0', grad_fn=<MseLossBackward>)
  17993. loss_train: 2.3147859629243612
  17994. step: 60
  17995. running loss: 0.038579766048739354
  17996. Train Steps: 60/90 Loss: 0.0386 torch.Size([8, 600, 800])
  17997. torch.Size([8, 8])
  17998. tensor([[0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131],
  17999. [0.6214, 0.4040, 0.8838, 0.3500, 0.3600, 0.5183, 0.6362, 0.5200],
  18000. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350],
  18001. [0.6225, 0.4116, 0.8662, 0.3517, 0.3663, 0.3233, 0.5837, 0.5317],
  18002. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  18003. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  18004. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  18005. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600]],
  18006. device='cuda:0', dtype=torch.float64)
  18007. predictions are: tensor([[ 0.6984, -0.3234, 1.5211, -0.3551, -0.5158, -0.1597, 0.2934, 0.1677],
  18008. [ 0.3330, -0.5850, 1.6220, -0.5140, -0.4023, 0.2297, 0.7771, 0.2031],
  18009. [ 0.2629, -0.6181, 1.7049, 0.1271, -0.3293, -0.2368, 0.1755, 0.1922],
  18010. [ 0.8531, -0.1939, 1.6120, -0.5787, -0.4479, -0.9063, 0.3136, 0.2825],
  18011. [ 0.6014, -0.4231, 1.7773, 0.0603, -0.4681, -0.4661, 0.7059, 0.1404],
  18012. [ 0.3605, -0.4942, 1.2824, -0.5865, -0.5712, -0.4829, 0.1422, 0.3245],
  18013. [ 0.4777, -0.4718, 1.7059, -0.5215, -0.2062, -0.9239, 0.8412, 0.1175],
  18014. [ 0.3245, -0.5201, 1.0536, -1.0747, -0.4880, -0.8538, 0.3860, 0.3297]],
  18015. device='cuda:0', grad_fn=<AddmmBackward>)
  18016. landmarks are: tensor([[[ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  18017. 0.0840],
  18018. [ 0.5841, -0.4199, 1.7961, -0.6693, -0.6231, 0.1082, 0.6529,
  18019. 0.1159],
  18020. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  18021. 0.1854],
  18022. [ 0.5893, -0.3847, 1.7152, -0.6616, -0.5942, -0.7925, 0.4104,
  18023. 0.1698],
  18024. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  18025. 0.0325],
  18026. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  18027. 0.3417],
  18028. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  18029. 0.1821],
  18030. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  18031. 0.3007]]], device='cuda:0')
  18032. loss_train_step before backward: tensor(0.0159, device='cuda:0', grad_fn=<MseLossBackward>)
  18033. loss_train_step after backward: tensor(0.0159, device='cuda:0', grad_fn=<MseLossBackward>)
  18034. loss_train: 2.330700110644102
  18035. step: 61
  18036. running loss: 0.038208198535149215
  18037. Train Steps: 61/90 Loss: 0.0382 torch.Size([8, 600, 800])
  18038. torch.Size([8, 8])
  18039. tensor([[0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  18040. [0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155],
  18041. [0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  18042. [ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933],
  18043. [0.6100, 0.4071, 0.7601, 0.3444, 0.3400, 0.4117, 0.5625, 0.5617],
  18044. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297],
  18045. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  18046. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058]],
  18047. device='cuda:0', dtype=torch.float64)
  18048. predictions are: tensor([[ 0.5166, -0.4363, 1.5673, 0.4389, -0.3340, 0.1185, 0.6154, 0.3582],
  18049. [ 0.7376, -0.2867, 1.6665, -0.9273, -0.1881, -1.2132, 0.7366, 0.0424],
  18050. [ 1.0151, -0.0670, 1.6360, 0.0200, -0.5590, -0.5761, 0.2286, 0.3074],
  18051. [-1.9647, -2.0599, 1.0725, -0.9805, -0.3861, -0.9972, 0.1053, 0.3411],
  18052. [ 0.7916, -0.2394, 1.3005, -0.7080, -0.6687, -0.2677, 0.3271, 0.2352],
  18053. [ 0.7570, -0.3201, 1.7928, -0.0304, -0.3660, 0.1177, 0.9711, 0.0881],
  18054. [ 0.8833, -0.1852, 1.0046, -1.0671, -0.4564, -1.1528, 0.3791, 0.2964],
  18055. [ 0.7265, -0.2935, 1.6835, -0.2477, -0.4694, -0.0076, 0.2798, 0.0503]],
  18056. device='cuda:0', grad_fn=<AddmmBackward>)
  18057. landmarks are: tensor([[[ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  18058. 0.5393],
  18059. [ 0.6126, -0.4161, 1.6344, -0.9541, -0.2247, -1.3467, 0.6339,
  18060. 0.0953],
  18061. [ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  18062. 0.4393],
  18063. [-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  18064. 0.4543],
  18065. [ 0.5318, -0.4056, 1.2249, -0.6949, -0.7155, -0.3844, 0.3122,
  18066. 0.3084],
  18067. [ 0.6257, -0.4273, 1.8365, -0.0688, -0.4672, -0.0611, 1.1715,
  18068. 0.1608],
  18069. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  18070. 0.2391],
  18071. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  18072. 0.0502]]], device='cuda:0')
  18073. loss_train_step before backward: tensor(0.0206, device='cuda:0', grad_fn=<MseLossBackward>)
  18074. loss_train_step after backward: tensor(0.0206, device='cuda:0', grad_fn=<MseLossBackward>)
  18075. loss_train: 2.351294633001089
  18076. step: 62
  18077. running loss: 0.03792410698388853
  18078.  
  18079. Train Steps: 62/90 Loss: 0.0379 torch.Size([8, 600, 800])
  18080. torch.Size([8, 8])
  18081. tensor([[0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  18082. [0.6173, 0.4114, 0.7325, 0.2500, 0.4213, 0.1917, 0.5338, 0.5700],
  18083. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  18084. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690],
  18085. [0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097],
  18086. [ nan, nan, 0.7625, 0.2433, 0.3713, 0.2867, 0.5235, 0.5220],
  18087. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  18088. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433]],
  18089. device='cuda:0', dtype=torch.float64)
  18090. predictions are: tensor([[ 0.9962, -0.0934, 1.1704, -0.8884, -0.5775, -0.9059, 0.1283, 0.0411],
  18091. [ 0.5343, -0.3708, 0.9757, -1.0411, -0.3740, -1.2404, 0.1549, 0.3203],
  18092. [ 0.6687, -0.3089, 1.6206, -0.1213, -0.5958, -0.6372, 0.2967, 0.3001],
  18093. [ 0.9464, -0.1766, 1.5838, 0.2979, -0.3140, 0.3399, 1.1289, 0.2496],
  18094. [ 0.8749, -0.1664, 1.7403, -0.0485, -0.2417, 0.4094, 0.6488, 0.1518],
  18095. [-2.2750, -2.2735, 1.1797, -0.9250, -0.4382, -1.0054, 0.2959, 0.2726],
  18096. [ 0.6862, -0.2847, 1.3516, -0.7464, -0.5798, -1.0829, 0.1398, 0.1386],
  18097. [ 0.9209, -0.1630, 1.7334, -0.0049, -0.1730, 0.2321, 0.8091, 0.1891]],
  18098. device='cuda:0', grad_fn=<AddmmBackward>)
  18099. landmarks are: tensor([[[ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  18100. 0.0141],
  18101. [ 0.5652, -0.3858, 1.0975, -1.1312, -0.3402, -1.4006, 0.1794,
  18102. 0.3469],
  18103. [ 0.5697, -0.4113, 1.7499, -0.2767, -0.6404, -0.7155, 0.1576,
  18104. 0.4032],
  18105. [ 0.6306, -0.4153, 1.5141, 0.2224, -0.3691, 0.2622, 1.0033,
  18106. 0.3425],
  18107. [ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  18108. 0.0682],
  18109. [-2.2859, -2.2859, 1.2360, -1.1620, -0.5711, -0.9618, 0.1322,
  18110. 0.1253],
  18111. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  18112. -0.0220],
  18113. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  18114. 0.2237]]], device='cuda:0')
  18115. loss_train_step before backward: tensor(0.0234, device='cuda:0', grad_fn=<MseLossBackward>)
  18116. loss_train_step after backward: tensor(0.0234, device='cuda:0', grad_fn=<MseLossBackward>)
  18117. loss_train: 2.3746544364839792
  18118. step: 63
  18119. running loss: 0.03769292756323776
  18120. Train Steps: 63/90 Loss: 0.0377 torch.Size([8, 600, 800])
  18121. torch.Size([8, 8])
  18122. tensor([[0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667],
  18123. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  18124. [0.6132, 0.3930, 0.8672, 0.4754, 0.3712, 0.5222, 0.5974, 0.5098],
  18125. [0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  18126. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  18127. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  18128. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  18129. [0.6144, 0.4032, 0.8563, 0.3283, 0.3525, 0.4200, 0.5775, 0.5583]],
  18130. device='cuda:0', dtype=torch.float64)
  18131. predictions are: tensor([[ 0.7226, -0.3009, 1.7418, -0.4842, -0.5559, -0.6611, 0.4734, 0.2265],
  18132. [ 0.4656, -0.4734, 1.4132, -0.7718, -0.6248, -0.4430, 0.5061, 0.1726],
  18133. [ 0.5246, -0.4583, 1.6505, 0.0021, -0.4564, 0.2503, 0.5228, 0.1319],
  18134. [ 0.3909, -0.5617, 1.6733, 0.2320, -0.2253, 0.2285, 0.9119, 0.1082],
  18135. [ 0.7132, -0.3086, 0.9763, -0.9335, -0.6716, -0.7552, 0.1523, 0.2934],
  18136. [ 0.4919, -0.4394, 1.6127, 0.4938, -0.3679, -0.0914, 0.3918, 0.3192],
  18137. [ 0.6757, -0.3431, 1.2730, -1.1612, -0.1780, -1.3853, 0.4469, 0.1643],
  18138. [ 0.1408, -0.6819, 1.6216, -0.6210, -0.6415, -0.3399, 0.3708, 0.2362]],
  18139. device='cuda:0', grad_fn=<AddmmBackward>)
  18140. landmarks are: tensor([[[ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  18141. 0.3315],
  18142. [ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  18143. 0.1159],
  18144. [ 0.5466, -0.4706, 1.7198, -0.0903, -0.5712, 0.1261, 0.4733,
  18145. 0.0688],
  18146. [ 0.6042, -0.4273, 1.6920, 0.1860, -0.2717, 0.1406, 0.7997,
  18147. 0.1004],
  18148. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  18149. 0.3315],
  18150. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  18151. 0.3007],
  18152. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  18153. 0.2083],
  18154. [ 0.5520, -0.4237, 1.6691, -0.7694, -0.6577, -0.3460, 0.3815,
  18155. 0.2930]]], device='cuda:0')
  18156. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  18157. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  18158. loss_train: 2.3852399922907352
  18159. step: 64
  18160. running loss: 0.03726937487954274
  18161. Train Steps: 64/90 Loss: 0.0373 torch.Size([8, 600, 800])
  18162. torch.Size([8, 8])
  18163. tensor([[0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  18164. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  18165. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  18166. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  18167. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  18168. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  18169. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  18170. [0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300]],
  18171. device='cuda:0', dtype=torch.float64)
  18172. predictions are: tensor([[-0.2325, -0.9602, 1.2720, -1.0271, -0.3637, -0.9876, 0.4289, 0.2526],
  18173. [ 0.4505, -0.5013, 1.8136, 0.0927, -0.1843, 0.4526, 0.6604, 0.1773],
  18174. [ 0.8687, -0.2430, 1.0114, -1.1226, -0.5207, -0.9863, 0.3914, 0.2113],
  18175. [ 0.6572, -0.3616, 1.5121, -0.5709, -0.6501, -0.3371, 0.4752, 0.4255],
  18176. [ 0.7217, -0.3336, 1.3004, -1.0443, -0.2111, -1.2127, 0.4349, 0.1557],
  18177. [ 0.3431, -0.5483, 1.2653, -0.8805, -0.6536, -0.6157, 0.3194, 0.1887],
  18178. [ 0.3079, -0.6517, 1.7307, 0.5960, -0.5675, 0.1268, 0.7210, 0.0536],
  18179. [ 0.6070, -0.3925, 1.6147, -0.2691, -0.6091, -0.5846, 0.4420, 0.1639]],
  18180. device='cuda:0', grad_fn=<AddmmBackward>)
  18181. landmarks are: tensor([[[ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  18182. 0.1698],
  18183. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  18184. 0.2237],
  18185. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  18186. 0.2930],
  18187. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  18188. 0.5624],
  18189. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  18190. 0.2083],
  18191. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  18192. 0.2545],
  18193. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  18194. 0.0261],
  18195. [ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  18196. 0.1621]]], device='cuda:0')
  18197. loss_train_step before backward: tensor(0.0348, device='cuda:0', grad_fn=<MseLossBackward>)
  18198. loss_train_step after backward: tensor(0.0348, device='cuda:0', grad_fn=<MseLossBackward>)
  18199. loss_train: 2.420039724558592
  18200. step: 65
  18201. running loss: 0.03723138037782449
  18202. Train Steps: 65/90 Loss: 0.0372 torch.Size([8, 600, 800])
  18203. torch.Size([8, 8])
  18204. tensor([[0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390],
  18205. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  18206. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  18207. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133],
  18208. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  18209. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  18210. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  18211. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667]],
  18212. device='cuda:0', dtype=torch.float64)
  18213. predictions are: tensor([[ 0.5645, -0.4307, 1.5633, -0.5971, -0.4191, -0.9917, 0.6887, 0.1340],
  18214. [ 0.7224, -0.3567, 1.5991, -0.2279, -0.4591, 0.3066, 0.8598, 0.1349],
  18215. [ 0.2056, -0.6534, 1.6414, -0.3374, -0.5785, -0.4410, 0.4228, 0.3512],
  18216. [ 0.9953, -0.1275, 1.5085, -0.5903, -0.7189, -0.6876, 0.1175, 0.0700],
  18217. [ 0.3773, -0.5384, 1.5414, -0.1393, -0.3429, 0.0346, 0.3330, 0.2650],
  18218. [ 0.5671, -0.4097, 1.5155, 0.2661, -0.4947, -0.1401, 0.4437, 0.1082],
  18219. [ 0.5217, -0.4431, 1.5807, -0.2839, -0.1187, 0.0570, 0.4562, 0.2333],
  18220. [ 0.3458, -0.5701, 1.5426, -0.6712, -0.6604, -0.4480, 0.5075, 0.3324]],
  18221. device='cuda:0', grad_fn=<AddmmBackward>)
  18222. landmarks are: tensor([[[ 0.6504, -0.3936, 1.8885, -0.4922, -0.3402, -0.9233, 0.8022,
  18223. 0.2035],
  18224. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  18225. 0.1554],
  18226. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  18227. 0.3238],
  18228. [ 0.5393, -0.4294, 1.6575, -0.4075, -0.6635, -0.6308, 0.3296,
  18229. 0.0851],
  18230. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  18231. 0.3084],
  18232. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  18233. 0.2391],
  18234. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  18235. 0.2853],
  18236. [ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  18237. 0.3315]]], device='cuda:0')
  18238. loss_train_step before backward: tensor(0.0216, device='cuda:0', grad_fn=<MseLossBackward>)
  18239. loss_train_step after backward: tensor(0.0216, device='cuda:0', grad_fn=<MseLossBackward>)
  18240. loss_train: 2.4416198935359716
  18241. step: 66
  18242. running loss: 0.03699424081115109
  18243.  
  18244. Train Steps: 66/90 Loss: 0.0370 torch.Size([8, 600, 800])
  18245. torch.Size([8, 8])
  18246. tensor([[0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  18247. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  18248. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  18249. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  18250. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  18251. [ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167],
  18252. [0.6129, 0.4063, 0.8738, 0.5250, 0.4313, 0.4733, 0.5230, 0.5874],
  18253. [0.6261, 0.4066, 0.8325, 0.2150, 0.4763, 0.2667, 0.7002, 0.5633]],
  18254. device='cuda:0', dtype=torch.float64)
  18255. predictions are: tensor([[ 0.5820, -0.4485, 1.6251, -0.0173, -0.6775, 0.0058, 0.4772, 0.1054],
  18256. [ 0.8377, -0.2557, 1.0665, -1.3392, -0.4191, -1.2162, 0.4193, 0.1196],
  18257. [ 0.7974, -0.2742, 1.7813, -0.2587, -0.6334, -0.5775, 0.6602, 0.2203],
  18258. [ 0.5028, -0.4743, 1.6421, -0.0655, -0.2851, 0.0431, 0.2469, 0.1449],
  18259. [ 0.6925, -0.3438, 1.5984, -0.0479, -0.4077, 0.1826, 0.6601, 0.2109],
  18260. [-1.8189, -2.0004, 1.1048, -1.0873, -0.5757, -0.9374, 0.1628, 0.3239],
  18261. [ 0.8944, -0.1868, 1.5583, 0.3516, -0.4822, 0.1158, 0.2916, 0.2641],
  18262. [ 0.9293, -0.2237, 1.5071, -1.1302, -0.2633, -1.0934, 1.0246, 0.1812]],
  18263. device='cuda:0', grad_fn=<AddmmBackward>)
  18264. landmarks are: tensor([[[ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  18265. -0.0534],
  18266. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  18267. 0.1082],
  18268. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  18269. 0.1005],
  18270. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  18271. -0.0039],
  18272. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  18273. 0.1474],
  18274. [-2.2859, -2.2859, 1.2820, -1.0801, -0.5885, -1.0234, 0.2141,
  18275. 0.1005],
  18276. [ 0.5453, -0.4091, 1.7499, 0.1390, -0.2940, -0.0996, 0.1300,
  18277. 0.4272],
  18278. [ 0.6059, -0.4080, 1.5594, -1.2928, -0.0861, -1.0542, 0.9485,
  18279. 0.3157]]], device='cuda:0')
  18280. loss_train_step before backward: tensor(0.0246, device='cuda:0', grad_fn=<MseLossBackward>)
  18281. loss_train_step after backward: tensor(0.0246, device='cuda:0', grad_fn=<MseLossBackward>)
  18282. loss_train: 2.466248968616128
  18283. step: 67
  18284. running loss: 0.03680968609874818
  18285. Train Steps: 67/90 Loss: 0.0368 torch.Size([8, 600, 800])
  18286. torch.Size([8, 8])
  18287. tensor([[0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320],
  18288. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  18289. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  18290. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  18291. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  18292. [0.6307, 0.4045, 0.8025, 0.5833, 0.3775, 0.4867, 0.6892, 0.5459],
  18293. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  18294. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433]],
  18295. device='cuda:0', dtype=torch.float64)
  18296. predictions are: tensor([[ 0.5870, -0.4610, 1.3650, -1.2479, -0.2693, -0.9599, 0.7566, 0.1759],
  18297. [ 0.4017, -0.5527, 1.6589, -0.4986, -0.6020, -0.2526, 0.3103, 0.3728],
  18298. [ 0.7367, -0.3825, 1.8921, 0.1706, -0.5680, -0.3303, 0.6146, -0.0270],
  18299. [ 0.3524, -0.5784, 1.2265, -1.1055, -0.5940, -0.6406, 0.4431, 0.2381],
  18300. [ 0.4678, -0.5461, 1.7167, -0.0406, -0.5576, -0.2412, 0.6385, 0.1505],
  18301. [ 0.4932, -0.5308, 1.5870, 0.1907, -0.4714, 0.0821, 0.8611, 0.1655],
  18302. [ 0.6406, -0.3934, 1.2931, -0.9672, -0.4253, -0.9065, 0.1885, 0.2612],
  18303. [ 0.3304, -0.5758, 1.4735, -0.6033, -0.6111, -0.6446, 0.1847, 0.2778]],
  18304. device='cuda:0', grad_fn=<AddmmBackward>)
  18305. landmarks are: tensor([[[ 0.6141, -0.4153, 1.4208, -1.2697, -0.2940, -1.0234, 0.8644,
  18306. 0.1715],
  18307. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  18308. 0.3238],
  18309. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  18310. -0.0049],
  18311. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  18312. 0.2545],
  18313. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  18314. 0.1082],
  18315. [ 0.6273, -0.4177, 1.4208, 0.4085, -0.5423, -0.0380, 0.8973,
  18316. 0.2356],
  18317. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  18318. 0.3700],
  18319. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  18320. 0.2237]]], device='cuda:0')
  18321. loss_train_step before backward: tensor(0.0130, device='cuda:0', grad_fn=<MseLossBackward>)
  18322. loss_train_step after backward: tensor(0.0130, device='cuda:0', grad_fn=<MseLossBackward>)
  18323. loss_train: 2.479281820356846
  18324. step: 68
  18325. running loss: 0.036460026769953614
  18326. Train Steps: 68/90 Loss: 0.0365 torch.Size([8, 600, 800])
  18327. torch.Size([8, 8])
  18328. tensor([[0.6168, 0.4081, 0.8438, 0.3367, 0.3500, 0.4667, 0.6212, 0.5400],
  18329. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  18330. [0.6203, 0.4078, 0.8800, 0.5083, 0.3900, 0.5000, 0.6100, 0.5583],
  18331. [0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  18332. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  18333. [0.6216, 0.4100, 0.7350, 0.2067, 0.4325, 0.2050, 0.5950, 0.5333],
  18334. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  18335. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064]],
  18336. device='cuda:0', dtype=torch.float64)
  18337. predictions are: tensor([[ 0.4208, -0.5286, 1.5660, -0.6811, -0.6707, -0.0938, 0.6795, 0.2433],
  18338. [ 0.4844, -0.5045, 1.7132, -0.2291, -0.6871, -0.6187, 0.3231, 0.2310],
  18339. [ 0.5048, -0.5052, 1.8143, 0.1818, -0.5250, 0.1356, 0.5827, 0.1163],
  18340. [ 0.4867, -0.5049, 1.7367, -0.1605, -0.5433, -0.1209, 0.4980, 0.3073],
  18341. [ 0.8457, -0.3071, 1.1189, -1.3358, -0.4476, -1.1324, 0.6848, 0.1563],
  18342. [ 0.5788, -0.4468, 1.1256, -1.3333, -0.3039, -1.3215, 0.4436, 0.2026],
  18343. [ 0.4527, -0.5231, 1.6824, -0.2289, -0.6501, -0.3667, 0.5120, 0.2052],
  18344. [ 0.2446, -0.6634, 1.8283, 0.1008, -0.0463, 0.0247, 0.2871, 0.1155]],
  18345. device='cuda:0', grad_fn=<AddmmBackward>)
  18346. landmarks are: tensor([[[ 0.5631, -0.4008, 1.6113, -0.7309, -0.6693, -0.1304, 0.5836,
  18347. 0.2083],
  18348. [ 0.5697, -0.4113, 1.7499, -0.2767, -0.6404, -0.7155, 0.1576,
  18349. 0.4032],
  18350. [ 0.5794, -0.4023, 1.7788, 0.0620, -0.4845, 0.0236, 0.5316,
  18351. 0.2930],
  18352. [ 0.5700, -0.4032, 1.7961, -0.1997, -0.5249, -0.2151, 0.3815,
  18353. 0.3161],
  18354. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  18355. 0.2468],
  18356. [ 0.5853, -0.3920, 1.1090, -1.3313, -0.2882, -1.3390, 0.4624,
  18357. 0.1775],
  18358. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  18359. 0.2853],
  18360. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  18361. 0.0532]]], device='cuda:0')
  18362. loss_train_step before backward: tensor(0.0102, device='cuda:0', grad_fn=<MseLossBackward>)
  18363. loss_train_step after backward: tensor(0.0102, device='cuda:0', grad_fn=<MseLossBackward>)
  18364. loss_train: 2.4894718173891306
  18365. step: 69
  18366. running loss: 0.03607930170129175
  18367. Train Steps: 69/90 Loss: 0.0361 torch.Size([8, 600, 800])
  18368. torch.Size([8, 8])
  18369. tensor([[0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  18370. [0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391],
  18371. [0.6211, 0.4069, 0.8750, 0.5117, 0.4150, 0.4900, 0.5875, 0.5167],
  18372. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  18373. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  18374. [0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467],
  18375. [0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  18376. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550]],
  18377. device='cuda:0', dtype=torch.float64)
  18378. predictions are: tensor([[ 0.4360, -0.4805, 1.6811, -0.2378, -0.3917, 0.2554, 0.4442, 0.2100],
  18379. [ 0.7784, -0.3134, 1.6368, -0.8815, -0.3902, -1.1743, 0.6127, 0.2010],
  18380. [ 0.4541, -0.5240, 1.7817, 0.1039, -0.5630, -0.0397, 0.6083, 0.1318],
  18381. [ 0.6691, -0.3933, 0.9687, -1.3212, -0.6521, -1.1426, 0.4844, 0.1541],
  18382. [ 0.1000, -0.7177, 1.7854, -0.0132, -0.3303, -0.0130, 0.2209, 0.1332],
  18383. [ 0.6156, -0.4212, 1.1427, -1.2524, -0.5990, -1.0458, 0.6910, 0.2183],
  18384. [ 0.3454, -0.6151, 1.7236, 0.0457, -0.5889, -0.2072, 0.4643, 0.2432],
  18385. [ 0.4638, -0.4857, 1.7544, -0.1624, -0.1677, -0.1337, 0.4243, 0.2240]],
  18386. device='cuda:0', grad_fn=<AddmmBackward>)
  18387. landmarks are: tensor([[[ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  18388. 0.2936],
  18389. [ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  18390. 0.2043],
  18391. [ 0.5828, -0.4066, 1.7557, 0.0774, -0.3691, -0.0226, 0.4277,
  18392. 0.1005],
  18393. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  18394. 0.0862],
  18395. [ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  18396. 0.0682],
  18397. [ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  18398. 0.2391],
  18399. [ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  18400. 0.3777],
  18401. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  18402. 0.2776]]], device='cuda:0')
  18403. loss_train_step before backward: tensor(0.0172, device='cuda:0', grad_fn=<MseLossBackward>)
  18404. loss_train_step after backward: tensor(0.0172, device='cuda:0', grad_fn=<MseLossBackward>)
  18405. loss_train: 2.506653221324086
  18406. step: 70
  18407. running loss: 0.03580933173320123
  18408.  
  18409. Train Steps: 70/90 Loss: 0.0358 torch.Size([8, 600, 800])
  18410. torch.Size([8, 8])
  18411. tensor([[0.6260, 0.4153, 0.9000, 0.4533, 0.4025, 0.2633, 0.6223, 0.4967],
  18412. [0.6198, 0.4115, 0.7762, 0.2717, 0.3713, 0.3200, 0.5837, 0.5683],
  18413. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  18414. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  18415. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  18416. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  18417. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  18418. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250]],
  18419. device='cuda:0', dtype=torch.float64)
  18420. predictions are: tensor([[ 0.8442, -0.2878, 1.8822, -0.1673, -0.3492, -1.0421, 0.6640, 0.0426],
  18421. [ 0.7231, -0.3500, 1.3377, -0.9462, -0.5609, -0.9033, 0.3942, 0.3295],
  18422. [ 0.1892, -0.6626, 1.2548, -0.9844, -0.6395, -0.4658, 0.4720, 0.2314],
  18423. [ 0.4308, -0.5277, 1.1750, -1.1513, -0.5298, -0.9072, 0.5386, 0.2045],
  18424. [ 0.3504, -0.5871, 1.8031, -0.1725, -0.5336, -0.3180, 0.3269, 0.2640],
  18425. [ 0.2974, -0.5743, 1.7718, 0.0869, -0.1664, 0.3221, 0.2445, 0.2308],
  18426. [ 0.6129, -0.4227, 1.6943, -0.1902, -0.5263, 0.1815, 0.7341, 0.1576],
  18427. [ 0.4973, -0.4933, 1.8406, -0.6789, -0.4059, -0.7973, 0.6918, 0.1629]],
  18428. device='cuda:0', grad_fn=<AddmmBackward>)
  18429. landmarks are: tensor([[[ 0.6055, -0.3676, 1.8711, -0.1920, -0.4268, -1.0696, 0.5887,
  18430. 0.0081],
  18431. [ 0.5768, -0.3852, 1.2995, -1.0311, -0.5711, -0.8079, 0.4104,
  18432. 0.3392],
  18433. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  18434. 0.2545],
  18435. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  18436. 0.1779],
  18437. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  18438. 0.2930],
  18439. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  18440. 0.0622],
  18441. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  18442. 0.1715],
  18443. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  18444. 0.1390]]], device='cuda:0')
  18445. loss_train_step before backward: tensor(0.0133, device='cuda:0', grad_fn=<MseLossBackward>)
  18446. loss_train_step after backward: tensor(0.0133, device='cuda:0', grad_fn=<MseLossBackward>)
  18447. loss_train: 2.5199545985087752
  18448. step: 71
  18449. running loss: 0.03549231828885599
  18450. Train Steps: 71/90 Loss: 0.0355 torch.Size([8, 600, 800])
  18451. torch.Size([8, 8])
  18452. tensor([[0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  18453. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133],
  18454. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533],
  18455. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483],
  18456. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  18457. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  18458. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344],
  18459. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267]],
  18460. device='cuda:0', dtype=torch.float64)
  18461. predictions are: tensor([[ 0.5248, -0.4641, 1.7781, -0.0666, -0.2967, -0.0768, 0.3448, 0.2732],
  18462. [ 0.6372, -0.3929, 1.7426, -0.5425, -0.6774, -0.6999, 0.3333, 0.1048],
  18463. [ 0.3841, -0.5738, 1.0240, -1.3658, -0.5510, -0.8458, 0.6108, 0.2919],
  18464. [ 0.4925, -0.4407, 1.6825, -0.1932, -0.6649, -0.5765, 0.1744, 0.2428],
  18465. [ 0.3824, -0.5599, 1.7717, 0.1097, -0.2361, 0.2542, 0.5080, 0.1504],
  18466. [ 0.6134, -0.4053, 1.7990, -0.2906, -0.3894, 0.1740, 0.5379, 0.2180],
  18467. [ 0.6294, -0.4055, 1.8176, -0.1581, -0.6121, -0.5588, 0.3933, 0.0921],
  18468. [ 0.5168, -0.5085, 1.4544, -1.3228, -0.1340, -1.4168, 0.8669, 0.1577]],
  18469. device='cuda:0', grad_fn=<AddmmBackward>)
  18470. landmarks are: tensor([[[ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  18471. 0.3057],
  18472. [ 0.5393, -0.4294, 1.6575, -0.4075, -0.6635, -0.6308, 0.3296,
  18473. 0.0851],
  18474. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  18475. 0.2699],
  18476. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  18477. 0.2468],
  18478. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  18479. 0.0764],
  18480. [ 0.5499, -0.4225, 1.8018, -0.2921, -0.3055, 0.0543, 0.4046,
  18481. 0.2699],
  18482. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  18483. 0.1824],
  18484. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  18485. 0.1467]]], device='cuda:0')
  18486. loss_train_step before backward: tensor(0.0061, device='cuda:0', grad_fn=<MseLossBackward>)
  18487. loss_train_step after backward: tensor(0.0061, device='cuda:0', grad_fn=<MseLossBackward>)
  18488. loss_train: 2.5260266615077853
  18489. step: 72
  18490. running loss: 0.03508370363205257
  18491. Train Steps: 72/90 Loss: 0.0351 torch.Size([8, 600, 800])
  18492. torch.Size([8, 8])
  18493. tensor([[0.6268, 0.4061, 0.8350, 0.2433, 0.4575, 0.2283, 0.6350, 0.5300],
  18494. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  18495. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  18496. [0.6218, 0.4137, 0.7263, 0.2233, 0.4075, 0.2650, 0.6212, 0.5783],
  18497. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  18498. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  18499. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  18500. [0.6040, 0.4002, 0.7338, 0.2267, 0.3975, 0.2100, 0.5231, 0.4778]],
  18501. device='cuda:0', dtype=torch.float64)
  18502. predictions are: tensor([[ 0.6334, -0.4061, 1.6728, -1.1904, -0.2485, -1.1383, 0.6056, 0.1502],
  18503. [ 0.3768, -0.5504, 1.8360, 0.0306, -0.2621, 0.2948, 0.3617, 0.1141],
  18504. [ 0.7082, -0.3276, 1.7454, 0.2261, -0.4818, -0.0875, 0.3203, 0.2773],
  18505. [ 0.4360, -0.5399, 1.2143, -1.1695, -0.4310, -1.0023, 0.5435, 0.3108],
  18506. [ 0.7105, -0.3180, 1.7618, -0.0368, -0.3727, -0.7612, 0.3573, 0.3785],
  18507. [ 0.3095, -0.5736, 1.6237, -0.7393, -0.6324, -0.0113, 0.5981, 0.2196],
  18508. [ 0.5194, -0.4909, 1.8626, 0.1112, -0.5627, -0.3060, 0.6890, 0.1156],
  18509. [ 0.3677, -0.5692, 1.1701, -1.4718, -0.4682, -1.2223, 0.2472, 0.0670]],
  18510. device='cuda:0', grad_fn=<AddmmBackward>)
  18511. landmarks are: tensor([[[ 0.6093, -0.4104, 1.5709, -1.1620, -0.1727, -1.2313, 0.6471,
  18512. 0.1621],
  18513. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  18514. 0.0764],
  18515. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  18516. 0.3007],
  18517. [ 0.5863, -0.3749, 1.0686, -1.2543, -0.4037, -1.0619, 0.5836,
  18518. 0.3854],
  18519. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  18520. 0.5762],
  18521. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  18522. 0.2083],
  18523. [ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  18524. 0.2516],
  18525. [ 0.5037, -0.4375, 1.1032, -1.2390, -0.4499, -1.3159, 0.1301,
  18526. -0.0791]]], device='cuda:0')
  18527. loss_train_step before backward: tensor(0.0123, device='cuda:0', grad_fn=<MseLossBackward>)
  18528. loss_train_step after backward: tensor(0.0123, device='cuda:0', grad_fn=<MseLossBackward>)
  18529. loss_train: 2.5383365219458938
  18530. step: 73
  18531. running loss: 0.03477173317734101
  18532. Train Steps: 73/90 Loss: 0.0348 torch.Size([8, 600, 800])
  18533. torch.Size([8, 8])
  18534. tensor([[0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  18535. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679],
  18536. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  18537. [0.6200, 0.3993, 0.8519, 0.4923, 0.3962, 0.4717, 0.6013, 0.5433],
  18538. [0.6080, 0.4010, 0.8750, 0.4500, 0.4825, 0.5617, 0.5837, 0.5583],
  18539. [0.6144, 0.4032, 0.8563, 0.3283, 0.3525, 0.4200, 0.5775, 0.5583],
  18540. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  18541. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350]],
  18542. device='cuda:0', dtype=torch.float64)
  18543. predictions are: tensor([[ 5.4418e-01, -4.4780e-01, 1.1559e+00, -1.3561e+00, -5.1064e-01,
  18544. -1.0292e+00, 4.7806e-01, 1.2951e-01],
  18545. [-1.2765e+00, -1.6316e+00, 1.6362e+00, -1.2697e+00, 1.1559e-01,
  18546. -9.7170e-01, 9.1181e-01, 3.6843e-01],
  18547. [ 8.5290e-01, -2.6447e-01, 1.9745e+00, -1.9718e-01, -5.8324e-01,
  18548. -2.4832e-01, 6.2102e-01, 1.3964e-01],
  18549. [ 6.6774e-01, -3.8083e-01, 1.7173e+00, 6.7244e-04, -4.7820e-01,
  18550. -1.5158e-01, 5.3323e-01, 1.8132e-01],
  18551. [ 6.6050e-01, -3.5493e-01, 1.7779e+00, -1.7826e-01, -1.4851e-01,
  18552. 1.2158e-01, 2.9447e-01, 1.5800e-01],
  18553. [ 1.0210e+00, -1.2668e-01, 1.6734e+00, -6.9517e-01, -6.8150e-01,
  18554. -4.4491e-01, 4.3289e-01, 2.1880e-01],
  18555. [ 6.1925e-01, -3.6422e-01, 1.4968e+00, -5.0518e-01, -4.9594e-01,
  18556. -1.0194e+00, 1.9179e-01, 3.0572e-01],
  18557. [ 7.5316e-01, -3.0276e-01, 1.7571e+00, -1.9632e-03, -4.9168e-01,
  18558. -3.3726e-01, 1.9005e-01, 1.0943e-01]], device='cuda:0',
  18559. grad_fn=<AddmmBackward>)
  18560. landmarks are: tensor([[[ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  18561. 0.0562],
  18562. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  18563. 0.3371],
  18564. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  18565. 0.1390],
  18566. [ 0.5777, -0.4415, 1.6491, -0.0122, -0.4557, -0.1073, 0.4912,
  18567. 0.2237],
  18568. [ 0.5223, -0.4336, 1.7557, -0.2074, -0.0573, 0.3084, 0.4104,
  18569. 0.2930],
  18570. [ 0.5520, -0.4237, 1.6691, -0.7694, -0.6577, -0.3460, 0.3815,
  18571. 0.2930],
  18572. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  18573. 0.3928],
  18574. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  18575. 0.1854]]], device='cuda:0')
  18576. loss_train_step before backward: tensor(0.0367, device='cuda:0', grad_fn=<MseLossBackward>)
  18577. loss_train_step after backward: tensor(0.0367, device='cuda:0', grad_fn=<MseLossBackward>)
  18578. loss_train: 2.5750327026471496
  18579. step: 74
  18580. running loss: 0.03479773922496148
  18581.  
  18582. Train Steps: 74/90 Loss: 0.0348 torch.Size([8, 600, 800])
  18583. torch.Size([8, 8])
  18584. tensor([[0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  18585. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  18586. [0.6164, 0.4076, 0.8838, 0.4117, 0.3713, 0.5550, 0.6238, 0.5350],
  18587. [0.6064, 0.4019, 0.8650, 0.4517, 0.4037, 0.5367, 0.5703, 0.5609],
  18588. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  18589. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  18590. [0.6346, 0.4092, 0.7712, 0.5917, 0.4037, 0.4767, 0.7343, 0.5725],
  18591. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433]],
  18592. device='cuda:0', dtype=torch.float64)
  18593. predictions are: tensor([[ 0.5096, -0.4283, 1.7634, -0.3190, -0.4290, -0.4513, 0.0348, 0.2677],
  18594. [ 0.3356, -0.5704, 1.5252, -1.1793, -0.3212, -1.1210, 0.4800, 0.1549],
  18595. [ 0.5342, -0.4191, 1.7516, -0.4826, -0.4391, 0.1963, 0.6230, 0.2563],
  18596. [ 0.5286, -0.4179, 1.7052, -0.2810, -0.3513, 0.1736, 0.3214, 0.2292],
  18597. [ 0.6839, -0.3655, 1.7865, 0.1565, -0.4345, -0.2359, 0.5560, 0.0668],
  18598. [ 0.5197, -0.4576, 1.6927, -0.9587, -0.3475, -1.0610, 0.6220, 0.1999],
  18599. [ 0.7338, -0.3127, 1.4894, -0.0715, -0.4081, -0.2553, 0.6845, 0.3432],
  18600. [ 0.4452, -0.4472, 1.5220, -0.7479, -0.5569, -0.9219, 0.1381, 0.2604]],
  18601. device='cuda:0', grad_fn=<AddmmBackward>)
  18602. landmarks are: tensor([[[ 0.5441, -0.3997, 1.7326, -0.2228, -0.4441, -0.2921, 0.0296,
  18603. 0.2409],
  18604. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  18605. 0.0807],
  18606. [ 0.5614, -0.4032, 1.7961, -0.3844, -0.5711, 0.2776, 0.5952,
  18607. 0.1852],
  18608. [ 0.5151, -0.4296, 1.7095, -0.1997, -0.4210, 0.1929, 0.3484,
  18609. 0.3047],
  18610. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  18611. -0.0049],
  18612. [ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  18613. 0.1931],
  18614. [ 0.6454, -0.3960, 1.2764, 0.4470, -0.4210, -0.0842, 1.1057,
  18615. 0.3585],
  18616. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  18617. 0.2237]]], device='cuda:0')
  18618. loss_train_step before backward: tensor(0.0165, device='cuda:0', grad_fn=<MseLossBackward>)
  18619. loss_train_step after backward: tensor(0.0165, device='cuda:0', grad_fn=<MseLossBackward>)
  18620. loss_train: 2.5915102371945977
  18621. step: 75
  18622. running loss: 0.0345534698292613
  18623. Train Steps: 75/90 Loss: 0.0346 torch.Size([8, 600, 800])
  18624. torch.Size([8, 8])
  18625. tensor([[0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  18626. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609],
  18627. [0.6357, 0.4159, 0.8788, 0.5583, 0.3638, 0.4433, 0.6488, 0.5297],
  18628. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  18629. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  18630. [0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  18631. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  18632. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960]],
  18633. device='cuda:0', dtype=torch.float64)
  18634. predictions are: tensor([[ 0.2447, -0.6079, 1.0104, -1.2852, -0.3396, -1.1869, 0.1303, 0.1883],
  18635. [-0.0586, -0.8399, 1.7326, -1.1093, 0.0978, -0.9643, 0.9543, 0.2626],
  18636. [ 0.6468, -0.3746, 1.8626, 0.2272, -0.6019, -0.0139, 0.5560, 0.1825],
  18637. [ 0.6586, -0.3544, 1.8994, -0.1186, -0.5412, -0.0036, 0.1801, 0.2295],
  18638. [ 0.6833, -0.3836, 1.8911, -0.0879, -0.6091, -0.1609, 0.6603, 0.1590],
  18639. [ 0.1767, -0.6590, 1.0074, -1.3677, -0.3177, -1.2696, 0.1919, 0.1461],
  18640. [ 0.6589, -0.3171, 1.5171, -0.1376, -0.4783, -0.5075, 0.2700, 0.4525],
  18641. [ 0.7460, -0.2777, 1.8169, -0.8115, -0.1521, -0.7355, 0.5067, 0.1502]],
  18642. device='cuda:0', grad_fn=<AddmmBackward>)
  18643. landmarks are: tensor([[[ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  18644. 0.1253],
  18645. [ 0.6372, -0.3575, 1.6633, -1.2082, 0.2199, -1.2467, 1.1313,
  18646. 0.3050],
  18647. [ 0.6504, -0.3647, 1.7730, 0.2930, -0.6058, -0.2382, 0.7109,
  18648. 0.1608],
  18649. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  18650. 0.3087],
  18651. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  18652. 0.1768],
  18653. [ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  18654. 0.0261],
  18655. [ 0.6069, -0.3309, 1.3742, -0.1493, -0.5365, -0.9541, 0.2884,
  18656. 0.5071],
  18657. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  18658. 0.0051]]], device='cuda:0')
  18659. loss_train_step before backward: tensor(0.0396, device='cuda:0', grad_fn=<MseLossBackward>)
  18660. loss_train_step after backward: tensor(0.0396, device='cuda:0', grad_fn=<MseLossBackward>)
  18661. loss_train: 2.6311407880857587
  18662. step: 76
  18663. running loss: 0.03462027352744419
  18664. Train Steps: 76/90 Loss: 0.0346 torch.Size([8, 600, 800])
  18665. torch.Size([8, 8])
  18666. tensor([[0.6022, 0.3994, 0.8025, 0.3350, 0.3350, 0.4400, 0.5565, 0.5025],
  18667. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  18668. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567],
  18669. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  18670. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  18671. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  18672. [0.6245, 0.4100, 0.7762, 0.2583, 0.4963, 0.1517, 0.5875, 0.5417],
  18673. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407]],
  18674. device='cuda:0', dtype=torch.float64)
  18675. predictions are: tensor([[ 0.5096, -0.4109, 1.4637, -0.8476, -0.5801, -0.3472, 0.3674, 0.1769],
  18676. [ 0.8256, -0.1998, 1.7899, -0.3321, -0.4646, -0.4428, 0.3457, 0.2799],
  18677. [-1.3500, -1.6118, 1.2457, -1.3102, -0.3704, -1.1211, 0.2283, 0.2938],
  18678. [ 0.8079, -0.2665, 1.8021, 0.1917, -0.4374, -0.2552, 0.4940, 0.0330],
  18679. [ 0.8357, -0.2062, 1.8751, -0.1593, -0.4265, 0.0671, 0.5050, 0.2274],
  18680. [ 0.6870, -0.3474, 1.9166, -0.1231, -0.2887, -0.2234, 0.7814, 0.2500],
  18681. [ 0.5397, -0.4013, 1.2299, -1.1997, 0.0241, -1.3590, 0.4714, 0.2773],
  18682. [ 0.7879, -0.2330, 1.6780, -0.3961, -0.5048, -0.8428, 0.1642, 0.2339]],
  18683. device='cuda:0', grad_fn=<AddmmBackward>)
  18684. landmarks are: tensor([[[ 0.4956, -0.4413, 1.4208, -0.7386, -0.7386, -0.2536, 0.2843,
  18685. 0.0351],
  18686. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  18687. 0.1852],
  18688. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  18689. 0.2853],
  18690. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  18691. -0.0102],
  18692. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  18693. 0.1775],
  18694. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  18695. 0.4386],
  18696. [ 0.5985, -0.3921, 1.2995, -1.0927, 0.0062, -1.5854, 0.4277,
  18697. 0.2160],
  18698. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  18699. 0.2116]]], device='cuda:0')
  18700. loss_train_step before backward: tensor(0.0323, device='cuda:0', grad_fn=<MseLossBackward>)
  18701. loss_train_step after backward: tensor(0.0323, device='cuda:0', grad_fn=<MseLossBackward>)
  18702. loss_train: 2.6634310306981206
  18703. step: 77
  18704. running loss: 0.03459001338568988
  18705. Train Steps: 77/90 Loss: 0.0346 torch.Size([8, 600, 800])
  18706. torch.Size([8, 8])
  18707. tensor([[0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217],
  18708. [0.6185, 0.4079, 0.8838, 0.4617, 0.4838, 0.5650, 0.6175, 0.5850],
  18709. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  18710. [0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383],
  18711. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  18712. [0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  18713. [0.6160, 0.4093, 0.8314, 0.4417, 0.3675, 0.4583, 0.5250, 0.5808],
  18714. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967]],
  18715. device='cuda:0', dtype=torch.float64)
  18716. predictions are: tensor([[ 0.4709, -0.4453, 1.0841, -1.2571, -0.3121, -1.3903, 0.4219, 0.4682],
  18717. [ 0.5359, -0.4140, 1.8498, -0.2117, -0.0671, 0.0072, 0.5131, 0.3493],
  18718. [ 0.7026, -0.3289, 1.8133, -0.0557, -0.2773, -0.1168, 0.3260, 0.2713],
  18719. [ 0.3245, -0.5751, 1.8032, -0.2144, -0.1927, 0.1364, 0.4431, 0.2329],
  18720. [ 0.6127, -0.4122, 1.7185, -0.8684, -0.6133, -0.9153, 0.6240, 0.0393],
  18721. [ 0.4521, -0.5100, 1.7841, -0.8017, -0.4028, -1.2877, 0.5973, 0.0130],
  18722. [ 0.4815, -0.4352, 1.6452, -0.2379, -0.5157, -0.3379, 0.2251, 0.3758],
  18723. [ 0.7428, -0.3001, 1.7455, -0.2779, -0.5834, -0.0526, 0.3788, 0.1368]],
  18724. device='cuda:0', grad_fn=<AddmmBackward>)
  18725. landmarks are: tensor([[[ 0.5687, -0.4088, 1.0397, -1.1466, -0.3113, -1.1928, 0.4681,
  18726. 0.5855],
  18727. [ 0.5707, -0.4017, 1.7961, -0.1535, -0.0515, 0.3238, 0.5663,
  18728. 0.4162],
  18729. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  18730. 0.3084],
  18731. [ 0.5664, -0.4321, 1.8249, -0.2074, -0.2651, 0.4162, 0.5663,
  18732. 0.2006],
  18733. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  18734. -0.0220],
  18735. [ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  18736. -0.0957],
  18737. [ 0.5592, -0.3956, 1.5543, -0.2456, -0.5885, -0.1689, 0.1392,
  18738. 0.3968],
  18739. [ 0.4974, -0.4482, 1.6633, -0.3306, -0.6173, 0.1313, 0.2925,
  18740. 0.0081]]], device='cuda:0')
  18741. loss_train_step before backward: tensor(0.0132, device='cuda:0', grad_fn=<MseLossBackward>)
  18742. loss_train_step after backward: tensor(0.0132, device='cuda:0', grad_fn=<MseLossBackward>)
  18743. loss_train: 2.6766006434336305
  18744. step: 78
  18745. running loss: 0.03431539286453372
  18746.  
  18747. Train Steps: 78/90 Loss: 0.0343 torch.Size([8, 600, 800])
  18748. torch.Size([8, 8])
  18749. tensor([[0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  18750. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  18751. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967],
  18752. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  18753. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436],
  18754. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  18755. [0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183],
  18756. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719]],
  18757. device='cuda:0', dtype=torch.float64)
  18758. predictions are: tensor([[ 0.5273, -0.4399, 1.8495, -0.1630, -0.2124, -0.1018, 0.4078, 0.2698],
  18759. [ 0.5313, -0.4043, 1.3250, -1.3841, -0.2848, -1.3463, 0.4527, 0.3200],
  18760. [ 0.6812, -0.3249, 1.7316, -0.3940, -0.4961, -0.0325, 0.3028, 0.1664],
  18761. [ 0.5938, -0.4122, 1.8738, -0.2503, -0.4744, -0.6442, 0.5637, 0.1794],
  18762. [ 0.7607, -0.2876, 1.7610, -0.0193, -0.2895, 0.1308, 0.7129, 0.3571],
  18763. [ 0.5551, -0.4227, 1.8155, 0.0922, -0.4076, -0.4884, 0.3522, 0.0836],
  18764. [ 0.4960, -0.4693, 1.6879, -0.8681, -0.4898, -0.7002, 0.5810, 0.1831],
  18765. [ 0.3679, -0.5129, 1.5779, -0.5601, -0.5443, -0.5261, 0.1086, 0.2616]],
  18766. device='cuda:0', grad_fn=<AddmmBackward>)
  18767. landmarks are: tensor([[[ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  18768. 0.2391],
  18769. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  18770. 0.3315],
  18771. [ 0.4974, -0.4482, 1.6633, -0.3306, -0.6173, 0.1313, 0.2925,
  18772. 0.0081],
  18773. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  18774. 0.0325],
  18775. [ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  18776. 0.2249],
  18777. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  18778. -0.0102],
  18779. [ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  18780. 0.1080],
  18781. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  18782. 0.3559]]], device='cuda:0')
  18783. loss_train_step before backward: tensor(0.0195, device='cuda:0', grad_fn=<MseLossBackward>)
  18784. loss_train_step after backward: tensor(0.0195, device='cuda:0', grad_fn=<MseLossBackward>)
  18785. loss_train: 2.6960538187995553
  18786. step: 79
  18787. running loss: 0.0341272635291083
  18788. Train Steps: 79/90 Loss: 0.0341 torch.Size([8, 600, 800])
  18789. torch.Size([8, 8])
  18790. tensor([[0.6262, 0.4085, 0.8438, 0.3150, 0.4025, 0.2633, 0.6339, 0.4810],
  18791. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  18792. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235],
  18793. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  18794. [0.6364, 0.4154, 0.8938, 0.3717, 0.4500, 0.2583, 0.6448, 0.5285],
  18795. [0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  18796. [0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882],
  18797. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197]],
  18798. device='cuda:0', dtype=torch.float64)
  18799. predictions are: tensor([[ 0.6406, -0.3394, 1.5624, -0.9658, -0.4175, -1.0238, 0.4895, 0.0445],
  18800. [ 0.8191, -0.2232, 1.7964, -0.2992, -0.5615, -0.4212, 0.4417, 0.3493],
  18801. [ 0.4210, -0.5028, 1.7112, -0.0776, -0.3531, 0.2189, 0.5235, 0.2024],
  18802. [ 0.3600, -0.5230, 1.3145, -1.0232, -0.6596, -0.3986, 0.5122, 0.2381],
  18803. [ 0.4282, -0.4474, 1.7761, -0.7220, -0.1502, -1.1927, 0.5608, 0.2853],
  18804. [ 0.2045, -0.6083, 1.6021, -1.0291, -0.0299, -1.2599, 0.7801, 0.2161],
  18805. [ 0.6250, -0.3410, 1.7121, 0.1525, -0.6350, -0.5269, 0.2029, 0.1414],
  18806. [ 0.5669, -0.3527, 1.7078, 0.0535, -0.1782, 0.1812, 0.2248, 0.2197]],
  18807. device='cuda:0', grad_fn=<AddmmBackward>)
  18808. landmarks are: tensor([[[ 0.6064, -0.3990, 1.6113, -0.8309, -0.4268, -1.0696, 0.6421,
  18809. -0.0640],
  18810. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  18811. 0.3238],
  18812. [ 0.5762, -0.4706, 1.7754, -0.0984, -0.3680, 0.2380, 0.6277,
  18813. 0.1322],
  18814. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  18815. 0.2545],
  18816. [ 0.6537, -0.3671, 1.8423, -0.5692, -0.2074, -1.0927, 0.6926,
  18817. 0.1554],
  18818. [ 0.6520, -0.3912, 1.7095, -0.9079, -0.0284, -1.3621, 0.8096,
  18819. 0.2356],
  18820. [ 0.5379, -0.4358, 1.7326, 0.1852, -0.6058, -0.5461, 0.0684,
  18821. -0.0310],
  18822. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  18823. 0.1146]]], device='cuda:0')
  18824. loss_train_step before backward: tensor(0.0123, device='cuda:0', grad_fn=<MseLossBackward>)
  18825. loss_train_step after backward: tensor(0.0123, device='cuda:0', grad_fn=<MseLossBackward>)
  18826. loss_train: 2.7083711810410023
  18827. step: 80
  18828. running loss: 0.03385463976301253
  18829. Train Steps: 80/90 Loss: 0.0339 torch.Size([8, 600, 800])
  18830. torch.Size([8, 8])
  18831. tensor([[0.6064, 0.4019, 0.8650, 0.4517, 0.4037, 0.5367, 0.5703, 0.5609],
  18832. [0.6284, 0.4093, 0.8900, 0.4700, 0.3650, 0.3850, 0.6212, 0.5167],
  18833. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  18834. [0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  18835. [ nan, nan, 0.9088, 0.3783, 0.4562, 0.2617, 0.6741, 0.5575],
  18836. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  18837. [0.6124, 0.4075, 0.7696, 0.4153, 0.3475, 0.3767, 0.5157, 0.5427],
  18838. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209]],
  18839. device='cuda:0', dtype=torch.float64)
  18840. predictions are: tensor([[ 0.7237, -0.3149, 1.8418, -0.0973, -0.3929, 0.4974, 0.4936, 0.1480],
  18841. [ 0.5533, -0.4386, 2.0288, -0.0327, -0.5607, -0.3373, 0.6171, 0.0117],
  18842. [ 0.6416, -0.3521, 1.0816, -1.1016, -0.4769, -1.0356, 0.4465, 0.2484],
  18843. [-0.0895, -0.8211, 1.0411, -1.2723, -0.3167, -1.3586, 0.1415, 0.1784],
  18844. [ 0.0629, -0.7368, 2.1032, -0.5214, -0.1178, -1.0612, 0.8426, 0.1643],
  18845. [ 0.6451, -0.3647, 1.2101, -1.0310, -0.4915, -0.8103, 0.5724, 0.2705],
  18846. [ 0.6988, -0.3193, 1.5759, -0.4323, -0.6370, -0.3351, 0.2304, 0.1933],
  18847. [ 0.6208, -0.3282, 1.7503, -0.0942, -0.2058, -0.9515, 0.4224, 0.3945]],
  18848. device='cuda:0', grad_fn=<AddmmBackward>)
  18849. landmarks are: tensor([[[ 0.5151, -0.4296, 1.7095, -0.1997, -0.4210, 0.1929, 0.3484,
  18850. 0.3047],
  18851. [ 0.6164, -0.3956, 1.8249, -0.1150, -0.6000, -0.5076, 0.5836,
  18852. 0.1005],
  18853. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  18854. 0.2391],
  18855. [ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  18856. 0.2699],
  18857. [-2.2859, -2.2859, 1.9115, -0.5384, -0.1785, -1.0773, 0.8278,
  18858. 0.2890],
  18859. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  18860. 0.3700],
  18861. [ 0.5427, -0.4035, 1.2688, -0.3675, -0.6808, -0.5461, 0.0959,
  18862. 0.2206],
  18863. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  18864. 0.5822]]], device='cuda:0')
  18865. loss_train_step before backward: tensor(0.1471, device='cuda:0', grad_fn=<MseLossBackward>)
  18866. loss_train_step after backward: tensor(0.1471, device='cuda:0', grad_fn=<MseLossBackward>)
  18867. loss_train: 2.855488333851099
  18868. step: 81
  18869. running loss: 0.03525294239322344
  18870. Train Steps: 81/90 Loss: 0.0353 torch.Size([8, 600, 800])
  18871. torch.Size([8, 8])
  18872. tensor([[ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  18873. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  18874. [0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  18875. [0.6268, 0.4029, 0.8500, 0.2683, 0.3937, 0.3500, 0.6860, 0.5297],
  18876. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690],
  18877. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  18878. [0.6124, 0.4069, 0.8314, 0.5001, 0.3738, 0.4650, 0.5167, 0.5402],
  18879. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301]],
  18880. device='cuda:0', dtype=torch.float64)
  18881. predictions are: tensor([[-1.1345, -1.4592, 0.8842, -1.3519, -0.4274, -1.4106, 0.0831, 0.2845],
  18882. [ 0.6571, -0.3376, 1.7894, 0.0479, -0.3040, -0.0971, 0.2572, 0.1928],
  18883. [ 0.6914, -0.2991, 1.3371, -1.1903, -0.2251, -1.5271, 0.3750, 0.1489],
  18884. [ 0.8150, -0.2614, 1.6584, -0.8945, -0.5536, -0.6788, 0.8310, 0.1009],
  18885. [ 0.7828, -0.2719, 1.6696, 0.2097, -0.3416, 0.3041, 0.8104, 0.3228],
  18886. [ 0.4134, -0.5005, 1.9845, -0.5028, -0.5451, -0.6079, 0.6033, 0.1341],
  18887. [ 0.7405, -0.2666, 1.6761, 0.0836, -0.4790, -0.1078, 0.1919, 0.2615],
  18888. [ 0.7103, -0.3291, 1.7885, 0.0517, -0.3564, -0.0208, 0.6138, 0.1718]],
  18889. device='cuda:0', grad_fn=<AddmmBackward>)
  18890. landmarks are: tensor([[[-2.2859e+00, -2.2859e+00, 8.0331e-01, -1.1250e+00, -3.8637e-01,
  18891. -1.3082e+00, 1.1262e-01, 4.5430e-01],
  18892. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  18893. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  18894. [ 5.7870e-01, -4.0862e-01, 1.3535e+00, -1.2794e+00, -1.7640e-01,
  18895. -1.4891e+00, 4.6447e-01, 2.4425e-01],
  18896. [ 6.0919e-01, -4.2490e-01, 1.6402e+00, -1.0465e+00, -4.6721e-01,
  18897. -6.6928e-01, 8.8267e-01, 1.6077e-01],
  18898. [ 6.3060e-01, -4.1527e-01, 1.5141e+00, 2.2241e-01, -3.6905e-01,
  18899. 2.6220e-01, 1.0033e+00, 3.4245e-01],
  18900. [ 6.0733e-01, -4.0577e-01, 1.8885e+00, -4.9992e-01, -5.9423e-01,
  18901. -4.7683e-01, 6.4134e-01, 1.5443e-01],
  18902. [ 5.4249e-01, -4.0670e-01, 1.5543e+00, 2.4057e-02, -5.5958e-01,
  18903. -1.3811e-01, 1.0049e-01, 2.0932e-01],
  18904. [ 6.0095e-01, -4.5619e-01, 1.7198e+00, -9.0441e-03, -3.4644e-01,
  18905. 1.0758e-02, 6.2944e-01, 1.6266e-01]]], device='cuda:0')
  18906. loss_train_step before backward: tensor(0.0413, device='cuda:0', grad_fn=<MseLossBackward>)
  18907. loss_train_step after backward: tensor(0.0413, device='cuda:0', grad_fn=<MseLossBackward>)
  18908. loss_train: 2.8967771902680397
  18909. step: 82
  18910. running loss: 0.03532655110082975
  18911.  
  18912. Train Steps: 82/90 Loss: 0.0353 torch.Size([8, 600, 800])
  18913. torch.Size([8, 8])
  18914. tensor([[0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  18915. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  18916. [0.6182, 0.3998, 0.8793, 0.4191, 0.3552, 0.4285, 0.6038, 0.5312],
  18917. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  18918. [0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667],
  18919. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  18920. [0.6350, 0.4043, 0.8738, 0.5650, 0.3850, 0.4750, 0.6401, 0.4950],
  18921. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533]],
  18922. device='cuda:0', dtype=torch.float64)
  18923. predictions are: tensor([[ 0.7146, -0.3538, 1.8599, 0.1712, -0.4480, 0.1083, 0.5213, 0.0950],
  18924. [ 0.6914, -0.3237, 1.8138, -0.0676, -0.1364, 0.2315, 0.5159, 0.2180],
  18925. [ 0.7692, -0.2724, 1.7680, -0.3090, -0.5663, -0.4063, 0.5210, 0.2294],
  18926. [ 0.6687, -0.3124, 1.3652, -0.8803, -0.4324, -1.0893, 0.5859, 0.3320],
  18927. [ 0.5855, -0.3619, 1.7856, -0.5942, -0.4860, -0.7473, 0.4492, 0.2532],
  18928. [ 0.6554, -0.3291, 1.1327, -1.2360, -0.4624, -1.1226, 0.3796, 0.2043],
  18929. [ 0.8600, -0.2718, 1.8370, 0.4075, -0.4948, -0.0732, 0.7471, 0.0575],
  18930. [-1.5150, -1.7410, 0.9122, -1.3620, -0.3742, -1.4723, 0.1188, 0.2358]],
  18931. device='cuda:0', grad_fn=<AddmmBackward>)
  18932. landmarks are: tensor([[[ 5.7829e-01, -4.3634e-01, 1.7724e+00, 4.3211e-02, -5.1531e-01,
  18933. 8.7136e-02, 4.8401e-01, 6.6263e-02],
  18934. [ 5.5260e-01, -4.3510e-01, 1.7672e+00, -1.9199e-01, -1.7852e-01,
  18935. 2.6990e-01, 5.2587e-01, 2.6990e-01],
  18936. [ 5.6966e-01, -4.3934e-01, 1.7754e+00, -3.5028e-01, -6.4527e-01,
  18937. -3.0670e-01, 5.0278e-01, 1.6774e-01],
  18938. [ 5.9151e-01, -3.6821e-01, 1.2187e+00, -1.2313e+00, -4.3256e-01,
  18939. -9.5412e-01, 5.7783e-01, 3.7768e-01],
  18940. [ 5.7829e-01, -3.9330e-01, 1.6748e+00, -6.1540e-01, -5.7691e-01,
  18941. -6.4619e-01, 4.7968e-01, 3.3149e-01],
  18942. [ 5.3557e-01, -4.2171e-01, 1.0339e+00, -1.4776e+00, -5.0762e-01,
  18943. -1.1081e+00, 4.2194e-01, 2.8530e-01],
  18944. [ 6.4706e-01, -4.1832e-01, 1.7499e+00, 3.2379e-01, -5.0762e-01,
  18945. -9.1917e-02, 6.7064e-01, 4.6189e-04],
  18946. [-2.2859e+00, -2.2859e+00, 7.0230e-01, -1.3883e+00, -4.2679e-01,
  18947. -1.3621e+00, 8.1293e-02, 2.6990e-01]]], device='cuda:0')
  18948. loss_train_step before backward: tensor(0.0244, device='cuda:0', grad_fn=<MseLossBackward>)
  18949. loss_train_step after backward: tensor(0.0244, device='cuda:0', grad_fn=<MseLossBackward>)
  18950. loss_train: 2.921171437948942
  18951. step: 83
  18952. running loss: 0.03519483660179448
  18953. Train Steps: 83/90 Loss: 0.0352 torch.Size([8, 600, 800])
  18954. torch.Size([8, 8])
  18955. tensor([[0.6260, 0.4120, 0.8013, 0.2350, 0.4888, 0.1533, 0.6281, 0.4895],
  18956. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  18957. [0.6336, 0.4154, 0.8900, 0.2767, 0.4988, 0.2867, 0.7422, 0.5540],
  18958. [0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350],
  18959. [0.6185, 0.4042, 0.7700, 0.2250, 0.4062, 0.2117, 0.5763, 0.5150],
  18960. [0.6245, 0.4115, 0.8700, 0.4883, 0.4625, 0.5517, 0.6100, 0.5217],
  18961. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  18962. [0.6224, 0.4061, 0.8988, 0.4300, 0.3838, 0.4750, 0.6112, 0.5483]],
  18963. device='cuda:0', dtype=torch.float64)
  18964. predictions are: tensor([[ 0.3414, -0.5336, 1.3901, -1.0815, -0.1304, -1.4158, 0.6134, 0.1596],
  18965. [ 0.5834, -0.4411, 1.6709, 0.4052, -0.5984, 0.0808, 0.5935, 0.1417],
  18966. [ 0.3512, -0.5651, 1.7264, -0.7843, -0.0953, -1.0059, 0.9068, 0.1935],
  18967. [ 0.4498, -0.4207, 1.3572, -0.9040, -0.5169, -0.8613, 0.3319, 0.2744],
  18968. [ 0.3137, -0.5197, 1.1709, -1.0104, -0.5328, -1.2113, 0.2474, 0.1146],
  18969. [ 0.5019, -0.4251, 1.6912, 0.0891, -0.2694, 0.3256, 0.5324, 0.2705],
  18970. [ 0.3252, -0.5454, 1.1839, -1.0608, -0.4705, -1.1051, 0.3983, 0.2607],
  18971. [ 0.4924, -0.4734, 1.8682, -0.0788, -0.6548, 0.1146, 0.5234, 0.1737]],
  18972. device='cuda:0', grad_fn=<AddmmBackward>)
  18973. landmarks are: tensor([[[ 0.6053, -0.3830, 1.4150, -1.2005, -0.0284, -1.5777, 0.6154,
  18974. -0.0250],
  18975. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  18976. 0.0697],
  18977. [ 0.6405, -0.3671, 1.8249, -1.0080, 0.0178, -0.9618, 1.1422,
  18978. 0.2730],
  18979. [ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  18980. 0.1852],
  18981. [ 0.5707, -0.4189, 1.2707, -1.2467, -0.4095, -1.3082, 0.3758,
  18982. 0.0928],
  18983. [ 0.5987, -0.3852, 1.7326, -0.0303, -0.1497, 0.2622, 0.5316,
  18984. 0.1236],
  18985. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  18986. 0.1698],
  18987. [ 0.5888, -0.4101, 1.8654, -0.2998, -0.5134, -0.0919, 0.5374,
  18988. 0.2468]]], device='cuda:0')
  18989. loss_train_step before backward: tensor(0.0179, device='cuda:0', grad_fn=<MseLossBackward>)
  18990. loss_train_step after backward: tensor(0.0179, device='cuda:0', grad_fn=<MseLossBackward>)
  18991. loss_train: 2.9391067922115326
  18992. step: 84
  18993. running loss: 0.034989366573946815
  18994. Train Steps: 84/90 Loss: 0.0350 torch.Size([8, 600, 800])
  18995. torch.Size([8, 8])
  18996. tensor([[0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  18997. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  18998. [0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390],
  18999. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  19000. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  19001. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  19002. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  19003. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285]],
  19004. device='cuda:0', dtype=torch.float64)
  19005. predictions are: tensor([[ 0.3572, -0.5497, 1.8215, -0.4146, -0.5355, -0.3716, 0.3348, 0.2300],
  19006. [ 0.5134, -0.4433, 1.6347, -0.5314, -0.6411, -0.5109, 0.4675, 0.2653],
  19007. [ 0.3472, -0.5754, 1.7767, -0.6031, -0.3520, -1.0399, 0.7266, 0.1543],
  19008. [ 0.5444, -0.4306, 1.1022, -1.4533, -0.3904, -1.3121, 0.5611, 0.1790],
  19009. [ 0.3579, -0.5079, 1.5207, 0.2874, -0.3740, -0.3332, 0.2718, 0.4807],
  19010. [ 0.6658, -0.3873, 1.7824, -0.3300, -0.4989, 0.1572, 0.8910, 0.1273],
  19011. [ 0.5774, -0.4470, 1.5978, 0.1259, -0.3104, 0.0424, 0.7856, 0.1582],
  19012. [ 0.4544, -0.4687, 1.3953, -0.5208, -0.5736, -0.3778, 0.0729, 0.1174]],
  19013. device='cuda:0', grad_fn=<AddmmBackward>)
  19014. landmarks are: tensor([[[ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  19015. 0.2930],
  19016. [ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  19017. 0.2930],
  19018. [ 0.6504, -0.3936, 1.8885, -0.4922, -0.3402, -0.9233, 0.8022,
  19019. 0.2035],
  19020. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  19021. 0.2468],
  19022. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  19023. 0.4470],
  19024. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  19025. 0.1715],
  19026. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  19027. 0.1176],
  19028. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  19029. 0.1552]]], device='cuda:0')
  19030. loss_train_step before backward: tensor(0.0091, device='cuda:0', grad_fn=<MseLossBackward>)
  19031. loss_train_step after backward: tensor(0.0091, device='cuda:0', grad_fn=<MseLossBackward>)
  19032. loss_train: 2.948201633989811
  19033. step: 85
  19034. running loss: 0.03468472510576248
  19035. Train Steps: 85/90 Loss: 0.0347 torch.Size([8, 600, 800])
  19036. torch.Size([8, 8])
  19037. tensor([[0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450],
  19038. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  19039. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  19040. [0.6234, 0.4179, 0.7825, 0.3450, 0.3813, 0.2867, 0.5675, 0.5617],
  19041. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  19042. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  19043. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  19044. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100]],
  19045. device='cuda:0', dtype=torch.float64)
  19046. predictions are: tensor([[ 0.4660, -0.5156, 1.7767, -0.2449, -0.3343, 0.1230, 0.6427, 0.1392],
  19047. [ 0.3637, -0.5195, 1.6345, -0.0874, -0.6553, -0.6107, 0.3418, 0.3022],
  19048. [ 0.4526, -0.5204, 1.7592, -0.2958, -0.4045, 0.2497, 0.6422, 0.1193],
  19049. [ 0.0573, -0.7052, 1.4025, -0.9575, -0.4882, -1.0913, 0.3891, 0.2999],
  19050. [ 0.4061, -0.4735, 1.1699, -0.8911, -0.0988, -1.4151, 0.2780, 0.3841],
  19051. [ 0.5552, -0.4399, 1.6502, 0.2949, -0.3972, 0.1041, 0.5352, 0.2250],
  19052. [ 0.5542, -0.4346, 1.0822, -1.1684, -0.5267, -1.0174, 0.6169, 0.2570],
  19053. [ 0.7242, -0.3797, 1.7948, -0.4427, -0.6509, -0.5013, 0.7786, 0.0073]],
  19054. device='cuda:0', grad_fn=<AddmmBackward>)
  19055. landmarks are: tensor([[[ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  19056. 0.2314],
  19057. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  19058. 0.3161],
  19059. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  19060. 0.2622],
  19061. [ 0.5935, -0.3558, 1.3284, -0.6924, -0.5249, -0.9618, 0.3353,
  19062. 0.3084],
  19063. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  19064. 0.5624],
  19065. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  19066. 0.3161],
  19067. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  19068. 0.3700],
  19069. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  19070. 0.0697]]], device='cuda:0')
  19071. loss_train_step before backward: tensor(0.0161, device='cuda:0', grad_fn=<MseLossBackward>)
  19072. loss_train_step after backward: tensor(0.0161, device='cuda:0', grad_fn=<MseLossBackward>)
  19073. loss_train: 2.964329108595848
  19074. step: 86
  19075. running loss: 0.034468943123207536
  19076.  
  19077. Train Steps: 86/90 Loss: 0.0345 torch.Size([8, 600, 800])
  19078. torch.Size([8, 8])
  19079. tensor([[0.6282, 0.4034, 0.7830, 0.2080, 0.4532, 0.2080, 0.6404, 0.5323],
  19080. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  19081. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  19082. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  19083. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967],
  19084. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  19085. [0.6272, 0.4120, 0.9038, 0.4117, 0.3725, 0.3200, 0.6175, 0.5250],
  19086. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717]],
  19087. device='cuda:0', dtype=torch.float64)
  19088. predictions are: tensor([[ 0.5998, -0.3945, 1.2492, -1.0363, -0.3124, -1.2346, 0.6505, 0.1615],
  19089. [ 0.4399, -0.5304, 1.5987, 0.2052, -0.2732, 0.2001, 0.5628, 0.1825],
  19090. [ 0.4002, -0.4918, 1.2865, -1.0020, -0.2786, -1.2601, 0.4286, 0.2335],
  19091. [ 0.5183, -0.4353, 1.5123, -0.2794, -0.6870, -0.2431, 0.3356, 0.1993],
  19092. [ 0.1278, -0.6566, 1.4739, -1.0337, -0.1406, -1.3200, 0.6354, 0.1578],
  19093. [ 0.4852, -0.4609, 1.6576, -0.2034, -0.3438, 0.3765, 0.6157, 0.1554],
  19094. [-0.0316, -0.7990, 1.7789, -0.2751, -0.6377, -0.7240, 0.6715, 0.2198],
  19095. [ 0.5022, -0.4296, 1.0507, -1.0560, -0.6059, -0.9220, 0.4741, 0.3350]],
  19096. device='cuda:0', grad_fn=<AddmmBackward>)
  19097. landmarks are: tensor([[[ 6.1577e-01, -4.2249e-01, 1.3307e+00, -1.3253e+00, -1.9244e-01,
  19098. -1.3252e+00, 6.7213e-01, 1.7271e-01],
  19099. [ 5.5484e-01, -4.6823e-01, 1.7309e+00, 9.6578e-02, -1.3942e-01,
  19100. 1.7573e-01, 5.0451e-01, 9.4188e-02],
  19101. [ 5.7679e-01, -4.0308e-01, 1.3838e+00, -1.1527e+00, -2.1876e-01,
  19102. -1.4216e+00, 4.3790e-01, 1.8502e-01],
  19103. [ 5.3672e-01, -4.2941e-01, 1.5709e+00, -4.9992e-01, -6.6928e-01,
  19104. -3.0747e-01, 2.4546e-01, 3.5585e-01],
  19105. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  19106. -1.5161e+00, 5.8660e-01, 8.0947e-03],
  19107. [ 5.1155e-01, -4.3318e-01, 1.7557e+00, -3.1517e-01, -2.5358e-01,
  19108. 3.9307e-01, 4.1387e-01, 2.9364e-01],
  19109. [ 6.1114e-01, -3.8276e-01, 1.8885e+00, -3.8445e-01, -5.6536e-01,
  19110. -8.0785e-01, 5.6628e-01, 1.3903e-01],
  19111. [ 5.7460e-01, -3.8822e-01, 1.1436e+00, -1.2005e+00, -4.9030e-01,
  19112. -1.0157e+00, 4.3926e-01, 3.5458e-01]]], device='cuda:0')
  19113. loss_train_step before backward: tensor(0.0250, device='cuda:0', grad_fn=<MseLossBackward>)
  19114. loss_train_step after backward: tensor(0.0250, device='cuda:0', grad_fn=<MseLossBackward>)
  19115. loss_train: 2.9893352556973696
  19116. step: 87
  19117. running loss: 0.03436017535284333
  19118. Train Steps: 87/90 Loss: 0.0344 torch.Size([8, 600, 800])
  19119. torch.Size([8, 8])
  19120. tensor([[0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  19121. [0.6214, 0.4175, 0.7300, 0.2883, 0.4338, 0.2167, 0.5698, 0.5773],
  19122. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  19123. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552],
  19124. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  19125. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  19126. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  19127. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960]],
  19128. device='cuda:0', dtype=torch.float64)
  19129. predictions are: tensor([[ 0.6628, -0.3783, 1.3547, 0.0378, -0.5396, -0.2219, 0.7363, 0.3387],
  19130. [ 0.9989, -0.0989, 1.0561, -1.0009, -0.3688, -1.1186, 0.2621, 0.3592],
  19131. [ 0.8307, -0.2395, 1.6155, -0.5370, -0.7173, -0.2707, 0.4068, 0.0687],
  19132. [-2.1859, -2.2229, 1.5529, -1.2666, 0.0458, -1.3234, 0.9324, 0.2525],
  19133. [ 0.4735, -0.4862, 1.6272, -0.1025, -0.5379, -0.1717, 0.3618, 0.0620],
  19134. [ 0.6799, -0.3520, 1.6324, -0.1560, -0.4966, 0.0338, 0.2962, 0.1715],
  19135. [ 0.6859, -0.3553, 1.3792, 0.0354, -0.5202, -0.0513, 0.8590, 0.3345],
  19136. [ 0.6793, -0.2859, 1.6432, -0.9845, -0.1492, -1.2886, 0.5025, 0.1337]],
  19137. device='cuda:0', grad_fn=<AddmmBackward>)
  19138. landmarks are: tensor([[[ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  19139. 0.3745],
  19140. [ 0.5841, -0.3574, 1.0859, -0.9541, -0.2824, -1.2851, 0.3460,
  19141. 0.3808],
  19142. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  19143. 0.0236],
  19144. [-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  19145. 0.2783],
  19146. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  19147. 0.0313],
  19148. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  19149. 0.2035],
  19150. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  19151. 0.3478],
  19152. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  19153. 0.0051]]], device='cuda:0')
  19154. loss_train_step before backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  19155. loss_train_step after backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  19156. loss_train: 3.0085563641041517
  19157. step: 88
  19158. running loss: 0.034188140501183545
  19159. Train Steps: 88/90 Loss: 0.0342 torch.Size([8, 600, 800])
  19160. torch.Size([8, 8])
  19161. tensor([[ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933],
  19162. [0.6269, 0.4073, 0.8900, 0.4933, 0.3625, 0.4183, 0.6288, 0.5150],
  19163. [0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  19164. [0.6286, 0.4060, 0.9188, 0.4333, 0.3675, 0.4167, 0.7034, 0.5528],
  19165. [0.6075, 0.4007, 0.8275, 0.4917, 0.4050, 0.5100, 0.5167, 0.5280],
  19166. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517],
  19167. [0.6107, 0.4050, 0.8700, 0.4850, 0.4470, 0.4848, 0.5043, 0.5431],
  19168. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309]],
  19169. device='cuda:0', dtype=torch.float64)
  19170. predictions are: tensor([[-1.8385, -1.9641, 0.9082, -1.2111, -0.4355, -1.1670, 0.1173, 0.2900],
  19171. [ 0.6356, -0.3790, 1.6797, -0.1061, -0.5099, -0.3461, 0.6313, 0.1793],
  19172. [ 0.5199, -0.3973, 1.6923, -0.4086, -0.3310, -0.9304, 0.6163, 0.2632],
  19173. [ 0.7638, -0.3175, 1.7645, -0.4099, -0.4495, -0.4600, 0.9688, 0.2919],
  19174. [ 0.7587, -0.2697, 1.4616, -0.1549, -0.3250, 0.0384, 0.2837, 0.1989],
  19175. [ 0.7750, -0.2476, 1.4770, -0.9351, -0.5789, -0.6013, 0.5758, 0.2528],
  19176. [ 0.6622, -0.3352, 1.5473, -0.1471, -0.1829, -0.0524, 0.2201, 0.1321],
  19177. [ 0.6658, -0.3254, 1.6760, -0.0658, -0.3696, -0.5965, 0.7424, 0.2032]],
  19178. device='cuda:0', grad_fn=<AddmmBackward>)
  19179. landmarks are: tensor([[[-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  19180. 0.4543],
  19181. [ 0.6096, -0.4046, 1.8249, -0.0072, -0.6115, -0.3537, 0.6182,
  19182. 0.0928],
  19183. [ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  19184. 0.1608],
  19185. [ 0.6174, -0.4105, 1.9577, -0.2844, -0.5885, -0.3614, 0.9631,
  19186. 0.2676],
  19187. [ 0.5200, -0.4353, 1.5363, -0.0149, -0.4152, 0.0697, 0.1005,
  19188. 0.1530],
  19189. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  19190. 0.2622],
  19191. [ 0.5351, -0.4153, 1.7326, -0.0457, -0.2214, -0.0466, 0.0434,
  19192. 0.2228],
  19193. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  19194. 0.1661]]], device='cuda:0')
  19195. loss_train_step before backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  19196. loss_train_step after backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  19197. loss_train: 3.0263278856873512
  19198. step: 89
  19199. running loss: 0.034003684108846646
  19200. Train Steps: 89/90 Loss: 0.0340 torch.Size([8, 600, 800])
  19201. torch.Size([8, 8])
  19202. tensor([[0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  19203. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  19204. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  19205. [0.6245, 0.4100, 0.7762, 0.2583, 0.4963, 0.1517, 0.5875, 0.5417],
  19206. [0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  19207. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433],
  19208. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  19209. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297]],
  19210. device='cuda:0', dtype=torch.float64)
  19211. predictions are: tensor([[ 0.2155, -0.6617, 1.7206, -0.2581, -0.0849, -0.0335, 0.5475, 0.2886],
  19212. [ 0.3063, -0.6256, 1.7132, -0.2126, -0.6088, -0.1912, 0.7480, 0.2040],
  19213. [ 0.4653, -0.5070, 1.7394, 0.1501, -0.6849, -0.4636, 0.5853, 0.0483],
  19214. [ 0.5087, -0.4337, 1.2280, -1.1637, -0.1142, -1.4992, 0.4559, 0.2600],
  19215. [ 0.6276, -0.3673, 1.3516, -1.2932, -0.1980, -1.4377, 0.6106, 0.2283],
  19216. [ 0.3026, -0.6008, 1.6122, -0.0452, -0.0811, -0.0767, 0.2343, 0.2728],
  19217. [ 0.5610, -0.3835, 1.2338, -0.8067, -0.7232, -0.4564, 0.3050, 0.3639],
  19218. [ 0.5379, -0.4936, 1.6835, 0.0435, -0.6293, -0.0777, 0.8585, 0.2135]],
  19219. device='cuda:0', grad_fn=<AddmmBackward>)
  19220. landmarks are: tensor([[[ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  19221. 0.2853],
  19222. [ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  19223. 0.1779],
  19224. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  19225. -0.0957],
  19226. [ 0.5985, -0.3921, 1.2995, -1.0927, 0.0062, -1.5854, 0.4277,
  19227. 0.2160],
  19228. [ 0.5908, -0.3832, 1.3804, -1.2543, -0.1270, -1.4671, 0.5721,
  19229. 0.2237],
  19230. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  19231. 0.2237],
  19232. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  19233. 0.4036],
  19234. [ 0.6520, -0.4032, 1.8076, 0.1852, -0.5711, -0.1381, 0.7876,
  19235. 0.1608]]], device='cuda:0')
  19236. loss_train_step before backward: tensor(0.0141, device='cuda:0', grad_fn=<MseLossBackward>)
  19237. loss_train_step after backward: tensor(0.0141, device='cuda:0', grad_fn=<MseLossBackward>)
  19238. loss_train: 3.0404702592641115
  19239. step: 90
  19240. running loss: 0.03378300288071235
  19241.  
  19242. Valid Steps: 10/10 Loss: nan 7.2476
  19243. --------------------------------------------------
  19244. Epoch: 5 Train Loss: 0.0338 Valid Loss: nan
  19245. --------------------------------------------------
  19246. size of train loader is: 90
  19247. torch.Size([8, 600, 800])
  19248. torch.Size([8, 8])
  19249. tensor([[0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  19250. [0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  19251. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  19252. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650],
  19253. [0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544],
  19254. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  19255. [0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  19256. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450]],
  19257. device='cuda:0', dtype=torch.float64)
  19258. predictions are: tensor([[ 0.7542, -0.2940, 1.0693, -1.0823, -0.2846, -1.4095, 0.2587, 0.1636],
  19259. [ 0.4289, -0.4749, 1.8449, -0.2291, -0.3635, -0.8582, 0.6296, 0.2635],
  19260. [ 0.7719, -0.2729, 1.6264, -0.6635, -0.6348, -0.6002, 0.4818, 0.1923],
  19261. [-2.1929, -2.2416, 1.0535, -1.1674, -0.3955, -1.2469, 0.2622, 0.2562],
  19262. [ 0.8213, -0.2376, 0.9933, -1.0158, -0.3735, -1.2595, 0.0756, 0.2700],
  19263. [ 0.7109, -0.3502, 1.7879, 0.0807, -0.3919, 0.4202, 0.9466, 0.2984],
  19264. [ 0.7260, -0.3469, 1.6753, 0.1680, -0.3162, 0.1486, 0.9122, 0.1825],
  19265. [ 0.6985, -0.3393, 1.7840, -0.1376, -0.3363, 0.1751, 0.5855, 0.2307]],
  19266. device='cuda:0', grad_fn=<AddmmBackward>)
  19267. landmarks are: tensor([[[ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  19268. 0.1253],
  19269. [ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  19270. 0.1608],
  19271. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  19272. 0.1753],
  19273. [-2.2859, -2.2859, 1.0361, -1.2021, -0.4210, -1.3390, 0.0871,
  19274. 0.3238],
  19275. [ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  19276. 0.2747],
  19277. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  19278. 0.3157],
  19279. [ 0.6042, -0.4273, 1.6920, 0.1860, -0.2717, 0.1406, 0.7997,
  19280. 0.1004],
  19281. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  19282. 0.2314]]], device='cuda:0')
  19283. loss_train_step before backward: tensor(0.0097, device='cuda:0', grad_fn=<MseLossBackward>)
  19284. loss_train_step after backward: tensor(0.0097, device='cuda:0', grad_fn=<MseLossBackward>)
  19285. loss_train: 0.009727518074214458
  19286. step: 1
  19287. running loss: 0.009727518074214458
  19288. Train Steps: 1/90 Loss: 0.0097 torch.Size([8, 600, 800])
  19289. torch.Size([8, 8])
  19290. tensor([[0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  19291. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  19292. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  19293. [0.6199, 0.4093, 0.7913, 0.2533, 0.4288, 0.2467, 0.5975, 0.5700],
  19294. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  19295. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  19296. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  19297. [0.6289, 0.4032, 0.8419, 0.5446, 0.4075, 0.5017, 0.6312, 0.5117]],
  19298. device='cuda:0', dtype=torch.float64)
  19299. predictions are: tensor([[ 0.6004, -0.3672, 1.2156, -0.6897, -0.3006, -1.1231, 0.3223, 0.4997],
  19300. [ 0.3149, -0.5709, 1.8053, -0.1810, -0.4348, -0.0823, 0.1140, 0.1113],
  19301. [ 0.3440, -0.6193, 1.6411, 0.4132, -0.2512, 0.0696, 0.2662, 0.1777],
  19302. [ 0.6088, -0.4192, 1.4295, -1.1601, -0.3286, -1.0138, 0.7049, 0.2644],
  19303. [ 0.5523, -0.4556, 1.0715, -1.3078, -0.4542, -1.0982, 0.6409, 0.2777],
  19304. [ 0.4007, -0.5953, 1.8373, -0.6258, -0.2968, -0.8168, 1.0265, 0.0947],
  19305. [ 0.1804, -0.6489, 1.6171, -0.5607, -0.6342, -0.7571, 0.2685, 0.2146],
  19306. [ 0.4799, -0.5429, 1.6780, 0.1912, -0.4269, 0.0378, 0.8408, 0.1385]],
  19307. device='cuda:0', grad_fn=<AddmmBackward>)
  19308. landmarks are: tensor([[[ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  19309. 0.5401],
  19310. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  19311. 0.0893],
  19312. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  19313. -0.0610],
  19314. [ 0.5771, -0.3955, 1.3688, -1.1158, -0.3055, -1.1466, 0.4739,
  19315. 0.3469],
  19316. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  19317. 0.2930],
  19318. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  19319. 0.1821],
  19320. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  19321. 0.2237],
  19322. [ 0.6189, -0.4238, 1.6026, 0.2295, -0.4037, 0.0313, 0.6298,
  19323. 0.0774]]], device='cuda:0')
  19324. loss_train_step before backward: tensor(0.0148, device='cuda:0', grad_fn=<MseLossBackward>)
  19325. loss_train_step after backward: tensor(0.0148, device='cuda:0', grad_fn=<MseLossBackward>)
  19326. loss_train: 0.024488049559295177
  19327. step: 2
  19328. running loss: 0.012244024779647589
  19329. Train Steps: 2/90 Loss: 0.0122 torch.Size([8, 600, 800])
  19330. torch.Size([8, 8])
  19331. tensor([[0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  19332. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  19333. [0.6201, 0.4064, 0.8688, 0.5050, 0.4225, 0.5100, 0.6138, 0.5500],
  19334. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  19335. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  19336. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  19337. [0.6200, 0.4039, 0.8880, 0.4799, 0.3625, 0.4285, 0.5866, 0.5148],
  19338. [0.6260, 0.4133, 0.8800, 0.5117, 0.3713, 0.3283, 0.6223, 0.4967]],
  19339. device='cuda:0', dtype=torch.float64)
  19340. predictions are: tensor([[ 0.7454, -0.3024, 1.7860, -0.3361, -0.0949, 0.0958, 0.5557, 0.2262],
  19341. [ 0.5253, -0.4278, 1.4045, -0.8717, -0.5915, -0.6161, 0.2637, 0.3010],
  19342. [ 0.6854, -0.3350, 1.7206, -0.0855, -0.2740, -0.0146, 0.3494, 0.2215],
  19343. [ 0.7256, -0.3493, 1.4856, 0.0067, -0.3950, -0.1420, 0.8548, 0.2708],
  19344. [ 0.8537, -0.2916, 1.6853, 0.2443, -0.5348, -0.2137, 0.6321, 0.1528],
  19345. [-1.9638, -2.1107, 1.0300, -1.3369, -0.1977, -1.5700, 0.3303, 0.3528],
  19346. [ 0.7093, -0.3309, 1.8327, -0.2651, -0.5227, -0.4226, 0.3786, 0.1303],
  19347. [ 0.8808, -0.2086, 1.8253, -0.0877, -0.4148, -0.8260, 0.6492, 0.1294]],
  19348. device='cuda:0', grad_fn=<AddmmBackward>)
  19349. landmarks are: tensor([[[ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  19350. 0.2237],
  19351. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  19352. 0.3417],
  19353. [ 0.5784, -0.4088, 1.7268, 0.0467, -0.3344, 0.0697, 0.5490,
  19354. 0.2545],
  19355. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  19356. 0.1928],
  19357. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  19358. 0.0261],
  19359. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  19360. 0.3469],
  19361. [ 0.5781, -0.4205, 1.8159, -0.0691, -0.6116, -0.3069, 0.4236,
  19362. 0.0919],
  19363. [ 0.6054, -0.3767, 1.7788, 0.0774, -0.5711, -0.7694, 0.5887,
  19364. 0.0081]]], device='cuda:0')
  19365. loss_train_step before backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  19366. loss_train_step after backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  19367. loss_train: 0.043093412183225155
  19368. step: 3
  19369. running loss: 0.014364470727741718
  19370. Train Steps: 3/90 Loss: 0.0144 torch.Size([8, 600, 800])
  19371. torch.Size([8, 8])
  19372. tensor([[0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913],
  19373. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  19374. [0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  19375. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  19376. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  19377. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  19378. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  19379. [0.6268, 0.4029, 0.8500, 0.2683, 0.3937, 0.3500, 0.6860, 0.5297]],
  19380. device='cuda:0', dtype=torch.float64)
  19381. predictions are: tensor([[ 0.0854, -0.7300, 1.3343, -1.0758, -0.0698, -1.3501, 0.5538, 0.1221],
  19382. [ 0.4797, -0.4857, 1.3555, -1.0026, -0.2330, -1.1817, 0.5848, 0.1294],
  19383. [ 0.4533, -0.4955, 1.4321, -0.8290, -0.3719, -0.8532, 0.5331, 0.2373],
  19384. [ 0.3314, -0.5476, 1.5791, -0.4780, -0.6127, -0.5765, 0.2331, 0.1541],
  19385. [ 0.3811, -0.5397, 1.6226, 0.3160, -0.5185, -0.2334, 0.2644, 0.2589],
  19386. [ 0.2556, -0.6680, 1.6682, 0.1286, -0.5395, 0.0395, 0.4531, 0.3512],
  19387. [ 0.4959, -0.4210, 1.4818, -0.3671, -0.0721, -0.9667, 0.3686, 0.3975],
  19388. [ 0.6450, -0.4446, 1.6500, -0.9368, -0.5058, -0.4594, 1.1056, 0.0772]],
  19389. device='cuda:0', grad_fn=<AddmmBackward>)
  19390. landmarks are: tensor([[[ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  19391. -0.0168],
  19392. [ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  19393. 0.0928],
  19394. [ 0.5875, -0.3888, 1.3111, -0.8848, -0.4614, -0.9849, 0.5201,
  19395. 0.2622],
  19396. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  19397. 0.2237],
  19398. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  19399. 0.3392],
  19400. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  19401. 0.5239],
  19402. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  19403. 0.5882],
  19404. [ 0.6092, -0.4249, 1.6402, -1.0465, -0.4672, -0.6693, 0.8827,
  19405. 0.1608]]], device='cuda:0')
  19406. loss_train_step before backward: tensor(0.0271, device='cuda:0', grad_fn=<MseLossBackward>)
  19407. loss_train_step after backward: tensor(0.0271, device='cuda:0', grad_fn=<MseLossBackward>)
  19408. loss_train: 0.07015109900385141
  19409. step: 4
  19410. running loss: 0.017537774750962853
  19411.  
  19412. Train Steps: 4/90 Loss: 0.0175 torch.Size([8, 600, 800])
  19413. torch.Size([8, 8])
  19414. tensor([[0.6083, 0.3957, 0.8638, 0.4950, 0.4363, 0.5083, 0.5346, 0.4980],
  19415. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  19416. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  19417. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598],
  19418. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  19419. [0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283],
  19420. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609],
  19421. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683]],
  19422. device='cuda:0', dtype=torch.float64)
  19423. predictions are: tensor([[ 0.6732, -0.3474, 1.6743, -0.0082, -0.4961, 0.0134, 0.2572, -0.0216],
  19424. [ 0.8126, -0.2493, 1.6378, 0.0115, -0.5362, 0.0172, 0.2641, 0.2438],
  19425. [ 0.7811, -0.2574, 1.5581, 0.0977, -0.4353, 0.0952, 0.1921, 0.1597],
  19426. [ 0.7708, -0.2707, 1.4945, 0.3949, -0.2718, -0.1890, 0.3506, 0.2391],
  19427. [-2.1231, -2.2121, 1.5529, -1.2340, 0.0463, -1.3679, 1.1119, 0.3009],
  19428. [ 0.6323, -0.3641, 1.6140, 0.1118, -0.1846, -0.1604, 0.1566, 0.1369],
  19429. [ 0.3799, -0.5494, 1.6646, -1.1212, 0.0340, -1.5158, 1.2984, 0.2480],
  19430. [ 0.9152, -0.1758, 1.4520, -1.0302, -0.5784, -0.9599, 0.4555, 0.2445]],
  19431. device='cuda:0', grad_fn=<AddmmBackward>)
  19432. landmarks are: tensor([[[ 5.2379e-01, -4.5797e-01, 1.7037e+00, 4.6189e-04, -2.7090e-01,
  19433. 6.2048e-02, 1.8356e-01, 1.4106e-02],
  19434. [ 5.5393e-01, -4.0308e-01, 1.7168e+00, -5.9398e-02, -3.7483e-01,
  19435. 5.4350e-02, 1.3903e-01, 3.7768e-01],
  19436. [ 5.1784e-01, -4.4796e-01, 1.6748e+00, 6.2048e-02, -2.7667e-01,
  19437. 2.0831e-01, 1.0666e-01, 2.3862e-01],
  19438. [ 5.7258e-01, -4.2487e-01, 1.5824e+00, 3.7768e-01, -9.4206e-02,
  19439. -5.5582e-02, 2.7815e-01, 2.9966e-01],
  19440. [-2.2859e+00, -2.2859e+00, 1.6517e+00, -1.2620e+00, 2.1409e-01,
  19441. -1.1928e+00, 1.1166e+00, 2.4627e-01],
  19442. [ 5.2448e-01, -4.3472e-01, 1.6806e+00, 1.1594e-01, 4.6468e-03,
  19443. 1.2940e-02, 1.0439e-01, 1.5443e-01],
  19444. [ 6.3718e-01, -3.5749e-01, 1.6633e+00, -1.2082e+00, 2.1986e-01,
  19445. -1.2467e+00, 1.1313e+00, 3.0505e-01],
  19446. [ 5.7783e-01, -3.9299e-01, 1.5189e+00, -9.3872e-01, -4.3256e-01,
  19447. -9.1563e-01, 4.8545e-01, 3.3918e-01]]], device='cuda:0')
  19448. loss_train_step before backward: tensor(0.0189, device='cuda:0', grad_fn=<MseLossBackward>)
  19449. loss_train_step after backward: tensor(0.0189, device='cuda:0', grad_fn=<MseLossBackward>)
  19450. loss_train: 0.08904801961034536
  19451. step: 5
  19452. running loss: 0.017809603922069074
  19453. Train Steps: 5/90 Loss: 0.0178 torch.Size([8, 600, 800])
  19454. torch.Size([8, 8])
  19455. tensor([[0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  19456. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  19457. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  19458. [0.6353, 0.4128, 0.9138, 0.3533, 0.4688, 0.3250, 0.7145, 0.5991],
  19459. [0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  19460. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  19461. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  19462. [0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131]],
  19463. device='cuda:0', dtype=torch.float64)
  19464. predictions are: tensor([[ 0.4679, -0.5249, 1.1432, -1.3886, -0.4626, -1.0470, 0.5615, 0.1004],
  19465. [ 0.6455, -0.3653, 1.5256, -0.2370, -0.4582, -0.1594, 0.2167, 0.2687],
  19466. [ 0.3983, -0.5051, 1.6557, 0.0228, -0.5898, -0.5597, 0.1420, 0.1631],
  19467. [-0.1206, -0.9222, 1.9298, -0.4981, 0.0381, -0.9257, 1.4428, 0.4271],
  19468. [ 0.5584, -0.3998, 1.7356, -0.2781, -0.2670, -1.1656, 0.4453, 0.2577],
  19469. [ 0.4390, -0.5099, 1.8071, -0.1181, -0.3375, -0.1904, 0.1749, 0.0565],
  19470. [ 0.6322, -0.3949, 1.6822, 0.0830, -0.2574, 0.1128, 0.3545, 0.3131],
  19471. [ 0.5678, -0.4407, 1.5844, -0.4062, -0.5713, -0.2275, 0.3795, 0.1258]],
  19472. device='cuda:0', grad_fn=<AddmmBackward>)
  19473. landmarks are: tensor([[[ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  19474. 0.0562],
  19475. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  19476. 0.3265],
  19477. [ 0.5443, -0.3994, 1.7499, -0.1227, -0.6173, -0.5769, 0.0049,
  19478. 0.2071],
  19479. [ 0.6487, -0.3792, 1.9346, -0.6539, -0.1208, -0.7848, 1.0143,
  19480. 0.4814],
  19481. [ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  19482. 0.1929],
  19483. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  19484. -0.0220],
  19485. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  19486. 0.3777],
  19487. [ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  19488. 0.0840]]], device='cuda:0')
  19489. loss_train_step before backward: tensor(0.0255, device='cuda:0', grad_fn=<MseLossBackward>)
  19490. loss_train_step after backward: tensor(0.0255, device='cuda:0', grad_fn=<MseLossBackward>)
  19491. loss_train: 0.11450012680143118
  19492. step: 6
  19493. running loss: 0.019083354466905195
  19494. Train Steps: 6/90 Loss: 0.0191 torch.Size([8, 600, 800])
  19495. torch.Size([8, 8])
  19496. tensor([[0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  19497. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  19498. [0.6182, 0.3967, 0.8263, 0.3065, 0.3526, 0.4161, 0.6192, 0.5290],
  19499. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  19500. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  19501. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  19502. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  19503. [0.6223, 0.4130, 0.8100, 0.2983, 0.3525, 0.3900, 0.5694, 0.5103]],
  19504. device='cuda:0', dtype=torch.float64)
  19505. predictions are: tensor([[ 0.7570, -0.3084, 1.7813, 0.1175, -0.2729, 0.0054, 0.5814, 0.2380],
  19506. [ 0.6667, -0.3722, 1.4920, -1.2591, -0.1936, -1.2800, 0.9240, 0.1477],
  19507. [ 0.4875, -0.4911, 1.6052, -0.7537, -0.5829, -0.5058, 0.7371, 0.1907],
  19508. [ 0.8956, -0.2000, 1.7388, 0.0653, -0.1816, -0.1037, 0.2166, 0.2962],
  19509. [ 0.8230, -0.2782, 1.6046, 0.5730, -0.1689, -0.0237, 0.2071, 0.1582],
  19510. [-2.3906, -2.3562, 1.1195, -0.9826, -0.3667, -1.1408, 0.1601, 0.2370],
  19511. [ 0.6998, -0.2829, 1.6248, -0.1946, -0.5209, -0.8853, 0.0696, 0.2143],
  19512. [ 0.8486, -0.2305, 1.5716, -0.7333, -0.5215, -0.5948, 0.5211, 0.1786]],
  19513. device='cuda:0', grad_fn=<AddmmBackward>)
  19514. landmarks are: tensor([[[ 5.7760e-01, -4.1093e-01, 1.7326e+00, -2.2633e-02, -3.6328e-01,
  19515. 2.3557e-02, 5.6051e-01, 2.3911e-01],
  19516. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  19517. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  19518. [ 5.6966e-01, -4.5379e-01, 1.5308e+00, -8.7027e-01, -6.5720e-01,
  19519. -3.6388e-01, 5.7392e-01, 1.5759e-01],
  19520. [ 5.4908e-01, -4.2902e-01, 1.7788e+00, -1.0731e-01, -2.6513e-01,
  19521. -1.0731e-01, 2.5553e-01, 3.0567e-01],
  19522. [ 5.1928e-01, -4.6990e-01, 1.5767e+00, 4.0077e-01, -2.4203e-01,
  19523. 7.7444e-02, 1.1776e-01, -6.1038e-02],
  19524. [-2.2859e+00, -2.2859e+00, 1.2469e+00, -1.0288e+00, -4.5566e-01,
  19525. -1.2774e+00, 5.1142e-02, 2.1834e-01],
  19526. [ 5.4700e-01, -3.9515e-01, 1.6377e+00, -4.2531e-01, -6.2887e-01,
  19527. -8.0785e-01, 2.4925e-02, 2.1157e-01],
  19528. [ 5.8863e-01, -3.7837e-01, 1.4554e+00, -9.0793e-01, -6.5774e-01,
  19529. -4.8453e-01, 3.4395e-01, 7.1216e-02]]], device='cuda:0')
  19530. loss_train_step before backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  19531. loss_train_step after backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  19532. loss_train: 0.1331191835924983
  19533. step: 7
  19534. running loss: 0.019017026227499758
  19535. Train Steps: 7/90 Loss: 0.0190 torch.Size([8, 600, 800])
  19536. torch.Size([8, 8])
  19537. tensor([[0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083],
  19538. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  19539. [0.6246, 0.4028, 0.8738, 0.4867, 0.4088, 0.5667, 0.6362, 0.5200],
  19540. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  19541. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  19542. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  19543. [0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617],
  19544. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550]],
  19545. device='cuda:0', dtype=torch.float64)
  19546. predictions are: tensor([[ 0.7288, -0.3058, 1.7726, -0.3509, -0.5335, -0.3225, 0.3383, 0.4083],
  19547. [ 0.2176, -0.6818, 1.7063, -0.6477, -0.6027, -0.5390, 0.5127, 0.2334],
  19548. [ 0.6948, -0.3953, 1.9897, 0.2174, -0.3004, 0.3106, 0.7040, 0.1262],
  19549. [ 0.3446, -0.6356, 1.5774, -1.2607, 0.0750, -1.6404, 0.7996, 0.0959],
  19550. [ 0.3937, -0.5598, 0.9217, -0.9847, -0.4205, -1.2133, 0.1011, 0.2899],
  19551. [ 0.3524, -0.5586, 1.6655, -0.3946, -0.6244, -0.4767, 0.1380, 0.1607],
  19552. [ 0.5475, -0.4451, 1.7190, 0.6524, -0.0622, -0.1217, 0.2448, 0.2306],
  19553. [ 0.3456, -0.5822, 1.4855, -0.7606, -0.6151, -0.3893, 0.4202, 0.2709]],
  19554. device='cuda:0', grad_fn=<AddmmBackward>)
  19555. landmarks are: tensor([[[ 0.5774, -0.3868, 1.6286, -0.5692, -0.6462, -0.2767, 0.5143,
  19556. 0.5239],
  19557. [ 0.5779, -0.4275, 1.5894, -0.8362, -0.6577, -0.5153, 0.5605,
  19558. 0.2006],
  19559. [ 0.5990, -0.4256, 1.7499, -0.0380, -0.3979, 0.3315, 0.6529,
  19560. 0.1159],
  19561. [ 0.6126, -0.4057, 1.4439, -1.3159, -0.1150, -1.5777, 0.5537,
  19562. -0.0530],
  19563. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  19564. 0.3546],
  19565. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  19566. 0.2365],
  19567. [ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  19568. 0.3084],
  19569. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  19570. 0.2776]]], device='cuda:0')
  19571. loss_train_step before backward: tensor(0.0201, device='cuda:0', grad_fn=<MseLossBackward>)
  19572. loss_train_step after backward: tensor(0.0201, device='cuda:0', grad_fn=<MseLossBackward>)
  19573. loss_train: 0.1532347435131669
  19574. step: 8
  19575. running loss: 0.019154342939145863
  19576.  
  19577. Train Steps: 8/90 Loss: 0.0192 torch.Size([8, 600, 800])
  19578. torch.Size([8, 8])
  19579. tensor([[0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290],
  19580. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  19581. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  19582. [0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  19583. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  19584. [0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  19585. [0.6226, 0.4125, 0.8800, 0.4900, 0.4512, 0.5600, 0.6275, 0.5517],
  19586. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168]],
  19587. device='cuda:0', dtype=torch.float64)
  19588. predictions are: tensor([[ 0.2550, -0.6382, 1.3415, -1.3801, -0.2225, -1.3262, 0.6423, 0.1599],
  19589. [ 0.5471, -0.4761, 1.7444, 0.2648, -0.4119, -0.1947, 0.4265, 0.1811],
  19590. [ 0.6230, -0.3890, 1.8253, 0.3196, -0.4646, -0.2568, 0.0844, 0.0392],
  19591. [ 0.8241, -0.2153, 1.8669, -0.0251, -0.5363, -0.3031, 0.3125, 0.3552],
  19592. [ 0.9951, -0.1611, 1.9537, -0.3856, -0.5628, -0.2982, 0.3243, 0.1922],
  19593. [ 0.4725, -0.4909, 1.6059, 0.3220, -0.4420, -0.0804, 0.3932, 0.4512],
  19594. [ 0.4065, -0.5371, 1.8867, -0.1379, -0.1220, 0.2303, 0.4275, 0.2397],
  19595. [-0.3573, -1.0397, 0.9568, -1.4847, -0.3793, -1.4299, 0.2651, 0.1650]],
  19596. device='cuda:0', grad_fn=<AddmmBackward>)
  19597. landmarks are: tensor([[[ 0.6125, -0.4273, 1.2807, -1.3253, -0.2574, -1.2542, 0.6864,
  19598. 0.1575],
  19599. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  19600. 0.1313],
  19601. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  19602. -0.0370],
  19603. [ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  19604. 0.3623],
  19605. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  19606. 0.2930],
  19607. [ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  19608. 0.5393],
  19609. [ 0.5897, -0.3804, 1.7788, -0.0226, -0.2016, 0.3007, 0.6125,
  19610. 0.2622],
  19611. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  19612. 0.1013]]], device='cuda:0')
  19613. loss_train_step before backward: tensor(0.0303, device='cuda:0', grad_fn=<MseLossBackward>)
  19614. loss_train_step after backward: tensor(0.0303, device='cuda:0', grad_fn=<MseLossBackward>)
  19615. loss_train: 0.18358023930341005
  19616. step: 9
  19617. running loss: 0.020397804367045563
  19618. Train Steps: 9/90 Loss: 0.0204 torch.Size([8, 600, 800])
  19619. torch.Size([8, 8])
  19620. tensor([[0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  19621. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  19622. [0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250],
  19623. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  19624. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  19625. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  19626. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  19627. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167]],
  19628. device='cuda:0', dtype=torch.float64)
  19629. predictions are: tensor([[ 4.3023e-01, -5.1482e-01, 1.7756e+00, 1.1360e-03, -3.6645e-01,
  19630. -2.6895e-01, 8.9147e-02, 2.8362e-01],
  19631. [ 2.5134e-01, -6.3133e-01, 1.8180e+00, -1.0324e-01, -3.5429e-01,
  19632. 4.1739e-01, 4.8015e-01, 1.5867e-01],
  19633. [ 3.5384e-01, -5.8044e-01, 1.1428e+00, -1.0631e+00, -3.7179e-01,
  19634. -9.1526e-01, 4.6287e-01, 2.6820e-01],
  19635. [ 4.9021e-01, -4.6988e-01, 1.6632e+00, -4.7789e-01, -3.7840e-01,
  19636. -1.0013e+00, 1.3930e-01, 1.6179e-01],
  19637. [ 7.3768e-01, -3.5570e-01, 1.7729e+00, -6.4928e-01, -2.7519e-01,
  19638. -8.5562e-01, 8.7062e-01, 2.3698e-01],
  19639. [ 6.4180e-01, -3.7256e-01, 1.3457e+00, -3.2032e-01, -4.9100e-01,
  19640. -7.8489e-01, 2.0598e-01, 4.0648e-01],
  19641. [ 4.5137e-02, -7.7108e-01, 1.3785e+00, -9.7295e-01, -5.5496e-01,
  19642. -6.3843e-01, 3.7514e-01, 1.5874e-01],
  19643. [ 5.1822e-01, -4.5746e-01, 1.6131e+00, -6.3268e-01, -4.9638e-01,
  19644. -8.6872e-01, 2.3403e-01, 9.5013e-02]], device='cuda:0',
  19645. grad_fn=<AddmmBackward>)
  19646. landmarks are: tensor([[[ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  19647. 0.3087],
  19648. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  19649. 0.0772],
  19650. [ 0.5891, -0.3937, 1.1494, -1.2390, -0.5076, -0.9695, 0.4797,
  19651. 0.1390],
  19652. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  19653. 0.1494],
  19654. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  19655. 0.3050],
  19656. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  19657. 0.4470],
  19658. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  19659. 0.0412],
  19660. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  19661. 0.1005]]], device='cuda:0')
  19662. loss_train_step before backward: tensor(0.0199, device='cuda:0', grad_fn=<MseLossBackward>)
  19663. loss_train_step after backward: tensor(0.0199, device='cuda:0', grad_fn=<MseLossBackward>)
  19664. loss_train: 0.20348771009594202
  19665. step: 10
  19666. running loss: 0.020348771009594202
  19667. Train Steps: 10/90 Loss: 0.0203 torch.Size([8, 600, 800])
  19668. torch.Size([8, 8])
  19669. tensor([[0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  19670. [0.6124, 0.4030, 0.8650, 0.4867, 0.4999, 0.5106, 0.5137, 0.5773],
  19671. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  19672. [0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  19673. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  19674. [0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617],
  19675. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  19676. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835]],
  19677. device='cuda:0', dtype=torch.float64)
  19678. predictions are: tensor([[ 0.3729, -0.5449, 1.6055, -0.3498, -0.5716, -0.1778, 0.1901, 0.2834],
  19679. [ 0.4369, -0.5189, 1.7649, -0.1136, -0.0909, -0.0224, 0.1736, 0.2540],
  19680. [ 0.2000, -0.6297, 1.3461, -1.0150, -0.4848, -1.0933, 0.1059, 0.2289],
  19681. [ 0.4935, -0.4793, 1.7645, -0.2782, -0.5397, -0.1706, 0.3770, 0.3191],
  19682. [ 0.6598, -0.3805, 0.9234, -1.1801, -0.5330, -1.1614, 0.4945, 0.2989],
  19683. [ 0.4239, -0.5186, 1.6509, 0.3934, -0.2377, -0.0880, 0.3082, 0.2429],
  19684. [ 0.3168, -0.5442, 1.8375, -0.1244, -0.4559, -0.0795, 0.3196, 0.0846],
  19685. [ 0.8351, -0.2616, 1.8822, -0.5596, -0.4198, -1.2483, 0.5455, 0.0289]],
  19686. device='cuda:0', grad_fn=<AddmmBackward>)
  19687. landmarks are: tensor([[[ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  19688. 0.3265],
  19689. [ 0.5428, -0.4244, 1.7095, -0.0380, 0.0232, 0.0725, 0.0866,
  19690. 0.3806],
  19691. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  19692. 0.3700],
  19693. [ 0.5700, -0.4032, 1.7961, -0.1997, -0.5249, -0.2151, 0.3815,
  19694. 0.3161],
  19695. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  19696. 0.2391],
  19697. [ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  19698. 0.3084],
  19699. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  19700. 0.1439],
  19701. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  19702. -0.0529]]], device='cuda:0')
  19703. loss_train_step before backward: tensor(0.0111, device='cuda:0', grad_fn=<MseLossBackward>)
  19704. loss_train_step after backward: tensor(0.0111, device='cuda:0', grad_fn=<MseLossBackward>)
  19705. loss_train: 0.2146181659772992
  19706. step: 11
  19707. running loss: 0.019510742361572655
  19708. Train Steps: 11/90 Loss: 0.0195 torch.Size([8, 600, 800])
  19709. torch.Size([8, 8])
  19710. tensor([[0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  19711. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  19712. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575],
  19713. [0.6142, 0.4127, 0.7575, 0.3067, 0.3438, 0.4383, 0.5778, 0.5207],
  19714. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  19715. [0.6276, 0.4235, 0.8888, 0.5333, 0.3800, 0.3117, 0.5427, 0.6164],
  19716. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  19717. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517]],
  19718. device='cuda:0', dtype=torch.float64)
  19719. predictions are: tensor([[ 0.4516, -0.5583, 1.8792, 0.0522, -0.5844, -0.0748, 0.2217, 0.0709],
  19720. [ 0.4405, -0.5722, 1.8521, -0.5826, -0.3625, -0.8696, 0.6606, 0.0918],
  19721. [ 0.5997, -0.4428, 1.7636, -0.7638, -0.4621, -0.3558, 0.7902, 0.2362],
  19722. [ 0.2645, -0.6072, 1.2612, -0.9835, -0.6613, -0.3469, 0.1612, 0.2814],
  19723. [ 0.4704, -0.4822, 1.2027, -1.1104, -0.6415, -0.7891, 0.2351, 0.2756],
  19724. [ 0.5423, -0.4085, 1.7679, 0.4169, -0.5631, -0.7001, 0.2094, 0.4311],
  19725. [ 0.4537, -0.5225, 1.8894, 0.1367, -0.0578, 0.1081, 0.0480, 0.0833],
  19726. [ 0.7690, -0.3127, 1.0238, -1.1468, -0.4148, -1.2598, 0.2532, 0.3526]],
  19727. device='cuda:0', grad_fn=<AddmmBackward>)
  19728. landmarks are: tensor([[[ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  19729. -0.0534],
  19730. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  19731. 0.1821],
  19732. [ 0.6158, -0.4249, 1.8654, -0.9002, -0.3229, -0.3537, 0.9667,
  19733. 0.2890],
  19734. [ 0.5509, -0.3798, 1.2129, -0.8694, -0.6982, -0.2613, 0.3830,
  19735. 0.1193],
  19736. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  19737. 0.3007],
  19738. [ 0.6131, -0.3299, 1.8192, 0.1775, -0.5307, -0.8463, 0.2206,
  19739. 0.5612],
  19740. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  19741. 0.0532],
  19742. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  19743. 0.2622]]], device='cuda:0')
  19744. loss_train_step before backward: tensor(0.0157, device='cuda:0', grad_fn=<MseLossBackward>)
  19745. loss_train_step after backward: tensor(0.0157, device='cuda:0', grad_fn=<MseLossBackward>)
  19746. loss_train: 0.23029645066708326
  19747. step: 12
  19748. running loss: 0.019191370888923604
  19749.  
  19750. Train Steps: 12/90 Loss: 0.0192 torch.Size([8, 600, 800])
  19751. torch.Size([8, 8])
  19752. tensor([[0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  19753. [0.6224, 0.3964, 0.8225, 0.5717, 0.4150, 0.4617, 0.5775, 0.5267],
  19754. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  19755. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  19756. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  19757. [0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869],
  19758. [0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  19759. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461]],
  19760. device='cuda:0', dtype=torch.float64)
  19761. predictions are: tensor([[ 0.4027, -0.4660, 1.7366, -0.1386, -0.4564, -0.1423, 0.1591, 0.1444],
  19762. [ 0.6957, -0.3605, 1.5943, 0.3531, -0.5002, -0.2424, 0.2633, 0.1841],
  19763. [ 0.5300, -0.4568, 1.6870, -0.1113, -0.3307, -0.0143, 0.4898, 0.2449],
  19764. [ 0.6326, -0.3350, 1.5015, -0.6746, -0.6986, -0.8277, 0.0879, 0.2304],
  19765. [ 0.4498, -0.4974, 1.7203, -0.1162, -0.3503, -0.0235, 0.2616, 0.2893],
  19766. [ 0.7554, -0.3196, 1.3230, -1.4331, -0.1000, -1.5792, 0.5366, 0.1289],
  19767. [ 0.3027, -0.6293, 1.6558, -0.7107, -0.6150, -0.2197, 0.6912, 0.2634],
  19768. [ 0.4142, -0.4875, 1.4956, -0.6237, -0.7294, -0.4820, 0.0756, 0.2566]],
  19769. device='cuda:0', grad_fn=<AddmmBackward>)
  19770. landmarks are: tensor([[[ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  19771. 0.1439],
  19772. [ 0.5891, -0.4550, 1.5132, 0.3546, -0.3691, -0.1535, 0.3815,
  19773. 0.1467],
  19774. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  19775. 0.1474],
  19776. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  19777. 0.2237],
  19778. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  19779. 0.3084],
  19780. [ 0.6124, -0.4010, 1.4381, -1.3544, -0.0573, -1.5546, 0.5573,
  19781. -0.0369],
  19782. [ 0.6108, -0.4273, 1.8711, -0.6616, -0.5769, -0.1997, 0.9156,
  19783. 0.1554],
  19784. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  19785. 0.2365]]], device='cuda:0')
  19786. loss_train_step before backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  19787. loss_train_step after backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  19788. loss_train: 0.24174558836966753
  19789. step: 13
  19790. running loss: 0.018595814489974424
  19791. Train Steps: 13/90 Loss: 0.0186 torch.Size([8, 600, 800])
  19792. torch.Size([8, 8])
  19793. tensor([[0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  19794. [0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  19795. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  19796. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  19797. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875],
  19798. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  19799. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  19800. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400]],
  19801. device='cuda:0', dtype=torch.float64)
  19802. predictions are: tensor([[ 0.5512, -0.4012, 1.5784, -0.9252, -0.4582, -0.8089, 0.3276, 0.1340],
  19803. [ 0.4327, -0.5581, 1.7039, 0.5004, -0.5014, 0.0815, 0.4479, 0.0676],
  19804. [ 0.4325, -0.4672, 0.9178, -1.0695, -0.3671, -1.2160, 0.0401, 0.3845],
  19805. [ 0.4380, -0.4994, 1.1840, -1.0801, -0.3987, -0.9658, 0.3837, 0.2877],
  19806. [ 0.4125, -0.4639, 1.6765, -0.6351, -0.6692, -0.6472, 0.0339, 0.1250],
  19807. [ 0.5317, -0.4280, 1.4851, -0.9166, -0.4635, -0.7955, 0.3967, 0.1464],
  19808. [ 0.5392, -0.4849, 1.8711, 0.0163, -0.5591, -0.0264, 0.6641, 0.2175],
  19809. [ 0.4610, -0.4635, 1.2291, -1.0568, -0.2196, -1.1458, 0.3517, 0.3011]],
  19810. device='cuda:0', grad_fn=<AddmmBackward>)
  19811. landmarks are: tensor([[[ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  19812. 0.0851],
  19813. [ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  19814. -0.1492],
  19815. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  19816. 0.3007],
  19817. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  19818. 0.1698],
  19819. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  19820. -0.0340],
  19821. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  19822. 0.0807],
  19823. [ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  19824. 0.1779],
  19825. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  19826. 0.2083]]], device='cuda:0')
  19827. loss_train_step before backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  19828. loss_train_step after backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  19829. loss_train: 0.25693511217832565
  19830. step: 14
  19831. running loss: 0.018352508012737547
  19832. Train Steps: 14/90 Loss: 0.0184 torch.Size([8, 600, 800])
  19833. torch.Size([8, 8])
  19834. tensor([[0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  19835. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  19836. [0.6250, 0.4013, 0.8525, 0.5417, 0.4037, 0.5117, 0.6325, 0.5017],
  19837. [0.6284, 0.4093, 0.8900, 0.4700, 0.3650, 0.3850, 0.6212, 0.5167],
  19838. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  19839. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  19840. [0.6173, 0.4114, 0.7325, 0.2500, 0.4213, 0.1917, 0.5338, 0.5700],
  19841. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901]],
  19842. device='cuda:0', dtype=torch.float64)
  19843. predictions are: tensor([[ 0.5322, -0.4184, 1.0965, -1.2336, -0.5849, -1.0054, 0.0292, 0.1176],
  19844. [ 0.6723, -0.3306, 0.9867, -1.1890, -0.4479, -1.1556, 0.2707, 0.3578],
  19845. [ 0.4028, -0.5790, 1.8348, 0.1465, -0.5165, 0.0932, 0.5661, 0.0781],
  19846. [ 0.6797, -0.3641, 1.9693, -0.1283, -0.6853, -0.4126, 0.5338, 0.0233],
  19847. [ 0.6101, -0.3995, 1.8501, -0.2459, -0.1648, 0.1547, 0.4233, 0.2387],
  19848. [ 0.5019, -0.4424, 1.6876, 0.3924, -0.2844, -0.1806, 0.2704, 0.4552],
  19849. [ 0.2637, -0.5703, 1.0420, -1.2051, -0.4135, -1.2683, 0.0640, 0.3140],
  19850. [ 0.7188, -0.3408, 1.7550, -0.8725, -0.6918, -0.6287, 0.5274, 0.0789]],
  19851. device='cuda:0', grad_fn=<AddmmBackward>)
  19852. landmarks are: tensor([[[ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  19853. 0.0802],
  19854. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  19855. 0.2622],
  19856. [ 0.6010, -0.4321, 1.6517, 0.2160, -0.4210, 0.0774, 0.6356,
  19857. 0.0313],
  19858. [ 0.6164, -0.3956, 1.8249, -0.1150, -0.6000, -0.5076, 0.5836,
  19859. 0.1005],
  19860. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  19861. 0.2853],
  19862. [ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  19863. 0.4470],
  19864. [ 0.5652, -0.3858, 1.0975, -1.1312, -0.3402, -1.4006, 0.1794,
  19865. 0.3469],
  19866. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  19867. -0.0220]]], device='cuda:0')
  19868. loss_train_step before backward: tensor(0.0100, device='cuda:0', grad_fn=<MseLossBackward>)
  19869. loss_train_step after backward: tensor(0.0100, device='cuda:0', grad_fn=<MseLossBackward>)
  19870. loss_train: 0.2669285275042057
  19871. step: 15
  19872. running loss: 0.017795235166947046
  19873. Train Steps: 15/90 Loss: 0.0178 torch.Size([8, 600, 800])
  19874. torch.Size([8, 8])
  19875. tensor([[0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436],
  19876. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  19877. [0.6196, 0.4088, 0.8888, 0.4583, 0.4500, 0.5683, 0.6138, 0.5883],
  19878. [0.6164, 0.4076, 0.8838, 0.4117, 0.3713, 0.5550, 0.6238, 0.5350],
  19879. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  19880. [0.6198, 0.4075, 0.8650, 0.5617, 0.4150, 0.4367, 0.5450, 0.5650],
  19881. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  19882. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114]],
  19883. device='cuda:0', dtype=torch.float64)
  19884. predictions are: tensor([[ 7.4917e-01, -2.9123e-01, 1.6643e+00, -7.0021e-02, -5.4613e-01,
  19885. 1.4726e-02, 8.5315e-01, 2.3208e-01],
  19886. [ 8.6743e-01, -1.8532e-01, 1.3006e+00, -1.5328e+00, -2.5562e-01,
  19887. -1.6725e+00, 4.7231e-01, 1.7271e-02],
  19888. [ 5.4636e-01, -3.7996e-01, 1.6489e+00, -4.4702e-01, -2.6623e-01,
  19889. 3.5819e-02, 3.5702e-01, 3.4274e-01],
  19890. [ 4.5332e-01, -4.3862e-01, 1.6072e+00, -5.8392e-01, -5.8043e-01,
  19891. 1.6829e-02, 4.6827e-01, 2.7635e-01],
  19892. [ 5.6296e-01, -3.9525e-01, 1.6733e+00, -2.4120e-01, -5.7210e-01,
  19893. -2.1659e-01, 1.4990e-01, 1.5060e-01],
  19894. [ 5.0192e-01, -4.1994e-01, 1.5758e+00, 1.8359e-01, -5.1492e-01,
  19895. -4.4539e-01, 2.1972e-01, 2.5103e-01],
  19896. [ 5.4839e-01, -4.0392e-01, 1.6198e+00, -1.2432e-01, -5.0563e-01,
  19897. -2.9601e-01, 7.4577e-02, 1.6226e-01],
  19898. [ 5.4278e-01, -4.0608e-01, 1.6447e+00, -8.1759e-02, -3.0073e-01,
  19899. -3.1521e-04, 3.1638e-01, 1.0237e-01]], device='cuda:0',
  19900. grad_fn=<AddmmBackward>)
  19901. landmarks are: tensor([[[ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  19902. 0.2249],
  19903. [ 0.6126, -0.4057, 1.4439, -1.3159, -0.1150, -1.5777, 0.5537,
  19904. -0.0530],
  19905. [ 0.5759, -0.3978, 1.8192, -0.1689, -0.2074, 0.3392, 0.5490,
  19906. 0.4316],
  19907. [ 0.5614, -0.4032, 1.7961, -0.3844, -0.5711, 0.2776, 0.5952,
  19908. 0.1852],
  19909. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  19910. 0.2035],
  19911. [ 0.5770, -0.4036, 1.7095, 0.3084, -0.3691, -0.2690, 0.2314,
  19912. 0.3238],
  19913. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  19914. 0.1854],
  19915. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  19916. 0.0764]]], device='cuda:0')
  19917. loss_train_step before backward: tensor(0.0220, device='cuda:0', grad_fn=<MseLossBackward>)
  19918. loss_train_step after backward: tensor(0.0220, device='cuda:0', grad_fn=<MseLossBackward>)
  19919. loss_train: 0.2889367938041687
  19920. step: 16
  19921. running loss: 0.018058549612760544
  19922.  
  19923. Train Steps: 16/90 Loss: 0.0181 torch.Size([8, 600, 800])
  19924. torch.Size([8, 8])
  19925. tensor([[0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  19926. [0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  19927. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  19928. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  19929. [0.6201, 0.4017, 0.8871, 0.4621, 0.3517, 0.4675, 0.5999, 0.5106],
  19930. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749],
  19931. [0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  19932. [0.6277, 0.4083, 0.8350, 0.2717, 0.4562, 0.1800, 0.5918, 0.4878]],
  19933. device='cuda:0', dtype=torch.float64)
  19934. predictions are: tensor([[ 5.1427e-01, -4.1541e-01, 1.5883e+00, -6.4958e-02, -2.9016e-01,
  19935. 1.5929e-03, 1.6787e-01, 2.4338e-01],
  19936. [ 7.8892e-01, -2.8638e-01, 1.8092e+00, -2.2893e-01, -4.9548e-01,
  19937. 9.6385e-02, 7.4152e-01, 1.4290e-01],
  19938. [ 6.8751e-01, -3.0935e-01, 1.6456e+00, -3.5264e-01, -5.5861e-01,
  19939. -2.3207e-01, 2.7769e-01, 2.3544e-01],
  19940. [ 7.5018e-01, -3.1599e-01, 1.6878e+00, 2.2710e-01, -5.1088e-01,
  19941. -2.6419e-01, 6.2945e-01, 1.2593e-02],
  19942. [ 6.6079e-01, -3.3558e-01, 1.6973e+00, -3.2839e-01, -6.2279e-01,
  19943. -3.0419e-01, 4.1372e-01, 1.6635e-01],
  19944. [ 5.2827e-01, -3.7146e-01, 1.0872e+00, -1.0771e+00, -6.6342e-01,
  19945. -8.6333e-01, 2.2034e-01, 3.3167e-01],
  19946. [ 5.4088e-01, -4.0553e-01, 1.7217e+00, -8.6147e-02, -1.6320e-01,
  19947. 1.2475e-01, 3.7833e-01, 2.1609e-01],
  19948. [ 4.0423e-01, -4.5951e-01, 1.3544e+00, -1.2396e+00, -2.0415e-01,
  19949. -1.3715e+00, 2.6294e-01, 7.7104e-02]], device='cuda:0',
  19950. grad_fn=<AddmmBackward>)
  19951. landmarks are: tensor([[[ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  19952. 0.2386],
  19953. [ 0.6047, -0.4209, 1.7557, -0.0303, -0.4845, 0.2545, 0.6587,
  19954. 0.1236],
  19955. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  19956. 0.3469],
  19957. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  19958. -0.0049],
  19959. [ 0.5783, -0.4306, 1.8114, -0.1515, -0.6617, -0.1268, 0.4851,
  19960. 0.0727],
  19961. [ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  19962. 0.3694],
  19963. [ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  19964. 0.0592],
  19965. [ 0.6132, -0.4002, 1.5709, -1.0311, -0.1785, -1.4545, 0.4474,
  19966. -0.0328]]], device='cuda:0')
  19967. loss_train_step before backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  19968. loss_train_step after backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  19969. loss_train: 0.3035747576504946
  19970. step: 17
  19971. running loss: 0.017857338685323212
  19972. Train Steps: 17/90 Loss: 0.0179 torch.Size([8, 600, 800])
  19973. torch.Size([8, 8])
  19974. tensor([[0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  19975. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  19976. [0.6200, 0.3978, 0.8900, 0.4550, 0.3775, 0.5200, 0.6150, 0.5367],
  19977. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  19978. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  19979. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  19980. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  19981. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064]],
  19982. device='cuda:0', dtype=torch.float64)
  19983. predictions are: tensor([[ 0.7755, -0.2566, 1.2124, -1.1970, -0.2807, -1.3949, 0.4493, 0.0860],
  19984. [ 0.6724, -0.2987, 1.2744, -0.9307, -0.5428, -0.9535, 0.2306, 0.0451],
  19985. [ 0.5606, -0.4360, 1.8056, -0.0158, -0.4819, 0.1948, 0.5600, 0.1729],
  19986. [ 0.4362, -0.4670, 1.2045, -0.9879, -0.5975, -0.6874, 0.2234, 0.1330],
  19987. [ 0.5636, -0.4414, 1.9031, -0.1640, -0.5636, -0.0504, 0.6355, 0.0259],
  19988. [ 0.7105, -0.3035, 1.0117, -1.1499, -0.4594, -1.1200, 0.4641, 0.2386],
  19989. [ 0.5666, -0.4205, 1.8395, -0.2656, -0.5567, -0.3416, 0.5523, 0.3514],
  19990. [ 0.4156, -0.5127, 1.7689, 0.0910, 0.0355, 0.0478, 0.2672, 0.1672]],
  19991. device='cuda:0', grad_fn=<AddmmBackward>)
  19992. landmarks are: tensor([[[ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  19993. 0.1082],
  19994. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  19995. -0.1031],
  19996. [ 0.5776, -0.4484, 1.8249, -0.1843, -0.5423, 0.1159, 0.5547,
  19997. 0.1929],
  19998. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  19999. 0.0442],
  20000. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  20001. -0.0670],
  20002. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  20003. 0.2930],
  20004. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  20005. 0.3238],
  20006. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  20007. 0.0532]]], device='cuda:0')
  20008. loss_train_step before backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  20009. loss_train_step after backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  20010. loss_train: 0.3108562519773841
  20011. step: 18
  20012. running loss: 0.01726979177652134
  20013. Train Steps: 18/90 Loss: 0.0173 torch.Size([8, 600, 800])
  20014. torch.Size([8, 8])
  20015. tensor([[0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  20016. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  20017. [0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  20018. [0.6236, 0.3977, 0.8985, 0.4806, 0.3835, 0.5216, 0.6613, 0.5166],
  20019. [0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  20020. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356],
  20021. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  20022. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183]],
  20023. device='cuda:0', dtype=torch.float64)
  20024. predictions are: tensor([[ 0.6249, -0.3117, 1.7247, -0.4558, -0.2784, -1.0430, 0.3631, 0.0424],
  20025. [ 0.5624, -0.4253, 1.5911, -1.0202, 0.0873, -1.0461, 0.9152, 0.1176],
  20026. [ 0.4162, -0.4453, 0.9554, -0.9243, -0.5591, -0.8039, 0.1167, 0.2402],
  20027. [ 0.5104, -0.4898, 1.7279, -0.0447, -0.4961, 0.3425, 0.7043, 0.1548],
  20028. [ 0.5848, -0.3563, 1.2298, -1.0580, -0.2116, -1.2383, 0.4013, 0.1006],
  20029. [ 0.5874, -0.3731, 1.3149, -0.9523, -0.3525, -1.0013, 0.5720, 0.1029],
  20030. [ 0.3819, -0.4549, 1.5499, -0.3267, -0.6556, -0.6680, -0.0268, 0.1221],
  20031. [ 0.7683, -0.3051, 1.7793, -0.1137, -0.4840, 0.5970, 0.6887, 0.1274]],
  20032. device='cuda:0', grad_fn=<AddmmBackward>)
  20033. landmarks are: tensor([[[ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  20034. 0.0171],
  20035. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  20036. 0.1982],
  20037. [ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  20038. 0.3315],
  20039. [ 0.5944, -0.4490, 1.8643, -0.0659, -0.5147, 0.1235, 0.7684,
  20040. 0.1004],
  20041. [ 0.5908, -0.3832, 1.3804, -1.2543, -0.1270, -1.4671, 0.5721,
  20042. 0.2237],
  20043. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  20044. 0.1879],
  20045. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  20046. 0.2116],
  20047. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  20048. 0.1082]]], device='cuda:0')
  20049. loss_train_step before backward: tensor(0.0143, device='cuda:0', grad_fn=<MseLossBackward>)
  20050. loss_train_step after backward: tensor(0.0143, device='cuda:0', grad_fn=<MseLossBackward>)
  20051. loss_train: 0.3251751000061631
  20052. step: 19
  20053. running loss: 0.017114478947692795
  20054. Train Steps: 19/90 Loss: 0.0171 torch.Size([8, 600, 800])
  20055. torch.Size([8, 8])
  20056. tensor([[0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  20057. [0.6266, 0.4101, 0.8350, 0.2333, 0.3950, 0.2950, 0.6264, 0.4921],
  20058. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  20059. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  20060. [0.6371, 0.4092, 0.8337, 0.5850, 0.3950, 0.5117, 0.6559, 0.5262],
  20061. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  20062. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320],
  20063. [0.6260, 0.4120, 0.8013, 0.2350, 0.4888, 0.1533, 0.6281, 0.4895]],
  20064. device='cuda:0', dtype=torch.float64)
  20065. predictions are: tensor([[ 6.3753e-01, -3.0106e-01, 1.7238e+00, -5.3725e-01, -4.3524e-01,
  20066. -8.7413e-01, 2.8037e-01, 1.2785e-01],
  20067. [ 7.4946e-01, -2.6226e-01, 1.4602e+00, -1.1061e+00, -3.8495e-01,
  20068. -8.8866e-01, 5.5216e-01, 3.8942e-02],
  20069. [ 5.6102e-01, -3.5893e-01, 1.1527e+00, -1.0360e+00, -5.2439e-01,
  20070. -6.7386e-01, 1.5924e-01, 1.1717e-01],
  20071. [-1.0101e+00, -1.4053e+00, 1.1850e+00, -1.0470e+00, -4.7518e-01,
  20072. -1.0037e+00, -4.8302e-02, 1.9874e-01],
  20073. [ 8.3262e-01, -2.4918e-01, 1.6203e+00, 3.0693e-01, -3.8922e-01,
  20074. 1.4029e-01, 6.9893e-01, 5.8639e-02],
  20075. [ 9.2227e-01, -1.9825e-01, 1.8672e+00, -6.0081e-02, -4.7998e-01,
  20076. 2.9148e-02, 8.5436e-01, 8.6164e-02],
  20077. [ 7.5961e-01, -2.9459e-01, 1.6385e+00, 1.3106e-01, -3.7348e-01,
  20078. 1.4454e-01, 6.9711e-01, 1.6616e-01],
  20079. [ 7.5710e-01, -2.3514e-01, 1.3542e+00, -1.1528e+00, 1.2851e-03,
  20080. -1.4269e+00, 5.6705e-01, 8.8829e-02]], device='cuda:0',
  20081. grad_fn=<AddmmBackward>)
  20082. landmarks are: tensor([[[ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  20083. 0.2139],
  20084. [ 0.6081, -0.3918, 1.5709, -1.2082, -0.4614, -0.9233, 0.6072,
  20085. -0.0129],
  20086. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  20087. 0.0442],
  20088. [-2.2859, -2.2859, 1.2030, -1.0288, -0.4961, -1.1081, 0.0813,
  20089. 0.3161],
  20090. [ 0.6569, -0.3960, 1.5651, 0.4162, -0.4614, 0.0774, 0.7438,
  20091. 0.1447],
  20092. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  20093. 0.2516],
  20094. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  20095. 0.1715],
  20096. [ 0.6053, -0.3830, 1.4150, -1.2005, -0.0284, -1.5777, 0.6154,
  20097. -0.0250]]], device='cuda:0')
  20098. loss_train_step before backward: tensor(0.0515, device='cuda:0', grad_fn=<MseLossBackward>)
  20099. loss_train_step after backward: tensor(0.0515, device='cuda:0', grad_fn=<MseLossBackward>)
  20100. loss_train: 0.37666080240160227
  20101. step: 20
  20102. running loss: 0.018833040120080115
  20103.  
  20104. Train Steps: 20/90 Loss: 0.0188 torch.Size([8, 600, 800])
  20105. torch.Size([8, 8])
  20106. tensor([[0.6336, 0.4191, 0.8938, 0.5167, 0.3937, 0.3517, 0.7343, 0.5748],
  20107. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  20108. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  20109. [0.6268, 0.4029, 0.8500, 0.2683, 0.3937, 0.3500, 0.6860, 0.5297],
  20110. [0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823],
  20111. [0.6030, 0.3969, 0.7988, 0.3917, 0.3450, 0.3667, 0.5266, 0.4700],
  20112. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  20113. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960]],
  20114. device='cuda:0', dtype=torch.float64)
  20115. predictions are: tensor([[ 0.4839, -0.5000, 1.6635, 0.1886, -0.3307, -0.3211, 0.7333, 0.2023],
  20116. [ 0.6194, -0.3507, 1.4114, -0.9203, -0.3818, -0.8013, 0.4622, 0.0413],
  20117. [ 0.6624, -0.3586, 1.8314, -0.1974, -0.5329, 0.0903, 0.6837, 0.1530],
  20118. [ 0.8656, -0.2259, 1.5109, -0.8773, -0.4817, -0.4769, 0.8409, 0.1297],
  20119. [ 0.8424, -0.2204, 1.4692, -1.0215, -0.1932, -1.1525, 0.6111, -0.0318],
  20120. [ 0.6292, -0.3355, 1.4958, -0.4595, -0.6039, -0.3666, 0.1997, 0.0866],
  20121. [-0.7059, -1.2208, 0.8391, -1.2020, -0.2385, -1.2981, 0.0876, 0.3023],
  20122. [ 0.7580, -0.2258, 1.6574, -0.7458, -0.0913, -1.0447, 0.4986, 0.0383]],
  20123. device='cuda:0', grad_fn=<AddmmBackward>)
  20124. landmarks are: tensor([[[ 0.6405, -0.3503, 1.8423, 0.1005, -0.4672, -0.6616, 1.1057,
  20125. 0.3692],
  20126. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  20127. 0.0807],
  20128. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  20129. 0.1390],
  20130. [ 0.6092, -0.4249, 1.6402, -1.0465, -0.4672, -0.6693, 0.8827,
  20131. 0.1608],
  20132. [ 0.6132, -0.4122, 1.5478, -1.0619, -0.2709, -1.4314, 0.5500,
  20133. -0.0583],
  20134. [ 0.4992, -0.4525, 1.4035, -0.4768, -0.6924, -0.5923, 0.1465,
  20135. -0.1151],
  20136. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  20137. 0.3469],
  20138. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  20139. 0.0051]]], device='cuda:0')
  20140. loss_train_step before backward: tensor(0.0800, device='cuda:0', grad_fn=<MseLossBackward>)
  20141. loss_train_step after backward: tensor(0.0800, device='cuda:0', grad_fn=<MseLossBackward>)
  20142. loss_train: 0.4566794792190194
  20143. step: 21
  20144. running loss: 0.02174664186757235
  20145. Train Steps: 21/90 Loss: 0.0217 torch.Size([8, 600, 800])
  20146. torch.Size([8, 8])
  20147. tensor([[0.6211, 0.3993, 0.7650, 0.1933, 0.4575, 0.1550, 0.5965, 0.4895],
  20148. [0.6357, 0.4159, 0.8788, 0.5583, 0.3638, 0.4433, 0.6488, 0.5297],
  20149. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667],
  20150. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500],
  20151. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  20152. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  20153. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  20154. [0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391]],
  20155. device='cuda:0', dtype=torch.float64)
  20156. predictions are: tensor([[ 0.7002, -0.3247, 1.2085, -1.4291, -0.0743, -1.4957, 0.4974, -0.0724],
  20157. [ 0.4774, -0.4847, 1.7084, 0.1631, -0.4217, -0.1387, 0.7403, 0.0630],
  20158. [ 0.5838, -0.3842, 1.6920, -0.6905, -0.5661, -0.2903, 0.6077, 0.2382],
  20159. [ 0.5264, -0.4329, 1.6813, -0.0333, -0.4499, -0.3091, 0.4960, 0.1460],
  20160. [ 0.7125, -0.3116, 1.7807, -0.0740, -0.3466, -0.4352, 0.7564, 0.0296],
  20161. [ 0.3954, -0.4781, 1.2758, -0.6132, -0.4806, -0.7404, 0.2370, 0.3153],
  20162. [ 0.7172, -0.2866, 1.5352, -0.8002, -0.5477, -0.3290, 0.5524, 0.1585],
  20163. [ 0.5864, -0.3569, 1.5866, -0.9917, -0.2150, -1.0676, 0.5041, 0.0485]],
  20164. device='cuda:0', grad_fn=<AddmmBackward>)
  20165. landmarks are: tensor([[[ 0.5828, -0.4417, 1.2476, -1.3929, -0.1727, -1.5700, 0.4694,
  20166. -0.0248],
  20167. [ 0.6504, -0.3647, 1.7730, 0.2930, -0.6058, -0.2382, 0.7109,
  20168. 0.1608],
  20169. [ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  20170. 0.3315],
  20171. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  20172. 0.2545],
  20173. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  20174. 0.1661],
  20175. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  20176. 0.4470],
  20177. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  20178. 0.2391],
  20179. [ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  20180. 0.2043]]], device='cuda:0')
  20181. loss_train_step before backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  20182. loss_train_step after backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  20183. loss_train: 0.46885613538324833
  20184. step: 22
  20185. running loss: 0.02131164251742038
  20186. Train Steps: 22/90 Loss: 0.0213 torch.Size([8, 600, 800])
  20187. torch.Size([8, 8])
  20188. tensor([[0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  20189. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332],
  20190. [0.6199, 0.4071, 0.7600, 0.2117, 0.4037, 0.2767, 0.6138, 0.5550],
  20191. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  20192. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  20193. [0.6090, 0.4010, 0.7838, 0.3483, 0.3538, 0.3783, 0.5462, 0.5077],
  20194. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967],
  20195. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683]],
  20196. device='cuda:0', dtype=torch.float64)
  20197. predictions are: tensor([[ 0.6196, -0.3860, 1.7935, 0.0901, -0.3193, 0.3917, 0.6185, 0.0979],
  20198. [ 0.4539, -0.5063, 1.5252, 0.2251, -0.4727, 0.1093, 0.7826, 0.1797],
  20199. [ 0.6377, -0.3392, 1.3309, -1.1378, -0.4062, -1.0118, 0.6385, 0.1555],
  20200. [ 0.4766, -0.4483, 1.3842, -1.0258, -0.1972, -1.3189, 0.4875, 0.1217],
  20201. [ 0.6683, -0.3750, 1.4588, -0.9875, -0.2644, -1.2481, 0.7489, 0.0369],
  20202. [ 0.4246, -0.4852, 1.4205, -0.7114, -0.6263, -0.5640, 0.2431, 0.1097],
  20203. [ 0.5375, -0.3941, 1.6243, -1.0296, -0.0724, -1.3532, 0.6481, 0.0064],
  20204. [ 0.5658, -0.3992, 1.6959, -0.5945, -0.7086, -0.3629, 0.4398, 0.2220]],
  20205. device='cuda:0', grad_fn=<AddmmBackward>)
  20206. landmarks are: tensor([[[ 5.9913e-01, -3.8029e-01, 1.8018e+00, -5.3426e-02, -3.4596e-01,
  20207. 1.8522e-01, 5.3741e-01, 1.3903e-01],
  20208. [ 6.1907e-01, -4.2971e-01, 1.4612e+00, 2.3911e-01, -4.9607e-01,
  20209. 3.1255e-02, 1.1166e+00, 1.7680e-01],
  20210. [ 5.7754e-01, -4.0539e-01, 1.2245e+00, -1.3082e+00, -4.2102e-01,
  20211. -1.0080e+00, 5.4896e-01, 2.7760e-01],
  20212. [ 5.7679e-01, -4.0308e-01, 1.3838e+00, -1.1527e+00, -2.1876e-01,
  20213. -1.4216e+00, 4.3790e-01, 1.8502e-01],
  20214. [ 6.1322e-01, -4.2479e-01, 1.5247e+00, -1.1620e+00, -2.8822e-01,
  20215. -1.3159e+00, 6.5445e-01, 1.1931e-01],
  20216. [ 5.2702e-01, -4.3356e-01, 1.3342e+00, -6.7698e-01, -6.5196e-01,
  20217. -5.3841e-01, 2.3702e-01, 5.9193e-02],
  20218. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  20219. -1.5161e+00, 5.8660e-01, 8.0947e-03],
  20220. [ 5.8672e-01, -3.9369e-01, 1.7499e+00, -7.1547e-01, -6.4042e-01,
  20221. -3.8445e-01, 4.7390e-01, 3.3918e-01]]], device='cuda:0')
  20222. loss_train_step before backward: tensor(0.0080, device='cuda:0', grad_fn=<MseLossBackward>)
  20223. loss_train_step after backward: tensor(0.0080, device='cuda:0', grad_fn=<MseLossBackward>)
  20224. loss_train: 0.4768888894468546
  20225. step: 23
  20226. running loss: 0.02073429954116759
  20227. Train Steps: 23/90 Loss: 0.0207 torch.Size([8, 600, 800])
  20228. torch.Size([8, 8])
  20229. tensor([[0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  20230. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  20231. [0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426],
  20232. [ nan, nan, 0.8850, 0.2817, 0.5112, 0.2183, 0.7184, 0.5436],
  20233. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  20234. [0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  20235. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  20236. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783]],
  20237. device='cuda:0', dtype=torch.float64)
  20238. predictions are: tensor([[ 6.4015e-01, -3.2741e-01, 1.5286e+00, -5.8203e-01, -2.0736e-01,
  20239. -1.0390e+00, 3.7237e-01, 3.1638e-01],
  20240. [ 7.2093e-01, -2.9143e-01, 1.7759e+00, -1.1026e+00, -2.6972e-01,
  20241. -1.1049e+00, 7.2239e-01, -1.2084e-01],
  20242. [ 8.0535e-01, -2.6231e-01, 1.2904e+00, -1.1777e+00, -3.5370e-01,
  20243. -1.2656e+00, 5.2912e-01, -1.9021e-02],
  20244. [-5.5371e-01, -1.1874e+00, 1.8828e+00, -1.1686e+00, -5.8424e-03,
  20245. -1.0682e+00, 1.1814e+00, 1.2185e-01],
  20246. [ 5.2261e-01, -4.1431e-01, 1.4245e+00, -1.9491e-01, -5.6756e-01,
  20247. -6.1366e-01, 3.0487e-01, 4.5116e-01],
  20248. [ 5.1992e-01, -4.8953e-01, 1.7885e+00, -5.3513e-02, -4.4506e-01,
  20249. 3.5400e-01, 6.2226e-01, 1.5005e-01],
  20250. [ 8.1954e-01, -3.3110e-01, 1.7693e+00, 2.3936e-01, -6.8419e-01,
  20251. -1.6167e-03, 7.2799e-01, 3.1313e-02],
  20252. [ 6.6607e-01, -3.6078e-01, 9.4744e-01, -1.1733e+00, -5.2266e-01,
  20253. -1.1170e+00, 3.4295e-01, 1.2331e-01]], device='cuda:0',
  20254. grad_fn=<AddmmBackward>)
  20255. landmarks are: tensor([[[ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  20256. 0.5882],
  20257. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  20258. -0.0209],
  20259. [ 0.5784, -0.4153, 1.2972, -1.2541, -0.2265, -1.4553, 0.4741,
  20260. 0.2203],
  20261. [-2.2859, -2.2859, 1.8018, -0.9849, 0.0755, -1.2774, 1.0326,
  20262. 0.2249],
  20263. [ 0.6069, -0.3309, 1.3742, -0.1493, -0.5365, -0.9541, 0.2884,
  20264. 0.5071],
  20265. [ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  20266. 0.2391],
  20267. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  20268. 0.0291],
  20269. [ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  20270. 0.3852]]], device='cuda:0')
  20271. loss_train_step before backward: tensor(0.0837, device='cuda:0', grad_fn=<MseLossBackward>)
  20272. loss_train_step after backward: tensor(0.0837, device='cuda:0', grad_fn=<MseLossBackward>)
  20273. loss_train: 0.5606125611811876
  20274. step: 24
  20275. running loss: 0.02335885671588282
  20276.  
  20277. Train Steps: 24/90 Loss: 0.0234 torch.Size([8, 600, 800])
  20278. torch.Size([8, 8])
  20279. tensor([[0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  20280. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  20281. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  20282. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  20283. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  20284. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  20285. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  20286. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100]],
  20287. device='cuda:0', dtype=torch.float64)
  20288. predictions are: tensor([[ 0.7548, -0.3042, 1.0104, -1.2783, -0.3081, -1.4168, 0.4733, 0.0882],
  20289. [ 0.3597, -0.5199, 1.6652, -0.3600, -0.5313, -0.7199, 0.4997, 0.3743],
  20290. [ 1.0061, -0.1646, 1.8598, -0.2678, -0.5175, 0.0687, 0.8785, 0.2038],
  20291. [-1.9778, -2.1261, 1.0573, -1.3015, -0.3206, -1.1825, 0.1999, 0.2042],
  20292. [ 0.6407, -0.3564, 1.7933, -0.4605, -0.3934, -0.7640, 0.5918, 0.2892],
  20293. [ 0.9847, -0.1499, 1.5094, -1.0364, -0.2792, -1.1041, 0.7410, 0.0412],
  20294. [ 0.8230, -0.2356, 1.6608, -0.5814, -0.5504, -0.7949, 0.4448, 0.0940],
  20295. [ 0.9102, -0.2794, 1.8353, -0.3655, -0.5575, -0.4388, 0.9005, 0.0544]],
  20296. device='cuda:0', grad_fn=<AddmmBackward>)
  20297. landmarks are: tensor([[[ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  20298. 0.2906],
  20299. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  20300. 0.3238],
  20301. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  20302. 0.3161],
  20303. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  20304. 0.2930],
  20305. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  20306. 0.3928],
  20307. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  20308. 0.1929],
  20309. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  20310. 0.2237],
  20311. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  20312. 0.0697]]], device='cuda:0')
  20313. loss_train_step before backward: tensor(0.0251, device='cuda:0', grad_fn=<MseLossBackward>)
  20314. loss_train_step after backward: tensor(0.0251, device='cuda:0', grad_fn=<MseLossBackward>)
  20315. loss_train: 0.5856962967664003
  20316. step: 25
  20317. running loss: 0.023427851870656012
  20318. Train Steps: 25/90 Loss: 0.0234 torch.Size([8, 600, 800])
  20319. torch.Size([8, 8])
  20320. tensor([[ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  20321. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  20322. [0.6209, 0.3920, 0.8650, 0.5367, 0.4400, 0.5067, 0.6025, 0.4950],
  20323. [0.6197, 0.3986, 0.8800, 0.4617, 0.4188, 0.4783, 0.5687, 0.5550],
  20324. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  20325. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  20326. [0.6214, 0.4175, 0.7300, 0.2883, 0.4338, 0.2167, 0.5698, 0.5773],
  20327. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980]],
  20328. device='cuda:0', dtype=torch.float64)
  20329. predictions are: tensor([[-2.1749, -2.2414, 1.2203, -1.2753, -0.2672, -1.2905, 0.4293, 0.2614],
  20330. [ 0.8052, -0.2676, 1.6369, -0.9690, -0.5289, -1.0819, 0.6849, 0.2336],
  20331. [ 0.7062, -0.3927, 1.7734, 0.1701, -0.3351, 0.0147, 0.6362, 0.0818],
  20332. [ 0.6538, -0.3901, 1.7930, -0.1344, -0.4454, -0.0750, 0.6346, 0.2179],
  20333. [ 0.7714, -0.2682, 1.5192, -1.0016, -0.5511, -1.1028, 0.7895, 0.1417],
  20334. [ 0.8999, -0.1971, 1.8160, -0.1320, -0.1471, 0.0496, 0.6020, 0.2215],
  20335. [ 0.9350, -0.1469, 1.1757, -0.9296, -0.3252, -1.4202, 0.5431, 0.3288],
  20336. [ 0.6527, -0.3576, 1.3160, -0.9865, -0.6031, -1.0946, 0.3418, -0.0273]],
  20337. device='cuda:0', grad_fn=<AddmmBackward>)
  20338. landmarks are: tensor([[[-2.2859e+00, -2.2859e+00, 9.1750e-01, -1.3947e+00, -3.6905e-01,
  20339. -1.2467e+00, 2.3141e-01, 3.2379e-01],
  20340. [ 5.7783e-01, -3.9299e-01, 1.5189e+00, -9.3872e-01, -4.3256e-01,
  20341. -9.1563e-01, 4.8545e-01, 3.3918e-01],
  20342. [ 5.8199e-01, -4.7544e-01, 1.7095e+00, 1.9292e-01, -2.5358e-01,
  20343. 5.4350e-02, 4.9700e-01, 4.6189e-04],
  20344. [ 5.7627e-01, -4.4503e-01, 1.7788e+00, -1.5350e-01, -3.5173e-01,
  20345. -7.6520e-02, 3.4111e-01, 2.7760e-01],
  20346. [ 5.9766e-01, -3.7916e-01, 1.2995e+00, -1.0311e+00, -5.1917e-01,
  20347. -8.3865e-01, 5.8360e-01, 2.1601e-01],
  20348. [ 5.5381e-01, -4.1386e-01, 1.7557e+00, -1.8430e-01, -4.5897e-02,
  20349. 1.2417e-01, 4.2194e-01, 2.8530e-01],
  20350. [ 5.8412e-01, -3.5743e-01, 1.0859e+00, -9.5412e-01, -2.8245e-01,
  20351. -1.2851e+00, 3.4601e-01, 3.8081e-01],
  20352. [ 5.2194e-01, -4.5504e-01, 1.1415e+00, -9.1962e-01, -6.4042e-01,
  20353. -9.3872e-01, 1.8562e-01, 1.4106e-02]]], device='cuda:0')
  20354. loss_train_step before backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  20355. loss_train_step after backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  20356. loss_train: 0.606036888435483
  20357. step: 26
  20358. running loss: 0.02330911109367242
  20359. Train Steps: 26/90 Loss: 0.0233 torch.Size([8, 600, 800])
  20360. torch.Size([8, 8])
  20361. tensor([[0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  20362. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  20363. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  20364. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578],
  20365. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320],
  20366. [0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  20367. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  20368. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412]],
  20369. device='cuda:0', dtype=torch.float64)
  20370. predictions are: tensor([[ 8.0656e-01, -2.6370e-01, 1.5694e+00, -7.0661e-01, -6.7750e-01,
  20371. -6.1102e-01, 4.4837e-01, 1.7196e-01],
  20372. [ 8.3816e-01, -2.6449e-01, 1.4815e+00, -9.9043e-01, -6.0364e-01,
  20373. -6.2400e-01, 7.4873e-01, 1.6229e-01],
  20374. [ 7.6048e-01, -3.0167e-01, 1.4651e+00, 1.3264e-01, -4.7946e-01,
  20375. -7.3808e-01, 4.7905e-01, 5.3412e-01],
  20376. [-2.4250e+00, -2.4390e+00, 1.1478e+00, -1.2399e+00, -4.5536e-01,
  20377. -1.1712e+00, 1.5048e-01, 2.7632e-01],
  20378. [ 9.2886e-01, -2.3300e-01, 1.6681e+00, 3.6170e-02, -4.2982e-01,
  20379. -2.4203e-02, 1.0275e+00, 1.7328e-01],
  20380. [ 7.3659e-01, -3.2591e-01, 1.6391e+00, -1.1892e+00, -4.0055e-01,
  20381. -1.3278e+00, 5.5345e-01, 4.1518e-02],
  20382. [ 7.4341e-01, -3.3253e-01, 1.7754e+00, -2.0403e-01, -2.2468e-03,
  20383. -5.2091e-02, 6.5368e-01, 2.7859e-01],
  20384. [ 7.0976e-01, -3.3546e-01, 1.8470e+00, -7.5960e-01, -4.6156e-01,
  20385. -1.2449e+00, 5.1825e-01, 1.3950e-01]], device='cuda:0',
  20386. grad_fn=<AddmmBackward>)
  20387. landmarks are: tensor([[[ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  20388. 0.2365],
  20389. [ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  20390. 0.1159],
  20391. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  20392. 0.4778],
  20393. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  20394. 0.2905],
  20395. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  20396. 0.1715],
  20397. [ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  20398. 0.0851],
  20399. [ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  20400. 0.2853],
  20401. [ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  20402. 0.2139]]], device='cuda:0')
  20403. loss_train_step before backward: tensor(0.0194, device='cuda:0', grad_fn=<MseLossBackward>)
  20404. loss_train_step after backward: tensor(0.0194, device='cuda:0', grad_fn=<MseLossBackward>)
  20405. loss_train: 0.6254050750285387
  20406. step: 27
  20407. running loss: 0.023163150926982914
  20408. Train Steps: 27/90 Loss: 0.0232 torch.Size([8, 600, 800])
  20409. torch.Size([8, 8])
  20410. tensor([[ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  20411. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  20412. [0.6084, 0.3981, 0.8588, 0.5233, 0.4600, 0.5367, 0.5680, 0.5006],
  20413. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  20414. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  20415. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  20416. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267],
  20417. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133]],
  20418. device='cuda:0', dtype=torch.float64)
  20419. predictions are: tensor([[-2.3912, -2.4006, 1.1279, -1.3163, -0.4300, -1.4060, 0.2300, 0.2982],
  20420. [ 0.8388, -0.2334, 1.3732, -1.0759, -0.6614, -0.8011, 0.6057, 0.2207],
  20421. [ 0.7985, -0.2911, 1.6881, 0.1210, -0.2120, -0.0144, 0.3557, 0.1805],
  20422. [ 0.5698, -0.3962, 1.3641, -0.7297, -0.7064, -0.7499, 0.3289, 0.3488],
  20423. [ 0.6580, -0.3809, 1.7488, -0.0879, -0.1178, -0.1244, 0.4801, 0.3834],
  20424. [ 1.0398, -0.1747, 1.8704, 0.0921, -0.5262, 0.1024, 1.1594, 0.2341],
  20425. [ 0.6474, -0.3854, 1.4655, -1.3019, -0.1727, -1.7691, 0.7337, 0.1894],
  20426. [ 0.5760, -0.4059, 1.7574, -0.5579, -0.7147, -0.9041, 0.3207, 0.1653]],
  20427. device='cuda:0', grad_fn=<AddmmBackward>)
  20428. landmarks are: tensor([[[-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  20429. 0.1373],
  20430. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  20431. 0.2237],
  20432. [ 0.5241, -0.4470, 1.6806, 0.1313, -0.1612, 0.1929, 0.3378,
  20433. 0.0261],
  20434. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  20435. 0.3417],
  20436. [ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  20437. 0.3007],
  20438. [ 0.6421, -0.3695, 1.7788, 0.0236, -0.4845, 0.1544, 1.1971,
  20439. 0.2196],
  20440. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  20441. 0.1467],
  20442. [ 0.5393, -0.4294, 1.6575, -0.4075, -0.6635, -0.6308, 0.3296,
  20443. 0.0851]]], device='cuda:0')
  20444. loss_train_step before backward: tensor(0.0175, device='cuda:0', grad_fn=<MseLossBackward>)
  20445. loss_train_step after backward: tensor(0.0175, device='cuda:0', grad_fn=<MseLossBackward>)
  20446. loss_train: 0.6429185438901186
  20447. step: 28
  20448. running loss: 0.022961376567504237
  20449.  
  20450. Train Steps: 28/90 Loss: 0.0230 torch.Size([8, 600, 800])
  20451. torch.Size([8, 8])
  20452. tensor([[0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  20453. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  20454. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  20455. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  20456. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  20457. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  20458. [0.6289, 0.4032, 0.8419, 0.5446, 0.4075, 0.5017, 0.6312, 0.5117],
  20459. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483]],
  20460. device='cuda:0', dtype=torch.float64)
  20461. predictions are: tensor([[ 0.3600, -0.5704, 1.3240, -1.3796, -0.1798, -1.6076, 0.5185, 0.2673],
  20462. [ 0.5784, -0.3890, 1.7528, -0.3822, -0.4831, 0.4132, 0.5336, 0.2449],
  20463. [ 0.4459, -0.5053, 1.4762, -1.3180, -0.2036, -1.4446, 0.5637, 0.2456],
  20464. [ 0.2246, -0.7033, 1.5671, 0.0254, -0.4486, -0.2696, 0.4713, 0.3428],
  20465. [ 0.5284, -0.4739, 1.8616, -0.5123, -0.5799, -0.8014, 0.6375, 0.2973],
  20466. [ 0.3499, -0.5930, 1.6678, -0.6075, -0.6182, -0.9334, 0.5179, 0.2470],
  20467. [ 0.6549, -0.4208, 1.5748, 0.0875, -0.4565, -0.0380, 0.7645, 0.2367],
  20468. [ 0.0652, -0.7456, 1.5443, -0.4409, -0.7221, -0.7115, 0.0813, 0.4008]],
  20469. device='cuda:0', grad_fn=<AddmmBackward>)
  20470. landmarks are: tensor([[[ 0.5908, -0.3832, 1.3804, -1.2543, -0.1270, -1.4671, 0.5721,
  20471. 0.2237],
  20472. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  20473. 0.0772],
  20474. [ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  20475. 0.2083],
  20476. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  20477. 0.2091],
  20478. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  20479. 0.1005],
  20480. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  20481. 0.1005],
  20482. [ 0.6189, -0.4238, 1.6026, 0.2295, -0.4037, 0.0313, 0.6298,
  20483. 0.0774],
  20484. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  20485. 0.2468]]], device='cuda:0')
  20486. loss_train_step before backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  20487. loss_train_step after backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  20488. loss_train: 0.6651229802519083
  20489. step: 29
  20490. running loss: 0.022935275181100286
  20491. Train Steps: 29/90 Loss: 0.0229 torch.Size([8, 600, 800])
  20492. torch.Size([8, 8])
  20493. tensor([[0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  20494. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  20495. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650],
  20496. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297],
  20497. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  20498. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  20499. [0.6364, 0.4154, 0.8938, 0.3717, 0.4500, 0.2583, 0.6448, 0.5285],
  20500. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667]],
  20501. device='cuda:0', dtype=torch.float64)
  20502. predictions are: tensor([[ 0.6743, -0.3775, 1.9492, -0.5144, -0.6510, -0.6040, 0.7542, 0.2366],
  20503. [ 0.4084, -0.5484, 0.8144, -1.2229, -0.4932, -1.3891, 0.2318, 0.3599],
  20504. [ 0.3393, -0.5796, 1.6478, -0.0665, -0.3251, -0.0515, 0.2467, 0.3376],
  20505. [ 0.7025, -0.3827, 1.7598, -0.0448, -0.4856, -0.1389, 0.9078, 0.2428],
  20506. [ 0.4087, -0.5155, 1.7943, -0.0300, -0.2215, 0.2901, 0.3834, 0.2715],
  20507. [ 0.5483, -0.4365, 1.2142, -1.0301, -0.6042, -1.1357, 0.1894, 0.0886],
  20508. [ 0.5886, -0.3989, 1.8939, -0.6754, -0.2331, -1.3781, 0.6624, 0.3241],
  20509. [-1.2400, -1.6479, 1.1698, -1.2162, -0.5687, -1.1057, 0.4281, 0.4191]],
  20510. device='cuda:0', grad_fn=<AddmmBackward>)
  20511. landmarks are: tensor([[[ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  20512. 0.1544],
  20513. [ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  20514. 0.3852],
  20515. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  20516. 0.3238],
  20517. [ 0.6257, -0.4273, 1.8365, -0.0688, -0.4672, -0.0611, 1.1715,
  20518. 0.1608],
  20519. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  20520. 0.0622],
  20521. [ 0.4997, -0.4446, 1.1610, -0.9772, -0.6058, -1.0311, 0.1404,
  20522. -0.1031],
  20523. [ 0.6537, -0.3671, 1.8423, -0.5692, -0.2074, -1.0927, 0.6926,
  20524. 0.1554],
  20525. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  20526. 0.3315]]], device='cuda:0')
  20527. loss_train_step before backward: tensor(0.0337, device='cuda:0', grad_fn=<MseLossBackward>)
  20528. loss_train_step after backward: tensor(0.0337, device='cuda:0', grad_fn=<MseLossBackward>)
  20529. loss_train: 0.6988462079316378
  20530. step: 30
  20531. running loss: 0.02329487359772126
  20532. Train Steps: 30/90 Loss: 0.0233 torch.Size([8, 600, 800])
  20533. torch.Size([8, 8])
  20534. tensor([[0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  20535. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  20536. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  20537. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  20538. [0.6114, 0.4018, 0.7213, 0.1967, 0.3763, 0.2700, 0.5875, 0.5533],
  20539. [0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  20540. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  20541. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297]],
  20542. device='cuda:0', dtype=torch.float64)
  20543. predictions are: tensor([[ 0.6474, -0.3811, 1.9037, -0.6287, -0.2022, -1.5291, 0.5346, 0.2287],
  20544. [ 0.5797, -0.4225, 1.7740, -0.1589, -0.1278, 0.2441, 0.5273, 0.3165],
  20545. [ 0.3275, -0.6175, 1.7052, -0.4999, -0.6740, -0.2583, 0.5826, 0.3372],
  20546. [ 0.0698, -0.7592, 1.6376, -0.3294, -0.4746, -0.4258, 0.0776, 0.3240],
  20547. [ 0.0830, -0.7637, 0.9233, -1.3943, -0.5709, -1.1773, 0.2773, 0.2900],
  20548. [ 0.2631, -0.6277, 1.5495, -0.5722, -0.5926, -0.8965, 0.4296, 0.3226],
  20549. [ 0.3554, -0.5687, 1.5380, -0.6126, -0.7502, -0.5382, 0.2942, 0.2498],
  20550. [ 0.5028, -0.5089, 1.7308, -0.0581, -0.4410, -0.0810, 0.8824, 0.2342]],
  20551. device='cuda:0', grad_fn=<AddmmBackward>)
  20552. landmarks are: tensor([[[ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  20553. 0.0171],
  20554. [ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  20555. 0.2699],
  20556. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  20557. 0.2083],
  20558. [ 0.5441, -0.3997, 1.7326, -0.2228, -0.4441, -0.2921, 0.0296,
  20559. 0.2409],
  20560. [ 0.5380, -0.4302, 1.0455, -1.3775, -0.5480, -1.0388, 0.4277,
  20561. 0.2699],
  20562. [ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  20563. 0.1621],
  20564. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  20565. 0.2365],
  20566. [ 0.6257, -0.4273, 1.8365, -0.0688, -0.4672, -0.0611, 1.1715,
  20567. 0.1608]]], device='cuda:0')
  20568. loss_train_step before backward: tensor(0.0212, device='cuda:0', grad_fn=<MseLossBackward>)
  20569. loss_train_step after backward: tensor(0.0212, device='cuda:0', grad_fn=<MseLossBackward>)
  20570. loss_train: 0.7200348284095526
  20571. step: 31
  20572. running loss: 0.023226929948695244
  20573. Train Steps: 31/90 Loss: 0.0232 torch.Size([8, 600, 800])
  20574. torch.Size([8, 8])
  20575. tensor([[0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  20576. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  20577. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750],
  20578. [0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  20579. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  20580. [0.6193, 0.4050, 0.7313, 0.2433, 0.4075, 0.2117, 0.5649, 0.5656],
  20581. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  20582. [0.6216, 0.4099, 0.7225, 0.2033, 0.4188, 0.2217, 0.5975, 0.5283]],
  20583. device='cuda:0', dtype=torch.float64)
  20584. predictions are: tensor([[ 0.6033, -0.4310, 1.8310, 0.4091, -0.5672, 0.0558, 0.7620, 0.1504],
  20585. [ 0.8779, -0.2438, 2.1329, -0.3252, -0.5712, -0.5649, 0.7217, 0.2011],
  20586. [-1.6352, -1.8747, 0.9210, -1.2440, -0.4025, -1.2805, 0.1456, 0.4208],
  20587. [-0.6913, -1.2824, 1.0063, -1.2538, -0.3921, -1.3718, 0.0689, 0.3489],
  20588. [ 0.7124, -0.3332, 1.8602, -0.3045, -0.5819, -0.0313, 0.3551, 0.0675],
  20589. [ 0.4150, -0.5009, 1.2186, -1.2239, -0.4369, -1.1337, 0.3174, 0.2731],
  20590. [ 0.6908, -0.3370, 1.6717, 0.3058, -0.4995, -0.0272, 0.5719, 0.5020],
  20591. [ 0.5956, -0.4108, 1.1865, -1.2724, -0.4142, -1.2213, 0.2497, 0.2512]],
  20592. device='cuda:0', grad_fn=<AddmmBackward>)
  20593. landmarks are: tensor([[[ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  20594. -0.1331],
  20595. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  20596. 0.1005],
  20597. [ 0.5663, -0.4396, 0.8261, -1.1312, -0.2940, -1.3929, 0.2603,
  20598. 0.3700],
  20599. [ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  20600. 0.2699],
  20601. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  20602. 0.0502],
  20603. [ 0.5746, -0.4153, 1.0917, -1.1620, -0.4037, -1.3082, 0.3234,
  20604. 0.3267],
  20605. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  20606. 0.5401],
  20607. [ 0.5850, -0.3925, 1.0513, -1.3467, -0.3517, -1.2620, 0.4739,
  20608. 0.1544]]], device='cuda:0')
  20609. loss_train_step before backward: tensor(0.1585, device='cuda:0', grad_fn=<MseLossBackward>)
  20610. loss_train_step after backward: tensor(0.1585, device='cuda:0', grad_fn=<MseLossBackward>)
  20611. loss_train: 0.8785099294036627
  20612. step: 32
  20613. running loss: 0.02745343529386446
  20614.  
  20615. Train Steps: 32/90 Loss: 0.0275 torch.Size([8, 600, 800])
  20616. torch.Size([8, 8])
  20617. tensor([[0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  20618. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  20619. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  20620. [0.6142, 0.4127, 0.7575, 0.3067, 0.3438, 0.4383, 0.5778, 0.5207],
  20621. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483],
  20622. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  20623. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  20624. [0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436]],
  20625. device='cuda:0', dtype=torch.float64)
  20626. predictions are: tensor([[ 5.2940e-01, -4.4512e-01, 1.6529e+00, 1.7090e-01, -2.1387e-01,
  20627. 7.7426e-03, 6.9037e-01, 1.7068e-01],
  20628. [ 3.4147e-01, -5.6399e-01, 1.5299e+00, -8.4593e-01, -6.4986e-01,
  20629. -7.0577e-01, 4.4995e-01, 2.9445e-01],
  20630. [-1.7507e-03, -7.9282e-01, 1.6644e+00, -4.0141e-01, -4.2820e-01,
  20631. -1.7175e-01, 1.8599e-01, 1.2021e-01],
  20632. [ 2.9183e-01, -5.5249e-01, 1.0889e+00, -9.9410e-01, -6.0846e-01,
  20633. -4.8721e-01, 2.1527e-01, 3.2583e-01],
  20634. [ 3.6955e-01, -5.1423e-01, 1.5982e+00, -2.9987e-01, -6.4598e-01,
  20635. -8.5654e-01, -3.9592e-02, 2.8502e-01],
  20636. [ 3.0083e-01, -5.7450e-01, 1.6468e+00, -3.0167e-01, -4.3349e-01,
  20637. -5.5919e-01, -3.3376e-02, 2.7009e-01],
  20638. [ 5.5085e-01, -4.4781e-01, 1.8877e+00, -1.4398e-01, -5.1621e-01,
  20639. -3.5603e-01, 8.2913e-01, 1.9243e-01],
  20640. [ 4.9237e-01, -4.7212e-01, 1.7585e+00, -3.4924e-01, -4.0652e-01,
  20641. -2.1576e-01, 8.1910e-01, 3.0801e-01]], device='cuda:0',
  20642. grad_fn=<AddmmBackward>)
  20643. landmarks are: tensor([[[ 0.6042, -0.4273, 1.6920, 0.1860, -0.2717, 0.1406, 0.7997,
  20644. 0.1004],
  20645. [ 0.5779, -0.4275, 1.5894, -0.8362, -0.6577, -0.5153, 0.5605,
  20646. 0.2006],
  20647. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  20648. 0.0231],
  20649. [ 0.5509, -0.3798, 1.2129, -0.8694, -0.6982, -0.2613, 0.3830,
  20650. 0.1193],
  20651. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  20652. 0.2468],
  20653. [ 0.5441, -0.3997, 1.7326, -0.2228, -0.4441, -0.2921, 0.0296,
  20654. 0.2409],
  20655. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  20656. 0.2516],
  20657. [ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  20658. 0.2249]]], device='cuda:0')
  20659. loss_train_step before backward: tensor(0.0250, device='cuda:0', grad_fn=<MseLossBackward>)
  20660. loss_train_step after backward: tensor(0.0250, device='cuda:0', grad_fn=<MseLossBackward>)
  20661. loss_train: 0.9034913182258606
  20662. step: 33
  20663. running loss: 0.02737852479472305
  20664. Train Steps: 33/90 Loss: 0.0274 torch.Size([8, 600, 800])
  20665. torch.Size([8, 8])
  20666. tensor([[ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  20667. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450],
  20668. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  20669. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412],
  20670. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  20671. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  20672. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  20673. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767]],
  20674. device='cuda:0', dtype=torch.float64)
  20675. predictions are: tensor([[-1.9099, -2.0520, 0.9409, -1.3096, -0.3855, -1.2464, 0.1902, 0.2886],
  20676. [ 0.5154, -0.4495, 1.7163, -0.2839, -0.3076, 0.1952, 0.4860, 0.1330],
  20677. [ 0.5209, -0.4609, 1.6231, -1.0219, -0.5351, -1.0031, 0.5578, 0.1162],
  20678. [ 0.5516, -0.4181, 1.5766, 0.2001, -0.1115, -0.0064, 0.2084, 0.1623],
  20679. [ 0.4060, -0.5142, 1.6260, -0.6436, -0.6285, -0.1200, 0.2998, 0.1566],
  20680. [ 0.7592, -0.2388, 1.3822, -0.2121, -0.4769, -0.7826, 0.2621, 0.4588],
  20681. [ 0.6406, -0.4045, 1.7779, -0.2040, -0.5504, -0.4587, 0.7782, 0.1341],
  20682. [ 0.6576, -0.3083, 1.6359, -0.1900, -0.5963, -0.8407, 0.2722, 0.2160]],
  20683. device='cuda:0', grad_fn=<AddmmBackward>)
  20684. landmarks are: tensor([[[-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  20685. 0.3084],
  20686. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  20687. 0.2314],
  20688. [ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  20689. 0.1931],
  20690. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  20691. 0.2138],
  20692. [ 0.5384, -0.4361, 1.7961, -0.4999, -0.5480, -0.1150, 0.3931,
  20693. 0.2776],
  20694. [ 0.6069, -0.3309, 1.3742, -0.1493, -0.5365, -0.9541, 0.2884,
  20695. 0.5071],
  20696. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  20697. 0.1768],
  20698. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  20699. 0.3778]]], device='cuda:0')
  20700. loss_train_step before backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  20701. loss_train_step after backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  20702. loss_train: 0.9148482903838158
  20703. step: 34
  20704. running loss: 0.026907302658347523
  20705. Train Steps: 34/90 Loss: 0.0269 torch.Size([8, 600, 800])
  20706. torch.Size([8, 8])
  20707. tensor([[0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  20708. [0.6286, 0.4097, 0.8107, 0.2414, 0.4425, 0.2483, 0.6745, 0.5385],
  20709. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  20710. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  20711. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  20712. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  20713. [0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044],
  20714. [0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436]],
  20715. device='cuda:0', dtype=torch.float64)
  20716. predictions are: tensor([[ 3.4211e-01, -5.5436e-01, 1.4170e+00, 6.1026e-02, -4.8594e-01,
  20717. -1.1325e-01, 7.7582e-01, 3.2171e-01],
  20718. [ 1.4285e-01, -6.6580e-01, 1.4183e+00, -1.1495e+00, -3.2002e-01,
  20719. -1.2133e+00, 6.1003e-01, 2.7405e-01],
  20720. [ 3.6311e-01, -4.9852e-01, 1.6690e+00, -1.9997e-01, -6.7210e-01,
  20721. -5.8863e-01, -4.3973e-02, 1.5990e-01],
  20722. [ 4.6845e-01, -4.8369e-01, 1.6665e+00, -1.5795e-02, -4.8026e-01,
  20723. -1.5836e-03, 2.7498e-01, 9.0587e-02],
  20724. [ 6.5483e-01, -3.1392e-01, 1.6959e+00, 2.6545e-01, -4.1626e-01,
  20725. -8.7995e-02, 4.2136e-01, 2.3797e-01],
  20726. [ 1.4710e-01, -6.7734e-01, 1.7470e+00, -3.3103e-01, -4.3827e-01,
  20727. -2.9471e-01, -9.0514e-03, 3.3535e-02],
  20728. [ 3.4537e-01, -5.5135e-01, 1.1529e+00, -1.3529e+00, -3.9643e-01,
  20729. -1.2332e+00, 2.8598e-01, 1.4165e-01],
  20730. [ 3.7841e-01, -5.3315e-01, 1.7237e+00, -4.0560e-01, -4.5712e-01,
  20731. -7.7054e-02, 7.7512e-01, 2.6182e-01]], device='cuda:0',
  20732. grad_fn=<AddmmBackward>)
  20733. landmarks are: tensor([[[ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  20734. 0.3478],
  20735. [ 0.6174, -0.3936, 1.4586, -1.1709, -0.2420, -1.1389, 0.8296,
  20736. 0.2012],
  20737. [ 0.5443, -0.3994, 1.7499, -0.1227, -0.6173, -0.5769, 0.0049,
  20738. 0.2071],
  20739. [ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  20740. 0.0663],
  20741. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  20742. 0.3007],
  20743. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  20744. -0.0220],
  20745. [ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  20746. 0.0438],
  20747. [ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  20748. 0.2249]]], device='cuda:0')
  20749. loss_train_step before backward: tensor(0.0243, device='cuda:0', grad_fn=<MseLossBackward>)
  20750. loss_train_step after backward: tensor(0.0243, device='cuda:0', grad_fn=<MseLossBackward>)
  20751. loss_train: 0.9391738977283239
  20752. step: 35
  20753. running loss: 0.02683353993509497
  20754. Train Steps: 35/90 Loss: 0.0268 torch.Size([8, 600, 800])
  20755. torch.Size([8, 8])
  20756. tensor([[0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  20757. [0.6268, 0.4061, 0.8350, 0.2433, 0.4575, 0.2283, 0.6350, 0.5300],
  20758. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  20759. [0.6234, 0.4179, 0.7825, 0.3450, 0.3813, 0.2867, 0.5675, 0.5617],
  20760. [ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933],
  20761. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567],
  20762. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  20763. [0.6168, 0.4081, 0.8438, 0.3367, 0.3500, 0.4667, 0.6212, 0.5400]],
  20764. device='cuda:0', dtype=torch.float64)
  20765. predictions are: tensor([[ 0.9853, -0.0791, 1.4641, -0.3702, -0.1446, -1.0620, 0.2074, 0.3532],
  20766. [ 0.7470, -0.2884, 1.5556, -0.9633, -0.2606, -1.1213, 0.5230, 0.1062],
  20767. [ 0.7365, -0.3068, 1.7563, -0.0710, -0.4981, -0.0292, 0.3810, 0.1003],
  20768. [ 0.8464, -0.1846, 1.4369, -0.5832, -0.4998, -0.7952, 0.3272, 0.2525],
  20769. [-1.5989, -1.7973, 0.9184, -0.9933, -0.5291, -0.9933, 0.0321, 0.2860],
  20770. [-1.6922, -1.8783, 1.0217, -1.0603, -0.4737, -1.0298, 0.0809, 0.2151],
  20771. [ 0.7276, -0.3266, 1.7957, 0.2800, -0.4631, 0.1283, 0.7769, -0.0928],
  20772. [ 0.7260, -0.2884, 1.6461, -0.5658, -0.5884, -0.0756, 0.7037, 0.1972]],
  20773. device='cuda:0', grad_fn=<AddmmBackward>)
  20774. landmarks are: tensor([[[ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  20775. 0.5882],
  20776. [ 0.6093, -0.4104, 1.5709, -1.1620, -0.1727, -1.2313, 0.6471,
  20777. 0.1621],
  20778. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  20779. 0.3469],
  20780. [ 0.5935, -0.3558, 1.3284, -0.6924, -0.5249, -0.9618, 0.3353,
  20781. 0.3084],
  20782. [-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  20783. 0.4543],
  20784. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  20785. 0.2853],
  20786. [ 0.5908, -0.4366, 1.7557, 0.1390, -0.5192, 0.1313, 0.6529,
  20787. 0.0236],
  20788. [ 0.5631, -0.4008, 1.6113, -0.7309, -0.6693, -0.1304, 0.5836,
  20789. 0.2083]]], device='cuda:0')
  20790. loss_train_step before backward: tensor(0.0352, device='cuda:0', grad_fn=<MseLossBackward>)
  20791. loss_train_step after backward: tensor(0.0352, device='cuda:0', grad_fn=<MseLossBackward>)
  20792. loss_train: 0.9743791241198778
  20793. step: 36
  20794. running loss: 0.027066086781107716
  20795.  
  20796. Train Steps: 36/90 Loss: 0.0271 torch.Size([8, 600, 800])
  20797. torch.Size([8, 8])
  20798. tensor([[0.6203, 0.4021, 0.8780, 0.5031, 0.3667, 0.3882, 0.5842, 0.5405],
  20799. [0.6268, 0.4102, 0.8938, 0.3667, 0.4025, 0.2833, 0.6275, 0.5183],
  20800. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  20801. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  20802. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  20803. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  20804. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  20805. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749]],
  20806. device='cuda:0', dtype=torch.float64)
  20807. predictions are: tensor([[ 0.6996, -0.3346, 1.8437, 0.1672, -0.5292, -0.3474, 0.3822, -0.0497],
  20808. [ 0.3493, -0.5383, 1.9132, -0.5951, -0.3706, -0.8605, 0.4897, 0.1431],
  20809. [ 0.2542, -0.6049, 1.8101, -0.1032, -0.4832, -0.2194, 0.4467, 0.1163],
  20810. [-0.0646, -0.8031, 0.9565, -0.8911, -0.5063, -0.8299, 0.2433, 0.3494],
  20811. [ 0.7911, -0.2365, 1.7099, 0.5081, -0.3259, -0.1652, 0.2937, 0.3079],
  20812. [ 0.5108, -0.4289, 1.9848, -0.2359, -0.5005, -0.0401, 0.5715, 0.0395],
  20813. [ 0.3191, -0.5725, 1.0183, -1.2563, -0.4272, -0.9802, 0.4102, 0.2090],
  20814. [ 0.2063, -0.6487, 1.2193, -0.8771, -0.5484, -0.6147, 0.2950, 0.2426]],
  20815. device='cuda:0', grad_fn=<AddmmBackward>)
  20816. landmarks are: tensor([[[ 0.5791, -0.4289, 1.7694, 0.0379, -0.5923, -0.4927, 0.4126,
  20817. 0.2107],
  20818. [ 0.6092, -0.3913, 1.8423, -0.5923, -0.4268, -0.9772, 0.6125,
  20819. 0.1082],
  20820. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  20821. 0.2314],
  20822. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  20823. 0.4085],
  20824. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  20825. 0.4624],
  20826. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  20827. 0.1390],
  20828. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  20829. 0.2930],
  20830. [ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  20831. 0.3694]]], device='cuda:0')
  20832. loss_train_step before backward: tensor(0.0252, device='cuda:0', grad_fn=<MseLossBackward>)
  20833. loss_train_step after backward: tensor(0.0252, device='cuda:0', grad_fn=<MseLossBackward>)
  20834. loss_train: 0.9995399247854948
  20835. step: 37
  20836. running loss: 0.02701459256177013
  20837. Train Steps: 37/90 Loss: 0.0270 torch.Size([8, 600, 800])
  20838. torch.Size([8, 8])
  20839. tensor([[0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  20840. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  20841. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  20842. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197],
  20843. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  20844. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  20845. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  20846. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800]],
  20847. device='cuda:0', dtype=torch.float64)
  20848. predictions are: tensor([[ 0.4743, -0.4986, 1.7012, 0.2645, -0.5962, -0.0472, 0.6053, -0.0269],
  20849. [ 0.4422, -0.4338, 1.6112, -0.2641, -0.3141, -0.9310, 0.3228, 0.4357],
  20850. [ 0.4612, -0.4605, 1.7693, -0.4304, -0.6406, -0.4055, 0.3712, 0.1926],
  20851. [ 0.3480, -0.5056, 1.7185, -0.0225, -0.2127, 0.2593, 0.2440, 0.0680],
  20852. [ 0.2740, -0.6009, 1.6386, -0.3549, -0.6436, -0.3869, 0.3592, 0.2311],
  20853. [ 0.6209, -0.3838, 1.4577, -1.1062, -0.4147, -0.9839, 0.5374, 0.0921],
  20854. [ 0.1334, -0.7052, 1.5866, 0.1677, -0.4499, -0.1311, 0.4455, 0.1111],
  20855. [ 0.3481, -0.5082, 1.0693, -1.1434, -0.2080, -1.2564, 0.3309, 0.3095]],
  20856. device='cuda:0', grad_fn=<AddmmBackward>)
  20857. landmarks are: tensor([[[ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  20858. 0.0261],
  20859. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  20860. 0.5822],
  20861. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  20862. 0.1544],
  20863. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  20864. 0.1146],
  20865. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  20866. 0.2853],
  20867. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  20868. 0.1929],
  20869. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  20870. 0.1313],
  20871. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  20872. 0.3931]]], device='cuda:0')
  20873. loss_train_step before backward: tensor(0.0145, device='cuda:0', grad_fn=<MseLossBackward>)
  20874. loss_train_step after backward: tensor(0.0145, device='cuda:0', grad_fn=<MseLossBackward>)
  20875. loss_train: 1.0140107097104192
  20876. step: 38
  20877. running loss: 0.026684492360800505
  20878. Train Steps: 38/90 Loss: 0.0267 torch.Size([8, 600, 800])
  20879. torch.Size([8, 8])
  20880. tensor([[0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  20881. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  20882. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  20883. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  20884. [0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  20885. [ nan, nan, 0.8900, 0.3217, 0.5038, 0.2233, 0.6694, 0.5609],
  20886. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  20887. [0.6260, 0.4153, 0.9000, 0.4533, 0.4025, 0.2633, 0.6223, 0.4967]],
  20888. device='cuda:0', dtype=torch.float64)
  20889. predictions are: tensor([[ 0.8678, -0.2009, 1.2378, -0.9185, -0.5161, -0.8553, 0.4915, 0.3090],
  20890. [ 0.9830, -0.1437, 1.6857, 0.4170, -0.5662, -0.0471, 0.5264, -0.0337],
  20891. [-1.3197, -1.6164, 0.8604, -1.1805, -0.3298, -1.2823, 0.1823, 0.3035],
  20892. [ 0.6939, -0.3165, 1.7800, -0.2526, -0.5378, 0.3783, 0.5597, 0.0969],
  20893. [ 0.5649, -0.3764, 1.3641, -0.9624, -0.5757, -0.6402, 0.3433, 0.2319],
  20894. [-1.4869, -1.6870, 1.6115, -0.8906, -0.0766, -1.0723, 0.6136, 0.3026],
  20895. [ 0.9856, -0.0815, 1.6037, 0.4419, -0.2505, -0.1491, 0.2663, 0.3167],
  20896. [ 0.7317, -0.2633, 1.8326, -0.1786, -0.4594, -0.8693, 0.3603, 0.0575]],
  20897. device='cuda:0', grad_fn=<AddmmBackward>)
  20898. landmarks are: tensor([[[ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  20899. 0.3777],
  20900. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  20901. 0.0261],
  20902. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  20903. 0.3469],
  20904. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  20905. 0.1005],
  20906. [ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  20907. 0.2699],
  20908. [-2.2859, -2.2859, 1.8249, -0.8002, 0.0409, -1.2543, 0.8059,
  20909. 0.3050],
  20910. [ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  20911. 0.4470],
  20912. [ 0.6055, -0.3676, 1.8711, -0.1920, -0.4268, -1.0696, 0.5887,
  20913. 0.0081]]], device='cuda:0')
  20914. loss_train_step before backward: tensor(0.0564, device='cuda:0', grad_fn=<MseLossBackward>)
  20915. loss_train_step after backward: tensor(0.0564, device='cuda:0', grad_fn=<MseLossBackward>)
  20916. loss_train: 1.070364617742598
  20917. step: 39
  20918. running loss: 0.027445246608784564
  20919. Train Steps: 39/90 Loss: 0.0274 torch.Size([8, 600, 800])
  20920. torch.Size([8, 8])
  20921. tensor([[0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  20922. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  20923. [ nan, nan, 0.6512, 0.1717, 0.4100, 0.1983, 0.5253, 0.5240],
  20924. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  20925. [ nan, nan, 0.6992, 0.2791, 0.3950, 0.2383, 0.5483, 0.5819],
  20926. [0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  20927. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  20928. [0.6246, 0.4028, 0.8738, 0.4867, 0.4088, 0.5667, 0.6362, 0.5200]],
  20929. device='cuda:0', dtype=torch.float64)
  20930. predictions are: tensor([[ 0.5133, -0.4663, 1.8136, 0.0464, -0.6048, -0.3059, 0.4851, 0.1031],
  20931. [ 0.8636, -0.1945, 1.7741, -0.3626, -0.4596, -0.9356, 0.1393, 0.1064],
  20932. [-1.3675, -1.6747, 0.9541, -1.3097, -0.3199, -1.3510, 0.3645, 0.2582],
  20933. [ 0.8342, -0.1883, 1.7027, -0.1683, -0.4789, -0.1760, 0.1873, 0.3101],
  20934. [-0.7556, -1.2731, 0.9561, -0.9565, -0.4540, -1.0619, 0.3168, 0.3183],
  20935. [ 0.6719, -0.3621, 1.5153, -0.9662, -0.3847, -0.8820, 0.7084, 0.1236],
  20936. [ 0.8573, -0.1882, 1.5670, 0.4527, -0.3737, 0.0536, 0.4860, 0.3803],
  20937. [ 0.7862, -0.2566, 1.8451, 0.0945, -0.3737, 0.4714, 0.6448, 0.1194]],
  20938. device='cuda:0', grad_fn=<AddmmBackward>)
  20939. landmarks are: tensor([[[ 5.9440e-01, -4.5427e-01, 1.8018e+00, 8.1601e-03, -6.0577e-01,
  20940. -4.3064e-01, 4.1617e-01, 1.0824e-01],
  20941. [ 5.4850e-01, -4.2094e-01, 1.6691e+00, -4.1524e-01, -5.2494e-01,
  20942. -1.1081e+00, 7.2521e-02, 2.0831e-03],
  20943. [-2.2859e+00, -2.2859e+00, 7.2217e-01, -1.4930e+00, -3.9215e-01,
  20944. -1.3698e+00, 1.4038e-01, 1.3434e-01],
  20945. [ 5.5525e-01, -3.9923e-01, 1.7557e+00, -2.6898e-01, -4.9030e-01,
  20946. -2.6898e-01, 5.4227e-02, 4.1446e-01],
  20947. [-2.2859e+00, -2.2859e+00, 9.4385e-01, -9.9666e-01, -4.6143e-01,
  20948. -1.1851e+00, 2.4679e-01, 4.0188e-01],
  20949. [ 6.1248e-01, -4.3453e-01, 1.4308e+00, -1.1384e+00, -4.2133e-01,
  20950. -1.0031e+00, 7.1897e-01, 1.2136e-01],
  20951. [ 6.1339e-01, -3.9099e-01, 1.4497e+00, 3.5458e-01, -3.5173e-01,
  20952. -9.1917e-02, 3.2956e-01, 5.2394e-01],
  20953. [ 5.9902e-01, -4.2556e-01, 1.7499e+00, -3.8029e-02, -3.9792e-01,
  20954. 3.3149e-01, 6.5289e-01, 1.1594e-01]]], device='cuda:0')
  20955. loss_train_step before backward: tensor(0.0867, device='cuda:0', grad_fn=<MseLossBackward>)
  20956. loss_train_step after backward: tensor(0.0867, device='cuda:0', grad_fn=<MseLossBackward>)
  20957. loss_train: 1.1570822978392243
  20958. step: 40
  20959. running loss: 0.02892705744598061
  20960.  
  20961. Train Steps: 40/90 Loss: 0.0289 torch.Size([8, 600, 800])
  20962. torch.Size([8, 8])
  20963. tensor([[0.6145, 0.4008, 0.8750, 0.5383, 0.3975, 0.4650, 0.5563, 0.5533],
  20964. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  20965. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  20966. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  20967. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  20968. [0.6260, 0.4253, 0.8938, 0.4400, 0.3675, 0.3650, 0.5675, 0.5767],
  20969. [0.6346, 0.4165, 0.9138, 0.3983, 0.3875, 0.4317, 0.7469, 0.5471],
  20970. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398]],
  20971. device='cuda:0', dtype=torch.float64)
  20972. predictions are: tensor([[ 0.6094, -0.3628, 1.5813, 0.1503, -0.3496, -0.1345, 0.4158, 0.2550],
  20973. [ 0.6345, -0.3623, 1.7048, -0.3339, -0.5686, -0.4320, 0.3378, 0.0178],
  20974. [-1.7347, -1.9036, 1.1396, -0.9692, -0.5907, -0.9591, 0.2255, 0.2204],
  20975. [ 0.7350, -0.2342, 1.5293, -0.2934, -0.1893, -1.0755, 0.4044, 0.5002],
  20976. [ 0.5159, -0.4508, 1.6632, -0.3091, -0.3144, 0.0313, 0.3703, 0.1639],
  20977. [ 0.6471, -0.3102, 1.6732, -0.2953, -0.5726, -0.5657, 0.2926, 0.3481],
  20978. [ 0.3940, -0.5209, 1.8598, -0.4337, -0.3804, -0.2356, 0.9161, 0.1679],
  20979. [ 0.8231, -0.2564, 1.5874, 0.1697, -0.5144, -0.3017, 0.5055, 0.0932]],
  20980. device='cuda:0', grad_fn=<AddmmBackward>)
  20981. landmarks are: tensor([[[ 0.5526, -0.4347, 1.7557, 0.2006, -0.4499, -0.1381, 0.2834,
  20982. 0.2699],
  20983. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  20984. 0.0467],
  20985. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  20986. 0.2837],
  20987. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  20988. 0.5822],
  20989. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  20990. 0.2545],
  20991. [ 0.6058, -0.3216, 1.8423, -0.2536, -0.5885, -0.6000, 0.3353,
  20992. 0.3777],
  20993. [ 0.6454, -0.3623, 1.9346, -0.4460, -0.4961, -0.2921, 1.1642,
  20994. 0.2409],
  20995. [ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  20996. 0.2075]]], device='cuda:0')
  20997. loss_train_step before backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  20998. loss_train_step after backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  20999. loss_train: 1.175681502558291
  21000. step: 41
  21001. running loss: 0.028675158598982706
  21002. Train Steps: 41/90 Loss: 0.0287 torch.Size([8, 600, 800])
  21003. torch.Size([8, 8])
  21004. tensor([[0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426],
  21005. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  21006. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  21007. [ nan, nan, 0.8888, 0.3100, 0.5262, 0.2817, 0.7145, 0.6003],
  21008. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  21009. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578],
  21010. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540],
  21011. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200]],
  21012. device='cuda:0', dtype=torch.float64)
  21013. predictions are: tensor([[ 1.0867, -0.0981, 1.1628, -0.9375, -0.2822, -1.2437, 0.4180, 0.2015],
  21014. [ 0.9307, -0.1722, 1.8503, -0.2443, -0.6467, -0.3693, 0.4760, 0.2033],
  21015. [ 0.9050, -0.1645, 1.7764, 0.1137, -0.5736, 0.1382, 0.2548, 0.2371],
  21016. [-1.1627, -1.4897, 1.6139, -0.6616, 0.0053, -0.9658, 0.8065, 0.4578],
  21017. [ 1.1114, -0.1139, 1.6950, 0.5100, -0.6381, -0.2213, 0.4249, 0.0464],
  21018. [-1.7602, -1.8987, 1.0080, -0.9613, -0.5353, -1.0438, 0.1584, 0.2675],
  21019. [-0.5237, -1.0626, 1.4513, -1.0196, 0.0815, -1.1053, 0.7325, 0.3350],
  21020. [ 0.8871, -0.2171, 1.4334, -0.6789, -0.6656, -0.4187, 0.4968, 0.2156]],
  21021. device='cuda:0', grad_fn=<AddmmBackward>)
  21022. landmarks are: tensor([[[ 0.5784, -0.4153, 1.2972, -1.2541, -0.2265, -1.4553, 0.4741,
  21023. 0.2203],
  21024. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  21025. 0.1544],
  21026. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  21027. 0.1775],
  21028. [-2.2859, -2.2859, 1.8192, -0.8540, 0.1448, -0.9849, 1.0143,
  21029. 0.4867],
  21030. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  21031. -0.1278],
  21032. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  21033. 0.2905],
  21034. [ 0.6487, -0.3792, 1.6344, -1.0850, 0.2659, -1.5397, 0.8059,
  21035. 0.2730],
  21036. [ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  21037. 0.1159]]], device='cuda:0')
  21038. loss_train_step before backward: tensor(0.1006, device='cuda:0', grad_fn=<MseLossBackward>)
  21039. loss_train_step after backward: tensor(0.1006, device='cuda:0', grad_fn=<MseLossBackward>)
  21040. loss_train: 1.2762999096885324
  21041. step: 42
  21042. running loss: 0.0303880930878222
  21043. Train Steps: 42/90 Loss: 0.0304 torch.Size([8, 600, 800])
  21044. torch.Size([8, 8])
  21045. tensor([[0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  21046. [0.6128, 0.4115, 0.7934, 0.3778, 0.3450, 0.4033, 0.5337, 0.5456],
  21047. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  21048. [ nan, nan, 0.6992, 0.2791, 0.3950, 0.2383, 0.5483, 0.5819],
  21049. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  21050. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  21051. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567],
  21052. [0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478]],
  21053. device='cuda:0', dtype=torch.float64)
  21054. predictions are: tensor([[ 0.5861, -0.4517, 1.3542, -0.8687, -0.6011, -0.7119, 0.5024, 0.1682],
  21055. [ 0.7095, -0.3213, 1.5826, -0.2131, -0.7450, -0.2024, 0.2908, 0.2557],
  21056. [ 0.6829, -0.3612, 1.0833, -1.0107, -0.4194, -1.0598, 0.4923, 0.3245],
  21057. [-1.2285, -1.5793, 1.0233, -0.6672, -0.4874, -0.9407, 0.3913, 0.3521],
  21058. [ 0.8831, -0.2063, 1.9609, -0.4306, -0.1119, -0.9870, 0.5996, 0.1698],
  21059. [ 0.6656, -0.3915, 1.3575, -0.8236, -0.2261, -1.1903, 0.6117, 0.1950],
  21060. [-1.9736, -2.0531, 1.1866, -0.7312, -0.4399, -0.9817, 0.2848, 0.2794],
  21061. [ 0.5745, -0.4375, 1.3779, -0.8132, -0.2105, -1.1064, 0.5409, 0.2714]],
  21062. device='cuda:0', grad_fn=<AddmmBackward>)
  21063. landmarks are: tensor([[[ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  21064. 0.0562],
  21065. [ 0.5444, -0.3852, 1.3786, -0.5409, -0.6924, -0.4229, 0.1791,
  21066. 0.2341],
  21067. [ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  21068. 0.2906],
  21069. [-2.2859, -2.2859, 0.9438, -0.9967, -0.4614, -1.1851, 0.2468,
  21070. 0.4019],
  21071. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  21072. 0.0051],
  21073. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  21074. 0.1005],
  21075. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  21076. 0.2853],
  21077. [ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  21078. 0.2442]]], device='cuda:0')
  21079. loss_train_step before backward: tensor(0.0686, device='cuda:0', grad_fn=<MseLossBackward>)
  21080. loss_train_step after backward: tensor(0.0686, device='cuda:0', grad_fn=<MseLossBackward>)
  21081. loss_train: 1.3449399406090379
  21082. step: 43
  21083. running loss: 0.03127767303741948
  21084. Train Steps: 43/90 Loss: 0.0313 torch.Size([8, 600, 800])
  21085. torch.Size([8, 8])
  21086. tensor([[0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  21087. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197],
  21088. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  21089. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100],
  21090. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  21091. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  21092. [0.6132, 0.3930, 0.8672, 0.4754, 0.3712, 0.5222, 0.5974, 0.5098],
  21093. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142]],
  21094. device='cuda:0', dtype=torch.float64)
  21095. predictions are: tensor([[ 0.5280, -0.4528, 1.7985, -0.1869, -0.4356, -0.3924, 0.1520, 0.1324],
  21096. [ 0.4553, -0.4516, 1.6858, 0.0901, -0.1598, 0.0426, 0.3004, 0.2708],
  21097. [ 0.6611, -0.3818, 1.6391, 0.0695, -0.3394, -0.2443, 0.2703, 0.2813],
  21098. [ 0.5227, -0.4709, 1.6064, 0.1950, -0.3658, -0.1808, 0.7545, 0.2764],
  21099. [ 0.2876, -0.6182, 1.3079, -1.2030, -0.2005, -1.5260, 0.6327, 0.2942],
  21100. [ 0.4826, -0.5128, 1.6825, -0.7884, -0.6276, -0.8875, 0.7476, 0.1812],
  21101. [ 0.6377, -0.3845, 1.6858, -0.0881, -0.5576, -0.0028, 0.5573, 0.2380],
  21102. [-1.4403, -1.7426, 1.4023, -0.8333, -0.6012, -1.0315, 0.3907, 0.2474]],
  21103. device='cuda:0', grad_fn=<AddmmBackward>)
  21104. landmarks are: tensor([[[ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  21105. -0.0220],
  21106. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  21107. 0.1146],
  21108. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  21109. 0.1854],
  21110. [ 0.6236, -0.4344, 1.6171, 0.1852, -0.3402, 0.0236, 0.6471,
  21111. 0.0697],
  21112. [ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  21113. 0.0928],
  21114. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  21115. -0.0220],
  21116. [ 0.5466, -0.4706, 1.7198, -0.0903, -0.5712, 0.1261, 0.4733,
  21117. 0.0688],
  21118. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  21119. 0.0893]]], device='cuda:0')
  21120. loss_train_step before backward: tensor(0.0320, device='cuda:0', grad_fn=<MseLossBackward>)
  21121. loss_train_step after backward: tensor(0.0320, device='cuda:0', grad_fn=<MseLossBackward>)
  21122. loss_train: 1.3768937001004815
  21123. step: 44
  21124. running loss: 0.031293038638647304
  21125.  
  21126. Train Steps: 44/90 Loss: 0.0313 torch.Size([8, 600, 800])
  21127. torch.Size([8, 8])
  21128. tensor([[ nan, nan, 0.8463, 0.2550, 0.5850, 0.2133, 0.7129, 0.6072],
  21129. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  21130. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  21131. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  21132. [0.6168, 0.4081, 0.8438, 0.3367, 0.3500, 0.4667, 0.6212, 0.5400],
  21133. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426],
  21134. [0.6146, 0.4124, 0.8800, 0.4867, 0.3800, 0.4500, 0.5106, 0.5524],
  21135. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583]],
  21136. device='cuda:0', dtype=torch.float64)
  21137. predictions are: tensor([[-1.9036, -2.0651, 1.5527, -1.0373, 0.3358, -1.2065, 1.1035, 0.3857],
  21138. [ 0.7392, -0.3105, 1.2319, -0.7023, -0.4938, -0.9192, 0.4006, 0.3703],
  21139. [ 0.2073, -0.6865, 1.8889, -0.1462, -0.2306, -1.0921, 0.7502, 0.2691],
  21140. [ 0.3774, -0.5846, 1.7424, -0.3205, -0.6016, -0.1874, 0.4186, -0.0711],
  21141. [ 0.6282, -0.4141, 1.4711, -0.7965, -0.6304, -0.2250, 0.5941, 0.2709],
  21142. [ 0.3742, -0.5652, 1.6887, -0.3577, -0.5015, -0.8006, 0.2380, 0.1651],
  21143. [ 0.6018, -0.4007, 1.6369, 0.0416, -0.4545, -0.3304, 0.0900, 0.1834],
  21144. [ 0.3541, -0.5593, 1.5228, -0.5119, -0.6283, -0.5439, 0.4191, 0.2913]],
  21145. device='cuda:0', grad_fn=<AddmmBackward>)
  21146. landmarks are: tensor([[[-2.2859, -2.2859, 1.6229, -1.1081, 0.4162, -1.3005, 1.0070,
  21147. 0.5188],
  21148. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  21149. 0.3469],
  21150. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  21151. 0.3692],
  21152. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  21153. -0.0670],
  21154. [ 0.5631, -0.4008, 1.6113, -0.7309, -0.6693, -0.1304, 0.5836,
  21155. 0.2083],
  21156. [ 0.5788, -0.4135, 1.8214, -0.2408, -0.6039, -0.7854, 0.4115,
  21157. 0.2203],
  21158. [ 0.5529, -0.3811, 1.7788, -0.0380, -0.5307, -0.2074, 0.0727,
  21159. 0.2657],
  21160. [ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  21161. 0.2930]]], device='cuda:0')
  21162. loss_train_step before backward: tensor(0.0201, device='cuda:0', grad_fn=<MseLossBackward>)
  21163. loss_train_step after backward: tensor(0.0201, device='cuda:0', grad_fn=<MseLossBackward>)
  21164. loss_train: 1.3970262268558145
  21165. step: 45
  21166. running loss: 0.031045027263462543
  21167. Train Steps: 45/90 Loss: 0.0310 torch.Size([8, 600, 800])
  21168. torch.Size([8, 8])
  21169. tensor([[0.6080, 0.4010, 0.8750, 0.4500, 0.4825, 0.5617, 0.5837, 0.5583],
  21170. [0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  21171. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  21172. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  21173. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  21174. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  21175. [ nan, nan, 0.8625, 0.2550, 0.5487, 0.2200, 0.7335, 0.5737],
  21176. [0.6346, 0.4165, 0.9138, 0.3983, 0.3875, 0.4317, 0.7469, 0.5471]],
  21177. device='cuda:0', dtype=torch.float64)
  21178. predictions are: tensor([[ 0.7793, -0.3316, 1.8120, -0.0791, -0.2213, -0.0297, 0.2753, 0.1217],
  21179. [ 0.7511, -0.3460, 1.6510, -0.1584, -0.7081, -0.2885, 0.1719, 0.1961],
  21180. [ 0.5894, -0.4178, 1.1553, -0.9393, -0.3990, -1.2565, 0.3335, 0.3389],
  21181. [ 0.9679, -0.2385, 1.2764, -1.0876, -0.6151, -0.9484, 0.3991, 0.2344],
  21182. [ 0.7129, -0.3717, 0.9215, -0.8002, -0.5720, -1.0232, 0.1904, 0.3818],
  21183. [-2.0511, -2.0903, 1.6392, -1.0022, 0.1126, -1.3098, 1.0287, 0.2427],
  21184. [-2.1435, -2.1390, 1.6120, -0.9052, 0.1158, -1.2869, 0.8389, 0.2812],
  21185. [ 0.6420, -0.4414, 1.9973, -0.1654, -0.5391, -0.2443, 0.8296, 0.0792]],
  21186. device='cuda:0', grad_fn=<AddmmBackward>)
  21187. landmarks are: tensor([[[ 0.5223, -0.4336, 1.7557, -0.2074, -0.0573, 0.3084, 0.4104,
  21188. 0.2930],
  21189. [ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  21190. 0.3267],
  21191. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  21192. 0.2853],
  21193. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  21194. 0.2853],
  21195. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  21196. 0.4085],
  21197. [-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  21198. 0.2463],
  21199. [-2.2859, -2.2859, 1.6979, -1.1081, 0.2487, -1.2697, 1.1020,
  21200. 0.3638],
  21201. [ 0.6454, -0.3623, 1.9346, -0.4460, -0.4961, -0.2921, 1.1642,
  21202. 0.2409]]], device='cuda:0')
  21203. loss_train_step before backward: tensor(0.0219, device='cuda:0', grad_fn=<MseLossBackward>)
  21204. loss_train_step after backward: tensor(0.0219, device='cuda:0', grad_fn=<MseLossBackward>)
  21205. loss_train: 1.4189534233883023
  21206. step: 46
  21207. running loss: 0.030846813551919615
  21208. Train Steps: 46/90 Loss: 0.0308 torch.Size([8, 600, 800])
  21209. torch.Size([8, 8])
  21210. tensor([[0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  21211. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  21212. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  21213. [0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783],
  21214. [0.6262, 0.4085, 0.8438, 0.3150, 0.4025, 0.2633, 0.6339, 0.4810],
  21215. [0.6246, 0.4028, 0.8738, 0.4867, 0.4088, 0.5667, 0.6362, 0.5200],
  21216. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167],
  21217. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350]],
  21218. device='cuda:0', dtype=torch.float64)
  21219. predictions are: tensor([[-0.1889, -0.9780, 1.7402, -0.4658, -0.6240, -0.6522, 0.4429, 0.1077],
  21220. [ 0.0686, -0.7909, 1.6863, -0.0267, -0.1338, -0.0739, 0.4993, 0.3025],
  21221. [ 0.1904, -0.7449, 1.7578, -0.1275, -0.4826, -0.2689, 0.4755, 0.1531],
  21222. [ 0.1659, -0.7163, 0.8696, -1.2486, -0.6219, -0.9096, 0.4073, 0.4252],
  21223. [ 0.7232, -0.3879, 1.6732, -1.1300, -0.3453, -1.2824, 0.7050, 0.0514],
  21224. [ 0.3838, -0.5893, 1.7987, -0.0436, -0.2872, 0.2436, 0.6770, 0.2404],
  21225. [ 0.0072, -0.8378, 1.6215, -0.9220, -0.4324, -1.1284, 0.3920, 0.1993],
  21226. [ 0.2877, -0.6304, 1.7888, -0.1657, -0.3686, -1.1141, 0.4204, 0.3036]],
  21227. device='cuda:0', grad_fn=<AddmmBackward>)
  21228. landmarks are: tensor([[[ 5.6692e-01, -4.7937e-01, 1.7499e+00, -3.3826e-01, -6.7506e-01,
  21229. -4.2294e-01, 4.9700e-01, -6.1124e-02],
  21230. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  21231. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  21232. [ 5.7263e-01, -4.7952e-01, 1.7788e+00, -1.4935e-02, -5.7113e-01,
  21233. -6.8822e-02, 5.0277e-01, -5.3426e-02],
  21234. [ 5.6796e-01, -4.0046e-01, 8.0300e-01, -1.0542e+00, -6.2887e-01,
  21235. -7.5396e-01, 3.6998e-01, 3.8537e-01],
  21236. [ 6.0641e-01, -3.9900e-01, 1.6113e+00, -8.3095e-01, -4.2679e-01,
  21237. -1.0696e+00, 6.4212e-01, -6.4044e-02],
  21238. [ 5.9902e-01, -4.2556e-01, 1.7499e+00, -3.8029e-02, -3.9792e-01,
  21239. 3.3149e-01, 6.5289e-01, 1.1594e-01],
  21240. [ 5.4825e-01, -4.2490e-01, 1.5305e+00, -7.3857e-01, -6.1155e-01,
  21241. -8.6944e-01, 3.3533e-01, 1.0054e-01],
  21242. [ 5.9007e-01, -4.0000e-01, 1.8423e+00, -6.8822e-02, -5.3072e-01,
  21243. -9.2333e-01, 3.6420e-01, 1.8522e-01]]], device='cuda:0')
  21244. loss_train_step before backward: tensor(0.0493, device='cuda:0', grad_fn=<MseLossBackward>)
  21245. loss_train_step after backward: tensor(0.0493, device='cuda:0', grad_fn=<MseLossBackward>)
  21246. loss_train: 1.4682444604113698
  21247. step: 47
  21248. running loss: 0.031239243838539783
  21249. Train Steps: 47/90 Loss: 0.0312 torch.Size([8, 600, 800])
  21250. torch.Size([8, 8])
  21251. tensor([[0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  21252. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667],
  21253. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  21254. [0.6128, 0.4116, 0.8450, 0.4583, 0.3675, 0.4867, 0.5337, 0.5446],
  21255. [0.6211, 0.4069, 0.8750, 0.5117, 0.4150, 0.4900, 0.5875, 0.5167],
  21256. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  21257. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  21258. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317]],
  21259. device='cuda:0', dtype=torch.float64)
  21260. predictions are: tensor([[ 0.8121, -0.2857, 1.8553, -0.0534, -0.1376, 0.1054, 0.5305, 0.2714],
  21261. [-2.7636, -2.6309, 1.3694, -0.9074, -0.3612, -1.1750, 0.5475, 0.2775],
  21262. [ 0.6600, -0.4128, 1.1770, -1.2402, -0.3847, -1.2091, 0.5563, 0.2726],
  21263. [ 0.4320, -0.4988, 1.7527, -0.0355, -0.5599, -0.0758, 0.2460, 0.2057],
  21264. [ 0.6434, -0.4167, 1.8805, 0.2187, -0.4504, 0.0262, 0.4597, 0.1198],
  21265. [ 0.0658, -0.7735, 0.9937, -1.2910, -0.3749, -1.4518, 0.4108, 0.1898],
  21266. [ 0.5898, -0.4576, 1.5912, -1.0806, -0.4569, -1.1443, 0.6867, 0.0462],
  21267. [-0.1678, -0.9171, 1.3631, -1.1337, -0.2762, -1.3283, 0.5493, 0.2750]],
  21268. device='cuda:0', grad_fn=<AddmmBackward>)
  21269. landmarks are: tensor([[[ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  21270. 0.3007],
  21271. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  21272. 0.3315],
  21273. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  21274. 0.2468],
  21275. [ 0.5444, -0.3846, 1.6171, -0.1689, -0.5885, -0.0380, 0.1791,
  21276. 0.2296],
  21277. [ 0.5828, -0.4066, 1.7557, 0.0774, -0.3691, -0.0226, 0.4277,
  21278. 0.1005],
  21279. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  21280. 0.1013],
  21281. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  21282. -0.0220],
  21283. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  21284. 0.1698]]], device='cuda:0')
  21285. loss_train_step before backward: tensor(0.0356, device='cuda:0', grad_fn=<MseLossBackward>)
  21286. loss_train_step after backward: tensor(0.0356, device='cuda:0', grad_fn=<MseLossBackward>)
  21287. loss_train: 1.5038310894742608
  21288. step: 48
  21289. running loss: 0.0313298143640471
  21290.  
  21291. Train Steps: 48/90 Loss: 0.0313 torch.Size([8, 600, 800])
  21292. torch.Size([8, 8])
  21293. tensor([[0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  21294. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  21295. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  21296. [0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  21297. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  21298. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  21299. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  21300. [0.6115, 0.3998, 0.7063, 0.2383, 0.4037, 0.1950, 0.5320, 0.4993]],
  21301. device='cuda:0', dtype=torch.float64)
  21302. predictions are: tensor([[ 0.2730, -0.6282, 1.9380, -0.1759, -0.0889, 0.0257, 0.2360, 0.1262],
  21303. [ 0.5148, -0.5094, 1.9247, -0.4342, -0.5837, -0.4938, 0.5429, 0.0917],
  21304. [ 0.3095, -0.6562, 1.8017, 0.1408, -0.6035, -0.1369, 0.7252, 0.1669],
  21305. [-0.0043, -0.8408, 1.0899, -1.4017, -0.2449, -1.5586, 0.4209, 0.3265],
  21306. [ 0.3186, -0.6128, 1.1535, -1.3408, -0.5048, -1.0129, 0.7331, 0.4692],
  21307. [ 0.0875, -0.7587, 1.8255, 0.1383, -0.4714, -0.2924, 0.2298, 0.1498],
  21308. [-0.2003, -0.9530, 1.7477, 0.2234, -0.5687, -0.0849, 0.5988, 0.1860],
  21309. [ 0.1707, -0.7150, 1.1711, -1.5067, -0.3215, -1.4711, 0.4139, 0.1151]],
  21310. device='cuda:0', grad_fn=<AddmmBackward>)
  21311. landmarks are: tensor([[[ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  21312. 0.0682],
  21313. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  21314. 0.0467],
  21315. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  21316. 0.0261],
  21317. [ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  21318. 0.2699],
  21319. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  21320. 0.3700],
  21321. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  21322. -0.0370],
  21323. [ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  21324. -0.1331],
  21325. [ 0.5384, -0.4393, 0.9762, -1.1851, -0.4210, -1.3852, 0.1712,
  21326. 0.0201]]], device='cuda:0')
  21327. loss_train_step before backward: tensor(0.0528, device='cuda:0', grad_fn=<MseLossBackward>)
  21328. loss_train_step after backward: tensor(0.0528, device='cuda:0', grad_fn=<MseLossBackward>)
  21329. loss_train: 1.5566692175343633
  21330. step: 49
  21331. running loss: 0.031768759541517616
  21332. Train Steps: 49/90 Loss: 0.0318 torch.Size([8, 600, 800])
  21333. torch.Size([8, 8])
  21334. tensor([[0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  21335. [0.6267, 0.4080, 0.8438, 0.2633, 0.4763, 0.1800, 0.6259, 0.5240],
  21336. [0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383],
  21337. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  21338. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  21339. [ nan, nan, 0.9088, 0.3783, 0.4562, 0.2617, 0.6741, 0.5575],
  21340. [0.6343, 0.4097, 0.9287, 0.4367, 0.4313, 0.3600, 0.7248, 0.5841],
  21341. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196]],
  21342. device='cuda:0', dtype=torch.float64)
  21343. predictions are: tensor([[ 0.3308, -0.5791, 1.6990, -0.1509, -0.1670, 0.1825, 0.3153, 0.1267],
  21344. [ 0.4098, -0.5453, 1.5226, -1.3711, -0.0952, -1.5752, 0.6124, 0.0944],
  21345. [ 0.1309, -0.7259, 1.6941, -0.4025, -0.3071, 0.3146, 0.4373, 0.1410],
  21346. [ 0.5440, -0.4765, 1.5739, -0.0572, -0.5781, -0.0772, 0.4984, 0.0258],
  21347. [ 0.1205, -0.6980, 1.2362, -0.9301, -0.7810, -0.5665, 0.1186, 0.2302],
  21348. [-1.3172, -1.6646, 1.9684, -0.6178, -0.2131, -1.3039, 0.8897, 0.1631],
  21349. [ 0.5473, -0.4987, 1.7234, -0.6042, -0.4938, -0.6665, 0.9100, 0.1871],
  21350. [ 0.4775, -0.4528, 1.5372, -0.2494, -0.4017, -0.9764, 0.2984, 0.4618]],
  21351. device='cuda:0', grad_fn=<AddmmBackward>)
  21352. landmarks are: tensor([[[ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  21353. 0.0592],
  21354. [ 0.6088, -0.4015, 1.6113, -1.0696, -0.0861, -1.4545, 0.6051,
  21355. 0.1343],
  21356. [ 0.5664, -0.4321, 1.8249, -0.2074, -0.2651, 0.4162, 0.5663,
  21357. 0.2006],
  21358. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  21359. 0.0697],
  21360. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  21361. 0.3417],
  21362. [-2.2859, -2.2859, 1.9115, -0.5384, -0.1785, -1.0773, 0.8278,
  21363. 0.2890],
  21364. [ 0.6438, -0.3936, 2.0039, -0.2690, -0.2940, -0.6231, 1.0618,
  21365. 0.4119],
  21366. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  21367. 0.5762]]], device='cuda:0')
  21368. loss_train_step before backward: tensor(0.0497, device='cuda:0', grad_fn=<MseLossBackward>)
  21369. loss_train_step after backward: tensor(0.0497, device='cuda:0', grad_fn=<MseLossBackward>)
  21370. loss_train: 1.6064054938033223
  21371. step: 50
  21372. running loss: 0.032128109876066444
  21373. Train Steps: 50/90 Loss: 0.0321 torch.Size([8, 600, 800])
  21374. torch.Size([8, 8])
  21375. tensor([[0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  21376. [0.6277, 0.4013, 0.8888, 0.4767, 0.3600, 0.3567, 0.6148, 0.4672],
  21377. [0.6099, 0.4030, 0.8638, 0.5117, 0.4983, 0.4965, 0.5086, 0.5388],
  21378. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  21379. [0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290],
  21380. [0.6307, 0.4029, 0.8988, 0.4817, 0.3937, 0.3500, 0.7311, 0.5378],
  21381. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  21382. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617]],
  21383. device='cuda:0', dtype=torch.float64)
  21384. predictions are: tensor([[ 0.4499, -0.5199, 1.6845, -0.3348, -0.3485, 0.1269, 0.3157, 0.2084],
  21385. [ 0.6747, -0.3542, 1.6891, -0.3486, -0.6206, -0.6618, 0.4907, 0.0787],
  21386. [ 0.6204, -0.3971, 1.6820, -0.0836, -0.0091, -0.0460, 0.1695, 0.1800],
  21387. [ 0.6887, -0.3090, 1.6003, -0.6434, -0.4770, -1.1085, 0.1139, 0.1487],
  21388. [ 0.4262, -0.4737, 1.1590, -1.4543, -0.3002, -1.2801, 0.6216, 0.1746],
  21389. [ 0.4292, -0.5376, 1.8991, -0.2834, -0.4674, -0.6994, 0.8851, 0.1040],
  21390. [ 0.4682, -0.5118, 1.7642, -0.4536, -0.5753, 0.2361, 0.9281, 0.1673],
  21391. [-2.8165, -2.6293, 1.1189, -1.1107, -0.3079, -1.3337, 0.3717, 0.2679]],
  21392. device='cuda:0', grad_fn=<AddmmBackward>)
  21393. landmarks are: tensor([[[ 5.6039e-01, -4.6197e-01, 1.7961e+00, -1.9969e-01, -3.2286e-01,
  21394. 1.0824e-01, 4.1039e-01, 2.5450e-01],
  21395. [ 6.1322e-01, -4.3241e-01, 1.8192e+00, -8.4219e-02, -6.2309e-01,
  21396. -6.3849e-01, 5.5366e-01, -1.2778e-01],
  21397. [ 5.3095e-01, -4.2456e-01, 1.7037e+00, 7.7444e-02, 1.5763e-02,
  21398. 7.5237e-03, 6.3480e-02, 2.0256e-01],
  21399. [ 5.4850e-01, -4.2094e-01, 1.6691e+00, -4.1524e-01, -5.2494e-01,
  21400. -1.1081e+00, 7.2521e-02, 2.0831e-03],
  21401. [ 6.1248e-01, -4.2731e-01, 1.2807e+00, -1.3253e+00, -2.5737e-01,
  21402. -1.2542e+00, 6.8644e-01, 1.5750e-01],
  21403. [ 6.2730e-01, -4.2490e-01, 1.8654e+00, -6.1124e-02, -4.6721e-01,
  21404. -6.6928e-01, 1.0910e+00, 1.9818e-01],
  21405. [ 6.0095e-01, -4.4175e-01, 1.9346e+00, -2.8437e-01, -5.4804e-01,
  21406. 1.2363e-01, 9.4481e-01, 1.7146e-01],
  21407. [-2.2859e+00, -2.2859e+00, 1.1841e+00, -1.3082e+00, -3.0554e-01,
  21408. -1.3621e+00, 3.0069e-01, 3.0839e-01]]], device='cuda:0')
  21409. loss_train_step before backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  21410. loss_train_step after backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  21411. loss_train: 1.6242366721853614
  21412. step: 51
  21413. running loss: 0.03184777788598748
  21414. Train Steps: 51/90 Loss: 0.0318 torch.Size([8, 600, 800])
  21415. torch.Size([8, 8])
  21416. tensor([[ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  21417. [0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  21418. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  21419. [0.6144, 0.4032, 0.8563, 0.3283, 0.3525, 0.4200, 0.5775, 0.5583],
  21420. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  21421. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552],
  21422. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  21423. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383]],
  21424. device='cuda:0', dtype=torch.float64)
  21425. predictions are: tensor([[-1.2281, -1.5360, 1.2552, -0.9789, -0.3538, -0.9091, 0.2718, 0.2497],
  21426. [ 1.1770, 0.0143, 1.8093, -0.5852, -0.1964, -1.1055, 0.6296, 0.0711],
  21427. [ 1.0187, -0.1383, 1.4644, -1.1879, -0.4770, -0.8713, 0.7727, -0.0471],
  21428. [ 1.4524, 0.1545, 1.5627, -0.7437, -0.6868, -0.2045, 0.5216, 0.1345],
  21429. [ 1.1354, -0.0355, 1.5601, 0.3532, -0.4657, -0.0231, 0.3850, 0.3366],
  21430. [-2.4087, -2.3484, 1.7172, -1.0239, 0.0941, -1.0496, 0.9831, 0.2392],
  21431. [ 0.8638, -0.1748, 1.5705, -0.4505, -0.6372, -0.3944, 0.0331, 0.1580],
  21432. [-1.9988, -2.0419, 0.9688, -1.1190, -0.3952, -1.2128, 0.0812, 0.2310]],
  21433. device='cuda:0', grad_fn=<AddmmBackward>)
  21434. landmarks are: tensor([[[-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  21435. 0.3007],
  21436. [ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  21437. 0.0171],
  21438. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  21439. -0.0220],
  21440. [ 0.5520, -0.4237, 1.6691, -0.7694, -0.6577, -0.3460, 0.3815,
  21441. 0.2930],
  21442. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  21443. 0.4624],
  21444. [-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  21445. 0.2783],
  21446. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  21447. 0.2567],
  21448. [-2.2859, -2.2859, 1.0712, -1.2085, -0.3806, -1.3929, 0.0755,
  21449. 0.2006]]], device='cuda:0')
  21450. loss_train_step before backward: tensor(0.0748, device='cuda:0', grad_fn=<MseLossBackward>)
  21451. loss_train_step after backward: tensor(0.0748, device='cuda:0', grad_fn=<MseLossBackward>)
  21452. loss_train: 1.6990172257646918
  21453. step: 52
  21454. running loss: 0.032673408187782534
  21455.  
  21456. Train Steps: 52/90 Loss: 0.0327 torch.Size([8, 600, 800])
  21457. torch.Size([8, 8])
  21458. tensor([[0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  21459. [0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676],
  21460. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767],
  21461. [0.6176, 0.4017, 0.8788, 0.5100, 0.4075, 0.5250, 0.5913, 0.5033],
  21462. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  21463. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  21464. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749],
  21465. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563]],
  21466. device='cuda:0', dtype=torch.float64)
  21467. predictions are: tensor([[-0.1634, -0.8578, 1.6840, -0.5581, -0.5848, -0.7154, 0.0890, 0.1144],
  21468. [ 0.4708, -0.4999, 1.8414, -0.1520, -0.0150, -0.1076, 0.5225, 0.1580],
  21469. [ 0.2425, -0.6167, 1.7604, -0.0780, -0.2799, 0.0465, 0.4614, 0.2296],
  21470. [ 0.4320, -0.5397, 1.8275, -0.0124, -0.2925, 0.0979, 0.6848, 0.0197],
  21471. [ 0.1199, -0.6968, 1.9107, -0.3066, -0.4233, -0.0754, 0.6837, 0.0897],
  21472. [ 0.6303, -0.3232, 1.3665, -0.7849, -0.5192, -0.9144, 0.5360, 0.3355],
  21473. [ 0.5060, -0.4484, 1.1837, -1.1058, -0.6574, -0.7888, 0.4394, 0.1935],
  21474. [-0.2262, -0.9020, 1.6467, -0.6310, -0.5496, -0.9648, 0.1842, 0.1176]],
  21475. device='cuda:0', grad_fn=<AddmmBackward>)
  21476. landmarks are: tensor([[[ 5.4331e-01, -4.0323e-01, 1.6344e+00, -4.9222e-01, -5.7691e-01,
  21477. -5.8460e-01, 3.5720e-02, 2.5666e-01],
  21478. [ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  21479. 4.6189e-04, 2.9049e-01, 3.3573e-01],
  21480. [ 5.5393e-01, -4.0308e-01, 1.7168e+00, -5.9398e-02, -3.7483e-01,
  21481. 5.4350e-02, 1.3903e-01, 3.7768e-01],
  21482. [ 5.6680e-01, -4.3056e-01, 1.7730e+00, 6.9746e-02, -4.0370e-01,
  21483. 1.3903e-01, 4.4503e-01, 3.8953e-02],
  21484. [ 6.0035e-01, -3.7467e-01, 1.8885e+00, -1.9969e-01, -5.0185e-01,
  21485. -1.4935e-02, 5.4896e-01, 1.7752e-01],
  21486. [ 5.8320e-01, -3.5928e-01, 1.3515e+00, -6.0770e-01, -5.2494e-01,
  21487. -9.3102e-01, 3.3533e-01, 3.4688e-01],
  21488. [ 5.4186e-01, -4.1601e-01, 1.1810e+00, -8.9394e-01, -6.8083e-01,
  21489. -7.4627e-01, 2.4855e-01, 3.6938e-01],
  21490. [ 5.5606e-01, -3.8337e-01, 1.6229e+00, -5.1532e-01, -6.2309e-01,
  21491. -8.0785e-01, 7.2734e-02, 2.8371e-01]]], device='cuda:0')
  21492. loss_train_step before backward: tensor(0.0443, device='cuda:0', grad_fn=<MseLossBackward>)
  21493. loss_train_step after backward: tensor(0.0443, device='cuda:0', grad_fn=<MseLossBackward>)
  21494. loss_train: 1.7433188473805785
  21495. step: 53
  21496. running loss: 0.03289280844114299
  21497. Train Steps: 53/90 Loss: 0.0329 torch.Size([8, 600, 800])
  21498. torch.Size([8, 8])
  21499. tensor([[0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  21500. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  21501. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  21502. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  21503. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350],
  21504. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  21505. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  21506. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320]],
  21507. device='cuda:0', dtype=torch.float64)
  21508. predictions are: tensor([[ 0.4969, -0.4439, 1.6245, -0.3381, -0.5079, -0.0939, 0.2119, 0.2477],
  21509. [-0.6186, -1.1474, 1.1579, -1.4484, -0.2859, -1.4703, 0.1573, 0.1548],
  21510. [ 0.0448, -0.7621, 1.7929, 0.1244, -0.4749, -0.2750, 0.8188, 0.1702],
  21511. [ 0.3577, -0.5050, 1.1513, -1.2380, -0.5836, -0.7809, 0.4390, 0.2825],
  21512. [ 0.5176, -0.4453, 1.7902, -0.0143, -0.4640, -0.1327, 0.1576, 0.1083],
  21513. [ 0.6601, -0.3388, 1.9378, -0.6587, -0.2862, -1.3708, 0.4818, 0.0354],
  21514. [-0.0375, -0.7674, 1.7133, 0.1232, -0.3605, -0.0799, 0.3183, 0.2255],
  21515. [ 0.5661, -0.4524, 1.9309, -0.3699, -0.4641, 0.2918, 1.0282, 0.1330]],
  21516. device='cuda:0', grad_fn=<AddmmBackward>)
  21517. landmarks are: tensor([[[ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  21518. 0.3265],
  21519. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  21520. 0.1343],
  21521. [ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  21522. 0.2516],
  21523. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  21524. 0.3007],
  21525. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  21526. 0.1854],
  21527. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  21528. -0.0529],
  21529. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  21530. 0.2391],
  21531. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  21532. 0.1715]]], device='cuda:0')
  21533. loss_train_step before backward: tensor(0.0540, device='cuda:0', grad_fn=<MseLossBackward>)
  21534. loss_train_step after backward: tensor(0.0540, device='cuda:0', grad_fn=<MseLossBackward>)
  21535. loss_train: 1.7973417667672038
  21536. step: 54
  21537. running loss: 0.033284106791985256
  21538. Train Steps: 54/90 Loss: 0.0333 torch.Size([8, 600, 800])
  21539. torch.Size([8, 8])
  21540. tensor([[0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  21541. [0.6289, 0.4024, 0.9088, 0.4567, 0.3937, 0.5633, 0.7058, 0.5609],
  21542. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  21543. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  21544. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  21545. [0.6286, 0.4060, 0.9188, 0.4333, 0.3675, 0.4167, 0.7034, 0.5528],
  21546. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  21547. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600]],
  21548. device='cuda:0', dtype=torch.float64)
  21549. predictions are: tensor([[ 0.6193, -0.2979, 1.2371, -1.2785, -0.4778, -0.9031, 0.4626, 0.2020],
  21550. [ 0.6740, -0.3263, 1.8320, -0.1743, -0.3139, 0.2781, 0.8246, 0.2859],
  21551. [ 0.3821, -0.4890, 1.8163, -0.2113, -0.3938, -0.2797, 0.0329, 0.0312],
  21552. [ 0.8386, -0.1654, 1.7004, -0.5014, -0.6979, -0.4120, 0.3056, 0.0958],
  21553. [ 0.6805, -0.3059, 1.7077, 0.1778, -0.4999, -0.0904, 0.5120, 0.1148],
  21554. [ 0.6076, -0.3326, 1.9301, -0.3129, -0.4152, -0.5163, 0.7245, 0.2601],
  21555. [ 0.6592, -0.3361, 1.6481, 0.1911, -0.3928, -0.1796, 0.3788, 0.1469],
  21556. [-2.6177, -2.5506, 1.3313, -1.1060, -0.2942, -1.1176, 0.2407, 0.2369]],
  21557. device='cuda:0', grad_fn=<AddmmBackward>)
  21558. landmarks are: tensor([[[ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  21559. 0.1621],
  21560. [ 0.6191, -0.4273, 1.9115, -0.1766, -0.4672, 0.3161, 0.9741,
  21561. 0.3050],
  21562. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  21563. -0.0220],
  21564. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  21565. 0.0236],
  21566. [ 0.6148, -0.4130, 1.6864, 0.1698, -0.5307, -0.1150, 0.6125,
  21567. 0.0851],
  21568. [ 0.6174, -0.4105, 1.9577, -0.2844, -0.5885, -0.3614, 0.9631,
  21569. 0.2676],
  21570. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  21571. 0.1979],
  21572. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  21573. 0.3007]]], device='cuda:0')
  21574. loss_train_step before backward: tensor(0.0118, device='cuda:0', grad_fn=<MseLossBackward>)
  21575. loss_train_step after backward: tensor(0.0118, device='cuda:0', grad_fn=<MseLossBackward>)
  21576. loss_train: 1.8091550571843982
  21577. step: 55
  21578. running loss: 0.0328937283124436
  21579. Train Steps: 55/90 Loss: 0.0329 torch.Size([8, 600, 800])
  21580. torch.Size([8, 8])
  21581. tensor([[0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  21582. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  21583. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  21584. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  21585. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  21586. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  21587. [0.6107, 0.4050, 0.8700, 0.4850, 0.4470, 0.4848, 0.5043, 0.5431],
  21588. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567]],
  21589. device='cuda:0', dtype=torch.float64)
  21590. predictions are: tensor([[ 0.1492, -0.6670, 1.5802, 0.2910, -0.4135, 0.0303, 0.4409, 0.4137],
  21591. [ 0.0904, -0.6878, 1.2486, -1.1853, -0.5766, -0.7854, 0.4236, 0.2221],
  21592. [ 0.7112, -0.3543, 1.6138, -1.0944, -0.4004, -1.0451, 0.4618, -0.0073],
  21593. [ 0.6569, -0.3063, 1.7665, -0.0456, -0.6110, -0.5325, 0.3404, 0.3160],
  21594. [ 0.0950, -0.7382, 1.8449, 0.1953, -0.5241, -0.2591, 0.8265, 0.0738],
  21595. [ 0.1203, -0.6797, 1.9646, -0.3627, -0.5742, -0.3932, 0.5246, 0.2486],
  21596. [ 0.3048, -0.5792, 1.8250, -0.0522, -0.2013, 0.0844, 0.1208, 0.0362],
  21597. [ 0.4090, -0.4900, 1.2181, -1.1421, -0.3401, -1.0661, 0.3066, 0.2915]],
  21598. device='cuda:0', grad_fn=<AddmmBackward>)
  21599. landmarks are: tensor([[[ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  21600. 0.5393],
  21601. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  21602. 0.3007],
  21603. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  21604. 0.0807],
  21605. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  21606. 0.3161],
  21607. [ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  21608. 0.2516],
  21609. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  21610. 0.3238],
  21611. [ 0.5351, -0.4153, 1.7326, -0.0457, -0.2214, -0.0466, 0.0434,
  21612. 0.2228],
  21613. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  21614. 0.2853]]], device='cuda:0')
  21615. loss_train_step before backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  21616. loss_train_step after backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  21617. loss_train: 1.837601481936872
  21618. step: 56
  21619. running loss: 0.03281431217744414
  21620.  
  21621. Train Steps: 56/90 Loss: 0.0328 torch.Size([8, 600, 800])
  21622. torch.Size([8, 8])
  21623. tensor([[0.6197, 0.4091, 0.8800, 0.4783, 0.3538, 0.4767, 0.5950, 0.5550],
  21624. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  21625. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586],
  21626. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  21627. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  21628. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913],
  21629. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  21630. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846]],
  21631. device='cuda:0', dtype=torch.float64)
  21632. predictions are: tensor([[ 1.2243e-01, -7.1268e-01, 1.8774e+00, 6.4187e-02, -6.6555e-01,
  21633. 2.1508e-01, 6.6481e-01, 2.6001e-01],
  21634. [ 1.7363e-01, -6.6750e-01, 1.9018e+00, -4.6164e-02, -6.1875e-01,
  21635. 1.2968e-02, 3.6536e-01, 1.5884e-01],
  21636. [ 9.2766e-02, -7.3770e-01, 1.7641e+00, -1.0756e+00, 6.6186e-02,
  21637. -1.2018e+00, 9.7435e-01, 1.6731e-01],
  21638. [ 8.2140e-01, -2.5627e-01, 1.3991e+00, -1.0600e+00, -3.0525e-01,
  21639. -1.0604e+00, 4.5021e-01, 1.6918e-01],
  21640. [ 1.3324e-01, -6.6895e-01, 9.5730e-01, -1.1570e+00, -5.2132e-01,
  21641. -1.1929e+00, 1.6117e-03, 1.6140e-01],
  21642. [ 2.9194e-01, -5.9492e-01, 1.3999e+00, -1.0445e+00, -2.3796e-01,
  21643. -1.2431e+00, 3.2231e-01, 5.8498e-02],
  21644. [ 3.9386e-01, -4.8484e-01, 1.6187e+00, 4.3420e-01, -6.6633e-01,
  21645. -2.1455e-01, 3.6329e-01, 4.0566e-01],
  21646. [ 4.8454e-01, -4.5625e-01, 1.7858e+00, -7.6451e-02, -6.4586e-01,
  21647. 6.5811e-02, 2.6243e-01, 2.7170e-01]], device='cuda:0',
  21648. grad_fn=<AddmmBackward>)
  21649. landmarks are: tensor([[[ 0.5763, -0.3963, 1.7788, -0.0765, -0.6520, -0.0842, 0.4624,
  21650. 0.2776],
  21651. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  21652. 0.3087],
  21653. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  21654. 0.2944],
  21655. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  21656. 0.1850],
  21657. [ 0.5591, -0.3990, 0.9012, -1.2313, -0.3979, -1.3852, 0.0804,
  21658. 0.2071],
  21659. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  21660. -0.0168],
  21661. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  21662. 0.4778],
  21663. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  21664. 0.4145]]], device='cuda:0')
  21665. loss_train_step before backward: tensor(0.0451, device='cuda:0', grad_fn=<MseLossBackward>)
  21666. loss_train_step after backward: tensor(0.0451, device='cuda:0', grad_fn=<MseLossBackward>)
  21667. loss_train: 1.8827112754806876
  21668. step: 57
  21669. running loss: 0.03303002237685417
  21670. Train Steps: 57/90 Loss: 0.0330 torch.Size([8, 600, 800])
  21671. torch.Size([8, 8])
  21672. tensor([[0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  21673. [0.6200, 0.3978, 0.8900, 0.4550, 0.3775, 0.5200, 0.6150, 0.5367],
  21674. [0.6229, 0.4086, 0.7538, 0.2600, 0.4775, 0.1617, 0.5900, 0.5383],
  21675. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  21676. [0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350],
  21677. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  21678. [ nan, nan, 0.6512, 0.1717, 0.4100, 0.1983, 0.5253, 0.5240],
  21679. [0.6200, 0.4039, 0.8880, 0.4799, 0.3625, 0.4285, 0.5866, 0.5148]],
  21680. device='cuda:0', dtype=torch.float64)
  21681. predictions are: tensor([[ 1.0962, -0.0636, 1.3366, -0.8499, -0.5666, -0.6745, 0.4527, 0.2407],
  21682. [ 0.5959, -0.3922, 1.8984, 0.1088, -0.5427, 0.2683, 0.5982, 0.1676],
  21683. [ 1.0458, -0.0688, 1.2324, -0.9085, -0.1895, -1.3337, 0.2850, 0.2403],
  21684. [-1.5538, -1.7963, 1.3983, -0.8904, -0.4080, -0.8523, 0.2596, 0.2820],
  21685. [ 0.7834, -0.1845, 1.3360, -0.7645, -0.3736, -1.0244, 0.2668, 0.2252],
  21686. [ 1.0495, -0.0705, 2.0186, 0.0522, -0.6195, -0.0223, 0.7219, 0.1308],
  21687. [-2.0917, -2.1628, 1.0026, -1.2713, -0.3786, -1.3109, 0.1309, 0.2826],
  21688. [ 0.8242, -0.2368, 1.9117, 0.2111, -0.6423, -0.1351, 0.4206, 0.0966]],
  21689. device='cuda:0', grad_fn=<AddmmBackward>)
  21690. landmarks are: tensor([[[ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  21691. 0.2853],
  21692. [ 0.5776, -0.4484, 1.8249, -0.1843, -0.5423, 0.1159, 0.5547,
  21693. 0.1929],
  21694. [ 0.5911, -0.3984, 1.1956, -1.0850, -0.0804, -1.5392, 0.4393,
  21695. 0.2006],
  21696. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  21697. 0.3007],
  21698. [ 0.5911, -0.4080, 1.2303, -0.9156, -0.3229, -1.2851, 0.4508,
  21699. 0.1852],
  21700. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  21701. 0.1390],
  21702. [-2.2859, -2.2859, 0.7222, -1.4930, -0.3921, -1.3698, 0.1404,
  21703. 0.1343],
  21704. [ 0.5781, -0.4205, 1.8159, -0.0691, -0.6116, -0.3069, 0.4236,
  21705. 0.0919]]], device='cuda:0')
  21706. loss_train_step before backward: tensor(0.0496, device='cuda:0', grad_fn=<MseLossBackward>)
  21707. loss_train_step after backward: tensor(0.0496, device='cuda:0', grad_fn=<MseLossBackward>)
  21708. loss_train: 1.932359985075891
  21709. step: 58
  21710. running loss: 0.03331655146682571
  21711. Train Steps: 58/90 Loss: 0.0333 torch.Size([8, 600, 800])
  21712. torch.Size([8, 8])
  21713. tensor([[0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  21714. [0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  21715. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  21716. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  21717. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  21718. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  21719. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433],
  21720. [0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155]],
  21721. device='cuda:0', dtype=torch.float64)
  21722. predictions are: tensor([[ 0.3482, -0.5847, 1.6769, -0.4344, -0.6912, -0.1510, 0.5420, 0.2736],
  21723. [ 0.4134, -0.4870, 1.6019, -0.5267, -0.6652, -0.7825, 0.3372, 0.1593],
  21724. [ 0.5419, -0.4151, 1.6395, -0.1511, -0.5665, -0.2487, 0.1434, 0.2999],
  21725. [ 0.0570, -0.7853, 1.8228, -0.4909, -0.6013, -0.4838, 0.6780, 0.1995],
  21726. [ 0.5814, -0.4066, 1.7251, -0.4970, -0.4215, -1.3153, 0.4057, 0.0920],
  21727. [ 0.6046, -0.3934, 1.6968, -0.0545, -0.2929, 0.4666, 0.5360, 0.3136],
  21728. [ 0.5320, -0.4514, 1.5537, 0.1591, -0.1326, 0.0026, 0.1167, 0.3526],
  21729. [ 0.3389, -0.5410, 1.5506, -0.9298, -0.3028, -1.3098, 0.5715, 0.1343]],
  21730. device='cuda:0', grad_fn=<AddmmBackward>)
  21731. landmarks are: tensor([[[ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  21732. 0.2083],
  21733. [ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  21734. 0.1963],
  21735. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  21736. 0.3087],
  21737. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  21738. 0.1544],
  21739. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  21740. -0.0529],
  21741. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  21742. 0.0928],
  21743. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  21744. 0.2237],
  21745. [ 0.6126, -0.4161, 1.6344, -0.9541, -0.2247, -1.3467, 0.6339,
  21746. 0.0953]]], device='cuda:0')
  21747. loss_train_step before backward: tensor(0.0151, device='cuda:0', grad_fn=<MseLossBackward>)
  21748. loss_train_step after backward: tensor(0.0151, device='cuda:0', grad_fn=<MseLossBackward>)
  21749. loss_train: 1.9474248168990016
  21750. step: 59
  21751. running loss: 0.03300720028642375
  21752. Train Steps: 59/90 Loss: 0.0330 torch.Size([8, 600, 800])
  21753. torch.Size([8, 8])
  21754. tensor([[0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  21755. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  21756. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  21757. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  21758. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  21759. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  21760. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  21761. [0.6090, 0.4045, 0.7250, 0.2100, 0.4075, 0.2300, 0.5476, 0.5663]],
  21762. device='cuda:0', dtype=torch.float64)
  21763. predictions are: tensor([[ 0.3817, -0.5736, 1.9059, -0.1225, -0.4497, -0.2011, 0.2088, 0.1125],
  21764. [ 0.9177, -0.2117, 1.3480, -0.8393, -0.3956, -0.8119, 0.5936, 0.5077],
  21765. [ 0.4320, -0.5735, 1.8279, 0.1515, -0.3319, -0.0194, 0.5533, 0.1154],
  21766. [ 0.4054, -0.5492, 1.9774, 0.1779, -0.5931, -0.5311, 0.6125, 0.0498],
  21767. [ 0.6835, -0.3405, 0.9233, -0.8949, -0.5273, -0.9222, 0.1870, 0.4747],
  21768. [ 0.4931, -0.4520, 1.6901, -0.4726, -0.6711, -0.3948, 0.3562, 0.0879],
  21769. [ 0.4073, -0.5244, 1.8318, -0.3861, -0.5785, -0.7754, 0.4366, 0.1827],
  21770. [-0.1445, -0.8772, 1.1068, -1.2608, -0.4086, -1.1984, 0.1743, 0.3005]],
  21771. device='cuda:0', grad_fn=<AddmmBackward>)
  21772. landmarks are: tensor([[[ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  21773. -0.0220],
  21774. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  21775. 0.5701],
  21776. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  21777. 0.0159],
  21778. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  21779. -0.0049],
  21780. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  21781. 0.4085],
  21782. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  21783. 0.0021],
  21784. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  21785. 0.1005],
  21786. [ 0.5269, -0.4176, 1.0628, -1.3159, -0.4037, -1.2236, 0.2432,
  21787. 0.3297]]], device='cuda:0')
  21788. loss_train_step before backward: tensor(0.0221, device='cuda:0', grad_fn=<MseLossBackward>)
  21789. loss_train_step after backward: tensor(0.0221, device='cuda:0', grad_fn=<MseLossBackward>)
  21790. loss_train: 1.969504582695663
  21791. step: 60
  21792. running loss: 0.03282507637826105
  21793.  
  21794. Train Steps: 60/90 Loss: 0.0328 torch.Size([8, 600, 800])
  21795. torch.Size([8, 8])
  21796. tensor([[0.6129, 0.4069, 0.8750, 0.5067, 0.3875, 0.4233, 0.5235, 0.5881],
  21797. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  21798. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  21799. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650],
  21800. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  21801. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  21802. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  21803. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000]],
  21804. device='cuda:0', dtype=torch.float64)
  21805. predictions are: tensor([[ 0.7551, -0.2848, 1.7650, 0.1631, -0.5179, -0.3995, 0.1350, 0.3288],
  21806. [ 0.6782, -0.3846, 1.5860, -1.0260, -0.3997, -1.1093, 0.5274, 0.0610],
  21807. [ 0.6320, -0.3760, 1.7877, -0.3926, -0.4922, -0.0774, 0.3800, 0.2165],
  21808. [-1.5177, -1.8227, 1.0843, -1.3910, -0.4651, -1.3811, 0.1120, 0.2572],
  21809. [ 0.8237, -0.2159, 1.7595, 0.2419, -0.5153, -0.2390, 0.3561, 0.3817],
  21810. [ 0.8449, -0.2290, 1.5374, 0.1570, -0.4488, -0.2010, 0.8125, 0.3838],
  21811. [ 0.3734, -0.5396, 1.2457, -1.0386, -0.6445, -0.7832, 0.1265, 0.0847],
  21812. [ 0.8764, -0.2458, 1.8436, 0.1623, -0.4635, -0.0212, 0.6347, 0.1237]],
  21813. device='cuda:0', grad_fn=<AddmmBackward>)
  21814. landmarks are: tensor([[[ 0.5452, -0.4067, 1.7557, 0.0543, -0.4961, -0.3306, 0.1323,
  21815. 0.4306],
  21816. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  21817. 0.0807],
  21818. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  21819. 0.2468],
  21820. [-2.2859, -2.2859, 1.0361, -1.2021, -0.4210, -1.3390, 0.0871,
  21821. 0.3238],
  21822. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  21823. 0.3161],
  21824. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  21825. 0.3478],
  21826. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  21827. 0.0442],
  21828. [ 0.5908, -0.4366, 1.7557, 0.1390, -0.5192, 0.1313, 0.6529,
  21829. 0.0236]]], device='cuda:0')
  21830. loss_train_step before backward: tensor(0.0242, device='cuda:0', grad_fn=<MseLossBackward>)
  21831. loss_train_step after backward: tensor(0.0242, device='cuda:0', grad_fn=<MseLossBackward>)
  21832. loss_train: 1.9937451435253024
  21833. step: 61
  21834. running loss: 0.03268434661516889
  21835. Train Steps: 61/90 Loss: 0.0327 torch.Size([8, 600, 800])
  21836. torch.Size([8, 8])
  21837. tensor([[0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  21838. [0.6124, 0.4075, 0.7696, 0.4153, 0.3475, 0.3767, 0.5157, 0.5427],
  21839. [0.6264, 0.4069, 0.7900, 0.1650, 0.4275, 0.2267, 0.6290, 0.4947],
  21840. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  21841. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  21842. [0.6216, 0.4099, 0.7225, 0.2033, 0.4188, 0.2217, 0.5975, 0.5283],
  21843. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  21844. [0.6075, 0.4000, 0.8513, 0.5183, 0.4510, 0.5329, 0.5180, 0.5280]],
  21845. device='cuda:0', dtype=torch.float64)
  21846. predictions are: tensor([[ 0.3201, -0.6410, 1.7896, -0.1694, -0.4898, 0.0609, 0.4582, 0.2323],
  21847. [ 0.4722, -0.4604, 1.3808, -0.3858, -0.7707, -0.5247, 0.1395, 0.3130],
  21848. [ 0.5414, -0.4888, 1.3641, -1.3285, -0.4477, -1.3795, 0.6508, 0.0505],
  21849. [ 0.3127, -0.6277, 1.7601, -0.0538, -0.2350, -0.0423, 0.4265, 0.3210],
  21850. [ 0.2437, -0.6771, 1.7701, -1.0139, -0.0564, -1.2747, 1.0509, 0.1679],
  21851. [ 0.5388, -0.4299, 1.0035, -1.1597, -0.4715, -1.3582, 0.1529, 0.2767],
  21852. [ 0.8609, -0.2031, 1.7233, 0.0268, -0.7773, -0.6240, 0.2071, 0.1623],
  21853. [ 0.5464, -0.4439, 1.6349, 0.1478, -0.3280, 0.1001, 0.1455, 0.2697]],
  21854. device='cuda:0', grad_fn=<AddmmBackward>)
  21855. landmarks are: tensor([[[ 5.6039e-01, -4.6197e-01, 1.7961e+00, -1.9969e-01, -3.2286e-01,
  21856. 1.0824e-01, 4.1039e-01, 2.5450e-01],
  21857. [ 5.4267e-01, -4.0354e-01, 1.2688e+00, -3.6754e-01, -6.8083e-01,
  21858. -5.4611e-01, 9.5867e-02, 2.2059e-01],
  21859. [ 6.0739e-01, -4.0631e-01, 1.3630e+00, -1.5238e+00, -3.1132e-01,
  21860. -1.2390e+00, 6.1950e-01, -9.2270e-04],
  21861. [ 5.3712e-01, -4.2517e-01, 1.7037e+00, -6.8822e-02, -3.4180e-02,
  21862. 6.2048e-02, 3.7575e-01, 2.8530e-01],
  21863. [ 6.2072e-01, -3.9360e-01, 1.7788e+00, -1.1235e+00, 1.4480e-01,
  21864. -1.0850e+00, 1.1459e+00, 1.9818e-01],
  21865. [ 5.8505e-01, -3.9246e-01, 1.0513e+00, -1.3467e+00, -3.5173e-01,
  21866. -1.2620e+00, 4.7390e-01, 1.5443e-01],
  21867. [ 5.4434e-01, -3.9938e-01, 1.7499e+00, -1.2271e-01, -6.1732e-01,
  21868. -5.7691e-01, 4.8756e-03, 2.0706e-01],
  21869. [ 5.2021e-01, -4.3818e-01, 1.6460e+00, 1.0824e-01, -2.0286e-01,
  21870. 1.7544e-01, 1.0666e-01, 1.5296e-01]]], device='cuda:0')
  21871. loss_train_step before backward: tensor(0.0184, device='cuda:0', grad_fn=<MseLossBackward>)
  21872. loss_train_step after backward: tensor(0.0184, device='cuda:0', grad_fn=<MseLossBackward>)
  21873. loss_train: 2.0121765499934554
  21874. step: 62
  21875. running loss: 0.03245446048376541
  21876. Train Steps: 62/90 Loss: 0.0325 torch.Size([8, 600, 800])
  21877. torch.Size([8, 8])
  21878. tensor([[0.6129, 0.4069, 0.8750, 0.5067, 0.3875, 0.4233, 0.5235, 0.5881],
  21879. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  21880. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  21881. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  21882. [0.6214, 0.4040, 0.8838, 0.3500, 0.3600, 0.5183, 0.6362, 0.5200],
  21883. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550],
  21884. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  21885. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947]],
  21886. device='cuda:0', dtype=torch.float64)
  21887. predictions are: tensor([[ 0.5197, -0.4527, 1.5950, 0.1716, -0.5711, -0.4149, 0.0090, 0.3377],
  21888. [ 0.3744, -0.5529, 1.5663, -1.0771, -0.2237, -1.2708, 0.4707, 0.0513],
  21889. [ 0.5448, -0.4714, 1.7032, -0.2847, -0.6567, -0.5911, 0.5097, 0.0959],
  21890. [ 0.6185, -0.3506, 1.0383, -0.7511, -0.1287, -1.3023, 0.0891, 0.4953],
  21891. [ 0.3769, -0.5777, 1.6381, -0.5963, -0.5831, 0.0237, 0.5714, 0.2753],
  21892. [ 0.5147, -0.4490, 1.7073, -0.1214, -0.4517, 0.0542, 0.3266, 0.3011],
  21893. [ 0.5869, -0.4673, 1.8068, -0.0764, -0.5900, -0.2953, 0.7764, 0.1528],
  21894. [ 0.4651, -0.5418, 1.3631, -1.2766, -0.3952, -1.2271, 0.5598, 0.0800]],
  21895. device='cuda:0', grad_fn=<AddmmBackward>)
  21896. landmarks are: tensor([[[ 5.4515e-01, -4.0670e-01, 1.7557e+00, 5.4350e-02, -4.9607e-01,
  21897. -3.3056e-01, 1.3228e-01, 4.3063e-01],
  21898. [ 6.1264e-01, -3.8707e-01, 1.6229e+00, -1.0773e+00, -2.1316e-01,
  21899. -1.3698e+00, 5.8291e-01, -2.0913e-02],
  21900. [ 6.2200e-01, -4.4357e-01, 1.8711e+00, -3.6905e-01, -6.1732e-01,
  21901. -4.9992e-01, 6.7021e-01, 6.9746e-02],
  21902. [ 6.1611e-01, -3.0754e-01, 1.1678e+00, -6.5000e-01, 8.1293e-02,
  21903. -1.4006e+00, 2.5450e-01, 5.6243e-01],
  21904. [ 5.8412e-01, -4.1986e-01, 1.7961e+00, -6.6928e-01, -6.2309e-01,
  21905. 1.0824e-01, 6.5289e-01, 1.1594e-01],
  21906. [ 5.9677e-01, -3.7252e-01, 1.8423e+00, -1.3811e-01, -4.0370e-01,
  21907. 1.8522e-01, 6.0092e-01, 2.7760e-01],
  21908. [ 6.1742e-01, -4.1286e-01, 1.8711e+00, -1.0731e-01, -5.4804e-01,
  21909. -1.2271e-01, 9.5578e-01, 2.5161e-01],
  21910. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  21911. -1.1312e+00, 6.1950e-01, -9.2270e-04]]], device='cuda:0')
  21912. loss_train_step before backward: tensor(0.0129, device='cuda:0', grad_fn=<MseLossBackward>)
  21913. loss_train_step after backward: tensor(0.0129, device='cuda:0', grad_fn=<MseLossBackward>)
  21914. loss_train: 2.0250426745042205
  21915. step: 63
  21916. running loss: 0.03214353451594001
  21917. Train Steps: 63/90 Loss: 0.0321 torch.Size([8, 600, 800])
  21918. torch.Size([8, 8])
  21919. tensor([[0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  21920. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  21921. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  21922. [0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  21923. [0.6292, 0.4010, 0.8988, 0.4800, 0.3638, 0.3817, 0.6357, 0.5051],
  21924. [0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290],
  21925. [0.6279, 0.4008, 0.8600, 0.4883, 0.4325, 0.5283, 0.7010, 0.5378],
  21926. [0.6250, 0.4131, 0.8688, 0.2983, 0.4275, 0.2367, 0.6162, 0.5367]],
  21927. device='cuda:0', dtype=torch.float64)
  21928. predictions are: tensor([[ 0.5808, -0.4370, 1.2576, -1.1996, -0.3212, -1.3849, 0.3267, 0.0878],
  21929. [ 0.4906, -0.5313, 1.7542, 0.1598, -0.3029, 0.2531, 0.3300, 0.1995],
  21930. [ 0.3006, -0.5941, 1.0523, -0.8893, -0.6749, -0.6995, 0.1450, 0.3257],
  21931. [ 0.6383, -0.3974, 0.9691, -1.1039, -0.3556, -1.3894, 0.1058, 0.2528],
  21932. [ 0.5203, -0.4946, 1.8813, -0.0241, -0.6237, -0.5090, 0.5620, 0.1526],
  21933. [ 0.4117, -0.5442, 1.3097, -1.0924, -0.3429, -1.2326, 0.5587, 0.1343],
  21934. [ 0.6043, -0.4339, 1.7556, 0.0348, -0.4017, 0.2142, 0.6594, 0.2807],
  21935. [ 0.4688, -0.4926, 1.7983, -0.7584, -0.3287, -1.0427, 0.5270, 0.1824]],
  21936. device='cuda:0', grad_fn=<AddmmBackward>)
  21937. landmarks are: tensor([[[ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  21938. 0.1082],
  21939. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  21940. 0.0764],
  21941. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  21942. 0.3315],
  21943. [ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  21944. 0.2699],
  21945. [ 0.6204, -0.4336, 1.8654, -0.0688, -0.6058, -0.5230, 0.6503,
  21946. 0.0472],
  21947. [ 0.6125, -0.4273, 1.2807, -1.3253, -0.2574, -1.2542, 0.6864,
  21948. 0.1575],
  21949. [ 0.6141, -0.4345, 1.6864, -0.0303, -0.2882, 0.1544, 0.9521,
  21950. 0.1982],
  21951. [ 0.6011, -0.3778, 1.7268, -0.9079, -0.3113, -1.1928, 0.5605,
  21952. 0.1929]]], device='cuda:0')
  21953. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  21954. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  21955. loss_train: 2.035658926703036
  21956. step: 64
  21957. running loss: 0.031807170729734935
  21958.  
  21959. Train Steps: 64/90 Loss: 0.0318 torch.Size([8, 600, 800])
  21960. torch.Size([8, 8])
  21961. tensor([[0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  21962. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  21963. [ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933],
  21964. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  21965. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064],
  21966. [0.6192, 0.3980, 0.7078, 0.2750, 0.4250, 0.2100, 0.5450, 0.5783],
  21967. [0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400],
  21968. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483]],
  21969. device='cuda:0', dtype=torch.float64)
  21970. predictions are: tensor([[ 1.1619, -0.0507, 1.9458, 0.1117, -0.3936, 0.2390, 0.6420, 0.0908],
  21971. [-0.6746, -1.2440, 0.9450, -1.3181, -0.3175, -1.5303, 0.2282, 0.3076],
  21972. [-0.8266, -1.3301, 1.1158, -1.1625, -0.5268, -1.1397, 0.0964, 0.2674],
  21973. [ 0.9588, -0.1822, 1.7905, 0.1449, -0.5481, -0.2363, 0.5219, 0.3334],
  21974. [ 0.9507, -0.1960, 1.8109, 0.1169, -0.0843, 0.0336, 0.1701, 0.1119],
  21975. [-0.1099, -0.8441, 1.0848, -1.0951, -0.3097, -1.2919, 0.2902, 0.3028],
  21976. [ 1.0059, -0.1478, 1.7145, -0.5904, -0.6488, -0.6710, 0.6253, 0.1184],
  21977. [ 0.9850, -0.1714, 1.1831, -1.1515, -0.3543, -1.2117, 0.5893, 0.1447]],
  21978. device='cuda:0', grad_fn=<AddmmBackward>)
  21979. landmarks are: tensor([[[ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  21980. 0.1390],
  21981. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  21982. 0.3469],
  21983. [-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  21984. 0.4543],
  21985. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  21986. 0.5239],
  21987. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  21988. 0.0532],
  21989. [ 0.5742, -0.4474, 0.9834, -1.0159, -0.3229, -1.3159, 0.2314,
  21990. 0.3854],
  21991. [ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  21992. 0.2083],
  21993. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  21994. 0.2468]]], device='cuda:0')
  21995. loss_train_step before backward: tensor(0.1430, device='cuda:0', grad_fn=<MseLossBackward>)
  21996. loss_train_step after backward: tensor(0.1430, device='cuda:0', grad_fn=<MseLossBackward>)
  21997. loss_train: 2.1786455223336816
  21998. step: 65
  21999. running loss: 0.03351762342051818
  22000. Train Steps: 65/90 Loss: 0.0335 torch.Size([8, 600, 800])
  22001. torch.Size([8, 8])
  22002. tensor([[0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  22003. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  22004. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  22005. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  22006. [0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  22007. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  22008. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  22009. [0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758]],
  22010. device='cuda:0', dtype=torch.float64)
  22011. predictions are: tensor([[ 0.4607, -0.5076, 1.5616, -0.9819, -0.3880, -1.0047, 0.6830, 0.2139],
  22012. [ 0.2895, -0.5994, 1.3120, -1.0558, -0.5012, -1.1000, 0.1815, 0.0953],
  22013. [ 0.7617, -0.2370, 1.0651, -0.8918, -0.0222, -1.3057, 0.3144, 0.5303],
  22014. [ 0.2737, -0.6040, 1.1433, -1.1580, -0.5218, -0.9390, 0.1412, 0.1010],
  22015. [ 0.6965, -0.3564, 1.6710, -0.2018, -0.2981, -0.0155, 0.4957, 0.2971],
  22016. [ 0.6458, -0.3963, 1.7657, 0.1448, -0.5660, -0.6313, 0.6119, 0.0351],
  22017. [ 0.5802, -0.4325, 1.6830, -0.1799, -0.3756, -0.1435, 0.3684, 0.2465],
  22018. [ 0.6696, -0.3913, 1.7502, -0.2301, -0.3841, -0.0126, 0.6902, 0.1319]],
  22019. device='cuda:0', grad_fn=<AddmmBackward>)
  22020. landmarks are: tensor([[[ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  22021. 0.1931],
  22022. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  22023. -0.0220],
  22024. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  22025. 0.5624],
  22026. [ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  22027. 0.0141],
  22028. [ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  22029. 0.2391],
  22030. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  22031. -0.0957],
  22032. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  22033. 0.2035],
  22034. [ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  22035. -0.0881]]], device='cuda:0')
  22036. loss_train_step before backward: tensor(0.0131, device='cuda:0', grad_fn=<MseLossBackward>)
  22037. loss_train_step after backward: tensor(0.0131, device='cuda:0', grad_fn=<MseLossBackward>)
  22038. loss_train: 2.1917926585301757
  22039. step: 66
  22040. running loss: 0.03320897967469963
  22041. Train Steps: 66/90 Loss: 0.0332 torch.Size([8, 600, 800])
  22042. torch.Size([8, 8])
  22043. tensor([[0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  22044. [0.6176, 0.4017, 0.8788, 0.5100, 0.4075, 0.5250, 0.5913, 0.5033],
  22045. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  22046. [0.6171, 0.4127, 0.8900, 0.4800, 0.4325, 0.5783, 0.5769, 0.5090],
  22047. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  22048. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500],
  22049. [0.6168, 0.4081, 0.8438, 0.3367, 0.3500, 0.4667, 0.6212, 0.5400],
  22050. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940]],
  22051. device='cuda:0', dtype=torch.float64)
  22052. predictions are: tensor([[ 0.5727, -0.3898, 1.5611, -0.2527, -0.5054, -0.5357, 0.4417, 0.4269],
  22053. [ 0.4821, -0.4974, 1.6563, -0.2330, -0.2927, -0.1848, 0.4000, 0.1484],
  22054. [ 0.5810, -0.4360, 1.5775, -0.0716, -0.4948, -0.5690, 0.5614, 0.1391],
  22055. [ 1.0774, -0.0504, 1.6881, -0.3434, -0.2318, 0.0752, 0.3415, 0.1202],
  22056. [ 0.6469, -0.3567, 1.6222, -0.0748, -0.4106, -0.3050, 0.4462, 0.2349],
  22057. [ 0.7940, -0.2222, 1.6271, -0.2506, -0.5119, -0.7262, 0.5196, 0.1868],
  22058. [ 0.4953, -0.4453, 1.4948, -1.0337, -0.5386, -0.4044, 0.5632, 0.2785],
  22059. [ 0.4612, -0.5075, 1.6961, -0.4348, -0.0683, -0.3957, 0.2832, 0.0984]],
  22060. device='cuda:0', grad_fn=<AddmmBackward>)
  22061. landmarks are: tensor([[[ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  22062. 0.5239],
  22063. [ 0.5668, -0.4306, 1.7730, 0.0697, -0.4037, 0.1390, 0.4450,
  22064. 0.0390],
  22065. [ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  22066. 0.2075],
  22067. [ 0.5645, -0.3797, 1.8249, -0.0688, -0.2882, 0.3854, 0.3789,
  22068. 0.0652],
  22069. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  22070. 0.1544],
  22071. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  22072. 0.2545],
  22073. [ 0.5631, -0.4008, 1.6113, -0.7309, -0.6693, -0.1304, 0.5836,
  22074. 0.2083],
  22075. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  22076. -0.0039]]], device='cuda:0')
  22077. loss_train_step before backward: tensor(0.0361, device='cuda:0', grad_fn=<MseLossBackward>)
  22078. loss_train_step after backward: tensor(0.0361, device='cuda:0', grad_fn=<MseLossBackward>)
  22079. loss_train: 2.227865911088884
  22080. step: 67
  22081. running loss: 0.033251730016252
  22082. Train Steps: 67/90 Loss: 0.0333 torch.Size([8, 600, 800])
  22083. torch.Size([8, 8])
  22084. tensor([[0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  22085. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  22086. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  22087. [0.6124, 0.4069, 0.8314, 0.5001, 0.3738, 0.4650, 0.5167, 0.5402],
  22088. [ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  22089. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633],
  22090. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  22091. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517]],
  22092. device='cuda:0', dtype=torch.float64)
  22093. predictions are: tensor([[ 0.8848, -0.1729, 1.4798, 0.2416, -0.3977, -0.0930, 0.4602, 0.4335],
  22094. [ 0.7835, -0.2613, 1.4584, -1.2296, -0.3859, -1.1383, 0.6709, -0.0248],
  22095. [ 0.8811, -0.2185, 1.4146, -1.4647, -0.0089, -1.5862, 0.7598, 0.0176],
  22096. [ 0.7126, -0.2833, 1.5513, -0.0976, -0.4387, -0.1353, 0.2362, 0.2505],
  22097. [-2.0188, -2.1723, 1.0514, -1.4950, -0.3005, -1.1029, 0.2591, 0.3280],
  22098. [ 0.7695, -0.2286, 1.6170, 0.1916, -0.2849, -0.1186, 0.4334, 0.3344],
  22099. [ 0.7143, -0.2892, 1.6661, 0.1946, -0.4831, -0.2583, 0.2466, 0.0479],
  22100. [ 0.8132, -0.2083, 1.5800, -0.8766, -0.5991, -0.5577, 0.4929, 0.1575]],
  22101. device='cuda:0', grad_fn=<AddmmBackward>)
  22102. landmarks are: tensor([[[ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  22103. 0.5393],
  22104. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  22105. -0.0220],
  22106. [ 0.6126, -0.4057, 1.4439, -1.3159, -0.1150, -1.5777, 0.5537,
  22107. -0.0530],
  22108. [ 0.5425, -0.4067, 1.5543, 0.0241, -0.5596, -0.1381, 0.1005,
  22109. 0.2093],
  22110. [-2.2859, -2.2859, 0.9175, -1.3947, -0.3691, -1.2467, 0.2314,
  22111. 0.3238],
  22112. [ 0.5880, -0.3605, 1.7037, 0.3238, -0.2940, -0.0765, 0.3180,
  22113. 0.3161],
  22114. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  22115. -0.0370],
  22116. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  22117. 0.2622]]], device='cuda:0')
  22118. loss_train_step before backward: tensor(0.0155, device='cuda:0', grad_fn=<MseLossBackward>)
  22119. loss_train_step after backward: tensor(0.0155, device='cuda:0', grad_fn=<MseLossBackward>)
  22120. loss_train: 2.243375484831631
  22121. step: 68
  22122. running loss: 0.03299081595340634
  22123.  
  22124. Train Steps: 68/90 Loss: 0.0330 torch.Size([8, 600, 800])
  22125. torch.Size([8, 8])
  22126. tensor([[0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  22127. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  22128. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  22129. [0.6343, 0.4097, 0.9287, 0.4367, 0.4313, 0.3600, 0.7248, 0.5841],
  22130. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  22131. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  22132. [0.6201, 0.4017, 0.8871, 0.4621, 0.3517, 0.4675, 0.5999, 0.5106],
  22133. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350]],
  22134. device='cuda:0', dtype=torch.float64)
  22135. predictions are: tensor([[ 0.5492, -0.3537, 1.0510, -1.1307, -0.1063, -1.2669, 0.3406, 0.4151],
  22136. [ 0.5106, -0.4782, 1.6313, -0.0935, -0.4695, -0.1447, 0.2669, 0.0259],
  22137. [ 0.5940, -0.3389, 1.5285, -0.8920, -0.1874, -1.3273, 0.2889, 0.0553],
  22138. [ 0.6428, -0.3886, 1.6949, -0.4102, -0.3667, -0.6118, 0.9077, 0.2542],
  22139. [ 0.7256, -0.3228, 1.7196, -0.2445, -0.4457, 0.0972, 0.4459, 0.1771],
  22140. [ 0.4534, -0.4983, 1.6209, -0.9948, -0.3314, -0.8475, 0.8452, 0.2427],
  22141. [ 0.5449, -0.4638, 1.6773, -0.2547, -0.5393, -0.0724, 0.4429, 0.1515],
  22142. [ 0.4045, -0.5464, 1.6156, -0.0932, -0.4692, -0.2328, 0.0977, 0.1593]],
  22143. device='cuda:0', grad_fn=<AddmmBackward>)
  22144. landmarks are: tensor([[[ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  22145. 0.3854],
  22146. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  22147. 0.0313],
  22148. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  22149. -0.0368],
  22150. [ 0.6438, -0.3936, 2.0039, -0.2690, -0.2940, -0.6231, 1.0618,
  22151. 0.4119],
  22152. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  22153. 0.2237],
  22154. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  22155. 0.3050],
  22156. [ 0.5783, -0.4306, 1.8114, -0.1515, -0.6617, -0.1268, 0.4851,
  22157. 0.0727],
  22158. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  22159. 0.1854]]], device='cuda:0')
  22160. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  22161. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  22162. loss_train: 2.2540173502638936
  22163. step: 69
  22164. running loss: 0.032666918119766575
  22165. Train Steps: 69/90 Loss: 0.0327 torch.Size([8, 600, 800])
  22166. torch.Size([8, 8])
  22167. tensor([[0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  22168. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  22169. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  22170. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  22171. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  22172. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  22173. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  22174. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899]],
  22175. device='cuda:0', dtype=torch.float64)
  22176. predictions are: tensor([[ 0.2508, -0.5467, 0.7966, -1.1588, -0.2903, -1.3747, 0.0383, 0.3953],
  22177. [ 0.5413, -0.4319, 1.3898, -1.3634, -0.2613, -1.1370, 0.5943, 0.0810],
  22178. [ 0.6342, -0.3566, 1.4557, 0.1665, -0.3822, -0.0786, 0.7992, 0.3457],
  22179. [ 0.5728, -0.4382, 1.8137, -0.3345, -0.5790, -0.2428, 0.4343, 0.0768],
  22180. [ 0.9392, -0.1153, 1.6216, -0.5804, -0.5492, -0.3375, 0.1921, 0.1121],
  22181. [ 0.1582, -0.6907, 1.7376, -0.2148, -0.5145, -0.3778, 0.1450, 0.0500],
  22182. [ 0.3844, -0.5329, 1.5189, -0.9580, -0.1783, -1.0164, 0.7031, 0.2159],
  22183. [ 0.4851, -0.4767, 1.8267, -0.0919, -0.3050, -0.2376, 0.7236, 0.2378]],
  22184. device='cuda:0', grad_fn=<AddmmBackward>)
  22185. landmarks are: tensor([[[ 5.5318e-01, -4.2640e-01, 7.6259e-01, -1.1466e+00, -3.9792e-01,
  22186. -1.2928e+00, 2.4936e-01, 3.8081e-01],
  22187. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  22188. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  22189. [ 6.4542e-01, -3.9842e-01, 1.3804e+00, 2.5450e-01, -4.5566e-01,
  22190. -3.8029e-02, 1.1057e+00, 3.4780e-01],
  22191. [ 6.0095e-01, -4.3453e-01, 1.8480e+00, -3.5366e-01, -6.4619e-01,
  22192. -2.6128e-01, 6.5240e-01, -9.9401e-03],
  22193. [ 5.8406e-01, -3.7783e-01, 1.6113e+00, -6.4619e-01, -6.6351e-01,
  22194. -2.5358e-01, 3.5423e-01, 8.0233e-02],
  22195. [ 5.8435e-01, -4.4657e-01, 1.8423e+00, -1.9969e-01, -5.9423e-01,
  22196. -3.9985e-01, 4.2194e-01, 4.6651e-02],
  22197. [ 6.1742e-01, -3.9842e-01, 1.5975e+00, -9.9214e-01, -3.6328e-01,
  22198. -9.9261e-01, 8.2047e-01, 2.0505e-01],
  22199. [ 6.4542e-01, -3.7194e-01, 1.9115e+00, -1.3041e-01, -5.0762e-01,
  22200. -2.8437e-01, 1.0033e+00, 4.3864e-01]]], device='cuda:0')
  22201. loss_train_step before backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  22202. loss_train_step after backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  22203. loss_train: 2.2742685051634908
  22204. step: 70
  22205. running loss: 0.032489550073764153
  22206. Train Steps: 70/90 Loss: 0.0325 torch.Size([8, 600, 800])
  22207. torch.Size([8, 8])
  22208. tensor([[0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  22209. [0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  22210. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  22211. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  22212. [0.6135, 0.3994, 0.7913, 0.3050, 0.3625, 0.3050, 0.5837, 0.5050],
  22213. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  22214. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  22215. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413]],
  22216. device='cuda:0', dtype=torch.float64)
  22217. predictions are: tensor([[ 0.5122, -0.4982, 1.8205, -0.3142, -0.5797, -0.0591, 0.6661, 0.1336],
  22218. [ 0.7927, -0.2415, 1.0857, -1.1362, -0.2013, -1.2924, 0.4452, 0.1942],
  22219. [ 0.3741, -0.4858, 1.5175, -0.3482, -0.5324, -0.6665, 0.0663, 0.2776],
  22220. [ 0.2747, -0.5748, 1.5718, -0.4627, -0.4041, -0.8664, 0.1605, 0.1826],
  22221. [ 0.2877, -0.5945, 1.3762, -0.9632, -0.5021, -0.6231, 0.5349, 0.1469],
  22222. [ 0.4169, -0.4920, 1.3689, -1.1018, -0.2625, -0.9907, 0.6163, 0.2166],
  22223. [ 0.5410, -0.4205, 1.5504, -0.5371, -0.5861, -0.2351, 0.3069, 0.0715],
  22224. [ 0.4781, -0.5026, 1.9161, -0.2707, -0.1580, -0.6887, 0.9722, 0.1813]],
  22225. device='cuda:0', grad_fn=<AddmmBackward>)
  22226. landmarks are: tensor([[[ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  22227. -0.0099],
  22228. [ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  22229. 0.1449],
  22230. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  22231. 0.2116],
  22232. [ 0.5485, -0.4209, 1.6691, -0.4152, -0.5249, -1.1081, 0.0725,
  22233. 0.0021],
  22234. [ 0.5477, -0.4413, 1.3688, -0.8771, -0.6115, -0.8771, 0.4104,
  22235. 0.0467],
  22236. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  22237. 0.1929],
  22238. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  22239. 0.0021],
  22240. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  22241. 0.2142]]], device='cuda:0')
  22242. loss_train_step before backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  22243. loss_train_step after backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  22244. loss_train: 2.289423213340342
  22245. step: 71
  22246. running loss: 0.03224539737099073
  22247. Train Steps: 71/90 Loss: 0.0322 torch.Size([8, 600, 800])
  22248. torch.Size([8, 8])
  22249. tensor([[0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  22250. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  22251. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  22252. [0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083],
  22253. [0.6125, 0.4035, 0.7825, 0.3100, 0.3463, 0.4900, 0.5832, 0.5637],
  22254. [0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  22255. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  22256. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960]],
  22257. device='cuda:0', dtype=torch.float64)
  22258. predictions are: tensor([[ 0.4479, -0.4506, 1.6853, -0.1913, -0.3362, -0.1246, 0.2974, 0.2190],
  22259. [ 0.4831, -0.4276, 1.6233, 0.2123, -0.4058, -0.0915, 0.4055, 0.2812],
  22260. [ 0.6317, -0.3702, 1.9464, -0.4200, -0.3204, -1.1019, 0.9239, 0.0278],
  22261. [ 0.7079, -0.2363, 1.5972, -0.7340, -0.6275, -0.5334, 0.4059, 0.3556],
  22262. [ 0.3797, -0.4968, 1.3329, -0.9653, -0.6206, -0.1962, 0.4695, 0.2560],
  22263. [ 0.6649, -0.3512, 1.5966, 0.2881, -0.5217, -0.2935, 0.5200, 0.0120],
  22264. [ 0.5794, -0.3805, 1.7459, -0.2830, -0.0878, -0.1662, 0.4798, 0.1850],
  22265. [ 0.6714, -0.3518, 1.7962, -0.2419, -0.2278, -0.1438, 0.3156, 0.0287]],
  22266. device='cuda:0', grad_fn=<AddmmBackward>)
  22267. landmarks are: tensor([[[ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  22268. 0.3084],
  22269. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  22270. 0.3161],
  22271. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  22272. 0.2142],
  22273. [ 0.5774, -0.3868, 1.6286, -0.5692, -0.6462, -0.2767, 0.5143,
  22274. 0.5239],
  22275. [ 0.5432, -0.4224, 1.3284, -0.8540, -0.6866, -0.0226, 0.4077,
  22276. 0.3177],
  22277. [ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  22278. -0.1492],
  22279. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  22280. 0.2853],
  22281. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  22282. 0.0051]]], device='cuda:0')
  22283. loss_train_step before backward: tensor(0.0154, device='cuda:0', grad_fn=<MseLossBackward>)
  22284. loss_train_step after backward: tensor(0.0154, device='cuda:0', grad_fn=<MseLossBackward>)
  22285. loss_train: 2.304807144217193
  22286. step: 72
  22287. running loss: 0.032011210336349905
  22288.  
  22289. Train Steps: 72/90 Loss: 0.0320 torch.Size([8, 600, 800])
  22290. torch.Size([8, 8])
  22291. tensor([[0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  22292. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  22293. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  22294. [0.6284, 0.4093, 0.8900, 0.4700, 0.3650, 0.3850, 0.6212, 0.5167],
  22295. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  22296. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  22297. [ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933],
  22298. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250]],
  22299. device='cuda:0', dtype=torch.float64)
  22300. predictions are: tensor([[ 0.5122, -0.4145, 1.0718, -0.8660, -0.4378, -0.9175, 0.5208, 0.2975],
  22301. [ 0.6879, -0.2902, 1.8188, -0.6282, -0.4061, -0.6229, 0.5794, 0.0858],
  22302. [ 0.7078, -0.2872, 1.2850, -1.0183, -0.4095, -0.7490, 0.5825, 0.1415],
  22303. [ 0.7138, -0.3128, 1.8883, 0.1094, -0.5699, -0.3284, 0.4986, 0.0147],
  22304. [ 0.7631, -0.2945, 1.7644, -0.9269, 0.1532, -1.1395, 1.0988, 0.0832],
  22305. [ 0.6894, -0.2747, 1.4439, -0.3181, -0.5894, -0.7208, 0.0107, 0.2779],
  22306. [-2.3025, -2.3297, 1.0130, -1.0680, -0.5892, -0.9831, 0.0336, 0.3642],
  22307. [ 0.8791, -0.1854, 1.9073, -0.1095, -0.5426, -0.0348, 0.5527, 0.0630]],
  22308. device='cuda:0', grad_fn=<AddmmBackward>)
  22309. landmarks are: tensor([[[ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  22310. 0.3700],
  22311. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  22312. 0.1390],
  22313. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  22314. 0.1621],
  22315. [ 0.6164, -0.3956, 1.8249, -0.1150, -0.6000, -0.5076, 0.5836,
  22316. 0.1005],
  22317. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  22318. 0.1982],
  22319. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  22320. 0.4374],
  22321. [-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  22322. 0.4543],
  22323. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  22324. 0.1390]]], device='cuda:0')
  22325. loss_train_step before backward: tensor(0.0139, device='cuda:0', grad_fn=<MseLossBackward>)
  22326. loss_train_step after backward: tensor(0.0139, device='cuda:0', grad_fn=<MseLossBackward>)
  22327. loss_train: 2.318676040507853
  22328. step: 73
  22329. running loss: 0.03176268548640895
  22330. Train Steps: 73/90 Loss: 0.0318 torch.Size([8, 600, 800])
  22331. torch.Size([8, 8])
  22332. tensor([[0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  22333. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  22334. [0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  22335. [0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  22336. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  22337. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  22338. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  22339. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550]],
  22340. device='cuda:0', dtype=torch.float64)
  22341. predictions are: tensor([[ 4.7113e-01, -4.8745e-01, 1.8539e+00, 3.2894e-01, -4.1775e-01,
  22342. -7.5153e-03, 5.0597e-01, 2.3463e-01],
  22343. [ 5.6107e-01, -4.3712e-01, 1.7635e+00, 2.1942e-01, -4.4146e-01,
  22344. -9.3449e-02, 4.3632e-01, 6.4832e-02],
  22345. [ 5.3550e-01, -3.7773e-01, 1.2046e+00, -7.6963e-01, -3.0734e-01,
  22346. -1.2585e+00, 3.2494e-01, 4.1616e-01],
  22347. [ 7.6130e-01, -2.6534e-01, 1.8936e+00, 1.0186e-03, -2.6857e-01,
  22348. 4.8667e-01, 3.9008e-01, 1.2859e-01],
  22349. [ 3.2546e-01, -5.6136e-01, 1.1409e+00, -1.3242e+00, -5.3331e-01,
  22350. -1.1989e+00, 3.7836e-01, 1.0678e-01],
  22351. [ 3.6444e-01, -5.2857e-01, 1.3846e+00, -1.0845e+00, -5.1766e-01,
  22352. -1.0753e+00, 6.7351e-01, 2.3173e-01],
  22353. [ 5.3250e-01, -4.3660e-01, 1.9654e+00, 2.5421e-03, -4.6362e-01,
  22354. -5.2328e-01, 7.3296e-01, 3.7710e-02],
  22355. [ 5.8066e-01, -4.1115e-01, 1.5945e+00, -8.2236e-01, -6.5597e-01,
  22356. -3.0854e-01, 5.7481e-01, 1.6315e-01]], device='cuda:0',
  22357. grad_fn=<AddmmBackward>)
  22358. landmarks are: tensor([[[ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  22359. 0.3007],
  22360. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  22361. 0.2091],
  22362. [ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  22363. 0.5401],
  22364. [ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  22365. 0.0412],
  22366. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  22367. 0.2853],
  22368. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  22369. 0.3777],
  22370. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  22371. 0.1661],
  22372. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  22373. 0.2776]]], device='cuda:0')
  22374. loss_train_step before backward: tensor(0.0116, device='cuda:0', grad_fn=<MseLossBackward>)
  22375. loss_train_step after backward: tensor(0.0116, device='cuda:0', grad_fn=<MseLossBackward>)
  22376. loss_train: 2.3302313135936856
  22377. step: 74
  22378. running loss: 0.03148961234586062
  22379. Train Steps: 74/90 Loss: 0.0315 torch.Size([8, 600, 800])
  22380. torch.Size([8, 8])
  22381. tensor([[0.6129, 0.4063, 0.8738, 0.5250, 0.4313, 0.4733, 0.5230, 0.5874],
  22382. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  22383. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  22384. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  22385. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  22386. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650],
  22387. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  22388. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466]],
  22389. device='cuda:0', dtype=torch.float64)
  22390. predictions are: tensor([[ 0.7608, -0.2662, 1.7774, 0.1798, -0.3807, -0.0089, 0.3839, 0.2495],
  22391. [ 0.3894, -0.5370, 1.4442, -0.7026, -0.7186, -0.3379, 0.3447, 0.1872],
  22392. [ 0.4860, -0.4275, 1.6876, 0.2732, -0.4168, -0.2713, 0.4909, 0.4333],
  22393. [ 0.5600, -0.3997, 1.0086, -1.0654, -0.6472, -1.0534, 0.2950, 0.2712],
  22394. [ 0.7111, -0.3574, 1.9038, -0.0752, -0.6639, -0.4627, 0.6405, 0.0408],
  22395. [ 0.5216, -0.4450, 1.8388, -0.1305, -0.3204, 0.0560, 0.3731, 0.1311],
  22396. [ 0.4902, -0.5181, 1.9518, -0.7413, -0.3985, -0.9655, 1.0865, 0.0022],
  22397. [ 0.5865, -0.3897, 1.7734, 0.0111, -0.2692, 0.1866, 0.3871, 0.1497]],
  22398. device='cuda:0', grad_fn=<AddmmBackward>)
  22399. landmarks are: tensor([[[ 0.5453, -0.4091, 1.7499, 0.1390, -0.2940, -0.0996, 0.1300,
  22400. 0.4272],
  22401. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  22402. 0.2386],
  22403. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  22404. 0.4470],
  22405. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  22406. 0.4103],
  22407. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  22408. 0.1082],
  22409. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  22410. 0.3238],
  22411. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  22412. 0.1821],
  22413. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  22414. 0.2386]]], device='cuda:0')
  22415. loss_train_step before backward: tensor(0.0163, device='cuda:0', grad_fn=<MseLossBackward>)
  22416. loss_train_step after backward: tensor(0.0163, device='cuda:0', grad_fn=<MseLossBackward>)
  22417. loss_train: 2.34652538318187
  22418. step: 75
  22419. running loss: 0.0312870051090916
  22420. Train Steps: 75/90 Loss: 0.0313 torch.Size([8, 600, 800])
  22421. torch.Size([8, 8])
  22422. tensor([[0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426],
  22423. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  22424. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540],
  22425. [0.6198, 0.4130, 0.8762, 0.4117, 0.3650, 0.4900, 0.5707, 0.5103],
  22426. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426],
  22427. [0.6364, 0.4154, 0.8938, 0.3717, 0.4500, 0.2583, 0.6448, 0.5285],
  22428. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  22429. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927]],
  22430. device='cuda:0', dtype=torch.float64)
  22431. predictions are: tensor([[ 0.8955, -0.1829, 1.1701, -1.0772, -0.3697, -1.3048, 0.5593, 0.1958],
  22432. [ 0.7101, -0.3358, 1.6189, 0.2893, -0.5472, -0.0433, 0.4882, 0.1745],
  22433. [-0.0980, -0.8081, 1.4499, -1.2712, -0.0374, -1.2084, 0.8850, 0.3341],
  22434. [ 0.5643, -0.3828, 1.7756, -0.2794, -0.7242, -0.0340, 0.4257, 0.1475],
  22435. [ 0.3468, -0.5400, 1.7338, -0.1671, -0.7472, -0.5945, 0.3265, 0.2328],
  22436. [ 0.3623, -0.5074, 1.7292, -0.6107, -0.3487, -1.0112, 0.6881, 0.2868],
  22437. [ 0.6102, -0.4003, 1.6497, 0.1532, -0.3328, 0.2402, 0.4762, 0.1845],
  22438. [ 0.4357, -0.5049, 1.7483, -0.0460, -0.4219, 0.1342, 0.1869, 0.0424]],
  22439. device='cuda:0', grad_fn=<AddmmBackward>)
  22440. landmarks are: tensor([[[ 0.5784, -0.4153, 1.2972, -1.2541, -0.2265, -1.4553, 0.4741,
  22441. 0.2203],
  22442. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  22443. 0.2091],
  22444. [ 0.6487, -0.3792, 1.6344, -1.0850, 0.2659, -1.5397, 0.8059,
  22445. 0.2730],
  22446. [ 0.5771, -0.3784, 1.7614, -0.3844, -0.6000, -0.0226, 0.3501,
  22447. 0.0712],
  22448. [ 0.5788, -0.4135, 1.8214, -0.2408, -0.6039, -0.7854, 0.4115,
  22449. 0.2203],
  22450. [ 0.6537, -0.3671, 1.8423, -0.5692, -0.2074, -1.0927, 0.6926,
  22451. 0.1554],
  22452. [ 0.5548, -0.4682, 1.7309, 0.0966, -0.1394, 0.1757, 0.5045,
  22453. 0.0942],
  22454. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  22455. -0.0099]]], device='cuda:0')
  22456. loss_train_step before backward: tensor(0.0295, device='cuda:0', grad_fn=<MseLossBackward>)
  22457. loss_train_step after backward: tensor(0.0295, device='cuda:0', grad_fn=<MseLossBackward>)
  22458. loss_train: 2.376007336191833
  22459. step: 76
  22460. running loss: 0.03126325442357675
  22461.  
  22462. Train Steps: 76/90 Loss: 0.0313 torch.Size([8, 600, 800])
  22463. torch.Size([8, 8])
  22464. tensor([[0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  22465. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  22466. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  22467. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650],
  22468. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  22469. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  22470. [0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748],
  22471. [0.6292, 0.4010, 0.8988, 0.4800, 0.3638, 0.3817, 0.6357, 0.5051]],
  22472. device='cuda:0', dtype=torch.float64)
  22473. predictions are: tensor([[ 6.2599e-01, -3.7787e-01, 1.7324e+00, -1.4953e-03, -5.6675e-01,
  22474. -2.6756e-01, 4.9518e-01, 4.3112e-01],
  22475. [ 6.0591e-01, -4.0288e-01, 1.4897e+00, -9.1640e-01, -6.3901e-01,
  22476. -7.7692e-01, 4.3591e-01, 9.2140e-02],
  22477. [ 3.4257e-01, -5.5844e-01, 1.6558e+00, 1.9338e-01, -4.5376e-01,
  22478. -9.7340e-03, 3.2920e-01, 2.5710e-01],
  22479. [ 4.5453e-01, -4.8078e-01, 1.7472e+00, -1.1293e-01, -2.6900e-01,
  22480. 2.1217e-03, 2.5967e-01, 2.2156e-01],
  22481. [ 6.1328e-01, -3.6578e-01, 1.3096e+00, -7.1024e-01, -6.7487e-01,
  22482. -5.3066e-01, 2.5872e-01, 3.9249e-01],
  22483. [ 5.6314e-01, -4.0142e-01, 1.8560e+00, -1.5741e-01, -1.9763e-01,
  22484. 2.6406e-01, 4.0827e-01, 1.1360e-01],
  22485. [ 5.6209e-01, -4.2365e-01, 1.7095e+00, 1.2593e-01, -4.6443e-01,
  22486. -4.5895e-01, 9.4878e-01, 2.4540e-01],
  22487. [ 7.4072e-01, -3.3453e-01, 1.8828e+00, -1.8974e-01, -5.4737e-01,
  22488. -6.2025e-01, 7.1610e-01, 1.2509e-01]], device='cuda:0',
  22489. grad_fn=<AddmmBackward>)
  22490. landmarks are: tensor([[[ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  22491. 0.5239],
  22492. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  22493. 0.0942],
  22494. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  22495. -0.1061],
  22496. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  22497. 0.3238],
  22498. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  22499. 0.4036],
  22500. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  22501. 0.0622],
  22502. [ 0.6421, -0.3647, 1.5940, 0.3084, -0.5192, -0.3691, 1.1057,
  22503. 0.3692],
  22504. [ 0.6204, -0.4336, 1.8654, -0.0688, -0.6058, -0.5230, 0.6503,
  22505. 0.0472]]], device='cuda:0')
  22506. loss_train_step before backward: tensor(0.0097, device='cuda:0', grad_fn=<MseLossBackward>)
  22507. loss_train_step after backward: tensor(0.0097, device='cuda:0', grad_fn=<MseLossBackward>)
  22508. loss_train: 2.3856922583654523
  22509. step: 77
  22510. running loss: 0.030983016342408472
  22511. Train Steps: 77/90 Loss: 0.0310 torch.Size([8, 600, 800])
  22512. torch.Size([8, 8])
  22513. tensor([[0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  22514. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  22515. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609],
  22516. [0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  22517. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  22518. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  22519. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  22520. [0.6064, 0.3953, 0.8738, 0.4417, 0.3663, 0.4683, 0.5511, 0.5416]],
  22521. device='cuda:0', dtype=torch.float64)
  22522. predictions are: tensor([[ 0.4816, -0.4621, 1.4665, -0.6807, -0.7312, -0.5035, 0.4855, 0.4826],
  22523. [ 0.3986, -0.5600, 1.7154, 0.1935, -0.3803, 0.1976, 0.4821, 0.1684],
  22524. [ 0.6346, -0.3935, 1.7428, -0.9900, 0.1062, -1.3640, 1.2291, 0.2949],
  22525. [ 0.6019, -0.4224, 1.4777, -0.9274, -0.5007, -0.9511, 0.6558, 0.1184],
  22526. [ 0.4079, -0.5341, 1.7268, -0.0303, -0.6630, -0.3353, 0.3375, 0.2916],
  22527. [ 0.5138, -0.4476, 1.8194, -0.0117, -0.0904, 0.0841, 0.4128, 0.2011],
  22528. [ 0.3823, -0.5219, 0.9403, -0.9047, -0.5712, -1.1431, 0.1388, 0.1978],
  22529. [ 0.5692, -0.4489, 1.8115, -0.0553, -0.6830, -0.0256, 0.2668, 0.1434]],
  22530. device='cuda:0', grad_fn=<AddmmBackward>)
  22531. landmarks are: tensor([[[ 5.7685e-01, -3.8992e-01, 1.3861e+00, -7.7706e-01, -5.8845e-01,
  22532. -5.4611e-01, 5.0277e-01, 5.6243e-01],
  22533. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  22534. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  22535. [ 6.3718e-01, -3.5749e-01, 1.6633e+00, -1.2082e+00, 2.1986e-01,
  22536. -1.2467e+00, 1.1313e+00, 3.0505e-01],
  22537. [ 6.1248e-01, -4.3453e-01, 1.4308e+00, -1.1384e+00, -4.2133e-01,
  22538. -1.0031e+00, 7.1897e-01, 1.2136e-01],
  22539. [ 5.4324e-01, -4.3364e-01, 1.7095e+00, -1.7660e-01, -5.9423e-01,
  22540. -4.8453e-01, 3.0069e-01, 2.8530e-01],
  22541. [ 5.3508e-01, -4.3212e-01, 1.7326e+00, -1.3811e-01, 4.6329e-02,
  22542. 1.0491e-01, 4.1617e-01, 2.7760e-01],
  22543. [ 5.4700e-01, -4.0808e-01, 8.4919e-01, -1.0773e+00, -5.3072e-01,
  22544. -1.1620e+00, 9.1240e-02, 1.8903e-01],
  22545. [ 5.1490e-01, -4.6028e-01, 1.7499e+00, -2.4588e-01, -5.9423e-01,
  22546. -1.2271e-01, 2.5964e-01, 2.1549e-01]]], device='cuda:0')
  22547. loss_train_step before backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  22548. loss_train_step after backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  22549. loss_train: 2.3952217008918524
  22550. step: 78
  22551. running loss: 0.03070797052425452
  22552. Train Steps: 78/90 Loss: 0.0307 torch.Size([8, 600, 800])
  22553. torch.Size([8, 8])
  22554. tensor([[0.6127, 0.4115, 0.7163, 0.2883, 0.3625, 0.2950, 0.5327, 0.5495],
  22555. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  22556. [0.6339, 0.4112, 0.8838, 0.5067, 0.4000, 0.5433, 0.7549, 0.5378],
  22557. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436],
  22558. [0.6086, 0.3998, 0.8788, 0.4450, 0.4025, 0.4650, 0.5306, 0.5103],
  22559. [0.6314, 0.4107, 0.8750, 0.5100, 0.3788, 0.4900, 0.7121, 0.5864],
  22560. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  22561. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600]],
  22562. device='cuda:0', dtype=torch.float64)
  22563. predictions are: tensor([[ 0.5093, -0.4510, 1.1529, -0.9447, -0.5343, -0.9558, 0.1538, 0.2929],
  22564. [ 0.1427, -0.6651, 1.3357, -0.4493, -0.5945, -0.9460, 0.1704, 0.4914],
  22565. [ 0.6095, -0.4259, 1.8378, 0.1008, -0.3755, 0.2174, 0.8572, 0.2546],
  22566. [ 0.6198, -0.4002, 1.7901, 0.1931, -0.3497, 0.1815, 0.8804, 0.2716],
  22567. [ 0.6056, -0.3894, 1.8245, -0.1414, -0.4505, -0.2102, 0.1380, 0.1016],
  22568. [ 0.6638, -0.3807, 1.8774, 0.2831, -0.4401, -0.0791, 0.8332, 0.2436],
  22569. [ 0.5925, -0.3957, 1.8014, -0.3808, -0.5423, -0.1721, 0.1716, 0.2022],
  22570. [ 0.5354, -0.4287, 1.1695, -1.0155, -0.5159, -0.9060, 0.4118, 0.2849]],
  22571. device='cuda:0', grad_fn=<AddmmBackward>)
  22572. landmarks are: tensor([[[ 0.5442, -0.3855, 1.0224, -0.9541, -0.6115, -0.9233, 0.1745,
  22573. 0.2522],
  22574. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  22575. 0.4470],
  22576. [ 0.6421, -0.3864, 1.7961, 0.0543, -0.4383, 0.2237, 1.2007,
  22577. 0.1982],
  22578. [ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  22579. 0.2249],
  22580. [ 0.5253, -0.4392, 1.7730, -0.2305, -0.4268, -0.1381, 0.1651,
  22581. 0.0712],
  22582. [ 0.6306, -0.3888, 1.7557, 0.0697, -0.5365, -0.0226, 1.0033,
  22583. 0.4226],
  22584. [ 0.5384, -0.4361, 1.7961, -0.4999, -0.5480, -0.1150, 0.3931,
  22585. 0.2776],
  22586. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  22587. 0.3007]]], device='cuda:0')
  22588. loss_train_step before backward: tensor(0.0158, device='cuda:0', grad_fn=<MseLossBackward>)
  22589. loss_train_step after backward: tensor(0.0158, device='cuda:0', grad_fn=<MseLossBackward>)
  22590. loss_train: 2.411067308858037
  22591. step: 79
  22592. running loss: 0.03051983935263338
  22593. Train Steps: 79/90 Loss: 0.0305 torch.Size([8, 600, 800])
  22594. torch.Size([8, 8])
  22595. tensor([[0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  22596. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  22597. [ nan, nan, 0.7097, 0.2346, 0.4250, 0.1850, 0.5175, 0.5583],
  22598. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  22599. [0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901],
  22600. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  22601. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  22602. [0.6262, 0.4085, 0.8438, 0.3150, 0.4025, 0.2633, 0.6339, 0.4810]],
  22603. device='cuda:0', dtype=torch.float64)
  22604. predictions are: tensor([[ 0.4540, -0.4703, 0.9067, -0.9209, -0.3107, -1.2274, 0.2563, 0.5059],
  22605. [ 0.5799, -0.4351, 1.6240, -0.3646, -0.6393, -0.2595, 0.2720, 0.1308],
  22606. [-1.5526, -1.8142, 0.9907, -1.0273, -0.3385, -1.2593, 0.1713, 0.4376],
  22607. [ 0.6030, -0.4002, 1.0383, -1.0469, -0.4132, -1.0222, 0.5741, 0.3941],
  22608. [ 0.8599, -0.2390, 1.9401, -0.4291, -0.5709, -0.3774, 0.7098, 0.1473],
  22609. [ 0.8415, -0.3189, 1.8656, 0.4869, -0.5526, -0.0591, 0.6731, 0.1598],
  22610. [ 0.6112, -0.4141, 1.7905, -0.2452, -0.4861, 0.1768, 0.4030, 0.2684],
  22611. [ 0.8313, -0.2715, 1.6857, -0.6763, -0.3634, -0.9058, 0.6089, 0.0587]],
  22612. device='cuda:0', grad_fn=<AddmmBackward>)
  22613. landmarks are: tensor([[[ 5.5318e-01, -4.2640e-01, 7.6259e-01, -1.1466e+00, -3.9792e-01,
  22614. -1.2928e+00, 2.4936e-01, 3.8081e-01],
  22615. [ 5.2061e-01, -4.6028e-01, 1.4670e+00, -4.7683e-01, -6.5774e-01,
  22616. -3.9985e-01, 1.8356e-01, 2.0831e-03],
  22617. [-2.2859e+00, -2.2859e+00, 9.9216e-01, -1.2021e+00, -3.2286e-01,
  22618. -1.4314e+00, 1.0439e-01, 2.9299e-01],
  22619. [ 5.9919e-01, -3.9684e-01, 9.3067e-01, -1.3497e+00, -4.7298e-01,
  22620. -1.0465e+00, 5.2587e-01, 2.9299e-01],
  22621. [ 6.0774e-01, -3.9646e-01, 1.8480e+00, -6.5389e-01, -6.2309e-01,
  22622. -4.5373e-01, 6.2155e-01, -2.1963e-02],
  22623. [ 6.2488e-01, -4.3518e-01, 1.8018e+00, 2.5450e-01, -6.1732e-01,
  22624. -1.9969e-01, 6.4006e-01, 2.9135e-02],
  22625. [ 5.5456e-01, -4.6205e-01, 1.7788e+00, -4.2294e-01, -5.1917e-01,
  22626. -2.2633e-02, 4.2771e-01, 2.4681e-01],
  22627. [ 6.0641e-01, -3.9900e-01, 1.6113e+00, -8.3095e-01, -4.2679e-01,
  22628. -1.0696e+00, 6.4212e-01, -6.4044e-02]]], device='cuda:0')
  22629. loss_train_step before backward: tensor(0.0272, device='cuda:0', grad_fn=<MseLossBackward>)
  22630. loss_train_step after backward: tensor(0.0272, device='cuda:0', grad_fn=<MseLossBackward>)
  22631. loss_train: 2.4382315184921026
  22632. step: 80
  22633. running loss: 0.030477893981151284
  22634.  
  22635. Train Steps: 80/90 Loss: 0.0305 torch.Size([8, 600, 800])
  22636. torch.Size([8, 8])
  22637. tensor([[0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400],
  22638. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  22639. [0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  22640. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  22641. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  22642. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  22643. [0.6080, 0.4010, 0.8750, 0.4500, 0.4825, 0.5617, 0.5837, 0.5583],
  22644. [0.6192, 0.3980, 0.7078, 0.2750, 0.4250, 0.2100, 0.5450, 0.5783]],
  22645. device='cuda:0', dtype=torch.float64)
  22646. predictions are: tensor([[ 0.6583, -0.3531, 1.5451, -0.6303, -0.7401, -0.6090, 0.5511, 0.2601],
  22647. [ 0.5577, -0.4344, 1.7469, 0.0396, -0.2320, 0.3542, 0.4915, 0.2582],
  22648. [ 0.5700, -0.4197, 1.3435, -1.0377, -0.5919, -0.7790, 0.5803, 0.3046],
  22649. [ 0.4306, -0.4598, 1.5850, 0.0190, -0.3076, -1.0861, 0.4304, 0.5001],
  22650. [ 0.6816, -0.3647, 1.1919, -1.0613, -0.2055, -1.3733, 0.5535, 0.2396],
  22651. [ 0.5564, -0.4769, 1.8245, -0.1644, -0.5580, 0.2945, 0.5149, 0.0401],
  22652. [ 0.4822, -0.5046, 1.7714, -0.1248, -0.1793, 0.1259, 0.3947, 0.1858],
  22653. [-0.4371, -1.0689, 0.9644, -0.8736, -0.3876, -1.3416, 0.3498, 0.4060]],
  22654. device='cuda:0', grad_fn=<AddmmBackward>)
  22655. landmarks are: tensor([[[ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  22656. 0.2083],
  22657. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  22658. 0.2083],
  22659. [ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  22660. 0.2699],
  22661. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  22662. 0.5822],
  22663. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  22664. 0.2083],
  22665. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  22666. -0.0322],
  22667. [ 0.5223, -0.4336, 1.7557, -0.2074, -0.0573, 0.3084, 0.4104,
  22668. 0.2930],
  22669. [ 0.5742, -0.4474, 0.9834, -1.0159, -0.3229, -1.3159, 0.2314,
  22670. 0.3854]]], device='cuda:0')
  22671. loss_train_step before backward: tensor(0.0289, device='cuda:0', grad_fn=<MseLossBackward>)
  22672. loss_train_step after backward: tensor(0.0289, device='cuda:0', grad_fn=<MseLossBackward>)
  22673. loss_train: 2.4671557769179344
  22674. step: 81
  22675. running loss: 0.03045871329528314
  22676. Train Steps: 81/90 Loss: 0.0305 torch.Size([8, 600, 800])
  22677. torch.Size([8, 8])
  22678. tensor([[0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  22679. [0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  22680. [0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  22681. [0.6246, 0.4028, 0.8738, 0.4867, 0.4088, 0.5667, 0.6362, 0.5200],
  22682. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  22683. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  22684. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609],
  22685. [0.6260, 0.4106, 0.8025, 0.2583, 0.4550, 0.1867, 0.6281, 0.4869]],
  22686. device='cuda:0', dtype=torch.float64)
  22687. predictions are: tensor([[ 0.3561, -0.5817, 1.6280, -0.5200, -0.6140, 0.0832, 0.4891, 0.2815],
  22688. [ 0.6177, -0.4275, 1.4497, 0.2524, -0.5313, -0.1602, 0.7929, 0.3334],
  22689. [ 0.3869, -0.4878, 1.4759, 0.0193, -0.6202, -0.5727, 0.1075, 0.3970],
  22690. [ 0.6651, -0.3817, 1.7857, -0.0360, -0.4305, 0.4036, 0.5908, 0.1152],
  22691. [ 0.1623, -0.6708, 1.5985, -0.0590, -0.7143, -0.5345, 0.0244, 0.3532],
  22692. [ 0.5097, -0.4573, 1.2580, -1.0156, -0.4474, -0.7448, 0.4199, 0.3221],
  22693. [ 0.6839, -0.3833, 1.6283, -1.0961, 0.1755, -1.2620, 1.0173, 0.3348],
  22694. [ 0.6074, -0.4254, 1.3506, -1.1489, -0.2045, -1.2801, 0.4970, 0.0799]],
  22695. device='cuda:0', grad_fn=<AddmmBackward>)
  22696. landmarks are: tensor([[[ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  22697. 0.2545],
  22698. [ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  22699. 0.3745],
  22700. [ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  22701. 0.4393],
  22702. [ 0.5990, -0.4256, 1.7499, -0.0380, -0.3979, 0.3315, 0.6529,
  22703. 0.1159],
  22704. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  22705. 0.4357],
  22706. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  22707. 0.2160],
  22708. [ 0.6372, -0.3575, 1.6633, -1.2082, 0.2199, -1.2467, 1.1313,
  22709. 0.3050],
  22710. [ 0.6058, -0.3892, 1.4208, -1.0927, -0.1843, -1.4237, 0.6154,
  22711. -0.0370]]], device='cuda:0')
  22712. loss_train_step before backward: tensor(0.0116, device='cuda:0', grad_fn=<MseLossBackward>)
  22713. loss_train_step after backward: tensor(0.0116, device='cuda:0', grad_fn=<MseLossBackward>)
  22714. loss_train: 2.478730901144445
  22715. step: 82
  22716. running loss: 0.030228425623712744
  22717. Train Steps: 82/90 Loss: 0.0302 torch.Size([8, 600, 800])
  22718. torch.Size([8, 8])
  22719. tensor([[0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  22720. [0.6173, 0.4114, 0.7325, 0.2500, 0.4213, 0.1917, 0.5338, 0.5700],
  22721. [0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  22722. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  22723. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  22724. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  22725. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  22726. [0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044]],
  22727. device='cuda:0', dtype=torch.float64)
  22728. predictions are: tensor([[ 0.1982, -0.6441, 1.4626, -1.0844, -0.4183, -0.8629, 0.2960, 0.2098],
  22729. [ 0.1744, -0.6380, 0.9460, -1.1304, -0.3395, -1.1559, 0.1845, 0.3836],
  22730. [ 0.4829, -0.4581, 1.7923, -0.2788, -0.4446, -0.5581, 0.5883, 0.2422],
  22731. [ 0.5963, -0.3333, 1.1338, -1.0038, -0.1605, -1.0222, 0.3700, 0.4745],
  22732. [ 0.5174, -0.4872, 1.6344, 0.1660, -0.4626, 0.0136, 0.4201, 0.1727],
  22733. [ 0.4432, -0.5566, 1.8790, -0.1467, -0.3513, -0.7157, 0.9092, 0.3290],
  22734. [ 0.6365, -0.4482, 1.6620, 0.3447, -0.5882, 0.0983, 0.6642, 0.0769],
  22735. [ 0.6277, -0.3859, 1.1277, -1.2750, -0.3528, -1.0574, 0.4644, 0.2117]],
  22736. device='cuda:0', grad_fn=<AddmmBackward>)
  22737. landmarks are: tensor([[[ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  22738. 0.0851],
  22739. [ 0.5652, -0.3858, 1.0975, -1.1312, -0.3402, -1.4006, 0.1794,
  22740. 0.3469],
  22741. [ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  22742. 0.1608],
  22743. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  22744. 0.3854],
  22745. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  22746. 0.2091],
  22747. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  22748. 0.3692],
  22749. [ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  22750. -0.1331],
  22751. [ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  22752. 0.0438]]], device='cuda:0')
  22753. loss_train_step before backward: tensor(0.0205, device='cuda:0', grad_fn=<MseLossBackward>)
  22754. loss_train_step after backward: tensor(0.0205, device='cuda:0', grad_fn=<MseLossBackward>)
  22755. loss_train: 2.499280705116689
  22756. step: 83
  22757. running loss: 0.03011181572429746
  22758. Train Steps: 83/90 Loss: 0.0301 torch.Size([8, 600, 800])
  22759. torch.Size([8, 8])
  22760. tensor([[0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  22761. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  22762. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  22763. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  22764. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  22765. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  22766. [0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  22767. [0.6239, 0.4206, 0.8750, 0.5400, 0.3688, 0.4850, 0.5737, 0.5700]],
  22768. device='cuda:0', dtype=torch.float64)
  22769. predictions are: tensor([[ 0.6278, -0.3582, 1.4195, -0.5272, -0.5106, -0.8733, 0.2839, 0.3572],
  22770. [ 0.6381, -0.4075, 1.6691, -0.0616, -0.2797, 0.1486, 0.6430, 0.1670],
  22771. [ 0.5569, -0.3845, 1.3425, -0.9565, -0.0864, -1.1992, 0.4094, 0.2892],
  22772. [ 0.6495, -0.4110, 1.7332, 0.0540, -0.4006, 0.1699, 0.6011, 0.0674],
  22773. [ 0.7700, -0.2943, 0.8941, -1.3155, -0.2464, -1.4069, 0.3876, 0.2335],
  22774. [-1.6801, -1.9175, 1.2121, -0.9034, -0.5852, -0.9538, 0.2522, 0.3485],
  22775. [ 0.8054, -0.2963, 1.5600, -0.6453, -0.5434, -0.6607, 0.5905, 0.2499],
  22776. [ 0.9652, -0.1676, 1.7356, 0.2161, -0.5124, 0.1078, 0.6526, 0.2850]],
  22777. device='cuda:0', grad_fn=<AddmmBackward>)
  22778. landmarks are: tensor([[[ 5.7790e-01, -3.8397e-01, 1.5420e+00, -4.3064e-01, -5.4226e-01,
  22779. -9.7721e-01, 2.0412e-01, 3.9283e-01],
  22780. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  22781. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  22782. [ 5.9107e-01, -3.8879e-01, 1.4727e+00, -9.5412e-01, -9.1917e-02,
  22783. -1.4930e+00, 3.9885e-01, 2.0831e-01],
  22784. [ 5.7777e-01, -4.3888e-01, 1.7107e+00, 1.1921e-01, -3.9207e-01,
  22785. 8.1507e-02, 4.7413e-01, 7.1077e-02],
  22786. [ 5.5664e-01, -4.1601e-01, 9.9353e-01, -1.3313e+00, -2.8245e-01,
  22787. -1.5161e+00, 2.1441e-01, 1.2532e-01],
  22788. [-2.2859e+00, -2.2859e+00, 1.5074e+00, -1.0388e+00, -5.4226e-01,
  22789. -9.8491e-01, 2.1986e-01, 2.6990e-01],
  22790. [ 5.2546e-01, -4.4950e-01, 1.5651e+00, -4.9992e-01, -5.7113e-01,
  22791. -8.4634e-01, 4.5658e-01, 1.6212e-01],
  22792. [ 5.9601e-01, -3.4305e-01, 1.7557e+00, 2.0831e-01, -5.8268e-01,
  22793. -4.5727e-02, 3.6420e-01, 3.4688e-01]]], device='cuda:0')
  22794. loss_train_step before backward: tensor(0.0224, device='cuda:0', grad_fn=<MseLossBackward>)
  22795. loss_train_step after backward: tensor(0.0224, device='cuda:0', grad_fn=<MseLossBackward>)
  22796. loss_train: 2.5217115683481097
  22797. step: 84
  22798. running loss: 0.03002037581366797
  22799.  
  22800. Train Steps: 84/90 Loss: 0.0300 torch.Size([8, 600, 800])
  22801. torch.Size([8, 8])
  22802. tensor([[0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  22803. [0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155],
  22804. [0.6260, 0.4106, 0.8025, 0.2583, 0.4550, 0.1867, 0.6281, 0.4869],
  22805. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  22806. [0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544],
  22807. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  22808. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795],
  22809. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600]],
  22810. device='cuda:0', dtype=torch.float64)
  22811. predictions are: tensor([[ 0.3755, -0.5651, 1.0948, -0.7817, -0.6757, -0.6152, 0.0656, 0.2687],
  22812. [ 0.5311, -0.4885, 1.6368, -0.8579, -0.2738, -1.1269, 0.7426, 0.1522],
  22813. [ 0.5372, -0.4697, 1.4447, -1.0901, -0.2341, -1.2558, 0.6001, 0.1076],
  22814. [ 0.4377, -0.5105, 1.8264, 0.0483, -0.0860, 0.1494, 0.4169, 0.2315],
  22815. [ 0.3859, -0.5386, 0.9109, -1.0271, -0.4228, -1.2534, 0.1069, 0.3340],
  22816. [ 0.7784, -0.3214, 1.5264, -1.0374, -0.1043, -1.2875, 0.6998, 0.2039],
  22817. [ 0.4173, -0.5761, 1.7450, 0.3063, -0.5354, 0.3130, 0.9737, 0.3100],
  22818. [ 0.4244, -0.5139, 1.1205, -0.9749, -0.6412, -0.6767, 0.4314, 0.2827]],
  22819. device='cuda:0', grad_fn=<AddmmBackward>)
  22820. landmarks are: tensor([[[ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  22821. 0.1710],
  22822. [ 0.6126, -0.4161, 1.6344, -0.9541, -0.2247, -1.3467, 0.6339,
  22823. 0.0953],
  22824. [ 0.6058, -0.3892, 1.4208, -1.0927, -0.1843, -1.4237, 0.6154,
  22825. -0.0370],
  22826. [ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  22827. 0.2853],
  22828. [ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  22829. 0.2747],
  22830. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  22831. 0.0851],
  22832. [ 0.6355, -0.4080, 1.6113, 0.1852, -0.4730, 0.1467, 0.9996,
  22833. 0.3905],
  22834. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  22835. 0.3007]]], device='cuda:0')
  22836. loss_train_step before backward: tensor(0.0115, device='cuda:0', grad_fn=<MseLossBackward>)
  22837. loss_train_step after backward: tensor(0.0115, device='cuda:0', grad_fn=<MseLossBackward>)
  22838. loss_train: 2.5331995971500874
  22839. step: 85
  22840. running loss: 0.029802348201765732
  22841. Train Steps: 85/90 Loss: 0.0298 torch.Size([8, 600, 800])
  22842. torch.Size([8, 8])
  22843. tensor([[0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  22844. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  22845. [0.6203, 0.4056, 0.8942, 0.4086, 0.3643, 0.3617, 0.5917, 0.5482],
  22846. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  22847. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  22848. [0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  22849. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  22850. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800]],
  22851. device='cuda:0', dtype=torch.float64)
  22852. predictions are: tensor([[ 0.3192, -0.5970, 1.7006, 0.2154, -0.0810, 0.0501, 0.5673, 0.2228],
  22853. [ 0.5665, -0.4718, 1.7598, -0.4422, -0.5859, -0.2406, 0.6804, 0.2694],
  22854. [ 0.7055, -0.3615, 1.8326, -0.3187, -0.5280, -0.6149, 0.5665, 0.2291],
  22855. [ 0.2587, -0.6218, 0.9886, -1.2755, -0.3026, -1.5091, 0.3010, 0.1494],
  22856. [ 0.6178, -0.4333, 1.6893, -0.4250, -0.4827, -0.8889, 0.5407, 0.1794],
  22857. [ 0.7328, -0.3638, 1.1332, -1.3629, -0.4475, -1.1089, 0.5656, 0.1385],
  22858. [ 0.4559, -0.5146, 1.7819, -0.2563, -0.3102, 0.2478, 0.6159, 0.2551],
  22859. [ 0.6827, -0.3224, 1.0977, -0.8458, -0.4696, -1.0328, 0.1970, 0.4110]],
  22860. device='cuda:0', grad_fn=<AddmmBackward>)
  22861. landmarks are: tensor([[[ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  22862. 0.0851],
  22863. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  22864. 0.2083],
  22865. [ 0.5791, -0.4127, 1.8442, -0.3985, -0.6031, -0.6154, 0.4473,
  22866. 0.2464],
  22867. [ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  22868. -0.0580],
  22869. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  22870. 0.1005],
  22871. [ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  22872. 0.0562],
  22873. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  22874. 0.2622],
  22875. [ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  22876. 0.3931]]], device='cuda:0')
  22877. loss_train_step before backward: tensor(0.0113, device='cuda:0', grad_fn=<MseLossBackward>)
  22878. loss_train_step after backward: tensor(0.0113, device='cuda:0', grad_fn=<MseLossBackward>)
  22879. loss_train: 2.5444738110527396
  22880. step: 86
  22881. running loss: 0.02958690477968302
  22882. Train Steps: 86/90 Loss: 0.0296 torch.Size([8, 600, 800])
  22883. torch.Size([8, 8])
  22884. tensor([[0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  22885. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  22886. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  22887. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  22888. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  22889. [0.6234, 0.4179, 0.7825, 0.3450, 0.3813, 0.2867, 0.5675, 0.5617],
  22890. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927],
  22891. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917]],
  22892. device='cuda:0', dtype=torch.float64)
  22893. predictions are: tensor([[ 0.3100, -0.6210, 0.9047, -1.3336, -0.3877, -1.2771, 0.5174, 0.1538],
  22894. [ 0.5911, -0.4111, 1.6927, -0.4872, -0.4639, -0.9790, 0.3204, 0.0526],
  22895. [ 0.6158, -0.4260, 1.3063, -1.2585, -0.1382, -1.3125, 0.6621, 0.1757],
  22896. [ 0.7599, -0.2690, 1.0580, -1.0242, -0.0868, -1.2896, 0.4650, 0.4659],
  22897. [ 0.4308, -0.5882, 1.8699, 0.0753, -0.5445, 0.1465, 0.6465, -0.0091],
  22898. [ 0.4604, -0.4707, 1.4312, -0.7649, -0.4340, -0.8856, 0.4767, 0.3702],
  22899. [ 0.1774, -0.7147, 1.8432, -0.1140, -0.2642, 0.0558, 0.2860, -0.0067],
  22900. [ 0.5459, -0.4278, 1.3398, -0.5322, -0.5929, -0.7123, 0.4224, 0.4162]],
  22901. device='cuda:0', grad_fn=<AddmmBackward>)
  22902. landmarks are: tensor([[[ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  22903. 0.1013],
  22904. [ 0.5485, -0.4209, 1.6691, -0.4152, -0.5249, -1.1081, 0.0725,
  22905. 0.0021],
  22906. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  22907. 0.2083],
  22908. [ 0.6101, -0.3152, 1.0166, -0.7540, -0.0226, -1.4468, 0.2823,
  22909. 0.5702],
  22910. [ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  22911. 0.0663],
  22912. [ 0.5935, -0.3558, 1.3284, -0.6924, -0.5249, -0.9618, 0.3353,
  22913. 0.3084],
  22914. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  22915. -0.0099],
  22916. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  22917. 0.4470]]], device='cuda:0')
  22918. loss_train_step before backward: tensor(0.0161, device='cuda:0', grad_fn=<MseLossBackward>)
  22919. loss_train_step after backward: tensor(0.0161, device='cuda:0', grad_fn=<MseLossBackward>)
  22920. loss_train: 2.56061180960387
  22921. step: 87
  22922. running loss: 0.029432319650619196
  22923. Train Steps: 87/90 Loss: 0.0294 torch.Size([8, 600, 800])
  22924. torch.Size([8, 8])
  22925. tensor([[0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  22926. [0.6200, 0.4071, 0.7338, 0.1917, 0.4200, 0.2450, 0.6150, 0.5517],
  22927. [0.6257, 0.4060, 0.8300, 0.2333, 0.4688, 0.2583, 0.7050, 0.5633],
  22928. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  22929. [0.6101, 0.4042, 0.7775, 0.2617, 0.3713, 0.2817, 0.5440, 0.5650],
  22930. [0.6128, 0.4115, 0.7934, 0.3778, 0.3450, 0.4033, 0.5337, 0.5456],
  22931. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  22932. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167]],
  22933. device='cuda:0', dtype=torch.float64)
  22934. predictions are: tensor([[ 4.6039e-01, -4.2506e-01, 1.4384e+00, -4.5731e-01, -4.3452e-02,
  22935. -1.2264e+00, 3.2788e-01, 3.5845e-01],
  22936. [ 6.0257e-01, -4.3626e-01, 1.1690e+00, -1.2788e+00, -3.3650e-01,
  22937. -1.1651e+00, 6.8741e-01, 1.0520e-01],
  22938. [ 5.2720e-01, -4.8766e-01, 1.6576e+00, -1.2388e+00, -1.2994e-01,
  22939. -1.1635e+00, 1.0622e+00, 1.5645e-01],
  22940. [ 4.8725e-01, -4.7966e-01, 1.4731e+00, -7.5758e-01, -6.2636e-01,
  22941. -6.2725e-01, 5.6555e-01, 3.4666e-01],
  22942. [ 4.4267e-01, -4.8748e-01, 1.3048e+00, -9.8736e-01, -4.8932e-01,
  22943. -9.7766e-01, 2.2468e-01, 9.5480e-02],
  22944. [ 3.4075e-01, -5.4505e-01, 1.4408e+00, -4.8045e-01, -6.5704e-01,
  22945. -4.3574e-01, 2.1275e-01, 1.5534e-01],
  22946. [ 3.3860e-01, -5.9572e-01, 1.7547e+00, -3.4798e-01, -5.4307e-01,
  22947. -8.2032e-02, 4.6923e-01, 4.7698e-02],
  22948. [ 5.7668e-01, -3.5282e-01, 1.1982e+00, -6.6692e-01, -1.3449e-03,
  22949. -1.3082e+00, 3.4176e-01, 3.4211e-01]], device='cuda:0',
  22950. grad_fn=<AddmmBackward>)
  22951. landmarks are: tensor([[[ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  22952. 0.5882],
  22953. [ 0.5779, -0.4054, 1.1032, -1.4006, -0.3460, -1.1543, 0.5547,
  22954. 0.2622],
  22955. [ 0.6042, -0.4105, 1.5478, -1.2082, -0.1208, -1.0927, 0.9704,
  22956. 0.3157],
  22957. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  22958. 0.5624],
  22959. [ 0.5320, -0.4189, 1.3053, -1.0773, -0.5711, -0.9849, 0.2267,
  22960. 0.3237],
  22961. [ 0.5444, -0.3852, 1.3786, -0.5409, -0.6924, -0.4229, 0.1791,
  22962. 0.2341],
  22963. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  22964. 0.2468],
  22965. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  22966. 0.5624]]], device='cuda:0')
  22967. loss_train_step before backward: tensor(0.0105, device='cuda:0', grad_fn=<MseLossBackward>)
  22968. loss_train_step after backward: tensor(0.0105, device='cuda:0', grad_fn=<MseLossBackward>)
  22969. loss_train: 2.5710743190720677
  22970. step: 88
  22971. running loss: 0.02921675362581895
  22972.  
  22973. Train Steps: 88/90 Loss: 0.0292 torch.Size([8, 600, 800])
  22974. torch.Size([8, 8])
  22975. tensor([[0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  22976. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  22977. [0.6146, 0.4124, 0.8800, 0.4867, 0.3800, 0.4500, 0.5106, 0.5524],
  22978. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  22979. [0.6229, 0.4066, 0.8513, 0.5717, 0.4500, 0.5050, 0.6025, 0.5350],
  22980. [0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676],
  22981. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  22982. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267]],
  22983. device='cuda:0', dtype=torch.float64)
  22984. predictions are: tensor([[ 0.7000, -0.3330, 1.2081, -1.3917, -0.5066, -1.2099, 0.5612, 0.2131],
  22985. [ 0.5759, -0.4134, 1.6561, -0.3017, -0.5498, -0.2371, 0.2067, 0.2265],
  22986. [ 0.5207, -0.4113, 1.6869, -0.0436, -0.5771, -0.3776, 0.2774, 0.1871],
  22987. [ 0.5346, -0.4634, 1.6791, 0.0160, -0.4440, -0.0452, 0.5119, 0.0538],
  22988. [ 0.2992, -0.6279, 1.5847, 0.2346, -0.2637, -0.1236, 0.4955, 0.2122],
  22989. [ 0.4735, -0.4733, 1.6959, -0.1844, -0.1443, -0.1494, 0.2397, 0.2195],
  22990. [ 0.4997, -0.4006, 1.0715, -1.2295, -0.1961, -1.5172, 0.3869, 0.3413],
  22991. [ 0.9420, -0.1883, 1.4086, -1.4380, -0.1689, -1.5866, 0.7342, 0.0748]],
  22992. device='cuda:0', grad_fn=<AddmmBackward>)
  22993. landmarks are: tensor([[[ 5.6966e-01, -4.4656e-01, 1.1973e+00, -1.1871e+00, -4.5712e-01,
  22994. -9.9653e-01, 5.2186e-01, 2.0324e-01],
  22995. [ 5.3684e-01, -4.4057e-01, 1.7730e+00, -1.7660e-01, -5.2494e-01,
  22996. -5.3426e-02, 2.3141e-01, 3.4688e-01],
  22997. [ 5.5289e-01, -3.8106e-01, 1.7788e+00, -3.8029e-02, -5.3072e-01,
  22998. -2.0739e-01, 7.2734e-02, 2.6568e-01],
  22999. [ 5.7777e-01, -4.3888e-01, 1.7107e+00, 1.1921e-01, -3.9207e-01,
  23000. 8.1507e-02, 4.7413e-01, 7.1077e-02],
  23001. [ 5.9107e-01, -4.0805e-01, 1.6460e+00, 3.5458e-01, -2.0739e-01,
  23002. 4.6651e-02, 4.9700e-01, 1.8522e-01],
  23003. [ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  23004. 4.6189e-04, 2.9049e-01, 3.3573e-01],
  23005. [ 5.8620e-01, -3.5296e-01, 1.1032e+00, -1.0619e+00, -1.4965e-01,
  23006. -1.3852e+00, 3.4111e-01, 3.9307e-01],
  23007. [ 6.0918e-01, -4.1432e-01, 1.4901e+00, -1.2467e+00, -1.2079e-01,
  23008. -1.4006e+00, 6.5866e-01, 1.4673e-01]]], device='cuda:0')
  23009. loss_train_step before backward: tensor(0.0142, device='cuda:0', grad_fn=<MseLossBackward>)
  23010. loss_train_step after backward: tensor(0.0142, device='cuda:0', grad_fn=<MseLossBackward>)
  23011. loss_train: 2.58522439096123
  23012. step: 89
  23013. running loss: 0.02904746506698011
  23014. Train Steps: 89/90 Loss: 0.0290 torch.Size([8, 600, 800])
  23015. torch.Size([8, 8])
  23016. tensor([[0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  23017. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  23018. [0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  23019. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  23020. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  23021. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  23022. [0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  23023. [0.6286, 0.4097, 0.8107, 0.2414, 0.4425, 0.2483, 0.6745, 0.5385]],
  23024. device='cuda:0', dtype=torch.float64)
  23025. predictions are: tensor([[ 0.5832, -0.3993, 1.1275, -1.2637, -0.5853, -1.0007, -0.0508, -0.0505],
  23026. [ 0.3885, -0.4997, 1.5609, 0.1179, -0.3980, -0.2911, 0.2709, 0.3850],
  23027. [ 0.3156, -0.6031, 1.7021, -0.8399, -0.6414, -0.2453, 0.6654, 0.1443],
  23028. [ 0.7260, -0.3384, 1.6161, 0.0791, -0.5394, -0.3537, 0.7659, 0.1245],
  23029. [ 0.4992, -0.4325, 1.5218, 0.1549, -0.1555, -0.3437, 0.2934, 0.4448],
  23030. [ 0.6640, -0.2715, 1.1294, -0.9919, -0.0219, -1.3958, 0.1330, 0.4381],
  23031. [ 0.6496, -0.3338, 1.8106, -0.5189, -0.3958, -0.9181, 0.5184, 0.1384],
  23032. [ 0.6956, -0.3518, 1.4355, -1.4073, -0.2439, -1.3482, 0.7373, 0.1280]],
  23033. device='cuda:0', grad_fn=<AddmmBackward>)
  23034. landmarks are: tensor([[[ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  23035. 0.0141],
  23036. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  23037. 0.3007],
  23038. [ 0.6108, -0.4273, 1.8711, -0.6616, -0.5769, -0.1997, 0.9156,
  23039. 0.1554],
  23040. [ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  23041. 0.2516],
  23042. [ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  23043. 0.4470],
  23044. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  23045. 0.5624],
  23046. [ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  23047. 0.1608],
  23048. [ 0.6174, -0.3936, 1.4586, -1.1709, -0.2420, -1.1389, 0.8296,
  23049. 0.2012]]], device='cuda:0')
  23050. loss_train_step before backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  23051. loss_train_step after backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  23052. loss_train: 2.604389033280313
  23053. step: 90
  23054. running loss: 0.02893765592533681
  23055. Valid Steps: 10/10 Loss: nan 7.8799
  23056. --------------------------------------------------
  23057. Epoch: 6 Train Loss: 0.0289 Valid Loss: nan
  23058. --------------------------------------------------
  23059. size of train loader is: 90
  23060. torch.Size([8, 600, 800])
  23061. torch.Size([8, 8])
  23062. tensor([[0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  23063. [0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  23064. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533],
  23065. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  23066. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  23067. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083],
  23068. [0.6165, 0.4106, 0.7575, 0.1733, 0.3838, 0.2650, 0.5680, 0.5116],
  23069. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467]],
  23070. device='cuda:0', dtype=torch.float64)
  23071. predictions are: tensor([[ 0.6477, -0.3526, 0.9691, -0.9025, -0.4389, -1.1085, 0.2247, 0.2755],
  23072. [ 0.8920, -0.2164, 1.2343, -1.0870, -0.2121, -1.2321, 0.6169, 0.2335],
  23073. [ 0.5558, -0.4183, 1.1495, -1.0581, -0.4915, -0.8478, 0.4433, 0.2620],
  23074. [ 0.5084, -0.4509, 1.4207, -1.0557, -0.0454, -1.4207, 0.5016, 0.1969],
  23075. [-0.0192, -0.7355, 1.4270, -0.7559, -0.2804, -1.0867, 0.2119, 0.3873],
  23076. [ 0.6241, -0.4014, 1.9214, -0.2800, -0.5671, -0.6757, 0.3070, 0.0805],
  23077. [ 0.5517, -0.4502, 1.3219, -1.2073, -0.4492, -1.1858, 0.5526, 0.0171],
  23078. [ 0.4252, -0.5143, 1.6961, -0.5656, -0.6468, -0.3361, 0.3515, 0.2301]],
  23079. device='cuda:0', grad_fn=<AddmmBackward>)
  23080. landmarks are: tensor([[[ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  23081. 0.3546],
  23082. [ 0.5861, -0.3929, 1.0570, -1.4314, -0.3286, -1.1235, 0.6182,
  23083. 0.1852],
  23084. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  23085. 0.2699],
  23086. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  23087. 0.2083],
  23088. [-2.2859, -2.2859, 1.2303, -0.7848, -0.4210, -1.1158, 0.2256,
  23089. 0.3777],
  23090. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  23091. 0.0620],
  23092. [ 0.5618, -0.3895, 1.2129, -1.4853, -0.5134, -1.0619, 0.3378,
  23093. 0.0772],
  23094. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  23095. 0.2391]]], device='cuda:0')
  23096. loss_train_step before backward: tensor(0.1317, device='cuda:0', grad_fn=<MseLossBackward>)
  23097. loss_train_step after backward: tensor(0.1317, device='cuda:0', grad_fn=<MseLossBackward>)
  23098. loss_train: 0.13170002400875092
  23099. step: 1
  23100. running loss: 0.13170002400875092
  23101. Train Steps: 1/90 Loss: 0.1317 torch.Size([8, 600, 800])
  23102. torch.Size([8, 8])
  23103. tensor([[0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  23104. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  23105. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  23106. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  23107. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  23108. [0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  23109. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297],
  23110. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550]],
  23111. device='cuda:0', dtype=torch.float64)
  23112. predictions are: tensor([[ 0.6647, -0.3062, 1.0944, -1.2538, -0.3591, -1.2520, 0.4543, 0.4699],
  23113. [ 0.3959, -0.5123, 1.6735, -0.1118, -0.0870, -0.0970, 0.0966, 0.1922],
  23114. [ 0.3720, -0.4999, 1.1677, -1.1540, -0.4044, -1.2134, 0.3068, 0.2836],
  23115. [ 0.6326, -0.3810, 1.6411, -0.0633, -0.3244, -0.1243, 0.2366, 0.2300],
  23116. [ 0.6179, -0.3312, 1.6827, -0.9184, -0.2375, -1.5012, 0.2988, -0.0049],
  23117. [ 0.7444, -0.2400, 1.0723, -0.8516, -0.3273, -1.3134, 0.1802, 0.4339],
  23118. [ 0.7338, -0.3491, 1.6987, 0.1139, -0.6360, -0.2006, 0.7904, 0.1141],
  23119. [ 0.5614, -0.3962, 1.7932, -0.2720, -0.4493, 0.1143, 0.6197, 0.2201]],
  23120. device='cuda:0', grad_fn=<AddmmBackward>)
  23121. landmarks are: tensor([[[ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  23122. 0.6084],
  23123. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  23124. 0.3392],
  23125. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  23126. 0.2853],
  23127. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  23128. 0.3700],
  23129. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  23130. -0.0368],
  23131. [ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  23132. 0.5401],
  23133. [ 0.6520, -0.4032, 1.8076, 0.1852, -0.5711, -0.1381, 0.7876,
  23134. 0.1608],
  23135. [ 0.5968, -0.3725, 1.8423, -0.1381, -0.4037, 0.1852, 0.6009,
  23136. 0.2776]]], device='cuda:0')
  23137. loss_train_step before backward: tensor(0.0086, device='cuda:0', grad_fn=<MseLossBackward>)
  23138. loss_train_step after backward: tensor(0.0086, device='cuda:0', grad_fn=<MseLossBackward>)
  23139. loss_train: 0.1403241939842701
  23140. step: 2
  23141. running loss: 0.07016209699213505
  23142.  
  23143. Train Steps: 2/90 Loss: 0.0702 torch.Size([8, 600, 800])
  23144. torch.Size([8, 8])
  23145. tensor([[0.6128, 0.4116, 0.8450, 0.4583, 0.3675, 0.4867, 0.5337, 0.5446],
  23146. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235],
  23147. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578],
  23148. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  23149. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  23150. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  23151. [0.6038, 0.3946, 0.8413, 0.4883, 0.3563, 0.4550, 0.5266, 0.4693],
  23152. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377]],
  23153. device='cuda:0', dtype=torch.float64)
  23154. predictions are: tensor([[ 0.7319, -0.2171, 1.5618, -0.3020, -0.4572, -0.2303, 0.1329, 0.3098],
  23155. [ 0.8232, -0.2165, 1.7220, -0.2264, -0.2888, 0.0441, 0.4587, 0.1933],
  23156. [-1.7871, -1.9312, 1.1732, -1.2439, -0.4154, -1.3333, 0.0692, 0.2836],
  23157. [ 0.7511, -0.2776, 1.8293, -0.2960, -0.3076, -0.5175, 0.9069, 0.3537],
  23158. [ 0.9328, -0.1419, 1.4058, 0.0273, -0.4443, -0.1959, 0.7334, 0.2985],
  23159. [ 0.9208, -0.1094, 0.9170, -1.5732, -0.3551, -1.5826, 0.2315, 0.1841],
  23160. [ 0.7178, -0.2332, 1.5154, -0.1506, -0.5277, -0.4161, -0.0780, 0.2460],
  23161. [ 0.8859, -0.2005, 1.6186, 0.0542, -0.3882, -0.3113, 0.3717, 0.1910]],
  23162. device='cuda:0', grad_fn=<AddmmBackward>)
  23163. landmarks are: tensor([[[ 0.5444, -0.3846, 1.6171, -0.1689, -0.5885, -0.0380, 0.1791,
  23164. 0.2296],
  23165. [ 0.5762, -0.4706, 1.7754, -0.0984, -0.3680, 0.2380, 0.6277,
  23166. 0.1322],
  23167. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  23168. 0.2905],
  23169. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  23170. 0.4386],
  23171. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  23172. 0.1928],
  23173. [ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  23174. 0.2906],
  23175. [ 0.5030, -0.4631, 1.5998, -0.0303, -0.6404, -0.1843, 0.1465,
  23176. -0.1181],
  23177. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  23178. 0.1979]]], device='cuda:0')
  23179. loss_train_step before backward: tensor(0.0370, device='cuda:0', grad_fn=<MseLossBackward>)
  23180. loss_train_step after backward: tensor(0.0370, device='cuda:0', grad_fn=<MseLossBackward>)
  23181. loss_train: 0.1773393712937832
  23182. step: 3
  23183. running loss: 0.0591131237645944
  23184. Train Steps: 3/90 Loss: 0.0591 torch.Size([8, 600, 800])
  23185. torch.Size([8, 8])
  23186. tensor([[0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  23187. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  23188. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  23189. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  23190. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356],
  23191. [0.6102, 0.3999, 0.8750, 0.5133, 0.3825, 0.4750, 0.5637, 0.5083],
  23192. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  23193. [0.6250, 0.4106, 0.8700, 0.3717, 0.3588, 0.4967, 0.6038, 0.5167]],
  23194. device='cuda:0', dtype=torch.float64)
  23195. predictions are: tensor([[ 8.9299e-01, -1.9483e-01, 1.3833e+00, 1.2987e-01, -4.8383e-01,
  23196. -5.3583e-03, 7.4699e-01, 2.4503e-01],
  23197. [-1.8940e+00, -2.0092e+00, 1.3015e+00, -1.1059e+00, -3.3122e-01,
  23198. -1.2012e+00, 2.4633e-01, 2.7320e-01],
  23199. [ 6.9292e-01, -2.6543e-01, 1.1853e+00, -5.9782e-01, -6.0230e-01,
  23200. -8.2772e-01, 1.5278e-01, 4.5867e-01],
  23201. [ 6.5121e-01, -2.5269e-01, 1.3511e+00, -6.1461e-01, -7.2152e-02,
  23202. -1.2816e+00, 1.5690e-01, 5.1567e-01],
  23203. [ 7.7100e-01, -2.4929e-01, 1.3652e+00, -1.1704e+00, -3.3382e-01,
  23204. -1.2479e+00, 6.5034e-01, 1.7962e-01],
  23205. [ 8.6061e-01, -1.8263e-01, 1.6473e+00, -7.0001e-04, -5.0347e-01,
  23206. -9.7541e-02, 1.6001e-01, 6.7358e-02],
  23207. [ 5.2133e-01, -3.6087e-01, 1.4178e+00, -9.9686e-01, -1.1791e-01,
  23208. -1.4057e+00, 3.2734e-01, 2.0587e-01],
  23209. [ 8.5589e-01, -1.9249e-01, 1.6359e+00, -5.9213e-01, -6.1109e-01,
  23210. 4.0864e-02, 5.4792e-01, 2.4353e-01]], device='cuda:0',
  23211. grad_fn=<AddmmBackward>)
  23212. landmarks are: tensor([[[ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  23213. 0.1928],
  23214. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  23215. 0.3007],
  23216. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  23217. 0.4470],
  23218. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  23219. 0.5882],
  23220. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  23221. 0.1879],
  23222. [ 0.5326, -0.4390, 1.7557, 0.0851, -0.5192, -0.0919, 0.3180,
  23223. 0.0620],
  23224. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  23225. 0.2083],
  23226. [ 0.6010, -0.3896, 1.7326, -0.5692, -0.6289, 0.0082, 0.5028,
  23227. 0.1005]]], device='cuda:0')
  23228. loss_train_step before backward: tensor(0.0179, device='cuda:0', grad_fn=<MseLossBackward>)
  23229. loss_train_step after backward: tensor(0.0179, device='cuda:0', grad_fn=<MseLossBackward>)
  23230. loss_train: 0.19527801871299744
  23231. step: 4
  23232. running loss: 0.04881950467824936
  23233. Train Steps: 4/90 Loss: 0.0488 torch.Size([8, 600, 800])
  23234. torch.Size([8, 8])
  23235. tensor([[0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  23236. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  23237. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  23238. [0.6124, 0.4075, 0.7696, 0.4153, 0.3475, 0.3767, 0.5157, 0.5427],
  23239. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  23240. [0.6216, 0.4100, 0.7350, 0.2067, 0.4325, 0.2050, 0.5950, 0.5333],
  23241. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  23242. [0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667]],
  23243. device='cuda:0', dtype=torch.float64)
  23244. predictions are: tensor([[ 0.6983, -0.2865, 1.5583, 0.4364, 0.0205, -0.2002, 0.3845, 0.5493],
  23245. [ 0.6020, -0.3588, 1.7794, -0.0123, -0.0761, 0.4327, 0.5758, 0.3702],
  23246. [ 0.8159, -0.2481, 1.7206, -0.3957, -0.6126, -0.8451, 0.4303, 0.1379],
  23247. [ 0.7543, -0.2461, 1.3220, -0.4106, -0.6687, -0.5468, 0.0829, 0.3590],
  23248. [-0.8455, -1.2990, 1.2776, -1.2102, -0.3380, -1.4762, 0.2634, 0.1421],
  23249. [ 0.4908, -0.4188, 1.0813, -1.3411, -0.3358, -1.4621, 0.4294, 0.2803],
  23250. [ 0.8225, -0.2386, 1.1020, -1.1353, -0.6921, -0.7803, 0.3172, 0.0501],
  23251. [ 0.5905, -0.3740, 1.6765, -0.6473, -0.5600, -0.7175, 0.5019, 0.3938]],
  23252. device='cuda:0', grad_fn=<AddmmBackward>)
  23253. landmarks are: tensor([[[ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  23254. 0.4547],
  23255. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  23256. 0.2083],
  23257. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  23258. 0.1005],
  23259. [ 0.5427, -0.4035, 1.2688, -0.3675, -0.6808, -0.5461, 0.0959,
  23260. 0.2206],
  23261. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  23262. 0.0231],
  23263. [ 0.5853, -0.3920, 1.1090, -1.3313, -0.2882, -1.3390, 0.4624,
  23264. 0.1775],
  23265. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  23266. 0.0622],
  23267. [ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  23268. 0.3315]]], device='cuda:0')
  23269. loss_train_step before backward: tensor(0.0562, device='cuda:0', grad_fn=<MseLossBackward>)
  23270. loss_train_step after backward: tensor(0.0562, device='cuda:0', grad_fn=<MseLossBackward>)
  23271. loss_train: 0.25149907171726227
  23272. step: 5
  23273. running loss: 0.05029981434345245
  23274. Train Steps: 5/90 Loss: 0.0503 torch.Size([8, 600, 800])
  23275. torch.Size([8, 8])
  23276. tensor([[0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  23277. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  23278. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  23279. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  23280. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550],
  23281. [0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  23282. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  23283. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456]],
  23284. device='cuda:0', dtype=torch.float64)
  23285. predictions are: tensor([[ 0.7097, -0.2963, 1.1037, -1.2898, -0.6142, -1.1763, 0.4470, 0.2839],
  23286. [ 0.6372, -0.2858, 0.9849, -0.8955, -0.1584, -1.5070, 0.1930, 0.5510],
  23287. [ 0.6837, -0.3201, 1.6716, 0.2550, -0.1896, 0.0621, 0.3190, 0.2978],
  23288. [ 0.2536, -0.5944, 1.3756, -1.0492, -0.5398, -0.9605, 0.6340, 0.2841],
  23289. [ 0.4375, -0.4863, 1.8205, -0.1297, -0.4469, 0.1487, 0.6756, 0.3328],
  23290. [ 0.0804, -0.6800, 1.4471, -0.7608, -0.4763, -1.2891, 0.1751, 0.0604],
  23291. [ 0.7134, -0.3114, 1.6887, -0.1343, -0.5369, -0.1299, 0.2081, 0.2759],
  23292. [ 0.6029, -0.3714, 1.6532, 0.1362, -0.3379, 0.1308, 0.3406, 0.2828]],
  23293. device='cuda:0', grad_fn=<AddmmBackward>)
  23294. landmarks are: tensor([[[ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  23295. 0.3007],
  23296. [ 0.6101, -0.3152, 1.0166, -0.7540, -0.0226, -1.4468, 0.2823,
  23297. 0.5702],
  23298. [ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  23299. 0.2364],
  23300. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  23301. 0.2160],
  23302. [ 0.5968, -0.3725, 1.8423, -0.1381, -0.4037, 0.1852, 0.6009,
  23303. 0.2776],
  23304. [ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  23305. 0.0111],
  23306. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  23307. 0.3469],
  23308. [ 0.5443, -0.3840, 1.7095, 0.0620, -0.3979, 0.1929, 0.1622,
  23309. 0.2341]]], device='cuda:0')
  23310. loss_train_step before backward: tensor(0.0141, device='cuda:0', grad_fn=<MseLossBackward>)
  23311. loss_train_step after backward: tensor(0.0141, device='cuda:0', grad_fn=<MseLossBackward>)
  23312. loss_train: 0.2655968349426985
  23313. step: 6
  23314. running loss: 0.04426613915711641
  23315.  
  23316. Train Steps: 6/90 Loss: 0.0443 torch.Size([8, 600, 800])
  23317. torch.Size([8, 8])
  23318. tensor([[0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  23319. [0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  23320. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  23321. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  23322. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  23323. [ nan, nan, 0.9050, 0.3500, 0.5138, 0.2300, 0.7359, 0.5702],
  23324. [0.6264, 0.4067, 0.9050, 0.4183, 0.3775, 0.4600, 0.6308, 0.4862],
  23325. [0.6343, 0.4097, 0.9287, 0.4367, 0.4313, 0.3600, 0.7248, 0.5841]],
  23326. device='cuda:0', dtype=torch.float64)
  23327. predictions are: tensor([[ 0.9006, -0.2117, 1.6638, -0.3467, -0.6132, -0.4659, 0.5123, 0.1801],
  23328. [ 0.5317, -0.3793, 0.8797, -0.9900, -0.5496, -0.9261, 0.0243, 0.3312],
  23329. [ 0.6930, -0.3017, 0.7817, -1.0732, -0.4704, -1.2299, -0.0311, 0.2055],
  23330. [ 0.6957, -0.3161, 1.7998, -0.4552, -0.5499, -0.4094, 0.6199, 0.2619],
  23331. [ 0.6030, -0.3544, 1.2631, -0.3271, -0.5427, -0.2744, -0.1266, 0.2739],
  23332. [-1.6762, -1.8580, 1.8621, -0.7469, 0.1769, -1.1852, 0.8146, 0.5468],
  23333. [ 0.6555, -0.3252, 1.7625, -0.2648, -0.5922, -0.1266, 0.5597, 0.1009],
  23334. [ 0.7671, -0.2935, 1.6871, -0.2076, -0.3535, -0.5524, 0.7757, 0.3876]],
  23335. device='cuda:0', grad_fn=<AddmmBackward>)
  23336. landmarks are: tensor([[[ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  23337. 0.0697],
  23338. [ 0.5425, -0.3998, 0.9263, -0.8683, -0.6000, -1.0157, 0.0990,
  23339. 0.2476],
  23340. [ 0.5470, -0.4081, 0.8492, -1.0773, -0.5307, -1.1620, 0.0912,
  23341. 0.1890],
  23342. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  23343. 0.1544],
  23344. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  23345. 0.1552],
  23346. [-2.2859, -2.2859, 1.8942, -0.6693, 0.0871, -1.2236, 1.1130,
  23347. 0.3478],
  23348. [ 0.6072, -0.4075, 1.8942, -0.3537, -0.5423, -0.1612, 0.6277,
  23349. -0.0400],
  23350. [ 0.6438, -0.3936, 2.0039, -0.2690, -0.2940, -0.6231, 1.0618,
  23351. 0.4119]]], device='cuda:0')
  23352. loss_train_step before backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  23353. loss_train_step after backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  23354. loss_train: 0.2878271918743849
  23355. step: 7
  23356. running loss: 0.04111817026776927
  23357. Train Steps: 7/90 Loss: 0.0411 torch.Size([8, 600, 800])
  23358. torch.Size([8, 8])
  23359. tensor([[0.6214, 0.4175, 0.7300, 0.2883, 0.4338, 0.2167, 0.5698, 0.5773],
  23360. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  23361. [0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  23362. [0.6201, 0.4036, 0.8596, 0.3850, 0.3492, 0.3785, 0.5978, 0.5131],
  23363. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  23364. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  23365. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  23366. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220]],
  23367. device='cuda:0', dtype=torch.float64)
  23368. predictions are: tensor([[ 0.4279, -0.4700, 1.1087, -0.9343, -0.3377, -1.1035, 0.2972, 0.4786],
  23369. [-0.1724, -0.8663, 1.5414, -0.3400, -0.5710, -0.8034, 0.1809, 0.4591],
  23370. [ 0.6113, -0.3749, 1.2179, -1.1382, -0.3679, -1.2327, 0.2952, 0.1828],
  23371. [ 0.8218, -0.2730, 1.8150, -0.3814, -0.7125, -0.3080, 0.3443, 0.1518],
  23372. [ 0.6928, -0.3667, 1.6759, 0.5193, -0.4929, 0.2824, 0.4658, 0.1233],
  23373. [ 0.4151, -0.4984, 0.9299, -1.0047, -0.5191, -1.0346, 0.3536, 0.3316],
  23374. [ 0.2671, -0.6461, 2.0895, -0.5594, -0.3277, -0.3334, 1.0386, 0.3234],
  23375. [ 0.2336, -0.6060, 1.0417, -1.1955, -0.3274, -1.4027, 0.1155, 0.1706]],
  23376. device='cuda:0', grad_fn=<AddmmBackward>)
  23377. landmarks are: tensor([[[ 0.5841, -0.3574, 1.0859, -0.9541, -0.2824, -1.2851, 0.3460,
  23378. 0.3808],
  23379. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  23380. 0.3928],
  23381. [ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  23382. 0.1449],
  23383. [ 0.5783, -0.4216, 1.6847, -0.5078, -0.6732, -0.5377, 0.4752,
  23384. 0.0839],
  23385. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  23386. -0.1385],
  23387. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  23388. 0.2391],
  23389. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  23390. 0.2676],
  23391. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  23392. 0.1253]]], device='cuda:0')
  23393. loss_train_step before backward: tensor(0.0310, device='cuda:0', grad_fn=<MseLossBackward>)
  23394. loss_train_step after backward: tensor(0.0310, device='cuda:0', grad_fn=<MseLossBackward>)
  23395. loss_train: 0.3187991585582495
  23396. step: 8
  23397. running loss: 0.039849894819781184
  23398. Train Steps: 8/90 Loss: 0.0398 torch.Size([8, 600, 800])
  23399. torch.Size([8, 8])
  23400. tensor([[0.6236, 0.3967, 0.8675, 0.5400, 0.3862, 0.4517, 0.5825, 0.5200],
  23401. [0.6264, 0.4067, 0.9050, 0.4183, 0.3775, 0.4600, 0.6308, 0.4862],
  23402. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  23403. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  23404. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  23405. [0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  23406. [ nan, nan, 0.8463, 0.2550, 0.5850, 0.2133, 0.7129, 0.6072],
  23407. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413]],
  23408. device='cuda:0', dtype=torch.float64)
  23409. predictions are: tensor([[ 0.6302, -0.3617, 1.5214, 0.2184, -0.5714, -0.2713, 0.1169, 0.2587],
  23410. [ 0.6184, -0.3406, 1.6832, -0.3059, -0.7060, -0.2061, 0.3594, 0.0877],
  23411. [ 0.6739, -0.3559, 1.5060, 0.3060, -0.6391, -0.1109, 0.3257, 0.1549],
  23412. [ 0.6845, -0.3340, 1.4835, 0.2149, -0.5401, -0.0175, 0.7316, 0.3698],
  23413. [ 0.7103, -0.3030, 1.6602, -0.1140, -0.5570, 0.0523, 0.2161, 0.2177],
  23414. [ 0.6586, -0.3380, 1.3056, -1.1049, -0.5090, -0.9922, 0.3005, 0.1256],
  23415. [-1.3580, -1.6826, 1.5312, -1.0974, 0.1189, -1.1105, 0.7331, 0.5404],
  23416. [ 0.3991, -0.5250, 1.5950, -1.2209, 0.0730, -1.0968, 0.8225, 0.2854]],
  23417. device='cuda:0', grad_fn=<AddmmBackward>)
  23418. landmarks are: tensor([[[ 0.5944, -0.4538, 1.7210, 0.2083, -0.5018, -0.1997, 0.4046,
  23419. 0.1159],
  23420. [ 0.6072, -0.4075, 1.8942, -0.3537, -0.5423, -0.1612, 0.6277,
  23421. -0.0400],
  23422. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  23423. 0.0261],
  23424. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  23425. 0.3745],
  23426. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  23427. 0.2237],
  23428. [ 0.6125, -0.4345, 1.4308, -1.1384, -0.4213, -1.0031, 0.7190,
  23429. 0.1214],
  23430. [-2.2859, -2.2859, 1.6229, -1.1081, 0.4162, -1.3005, 1.0070,
  23431. 0.5188],
  23432. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  23433. 0.2142]]], device='cuda:0')
  23434. loss_train_step before backward: tensor(0.0426, device='cuda:0', grad_fn=<MseLossBackward>)
  23435. loss_train_step after backward: tensor(0.0426, device='cuda:0', grad_fn=<MseLossBackward>)
  23436. loss_train: 0.3614186178892851
  23437. step: 9
  23438. running loss: 0.04015762420992056
  23439. Train Steps: 9/90 Loss: 0.0402 torch.Size([8, 600, 800])
  23440. torch.Size([8, 8])
  23441. tensor([[0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  23442. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  23443. [0.6200, 0.4070, 0.8938, 0.4183, 0.3538, 0.4567, 0.6175, 0.5400],
  23444. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875],
  23445. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  23446. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  23447. [0.6197, 0.4091, 0.8800, 0.4783, 0.3538, 0.4767, 0.5950, 0.5550],
  23448. [0.6075, 0.4000, 0.8513, 0.5183, 0.4510, 0.5329, 0.5180, 0.5280]],
  23449. device='cuda:0', dtype=torch.float64)
  23450. predictions are: tensor([[ 0.6971, -0.3688, 1.7350, -0.1732, -0.4029, 0.2110, 0.7087, 0.2211],
  23451. [ 0.4011, -0.5162, 1.1709, -1.1587, -0.3880, -1.3280, 0.4589, 0.3671],
  23452. [ 0.4933, -0.4978, 1.7170, -0.3445, -0.6054, -0.3812, 0.6053, 0.2377],
  23453. [ 0.3137, -0.5505, 1.5822, -0.6377, -0.6560, -1.0371, 0.2575, 0.1115],
  23454. [ 0.5390, -0.4642, 1.6548, 0.1634, -0.3035, -0.1852, 0.5739, 0.1073],
  23455. [ 0.2994, -0.5938, 1.6538, -0.3325, -0.4045, 0.1992, 0.3695, 0.1887],
  23456. [ 0.5082, -0.4512, 1.6077, -0.1040, -0.5408, -0.2585, 0.5207, 0.4175],
  23457. [ 0.4719, -0.4648, 1.5714, 0.0954, -0.1144, -0.0728, 0.1835, 0.2303]],
  23458. device='cuda:0', grad_fn=<AddmmBackward>)
  23459. landmarks are: tensor([[[ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  23460. 0.1082],
  23461. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  23462. 0.3315],
  23463. [ 0.5778, -0.4061, 1.8423, -0.3537, -0.6520, -0.1766, 0.5663,
  23464. 0.2083],
  23465. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  23466. -0.0340],
  23467. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  23468. 0.0159],
  23469. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  23470. 0.0772],
  23471. [ 0.5763, -0.3963, 1.7788, -0.0765, -0.6520, -0.0842, 0.4624,
  23472. 0.2776],
  23473. [ 0.5202, -0.4382, 1.6460, 0.1082, -0.2029, 0.1754, 0.1067,
  23474. 0.1530]]], device='cuda:0')
  23475. loss_train_step before backward: tensor(0.0139, device='cuda:0', grad_fn=<MseLossBackward>)
  23476. loss_train_step after backward: tensor(0.0139, device='cuda:0', grad_fn=<MseLossBackward>)
  23477. loss_train: 0.3753113318234682
  23478. step: 10
  23479. running loss: 0.03753113318234682
  23480.  
  23481. Train Steps: 10/90 Loss: 0.0375 torch.Size([8, 600, 800])
  23482. torch.Size([8, 8])
  23483. tensor([[0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617],
  23484. [0.6176, 0.4030, 0.8850, 0.4850, 0.3688, 0.4050, 0.5312, 0.5783],
  23485. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  23486. [0.6203, 0.4076, 0.8611, 0.2878, 0.4050, 0.2554, 0.5907, 0.5496],
  23487. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  23488. [0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  23489. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  23490. [0.6200, 0.4049, 0.8638, 0.5617, 0.4125, 0.5100, 0.6013, 0.5317]],
  23491. device='cuda:0', dtype=torch.float64)
  23492. predictions are: tensor([[ 0.1967, -0.6591, 1.7363, -0.0536, -0.5547, -0.1339, 0.6452, 0.2842],
  23493. [ 0.5217, -0.4646, 1.6759, -0.0579, -0.5454, -0.3497, 0.2499, 0.1922],
  23494. [ 0.2723, -0.6024, 1.3251, -1.0565, -0.2461, -1.3451, 0.3772, 0.1343],
  23495. [ 0.2139, -0.6353, 1.6743, -0.9571, -0.2936, -0.9478, 0.5853, 0.1640],
  23496. [ 0.7073, -0.3514, 1.2029, -1.1984, -0.5418, -0.8277, 0.5706, 0.1203],
  23497. [ 0.6006, -0.4165, 1.5692, -0.5432, -0.5794, -0.7226, 0.4796, 0.1666],
  23498. [ 0.5078, -0.4796, 1.7146, 0.1441, -0.4945, -0.1384, 0.4881, 0.3228],
  23499. [ 0.2629, -0.6667, 1.6207, 0.2619, -0.2709, 0.1349, 0.5074, 0.1552]],
  23500. device='cuda:0', grad_fn=<AddmmBackward>)
  23501. landmarks are: tensor([[[ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  23502. 0.3084],
  23503. [ 0.5667, -0.4246, 1.8018, -0.0457, -0.5827, -0.4152, 0.1679,
  23504. 0.3854],
  23505. [ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  23506. 0.0928],
  23507. [ 0.5790, -0.4031, 1.6915, -0.9564, -0.4152, -1.1063, 0.4425,
  23508. 0.2528],
  23509. [ 0.5730, -0.4562, 1.2195, -1.2440, -0.5497, -0.7711, 0.5704,
  23510. 0.1779],
  23511. [ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  23512. 0.1621],
  23513. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  23514. 0.3161],
  23515. [ 0.5776, -0.4159, 1.7037, 0.3084, -0.3806, 0.0697, 0.4912,
  23516. 0.1698]]], device='cuda:0')
  23517. loss_train_step before backward: tensor(0.0162, device='cuda:0', grad_fn=<MseLossBackward>)
  23518. loss_train_step after backward: tensor(0.0162, device='cuda:0', grad_fn=<MseLossBackward>)
  23519. loss_train: 0.3914999272674322
  23520. step: 11
  23521. running loss: 0.035590902478857475
  23522. Train Steps: 11/90 Loss: 0.0356 torch.Size([8, 600, 800])
  23523. torch.Size([8, 8])
  23524. tensor([[0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  23525. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  23526. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  23527. [0.6250, 0.4116, 0.8700, 0.4850, 0.4650, 0.5567, 0.6088, 0.5183],
  23528. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  23529. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  23530. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  23531. [0.6136, 0.4029, 0.8263, 0.3350, 0.3625, 0.3067, 0.5675, 0.5167]],
  23532. device='cuda:0', dtype=torch.float64)
  23533. predictions are: tensor([[ 0.9551, -0.1943, 1.7838, 0.1884, -0.5463, -0.5159, 0.7997, 0.0161],
  23534. [ 0.8863, -0.2218, 1.0800, -1.0480, -0.5751, -0.7298, 0.4776, 0.0688],
  23535. [-2.0307, -2.0780, 1.1745, -1.1032, -0.3354, -1.3458, 0.2500, 0.2283],
  23536. [ 0.9031, -0.1703, 1.7089, -0.1087, -0.1458, 0.2899, 0.7898, 0.2564],
  23537. [ 0.8976, -0.1821, 1.7356, -0.1796, -0.4199, -0.2579, 0.3009, 0.0515],
  23538. [ 0.9155, -0.2161, 1.6589, 0.0400, -0.2482, -0.0904, 0.4978, 0.2829],
  23539. [-1.8523, -1.9757, 1.3322, -0.7963, -0.5985, -0.8162, 0.2899, 0.2414],
  23540. [ 0.8009, -0.2398, 1.5121, -0.6899, -0.5752, -0.8632, 0.4632, 0.1816]],
  23541. device='cuda:0', grad_fn=<AddmmBackward>)
  23542. landmarks are: tensor([[[ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  23543. -0.0049],
  23544. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  23545. 0.0622],
  23546. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  23547. 0.0231],
  23548. [ 0.6012, -0.3846, 1.7326, -0.0457, -0.1381, 0.2853, 0.5259,
  23549. 0.1082],
  23550. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  23551. -0.0220],
  23552. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  23553. 0.3700],
  23554. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  23555. 0.1133],
  23556. [ 0.5483, -0.4249, 1.5305, -0.7386, -0.6115, -0.8694, 0.3353,
  23557. 0.1005]]], device='cuda:0')
  23558. loss_train_step before backward: tensor(0.0300, device='cuda:0', grad_fn=<MseLossBackward>)
  23559. loss_train_step after backward: tensor(0.0300, device='cuda:0', grad_fn=<MseLossBackward>)
  23560. loss_train: 0.42152343317866325
  23561. step: 12
  23562. running loss: 0.03512695276488861
  23563. Train Steps: 12/90 Loss: 0.0351 torch.Size([8, 600, 800])
  23564. torch.Size([8, 8])
  23565. tensor([[0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  23566. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  23567. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  23568. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550],
  23569. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  23570. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  23571. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  23572. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320]],
  23573. device='cuda:0', dtype=torch.float64)
  23574. predictions are: tensor([[-0.0789, -0.8634, 1.9075, -0.1872, -0.4406, -0.8748, 0.5152, 0.2647],
  23575. [ 0.1872, -0.6352, 1.2463, -0.5061, 0.0230, -1.0992, 0.3518, 0.4947],
  23576. [ 0.6524, -0.4729, 1.6001, -1.0348, -0.2872, -1.0288, 0.8581, -0.0065],
  23577. [-0.0280, -0.7967, 1.5074, -0.6335, -0.5794, -0.7054, 0.1318, 0.1660],
  23578. [-0.4311, -1.0920, 1.1659, -1.0859, -0.4291, -1.2241, 0.2571, -0.0169],
  23579. [ 0.3784, -0.5783, 1.1265, -1.1726, -0.5293, -0.8971, 0.4713, 0.1641],
  23580. [ 0.4242, -0.5747, 1.4232, -0.9487, -0.6321, -0.5319, 0.5436, 0.0818],
  23581. [ 0.7843, -0.3753, 1.9808, -0.0349, -0.5629, -0.0903, 0.9297, -0.0148]],
  23582. device='cuda:0', grad_fn=<AddmmBackward>)
  23583. landmarks are: tensor([[[ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  23584. 0.1929],
  23585. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  23586. 0.5624],
  23587. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  23588. 0.1193],
  23589. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  23590. 0.2776],
  23591. [ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  23592. -0.0580],
  23593. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  23594. 0.2853],
  23595. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  23596. 0.2545],
  23597. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  23598. 0.1715]]], device='cuda:0')
  23599. loss_train_step before backward: tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward>)
  23600. loss_train_step after backward: tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward>)
  23601. loss_train: 0.4853547476232052
  23602. step: 13
  23603. running loss: 0.0373349805864004
  23604. Train Steps: 13/90 Loss: 0.0373 torch.Size([8, 600, 800])
  23605. torch.Size([8, 8])
  23606. tensor([[0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  23607. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  23608. [0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  23609. [0.6261, 0.3987, 0.8688, 0.4917, 0.4300, 0.5333, 0.7010, 0.5309],
  23610. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  23611. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563],
  23612. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  23613. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586]],
  23614. device='cuda:0', dtype=torch.float64)
  23615. predictions are: tensor([[ 0.3884, -0.5688, 1.7313, -0.1300, -0.3147, -0.0134, 0.2209, 0.1419],
  23616. [ 0.3916, -0.5727, 1.6822, -0.3438, -0.6272, -0.4326, 0.3543, 0.1778],
  23617. [ 0.5572, -0.4856, 1.4594, 0.1052, -0.5221, -0.1518, 0.9008, 0.2143],
  23618. [ 0.1300, -0.7581, 1.7953, -0.2225, -0.3607, 0.2561, 0.8635, 0.0762],
  23619. [ 0.4244, -0.4891, 1.6533, -0.0386, -0.3964, -0.9195, 0.3851, 0.3819],
  23620. [ 0.3393, -0.5632, 1.5823, -0.5397, -0.6619, -0.7676, 0.0628, 0.0785],
  23621. [ 0.5327, -0.5028, 1.9065, -0.4265, -0.6527, -0.1407, 0.5415, -0.1797],
  23622. [ 0.2941, -0.6158, 1.6339, -1.2622, 0.2046, -1.5005, 0.8122, 0.0909]],
  23623. device='cuda:0', grad_fn=<AddmmBackward>)
  23624. landmarks are: tensor([[[ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  23625. 0.3700],
  23626. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  23627. 0.2853],
  23628. [ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  23629. 0.3745],
  23630. [ 0.6059, -0.4442, 1.7268, -0.0149, -0.2998, 0.1775, 0.9521,
  23631. 0.1661],
  23632. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  23633. 0.5762],
  23634. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  23635. 0.2837],
  23636. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  23637. -0.0670],
  23638. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  23639. 0.2944]]], device='cuda:0')
  23640. loss_train_step before backward: tensor(0.0220, device='cuda:0', grad_fn=<MseLossBackward>)
  23641. loss_train_step after backward: tensor(0.0220, device='cuda:0', grad_fn=<MseLossBackward>)
  23642. loss_train: 0.507318003103137
  23643. step: 14
  23644. running loss: 0.036237000221652646
  23645.  
  23646. Train Steps: 14/90 Loss: 0.0362 torch.Size([8, 600, 800])
  23647. torch.Size([8, 8])
  23648. tensor([[0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  23649. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913],
  23650. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690],
  23651. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  23652. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  23653. [0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617],
  23654. [0.6357, 0.4159, 0.8788, 0.5583, 0.3638, 0.4433, 0.6488, 0.5297],
  23655. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333]],
  23656. device='cuda:0', dtype=torch.float64)
  23657. predictions are: tensor([[ 0.5010, -0.5033, 1.5258, -1.1736, -0.0400, -1.5058, 0.5740, 0.0958],
  23658. [-0.6502, -1.2076, 1.3271, -1.1346, -0.1043, -1.5780, 0.2231, 0.0820],
  23659. [ 0.1329, -0.7390, 1.6516, 0.0745, -0.3668, 0.2067, 0.9566, 0.2391],
  23660. [ 0.5369, -0.4364, 1.6081, -0.6326, -0.6196, -0.3833, 0.2194, 0.1052],
  23661. [ 0.6469, -0.4278, 1.8764, -0.1909, -0.5821, -0.4823, 0.7569, 0.0944],
  23662. [ 0.5482, -0.4222, 1.8058, -0.0620, -0.5755, -0.1781, 0.4873, 0.2051],
  23663. [ 0.6252, -0.3851, 1.7494, 0.2343, -0.5574, -0.2445, 0.6326, 0.0882],
  23664. [ 0.5591, -0.4175, 1.8093, -0.2406, -0.5084, -0.0182, 0.4032, 0.1271]],
  23665. device='cuda:0', grad_fn=<AddmmBackward>)
  23666. landmarks are: tensor([[[ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  23667. 0.0851],
  23668. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  23669. -0.0168],
  23670. [ 0.6306, -0.4153, 1.5141, 0.2224, -0.3691, 0.2622, 1.0033,
  23671. 0.3425],
  23672. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  23673. 0.0802],
  23674. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  23675. 0.1768],
  23676. [ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  23677. 0.3084],
  23678. [ 0.6504, -0.3647, 1.7730, 0.2930, -0.6058, -0.2382, 0.7109,
  23679. 0.1608],
  23680. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  23681. 0.1775]]], device='cuda:0')
  23682. loss_train_step before backward: tensor(0.0457, device='cuda:0', grad_fn=<MseLossBackward>)
  23683. loss_train_step after backward: tensor(0.0457, device='cuda:0', grad_fn=<MseLossBackward>)
  23684. loss_train: 0.5530113819986582
  23685. step: 15
  23686. running loss: 0.03686742546657721
  23687. Train Steps: 15/90 Loss: 0.0369 torch.Size([8, 600, 800])
  23688. torch.Size([8, 8])
  23689. tensor([[0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  23690. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  23691. [0.6339, 0.4112, 0.8838, 0.5067, 0.4000, 0.5433, 0.7549, 0.5378],
  23692. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  23693. [0.6069, 0.3975, 0.8625, 0.5083, 0.4388, 0.5483, 0.5650, 0.4967],
  23694. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  23695. [0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  23696. [0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901]],
  23697. device='cuda:0', dtype=torch.float64)
  23698. predictions are: tensor([[ 5.0703e-01, -4.5975e-01, 1.6656e+00, 3.0593e-01, -4.7732e-01,
  23699. -6.5627e-01, 3.7422e-01, 3.8503e-01],
  23700. [ 2.5524e-01, -6.5057e-01, 1.5289e+00, -9.4455e-01, -6.3493e-01,
  23701. -4.8177e-01, 5.8337e-01, 1.9329e-01],
  23702. [ 2.5623e-01, -6.6214e-01, 1.9205e+00, -1.1357e-01, -4.2664e-01,
  23703. 1.1833e-01, 1.0859e+00, 1.5132e-01],
  23704. [ 5.9606e-01, -4.3202e-01, 9.1692e-01, -1.0829e+00, -4.4209e-01,
  23705. -1.2715e+00, 4.4589e-02, 1.2495e-01],
  23706. [ 2.9305e-01, -6.0549e-01, 1.8639e+00, -2.6410e-02, -2.2537e-01,
  23707. 6.4895e-02, 2.5880e-01, -2.0055e-02],
  23708. [ 2.7239e-01, -6.2210e-01, 1.7858e+00, 4.2429e-02, -1.7373e-01,
  23709. -4.4527e-02, 4.1536e-01, 8.2200e-02],
  23710. [ 4.3774e-01, -5.2086e-01, 1.9156e+00, -2.9562e-01, -3.8331e-01,
  23711. -9.2735e-01, 6.8998e-01, 1.6443e-01],
  23712. [ 6.5677e-01, -3.7615e-01, 1.9344e+00, -6.7801e-01, -5.9268e-01,
  23713. -6.3210e-01, 6.6573e-01, -4.8861e-04]], device='cuda:0',
  23714. grad_fn=<AddmmBackward>)
  23715. landmarks are: tensor([[[ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  23716. 0.4778],
  23717. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  23718. 0.2776],
  23719. [ 0.6421, -0.3864, 1.7961, 0.0543, -0.4383, 0.2237, 1.2007,
  23720. 0.1982],
  23721. [ 0.5470, -0.4081, 0.8492, -1.0773, -0.5307, -1.1620, 0.0912,
  23722. 0.1890],
  23723. [ 0.5174, -0.4497, 1.6979, 0.0620, -0.2594, 0.2468, 0.3238,
  23724. 0.0082],
  23725. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  23726. 0.0851],
  23727. [ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  23728. 0.1608],
  23729. [ 0.6077, -0.3965, 1.8480, -0.6539, -0.6231, -0.4537, 0.6216,
  23730. -0.0220]]], device='cuda:0')
  23731. loss_train_step before backward: tensor(0.0160, device='cuda:0', grad_fn=<MseLossBackward>)
  23732. loss_train_step after backward: tensor(0.0160, device='cuda:0', grad_fn=<MseLossBackward>)
  23733. loss_train: 0.5689659360796213
  23734. step: 16
  23735. running loss: 0.03556037100497633
  23736. Train Steps: 16/90 Loss: 0.0356 torch.Size([8, 600, 800])
  23737. torch.Size([8, 8])
  23738. tensor([[0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  23739. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  23740. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  23741. [0.6102, 0.3999, 0.8750, 0.5133, 0.3825, 0.4750, 0.5637, 0.5083],
  23742. [0.6250, 0.4110, 0.7238, 0.2067, 0.4263, 0.1883, 0.5625, 0.5633],
  23743. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  23744. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  23745. [0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544]],
  23746. device='cuda:0', dtype=torch.float64)
  23747. predictions are: tensor([[-0.0935, -0.8722, 1.3125, -1.3468, -0.2899, -1.2047, 0.7003, 0.2224],
  23748. [ 0.2963, -0.6498, 2.0224, -0.2893, -0.5738, -0.3291, 0.8886, 0.0073],
  23749. [ 0.6682, -0.4188, 1.9193, 0.1636, -0.6020, -0.1303, 0.5732, 0.0660],
  23750. [ 0.6721, -0.3713, 1.9908, -0.0065, -0.5589, 0.0488, 0.3812, -0.0499],
  23751. [ 0.1340, -0.7117, 1.1896, -1.2837, -0.2576, -1.3935, 0.3966, 0.1664],
  23752. [ 0.5357, -0.4752, 1.9282, 0.1077, -0.5723, -0.4885, 0.5420, 0.1317],
  23753. [ 0.7458, -0.3102, 1.8443, 0.3719, -0.2171, -0.0943, 0.5615, 0.3431],
  23754. [ 0.4249, -0.5251, 1.0434, -1.1636, -0.3758, -1.2958, 0.1229, 0.1956]],
  23755. device='cuda:0', grad_fn=<AddmmBackward>)
  23756. landmarks are: tensor([[[ 0.5917, -0.3861, 1.0455, -1.3698, -0.2882, -1.1928, 0.6067,
  23757. 0.2083],
  23758. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  23759. 0.1715],
  23760. [ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  23761. 0.2075],
  23762. [ 0.5326, -0.4390, 1.7557, 0.0851, -0.5192, -0.0919, 0.3180,
  23763. 0.0620],
  23764. [ 0.6010, -0.3875, 1.0570, -1.3313, -0.3171, -1.4160, 0.3122,
  23765. 0.3161],
  23766. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  23767. 0.1698],
  23768. [ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  23769. 0.4470],
  23770. [ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  23771. 0.2747]]], device='cuda:0')
  23772. loss_train_step before backward: tensor(0.0314, device='cuda:0', grad_fn=<MseLossBackward>)
  23773. loss_train_step after backward: tensor(0.0314, device='cuda:0', grad_fn=<MseLossBackward>)
  23774. loss_train: 0.6003932412713766
  23775. step: 17
  23776. running loss: 0.035317249486551565
  23777. Train Steps: 17/90 Loss: 0.0353 torch.Size([8, 600, 800])
  23778. torch.Size([8, 8])
  23779. tensor([[0.6069, 0.3975, 0.8625, 0.5083, 0.4388, 0.5483, 0.5650, 0.4967],
  23780. [0.6179, 0.4008, 0.8600, 0.4015, 0.3932, 0.2515, 0.5711, 0.5438],
  23781. [0.6197, 0.3986, 0.8800, 0.4617, 0.4188, 0.4783, 0.5687, 0.5550],
  23782. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297],
  23783. [0.6187, 0.4104, 0.7126, 0.2069, 0.3950, 0.2517, 0.5913, 0.5683],
  23784. [0.6090, 0.4010, 0.7838, 0.3483, 0.3538, 0.3783, 0.5462, 0.5077],
  23785. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351],
  23786. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875]],
  23787. device='cuda:0', dtype=torch.float64)
  23788. predictions are: tensor([[ 0.3610, -0.5678, 1.9080, 0.1425, -0.2585, 0.2075, 0.4586, 0.0328],
  23789. [ 0.5887, -0.4187, 1.6380, -0.3694, -0.3123, -1.1082, 0.3524, 0.3063],
  23790. [ 0.3034, -0.5894, 1.8729, -0.0846, -0.3672, 0.0066, 0.5765, 0.1857],
  23791. [ 0.2782, -0.6576, 1.9356, -0.0492, -0.4911, -0.0651, 1.0794, 0.1156],
  23792. [ 0.3067, -0.6011, 1.0080, -1.2048, -0.4256, -1.1716, 0.5215, 0.3087],
  23793. [ 0.1235, -0.7251, 1.5411, -0.6893, -0.6735, -0.5725, 0.3647, 0.0733],
  23794. [ 0.6070, -0.4165, 1.3449, -0.9162, -0.1758, -1.4343, 0.4269, 0.1630],
  23795. [ 0.7717, -0.3102, 1.7616, -0.6037, -0.6002, -0.8472, 0.3638, 0.0585]],
  23796. device='cuda:0', grad_fn=<AddmmBackward>)
  23797. landmarks are: tensor([[[ 0.5174, -0.4497, 1.6979, 0.0620, -0.2594, 0.2468, 0.3238,
  23798. 0.0082],
  23799. [ 0.5680, -0.4345, 1.6864, -0.4315, -0.4698, -1.1241, 0.3518,
  23800. 0.2261],
  23801. [ 0.5763, -0.4450, 1.7788, -0.1535, -0.3517, -0.0765, 0.3411,
  23802. 0.2776],
  23803. [ 0.6257, -0.4273, 1.8365, -0.0688, -0.4672, -0.0611, 1.1715,
  23804. 0.1608],
  23805. [ 0.5718, -0.3905, 1.0053, -1.3305, -0.4614, -1.1235, 0.4450,
  23806. 0.3392],
  23807. [ 0.5270, -0.4336, 1.3342, -0.6770, -0.6520, -0.5384, 0.2370,
  23808. 0.0592],
  23809. [ 0.5664, -0.4321, 1.2862, -1.0003, -0.2189, -1.4608, 0.3883,
  23810. 0.1855],
  23811. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  23812. -0.0340]]], device='cuda:0')
  23813. loss_train_step before backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  23814. loss_train_step after backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  23815. loss_train: 0.618410861119628
  23816. step: 18
  23817. running loss: 0.03435615895109044
  23818.  
  23819. Train Steps: 18/90 Loss: 0.0344 torch.Size([8, 600, 800])
  23820. torch.Size([8, 8])
  23821. tensor([[0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  23822. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  23823. [0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  23824. [0.6350, 0.4144, 0.9250, 0.4100, 0.4125, 0.3750, 0.7129, 0.5945],
  23825. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795],
  23826. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  23827. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  23828. [0.6092, 0.4001, 0.8638, 0.4867, 0.4288, 0.5367, 0.5484, 0.5064]],
  23829. device='cuda:0', dtype=torch.float64)
  23830. predictions are: tensor([[ 0.1828, -0.6863, 1.7455, -1.3498, 0.0840, -1.6401, 0.8802, 0.0811],
  23831. [ 0.5804, -0.3763, 1.8545, -0.1124, -0.2649, 0.2308, 0.4292, 0.1976],
  23832. [ 0.4637, -0.4524, 1.1475, -0.7110, -0.3402, -1.3154, 0.0892, 0.4226],
  23833. [ 0.5057, -0.4969, 1.9738, -0.3320, -0.3745, -0.6609, 0.8750, 0.2639],
  23834. [ 0.7743, -0.3068, 1.7448, 0.1914, -0.5778, 0.1589, 0.8097, 0.1874],
  23835. [ 0.4554, -0.5175, 1.7897, 0.2008, -0.5382, -0.1848, 0.2942, 0.0439],
  23836. [ 0.6566, -0.3793, 1.5341, 0.1815, -0.5751, -0.1516, 0.8652, 0.2552],
  23837. [ 0.3685, -0.5335, 1.7676, -0.0991, -0.3964, 0.0852, 0.0582, 0.0316]],
  23838. device='cuda:0', grad_fn=<AddmmBackward>)
  23839. landmarks are: tensor([[[ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  23840. 0.2142],
  23841. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  23842. 0.2083],
  23843. [ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  23844. 0.5401],
  23845. [ 0.6471, -0.3719, 1.9866, -0.3921, -0.3806, -0.5538, 1.0070,
  23846. 0.4600],
  23847. [ 0.6355, -0.4080, 1.6113, 0.1852, -0.4730, 0.1467, 0.9996,
  23848. 0.3905],
  23849. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  23850. 0.1979],
  23851. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  23852. 0.3478],
  23853. [ 0.5278, -0.4377, 1.7037, -0.0380, -0.3055, 0.1929, 0.2473,
  23854. 0.0532]]], device='cuda:0')
  23855. loss_train_step before backward: tensor(0.0174, device='cuda:0', grad_fn=<MseLossBackward>)
  23856. loss_train_step after backward: tensor(0.0174, device='cuda:0', grad_fn=<MseLossBackward>)
  23857. loss_train: 0.6358400098979473
  23858. step: 19
  23859. running loss: 0.033465263678839334
  23860. Train Steps: 19/90 Loss: 0.0335 torch.Size([8, 600, 800])
  23861. torch.Size([8, 8])
  23862. tensor([[0.6100, 0.4071, 0.7601, 0.3444, 0.3400, 0.4117, 0.5625, 0.5617],
  23863. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  23864. [0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901],
  23865. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  23866. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  23867. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  23868. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650],
  23869. [0.6339, 0.4112, 0.8838, 0.5067, 0.4000, 0.5433, 0.7549, 0.5378]],
  23870. device='cuda:0', dtype=torch.float64)
  23871. predictions are: tensor([[ 0.7286, -0.3021, 1.2757, -0.6294, -0.6770, -0.5504, 0.3182, 0.2894],
  23872. [ 0.6831, -0.3413, 1.7177, 0.1549, -0.2115, -0.1291, 0.4543, 0.2399],
  23873. [ 1.0485, -0.1073, 1.8392, -0.5684, -0.5598, -0.7251, 0.6200, 0.0672],
  23874. [ 0.6044, -0.4001, 1.7955, 0.1472, -0.2306, -0.2585, 0.1774, 0.2846],
  23875. [ 0.6464, -0.3412, 1.8233, -0.2097, -0.3579, 0.0401, 0.5192, 0.2039],
  23876. [ 0.8227, -0.2677, 1.8455, 0.1839, -0.4548, 0.0273, 0.8990, 0.1851],
  23877. [-1.6205, -1.8727, 1.1033, -1.1597, -0.3460, -1.5958, 0.1061, 0.0953],
  23878. [ 0.7472, -0.3128, 1.8387, 0.1208, -0.4073, 0.0710, 1.0212, 0.2521]],
  23879. device='cuda:0', grad_fn=<AddmmBackward>)
  23880. landmarks are: tensor([[[ 5.3178e-01, -4.0564e-01, 1.2249e+00, -6.9494e-01, -7.1547e-01,
  23881. -3.8445e-01, 3.1224e-01, 3.0839e-01],
  23882. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  23883. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  23884. [ 6.0774e-01, -3.9646e-01, 1.8480e+00, -6.5389e-01, -6.2309e-01,
  23885. -4.5373e-01, 6.2155e-01, -2.1963e-02],
  23886. [ 5.5254e-01, -4.4627e-01, 1.7326e+00, 3.1255e-02, -2.5358e-01,
  23887. -6.8822e-02, 1.9677e-01, 3.6998e-01],
  23888. [ 5.4169e-01, -4.3549e-01, 1.8018e+00, -3.3826e-01, -3.9792e-01,
  23889. 2.6220e-01, 5.1432e-01, 2.6220e-01],
  23890. [ 6.4212e-01, -3.6953e-01, 1.7788e+00, 2.3557e-02, -4.8453e-01,
  23891. 1.5443e-01, 1.1971e+00, 2.1955e-01],
  23892. [-2.2859e+00, -2.2859e+00, 1.0361e+00, -1.2021e+00, -4.2102e-01,
  23893. -1.3390e+00, 8.7067e-02, 3.2379e-01],
  23894. [ 6.4212e-01, -3.8638e-01, 1.7961e+00, 5.4350e-02, -4.3834e-01,
  23895. 2.2371e-01, 1.2007e+00, 1.9818e-01]]], device='cuda:0')
  23896. loss_train_step before backward: tensor(0.0273, device='cuda:0', grad_fn=<MseLossBackward>)
  23897. loss_train_step after backward: tensor(0.0273, device='cuda:0', grad_fn=<MseLossBackward>)
  23898. loss_train: 0.6631092224270105
  23899. step: 20
  23900. running loss: 0.033155461121350524
  23901. Train Steps: 20/90 Loss: 0.0332 torch.Size([8, 600, 800])
  23902. torch.Size([8, 8])
  23903. tensor([[0.6198, 0.4101, 0.8838, 0.5283, 0.3763, 0.5267, 0.5913, 0.5567],
  23904. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390],
  23905. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  23906. [0.6371, 0.4092, 0.8337, 0.5850, 0.3950, 0.5117, 0.6559, 0.5262],
  23907. [0.6129, 0.3930, 0.8769, 0.5105, 0.4146, 0.5642, 0.6000, 0.5082],
  23908. [0.6129, 0.4069, 0.8750, 0.5067, 0.3875, 0.4233, 0.5235, 0.5881],
  23909. [0.6132, 0.3930, 0.8672, 0.4754, 0.3712, 0.5222, 0.5974, 0.5098],
  23910. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483]],
  23911. device='cuda:0', dtype=torch.float64)
  23912. predictions are: tensor([[ 0.5992, -0.3980, 1.7403, 0.2467, -0.4589, -0.0764, 0.5850, 0.3452],
  23913. [ 0.3023, -0.6008, 1.8628, -0.1265, -0.4278, -0.0498, 1.0072, 0.2887],
  23914. [ 0.8948, -0.2468, 1.3591, -1.4355, -0.3035, -1.3032, 0.6622, 0.1346],
  23915. [ 0.8589, -0.2448, 1.5960, 0.3670, -0.4593, -0.1402, 0.7276, 0.1638],
  23916. [ 0.5828, -0.4151, 1.7459, 0.1039, -0.2371, 0.0888, 0.3880, 0.1641],
  23917. [ 0.5667, -0.4005, 1.7422, 0.1350, -0.4795, -0.4804, 0.1186, 0.3531],
  23918. [ 0.5436, -0.4430, 1.7085, -0.0783, -0.4442, -0.0420, 0.4933, 0.1895],
  23919. [ 0.4270, -0.5031, 1.7202, -0.4630, -0.4792, -0.2533, 0.3859, 0.2487]],
  23920. device='cuda:0', grad_fn=<AddmmBackward>)
  23921. landmarks are: tensor([[[ 5.7696e-01, -3.9176e-01, 1.7961e+00, 1.5443e-01, -5.4804e-01,
  23922. 1.4673e-01, 4.4503e-01, 2.8530e-01],
  23923. [ 6.4212e-01, -3.9120e-01, 1.9115e+00, -8.4219e-02, -4.7298e-01,
  23924. 1.5443e-01, 1.1824e+00, 2.0352e-01],
  23925. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  23926. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  23927. [ 6.5695e-01, -3.9601e-01, 1.5651e+00, 4.1617e-01, -4.6143e-01,
  23928. 7.7444e-02, 7.4375e-01, 1.4474e-01],
  23929. [ 5.4496e-01, -4.7064e-01, 1.7643e+00, 7.2204e-02, -3.7076e-01,
  23930. 3.2001e-01, 4.8543e-01, 6.1219e-02],
  23931. [ 5.4515e-01, -4.0670e-01, 1.7557e+00, 5.4350e-02, -4.9607e-01,
  23932. -3.3056e-01, 1.3228e-01, 4.3063e-01],
  23933. [ 5.4660e-01, -4.7064e-01, 1.7198e+00, -9.0292e-02, -5.7125e-01,
  23934. 1.2613e-01, 4.7328e-01, 6.8827e-02],
  23935. [ 5.5456e-01, -4.6205e-01, 1.7788e+00, -4.2294e-01, -5.1917e-01,
  23936. -2.2633e-02, 4.2771e-01, 2.4681e-01]]], device='cuda:0')
  23937. loss_train_step before backward: tensor(0.0139, device='cuda:0', grad_fn=<MseLossBackward>)
  23938. loss_train_step after backward: tensor(0.0139, device='cuda:0', grad_fn=<MseLossBackward>)
  23939. loss_train: 0.6769989067688584
  23940. step: 21
  23941. running loss: 0.03223804317946945
  23942. Train Steps: 21/90 Loss: 0.0322 torch.Size([8, 600, 800])
  23943. torch.Size([8, 8])
  23944. tensor([[0.6211, 0.3993, 0.7650, 0.1933, 0.4575, 0.1550, 0.5965, 0.4895],
  23945. [0.6152, 0.4131, 0.6863, 0.2567, 0.3625, 0.3300, 0.5765, 0.5305],
  23946. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  23947. [0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  23948. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  23949. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  23950. [0.6165, 0.4106, 0.7575, 0.1733, 0.3838, 0.2650, 0.5680, 0.5116],
  23951. [0.6168, 0.4081, 0.8438, 0.3367, 0.3500, 0.4667, 0.6212, 0.5400]],
  23952. device='cuda:0', dtype=torch.float64)
  23953. predictions are: tensor([[ 0.6423, -0.4058, 1.3525, -1.2299, -0.0814, -1.5329, 0.4613, 0.1552],
  23954. [ 0.3405, -0.5563, 1.0578, -0.8936, -0.5718, -0.7640, 0.4300, 0.3576],
  23955. [ 0.5428, -0.4354, 1.0600, -0.8942, -0.3129, -1.1778, 0.3834, 0.4182],
  23956. [ 0.7124, -0.3692, 1.7740, 0.6887, -0.4695, -0.0495, 0.6066, 0.1195],
  23957. [ 0.4637, -0.4929, 1.9336, 0.4006, -0.5610, -0.1530, 0.5893, 0.3991],
  23958. [ 0.6304, -0.3523, 1.9097, -0.1257, -0.4233, 0.4380, 0.6059, 0.1707],
  23959. [ 0.7436, -0.3395, 1.3049, -1.1675, -0.4783, -1.1101, 0.5469, 0.1452],
  23960. [ 0.1071, -0.7279, 1.7459, -0.5140, -0.5872, -0.1503, 0.7996, 0.2985]],
  23961. device='cuda:0', grad_fn=<AddmmBackward>)
  23962. landmarks are: tensor([[[ 0.5828, -0.4417, 1.2476, -1.3929, -0.1727, -1.5700, 0.4694,
  23963. -0.0248],
  23964. [ 0.5557, -0.3779, 0.8838, -1.1004, -0.6115, -0.7617, 0.3769,
  23965. 0.1644],
  23966. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  23967. 0.2622],
  23968. [ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  23969. -0.1492],
  23970. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  23971. 0.3161],
  23972. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  23973. 0.0772],
  23974. [ 0.5618, -0.3895, 1.2129, -1.4853, -0.5134, -1.0619, 0.3378,
  23975. 0.0772],
  23976. [ 0.5631, -0.4008, 1.6113, -0.7309, -0.6693, -0.1304, 0.5836,
  23977. 0.2083]]], device='cuda:0')
  23978. loss_train_step before backward: tensor(0.0238, device='cuda:0', grad_fn=<MseLossBackward>)
  23979. loss_train_step after backward: tensor(0.0238, device='cuda:0', grad_fn=<MseLossBackward>)
  23980. loss_train: 0.7008060766384006
  23981. step: 22
  23982. running loss: 0.031854821665381845
  23983.  
  23984. Train Steps: 22/90 Loss: 0.0319 torch.Size([8, 600, 800])
  23985. torch.Size([8, 8])
  23986. tensor([[0.6097, 0.4024, 0.8488, 0.3717, 0.3875, 0.5517, 0.5836, 0.5591],
  23987. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  23988. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  23989. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  23990. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  23991. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  23992. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  23993. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413]],
  23994. device='cuda:0', dtype=torch.float64)
  23995. predictions are: tensor([[ 0.5192, -0.4303, 1.5533, -0.5186, -0.4992, 0.2291, 0.8167, 0.2161],
  23996. [ 0.8398, -0.2164, 1.5734, -0.2260, -0.6431, -0.7362, 0.4513, 0.3491],
  23997. [ 0.7983, -0.2492, 1.6775, -0.1223, -0.1407, 0.0391, 0.6358, 0.2704],
  23998. [-0.8730, -1.3414, 0.9229, -1.2942, -0.4417, -1.3333, 0.1050, 0.1558],
  23999. [ 0.7856, -0.2575, 1.5907, 0.4904, -0.6020, -0.0994, 0.5406, 0.3689],
  24000. [ 0.7232, -0.2932, 1.6110, 0.1631, -0.2535, 0.0306, 0.2218, 0.2326],
  24001. [ 0.7808, -0.2383, 1.7002, 0.0022, -0.2485, 0.3157, 0.6546, 0.3287],
  24002. [ 0.6408, -0.3928, 1.9235, -0.6045, -0.2477, -1.1302, 0.9770, 0.1677]],
  24003. device='cuda:0', grad_fn=<AddmmBackward>)
  24004. landmarks are: tensor([[[ 0.5301, -0.4273, 1.6344, -0.5692, -0.4961, 0.2622, 0.4098,
  24005. 0.2966],
  24006. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  24007. 0.2699],
  24008. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  24009. 0.2853],
  24010. [-2.2859, -2.2859, 1.0513, -1.2851, -0.4441, -1.2313, 0.2206,
  24011. 0.1073],
  24012. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  24013. 0.5316],
  24014. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  24015. 0.2634],
  24016. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  24017. 0.2083],
  24018. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  24019. 0.2142]]], device='cuda:0')
  24020. loss_train_step before backward: tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward>)
  24021. loss_train_step after backward: tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward>)
  24022. loss_train: 0.7600116161629558
  24023. step: 23
  24024. running loss: 0.03304398331143286
  24025. Train Steps: 23/90 Loss: 0.0330 torch.Size([8, 600, 800])
  24026. torch.Size([8, 8])
  24027. tensor([[0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  24028. [0.6107, 0.4050, 0.8700, 0.4850, 0.4470, 0.4848, 0.5043, 0.5431],
  24029. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  24030. [0.6209, 0.3920, 0.8650, 0.5367, 0.4400, 0.5067, 0.6025, 0.4950],
  24031. [0.6250, 0.4110, 0.7238, 0.2067, 0.4263, 0.1883, 0.5625, 0.5633],
  24032. [0.6193, 0.3930, 0.8949, 0.4437, 0.3852, 0.5435, 0.6263, 0.5263],
  24033. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  24034. [0.6224, 0.3964, 0.8225, 0.5717, 0.4150, 0.4617, 0.5775, 0.5267]],
  24035. device='cuda:0', dtype=torch.float64)
  24036. predictions are: tensor([[ 0.6867, -0.2904, 1.3013, -0.6740, -0.6040, -0.8209, 0.2258, 0.2238],
  24037. [ 0.7138, -0.2789, 1.6832, 0.0185, -0.3824, 0.1739, 0.3402, 0.2216],
  24038. [ 0.8082, -0.2157, 1.4416, -1.2298, -0.1667, -1.0268, 0.7925, 0.1555],
  24039. [ 0.6891, -0.3364, 1.7066, 0.2175, -0.3908, 0.2481, 0.6137, 0.1848],
  24040. [ 0.6694, -0.3064, 1.0297, -1.0955, -0.3065, -1.2666, 0.5156, 0.3473],
  24041. [ 0.6522, -0.3592, 1.7807, -0.1508, -0.5552, 0.2680, 0.8259, 0.2385],
  24042. [-1.8048, -1.9724, 0.9865, -1.1424, -0.2959, -1.4394, 0.2511, 0.3223],
  24043. [ 0.8061, -0.2563, 1.6035, 0.4277, -0.5191, -0.0406, 0.5202, 0.2413]],
  24044. device='cuda:0', grad_fn=<AddmmBackward>)
  24045. landmarks are: tensor([[[ 5.5319e-01, -3.8879e-01, 1.4727e+00, -7.4627e-01, -5.5381e-01,
  24046. -1.0465e+00, 2.6467e-02, 2.1383e-01],
  24047. [ 5.3508e-01, -4.1527e-01, 1.7326e+00, -4.5727e-02, -2.2139e-01,
  24048. -4.6642e-02, 4.3431e-02, 2.2284e-01],
  24049. [ 6.1270e-01, -3.9438e-01, 1.5189e+00, -1.2467e+00, -1.3233e-01,
  24050. -1.4622e+00, 5.6463e-01, -3.6943e-02],
  24051. [ 5.8199e-01, -4.7544e-01, 1.7095e+00, 1.9292e-01, -2.5358e-01,
  24052. 5.4350e-02, 4.9700e-01, 4.6189e-04],
  24053. [ 6.0098e-01, -3.8745e-01, 1.0570e+00, -1.3313e+00, -3.1709e-01,
  24054. -1.4160e+00, 3.1224e-01, 3.1609e-01],
  24055. [ 5.7460e-01, -4.7064e-01, 1.8476e+00, -2.3654e-01, -5.0683e-01,
  24056. 2.2450e-01, 6.0688e-01, 1.4491e-01],
  24057. [-2.2859e+00, -2.2859e+00, 6.7598e-01, -1.4083e+00, -3.2864e-01,
  24058. -1.4160e+00, 2.4873e-01, 3.4688e-01],
  24059. [ 5.8915e-01, -4.5504e-01, 1.5132e+00, 3.5458e-01, -3.6905e-01,
  24060. -1.5350e-01, 3.8152e-01, 1.4673e-01]]], device='cuda:0')
  24061. loss_train_step before backward: tensor(0.0274, device='cuda:0', grad_fn=<MseLossBackward>)
  24062. loss_train_step after backward: tensor(0.0274, device='cuda:0', grad_fn=<MseLossBackward>)
  24063. loss_train: 0.7874013772234321
  24064. step: 24
  24065. running loss: 0.032808390717643
  24066. Train Steps: 24/90 Loss: 0.0328 torch.Size([8, 600, 800])
  24067. torch.Size([8, 8])
  24068. tensor([[0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  24069. [0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823],
  24070. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320],
  24071. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  24072. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  24073. [0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395],
  24074. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  24075. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150]],
  24076. device='cuda:0', dtype=torch.float64)
  24077. predictions are: tensor([[ 0.5090, -0.4777, 1.5581, 0.3141, -0.4932, 0.0368, 0.8771, 0.3633],
  24078. [ 0.2972, -0.5898, 1.5307, -1.0487, -0.2588, -1.2857, 0.4801, 0.0661],
  24079. [ 0.3602, -0.5758, 1.5941, 0.1848, -0.5014, 0.1306, 0.7942, 0.2363],
  24080. [ 0.6912, -0.3386, 1.7118, -0.7506, -0.3744, -1.1410, 0.4392, 0.1324],
  24081. [ 0.4615, -0.4464, 1.5727, 0.1339, -0.2828, 0.2632, 0.0648, 0.2474],
  24082. [ 0.6099, -0.3904, 0.9968, -1.2696, -0.4457, -0.9995, 0.4334, 0.2862],
  24083. [ 0.7335, -0.3144, 1.1439, -1.0194, -0.5125, -0.8689, 0.5599, 0.4064],
  24084. [ 0.5387, -0.4068, 1.7121, -0.0485, -0.3344, 0.5094, 0.5716, 0.2331]],
  24085. device='cuda:0', grad_fn=<AddmmBackward>)
  24086. landmarks are: tensor([[[ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  24087. 0.3745],
  24088. [ 0.6132, -0.4122, 1.5478, -1.0619, -0.2709, -1.4314, 0.5500,
  24089. -0.0583],
  24090. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  24091. 0.1715],
  24092. [ 0.6128, -0.3828, 1.7499, -0.8386, -0.3344, -1.2620, 0.5792,
  24093. -0.0263],
  24094. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  24095. 0.2386],
  24096. [ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  24097. 0.2058],
  24098. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  24099. 0.3777],
  24100. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  24101. 0.0928]]], device='cuda:0')
  24102. loss_train_step before backward: tensor(0.0127, device='cuda:0', grad_fn=<MseLossBackward>)
  24103. loss_train_step after backward: tensor(0.0127, device='cuda:0', grad_fn=<MseLossBackward>)
  24104. loss_train: 0.8001020578667521
  24105. step: 25
  24106. running loss: 0.032004082314670085
  24107. Train Steps: 25/90 Loss: 0.0320 torch.Size([8, 600, 800])
  24108. torch.Size([8, 8])
  24109. tensor([[0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  24110. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  24111. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  24112. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  24113. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064],
  24114. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717],
  24115. [ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  24116. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397]],
  24117. device='cuda:0', dtype=torch.float64)
  24118. predictions are: tensor([[ 0.7484, -0.2701, 0.9943, -1.1130, -0.4974, -0.8206, 0.6677, 0.3461],
  24119. [ 0.5576, -0.4452, 1.8740, -0.1048, -0.5938, -0.3413, 0.9014, 0.0819],
  24120. [ 0.8929, -0.1953, 1.1599, -0.9577, -0.4125, -0.6735, 0.6857, 0.4512],
  24121. [ 0.9197, -0.1350, 1.6207, -0.0053, -0.5782, -0.4007, 0.4676, 0.3432],
  24122. [ 0.7223, -0.2809, 1.6813, 0.0196, -0.0342, 0.1632, 0.1919, 0.1328],
  24123. [ 0.5366, -0.4327, 1.7118, -0.0477, -0.3475, 0.1408, 0.4257, 0.2003],
  24124. [-1.7881, -1.9381, 1.0119, -1.3121, -0.1923, -1.0895, 0.3048, 0.1346],
  24125. [ 0.8429, -0.1873, 1.6756, -0.1547, -0.6246, -0.4101, 0.2499, 0.1570]],
  24126. device='cuda:0', grad_fn=<AddmmBackward>)
  24127. landmarks are: tensor([[[ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  24128. 0.3700],
  24129. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  24130. 0.0325],
  24131. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  24132. 0.5701],
  24133. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  24134. 0.3161],
  24135. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  24136. 0.0532],
  24137. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  24138. 0.3546],
  24139. [-2.2859, -2.2859, 0.9175, -1.3947, -0.3691, -1.2467, 0.2314,
  24140. 0.3238],
  24141. [ 0.5443, -0.3994, 1.7499, -0.1227, -0.6173, -0.5769, 0.0049,
  24142. 0.2071]]], device='cuda:0')
  24143. loss_train_step before backward: tensor(0.0233, device='cuda:0', grad_fn=<MseLossBackward>)
  24144. loss_train_step after backward: tensor(0.0233, device='cuda:0', grad_fn=<MseLossBackward>)
  24145. loss_train: 0.823372888378799
  24146. step: 26
  24147. running loss: 0.03166818801456919
  24148.  
  24149. Train Steps: 26/90 Loss: 0.0317 torch.Size([8, 600, 800])
  24150. torch.Size([8, 8])
  24151. tensor([[0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  24152. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  24153. [0.6259, 0.4133, 0.8200, 0.2317, 0.5025, 0.1533, 0.6250, 0.4947],
  24154. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456],
  24155. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  24156. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  24157. [0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  24158. [0.6118, 0.4052, 0.8463, 0.3917, 0.3538, 0.3450, 0.5053, 0.5593]],
  24159. device='cuda:0', dtype=torch.float64)
  24160. predictions are: tensor([[ 7.5652e-01, -2.7539e-01, 1.5621e+00, 1.8410e-01, -5.1502e-01,
  24161. -3.3857e-01, 3.6783e-01, 2.5592e-01],
  24162. [ 7.1403e-01, -3.2540e-01, 1.6967e+00, -5.6145e-01, -5.9954e-01,
  24163. -3.0913e-01, 7.2090e-01, 7.3376e-02],
  24164. [ 8.6360e-01, -2.0367e-01, 1.3451e+00, -1.1514e+00, -1.1073e-02,
  24165. -1.2515e+00, 5.7336e-01, 1.6534e-01],
  24166. [ 7.4604e-01, -2.7205e-01, 1.5418e+00, 1.2414e-01, -3.3964e-01,
  24167. 4.4680e-01, 3.2297e-01, 3.0321e-01],
  24168. [ 5.8184e-01, -4.4765e-01, 1.8961e+00, -3.1615e-01, -2.8393e-01,
  24169. -6.9362e-01, 1.0925e+00, 1.8052e-01],
  24170. [-1.9204e+00, -2.0319e+00, 8.3474e-01, -1.2677e+00, -4.0795e-01,
  24171. -1.1218e+00, 1.0736e-01, 1.9626e-01],
  24172. [ 5.2281e-01, -4.1657e-01, 1.1166e+00, -1.1776e+00, -5.2418e-01,
  24173. -6.1399e-01, 5.6810e-01, 2.8002e-01],
  24174. [ 7.1040e-01, -2.8060e-01, 1.4571e+00, -4.6101e-01, -5.9290e-01,
  24175. -4.6358e-01, -8.6606e-04, 2.7863e-01]], device='cuda:0',
  24176. grad_fn=<AddmmBackward>)
  24177. landmarks are: tensor([[[ 5.9013e-01, -4.1570e-01, 1.7557e+00, 1.9292e-01, -5.4226e-01,
  24178. -5.9230e-01, 3.5843e-01, 1.6982e-01],
  24179. [ 6.0710e-01, -4.1186e-01, 1.7788e+00, -5.1532e-01, -6.0000e-01,
  24180. -5.6921e-01, 6.5857e-01, -6.7050e-02],
  24181. [ 6.0514e-01, -3.7714e-01, 1.5016e+00, -1.2159e+00, 3.5104e-02,
  24182. -1.5777e+00, 6.0099e-01, -9.2270e-04],
  24183. [ 5.4428e-01, -3.8399e-01, 1.7095e+00, 6.2048e-02, -3.9792e-01,
  24184. 1.9292e-01, 1.6218e-01, 2.3412e-01],
  24185. [ 6.2236e-01, -4.3453e-01, 1.9404e+00, -2.9207e-01, -3.1709e-01,
  24186. -8.7714e-01, 1.0655e+00, 2.1421e-01],
  24187. [-2.2859e+00, -2.2859e+00, 8.5162e-01, -1.3112e+00, -4.3256e-01,
  24188. -1.2851e+00, 7.5520e-02, 2.9299e-01],
  24189. [ 5.7296e-01, -4.5619e-01, 1.2195e+00, -1.2440e+00, -5.4966e-01,
  24190. -7.7109e-01, 5.7045e-01, 1.7788e-01],
  24191. [ 5.3990e-01, -4.1424e-01, 1.6229e+00, -4.7683e-01, -6.5196e-01,
  24192. -6.9238e-01, 4.8058e-02, 2.9724e-01]]], device='cuda:0')
  24193. loss_train_step before backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  24194. loss_train_step after backward: tensor(0.0186, device='cuda:0', grad_fn=<MseLossBackward>)
  24195. loss_train: 0.8419636627659202
  24196. step: 27
  24197. running loss: 0.031183839361700747
  24198. Train Steps: 27/90 Loss: 0.0312 torch.Size([8, 600, 800])
  24199. torch.Size([8, 8])
  24200. tensor([[0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  24201. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  24202. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  24203. [0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  24204. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  24205. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  24206. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  24207. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656]],
  24208. device='cuda:0', dtype=torch.float64)
  24209. predictions are: tensor([[ 0.6225, -0.3881, 1.5662, -0.0781, -0.2772, 0.1189, 0.2225, 0.0775],
  24210. [ 0.9844, -0.1379, 1.7062, -0.6037, -0.4731, 0.3303, 0.7703, 0.1002],
  24211. [ 0.7208, -0.3073, 1.5178, 0.1953, -0.3616, -0.4154, 0.4075, 0.4878],
  24212. [ 0.6547, -0.3556, 1.4913, 0.1435, -0.2581, -0.0428, 0.4009, 0.1827],
  24213. [ 0.3554, -0.5601, 1.6440, -0.4274, -0.5485, -0.4182, 0.5138, 0.2277],
  24214. [ 0.4400, -0.5040, 1.6787, -0.3374, -0.5218, -0.4229, 0.8214, 0.1786],
  24215. [ 0.3061, -0.5993, 1.7038, -0.4087, -0.4780, -0.3626, 0.3291, 0.2741],
  24216. [ 0.5325, -0.4226, 1.4472, -0.5124, -0.4933, -0.2613, 0.2442, 0.2672]],
  24217. device='cuda:0', grad_fn=<AddmmBackward>)
  24218. landmarks are: tensor([[[ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  24219. 0.0467],
  24220. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  24221. 0.1005],
  24222. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  24223. 0.4624],
  24224. [ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  24225. 0.2237],
  24226. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  24227. 0.2314],
  24228. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  24229. 0.1499],
  24230. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  24231. 0.3087],
  24232. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  24233. 0.3265]]], device='cuda:0')
  24234. loss_train_step before backward: tensor(0.0205, device='cuda:0', grad_fn=<MseLossBackward>)
  24235. loss_train_step after backward: tensor(0.0205, device='cuda:0', grad_fn=<MseLossBackward>)
  24236. loss_train: 0.8624861231073737
  24237. step: 28
  24238. running loss: 0.030803075825263346
  24239. Train Steps: 28/90 Loss: 0.0308 torch.Size([8, 600, 800])
  24240. torch.Size([8, 8])
  24241. tensor([[0.6173, 0.4114, 0.7325, 0.2500, 0.4213, 0.1917, 0.5338, 0.5700],
  24242. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  24243. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  24244. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  24245. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  24246. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  24247. [0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  24248. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217]],
  24249. device='cuda:0', dtype=torch.float64)
  24250. predictions are: tensor([[ 0.1548, -0.6666, 1.0475, -1.1813, -0.3556, -1.3011, 0.2236, 0.2432],
  24251. [ 0.7615, -0.3281, 1.7192, 0.2027, -0.5713, -0.0331, 0.7117, 0.0804],
  24252. [ 0.5163, -0.4591, 1.4358, -1.4274, -0.3775, -1.1807, 0.6925, 0.0060],
  24253. [ 0.6276, -0.3860, 1.7572, -0.2639, -0.3414, 0.2167, 0.4277, 0.1755],
  24254. [ 0.3829, -0.5351, 1.7428, -0.1622, -0.5477, -0.1566, 0.4544, 0.1677],
  24255. [ 0.5205, -0.4734, 1.5797, 0.3457, -0.2694, 0.0125, 0.0688, 0.0827],
  24256. [ 0.3644, -0.5406, 1.6827, -0.2990, -0.5216, -0.1021, 0.4127, 0.3489],
  24257. [ 0.4920, -0.4392, 1.0327, -1.2483, -0.3211, -1.2385, 0.4642, 0.4751]],
  24258. device='cuda:0', grad_fn=<AddmmBackward>)
  24259. landmarks are: tensor([[[ 5.6518e-01, -3.8584e-01, 1.0975e+00, -1.1312e+00, -3.4018e-01,
  24260. -1.4006e+00, 1.7945e-01, 3.4688e-01],
  24261. [ 6.1484e-01, -4.1301e-01, 1.6864e+00, 1.6982e-01, -5.3072e-01,
  24262. -1.1501e-01, 6.1247e-01, 8.5142e-02],
  24263. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  24264. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  24265. [ 5.4990e-01, -4.2249e-01, 1.8018e+00, -2.9207e-01, -3.0554e-01,
  24266. 5.4350e-02, 4.0462e-01, 2.6990e-01],
  24267. [ 5.8655e-01, -3.9731e-01, 1.8423e+00, -6.8822e-02, -5.1917e-01,
  24268. -2.3048e-01, 4.1617e-01, 1.1594e-01],
  24269. [ 5.1928e-01, -4.6990e-01, 1.5767e+00, 4.0077e-01, -2.4203e-01,
  24270. 7.7444e-02, 1.1776e-01, -6.1038e-02],
  24271. [ 5.7003e-01, -4.0316e-01, 1.7961e+00, -1.9969e-01, -5.2494e-01,
  24272. -2.1509e-01, 3.8152e-01, 3.1609e-01],
  24273. [ 5.6871e-01, -4.0878e-01, 1.0397e+00, -1.1466e+00, -3.1132e-01,
  24274. -1.1928e+00, 4.6813e-01, 5.8553e-01]]], device='cuda:0')
  24275. loss_train_step before backward: tensor(0.0100, device='cuda:0', grad_fn=<MseLossBackward>)
  24276. loss_train_step after backward: tensor(0.0100, device='cuda:0', grad_fn=<MseLossBackward>)
  24277. loss_train: 0.872529580257833
  24278. step: 29
  24279. running loss: 0.030087226905442518
  24280.  
  24281. Train Steps: 29/90 Loss: 0.0301 torch.Size([8, 600, 800])
  24282. torch.Size([8, 8])
  24283. tensor([[0.6101, 0.4042, 0.7775, 0.2617, 0.3713, 0.2817, 0.5440, 0.5650],
  24284. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  24285. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  24286. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  24287. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  24288. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  24289. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679],
  24290. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901]],
  24291. device='cuda:0', dtype=torch.float64)
  24292. predictions are: tensor([[ 0.5629, -0.4008, 1.1536, -0.9999, -0.5741, -0.8104, 0.1382, 0.2250],
  24293. [ 0.6017, -0.3874, 1.4440, -1.0393, -0.1726, -1.3285, 0.5830, 0.1753],
  24294. [ 0.9206, -0.2273, 1.5587, 0.5413, -0.6123, 0.1463, 0.4333, 0.0461],
  24295. [ 0.4372, -0.4923, 1.6003, -1.1577, 0.0245, -1.0948, 1.0326, 0.1909],
  24296. [ 0.4308, -0.4589, 1.1894, -0.9453, -0.4832, -0.9390, 0.0674, 0.2499],
  24297. [ 0.9319, -0.1536, 1.6204, -0.4210, -0.6550, 0.0903, 0.3071, 0.1912],
  24298. [-1.7346, -1.9065, 1.4397, -1.1808, 0.0347, -1.2153, 0.9088, 0.3061],
  24299. [ 0.4637, -0.4995, 1.7508, -0.1255, -0.5554, -0.0794, 0.1084, 0.0721]],
  24300. device='cuda:0', grad_fn=<AddmmBackward>)
  24301. landmarks are: tensor([[[ 0.5320, -0.4189, 1.3053, -1.0773, -0.5711, -0.9849, 0.2267,
  24302. 0.3237],
  24303. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  24304. 0.0851],
  24305. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  24306. -0.1385],
  24307. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  24308. 0.2142],
  24309. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  24310. 0.3700],
  24311. [ 0.5384, -0.4361, 1.7961, -0.4999, -0.5480, -0.1150, 0.3931,
  24312. 0.2776],
  24313. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  24314. 0.3371],
  24315. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  24316. -0.0220]]], device='cuda:0')
  24317. loss_train_step before backward: tensor(0.0269, device='cuda:0', grad_fn=<MseLossBackward>)
  24318. loss_train_step after backward: tensor(0.0269, device='cuda:0', grad_fn=<MseLossBackward>)
  24319. loss_train: 0.8993881745263934
  24320. step: 30
  24321. running loss: 0.029979605817546447
  24322. Train Steps: 30/90 Loss: 0.0300 torch.Size([8, 600, 800])
  24323. torch.Size([8, 8])
  24324. tensor([[0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  24325. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  24326. [0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097],
  24327. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  24328. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  24329. [0.6279, 0.4008, 0.8600, 0.4883, 0.4325, 0.5283, 0.7010, 0.5378],
  24330. [0.6075, 0.4007, 0.8275, 0.4917, 0.4050, 0.5100, 0.5167, 0.5280],
  24331. [0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136]],
  24332. device='cuda:0', dtype=torch.float64)
  24333. predictions are: tensor([[ 0.5029, -0.4627, 1.8340, -1.0026, -0.1339, -1.6149, 0.6156, 0.0087],
  24334. [ 0.5740, -0.4009, 1.7582, -0.1699, -0.1234, -0.0320, 0.4125, 0.2843],
  24335. [ 0.6356, -0.3398, 1.7359, -0.1383, -0.2639, 0.2198, 0.3052, 0.1666],
  24336. [ 0.3308, -0.5629, 0.8794, -1.2483, -0.5392, -1.3448, 0.4178, 0.3191],
  24337. [ 0.4581, -0.5044, 1.5836, -0.5473, -0.7216, -0.5668, 0.2383, 0.0167],
  24338. [ 0.6568, -0.3957, 1.7078, 0.0030, -0.3137, 0.0374, 0.8280, 0.2264],
  24339. [ 0.3297, -0.5640, 1.5501, -0.0372, -0.3852, -0.0481, 0.0236, 0.2139],
  24340. [ 0.3091, -0.5670, 1.4527, -0.6382, -0.6001, -0.0085, 0.4038, 0.2477]],
  24341. device='cuda:0', grad_fn=<AddmmBackward>)
  24342. landmarks are: tensor([[[ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  24343. 0.0051],
  24344. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  24345. 0.3007],
  24346. [ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  24347. 0.0682],
  24348. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  24349. 0.2391],
  24350. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  24351. 0.0021],
  24352. [ 0.6141, -0.4345, 1.6864, -0.0303, -0.2882, 0.1544, 0.9521,
  24353. 0.1982],
  24354. [ 0.5200, -0.4353, 1.5363, -0.0149, -0.4152, 0.0697, 0.1005,
  24355. 0.1530],
  24356. [ 0.5466, -0.3840, 1.5016, -0.6077, -0.6404, 0.2083, 0.3871,
  24357. 0.0862]]], device='cuda:0')
  24358. loss_train_step before backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  24359. loss_train_step after backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  24360. loss_train: 0.9131455309689045
  24361. step: 31
  24362. running loss: 0.02945630745060982
  24363. Train Steps: 31/90 Loss: 0.0295 torch.Size([8, 600, 800])
  24364. torch.Size([8, 8])
  24365. tensor([[0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  24366. [0.6239, 0.4107, 0.8162, 0.2763, 0.3625, 0.3600, 0.5988, 0.5700],
  24367. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  24368. [0.6357, 0.4139, 0.8450, 0.5883, 0.3775, 0.4950, 0.6488, 0.5297],
  24369. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  24370. [0.6260, 0.4106, 0.8025, 0.2583, 0.4550, 0.1867, 0.6281, 0.4869],
  24371. [0.6185, 0.4042, 0.7700, 0.2250, 0.4062, 0.2117, 0.5763, 0.5150],
  24372. [0.6263, 0.4030, 0.9000, 0.4767, 0.3800, 0.5167, 0.6415, 0.4771]],
  24373. device='cuda:0', dtype=torch.float64)
  24374. predictions are: tensor([[ 6.5724e-01, -3.3551e-01, 1.7339e+00, -1.7214e-01, -5.4087e-01,
  24375. -5.7657e-01, -7.2407e-04, 3.0961e-01],
  24376. [ 6.4453e-01, -3.8119e-01, 1.4042e+00, -9.6262e-01, -4.7842e-01,
  24377. -6.2890e-01, 3.6548e-01, 2.1259e-01],
  24378. [ 5.3622e-01, -4.3840e-01, 1.4795e+00, -8.7511e-01, -5.5252e-01,
  24379. -4.6950e-01, 5.1470e-01, 2.1833e-01],
  24380. [ 7.7063e-01, -3.1686e-01, 1.7194e+00, 3.5740e-01, -4.2742e-01,
  24381. -1.5771e-02, 7.1987e-01, 9.3308e-02],
  24382. [-9.5819e-01, -1.3890e+00, 1.2376e+00, -9.8477e-01, -3.6917e-01,
  24383. -1.1233e+00, 1.0399e-01, 3.1658e-01],
  24384. [ 2.9942e-01, -5.8920e-01, 1.5002e+00, -1.1685e+00, -1.3334e-01,
  24385. -1.4075e+00, 5.3227e-01, 5.6465e-02],
  24386. [ 5.8947e-01, -4.2299e-01, 1.2521e+00, -1.2410e+00, -3.8749e-01,
  24387. -1.2859e+00, 3.7489e-01, 5.9306e-02],
  24388. [ 6.0614e-01, -4.2630e-01, 1.8852e+00, -1.1434e-01, -4.4070e-01,
  24389. 1.6359e-01, 5.1914e-01, 5.1127e-02]], device='cuda:0',
  24390. grad_fn=<AddmmBackward>)
  24391. landmarks are: tensor([[[ 5.4544e-01, -4.0531e-01, 1.6633e+00, -1.7660e-01, -6.0577e-01,
  24392. -5.9230e-01, 1.5773e-01, 4.3570e-01],
  24393. [ 5.9601e-01, -3.8879e-01, 1.4840e+00, -1.0095e+00, -6.1155e-01,
  24394. -6.2309e-01, 4.7968e-01, 3.4688e-01],
  24395. [ 5.9319e-01, -3.9615e-01, 1.4554e+00, -9.2333e-01, -6.4042e-01,
  24396. -4.9222e-01, 4.9122e-01, 1.1594e-01],
  24397. [ 6.5036e-01, -3.7434e-01, 1.6171e+00, 4.3156e-01, -5.4226e-01,
  24398. 4.6189e-04, 7.1085e-01, 1.6077e-01],
  24399. [-2.2859e+00, -2.2859e+00, 1.2303e+00, -7.8476e-01, -4.2102e-01,
  24400. -1.1158e+00, 2.2564e-01, 3.7768e-01],
  24401. [ 6.0577e-01, -3.8922e-01, 1.4208e+00, -1.0927e+00, -1.8430e-01,
  24402. -1.4237e+00, 6.1538e-01, -3.6992e-02],
  24403. [ 5.7067e-01, -4.1886e-01, 1.2707e+00, -1.2467e+00, -4.0947e-01,
  24404. -1.3082e+00, 3.7575e-01, 9.2841e-02],
  24405. [ 6.0716e-01, -4.2471e-01, 1.8711e+00, -8.4219e-02, -5.3072e-01,
  24406. 1.0054e-01, 6.7707e-01, -8.2079e-02]]], device='cuda:0')
  24407. loss_train_step before backward: tensor(0.0478, device='cuda:0', grad_fn=<MseLossBackward>)
  24408. loss_train_step after backward: tensor(0.0478, device='cuda:0', grad_fn=<MseLossBackward>)
  24409. loss_train: 0.9609342403709888
  24410. step: 32
  24411. running loss: 0.0300291950115934
  24412. Train Steps: 32/90 Loss: 0.0300 torch.Size([8, 600, 800])
  24413. torch.Size([8, 8])
  24414. tensor([[0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  24415. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  24416. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  24417. [0.6263, 0.4030, 0.9000, 0.4767, 0.3800, 0.5167, 0.6415, 0.4771],
  24418. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  24419. [0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  24420. [0.6124, 0.4030, 0.8650, 0.4867, 0.4999, 0.5106, 0.5137, 0.5773],
  24421. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494]],
  24422. device='cuda:0', dtype=torch.float64)
  24423. predictions are: tensor([[ 0.5655, -0.4276, 1.7582, -0.6235, -0.6276, -0.6743, 0.5222, 0.1137],
  24424. [ 0.6222, -0.3659, 1.6961, 0.1163, -0.4128, -0.2092, 0.3120, 0.3234],
  24425. [ 0.3312, -0.5525, 1.7061, -0.5412, -0.6122, -0.6128, 0.1507, 0.2349],
  24426. [ 0.4998, -0.4658, 1.7805, -0.3142, -0.5496, -0.0170, 0.4519, 0.0428],
  24427. [ 0.2381, -0.6250, 1.6805, -0.2034, -0.1010, -0.1950, -0.0042, 0.2027],
  24428. [ 0.6927, -0.3407, 1.6134, -0.0583, -0.2813, 0.0023, 0.7085, 0.1154],
  24429. [ 0.3413, -0.5539, 1.7100, -0.2173, -0.0598, -0.2415, -0.0140, 0.1867],
  24430. [ 0.9364, -0.1751, 1.8455, -0.3379, -0.5334, -0.3309, 0.9051, 0.1270]],
  24431. device='cuda:0', grad_fn=<AddmmBackward>)
  24432. landmarks are: tensor([[[ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  24433. 0.0697],
  24434. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  24435. 0.3007],
  24436. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  24437. 0.1852],
  24438. [ 0.6072, -0.4247, 1.8711, -0.0842, -0.5307, 0.1005, 0.6771,
  24439. -0.0821],
  24440. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  24441. 0.3392],
  24442. [ 0.6042, -0.4273, 1.6920, 0.1860, -0.2717, 0.1406, 0.7997,
  24443. 0.1004],
  24444. [ 0.5428, -0.4244, 1.7095, -0.0380, 0.0232, 0.0725, 0.0866,
  24445. 0.3806],
  24446. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  24447. 0.2516]]], device='cuda:0')
  24448. loss_train_step before backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  24449. loss_train_step after backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  24450. loss_train: 0.9831647351384163
  24451. step: 33
  24452. running loss: 0.02979287076177019
  24453.  
  24454. Train Steps: 33/90 Loss: 0.0298 torch.Size([8, 600, 800])
  24455. torch.Size([8, 8])
  24456. tensor([[0.6200, 0.4112, 0.8862, 0.4100, 0.3638, 0.4917, 0.6088, 0.6050],
  24457. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  24458. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  24459. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  24460. [0.6268, 0.4102, 0.8938, 0.3667, 0.4025, 0.2833, 0.6275, 0.5183],
  24461. [0.6246, 0.4028, 0.8738, 0.4867, 0.4088, 0.5667, 0.6362, 0.5200],
  24462. [0.6129, 0.4114, 0.6950, 0.2467, 0.4050, 0.2133, 0.5363, 0.5550],
  24463. [0.6075, 0.4000, 0.8513, 0.5183, 0.4510, 0.5329, 0.5180, 0.5280]],
  24464. device='cuda:0', dtype=torch.float64)
  24465. predictions are: tensor([[ 0.5627, -0.4001, 1.8025, -0.3814, -0.5554, -0.0953, 0.4415, 0.3466],
  24466. [ 0.5360, -0.4458, 1.7127, 0.1136, -0.3603, 0.2607, 0.8678, 0.2304],
  24467. [ 0.6083, -0.3793, 1.3611, -1.2816, -0.2590, -1.5712, 0.4258, 0.0313],
  24468. [ 0.1714, -0.6622, 1.6124, 0.1800, -0.4743, -0.0086, 0.1030, 0.1615],
  24469. [ 0.3095, -0.5768, 1.9215, -0.7524, -0.3930, -1.1578, 0.5276, 0.1364],
  24470. [ 0.6881, -0.3396, 1.8548, -0.0897, -0.3718, 0.2349, 0.6835, 0.0806],
  24471. [ 0.4803, -0.4402, 1.0330, -1.1984, -0.4795, -1.2689, 0.0921, 0.2523],
  24472. [ 0.4115, -0.4979, 1.7126, 0.0244, -0.1545, 0.0139, -0.0112, 0.0896]],
  24473. device='cuda:0', grad_fn=<AddmmBackward>)
  24474. landmarks are: tensor([[[ 0.5777, -0.3868, 1.8076, -0.3921, -0.6058, -0.0149, 0.5259,
  24475. 0.5085],
  24476. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  24477. 0.3371],
  24478. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  24479. 0.1005],
  24480. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  24481. -0.1061],
  24482. [ 0.6092, -0.3913, 1.8423, -0.5923, -0.4268, -0.9772, 0.6125,
  24483. 0.1082],
  24484. [ 0.5990, -0.4256, 1.7499, -0.0380, -0.3979, 0.3315, 0.6529,
  24485. 0.1159],
  24486. [ 0.5448, -0.3859, 0.9242, -1.1466, -0.4152, -1.3005, 0.1910,
  24487. 0.2776],
  24488. [ 0.5202, -0.4382, 1.6460, 0.1082, -0.2029, 0.1754, 0.1067,
  24489. 0.1530]]], device='cuda:0')
  24490. loss_train_step before backward: tensor(0.0109, device='cuda:0', grad_fn=<MseLossBackward>)
  24491. loss_train_step after backward: tensor(0.0109, device='cuda:0', grad_fn=<MseLossBackward>)
  24492. loss_train: 0.994059644639492
  24493. step: 34
  24494. running loss: 0.029237048371749765
  24495. Train Steps: 34/90 Loss: 0.0292 torch.Size([8, 600, 800])
  24496. torch.Size([8, 8])
  24497. tensor([[0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436],
  24498. [0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  24499. [0.6201, 0.4102, 0.7288, 0.2417, 0.4150, 0.2383, 0.6100, 0.5500],
  24500. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297],
  24501. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  24502. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  24503. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  24504. [0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447]],
  24505. device='cuda:0', dtype=torch.float64)
  24506. predictions are: tensor([[ 0.5234, -0.4664, 1.8526, -0.3534, -0.4182, -0.0822, 0.6591, 0.2142],
  24507. [ 0.4352, -0.4940, 1.8282, -0.9907, -0.0305, -1.4398, 0.5311, 0.0966],
  24508. [ 0.8282, -0.2346, 1.2444, -1.2653, -0.4695, -1.2162, 0.1952, 0.1267],
  24509. [ 0.4458, -0.5179, 1.8325, 0.1580, -0.5393, -0.1276, 0.4210, 0.1183],
  24510. [ 0.3377, -0.5294, 1.3695, -1.2153, -0.4092, -1.1784, 0.1472, 0.2982],
  24511. [ 0.3720, -0.5473, 1.8003, 0.0639, -0.3505, 0.3625, 0.4583, 0.2098],
  24512. [ 0.4163, -0.5423, 1.5022, 0.1460, -0.4588, -0.0288, 0.5502, 0.1593],
  24513. [ 0.4728, -0.4942, 1.9267, -0.1118, -0.4895, -0.0021, 0.5690, 0.1152]],
  24514. device='cuda:0', grad_fn=<AddmmBackward>)
  24515. landmarks are: tensor([[[ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  24516. 0.2249],
  24517. [ 0.6520, -0.3912, 1.7095, -0.9079, -0.0284, -1.3621, 0.8096,
  24518. 0.2356],
  24519. [ 0.5784, -0.3913, 1.0801, -1.1697, -0.3691, -1.1851, 0.5316,
  24520. 0.2545],
  24521. [ 0.6520, -0.4032, 1.8076, 0.1852, -0.5711, -0.1381, 0.7876,
  24522. 0.1608],
  24523. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  24524. 0.3315],
  24525. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  24526. 0.3157],
  24527. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  24528. 0.1928],
  24529. [ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  24530. 0.2302]]], device='cuda:0')
  24531. loss_train_step before backward: tensor(0.0352, device='cuda:0', grad_fn=<MseLossBackward>)
  24532. loss_train_step after backward: tensor(0.0352, device='cuda:0', grad_fn=<MseLossBackward>)
  24533. loss_train: 1.0292295143008232
  24534. step: 35
  24535. running loss: 0.029406557551452092
  24536. Train Steps: 35/90 Loss: 0.0294 torch.Size([8, 600, 800])
  24537. torch.Size([8, 8])
  24538. tensor([[0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  24539. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  24540. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  24541. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344],
  24542. [0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  24543. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  24544. [0.6260, 0.4253, 0.8938, 0.4400, 0.3675, 0.3650, 0.5675, 0.5767],
  24545. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661]],
  24546. device='cuda:0', dtype=torch.float64)
  24547. predictions are: tensor([[ 0.6034, -0.4226, 1.7620, 0.0535, -0.4684, -0.2611, 0.4431, 0.1771],
  24548. [ 0.3709, -0.5737, 1.6665, 0.0294, -0.3556, -0.0046, 0.5314, 0.1333],
  24549. [ 0.6214, -0.4068, 1.9044, -0.2927, -0.4045, -0.1387, 0.9449, 0.1900],
  24550. [ 0.4604, -0.4612, 1.8500, -0.3535, -0.5022, -0.5301, 0.0546, 0.1342],
  24551. [ 0.7181, -0.2917, 1.3510, -1.4534, -0.4692, -0.9523, 0.3789, 0.0521],
  24552. [ 0.6420, -0.3510, 1.8920, -0.1968, -0.3205, -0.5772, 0.5890, 0.1643],
  24553. [ 0.5143, -0.4038, 1.8072, -0.4124, -0.4635, -0.6016, 0.2431, 0.3779],
  24554. [ 0.3334, -0.5918, 1.6142, 0.2640, -0.4179, -0.0050, 0.4461, 0.1309]],
  24555. device='cuda:0', grad_fn=<AddmmBackward>)
  24556. landmarks are: tensor([[[ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  24557. 0.0291],
  24558. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  24559. 0.0697],
  24560. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  24561. 0.2516],
  24562. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  24563. 0.1824],
  24564. [ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  24565. -0.0108],
  24566. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  24567. 0.1661],
  24568. [ 0.6058, -0.3216, 1.8423, -0.2536, -0.5885, -0.6000, 0.3353,
  24569. 0.3777],
  24570. [ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  24571. -0.1331]]], device='cuda:0')
  24572. loss_train_step before backward: tensor(0.0150, device='cuda:0', grad_fn=<MseLossBackward>)
  24573. loss_train_step after backward: tensor(0.0150, device='cuda:0', grad_fn=<MseLossBackward>)
  24574. loss_train: 1.044245726428926
  24575. step: 36
  24576. running loss: 0.029006825734136835
  24577. Train Steps: 36/90 Loss: 0.0290 torch.Size([8, 600, 800])
  24578. torch.Size([8, 8])
  24579. tensor([[0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447],
  24580. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  24581. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426],
  24582. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483],
  24583. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  24584. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800],
  24585. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  24586. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533]],
  24587. device='cuda:0', dtype=torch.float64)
  24588. predictions are: tensor([[ 0.6509, -0.3897, 1.9019, -0.1008, -0.3962, -0.0111, 1.1013, 0.1596],
  24589. [ 0.8432, -0.2382, 1.8771, -0.3779, -0.3931, 0.3015, 0.7711, 0.0823],
  24590. [ 0.4317, -0.4885, 1.8653, -0.3814, -0.5239, -0.7898, 0.4372, 0.1703],
  24591. [ 0.5510, -0.3753, 1.7102, -0.2932, -0.5679, -0.6029, 0.1613, 0.2940],
  24592. [ 0.6017, -0.4021, 1.8899, 0.1966, -0.5129, -0.6484, 0.6649, -0.0689],
  24593. [ 0.0397, -0.6923, 1.1594, -0.9537, -0.5354, -1.0902, 0.1489, 0.3543],
  24594. [ 0.4427, -0.4832, 1.5935, -0.3385, -0.4276, -0.2279, 0.1961, 0.2921],
  24595. [ 0.6207, -0.3919, 1.8145, -0.1962, -0.0353, 0.1292, 0.5811, 0.2452]],
  24596. device='cuda:0', grad_fn=<AddmmBackward>)
  24597. landmarks are: tensor([[[ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  24598. 0.2302],
  24599. [ 0.5886, -0.4253, 1.8654, -0.3460, -0.5480, 0.3623, 0.6587,
  24600. 0.1005],
  24601. [ 0.5788, -0.4135, 1.8214, -0.2408, -0.6039, -0.7854, 0.4115,
  24602. 0.2203],
  24603. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  24604. 0.2468],
  24605. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  24606. -0.0957],
  24607. [ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  24608. 0.3931],
  24609. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  24610. 0.3265],
  24611. [ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  24612. 0.2699]]], device='cuda:0')
  24613. loss_train_step before backward: tensor(0.0128, device='cuda:0', grad_fn=<MseLossBackward>)
  24614. loss_train_step after backward: tensor(0.0128, device='cuda:0', grad_fn=<MseLossBackward>)
  24615. loss_train: 1.0570316752418876
  24616. step: 37
  24617. running loss: 0.02856842365518615
  24618.  
  24619. Train Steps: 37/90 Loss: 0.0286 torch.Size([8, 600, 800])
  24620. torch.Size([8, 8])
  24621. tensor([[0.6257, 0.4060, 0.8300, 0.2333, 0.4688, 0.2583, 0.7050, 0.5633],
  24622. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  24623. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  24624. [0.6279, 0.4008, 0.8600, 0.4883, 0.4325, 0.5283, 0.7010, 0.5378],
  24625. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  24626. [0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  24627. [0.6336, 0.4154, 0.8900, 0.2767, 0.4988, 0.2867, 0.7422, 0.5540],
  24628. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517]],
  24629. device='cuda:0', dtype=torch.float64)
  24630. predictions are: tensor([[ 0.4441, -0.4830, 1.6680, -1.0800, -0.2465, -1.0681, 0.7556, 0.2798],
  24631. [ 0.1950, -0.6115, 1.0745, -1.2398, -0.6409, -0.9222, 0.2341, 0.2288],
  24632. [ 0.6605, -0.4018, 2.1028, -0.1091, -0.3462, -0.7841, 0.9333, 0.0228],
  24633. [ 0.7723, -0.3271, 1.7699, 0.2168, -0.3638, 0.3681, 0.7759, 0.0680],
  24634. [ 0.7062, -0.3003, 1.1744, -1.1470, -0.4890, -0.9774, 0.3316, 0.2041],
  24635. [ 0.5624, -0.4178, 1.6652, 0.5979, -0.2604, -0.0412, 0.2334, 0.3466],
  24636. [ 0.0958, -0.7478, 1.8266, -0.7130, -0.0486, -0.9561, 0.8954, 0.2009],
  24637. [ 0.1288, -0.6920, 1.6375, -0.5932, -0.7722, -0.3912, 0.4008, 0.1899]],
  24638. device='cuda:0', grad_fn=<AddmmBackward>)
  24639. landmarks are: tensor([[[ 0.6042, -0.4105, 1.5478, -1.2082, -0.1208, -1.0927, 0.9704,
  24640. 0.3157],
  24641. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  24642. 0.2853],
  24643. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  24644. 0.2142],
  24645. [ 0.6141, -0.4345, 1.6864, -0.0303, -0.2882, 0.1544, 0.9521,
  24646. 0.1982],
  24647. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  24648. 0.2468],
  24649. [ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  24650. 0.4470],
  24651. [ 0.6405, -0.3671, 1.8249, -1.0080, 0.0178, -0.9618, 1.1422,
  24652. 0.2730],
  24653. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  24654. 0.2622]]], device='cuda:0')
  24655. loss_train_step before backward: tensor(0.0323, device='cuda:0', grad_fn=<MseLossBackward>)
  24656. loss_train_step after backward: tensor(0.0323, device='cuda:0', grad_fn=<MseLossBackward>)
  24657. loss_train: 1.089333820156753
  24658. step: 38
  24659. running loss: 0.028666679477809293
  24660. Train Steps: 38/90 Loss: 0.0287 torch.Size([8, 600, 800])
  24661. torch.Size([8, 8])
  24662. tensor([[0.6102, 0.3999, 0.8750, 0.5133, 0.3825, 0.4750, 0.5637, 0.5083],
  24663. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  24664. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  24665. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  24666. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083],
  24667. [0.6087, 0.3951, 0.8387, 0.5833, 0.4188, 0.4933, 0.5146, 0.4830],
  24668. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  24669. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980]],
  24670. device='cuda:0', dtype=torch.float64)
  24671. predictions are: tensor([[ 8.8443e-01, -1.9540e-01, 1.8931e+00, 8.7475e-02, -4.4813e-01,
  24672. 1.6257e-03, 6.1814e-01, -9.2434e-03],
  24673. [ 5.0552e-01, -3.8126e-01, 1.2175e+00, -1.0401e+00, -1.1707e-01,
  24674. -1.3590e+00, 5.7183e-01, 4.3613e-01],
  24675. [ 8.3590e-01, -2.1532e-01, 1.6410e+00, 2.7475e-01, -4.1388e-01,
  24676. -1.0416e-01, 7.4442e-01, 4.3882e-01],
  24677. [ 7.6310e-01, -2.6186e-01, 1.6897e+00, -2.8506e-01, -4.8278e-01,
  24678. -1.4364e-01, 4.4101e-01, 2.6590e-01],
  24679. [ 8.4191e-01, -2.4302e-01, 1.9611e+00, -4.4580e-01, -6.0415e-01,
  24680. -6.3684e-01, 6.8879e-01, 9.6068e-03],
  24681. [ 8.2173e-01, -2.3409e-01, 1.7656e+00, 4.0293e-01, -3.2369e-01,
  24682. 5.4397e-02, 5.1337e-01, 2.0862e-02],
  24683. [-2.3548e+00, -2.3337e+00, 1.3308e+00, -7.7752e-01, -6.2998e-01,
  24684. -7.0770e-01, 5.5572e-01, 2.3119e-01],
  24685. [ 8.9218e-01, -1.8210e-01, 1.3559e+00, -9.9058e-01, -5.4404e-01,
  24686. -8.9048e-01, 3.4451e-01, 9.2592e-03]], device='cuda:0',
  24687. grad_fn=<AddmmBackward>)
  24688. landmarks are: tensor([[[ 0.5326, -0.4390, 1.7557, 0.0851, -0.5192, -0.0919, 0.3180,
  24689. 0.0620],
  24690. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  24691. 0.3931],
  24692. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  24693. 0.5401],
  24694. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  24695. 0.3265],
  24696. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  24697. 0.0620],
  24698. [ 0.5258, -0.4610, 1.5882, 0.4085, -0.3517, -0.0072, 0.0910,
  24699. -0.0550],
  24700. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  24701. 0.1133],
  24702. [ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  24703. 0.0141]]], device='cuda:0')
  24704. loss_train_step before backward: tensor(0.0324, device='cuda:0', grad_fn=<MseLossBackward>)
  24705. loss_train_step after backward: tensor(0.0324, device='cuda:0', grad_fn=<MseLossBackward>)
  24706. loss_train: 1.1217780141159892
  24707. step: 39
  24708. running loss: 0.028763538823486902
  24709. Train Steps: 39/90 Loss: 0.0288 torch.Size([8, 600, 800])
  24710. torch.Size([8, 8])
  24711. tensor([[0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  24712. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  24713. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  24714. [0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138],
  24715. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  24716. [0.6199, 0.4071, 0.7600, 0.2117, 0.4037, 0.2767, 0.6138, 0.5550],
  24717. [0.6350, 0.4144, 0.9250, 0.4100, 0.4125, 0.3750, 0.7129, 0.5945],
  24718. [0.6336, 0.4191, 0.8938, 0.5167, 0.3937, 0.3517, 0.7343, 0.5748]],
  24719. device='cuda:0', dtype=torch.float64)
  24720. predictions are: tensor([[ 0.6440, -0.3332, 1.7672, -0.0498, -0.3202, 0.0893, 0.1455, 0.0761],
  24721. [ 0.5725, -0.4177, 1.4867, 0.1828, -0.4769, -0.0204, 1.0719, 0.2339],
  24722. [ 0.5976, -0.4119, 1.8482, -0.3967, -0.5806, -0.0978, 0.7626, 0.1046],
  24723. [ 0.4039, -0.4856, 1.5727, -0.4861, -0.6485, -0.5054, 0.4126, 0.3674],
  24724. [ 0.8189, -0.2302, 1.6996, 0.4369, -0.4249, -0.1943, 0.2815, 0.3349],
  24725. [ 0.6293, -0.3363, 1.3477, -1.3669, -0.4102, -1.0134, 0.5384, 0.2066],
  24726. [ 0.5771, -0.4255, 1.9855, -0.3066, -0.2413, -0.5252, 1.0077, 0.2510],
  24727. [ 0.0591, -0.7700, 1.8177, 0.0866, -0.3968, -0.5449, 0.8709, 0.1763]],
  24728. device='cuda:0', grad_fn=<AddmmBackward>)
  24729. landmarks are: tensor([[[ 0.5491, -0.4132, 1.7557, -0.0919, -0.2709, 0.0313, 0.0635,
  24730. 0.4032],
  24731. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  24732. 0.3478],
  24733. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  24734. 0.0985],
  24735. [ 0.5438, -0.4206, 1.5189, -0.4537, -0.6115, -0.6231, 0.4365,
  24736. 0.5491],
  24737. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  24738. 0.4624],
  24739. [ 0.5775, -0.4054, 1.2245, -1.3082, -0.4210, -1.0080, 0.5490,
  24740. 0.2776],
  24741. [ 0.6471, -0.3719, 1.9866, -0.3921, -0.3806, -0.5538, 1.0070,
  24742. 0.4600],
  24743. [ 0.6405, -0.3503, 1.8423, 0.1005, -0.4672, -0.6616, 1.1057,
  24744. 0.3692]]], device='cuda:0')
  24745. loss_train_step before backward: tensor(0.0169, device='cuda:0', grad_fn=<MseLossBackward>)
  24746. loss_train_step after backward: tensor(0.0169, device='cuda:0', grad_fn=<MseLossBackward>)
  24747. loss_train: 1.1386554995551705
  24748. step: 40
  24749. running loss: 0.028466387488879263
  24750. Train Steps: 40/90 Loss: 0.0285 torch.Size([8, 600, 800])
  24751. torch.Size([8, 8])
  24752. tensor([[0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  24753. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297],
  24754. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  24755. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  24756. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  24757. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  24758. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  24759. [0.6246, 0.4008, 0.8757, 0.5088, 0.4101, 0.5392, 0.6644, 0.5133]],
  24760. device='cuda:0', dtype=torch.float64)
  24761. predictions are: tensor([[ 0.6078, -0.3606, 1.5451, -0.5208, -0.7137, -0.4924, 0.4499, 0.2869],
  24762. [ 0.7464, -0.3133, 1.7544, 0.2531, -0.5698, -0.1807, 1.0396, 0.2625],
  24763. [ 0.3502, -0.5323, 1.8783, -0.4356, -0.3516, -1.3380, 0.7168, 0.1584],
  24764. [ 0.4409, -0.4870, 1.5813, -0.2868, -0.5962, -0.1480, 0.2479, 0.2000],
  24765. [ 0.5728, -0.4096, 1.6914, -0.2556, -0.5003, 0.0082, 0.4210, 0.1230],
  24766. [ 0.3514, -0.5419, 1.7136, 0.0634, -0.1271, -0.0333, 0.4373, 0.2821],
  24767. [ 0.8080, -0.2471, 1.7488, -0.1996, -0.3355, 0.0799, 0.5897, 0.2356],
  24768. [ 0.6162, -0.4141, 1.7027, 0.1096, -0.3821, 0.1523, 1.0530, 0.2057]],
  24769. device='cuda:0', grad_fn=<AddmmBackward>)
  24770. landmarks are: tensor([[[ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  24771. 0.2365],
  24772. [ 0.6520, -0.4032, 1.8076, 0.1852, -0.5711, -0.1381, 0.7876,
  24773. 0.1608],
  24774. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  24775. -0.0529],
  24776. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  24777. 0.0502],
  24778. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  24779. 0.0231],
  24780. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  24781. 0.3392],
  24782. [ 0.5499, -0.4225, 1.8018, -0.2921, -0.3055, 0.0543, 0.4046,
  24783. 0.2699],
  24784. [ 0.5993, -0.4345, 1.7587, 0.0641, -0.3917, 0.2048, 0.7827,
  24785. 0.0852]]], device='cuda:0')
  24786. loss_train_step before backward: tensor(0.0150, device='cuda:0', grad_fn=<MseLossBackward>)
  24787. loss_train_step after backward: tensor(0.0150, device='cuda:0', grad_fn=<MseLossBackward>)
  24788. loss_train: 1.1536407247185707
  24789. step: 41
  24790. running loss: 0.028137578651672455
  24791.  
  24792. Train Steps: 41/90 Loss: 0.0281 torch.Size([8, 600, 800])
  24793. torch.Size([8, 8])
  24794. tensor([[0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676],
  24795. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  24796. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  24797. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  24798. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395],
  24799. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  24800. [0.6282, 0.4034, 0.7830, 0.2080, 0.4532, 0.2080, 0.6404, 0.5323],
  24801. [0.6198, 0.4101, 0.8838, 0.5283, 0.3763, 0.5267, 0.5913, 0.5567]],
  24802. device='cuda:0', dtype=torch.float64)
  24803. predictions are: tensor([[ 0.8460, -0.2558, 1.8253, 0.0117, -0.2213, -0.0403, 0.4005, 0.2357],
  24804. [ 0.7772, -0.2915, 1.8138, 0.0177, -0.2384, 0.2574, 0.7008, 0.2388],
  24805. [ 0.4894, -0.4668, 1.1931, -1.0988, -0.6886, -0.7637, 0.4019, 0.1059],
  24806. [ 0.4321, -0.5275, 1.7577, 0.3191, -0.4827, -0.1046, 0.5689, 0.3247],
  24807. [ 0.0895, -0.7132, 1.6919, 0.1463, -0.7607, -0.6208, 0.4622, 0.2670],
  24808. [ 0.5809, -0.4362, 1.8019, 0.0882, -0.4585, 0.2636, 1.0704, 0.2819],
  24809. [ 0.4095, -0.5098, 1.3689, -1.2173, -0.2903, -1.4032, 0.7033, 0.1959],
  24810. [ 0.7698, -0.3002, 1.7510, 0.2490, -0.5625, 0.0499, 0.6418, 0.3161]],
  24811. device='cuda:0', grad_fn=<AddmmBackward>)
  24812. landmarks are: tensor([[[ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  24813. 4.6189e-04, 2.9049e-01, 3.3573e-01],
  24814. [ 5.7090e-01, -3.9330e-01, 1.7961e+00, -2.2633e-02, -1.9007e-01,
  24815. 3.9307e-01, 6.1824e-01, 2.0831e-01],
  24816. [ 5.0092e-01, -4.3333e-01, 1.1090e+00, -1.1158e+00, -6.9815e-01,
  24817. -7.3087e-01, 2.6170e-01, 6.2199e-02],
  24818. [ 5.8834e-01, -3.5935e-01, 1.7557e+00, 2.5450e-01, -4.1524e-01,
  24819. -6.1124e-02, 3.3533e-01, 3.0069e-01],
  24820. [ 5.6966e-01, -4.5138e-01, 1.7420e+00, 2.6720e-01, -6.0553e-01,
  24821. -6.3118e-01, 3.4489e-01, 2.0578e-01],
  24822. [ 6.2072e-01, -4.2731e-01, 1.7557e+00, 2.3557e-02, -4.3256e-01,
  24823. 3.6228e-01, 1.0033e+00, 3.1574e-01],
  24824. [ 6.1577e-01, -4.2249e-01, 1.3307e+00, -1.3253e+00, -1.9244e-01,
  24825. -1.3252e+00, 6.7213e-01, 1.7271e-01],
  24826. [ 5.7696e-01, -3.9176e-01, 1.7961e+00, 1.5443e-01, -5.4804e-01,
  24827. 1.4673e-01, 4.4503e-01, 2.8530e-01]]], device='cuda:0')
  24828. loss_train_step before backward: tensor(0.0151, device='cuda:0', grad_fn=<MseLossBackward>)
  24829. loss_train_step after backward: tensor(0.0151, device='cuda:0', grad_fn=<MseLossBackward>)
  24830. loss_train: 1.168755921535194
  24831. step: 42
  24832. running loss: 0.027827521941314142
  24833. Train Steps: 42/90 Loss: 0.0278 torch.Size([8, 600, 800])
  24834. torch.Size([8, 8])
  24835. tensor([[ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  24836. [0.6203, 0.4076, 0.8611, 0.2878, 0.4050, 0.2554, 0.5907, 0.5496],
  24837. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332],
  24838. [0.6259, 0.4133, 0.8200, 0.2317, 0.5025, 0.1533, 0.6250, 0.4947],
  24839. [0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882],
  24840. [0.6182, 0.3967, 0.8263, 0.3065, 0.3526, 0.4161, 0.6192, 0.5290],
  24841. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  24842. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578]],
  24843. device='cuda:0', dtype=torch.float64)
  24844. predictions are: tensor([[-2.3789, -2.3153, 1.4070, -1.0507, -0.0678, -1.0513, 0.8482, 0.3953],
  24845. [ 0.8099, -0.2315, 1.6563, -0.7828, -0.4231, -0.8245, 0.5477, 0.2148],
  24846. [ 0.8783, -0.2303, 1.5719, 0.3158, -0.5748, 0.1391, 0.9184, 0.1658],
  24847. [ 0.7176, -0.2993, 1.4880, -0.9552, -0.0990, -1.3317, 0.5871, 0.2044],
  24848. [ 0.6668, -0.3495, 1.7761, 0.3125, -0.7050, -0.3645, 0.2513, 0.0879],
  24849. [ 0.7174, -0.3138, 1.5611, -0.6533, -0.6790, -0.3239, 0.7629, 0.2343],
  24850. [ 0.6578, -0.3283, 1.6729, 0.4010, -0.5496, 0.0428, 0.5500, 0.2054],
  24851. [ 0.7935, -0.2433, 0.9686, -1.1348, -0.4325, -1.1478, 0.3664, 0.3375]],
  24852. device='cuda:0', grad_fn=<AddmmBackward>)
  24853. landmarks are: tensor([[[-2.2859e+00, -2.2859e+00, 1.7210e+00, -9.7721e-01, 1.8522e-01,
  24854. -1.3698e+00, 7.9859e-01, 3.1039e-01],
  24855. [ 5.7904e-01, -4.0308e-01, 1.6915e+00, -9.5640e-01, -4.1518e-01,
  24856. -1.1063e+00, 4.4251e-01, 2.5281e-01],
  24857. [ 6.1907e-01, -4.2971e-01, 1.4612e+00, 2.3911e-01, -4.9607e-01,
  24858. 3.1255e-02, 1.1166e+00, 1.7680e-01],
  24859. [ 6.0514e-01, -3.7714e-01, 1.5016e+00, -1.2159e+00, 3.5104e-02,
  24860. -1.5777e+00, 6.0099e-01, -9.2270e-04],
  24861. [ 5.3788e-01, -4.3580e-01, 1.7326e+00, 1.8522e-01, -6.0577e-01,
  24862. -5.4611e-01, 6.8408e-02, -3.0981e-02],
  24863. [ 5.6966e-01, -4.5379e-01, 1.5308e+00, -8.7027e-01, -6.5720e-01,
  24864. -3.6388e-01, 5.7392e-01, 1.5759e-01],
  24865. [ 6.1149e-01, -3.7244e-01, 1.7557e+00, 3.4688e-01, -4.4411e-01,
  24866. -1.0731e-01, 4.9122e-01, 2.3911e-01],
  24867. [ 5.2315e-01, -4.1886e-01, 9.3580e-01, -1.4006e+00, -3.9215e-01,
  24868. -1.3698e+00, 2.5553e-01, 2.9064e-01]]], device='cuda:0')
  24869. loss_train_step before backward: tensor(0.0226, device='cuda:0', grad_fn=<MseLossBackward>)
  24870. loss_train_step after backward: tensor(0.0226, device='cuda:0', grad_fn=<MseLossBackward>)
  24871. loss_train: 1.1913132583722472
  24872. step: 43
  24873. running loss: 0.027704959497029006
  24874. Train Steps: 43/90 Loss: 0.0277 torch.Size([8, 600, 800])
  24875. torch.Size([8, 8])
  24876. tensor([[0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  24877. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  24878. [0.6193, 0.4050, 0.7313, 0.2433, 0.4075, 0.2117, 0.5649, 0.5656],
  24879. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  24880. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  24881. [0.6264, 0.4069, 0.7900, 0.1650, 0.4275, 0.2267, 0.6290, 0.4947],
  24882. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  24883. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383]],
  24884. device='cuda:0', dtype=torch.float64)
  24885. predictions are: tensor([[ 0.7687, -0.3415, 1.8001, -0.9061, 0.0913, -1.0675, 1.0970, 0.1657],
  24886. [ 0.6264, -0.3643, 1.4945, 0.0356, -0.5496, -0.5861, 0.2921, 0.4837],
  24887. [ 0.4643, -0.4759, 1.1842, -1.0252, -0.4246, -1.0295, 0.3400, 0.2287],
  24888. [ 0.8361, -0.2656, 1.6420, -0.5933, -0.7136, -0.2909, 0.6242, 0.2097],
  24889. [ 0.8740, -0.2414, 1.6095, 0.5303, -0.4926, 0.1541, 0.4730, 0.3609],
  24890. [ 0.6245, -0.4205, 1.4561, -1.2001, -0.3846, -1.1205, 0.6975, 0.0619],
  24891. [ 1.0365, -0.1871, 1.9594, 0.1347, -0.6793, -0.2144, 0.7839, 0.0429],
  24892. [-2.2615, -2.2909, 1.0155, -0.9692, -0.4837, -1.0926, 0.3438, 0.3451]],
  24893. device='cuda:0', grad_fn=<AddmmBackward>)
  24894. landmarks are: tensor([[[ 6.2072e-01, -3.9360e-01, 1.7788e+00, -1.1235e+00, 1.4480e-01,
  24895. -1.0850e+00, 1.1459e+00, 1.9818e-01],
  24896. [ 6.0687e-01, -3.3095e-01, 1.3742e+00, -1.4927e-01, -5.3649e-01,
  24897. -9.5412e-01, 2.8843e-01, 5.0705e-01],
  24898. [ 5.7460e-01, -4.1527e-01, 1.0917e+00, -1.1620e+00, -4.0370e-01,
  24899. -1.3082e+00, 3.2339e-01, 3.2671e-01],
  24900. [ 5.7794e-01, -4.2748e-01, 1.5894e+00, -8.3617e-01, -6.5774e-01,
  24901. -5.1532e-01, 5.6051e-01, 2.0062e-01],
  24902. [ 6.1339e-01, -3.9099e-01, 1.4497e+00, 3.5458e-01, -3.5173e-01,
  24903. -9.1917e-02, 3.2956e-01, 5.2394e-01],
  24904. [ 6.0739e-01, -4.0631e-01, 1.3630e+00, -1.5238e+00, -3.1132e-01,
  24905. -1.2390e+00, 6.1950e-01, -9.2270e-04],
  24906. [ 6.3718e-01, -4.1286e-01, 1.8942e+00, -7.6520e-02, -6.1732e-01,
  24907. -4.7683e-01, 6.9989e-01, 3.2524e-02],
  24908. [-2.2859e+00, -2.2859e+00, 1.0712e+00, -1.2085e+00, -3.8060e-01,
  24909. -1.3929e+00, 7.5520e-02, 2.0062e-01]]], device='cuda:0')
  24910. loss_train_step before backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  24911. loss_train_step after backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  24912. loss_train: 1.2166265537962317
  24913. step: 44
  24914. running loss: 0.027650603495368905
  24915.  
  24916. Train Steps: 44/90 Loss: 0.0277 torch.Size([8, 600, 800])
  24917. torch.Size([8, 8])
  24918. tensor([[0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  24919. [0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617],
  24920. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483],
  24921. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500],
  24922. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913],
  24923. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  24924. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  24925. [0.6149, 0.4054, 0.6713, 0.2333, 0.4025, 0.2017, 0.5213, 0.5695]],
  24926. device='cuda:0', dtype=torch.float64)
  24927. predictions are: tensor([[ 0.3303, -0.6281, 1.9273, -0.1490, -0.3484, -0.8306, 1.1438, 0.2584],
  24928. [ 0.4734, -0.4978, 1.7926, -0.0348, -0.6413, -0.0802, 0.6553, 0.2107],
  24929. [ 0.5969, -0.3857, 1.6875, -0.2029, -0.6595, -0.4201, 0.2257, 0.2553],
  24930. [ 0.5582, -0.4341, 1.7493, 0.0950, -0.6047, -0.2364, 0.6304, 0.2153],
  24931. [ 0.9523, -0.1903, 1.3590, -1.0891, -0.0964, -1.3481, 0.5336, 0.0817],
  24932. [ 0.5434, -0.4403, 1.5534, 0.2962, -0.5464, -0.3564, 0.3453, 0.4208],
  24933. [ 0.6677, -0.3801, 1.7239, -0.2702, -0.4015, 0.3340, 0.7229, 0.3309],
  24934. [ 0.0454, -0.7430, 0.8856, -1.2511, -0.3786, -1.2249, 0.1690, 0.3114]],
  24935. device='cuda:0', grad_fn=<AddmmBackward>)
  24936. landmarks are: tensor([[[ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  24937. 0.3692],
  24938. [ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  24939. 0.3084],
  24940. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  24941. 0.2468],
  24942. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  24943. 0.2545],
  24944. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  24945. -0.0168],
  24946. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  24947. 0.4778],
  24948. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  24949. 0.4701],
  24950. [ 0.5544, -0.4133, 0.8145, -1.2082, -0.4268, -1.3544, 0.1221,
  24951. 0.3446]]], device='cuda:0')
  24952. loss_train_step before backward: tensor(0.0183, device='cuda:0', grad_fn=<MseLossBackward>)
  24953. loss_train_step after backward: tensor(0.0183, device='cuda:0', grad_fn=<MseLossBackward>)
  24954. loss_train: 1.2349761677905917
  24955. step: 45
  24956. running loss: 0.027443914839790928
  24957. Train Steps: 45/90 Loss: 0.0274 torch.Size([8, 600, 800])
  24958. torch.Size([8, 8])
  24959. tensor([[0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  24960. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  24961. [0.6357, 0.4139, 0.8450, 0.5883, 0.3775, 0.4950, 0.6488, 0.5297],
  24962. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  24963. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  24964. [0.6229, 0.4066, 0.7612, 0.2967, 0.4250, 0.2167, 0.5925, 0.5350],
  24965. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  24966. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383]],
  24967. device='cuda:0', dtype=torch.float64)
  24968. predictions are: tensor([[ 0.9098, -0.2486, 1.7183, 0.3586, -0.4905, -0.0874, 0.6515, 0.0615],
  24969. [ 0.8520, -0.2772, 1.7976, -0.0532, -0.5135, -0.2319, 0.7554, 0.2187],
  24970. [ 0.7001, -0.3704, 1.6785, 0.3245, -0.5234, -0.0619, 0.8263, 0.1866],
  24971. [ 0.9059, -0.2046, 1.4341, -1.0454, -0.3405, -1.1364, 0.4722, 0.2305],
  24972. [ 0.4765, -0.4984, 1.7903, -0.3978, -0.5214, 0.2342, 0.6698, 0.2583],
  24973. [ 0.7447, -0.3002, 1.2680, -1.0002, -0.2925, -1.2363, 0.4049, 0.2539],
  24974. [ 0.6188, -0.3739, 1.7510, -0.1212, -0.6343, -0.6131, 0.1172, 0.2812],
  24975. [-1.8595, -2.0222, 1.0496, -1.0688, -0.3478, -1.2907, 0.3034, 0.3780]],
  24976. device='cuda:0', grad_fn=<AddmmBackward>)
  24977. landmarks are: tensor([[[ 6.3949e-01, -4.2132e-01, 1.7037e+00, 3.6228e-01, -4.3256e-01,
  24978. -1.0731e-01, 6.5602e-01, -4.8817e-03],
  24979. [ 6.0754e-01, -4.5138e-01, 1.8032e+00, -8.2167e-02, -5.0606e-01,
  24980. -2.0228e-01, 6.2076e-01, 1.7788e-01],
  24981. [ 6.5036e-01, -3.7434e-01, 1.6171e+00, 4.3156e-01, -5.4226e-01,
  24982. 4.6189e-04, 7.1085e-01, 1.6077e-01],
  24983. [ 5.7962e-01, -3.8776e-01, 1.3688e+00, -1.0542e+00, -4.0947e-01,
  24984. -1.1312e+00, 5.8938e-01, 1.9292e-01],
  24985. [ 5.8857e-01, -4.2525e-01, 1.8654e+00, -3.4596e-01, -5.4804e-01,
  24986. 3.6228e-01, 6.5866e-01, 1.0054e-01],
  24987. [ 5.9107e-01, -4.0805e-01, 1.2303e+00, -9.1563e-01, -3.2286e-01,
  24988. -1.2851e+00, 4.5081e-01, 1.8522e-01],
  24989. [ 5.4434e-01, -3.9938e-01, 1.7499e+00, -1.2271e-01, -6.1732e-01,
  24990. -5.7691e-01, 4.8756e-03, 2.0706e-01],
  24991. [-2.2859e+00, -2.2859e+00, 1.0712e+00, -1.2085e+00, -3.8060e-01,
  24992. -1.3929e+00, 7.5520e-02, 2.0062e-01]]], device='cuda:0')
  24993. loss_train_step before backward: tensor(0.0147, device='cuda:0', grad_fn=<MseLossBackward>)
  24994. loss_train_step after backward: tensor(0.0147, device='cuda:0', grad_fn=<MseLossBackward>)
  24995. loss_train: 1.2496287617832422
  24996. step: 46
  24997. running loss: 0.027165842647461788
  24998. Train Steps: 46/90 Loss: 0.0272 torch.Size([8, 600, 800])
  24999. torch.Size([8, 8])
  25000. tensor([[0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  25001. [0.6272, 0.4120, 0.9038, 0.4117, 0.3725, 0.3200, 0.6175, 0.5250],
  25002. [0.6357, 0.4097, 0.9038, 0.3883, 0.4213, 0.2950, 0.6686, 0.5390],
  25003. [0.6276, 0.4235, 0.8888, 0.5333, 0.3800, 0.3117, 0.5427, 0.6164],
  25004. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  25005. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  25006. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  25007. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585]],
  25008. device='cuda:0', dtype=torch.float64)
  25009. predictions are: tensor([[ 0.6078, -0.4097, 1.7259, -0.0724, -0.5862, -0.7533, 0.3447, 0.1366],
  25010. [ 0.5774, -0.4651, 1.8405, -0.4214, -0.6620, -0.7016, 0.6259, 0.1238],
  25011. [ 0.5436, -0.4845, 1.7181, -0.5656, -0.4144, -0.8562, 0.7794, 0.1202],
  25012. [ 0.5757, -0.4130, 1.6117, 0.2724, -0.5682, -0.5975, 0.3891, 0.3914],
  25013. [ 0.5848, -0.4938, 1.6619, -1.2172, 0.1144, -1.1763, 1.1502, 0.1497],
  25014. [ 0.5044, -0.4762, 1.2517, -0.6019, -0.6974, -0.6827, 0.2724, 0.4284],
  25015. [ 0.3666, -0.5354, 1.0874, -0.8050, -0.0549, -1.2401, 0.2733, 0.4696],
  25016. [-0.0309, -0.8409, 1.6236, -0.3864, -0.3763, 0.3611, 0.4533, 0.2188]],
  25017. device='cuda:0', grad_fn=<AddmmBackward>)
  25018. landmarks are: tensor([[[ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  25019. 0.1852],
  25020. [ 0.6111, -0.3828, 1.8885, -0.3844, -0.5654, -0.8079, 0.5663,
  25021. 0.1390],
  25022. [ 0.6504, -0.3936, 1.8885, -0.4922, -0.3402, -0.9233, 0.8022,
  25023. 0.2035],
  25024. [ 0.6131, -0.3299, 1.8192, 0.1775, -0.5307, -0.8463, 0.2206,
  25025. 0.5612],
  25026. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  25027. 0.1982],
  25028. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  25029. 0.4470],
  25030. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  25031. 0.5624],
  25032. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  25033. 0.2936]]], device='cuda:0')
  25034. loss_train_step before backward: tensor(0.0190, device='cuda:0', grad_fn=<MseLossBackward>)
  25035. loss_train_step after backward: tensor(0.0190, device='cuda:0', grad_fn=<MseLossBackward>)
  25036. loss_train: 1.2686103787273169
  25037. step: 47
  25038. running loss: 0.026991710185687592
  25039. Train Steps: 47/90 Loss: 0.0270 torch.Size([8, 600, 800])
  25040. torch.Size([8, 8])
  25041. tensor([[0.6075, 0.4007, 0.8275, 0.4917, 0.4050, 0.5100, 0.5167, 0.5280],
  25042. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  25043. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550],
  25044. [ nan, nan, 0.8463, 0.2550, 0.5850, 0.2133, 0.7129, 0.6072],
  25045. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  25046. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  25047. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  25048. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567]],
  25049. device='cuda:0', dtype=torch.float64)
  25050. predictions are: tensor([[ 0.7934, -0.2449, 1.5154, 0.1089, -0.4596, -0.0577, 0.1022, 0.1616],
  25051. [ 0.7675, -0.2803, 1.3185, -0.8539, -0.6104, -0.9508, 0.4776, 0.2612],
  25052. [ 0.7659, -0.2658, 1.7689, -0.0246, -0.5172, -0.0341, 0.4878, 0.2810],
  25053. [-1.6360, -1.8705, 1.5813, -0.9753, 0.1505, -1.2824, 1.0845, 0.4963],
  25054. [ 0.7661, -0.2863, 1.3170, -0.9580, -0.6673, -0.7572, 0.3504, 0.1004],
  25055. [ 1.1099, -0.0842, 1.4959, -0.8644, -0.0398, -1.5079, 0.7408, 0.0879],
  25056. [ 0.8245, -0.2819, 1.6245, 0.2629, -0.2925, 0.0168, 0.4868, 0.1323],
  25057. [-1.3622, -1.6601, 1.1851, -0.9392, -0.4514, -1.1801, 0.2310, 0.3086]],
  25058. device='cuda:0', grad_fn=<AddmmBackward>)
  25059. landmarks are: tensor([[[ 0.5200, -0.4353, 1.5363, -0.0149, -0.4152, 0.0697, 0.1005,
  25060. 0.1530],
  25061. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  25062. 0.1931],
  25063. [ 0.5968, -0.3725, 1.8423, -0.1381, -0.4037, 0.1852, 0.6009,
  25064. 0.2776],
  25065. [-2.2859, -2.2859, 1.6229, -1.1081, 0.4162, -1.3005, 1.0070,
  25066. 0.5188],
  25067. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  25068. 0.0412],
  25069. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  25070. 0.1020],
  25071. [ 0.5548, -0.4682, 1.7309, 0.0966, -0.1394, 0.1757, 0.5045,
  25072. 0.0942],
  25073. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  25074. 0.2853]]], device='cuda:0')
  25075. loss_train_step before backward: tensor(0.0482, device='cuda:0', grad_fn=<MseLossBackward>)
  25076. loss_train_step after backward: tensor(0.0482, device='cuda:0', grad_fn=<MseLossBackward>)
  25077. loss_train: 1.3167862426489592
  25078. step: 48
  25079. running loss: 0.027433046721853316
  25080.  
  25081. Train Steps: 48/90 Loss: 0.0274 torch.Size([8, 600, 800])
  25082. torch.Size([8, 8])
  25083. tensor([[0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  25084. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  25085. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  25086. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  25087. [0.6357, 0.4139, 0.8450, 0.5883, 0.3775, 0.4950, 0.6488, 0.5297],
  25088. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  25089. [0.6293, 0.3982, 0.8700, 0.5300, 0.3763, 0.4717, 0.7050, 0.5297],
  25090. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297]],
  25091. device='cuda:0', dtype=torch.float64)
  25092. predictions are: tensor([[ 0.6029, -0.4274, 1.6532, -0.8771, -0.5784, -0.8858, 0.4872, 0.2820],
  25093. [ 0.3579, -0.5499, 1.8201, -0.1189, -0.1082, -0.1930, 0.1005, 0.1570],
  25094. [ 0.2582, -0.6223, 1.5448, -0.6216, -0.5208, -0.6415, 0.1641, 0.4178],
  25095. [ 0.4707, -0.5316, 1.7071, -0.0668, -0.2033, -0.1684, 0.5052, 0.3034],
  25096. [ 0.5893, -0.4368, 1.6961, 0.2884, -0.4750, -0.2678, 0.7490, 0.2008],
  25097. [ 0.4832, -0.4854, 1.1430, -1.1649, -0.5456, -0.9242, 0.1531, 0.1965],
  25098. [ 0.5110, -0.4910, 1.6933, 0.1101, -0.4684, -0.2975, 0.7455, 0.2333],
  25099. [ 0.6602, -0.4004, 1.7785, 0.1148, -0.5072, -0.3808, 0.7389, 0.2826]],
  25100. device='cuda:0', grad_fn=<AddmmBackward>)
  25101. landmarks are: tensor([[[ 5.6801e-01, -4.3934e-01, 1.5920e+00, -6.6715e-01, -6.4527e-01,
  25102. -5.4566e-01, 5.1492e-01, 1.7534e-01],
  25103. [ 5.5155e-01, -4.2249e-01, 1.7788e+00, -5.3426e-02, -2.0162e-01,
  25104. 1.9292e-01, 1.5683e-01, 6.8210e-02],
  25105. [ 5.3672e-01, -4.2941e-01, 1.5709e+00, -4.9992e-01, -6.6928e-01,
  25106. -3.0747e-01, 2.4546e-01, 3.5585e-01],
  25107. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  25108. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  25109. [ 6.5036e-01, -3.7434e-01, 1.6171e+00, 4.3156e-01, -5.4226e-01,
  25110. 4.6189e-04, 7.1085e-01, 1.6077e-01],
  25111. [ 5.3031e-01, -4.3841e-01, 1.0975e+00, -1.0542e+00, -6.9238e-01,
  25112. -6.6159e-01, 1.5477e-01, 4.4164e-02],
  25113. [ 6.2072e-01, -4.4656e-01, 1.7326e+00, 1.6212e-01, -5.4804e-01,
  25114. -1.0731e-01, 9.7040e-01, 1.6077e-01],
  25115. [ 6.5201e-01, -4.0323e-01, 1.8076e+00, 1.8522e-01, -5.7113e-01,
  25116. -1.3811e-01, 7.8762e-01, 1.6077e-01]]], device='cuda:0')
  25117. loss_train_step before backward: tensor(0.0196, device='cuda:0', grad_fn=<MseLossBackward>)
  25118. loss_train_step after backward: tensor(0.0196, device='cuda:0', grad_fn=<MseLossBackward>)
  25119. loss_train: 1.336402228102088
  25120. step: 49
  25121. running loss: 0.027273514859226286
  25122. Train Steps: 49/90 Loss: 0.0273 torch.Size([8, 600, 800])
  25123. torch.Size([8, 8])
  25124. tensor([[0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  25125. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  25126. [0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  25127. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  25128. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  25129. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  25130. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  25131. [0.6030, 0.3969, 0.7988, 0.3917, 0.3450, 0.3667, 0.5266, 0.4700]],
  25132. device='cuda:0', dtype=torch.float64)
  25133. predictions are: tensor([[ 0.4697, -0.4949, 1.2264, -1.1615, -0.3115, -1.3537, 0.3968, 0.1538],
  25134. [ 0.4581, -0.5103, 1.2444, -1.2177, -0.2020, -1.4147, 0.4720, 0.1634],
  25135. [ 0.7304, -0.3405, 1.2307, -0.9687, -0.2543, -1.3712, 0.4215, 0.2137],
  25136. [ 0.5282, -0.5000, 1.8005, 0.1556, -0.2945, -0.0716, 0.3245, 0.3234],
  25137. [-0.5072, -1.1353, 0.9631, -1.1802, -0.3185, -1.3331, 0.3396, 0.2513],
  25138. [ 0.3824, -0.5971, 1.8023, 0.2948, -0.4119, 0.2892, 1.0153, 0.3397],
  25139. [ 0.5125, -0.4644, 1.8052, -0.4985, -0.6533, -0.4799, 0.4674, 0.3349],
  25140. [ 0.4898, -0.4892, 1.6309, -0.3511, -0.6462, -0.5951, 0.1274, 0.1258]],
  25141. device='cuda:0', grad_fn=<AddmmBackward>)
  25142. landmarks are: tensor([[[ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  25143. 0.0774],
  25144. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  25145. 0.1082],
  25146. [ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  25147. 0.1449],
  25148. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  25149. 0.3700],
  25150. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  25151. 0.1013],
  25152. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  25153. 0.3371],
  25154. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  25155. 0.3392],
  25156. [ 0.4992, -0.4525, 1.4035, -0.4768, -0.6924, -0.5923, 0.1465,
  25157. -0.1151]]], device='cuda:0')
  25158. loss_train_step before backward: tensor(0.0342, device='cuda:0', grad_fn=<MseLossBackward>)
  25159. loss_train_step after backward: tensor(0.0342, device='cuda:0', grad_fn=<MseLossBackward>)
  25160. loss_train: 1.370650378987193
  25161. step: 50
  25162. running loss: 0.027413007579743864
  25163. Train Steps: 50/90 Loss: 0.0274 torch.Size([8, 600, 800])
  25164. torch.Size([8, 8])
  25165. tensor([[0.6064, 0.4019, 0.8650, 0.4517, 0.4037, 0.5367, 0.5703, 0.5609],
  25166. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  25167. [0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083],
  25168. [0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  25169. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  25170. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927],
  25171. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  25172. [ nan, nan, 0.8463, 0.2550, 0.5850, 0.2133, 0.7129, 0.6072]],
  25173. device='cuda:0', dtype=torch.float64)
  25174. predictions are: tensor([[ 0.5260, -0.4512, 1.5853, -0.1327, -0.3905, 0.0258, 0.3438, 0.2133],
  25175. [ 0.7047, -0.3586, 1.7669, -0.6288, -0.3302, -0.8932, 0.9293, 0.2138],
  25176. [ 0.6988, -0.2873, 1.4754, -0.5759, -0.5988, -0.5795, 0.3050, 0.4355],
  25177. [ 0.7808, -0.3050, 1.6218, 0.2099, -0.4843, -0.3894, 0.3224, 0.0286],
  25178. [ 0.6624, -0.3391, 1.5512, -0.4366, -0.5093, -0.2878, 0.2257, 0.2136],
  25179. [ 0.5930, -0.4043, 1.6772, -0.0725, -0.2312, -0.2132, 0.0442, -0.0188],
  25180. [ 0.5222, -0.4644, 1.6615, -0.3672, -0.5627, -0.3673, 0.6173, 0.2334],
  25181. [-1.8953, -2.0281, 1.5608, -1.1411, 0.3558, -1.4730, 1.0002, 0.4625]],
  25182. device='cuda:0', grad_fn=<AddmmBackward>)
  25183. landmarks are: tensor([[[ 0.5151, -0.4296, 1.7095, -0.1997, -0.4210, 0.1929, 0.3484,
  25184. 0.3047],
  25185. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  25186. 0.2676],
  25187. [ 0.5774, -0.3868, 1.6286, -0.5692, -0.6462, -0.2767, 0.5143,
  25188. 0.5239],
  25189. [ 0.5773, -0.4316, 1.7399, 0.1287, -0.5153, -0.0817, 0.4313,
  25190. 0.0919],
  25191. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  25192. 0.2468],
  25193. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  25194. -0.0099],
  25195. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  25196. 0.0985],
  25197. [-2.2859, -2.2859, 1.6229, -1.1081, 0.4162, -1.3005, 1.0070,
  25198. 0.5188]]], device='cuda:0')
  25199. loss_train_step before backward: tensor(0.0200, device='cuda:0', grad_fn=<MseLossBackward>)
  25200. loss_train_step after backward: tensor(0.0200, device='cuda:0', grad_fn=<MseLossBackward>)
  25201. loss_train: 1.3906042091548443
  25202. step: 51
  25203. running loss: 0.027266749199114593
  25204. Train Steps: 51/90 Loss: 0.0273 torch.Size([8, 600, 800])
  25205. torch.Size([8, 8])
  25206. tensor([[0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  25207. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  25208. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967],
  25209. [0.6216, 0.4099, 0.7225, 0.2033, 0.4188, 0.2217, 0.5975, 0.5283],
  25210. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  25211. [0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250],
  25212. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  25213. [0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676]],
  25214. device='cuda:0', dtype=torch.float64)
  25215. predictions are: tensor([[ 0.4308, -0.5393, 1.9275, -0.0703, -0.3942, -0.2634, 0.1682, 0.1026],
  25216. [ 0.3524, -0.5766, 1.8549, -0.2104, -0.5534, -0.6176, 0.5192, 0.3368],
  25217. [ 0.3679, -0.5808, 1.7765, -0.1534, -0.5801, 0.0536, 0.4781, 0.1789],
  25218. [ 0.4266, -0.5153, 1.0804, -1.1756, -0.2470, -1.4130, 0.3684, 0.2618],
  25219. [ 0.5300, -0.4728, 1.1145, -1.2576, -0.2983, -1.2850, 0.6322, 0.2698],
  25220. [ 0.2888, -0.6171, 1.1986, -1.1513, -0.3956, -1.0440, 0.6077, 0.2181],
  25221. [ 0.6086, -0.4195, 1.2452, -0.9810, -0.4951, -1.0781, 0.2751, 0.0469],
  25222. [ 0.2659, -0.6734, 1.8575, 0.0737, -0.0717, -0.0615, 0.3565, 0.3574]],
  25223. device='cuda:0', grad_fn=<AddmmBackward>)
  25224. landmarks are: tensor([[[ 5.6634e-01, -3.9546e-01, 1.7788e+00, -2.3818e-01, -4.0370e-01,
  25225. -2.6898e-01, 8.2802e-02, -2.1963e-02],
  25226. [ 5.8799e-01, -3.8868e-01, 1.8423e+00, -3.3056e-01, -6.2309e-01,
  25227. -5.2302e-01, 4.0462e-01, 1.5443e-01],
  25228. [ 4.9740e-01, -4.4819e-01, 1.6633e+00, -3.3056e-01, -6.1732e-01,
  25229. 1.3133e-01, 2.9255e-01, 8.0947e-03],
  25230. [ 5.8505e-01, -3.9246e-01, 1.0513e+00, -1.3467e+00, -3.5173e-01,
  25231. -1.2620e+00, 4.7390e-01, 1.5443e-01],
  25232. [ 5.7841e-01, -4.0847e-01, 1.0859e+00, -1.3929e+00, -4.0370e-01,
  25233. -1.1158e+00, 5.6051e-01, 2.4681e-01],
  25234. [ 5.8909e-01, -3.9369e-01, 1.1494e+00, -1.2390e+00, -5.0762e-01,
  25235. -9.6952e-01, 4.7968e-01, 1.3903e-01],
  25236. [ 4.9971e-01, -4.4465e-01, 1.1610e+00, -9.7721e-01, -6.0577e-01,
  25237. -1.0311e+00, 1.4038e-01, -1.0312e-01],
  25238. [ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  25239. 4.6189e-04, 2.9049e-01, 3.3573e-01]]], device='cuda:0')
  25240. loss_train_step before backward: tensor(0.0164, device='cuda:0', grad_fn=<MseLossBackward>)
  25241. loss_train_step after backward: tensor(0.0164, device='cuda:0', grad_fn=<MseLossBackward>)
  25242. loss_train: 1.4069728069007397
  25243. step: 52
  25244. running loss: 0.027057169363475762
  25245.  
  25246. Train Steps: 52/90 Loss: 0.0271 torch.Size([8, 600, 800])
  25247. torch.Size([8, 8])
  25248. tensor([[0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  25249. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  25250. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667],
  25251. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  25252. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  25253. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  25254. [0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  25255. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466]],
  25256. device='cuda:0', dtype=torch.float64)
  25257. predictions are: tensor([[ 0.6663, -0.3088, 1.6004, 0.0154, -0.4911, -0.6876, 0.0623, 0.3197],
  25258. [ 0.8698, -0.2878, 1.8808, -0.0299, -0.4834, -0.4837, 0.6643, 0.0741],
  25259. [ 0.7847, -0.2747, 1.7890, -0.5887, -0.5645, -0.3924, 0.5472, 0.3043],
  25260. [ 0.5769, -0.4142, 1.6525, -0.7106, -0.5385, 0.0847, 0.6281, 0.2195],
  25261. [-2.3713, -2.3257, 1.1043, -1.3198, -0.1935, -1.3207, 0.1519, 0.2115],
  25262. [ 0.7094, -0.3830, 1.8119, -0.5825, -0.2013, -0.9141, 0.9488, 0.0407],
  25263. [ 0.3497, -0.5628, 0.9207, -1.2847, -0.1244, -1.5964, 0.2215, 0.2328],
  25264. [ 0.5139, -0.4596, 1.3448, -0.5620, -0.5908, -0.3688, 0.0872, 0.2178]],
  25265. device='cuda:0', grad_fn=<AddmmBackward>)
  25266. landmarks are: tensor([[[ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  25267. 0.4393],
  25268. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  25269. 0.0325],
  25270. [ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  25271. 0.3315],
  25272. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  25273. 0.2083],
  25274. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  25275. 0.2930],
  25276. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  25277. 0.1821],
  25278. [ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  25279. 0.2699],
  25280. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  25281. 0.2386]]], device='cuda:0')
  25282. loss_train_step before backward: tensor(0.0103, device='cuda:0', grad_fn=<MseLossBackward>)
  25283. loss_train_step after backward: tensor(0.0103, device='cuda:0', grad_fn=<MseLossBackward>)
  25284. loss_train: 1.4172964449971914
  25285. step: 53
  25286. running loss: 0.026741442358437575
  25287. Train Steps: 53/90 Loss: 0.0267 torch.Size([8, 600, 800])
  25288. torch.Size([8, 8])
  25289. tensor([[0.6164, 0.4076, 0.8838, 0.4117, 0.3713, 0.5550, 0.6238, 0.5350],
  25290. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  25291. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208],
  25292. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  25293. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  25294. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  25295. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  25296. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317]],
  25297. device='cuda:0', dtype=torch.float64)
  25298. predictions are: tensor([[ 0.5588, -0.4190, 1.8389, -0.3034, -0.4850, 0.2965, 0.6388, 0.2382],
  25299. [ 0.5971, -0.3907, 1.5570, -0.6910, -0.6359, -0.7238, 0.2675, 0.2644],
  25300. [ 0.5777, -0.4140, 1.4146, -1.0344, -0.2636, -1.2908, 0.4869, 0.0262],
  25301. [ 0.3478, -0.5392, 0.8901, -1.1096, -0.2750, -1.3271, 0.4063, 0.2873],
  25302. [ 0.6769, -0.3749, 1.8106, -0.0091, -0.1602, 0.2302, 0.5604, 0.2009],
  25303. [ 0.6794, -0.3695, 1.8073, -0.6632, -0.4131, -0.8047, 0.6484, 0.1249],
  25304. [-1.6592, -1.8379, 1.3722, -0.7628, -0.4710, -1.0075, -0.0038, 0.1739],
  25305. [ 0.3202, -0.5807, 1.1559, -1.1361, -0.2836, -1.1998, 0.3835, 0.2031]],
  25306. device='cuda:0', grad_fn=<AddmmBackward>)
  25307. landmarks are: tensor([[[ 0.5614, -0.4032, 1.7961, -0.3844, -0.5711, 0.2776, 0.5952,
  25308. 0.1852],
  25309. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  25310. 0.3315],
  25311. [ 0.5885, -0.4429, 1.4266, -0.9926, -0.4383, -1.2313, 0.4228,
  25312. 0.1195],
  25313. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  25314. 0.2622],
  25315. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  25316. 0.2237],
  25317. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  25318. 0.1390],
  25319. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  25320. 0.2837],
  25321. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  25322. 0.1698]]], device='cuda:0')
  25323. loss_train_step before backward: tensor(0.0165, device='cuda:0', grad_fn=<MseLossBackward>)
  25324. loss_train_step after backward: tensor(0.0165, device='cuda:0', grad_fn=<MseLossBackward>)
  25325. loss_train: 1.4337830413132906
  25326. step: 54
  25327. running loss: 0.026551537802097975
  25328. Train Steps: 54/90 Loss: 0.0266 torch.Size([8, 600, 800])
  25329. torch.Size([8, 8])
  25330. tensor([[0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  25331. [0.6264, 0.4035, 0.8888, 0.4883, 0.4050, 0.5217, 0.6361, 0.4791],
  25332. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  25333. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279],
  25334. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  25335. [0.6197, 0.4050, 0.7527, 0.2000, 0.4042, 0.2249, 0.5895, 0.4995],
  25336. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  25337. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167]],
  25338. device='cuda:0', dtype=torch.float64)
  25339. predictions are: tensor([[ 0.5739, -0.4075, 1.0099, -1.2497, -0.4887, -1.0567, 0.4248, 0.2145],
  25340. [ 0.6474, -0.3825, 1.8956, 0.0107, -0.5090, 0.2286, 0.5319, 0.0127],
  25341. [-2.0089, -2.0760, 1.3973, -1.0495, -0.2714, -1.0593, 0.1613, 0.2091],
  25342. [ 0.5967, -0.3914, 1.8916, -0.0790, -0.5793, 0.0853, 0.3931, 0.1261],
  25343. [ 0.6433, -0.3461, 0.9987, -1.1937, -0.3592, -1.3822, 0.1790, 0.2450],
  25344. [ 0.6662, -0.3432, 1.2133, -1.2991, -0.4466, -1.1694, 0.4190, 0.0401],
  25345. [ 0.4311, -0.5357, 1.9630, -0.0693, -0.5812, -0.0296, 0.7530, 0.2171],
  25346. [ 0.4983, -0.3966, 1.1779, -0.7674, -0.0606, -1.3045, 0.2264, 0.4292]],
  25347. device='cuda:0', grad_fn=<AddmmBackward>)
  25348. landmarks are: tensor([[[ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  25349. 0.2930],
  25350. [ 0.6074, -0.4223, 1.8192, -0.0303, -0.4152, 0.1236, 0.6524,
  25351. -0.0731],
  25352. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  25353. 0.3007],
  25354. [ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  25355. 0.1525],
  25356. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  25357. 0.3007],
  25358. [ 0.5762, -0.4153, 1.1908, -1.3622, -0.4190, -1.2471, 0.4368,
  25359. 0.0213],
  25360. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  25361. 0.2516],
  25362. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  25363. 0.5624]]], device='cuda:0')
  25364. loss_train_step before backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  25365. loss_train_step after backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  25366. loss_train: 1.4424332054331899
  25367. step: 55
  25368. running loss: 0.026226058280603454
  25369. Train Steps: 55/90 Loss: 0.0262 torch.Size([8, 600, 800])
  25370. torch.Size([8, 8])
  25371. tensor([[0.6097, 0.4024, 0.8488, 0.3717, 0.3875, 0.5517, 0.5836, 0.5591],
  25372. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533],
  25373. [0.6346, 0.4086, 0.7938, 0.5500, 0.3962, 0.4867, 0.7343, 0.5702],
  25374. [0.6132, 0.4037, 0.6963, 0.2217, 0.4100, 0.1950, 0.5395, 0.5175],
  25375. [0.6164, 0.3956, 0.8757, 0.5088, 0.4300, 0.5320, 0.6022, 0.5202],
  25376. [0.6200, 0.3913, 0.8788, 0.5217, 0.4075, 0.5100, 0.6060, 0.4913],
  25377. [0.6127, 0.4115, 0.7163, 0.2883, 0.3625, 0.2950, 0.5327, 0.5495],
  25378. [0.6197, 0.4050, 0.7527, 0.2000, 0.4042, 0.2249, 0.5895, 0.4995]],
  25379. device='cuda:0', dtype=torch.float64)
  25380. predictions are: tensor([[ 0.4872, -0.4469, 1.7565, -0.5619, -0.4863, 0.3109, 0.5125, 0.2862],
  25381. [-1.7611, -1.9040, 0.9830, -1.3490, -0.3156, -1.5371, 0.0834, 0.3199],
  25382. [ 0.5838, -0.4097, 1.6127, 0.1440, -0.5238, -0.0731, 0.8983, 0.3705],
  25383. [ 0.5559, -0.3909, 1.0559, -1.3005, -0.4127, -1.4387, 0.2621, 0.0786],
  25384. [ 0.6276, -0.3755, 1.8506, 0.0234, -0.3498, 0.1800, 0.3969, 0.1361],
  25385. [ 0.4281, -0.5543, 1.8947, 0.0836, -0.3881, 0.0256, 0.3248, 0.0540],
  25386. [ 0.5170, -0.4141, 1.1629, -1.0955, -0.6339, -0.8938, 0.1307, 0.2361],
  25387. [ 0.7367, -0.3005, 1.2420, -1.3779, -0.4522, -1.2652, 0.4379, 0.0683]],
  25388. device='cuda:0', grad_fn=<AddmmBackward>)
  25389. landmarks are: tensor([[[ 0.5301, -0.4273, 1.6344, -0.5692, -0.4961, 0.2622, 0.4098,
  25390. 0.2966],
  25391. [-2.2859, -2.2859, 0.7023, -1.3883, -0.4268, -1.3621, 0.0813,
  25392. 0.2699],
  25393. [ 0.6454, -0.3984, 1.3804, 0.2545, -0.4557, -0.0380, 1.1057,
  25394. 0.3478],
  25395. [ 0.5465, -0.4214, 0.9300, -1.2620, -0.3921, -1.3852, 0.2062,
  25396. 0.1043],
  25397. [ 0.5614, -0.4586, 1.7587, 0.0641, -0.2998, 0.1712, 0.4958,
  25398. 0.1170],
  25399. [ 0.5776, -0.4784, 1.7730, 0.1236, -0.4037, 0.0697, 0.5132,
  25400. -0.0168],
  25401. [ 0.5442, -0.3855, 1.0224, -0.9541, -0.6115, -0.9233, 0.1745,
  25402. 0.2522],
  25403. [ 0.5762, -0.4153, 1.1908, -1.3622, -0.4190, -1.2471, 0.4368,
  25404. 0.0213]]], device='cuda:0')
  25405. loss_train_step before backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  25406. loss_train_step after backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  25407. loss_train: 1.4570275181904435
  25408. step: 56
  25409. running loss: 0.026018348539115062
  25410.  
  25411. Train Steps: 56/90 Loss: 0.0260 torch.Size([8, 600, 800])
  25412. torch.Size([8, 8])
  25413. tensor([[0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  25414. [0.6268, 0.4029, 0.8500, 0.2683, 0.3937, 0.3500, 0.6860, 0.5297],
  25415. [0.6248, 0.4032, 0.7738, 0.1900, 0.4813, 0.1400, 0.5941, 0.4904],
  25416. [0.6124, 0.4030, 0.8650, 0.4867, 0.4999, 0.5106, 0.5137, 0.5773],
  25417. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  25418. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  25419. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  25420. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904]],
  25421. device='cuda:0', dtype=torch.float64)
  25422. predictions are: tensor([[ 0.4687, -0.4761, 1.3885, -0.9022, -0.7235, -0.3510, 0.5231, 0.1867],
  25423. [ 0.5900, -0.4263, 1.4820, -1.0055, -0.6282, -0.5480, 0.8535, 0.1611],
  25424. [ 0.5019, -0.4647, 1.1006, -1.1980, -0.0975, -1.5659, 0.3672, 0.0922],
  25425. [ 0.2821, -0.6068, 1.6277, -0.0317, -0.0875, 0.1353, -0.0203, 0.2949],
  25426. [ 0.4712, -0.5273, 1.7103, -0.5717, -0.4082, -0.7752, 0.8000, 0.1014],
  25427. [ 0.3002, -0.5729, 1.6020, -0.7157, -0.7064, -0.2938, 0.3533, 0.2870],
  25428. [ 0.1574, -0.6228, 1.4466, -0.3927, -0.6264, -0.6890, 0.0769, 0.4375],
  25429. [ 0.1880, -0.6467, 1.4838, -1.2031, -0.1930, -1.1545, 0.4361, 0.0573]],
  25430. device='cuda:0', grad_fn=<AddmmBackward>)
  25431. landmarks are: tensor([[[ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  25432. 0.1159],
  25433. [ 0.6092, -0.4249, 1.6402, -1.0465, -0.4672, -0.6693, 0.8827,
  25434. 0.1608],
  25435. [ 0.5999, -0.4236, 1.2880, -1.4083, -0.0630, -1.6393, 0.4584,
  25436. -0.0208],
  25437. [ 0.5428, -0.4244, 1.7095, -0.0380, 0.0232, 0.0725, 0.0866,
  25438. 0.3806],
  25439. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  25440. 0.1821],
  25441. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  25442. 0.3392],
  25443. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  25444. 0.3238],
  25445. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  25446. -0.0209]]], device='cuda:0')
  25447. loss_train_step before backward: tensor(0.0224, device='cuda:0', grad_fn=<MseLossBackward>)
  25448. loss_train_step after backward: tensor(0.0224, device='cuda:0', grad_fn=<MseLossBackward>)
  25449. loss_train: 1.4794276067987084
  25450. step: 57
  25451. running loss: 0.02595487029471418
  25452. Train Steps: 57/90 Loss: 0.0260 torch.Size([8, 600, 800])
  25453. torch.Size([8, 8])
  25454. tensor([[0.6275, 0.4050, 0.9038, 0.3767, 0.3838, 0.3533, 0.7074, 0.5575],
  25455. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  25456. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767],
  25457. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  25458. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  25459. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  25460. [0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138],
  25461. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400]],
  25462. device='cuda:0', dtype=torch.float64)
  25463. predictions are: tensor([[ 0.5395, -0.4694, 1.7540, -0.6162, -0.3841, -0.6810, 0.9446, 0.2789],
  25464. [ 0.5050, -0.4520, 1.3034, -1.0162, -0.6673, -0.7612, 0.3418, 0.0111],
  25465. [ 0.4511, -0.4448, 1.5851, -0.2066, -0.5379, -0.8791, 0.2361, 0.2449],
  25466. [ 0.3331, -0.6058, 1.6994, -0.1982, -0.0322, 0.0858, 0.1891, 0.1661],
  25467. [ 0.4013, -0.5315, 1.5514, -0.8512, -0.5781, 0.1099, 0.5527, 0.2199],
  25468. [ 0.5276, -0.4425, 1.3316, -1.2870, -0.3980, -1.1945, 0.4547, 0.0442],
  25469. [ 0.3599, -0.5380, 1.4635, -0.6173, -0.6199, -0.5927, 0.3554, 0.4287],
  25470. [ 0.3724, -0.5610, 1.7453, -0.5381, -0.5880, -0.0687, 0.4760, 0.2247]],
  25471. device='cuda:0', grad_fn=<AddmmBackward>)
  25472. landmarks are: tensor([[[ 0.6125, -0.4153, 1.8885, -0.5461, -0.5134, -0.6539, 0.9814,
  25473. 0.2890],
  25474. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  25475. 0.0942],
  25476. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  25477. 0.3778],
  25478. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  25479. 0.2622],
  25480. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  25481. 0.2083],
  25482. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  25483. 0.1929],
  25484. [ 0.5438, -0.4206, 1.5189, -0.4537, -0.6115, -0.6231, 0.4365,
  25485. 0.5491],
  25486. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  25487. 0.2083]]], device='cuda:0')
  25488. loss_train_step before backward: tensor(0.0119, device='cuda:0', grad_fn=<MseLossBackward>)
  25489. loss_train_step after backward: tensor(0.0119, device='cuda:0', grad_fn=<MseLossBackward>)
  25490. loss_train: 1.491361235268414
  25491. step: 58
  25492. running loss: 0.02571312474600714
  25493. Train Steps: 58/90 Loss: 0.0257 torch.Size([8, 600, 800])
  25494. torch.Size([8, 8])
  25495. tensor([[ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  25496. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750],
  25497. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  25498. [0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044],
  25499. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  25500. [0.6225, 0.4116, 0.8662, 0.3517, 0.3663, 0.3233, 0.5837, 0.5317],
  25501. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  25502. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117]],
  25503. device='cuda:0', dtype=torch.float64)
  25504. predictions are: tensor([[-1.0428, -1.4417, 1.1209, -1.3021, -0.3286, -1.2498, 0.1953, 0.2366],
  25505. [-0.5951, -1.1337, 0.8469, -1.3820, -0.3139, -1.3906, 0.1110, 0.3584],
  25506. [ 0.7358, -0.2749, 1.8279, -0.0705, -0.3832, 0.1568, 0.2909, 0.1203],
  25507. [ 0.6467, -0.3631, 1.2392, -1.4253, -0.4089, -1.1979, 0.4387, 0.0469],
  25508. [ 0.7252, -0.3748, 1.8057, 0.2314, -0.5462, -0.1135, 0.6252, 0.0910],
  25509. [ 0.7185, -0.2933, 1.6671, -0.7556, -0.6140, -0.6193, 0.4088, 0.1966],
  25510. [ 0.6939, -0.3297, 1.2181, -1.2268, -0.5244, -0.8829, 0.6186, 0.3606],
  25511. [ 0.6410, -0.4152, 1.8992, -0.1185, -0.5496, 0.0964, 0.7300, 0.1463]],
  25512. device='cuda:0', grad_fn=<AddmmBackward>)
  25513. landmarks are: tensor([[[-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  25514. 0.3084],
  25515. [ 0.5663, -0.4396, 0.8261, -1.1312, -0.2940, -1.3929, 0.2603,
  25516. 0.3700],
  25517. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  25518. 0.1439],
  25519. [ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  25520. 0.0438],
  25521. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  25522. 0.0291],
  25523. [ 0.5893, -0.3847, 1.7152, -0.6616, -0.5942, -0.7925, 0.4104,
  25524. 0.1698],
  25525. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  25526. 0.3777],
  25527. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  25528. 0.0774]]], device='cuda:0')
  25529. loss_train_step before backward: tensor(0.0705, device='cuda:0', grad_fn=<MseLossBackward>)
  25530. loss_train_step after backward: tensor(0.0705, device='cuda:0', grad_fn=<MseLossBackward>)
  25531. loss_train: 1.5618963139131665
  25532. step: 59
  25533. running loss: 0.026472818879884178
  25534. Train Steps: 59/90 Loss: 0.0265 torch.Size([8, 600, 800])
  25535. torch.Size([8, 8])
  25536. tensor([[0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  25537. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  25538. [0.6214, 0.4040, 0.8838, 0.3500, 0.3600, 0.5183, 0.6362, 0.5200],
  25539. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  25540. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  25541. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  25542. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567],
  25543. [0.6037, 0.4020, 0.8300, 0.4033, 0.3575, 0.4883, 0.5647, 0.5631]],
  25544. device='cuda:0', dtype=torch.float64)
  25545. predictions are: tensor([[ 0.6830, -0.3160, 1.5683, -0.4438, -0.5378, -0.1399, 0.1804, 0.0487],
  25546. [ 0.6534, -0.3342, 1.1585, -1.1978, -0.4531, -0.9316, 0.6637, 0.5017],
  25547. [ 0.7875, -0.2731, 1.6926, -0.7453, -0.5681, 0.1508, 0.7731, 0.1326],
  25548. [ 0.4850, -0.4299, 1.6709, -0.0909, -0.1282, -0.1104, 0.3001, 0.3511],
  25549. [ 0.7053, -0.2990, 1.6272, 0.0098, -0.5108, -0.6850, 0.4937, 0.1394],
  25550. [ 0.7281, -0.3108, 1.7384, -0.3913, -0.5842, -0.4616, 0.5438, -0.0194],
  25551. [-2.2420, -2.2402, 1.1993, -1.3444, -0.4029, -1.2837, 0.1392, 0.1897],
  25552. [ 0.4973, -0.4148, 1.5378, -0.5538, -0.5770, -0.0541, 0.4557, 0.2367]],
  25553. device='cuda:0', grad_fn=<AddmmBackward>)
  25554. landmarks are: tensor([[[ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  25555. 0.0502],
  25556. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  25557. 0.5701],
  25558. [ 0.5841, -0.4199, 1.7961, -0.6693, -0.6231, 0.1082, 0.6529,
  25559. 0.1159],
  25560. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  25561. 0.4171],
  25562. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  25563. 0.1698],
  25564. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  25565. 0.0467],
  25566. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  25567. 0.2853],
  25568. [ 0.5027, -0.4289, 1.5478, -0.4229, -0.6346, -0.0303, 0.3223,
  25569. 0.3148]]], device='cuda:0')
  25570. loss_train_step before backward: tensor(0.0100, device='cuda:0', grad_fn=<MseLossBackward>)
  25571. loss_train_step after backward: tensor(0.0100, device='cuda:0', grad_fn=<MseLossBackward>)
  25572. loss_train: 1.5718588447198272
  25573. step: 60
  25574. running loss: 0.026197647411997118
  25575.  
  25576. Train Steps: 60/90 Loss: 0.0262 torch.Size([8, 600, 800])
  25577. torch.Size([8, 8])
  25578. tensor([[ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  25579. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  25580. [0.6264, 0.4067, 0.9050, 0.4183, 0.3775, 0.4600, 0.6308, 0.4862],
  25581. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  25582. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  25583. [0.6164, 0.4076, 0.8838, 0.4117, 0.3713, 0.5550, 0.6238, 0.5350],
  25584. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  25585. [0.6284, 0.4029, 0.8838, 0.3783, 0.3975, 0.2850, 0.6335, 0.5090]],
  25586. device='cuda:0', dtype=torch.float64)
  25587. predictions are: tensor([[-0.9843, -1.3892, 1.0133, -1.2959, -0.4340, -1.2826, 0.1560, 0.2911],
  25588. [-0.4680, -1.0566, 1.4186, -0.9007, -0.7730, -0.6571, 0.1447, 0.1514],
  25589. [ 0.9725, -0.1446, 1.7648, -0.3390, -0.6778, -0.0703, 0.5688, 0.0236],
  25590. [-1.6986, -1.8749, 0.8447, -1.3785, -0.2807, -1.4518, 0.1705, 0.4223],
  25591. [ 0.9834, -0.1479, 1.6662, -0.1350, -0.1114, 0.1979, 0.4884, 0.2888],
  25592. [ 1.0038, -0.0991, 1.7135, -0.3682, -0.5607, 0.4052, 0.5918, 0.2180],
  25593. [ 0.6469, -0.3788, 1.8183, -0.9520, -0.1124, -1.1401, 0.9596, 0.2261],
  25594. [ 1.1452, -0.0534, 1.6800, -0.5457, -0.5165, -0.8915, 0.6578, 0.0302]],
  25595. device='cuda:0', grad_fn=<AddmmBackward>)
  25596. landmarks are: tensor([[[-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  25597. 0.3084],
  25598. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  25599. 0.0893],
  25600. [ 0.6072, -0.4075, 1.8942, -0.3537, -0.5423, -0.1612, 0.6277,
  25601. -0.0400],
  25602. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  25603. 0.3623],
  25604. [ 0.5598, -0.4273, 1.7152, -0.1227, -0.0065, 0.1917, 0.5143,
  25605. 0.2853],
  25606. [ 0.5614, -0.4032, 1.7961, -0.3844, -0.5711, 0.2776, 0.5952,
  25607. 0.1852],
  25608. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  25609. 0.2142],
  25610. [ 0.6165, -0.4249, 1.7961, -0.5384, -0.4499, -0.9695, 0.6401,
  25611. 0.0652]]], device='cuda:0')
  25612. loss_train_step before backward: tensor(0.1461, device='cuda:0', grad_fn=<MseLossBackward>)
  25613. loss_train_step after backward: tensor(0.1461, device='cuda:0', grad_fn=<MseLossBackward>)
  25614. loss_train: 1.7179200714454055
  25615. step: 61
  25616. running loss: 0.028162624122055828
  25617. Train Steps: 61/90 Loss: 0.0282 torch.Size([8, 600, 800])
  25618. torch.Size([8, 8])
  25619. tensor([[0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  25620. [0.6307, 0.4045, 0.8025, 0.5833, 0.3775, 0.4867, 0.6892, 0.5459],
  25621. [0.6182, 0.3967, 0.8263, 0.3065, 0.3526, 0.4161, 0.6192, 0.5290],
  25622. [0.6226, 0.4103, 0.8575, 0.3450, 0.4388, 0.2067, 0.5787, 0.5383],
  25623. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  25624. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  25625. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  25626. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389]],
  25627. device='cuda:0', dtype=torch.float64)
  25628. predictions are: tensor([[ 0.4069, -0.4887, 1.5738, -0.8161, -0.4371, -0.9213, 0.2029, 0.1648],
  25629. [ 0.6786, -0.3535, 1.4581, 0.0995, -0.4370, 0.0541, 0.8146, 0.2342],
  25630. [ 0.4607, -0.4850, 1.5293, -0.9322, -0.6656, -0.2563, 0.6008, 0.1711],
  25631. [ 0.8734, -0.1844, 1.6444, -0.8083, -0.2172, -1.0457, 0.3793, 0.2408],
  25632. [-2.2036, -2.2297, 1.0053, -1.3418, -0.4457, -1.3178, 0.0063, 0.2084],
  25633. [ 0.6053, -0.4024, 1.7200, -0.1428, -0.5565, -0.3159, 0.4685, 0.1977],
  25634. [ 0.6157, -0.4194, 1.7860, -0.4878, -0.5991, -0.3522, 0.7102, 0.1331],
  25635. [ 0.4235, -0.4903, 1.1394, -1.3845, -0.5097, -0.8972, 0.5451, 0.3152]],
  25636. device='cuda:0', grad_fn=<AddmmBackward>)
  25637. landmarks are: tensor([[[ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  25638. 0.1494],
  25639. [ 0.6273, -0.4177, 1.4208, 0.4085, -0.5423, -0.0380, 0.8973,
  25640. 0.2356],
  25641. [ 0.5697, -0.4538, 1.5308, -0.8703, -0.6572, -0.3639, 0.5739,
  25642. 0.1576],
  25643. [ 0.5898, -0.3908, 1.6748, -0.6924, -0.2594, -1.3313, 0.3873,
  25644. 0.2006],
  25645. [-2.2859, -2.2859, 1.0712, -1.2085, -0.3806, -1.3929, 0.0755,
  25646. 0.2006],
  25647. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  25648. 0.1082],
  25649. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  25650. 0.0697],
  25651. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  25652. 0.2032]]], device='cuda:0')
  25653. loss_train_step before backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  25654. loss_train_step after backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  25655. loss_train: 1.7292997566983104
  25656. step: 62
  25657. running loss: 0.027891931559650168
  25658. Train Steps: 62/90 Loss: 0.0279 torch.Size([8, 600, 800])
  25659. torch.Size([8, 8])
  25660. tensor([[0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  25661. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  25662. [0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823],
  25663. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208],
  25664. [0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  25665. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  25666. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  25667. [0.6307, 0.4029, 0.8650, 0.5200, 0.3763, 0.4017, 0.7311, 0.5366]],
  25668. device='cuda:0', dtype=torch.float64)
  25669. predictions are: tensor([[ 0.4144, -0.4975, 1.6276, -0.0421, -0.2300, 0.1761, 0.1585, 0.3201],
  25670. [ 0.0341, -0.7305, 1.5266, -0.5993, -0.6648, -0.6568, 0.3565, 0.5090],
  25671. [ 0.5211, -0.4751, 1.5493, -1.3137, -0.4079, -1.2031, 0.6441, 0.0187],
  25672. [ 0.1711, -0.6814, 1.3945, -1.2608, -0.5439, -1.0559, 0.4239, 0.1091],
  25673. [ 0.6617, -0.3810, 1.2957, -1.4371, -0.2348, -1.3179, 0.5682, 0.2448],
  25674. [ 0.4271, -0.5189, 1.6395, -0.2360, -0.3430, 0.0163, 0.2549, 0.3236],
  25675. [ 0.4806, -0.5065, 1.6840, 0.0585, -0.6031, -0.1559, 0.5047, 0.0424],
  25676. [ 0.3668, -0.6003, 1.7427, -0.1002, -0.6017, -0.3306, 0.8768, 0.1167]],
  25677. device='cuda:0', grad_fn=<AddmmBackward>)
  25678. landmarks are: tensor([[[ 5.4475e-01, -3.8383e-01, 1.7037e+00, 1.7752e-01, -1.4965e-01,
  25679. 1.4673e-01, 1.1283e-01, 2.4313e-01],
  25680. [ 5.8942e-01, -3.5027e-01, 1.6402e+00, -3.6135e-01, -5.8268e-01,
  25681. -7.9246e-01, 3.2379e-01, 3.2379e-01],
  25682. [ 6.1316e-01, -4.1224e-01, 1.5478e+00, -1.0619e+00, -2.7090e-01,
  25683. -1.4314e+00, 5.5000e-01, -5.8318e-02],
  25684. [ 5.8851e-01, -4.4288e-01, 1.4266e+00, -9.9261e-01, -4.3834e-01,
  25685. -1.2313e+00, 4.2276e-01, 1.1948e-01],
  25686. [ 5.9076e-01, -3.8322e-01, 1.3804e+00, -1.2543e+00, -1.2695e-01,
  25687. -1.4671e+00, 5.7206e-01, 2.2371e-01],
  25688. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  25689. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  25690. [ 6.3355e-01, -4.1617e-01, 1.7499e+00, 3.0839e-01, -4.9607e-01,
  25691. -2.4588e-01, 6.5236e-01, -1.0225e-02],
  25692. [ 6.2730e-01, -4.2490e-01, 1.7095e+00, 1.1594e-01, -5.4804e-01,
  25693. -4.3064e-01, 1.0910e+00, 1.9283e-01]]], device='cuda:0')
  25694. loss_train_step before backward: tensor(0.0269, device='cuda:0', grad_fn=<MseLossBackward>)
  25695. loss_train_step after backward: tensor(0.0269, device='cuda:0', grad_fn=<MseLossBackward>)
  25696. loss_train: 1.7561887232586741
  25697. step: 63
  25698. running loss: 0.027876011480296416
  25699. Train Steps: 63/90 Loss: 0.0279 torch.Size([8, 600, 800])
  25700. torch.Size([8, 8])
  25701. tensor([[0.6144, 0.4032, 0.8563, 0.3283, 0.3525, 0.4200, 0.5775, 0.5583],
  25702. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  25703. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  25704. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795],
  25705. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  25706. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  25707. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  25708. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475]],
  25709. device='cuda:0', dtype=torch.float64)
  25710. predictions are: tensor([[ 0.6315, -0.3615, 1.5528, -0.9199, -0.7058, -0.4619, 0.3850, 0.2241],
  25711. [ 0.3478, -0.5686, 1.4856, -0.6887, -0.6811, -0.5351, 0.2528, 0.0194],
  25712. [ 0.2640, -0.5953, 1.5867, 0.0825, -0.2929, -0.1107, 0.1025, 0.2531],
  25713. [ 0.5650, -0.4369, 1.6092, 0.0533, -0.3942, 0.1878, 1.0112, 0.3344],
  25714. [-0.0204, -0.8140, 1.8506, -0.5604, -0.4599, -0.8181, 0.6399, 0.2778],
  25715. [ 0.4338, -0.5079, 1.4570, -1.0512, -0.5840, -1.0056, 0.5227, 0.0549],
  25716. [ 0.4230, -0.5198, 1.8174, -0.6804, -0.5331, -0.5642, 0.7121, 0.2244],
  25717. [ 0.4962, -0.4371, 1.6423, 0.0260, -0.1258, -0.0331, 0.1809, 0.2964]],
  25718. device='cuda:0', grad_fn=<AddmmBackward>)
  25719. landmarks are: tensor([[[ 0.5520, -0.4237, 1.6691, -0.7694, -0.6577, -0.3460, 0.3815,
  25720. 0.2930],
  25721. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  25722. 0.0021],
  25723. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  25724. 0.2048],
  25725. [ 0.6355, -0.4080, 1.6113, 0.1852, -0.4730, 0.1467, 0.9996,
  25726. 0.3905],
  25727. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  25728. 0.1005],
  25729. [ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  25730. 0.1080],
  25731. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  25732. 0.1544],
  25733. [ 0.5447, -0.3838, 1.7037, 0.1775, -0.1497, 0.1467, 0.1128,
  25734. 0.2431]]], device='cuda:0')
  25735. loss_train_step before backward: tensor(0.0206, device='cuda:0', grad_fn=<MseLossBackward>)
  25736. loss_train_step after backward: tensor(0.0206, device='cuda:0', grad_fn=<MseLossBackward>)
  25737. loss_train: 1.7767991842702031
  25738. step: 64
  25739. running loss: 0.027762487254221924
  25740.  
  25741. Train Steps: 64/90 Loss: 0.0278 torch.Size([8, 600, 800])
  25742. torch.Size([8, 8])
  25743. tensor([[0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843],
  25744. [0.6203, 0.4056, 0.8942, 0.4086, 0.3643, 0.3617, 0.5917, 0.5482],
  25745. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  25746. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  25747. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  25748. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  25749. [0.6203, 0.4076, 0.8611, 0.2878, 0.4050, 0.2554, 0.5907, 0.5496],
  25750. [0.6037, 0.4020, 0.8300, 0.4033, 0.3575, 0.4883, 0.5647, 0.5631]],
  25751. device='cuda:0', dtype=torch.float64)
  25752. predictions are: tensor([[ 0.4024, -0.5408, 1.8413, -0.2530, -0.4907, -0.0938, 0.6912, 0.0739],
  25753. [ 0.2597, -0.6268, 1.7614, -0.5272, -0.5981, -0.6706, 0.5482, 0.1919],
  25754. [ 0.5895, -0.4250, 1.6090, -0.0598, -0.2045, -0.0404, 0.6184, 0.3056],
  25755. [ 0.3920, -0.5026, 1.5573, -0.3926, -0.6188, -0.8363, 0.1831, 0.3305],
  25756. [ 0.3983, -0.5696, 1.7242, 0.0177, -0.4467, -0.0459, 0.4527, 0.1228],
  25757. [ 0.2151, -0.6292, 1.6645, -0.2897, -0.3916, -0.1674, 0.1652, 0.1324],
  25758. [ 0.7846, -0.2886, 1.6542, -1.0929, -0.3467, -1.0930, 0.6925, 0.1557],
  25759. [ 0.0871, -0.7089, 1.5407, -0.4913, -0.5601, -0.1321, 0.4519, 0.3129]],
  25760. device='cuda:0', grad_fn=<AddmmBackward>)
  25761. landmarks are: tensor([[[ 6.0751e-01, -4.1586e-01, 1.8654e+00, -1.4580e-01, -5.2494e-01,
  25762. 1.5858e-02, 6.3595e-01, -4.9015e-02],
  25763. [ 5.7910e-01, -4.1270e-01, 1.8442e+00, -3.9854e-01, -6.0306e-01,
  25764. -6.1538e-01, 4.4726e-01, 2.4636e-01],
  25765. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  25766. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  25767. [ 5.6969e-01, -4.1132e-01, 1.7499e+00, -2.7667e-01, -6.4042e-01,
  25768. -7.1547e-01, 1.5756e-01, 4.0319e-01],
  25769. [ 5.7829e-01, -4.3634e-01, 1.7724e+00, 4.3211e-02, -5.1531e-01,
  25770. 8.7136e-02, 4.8401e-01, 6.6263e-02],
  25771. [ 5.7079e-01, -4.0747e-01, 1.7961e+00, -2.3048e-01, -4.2102e-01,
  25772. -9.9615e-02, 1.2187e-01, 8.9251e-02],
  25773. [ 5.7904e-01, -4.0308e-01, 1.6915e+00, -9.5640e-01, -4.1518e-01,
  25774. -1.1063e+00, 4.4251e-01, 2.5281e-01],
  25775. [ 5.0266e-01, -4.2895e-01, 1.5478e+00, -4.2294e-01, -6.3464e-01,
  25776. -3.0331e-02, 3.2234e-01, 3.1483e-01]]], device='cuda:0')
  25777. loss_train_step before backward: tensor(0.0183, device='cuda:0', grad_fn=<MseLossBackward>)
  25778. loss_train_step after backward: tensor(0.0183, device='cuda:0', grad_fn=<MseLossBackward>)
  25779. loss_train: 1.7951224902644753
  25780. step: 65
  25781. running loss: 0.02761726908099193
  25782. Train Steps: 65/90 Loss: 0.0276 torch.Size([8, 600, 800])
  25783. torch.Size([8, 8])
  25784. tensor([[0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  25785. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  25786. [0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  25787. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  25788. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  25789. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  25790. [0.6202, 0.4064, 0.7879, 0.2179, 0.4567, 0.1725, 0.5955, 0.5478],
  25791. [0.6193, 0.3930, 0.8949, 0.4437, 0.3852, 0.5435, 0.6263, 0.5263]],
  25792. device='cuda:0', dtype=torch.float64)
  25793. predictions are: tensor([[ 4.6338e-01, -5.2227e-01, 1.7455e+00, 1.4470e-01, -4.0361e-01,
  25794. -9.9533e-03, 5.7737e-01, 2.0882e-01],
  25795. [ 5.8856e-01, -4.1358e-01, 1.8907e+00, -1.4242e-01, -1.5540e-03,
  25796. -1.9423e-01, 5.4205e-01, 3.0218e-01],
  25797. [ 1.7223e-02, -7.4201e-01, 9.9789e-01, -9.9806e-01, -6.9489e-01,
  25798. -9.9325e-01, 1.8740e-01, 3.3484e-01],
  25799. [ 5.7928e-01, -4.4168e-01, 1.8534e+00, -2.0523e-01, -4.6537e-01,
  25800. 1.8911e-01, 5.8318e-01, 4.3507e-02],
  25801. [ 2.2809e-01, -6.4014e-01, 1.8076e+00, -2.9703e-01, -4.9680e-01,
  25802. -3.3525e-01, 1.6166e-01, 8.1175e-02],
  25803. [ 5.3848e-01, -4.6859e-01, 1.8441e+00, -2.2687e-01, -6.5880e-01,
  25804. -4.8382e-01, 6.1689e-01, 7.4508e-02],
  25805. [ 5.3224e-01, -4.6670e-01, 1.2817e+00, -1.2365e+00, -2.9876e-01,
  25806. -1.5286e+00, 5.0515e-01, 2.2926e-01],
  25807. [ 1.9818e-01, -6.9324e-01, 1.7965e+00, -2.1564e-01, -5.4197e-01,
  25808. 4.7281e-02, 5.9085e-01, 1.7062e-01]], device='cuda:0',
  25809. grad_fn=<AddmmBackward>)
  25810. landmarks are: tensor([[[ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  25811. 0.0711],
  25812. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  25813. 0.2776],
  25814. [ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  25815. 0.3315],
  25816. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  25817. -0.0322],
  25818. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  25819. -0.0220],
  25820. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  25821. 0.0467],
  25822. [ 0.5787, -0.4086, 1.3535, -1.2794, -0.1764, -1.4891, 0.4645,
  25823. 0.2442],
  25824. [ 0.5746, -0.4706, 1.8476, -0.2365, -0.5068, 0.2245, 0.6069,
  25825. 0.1449]]], device='cuda:0')
  25826. loss_train_step before backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  25827. loss_train_step after backward: tensor(0.0180, device='cuda:0', grad_fn=<MseLossBackward>)
  25828. loss_train: 1.813149274326861
  25829. step: 66
  25830. running loss: 0.027471958701922136
  25831. Train Steps: 66/90 Loss: 0.0275 torch.Size([8, 600, 800])
  25832. torch.Size([8, 8])
  25833. tensor([[0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  25834. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  25835. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  25836. [0.6128, 0.4116, 0.8450, 0.4583, 0.3675, 0.4867, 0.5337, 0.5446],
  25837. [0.6268, 0.4061, 0.8350, 0.2433, 0.4575, 0.2283, 0.6350, 0.5300],
  25838. [0.6317, 0.4038, 0.8287, 0.5900, 0.3800, 0.4717, 0.6295, 0.4986],
  25839. [0.6069, 0.3975, 0.8625, 0.5083, 0.4388, 0.5483, 0.5650, 0.4967],
  25840. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586]],
  25841. device='cuda:0', dtype=torch.float64)
  25842. predictions are: tensor([[ 0.6237, -0.3526, 1.4897, -0.8053, -0.2185, -1.1974, 0.4056, 0.2007],
  25843. [ 0.5143, -0.4223, 1.6992, -0.3952, -0.7517, -0.3259, 0.4469, 0.1026],
  25844. [-2.5826, -2.4747, 1.1780, -1.1872, -0.4906, -1.2475, 0.2174, 0.1164],
  25845. [ 0.4828, -0.4180, 1.6138, -0.1066, -0.5749, -0.0056, 0.3014, 0.1830],
  25846. [ 0.1862, -0.6344, 1.5743, -1.1071, -0.3166, -1.1941, 0.6868, 0.2255],
  25847. [ 0.8689, -0.2395, 1.6244, 0.4121, -0.6324, 0.0112, 0.6183, 0.0872],
  25848. [ 0.6781, -0.3274, 1.6930, 0.1251, -0.3152, 0.2715, 0.3076, 0.0937],
  25849. [ 0.8013, -0.2742, 1.6472, -1.0357, 0.1264, -1.3641, 0.7931, 0.2533]],
  25850. device='cuda:0', grad_fn=<AddmmBackward>)
  25851. landmarks are: tensor([[[ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  25852. 0.2083],
  25853. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  25854. 0.0236],
  25855. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  25856. 0.0231],
  25857. [ 0.5444, -0.3846, 1.6171, -0.1689, -0.5885, -0.0380, 0.1791,
  25858. 0.2296],
  25859. [ 0.6093, -0.4104, 1.5709, -1.1620, -0.1727, -1.2313, 0.6471,
  25860. 0.1621],
  25861. [ 0.6320, -0.4206, 1.5420, 0.4393, -0.5307, -0.1073, 0.6216,
  25862. 0.0171],
  25863. [ 0.5174, -0.4497, 1.6979, 0.0620, -0.2594, 0.2468, 0.3238,
  25864. 0.0082],
  25865. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  25866. 0.2944]]], device='cuda:0')
  25867. loss_train_step before backward: tensor(0.0157, device='cuda:0', grad_fn=<MseLossBackward>)
  25868. loss_train_step after backward: tensor(0.0157, device='cuda:0', grad_fn=<MseLossBackward>)
  25869. loss_train: 1.8288374664261937
  25870. step: 67
  25871. running loss: 0.027296081588450653
  25872. Train Steps: 67/90 Loss: 0.0273 torch.Size([8, 600, 800])
  25873. torch.Size([8, 8])
  25874. tensor([[0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  25875. [0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600],
  25876. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  25877. [0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155],
  25878. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  25879. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297],
  25880. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927],
  25881. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742]],
  25882. device='cuda:0', dtype=torch.float64)
  25883. predictions are: tensor([[ 0.3651, -0.5206, 1.6997, 0.1684, -0.4600, -0.2442, 0.4703, 0.4270],
  25884. [ 0.7231, -0.3273, 1.6843, 0.2476, -0.3617, 0.2596, 0.3580, 0.2787],
  25885. [ 0.2887, -0.6014, 1.3200, -1.1043, -0.6701, -0.5464, 0.3305, 0.1842],
  25886. [ 0.5762, -0.4481, 1.7215, -0.9292, -0.2008, -1.3391, 0.6507, 0.1040],
  25887. [ 0.5290, -0.4668, 1.7715, -0.5002, -0.5998, -0.8600, 0.4262, 0.1119],
  25888. [ 0.3244, -0.6056, 1.7703, -0.1491, -0.4256, 0.0223, 0.7856, 0.1435],
  25889. [ 0.4005, -0.5445, 1.8250, -0.1427, -0.1946, 0.0466, 0.0948, 0.0051],
  25890. [ 0.4814, -0.5089, 1.8568, 0.1708, -0.5595, -0.5359, 0.4954, -0.0020]],
  25891. device='cuda:0', grad_fn=<AddmmBackward>)
  25892. landmarks are: tensor([[[ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  25893. 0.3084],
  25894. [ 0.5762, -0.3840, 1.7268, 0.2622, -0.4210, 0.1313, 0.4277,
  25895. 0.3007],
  25896. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  25897. 0.2237],
  25898. [ 0.6126, -0.4161, 1.6344, -0.9541, -0.2247, -1.3467, 0.6339,
  25899. 0.0953],
  25900. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  25901. 0.1005],
  25902. [ 0.6257, -0.4273, 1.8365, -0.0688, -0.4672, -0.0611, 1.1715,
  25903. 0.1608],
  25904. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  25905. -0.0099],
  25906. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  25907. -0.0957]]], device='cuda:0')
  25908. loss_train_step before backward: tensor(0.0129, device='cuda:0', grad_fn=<MseLossBackward>)
  25909. loss_train_step after backward: tensor(0.0129, device='cuda:0', grad_fn=<MseLossBackward>)
  25910. loss_train: 1.8417663387954235
  25911. step: 68
  25912. running loss: 0.027084799099932697
  25913.  
  25914. Train Steps: 68/90 Loss: 0.0271 torch.Size([8, 600, 800])
  25915. torch.Size([8, 8])
  25916. tensor([[0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  25917. [0.6250, 0.4013, 0.8525, 0.5417, 0.4037, 0.5117, 0.6325, 0.5017],
  25918. [0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183],
  25919. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  25920. [0.6129, 0.4069, 0.8750, 0.5067, 0.3875, 0.4233, 0.5235, 0.5881],
  25921. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  25922. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646],
  25923. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983]],
  25924. device='cuda:0', dtype=torch.float64)
  25925. predictions are: tensor([[ 0.7885, -0.2755, 1.8507, -0.0734, -0.4111, 0.0235, 0.3560, 0.0462],
  25926. [ 0.7404, -0.3294, 1.7126, 0.2041, -0.3258, 0.0337, 0.6419, -0.0222],
  25927. [ 0.9415, -0.2172, 1.7814, -0.6563, -0.5288, -0.5494, 0.6929, 0.0388],
  25928. [ 0.4125, -0.5422, 1.9219, -0.7111, -0.3666, -0.8003, 0.6918, 0.0999],
  25929. [ 0.6063, -0.3980, 1.7486, 0.0841, -0.4291, -0.2599, 0.1080, 0.2190],
  25930. [ 0.3537, -0.5790, 1.9364, -0.1108, -0.2992, -0.2235, 0.9382, 0.2877],
  25931. [-1.0781, -1.4772, 1.3764, -0.8284, -0.6005, -0.8796, -0.0899, 0.0682],
  25932. [ 0.6193, -0.3623, 1.5289, 0.2866, -0.4413, -0.5597, 0.1839, 0.4190]],
  25933. device='cuda:0', grad_fn=<AddmmBackward>)
  25934. landmarks are: tensor([[[ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  25935. 0.2237],
  25936. [ 0.6010, -0.4321, 1.6517, 0.2160, -0.4210, 0.0774, 0.6356,
  25937. 0.0313],
  25938. [ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  25939. 0.1080],
  25940. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  25941. 0.1390],
  25942. [ 0.5452, -0.4067, 1.7557, 0.0543, -0.4961, -0.3306, 0.1323,
  25943. 0.4306],
  25944. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  25945. 0.4386],
  25946. [ 0.5483, -0.4105, 1.4208, -0.8002, -0.6000, -0.9002, 0.0511,
  25947. 0.3220],
  25948. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  25949. 0.4778]]], device='cuda:0')
  25950. loss_train_step before backward: tensor(0.0728, device='cuda:0', grad_fn=<MseLossBackward>)
  25951. loss_train_step after backward: tensor(0.0728, device='cuda:0', grad_fn=<MseLossBackward>)
  25952. loss_train: 1.9145381338894367
  25953. step: 69
  25954. running loss: 0.027746929476658504
  25955. Train Steps: 69/90 Loss: 0.0277 torch.Size([8, 600, 800])
  25956. torch.Size([8, 8])
  25957. tensor([[0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  25958. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  25959. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  25960. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749],
  25961. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  25962. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  25963. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250],
  25964. [0.6246, 0.4028, 0.8738, 0.4867, 0.4088, 0.5667, 0.6362, 0.5200]],
  25965. device='cuda:0', dtype=torch.float64)
  25966. predictions are: tensor([[-0.1347, -0.8905, 1.3869, -1.0465, -0.3008, -1.1903, 0.5167, 0.1891],
  25967. [ 0.5789, -0.4325, 1.7945, 0.1725, -0.3334, 0.1157, 0.6113, 0.0700],
  25968. [ 0.1578, -0.6654, 1.5865, -0.2879, -0.4701, -0.9997, 0.2556, 0.2780],
  25969. [ 0.3835, -0.5182, 1.2272, -0.7243, -0.6110, -0.6875, 0.1796, 0.2398],
  25970. [ 0.6624, -0.3772, 2.0066, -0.3205, -0.2315, -1.2892, 0.5583, 0.0233],
  25971. [ 1.0005, -0.1530, 1.7703, 0.2153, -0.3215, -0.0169, 0.2178, 0.0890],
  25972. [ 0.5081, -0.4877, 1.9618, -0.1362, -0.5452, -0.0896, 0.5822, 0.0863],
  25973. [ 0.6206, -0.3973, 1.8513, 0.1067, -0.3296, 0.4381, 0.6588, 0.0824]],
  25974. device='cuda:0', grad_fn=<AddmmBackward>)
  25975. landmarks are: tensor([[[ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  25976. 0.1698],
  25977. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  25978. 0.1627],
  25979. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  25980. 0.3928],
  25981. [ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  25982. 0.3694],
  25983. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  25984. -0.0529],
  25985. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  25986. 0.1854],
  25987. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  25988. 0.1390],
  25989. [ 0.5990, -0.4256, 1.7499, -0.0380, -0.3979, 0.3315, 0.6529,
  25990. 0.1159]]], device='cuda:0')
  25991. loss_train_step before backward: tensor(0.0296, device='cuda:0', grad_fn=<MseLossBackward>)
  25992. loss_train_step after backward: tensor(0.0296, device='cuda:0', grad_fn=<MseLossBackward>)
  25993. loss_train: 1.9441209603101015
  25994. step: 70
  25995. running loss: 0.027773156575858594
  25996. Train Steps: 70/90 Loss: 0.0278 torch.Size([8, 600, 800])
  25997. torch.Size([8, 8])
  25998. tensor([[0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676],
  25999. [0.6135, 0.3994, 0.7913, 0.3050, 0.3625, 0.3050, 0.5837, 0.5050],
  26000. [0.6205, 0.4012, 0.8675, 0.3283, 0.3713, 0.3050, 0.5813, 0.5117],
  26001. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  26002. [0.6197, 0.4091, 0.8800, 0.4783, 0.3538, 0.4767, 0.5950, 0.5550],
  26003. [0.6161, 0.4024, 0.8662, 0.4683, 0.4935, 0.5364, 0.6063, 0.5567],
  26004. [0.6102, 0.3999, 0.8750, 0.5133, 0.3825, 0.4750, 0.5637, 0.5083],
  26005. [0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617]],
  26006. device='cuda:0', dtype=torch.float64)
  26007. predictions are: tensor([[ 0.6819, -0.3631, 1.7929, 0.0338, -0.1769, -0.1166, 0.2615, 0.2761],
  26008. [ 0.2571, -0.6269, 1.4967, -0.7880, -0.6286, -0.9278, 0.4804, 0.0170],
  26009. [ 0.1597, -0.7106, 1.8510, -0.6569, -0.5832, -0.9929, 0.5346, 0.0192],
  26010. [ 0.6173, -0.4197, 1.6777, 0.3250, -0.4016, 0.1249, 0.7606, 0.0746],
  26011. [ 0.7167, -0.3175, 1.7641, -0.0079, -0.6089, -0.2013, 0.5217, 0.2568],
  26012. [ 0.8350, -0.2456, 1.8566, -0.0243, -0.0949, -0.0249, 0.4935, 0.2472],
  26013. [ 0.5563, -0.4414, 1.8026, 0.2169, -0.5440, -0.1765, 0.2853, 0.0218],
  26014. [ 0.5862, -0.4149, 1.7682, -0.0044, -0.1104, -0.1928, 0.2206, 0.2828]],
  26015. device='cuda:0', grad_fn=<AddmmBackward>)
  26016. landmarks are: tensor([[[ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  26017. 4.6189e-04, 2.9049e-01, 3.3573e-01],
  26018. [ 5.4769e-01, -4.4126e-01, 1.3688e+00, -8.7714e-01, -6.1155e-01,
  26019. -8.7714e-01, 4.1039e-01, 4.6651e-02],
  26020. [ 5.7991e-01, -4.3295e-01, 1.7210e+00, -7.6936e-01, -5.7113e-01,
  26021. -8.7714e-01, 3.9885e-01, 7.7444e-02],
  26022. [ 6.0425e-01, -4.2731e-01, 1.7198e+00, 2.1845e-01, -3.4783e-01,
  26023. 1.1492e-01, 8.0616e-01, 1.1755e-01],
  26024. [ 5.7633e-01, -3.9630e-01, 1.7788e+00, -7.6520e-02, -6.5196e-01,
  26025. -8.4219e-02, 4.6236e-01, 2.7760e-01],
  26026. [ 5.5978e-01, -4.2731e-01, 1.7152e+00, -1.2271e-01, -6.4698e-03,
  26027. 1.9169e-01, 5.1432e-01, 2.8530e-01],
  26028. [ 5.3262e-01, -4.3895e-01, 1.7557e+00, 8.5142e-02, -5.1917e-01,
  26029. -9.1917e-02, 3.1801e-01, 6.2048e-02],
  26030. [ 5.4319e-01, -4.3880e-01, 1.7557e+00, -3.0331e-02, -9.1917e-02,
  26031. -1.1501e-01, 2.6993e-01, 3.0867e-01]]], device='cuda:0')
  26032. loss_train_step before backward: tensor(0.0130, device='cuda:0', grad_fn=<MseLossBackward>)
  26033. loss_train_step after backward: tensor(0.0130, device='cuda:0', grad_fn=<MseLossBackward>)
  26034. loss_train: 1.9570787139236927
  26035. step: 71
  26036. running loss: 0.027564488928502714
  26037. Train Steps: 71/90 Loss: 0.0276 torch.Size([8, 600, 800])
  26038. torch.Size([8, 8])
  26039. tensor([[0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044],
  26040. [0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  26041. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  26042. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  26043. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  26044. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  26045. [0.6197, 0.3986, 0.8800, 0.4617, 0.4188, 0.4783, 0.5687, 0.5550],
  26046. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183]],
  26047. device='cuda:0', dtype=torch.float64)
  26048. predictions are: tensor([[ 0.2929, -0.6306, 1.3494, -1.0974, -0.2760, -1.2471, 0.5076, 0.1783],
  26049. [ 0.5876, -0.4227, 1.8131, -0.3082, -0.5716, 0.0681, 0.6366, 0.1759],
  26050. [ 0.4308, -0.4823, 1.2201, -0.8724, -0.5480, -0.7434, 0.4204, 0.2808],
  26051. [ 0.5981, -0.4646, 1.8456, 0.3831, -0.3125, 0.1098, 0.6071, -0.0576],
  26052. [ 0.3022, -0.6097, 1.5507, -0.6316, -0.4949, -1.1007, 0.2263, 0.1064],
  26053. [ 0.7622, -0.3001, 1.7877, -0.3726, -0.3335, -1.0181, 0.2477, 0.1684],
  26054. [ 0.6255, -0.4040, 1.8410, 0.0971, -0.3022, 0.0756, 0.4581, 0.1748],
  26055. [ 0.5553, -0.4920, 1.8473, 0.2026, -0.5247, -0.4048, 0.5851, 0.1129]],
  26056. device='cuda:0', grad_fn=<AddmmBackward>)
  26057. landmarks are: tensor([[[ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  26058. 0.0438],
  26059. [ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  26060. 0.2545],
  26061. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  26062. 0.3007],
  26063. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  26064. 0.0159],
  26065. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  26066. -0.0220],
  26067. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  26068. 0.1494],
  26069. [ 0.5763, -0.4450, 1.7788, -0.1535, -0.3517, -0.0765, 0.3411,
  26070. 0.2776],
  26071. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  26072. 0.1082]]], device='cuda:0')
  26073. loss_train_step before backward: tensor(0.0202, device='cuda:0', grad_fn=<MseLossBackward>)
  26074. loss_train_step after backward: tensor(0.0202, device='cuda:0', grad_fn=<MseLossBackward>)
  26075. loss_train: 1.9772933050990105
  26076. step: 72
  26077. running loss: 0.027462407015264034
  26078.  
  26079. Train Steps: 72/90 Loss: 0.0275 torch.Size([8, 600, 800])
  26080. torch.Size([8, 8])
  26081. tensor([[0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  26082. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  26083. [0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  26084. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  26085. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  26086. [0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183],
  26087. [0.6107, 0.4050, 0.8700, 0.4850, 0.4470, 0.4848, 0.5043, 0.5431],
  26088. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598]],
  26089. device='cuda:0', dtype=torch.float64)
  26090. predictions are: tensor([[ 6.5583e-01, -3.7811e-01, 1.2696e+00, -7.9125e-01, -4.5153e-01,
  26091. -8.8227e-01, 6.5653e-01, 3.0809e-01],
  26092. [ 9.5700e-01, -1.8838e-01, 2.0054e+00, -3.3127e-02, -6.0763e-01,
  26093. -4.2334e-01, 6.2569e-01, 8.3709e-02],
  26094. [ 9.3682e-01, -2.0342e-01, 1.6857e+00, -6.1299e-01, -6.7221e-01,
  26095. -5.1084e-01, 4.4851e-01, 6.2466e-02],
  26096. [ 2.5737e-01, -6.2742e-01, 1.3201e+00, -9.9313e-01, -2.6889e-01,
  26097. -1.3625e+00, 3.5545e-01, 1.6475e-01],
  26098. [-1.3298e+00, -1.6522e+00, 1.0108e+00, -9.3262e-01, -3.8892e-01,
  26099. -1.2307e+00, 3.4897e-01, 3.3487e-01],
  26100. [ 3.9808e-01, -5.5571e-01, 1.6143e+00, -7.6801e-01, -4.6551e-01,
  26101. -1.0459e+00, 3.7800e-01, 6.5839e-02],
  26102. [ 6.9094e-01, -3.6286e-01, 1.8962e+00, 1.8539e-01, -2.5873e-01,
  26103. 7.2056e-02, 2.3904e-01, 1.9110e-02],
  26104. [ 6.2867e-01, -4.1586e-01, 1.7483e+00, 5.4881e-01, -1.1541e-01,
  26105. -1.4957e-03, 4.3051e-01, 1.5835e-01]], device='cuda:0',
  26106. grad_fn=<AddmmBackward>)
  26107. landmarks are: tensor([[[ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  26108. 0.3700],
  26109. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  26110. 0.1544],
  26111. [ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  26112. 0.2776],
  26113. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  26114. 0.1343],
  26115. [-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  26116. 0.4543],
  26117. [ 0.5798, -0.4156, 1.3977, -1.0388, -0.4672, -1.1004, 0.3469,
  26118. 0.1082],
  26119. [ 0.5351, -0.4153, 1.7326, -0.0457, -0.2214, -0.0466, 0.0434,
  26120. 0.2228],
  26121. [ 0.5726, -0.4249, 1.5824, 0.3777, -0.0942, -0.0556, 0.2782,
  26122. 0.2997]]], device='cuda:0')
  26123. loss_train_step before backward: tensor(0.0512, device='cuda:0', grad_fn=<MseLossBackward>)
  26124. loss_train_step after backward: tensor(0.0512, device='cuda:0', grad_fn=<MseLossBackward>)
  26125. loss_train: 2.028471328318119
  26126. step: 73
  26127. running loss: 0.02778727847011122
  26128. Train Steps: 73/90 Loss: 0.0278 torch.Size([8, 600, 800])
  26129. torch.Size([8, 8])
  26130. tensor([[0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  26131. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  26132. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  26133. [0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  26134. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  26135. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  26136. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  26137. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142]],
  26138. device='cuda:0', dtype=torch.float64)
  26139. predictions are: tensor([[ 0.6416, -0.3906, 1.7688, -0.7565, -0.0875, -1.1663, 0.7043, 0.1075],
  26140. [ 0.7966, -0.2625, 1.7855, 0.4262, -0.6310, -0.1006, 0.5265, 0.2256],
  26141. [-1.6472, -1.8579, 1.0097, -1.0127, -0.2529, -1.2835, 0.3738, 0.4171],
  26142. [ 0.6535, -0.3692, 1.6415, -0.3841, -0.6620, -0.6364, 0.3850, 0.0625],
  26143. [ 0.6294, -0.3894, 1.0214, -1.1424, -0.4673, -1.1836, 0.2044, 0.2154],
  26144. [ 0.6398, -0.3967, 1.7436, 0.1655, -0.4967, 0.0448, 0.2775, 0.0594],
  26145. [ 0.5993, -0.4317, 1.8031, -0.9034, 0.0458, -1.0696, 0.9169, 0.1342],
  26146. [ 0.7419, -0.3240, 1.7888, 0.0059, -0.5461, 0.0415, 0.1476, 0.0034]],
  26147. device='cuda:0', grad_fn=<AddmmBackward>)
  26148. landmarks are: tensor([[[ 0.6520, -0.3912, 1.7095, -0.9079, -0.0284, -1.3621, 0.8096,
  26149. 0.2356],
  26150. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  26151. 0.3084],
  26152. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  26153. 0.3623],
  26154. [ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  26155. 0.1621],
  26156. [ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  26157. 0.2906],
  26158. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  26159. 0.1854],
  26160. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  26161. 0.1982],
  26162. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  26163. 0.0893]]], device='cuda:0')
  26164. loss_train_step before backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  26165. loss_train_step after backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  26166. loss_train: 2.056894328445196
  26167. step: 74
  26168. running loss: 0.027795869303313462
  26169. Train Steps: 74/90 Loss: 0.0278 torch.Size([8, 600, 800])
  26170. torch.Size([8, 8])
  26171. tensor([[0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  26172. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320],
  26173. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  26174. [0.6146, 0.4124, 0.8800, 0.4867, 0.3800, 0.4500, 0.5106, 0.5524],
  26175. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646],
  26176. [0.6364, 0.4092, 0.8525, 0.5633, 0.3875, 0.4950, 0.6599, 0.5285],
  26177. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  26178. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471]],
  26179. device='cuda:0', dtype=torch.float64)
  26180. predictions are: tensor([[ 6.8721e-01, -3.6603e-01, 1.6273e+00, -9.3910e-01, -2.3020e-01,
  26181. -1.0608e+00, 8.1830e-01, 2.8156e-01],
  26182. [ 2.6261e-01, -6.6006e-01, 1.7028e+00, 6.9278e-02, -5.0285e-01,
  26183. 6.1316e-02, 9.1670e-01, 9.0216e-02],
  26184. [ 7.8071e-02, -7.5531e-01, 9.7520e-01, -1.1406e+00, -3.2744e-01,
  26185. -1.3896e+00, 1.0609e-01, 2.5919e-01],
  26186. [ 6.7547e-01, -3.5546e-01, 1.7788e+00, -4.9031e-02, -5.2201e-01,
  26187. -2.5553e-01, 2.1430e-01, 1.6061e-01],
  26188. [ 9.4422e-01, -1.8775e-01, 1.4252e+00, -7.5169e-01, -5.3062e-01,
  26189. -8.7556e-01, -3.1819e-02, 1.9832e-01],
  26190. [ 4.0847e-01, -5.7434e-01, 1.6866e+00, 2.0950e-01, -4.9814e-01,
  26191. 1.7580e-03, 7.6417e-01, 9.1559e-02],
  26192. [ 6.3641e-01, -3.8298e-01, 1.7680e+00, -2.8971e-01, -5.1222e-01,
  26193. -7.0556e-01, 4.5485e-01, 2.9442e-01],
  26194. [ 4.7471e-01, -4.8755e-01, 1.7431e+00, -2.4426e-01, -4.8224e-01,
  26195. -3.1786e-01, 1.0535e-01, 1.8711e-01]], device='cuda:0',
  26196. grad_fn=<AddmmBackward>)
  26197. landmarks are: tensor([[[ 6.1742e-01, -3.9842e-01, 1.5975e+00, -9.9214e-01, -3.6328e-01,
  26198. -9.9261e-01, 8.2047e-01, 2.0505e-01],
  26199. [ 6.2730e-01, -4.3934e-01, 1.6402e+00, 1.3133e-01, -5.0762e-01,
  26200. 4.6651e-02, 1.1532e+00, 1.7146e-01],
  26201. [ 5.5912e-01, -3.9900e-01, 9.0115e-01, -1.2313e+00, -3.9792e-01,
  26202. -1.3852e+00, 8.0445e-02, 2.0706e-01],
  26203. [ 5.5289e-01, -3.8106e-01, 1.7788e+00, -3.8029e-02, -5.3072e-01,
  26204. -2.0739e-01, 7.2734e-02, 2.6568e-01],
  26205. [ 5.4825e-01, -4.1045e-01, 1.4208e+00, -8.0015e-01, -6.0000e-01,
  26206. -9.0023e-01, 5.1142e-02, 3.2204e-01],
  26207. [ 6.5365e-01, -3.9601e-01, 1.6517e+00, 3.1609e-01, -4.9607e-01,
  26208. 4.6189e-04, 7.6203e-01, 1.5543e-01],
  26209. [ 6.0162e-01, -3.6328e-01, 1.7152e+00, -2.2279e-01, -6.1155e-01,
  26210. -6.3849e-01, 5.0277e-01, 2.6990e-01],
  26211. [ 5.4405e-01, -3.9969e-01, 1.7326e+00, -2.2279e-01, -4.4411e-01,
  26212. -2.9207e-01, 2.9551e-02, 2.4088e-01]]], device='cuda:0')
  26213. loss_train_step before backward: tensor(0.0174, device='cuda:0', grad_fn=<MseLossBackward>)
  26214. loss_train_step after backward: tensor(0.0174, device='cuda:0', grad_fn=<MseLossBackward>)
  26215. loss_train: 2.0743119940161705
  26216. step: 75
  26217. running loss: 0.02765749325354894
  26218.  
  26219. Train Steps: 75/90 Loss: 0.0277 torch.Size([8, 600, 800])
  26220. torch.Size([8, 8])
  26221. tensor([[0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  26222. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  26223. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  26224. [0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  26225. [0.6286, 0.4097, 0.8107, 0.2414, 0.4425, 0.2483, 0.6745, 0.5385],
  26226. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500],
  26227. [ nan, nan, 0.9088, 0.3783, 0.4562, 0.2617, 0.6741, 0.5575],
  26228. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892]],
  26229. device='cuda:0', dtype=torch.float64)
  26230. predictions are: tensor([[ 0.8649, -0.2485, 1.7574, -0.6191, -0.2934, -1.1843, 0.4251, 0.1032],
  26231. [ 0.4361, -0.5190, 1.6486, -0.2521, -0.3616, -0.0664, 0.2143, 0.2285],
  26232. [ 0.3731, -0.5932, 1.5713, 0.0356, -0.5071, -0.1149, 0.5145, 0.1103],
  26233. [ 0.4553, -0.4569, 1.2745, -0.7047, -0.4934, -0.8180, 0.3275, 0.3119],
  26234. [ 0.7047, -0.3546, 1.3248, -1.2568, -0.2380, -1.1344, 0.7567, 0.2289],
  26235. [ 0.6938, -0.3485, 1.6413, -0.0666, -0.5683, -0.3663, 0.4046, 0.1990],
  26236. [-0.3272, -1.0349, 1.8241, -0.5274, -0.2300, -0.9745, 0.7401, 0.2870],
  26237. [ 0.7128, -0.3070, 1.5699, -0.2741, -0.6330, -0.5391, 0.0100, 0.2550]],
  26238. device='cuda:0', grad_fn=<AddmmBackward>)
  26239. landmarks are: tensor([[[ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  26240. -0.0529],
  26241. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  26242. 0.3057],
  26243. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  26244. 0.1979],
  26245. [ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  26246. 0.3469],
  26247. [ 0.6174, -0.3936, 1.4586, -1.1709, -0.2420, -1.1389, 0.8296,
  26248. 0.2012],
  26249. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  26250. 0.2545],
  26251. [-2.2859, -2.2859, 1.9115, -0.5384, -0.1785, -1.0773, 0.8278,
  26252. 0.2890],
  26253. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  26254. 0.4357]]], device='cuda:0')
  26255. loss_train_step before backward: tensor(0.0945, device='cuda:0', grad_fn=<MseLossBackward>)
  26256. loss_train_step after backward: tensor(0.0945, device='cuda:0', grad_fn=<MseLossBackward>)
  26257. loss_train: 2.168797843158245
  26258. step: 76
  26259. running loss: 0.028536813725766382
  26260. Train Steps: 76/90 Loss: 0.0285 torch.Size([8, 600, 800])
  26261. torch.Size([8, 8])
  26262. tensor([[0.6245, 0.4115, 0.8700, 0.4883, 0.4625, 0.5517, 0.6100, 0.5217],
  26263. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  26264. [0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167],
  26265. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  26266. [0.6250, 0.4116, 0.8700, 0.4850, 0.4650, 0.5567, 0.6088, 0.5183],
  26267. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  26268. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  26269. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100]],
  26270. device='cuda:0', dtype=torch.float64)
  26271. predictions are: tensor([[ 0.5790, -0.4246, 1.7650, -0.0211, -0.2898, 0.0674, 0.4351, 0.2170],
  26272. [ 0.7075, -0.3480, 1.0163, -1.1494, -0.3797, -1.5016, 0.1140, 0.3749],
  26273. [ 0.5688, -0.4119, 1.2305, -0.8478, -0.4889, -1.1087, 0.3657, 0.4492],
  26274. [ 0.5267, -0.4787, 1.4408, -0.9947, -0.4450, -1.2665, 0.3767, 0.1211],
  26275. [ 0.5472, -0.4517, 1.7947, -0.1033, -0.2681, 0.1028, 0.4809, 0.2489],
  26276. [ 0.4713, -0.5011, 1.2762, -1.1014, -0.4127, -1.2061, 0.4065, 0.3346],
  26277. [ 0.3543, -0.5869, 1.7987, -0.0647, -0.3814, 0.2580, 0.5179, 0.1634],
  26278. [ 0.3446, -0.6577, 1.8439, -0.3129, -0.6954, -0.6245, 0.6689, 0.0432]],
  26279. device='cuda:0', grad_fn=<AddmmBackward>)
  26280. landmarks are: tensor([[[ 0.5987, -0.3852, 1.7326, -0.0303, -0.1497, 0.2622, 0.5316,
  26281. 0.1236],
  26282. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  26283. 0.3007],
  26284. [ 0.5631, -0.4129, 1.2129, -0.9233, -0.4152, -1.0311, 0.4566,
  26285. 0.5624],
  26286. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  26287. 0.2043],
  26288. [ 0.6012, -0.3846, 1.7326, -0.0457, -0.1381, 0.2853, 0.5259,
  26289. 0.1082],
  26290. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  26291. 0.3315],
  26292. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  26293. 0.0928],
  26294. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  26295. 0.0697]]], device='cuda:0')
  26296. loss_train_step before backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  26297. loss_train_step after backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  26298. loss_train: 2.1782545149326324
  26299. step: 77
  26300. running loss: 0.028289019674449772
  26301. Train Steps: 77/90 Loss: 0.0283 torch.Size([8, 600, 800])
  26302. torch.Size([8, 8])
  26303. tensor([[0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  26304. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133],
  26305. [0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  26306. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  26307. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  26308. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  26309. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  26310. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083]],
  26311. device='cuda:0', dtype=torch.float64)
  26312. predictions are: tensor([[ 0.7530, -0.2939, 1.4046, -1.0338, -0.3590, -1.0755, 0.5026, 0.1979],
  26313. [ 0.4401, -0.4800, 1.5502, -0.4485, -0.5286, -0.7753, 0.2494, 0.2087],
  26314. [ 0.6913, -0.3143, 1.2940, -0.9489, -0.3650, -1.0523, 0.4405, 0.3707],
  26315. [ 0.7265, -0.2805, 1.2429, -1.0236, -0.4281, -0.9581, 0.4826, 0.3433],
  26316. [-1.5196, -1.7774, 1.3053, -0.7442, -0.5791, -0.8100, 0.3340, 0.2008],
  26317. [ 0.4117, -0.5339, 1.6772, -0.1784, -0.2167, 0.0569, 0.6415, 0.2582],
  26318. [ 0.5965, -0.3613, 1.5313, -0.4395, -0.3732, -1.0792, 0.1596, 0.1984],
  26319. [ 0.6020, -0.4144, 1.7071, -0.4450, -0.5114, -0.7503, 0.4338, 0.1238]],
  26320. device='cuda:0', grad_fn=<AddmmBackward>)
  26321. landmarks are: tensor([[[ 5.7898e-01, -4.0793e-01, 1.5929e+00, -1.0630e+00, -4.7294e-01,
  26322. -1.0725e+00, 4.1374e-01, 8.0707e-02],
  26323. [ 5.3926e-01, -4.2941e-01, 1.6575e+00, -4.0754e-01, -6.6351e-01,
  26324. -6.3079e-01, 3.2956e-01, 8.5142e-02],
  26325. [ 5.8747e-01, -3.8876e-01, 1.3111e+00, -8.8483e-01, -4.6143e-01,
  26326. -9.8491e-01, 5.2009e-01, 2.6220e-01],
  26327. [ 5.9766e-01, -3.7916e-01, 1.2995e+00, -1.0311e+00, -5.1917e-01,
  26328. -8.3865e-01, 5.8360e-01, 2.1601e-01],
  26329. [-2.2859e+00, -2.2859e+00, 1.5478e+00, -8.3095e-01, -6.2887e-01,
  26330. -7.2317e-01, 1.1982e-01, 1.1330e-01],
  26331. [ 6.0087e-01, -4.1347e-01, 1.7651e+00, -1.0433e-01, -1.3233e-01,
  26332. 1.9292e-01, 5.6051e-01, 2.2371e-01],
  26333. [ 5.4850e-01, -4.2094e-01, 1.6691e+00, -4.1524e-01, -5.2494e-01,
  26334. -1.1081e+00, 7.2521e-02, 2.0831e-03],
  26335. [ 5.8072e-01, -4.3780e-01, 1.8249e+00, -4.6913e-01, -6.2887e-01,
  26336. -6.3849e-01, 4.1039e-01, 6.2048e-02]]], device='cuda:0')
  26337. loss_train_step before backward: tensor(0.0242, device='cuda:0', grad_fn=<MseLossBackward>)
  26338. loss_train_step after backward: tensor(0.0242, device='cuda:0', grad_fn=<MseLossBackward>)
  26339. loss_train: 2.202410016208887
  26340. step: 78
  26341. running loss: 0.028236025848831885
  26342. Train Steps: 78/90 Loss: 0.0282 torch.Size([8, 600, 800])
  26343. torch.Size([8, 8])
  26344. tensor([[0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  26345. [0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  26346. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  26347. [0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  26348. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795],
  26349. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  26350. [0.6203, 0.4021, 0.8780, 0.5031, 0.3667, 0.3882, 0.5842, 0.5405],
  26351. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700]],
  26352. device='cuda:0', dtype=torch.float64)
  26353. predictions are: tensor([[ 0.6716, -0.3651, 1.6848, 0.1993, -0.4682, -0.3016, 0.3698, 0.0878],
  26354. [ 1.1126, -0.0634, 1.0590, -1.5005, -0.3099, -1.4083, 0.3902, 0.3436],
  26355. [ 0.4396, -0.4931, 1.6367, -0.1527, -0.2727, -0.1796, 0.3804, 0.3029],
  26356. [ 0.4806, -0.5013, 1.7506, -0.7712, -0.5522, -0.3615, 0.7104, 0.2110],
  26357. [ 0.7517, -0.3017, 1.6676, 0.0399, -0.4713, 0.0236, 0.7962, 0.3514],
  26358. [-1.4892, -1.7884, 1.1316, -1.2032, -0.4816, -1.2419, 0.0669, 0.3637],
  26359. [ 0.8437, -0.2534, 1.7568, -0.0860, -0.5708, -0.6748, 0.2525, 0.1682],
  26360. [ 0.6160, -0.3820, 1.7347, -0.3169, -0.5240, -0.3235, 0.1420, 0.2635]],
  26361. device='cuda:0', grad_fn=<AddmmBackward>)
  26362. landmarks are: tensor([[[ 6.3949e-01, -4.2132e-01, 1.7037e+00, 3.6228e-01, -4.3256e-01,
  26363. -1.0731e-01, 6.5602e-01, -4.8817e-03],
  26364. [ 5.8614e-01, -3.9292e-01, 1.0570e+00, -1.4314e+00, -3.2864e-01,
  26365. -1.1235e+00, 6.1824e-01, 1.8522e-01],
  26366. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  26367. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  26368. [ 6.1083e-01, -4.2731e-01, 1.8711e+00, -6.6159e-01, -5.7691e-01,
  26369. -1.9969e-01, 9.1557e-01, 1.5543e-01],
  26370. [ 6.3554e-01, -4.0805e-01, 1.6113e+00, 1.8522e-01, -4.7298e-01,
  26371. 1.4673e-01, 9.9965e-01, 3.9055e-01],
  26372. [-2.2859e+00, -2.2859e+00, 1.2030e+00, -1.0288e+00, -4.9607e-01,
  26373. -1.1081e+00, 8.1293e-02, 3.1609e-01],
  26374. [ 5.7910e-01, -4.2887e-01, 1.7694e+00, 3.7905e-02, -5.9233e-01,
  26375. -4.9270e-01, 4.1265e-01, 2.1070e-01],
  26376. [ 5.3684e-01, -4.4057e-01, 1.7730e+00, -1.7660e-01, -5.2494e-01,
  26377. -5.3426e-02, 2.3141e-01, 3.4688e-01]]], device='cuda:0')
  26378. loss_train_step before backward: tensor(0.0364, device='cuda:0', grad_fn=<MseLossBackward>)
  26379. loss_train_step after backward: tensor(0.0364, device='cuda:0', grad_fn=<MseLossBackward>)
  26380. loss_train: 2.2388419173657894
  26381. step: 79
  26382. running loss: 0.02833977110589607
  26383.  
  26384. Train Steps: 79/90 Loss: 0.0283 torch.Size([8, 600, 800])
  26385. torch.Size([8, 8])
  26386. tensor([[0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  26387. [0.6198, 0.4115, 0.7762, 0.2717, 0.3713, 0.3200, 0.5837, 0.5683],
  26388. [0.6199, 0.4071, 0.7600, 0.2117, 0.4037, 0.2767, 0.6138, 0.5550],
  26389. [0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  26390. [0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501],
  26391. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  26392. [0.6199, 0.4093, 0.7913, 0.2533, 0.4288, 0.2467, 0.5975, 0.5700],
  26393. [0.6148, 0.4076, 0.8666, 0.4820, 0.4138, 0.5067, 0.5250, 0.5767]],
  26394. device='cuda:0', dtype=torch.float64)
  26395. predictions are: tensor([[ 0.4967, -0.4445, 1.6899, -0.5683, -0.6099, -0.5226, 0.4112, 0.2618],
  26396. [ 0.5527, -0.3992, 1.2878, -0.9653, -0.5312, -0.8909, 0.4131, 0.3071],
  26397. [ 0.5773, -0.3801, 1.1588, -1.2760, -0.3543, -1.0148, 0.4385, 0.3473],
  26398. [ 0.3141, -0.5629, 1.6904, -0.2649, -0.3561, -1.0912, 0.3390, 0.2800],
  26399. [ 0.3397, -0.5448, 1.3303, -1.0739, -0.2484, -1.2535, 0.4785, 0.2336],
  26400. [ 0.5512, -0.4214, 1.4524, -1.0067, -0.4021, -1.0468, 0.4744, 0.1392],
  26401. [ 0.3694, -0.5477, 1.2548, -1.1035, -0.3461, -1.0229, 0.5109, 0.2759],
  26402. [-0.1604, -0.9095, 1.6600, 0.0585, -0.4307, -0.0445, 0.3925, 0.2854]],
  26403. device='cuda:0', grad_fn=<AddmmBackward>)
  26404. landmarks are: tensor([[[ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  26405. 0.3392],
  26406. [ 0.5768, -0.3852, 1.2995, -1.0311, -0.5711, -0.8079, 0.4104,
  26407. 0.3392],
  26408. [ 0.5775, -0.4054, 1.2245, -1.3082, -0.4210, -1.0080, 0.5490,
  26409. 0.2776],
  26410. [ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  26411. 0.1929],
  26412. [ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  26413. 0.2549],
  26414. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  26415. 0.0807],
  26416. [ 0.5771, -0.3955, 1.3688, -1.1158, -0.3055, -1.1466, 0.4739,
  26417. 0.3469],
  26418. [ 0.5539, -0.4031, 1.7168, -0.0594, -0.3748, 0.0543, 0.1390,
  26419. 0.3777]]], device='cuda:0')
  26420. loss_train_step before backward: tensor(0.0219, device='cuda:0', grad_fn=<MseLossBackward>)
  26421. loss_train_step after backward: tensor(0.0219, device='cuda:0', grad_fn=<MseLossBackward>)
  26422. loss_train: 2.260784700512886
  26423. step: 80
  26424. running loss: 0.028259808756411077
  26425. Train Steps: 80/90 Loss: 0.0283 torch.Size([8, 600, 800])
  26426. torch.Size([8, 8])
  26427. tensor([[0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250],
  26428. [0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136],
  26429. [0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  26430. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  26431. [0.6127, 0.4066, 0.8550, 0.5567, 0.4662, 0.5141, 0.5070, 0.5412],
  26432. [0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  26433. [0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  26434. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507]],
  26435. device='cuda:0', dtype=torch.float64)
  26436. predictions are: tensor([[ 0.5515, -0.4324, 1.2522, -1.1974, -0.5468, -0.9399, 0.5127, 0.2591],
  26437. [ 0.2839, -0.6032, 1.8354, 0.1435, -0.2102, 0.1414, 0.4120, 0.2700],
  26438. [ 0.4407, -0.4859, 0.9970, -1.3051, -0.5360, -1.1848, 0.2556, 0.2368],
  26439. [ 0.4679, -0.5184, 1.8603, -0.3844, -0.6523, -0.8006, 0.4449, 0.1568],
  26440. [ 0.4220, -0.5166, 1.7469, 0.3429, -0.2708, 0.0341, 0.1857, 0.3391],
  26441. [ 0.7520, -0.3054, 1.1945, -0.9319, -0.6896, -0.7861, 0.1203, 0.2432],
  26442. [-0.0073, -0.8187, 1.6968, -1.1910, 0.0458, -1.4126, 1.0480, 0.3479],
  26443. [ 0.5477, -0.4101, 1.0520, -1.3807, -0.5342, -1.2166, 0.3435, 0.2966]],
  26444. device='cuda:0', grad_fn=<AddmmBackward>)
  26445. landmarks are: tensor([[[ 0.5891, -0.3937, 1.1494, -1.2390, -0.5076, -0.9695, 0.4797,
  26446. 0.1390],
  26447. [ 0.5564, -0.3842, 1.7268, 0.1005, -0.0250, 0.3225, 0.2658,
  26448. 0.0862],
  26449. [ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  26450. 0.0712],
  26451. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  26452. 0.1005],
  26453. [ 0.5443, -0.4079, 1.6633, 0.2853, -0.1325, 0.0888, 0.0558,
  26454. 0.2138],
  26455. [ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  26456. 0.1710],
  26457. [ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  26458. 0.2142],
  26459. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  26460. 0.2576]]], device='cuda:0')
  26461. loss_train_step before backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  26462. loss_train_step after backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  26463. loss_train: 2.281465532258153
  26464. step: 81
  26465. running loss: 0.028166241138989544
  26466. Train Steps: 81/90 Loss: 0.0282 torch.Size([8, 600, 800])
  26467. torch.Size([8, 8])
  26468. tensor([[0.6111, 0.4033, 0.8300, 0.3267, 0.3588, 0.3333, 0.5444, 0.5637],
  26469. [0.6176, 0.4017, 0.8788, 0.5100, 0.4075, 0.5250, 0.5913, 0.5033],
  26470. [0.6129, 0.4114, 0.6950, 0.2467, 0.4050, 0.2133, 0.5363, 0.5550],
  26471. [0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136],
  26472. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  26473. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  26474. [0.6236, 0.3977, 0.8985, 0.4806, 0.3835, 0.5216, 0.6613, 0.5166],
  26475. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400]],
  26476. device='cuda:0', dtype=torch.float64)
  26477. predictions are: tensor([[ 0.7174, -0.3203, 1.5432, -0.7647, -0.5346, -0.9745, 0.1499, 0.2596],
  26478. [ 0.5553, -0.4361, 1.7861, 0.0788, -0.2853, 0.0368, 0.4463, 0.1984],
  26479. [ 0.7145, -0.2997, 0.9637, -1.2829, -0.4113, -1.4868, 0.1665, 0.3214],
  26480. [ 0.6634, -0.3140, 1.5424, -0.6475, -0.5232, -0.0573, 0.4547, 0.2503],
  26481. [ 0.4377, -0.4985, 1.2757, -1.2660, -0.3435, -1.3296, 0.5275, 0.3440],
  26482. [ 0.3779, -0.5464, 1.6157, -0.4544, -0.6177, -0.5650, 0.2407, 0.2846],
  26483. [ 0.2344, -0.6762, 1.8225, -0.0604, -0.4420, 0.0151, 0.8304, 0.2047],
  26484. [ 0.3008, -0.5890, 1.6560, -0.6949, -0.5658, -0.1531, 0.5472, 0.2596]],
  26485. device='cuda:0', grad_fn=<AddmmBackward>)
  26486. landmarks are: tensor([[[ 0.5366, -0.4232, 1.5478, -0.7771, -0.6289, -0.7463, 0.2288,
  26487. 0.3177],
  26488. [ 0.5668, -0.4306, 1.7730, 0.0697, -0.4037, 0.1390, 0.4450,
  26489. 0.0390],
  26490. [ 0.5448, -0.3859, 0.9242, -1.1466, -0.4152, -1.3005, 0.1910,
  26491. 0.2776],
  26492. [ 0.5466, -0.3840, 1.5016, -0.6077, -0.6404, 0.2083, 0.3871,
  26493. 0.0862],
  26494. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  26495. 0.3315],
  26496. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  26497. 0.3559],
  26498. [ 0.5944, -0.4490, 1.8643, -0.0659, -0.5147, 0.1235, 0.7684,
  26499. 0.1004],
  26500. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  26501. 0.2083]]], device='cuda:0')
  26502. loss_train_step before backward: tensor(0.0148, device='cuda:0', grad_fn=<MseLossBackward>)
  26503. loss_train_step after backward: tensor(0.0148, device='cuda:0', grad_fn=<MseLossBackward>)
  26504. loss_train: 2.2963146083056927
  26505. step: 82
  26506. running loss: 0.02800383668665479
  26507. Train Steps: 82/90 Loss: 0.0280 torch.Size([8, 600, 800])
  26508. torch.Size([8, 8])
  26509. tensor([[0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  26510. [0.6163, 0.4006, 0.8788, 0.4683, 0.3663, 0.4883, 0.5887, 0.5017],
  26511. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  26512. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  26513. [0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783],
  26514. [0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  26515. [0.6022, 0.3994, 0.8025, 0.3350, 0.3350, 0.4400, 0.5565, 0.5025],
  26516. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274]],
  26517. device='cuda:0', dtype=torch.float64)
  26518. predictions are: tensor([[ 0.1430, -0.7105, 1.6730, -1.2270, 0.1805, -1.4558, 0.9720, 0.2920],
  26519. [ 0.5546, -0.4364, 1.8704, -0.0628, -0.5260, 0.0190, 0.3254, 0.1272],
  26520. [-0.0603, -0.8157, 0.9096, -1.3470, -0.3919, -1.3662, 0.3169, 0.2475],
  26521. [ 0.4587, -0.4335, 1.3221, -0.6188, -0.6190, -0.6014, 0.0964, 0.4070],
  26522. [ 0.5745, -0.3822, 1.0003, -1.0263, -0.6209, -0.8339, 0.3180, 0.3165],
  26523. [ 1.1199, -0.0309, 1.5450, -0.9909, -0.6218, -0.6417, 0.3637, 0.2202],
  26524. [ 0.3321, -0.5572, 1.5391, -0.7018, -0.6428, -0.4123, 0.2566, 0.1486],
  26525. [ 0.4968, -0.4762, 1.9318, 0.1283, -0.5195, -0.2110, 0.7342, 0.2339]],
  26526. device='cuda:0', grad_fn=<AddmmBackward>)
  26527. landmarks are: tensor([[[ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  26528. 0.2142],
  26529. [ 0.5609, -0.4354, 1.7730, -0.1227, -0.5942, -0.0303, 0.4335,
  26530. 0.0313],
  26531. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  26532. 0.1013],
  26533. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  26534. 0.4036],
  26535. [ 0.5680, -0.4005, 0.8030, -1.0542, -0.6289, -0.7540, 0.3700,
  26536. 0.3854],
  26537. [ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  26538. 0.2776],
  26539. [ 0.4956, -0.4413, 1.4208, -0.7386, -0.7386, -0.2536, 0.2843,
  26540. 0.0351],
  26541. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  26542. 0.1499]]], device='cuda:0')
  26543. loss_train_step before backward: tensor(0.0251, device='cuda:0', grad_fn=<MseLossBackward>)
  26544. loss_train_step after backward: tensor(0.0251, device='cuda:0', grad_fn=<MseLossBackward>)
  26545. loss_train: 2.3214387968182564
  26546. step: 83
  26547. running loss: 0.02796914213034044
  26548.  
  26549. Train Steps: 83/90 Loss: 0.0280 torch.Size([8, 600, 800])
  26550. torch.Size([8, 8])
  26551. tensor([[ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  26552. [0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044],
  26553. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  26554. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  26555. [0.6336, 0.4154, 0.8900, 0.2767, 0.4988, 0.2867, 0.7422, 0.5540],
  26556. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  26557. [0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  26558. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748]],
  26559. device='cuda:0', dtype=torch.float64)
  26560. predictions are: tensor([[-2.2269, -2.2273, 1.1713, -1.1375, -0.4127, -1.0421, 0.1625, 0.2478],
  26561. [ 0.6665, -0.2975, 1.0809, -1.5144, -0.3767, -1.2959, 0.3798, 0.1838],
  26562. [ 0.8967, -0.1623, 1.6080, 0.1411, -0.5546, -0.2800, 0.2731, 0.0371],
  26563. [ 0.8213, -0.1644, 1.3793, -0.6185, -0.5996, -0.8791, -0.0651, 0.3671],
  26564. [ 0.6198, -0.3447, 1.5878, -1.1289, -0.0898, -1.0752, 0.8322, 0.2534],
  26565. [ 0.5938, -0.3939, 1.7633, -0.2117, -0.4702, 0.2779, 0.6836, 0.1326],
  26566. [ 0.6316, -0.3298, 1.6066, -0.6564, -0.6365, -0.0327, 0.4298, 0.2297],
  26567. [ 0.6697, -0.3118, 1.7474, -0.2772, -0.3892, -0.8977, 0.6521, 0.3015]],
  26568. device='cuda:0', grad_fn=<AddmmBackward>)
  26569. landmarks are: tensor([[[-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  26570. 0.3007],
  26571. [ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  26572. 0.0438],
  26573. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  26574. -0.0102],
  26575. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  26576. 0.4374],
  26577. [ 0.6405, -0.3671, 1.8249, -1.0080, 0.0178, -0.9618, 1.1422,
  26578. 0.2730],
  26579. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  26580. 0.1554],
  26581. [ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  26582. 0.2545],
  26583. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  26584. 0.3692]]], device='cuda:0')
  26585. loss_train_step before backward: tensor(0.0214, device='cuda:0', grad_fn=<MseLossBackward>)
  26586. loss_train_step after backward: tensor(0.0214, device='cuda:0', grad_fn=<MseLossBackward>)
  26587. loss_train: 2.342796679586172
  26588. step: 84
  26589. running loss: 0.027890436661740143
  26590. Train Steps: 84/90 Loss: 0.0279 torch.Size([8, 600, 800])
  26591. torch.Size([8, 8])
  26592. tensor([[0.6199, 0.4093, 0.7913, 0.2533, 0.4288, 0.2467, 0.5975, 0.5700],
  26593. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  26594. [0.6180, 0.4064, 0.7200, 0.2467, 0.4275, 0.2367, 0.5963, 0.6217],
  26595. [0.6275, 0.4157, 0.8337, 0.5800, 0.3763, 0.4200, 0.5547, 0.6125],
  26596. [0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  26597. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  26598. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578],
  26599. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366]],
  26600. device='cuda:0', dtype=torch.float64)
  26601. predictions are: tensor([[ 0.6604, -0.3537, 1.5051, -1.2975, -0.3695, -0.9548, 0.5446, 0.1394],
  26602. [ 0.1555, -0.6838, 1.0384, -1.4719, -0.4375, -1.2605, 0.3670, 0.1280],
  26603. [ 0.3765, -0.5204, 1.1939, -1.3233, -0.3674, -1.1210, 0.4890, 0.3674],
  26604. [ 0.7508, -0.2881, 1.7318, 0.2697, -0.5587, -0.2539, 0.3189, 0.3947],
  26605. [ 0.6070, -0.3943, 1.2620, -1.0188, -0.6195, -0.6756, 0.1259, 0.1423],
  26606. [ 0.6287, -0.3404, 1.9525, 0.1932, -0.5037, -0.1270, 0.3228, 0.3000],
  26607. [ 0.2278, -0.6186, 1.0869, -1.5289, -0.4159, -1.2903, 0.3593, 0.1703],
  26608. [ 0.2406, -0.6494, 1.6878, 0.1533, -0.4699, 0.1824, 0.8549, 0.1438]],
  26609. device='cuda:0', grad_fn=<AddmmBackward>)
  26610. landmarks are: tensor([[[ 0.5771, -0.3955, 1.3688, -1.1158, -0.3055, -1.1466, 0.4739,
  26611. 0.3469],
  26612. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  26613. 0.1013],
  26614. [ 0.5687, -0.4088, 1.0397, -1.1466, -0.3113, -1.1928, 0.4681,
  26615. 0.5855],
  26616. [ 0.6124, -0.3658, 1.5651, 0.3931, -0.5480, -0.3460, 0.2761,
  26617. 0.5431],
  26618. [ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  26619. 0.1710],
  26620. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  26621. 0.3084],
  26622. [ 0.5232, -0.4189, 0.9358, -1.4006, -0.3921, -1.3698, 0.2555,
  26623. 0.2906],
  26624. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  26625. 0.1928]]], device='cuda:0')
  26626. loss_train_step before backward: tensor(0.0225, device='cuda:0', grad_fn=<MseLossBackward>)
  26627. loss_train_step after backward: tensor(0.0225, device='cuda:0', grad_fn=<MseLossBackward>)
  26628. loss_train: 2.365304049104452
  26629. step: 85
  26630. running loss: 0.02782710646005238
  26631. Train Steps: 85/90 Loss: 0.0278 torch.Size([8, 600, 800])
  26632. torch.Size([8, 8])
  26633. tensor([[0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  26634. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  26635. [0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  26636. [0.6135, 0.4115, 0.8838, 0.4667, 0.4288, 0.6050, 0.5778, 0.5097],
  26637. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  26638. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  26639. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  26640. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505]],
  26641. device='cuda:0', dtype=torch.float64)
  26642. predictions are: tensor([[ 0.4752, -0.4915, 1.7250, -0.1743, -0.5882, -0.1805, 0.7140, 0.1793],
  26643. [ 0.5620, -0.3887, 1.4668, -1.3343, -0.3144, -1.1160, 0.8748, 0.2578],
  26644. [ 0.6195, -0.3832, 1.7568, -0.3389, -0.4534, 0.3030, 0.6783, 0.1351],
  26645. [ 0.3791, -0.4708, 1.6688, -0.3477, -0.2809, 0.3300, 0.3379, 0.1553],
  26646. [ 0.5733, -0.3845, 1.6611, 0.1772, -0.4800, -0.0565, 0.3584, 0.3798],
  26647. [ 0.5504, -0.4220, 1.6632, -0.1711, -0.4728, -0.0582, 0.2567, 0.2242],
  26648. [ 0.5528, -0.4051, 0.8821, -1.4736, -0.3661, -1.5189, 0.3338, 0.2473],
  26649. [ 0.6205, -0.3280, 1.5286, -0.6112, -0.6699, -0.7295, 0.0736, 0.2279]],
  26650. device='cuda:0', grad_fn=<AddmmBackward>)
  26651. landmarks are: tensor([[[ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  26652. 0.0774],
  26653. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  26654. 0.2944],
  26655. [ 0.5934, -0.4276, 1.8192, -0.1458, -0.4499, 0.3777, 0.6702,
  26656. 0.1082],
  26657. [ 0.5477, -0.3851, 1.7961, -0.1304, -0.3055, 0.5085, 0.3830,
  26658. 0.0682],
  26659. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  26660. 0.3007],
  26661. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  26662. 0.2035],
  26663. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  26664. 0.1253],
  26665. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  26666. 0.2567]]], device='cuda:0')
  26667. loss_train_step before backward: tensor(0.0094, device='cuda:0', grad_fn=<MseLossBackward>)
  26668. loss_train_step after backward: tensor(0.0094, device='cuda:0', grad_fn=<MseLossBackward>)
  26669. loss_train: 2.374746444635093
  26670. step: 86
  26671. running loss: 0.027613330751570853
  26672. Train Steps: 86/90 Loss: 0.0276 torch.Size([8, 600, 800])
  26673. torch.Size([8, 8])
  26674. tensor([[0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  26675. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  26676. [0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274],
  26677. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  26678. [0.6168, 0.4081, 0.8438, 0.3367, 0.3500, 0.4667, 0.6212, 0.5400],
  26679. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  26680. [0.6311, 0.3998, 0.7975, 0.5767, 0.3838, 0.4850, 0.7327, 0.5343],
  26681. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356]],
  26682. device='cuda:0', dtype=torch.float64)
  26683. predictions are: tensor([[ 0.3664, -0.5092, 1.3370, -1.0725, -0.5688, -0.9993, 0.1131, 0.0623],
  26684. [ 0.6189, -0.3521, 1.7721, -0.1010, -0.5002, -0.3470, 0.6110, 0.1564],
  26685. [ 0.2863, -0.5541, 1.6003, -0.9776, -0.1182, -1.1446, 0.6046, 0.1507],
  26686. [ 0.2970, -0.5251, 0.9866, -1.2467, -0.2565, -1.2284, 0.3042, 0.3866],
  26687. [ 0.7506, -0.2783, 1.5889, -0.8261, -0.6352, 0.0359, 0.5611, 0.2387],
  26688. [ 0.5821, -0.3698, 1.6028, 0.0332, -0.5533, -0.3493, 0.1958, 0.3500],
  26689. [ 0.2462, -0.6476, 1.4856, 0.0648, -0.5149, 0.1151, 0.7020, 0.1618],
  26690. [ 0.6343, -0.3339, 1.3000, -1.2645, -0.3201, -1.0795, 0.7160, 0.1657]],
  26691. device='cuda:0', grad_fn=<AddmmBackward>)
  26692. landmarks are: tensor([[[ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  26693. -0.0220],
  26694. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  26695. 0.1661],
  26696. [ 0.6537, -0.3719, 1.6979, -0.8617, -0.0169, -1.3621, 0.6926,
  26697. 0.1501],
  26698. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  26699. 0.3931],
  26700. [ 0.5631, -0.4008, 1.6113, -0.7309, -0.6693, -0.1304, 0.5836,
  26701. 0.2083],
  26702. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  26703. 0.3392],
  26704. [ 0.6289, -0.4393, 1.3977, 0.3777, -0.5134, -0.0457, 1.0984,
  26705. 0.1821],
  26706. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  26707. 0.1879]]], device='cuda:0')
  26708. loss_train_step before backward: tensor(0.0211, device='cuda:0', grad_fn=<MseLossBackward>)
  26709. loss_train_step after backward: tensor(0.0211, device='cuda:0', grad_fn=<MseLossBackward>)
  26710. loss_train: 2.3958609933033586
  26711. step: 87
  26712. running loss: 0.027538632106935156
  26713.  
  26714. Train Steps: 87/90 Loss: 0.0275 torch.Size([8, 600, 800])
  26715. torch.Size([8, 8])
  26716. tensor([[0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  26717. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  26718. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433],
  26719. [0.6260, 0.4153, 0.9000, 0.4533, 0.4025, 0.2633, 0.6223, 0.4967],
  26720. [0.6108, 0.4011, 0.8037, 0.3400, 0.3700, 0.2933, 0.5658, 0.5617],
  26721. [0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  26722. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  26723. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356]],
  26724. device='cuda:0', dtype=torch.float64)
  26725. predictions are: tensor([[ 0.3245, -0.5463, 1.6416, 0.1805, -0.5145, -0.1114, 0.1358, 0.1085],
  26726. [ 0.4553, -0.4918, 1.4523, 0.0928, -0.5212, 0.1824, 0.9054, 0.2236],
  26727. [ 0.5183, -0.4307, 1.6151, -0.0479, -0.1344, 0.1879, 0.0953, 0.3011],
  26728. [ 0.4604, -0.4627, 1.8237, -0.4227, -0.4729, -0.9072, 0.5547, 0.1219],
  26729. [ 0.5760, -0.3800, 1.4301, -0.8783, -0.5904, -0.7605, 0.3787, 0.2626],
  26730. [ 0.4793, -0.4195, 1.2977, -1.1489, -0.4808, -0.8817, 0.4595, 0.2736],
  26731. [ 0.5724, -0.3816, 1.1668, -1.3779, -0.2650, -1.3689, 0.5275, 0.1317],
  26732. [ 0.6453, -0.3177, 1.3266, -1.2657, -0.3371, -1.0873, 0.7413, 0.1793]],
  26733. device='cuda:0', grad_fn=<AddmmBackward>)
  26734. landmarks are: tensor([[[ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  26735. -0.0370],
  26736. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  26737. 0.1928],
  26738. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  26739. 0.2237],
  26740. [ 0.6055, -0.3676, 1.8711, -0.1920, -0.4268, -1.0696, 0.5887,
  26741. 0.0081],
  26742. [ 0.5355, -0.4335, 1.4266, -0.7155, -0.5769, -0.9310, 0.3275,
  26743. 0.3087],
  26744. [ 0.5875, -0.3888, 1.3111, -0.8848, -0.4614, -0.9849, 0.5201,
  26745. 0.2622],
  26746. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  26747. 0.1005],
  26748. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  26749. 0.1879]]], device='cuda:0')
  26750. loss_train_step before backward: tensor(0.0118, device='cuda:0', grad_fn=<MseLossBackward>)
  26751. loss_train_step after backward: tensor(0.0118, device='cuda:0', grad_fn=<MseLossBackward>)
  26752. loss_train: 2.4076440930366516
  26753. step: 88
  26754. running loss: 0.027359591966325588
  26755. Train Steps: 88/90 Loss: 0.0274 torch.Size([8, 600, 800])
  26756. torch.Size([8, 8])
  26757. tensor([[0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  26758. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  26759. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  26760. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  26761. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  26762. [0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901],
  26763. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  26764. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142]],
  26765. device='cuda:0', dtype=torch.float64)
  26766. predictions are: tensor([[ 0.8967, -0.1894, 1.6235, -0.5461, -0.5360, -0.7694, 0.4593, 0.1840],
  26767. [ 0.7258, -0.2661, 1.1216, -1.2929, -0.1953, -1.4731, 0.5593, 0.1530],
  26768. [ 0.6065, -0.3242, 1.6106, -0.5376, -0.5609, -0.3627, 0.5166, 0.2849],
  26769. [ 0.7895, -0.2600, 1.5678, 0.1344, -0.4056, -0.0342, 0.4855, 0.2049],
  26770. [ 0.5367, -0.4251, 1.5836, 0.1638, -0.4319, -0.0222, 0.6117, 0.1143],
  26771. [ 0.9586, -0.0897, 1.6710, -0.7051, -0.5443, -0.4784, 0.5907, 0.1210],
  26772. [ 0.7902, -0.2370, 1.5886, -0.1792, -0.1250, 0.1207, 0.3287, 0.1890],
  26773. [-1.6931, -1.8893, 1.3705, -0.9159, -0.5961, -0.7617, 0.1850, 0.1535]],
  26774. device='cuda:0', grad_fn=<AddmmBackward>)
  26775. landmarks are: tensor([[[ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  26776. 0.1005],
  26777. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  26778. 0.1005],
  26779. [ 0.6009, -0.3710, 1.7961, -0.4691, -0.6289, -0.3075, 0.5605,
  26780. 0.1929],
  26781. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  26782. 0.1979],
  26783. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  26784. 0.0697],
  26785. [ 0.6077, -0.3965, 1.8480, -0.6539, -0.6231, -0.4537, 0.6216,
  26786. -0.0220],
  26787. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  26788. 0.2622],
  26789. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  26790. 0.0893]]], device='cuda:0')
  26791. loss_train_step before backward: tensor(0.0235, device='cuda:0', grad_fn=<MseLossBackward>)
  26792. loss_train_step after backward: tensor(0.0235, device='cuda:0', grad_fn=<MseLossBackward>)
  26793. loss_train: 2.4311892818659544
  26794. step: 89
  26795. running loss: 0.02731673350411185
  26796. Train Steps: 89/90 Loss: 0.0273 torch.Size([8, 600, 800])
  26797. torch.Size([8, 8])
  26798. tensor([[0.6260, 0.4133, 0.8800, 0.5117, 0.3713, 0.3283, 0.6223, 0.4967],
  26799. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  26800. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  26801. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  26802. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  26803. [0.6350, 0.4144, 0.9250, 0.4100, 0.4125, 0.3750, 0.7129, 0.5945],
  26804. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  26805. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650]],
  26806. device='cuda:0', dtype=torch.float64)
  26807. predictions are: tensor([[ 0.5705, -0.3882, 1.6861, -0.0167, -0.5071, -0.7305, 0.5165, 0.0700],
  26808. [ 0.6534, -0.3226, 1.5963, -0.2239, -0.1139, 0.3164, 0.3441, 0.1890],
  26809. [ 0.5489, -0.3968, 1.0934, -1.3142, -0.5016, -1.0165, 0.5338, 0.1896],
  26810. [ 0.3663, -0.4814, 1.4985, -0.4219, -0.5752, -0.7880, 0.2258, 0.3580],
  26811. [ 0.4916, -0.5086, 1.8622, -0.3967, -0.3204, -0.9278, 0.9234, 0.0578],
  26812. [ 0.3684, -0.5708, 1.8041, -0.3877, -0.3142, -0.5238, 0.8517, 0.3063],
  26813. [ 0.8468, -0.2431, 1.6189, -0.1766, -0.1639, 0.3228, 0.4935, 0.1421],
  26814. [ 0.5632, -0.3607, 1.5821, -0.5251, -0.6298, -0.4061, 0.1537, 0.2595]],
  26815. device='cuda:0', grad_fn=<AddmmBackward>)
  26816. landmarks are: tensor([[[ 0.6054, -0.3767, 1.7788, 0.0774, -0.5711, -0.7694, 0.5887,
  26817. 0.0081],
  26818. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  26819. 0.3007],
  26820. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  26821. 0.2032],
  26822. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  26823. 0.3238],
  26824. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  26825. 0.2142],
  26826. [ 0.6471, -0.3719, 1.9866, -0.3921, -0.3806, -0.5538, 1.0070,
  26827. 0.4600],
  26828. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  26829. 0.2237],
  26830. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  26831. 0.3238]]], device='cuda:0')
  26832. loss_train_step before backward: tensor(0.0120, device='cuda:0', grad_fn=<MseLossBackward>)
  26833. loss_train_step after backward: tensor(0.0120, device='cuda:0', grad_fn=<MseLossBackward>)
  26834. loss_train: 2.443223439157009
  26835. step: 90
  26836. running loss: 0.027146927101744545
  26837. Valid Steps: 10/10 Loss: nan 6.5902
  26838. --------------------------------------------------
  26839. Epoch: 7 Train Loss: 0.0271 Valid Loss: nan
  26840. --------------------------------------------------
  26841. size of train loader is: 90
  26842. torch.Size([8, 600, 800])
  26843. torch.Size([8, 8])
  26844. tensor([[0.6199, 0.4112, 0.8475, 0.3717, 0.3550, 0.4350, 0.6063, 0.6083],
  26845. [0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  26846. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  26847. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  26848. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  26849. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  26850. [ nan, nan, 0.9050, 0.3500, 0.5138, 0.2300, 0.7359, 0.5702],
  26851. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150]],
  26852. device='cuda:0', dtype=torch.float64)
  26853. predictions are: tensor([[ 0.7039, -0.2916, 1.6499, -0.5477, -0.5646, -0.1249, 0.4112, 0.3280],
  26854. [ 0.8252, -0.2680, 1.5895, 0.4821, -0.4184, 0.0452, 0.6871, -0.0390],
  26855. [ 0.7905, -0.2879, 1.7602, -0.0484, -0.4769, -0.2194, 0.5950, 0.1834],
  26856. [ 0.7472, -0.2969, 1.6772, -0.1715, -0.5247, -0.3710, 0.4660, 0.2601],
  26857. [ 0.8241, -0.2370, 1.0809, -1.1172, -0.4864, -1.0178, 0.3043, 0.0526],
  26858. [ 0.7743, -0.2381, 1.6707, -0.4007, -0.5739, -0.3339, 0.3342, 0.2430],
  26859. [-1.4220, -1.7229, 1.8686, -0.8128, 0.0823, -1.1515, 0.7699, 0.2080],
  26860. [ 0.5649, -0.4012, 1.3509, -1.1256, -0.2297, -1.2799, 0.5118, 0.0663]],
  26861. device='cuda:0', grad_fn=<AddmmBackward>)
  26862. landmarks are: tensor([[[ 0.5774, -0.3868, 1.6286, -0.5692, -0.6462, -0.2767, 0.5143,
  26863. 0.5239],
  26864. [ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  26865. -0.1492],
  26866. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  26867. 0.2314],
  26868. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  26869. 0.2853],
  26870. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  26871. 0.0802],
  26872. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  26873. 0.3238],
  26874. [-2.2859, -2.2859, 1.8942, -0.6693, 0.0871, -1.2236, 1.1130,
  26875. 0.3478],
  26876. [ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  26877. 0.0928]]], device='cuda:0')
  26878. loss_train_step before backward: tensor(0.0307, device='cuda:0', grad_fn=<MseLossBackward>)
  26879.  
  26880. loss_train_step after backward: tensor(0.0307, device='cuda:0', grad_fn=<MseLossBackward>)
  26881. loss_train: 0.030708475038409233
  26882. step: 1
  26883. running loss: 0.030708475038409233
  26884. Train Steps: 1/90 Loss: 0.0307 torch.Size([8, 600, 800])
  26885. torch.Size([8, 8])
  26886. tensor([[0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  26887. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  26888. [0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  26889. [0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  26890. [0.6296, 0.4060, 0.9100, 0.3267, 0.4726, 0.3367, 0.7446, 0.5355],
  26891. [0.6189, 0.4033, 0.8650, 0.5267, 0.4487, 0.5150, 0.5925, 0.5050],
  26892. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  26893. [0.6142, 0.4127, 0.7575, 0.3067, 0.3438, 0.4383, 0.5778, 0.5207]],
  26894. device='cuda:0', dtype=torch.float64)
  26895. predictions are: tensor([[ 0.7814, -0.3283, 1.7350, 0.3717, -0.6610, -0.2527, 0.6901, 0.0986],
  26896. [ 0.4466, -0.4523, 1.5270, -0.9148, -0.1701, -1.3227, 0.4904, 0.1241],
  26897. [ 0.5207, -0.4192, 1.7305, 0.0228, -0.3488, 0.1860, 0.1492, 0.2329],
  26898. [ 0.1713, -0.6661, 1.9103, -0.2153, -0.4411, -0.7909, 0.6483, 0.1719],
  26899. [ 0.6538, -0.4094, 1.7988, -0.7230, -0.2640, -0.6816, 1.0283, 0.1449],
  26900. [ 0.6401, -0.3794, 1.7304, 0.2279, -0.2252, 0.2746, 0.4670, 0.1517],
  26901. [ 0.6683, -0.3525, 1.0400, -1.2745, -0.3444, -1.4572, 0.2691, 0.1660],
  26902. [ 0.5483, -0.4067, 1.2148, -0.8755, -0.6606, -0.2426, 0.4862, 0.2548]],
  26903. device='cuda:0', grad_fn=<AddmmBackward>)
  26904. landmarks are: tensor([[[ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  26905. -0.1278],
  26906. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  26907. 0.2083],
  26908. [ 0.5491, -0.4132, 1.7557, -0.0919, -0.2709, 0.0313, 0.0635,
  26909. 0.4032],
  26910. [ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  26911. 0.1608],
  26912. [ 0.6224, -0.4105, 1.9173, -0.7771, -0.1030, -0.7308, 1.1532,
  26913. 0.1875],
  26914. [ 0.5726, -0.4230, 1.7095, 0.1467, -0.2132, 0.0928, 0.4508,
  26915. 0.0467],
  26916. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  26917. 0.1253],
  26918. [ 0.5509, -0.3798, 1.2129, -0.8694, -0.6982, -0.2613, 0.3830,
  26919. 0.1193]]], device='cuda:0')
  26920. loss_train_step before backward: tensor(0.0126, device='cuda:0', grad_fn=<MseLossBackward>)
  26921. loss_train_step after backward: tensor(0.0126, device='cuda:0', grad_fn=<MseLossBackward>)
  26922. loss_train: 0.043306597508490086
  26923. step: 2
  26924. running loss: 0.021653298754245043
  26925. Train Steps: 2/90 Loss: 0.0217 torch.Size([8, 600, 800])
  26926. torch.Size([8, 8])
  26927. tensor([[0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  26928. [0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  26929. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  26930. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  26931. [0.6267, 0.4094, 0.8712, 0.3083, 0.4400, 0.2267, 0.6250, 0.5200],
  26932. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  26933. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  26934. [0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274]],
  26935. device='cuda:0', dtype=torch.float64)
  26936. predictions are: tensor([[ 0.5350, -0.4089, 1.6639, -0.7590, -0.2530, -1.2740, 0.3201, 0.0325],
  26937. [ 0.6042, -0.3893, 1.6976, -0.0241, -0.5590, 0.0529, 0.2902, 0.2995],
  26938. [ 0.5105, -0.4591, 1.2283, -1.1165, -0.2299, -1.4138, 0.3845, 0.1057],
  26939. [ 0.5441, -0.4624, 1.8066, -0.1762, -0.5450, -0.5049, 0.5332, 0.1960],
  26940. [ 0.2679, -0.5802, 1.7151, -0.9117, -0.2376, -1.0972, 0.5032, 0.1522],
  26941. [ 0.6417, -0.3980, 1.3725, 0.3973, -0.4975, 0.1530, 0.8924, 0.2196],
  26942. [ 0.7965, -0.3336, 1.8087, -0.2137, -0.5701, 0.3298, 0.9831, 0.1608],
  26943. [ 0.3200, -0.5568, 1.6624, -0.7711, -0.0910, -1.2281, 0.5951, 0.1513]],
  26944. device='cuda:0', grad_fn=<AddmmBackward>)
  26945. landmarks are: tensor([[[ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  26946. -0.0368],
  26947. [ 0.5700, -0.4032, 1.7961, -0.1997, -0.5249, -0.2151, 0.3815,
  26948. 0.3161],
  26949. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  26950. 0.1005],
  26951. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  26952. 0.1005],
  26953. [ 0.6089, -0.3948, 1.7383, -0.8617, -0.2536, -1.2390, 0.6009,
  26954. 0.1159],
  26955. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  26956. 0.1928],
  26957. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  26958. 0.1715],
  26959. [ 0.6537, -0.3719, 1.6979, -0.8617, -0.0169, -1.3621, 0.6926,
  26960. 0.1501]]], device='cuda:0')
  26961. loss_train_step before backward: tensor(0.0125, device='cuda:0', grad_fn=<MseLossBackward>)
  26962. loss_train_step after backward: tensor(0.0125, device='cuda:0', grad_fn=<MseLossBackward>)
  26963. loss_train: 0.055825852788984776
  26964. step: 3
  26965. running loss: 0.01860861759632826
  26966. Train Steps: 3/90 Loss: 0.0186 torch.Size([8, 600, 800])
  26967. torch.Size([8, 8])
  26968. tensor([[0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  26969. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  26970. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  26971. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  26972. [0.6161, 0.4076, 0.8900, 0.4667, 0.4125, 0.5917, 0.6262, 0.5367],
  26973. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  26974. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  26975. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133]],
  26976. device='cuda:0', dtype=torch.float64)
  26977. predictions are: tensor([[ 0.5987, -0.4661, 1.6236, -0.9908, -0.4434, -1.1789, 0.7196, 0.0251],
  26978. [ 0.5112, -0.4525, 1.0903, -0.8345, -0.6445, -0.8166, 0.3535, 0.3133],
  26979. [ 0.5388, -0.4309, 1.4379, -0.4941, -0.6618, -0.5530, 0.2934, 0.3137],
  26980. [ 0.7562, -0.3317, 1.7788, -0.3304, -0.7112, -0.4528, 0.5880, 0.0941],
  26981. [ 0.3007, -0.6169, 1.8800, 0.0517, -0.2237, 0.4643, 0.7065, 0.1734],
  26982. [ 0.7015, -0.3517, 1.8053, 0.2233, 0.0085, 0.0399, 0.4138, 0.1027],
  26983. [ 0.3611, -0.5971, 1.8793, 0.2300, -0.4435, -0.2307, 0.6075, 0.0287],
  26984. [ 0.8464, -0.2693, 1.6988, -0.9977, -0.0583, -1.6439, 0.7758, 0.0953]],
  26985. device='cuda:0', grad_fn=<AddmmBackward>)
  26986. landmarks are: tensor([[[ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  26987. -0.0220],
  26988. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  26989. 0.3315],
  26990. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  26991. 0.3417],
  26992. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  26993. 0.0236],
  26994. [ 0.5598, -0.4032, 1.8249, -0.1304, -0.3806, 0.4470, 0.6067,
  26995. 0.1929],
  26996. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  26997. 0.0532],
  26998. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  26999. 0.0313],
  27000. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  27001. 0.0851]]], device='cuda:0')
  27002. loss_train_step before backward: tensor(0.0153, device='cuda:0', grad_fn=<MseLossBackward>)
  27003. loss_train_step after backward: tensor(0.0153, device='cuda:0', grad_fn=<MseLossBackward>)
  27004. loss_train: 0.07109592575579882
  27005. step: 4
  27006. running loss: 0.017773981438949704
  27007. Train Steps: 4/90 Loss: 0.0178 torch.Size([8, 600, 800])
  27008. torch.Size([8, 8])
  27009. tensor([[0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  27010. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650],
  27011. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  27012. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  27013. [0.6132, 0.3930, 0.8672, 0.4754, 0.3712, 0.5222, 0.5974, 0.5098],
  27014. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567],
  27015. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  27016. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717]],
  27017. device='cuda:0', dtype=torch.float64)
  27018. predictions are: tensor([[ 0.7477, -0.3178, 1.2301, -0.7151, -0.6086, -0.7426, 0.3208, 0.1037],
  27019. [-1.8269, -1.9756, 1.2389, -1.0472, -0.3977, -1.2951, 0.2191, 0.1287],
  27020. [ 1.0299, -0.0680, 1.6474, -0.3865, -0.0985, -1.2672, 0.6018, 0.2814],
  27021. [ 0.8511, -0.2321, 1.9707, -0.4202, -0.4431, -1.0457, 0.6645, 0.0311],
  27022. [ 1.0978, -0.1226, 1.8701, 0.1610, -0.4615, 0.1962, 0.8286, 0.0466],
  27023. [-1.8291, -1.9821, 1.4092, -1.0083, -0.3946, -1.1683, 0.3364, 0.0987],
  27024. [ 0.9370, -0.1767, 1.8685, 0.0554, -0.0661, 0.2181, 0.7632, 0.1283],
  27025. [ 1.0451, -0.1336, 1.0969, -0.9064, -0.4676, -1.1103, 0.4340, 0.2015]],
  27026. device='cuda:0', grad_fn=<AddmmBackward>)
  27027. landmarks are: tensor([[[ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  27028. 0.1710],
  27029. [-2.2859, -2.2859, 1.0361, -1.2021, -0.4210, -1.3390, 0.0871,
  27030. 0.3238],
  27031. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  27032. 0.5882],
  27033. [ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  27034. 0.2139],
  27035. [ 0.5466, -0.4706, 1.7198, -0.0903, -0.5712, 0.1261, 0.4733,
  27036. 0.0688],
  27037. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  27038. 0.2853],
  27039. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  27040. 0.3007],
  27041. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  27042. 0.3546]]], device='cuda:0')
  27043. loss_train_step before backward: tensor(0.0528, device='cuda:0', grad_fn=<MseLossBackward>)
  27044. loss_train_step after backward: tensor(0.0528, device='cuda:0', grad_fn=<MseLossBackward>)
  27045. loss_train: 0.12389781419187784
  27046. step: 5
  27047. running loss: 0.02477956283837557
  27048.  
  27049. Train Steps: 5/90 Loss: 0.0248 torch.Size([8, 600, 800])
  27050. torch.Size([8, 8])
  27051. tensor([[0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  27052. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  27053. [0.6276, 0.4120, 0.8738, 0.3133, 0.4225, 0.2217, 0.6203, 0.4892],
  27054. [0.6185, 0.4129, 0.8900, 0.4567, 0.3937, 0.5417, 0.5734, 0.5110],
  27055. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  27056. [0.6250, 0.4146, 0.8838, 0.3933, 0.3588, 0.4283, 0.6162, 0.5367],
  27057. [0.6129, 0.4069, 0.8750, 0.5067, 0.3875, 0.4233, 0.5235, 0.5881],
  27058. [0.6259, 0.4133, 0.8200, 0.2317, 0.5025, 0.1533, 0.6250, 0.4947]],
  27059. device='cuda:0', dtype=torch.float64)
  27060. predictions are: tensor([[ 0.4496, -0.4924, 1.7601, 0.0577, -0.3639, -0.1169, 0.4771, 0.1180],
  27061. [ 0.6491, -0.3763, 1.2254, -0.8365, -0.5457, -0.9526, 0.2617, 0.0583],
  27062. [ 0.7002, -0.3444, 1.8390, -0.6355, -0.3098, -1.3207, 0.7930, 0.0159],
  27063. [ 0.8954, -0.2209, 1.8416, -0.0108, -0.3952, 0.1701, 0.6371, 0.1106],
  27064. [-2.1383, -2.1947, 1.1317, -1.1560, -0.4116, -1.2603, 0.1670, 0.1438],
  27065. [ 0.7399, -0.3151, 1.7280, -0.3167, -0.5821, -0.4310, 0.7327, 0.2390],
  27066. [ 0.7173, -0.3291, 1.7100, 0.2690, -0.4947, -0.3467, 0.2674, 0.3007],
  27067. [ 0.7036, -0.3440, 1.5613, -1.0072, 0.0162, -1.4975, 0.7395, 0.0891]],
  27068. device='cuda:0', grad_fn=<AddmmBackward>)
  27069. landmarks are: tensor([[[ 5.7460e-01, -3.6231e-01, 1.7961e+00, -1.1501e-01, -3.6905e-01,
  27070. -3.8029e-02, 2.2079e-01, 1.4394e-01],
  27071. [ 5.2194e-01, -4.5504e-01, 1.1415e+00, -9.1962e-01, -6.4042e-01,
  27072. -9.3872e-01, 1.8562e-01, 1.4106e-02],
  27073. [ 6.1282e-01, -3.8283e-01, 1.7499e+00, -8.3865e-01, -3.3441e-01,
  27074. -1.2620e+00, 5.7925e-01, -2.6256e-02],
  27075. [ 5.7113e-01, -3.7875e-01, 1.8249e+00, -1.7660e-01, -4.6721e-01,
  27076. 2.1601e-01, 3.6246e-01, 7.4222e-02],
  27077. [-2.2859e+00, -2.2859e+00, 1.0513e+00, -1.2851e+00, -4.4411e-01,
  27078. -1.2313e+00, 2.2057e-01, 1.0729e-01],
  27079. [ 6.0092e-01, -3.7098e-01, 1.7961e+00, -4.6913e-01, -6.2887e-01,
  27080. -3.0747e-01, 5.6051e-01, 1.9292e-01],
  27081. [ 5.4515e-01, -4.0670e-01, 1.7557e+00, 5.4350e-02, -4.9607e-01,
  27082. -3.3056e-01, 1.3228e-01, 4.3063e-01],
  27083. [ 6.0514e-01, -3.7714e-01, 1.5016e+00, -1.2159e+00, 3.5104e-02,
  27084. -1.5777e+00, 6.0099e-01, -9.2270e-04]]], device='cuda:0')
  27085. loss_train_step before backward: tensor(0.0142, device='cuda:0', grad_fn=<MseLossBackward>)
  27086. loss_train_step after backward: tensor(0.0142, device='cuda:0', grad_fn=<MseLossBackward>)
  27087. loss_train: 0.13813432399183512
  27088. step: 6
  27089. running loss: 0.02302238733197252
  27090. Train Steps: 6/90 Loss: 0.0230 torch.Size([8, 600, 800])
  27091. torch.Size([8, 8])
  27092. tensor([[0.6234, 0.4023, 0.8888, 0.4633, 0.3975, 0.5767, 0.6400, 0.5183],
  27093. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  27094. [0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138],
  27095. [0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  27096. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  27097. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  27098. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  27099. [0.6307, 0.4029, 0.8650, 0.5200, 0.3763, 0.4017, 0.7311, 0.5366]],
  27100. device='cuda:0', dtype=torch.float64)
  27101. predictions are: tensor([[ 0.5177, -0.5142, 1.8768, -0.0287, -0.3660, 0.3563, 0.6098, 0.1759],
  27102. [ 0.6169, -0.4642, 1.7793, 0.2798, -0.4347, 0.0232, 0.5844, 0.0657],
  27103. [ 0.5446, -0.4551, 1.5762, -0.3746, -0.5773, -0.6849, 0.3518, 0.4858],
  27104. [ 0.5052, -0.5054, 1.2804, -1.1753, -0.3175, -1.4387, 0.2268, 0.0866],
  27105. [ 0.4783, -0.5226, 1.5799, -1.2029, -0.2695, -1.2095, 0.7283, 0.0610],
  27106. [ 0.5183, -0.5346, 1.5911, -0.9976, -0.3980, -1.1554, 0.4931, 0.0675],
  27107. [ 0.4365, -0.5086, 1.7467, -0.3318, -0.5918, -0.4954, 0.2639, 0.3172],
  27108. [ 0.5277, -0.5272, 1.8241, 0.2649, -0.4634, -0.5806, 0.9055, 0.0354]],
  27109. device='cuda:0', grad_fn=<AddmmBackward>)
  27110. landmarks are: tensor([[[ 5.9336e-01, -4.2756e-01, 1.8192e+00, -1.4580e-01, -4.4988e-01,
  27111. 3.7768e-01, 6.7021e-01, 1.0824e-01],
  27112. [ 5.9082e-01, -4.3664e-01, 1.7557e+00, 1.3903e-01, -5.1917e-01,
  27113. 1.3133e-01, 6.5289e-01, 2.3557e-02],
  27114. [ 5.4376e-01, -4.2055e-01, 1.5189e+00, -4.5373e-01, -6.1155e-01,
  27115. -6.2309e-01, 4.3649e-01, 5.4914e-01],
  27116. [ 5.5978e-01, -4.2008e-01, 1.1898e+00, -1.3005e+00, -3.8060e-01,
  27117. -1.3313e+00, 3.8730e-01, 7.7444e-02],
  27118. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  27119. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  27120. [ 6.0421e-01, -4.2248e-01, 1.5420e+00, -1.2082e+00, -4.7298e-01,
  27121. -1.0311e+00, 6.3800e-01, -2.1963e-02],
  27122. [ 5.7569e-01, -3.9169e-01, 1.7095e+00, -4.7683e-01, -6.3464e-01,
  27123. -4.2294e-01, 3.9307e-01, 3.2379e-01],
  27124. [ 6.2730e-01, -4.2490e-01, 1.7095e+00, 1.1594e-01, -5.4804e-01,
  27125. -4.3064e-01, 1.0910e+00, 1.9283e-01]]], device='cuda:0')
  27126. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  27127. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  27128. loss_train: 0.14870771393179893
  27129. step: 7
  27130. running loss: 0.021243959133114134
  27131. Train Steps: 7/90 Loss: 0.0212 torch.Size([8, 600, 800])
  27132. torch.Size([8, 8])
  27133. tensor([[0.6216, 0.4099, 0.7225, 0.2033, 0.4188, 0.2217, 0.5975, 0.5283],
  27134. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  27135. [0.6129, 0.4063, 0.8738, 0.5250, 0.4313, 0.4733, 0.5230, 0.5874],
  27136. [0.6353, 0.4128, 0.9138, 0.3533, 0.4688, 0.3250, 0.7145, 0.5991],
  27137. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  27138. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967],
  27139. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  27140. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633]],
  27141. device='cuda:0', dtype=torch.float64)
  27142. predictions are: tensor([[ 0.5176, -0.4837, 1.0740, -1.1601, -0.4477, -1.2307, 0.2159, 0.1664],
  27143. [ 0.6377, -0.4477, 1.5012, -1.2757, -0.1299, -1.4302, 0.5491, -0.0120],
  27144. [ 0.5548, -0.4542, 1.6038, 0.3398, -0.4500, 0.0341, 0.0801, 0.2882],
  27145. [-0.2789, -1.0308, 1.9276, -0.5532, -0.2452, -0.9053, 1.0819, 0.2952],
  27146. [ 0.6326, -0.4496, 1.7682, 0.0528, -0.6594, -0.1615, 0.5851, 0.0823],
  27147. [ 0.3568, -0.5675, 1.6265, -1.0354, -0.0946, -1.2957, 0.5937, 0.0173],
  27148. [ 0.4348, -0.5392, 1.7455, -0.7572, -0.4726, -0.8393, 0.7825, 0.1674],
  27149. [ 0.4264, -0.4988, 1.6926, 0.0959, -0.7095, -0.5125, 0.3129, 0.2892]],
  27150. device='cuda:0', grad_fn=<AddmmBackward>)
  27151. landmarks are: tensor([[[ 5.8505e-01, -3.9246e-01, 1.0513e+00, -1.3467e+00, -3.5173e-01,
  27152. -1.2620e+00, 4.7390e-01, 1.5443e-01],
  27153. [ 6.1264e-01, -4.0570e-01, 1.4439e+00, -1.3159e+00, -1.1501e-01,
  27154. -1.5777e+00, 5.5366e-01, -5.2974e-02],
  27155. [ 5.4527e-01, -4.0908e-01, 1.7499e+00, 1.3903e-01, -2.9400e-01,
  27156. -9.9615e-02, 1.2997e-01, 4.2725e-01],
  27157. [ 6.4871e-01, -3.7916e-01, 1.9346e+00, -6.5389e-01, -1.2079e-01,
  27158. -7.8476e-01, 1.0143e+00, 4.8139e-01],
  27159. [ 6.0754e-01, -4.5138e-01, 1.8032e+00, -8.2167e-02, -5.0606e-01,
  27160. -2.0228e-01, 6.2076e-01, 1.7788e-01],
  27161. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  27162. -1.5161e+00, 5.8660e-01, 8.0947e-03],
  27163. [ 6.0260e-01, -4.0323e-01, 1.7326e+00, -7.7706e-01, -3.6905e-01,
  27164. -8.6174e-01, 9.7040e-01, 3.0505e-01],
  27165. [ 5.9024e-01, -3.4927e-01, 1.7961e+00, -7.2363e-03, -5.9423e-01,
  27166. -5.6151e-01, 3.1801e-01, 3.1609e-01]]], device='cuda:0')
  27167. loss_train_step before backward: tensor(0.0322, device='cuda:0', grad_fn=<MseLossBackward>)
  27168. loss_train_step after backward: tensor(0.0322, device='cuda:0', grad_fn=<MseLossBackward>)
  27169. loss_train: 0.18095311149954796
  27170. step: 8
  27171. running loss: 0.022619138937443495
  27172.  
  27173. Train Steps: 8/90 Loss: 0.0226 torch.Size([8, 600, 800])
  27174. torch.Size([8, 8])
  27175. tensor([[0.6201, 0.4017, 0.8871, 0.4621, 0.3517, 0.4675, 0.5999, 0.5106],
  27176. [0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  27177. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  27178. [0.6149, 0.4054, 0.6713, 0.2333, 0.4025, 0.2017, 0.5213, 0.5695],
  27179. [0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395],
  27180. [0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  27181. [0.6196, 0.4068, 0.7645, 0.2234, 0.4575, 0.1737, 0.5926, 0.5284],
  27182. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500]],
  27183. device='cuda:0', dtype=torch.float64)
  27184. predictions are: tensor([[ 0.3702, -0.6153, 1.9485, 0.0180, -0.6251, -0.1912, 0.5284, 0.1265],
  27185. [ 0.3924, -0.5669, 1.9019, 0.1812, -0.2794, 0.3535, 0.4786, 0.1891],
  27186. [ 0.4712, -0.5183, 1.9494, -0.0167, -0.5042, -0.3461, 0.3179, 0.1923],
  27187. [ 0.0712, -0.7806, 1.0954, -1.0432, -0.4323, -1.4276, 0.1083, 0.2082],
  27188. [ 0.5518, -0.4915, 1.3219, -1.1241, -0.4176, -1.2363, 0.5847, 0.1265],
  27189. [ 0.8444, -0.3112, 1.2868, -1.1265, -0.3504, -1.2792, 0.7130, 0.1989],
  27190. [ 0.5735, -0.4880, 1.4809, -1.0457, -0.1821, -1.5007, 0.5285, 0.0796],
  27191. [ 0.3346, -0.6325, 1.4708, -0.8016, -0.6968, -0.4213, 0.6137, 0.1977]],
  27192. device='cuda:0', grad_fn=<AddmmBackward>)
  27193. landmarks are: tensor([[[ 0.5783, -0.4306, 1.8114, -0.1515, -0.6617, -0.1268, 0.4851,
  27194. 0.0727],
  27195. [ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  27196. 0.0412],
  27197. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  27198. 0.3087],
  27199. [ 0.5544, -0.4133, 0.8145, -1.2082, -0.4268, -1.3544, 0.1221,
  27200. 0.3446],
  27201. [ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  27202. 0.2058],
  27203. [ 0.5861, -0.3929, 1.0570, -1.4314, -0.3286, -1.1235, 0.6182,
  27204. 0.1852],
  27205. [ 0.5761, -0.4070, 1.2452, -1.2541, -0.1725, -1.4835, 0.4511,
  27206. 0.1545],
  27207. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  27208. 0.2545]]], device='cuda:0')
  27209. loss_train_step before backward: tensor(0.0257, device='cuda:0', grad_fn=<MseLossBackward>)
  27210. loss_train_step after backward: tensor(0.0257, device='cuda:0', grad_fn=<MseLossBackward>)
  27211. loss_train: 0.2066050637513399
  27212. step: 9
  27213. running loss: 0.022956118194593325
  27214. Train Steps: 9/90 Loss: 0.0230 torch.Size([8, 600, 800])
  27215. torch.Size([8, 8])
  27216. tensor([[0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  27217. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  27218. [0.6202, 0.4066, 0.8746, 0.3376, 0.3717, 0.3090, 0.5842, 0.5165],
  27219. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  27220. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272],
  27221. [0.6245, 0.4115, 0.8700, 0.4883, 0.4625, 0.5517, 0.6100, 0.5217],
  27222. [0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  27223. [0.6186, 0.4013, 0.8191, 0.3188, 0.4279, 0.2060, 0.5767, 0.5411]],
  27224. device='cuda:0', dtype=torch.float64)
  27225. predictions are: tensor([[ 0.2651, -0.6157, 1.2570, -1.0635, -0.5154, -0.8834, 0.6192, 0.2747],
  27226. [ 0.5491, -0.4932, 1.5250, 0.1891, -0.4677, 0.1058, 0.6565, 0.1900],
  27227. [ 0.3616, -0.5737, 1.6377, -0.7714, -0.6248, -0.9259, 0.4174, 0.1688],
  27228. [ 0.2940, -0.6039, 1.6172, -1.1136, -0.1859, -1.2848, 0.6837, 0.0900],
  27229. [ 0.3842, -0.5400, 1.5422, -0.7308, -0.4851, -1.1094, 0.1827, 0.2126],
  27230. [ 0.5567, -0.4578, 1.6566, -0.1017, -0.2839, 0.2518, 0.5364, 0.2497],
  27231. [ 0.4010, -0.5515, 1.8669, -0.6154, -0.2421, -1.3174, 0.5998, 0.1543],
  27232. [ 0.3493, -0.5728, 1.4240, -0.8848, -0.3612, -1.3296, 0.3260, 0.1651]],
  27233. device='cuda:0', grad_fn=<AddmmBackward>)
  27234. landmarks are: tensor([[[ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  27235. 0.2160],
  27236. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  27237. 0.1176],
  27238. [ 0.5787, -0.4077, 1.7537, -0.7263, -0.5692, -0.8586, 0.4126,
  27239. 0.1000],
  27240. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  27241. -0.0209],
  27242. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  27243. 0.1494],
  27244. [ 0.5987, -0.3852, 1.7326, -0.0303, -0.1497, 0.2622, 0.5316,
  27245. 0.1236],
  27246. [ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  27247. 0.0171],
  27248. [ 0.5713, -0.4321, 1.4975, -0.8134, -0.3094, -1.3345, 0.3779,
  27249. 0.2134]]], device='cuda:0')
  27250. loss_train_step before backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  27251. loss_train_step after backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  27252. loss_train: 0.22040296904742718
  27253. step: 10
  27254. running loss: 0.02204029690474272
  27255. Train Steps: 10/90 Loss: 0.0220 torch.Size([8, 600, 800])
  27256. torch.Size([8, 8])
  27257. tensor([[0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  27258. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667],
  27259. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  27260. [0.6264, 0.3972, 0.8853, 0.4771, 0.3853, 0.4511, 0.6293, 0.5334],
  27261. [0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131],
  27262. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  27263. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  27264. [0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117]],
  27265. device='cuda:0', dtype=torch.float64)
  27266. predictions are: tensor([[ 0.5814, -0.4430, 1.4538, -1.1155, -0.4904, -1.2293, 0.2936, -0.0107],
  27267. [-1.1313, -1.5455, 1.3149, -1.3389, -0.4164, -1.0452, 0.6576, 0.2857],
  27268. [ 0.7803, -0.3256, 1.7643, -0.2083, -0.5666, -0.6007, 0.4089, 0.1928],
  27269. [ 0.7986, -0.3300, 1.8533, -0.2059, -0.5074, -0.3374, 0.7314, 0.1213],
  27270. [ 0.5316, -0.4786, 1.6618, -0.5652, -0.6384, -0.3324, 0.4430, 0.1096],
  27271. [ 0.5207, -0.4637, 1.5275, -0.6416, -0.4408, -1.1248, 0.3544, 0.2698],
  27272. [ 0.5309, -0.4870, 1.8894, -0.3099, -0.1636, -0.0802, 0.3456, 0.0679],
  27273. [ 0.7446, -0.3162, 1.5247, 0.2188, -0.4249, -0.1904, 0.4876, 0.4739]],
  27274. device='cuda:0', grad_fn=<AddmmBackward>)
  27275. landmarks are: tensor([[[ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  27276. -0.0220],
  27277. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  27278. 0.3315],
  27279. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  27280. 0.1082],
  27281. [ 0.6075, -0.4514, 1.8032, -0.0822, -0.5061, -0.2023, 0.6208,
  27282. 0.1779],
  27283. [ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  27284. 0.0840],
  27285. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  27286. 0.3928],
  27287. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  27288. 0.0051],
  27289. [ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  27290. 0.5393]]], device='cuda:0')
  27291. loss_train_step before backward: tensor(0.0416, device='cuda:0', grad_fn=<MseLossBackward>)
  27292. loss_train_step after backward: tensor(0.0416, device='cuda:0', grad_fn=<MseLossBackward>)
  27293. loss_train: 0.26203702203929424
  27294. step: 11
  27295. running loss: 0.023821547458117657
  27296. Train Steps: 11/90 Loss: 0.0238 torch.Size([8, 600, 800])
  27297. torch.Size([8, 8])
  27298. tensor([[0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  27299. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  27300. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  27301. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  27302. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  27303. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  27304. [0.6127, 0.4119, 0.8650, 0.5300, 0.4512, 0.5250, 0.5260, 0.5461],
  27305. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892]],
  27306. device='cuda:0', dtype=torch.float64)
  27307. predictions are: tensor([[ 0.6080, -0.3856, 1.7336, -0.8982, -0.5061, -1.2318, 0.4152, 0.1341],
  27308. [ 0.4990, -0.4607, 1.6878, -0.4426, -0.1015, 0.0150, 0.4344, 0.2551],
  27309. [ 0.6212, -0.4318, 1.8470, -0.4213, -0.5903, -0.3445, 0.9861, 0.1653],
  27310. [ 0.5750, -0.4459, 1.7188, -0.4567, -0.6006, -0.5663, 0.4482, 0.2204],
  27311. [ 0.3180, -0.5996, 1.5562, 0.1008, -0.2646, -0.2010, 0.1075, 0.1433],
  27312. [ 0.6339, -0.4288, 1.7481, -0.3449, -0.6115, -0.3539, 0.6958, 0.1332],
  27313. [ 0.5634, -0.4427, 1.6698, -0.0794, -0.2126, -0.0684, 0.2679, 0.2849],
  27314. [ 0.5064, -0.4542, 1.6120, -0.4523, -0.6879, -0.7564, 0.0842, 0.3415]],
  27315. device='cuda:0', grad_fn=<AddmmBackward>)
  27316. landmarks are: tensor([[[ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  27317. 0.2139],
  27318. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  27319. 0.3007],
  27320. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  27321. 0.2516],
  27322. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  27323. 0.2314],
  27324. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  27325. -0.0610],
  27326. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  27327. 0.0774],
  27328. [ 0.5443, -0.3831, 1.7095, 0.1621, -0.2016, 0.1390, 0.1437,
  27329. 0.2364],
  27330. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  27331. 0.4357]]], device='cuda:0')
  27332. loss_train_step before backward: tensor(0.0211, device='cuda:0', grad_fn=<MseLossBackward>)
  27333. loss_train_step after backward: tensor(0.0211, device='cuda:0', grad_fn=<MseLossBackward>)
  27334. loss_train: 0.2831164803355932
  27335. step: 12
  27336. running loss: 0.0235930400279661
  27337.  
  27338. Train Steps: 12/90 Loss: 0.0236 torch.Size([8, 600, 800])
  27339. torch.Size([8, 8])
  27340. tensor([[0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  27341. [0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447],
  27342. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  27343. [0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  27344. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  27345. [0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044],
  27346. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  27347. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600]],
  27348. device='cuda:0', dtype=torch.float64)
  27349. predictions are: tensor([[ 0.6903, -0.3651, 1.6474, -0.8374, -0.6341, -0.9663, 0.3582, 0.1343],
  27350. [ 0.7031, -0.3525, 1.8754, -0.3281, -0.5801, -0.0378, 0.9083, 0.2030],
  27351. [ 0.4434, -0.4866, 1.6338, -0.1192, -0.5832, -0.6506, 0.1753, 0.3616],
  27352. [ 0.3422, -0.5627, 1.6275, 0.1652, -0.3122, -0.0549, 0.3189, 0.1649],
  27353. [ 0.5406, -0.4587, 1.6440, -0.0238, -0.5029, -0.2293, 0.4639, 0.0663],
  27354. [ 0.3885, -0.5420, 1.1723, -1.5524, -0.3675, -1.4431, 0.3967, 0.1097],
  27355. [ 0.6008, -0.3660, 1.6981, -0.7082, -0.4588, -0.9460, 0.3118, 0.4068],
  27356. [ 0.5218, -0.4222, 1.7080, -0.3800, -0.1079, 0.0906, 0.3519, 0.2555]],
  27357. device='cuda:0', grad_fn=<AddmmBackward>)
  27358. landmarks are: tensor([[[ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  27359. 0.1963],
  27360. [ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  27361. 0.2302],
  27362. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  27363. 0.3392],
  27364. [ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  27365. 0.2237],
  27366. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  27367. 0.0697],
  27368. [ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  27369. 0.0438],
  27370. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  27371. 0.3928],
  27372. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  27373. 0.3007]]], device='cuda:0')
  27374. loss_train_step before backward: tensor(0.0163, device='cuda:0', grad_fn=<MseLossBackward>)
  27375. loss_train_step after backward: tensor(0.0163, device='cuda:0', grad_fn=<MseLossBackward>)
  27376. loss_train: 0.29939468391239643
  27377. step: 13
  27378. running loss: 0.02303036030095357
  27379. Train Steps: 13/90 Loss: 0.0230 torch.Size([8, 600, 800])
  27380. torch.Size([8, 8])
  27381. tensor([[0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  27382. [0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  27383. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  27384. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767],
  27385. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  27386. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  27387. [0.6164, 0.3956, 0.8757, 0.5088, 0.4300, 0.5320, 0.6022, 0.5202],
  27388. [0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600]],
  27389. device='cuda:0', dtype=torch.float64)
  27390. predictions are: tensor([[ 0.5391, -0.4051, 1.3651, -0.6155, -0.6337, -0.3972, 0.0932, 0.1569],
  27391. [ 0.8467, -0.2399, 1.5689, -0.7761, -0.5896, -0.9227, 0.5025, 0.1898],
  27392. [ 0.7796, -0.2896, 1.7108, -0.0121, -0.4627, -0.1891, 0.6232, 0.0323],
  27393. [ 0.7671, -0.2283, 1.6868, -0.3612, -0.5792, -0.8732, 0.2958, 0.2853],
  27394. [ 0.6036, -0.3718, 1.7765, -0.1932, -0.1691, -0.1180, 0.2454, 0.3723],
  27395. [-2.3431, -2.3347, 0.9550, -1.3480, -0.4412, -1.4053, 0.1967, 0.3362],
  27396. [ 0.7980, -0.2530, 1.7662, -0.1792, -0.2901, 0.0418, 0.4128, 0.0634],
  27397. [ 0.7255, -0.2844, 1.7484, 0.0438, -0.4412, 0.1162, 0.4451, 0.2396]],
  27398. device='cuda:0', grad_fn=<AddmmBackward>)
  27399. landmarks are: tensor([[[ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  27400. 0.1552],
  27401. [ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  27402. 0.1621],
  27403. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  27404. 0.0697],
  27405. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  27406. 0.3778],
  27407. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  27408. 0.4171],
  27409. [-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  27410. 0.4543],
  27411. [ 0.5614, -0.4586, 1.7587, 0.0641, -0.2998, 0.1712, 0.4958,
  27412. 0.1170],
  27413. [ 0.5762, -0.3840, 1.7268, 0.2622, -0.4210, 0.1313, 0.4277,
  27414. 0.3007]]], device='cuda:0')
  27415. loss_train_step before backward: tensor(0.0169, device='cuda:0', grad_fn=<MseLossBackward>)
  27416. loss_train_step after backward: tensor(0.0169, device='cuda:0', grad_fn=<MseLossBackward>)
  27417. loss_train: 0.3162560146301985
  27418. step: 14
  27419. running loss: 0.022589715330728462
  27420. Train Steps: 14/90 Loss: 0.0226 torch.Size([8, 600, 800])
  27421. torch.Size([8, 8])
  27422. tensor([[ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729],
  27423. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  27424. [0.6113, 0.4088, 0.6859, 0.2208, 0.4363, 0.1700, 0.5188, 0.5533],
  27425. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  27426. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  27427. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  27428. [0.6201, 0.4036, 0.8596, 0.3850, 0.3492, 0.3785, 0.5978, 0.5131],
  27429. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672]],
  27430. device='cuda:0', dtype=torch.float64)
  27431. predictions are: tensor([[-1.8744, -2.0117, 0.9690, -1.2382, -0.4163, -1.3135, 0.1242, 0.3034],
  27432. [ 0.5949, -0.3956, 1.3967, -1.1633, -0.2750, -1.1070, 0.7447, 0.1486],
  27433. [ 0.5934, -0.3800, 0.9055, -1.2207, -0.3371, -1.3213, 0.0684, 0.2919],
  27434. [ 0.4608, -0.4651, 1.8125, 0.0842, -0.1831, 0.1602, 0.2000, 0.3755],
  27435. [ 0.6010, -0.3735, 1.6042, -0.6678, -0.7322, -0.2244, 0.4141, 0.2086],
  27436. [ 0.7164, -0.2757, 1.4874, -0.8664, -0.1305, -1.1824, 0.3852, 0.1847],
  27437. [ 0.8126, -0.2737, 1.7947, -0.4520, -0.7088, -0.3828, 0.3791, 0.0978],
  27438. [ 0.6742, -0.3727, 1.8206, 0.3258, -0.6526, -0.1677, 0.5933, 0.0655]],
  27439. device='cuda:0', grad_fn=<AddmmBackward>)
  27440. landmarks are: tensor([[[-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  27441. 0.3604],
  27442. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  27443. 0.1917],
  27444. [ 0.5377, -0.3978, 0.8824, -1.2663, -0.2709, -1.5007, 0.1102,
  27445. 0.2699],
  27446. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  27447. 0.4171],
  27448. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  27449. 0.2391],
  27450. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  27451. 0.2083],
  27452. [ 0.5783, -0.4216, 1.6847, -0.5078, -0.6732, -0.5377, 0.4752,
  27453. 0.0839],
  27454. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  27455. -0.1278]]], device='cuda:0')
  27456. loss_train_step before backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  27457. loss_train_step after backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  27458. loss_train: 0.32841287832707167
  27459. step: 15
  27460. running loss: 0.021894191888471446
  27461. Train Steps: 15/90 Loss: 0.0219 torch.Size([8, 600, 800])
  27462. torch.Size([8, 8])
  27463. tensor([[0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667],
  27464. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  27465. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  27466. [0.6262, 0.4052, 0.8888, 0.4700, 0.3675, 0.5117, 0.6350, 0.5233],
  27467. [0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400],
  27468. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  27469. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  27470. [0.6161, 0.4076, 0.8900, 0.4667, 0.4125, 0.5917, 0.6262, 0.5367]],
  27471. device='cuda:0', dtype=torch.float64)
  27472. predictions are: tensor([[ 0.6738, -0.3040, 1.6709, -0.5974, -0.5665, -0.4662, 0.4484, 0.4006],
  27473. [ 0.6564, -0.3728, 1.6862, 0.2819, -0.4988, -0.4484, 0.4865, 0.1666],
  27474. [ 0.4000, -0.5246, 1.2383, -1.0922, -0.6371, -0.8293, 0.3081, 0.1241],
  27475. [ 0.6967, -0.3275, 1.8110, -0.0835, -0.4345, -0.0513, 0.5109, 0.1657],
  27476. [ 0.5529, -0.3873, 1.5040, -0.7385, -0.5744, -0.7136, 0.4337, 0.3210],
  27477. [ 0.6056, -0.3954, 1.7734, -0.2286, -0.3551, 0.1743, 0.3885, 0.1289],
  27478. [ 0.3163, -0.5174, 1.6173, -0.2200, -0.4569, -0.3970, -0.0269, 0.4105],
  27479. [ 0.4139, -0.4945, 1.7536, -0.1140, -0.1944, 0.3604, 0.4320, 0.2440]],
  27480. device='cuda:0', grad_fn=<AddmmBackward>)
  27481. landmarks are: tensor([[[ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  27482. 0.3315],
  27483. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  27484. 0.0291],
  27485. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  27486. 0.0412],
  27487. [ 0.6063, -0.4142, 1.8192, -0.1150, -0.5885, 0.0774, 0.6471,
  27488. 0.1313],
  27489. [ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  27490. 0.2083],
  27491. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  27492. -0.0322],
  27493. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  27494. 0.4145],
  27495. [ 0.5598, -0.4032, 1.8249, -0.1304, -0.3806, 0.4470, 0.6067,
  27496. 0.1929]]], device='cuda:0')
  27497. loss_train_step before backward: tensor(0.0115, device='cuda:0', grad_fn=<MseLossBackward>)
  27498. loss_train_step after backward: tensor(0.0115, device='cuda:0', grad_fn=<MseLossBackward>)
  27499. loss_train: 0.3399082263931632
  27500. step: 16
  27501. running loss: 0.0212442641495727
  27502.  
  27503. Train Steps: 16/90 Loss: 0.0212 torch.Size([8, 600, 800])
  27504. torch.Size([8, 8])
  27505. tensor([[0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  27506. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  27507. [0.6289, 0.4032, 0.8419, 0.5446, 0.4075, 0.5017, 0.6312, 0.5117],
  27508. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  27509. [0.6336, 0.4191, 0.8938, 0.5167, 0.3937, 0.3517, 0.7343, 0.5748],
  27510. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  27511. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  27512. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533]],
  27513. device='cuda:0', dtype=torch.float64)
  27514. predictions are: tensor([[ 0.7029, -0.2821, 1.0760, -1.2492, -0.3319, -1.2570, 0.1479, 0.1191],
  27515. [ 0.7587, -0.2442, 1.6849, -0.0106, -0.3610, 0.4631, 0.6869, 0.2252],
  27516. [ 0.5850, -0.3844, 1.6199, 0.0817, -0.3890, 0.0821, 0.4641, 0.0563],
  27517. [ 0.7050, -0.2352, 1.3946, -0.2707, -0.4803, -0.7746, 0.0691, 0.4567],
  27518. [ 0.6798, -0.3020, 1.7941, 0.0049, -0.3509, -0.4692, 0.7393, 0.2167],
  27519. [ 0.6755, -0.2483, 1.5387, -0.4930, -0.5451, -0.6314, 0.1540, 0.3930],
  27520. [ 0.6301, -0.3319, 1.7693, -0.2778, -0.5249, -0.2802, 0.2878, 0.1862],
  27521. [-2.3278, -2.2892, 1.3048, -0.9943, -0.5037, -0.9370, 0.2053, 0.2479]],
  27522. device='cuda:0', grad_fn=<AddmmBackward>)
  27523. landmarks are: tensor([[[ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  27524. 0.1449],
  27525. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  27526. 0.3371],
  27527. [ 0.6189, -0.4238, 1.6026, 0.2295, -0.4037, 0.0313, 0.6298,
  27528. 0.0774],
  27529. [ 0.6069, -0.3309, 1.3742, -0.1493, -0.5365, -0.9541, 0.2884,
  27530. 0.5071],
  27531. [ 0.6405, -0.3503, 1.8423, 0.1005, -0.4672, -0.6616, 1.1057,
  27532. 0.3692],
  27533. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  27534. 0.3238],
  27535. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  27536. 0.2314],
  27537. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  27538. 0.2699]]], device='cuda:0')
  27539. loss_train_step before backward: tensor(0.0158, device='cuda:0', grad_fn=<MseLossBackward>)
  27540. loss_train_step after backward: tensor(0.0158, device='cuda:0', grad_fn=<MseLossBackward>)
  27541. loss_train: 0.3556927992030978
  27542. step: 17
  27543. running loss: 0.020923105835476342
  27544. Train Steps: 17/90 Loss: 0.0209 torch.Size([8, 600, 800])
  27545. torch.Size([8, 8])
  27546. tensor([[0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  27547. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  27548. [0.6200, 0.4071, 0.7338, 0.1917, 0.4200, 0.2450, 0.6150, 0.5517],
  27549. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  27550. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  27551. [0.6203, 0.4096, 0.8862, 0.4267, 0.3538, 0.4117, 0.6025, 0.5650],
  27552. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  27553. [0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117]],
  27554. device='cuda:0', dtype=torch.float64)
  27555. predictions are: tensor([[ 0.6595, -0.3308, 1.7053, 0.3498, -0.4550, -0.0557, 0.7336, 0.1286],
  27556. [ 0.5503, -0.4199, 1.9664, -0.1062, -0.2386, -0.7404, 0.8984, 0.3366],
  27557. [ 0.4786, -0.4499, 1.0389, -1.3838, -0.2911, -0.9671, 0.3889, 0.2742],
  27558. [ 0.3249, -0.5281, 0.7924, -1.2884, -0.4708, -0.9557, 0.1264, 0.1307],
  27559. [ 0.3706, -0.5244, 1.7032, -0.2031, -0.5283, -0.3190, 0.2407, 0.3382],
  27560. [ 0.5839, -0.3540, 1.7904, -0.3297, -0.4904, -0.1844, 0.3168, 0.3530],
  27561. [ 0.2467, -0.5829, 1.6835, -0.3035, -0.5309, -0.5152, 0.2587, 0.3660],
  27562. [ 0.6686, -0.3094, 1.7843, -0.1293, -0.5499, -0.2107, 0.1485, 0.0952]],
  27563. device='cuda:0', grad_fn=<AddmmBackward>)
  27564. landmarks are: tensor([[[ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  27565. 0.2516],
  27566. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  27567. 0.3692],
  27568. [ 0.5779, -0.4054, 1.1032, -1.4006, -0.3460, -1.1543, 0.5547,
  27569. 0.2622],
  27570. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  27571. 0.0862],
  27572. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  27573. 0.2853],
  27574. [ 0.5790, -0.3940, 1.8076, -0.3152, -0.6520, -0.3844, 0.4970,
  27575. 0.3238],
  27576. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  27577. 0.2699],
  27578. [ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  27579. 0.0774]]], device='cuda:0')
  27580. loss_train_step before backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  27581. loss_train_step after backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  27582. loss_train: 0.3708633789792657
  27583. step: 18
  27584. running loss: 0.020603521054403648
  27585. Train Steps: 18/90 Loss: 0.0206 torch.Size([8, 600, 800])
  27586. torch.Size([8, 8])
  27587. tensor([[0.6236, 0.3977, 0.8985, 0.4806, 0.3835, 0.5216, 0.6613, 0.5166],
  27588. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609],
  27589. [0.6196, 0.4068, 0.7645, 0.2234, 0.4575, 0.1737, 0.5926, 0.5284],
  27590. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  27591. [0.6364, 0.4092, 0.8525, 0.5633, 0.3875, 0.4950, 0.6599, 0.5285],
  27592. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  27593. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  27594. [0.6202, 0.4054, 0.8892, 0.4428, 0.3642, 0.3249, 0.5840, 0.5426]],
  27595. device='cuda:0', dtype=torch.float64)
  27596. predictions are: tensor([[ 0.3771, -0.5383, 1.7638, -0.0992, -0.5666, 0.2643, 0.5956, 0.2325],
  27597. [ 0.7077, -0.2939, 1.6108, -1.1808, 0.1599, -1.2673, 0.9221, 0.3429],
  27598. [ 0.5240, -0.3895, 1.0684, -1.2673, -0.2932, -1.2565, 0.1783, 0.2553],
  27599. [ 0.3992, -0.4817, 1.6507, 0.1151, -0.2505, 0.2378, 0.2202, 0.2257],
  27600. [ 0.4623, -0.4594, 1.6011, 0.3008, -0.5909, 0.1249, 0.5551, 0.2070],
  27601. [ 0.6439, -0.3487, 1.6420, 0.2801, -0.6249, -0.1156, 0.3183, 0.2343],
  27602. [ 0.3152, -0.5551, 1.8351, -0.2781, -0.6664, -0.0461, 0.4377, 0.0753],
  27603. [ 0.6804, -0.2900, 1.7184, -0.2531, -0.6444, -0.5595, 0.2237, 0.3050]],
  27604. device='cuda:0', grad_fn=<AddmmBackward>)
  27605. landmarks are: tensor([[[ 5.9436e-01, -4.4897e-01, 1.8643e+00, -6.5918e-02, -5.1472e-01,
  27606. 1.2348e-01, 7.6842e-01, 1.0043e-01],
  27607. [ 6.3718e-01, -3.5749e-01, 1.6633e+00, -1.2082e+00, 2.1986e-01,
  27608. -1.2467e+00, 1.1313e+00, 3.0505e-01],
  27609. [ 5.7610e-01, -4.0701e-01, 1.2452e+00, -1.2541e+00, -1.7255e-01,
  27610. -1.4835e+00, 4.5107e-01, 1.5453e-01],
  27611. [ 5.7864e-01, -4.1409e-01, 1.7037e+00, 1.5443e-01, -1.8624e-01,
  27612. 7.3556e-02, 4.3926e-01, 8.5142e-02],
  27613. [ 6.5365e-01, -3.9601e-01, 1.6517e+00, 3.1609e-01, -4.9607e-01,
  27614. 4.6189e-04, 7.6203e-01, 1.5543e-01],
  27615. [ 5.7864e-01, -4.4627e-01, 1.6655e+00, 2.2157e-01, -5.1146e-01,
  27616. -2.6752e-01, 4.2362e-01, 2.0749e-01],
  27617. [ 6.0716e-01, -4.2055e-01, 1.8711e+00, -2.5358e-01, -6.1155e-01,
  27618. -1.3041e-01, 6.8119e-01, -6.7050e-02],
  27619. [ 5.7875e-01, -4.1347e-01, 1.8214e+00, -2.4075e-01, -6.0389e-01,
  27620. -7.8543e-01, 4.1155e-01, 2.2033e-01]]], device='cuda:0')
  27621. loss_train_step before backward: tensor(0.0161, device='cuda:0', grad_fn=<MseLossBackward>)
  27622. loss_train_step after backward: tensor(0.0161, device='cuda:0', grad_fn=<MseLossBackward>)
  27623. loss_train: 0.3869306379929185
  27624. step: 19
  27625. running loss: 0.020364770420679922
  27626. Train Steps: 19/90 Loss: 0.0204 torch.Size([8, 600, 800])
  27627. torch.Size([8, 8])
  27628. tensor([[0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  27629. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  27630. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  27631. [0.6022, 0.3994, 0.8025, 0.3350, 0.3350, 0.4400, 0.5565, 0.5025],
  27632. [0.6250, 0.4131, 0.8688, 0.2983, 0.4275, 0.2367, 0.6162, 0.5367],
  27633. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  27634. [0.6332, 0.4128, 0.9200, 0.3517, 0.4400, 0.3833, 0.7461, 0.5494],
  27635. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196]],
  27636. device='cuda:0', dtype=torch.float64)
  27637. predictions are: tensor([[ 0.4445, -0.4425, 1.4694, -0.9243, -0.4568, -0.9045, 0.4037, 0.1216],
  27638. [ 0.5492, -0.4187, 1.6414, 0.1282, -0.3174, 0.0859, 0.3000, 0.2823],
  27639. [ 0.4324, -0.4828, 1.6951, 0.0454, -0.1453, 0.1048, 0.2725, 0.0768],
  27640. [ 0.2279, -0.6074, 1.3656, -0.6036, -0.7623, -0.1955, 0.3766, 0.1503],
  27641. [ 0.1854, -0.5919, 1.6488, -0.8114, -0.3160, -1.0299, 0.6023, 0.2372],
  27642. [ 0.5083, -0.4121, 1.3570, -0.8879, -0.4907, -0.6800, 0.4704, 0.3468],
  27643. [ 0.5510, -0.4482, 1.7670, -0.4521, -0.4118, -0.3523, 1.0814, 0.2116],
  27644. [ 0.7426, -0.2122, 1.5960, 0.2323, -0.3715, -0.8716, 0.3507, 0.4529]],
  27645. device='cuda:0', grad_fn=<AddmmBackward>)
  27646. landmarks are: tensor([[[ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  27647. 0.0851],
  27648. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  27649. 0.3700],
  27650. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  27651. -0.0039],
  27652. [ 0.4956, -0.4413, 1.4208, -0.7386, -0.7386, -0.2536, 0.2843,
  27653. 0.0351],
  27654. [ 0.6011, -0.3778, 1.7268, -0.9079, -0.3113, -1.1928, 0.5605,
  27655. 0.1929],
  27656. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  27657. 0.3392],
  27658. [ 0.6388, -0.3792, 1.9635, -0.6616, -0.2536, -0.5153, 1.1605,
  27659. 0.2516],
  27660. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  27661. 0.5762]]], device='cuda:0')
  27662. loss_train_step before backward: tensor(0.0167, device='cuda:0', grad_fn=<MseLossBackward>)
  27663. loss_train_step after backward: tensor(0.0167, device='cuda:0', grad_fn=<MseLossBackward>)
  27664. loss_train: 0.40361075196415186
  27665. step: 20
  27666. running loss: 0.020180537598207593
  27667.  
  27668. Train Steps: 20/90 Loss: 0.0202 torch.Size([8, 600, 800])
  27669. torch.Size([8, 8])
  27670. tensor([[0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501],
  27671. [ nan, nan, 0.8850, 0.2817, 0.5112, 0.2183, 0.7184, 0.5436],
  27672. [0.6162, 0.4134, 0.6700, 0.2467, 0.3962, 0.2533, 0.5737, 0.5467],
  27673. [0.6223, 0.4130, 0.8100, 0.2983, 0.3525, 0.3900, 0.5694, 0.5103],
  27674. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  27675. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  27676. [0.6145, 0.4008, 0.8750, 0.5383, 0.3975, 0.4650, 0.5563, 0.5533],
  27677. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973]],
  27678. device='cuda:0', dtype=torch.float64)
  27679. predictions are: tensor([[ 0.3955, -0.4749, 1.3898, -0.9947, -0.2276, -1.1466, 0.4303, 0.2292],
  27680. [-0.9126, -1.3647, 1.7853, -1.0556, 0.1312, -1.1487, 1.0912, 0.3533],
  27681. [ 0.5603, -0.3804, 0.8494, -1.0202, -0.4774, -1.0772, 0.3581, 0.2918],
  27682. [ 0.5956, -0.3725, 1.5091, -0.6703, -0.6470, -0.3083, 0.4570, 0.1711],
  27683. [ 0.4852, -0.4004, 1.4856, -0.3499, -0.6665, -0.7114, 0.0906, 0.3698],
  27684. [ 0.6508, -0.3468, 1.8328, -0.0150, -0.5481, 0.1108, 0.3329, 0.1858],
  27685. [ 0.6672, -0.3458, 1.7533, 0.3656, -0.3711, 0.0669, 0.4311, 0.2554],
  27686. [ 0.7912, -0.3052, 1.8702, 0.3306, -0.6130, -0.0232, 0.8078, -0.0553]],
  27687. device='cuda:0', grad_fn=<AddmmBackward>)
  27688. landmarks are: tensor([[[ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  27689. 0.2549],
  27690. [-2.2859, -2.2859, 1.8018, -0.9849, 0.0755, -1.2774, 1.0326,
  27691. 0.2249],
  27692. [ 0.5603, -0.3764, 0.8088, -1.1466, -0.4557, -1.1158, 0.3642,
  27693. 0.2391],
  27694. [ 0.5886, -0.3784, 1.4554, -0.9079, -0.6577, -0.4845, 0.3440,
  27695. 0.0712],
  27696. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  27697. 0.4374],
  27698. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  27699. 0.3469],
  27700. [ 0.5526, -0.4347, 1.7557, 0.2006, -0.4499, -0.1381, 0.2834,
  27701. 0.2699],
  27702. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  27703. 0.0111]]], device='cuda:0')
  27704. loss_train_step before backward: tensor(0.0536, device='cuda:0', grad_fn=<MseLossBackward>)
  27705. loss_train_step after backward: tensor(0.0536, device='cuda:0', grad_fn=<MseLossBackward>)
  27706. loss_train: 0.45722213480621576
  27707. step: 21
  27708. running loss: 0.021772482609819798
  27709. Train Steps: 21/90 Loss: 0.0218 torch.Size([8, 600, 800])
  27710. torch.Size([8, 8])
  27711. tensor([[0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  27712. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  27713. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  27714. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  27715. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  27716. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  27717. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  27718. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690]],
  27719. device='cuda:0', dtype=torch.float64)
  27720. predictions are: tensor([[ 0.4032, -0.5113, 1.7258, -0.0226, -0.2910, -0.1014, 0.5768, 0.1624],
  27721. [ 0.6011, -0.3635, 1.2942, -1.0630, -0.6989, -0.7143, 0.5331, 0.1748],
  27722. [ 0.5156, -0.4315, 1.7901, -0.0675, -0.0420, -0.1152, 0.4514, 0.2772],
  27723. [ 0.4480, -0.4534, 1.7835, -0.2277, -0.3825, 0.1414, 0.4593, 0.3638],
  27724. [ 0.6085, -0.3451, 1.7743, 0.1849, -0.5596, -0.3062, 0.3344, 0.4080],
  27725. [ 0.6167, -0.3827, 1.8204, 0.0671, -0.5119, -0.2906, 0.4843, -0.0131],
  27726. [ 0.6249, -0.3598, 1.8184, -0.1034, -0.5868, -0.1451, 0.3213, 0.2177],
  27727. [ 0.6213, -0.3791, 1.5676, 0.2199, -0.4263, 0.1815, 1.0220, 0.3422]],
  27728. device='cuda:0', grad_fn=<AddmmBackward>)
  27729. landmarks are: tensor([[[ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  27730. 0.1474],
  27731. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  27732. 0.2237],
  27733. [ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  27734. 0.2853],
  27735. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  27736. 0.4701],
  27737. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  27738. 0.3161],
  27739. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  27740. 0.0313],
  27741. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  27742. 0.3469],
  27743. [ 0.6306, -0.4153, 1.5141, 0.2224, -0.3691, 0.2622, 1.0033,
  27744. 0.3425]]], device='cuda:0')
  27745. loss_train_step before backward: tensor(0.0053, device='cuda:0', grad_fn=<MseLossBackward>)
  27746. loss_train_step after backward: tensor(0.0053, device='cuda:0', grad_fn=<MseLossBackward>)
  27747. loss_train: 0.46247611194849014
  27748. step: 22
  27749. running loss: 0.021021641452204098
  27750. Train Steps: 22/90 Loss: 0.0210 torch.Size([8, 600, 800])
  27751. torch.Size([8, 8])
  27752. tensor([[0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  27753. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  27754. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  27755. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567],
  27756. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  27757. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  27758. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  27759. [0.6182, 0.3967, 0.8263, 0.3065, 0.3526, 0.4161, 0.6192, 0.5290]],
  27760. device='cuda:0', dtype=torch.float64)
  27761. predictions are: tensor([[ 0.4703, -0.4666, 1.7351, -1.2481, 0.1270, -1.5093, 1.1119, 0.2799],
  27762. [ 0.5133, -0.4259, 0.8617, -1.3169, -0.4766, -1.3048, 0.2593, 0.1520],
  27763. [ 0.2934, -0.5855, 1.6849, 0.3353, -0.5495, 0.0145, 0.3481, 0.2117],
  27764. [ 0.6970, -0.3230, 1.6839, 0.4214, -0.3112, 0.0768, 0.3962, 0.3051],
  27765. [ 0.5945, -0.3530, 1.7217, 0.2182, -0.2332, 0.1234, 0.2404, 0.2736],
  27766. [ 0.4804, -0.4319, 1.8376, -0.0268, -0.4507, -0.0504, 0.3362, 0.2036],
  27767. [ 0.5193, -0.4420, 1.8981, 0.0182, -0.6593, -0.2885, 0.9374, 0.2386],
  27768. [ 0.4919, -0.4813, 1.6119, -0.7349, -0.7653, -0.3712, 0.6983, 0.1223]],
  27769. device='cuda:0', grad_fn=<AddmmBackward>)
  27770. landmarks are: tensor([[[ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  27771. 0.2142],
  27772. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  27773. 0.1013],
  27774. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  27775. -0.1061],
  27776. [ 0.5620, -0.4346, 1.6691, 0.3315, -0.2594, -0.0072, 0.2891,
  27777. 0.2853],
  27778. [ 0.5447, -0.3838, 1.7037, 0.1775, -0.1497, 0.1467, 0.1128,
  27779. 0.2431],
  27780. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  27781. 0.1439],
  27782. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  27783. 0.1499],
  27784. [ 0.5697, -0.4538, 1.5308, -0.8703, -0.6572, -0.3639, 0.5739,
  27785. 0.1576]]], device='cuda:0')
  27786. loss_train_step before backward: tensor(0.0083, device='cuda:0', grad_fn=<MseLossBackward>)
  27787. loss_train_step after backward: tensor(0.0083, device='cuda:0', grad_fn=<MseLossBackward>)
  27788. loss_train: 0.4708037283271551
  27789. step: 23
  27790. running loss: 0.02046972731857196
  27791. Train Steps: 23/90 Loss: 0.0205 torch.Size([8, 600, 800])
  27792. torch.Size([8, 8])
  27793. tensor([[0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  27794. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  27795. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  27796. [0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167],
  27797. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  27798. [0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433],
  27799. [0.6307, 0.4029, 0.8988, 0.4817, 0.3937, 0.3500, 0.7311, 0.5378],
  27800. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450]],
  27801. device='cuda:0', dtype=torch.float64)
  27802. predictions are: tensor([[ 0.3197, -0.5203, 1.6434, -1.0400, -0.1443, -1.1808, 0.6363, 0.1232],
  27803. [ 0.2566, -0.6155, 1.8100, -0.6931, -0.4654, -0.6712, 0.7653, 0.2250],
  27804. [ 0.5813, -0.4408, 1.7087, 0.2765, -0.6172, -0.2340, 0.6644, 0.1122],
  27805. [ 0.4842, -0.4296, 1.1465, -0.9483, -0.4555, -1.0081, 0.4722, 0.4620],
  27806. [ 0.5570, -0.3612, 1.5991, -0.3948, -0.5087, -1.0276, 0.1089, 0.1086],
  27807. [ 0.5946, -0.3962, 1.6840, -0.0339, -0.1180, 0.3206, 0.4458, 0.3277],
  27808. [ 0.5608, -0.4686, 1.8304, -0.0690, -0.4417, -0.6189, 1.0276, 0.1999],
  27809. [ 0.3944, -0.5490, 1.7384, -0.1617, -0.3495, 0.2295, 0.4583, 0.2216]],
  27810. device='cuda:0', grad_fn=<AddmmBackward>)
  27811. landmarks are: tensor([[[ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  27812. -0.0209],
  27813. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  27814. 0.1390],
  27815. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  27816. 0.0291],
  27817. [ 0.5631, -0.4129, 1.2129, -0.9233, -0.4152, -1.0311, 0.4566,
  27818. 0.5624],
  27819. [ 0.5485, -0.4209, 1.6691, -0.4152, -0.5249, -1.1081, 0.0725,
  27820. 0.0021],
  27821. [ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  27822. 0.2237],
  27823. [ 0.6273, -0.4249, 1.8654, -0.0611, -0.4672, -0.6693, 1.0910,
  27824. 0.1982],
  27825. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  27826. 0.2314]]], device='cuda:0')
  27827. loss_train_step before backward: tensor(0.0093, device='cuda:0', grad_fn=<MseLossBackward>)
  27828. loss_train_step after backward: tensor(0.0093, device='cuda:0', grad_fn=<MseLossBackward>)
  27829. loss_train: 0.4800864914432168
  27830. step: 24
  27831. running loss: 0.020003603810134035
  27832.  
  27833. Train Steps: 24/90 Loss: 0.0200 torch.Size([8, 600, 800])
  27834. torch.Size([8, 8])
  27835. tensor([[0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  27836. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  27837. [0.6280, 0.4101, 0.9050, 0.4533, 0.3775, 0.3217, 0.6338, 0.4915],
  27838. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  27839. [0.6200, 0.4070, 0.8938, 0.4183, 0.3538, 0.4567, 0.6175, 0.5400],
  27840. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  27841. [0.6223, 0.4130, 0.8100, 0.2983, 0.3525, 0.3900, 0.5694, 0.5103],
  27842. [0.6107, 0.4050, 0.8700, 0.4850, 0.4470, 0.4848, 0.5043, 0.5431]],
  27843. device='cuda:0', dtype=torch.float64)
  27844. predictions are: tensor([[ 0.2778, -0.6069, 1.9192, -0.2346, -0.2136, -0.9693, 1.0890, 0.4038],
  27845. [ 0.6852, -0.3778, 1.5858, 0.2068, -0.3921, -0.0105, 1.0698, 0.2575],
  27846. [ 0.4798, -0.4860, 1.8392, -0.2396, -0.4881, -0.8281, 0.6195, 0.1020],
  27847. [ 0.6741, -0.3266, 1.7744, -0.3613, -0.5465, -0.4756, 0.5234, 0.2343],
  27848. [ 0.3450, -0.5909, 1.8070, -0.4339, -0.5138, -0.2004, 0.6149, 0.1366],
  27849. [ 0.2770, -0.5442, 1.5616, -0.4305, -0.5066, -0.8888, 0.0636, 0.2526],
  27850. [ 0.6650, -0.3418, 1.4621, -0.8721, -0.5571, -0.4428, 0.4900, 0.1761],
  27851. [ 0.5881, -0.3967, 1.6592, -0.0824, -0.1299, 0.0190, 0.0928, 0.1560]],
  27852. device='cuda:0', grad_fn=<AddmmBackward>)
  27853. landmarks are: tensor([[[ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  27854. 0.3692],
  27855. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  27856. 0.3745],
  27857. [ 0.6148, -0.3918, 1.8942, -0.1920, -0.5423, -0.8002, 0.6414,
  27858. -0.0156],
  27859. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  27860. 0.1544],
  27861. [ 0.5778, -0.4061, 1.8423, -0.3537, -0.6520, -0.1766, 0.5663,
  27862. 0.2083],
  27863. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  27864. 0.2116],
  27865. [ 0.5886, -0.3784, 1.4554, -0.9079, -0.6577, -0.4845, 0.3440,
  27866. 0.0712],
  27867. [ 0.5351, -0.4153, 1.7326, -0.0457, -0.2214, -0.0466, 0.0434,
  27868. 0.2228]]], device='cuda:0')
  27869. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  27870. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  27871. loss_train: 0.49067305121570826
  27872. step: 25
  27873. running loss: 0.01962692204862833
  27874. Train Steps: 25/90 Loss: 0.0196 torch.Size([8, 600, 800])
  27875. torch.Size([8, 8])
  27876. tensor([[0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  27877. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  27878. [0.6164, 0.3956, 0.8757, 0.5088, 0.4300, 0.5320, 0.6022, 0.5202],
  27879. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  27880. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  27881. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  27882. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528],
  27883. [0.6364, 0.4092, 0.8525, 0.5633, 0.3875, 0.4950, 0.6599, 0.5285]],
  27884. device='cuda:0', dtype=torch.float64)
  27885. predictions are: tensor([[ 0.6417, -0.3648, 1.6992, -0.2418, -0.0921, -0.0855, 0.3235, 0.2546],
  27886. [ 0.6611, -0.3901, 1.7823, -0.1001, -0.4637, 0.1033, 1.0566, 0.1444],
  27887. [ 0.7788, -0.2877, 1.6923, -0.0969, -0.2912, -0.0103, 0.4486, 0.0481],
  27888. [ 0.7775, -0.2282, 1.7290, -0.1277, -0.6033, -0.6896, 0.4119, 0.3582],
  27889. [ 0.5787, -0.3499, 1.5670, 0.1464, -0.5430, -0.6805, 0.3149, 0.4437],
  27890. [ 0.7507, -0.3013, 1.6025, -0.4169, -0.5600, -0.2327, 0.2022, 0.0216],
  27891. [-1.5653, -1.8225, 1.9168, -1.0289, -0.1499, -1.0868, 1.0415, 0.2593],
  27892. [ 0.8505, -0.2690, 1.6382, 0.1561, -0.4971, -0.1405, 0.8296, 0.0649]],
  27893. device='cuda:0', grad_fn=<AddmmBackward>)
  27894. landmarks are: tensor([[[ 5.5052e-01, -4.2071e-01, 1.7095e+00, -5.3426e-02, -5.0936e-02,
  27895. 1.0502e-01, 3.8730e-01, 3.0069e-01],
  27896. [ 6.4212e-01, -3.6953e-01, 1.7788e+00, 2.3557e-02, -4.8453e-01,
  27897. 1.5443e-01, 1.1971e+00, 2.1955e-01],
  27898. [ 5.6143e-01, -4.5860e-01, 1.7587e+00, 6.4079e-02, -2.9982e-01,
  27899. 1.7122e-01, 4.9584e-01, 1.1701e-01],
  27900. [ 5.9024e-01, -3.4927e-01, 1.7961e+00, -7.2363e-03, -5.9423e-01,
  27901. -5.6151e-01, 3.1801e-01, 3.1609e-01],
  27902. [ 6.0554e-01, -3.3934e-01, 1.6575e+00, 2.5450e-01, -5.9423e-01,
  27903. -5.4611e-01, 2.9492e-01, 4.7775e-01],
  27904. [ 5.2448e-01, -4.3610e-01, 1.5940e+00, -2.9207e-01, -5.4804e-01,
  27905. -9.1917e-02, 2.4319e-01, 5.0176e-02],
  27906. [-2.2859e+00, -2.2859e+00, 1.8423e+00, -9.6952e-01, -1.3233e-01,
  27907. -8.4634e-01, 1.1349e+00, 2.6764e-01],
  27908. [ 6.5365e-01, -3.9601e-01, 1.6517e+00, 3.1609e-01, -4.9607e-01,
  27909. 4.6189e-04, 7.6203e-01, 1.5543e-01]]], device='cuda:0')
  27910. loss_train_step before backward: tensor(0.0227, device='cuda:0', grad_fn=<MseLossBackward>)
  27911. loss_train_step after backward: tensor(0.0227, device='cuda:0', grad_fn=<MseLossBackward>)
  27912. loss_train: 0.5133614921942353
  27913. step: 26
  27914. running loss: 0.019744672776701357
  27915. Train Steps: 26/90 Loss: 0.0197 torch.Size([8, 600, 800])
  27916. torch.Size([8, 8])
  27917. tensor([[0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  27918. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  27919. [0.6311, 0.3998, 0.7975, 0.5767, 0.3838, 0.4850, 0.7327, 0.5343],
  27920. [0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  27921. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  27922. [0.6289, 0.4081, 0.8720, 0.3487, 0.3900, 0.3183, 0.6703, 0.5376],
  27923. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  27924. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967]],
  27925. device='cuda:0', dtype=torch.float64)
  27926. predictions are: tensor([[ 0.4348, -0.5345, 1.8946, -0.7295, -0.4771, -0.7699, 0.7855, 0.1025],
  27927. [ 0.5123, -0.4724, 1.6877, -0.4641, -0.6370, -0.5252, 0.5698, 0.2832],
  27928. [ 0.5497, -0.4999, 1.5042, 0.1221, -0.5073, -0.1399, 0.8437, 0.0930],
  27929. [ 0.3297, -0.5854, 1.5203, 0.3082, -0.4449, -0.1237, 0.4385, 0.4445],
  27930. [ 0.6769, -0.3657, 1.7477, -0.1668, -0.0879, 0.0667, 0.3535, 0.1672],
  27931. [ 0.7711, -0.3086, 1.7944, -0.5775, -0.4388, -0.8960, 0.9241, 0.1388],
  27932. [ 0.2592, -0.5935, 1.7154, -0.2854, -0.5463, -0.3459, 0.0919, 0.3221],
  27933. [ 0.2919, -0.5843, 1.6723, -1.1340, -0.0278, -1.4489, 0.6213, 0.0186]],
  27934. device='cuda:0', grad_fn=<AddmmBackward>)
  27935. landmarks are: tensor([[[ 6.0779e-01, -4.0570e-01, 1.8134e+00, -7.3087e-01, -4.4988e-01,
  27936. -7.3857e-01, 6.2979e-01, 1.3903e-01],
  27937. [ 5.7610e-01, -3.9661e-01, 1.6171e+00, -4.8453e-01, -6.3464e-01,
  27938. -4.6913e-01, 4.7390e-01, 2.9299e-01],
  27939. [ 6.2895e-01, -4.3934e-01, 1.3977e+00, 3.7768e-01, -5.1339e-01,
  27940. -4.5727e-02, 1.0984e+00, 1.8214e-01],
  27941. [ 6.1184e-01, -3.9831e-01, 1.5824e+00, 3.4688e-01, -4.2679e-01,
  27942. -6.8822e-02, 3.4688e-01, 5.3934e-01],
  27943. [ 5.5381e-01, -4.1386e-01, 1.7557e+00, -1.8430e-01, -4.5897e-02,
  27944. 1.2417e-01, 4.2194e-01, 2.8530e-01],
  27945. [ 6.1907e-01, -4.0082e-01, 1.7420e+00, -6.7528e-01, -4.8453e-01,
  27946. -8.1555e-01, 8.1006e-01, 1.9744e-01],
  27947. [ 5.5525e-01, -3.9923e-01, 1.7557e+00, -2.6898e-01, -4.9030e-01,
  27948. -2.6898e-01, 5.4227e-02, 4.1446e-01],
  27949. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  27950. -1.5161e+00, 5.8660e-01, 8.0947e-03]]], device='cuda:0')
  27951. loss_train_step before backward: tensor(0.0129, device='cuda:0', grad_fn=<MseLossBackward>)
  27952. loss_train_step after backward: tensor(0.0129, device='cuda:0', grad_fn=<MseLossBackward>)
  27953. loss_train: 0.5262837493792176
  27954. step: 27
  27955. running loss: 0.019491990717748802
  27956. Train Steps: 27/90 Loss: 0.0195 torch.Size([8, 600, 800])
  27957. torch.Size([8, 8])
  27958. tensor([[0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  27959. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  27960. [0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  27961. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  27962. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  27963. [0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617],
  27964. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  27965. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869]],
  27966. device='cuda:0', dtype=torch.float64)
  27967. predictions are: tensor([[ 5.9047e-01, -4.3015e-01, 1.2829e+00, -8.2089e-01, -6.3280e-01,
  27968. -8.4250e-01, 3.8176e-01, -1.2932e-03],
  27969. [ 4.8052e-01, -4.9887e-01, 1.3317e+00, -1.0921e+00, -2.2815e-01,
  27970. -1.4085e+00, 6.0268e-01, 1.1726e-01],
  27971. [ 3.5900e-01, -5.5937e-01, 1.1690e+00, -1.2250e+00, -3.4386e-01,
  27972. -1.1243e+00, 8.3362e-01, 2.8056e-01],
  27973. [ 5.8892e-01, -4.3297e-01, 1.7712e+00, 4.5259e-01, -3.8018e-01,
  27974. 1.1718e-01, 3.4146e-01, 2.2360e-01],
  27975. [-5.7707e-02, -8.8170e-01, 1.5893e+00, -9.8783e-01, -4.7708e-01,
  27976. -9.3724e-01, 8.6913e-01, 4.6581e-02],
  27977. [ 6.0177e-01, -4.4187e-01, 1.8321e+00, 1.1511e-01, -1.2282e-01,
  27978. 4.9209e-02, 3.9132e-01, 3.2597e-01],
  27979. [ 3.7568e-01, -5.4407e-01, 1.9095e+00, -1.6609e-01, -6.2486e-01,
  27980. -3.4410e-01, 4.6614e-01, 3.1886e-01],
  27981. [ 8.9065e-01, -2.2668e-01, 1.8704e+00, -6.2750e-01, -2.4321e-01,
  27982. -1.2563e+00, 6.0711e-01, 7.1932e-02]], device='cuda:0',
  27983. grad_fn=<AddmmBackward>)
  27984. landmarks are: tensor([[[ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  27985. 0.0141],
  27986. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  27987. 0.1005],
  27988. [ 0.5917, -0.3861, 1.0455, -1.3698, -0.2882, -1.1928, 0.6067,
  27989. 0.2083],
  27990. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  27991. 0.2048],
  27992. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  27993. -0.0220],
  27994. [ 0.5432, -0.4388, 1.7557, -0.0303, -0.0919, -0.1150, 0.2699,
  27995. 0.3087],
  27996. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  27997. 0.1852],
  27998. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  27999. -0.0368]]], device='cuda:0')
  28000. loss_train_step before backward: tensor(0.0293, device='cuda:0', grad_fn=<MseLossBackward>)
  28001. loss_train_step after backward: tensor(0.0293, device='cuda:0', grad_fn=<MseLossBackward>)
  28002. loss_train: 0.5556024992838502
  28003. step: 28
  28004. running loss: 0.019842946402994648
  28005.  
  28006. Train Steps: 28/90 Loss: 0.0198 torch.Size([8, 600, 800])
  28007. torch.Size([8, 8])
  28008. tensor([[0.6160, 0.4093, 0.8314, 0.4417, 0.3675, 0.4583, 0.5250, 0.5808],
  28009. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  28010. [0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  28011. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  28012. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552],
  28013. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  28014. [0.6083, 0.3957, 0.8638, 0.4950, 0.4363, 0.5083, 0.5346, 0.4980],
  28015. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507]],
  28016. device='cuda:0', dtype=torch.float64)
  28017. predictions are: tensor([[ 0.9783, -0.1393, 1.6980, -0.1290, -0.5966, -0.2572, 0.4469, 0.3263],
  28018. [ 1.0109, -0.1533, 1.7835, 0.1568, -0.2468, 0.1617, 0.6071, 0.1030],
  28019. [ 1.0725, -0.1292, 1.8002, -0.4632, -0.6134, -0.8617, 0.7768, 0.0539],
  28020. [ 1.0948, -0.0996, 1.6784, 0.3902, -0.3171, -0.0440, 0.3689, 0.1001],
  28021. [-2.1774, -2.1930, 1.7331, -1.1181, 0.0143, -1.2074, 0.8685, 0.2866],
  28022. [-2.1275, -2.1613, 0.9271, -1.1838, -0.4288, -1.2942, 0.1119, 0.3530],
  28023. [ 1.1153, -0.1008, 1.8017, 0.0431, -0.3620, 0.0071, 0.4366, -0.0337],
  28024. [ 0.8060, -0.2648, 1.0662, -1.2371, -0.4700, -1.2497, 0.5248, 0.1688]],
  28025. device='cuda:0', grad_fn=<AddmmBackward>)
  28026. landmarks are: tensor([[[ 5.5924e-01, -3.9561e-01, 1.5543e+00, -2.4557e-01, -5.8845e-01,
  28027. -1.6890e-01, 1.3922e-01, 3.9681e-01],
  28028. [ 5.4496e-01, -4.7305e-01, 1.7420e+00, 1.3720e-01, -1.9186e-01,
  28029. 2.6139e-01, 4.9757e-01, 7.6435e-02],
  28030. [ 5.7771e-01, -4.4157e-01, 1.7044e+00, -5.8275e-01, -5.9618e-01,
  28031. -8.3610e-01, 4.8621e-01, 1.9626e-01],
  28032. [ 5.1928e-01, -4.6990e-01, 1.5767e+00, 4.0077e-01, -2.4203e-01,
  28033. 7.7444e-02, 1.1776e-01, -6.1038e-02],
  28034. [-2.2859e+00, -2.2859e+00, 1.7557e+00, -1.1466e+00, 8.7067e-02,
  28035. -1.0773e+00, 1.1239e+00, 2.7833e-01],
  28036. [-2.2859e+00, -2.2859e+00, 8.0331e-01, -1.1250e+00, -3.8637e-01,
  28037. -1.3082e+00, 1.1262e-01, 4.5430e-01],
  28038. [ 5.2379e-01, -4.5797e-01, 1.7037e+00, 4.6189e-04, -2.7090e-01,
  28039. 6.2048e-02, 1.8356e-01, 1.4106e-02],
  28040. [ 5.1853e-01, -4.2517e-01, 9.6467e-01, -1.2928e+00, -4.7875e-01,
  28041. -1.2390e+00, 2.6170e-01, 2.5757e-01]]], device='cuda:0')
  28042. loss_train_step before backward: tensor(0.0428, device='cuda:0', grad_fn=<MseLossBackward>)
  28043. loss_train_step after backward: tensor(0.0428, device='cuda:0', grad_fn=<MseLossBackward>)
  28044. loss_train: 0.5983591759577394
  28045. step: 29
  28046. running loss: 0.020633075033025496
  28047. Train Steps: 29/90 Loss: 0.0206 torch.Size([8, 600, 800])
  28048. torch.Size([8, 8])
  28049. tensor([[0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  28050. [0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  28051. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  28052. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767],
  28053. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  28054. [0.6336, 0.4086, 0.8900, 0.3950, 0.3900, 0.2950, 0.6504, 0.5066],
  28055. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  28056. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679]],
  28057. device='cuda:0', dtype=torch.float64)
  28058. predictions are: tensor([[ 0.5075, -0.5088, 1.7788, -0.1351, -0.1265, -0.0524, 0.2179, 0.0959],
  28059. [-0.2226, -0.9488, 1.6794, -1.3423, 0.1735, -1.5009, 1.0534, 0.2728],
  28060. [ 0.4128, -0.5544, 1.1306, -1.1477, -0.6543, -0.7419, 0.3301, 0.0285],
  28061. [ 0.5527, -0.3928, 1.7188, -0.1665, -0.5780, -0.7781, 0.2299, 0.3728],
  28062. [ 0.6418, -0.4208, 1.8075, 0.0507, -0.4922, 0.0938, 0.3359, 0.1123],
  28063. [ 0.7886, -0.3359, 1.8696, -0.5041, -0.4656, -0.9213, 0.8079, 0.0993],
  28064. [ 0.9940, -0.1880, 1.8234, 0.1831, -0.6006, -0.5426, 0.5605, 0.0328],
  28065. [ 0.3124, -0.6318, 1.6706, 0.0678, -0.3578, 0.2999, 0.9073, 0.3424]],
  28066. device='cuda:0', grad_fn=<AddmmBackward>)
  28067. landmarks are: tensor([[[ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  28068. -0.0039],
  28069. [ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  28070. 0.2142],
  28071. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  28072. 0.0622],
  28073. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  28074. 0.3778],
  28075. [ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  28076. 0.0663],
  28077. [ 0.6405, -0.3984, 1.8249, -0.4614, -0.4845, -0.9233, 0.7182,
  28078. 0.0539],
  28079. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  28080. -0.0957],
  28081. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  28082. 0.3371]]], device='cuda:0')
  28083. loss_train_step before backward: tensor(0.0240, device='cuda:0', grad_fn=<MseLossBackward>)
  28084. loss_train_step after backward: tensor(0.0240, device='cuda:0', grad_fn=<MseLossBackward>)
  28085. loss_train: 0.6223869854584336
  28086. step: 30
  28087. running loss: 0.020746232848614453
  28088. Train Steps: 30/90 Loss: 0.0207 torch.Size([8, 600, 800])
  28089. torch.Size([8, 8])
  28090. tensor([[0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  28091. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  28092. [0.6339, 0.4081, 0.8425, 0.5417, 0.3850, 0.4833, 0.7335, 0.5760],
  28093. [0.6226, 0.4103, 0.8575, 0.3450, 0.4388, 0.2067, 0.5787, 0.5383],
  28094. [0.6239, 0.4107, 0.8162, 0.2763, 0.3625, 0.3600, 0.5988, 0.5700],
  28095. [0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  28096. [0.6163, 0.4006, 0.8788, 0.4683, 0.3663, 0.4883, 0.5887, 0.5017],
  28097. [0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220]],
  28098. device='cuda:0', dtype=torch.float64)
  28099. predictions are: tensor([[ 0.5228, -0.4469, 1.4481, -1.1311, -0.2062, -1.3879, 0.5930, 0.1343],
  28100. [ 0.7055, -0.3875, 1.8804, -0.0432, -0.2867, 0.0243, 0.3167, 0.0265],
  28101. [ 0.6936, -0.4046, 1.7164, 0.3293, -0.4862, -0.0240, 1.1612, 0.2557],
  28102. [ 0.7628, -0.2640, 1.8340, -0.6504, -0.2326, -1.2022, 0.4564, 0.2166],
  28103. [-0.6807, -1.2229, 1.4377, -0.8805, -0.5891, -0.6684, 0.4366, 0.2792],
  28104. [ 0.5615, -0.4705, 1.7807, 0.2131, -0.3258, 0.1174, 0.3444, 0.0610],
  28105. [ 0.6153, -0.4303, 1.8371, -0.0601, -0.5939, -0.0201, 0.5271, 0.1234],
  28106. [ 0.4692, -0.5014, 1.0312, -1.2795, -0.2998, -1.5233, 0.2746, 0.1054]],
  28107. device='cuda:0', grad_fn=<AddmmBackward>)
  28108. landmarks are: tensor([[[ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  28109. 0.1850],
  28110. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  28111. 0.0051],
  28112. [ 0.6421, -0.4008, 1.6055, 0.2160, -0.5076, -0.0534, 1.1020,
  28113. 0.3745],
  28114. [ 0.5898, -0.3908, 1.6748, -0.6924, -0.2594, -1.3313, 0.3873,
  28115. 0.2006],
  28116. [ 0.5960, -0.3888, 1.4840, -1.0095, -0.6115, -0.6231, 0.4797,
  28117. 0.3469],
  28118. [ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  28119. 0.0467],
  28120. [ 0.5609, -0.4354, 1.7730, -0.1227, -0.5942, -0.0303, 0.4335,
  28121. 0.0313],
  28122. [ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  28123. 0.1253]]], device='cuda:0')
  28124. loss_train_step before backward: tensor(0.0424, device='cuda:0', grad_fn=<MseLossBackward>)
  28125. loss_train_step after backward: tensor(0.0424, device='cuda:0', grad_fn=<MseLossBackward>)
  28126. loss_train: 0.6647640662267804
  28127. step: 31
  28128. running loss: 0.021444002136347756
  28129. Train Steps: 31/90 Loss: 0.0214 torch.Size([8, 600, 800])
  28130. torch.Size([8, 8])
  28131. tensor([[0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  28132. [0.6245, 0.4115, 0.8700, 0.4883, 0.4625, 0.5517, 0.6100, 0.5217],
  28133. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817],
  28134. [0.6264, 0.4055, 0.8425, 0.2767, 0.4425, 0.2767, 0.7050, 0.5586],
  28135. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478],
  28136. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  28137. [0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  28138. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467]],
  28139. device='cuda:0', dtype=torch.float64)
  28140. predictions are: tensor([[ 0.4506, -0.5275, 1.7686, -0.2940, -0.5330, -0.4536, 0.3733, 0.2598],
  28141. [ 0.5407, -0.5005, 1.7940, 0.1318, -0.0543, 0.2764, 0.6289, 0.1438],
  28142. [ 0.3794, -0.5269, 1.5145, -0.7211, -0.1765, -1.1368, 0.3719, 0.3084],
  28143. [ 0.4169, -0.5643, 1.6879, -0.9827, -0.1545, -1.1282, 0.9710, 0.1931],
  28144. [ 0.3583, -0.5941, 1.9093, -0.4784, -0.4752, -0.8796, 0.5574, 0.1085],
  28145. [ 0.6627, -0.3939, 1.6628, -0.2187, -0.5922, -0.3117, 0.2554, 0.1885],
  28146. [ 0.7224, -0.3879, 1.3228, -1.0733, -0.4802, -1.0500, 0.5118, -0.1316],
  28147. [ 0.6318, -0.4254, 1.6359, -0.5419, -0.6135, -0.3646, 0.5188, 0.1461]],
  28148. device='cuda:0', grad_fn=<AddmmBackward>)
  28149. landmarks are: tensor([[[ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  28150. 0.3238],
  28151. [ 0.5987, -0.3852, 1.7326, -0.0303, -0.1497, 0.2622, 0.5316,
  28152. 0.1236],
  28153. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  28154. 0.4008],
  28155. [ 0.6075, -0.4129, 1.6055, -1.0080, -0.2420, -1.0080, 0.9704,
  28156. 0.2944],
  28157. [ 0.5792, -0.4052, 1.8214, -0.6587, -0.5384, -0.8924, 0.4381,
  28158. 0.2442],
  28159. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  28160. 0.3559],
  28161. [ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  28162. -0.0108],
  28163. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  28164. 0.2391]]], device='cuda:0')
  28165. loss_train_step before backward: tensor(0.0130, device='cuda:0', grad_fn=<MseLossBackward>)
  28166. loss_train_step after backward: tensor(0.0130, device='cuda:0', grad_fn=<MseLossBackward>)
  28167. loss_train: 0.6778084067627788
  28168. step: 32
  28169. running loss: 0.021181512711336836
  28170.  
  28171. Train Steps: 32/90 Loss: 0.0212 torch.Size([8, 600, 800])
  28172. torch.Size([8, 8])
  28173. tensor([[0.6261, 0.4131, 0.8938, 0.3550, 0.4000, 0.2683, 0.6188, 0.5283],
  28174. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  28175. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  28176. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  28177. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  28178. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  28179. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  28180. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196]],
  28181. device='cuda:0', dtype=torch.float64)
  28182. predictions are: tensor([[ 0.7188, -0.3367, 1.8920, -0.6707, -0.4313, -1.0907, 0.6629, 0.0770],
  28183. [ 0.6263, -0.4435, 1.7797, 0.0100, -0.4408, -0.1267, 0.4634, -0.0449],
  28184. [ 0.7959, -0.2640, 1.6776, 0.2334, -0.4097, -0.1032, 0.5011, 0.1118],
  28185. [ 0.5462, -0.4585, 1.5470, -1.0173, -0.4050, -1.0583, 0.4912, -0.0234],
  28186. [ 0.5802, -0.4418, 0.9874, -1.2851, -0.3965, -1.1792, 0.4044, 0.1651],
  28187. [ 0.6268, -0.4222, 1.7376, -0.0928, -0.1368, 0.0947, 0.3983, 0.1281],
  28188. [-2.0925, -2.1734, 1.2965, -0.9992, -0.5074, -0.9629, 0.3409, 0.2234],
  28189. [ 0.7433, -0.2898, 1.7182, -0.0200, -0.2876, -0.9544, 0.3056, 0.4590]],
  28190. device='cuda:0', grad_fn=<AddmmBackward>)
  28191. landmarks are: tensor([[[ 0.6062, -0.3778, 1.8423, -0.6462, -0.4383, -1.0465, 0.5721,
  28192. 0.1544],
  28193. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  28194. 0.0313],
  28195. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  28196. 0.2391],
  28197. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  28198. 0.0807],
  28199. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  28200. 0.2576],
  28201. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  28202. 0.2622],
  28203. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  28204. 0.2699],
  28205. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  28206. 0.5762]]], device='cuda:0')
  28207. loss_train_step before backward: tensor(0.0063, device='cuda:0', grad_fn=<MseLossBackward>)
  28208. loss_train_step after backward: tensor(0.0063, device='cuda:0', grad_fn=<MseLossBackward>)
  28209. loss_train: 0.6841176045127213
  28210. step: 33
  28211. running loss: 0.020730836500385492
  28212. Train Steps: 33/90 Loss: 0.0207 torch.Size([8, 600, 800])
  28213. torch.Size([8, 8])
  28214. tensor([[0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  28215. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  28216. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967],
  28217. [0.6336, 0.4154, 0.8900, 0.2767, 0.4988, 0.2867, 0.7422, 0.5540],
  28218. [0.6311, 0.3998, 0.7975, 0.5767, 0.3838, 0.4850, 0.7327, 0.5343],
  28219. [0.6246, 0.4028, 0.8738, 0.4867, 0.4088, 0.5667, 0.6362, 0.5200],
  28220. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267],
  28221. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019]],
  28222. device='cuda:0', dtype=torch.float64)
  28223. predictions are: tensor([[ 0.6255, -0.3592, 1.6984, -0.2594, -0.6196, -0.3773, 0.0322, 0.2342],
  28224. [-1.9203, -2.0523, 1.4849, -1.2326, 0.1044, -1.1637, 0.8986, 0.2863],
  28225. [ 0.6367, -0.3641, 1.5570, -1.0202, -0.1333, -1.3515, 0.3457, 0.0102],
  28226. [ 0.5406, -0.4691, 1.7121, -0.8162, -0.1013, -0.9956, 0.8345, 0.1929],
  28227. [ 0.6415, -0.4127, 1.3976, 0.2055, -0.5793, 0.0214, 0.5662, 0.1494],
  28228. [ 0.6824, -0.3714, 1.7048, 0.0315, -0.4587, 0.4051, 0.4384, 0.1293],
  28229. [ 0.6387, -0.3973, 1.3418, -1.1451, -0.2160, -1.4084, 0.4027, 0.0928],
  28230. [ 0.6806, -0.3924, 1.7546, -0.0103, -0.6495, -0.3794, 0.3367, 0.0941]],
  28231. device='cuda:0', grad_fn=<AddmmBackward>)
  28232. landmarks are: tensor([[[ 6.0722e-01, -3.2394e-01, 1.8423e+00, -3.5366e-01, -4.9607e-01,
  28233. -3.9215e-01, 2.0831e-01, 1.8522e-01],
  28234. [-2.2859e+00, -2.2859e+00, 1.6517e+00, -1.2620e+00, 2.1409e-01,
  28235. -1.1928e+00, 1.1166e+00, 2.4627e-01],
  28236. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  28237. -1.5161e+00, 5.8660e-01, 8.0947e-03],
  28238. [ 6.4048e-01, -3.6712e-01, 1.8249e+00, -1.0080e+00, 1.7783e-02,
  28239. -9.6182e-01, 1.1422e+00, 2.7299e-01],
  28240. [ 6.2895e-01, -4.3934e-01, 1.3977e+00, 3.7768e-01, -5.1339e-01,
  28241. -4.5727e-02, 1.0984e+00, 1.8214e-01],
  28242. [ 5.9902e-01, -4.2556e-01, 1.7499e+00, -3.8029e-02, -3.9792e-01,
  28243. 3.3149e-01, 6.5289e-01, 1.1594e-01],
  28244. [ 6.0918e-01, -4.1432e-01, 1.4901e+00, -1.2467e+00, -1.2079e-01,
  28245. -1.4006e+00, 6.5866e-01, 1.4673e-01],
  28246. [ 6.3718e-01, -4.1286e-01, 1.8942e+00, -7.6520e-02, -6.1732e-01,
  28247. -4.7683e-01, 6.9989e-01, 3.2524e-02]]], device='cuda:0')
  28248. loss_train_step before backward: tensor(0.0209, device='cuda:0', grad_fn=<MseLossBackward>)
  28249. loss_train_step after backward: tensor(0.0209, device='cuda:0', grad_fn=<MseLossBackward>)
  28250. loss_train: 0.7050670147873461
  28251. step: 34
  28252. running loss: 0.020737265140804297
  28253. Train Steps: 34/90 Loss: 0.0207 torch.Size([8, 600, 800])
  28254. torch.Size([8, 8])
  28255. tensor([[0.6069, 0.3975, 0.8625, 0.5083, 0.4388, 0.5483, 0.5650, 0.4967],
  28256. [0.6198, 0.4130, 0.8762, 0.4117, 0.3650, 0.4900, 0.5707, 0.5103],
  28257. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  28258. [0.6093, 0.3990, 0.8400, 0.4333, 0.3688, 0.4633, 0.5560, 0.5656],
  28259. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  28260. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  28261. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  28262. [0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167]],
  28263. device='cuda:0', dtype=torch.float64)
  28264. predictions are: tensor([[ 0.4029, -0.5921, 1.6903, 0.1829, -0.3016, 0.2530, 0.2826, 0.0848],
  28265. [ 0.5061, -0.4869, 1.8188, -0.2548, -0.6397, -0.0794, 0.3478, 0.0932],
  28266. [ 0.5058, -0.5134, 1.2198, -1.2538, -0.3336, -1.4177, 0.3494, 0.0629],
  28267. [ 0.5262, -0.4614, 1.6594, -0.1469, -0.6424, -0.1302, 0.2515, 0.2958],
  28268. [ 0.5180, -0.4978, 1.7588, 0.0278, -0.3378, 0.0622, 0.4041, 0.2559],
  28269. [ 0.5641, -0.4334, 1.6918, -0.9860, -0.2200, -1.3162, 0.6009, -0.0315],
  28270. [ 0.4836, -0.5410, 1.7605, -1.1247, 0.1414, -1.2232, 1.1395, 0.1591],
  28271. [ 0.5724, -0.4363, 1.2401, -0.8151, -0.4982, -0.9966, 0.3776, 0.4530]],
  28272. device='cuda:0', grad_fn=<AddmmBackward>)
  28273. landmarks are: tensor([[[ 0.5174, -0.4497, 1.6979, 0.0620, -0.2594, 0.2468, 0.3238,
  28274. 0.0082],
  28275. [ 0.5771, -0.3784, 1.7614, -0.3844, -0.6000, -0.0226, 0.3501,
  28276. 0.0712],
  28277. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  28278. 0.1082],
  28279. [ 0.5283, -0.4429, 1.5940, -0.2844, -0.5827, -0.1458, 0.2823,
  28280. 0.3267],
  28281. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  28282. 0.3084],
  28283. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  28284. -0.0209],
  28285. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  28286. 0.2142],
  28287. [ 0.5631, -0.4129, 1.2129, -0.9233, -0.4152, -1.0311, 0.4566,
  28288. 0.5624]]], device='cuda:0')
  28289. loss_train_step before backward: tensor(0.0056, device='cuda:0', grad_fn=<MseLossBackward>)
  28290. loss_train_step after backward: tensor(0.0056, device='cuda:0', grad_fn=<MseLossBackward>)
  28291. loss_train: 0.7106758425943553
  28292. step: 35
  28293. running loss: 0.020305024074124437
  28294. Train Steps: 35/90 Loss: 0.0203 torch.Size([8, 600, 800])
  28295. torch.Size([8, 8])
  28296. tensor([[0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  28297. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  28298. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  28299. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  28300. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913],
  28301. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  28302. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  28303. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578]],
  28304. device='cuda:0', dtype=torch.float64)
  28305. predictions are: tensor([[ 0.7175, -0.3182, 1.5601, -1.1531, -0.1840, -1.2262, 0.5677, -0.0161],
  28306. [ 0.7583, -0.3484, 1.7435, 0.2148, -0.4061, 0.0851, 0.4845, -0.0334],
  28307. [ 0.7261, -0.2570, 1.2147, -0.6802, -0.0970, -1.2256, 0.2552, 0.4634],
  28308. [-1.5970, -1.8209, 0.9663, -1.2563, -0.2124, -1.3566, 0.3545, 0.4310],
  28309. [ 0.6751, -0.3353, 1.3610, -1.0378, -0.1904, -1.4201, 0.3632, 0.0626],
  28310. [ 0.9350, -0.1898, 1.9036, -0.2485, -0.6079, -0.5402, 0.5454, 0.1273],
  28311. [ 0.9440, -0.1748, 1.8448, 0.0834, -0.4474, 0.3213, 0.6020, 0.1024],
  28312. [-1.9158, -2.0474, 1.1735, -1.1139, -0.5103, -1.0042, 0.2081, 0.2710]],
  28313. device='cuda:0', grad_fn=<AddmmBackward>)
  28314. landmarks are: tensor([[[ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  28315. -0.0369],
  28316. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  28317. 0.0159],
  28318. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  28319. 0.5624],
  28320. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  28321. 0.3623],
  28322. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  28323. -0.0168],
  28324. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  28325. 0.1005],
  28326. [ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  28327. 0.1390],
  28328. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  28329. 0.2905]]], device='cuda:0')
  28330. loss_train_step before backward: tensor(0.0280, device='cuda:0', grad_fn=<MseLossBackward>)
  28331. loss_train_step after backward: tensor(0.0280, device='cuda:0', grad_fn=<MseLossBackward>)
  28332. loss_train: 0.7386775049380958
  28333. step: 36
  28334. running loss: 0.02051881958161377
  28335.  
  28336. Train Steps: 36/90 Loss: 0.0205 torch.Size([8, 600, 800])
  28337. torch.Size([8, 8])
  28338. tensor([[0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  28339. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  28340. [0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  28341. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  28342. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598],
  28343. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  28344. [0.6080, 0.4010, 0.8750, 0.4500, 0.4825, 0.5617, 0.5837, 0.5583],
  28345. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679]],
  28346. device='cuda:0', dtype=torch.float64)
  28347. predictions are: tensor([[ 0.7026, -0.3475, 1.7143, -0.5126, -0.6330, -0.2998, 0.4079, 0.1759],
  28348. [ 0.4452, -0.4884, 1.7904, -0.2999, -0.4580, -0.4563, 0.1168, 0.2451],
  28349. [ 0.8208, -0.2664, 1.4383, -1.0448, -0.6861, -0.8196, 0.1715, 0.0891],
  28350. [ 0.6975, -0.3649, 1.3709, 0.1070, -0.4919, -0.1339, 0.7419, 0.1754],
  28351. [ 0.6489, -0.3556, 1.5818, 0.2273, -0.1254, -0.3050, 0.1784, 0.2450],
  28352. [ 0.7435, -0.3313, 1.8172, -0.2670, -0.4164, -0.4652, 0.8118, 0.1959],
  28353. [ 0.4413, -0.4983, 1.7393, -0.3508, -0.1120, -0.1085, 0.3081, 0.1528],
  28354. [-1.9452, -2.0874, 1.6159, -1.3266, 0.2288, -1.4092, 1.0428, 0.2691]],
  28355. device='cuda:0', grad_fn=<AddmmBackward>)
  28356. landmarks are: tensor([[[ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  28357. 0.2083],
  28358. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  28359. 0.3087],
  28360. [ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  28361. 0.2776],
  28362. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  28363. 0.1928],
  28364. [ 0.5726, -0.4249, 1.5824, 0.3777, -0.0942, -0.0556, 0.2782,
  28365. 0.2997],
  28366. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  28367. 0.4386],
  28368. [ 0.5223, -0.4336, 1.7557, -0.2074, -0.0573, 0.3084, 0.4104,
  28369. 0.2930],
  28370. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  28371. 0.3371]]], device='cuda:0')
  28372. loss_train_step before backward: tensor(0.0191, device='cuda:0', grad_fn=<MseLossBackward>)
  28373. loss_train_step after backward: tensor(0.0191, device='cuda:0', grad_fn=<MseLossBackward>)
  28374. loss_train: 0.7578194118104875
  28375. step: 37
  28376. running loss: 0.02048160572460777
  28377. Train Steps: 37/90 Loss: 0.0205 torch.Size([8, 600, 800])
  28378. torch.Size([8, 8])
  28379. tensor([[ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167],
  28380. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  28381. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  28382. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  28383. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  28384. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  28385. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  28386. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000]],
  28387. device='cuda:0', dtype=torch.float64)
  28388. predictions are: tensor([[-2.1001, -2.2408, 1.2620, -1.2134, -0.3332, -1.1288, 0.4092, 0.1548],
  28389. [ 0.6518, -0.3524, 1.6998, -0.3598, -0.2870, 0.3224, 0.6301, 0.1420],
  28390. [ 0.7167, -0.2884, 1.6898, -0.2260, -0.4900, -0.6974, 0.2223, 0.3375],
  28391. [ 0.6266, -0.3632, 1.8030, -0.1496, -0.3881, -1.0460, 0.4562, 0.1622],
  28392. [ 0.4956, -0.4900, 1.2467, -1.3024, -0.3474, -1.1994, 0.6318, 0.1830],
  28393. [ 0.4585, -0.5079, 1.7557, -0.2600, -0.0559, 0.1161, 0.5975, 0.2690],
  28394. [ 0.6890, -0.3344, 1.5034, -0.6130, -0.4778, -1.0306, 0.1694, 0.3261],
  28395. [ 0.6072, -0.4055, 1.6764, -0.5149, -0.5742, -0.4923, 0.5001, 0.1026]],
  28396. device='cuda:0', grad_fn=<AddmmBackward>)
  28397. landmarks are: tensor([[[-2.2859, -2.2859, 1.2820, -1.0801, -0.5885, -1.0234, 0.2141,
  28398. 0.1005],
  28399. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  28400. 0.0772],
  28401. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  28402. 0.4357],
  28403. [ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  28404. 0.1852],
  28405. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  28406. 0.2032],
  28407. [ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  28408. 0.2699],
  28409. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  28410. 0.4374],
  28411. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  28412. 0.0236]]], device='cuda:0')
  28413. loss_train_step before backward: tensor(0.0116, device='cuda:0', grad_fn=<MseLossBackward>)
  28414. loss_train_step after backward: tensor(0.0116, device='cuda:0', grad_fn=<MseLossBackward>)
  28415. loss_train: 0.7694539255462587
  28416. step: 38
  28417. running loss: 0.020248787514375227
  28418. Train Steps: 38/90 Loss: 0.0202 torch.Size([8, 600, 800])
  28419. torch.Size([8, 8])
  28420. tensor([[0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617],
  28421. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  28422. [0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  28423. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  28424. [0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510],
  28425. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  28426. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  28427. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209]],
  28428. device='cuda:0', dtype=torch.float64)
  28429. predictions are: tensor([[ 0.3345, -0.5815, 1.6559, -0.2002, -0.0839, -0.0443, 0.3847, 0.3240],
  28430. [ 0.6685, -0.3828, 1.5534, -1.0486, -0.4268, -0.9877, 0.7333, 0.1445],
  28431. [ 0.6851, -0.3588, 1.4897, -1.1548, -0.4079, -1.0997, 0.4530, 0.0514],
  28432. [ 0.4126, -0.5595, 1.6417, -0.2154, -0.5463, -0.0265, 0.4602, 0.1108],
  28433. [ 0.5710, -0.4018, 1.6016, -0.0976, -0.4236, -0.0688, 0.2664, 0.2464],
  28434. [ 0.6039, -0.3627, 1.6929, -0.2127, -0.5257, -0.8801, 0.3550, 0.1962],
  28435. [-1.8773, -2.0152, 1.4880, -1.3270, 0.1654, -1.2752, 0.8369, 0.2394],
  28436. [ 0.5513, -0.3570, 1.5899, -0.3356, -0.2179, -1.0885, 0.2876, 0.5012]],
  28437. device='cuda:0', grad_fn=<AddmmBackward>)
  28438. landmarks are: tensor([[[ 0.5432, -0.4388, 1.7557, -0.0303, -0.0919, -0.1150, 0.2699,
  28439. 0.3087],
  28440. [ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  28441. 0.1931],
  28442. [ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  28443. 0.0851],
  28444. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  28445. -0.0534],
  28446. [ 0.5334, -0.4252, 1.7499, -0.0226, -0.3979, -0.1920, 0.0558,
  28447. 0.2589],
  28448. [ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  28449. 0.1852],
  28450. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  28451. 0.3104],
  28452. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  28453. 0.5822]]], device='cuda:0')
  28454. loss_train_step before backward: tensor(0.0153, device='cuda:0', grad_fn=<MseLossBackward>)
  28455. loss_train_step after backward: tensor(0.0153, device='cuda:0', grad_fn=<MseLossBackward>)
  28456. loss_train: 0.7847062242217362
  28457. step: 39
  28458. running loss: 0.020120672415941954
  28459. Train Steps: 39/90 Loss: 0.0201 torch.Size([8, 600, 800])
  28460. torch.Size([8, 8])
  28461. tensor([[0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  28462. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  28463. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  28464. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  28465. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  28466. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  28467. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  28468. [0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510]],
  28469. device='cuda:0', dtype=torch.float64)
  28470. predictions are: tensor([[ 0.7944, -0.2597, 1.6941, -0.7817, -0.3957, -1.1214, 0.3668, 0.0797],
  28471. [-1.2229, -1.5579, 1.2096, -0.8862, -0.5949, -0.8335, 0.0194, 0.3173],
  28472. [-1.9269, -2.0668, 1.0180, -1.3759, -0.3612, -1.2341, 0.1503, 0.2716],
  28473. [ 0.6871, -0.2951, 1.6941, 0.2017, -0.4402, -0.3049, 0.2864, 0.4204],
  28474. [ 0.6057, -0.3936, 1.8279, -0.9332, 0.0218, -1.2719, 0.9551, 0.2071],
  28475. [ 0.9779, -0.1799, 1.6772, 0.0201, -0.3361, 0.4483, 0.8435, 0.2974],
  28476. [ 0.6400, -0.3831, 1.8871, -0.6828, -0.3191, -0.5734, 0.8844, 0.1991],
  28477. [ 0.7648, -0.2619, 1.6307, 0.0055, -0.3844, -0.1027, 0.1083, 0.2771]],
  28478. device='cuda:0', grad_fn=<AddmmBackward>)
  28479. landmarks are: tensor([[[ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  28480. -0.0957],
  28481. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  28482. 0.2837],
  28483. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  28484. 0.1373],
  28485. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  28486. 0.3084],
  28487. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  28488. 0.2142],
  28489. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  28490. 0.3157],
  28491. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  28492. 0.2676],
  28493. [ 0.5334, -0.4252, 1.7499, -0.0226, -0.3979, -0.1920, 0.0558,
  28494. 0.2589]]], device='cuda:0')
  28495. loss_train_step before backward: tensor(0.0405, device='cuda:0', grad_fn=<MseLossBackward>)
  28496. loss_train_step after backward: tensor(0.0405, device='cuda:0', grad_fn=<MseLossBackward>)
  28497. loss_train: 0.8252143119461834
  28498. step: 40
  28499. running loss: 0.020630357798654585
  28500.  
  28501. Train Steps: 40/90 Loss: 0.0206 torch.Size([8, 600, 800])
  28502. torch.Size([8, 8])
  28503. tensor([[0.6109, 0.4041, 0.6975, 0.3167, 0.3513, 0.3383, 0.5153, 0.5319],
  28504. [0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290],
  28505. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  28506. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750],
  28507. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  28508. [0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501],
  28509. [0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544],
  28510. [0.6267, 0.4080, 0.8438, 0.2633, 0.4763, 0.1800, 0.6259, 0.5240]],
  28511. device='cuda:0', dtype=torch.float64)
  28512. predictions are: tensor([[ 0.2722, -0.6165, 1.1779, -0.8024, -0.6699, -0.6848, 0.0763, 0.2715],
  28513. [ 0.2924, -0.6367, 1.3922, -1.1740, -0.2910, -1.2150, 0.6039, 0.1700],
  28514. [ 0.3281, -0.5799, 1.9128, 0.0207, -0.1557, 0.4681, 0.6649, 0.3074],
  28515. [ 0.3481, -0.5868, 1.1737, -1.0323, -0.5273, -0.8910, 0.5458, 0.4523],
  28516. [ 0.2317, -0.6822, 1.8328, 0.0113, -0.2837, 0.2063, 0.6388, 0.2003],
  28517. [ 0.4696, -0.4915, 1.5757, -1.0361, -0.2425, -1.3144, 0.4999, 0.2187],
  28518. [ 0.2441, -0.6215, 1.0434, -1.0948, -0.4172, -1.3396, -0.0088, 0.3534],
  28519. [ 0.6824, -0.3667, 1.7853, -0.9849, -0.1111, -1.4141, 0.6500, 0.1578]],
  28520. device='cuda:0', grad_fn=<AddmmBackward>)
  28521. landmarks are: tensor([[[ 0.5359, -0.4193, 0.9358, -0.8232, -0.6635, -0.7232, 0.0943,
  28522. 0.1710],
  28523. [ 0.6125, -0.4273, 1.2807, -1.3253, -0.2574, -1.2542, 0.6864,
  28524. 0.1575],
  28525. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  28526. 0.2083],
  28527. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  28528. 0.3700],
  28529. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  28530. 0.1474],
  28531. [ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  28532. 0.2549],
  28533. [ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  28534. 0.2747],
  28535. [ 0.6088, -0.4015, 1.6113, -1.0696, -0.0861, -1.4545, 0.6051,
  28536. 0.1343]]], device='cuda:0')
  28537. loss_train_step before backward: tensor(0.0182, device='cuda:0', grad_fn=<MseLossBackward>)
  28538. loss_train_step after backward: tensor(0.0182, device='cuda:0', grad_fn=<MseLossBackward>)
  28539. loss_train: 0.843462482560426
  28540. step: 41
  28541. running loss: 0.02057225567220551
  28542. Train Steps: 41/90 Loss: 0.0206 torch.Size([8, 600, 800])
  28543. torch.Size([8, 8])
  28544. tensor([[0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  28545. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  28546. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517],
  28547. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  28548. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  28549. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  28550. [0.6261, 0.4045, 0.8865, 0.5369, 0.3895, 0.4859, 0.6683, 0.5249],
  28551. [0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882]],
  28552. device='cuda:0', dtype=torch.float64)
  28553. predictions are: tensor([[ 0.4012, -0.5602, 1.1020, -1.4905, -0.3912, -1.1780, 0.3697, 0.3340],
  28554. [ 0.3519, -0.6377, 1.8958, -0.1771, -0.4805, -0.0822, 0.7601, 0.2015],
  28555. [ 0.7661, -0.3157, 1.7028, -0.8933, -0.5319, -0.5710, 0.5506, 0.2958],
  28556. [ 0.3787, -0.5236, 1.8381, 0.0948, -0.3877, -0.3379, 0.4612, 0.4892],
  28557. [ 0.3725, -0.5542, 0.9727, -1.3297, -0.2899, -1.4031, 0.1775, 0.5426],
  28558. [ 0.1261, -0.7136, 1.7445, 0.1966, -0.3572, -0.2723, 0.2821, 0.1150],
  28559. [ 0.5290, -0.4819, 1.8134, 0.0249, -0.4198, 0.0279, 0.8776, 0.1686],
  28560. [ 0.4397, -0.5016, 1.8540, -0.5343, -0.5032, -0.5813, 0.1569, 0.1158]],
  28561. device='cuda:0', grad_fn=<AddmmBackward>)
  28562. landmarks are: tensor([[[ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  28563. 0.2853],
  28564. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  28565. 0.0774],
  28566. [ 0.5814, -0.4003, 1.6575, -0.8694, -0.6289, -0.5692, 0.5374,
  28567. 0.2622],
  28568. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  28569. 0.3084],
  28570. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  28571. 0.3808],
  28572. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  28573. -0.0370],
  28574. [ 0.6059, -0.4177, 1.8087, 0.1941, -0.4868, -0.0414, 0.8010,
  28575. 0.1385],
  28576. [ 0.5595, -0.3988, 1.7672, -0.4460, -0.5538, -0.5384, 0.0828,
  28577. -0.0310]]], device='cuda:0')
  28578. loss_train_step before backward: tensor(0.0174, device='cuda:0', grad_fn=<MseLossBackward>)
  28579. loss_train_step after backward: tensor(0.0174, device='cuda:0', grad_fn=<MseLossBackward>)
  28580. loss_train: 0.860898629296571
  28581. step: 42
  28582. running loss: 0.02049758641182312
  28583. Train Steps: 42/90 Loss: 0.0205 torch.Size([8, 600, 800])
  28584. torch.Size([8, 8])
  28585. tensor([[ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  28586. [0.6260, 0.4106, 0.8025, 0.2583, 0.4550, 0.1867, 0.6281, 0.4869],
  28587. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578],
  28588. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  28589. [0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617],
  28590. [0.6226, 0.4001, 0.8438, 0.5733, 0.3862, 0.4250, 0.5750, 0.5283],
  28591. [0.6197, 0.4050, 0.7527, 0.2000, 0.4042, 0.2249, 0.5895, 0.4995],
  28592. [0.6132, 0.4037, 0.6963, 0.2217, 0.4100, 0.1950, 0.5395, 0.5175]],
  28593. device='cuda:0', dtype=torch.float64)
  28594. predictions are: tensor([[-1.6744, -1.8164, 1.6428, -1.1464, 0.1531, -1.0890, 1.0504, 0.3297],
  28595. [ 0.6633, -0.3424, 1.5168, -1.0733, -0.2207, -1.2959, 0.5642, 0.1678],
  28596. [-2.1848, -2.1812, 1.1882, -1.0478, -0.5552, -0.9504, 0.1036, 0.2840],
  28597. [ 0.5811, -0.4098, 1.1966, -1.0334, -0.6815, -0.6616, 0.3493, 0.1752],
  28598. [ 0.7715, -0.2316, 1.6568, 0.3646, -0.2515, 0.0227, 0.3323, 0.3487],
  28599. [ 0.6553, -0.3458, 1.7052, 0.3154, -0.5779, -0.2111, 0.3768, 0.2283],
  28600. [ 0.7520, -0.3007, 1.2283, -1.2327, -0.4260, -1.1571, 0.4222, 0.2272],
  28601. [ 0.6980, -0.3132, 1.0704, -1.2022, -0.4169, -1.3390, 0.2616, 0.2387]],
  28602. device='cuda:0', grad_fn=<AddmmBackward>)
  28603. landmarks are: tensor([[[-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  28604. 0.2463],
  28605. [ 0.6058, -0.3892, 1.4208, -1.0927, -0.1843, -1.4237, 0.6154,
  28606. -0.0370],
  28607. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  28608. 0.2905],
  28609. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  28610. 0.0622],
  28611. [ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  28612. 0.3084],
  28613. [ 0.5900, -0.4377, 1.6113, 0.3623, -0.5018, -0.3229, 0.3700,
  28614. 0.1544],
  28615. [ 0.5762, -0.4153, 1.1908, -1.3622, -0.4190, -1.2471, 0.4368,
  28616. 0.0213],
  28617. [ 0.5465, -0.4214, 0.9300, -1.2620, -0.3921, -1.3852, 0.2062,
  28618. 0.1043]]], device='cuda:0')
  28619. loss_train_step before backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  28620. loss_train_step after backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  28621. loss_train: 0.8787088342942297
  28622. step: 43
  28623. running loss: 0.02043508916963325
  28624. Train Steps: 43/90 Loss: 0.0204 torch.Size([8, 600, 800])
  28625. torch.Size([8, 8])
  28626. tensor([[0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  28627. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  28628. [0.6200, 0.4112, 0.8862, 0.4100, 0.3638, 0.4917, 0.6088, 0.6050],
  28629. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  28630. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  28631. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  28632. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  28633. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852]],
  28634. device='cuda:0', dtype=torch.float64)
  28635. predictions are: tensor([[ 0.0593, -0.7209, 1.4025, -0.7395, -0.5557, -1.0149, -0.0363, 0.1739],
  28636. [ 0.2105, -0.6398, 0.9159, -0.9487, -0.5745, -1.0085, 0.1048, 0.4227],
  28637. [ 0.5317, -0.4285, 1.8629, -0.3572, -0.4762, 0.0316, 0.7137, 0.3804],
  28638. [ 0.4177, -0.4962, 1.5345, -0.5597, -0.5811, -0.9179, 0.0925, 0.3951],
  28639. [ 0.6118, -0.4042, 1.9377, -0.8004, -0.4052, -0.8034, 0.7940, 0.1437],
  28640. [ 0.0240, -0.7626, 1.1786, -1.3303, -0.2676, -1.4906, 0.2640, 0.2023],
  28641. [ 0.5820, -0.4623, 1.8527, 0.0597, -0.4232, 0.3058, 1.2145, 0.1657],
  28642. [ 0.2763, -0.6095, 1.8244, 0.0415, -0.1050, -0.0060, 0.3189, 0.3642]],
  28643. device='cuda:0', grad_fn=<AddmmBackward>)
  28644. landmarks are: tensor([[[ 0.5532, -0.3888, 1.4727, -0.7463, -0.5538, -1.0465, 0.0265,
  28645. 0.2138],
  28646. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  28647. 0.4103],
  28648. [ 0.5777, -0.3868, 1.8076, -0.3921, -0.6058, -0.0149, 0.5259,
  28649. 0.5085],
  28650. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  28651. 0.4374],
  28652. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  28653. 0.1390],
  28654. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  28655. 0.1343],
  28656. [ 0.6421, -0.3695, 1.7788, 0.0236, -0.4845, 0.1544, 1.1971,
  28657. 0.2196],
  28658. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  28659. 0.4171]]], device='cuda:0')
  28660. loss_train_step before backward: tensor(0.0223, device='cuda:0', grad_fn=<MseLossBackward>)
  28661. loss_train_step after backward: tensor(0.0223, device='cuda:0', grad_fn=<MseLossBackward>)
  28662. loss_train: 0.9010163084603846
  28663. step: 44
  28664. running loss: 0.02047764337409965
  28665.  
  28666. Train Steps: 44/90 Loss: 0.0205 torch.Size([8, 600, 800])
  28667. torch.Size([8, 8])
  28668. tensor([[0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  28669. [0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  28670. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528],
  28671. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  28672. [0.6205, 0.4012, 0.8675, 0.3283, 0.3713, 0.3050, 0.5813, 0.5117],
  28673. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  28674. [0.6132, 0.3930, 0.8672, 0.4754, 0.3712, 0.5222, 0.5974, 0.5098],
  28675. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483]],
  28676. device='cuda:0', dtype=torch.float64)
  28677. predictions are: tensor([[ 0.8081, -0.2567, 1.7158, -0.0621, -0.3863, 0.1884, 0.6553, 0.2262],
  28678. [ 0.3466, -0.5509, 0.7081, -1.3252, -0.4496, -1.2155, 0.2184, 0.2836],
  28679. [-2.5157, -2.3895, 1.8121, -0.7981, -0.1205, -0.9275, 0.9323, 0.2574],
  28680. [ 0.4411, -0.4603, 1.7228, -0.2251, -0.3915, -0.2788, 0.1090, 0.1176],
  28681. [ 0.5141, -0.4182, 1.6298, -0.8154, -0.5195, -0.9728, 0.3624, 0.1820],
  28682. [ 0.7026, -0.3435, 1.6917, -0.4188, -0.5994, -0.5678, 0.6849, 0.2348],
  28683. [ 0.5526, -0.4045, 1.6131, -0.0275, -0.4721, 0.1363, 0.4688, 0.2287],
  28684. [ 0.6117, -0.3064, 1.5351, -0.2352, -0.5716, -0.6021, 0.0366, 0.4231]],
  28685. device='cuda:0', grad_fn=<AddmmBackward>)
  28686. landmarks are: tensor([[[ 0.6047, -0.4209, 1.7557, -0.0303, -0.4845, 0.2545, 0.6587,
  28687. 0.1236],
  28688. [ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  28689. 0.0712],
  28690. [-2.2859, -2.2859, 1.8423, -0.9695, -0.1323, -0.8463, 1.1349,
  28691. 0.2676],
  28692. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  28693. -0.0220],
  28694. [ 0.5799, -0.4329, 1.7210, -0.7694, -0.5711, -0.8771, 0.3988,
  28695. 0.0774],
  28696. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  28697. 0.0697],
  28698. [ 0.5466, -0.4706, 1.7198, -0.0903, -0.5712, 0.1261, 0.4733,
  28699. 0.0688],
  28700. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  28701. 0.2468]]], device='cuda:0')
  28702. loss_train_step before backward: tensor(0.0107, device='cuda:0', grad_fn=<MseLossBackward>)
  28703. loss_train_step after backward: tensor(0.0107, device='cuda:0', grad_fn=<MseLossBackward>)
  28704. loss_train: 0.9117077724076807
  28705. step: 45
  28706. running loss: 0.020260172720170683
  28707. Train Steps: 45/90 Loss: 0.0203 torch.Size([8, 600, 800])
  28708. torch.Size([8, 8])
  28709. tensor([[0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869],
  28710. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  28711. [0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  28712. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  28713. [0.6311, 0.3998, 0.7975, 0.5767, 0.3838, 0.4850, 0.7327, 0.5343],
  28714. [0.6201, 0.4036, 0.8596, 0.3850, 0.3492, 0.3785, 0.5978, 0.5131],
  28715. [0.6131, 0.4037, 0.6907, 0.2819, 0.3688, 0.2700, 0.5217, 0.5680],
  28716. [0.6082, 0.4042, 0.6975, 0.1917, 0.4100, 0.1983, 0.5502, 0.5578]],
  28717. device='cuda:0', dtype=torch.float64)
  28718. predictions are: tensor([[ 0.3473, -0.5753, 1.5471, -1.2589, -0.0220, -1.4570, 0.6313, 0.0374],
  28719. [ 0.3961, -0.5188, 1.5376, -1.2642, -0.3802, -1.0928, 0.6439, 0.0683],
  28720. [ 0.5461, -0.3509, 1.9025, 0.1118, -0.6093, -0.2064, 0.1833, 0.4084],
  28721. [ 0.5049, -0.4197, 1.1840, -1.0966, -0.3444, -1.0405, 0.4707, 0.5814],
  28722. [ 0.3431, -0.6076, 1.5917, 0.3166, -0.5506, 0.0278, 0.8716, 0.1111],
  28723. [ 0.4011, -0.5269, 1.8692, -0.4701, -0.7028, -0.4832, 0.3813, 0.0916],
  28724. [-0.0361, -0.7732, 0.9775, -0.9902, -0.5846, -0.9177, 0.0684, 0.3048],
  28725. [ 0.1723, -0.6870, 0.9510, -1.2858, -0.4434, -1.2211, 0.2540, 0.2577]],
  28726. device='cuda:0', grad_fn=<AddmmBackward>)
  28727. landmarks are: tensor([[[ 6.1241e-01, -4.0100e-01, 1.4381e+00, -1.3544e+00, -5.7275e-02,
  28728. -1.5546e+00, 5.5732e-01, -3.6943e-02],
  28729. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  28730. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  28731. [ 6.1207e-01, -3.1378e-01, 1.8423e+00, 8.1601e-03, -6.4619e-01,
  28732. -3.0747e-01, 3.4688e-01, 3.6228e-01],
  28733. [ 5.7460e-01, -4.0208e-01, 1.0801e+00, -1.1312e+00, -3.2286e-01,
  28734. -1.1081e+00, 4.8034e-01, 6.0842e-01],
  28735. [ 6.2895e-01, -4.3934e-01, 1.3977e+00, 3.7768e-01, -5.1339e-01,
  28736. -4.5727e-02, 1.0984e+00, 1.8214e-01],
  28737. [ 5.7829e-01, -4.2163e-01, 1.6847e+00, -5.0778e-01, -6.7321e-01,
  28738. -5.3774e-01, 4.7523e-01, 8.3916e-02],
  28739. [ 5.4590e-01, -4.2148e-01, 9.0432e-01, -9.8382e-01, -5.8268e-01,
  28740. -1.0388e+00, 1.2363e-01, 3.3782e-01],
  28741. [ 5.2315e-01, -4.1886e-01, 9.3580e-01, -1.4006e+00, -3.9215e-01,
  28742. -1.3698e+00, 2.5553e-01, 2.9064e-01]]], device='cuda:0')
  28743. loss_train_step before backward: tensor(0.0213, device='cuda:0', grad_fn=<MseLossBackward>)
  28744. loss_train_step after backward: tensor(0.0213, device='cuda:0', grad_fn=<MseLossBackward>)
  28745. loss_train: 0.9329804559238255
  28746. step: 46
  28747. running loss: 0.020282183824430988
  28748. Train Steps: 46/90 Loss: 0.0203 torch.Size([8, 600, 800])
  28749. torch.Size([8, 8])
  28750. tensor([[0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758],
  28751. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  28752. [0.6277, 0.4118, 0.8988, 0.3833, 0.3950, 0.2650, 0.6290, 0.4938],
  28753. [0.6246, 0.4028, 0.8738, 0.4867, 0.4088, 0.5667, 0.6362, 0.5200],
  28754. [0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  28755. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  28756. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  28757. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609]],
  28758. device='cuda:0', dtype=torch.float64)
  28759. predictions are: tensor([[ 3.4157e-01, -5.4580e-01, 1.7160e+00, -9.9776e-02, -5.3122e-01,
  28760. 1.0598e-01, 4.4080e-01, 7.4866e-02],
  28761. [ 4.5865e-01, -4.6616e-01, 1.6395e+00, -8.6564e-01, -4.8457e-01,
  28762. -8.4187e-01, 6.6704e-01, 2.8578e-01],
  28763. [ 9.5002e-02, -7.0816e-01, 1.8023e+00, -5.4315e-01, -6.0169e-01,
  28764. -1.0344e+00, 3.4626e-01, 5.6686e-02],
  28765. [ 4.0714e-01, -5.0531e-01, 1.6999e+00, -8.3630e-02, -4.9261e-01,
  28766. 3.0629e-01, 5.2600e-01, 1.3596e-01],
  28767. [ 7.4241e-01, -3.0988e-01, 1.2474e+00, -1.2521e+00, -2.4741e-01,
  28768. -1.4120e+00, 4.0297e-01, 2.0329e-01],
  28769. [ 4.5643e-01, -4.0569e-01, 1.1043e+00, -6.4953e-01, -7.8430e-01,
  28770. -5.2145e-01, -1.3662e-03, 4.6987e-01],
  28771. [ 4.2579e-01, -5.1258e-01, 1.6009e+00, 2.2429e-01, -5.5763e-01,
  28772. -8.9889e-02, 2.6553e-01, 1.4516e-01],
  28773. [ 1.9168e-01, -6.7445e-01, 1.6228e+00, -1.1956e+00, 1.8815e-01,
  28774. -1.3783e+00, 1.0478e+00, 3.1273e-01]], device='cuda:0',
  28775. grad_fn=<AddmmBackward>)
  28776. landmarks are: tensor([[[ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  28777. -0.0881],
  28778. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  28779. 0.3050],
  28780. [ 0.6135, -0.3841, 1.8654, -0.5153, -0.4614, -1.0619, 0.6195,
  28781. -0.0049],
  28782. [ 0.5990, -0.4256, 1.7499, -0.0380, -0.3979, 0.3315, 0.6529,
  28783. 0.1159],
  28784. [ 0.5908, -0.3832, 1.3804, -1.2543, -0.1270, -1.4671, 0.5721,
  28785. 0.2237],
  28786. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  28787. 0.4036],
  28788. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  28789. 0.1979],
  28790. [ 0.6372, -0.3575, 1.6633, -1.2082, 0.2199, -1.2467, 1.1313,
  28791. 0.3050]]], device='cuda:0')
  28792. loss_train_step before backward: tensor(0.0230, device='cuda:0', grad_fn=<MseLossBackward>)
  28793. loss_train_step after backward: tensor(0.0230, device='cuda:0', grad_fn=<MseLossBackward>)
  28794. loss_train: 0.9559376635588706
  28795. step: 47
  28796. running loss: 0.02033909922465682
  28797. Train Steps: 47/90 Loss: 0.0203 torch.Size([8, 600, 800])
  28798. torch.Size([8, 8])
  28799. tensor([[0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  28800. [0.6198, 0.4101, 0.8838, 0.5283, 0.3763, 0.5267, 0.5913, 0.5567],
  28801. [0.6185, 0.4079, 0.8838, 0.4617, 0.4838, 0.5650, 0.6175, 0.5850],
  28802. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  28803. [0.6339, 0.4102, 0.8588, 0.3133, 0.4425, 0.2117, 0.6417, 0.5089],
  28804. [ nan, nan, 0.6512, 0.1717, 0.4100, 0.1983, 0.5253, 0.5240],
  28805. [0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  28806. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389]],
  28807. device='cuda:0', dtype=torch.float64)
  28808. predictions are: tensor([[ 0.0754, -0.6728, 1.4005, -0.7200, -0.4994, -1.1253, 0.1119, 0.0342],
  28809. [ 0.7075, -0.3032, 1.7789, 0.2578, -0.6072, 0.0754, 0.5373, 0.2307],
  28810. [ 0.4886, -0.4103, 1.7513, -0.1235, -0.1657, 0.1917, 0.4897, 0.3107],
  28811. [ 0.6213, -0.3726, 1.1898, -1.2564, -0.3196, -1.3608, 0.4322, 0.1022],
  28812. [ 0.7552, -0.2970, 1.6800, -0.7415, -0.2835, -1.2006, 0.7921, 0.0721],
  28813. [-2.7242, -2.5366, 0.9469, -1.2379, -0.4670, -1.2380, 0.2041, 0.1697],
  28814. [ 0.4366, -0.4563, 0.9809, -0.8987, -0.6418, -0.8829, 0.1738, 0.2443],
  28815. [ 0.6094, -0.3594, 1.1859, -1.1509, -0.5651, -0.9896, 0.5455, 0.2325]],
  28816. device='cuda:0', grad_fn=<AddmmBackward>)
  28817. landmarks are: tensor([[[ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  28818. 0.0111],
  28819. [ 0.5770, -0.3918, 1.7961, 0.1544, -0.5480, 0.1467, 0.4450,
  28820. 0.2853],
  28821. [ 0.5707, -0.4017, 1.7961, -0.1535, -0.0515, 0.3238, 0.5663,
  28822. 0.4162],
  28823. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  28824. 0.1082],
  28825. [ 0.6421, -0.3912, 1.6806, -0.8386, -0.2420, -1.3082, 0.6780,
  28826. 0.0646],
  28827. [-2.2859, -2.2859, 0.7222, -1.4930, -0.3921, -1.3698, 0.1404,
  28828. 0.1343],
  28829. [ 0.5425, -0.3998, 0.9263, -0.8683, -0.6000, -1.0157, 0.0990,
  28830. 0.2476],
  28831. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  28832. 0.2032]]], device='cuda:0')
  28833. loss_train_step before backward: tensor(0.0158, device='cuda:0', grad_fn=<MseLossBackward>)
  28834. loss_train_step after backward: tensor(0.0158, device='cuda:0', grad_fn=<MseLossBackward>)
  28835. loss_train: 0.9717486617155373
  28836. step: 48
  28837. running loss: 0.02024476378574036
  28838.  
  28839. Train Steps: 48/90 Loss: 0.0202 torch.Size([8, 600, 800])
  28840. torch.Size([8, 8])
  28841. tensor([[0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  28842. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  28843. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  28844. [0.6296, 0.4060, 0.9100, 0.3267, 0.4726, 0.3367, 0.7446, 0.5355],
  28845. [0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320],
  28846. [0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501],
  28847. [0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  28848. [0.6167, 0.4048, 0.6831, 0.3639, 0.3763, 0.3017, 0.5700, 0.5883]],
  28849. device='cuda:0', dtype=torch.float64)
  28850. predictions are: tensor([[ 0.5644, -0.4089, 1.3489, -1.0632, -0.3554, -1.2604, 0.3068, 0.0804],
  28851. [ 0.4687, -0.4830, 1.2589, -1.1416, -0.2557, -1.2853, 0.4649, 0.1626],
  28852. [ 0.4234, -0.5423, 1.6914, 0.3361, -0.5816, -0.0057, 0.5142, -0.0243],
  28853. [ 0.4425, -0.5201, 1.8059, -0.6999, -0.2962, -0.6888, 1.0130, 0.1350],
  28854. [ 0.2810, -0.5907, 1.3972, -1.1654, -0.4216, -0.9874, 0.6505, 0.1130],
  28855. [ 0.6097, -0.3620, 1.3889, -1.0538, -0.3057, -1.2302, 0.3695, 0.1679],
  28856. [ 0.5667, -0.4004, 1.3944, -0.9263, -0.5386, -0.9340, 0.3893, 0.2306],
  28857. [-0.0884, -0.7821, 1.0243, -0.7315, -0.6894, -0.8069, 0.1109, 0.4189]],
  28858. device='cuda:0', grad_fn=<AddmmBackward>)
  28859. landmarks are: tensor([[[ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  28860. 0.0928],
  28861. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  28862. 0.2083],
  28863. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  28864. 0.0697],
  28865. [ 0.6224, -0.4105, 1.9173, -0.7771, -0.1030, -0.7308, 1.1532,
  28866. 0.1875],
  28867. [ 0.6141, -0.4153, 1.4208, -1.2697, -0.2940, -1.0234, 0.8644,
  28868. 0.1715],
  28869. [ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  28870. 0.2549],
  28871. [ 0.5875, -0.3888, 1.3111, -0.8848, -0.4614, -0.9849, 0.5201,
  28872. 0.2622],
  28873. [ 0.5626, -0.4162, 0.8692, -0.6051, -0.5480, -0.8925, 0.3469,
  28874. 0.4316]]], device='cuda:0')
  28875. loss_train_step before backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  28876. loss_train_step after backward: tensor(0.0207, device='cuda:0', grad_fn=<MseLossBackward>)
  28877. loss_train: 0.9924390469677746
  28878. step: 49
  28879. running loss: 0.020253858101383155
  28880. Train Steps: 49/90 Loss: 0.0203 torch.Size([8, 600, 800])
  28881. torch.Size([8, 8])
  28882. tensor([[0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  28883. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  28884. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  28885. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  28886. [0.6040, 0.4002, 0.7338, 0.2267, 0.3975, 0.2100, 0.5231, 0.4778],
  28887. [0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391],
  28888. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  28889. [0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843]],
  28890. device='cuda:0', dtype=torch.float64)
  28891. predictions are: tensor([[ 0.3356, -0.6246, 1.6195, 0.2512, -0.6513, -0.3454, 0.5973, 0.0688],
  28892. [ 0.6370, -0.3359, 1.3365, -1.0085, -0.1253, -1.4134, 0.3820, 0.2478],
  28893. [ 0.4861, -0.4302, 1.6799, -0.2698, -0.5321, -0.0616, 0.5071, 0.2307],
  28894. [ 0.3765, -0.4768, 1.6450, -0.1350, -0.4039, -0.1223, 0.2556, 0.1823],
  28895. [ 0.5536, -0.4313, 0.9053, -1.4331, -0.4854, -1.2592, 0.2617, 0.0754],
  28896. [ 0.6161, -0.3597, 1.4798, -1.0293, -0.3282, -1.1504, 0.4840, 0.1977],
  28897. [ 0.4582, -0.4561, 1.7081, -0.8268, -0.5026, -0.7563, 0.6979, 0.2014],
  28898. [ 0.6078, -0.3919, 1.8090, -0.2198, -0.5793, -0.0794, 0.6614, 0.0188]],
  28899. device='cuda:0', grad_fn=<AddmmBackward>)
  28900. landmarks are: tensor([[[ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  28901. -0.1278],
  28902. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  28903. 0.2083],
  28904. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  28905. 0.1775],
  28906. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  28907. 0.1439],
  28908. [ 0.5037, -0.4375, 1.1032, -1.2390, -0.4499, -1.3159, 0.1301,
  28909. -0.0791],
  28910. [ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  28911. 0.2043],
  28912. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  28913. 0.1390],
  28914. [ 0.6075, -0.4159, 1.8654, -0.1458, -0.5249, 0.0159, 0.6359,
  28915. -0.0490]]], device='cuda:0')
  28916. loss_train_step before backward: tensor(0.0099, device='cuda:0', grad_fn=<MseLossBackward>)
  28917. loss_train_step after backward: tensor(0.0099, device='cuda:0', grad_fn=<MseLossBackward>)
  28918. loss_train: 1.0023726033978164
  28919. step: 50
  28920. running loss: 0.02004745206795633
  28921. Train Steps: 50/90 Loss: 0.0200 torch.Size([8, 600, 800])
  28922. torch.Size([8, 8])
  28923. tensor([[0.6205, 0.4004, 0.8938, 0.4883, 0.3663, 0.5000, 0.6357, 0.4947],
  28924. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450],
  28925. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  28926. [0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136],
  28927. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650],
  28928. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  28929. [0.6292, 0.4010, 0.8988, 0.4800, 0.3638, 0.3817, 0.6357, 0.5051],
  28930. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817]],
  28931. device='cuda:0', dtype=torch.float64)
  28932. predictions are: tensor([[ 0.7533, -0.3049, 1.7014, -0.1500, -0.6275, -0.0598, 0.6284, -0.0155],
  28933. [ 0.7431, -0.2644, 1.7102, -0.3314, -0.3599, 0.0643, 0.5581, 0.1520],
  28934. [ 0.8763, -0.1319, 1.6137, -0.1098, -0.3940, -1.0488, 0.3424, 0.4068],
  28935. [ 0.5484, -0.3760, 1.6466, -0.0710, -0.1373, 0.0032, 0.3874, 0.1075],
  28936. [-2.5872, -2.4539, 0.9287, -1.3730, -0.5087, -1.2914, 0.1816, 0.1541],
  28937. [ 0.5824, -0.4260, 1.6279, 0.0228, -0.3571, -0.1051, 0.5001, -0.1236],
  28938. [ 0.7043, -0.3324, 1.7657, -0.3025, -0.6113, -0.6340, 0.7717, 0.0398],
  28939. [ 0.6638, -0.2967, 1.3242, -1.0323, -0.3195, -1.1665, 0.3938, 0.3216]],
  28940. device='cuda:0', grad_fn=<AddmmBackward>)
  28941. landmarks are: tensor([[[ 5.8031e-01, -4.3672e-01, 1.8423e+00, -3.0331e-02, -5.9423e-01,
  28942. 2.3557e-02, 6.5034e-01, -9.2270e-04],
  28943. [ 5.9602e-01, -4.1016e-01, 1.8018e+00, -1.6120e-01, -3.3441e-01,
  28944. 1.1594e-01, 5.4896e-01, 2.3141e-01],
  28945. [ 6.1386e-01, -3.2163e-01, 1.8134e+00, 3.1255e-02, -3.8637e-01,
  28946. -1.0157e+00, 2.1441e-01, 5.7619e-01],
  28947. [ 5.5635e-01, -3.8422e-01, 1.7268e+00, 1.0054e-01, -2.4997e-02,
  28948. 3.2255e-01, 2.6581e-01, 8.6245e-02],
  28949. [-2.2859e+00, -2.2859e+00, 1.0361e+00, -1.2021e+00, -4.2102e-01,
  28950. -1.3390e+00, 8.7067e-02, 3.2379e-01],
  28951. [ 5.8643e-01, -4.6898e-01, 1.7268e+00, 1.4673e-01, -2.9400e-01,
  28952. 8.1601e-03, 4.7968e-01, 1.5858e-02],
  28953. [ 6.2038e-01, -4.3356e-01, 1.8654e+00, -6.8822e-02, -6.0577e-01,
  28954. -5.2302e-01, 6.5034e-01, 4.7170e-02],
  28955. [ 5.9636e-01, -3.3795e-01, 1.4785e+00, -8.3865e-01, -2.4203e-01,
  28956. -1.0619e+00, 3.2379e-01, 4.0077e-01]]], device='cuda:0')
  28957. loss_train_step before backward: tensor(0.0161, device='cuda:0', grad_fn=<MseLossBackward>)
  28958. loss_train_step after backward: tensor(0.0161, device='cuda:0', grad_fn=<MseLossBackward>)
  28959. loss_train: 1.0185070815496147
  28960. step: 51
  28961. running loss: 0.01997072708920813
  28962. Train Steps: 51/90 Loss: 0.0200 torch.Size([8, 600, 800])
  28963. torch.Size([8, 8])
  28964. tensor([[0.6142, 0.4127, 0.7575, 0.3067, 0.3438, 0.4383, 0.5778, 0.5207],
  28965. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  28966. [0.6250, 0.4131, 0.8688, 0.2983, 0.4275, 0.2367, 0.6162, 0.5367],
  28967. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  28968. [0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467],
  28969. [0.6236, 0.4081, 0.8575, 0.3000, 0.3713, 0.3033, 0.5550, 0.5633],
  28970. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  28971. [0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426]],
  28972. device='cuda:0', dtype=torch.float64)
  28973. predictions are: tensor([[ 0.5031, -0.4425, 1.2040, -0.7772, -0.5495, -0.3063, 0.4339, 0.1906],
  28974. [ 0.3934, -0.5387, 1.4250, -0.7125, -0.5673, -0.3420, 0.6277, 0.2145],
  28975. [ 0.7193, -0.3086, 1.8446, -0.8237, -0.1610, -1.2996, 0.7239, 0.0600],
  28976. [ 0.5397, -0.4609, 1.6552, -0.6620, -0.5809, -0.4994, 0.7042, 0.1421],
  28977. [ 0.8671, -0.2594, 1.1405, -1.1521, -0.4197, -1.0268, 0.5970, 0.0799],
  28978. [ 0.6018, -0.3752, 1.6716, -0.6814, -0.4735, -0.9963, 0.3710, 0.0484],
  28979. [ 0.2039, -0.6625, 1.6431, -0.2761, -0.5604, -0.3393, 0.3029, 0.1686],
  28980. [ 0.6398, -0.3982, 1.2430, -1.0984, -0.1309, -1.4904, 0.4661, 0.0773]],
  28981. device='cuda:0', grad_fn=<AddmmBackward>)
  28982. landmarks are: tensor([[[ 0.5509, -0.3798, 1.2129, -0.8694, -0.6982, -0.2613, 0.3830,
  28983. 0.1193],
  28984. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  28985. 0.2776],
  28986. [ 0.6011, -0.3778, 1.7268, -0.9079, -0.3113, -1.1928, 0.5605,
  28987. 0.1929],
  28988. [ 0.5779, -0.4275, 1.5894, -0.8362, -0.6577, -0.5153, 0.5605,
  28989. 0.2006],
  28990. [ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  28991. 0.2391],
  28992. [ 0.5944, -0.4008, 1.6748, -0.9002, -0.5711, -0.8848, 0.2776,
  28993. 0.3161],
  28994. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  28995. 0.3559],
  28996. [ 0.5784, -0.4153, 1.2972, -1.2541, -0.2265, -1.4553, 0.4741,
  28997. 0.2203]]], device='cuda:0')
  28998. loss_train_step before backward: tensor(0.0147, device='cuda:0', grad_fn=<MseLossBackward>)
  28999. loss_train_step after backward: tensor(0.0147, device='cuda:0', grad_fn=<MseLossBackward>)
  29000. loss_train: 1.0332335312850773
  29001. step: 52
  29002. running loss: 0.019869875601636104
  29003.  
  29004. Train Steps: 52/90 Loss: 0.0199 torch.Size([8, 600, 800])
  29005. torch.Size([8, 8])
  29006. tensor([[0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  29007. [0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  29008. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  29009. [0.6064, 0.4019, 0.8650, 0.4517, 0.4037, 0.5367, 0.5703, 0.5609],
  29010. [0.6201, 0.4017, 0.8871, 0.4621, 0.3517, 0.4675, 0.5999, 0.5106],
  29011. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  29012. [0.6113, 0.4104, 0.8650, 0.4250, 0.3925, 0.5967, 0.5787, 0.5116],
  29013. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433]],
  29014. device='cuda:0', dtype=torch.float64)
  29015. predictions are: tensor([[ 7.2992e-01, -3.0336e-01, 1.6313e+00, -1.1895e+00, -1.6060e-01,
  29016. -1.5407e+00, 7.1356e-01, -1.1083e-04],
  29017. [ 8.3763e-01, -2.4081e-01, 9.4407e-01, -1.0714e+00, -6.1049e-01,
  29018. -1.1304e+00, 3.6978e-01, 2.8219e-01],
  29019. [ 5.3184e-01, -4.5070e-01, 1.7964e+00, -2.1034e-01, -4.5707e-01,
  29020. 1.3236e-01, 5.4005e-01, 1.0987e-02],
  29021. [ 4.1670e-01, -5.2252e-01, 1.7129e+00, -1.5120e-01, -3.7215e-01,
  29022. 7.9002e-02, 4.5440e-01, 2.4114e-01],
  29023. [ 6.4734e-01, -3.8203e-01, 1.7813e+00, -1.8053e-01, -6.0651e-01,
  29024. -2.4972e-01, 4.8176e-01, 1.4656e-01],
  29025. [ 8.4762e-01, -2.9559e-01, 1.6944e+00, -8.0337e-01, -6.5135e-01,
  29026. -8.4902e-01, 8.1033e-01, -2.9006e-02],
  29027. [ 5.1166e-01, -4.3294e-01, 1.7072e+00, -3.1367e-01, -4.1504e-01,
  29028. 2.0122e-01, 4.7451e-01, 1.6525e-01],
  29029. [ 5.3567e-01, -4.6310e-01, 1.7171e+00, 1.5583e-01, 6.1324e-03,
  29030. -2.4901e-01, 2.7454e-01, 2.4279e-01]], device='cuda:0',
  29031. grad_fn=<AddmmBackward>)
  29032. landmarks are: tensor([[[ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  29033. -0.0209],
  29034. [ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  29035. 0.3315],
  29036. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  29037. -0.0322],
  29038. [ 0.5151, -0.4296, 1.7095, -0.1997, -0.4210, 0.1929, 0.3484,
  29039. 0.3047],
  29040. [ 0.5783, -0.4306, 1.8114, -0.1515, -0.6617, -0.1268, 0.4851,
  29041. 0.0727],
  29042. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  29043. -0.0220],
  29044. [ 0.5376, -0.3903, 1.7095, -0.3229, -0.4730, 0.4701, 0.3871,
  29045. 0.0772],
  29046. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  29047. 0.2237]]], device='cuda:0')
  29048. loss_train_step before backward: tensor(0.0120, device='cuda:0', grad_fn=<MseLossBackward>)
  29049. loss_train_step after backward: tensor(0.0120, device='cuda:0', grad_fn=<MseLossBackward>)
  29050. loss_train: 1.0451941271312535
  29051. step: 53
  29052. running loss: 0.019720643908136857
  29053. Train Steps: 53/90 Loss: 0.0197 torch.Size([8, 600, 800])
  29054. torch.Size([8, 8])
  29055. tensor([[0.6157, 0.3956, 0.8323, 0.4138, 0.3479, 0.4431, 0.5914, 0.5131],
  29056. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  29057. [0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  29058. [0.6364, 0.4154, 0.8938, 0.3717, 0.4500, 0.2583, 0.6448, 0.5285],
  29059. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  29060. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  29061. [0.6124, 0.4069, 0.8314, 0.5001, 0.3738, 0.4650, 0.5167, 0.5402],
  29062. [0.6277, 0.4118, 0.8988, 0.3833, 0.3950, 0.2650, 0.6290, 0.4938]],
  29063. device='cuda:0', dtype=torch.float64)
  29064. predictions are: tensor([[ 0.6368, -0.3853, 1.6120, -0.5413, -0.6199, -0.2305, 0.5398, 0.0600],
  29065. [ 0.5209, -0.4816, 1.6451, 0.1398, -0.3906, -0.1227, 0.5984, 0.0783],
  29066. [ 0.9131, -0.1735, 1.7377, -0.3481, -0.4845, -0.1768, 0.5186, 0.2881],
  29067. [ 0.6196, -0.3521, 1.8370, -0.8313, -0.1900, -1.2255, 0.7835, 0.2021],
  29068. [ 0.6076, -0.3732, 1.5815, -0.3898, -0.5213, -0.1574, 0.3139, 0.2048],
  29069. [ 0.6049, -0.3922, 1.6878, 0.0123, -0.1104, 0.0630, 0.2517, 0.1497],
  29070. [ 0.7485, -0.2795, 1.5738, -0.0625, -0.4706, -0.1227, 0.3277, 0.2029],
  29071. [ 0.6269, -0.3977, 1.9121, -0.6803, -0.4985, -1.1353, 0.7050, -0.0465]],
  29072. device='cuda:0', grad_fn=<AddmmBackward>)
  29073. landmarks are: tensor([[[ 0.5581, -0.4586, 1.5586, -0.3747, -0.6792, -0.2391, 0.4455,
  29074. 0.0840],
  29075. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  29076. 0.2091],
  29077. [ 0.5700, -0.4032, 1.7961, -0.1997, -0.5249, -0.2151, 0.3815,
  29078. 0.3161],
  29079. [ 0.6537, -0.3671, 1.8423, -0.5692, -0.2074, -1.0927, 0.6926,
  29080. 0.1554],
  29081. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  29082. 0.3265],
  29083. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  29084. 0.2634],
  29085. [ 0.5425, -0.4067, 1.5543, 0.0241, -0.5596, -0.1381, 0.1005,
  29086. 0.2093],
  29087. [ 0.6135, -0.3841, 1.8654, -0.5153, -0.4614, -1.0619, 0.6195,
  29088. -0.0049]]], device='cuda:0')
  29089. loss_train_step before backward: tensor(0.0117, device='cuda:0', grad_fn=<MseLossBackward>)
  29090. loss_train_step after backward: tensor(0.0117, device='cuda:0', grad_fn=<MseLossBackward>)
  29091. loss_train: 1.0568622411228716
  29092. step: 54
  29093. running loss: 0.019571522983756882
  29094. Train Steps: 54/90 Loss: 0.0196 torch.Size([8, 600, 800])
  29095. torch.Size([8, 8])
  29096. tensor([[0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  29097. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  29098. [0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426],
  29099. [0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  29100. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  29101. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  29102. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  29103. [0.6203, 0.4076, 0.8611, 0.2878, 0.4050, 0.2554, 0.5907, 0.5496]],
  29104. device='cuda:0', dtype=torch.float64)
  29105. predictions are: tensor([[ 0.7829, -0.3401, 1.8872, -0.0882, -0.5316, -0.3178, 0.9825, 0.0237],
  29106. [ 0.7225, -0.2570, 1.2862, -0.5971, -0.6629, -0.5322, 0.2681, 0.3659],
  29107. [ 0.7286, -0.3055, 1.2713, -1.2098, -0.2073, -1.4156, 0.5210, 0.1292],
  29108. [ 0.6605, -0.3209, 1.4038, -0.7051, -0.5712, -0.9730, 0.0354, 0.1156],
  29109. [ 0.8193, -0.2439, 1.8907, 0.0371, -0.3015, 0.2836, 0.6148, 0.1104],
  29110. [ 0.8284, -0.2746, 1.8211, 0.1799, -0.3628, 0.1998, 0.5393, -0.0055],
  29111. [-1.1938, -1.5406, 1.1514, -1.2486, -0.3078, -1.3804, 0.1980, 0.1326],
  29112. [ 0.6440, -0.3563, 1.7050, -0.9408, -0.3089, -0.9373, 0.5627, 0.1509]],
  29113. device='cuda:0', grad_fn=<AddmmBackward>)
  29114. landmarks are: tensor([[[ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  29115. 0.1715],
  29116. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  29117. 0.4036],
  29118. [ 0.5784, -0.4153, 1.2972, -1.2541, -0.2265, -1.4553, 0.4741,
  29119. 0.2203],
  29120. [ 0.5532, -0.3888, 1.4727, -0.7463, -0.5538, -1.0465, 0.0265,
  29121. 0.2138],
  29122. [ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  29123. 0.1390],
  29124. [ 0.5778, -0.4389, 1.7107, 0.1192, -0.3921, 0.0815, 0.4741,
  29125. 0.0711],
  29126. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  29127. 0.0231],
  29128. [ 0.5790, -0.4031, 1.6915, -0.9564, -0.4152, -1.1063, 0.4425,
  29129. 0.2528]]], device='cuda:0')
  29130. loss_train_step before backward: tensor(0.0374, device='cuda:0', grad_fn=<MseLossBackward>)
  29131. loss_train_step after backward: tensor(0.0374, device='cuda:0', grad_fn=<MseLossBackward>)
  29132. loss_train: 1.0942944386042655
  29133. step: 55
  29134. running loss: 0.019896262520077555
  29135. Train Steps: 55/90 Loss: 0.0199 torch.Size([8, 600, 800])
  29136. torch.Size([8, 8])
  29137. tensor([[0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  29138. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  29139. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  29140. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  29141. [0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544],
  29142. [0.6284, 0.4029, 0.8838, 0.3783, 0.3975, 0.2850, 0.6335, 0.5090],
  29143. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  29144. [0.6246, 0.4008, 0.8757, 0.5088, 0.4101, 0.5392, 0.6644, 0.5133]],
  29145. device='cuda:0', dtype=torch.float64)
  29146. predictions are: tensor([[ 0.5863, -0.4174, 1.1850, -1.1955, -0.2477, -1.3069, 0.3485, 0.1124],
  29147. [ 0.7275, -0.3032, 1.7512, -0.7057, -0.5881, -0.3120, 0.4027, 0.2238],
  29148. [ 0.7115, -0.3709, 1.8298, -0.0473, -0.5467, -0.2742, 0.4645, 0.0810],
  29149. [ 0.7314, -0.3769, 1.9074, -0.1583, -0.5646, -0.3302, 0.7126, 0.0212],
  29150. [ 0.6423, -0.3575, 0.8832, -1.2260, -0.3278, -1.3196, 0.0393, 0.2563],
  29151. [ 0.6789, -0.3773, 1.8181, -0.6685, -0.3828, -0.8828, 0.6894, 0.0553],
  29152. [ 0.6784, -0.3066, 1.7560, -0.0381, -0.5392, -0.4158, 0.2583, 0.3503],
  29153. [ 0.5078, -0.5002, 1.7740, -0.0045, -0.3177, 0.4120, 0.7222, 0.1060]],
  29154. device='cuda:0', grad_fn=<AddmmBackward>)
  29155. landmarks are: tensor([[[ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  29156. 0.1449],
  29157. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  29158. 0.3392],
  29159. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  29160. 0.1082],
  29161. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  29162. 0.0325],
  29163. [ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  29164. 0.2747],
  29165. [ 0.6165, -0.4249, 1.7961, -0.5384, -0.4499, -0.9695, 0.6401,
  29166. 0.0652],
  29167. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  29168. 0.3161],
  29169. [ 0.5993, -0.4345, 1.7587, 0.0641, -0.3917, 0.2048, 0.7827,
  29170. 0.0852]]], device='cuda:0')
  29171. loss_train_step before backward: tensor(0.0058, device='cuda:0', grad_fn=<MseLossBackward>)
  29172. loss_train_step after backward: tensor(0.0058, device='cuda:0', grad_fn=<MseLossBackward>)
  29173. loss_train: 1.1001434274949133
  29174. step: 56
  29175. running loss: 0.01964541834812345
  29176.  
  29177. Train Steps: 56/90 Loss: 0.0196 torch.Size([8, 600, 800])
  29178. torch.Size([8, 8])
  29179. tensor([[ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  29180. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  29181. [0.6245, 0.4100, 0.7762, 0.2583, 0.4963, 0.1517, 0.5875, 0.5417],
  29182. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  29183. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  29184. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  29185. [0.6357, 0.4159, 0.8788, 0.5583, 0.3638, 0.4433, 0.6488, 0.5297],
  29186. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852]],
  29187. device='cuda:0', dtype=torch.float64)
  29188. predictions are: tensor([[-1.6910, -1.8692, 1.1434, -1.2963, -0.3648, -1.2930, 0.1842, 0.1635],
  29189. [ 0.7451, -0.2723, 1.7204, 0.1904, -0.3997, 0.1187, 0.1519, 0.1289],
  29190. [ 0.6097, -0.3337, 1.2839, -1.0808, -0.0696, -1.4428, 0.3928, 0.2679],
  29191. [ 0.7237, -0.3450, 1.7572, 0.1803, -0.5939, -0.1386, 0.5070, 0.0829],
  29192. [ 0.8000, -0.2632, 1.5401, -0.9677, -0.5274, -0.9060, 0.6557, 0.0595],
  29193. [ 0.5654, -0.4025, 1.4035, -1.1105, -0.3297, -1.2302, 0.4009, 0.1177],
  29194. [ 0.8601, -0.2298, 1.8324, 0.2251, -0.6189, -0.1713, 0.7841, 0.0564],
  29195. [ 0.7536, -0.2819, 1.8000, -0.0206, -0.2430, 0.1234, 0.2688, 0.2988]],
  29196. device='cuda:0', grad_fn=<AddmmBackward>)
  29197. landmarks are: tensor([[[-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  29198. 0.0231],
  29199. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  29200. 0.2048],
  29201. [ 0.5985, -0.3921, 1.2995, -1.0927, 0.0062, -1.5854, 0.4277,
  29202. 0.2160],
  29203. [ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  29204. 0.2075],
  29205. [ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  29206. 0.1080],
  29207. [ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  29208. 0.0928],
  29209. [ 0.6504, -0.3647, 1.7730, 0.2930, -0.6058, -0.2382, 0.7109,
  29210. 0.1608],
  29211. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  29212. 0.4171]]], device='cuda:0')
  29213. loss_train_step before backward: tensor(0.0204, device='cuda:0', grad_fn=<MseLossBackward>)
  29214. loss_train_step after backward: tensor(0.0204, device='cuda:0', grad_fn=<MseLossBackward>)
  29215. loss_train: 1.1205182750709355
  29216. step: 57
  29217. running loss: 0.019658215352121675
  29218. Train Steps: 57/90 Loss: 0.0197 torch.Size([8, 600, 800])
  29219. torch.Size([8, 8])
  29220. tensor([[0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  29221. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  29222. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  29223. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  29224. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  29225. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  29226. [0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183],
  29227. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150]],
  29228. device='cuda:0', dtype=torch.float64)
  29229. predictions are: tensor([[ 0.7240, -0.3128, 1.8758, -0.1588, -0.5622, -0.1100, 0.3184, 0.3145],
  29230. [ 0.6164, -0.3884, 0.9456, -1.0949, -0.4927, -1.2268, 0.0999, 0.0704],
  29231. [ 0.5727, -0.4196, 1.4462, -0.6541, -0.6380, -0.7790, 0.2244, 0.1123],
  29232. [ 0.7500, -0.3441, 1.8785, -0.1390, -0.5367, 0.1114, 0.7222, 0.2040],
  29233. [ 0.3065, -0.6051, 1.9755, -0.6526, 0.0485, -1.1576, 0.8616, 0.2635],
  29234. [ 0.5309, -0.4451, 1.2675, -1.0254, -0.4772, -1.0516, 0.3530, 0.2737],
  29235. [ 0.7435, -0.3372, 1.7588, -0.5859, -0.5617, -0.5718, 0.6055, 0.1405],
  29236. [ 0.4607, -0.4934, 1.8087, 0.0506, -0.2326, 0.4321, 0.3402, 0.1789]],
  29237. device='cuda:0', grad_fn=<AddmmBackward>)
  29238. landmarks are: tensor([[[ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  29239. 0.3161],
  29240. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  29241. 0.0862],
  29242. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  29243. 0.0942],
  29244. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  29245. 0.1715],
  29246. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  29247. 0.2142],
  29248. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  29249. 0.2032],
  29250. [ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  29251. 0.1080],
  29252. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  29253. 0.0928]]], device='cuda:0')
  29254. loss_train_step before backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  29255. loss_train_step after backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  29256. loss_train: 1.134296880569309
  29257. step: 58
  29258. running loss: 0.01955684276843636
  29259. Train Steps: 58/90 Loss: 0.0196 torch.Size([8, 600, 800])
  29260. torch.Size([8, 8])
  29261. tensor([[0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  29262. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  29263. [0.6264, 0.4035, 0.8888, 0.4883, 0.4050, 0.5217, 0.6361, 0.4791],
  29264. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  29265. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  29266. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  29267. [0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748],
  29268. [0.6040, 0.4002, 0.7338, 0.2267, 0.3975, 0.2100, 0.5231, 0.4778]],
  29269. device='cuda:0', dtype=torch.float64)
  29270. predictions are: tensor([[ 0.6055, -0.4108, 1.7864, 0.0511, -0.3500, -0.0902, 0.1680, 0.2737],
  29271. [ 0.7388, -0.3232, 1.8136, -0.4222, -0.5589, -0.1588, 0.5349, 0.2467],
  29272. [ 0.7091, -0.3533, 1.8356, -0.0353, -0.3907, 0.1420, 0.4466, 0.0463],
  29273. [ 0.5975, -0.3956, 1.4275, -0.8469, -0.5958, -0.3813, 0.4986, 0.3251],
  29274. [ 0.5958, -0.3976, 1.8374, -0.2642, -0.5575, -0.5204, 0.3262, 0.2197],
  29275. [ 0.6485, -0.3895, 1.7882, -0.4670, -0.5247, -0.8635, 0.3813, 0.1579],
  29276. [ 0.4192, -0.5455, 1.6479, 0.2483, -0.4039, -0.3421, 0.7505, 0.3025],
  29277. [ 0.4611, -0.4840, 1.1231, -1.3008, -0.3819, -1.3606, 0.1314, 0.0664]],
  29278. device='cuda:0', grad_fn=<AddmmBackward>)
  29279. landmarks are: tensor([[[ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  29280. 0.3777],
  29281. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  29282. 0.2083],
  29283. [ 0.6074, -0.4223, 1.8192, -0.0303, -0.4152, 0.1236, 0.6524,
  29284. -0.0731],
  29285. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  29286. 0.2776],
  29287. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  29288. 0.1544],
  29289. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  29290. 0.1005],
  29291. [ 0.6421, -0.3647, 1.5940, 0.3084, -0.5192, -0.3691, 1.1057,
  29292. 0.3692],
  29293. [ 0.5037, -0.4375, 1.1032, -1.2390, -0.4499, -1.3159, 0.1301,
  29294. -0.0791]]], device='cuda:0')
  29295. loss_train_step before backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  29296. loss_train_step after backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  29297. loss_train: 1.1419263114221394
  29298. step: 59
  29299. running loss: 0.01935468324444304
  29300. Train Steps: 59/90 Loss: 0.0194 torch.Size([8, 600, 800])
  29301. torch.Size([8, 8])
  29302. tensor([[0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  29303. [0.6222, 0.3957, 0.8838, 0.5017, 0.3937, 0.4600, 0.5900, 0.5017],
  29304. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  29305. [0.6168, 0.4029, 0.8523, 0.3417, 0.3588, 0.5000, 0.6125, 0.5400],
  29306. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  29307. [0.6053, 0.4035, 0.6897, 0.1916, 0.4000, 0.2117, 0.5440, 0.5168],
  29308. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  29309. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317]],
  29310. device='cuda:0', dtype=torch.float64)
  29311. predictions are: tensor([[ 0.7460, -0.2874, 1.7264, 0.2952, -0.3615, 0.0596, 0.1324, 0.1865],
  29312. [ 0.6967, -0.3833, 1.8552, 0.0737, -0.5081, -0.1024, 0.4197, 0.0161],
  29313. [-1.7460, -1.9138, 1.3348, -0.9356, -0.5931, -0.9858, 0.2740, 0.2554],
  29314. [ 0.8198, -0.2550, 1.6915, -0.6744, -0.5717, 0.0033, 0.7498, 0.2701],
  29315. [ 0.5167, -0.4165, 1.8108, -0.7367, -0.2093, -1.3022, 0.3991, 0.0950],
  29316. [ 0.5604, -0.4277, 0.9121, -1.2715, -0.3794, -1.3098, 0.3249, 0.1936],
  29317. [ 0.7529, -0.2951, 1.8136, 0.2724, -0.5670, -0.5399, 0.4457, 0.1687],
  29318. [ 0.4675, -0.4694, 1.3008, -1.0542, -0.3341, -1.1477, 0.4661, 0.2529]],
  29319. device='cuda:0', grad_fn=<AddmmBackward>)
  29320. landmarks are: tensor([[[ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  29321. 0.2048],
  29322. [ 0.5879, -0.4583, 1.7961, 0.0313, -0.4672, -0.1612, 0.4393,
  29323. 0.0313],
  29324. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  29325. 0.2699],
  29326. [ 0.5631, -0.4249, 1.6509, -0.7078, -0.6289, 0.0236, 0.5432,
  29327. 0.2083],
  29328. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  29329. -0.0368],
  29330. [ 0.5102, -0.4223, 0.8999, -1.4011, -0.4383, -1.3082, 0.2267,
  29331. 0.1013],
  29332. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  29333. 0.1698],
  29334. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  29335. 0.1698]]], device='cuda:0')
  29336. loss_train_step before backward: tensor(0.0150, device='cuda:0', grad_fn=<MseLossBackward>)
  29337. loss_train_step after backward: tensor(0.0150, device='cuda:0', grad_fn=<MseLossBackward>)
  29338. loss_train: 1.156885642092675
  29339. step: 60
  29340. running loss: 0.01928142736821125
  29341.  
  29342. Train Steps: 60/90 Loss: 0.0193 torch.Size([8, 600, 800])
  29343. torch.Size([8, 8])
  29344. tensor([[0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  29345. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550],
  29346. [0.6357, 0.4159, 0.8788, 0.5583, 0.3638, 0.4433, 0.6488, 0.5297],
  29347. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  29348. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  29349. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  29350. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  29351. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413]],
  29352. device='cuda:0', dtype=torch.float64)
  29353. predictions are: tensor([[ 0.3795, -0.5493, 1.2779, -1.1011, -0.6506, -0.7793, 0.3970, 0.1421],
  29354. [ 0.4603, -0.4661, 1.3833, -0.7593, -0.6260, -0.9102, -0.0130, 0.1901],
  29355. [ 0.6507, -0.3994, 1.7494, 0.2472, -0.6366, -0.2860, 0.6668, 0.0906],
  29356. [ 0.6627, -0.3054, 1.7199, -0.0872, -0.2746, -0.9652, 0.2201, 0.4598],
  29357. [ 0.6057, -0.4007, 1.7335, -0.2720, -0.6664, -0.7356, 0.3688, 0.2675],
  29358. [ 0.3530, -0.5622, 1.7161, -0.2440, -0.1596, 0.1293, 0.3165, 0.1964],
  29359. [ 0.3366, -0.5876, 1.3808, -0.9403, -0.6362, -0.8249, 0.4522, 0.1936],
  29360. [ 0.4302, -0.5576, 1.7444, -1.1820, 0.1793, -1.0450, 1.0431, 0.2124]],
  29361. device='cuda:0', grad_fn=<AddmmBackward>)
  29362. landmarks are: tensor([[[ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  29363. 0.2545],
  29364. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  29365. 0.2776],
  29366. [ 0.6504, -0.3647, 1.7730, 0.2930, -0.6058, -0.2382, 0.7109,
  29367. 0.1608],
  29368. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  29369. 0.5822],
  29370. [ 0.6016, -0.3633, 1.7152, -0.2228, -0.6115, -0.6385, 0.5028,
  29371. 0.2699],
  29372. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  29373. 0.2853],
  29374. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  29375. 0.1931],
  29376. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  29377. 0.2142]]], device='cuda:0')
  29378. loss_train_step before backward: tensor(0.0086, device='cuda:0', grad_fn=<MseLossBackward>)
  29379. loss_train_step after backward: tensor(0.0086, device='cuda:0', grad_fn=<MseLossBackward>)
  29380. loss_train: 1.1654705270193517
  29381. step: 61
  29382. running loss: 0.019106074213431995
  29383. Train Steps: 61/90 Loss: 0.0191 torch.Size([8, 600, 800])
  29384. torch.Size([8, 8])
  29385. tensor([[ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  29386. [0.6090, 0.4045, 0.7250, 0.2100, 0.4075, 0.2300, 0.5476, 0.5663],
  29387. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  29388. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  29389. [0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  29390. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  29391. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  29392. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367]],
  29393. device='cuda:0', dtype=torch.float64)
  29394. predictions are: tensor([[-2.1501, -2.1734, 1.3345, -0.8381, -0.5983, -0.9237, 0.1402, 0.2465],
  29395. [ 0.4663, -0.4732, 1.1043, -1.1138, -0.4635, -1.1531, 0.1945, 0.2410],
  29396. [-1.5817, -1.7912, 0.9501, -1.3078, -0.3975, -1.2940, 0.0970, 0.2340],
  29397. [ 0.9681, -0.1215, 1.7032, 0.3756, -0.5523, -0.0942, 0.4063, 0.1481],
  29398. [ 0.9483, -0.1109, 1.8560, 0.1420, -0.6529, -0.2599, 0.2922, 0.3571],
  29399. [ 0.8209, -0.2577, 1.7611, -1.0484, 0.1209, -0.9930, 1.0093, 0.2220],
  29400. [ 0.9207, -0.2333, 1.6936, 0.2770, -0.5535, -0.0371, 0.5384, 0.0420],
  29401. [ 0.7437, -0.2797, 1.4979, -0.9594, -0.3998, -1.1038, 0.4923, 0.1269]],
  29402. device='cuda:0', grad_fn=<AddmmBackward>)
  29403. landmarks are: tensor([[[-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  29404. 0.2837],
  29405. [ 0.5269, -0.4176, 1.0628, -1.3159, -0.4037, -1.2236, 0.2432,
  29406. 0.3297],
  29407. [-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  29408. 0.2930],
  29409. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  29410. 0.2391],
  29411. [ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  29412. 0.3623],
  29413. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  29414. 0.2142],
  29415. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  29416. 0.0697],
  29417. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  29418. 0.1929]]], device='cuda:0')
  29419. loss_train_step before backward: tensor(0.0272, device='cuda:0', grad_fn=<MseLossBackward>)
  29420. loss_train_step after backward: tensor(0.0272, device='cuda:0', grad_fn=<MseLossBackward>)
  29421. loss_train: 1.192680740263313
  29422. step: 62
  29423. running loss: 0.019236786133279244
  29424. Train Steps: 62/90 Loss: 0.0192 torch.Size([8, 600, 800])
  29425. torch.Size([8, 8])
  29426. tensor([[0.6289, 0.4024, 0.9088, 0.4567, 0.3937, 0.5633, 0.7058, 0.5609],
  29427. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  29428. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  29429. [0.6261, 0.4045, 0.8865, 0.5369, 0.3895, 0.4859, 0.6683, 0.5249],
  29430. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378],
  29431. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436],
  29432. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  29433. [0.6339, 0.4112, 0.8838, 0.5067, 0.4000, 0.5433, 0.7549, 0.5378]],
  29434. device='cuda:0', dtype=torch.float64)
  29435. predictions are: tensor([[ 0.6573, -0.3446, 1.6966, -0.2443, -0.5200, 0.1686, 0.5751, 0.2832],
  29436. [ 0.6415, -0.3198, 1.6393, -0.4346, -0.4965, -0.9133, 0.0875, 0.4190],
  29437. [ 0.4149, -0.5455, 1.8838, -0.2986, -0.3281, -0.9900, 0.6586, 0.1507],
  29438. [ 0.6257, -0.3637, 1.6404, 0.1075, -0.6028, -0.1368, 0.3381, 0.1363],
  29439. [ 0.5099, -0.4514, 1.6478, -1.0770, 0.0905, -1.2842, 0.7178, 0.1467],
  29440. [ 0.6812, -0.3321, 1.5995, 0.0378, -0.5077, 0.1190, 0.6594, 0.2596],
  29441. [-2.2269, -2.2209, 1.0822, -1.1340, -0.4991, -1.3651, -0.0889, 0.1406],
  29442. [ 0.5776, -0.4028, 1.6504, -0.0414, -0.5256, 0.1455, 0.5969, 0.2451]],
  29443. device='cuda:0', grad_fn=<AddmmBackward>)
  29444. landmarks are: tensor([[[ 0.6191, -0.4273, 1.9115, -0.1766, -0.4672, 0.3161, 0.9741,
  29445. 0.3050],
  29446. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  29447. 0.3928],
  29448. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  29449. 0.2142],
  29450. [ 0.6059, -0.4177, 1.8087, 0.1941, -0.4868, -0.0414, 0.8010,
  29451. 0.1385],
  29452. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  29453. 0.1982],
  29454. [ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  29455. 0.2249],
  29456. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  29457. 0.2183],
  29458. [ 0.6421, -0.3864, 1.7961, 0.0543, -0.4383, 0.2237, 1.2007,
  29459. 0.1982]]], device='cuda:0')
  29460. loss_train_step before backward: tensor(0.0305, device='cuda:0', grad_fn=<MseLossBackward>)
  29461. loss_train_step after backward: tensor(0.0305, device='cuda:0', grad_fn=<MseLossBackward>)
  29462. loss_train: 1.2231627046130598
  29463. step: 63
  29464. running loss: 0.019415281025604123
  29465. Train Steps: 63/90 Loss: 0.0194 torch.Size([8, 600, 800])
  29466. torch.Size([8, 8])
  29467. tensor([[0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138],
  29468. [0.6179, 0.3961, 0.8347, 0.6020, 0.3887, 0.4624, 0.5714, 0.5373],
  29469. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575],
  29470. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  29471. [0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882],
  29472. [ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  29473. [0.6350, 0.4043, 0.8738, 0.5650, 0.3850, 0.4750, 0.6401, 0.4950],
  29474. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550]],
  29475. device='cuda:0', dtype=torch.float64)
  29476. predictions are: tensor([[ 0.6864, -0.2961, 1.5186, -0.5382, -0.5293, -0.7114, 0.4208, 0.5046],
  29477. [ 0.9863, -0.1553, 1.5130, 0.3829, -0.4618, -0.3696, 0.4101, 0.2275],
  29478. [ 0.8880, -0.2267, 1.6710, -0.8084, -0.3837, -0.4435, 1.0219, 0.2616],
  29479. [-2.2763, -2.2673, 1.3555, -0.8581, -0.5137, -0.9928, 0.1230, 0.2752],
  29480. [ 0.7329, -0.2929, 1.7610, -0.4323, -0.5493, -0.6349, 0.1989, 0.0026],
  29481. [-1.8182, -1.9563, 0.9659, -1.3406, -0.3299, -1.3894, 0.0819, 0.2440],
  29482. [ 0.8465, -0.2613, 1.7509, 0.2371, -0.4888, -0.1813, 0.6480, 0.0601],
  29483. [ 0.8349, -0.2106, 1.8088, -0.2125, -0.3730, 0.0472, 0.5546, 0.3162]],
  29484. device='cuda:0', grad_fn=<AddmmBackward>)
  29485. landmarks are: tensor([[[ 5.4376e-01, -4.2055e-01, 1.5189e+00, -4.5373e-01, -6.1155e-01,
  29486. -6.2309e-01, 4.3649e-01, 5.4914e-01],
  29487. [ 5.6801e-01, -4.5619e-01, 1.5697e+00, 4.9469e-01, -4.9038e-01,
  29488. -1.5026e-01, 3.5357e-01, 1.9563e-01],
  29489. [ 6.1577e-01, -4.2490e-01, 1.8654e+00, -9.0023e-01, -3.2286e-01,
  29490. -3.5366e-01, 9.6675e-01, 2.8902e-01],
  29491. [-2.2859e+00, -2.2859e+00, 1.4006e+00, -8.1049e-01, -6.1155e-01,
  29492. -8.2325e-01, 4.1889e-02, 2.8371e-01],
  29493. [ 5.5953e-01, -3.9877e-01, 1.7672e+00, -4.4604e-01, -5.5381e-01,
  29494. -5.3841e-01, 8.2802e-02, -3.0981e-02],
  29495. [-2.2859e+00, -2.2859e+00, 8.5162e-01, -1.3112e+00, -4.3256e-01,
  29496. -1.2851e+00, 7.5520e-02, 2.9299e-01],
  29497. [ 6.4706e-01, -4.1832e-01, 1.7499e+00, 3.2379e-01, -5.0762e-01,
  29498. -9.1917e-02, 6.7064e-01, 4.6189e-04],
  29499. [ 5.9677e-01, -3.7252e-01, 1.8423e+00, -1.3811e-01, -4.0370e-01,
  29500. 1.8522e-01, 6.0092e-01, 2.7760e-01]]], device='cuda:0')
  29501. loss_train_step before backward: tensor(0.0195, device='cuda:0', grad_fn=<MseLossBackward>)
  29502. loss_train_step after backward: tensor(0.0195, device='cuda:0', grad_fn=<MseLossBackward>)
  29503. loss_train: 1.2426480515860021
  29504. step: 64
  29505. running loss: 0.019416375806031283
  29506.  
  29507. Train Steps: 64/90 Loss: 0.0194 torch.Size([8, 600, 800])
  29508. torch.Size([8, 8])
  29509. tensor([[0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  29510. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586],
  29511. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  29512. [0.6197, 0.4091, 0.8800, 0.4783, 0.3538, 0.4767, 0.5950, 0.5550],
  29513. [0.6224, 0.3964, 0.8225, 0.5717, 0.4150, 0.4617, 0.5775, 0.5267],
  29514. [0.6339, 0.4102, 0.8588, 0.3133, 0.4425, 0.2117, 0.6417, 0.5089],
  29515. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  29516. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350]],
  29517. device='cuda:0', dtype=torch.float64)
  29518. predictions are: tensor([[ 0.5682, -0.3837, 1.6764, -0.2138, -0.3883, -0.8902, 0.3701, 0.5147],
  29519. [ 0.2831, -0.6369, 1.5697, -1.2638, 0.0999, -1.3712, 0.9089, 0.2294],
  29520. [ 0.2783, -0.6375, 1.5955, -0.1216, -0.4374, 0.1521, 0.4283, 0.2186],
  29521. [ 0.4816, -0.4981, 1.7127, -0.2116, -0.7235, -0.0632, 0.5347, 0.3418],
  29522. [ 0.4290, -0.5700, 1.5273, 0.2132, -0.5799, -0.1178, 0.4299, 0.1792],
  29523. [ 0.5207, -0.4917, 1.6541, -0.9631, -0.3377, -1.1652, 0.7063, 0.0927],
  29524. [ 0.2865, -0.5891, 1.4471, -0.9866, -0.2524, -1.2922, 0.3699, 0.2180],
  29525. [ 0.1956, -0.6708, 1.3196, -1.2192, -0.3199, -1.2378, 0.4614, 0.2082]],
  29526. device='cuda:0', grad_fn=<AddmmBackward>)
  29527. landmarks are: tensor([[[ 6.1742e-01, -3.1175e-01, 1.6402e+00, -2.0739e-01, -1.9584e-01,
  29528. -1.0927e+00, 2.2674e-01, 5.8220e-01],
  29529. [ 6.5036e-01, -3.8397e-01, 1.5940e+00, -1.1312e+00, 2.1409e-01,
  29530. -1.5315e+00, 8.2052e-01, 2.9436e-01],
  29531. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  29532. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  29533. [ 5.7633e-01, -3.9630e-01, 1.7788e+00, -7.6520e-02, -6.5196e-01,
  29534. -8.4219e-02, 4.6236e-01, 2.7760e-01],
  29535. [ 5.8915e-01, -4.5504e-01, 1.5132e+00, 3.5458e-01, -3.6905e-01,
  29536. -1.5350e-01, 3.8152e-01, 1.4673e-01],
  29537. [ 6.4212e-01, -3.9120e-01, 1.6806e+00, -8.3865e-01, -2.4203e-01,
  29538. -1.3082e+00, 6.7795e-01, 6.4585e-02],
  29539. [ 5.9107e-01, -3.8879e-01, 1.4727e+00, -9.5412e-01, -9.1917e-02,
  29540. -1.4930e+00, 3.9885e-01, 2.0831e-01],
  29541. [ 5.7679e-01, -4.0308e-01, 1.3838e+00, -1.1527e+00, -2.1876e-01,
  29542. -1.4216e+00, 4.3790e-01, 1.8502e-01]]], device='cuda:0')
  29543. loss_train_step before backward: tensor(0.0199, device='cuda:0', grad_fn=<MseLossBackward>)
  29544. loss_train_step after backward: tensor(0.0199, device='cuda:0', grad_fn=<MseLossBackward>)
  29545. loss_train: 1.2625863901339471
  29546. step: 65
  29547. running loss: 0.019424406002060725
  29548. Train Steps: 65/90 Loss: 0.0194 torch.Size([8, 600, 800])
  29549. torch.Size([8, 8])
  29550. tensor([[0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  29551. [0.6267, 0.4080, 0.8438, 0.2633, 0.4763, 0.1800, 0.6259, 0.5240],
  29552. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  29553. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  29554. [0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  29555. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  29556. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  29557. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700]],
  29558. device='cuda:0', dtype=torch.float64)
  29559. predictions are: tensor([[ 0.5621, -0.4321, 1.7724, -0.4772, -0.5423, -0.1147, 0.8050, 0.2694],
  29560. [ 0.5308, -0.4434, 1.6116, -1.1489, -0.1159, -1.5357, 0.5198, 0.1760],
  29561. [ 0.5708, -0.3927, 1.7551, -0.3971, -0.4772, 0.0762, 0.3674, 0.0970],
  29562. [ 0.3569, -0.5271, 1.7537, -0.2564, -0.2742, 0.1578, 0.5440, 0.2621],
  29563. [ 0.5001, -0.4712, 1.6459, 0.1250, -0.5059, -0.5100, 0.7173, 0.2668],
  29564. [ 0.5423, -0.4400, 1.6106, 0.2562, -0.5150, -0.2214, 0.4051, 0.1300],
  29565. [ 0.4982, -0.4699, 1.4092, 0.0876, -0.4595, -0.2477, 0.7810, 0.3380],
  29566. [-2.5799, -2.5101, 0.9946, -1.3201, -0.3054, -1.6528, 0.1075, 0.3432]],
  29567. device='cuda:0', grad_fn=<AddmmBackward>)
  29568. landmarks are: tensor([[[ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  29569. 0.1715],
  29570. [ 0.6088, -0.4015, 1.6113, -1.0696, -0.0861, -1.4545, 0.6051,
  29571. 0.1343],
  29572. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  29573. -0.0322],
  29574. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  29575. 0.0928],
  29576. [ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  29577. 0.2516],
  29578. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  29579. -0.1385],
  29580. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  29581. 0.1928],
  29582. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  29583. 0.3469]]], device='cuda:0')
  29584. loss_train_step before backward: tensor(0.0219, device='cuda:0', grad_fn=<MseLossBackward>)
  29585. loss_train_step after backward: tensor(0.0219, device='cuda:0', grad_fn=<MseLossBackward>)
  29586. loss_train: 1.2844528066925704
  29587. step: 66
  29588. running loss: 0.019461406162008643
  29589. Train Steps: 66/90 Loss: 0.0195 torch.Size([8, 600, 800])
  29590. torch.Size([8, 8])
  29591. tensor([[0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  29592. [0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  29593. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  29594. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  29595. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  29596. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  29597. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267],
  29598. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583]],
  29599. device='cuda:0', dtype=torch.float64)
  29600. predictions are: tensor([[ 0.6355, -0.3365, 1.7837, 0.2189, -0.3321, -0.7855, 0.6329, 0.4986],
  29601. [ 0.6189, -0.3985, 1.1583, -1.1676, -0.5172, -0.9246, 0.6778, 0.2728],
  29602. [ 0.4296, -0.5356, 1.8003, -0.0223, -0.1546, 0.1135, 0.4732, 0.0954],
  29603. [ 0.2051, -0.6368, 1.1759, -1.1390, -0.3122, -1.3071, 0.3184, 0.2113],
  29604. [ 0.2515, -0.6269, 1.0781, -1.1108, -0.3976, -1.3259, 0.3161, 0.0738],
  29605. [-2.5323, -2.4686, 1.0653, -1.2045, -0.4495, -1.2806, 0.2355, 0.2090],
  29606. [ 0.6640, -0.3917, 1.4862, -1.1260, -0.1107, -1.3607, 0.8365, 0.1686],
  29607. [ 0.4217, -0.5376, 1.9231, -0.1483, -0.5415, -0.2629, 0.6584, 0.2839]],
  29608. device='cuda:0', grad_fn=<AddmmBackward>)
  29609. landmarks are: tensor([[[ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  29610. 0.5762],
  29611. [ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  29612. 0.3007],
  29613. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  29614. -0.0039],
  29615. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  29616. 0.1343],
  29617. [ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  29618. -0.0580],
  29619. [-2.2859, -2.2859, 1.0513, -1.2851, -0.4441, -1.2313, 0.2206,
  29620. 0.1073],
  29621. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  29622. 0.1467],
  29623. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  29624. 0.2930]]], device='cuda:0')
  29625. loss_train_step before backward: tensor(0.0230, device='cuda:0', grad_fn=<MseLossBackward>)
  29626. loss_train_step after backward: tensor(0.0230, device='cuda:0', grad_fn=<MseLossBackward>)
  29627. loss_train: 1.3074766951613128
  29628. step: 67
  29629. running loss: 0.019514577539721085
  29630. Train Steps: 67/90 Loss: 0.0195 torch.Size([8, 600, 800])
  29631. torch.Size([8, 8])
  29632. tensor([[0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  29633. [ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  29634. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  29635. [ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  29636. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  29637. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  29638. [0.6083, 0.3957, 0.8638, 0.4950, 0.4363, 0.5083, 0.5346, 0.4980],
  29639. [0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748]],
  29640. device='cuda:0', dtype=torch.float64)
  29641. predictions are: tensor([[ 0.7521, -0.2619, 1.6282, -0.0429, -0.5543, -0.5445, 0.4366, 0.3235],
  29642. [-2.1303, -2.1780, 1.7012, -1.1529, 0.1408, -1.2760, 0.8930, 0.4179],
  29643. [ 0.7358, -0.3000, 1.6929, 0.0419, -0.5112, -0.0552, 0.5920, 0.1726],
  29644. [-1.7605, -1.9247, 0.9663, -1.3456, -0.4302, -1.4783, 0.0266, 0.2209],
  29645. [ 0.7053, -0.2838, 1.5613, 0.1993, -0.0641, -0.2609, 0.4373, 0.3980],
  29646. [ 0.5957, -0.3948, 1.7999, -0.4406, -0.5199, -0.3977, 0.4966, 0.2283],
  29647. [ 0.6119, -0.3963, 1.6988, -0.1708, -0.3118, 0.0706, 0.3834, -0.0591],
  29648. [ 0.6916, -0.3560, 1.5536, 0.0555, -0.4908, -0.3907, 1.0764, 0.2408]],
  29649. device='cuda:0', grad_fn=<AddmmBackward>)
  29650. landmarks are: tensor([[[ 5.7771e-01, -3.9153e-01, 1.7961e+00, 1.6982e-01, -5.1917e-01,
  29651. -5.3072e-01, 2.1409e-01, 3.3918e-01],
  29652. [-2.2859e+00, -2.2859e+00, 1.8018e+00, -9.0023e-01, 1.9099e-01,
  29653. -1.2467e+00, 1.1057e+00, 3.7986e-01],
  29654. [ 5.6028e-01, -4.3195e-01, 1.7788e+00, 1.7752e-01, -5.5381e-01,
  29655. -6.1124e-02, 4.7968e-01, 1.5443e-01],
  29656. [-2.2859e+00, -2.2859e+00, 1.0712e+00, -1.2085e+00, -3.8060e-01,
  29657. -1.3929e+00, 7.5520e-02, 2.0062e-01],
  29658. [ 5.9590e-01, -3.5789e-01, 1.6055e+00, 3.6228e-01, -5.7275e-02,
  29659. -2.0739e-01, 3.1224e-01, 4.5466e-01],
  29660. [ 5.8320e-01, -4.2309e-01, 1.8423e+00, -3.6135e-01, -5.2494e-01,
  29661. -3.1517e-01, 3.0647e-01, 2.9299e-01],
  29662. [ 5.2379e-01, -4.5797e-01, 1.7037e+00, 4.6189e-04, -2.7090e-01,
  29663. 6.2048e-02, 1.8356e-01, 1.4106e-02],
  29664. [ 6.4212e-01, -3.6471e-01, 1.5940e+00, 3.0839e-01, -5.1917e-01,
  29665. -3.6905e-01, 1.1057e+00, 3.6917e-01]]], device='cuda:0')
  29666. loss_train_step before backward: tensor(0.0182, device='cuda:0', grad_fn=<MseLossBackward>)
  29667. loss_train_step after backward: tensor(0.0182, device='cuda:0', grad_fn=<MseLossBackward>)
  29668. loss_train: 1.325725748669356
  29669. step: 68
  29670. running loss: 0.019495966892196414
  29671.  
  29672. Train Steps: 68/90 Loss: 0.0195 torch.Size([8, 600, 800])
  29673. torch.Size([8, 8])
  29674. tensor([[0.6336, 0.4086, 0.8900, 0.3950, 0.3900, 0.2950, 0.6504, 0.5066],
  29675. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  29676. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  29677. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  29678. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  29679. [0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  29680. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  29681. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833]],
  29682. device='cuda:0', dtype=torch.float64)
  29683. predictions are: tensor([[ 0.5283, -0.5369, 1.9181, -0.6369, -0.4015, -0.9028, 0.8409, -0.0470],
  29684. [ 0.2845, -0.6451, 1.9472, -0.3014, -0.4665, -0.3839, 0.4376, 0.1284],
  29685. [ 0.5186, -0.4488, 1.4861, -0.1716, -0.4262, -0.8543, 0.4471, 0.4673],
  29686. [ 0.3839, -0.5428, 1.3026, -1.1962, -0.0284, -1.3630, 0.4675, 0.3162],
  29687. [ 0.1748, -0.7349, 1.7817, -0.0084, -0.4737, -0.1699, 0.6443, 0.3722],
  29688. [ 0.4493, -0.5394, 1.7518, 0.1026, -0.4578, -0.4625, 0.4444, 0.3099],
  29689. [ 0.4751, -0.5104, 1.9062, -0.2140, -0.2256, 0.3614, 0.8055, 0.2947],
  29690. [ 0.3398, -0.6077, 0.9313, -1.0825, -0.4828, -0.9722, 0.4175, 0.3324]],
  29691. device='cuda:0', grad_fn=<AddmmBackward>)
  29692. landmarks are: tensor([[[ 0.6405, -0.3984, 1.8249, -0.4614, -0.4845, -0.9233, 0.7182,
  29693. 0.0539],
  29694. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  29695. 0.1852],
  29696. [ 0.6069, -0.3309, 1.3742, -0.1493, -0.5365, -0.9541, 0.2884,
  29697. 0.5071],
  29698. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  29699. 0.3854],
  29700. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  29701. 0.5239],
  29702. [ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  29703. 0.3392],
  29704. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  29705. 0.4701],
  29706. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  29707. 0.4085]]], device='cuda:0')
  29708. loss_train_step before backward: tensor(0.0231, device='cuda:0', grad_fn=<MseLossBackward>)
  29709. loss_train_step after backward: tensor(0.0231, device='cuda:0', grad_fn=<MseLossBackward>)
  29710. loss_train: 1.3488060417585075
  29711. step: 69
  29712. running loss: 0.01954791364867402
  29713. Train Steps: 69/90 Loss: 0.0195 torch.Size([8, 600, 800])
  29714. torch.Size([8, 8])
  29715. tensor([[0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510],
  29716. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679],
  29717. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  29718. [0.6030, 0.3969, 0.7988, 0.3917, 0.3450, 0.3667, 0.5266, 0.4700],
  29719. [ nan, nan, 0.7625, 0.2433, 0.3713, 0.2867, 0.5235, 0.5220],
  29720. [0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  29721. [0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  29722. [ nan, nan, 0.8463, 0.2550, 0.5850, 0.2133, 0.7129, 0.6072]],
  29723. device='cuda:0', dtype=torch.float64)
  29724. predictions are: tensor([[ 0.7772, -0.2527, 1.6278, 0.0698, -0.3793, -0.1506, 0.2176, 0.2853],
  29725. [-1.7345, -1.9180, 1.5621, -1.2114, 0.2351, -1.2765, 1.1004, 0.4288],
  29726. [ 0.8021, -0.2626, 1.6834, 0.2813, -0.5456, -0.5102, 0.6018, 0.0368],
  29727. [ 0.8277, -0.2241, 1.4681, -0.4764, -0.6223, -0.5843, 0.2276, 0.0560],
  29728. [-1.8877, -2.0528, 1.1652, -1.0918, -0.5150, -1.0408, 0.1515, 0.2189],
  29729. [ 0.8518, -0.1916, 1.7081, -0.0081, -0.2950, 0.3841, 0.5503, 0.2017],
  29730. [ 0.8578, -0.2372, 1.6706, 0.0083, -0.5515, -0.4213, 0.4641, 0.1731],
  29731. [-0.7118, -1.2511, 1.4998, -1.1039, 0.2474, -1.1877, 1.1366, 0.5582]],
  29732. device='cuda:0', grad_fn=<AddmmBackward>)
  29733. landmarks are: tensor([[[ 0.5334, -0.4252, 1.7499, -0.0226, -0.3979, -0.1920, 0.0558,
  29734. 0.2589],
  29735. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  29736. 0.3371],
  29737. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  29738. -0.0957],
  29739. [ 0.4992, -0.4525, 1.4035, -0.4768, -0.6924, -0.5923, 0.1465,
  29740. -0.1151],
  29741. [-2.2859, -2.2859, 1.2360, -1.1620, -0.5711, -0.9618, 0.1322,
  29742. 0.1253],
  29743. [ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  29744. 0.0412],
  29745. [ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  29746. 0.1082],
  29747. [-2.2859, -2.2859, 1.6229, -1.1081, 0.4162, -1.3005, 1.0070,
  29748. 0.5188]]], device='cuda:0')
  29749. loss_train_step before backward: tensor(0.0804, device='cuda:0', grad_fn=<MseLossBackward>)
  29750. loss_train_step after backward: tensor(0.0804, device='cuda:0', grad_fn=<MseLossBackward>)
  29751. loss_train: 1.429237652104348
  29752. step: 70
  29753. running loss: 0.020417680744347827
  29754. Train Steps: 70/90 Loss: 0.0204 torch.Size([8, 600, 800])
  29755. torch.Size([8, 8])
  29756. tensor([[0.6197, 0.4050, 0.7527, 0.2000, 0.4042, 0.2249, 0.5895, 0.4995],
  29757. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875],
  29758. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  29759. [ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  29760. [0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136],
  29761. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  29762. [0.6231, 0.3973, 0.8650, 0.3950, 0.3625, 0.3183, 0.5837, 0.5167],
  29763. [0.6296, 0.4045, 0.9138, 0.4100, 0.4232, 0.4242, 0.7422, 0.5297]],
  29764. device='cuda:0', dtype=torch.float64)
  29765. predictions are: tensor([[ 0.4453, -0.4955, 1.0256, -1.3659, -0.3497, -1.3072, 0.4431, 0.1319],
  29766. [ 0.5297, -0.4232, 1.5883, -0.5915, -0.5403, -0.8735, 0.1991, 0.1346],
  29767. [ 0.4946, -0.4857, 1.7351, -0.2698, -0.5069, -0.1672, 0.6268, 0.2527],
  29768. [-2.8201, -2.6383, 1.6262, -0.9551, 0.1732, -1.2972, 0.9966, 0.4400],
  29769. [ 0.3718, -0.5021, 1.6190, 0.1805, -0.0066, 0.1725, 0.3168, 0.2959],
  29770. [ 0.3578, -0.5493, 1.6804, -0.0961, -0.4836, -0.3701, 0.3286, 0.1494],
  29771. [ 0.4327, -0.5074, 1.5830, -0.3938, -0.5189, -0.8052, 0.3056, 0.2072],
  29772. [ 0.6953, -0.3807, 1.7009, -0.3156, -0.4463, -0.3204, 0.8906, 0.2495]],
  29773. device='cuda:0', grad_fn=<AddmmBackward>)
  29774. landmarks are: tensor([[[ 0.5762, -0.4153, 1.1908, -1.3622, -0.4190, -1.2471, 0.4368,
  29775. 0.0213],
  29776. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  29777. -0.0340],
  29778. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  29779. 0.0985],
  29780. [-2.2859, -2.2859, 1.8018, -0.9002, 0.1910, -1.2467, 1.1057,
  29781. 0.3799],
  29782. [ 0.5564, -0.3842, 1.7268, 0.1005, -0.0250, 0.3225, 0.2658,
  29783. 0.0862],
  29784. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  29785. 0.0467],
  29786. [ 0.5924, -0.4507, 1.7095, -0.4614, -0.6115, -0.8156, 0.4104,
  29787. 0.1005],
  29788. [ 0.6224, -0.4177, 1.9346, -0.3921, -0.3314, -0.3264, 1.1422,
  29789. 0.1608]]], device='cuda:0')
  29790. loss_train_step before backward: tensor(0.0187, device='cuda:0', grad_fn=<MseLossBackward>)
  29791. loss_train_step after backward: tensor(0.0187, device='cuda:0', grad_fn=<MseLossBackward>)
  29792. loss_train: 1.4479092578403652
  29793. step: 71
  29794. running loss: 0.020393088138596693
  29795. Train Steps: 71/90 Loss: 0.0204 torch.Size([8, 600, 800])
  29796. torch.Size([8, 8])
  29797. tensor([[0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  29798. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  29799. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  29800. [0.6160, 0.4093, 0.8314, 0.4417, 0.3675, 0.4583, 0.5250, 0.5808],
  29801. [0.6182, 0.3930, 0.8841, 0.3892, 0.3556, 0.4967, 0.6222, 0.5279],
  29802. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  29803. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  29804. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667]],
  29805. device='cuda:0', dtype=torch.float64)
  29806. predictions are: tensor([[ 0.4783, -0.4974, 1.6404, -0.4530, -0.5869, -0.5150, 0.2844, 0.1453],
  29807. [ 0.3782, -0.5538, 0.8784, -0.8781, -0.4522, -1.1484, 0.3703, 0.4597],
  29808. [ 0.4230, -0.5561, 2.0172, -0.3372, -0.3733, -0.6211, 0.8404, 0.1709],
  29809. [ 0.3973, -0.5338, 1.6760, -0.0551, -0.4016, -0.2625, 0.2399, 0.4082],
  29810. [ 0.4056, -0.5981, 1.8446, -0.3088, -0.4308, -0.1141, 0.7484, 0.1713],
  29811. [ 0.4678, -0.5262, 1.4584, -0.9175, -0.4248, -1.0008, 0.6792, 0.2188],
  29812. [ 0.0892, -0.7973, 1.9030, 0.0130, -0.0089, -0.0517, 0.2399, 0.0862],
  29813. [ 0.2341, -0.6479, 1.8795, -0.4693, -0.4716, -0.5444, 0.6646, 0.3986]],
  29814. device='cuda:0', grad_fn=<AddmmBackward>)
  29815. landmarks are: tensor([[[ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  29816. 0.2365],
  29817. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  29818. 0.4085],
  29819. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  29820. 0.1544],
  29821. [ 0.5592, -0.3956, 1.5543, -0.2456, -0.5885, -0.1689, 0.1392,
  29822. 0.3968],
  29823. [ 0.5697, -0.4706, 1.7976, -0.4884, -0.6433, 0.0081, 0.5878,
  29824. 0.1525],
  29825. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  29826. 0.1931],
  29827. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  29828. 0.0051],
  29829. [ 0.6040, -0.3614, 1.7672, -0.7001, -0.6404, -0.3768, 0.5778,
  29830. 0.3315]]], device='cuda:0')
  29831. loss_train_step before backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  29832. loss_train_step after backward: tensor(0.0253, device='cuda:0', grad_fn=<MseLossBackward>)
  29833. loss_train: 1.4732359643094242
  29834. step: 72
  29835. running loss: 0.02046161061540867
  29836.  
  29837. Train Steps: 72/90 Loss: 0.0205 torch.Size([8, 600, 800])
  29838. torch.Size([8, 8])
  29839. tensor([[0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  29840. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  29841. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332],
  29842. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  29843. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  29844. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  29845. [0.6114, 0.4018, 0.7213, 0.1967, 0.3763, 0.2700, 0.5875, 0.5533],
  29846. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550]],
  29847. device='cuda:0', dtype=torch.float64)
  29848. predictions are: tensor([[ 0.2125, -0.6521, 1.6035, -0.3375, -0.4940, -1.0512, 0.1700, 0.4392],
  29849. [ 0.4755, -0.4858, 1.6933, -0.1396, -0.4665, -0.1380, 0.0999, 0.3121],
  29850. [ 0.2651, -0.6861, 1.6333, 0.4201, -0.4264, 0.0603, 0.8666, 0.2789],
  29851. [ 0.2776, -0.6162, 1.7169, -1.3630, 0.0578, -1.5248, 0.7481, 0.0741],
  29852. [ 0.3534, -0.6021, 1.8435, 0.1591, -0.1584, 0.1252, 0.5831, 0.2369],
  29853. [ 0.5017, -0.5179, 1.9070, -0.4184, -0.5838, -0.5517, 0.5219, -0.0068],
  29854. [ 0.4388, -0.5183, 1.0337, -1.3808, -0.4962, -1.1296, 0.3308, 0.2330],
  29855. [ 0.4061, -0.5370, 1.5350, -0.8161, -0.6444, -0.3295, 0.4475, 0.3008]],
  29856. device='cuda:0', grad_fn=<AddmmBackward>)
  29857. landmarks are: tensor([[[ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  29858. 0.3928],
  29859. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  29860. 0.3265],
  29861. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  29862. 0.1768],
  29863. [ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  29864. -0.0369],
  29865. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  29866. 0.1474],
  29867. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  29868. -0.0670],
  29869. [ 0.5380, -0.4302, 1.0455, -1.3775, -0.5480, -1.0388, 0.4277,
  29870. 0.2699],
  29871. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  29872. 0.2776]]], device='cuda:0')
  29873. loss_train_step before backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  29874. loss_train_step after backward: tensor(0.0192, device='cuda:0', grad_fn=<MseLossBackward>)
  29875. loss_train: 1.4924231390468776
  29876. step: 73
  29877. running loss: 0.020444152589683254
  29878. Train Steps: 73/90 Loss: 0.0204 torch.Size([8, 600, 800])
  29879. torch.Size([8, 8])
  29880. tensor([[0.6171, 0.4127, 0.8900, 0.4800, 0.4325, 0.5783, 0.5769, 0.5090],
  29881. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  29882. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  29883. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  29884. [0.6108, 0.4011, 0.8037, 0.3400, 0.3700, 0.2933, 0.5658, 0.5617],
  29885. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  29886. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  29887. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817]],
  29888. device='cuda:0', dtype=torch.float64)
  29889. predictions are: tensor([[ 0.4990, -0.3994, 1.8878, 0.1543, -0.1967, 0.2972, 0.2611, 0.1317],
  29890. [-2.5539, -2.4791, 1.3508, -0.8933, -0.3324, -1.1283, 0.5128, 0.2438],
  29891. [ 0.5593, -0.4488, 1.0732, -1.2685, -0.3754, -1.2378, 0.5518, 0.1295],
  29892. [ 0.4449, -0.4705, 1.3463, -0.9438, -0.6151, -0.6301, 0.4881, 0.1498],
  29893. [ 0.4011, -0.5055, 1.4918, -0.5525, -0.5540, -0.9145, 0.3074, 0.2244],
  29894. [ 0.5259, -0.4571, 1.8694, -0.2454, -0.5995, -0.1364, 0.5221, 0.1358],
  29895. [ 0.4467, -0.4976, 1.9176, 0.1158, -0.4520, 0.0610, 0.3982, 0.1398],
  29896. [ 0.4622, -0.4492, 1.5167, -0.7024, -0.1878, -1.1792, 0.4206, 0.3888]],
  29897. device='cuda:0', grad_fn=<AddmmBackward>)
  29898. landmarks are: tensor([[[ 0.5645, -0.3797, 1.8249, -0.0688, -0.2882, 0.3854, 0.3789,
  29899. 0.0652],
  29900. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  29901. 0.3007],
  29902. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  29903. 0.2468],
  29904. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  29905. 0.2237],
  29906. [ 0.5355, -0.4335, 1.4266, -0.7155, -0.5769, -0.9310, 0.3275,
  29907. 0.3087],
  29908. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  29909. 0.2083],
  29910. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  29911. 0.2237],
  29912. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  29913. 0.4008]]], device='cuda:0')
  29914. loss_train_step before backward: tensor(0.0119, device='cuda:0', grad_fn=<MseLossBackward>)
  29915. loss_train_step after backward: tensor(0.0119, device='cuda:0', grad_fn=<MseLossBackward>)
  29916. loss_train: 1.5043019359000027
  29917. step: 74
  29918. running loss: 0.020328404539189226
  29919. Train Steps: 74/90 Loss: 0.0203 torch.Size([8, 600, 800])
  29920. torch.Size([8, 8])
  29921. tensor([[0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  29922. [0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882],
  29923. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  29924. [0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  29925. [0.6165, 0.4106, 0.7575, 0.1733, 0.3838, 0.2650, 0.5680, 0.5116],
  29926. [0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  29927. [0.6273, 0.4100, 0.7137, 0.2133, 0.4000, 0.2650, 0.6075, 0.5633],
  29928. [0.6083, 0.3957, 0.8638, 0.4950, 0.4363, 0.5083, 0.5346, 0.4980]],
  29929. device='cuda:0', dtype=torch.float64)
  29930. predictions are: tensor([[ 0.7385, -0.2766, 1.7929, -0.4707, -0.3836, -0.8503, 0.2929, 0.5421],
  29931. [ 0.4394, -0.5178, 1.7771, 0.1945, -0.5874, -0.4860, 0.1179, 0.1616],
  29932. [ 0.5185, -0.4564, 1.5172, -0.9465, -0.5366, -0.9257, 0.4488, 0.1289],
  29933. [ 0.4509, -0.5212, 1.7735, -0.5872, -0.6069, -0.7674, 0.4284, 0.1717],
  29934. [ 0.3056, -0.6098, 1.1797, -1.4743, -0.5555, -1.1407, 0.5208, 0.0257],
  29935. [ 0.5038, -0.4859, 1.7634, 0.1764, -0.2746, 0.2542, 0.7511, 0.2093],
  29936. [-0.1378, -0.8732, 0.9934, -1.3726, -0.4818, -1.0837, 0.5299, 0.3079],
  29937. [ 0.3289, -0.6140, 1.8338, 0.0409, -0.2576, 0.1750, 0.2668, 0.0221]],
  29938. device='cuda:0', grad_fn=<AddmmBackward>)
  29939. landmarks are: tensor([[[ 6.0075e-01, -3.2925e-01, 1.7037e+00, -5.4611e-01, -4.1524e-01,
  29940. -8.3095e-01, 3.2339e-01, 3.9283e-01],
  29941. [ 5.3788e-01, -4.3580e-01, 1.7326e+00, 1.8522e-01, -6.0577e-01,
  29942. -5.4611e-01, 6.8408e-02, -3.0981e-02],
  29943. [ 5.7806e-01, -4.1286e-01, 1.4142e+00, -9.0574e-01, -5.1146e-01,
  29944. -9.9373e-01, 4.6205e-01, 1.0799e-01],
  29945. [ 5.7771e-01, -4.4157e-01, 1.7044e+00, -5.8275e-01, -5.9618e-01,
  29946. -8.3610e-01, 4.8621e-01, 1.9626e-01],
  29947. [ 5.6184e-01, -3.8945e-01, 1.2129e+00, -1.4853e+00, -5.1339e-01,
  29948. -1.0619e+00, 3.3778e-01, 7.7228e-02],
  29949. [ 6.0425e-01, -4.2731e-01, 1.6920e+00, 1.8595e-01, -2.7171e-01,
  29950. 1.4059e-01, 7.9965e-01, 1.0043e-01],
  29951. [ 6.1155e-01, -3.9238e-01, 1.0109e+00, -1.3005e+00, -4.3834e-01,
  29952. -1.0619e+00, 5.2009e-01, 3.1609e-01],
  29953. [ 5.2379e-01, -4.5797e-01, 1.7037e+00, 4.6189e-04, -2.7090e-01,
  29954. 6.2048e-02, 1.8356e-01, 1.4106e-02]]], device='cuda:0')
  29955. loss_train_step before backward: tensor(0.0201, device='cuda:0', grad_fn=<MseLossBackward>)
  29956. loss_train_step after backward: tensor(0.0201, device='cuda:0', grad_fn=<MseLossBackward>)
  29957. loss_train: 1.5244338628835976
  29958. step: 75
  29959. running loss: 0.020325784838447967
  29960. Train Steps: 75/90 Loss: 0.0203 torch.Size([8, 600, 800])
  29961. torch.Size([8, 8])
  29962. tensor([[ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  29963. [0.6346, 0.4092, 0.7712, 0.5917, 0.4037, 0.4767, 0.7343, 0.5725],
  29964. [0.6129, 0.4114, 0.6950, 0.2467, 0.4050, 0.2133, 0.5363, 0.5550],
  29965. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  29966. [0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  29967. [0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136],
  29968. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  29969. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517]],
  29970. device='cuda:0', dtype=torch.float64)
  29971. predictions are: tensor([[-2.2324, -2.2225, 1.6292, -1.1904, 0.0917, -1.4040, 1.1599, 0.2829],
  29972. [ 0.7922, -0.2702, 1.3739, 0.1742, -0.5550, -0.2331, 0.7177, 0.3121],
  29973. [ 0.7121, -0.2939, 0.9677, -1.1365, -0.5669, -1.3134, 0.0549, 0.2373],
  29974. [ 0.8527, -0.2089, 1.8690, -0.2207, -0.6001, 0.2241, 0.3038, -0.0493],
  29975. [ 0.7100, -0.3023, 1.7268, 0.1583, -0.4271, 0.0640, 0.1201, 0.0194],
  29976. [ 0.7107, -0.2707, 1.5645, -0.6021, -0.6825, 0.0030, 0.3742, 0.1236],
  29977. [-2.0439, -2.0895, 1.1987, -1.0126, -0.5981, -1.1250, 0.1630, 0.2282],
  29978. [ 0.7303, -0.3029, 1.7606, -0.0840, -0.2595, -0.0316, 0.2301, 0.1367]],
  29979. device='cuda:0', grad_fn=<AddmmBackward>)
  29980. landmarks are: tensor([[[-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  29981. 0.2463],
  29982. [ 0.6454, -0.3960, 1.2764, 0.4470, -0.4210, -0.0842, 1.1057,
  29983. 0.3585],
  29984. [ 0.5448, -0.3859, 0.9242, -1.1466, -0.4152, -1.3005, 0.1910,
  29985. 0.2776],
  29986. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  29987. -0.0322],
  29988. [ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  29989. 0.0467],
  29990. [ 0.5466, -0.3840, 1.5016, -0.6077, -0.6404, 0.2083, 0.3871,
  29991. 0.0862],
  29992. [-2.2859, -2.2859, 1.2030, -1.0288, -0.4961, -1.1081, 0.0813,
  29993. 0.3161],
  29994. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  29995. 0.2622]]], device='cuda:0')
  29996. loss_train_step before backward: tensor(0.0172, device='cuda:0', grad_fn=<MseLossBackward>)
  29997. loss_train_step after backward: tensor(0.0172, device='cuda:0', grad_fn=<MseLossBackward>)
  29998. loss_train: 1.5416146223433316
  29999. step: 76
  30000. running loss: 0.020284402925570152
  30001.  
  30002. Train Steps: 76/90 Loss: 0.0203 torch.Size([8, 600, 800])
  30003. torch.Size([8, 8])
  30004. tensor([[0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  30005. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  30006. [0.6101, 0.3977, 0.8550, 0.5667, 0.3862, 0.4417, 0.5128, 0.4869],
  30007. [0.6286, 0.4055, 0.9000, 0.4717, 0.3763, 0.4683, 0.7018, 0.5494],
  30008. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800],
  30009. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  30010. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  30011. [0.6206, 0.4001, 0.8900, 0.3933, 0.3588, 0.3567, 0.5837, 0.5083]],
  30012. device='cuda:0', dtype=torch.float64)
  30013. predictions are: tensor([[-0.0093, -0.8159, 1.5997, -0.9410, -0.6810, -0.3697, 0.5364, 0.1780],
  30014. [ 0.4972, -0.5001, 1.7852, -0.1670, -0.4175, 0.0122, 0.3248, 0.1241],
  30015. [ 0.5981, -0.3969, 1.6569, 0.3041, -0.4702, -0.2394, 0.2030, 0.0229],
  30016. [ 0.5747, -0.4492, 1.8774, -0.2422, -0.5260, -0.1429, 1.0017, 0.2354],
  30017. [ 0.7515, -0.2731, 1.0945, -0.9634, -0.6238, -1.0175, 0.1457, 0.3325],
  30018. [ 0.5947, -0.4267, 1.8414, -0.3665, -0.3415, 0.1742, 0.4117, 0.1350],
  30019. [ 0.6684, -0.3270, 1.7121, 0.1320, -0.5190, -0.3264, 0.3048, 0.4452],
  30020. [ 0.4449, -0.5292, 1.8183, -0.6192, -0.6611, -0.6690, 0.3456, 0.0433]],
  30021. device='cuda:0', grad_fn=<AddmmBackward>)
  30022. landmarks are: tensor([[[ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  30023. 0.2391],
  30024. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  30025. 0.2035],
  30026. [ 0.5320, -0.4488, 1.6633, 0.3315, -0.5018, -0.2459, 0.0828,
  30027. -0.0370],
  30028. [ 0.6174, -0.4129, 1.8711, -0.1073, -0.5480, -0.1227, 0.9558,
  30029. 0.2516],
  30030. [ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  30031. 0.3931],
  30032. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  30033. 0.2545],
  30034. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  30035. 0.3084],
  30036. [ 0.5807, -0.4378, 1.8249, -0.4691, -0.6289, -0.6385, 0.4104,
  30037. 0.0620]]], device='cuda:0')
  30038. loss_train_step before backward: tensor(0.0129, device='cuda:0', grad_fn=<MseLossBackward>)
  30039. loss_train_step after backward: tensor(0.0129, device='cuda:0', grad_fn=<MseLossBackward>)
  30040. loss_train: 1.5544648678041995
  30041. step: 77
  30042. running loss: 0.020187855426028564
  30043. Train Steps: 77/90 Loss: 0.0202 torch.Size([8, 600, 800])
  30044. torch.Size([8, 8])
  30045. tensor([[ nan, nan, 0.7268, 0.2333, 0.4125, 0.1933, 0.5112, 0.5383],
  30046. [0.6137, 0.4038, 0.8563, 0.4050, 0.3813, 0.2550, 0.5106, 0.4954],
  30047. [0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800],
  30048. [ nan, nan, 0.6512, 0.1717, 0.4100, 0.1983, 0.5253, 0.5240],
  30049. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  30050. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  30051. [0.6246, 0.4008, 0.8757, 0.5088, 0.4101, 0.5392, 0.6644, 0.5133],
  30052. [0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901]],
  30053. device='cuda:0', dtype=torch.float64)
  30054. predictions are: tensor([[-1.9846, -2.0517, 1.0544, -1.1034, -0.4659, -1.2181, 0.2361, 0.2311],
  30055. [ 0.6813, -0.3112, 1.6636, -0.3705, -0.5481, -0.9216, 0.0807, 0.0184],
  30056. [ 0.8089, -0.2280, 1.1881, -0.7429, -0.6169, -0.8958, 0.1599, 0.2940],
  30057. [-1.8478, -1.9572, 0.9084, -1.2993, -0.4090, -1.2715, 0.3189, 0.2186],
  30058. [ 0.6891, -0.3126, 1.0502, -1.2537, -0.5350, -0.9494, 0.4252, 0.2086],
  30059. [ 0.7851, -0.2646, 1.7832, 0.0043, -0.2070, 0.1093, 0.2041, 0.1600],
  30060. [ 0.7233, -0.3370, 1.8567, 0.0620, -0.4575, 0.3413, 0.8358, 0.1053],
  30061. [ 0.7289, -0.2822, 1.9100, -0.5723, -0.6314, -0.3930, 0.5902, 0.0267]],
  30062. device='cuda:0', grad_fn=<AddmmBackward>)
  30063. landmarks are: tensor([[[-2.2859e+00, -2.2859e+00, 1.0712e+00, -1.2085e+00, -3.8060e-01,
  30064. -1.3929e+00, 7.5520e-02, 2.0062e-01],
  30065. [ 5.4850e-01, -4.2094e-01, 1.6691e+00, -4.1524e-01, -5.2494e-01,
  30066. -1.1081e+00, 7.2521e-02, 2.0831e-03],
  30067. [ 5.5484e-01, -3.9360e-01, 1.1634e+00, -8.1049e-01, -5.1917e-01,
  30068. -1.0696e+00, 2.3718e-01, 3.9307e-01],
  30069. [-2.2859e+00, -2.2859e+00, 7.2217e-01, -1.4930e+00, -3.9215e-01,
  30070. -1.3698e+00, 1.4038e-01, 1.3434e-01],
  30071. [ 5.3557e-01, -4.2171e-01, 1.0339e+00, -1.4776e+00, -5.0762e-01,
  30072. -1.1081e+00, 4.2194e-01, 2.8530e-01],
  30073. [ 5.3585e-01, -4.3703e-01, 1.7095e+00, -3.0331e-02, -8.0370e-02,
  30074. -3.8029e-02, 1.0439e-01, 3.3918e-01],
  30075. [ 5.9931e-01, -4.3453e-01, 1.7587e+00, 6.4079e-02, -3.9175e-01,
  30076. 2.0479e-01, 7.8274e-01, 8.5217e-02],
  30077. [ 6.0774e-01, -3.9646e-01, 1.8480e+00, -6.5389e-01, -6.2309e-01,
  30078. -4.5373e-01, 6.2155e-01, -2.1963e-02]]], device='cuda:0')
  30079. loss_train_step before backward: tensor(0.0198, device='cuda:0', grad_fn=<MseLossBackward>)
  30080. loss_train_step after backward: tensor(0.0198, device='cuda:0', grad_fn=<MseLossBackward>)
  30081. loss_train: 1.5742266257293522
  30082. step: 78
  30083. running loss: 0.020182392637555797
  30084. Train Steps: 78/90 Loss: 0.0202 torch.Size([8, 600, 800])
  30085. torch.Size([8, 8])
  30086. tensor([[0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  30087. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  30088. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646],
  30089. [0.6286, 0.4040, 0.8696, 0.3047, 0.3924, 0.2887, 0.6300, 0.5367],
  30090. [0.6160, 0.4093, 0.8314, 0.4417, 0.3675, 0.4583, 0.5250, 0.5808],
  30091. [0.6304, 0.4029, 0.8413, 0.5217, 0.4125, 0.5617, 0.7089, 0.5679],
  30092. [0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  30093. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250]],
  30094. device='cuda:0', dtype=torch.float64)
  30095. predictions are: tensor([[ 0.3673, -0.5634, 1.6359, -0.6539, -0.6386, -0.7926, 0.4197, 0.1037],
  30096. [ 0.7273, -0.2814, 1.7136, -0.3755, -0.6066, -0.4177, 0.0784, 0.1788],
  30097. [ 0.4522, -0.4597, 1.3317, -0.7944, -0.7027, -0.8624, -0.1578, 0.1287],
  30098. [ 0.5168, -0.4615, 1.5470, -0.9493, -0.4533, -0.9150, 0.5691, 0.2001],
  30099. [ 0.4989, -0.4498, 1.5476, -0.3193, -0.5839, -0.1889, 0.1756, 0.3494],
  30100. [ 0.5740, -0.4453, 1.6434, 0.0708, -0.4044, 0.3415, 0.9822, 0.2546],
  30101. [ 0.4685, -0.5086, 1.6151, 0.0564, -0.3354, 0.2027, 0.7280, 0.0913],
  30102. [ 0.3415, -0.5573, 1.7585, -0.8527, -0.4933, -0.7010, 0.5609, 0.1285]],
  30103. device='cuda:0', grad_fn=<AddmmBackward>)
  30104. landmarks are: tensor([[[ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  30105. 0.1963],
  30106. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  30107. 0.1852],
  30108. [ 0.5483, -0.4105, 1.4208, -0.8002, -0.6000, -0.9002, 0.0511,
  30109. 0.3220],
  30110. [ 0.6174, -0.4201, 1.7309, -0.8784, -0.4735, -0.9524, 0.6242,
  30111. 0.1931],
  30112. [ 0.5592, -0.3956, 1.5543, -0.2456, -0.5885, -0.1689, 0.1392,
  30113. 0.3968],
  30114. [ 0.6257, -0.4249, 1.5998, 0.1236, -0.3806, 0.3084, 0.9887,
  30115. 0.3371],
  30116. [ 0.6042, -0.4273, 1.6920, 0.1860, -0.2717, 0.1406, 0.7997,
  30117. 0.1004],
  30118. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  30119. 0.1390]]], device='cuda:0')
  30120. loss_train_step before backward: tensor(0.0083, device='cuda:0', grad_fn=<MseLossBackward>)
  30121. loss_train_step after backward: tensor(0.0083, device='cuda:0', grad_fn=<MseLossBackward>)
  30122. loss_train: 1.5825061020441353
  30123. step: 79
  30124. running loss: 0.020031722810685257
  30125. Train Steps: 79/90 Loss: 0.0200 torch.Size([8, 600, 800])
  30126. torch.Size([8, 8])
  30127. tensor([[0.6201, 0.4102, 0.7288, 0.2417, 0.4150, 0.2383, 0.6100, 0.5500],
  30128. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  30129. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690],
  30130. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  30131. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  30132. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  30133. [0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600],
  30134. [0.6099, 0.4030, 0.8638, 0.5117, 0.4983, 0.4965, 0.5086, 0.5388]],
  30135. device='cuda:0', dtype=torch.float64)
  30136. predictions are: tensor([[ 0.6953, -0.3039, 1.0919, -1.2795, -0.5539, -1.2303, 0.4363, 0.1660],
  30137. [ 0.6522, -0.3437, 1.6727, -0.4270, -0.6701, -0.1970, 0.1418, -0.0034],
  30138. [ 0.4385, -0.5066, 1.6041, 0.0371, -0.4771, 0.1611, 1.0337, 0.2570],
  30139. [ 0.6591, -0.3570, 1.7664, -0.3257, -0.6140, -0.1533, 0.2319, 0.1825],
  30140. [-1.6271, -1.8176, 1.2880, -1.0241, -0.5292, -1.1064, 0.1217, 0.2967],
  30141. [ 0.5874, -0.4156, 1.6548, 0.0828, -0.4626, 0.0553, 0.7523, 0.0670],
  30142. [ 0.7439, -0.2793, 1.7456, 0.1186, -0.5632, 0.0915, 0.3984, 0.1757],
  30143. [ 0.5422, -0.4143, 1.7436, -0.1030, -0.1236, -0.1744, 0.0474, 0.1065]],
  30144. device='cuda:0', grad_fn=<AddmmBackward>)
  30145. landmarks are: tensor([[[ 0.5784, -0.3913, 1.0801, -1.1697, -0.3691, -1.1851, 0.5316,
  30146. 0.2545],
  30147. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  30148. 0.0502],
  30149. [ 0.6306, -0.4153, 1.5141, 0.2224, -0.3691, 0.2622, 1.0033,
  30150. 0.3425],
  30151. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  30152. 0.3469],
  30153. [-2.2859, -2.2859, 1.2303, -0.7848, -0.4210, -1.1158, 0.2256,
  30154. 0.3777],
  30155. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  30156. 0.1176],
  30157. [ 0.5762, -0.3840, 1.7268, 0.2622, -0.4210, 0.1313, 0.4277,
  30158. 0.3007],
  30159. [ 0.5309, -0.4246, 1.7037, 0.0774, 0.0158, 0.0075, 0.0635,
  30160. 0.2026]]], device='cuda:0')
  30161. loss_train_step before backward: tensor(0.0213, device='cuda:0', grad_fn=<MseLossBackward>)
  30162. loss_train_step after backward: tensor(0.0213, device='cuda:0', grad_fn=<MseLossBackward>)
  30163. loss_train: 1.603833228815347
  30164. step: 80
  30165. running loss: 0.020047915360191838
  30166.  
  30167. Train Steps: 80/90 Loss: 0.0200 torch.Size([8, 600, 800])
  30168. torch.Size([8, 8])
  30169. tensor([[0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167],
  30170. [0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320],
  30171. [0.6201, 0.4036, 0.8596, 0.3850, 0.3492, 0.3785, 0.5978, 0.5131],
  30172. [0.6275, 0.4050, 0.9038, 0.3767, 0.3838, 0.3533, 0.7074, 0.5575],
  30173. [0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183],
  30174. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  30175. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  30176. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208]],
  30177. device='cuda:0', dtype=torch.float64)
  30178. predictions are: tensor([[ 0.3734, -0.5190, 1.1472, -0.9185, -0.5289, -0.9328, 0.3290, 0.5005],
  30179. [ 0.1556, -0.7042, 1.3313, -1.2112, -0.4058, -0.9651, 0.7235, 0.1515],
  30180. [ 0.7030, -0.3688, 1.7134, -0.4899, -0.7348, -0.4037, 0.3331, 0.0598],
  30181. [ 0.4604, -0.5118, 1.8374, -0.4674, -0.5123, -0.5352, 0.8484, 0.2562],
  30182. [ 0.7388, -0.3145, 1.3714, -1.0121, -0.5813, -1.0120, 0.1488, 0.0172],
  30183. [ 0.5941, -0.3950, 1.7309, -0.0935, -0.3420, 0.1457, 0.3144, 0.1970],
  30184. [ 0.5540, -0.4376, 1.6098, 0.0253, -0.2959, 0.2028, 0.3435, 0.1415],
  30185. [ 0.2762, -0.6084, 1.4040, -0.9958, -0.4741, -1.0922, 0.3900, 0.0834]],
  30186. device='cuda:0', grad_fn=<AddmmBackward>)
  30187. landmarks are: tensor([[[ 5.6307e-01, -4.1286e-01, 1.2129e+00, -9.2333e-01, -4.1524e-01,
  30188. -1.0311e+00, 4.5658e-01, 5.6243e-01],
  30189. [ 6.1413e-01, -4.1527e-01, 1.4208e+00, -1.2697e+00, -2.9400e-01,
  30190. -1.0234e+00, 8.6439e-01, 1.7146e-01],
  30191. [ 5.7829e-01, -4.2163e-01, 1.6847e+00, -5.0778e-01, -6.7321e-01,
  30192. -5.3774e-01, 4.7523e-01, 8.3916e-02],
  30193. [ 6.1248e-01, -4.1527e-01, 1.8885e+00, -5.4611e-01, -5.1339e-01,
  30194. -6.5389e-01, 9.8137e-01, 2.8902e-01],
  30195. [ 5.7985e-01, -4.1555e-01, 1.3977e+00, -1.0388e+00, -4.6721e-01,
  30196. -1.1004e+00, 3.4688e-01, 1.0824e-01],
  30197. [ 5.6374e-01, -4.1432e-01, 1.7519e+00, -7.8656e-02, -3.0554e-01,
  30198. -1.4935e-02, 3.7575e-01, 3.0839e-01],
  30199. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  30200. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  30201. [ 5.8851e-01, -4.4288e-01, 1.4266e+00, -9.9261e-01, -4.3834e-01,
  30202. -1.2313e+00, 4.2276e-01, 1.1948e-01]]], device='cuda:0')
  30203. loss_train_step before backward: tensor(0.0144, device='cuda:0', grad_fn=<MseLossBackward>)
  30204. loss_train_step after backward: tensor(0.0144, device='cuda:0', grad_fn=<MseLossBackward>)
  30205. loss_train: 1.6182256652973592
  30206. step: 81
  30207. running loss: 0.01997809463330073
  30208. Train Steps: 81/90 Loss: 0.0200 torch.Size([8, 600, 800])
  30209. torch.Size([8, 8])
  30210. tensor([[0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869],
  30211. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  30212. [0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  30213. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  30214. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  30215. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  30216. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  30217. [0.6293, 0.4097, 0.8800, 0.2517, 0.5262, 0.2600, 0.7430, 0.5378]],
  30218. device='cuda:0', dtype=torch.float64)
  30219. predictions are: tensor([[ 0.2903, -0.5904, 1.3713, -1.2827, -0.1585, -1.3888, 0.3519, 0.0815],
  30220. [ 0.3774, -0.5230, 1.1499, -0.9511, -0.7478, -0.5249, 0.2670, 0.2296],
  30221. [ 0.6424, -0.3445, 1.6242, -0.1800, -0.6430, 0.0166, 0.1866, 0.3549],
  30222. [ 0.3907, -0.5244, 1.1680, -1.1063, -0.3419, -1.1686, 0.3648, 0.2469],
  30223. [ 0.7197, -0.3552, 1.6134, 0.0642, -0.4562, 0.1645, 0.5280, 0.1403],
  30224. [ 0.5325, -0.4282, 1.7349, -0.4375, -0.4583, -1.1334, 0.2133, 0.0699],
  30225. [ 0.4556, -0.5406, 1.7986, -0.2391, -0.6904, 0.2913, 0.8318, 0.1297],
  30226. [ 0.4897, -0.4823, 1.6821, -1.0455, 0.0482, -1.0562, 0.9698, 0.2569]],
  30227. device='cuda:0', grad_fn=<AddmmBackward>)
  30228. landmarks are: tensor([[[ 0.6124, -0.4010, 1.4381, -1.3544, -0.0573, -1.5546, 0.5573,
  30229. -0.0369],
  30230. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  30231. 0.2545],
  30232. [ 0.5700, -0.4032, 1.7961, -0.1997, -0.5249, -0.2151, 0.3815,
  30233. 0.3161],
  30234. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  30235. 0.2083],
  30236. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  30237. 0.1627],
  30238. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  30239. -0.0529],
  30240. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  30241. 0.1715],
  30242. [ 0.6207, -0.3936, 1.7788, -1.1235, 0.1448, -1.0850, 1.1459,
  30243. 0.1982]]], device='cuda:0')
  30244. loss_train_step before backward: tensor(0.0183, device='cuda:0', grad_fn=<MseLossBackward>)
  30245. loss_train_step after backward: tensor(0.0183, device='cuda:0', grad_fn=<MseLossBackward>)
  30246. loss_train: 1.6365177757106721
  30247. step: 82
  30248. running loss: 0.019957533850130146
  30249. Train Steps: 82/90 Loss: 0.0200 torch.Size([8, 600, 800])
  30250. torch.Size([8, 8])
  30251. tensor([[0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  30252. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  30253. [0.6230, 0.4113, 0.7213, 0.1983, 0.4325, 0.2367, 0.6262, 0.5400],
  30254. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  30255. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552],
  30256. [0.6199, 0.4071, 0.7600, 0.2117, 0.4037, 0.2767, 0.6138, 0.5550],
  30257. [0.6260, 0.4253, 0.8938, 0.4400, 0.3675, 0.3650, 0.5675, 0.5767],
  30258. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933]],
  30259. device='cuda:0', dtype=torch.float64)
  30260. predictions are: tensor([[ 0.8619, -0.2506, 1.5938, 0.1987, -0.4249, 0.2109, 0.7913, 0.0299],
  30261. [ 0.8644, -0.2650, 1.7133, -0.0653, -0.5711, -0.0539, 0.4279, -0.0110],
  30262. [ 0.7838, -0.2591, 1.1059, -1.2509, -0.3135, -1.1064, 0.5907, 0.2126],
  30263. [ 0.8056, -0.2161, 1.6969, 0.2063, -0.5404, -0.2532, 0.2598, 0.3049],
  30264. [-2.0843, -2.1210, 1.6906, -1.1510, 0.0211, -1.1015, 0.7819, 0.1954],
  30265. [ 0.7208, -0.2959, 1.2570, -1.1981, -0.3980, -0.8894, 0.5388, 0.1905],
  30266. [ 0.8011, -0.2003, 1.7396, -0.2197, -0.6043, -0.5010, 0.2048, 0.3001],
  30267. [-1.8934, -1.9678, 0.8566, -1.1885, -0.4570, -1.1944, 0.0053, 0.2951]],
  30268. device='cuda:0', grad_fn=<AddmmBackward>)
  30269. landmarks are: tensor([[[ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  30270. 0.1176],
  30271. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  30272. -0.0534],
  30273. [ 0.5917, -0.3861, 1.0455, -1.3698, -0.2882, -1.1928, 0.6067,
  30274. 0.2083],
  30275. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  30276. 0.3084],
  30277. [-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  30278. 0.2783],
  30279. [ 0.5775, -0.4054, 1.2245, -1.3082, -0.4210, -1.0080, 0.5490,
  30280. 0.2776],
  30281. [ 0.6058, -0.3216, 1.8423, -0.2536, -0.5885, -0.6000, 0.3353,
  30282. 0.3777],
  30283. [-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  30284. 0.4543]]], device='cuda:0')
  30285. loss_train_step before backward: tensor(0.0177, device='cuda:0', grad_fn=<MseLossBackward>)
  30286. loss_train_step after backward: tensor(0.0177, device='cuda:0', grad_fn=<MseLossBackward>)
  30287. loss_train: 1.654198335018009
  30288. step: 83
  30289. running loss: 0.019930100421903723
  30290. Train Steps: 83/90 Loss: 0.0199 torch.Size([8, 600, 800])
  30291. torch.Size([8, 8])
  30292. tensor([[0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  30293. [0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447],
  30294. [0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  30295. [0.6197, 0.4091, 0.8800, 0.4783, 0.3538, 0.4767, 0.5950, 0.5550],
  30296. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  30297. [0.6261, 0.4131, 0.8938, 0.3550, 0.4000, 0.2683, 0.6188, 0.5283],
  30298. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875],
  30299. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266]],
  30300. device='cuda:0', dtype=torch.float64)
  30301. predictions are: tensor([[ 0.5667, -0.4106, 1.5669, 0.2542, -0.3283, -0.3381, 0.2532, 0.4962],
  30302. [ 0.4737, -0.5161, 1.7973, -0.2878, -0.4420, 0.0469, 1.0790, 0.2255],
  30303. [ 0.5542, -0.4182, 1.7720, -0.4122, -0.4295, 0.0192, 0.5208, 0.1936],
  30304. [ 0.6322, -0.4009, 1.6925, -0.2425, -0.4987, -0.1369, 0.4719, 0.3256],
  30305. [ 0.5740, -0.4672, 1.5395, 0.3276, -0.4665, 0.0108, 0.5626, -0.0387],
  30306. [ 0.6924, -0.3483, 1.8122, -0.8088, -0.3993, -1.0986, 0.6015, 0.1548],
  30307. [ 0.6318, -0.3645, 1.6522, -0.8129, -0.5442, -0.8673, 0.1077, -0.0085],
  30308. [ 0.2982, -0.5549, 1.0625, -1.3172, -0.2534, -1.1064, 0.5091, 0.5923]],
  30309. device='cuda:0', grad_fn=<AddmmBackward>)
  30310. landmarks are: tensor([[[ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  30311. 0.4624],
  30312. [ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  30313. 0.2302],
  30314. [ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  30315. 0.1775],
  30316. [ 0.5763, -0.3963, 1.7788, -0.0765, -0.6520, -0.0842, 0.4624,
  30317. 0.2776],
  30318. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  30319. -0.1385],
  30320. [ 0.6062, -0.3778, 1.8423, -0.6462, -0.4383, -1.0465, 0.5721,
  30321. 0.1544],
  30322. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  30323. -0.0340],
  30324. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  30325. 0.6084]]], device='cuda:0')
  30326. loss_train_step before backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  30327. loss_train_step after backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  30328. loss_train: 1.6629118216224015
  30329. step: 84
  30330. running loss: 0.01979656930502859
  30331.  
  30332. Train Steps: 84/90 Loss: 0.0198 torch.Size([8, 600, 800])
  30333. torch.Size([8, 8])
  30334. tensor([[0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  30335. [0.6223, 0.4028, 0.8988, 0.4200, 0.3763, 0.5733, 0.6375, 0.5167],
  30336. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617],
  30337. [0.6083, 0.3957, 0.8638, 0.4950, 0.4363, 0.5083, 0.5346, 0.4980],
  30338. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  30339. [0.6248, 0.4032, 0.7738, 0.1900, 0.4813, 0.1400, 0.5941, 0.4904],
  30340. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  30341. [0.6280, 0.4101, 0.9050, 0.4533, 0.3775, 0.3217, 0.6338, 0.4915]],
  30342. device='cuda:0', dtype=torch.float64)
  30343. predictions are: tensor([[ 0.6178, -0.4126, 1.6719, -0.2266, -0.2874, 0.0123, 0.7712, 0.1822],
  30344. [ 0.6737, -0.3681, 1.8302, -0.4825, -0.5582, 0.3299, 0.8426, 0.1744],
  30345. [ 0.4683, -0.4485, 1.6903, 0.0651, -0.5430, -0.3624, 0.4358, 0.4397],
  30346. [ 0.4677, -0.5152, 1.6872, -0.1683, -0.3159, 0.0394, 0.3376, 0.0098],
  30347. [ 0.4362, -0.4553, 1.5300, 0.2041, -0.3977, -0.2993, 0.3835, 0.5141],
  30348. [ 0.7591, -0.2939, 1.3000, -1.4181, -0.0185, -1.6864, 0.5949, 0.1079],
  30349. [ 0.4794, -0.4698, 1.6591, -0.1646, -0.1904, -0.1011, 0.2546, 0.4571],
  30350. [ 0.5885, -0.4134, 1.8501, -0.3274, -0.6333, -0.8266, 0.6597, 0.0587]],
  30351. device='cuda:0', grad_fn=<AddmmBackward>)
  30352. landmarks are: tensor([[[ 5.8284e-01, -4.6823e-01, 1.7031e+00, -4.9668e-02, -2.4581e-01,
  30353. 8.1770e-02, 6.3811e-01, 1.4745e-01],
  30354. [ 5.8857e-01, -4.2525e-01, 1.8654e+00, -3.4596e-01, -5.4804e-01,
  30355. 3.6228e-01, 6.5866e-01, 1.0054e-01],
  30356. [ 5.8972e-01, -3.5273e-01, 1.8018e+00, 2.5450e-01, -5.3072e-01,
  30357. -3.2286e-01, 3.1224e-01, 3.0839e-01],
  30358. [ 5.2379e-01, -4.5797e-01, 1.7037e+00, 4.6189e-04, -2.7090e-01,
  30359. 6.2048e-02, 1.8356e-01, 1.4106e-02],
  30360. [ 5.8360e-01, -3.6490e-01, 1.7210e+00, 3.8537e-01, -3.9792e-01,
  30361. -2.9207e-01, 3.0647e-01, 4.4696e-01],
  30362. [ 5.9994e-01, -4.2363e-01, 1.2880e+00, -1.4083e+00, -6.3048e-02,
  30363. -1.6393e+00, 4.5840e-01, -2.0790e-02],
  30364. [ 5.5000e-01, -4.0600e-01, 1.7326e+00, 2.3557e-02, -1.5543e-01,
  30365. -2.2633e-02, 1.4385e-01, 4.1710e-01],
  30366. [ 6.1484e-01, -3.9184e-01, 1.8942e+00, -1.9199e-01, -5.4226e-01,
  30367. -8.0015e-01, 6.4140e-01, -1.5569e-02]]], device='cuda:0')
  30368. loss_train_step before backward: tensor(0.0094, device='cuda:0', grad_fn=<MseLossBackward>)
  30369. loss_train_step after backward: tensor(0.0094, device='cuda:0', grad_fn=<MseLossBackward>)
  30370. loss_train: 1.6722815376706421
  30371. step: 85
  30372. running loss: 0.019673900443184025
  30373. Train Steps: 85/90 Loss: 0.0197 torch.Size([8, 600, 800])
  30374. torch.Size([8, 8])
  30375. tensor([[0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  30376. [0.6200, 0.3913, 0.8788, 0.5217, 0.4075, 0.5100, 0.6060, 0.4913],
  30377. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  30378. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450],
  30379. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  30380. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  30381. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  30382. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350]],
  30383. device='cuda:0', dtype=torch.float64)
  30384. predictions are: tensor([[ 0.5126, -0.3980, 1.1951, -0.8997, 0.0626, -1.4429, 0.3967, 0.6447],
  30385. [ 0.2296, -0.6835, 1.7541, -0.0746, -0.3331, 0.0221, 0.4547, 0.1091],
  30386. [ 0.6355, -0.3560, 1.8110, -0.0143, -0.5147, -0.2400, 0.4765, 0.4517],
  30387. [ 0.7565, -0.2948, 1.8072, -0.3907, -0.2909, 0.1811, 0.6384, 0.2877],
  30388. [ 0.8373, -0.2884, 1.7138, 0.2233, -0.4457, -0.0877, 0.8785, 0.0349],
  30389. [ 0.7473, -0.3367, 1.7696, 0.1339, -0.5059, -0.2661, 0.7932, 0.0021],
  30390. [ 0.4635, -0.4734, 1.6943, -0.5987, -0.5666, -0.5225, 0.3460, 0.1546],
  30391. [ 0.3809, -0.5535, 1.7622, -0.1957, -0.4246, -0.2758, 0.3063, 0.2153]],
  30392. device='cuda:0', grad_fn=<AddmmBackward>)
  30393. landmarks are: tensor([[[ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  30394. 0.5624],
  30395. [ 0.5776, -0.4784, 1.7730, 0.1236, -0.4037, 0.0697, 0.5132,
  30396. -0.0168],
  30397. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  30398. 0.3161],
  30399. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  30400. 0.2314],
  30401. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  30402. -0.0049],
  30403. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  30404. -0.0102],
  30405. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  30406. 0.0862],
  30407. [ 0.5513, -0.4467, 1.7095, -0.0303, -0.4788, -0.2921, 0.1692,
  30408. 0.1854]]], device='cuda:0')
  30409. loss_train_step before backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  30410. loss_train_step after backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  30411. loss_train: 1.686103314626962
  30412. step: 86
  30413. running loss: 0.019605852495662348
  30414. Train Steps: 86/90 Loss: 0.0196 torch.Size([8, 600, 800])
  30415. torch.Size([8, 8])
  30416. tensor([[0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  30417. [0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  30418. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  30419. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  30420. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317],
  30421. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  30422. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  30423. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550]],
  30424. device='cuda:0', dtype=torch.float64)
  30425. predictions are: tensor([[ 0.7564, -0.2589, 1.8650, -0.5441, -0.1607, -1.1702, 0.7058, 0.0304],
  30426. [ 0.8369, -0.2295, 1.6265, 0.1115, -0.1178, 0.0394, 0.4619, 0.3338],
  30427. [ 0.8468, -0.2518, 1.6333, -0.1932, -0.5100, -0.3991, 0.6418, 0.2949],
  30428. [-1.7919, -1.9164, 1.2644, -0.9980, -0.3826, -0.9792, 0.2770, 0.2354],
  30429. [ 0.7303, -0.2999, 1.2405, -1.0710, -0.2661, -1.0750, 0.7384, 0.1537],
  30430. [ 0.7327, -0.2754, 1.6966, -0.0502, -0.5937, -0.4542, 0.3500, 0.1744],
  30431. [-2.0738, -2.0970, 1.5829, -1.1729, 0.1751, -1.2038, 0.8197, 0.2315],
  30432. [ 0.7515, -0.2552, 1.3871, -0.7542, -0.4840, -0.8544, 0.2894, 0.1536]],
  30433. device='cuda:0', grad_fn=<AddmmBackward>)
  30434. landmarks are: tensor([[[ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  30435. 0.0171],
  30436. [ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  30437. 0.4239],
  30438. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  30439. 0.2853],
  30440. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  30441. 0.3007],
  30442. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  30443. 0.1698],
  30444. [ 0.5443, -0.3994, 1.7499, -0.1227, -0.6173, -0.5769, 0.0049,
  30445. 0.2071],
  30446. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  30447. 0.3104],
  30448. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  30449. 0.2776]]], device='cuda:0')
  30450. loss_train_step before backward: tensor(0.0267, device='cuda:0', grad_fn=<MseLossBackward>)
  30451. loss_train_step after backward: tensor(0.0267, device='cuda:0', grad_fn=<MseLossBackward>)
  30452. loss_train: 1.7128123142756522
  30453. step: 87
  30454. running loss: 0.01968749786523738
  30455. Train Steps: 87/90 Loss: 0.0197 torch.Size([8, 600, 800])
  30456. torch.Size([8, 8])
  30457. tensor([[0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  30458. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500],
  30459. [0.6075, 0.4007, 0.8275, 0.4917, 0.4050, 0.5100, 0.5167, 0.5280],
  30460. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  30461. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392],
  30462. [0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  30463. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  30464. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167]],
  30465. device='cuda:0', dtype=torch.float64)
  30466. predictions are: tensor([[ 5.6286e-01, -4.0666e-01, 1.1249e+00, -9.1667e-01, -4.4478e-01,
  30467. -9.4364e-01, 4.9949e-01, 3.6532e-01],
  30468. [ 4.0523e-01, -5.1145e-01, 1.8993e+00, 9.8369e-02, -4.8307e-01,
  30469. -4.0015e-01, 6.8296e-01, 2.3447e-01],
  30470. [ 4.5955e-01, -4.7740e-01, 1.6666e+00, -1.6434e-02, -2.6750e-01,
  30471. 5.4508e-02, 3.1240e-01, 1.9984e-01],
  30472. [ 2.8139e-01, -6.2768e-01, 2.0158e+00, -5.1398e-01, -2.0669e-01,
  30473. -1.3062e+00, 6.4697e-01, 7.9610e-03],
  30474. [ 5.3721e-01, -4.3750e-01, 1.7832e+00, 2.9688e-01, -2.3398e-01,
  30475. -1.2247e-03, 2.8872e-01, 1.9452e-01],
  30476. [ 6.6184e-01, -4.0100e-01, 1.3221e+00, -1.2418e+00, -4.3192e-01,
  30477. -9.4730e-01, 6.9494e-01, 1.1958e-01],
  30478. [ 5.3418e-01, -4.0369e-01, 1.3463e+00, -5.7753e-01, -5.9096e-01,
  30479. -5.4382e-01, 4.0242e-01, 4.7178e-01],
  30480. [ 5.9500e-01, -4.2295e-01, 1.4109e+00, -1.1970e+00, -6.6504e-02,
  30481. -1.4813e+00, 6.5024e-01, 1.0265e-01]], device='cuda:0',
  30482. grad_fn=<AddmmBackward>)
  30483. landmarks are: tensor([[[ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  30484. 0.3315],
  30485. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  30486. 0.2545],
  30487. [ 0.5200, -0.4353, 1.5363, -0.0149, -0.4152, 0.0697, 0.1005,
  30488. 0.1530],
  30489. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  30490. -0.0529],
  30491. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  30492. 0.2048],
  30493. [ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  30494. 0.0562],
  30495. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  30496. 0.4036],
  30497. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  30498. 0.1005]]], device='cuda:0')
  30499. loss_train_step before backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  30500. loss_train_step after backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  30501. loss_train: 1.7306391117163002
  30502. step: 88
  30503. running loss: 0.019666353542230685
  30504.  
  30505. Train Steps: 88/90 Loss: 0.0197 torch.Size([8, 600, 800])
  30506. torch.Size([8, 8])
  30507. tensor([[0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600],
  30508. [0.6031, 0.3986, 0.7462, 0.2833, 0.3638, 0.2717, 0.5253, 0.4726],
  30509. [0.6364, 0.4092, 0.8525, 0.5633, 0.3875, 0.4950, 0.6599, 0.5285],
  30510. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  30511. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  30512. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  30513. [0.6304, 0.4024, 0.8925, 0.4800, 0.3937, 0.4817, 0.7485, 0.5297],
  30514. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038]],
  30515. device='cuda:0', dtype=torch.float64)
  30516. predictions are: tensor([[ 0.6136, -0.3292, 1.7236, 0.2335, -0.3311, 0.0264, 0.4263, 0.2954],
  30517. [ 0.6881, -0.2870, 1.2374, -1.0072, -0.4346, -1.1297, 0.2528, 0.0145],
  30518. [ 0.5846, -0.4008, 1.6797, 0.3026, -0.3951, -0.1516, 0.7463, 0.1915],
  30519. [ 0.4226, -0.4940, 1.8812, -0.1699, -0.2164, -0.4229, 0.9591, 0.3326],
  30520. [ 0.6220, -0.3374, 1.7867, 0.2923, -0.3024, -0.1980, 0.3742, 0.3229],
  30521. [-2.1704, -2.2239, 1.4709, -0.8261, -0.5161, -0.9168, 0.2164, 0.1590],
  30522. [ 0.6821, -0.3473, 1.7859, -0.0876, -0.3812, -0.1809, 0.9278, 0.1667],
  30523. [ 0.6349, -0.3336, 1.7291, -0.1699, -0.1123, -0.1446, 0.1518, 0.0453]],
  30524. device='cuda:0', grad_fn=<AddmmBackward>)
  30525. landmarks are: tensor([[[ 5.7625e-01, -3.8397e-01, 1.7268e+00, 2.6220e-01, -4.2102e-01,
  30526. 1.3133e-01, 4.2771e-01, 3.0069e-01],
  30527. [ 4.9971e-01, -4.4465e-01, 1.1610e+00, -9.7721e-01, -6.0577e-01,
  30528. -1.0311e+00, 1.4038e-01, -1.0312e-01],
  30529. [ 6.5365e-01, -3.9601e-01, 1.6517e+00, 3.1609e-01, -4.9607e-01,
  30530. 4.6189e-04, 7.6203e-01, 1.5543e-01],
  30531. [ 6.4542e-01, -3.7194e-01, 1.9115e+00, -1.3041e-01, -5.0762e-01,
  30532. -2.8437e-01, 1.0033e+00, 4.3864e-01],
  30533. [ 5.8834e-01, -3.5935e-01, 1.7557e+00, 2.5450e-01, -4.1524e-01,
  30534. -6.1124e-02, 3.3533e-01, 3.0069e-01],
  30535. [-2.2859e+00, -2.2859e+00, 1.5767e+00, -7.5396e-01, -6.4042e-01,
  30536. -7.3087e-01, 1.7534e-01, 8.9251e-02],
  30537. [ 6.2566e-01, -4.2731e-01, 1.8365e+00, -6.8822e-02, -4.6721e-01,
  30538. -6.1124e-02, 1.1715e+00, 1.6077e-01],
  30539. [ 5.2494e-01, -4.4734e-01, 1.7326e+00, -9.1917e-02, -2.0162e-01,
  30540. 1.5443e-01, 1.7328e-01, 4.1158e-02]]], device='cuda:0')
  30541. loss_train_step before backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  30542. loss_train_step after backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  30543. loss_train: 1.7420769152231514
  30544. step: 89
  30545. running loss: 0.019573897923855634
  30546. Train Steps: 89/90 Loss: 0.0196 torch.Size([8, 600, 800])
  30547. torch.Size([8, 8])
  30548. tensor([[0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  30549. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  30550. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  30551. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390],
  30552. [0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  30553. [0.6262, 0.4052, 0.8888, 0.4700, 0.3675, 0.5117, 0.6350, 0.5233],
  30554. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  30555. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006]],
  30556. device='cuda:0', dtype=torch.float64)
  30557. predictions are: tensor([[ 0.4671, -0.5049, 1.8774, -0.1466, -0.0864, -0.0608, 0.2093, 0.0941],
  30558. [ 0.5628, -0.4053, 0.9370, -1.2464, -0.2642, -1.3898, 0.2510, 0.3911],
  30559. [ 0.7089, -0.3867, 1.8857, -0.3630, -0.5566, -0.5843, 0.7402, 0.1295],
  30560. [ 0.5594, -0.4493, 1.9432, -0.0785, -0.3768, 0.2006, 1.0250, 0.2871],
  30561. [ 0.0606, -0.7394, 1.5011, -0.7235, -0.4577, -1.0457, 0.0626, 0.1358],
  30562. [ 0.7851, -0.2815, 1.9567, -0.1113, -0.4422, 0.0439, 0.6305, 0.0925],
  30563. [ 0.4946, -0.4309, 1.6859, 0.3787, -0.4591, -0.5892, 0.3183, 0.4996],
  30564. [ 0.5189, -0.5028, 1.7568, 0.4543, -0.5045, -0.1441, 0.6245, 0.0330]],
  30565. device='cuda:0', grad_fn=<AddmmBackward>)
  30566. landmarks are: tensor([[[ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  30567. 0.0051],
  30568. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  30569. 0.3808],
  30570. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  30571. 0.0697],
  30572. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  30573. 0.2035],
  30574. [ 0.5532, -0.3888, 1.4727, -0.7463, -0.5538, -1.0465, 0.0265,
  30575. 0.2138],
  30576. [ 0.6063, -0.4142, 1.8192, -0.1150, -0.5885, 0.0774, 0.6471,
  30577. 0.1313],
  30578. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  30579. 0.4778],
  30580. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  30581. 0.0261]]], device='cuda:0')
  30582. loss_train_step before backward: tensor(0.0123, device='cuda:0', grad_fn=<MseLossBackward>)
  30583. loss_train_step after backward: tensor(0.0123, device='cuda:0', grad_fn=<MseLossBackward>)
  30584. loss_train: 1.7543703555129468
  30585. step: 90
  30586. running loss: 0.019493003950143854
  30587. Valid Steps: 10/10 Loss: nan 3.8413
  30588. --------------------------------------------------
  30589. Epoch: 8 Train Loss: 0.0195 Valid Loss: nan
  30590. --------------------------------------------------
  30591. size of train loader is: 90
  30592. torch.Size([8, 600, 800])
  30593. torch.Size([8, 8])
  30594. tensor([[0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  30595. [0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183],
  30596. [0.6135, 0.3994, 0.7913, 0.3050, 0.3625, 0.3050, 0.5837, 0.5050],
  30597. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967],
  30598. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  30599. [0.6357, 0.4139, 0.8450, 0.5883, 0.3775, 0.4950, 0.6488, 0.5297],
  30600. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540],
  30601. [0.6127, 0.4115, 0.7163, 0.2883, 0.3625, 0.2950, 0.5327, 0.5495]],
  30602. device='cuda:0', dtype=torch.float64)
  30603. predictions are: tensor([[ 0.6140, -0.3871, 1.6023, -0.7491, -0.5414, -0.3933, 0.5851, 0.2746],
  30604. [ 0.5138, -0.4631, 1.5303, -0.9427, -0.4560, -1.2151, 0.2397, 0.0554],
  30605. [ 0.4892, -0.4673, 1.4873, -0.7423, -0.5505, -0.9114, 0.4542, 0.1094],
  30606. [ 0.6205, -0.3850, 1.7838, -0.1074, -0.5529, -0.0047, 0.3428, 0.1468],
  30607. [ 0.6016, -0.4252, 1.7565, 0.4326, -0.3560, -0.1970, 0.4493, 0.1951],
  30608. [ 0.7335, -0.3303, 1.8009, 0.5891, -0.5046, -0.0271, 0.7923, 0.1182],
  30609. [-0.4382, -1.0592, 1.7135, -1.0684, 0.3674, -1.3955, 0.8355, 0.2889],
  30610. [ 0.4659, -0.4597, 1.1708, -0.8018, -0.5448, -0.9428, 0.1353, 0.3279]],
  30611. device='cuda:0', grad_fn=<AddmmBackward>)
  30612. landmarks are: tensor([[[ 5.7991e-01, -4.0985e-01, 1.5651e+00, -1.0465e+00, -5.8845e-01,
  30613. -3.0747e-01, 6.4134e-01, 1.3903e-01],
  30614. [ 5.7985e-01, -4.1555e-01, 1.3977e+00, -1.0388e+00, -4.6721e-01,
  30615. -1.1004e+00, 3.4688e-01, 1.0824e-01],
  30616. [ 5.4769e-01, -4.4126e-01, 1.3688e+00, -8.7714e-01, -6.1155e-01,
  30617. -8.7714e-01, 4.1039e-01, 4.6651e-02],
  30618. [ 4.9740e-01, -4.4819e-01, 1.6633e+00, -3.3056e-01, -6.1732e-01,
  30619. 1.3133e-01, 2.9255e-01, 8.0947e-03],
  30620. [ 5.7800e-01, -4.5651e-01, 1.6221e+00, 2.5323e-01, -3.7281e-01,
  30621. -1.7182e-01, 4.3570e-01, 2.0910e-01],
  30622. [ 6.5036e-01, -3.7434e-01, 1.6171e+00, 4.3156e-01, -5.4226e-01,
  30623. 4.6189e-04, 7.1085e-01, 1.6077e-01],
  30624. [ 6.4871e-01, -3.7916e-01, 1.6344e+00, -1.0850e+00, 2.6592e-01,
  30625. -1.5397e+00, 8.0590e-01, 2.7299e-01],
  30626. [ 5.4417e-01, -3.8545e-01, 1.0224e+00, -9.5412e-01, -6.1155e-01,
  30627. -9.2333e-01, 1.7452e-01, 2.5215e-01]]], device='cuda:0')
  30628. loss_train_step before backward: tensor(0.0350, device='cuda:0', grad_fn=<MseLossBackward>)
  30629. loss_train_step after backward: tensor(0.0350, device='cuda:0', grad_fn=<MseLossBackward>)
  30630. loss_train: 0.035023126751184464
  30631. step: 1
  30632. running loss: 0.035023126751184464
  30633. Train Steps: 1/90 Loss: 0.0350 torch.Size([8, 600, 800])
  30634. torch.Size([8, 8])
  30635. tensor([[ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  30636. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  30637. [0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901],
  30638. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  30639. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  30640. [0.6187, 0.4104, 0.7126, 0.2069, 0.3950, 0.2517, 0.5913, 0.5683],
  30641. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  30642. [0.6289, 0.4081, 0.8720, 0.3487, 0.3900, 0.3183, 0.6703, 0.5376]],
  30643. device='cuda:0', dtype=torch.float64)
  30644. predictions are: tensor([[-1.5893, -1.8049, 1.6660, -0.9662, 0.1232, -1.2444, 0.7696, 0.2287],
  30645. [ 0.6649, -0.2618, 1.4795, -0.3987, -0.1274, -1.2144, 0.1891, 0.4023],
  30646. [ 0.8279, -0.1916, 1.8551, -0.5088, -0.6687, -0.4753, 0.5482, -0.0837],
  30647. [ 0.6262, -0.3445, 1.6581, 0.1843, -0.3398, 0.0883, 0.3233, 0.1184],
  30648. [-2.2111, -2.2507, 0.9937, -1.0590, -0.2451, -1.3357, 0.2370, 0.3124],
  30649. [ 0.7010, -0.3028, 1.0150, -1.1334, -0.4862, -1.0880, 0.4025, 0.2193],
  30650. [ 0.6674, -0.3327, 1.6469, 0.4851, -0.5619, 0.0573, 0.2066, 0.0539],
  30651. [ 0.6414, -0.3664, 1.7301, -0.4614, -0.4897, -0.7804, 0.7746, 0.1199]],
  30652. device='cuda:0', grad_fn=<AddmmBackward>)
  30653. landmarks are: tensor([[[-2.2859e+00, -2.2859e+00, 1.7210e+00, -9.7721e-01, 1.8522e-01,
  30654. -1.3698e+00, 7.9859e-01, 3.1039e-01],
  30655. [ 6.2367e-01, -2.9831e-01, 1.3919e+00, -4.6913e-01, -4.5727e-02,
  30656. -1.2313e+00, 2.4525e-01, 5.8821e-01],
  30657. [ 6.0774e-01, -3.9646e-01, 1.8480e+00, -6.5389e-01, -6.2309e-01,
  30658. -4.5373e-01, 6.2155e-01, -2.1963e-02],
  30659. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  30660. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  30661. [-2.2859e+00, -2.2859e+00, 7.1062e-01, -1.4468e+00, -2.8822e-01,
  30662. -1.4237e+00, 2.4296e-01, 3.6228e-01],
  30663. [ 5.7182e-01, -3.9053e-01, 1.0053e+00, -1.3305e+00, -4.6143e-01,
  30664. -1.1235e+00, 4.4503e-01, 3.3918e-01],
  30665. [ 5.0785e-01, -4.7144e-01, 1.6575e+00, 2.2371e-01, -4.9607e-01,
  30666. 7.7444e-02, 1.4655e-01, -1.0613e-01],
  30667. [ 6.1907e-01, -4.0082e-01, 1.7420e+00, -6.7528e-01, -4.8453e-01,
  30668. -8.1555e-01, 8.1006e-01, 1.9744e-01]]], device='cuda:0')
  30669. loss_train_step before backward: tensor(0.0246, device='cuda:0', grad_fn=<MseLossBackward>)
  30670. loss_train_step after backward: tensor(0.0246, device='cuda:0', grad_fn=<MseLossBackward>)
  30671. loss_train: 0.05961088836193085
  30672. step: 2
  30673. running loss: 0.029805444180965424
  30674.  
  30675. Train Steps: 2/90 Loss: 0.0298 torch.Size([8, 600, 800])
  30676. torch.Size([8, 8])
  30677. tensor([[0.6136, 0.4117, 0.8700, 0.5167, 0.4188, 0.5083, 0.5147, 0.5495],
  30678. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  30679. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  30680. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  30681. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  30682. [0.6141, 0.4038, 0.8650, 0.4833, 0.4839, 0.5176, 0.5787, 0.5600],
  30683. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  30684. [0.6113, 0.4006, 0.8700, 0.5350, 0.3638, 0.3767, 0.5097, 0.4882]],
  30685. device='cuda:0', dtype=torch.float64)
  30686. predictions are: tensor([[ 0.3977, -0.5190, 1.6397, 0.2275, -0.4261, 0.0427, 0.1332, 0.2363],
  30687. [ 0.5997, -0.4350, 1.6313, 0.4328, -0.5913, -0.0857, 0.5645, -0.0069],
  30688. [ 0.7061, -0.3038, 1.7128, -0.8875, -0.1318, -1.3337, 0.5031, 0.0823],
  30689. [ 0.4596, -0.4776, 1.4336, -1.1474, -0.1885, -1.2794, 0.5792, 0.2321],
  30690. [ 0.5913, -0.3999, 1.4971, -0.7091, -0.7462, -0.3909, 0.3259, 0.3171],
  30691. [ 0.2882, -0.5980, 1.6730, -0.0155, -0.1775, 0.0260, 0.2027, 0.3243],
  30692. [ 0.4600, -0.5590, 1.9039, -0.2497, -0.3810, -0.9030, 1.0014, 0.1673],
  30693. [ 0.2536, -0.6194, 1.6788, 0.1859, -0.7088, -0.5439, 0.0605, 0.0532]],
  30694. device='cuda:0', grad_fn=<AddmmBackward>)
  30695. landmarks are: tensor([[[ 0.5482, -0.3841, 1.7326, 0.1005, -0.3517, 0.0620, 0.0912,
  30696. 0.2522],
  30697. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  30698. -0.0049],
  30699. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  30700. 0.0051],
  30701. [ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  30702. 0.2083],
  30703. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  30704. 0.2391],
  30705. [ 0.5505, -0.4207, 1.7095, -0.0534, -0.0509, 0.1050, 0.3873,
  30706. 0.3007],
  30707. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  30708. 0.2142],
  30709. [ 0.5379, -0.4358, 1.7326, 0.1852, -0.6058, -0.5461, 0.0684,
  30710. -0.0310]]], device='cuda:0')
  30711. loss_train_step before backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  30712. loss_train_step after backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  30713. loss_train: 0.06913623213768005
  30714. step: 3
  30715. running loss: 0.023045410712560017
  30716. Train Steps: 3/90 Loss: 0.0230 torch.Size([8, 600, 800])
  30717. torch.Size([8, 8])
  30718. tensor([[0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  30719. [0.6229, 0.4086, 0.7538, 0.2600, 0.4775, 0.1617, 0.5900, 0.5383],
  30720. [0.6128, 0.4115, 0.7934, 0.3778, 0.3450, 0.4033, 0.5337, 0.5456],
  30721. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  30722. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  30723. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  30724. [0.6224, 0.3964, 0.8225, 0.5717, 0.4150, 0.4617, 0.5775, 0.5267],
  30725. [0.6198, 0.4130, 0.8762, 0.4117, 0.3650, 0.4900, 0.5707, 0.5103]],
  30726. device='cuda:0', dtype=torch.float64)
  30727. predictions are: tensor([[ 0.7372, -0.2586, 1.7167, 0.3747, -0.4748, -0.1449, 0.4796, 0.0674],
  30728. [ 0.8608, -0.2171, 1.2050, -1.0956, -0.1502, -1.5177, 0.4047, 0.2153],
  30729. [ 0.5684, -0.3655, 1.4035, -0.4764, -0.7140, -0.4578, 0.2291, 0.2330],
  30730. [-1.4736, -1.7437, 1.6607, -1.0372, 0.2038, -1.3720, 0.9044, 0.2716],
  30731. [-2.0843, -2.1717, 1.3421, -0.6876, -0.6274, -0.8590, 0.1328, 0.2106],
  30732. [ 0.6394, -0.3625, 1.4053, -0.7157, -0.6669, -0.7526, 0.3336, 0.1017],
  30733. [ 0.7157, -0.3242, 1.5919, 0.4262, -0.4433, -0.1878, 0.3655, 0.0658],
  30734. [ 0.7816, -0.2302, 1.8276, -0.3053, -0.6136, -0.1140, 0.3521, 0.0361]],
  30735. device='cuda:0', grad_fn=<AddmmBackward>)
  30736. landmarks are: tensor([[[ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  30737. 0.2391],
  30738. [ 0.5911, -0.3984, 1.1956, -1.0850, -0.0804, -1.5392, 0.4393,
  30739. 0.2006],
  30740. [ 0.5444, -0.3852, 1.3786, -0.5409, -0.6924, -0.4229, 0.1791,
  30741. 0.2341],
  30742. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  30743. 0.3104],
  30744. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  30745. 0.2837],
  30746. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  30747. 0.0942],
  30748. [ 0.5891, -0.4550, 1.5132, 0.3546, -0.3691, -0.1535, 0.3815,
  30749. 0.1467],
  30750. [ 0.5771, -0.3784, 1.7614, -0.3844, -0.6000, -0.0226, 0.3501,
  30751. 0.0712]]], device='cuda:0')
  30752. loss_train_step before backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  30753. loss_train_step after backward: tensor(0.0222, device='cuda:0', grad_fn=<MseLossBackward>)
  30754. loss_train: 0.0913512222468853
  30755. step: 4
  30756. running loss: 0.022837805561721325
  30757. Train Steps: 4/90 Loss: 0.0228 torch.Size([8, 600, 800])
  30758. torch.Size([8, 8])
  30759. tensor([[0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  30760. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  30761. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  30762. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  30763. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  30764. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  30765. [0.6332, 0.4128, 0.9200, 0.3517, 0.4400, 0.3833, 0.7461, 0.5494],
  30766. [0.6182, 0.3998, 0.8793, 0.4191, 0.3552, 0.4285, 0.6038, 0.5312]],
  30767. device='cuda:0', dtype=torch.float64)
  30768. predictions are: tensor([[ 0.3963, -0.5111, 1.5654, -0.2544, -0.6555, -0.8049, -0.0029, 0.2036],
  30769. [ 0.6896, -0.3829, 1.4768, -0.9736, -0.0825, -1.4334, 0.5826, 0.1867],
  30770. [ 0.5362, -0.5103, 1.6700, 0.3681, -0.4911, -0.0497, 0.4941, 0.1507],
  30771. [ 0.2169, -0.6776, 1.1213, -0.8193, -0.6600, -0.8720, 0.0790, 0.0277],
  30772. [ 0.5976, -0.4572, 1.3894, -1.2061, -0.0525, -1.4916, 0.4835, 0.0843],
  30773. [ 0.4290, -0.4816, 1.7752, -0.1858, -0.6380, -0.3565, 0.2010, 0.2168],
  30774. [ 0.3762, -0.6093, 1.8550, -0.4568, -0.4097, -0.4039, 1.0037, 0.2467],
  30775. [ 0.5470, -0.4521, 1.7105, -0.2674, -0.6784, -0.2623, 0.4499, 0.1900]],
  30776. device='cuda:0', grad_fn=<AddmmBackward>)
  30777. landmarks are: tensor([[[ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  30778. 0.2116],
  30779. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  30780. 0.0851],
  30781. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  30782. 0.1979],
  30783. [ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  30784. 0.0141],
  30785. [ 0.6126, -0.4057, 1.4439, -1.3159, -0.1150, -1.5777, 0.5537,
  30786. -0.0530],
  30787. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  30788. 0.1852],
  30789. [ 0.6388, -0.3792, 1.9635, -0.6616, -0.2536, -0.5153, 1.1605,
  30790. 0.2516],
  30791. [ 0.5697, -0.4393, 1.7754, -0.3503, -0.6453, -0.3067, 0.5028,
  30792. 0.1677]]], device='cuda:0')
  30793. loss_train_step before backward: tensor(0.0120, device='cuda:0', grad_fn=<MseLossBackward>)
  30794. loss_train_step after backward: tensor(0.0120, device='cuda:0', grad_fn=<MseLossBackward>)
  30795. loss_train: 0.10337931476533413
  30796. step: 5
  30797. running loss: 0.020675862953066827
  30798. Train Steps: 5/90 Loss: 0.0207 torch.Size([8, 600, 800])
  30799. torch.Size([8, 8])
  30800. tensor([[0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  30801. [0.6101, 0.4042, 0.7775, 0.2617, 0.3713, 0.2817, 0.5440, 0.5650],
  30802. [0.6149, 0.4054, 0.6713, 0.2333, 0.4025, 0.2017, 0.5213, 0.5695],
  30803. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  30804. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  30805. [0.6132, 0.3930, 0.8672, 0.4754, 0.3712, 0.5222, 0.5974, 0.5098],
  30806. [0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  30807. [0.6209, 0.3920, 0.8650, 0.5367, 0.4400, 0.5067, 0.6025, 0.4950]],
  30808. device='cuda:0', dtype=torch.float64)
  30809. predictions are: tensor([[ 0.5466, -0.4835, 1.6164, -0.6194, -0.7410, -0.6682, 0.3838, 0.1722],
  30810. [ 0.4471, -0.5391, 1.2867, -0.9394, -0.5697, -1.0218, 0.1520, 0.2237],
  30811. [ 0.1865, -0.6866, 0.8140, -1.0698, -0.4618, -1.3994, -0.0308, 0.2866],
  30812. [ 0.4823, -0.4738, 1.8417, -0.0641, -0.4494, 0.1759, 0.4307, 0.3456],
  30813. [ 0.5742, -0.4413, 1.7019, -0.8798, -0.3884, -1.1352, 0.6841, 0.1134],
  30814. [ 0.5016, -0.4895, 1.7512, 0.0568, -0.5928, 0.0645, 0.3931, 0.1011],
  30815. [ 0.5847, -0.4574, 1.7197, -0.7646, -0.0677, -1.3968, 0.8645, 0.1314],
  30816. [ 0.3921, -0.5961, 1.7098, 0.3133, -0.3360, 0.0101, 0.3127, -0.0480]],
  30817. device='cuda:0', grad_fn=<AddmmBackward>)
  30818. landmarks are: tensor([[[ 5.6801e-01, -4.3934e-01, 1.5920e+00, -6.6715e-01, -6.4527e-01,
  30819. -5.4566e-01, 5.1492e-01, 1.7534e-01],
  30820. [ 5.3204e-01, -4.1886e-01, 1.3053e+00, -1.0773e+00, -5.7113e-01,
  30821. -9.8491e-01, 2.2674e-01, 3.2370e-01],
  30822. [ 5.5445e-01, -4.1332e-01, 8.1455e-01, -1.2082e+00, -4.2679e-01,
  30823. -1.3544e+00, 1.2208e-01, 3.4458e-01],
  30824. [ 5.7719e-01, -3.9130e-01, 1.8480e+00, -2.4588e-01, -4.3256e-01,
  30825. 1.9292e-01, 5.3741e-01, 4.7005e-01],
  30826. [ 6.0837e-01, -4.0762e-01, 1.6806e+00, -9.6182e-01, -2.9977e-01,
  30827. -9.6952e-01, 6.3557e-01, 1.4673e-01],
  30828. [ 5.4660e-01, -4.7064e-01, 1.7198e+00, -9.0292e-02, -5.7125e-01,
  30829. 1.2613e-01, 4.7328e-01, 6.8827e-02],
  30830. [ 6.5201e-01, -3.9120e-01, 1.7095e+00, -9.0793e-01, -2.8406e-02,
  30831. -1.3621e+00, 8.0956e-01, 2.3558e-01],
  30832. [ 5.8199e-01, -4.7544e-01, 1.7095e+00, 1.9292e-01, -2.5358e-01,
  30833. 5.4350e-02, 4.9700e-01, 4.6189e-04]]], device='cuda:0')
  30834. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  30835. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  30836. loss_train: 0.11402785126119852
  30837. step: 6
  30838. running loss: 0.01900464187686642
  30839.  
  30840. Train Steps: 6/90 Loss: 0.0190 torch.Size([8, 600, 800])
  30841. torch.Size([8, 8])
  30842. tensor([[0.6276, 0.4235, 0.8888, 0.5333, 0.3800, 0.3117, 0.5427, 0.6164],
  30843. [0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  30844. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  30845. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  30846. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  30847. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  30848. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  30849. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268]],
  30850. device='cuda:0', dtype=torch.float64)
  30851. predictions are: tensor([[ 0.5891, -0.3890, 1.6729, 0.2073, -0.4570, -0.8302, 0.3594, 0.4329],
  30852. [ 0.4704, -0.4707, 1.7011, -0.0808, -0.2426, -0.0565, 0.0563, 0.1839],
  30853. [ 0.4041, -0.5540, 1.0145, -1.2279, -0.3703, -1.4565, 0.2284, -0.0221],
  30854. [ 0.5034, -0.4659, 1.5339, -0.5810, -0.6889, -0.4715, 0.2772, 0.1573],
  30855. [ 0.5466, -0.4884, 1.7959, -0.1409, -0.5534, -0.4282, 0.8416, 0.0456],
  30856. [ 0.6808, -0.3508, 1.6525, -0.6522, -0.6313, -0.4027, 0.3507, 0.0792],
  30857. [-2.1821, -2.2742, 1.3833, -0.8228, -0.5880, -1.0219, 0.2936, 0.2045],
  30858. [ 0.6380, -0.4148, 1.7247, -0.0332, -0.2073, 0.0171, 0.6617, 0.0978]],
  30859. device='cuda:0', grad_fn=<AddmmBackward>)
  30860. landmarks are: tensor([[[ 0.6131, -0.3299, 1.8192, 0.1775, -0.5307, -0.8463, 0.2206,
  30861. 0.5612],
  30862. [ 0.5491, -0.4132, 1.7557, -0.0919, -0.2709, 0.0313, 0.0635,
  30863. 0.4032],
  30864. [ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  30865. -0.0580],
  30866. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  30867. 0.2365],
  30868. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  30869. 0.1715],
  30870. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  30871. 0.0802],
  30872. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  30873. 0.2699],
  30874. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  30875. 0.1474]]], device='cuda:0')
  30876. loss_train_step before backward: tensor(0.0065, device='cuda:0', grad_fn=<MseLossBackward>)
  30877. loss_train_step after backward: tensor(0.0065, device='cuda:0', grad_fn=<MseLossBackward>)
  30878. loss_train: 0.12055541574954987
  30879. step: 7
  30880. running loss: 0.017222202249935696
  30881. Train Steps: 7/90 Loss: 0.0172 torch.Size([8, 600, 800])
  30882. torch.Size([8, 8])
  30883. tensor([[0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  30884. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  30885. [0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  30886. [0.6135, 0.3994, 0.7913, 0.3050, 0.3625, 0.3050, 0.5837, 0.5050],
  30887. [0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378],
  30888. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  30889. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  30890. [0.6198, 0.4130, 0.8762, 0.4117, 0.3650, 0.4900, 0.5707, 0.5103]],
  30891. device='cuda:0', dtype=torch.float64)
  30892. predictions are: tensor([[ 0.6121, -0.4770, 1.8885, 0.0605, -0.6429, -0.2336, 0.6899, 0.0278],
  30893. [ 0.7454, -0.3639, 1.0604, -1.3949, -0.4047, -1.2772, 0.4862, 0.2483],
  30894. [ 0.2872, -0.6198, 1.6279, -0.3692, -0.5507, -0.2969, 0.1379, 0.3256],
  30895. [ 0.3327, -0.6100, 1.4320, -0.9929, -0.6452, -0.9560, 0.4174, 0.0762],
  30896. [ 0.7374, -0.3535, 1.6367, 0.2674, -0.6135, -0.4852, 0.2430, 0.1632],
  30897. [ 0.5788, -0.5004, 1.6847, 0.2857, -0.3745, -0.2482, 0.4787, 0.2059],
  30898. [ 0.5147, -0.4656, 1.8758, -0.2675, -0.1389, 0.0108, 0.3955, 0.3097],
  30899. [ 0.5872, -0.4207, 1.8811, -0.4503, -0.5698, -0.2127, 0.3556, 0.0867]],
  30900. device='cuda:0', grad_fn=<AddmmBackward>)
  30901. landmarks are: tensor([[[ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  30902. 0.0111],
  30903. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  30904. 0.2468],
  30905. [ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  30906. 0.3265],
  30907. [ 0.5477, -0.4413, 1.3688, -0.8771, -0.6115, -0.8771, 0.4104,
  30908. 0.0467],
  30909. [ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  30910. 0.1982],
  30911. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  30912. 0.1313],
  30913. [ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  30914. 0.2699],
  30915. [ 0.5771, -0.3784, 1.7614, -0.3844, -0.6000, -0.0226, 0.3501,
  30916. 0.0712]]], device='cuda:0')
  30917. loss_train_step before backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  30918. loss_train_step after backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  30919. loss_train: 0.1300251130014658
  30920. step: 8
  30921. running loss: 0.016253139125183225
  30922. Train Steps: 8/90 Loss: 0.0163 torch.Size([8, 600, 800])
  30923. torch.Size([8, 8])
  30924. tensor([[0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  30925. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  30926. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  30927. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  30928. [0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378],
  30929. [0.6343, 0.4097, 0.9287, 0.4367, 0.4313, 0.3600, 0.7248, 0.5841],
  30930. [0.6176, 0.4017, 0.8788, 0.5100, 0.4075, 0.5250, 0.5913, 0.5033],
  30931. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320]],
  30932. device='cuda:0', dtype=torch.float64)
  30933. predictions are: tensor([[ 0.5256, -0.4524, 1.7984, 0.1450, -0.4289, -0.0788, 0.2589, 0.3393],
  30934. [ 0.4977, -0.4804, 1.3995, -1.0820, -0.5870, -1.0135, 0.3227, 0.1081],
  30935. [ 0.6630, -0.3975, 1.3779, -1.1074, -0.6264, -1.1621, 0.1380, -0.0220],
  30936. [ 0.5724, -0.4312, 1.7310, -0.1963, -0.0846, -0.1130, 0.1525, 0.2617],
  30937. [ 0.7592, -0.3167, 1.5519, 0.1764, -0.6423, -0.4017, 0.1510, 0.1811],
  30938. [ 0.4704, -0.5583, 1.8519, -0.4481, -0.4448, -0.6366, 0.9631, 0.3323],
  30939. [ 0.4849, -0.5122, 1.7827, -0.0995, -0.3785, 0.1170, 0.3145, 0.1204],
  30940. [ 0.3807, -0.6192, 1.7006, 0.0377, -0.5237, 0.0271, 0.9367, 0.1956]],
  30941. device='cuda:0', grad_fn=<AddmmBackward>)
  30942. landmarks are: tensor([[[ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  30943. 0.3007],
  30944. [ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  30945. 0.1080],
  30946. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  30947. -0.0220],
  30948. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  30949. 0.3392],
  30950. [ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  30951. 0.1982],
  30952. [ 0.6438, -0.3936, 2.0039, -0.2690, -0.2940, -0.6231, 1.0618,
  30953. 0.4119],
  30954. [ 0.5668, -0.4306, 1.7730, 0.0697, -0.4037, 0.1390, 0.4450,
  30955. 0.0390],
  30956. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  30957. 0.1715]]], device='cuda:0')
  30958. loss_train_step before backward: tensor(0.0117, device='cuda:0', grad_fn=<MseLossBackward>)
  30959. loss_train_step after backward: tensor(0.0117, device='cuda:0', grad_fn=<MseLossBackward>)
  30960. loss_train: 0.14171226508915424
  30961. step: 9
  30962. running loss: 0.015745807232128248
  30963. Train Steps: 9/90 Loss: 0.0157 torch.Size([8, 600, 800])
  30964. torch.Size([8, 8])
  30965. tensor([[0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  30966. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750],
  30967. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402],
  30968. [0.6100, 0.4071, 0.7601, 0.3444, 0.3400, 0.4117, 0.5625, 0.5617],
  30969. [0.6218, 0.4137, 0.7263, 0.2233, 0.4075, 0.2650, 0.6212, 0.5783],
  30970. [0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  30971. [0.6118, 0.4052, 0.8463, 0.3917, 0.3538, 0.3450, 0.5053, 0.5593],
  30972. [0.6317, 0.4038, 0.8287, 0.5900, 0.3800, 0.4717, 0.6295, 0.4986]],
  30973. device='cuda:0', dtype=torch.float64)
  30974. predictions are: tensor([[ 0.5621, -0.4350, 1.8083, -0.7072, -0.6060, -0.3735, 0.3713, 0.1477],
  30975. [-0.2548, -0.9666, 0.9694, -1.2713, -0.2514, -1.5026, 0.2285, 0.4129],
  30976. [ 0.5501, -0.4866, 1.7867, 0.1286, -0.3355, -0.1685, 0.5161, 0.1942],
  30977. [ 0.5518, -0.4300, 1.3952, -0.7849, -0.7246, -0.3439, 0.2739, 0.2838],
  30978. [ 0.6204, -0.4182, 1.1728, -1.2457, -0.4112, -1.0753, 0.5919, 0.3851],
  30979. [ 0.7153, -0.3850, 1.8950, 0.1854, -0.4805, -0.2747, 0.6471, -0.0912],
  30980. [ 0.5189, -0.4356, 1.7161, -0.5475, -0.5983, -0.7178, -0.0889, 0.2347],
  30981. [ 0.6597, -0.4147, 1.7465, 0.3388, -0.5111, -0.1052, 0.6238, 0.0331]],
  30982. device='cuda:0', grad_fn=<AddmmBackward>)
  30983. landmarks are: tensor([[[ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  30984. 0.0802],
  30985. [ 0.5663, -0.4396, 0.8261, -1.1312, -0.2940, -1.3929, 0.2603,
  30986. 0.3700],
  30987. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  30988. 0.2091],
  30989. [ 0.5318, -0.4056, 1.2249, -0.6949, -0.7155, -0.3844, 0.3122,
  30990. 0.3084],
  30991. [ 0.5863, -0.3749, 1.0686, -1.2543, -0.4037, -1.0619, 0.5836,
  30992. 0.3854],
  30993. [ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  30994. -0.0102],
  30995. [ 0.5399, -0.4142, 1.6229, -0.4768, -0.6520, -0.6924, 0.0481,
  30996. 0.2972],
  30997. [ 0.6320, -0.4206, 1.5420, 0.4393, -0.5307, -0.1073, 0.6216,
  30998. 0.0171]]], device='cuda:0')
  30999. loss_train_step before backward: tensor(0.0208, device='cuda:0', grad_fn=<MseLossBackward>)
  31000. loss_train_step after backward: tensor(0.0208, device='cuda:0', grad_fn=<MseLossBackward>)
  31001. loss_train: 0.16252397932112217
  31002. step: 10
  31003. running loss: 0.016252397932112216
  31004.  
  31005. Train Steps: 10/90 Loss: 0.0163 torch.Size([8, 600, 800])
  31006. torch.Size([8, 8])
  31007. tensor([[0.6257, 0.4060, 0.8300, 0.2333, 0.4688, 0.2583, 0.7050, 0.5633],
  31008. [0.6022, 0.3994, 0.8025, 0.3350, 0.3350, 0.4400, 0.5565, 0.5025],
  31009. [0.6289, 0.4081, 0.8720, 0.3487, 0.3900, 0.3183, 0.6703, 0.5376],
  31010. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  31011. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  31012. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  31013. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  31014. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717]],
  31015. device='cuda:0', dtype=torch.float64)
  31016. predictions are: tensor([[ 0.4952, -0.5065, 1.6989, -1.0779, -0.1564, -1.1010, 0.9690, 0.3485],
  31017. [ 0.2338, -0.6378, 1.5139, -0.6089, -0.7161, -0.2372, 0.2462, 0.1252],
  31018. [ 0.4851, -0.5297, 1.8211, -0.5048, -0.4673, -0.7272, 0.9266, 0.2146],
  31019. [ 0.4475, -0.4619, 1.8858, -0.2298, -0.6026, -0.3046, 0.2469, 0.2047],
  31020. [ 0.6366, -0.3988, 1.3170, -1.0641, -0.1947, -1.3048, 0.4453, 0.1899],
  31021. [ 0.4931, -0.4868, 1.0749, -1.0042, -0.5348, -0.9385, 0.0530, 0.0562],
  31022. [ 0.4666, -0.4832, 1.4160, -1.0601, -0.1922, -1.2653, 0.4001, 0.2308],
  31023. [ 0.6729, -0.3513, 0.8831, -1.0201, -0.5309, -0.9789, 0.1976, 0.2888]],
  31024. device='cuda:0', grad_fn=<AddmmBackward>)
  31025. landmarks are: tensor([[[ 0.6042, -0.4105, 1.5478, -1.2082, -0.1208, -1.0927, 0.9704,
  31026. 0.3157],
  31027. [ 0.4956, -0.4413, 1.4208, -0.7386, -0.7386, -0.2536, 0.2843,
  31028. 0.0351],
  31029. [ 0.6191, -0.4008, 1.7420, -0.6753, -0.4845, -0.8156, 0.8101,
  31030. 0.1974],
  31031. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  31032. 0.1852],
  31033. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  31034. 0.2083],
  31035. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  31036. 0.0802],
  31037. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  31038. 0.1850],
  31039. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  31040. 0.3546]]], device='cuda:0')
  31041. loss_train_step before backward: tensor(0.0092, device='cuda:0', grad_fn=<MseLossBackward>)
  31042. loss_train_step after backward: tensor(0.0092, device='cuda:0', grad_fn=<MseLossBackward>)
  31043. loss_train: 0.1717460323125124
  31044. step: 11
  31045. running loss: 0.015613275664773855
  31046. Train Steps: 11/90 Loss: 0.0156 torch.Size([8, 600, 800])
  31047. torch.Size([8, 8])
  31048. tensor([[ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  31049. [0.6193, 0.3930, 0.8949, 0.4437, 0.3852, 0.5435, 0.6263, 0.5263],
  31050. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  31051. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  31052. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  31053. [0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869],
  31054. [0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510],
  31055. [0.6059, 0.4002, 0.7562, 0.2767, 0.3538, 0.3033, 0.5529, 0.5455]],
  31056. device='cuda:0', dtype=torch.float64)
  31057. predictions are: tensor([[-2.1810, -2.2031, 0.8995, -1.0844, -0.4663, -1.2910, 0.0934, 0.3814],
  31058. [ 0.4687, -0.4924, 1.8094, -0.1270, -0.4819, 0.2563, 0.5449, 0.1873],
  31059. [ 0.4851, -0.4925, 1.7876, -0.3265, -0.6856, -0.1683, 0.4772, 0.1175],
  31060. [ 0.7273, -0.2978, 0.9829, -1.2828, -0.4788, -1.0173, 0.3975, 0.2628],
  31061. [ 0.4733, -0.5219, 1.8115, -0.5131, -0.3404, -0.8316, 0.9798, 0.1113],
  31062. [ 0.9110, -0.2001, 1.4314, -1.2082, -0.0286, -1.5178, 0.5554, 0.0304],
  31063. [ 0.4506, -0.4711, 1.7314, 0.1099, -0.3668, -0.0410, 0.1666, 0.2598],
  31064. [ 0.4830, -0.4528, 1.1680, -0.8904, -0.5668, -0.7985, 0.3129, 0.1844]],
  31065. device='cuda:0', grad_fn=<AddmmBackward>)
  31066. landmarks are: tensor([[[-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  31067. 0.4543],
  31068. [ 0.5746, -0.4706, 1.8476, -0.2365, -0.5068, 0.2245, 0.6069,
  31069. 0.1449],
  31070. [ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  31071. -0.0099],
  31072. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  31073. 0.2853],
  31074. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  31075. 0.1821],
  31076. [ 0.6124, -0.4010, 1.4381, -1.3544, -0.0573, -1.5546, 0.5573,
  31077. -0.0369],
  31078. [ 0.5334, -0.4252, 1.7499, -0.0226, -0.3979, -0.1920, 0.0558,
  31079. 0.2589],
  31080. [ 0.5129, -0.4374, 1.2072, -1.0080, -0.6520, -0.8848, 0.2679,
  31081. 0.2335]]], device='cuda:0')
  31082. loss_train_step before backward: tensor(0.0088, device='cuda:0', grad_fn=<MseLossBackward>)
  31083. loss_train_step after backward: tensor(0.0088, device='cuda:0', grad_fn=<MseLossBackward>)
  31084. loss_train: 0.18051145039498806
  31085. step: 12
  31086. running loss: 0.015042620866249004
  31087. Train Steps: 12/90 Loss: 0.0150 torch.Size([8, 600, 800])
  31088. torch.Size([8, 8])
  31089. tensor([[0.6193, 0.4034, 0.7757, 0.2347, 0.3733, 0.2919, 0.5930, 0.4926],
  31090. [0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  31091. [0.6296, 0.4045, 0.9138, 0.4100, 0.4232, 0.4242, 0.7422, 0.5297],
  31092. [0.6261, 0.4045, 0.8865, 0.5369, 0.3895, 0.4859, 0.6683, 0.5249],
  31093. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  31094. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  31095. [0.6286, 0.4060, 0.9188, 0.4333, 0.3675, 0.4167, 0.7034, 0.5528],
  31096. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567]],
  31097. device='cuda:0', dtype=torch.float64)
  31098. predictions are: tensor([[ 0.5929, -0.3831, 1.1603, -1.3763, -0.5561, -0.9755, 0.1903, 0.0160],
  31099. [ 0.5210, -0.4703, 1.7357, -0.5514, -0.6131, -0.5008, 0.5070, 0.1872],
  31100. [ 0.7239, -0.3509, 1.8028, -0.5375, -0.4470, -0.3079, 0.8961, 0.2300],
  31101. [ 0.6579, -0.3626, 1.6936, 0.0632, -0.4777, 0.0678, 0.5938, 0.2176],
  31102. [ 0.5153, -0.4594, 1.7896, -0.2423, -0.6064, -0.4672, 0.4889, 0.1511],
  31103. [ 0.6139, -0.3908, 1.5405, 0.1031, -0.4729, -0.2208, 0.2265, 0.2722],
  31104. [ 0.6588, -0.3622, 1.8513, -0.3756, -0.4461, -0.3094, 0.7993, 0.3618],
  31105. [ 0.6246, -0.3740, 1.5466, 0.2366, -0.1276, 0.0130, 0.1270, 0.3720]],
  31106. device='cuda:0', grad_fn=<AddmmBackward>)
  31107. landmarks are: tensor([[[ 0.5746, -0.4225, 1.2968, -1.2019, -0.5615, -0.9374, 0.4533,
  31108. -0.0108],
  31109. [ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  31110. 0.0697],
  31111. [ 0.6224, -0.4177, 1.9346, -0.3921, -0.3314, -0.3264, 1.1422,
  31112. 0.1608],
  31113. [ 0.6059, -0.4177, 1.8087, 0.1941, -0.4868, -0.0414, 0.8010,
  31114. 0.1385],
  31115. [ 0.6372, -0.4129, 1.8942, -0.0765, -0.6173, -0.4768, 0.6999,
  31116. 0.0325],
  31117. [ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  31118. 0.2075],
  31119. [ 0.6174, -0.4105, 1.9577, -0.2844, -0.5885, -0.3614, 0.9631,
  31120. 0.2676],
  31121. [ 0.5620, -0.4346, 1.6691, 0.3315, -0.2594, -0.0072, 0.2891,
  31122. 0.2853]]], device='cuda:0')
  31123. loss_train_step before backward: tensor(0.0127, device='cuda:0', grad_fn=<MseLossBackward>)
  31124. loss_train_step after backward: tensor(0.0127, device='cuda:0', grad_fn=<MseLossBackward>)
  31125. loss_train: 0.19325176812708378
  31126. step: 13
  31127. running loss: 0.01486552062516029
  31128. Train Steps: 13/90 Loss: 0.0149 torch.Size([8, 600, 800])
  31129. torch.Size([8, 8])
  31130. tensor([[0.6249, 0.4138, 0.9038, 0.4517, 0.3862, 0.4917, 0.6138, 0.5333],
  31131. [0.6042, 0.3990, 0.6831, 0.2875, 0.3500, 0.3133, 0.5143, 0.5510],
  31132. [0.6307, 0.4045, 0.8025, 0.5833, 0.3775, 0.4867, 0.6892, 0.5459],
  31133. [0.6269, 0.4073, 0.8900, 0.4933, 0.3625, 0.4183, 0.6288, 0.5150],
  31134. [0.6350, 0.4144, 0.9250, 0.4100, 0.4125, 0.3750, 0.7129, 0.5945],
  31135. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  31136. [0.6371, 0.4092, 0.8337, 0.5850, 0.3950, 0.5117, 0.6559, 0.5262],
  31137. [ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933]],
  31138. device='cuda:0', dtype=torch.float64)
  31139. predictions are: tensor([[ 0.6185, -0.3156, 1.8265, -0.3126, -0.4726, 0.0292, 0.3994, 0.2266],
  31140. [ 0.5336, -0.3887, 0.9285, -1.1986, -0.5366, -0.9300, 0.0476, 0.2809],
  31141. [ 0.6409, -0.3765, 1.4790, 0.1583, -0.4156, -0.0975, 0.8417, 0.2170],
  31142. [ 0.4891, -0.4365, 1.8433, -0.1204, -0.5106, -0.2830, 0.4545, 0.1341],
  31143. [ 0.7050, -0.3099, 1.9224, -0.4509, -0.2300, -0.5580, 0.9066, 0.3912],
  31144. [ 0.6713, -0.3561, 1.7889, 0.0174, -0.5189, -0.1541, 0.5659, 0.0518],
  31145. [ 0.6875, -0.3242, 1.5716, 0.2427, -0.3745, 0.0493, 0.6705, 0.1036],
  31146. [-1.9622, -2.0539, 1.0842, -1.0704, -0.5110, -1.1750, -0.0437, 0.3613]],
  31147. device='cuda:0', grad_fn=<AddmmBackward>)
  31148. landmarks are: tensor([[[ 0.6003, -0.3747, 1.8885, -0.1997, -0.5018, -0.0149, 0.5490,
  31149. 0.1775],
  31150. [ 0.5049, -0.4428, 0.8692, -0.9581, -0.6693, -0.8386, 0.0897,
  31151. 0.2589],
  31152. [ 0.6273, -0.4177, 1.4208, 0.4085, -0.5423, -0.0380, 0.8973,
  31153. 0.2356],
  31154. [ 0.6096, -0.4046, 1.8249, -0.0072, -0.6115, -0.3537, 0.6182,
  31155. 0.0928],
  31156. [ 0.6471, -0.3719, 1.9866, -0.3921, -0.3806, -0.5538, 1.0070,
  31157. 0.4600],
  31158. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  31159. 0.0111],
  31160. [ 0.6569, -0.3960, 1.5651, 0.4162, -0.4614, 0.0774, 0.7438,
  31161. 0.1447],
  31162. [-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  31163. 0.4543]]], device='cuda:0')
  31164. loss_train_step before backward: tensor(0.0104, device='cuda:0', grad_fn=<MseLossBackward>)
  31165. loss_train_step after backward: tensor(0.0104, device='cuda:0', grad_fn=<MseLossBackward>)
  31166. loss_train: 0.20368763711303473
  31167. step: 14
  31168. running loss: 0.014549116936645337
  31169.  
  31170. Train Steps: 14/90 Loss: 0.0145 torch.Size([8, 600, 800])
  31171. torch.Size([8, 8])
  31172. tensor([[0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117],
  31173. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  31174. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  31175. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  31176. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  31177. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  31178. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  31179. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064]],
  31180. device='cuda:0', dtype=torch.float64)
  31181. predictions are: tensor([[ 0.5511, -0.4068, 1.7669, -0.1467, -0.6737, -0.4046, 0.2705, 0.1262],
  31182. [ 0.6452, -0.3602, 1.3157, -1.0661, -0.3160, -1.2657, 0.7119, 0.1955],
  31183. [ 0.4112, -0.5618, 1.8742, -0.2422, -0.5652, 0.0540, 1.0783, 0.2086],
  31184. [ 0.6926, -0.3282, 1.0094, -1.2379, -0.4402, -1.1454, 0.4859, 0.2555],
  31185. [ 0.5699, -0.3966, 1.7770, -0.0380, -0.3195, 0.3987, 0.6858, 0.2068],
  31186. [ 0.6017, -0.3589, 1.3299, -1.0885, -0.2723, -1.3584, 0.3951, 0.2467],
  31187. [ 0.4981, -0.4629, 1.3449, -0.8999, -0.6521, -0.7340, 0.4934, 0.2876],
  31188. [ 0.5636, -0.4064, 1.6784, 0.0822, -0.1191, 0.0233, 0.1590, 0.1523]],
  31189. device='cuda:0', grad_fn=<AddmmBackward>)
  31190. landmarks are: tensor([[[ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  31191. 0.0774],
  31192. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  31193. 0.1917],
  31194. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  31195. 0.1715],
  31196. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  31197. 0.2468],
  31198. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  31199. 0.0928],
  31200. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  31201. 0.1850],
  31202. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  31203. 0.1931],
  31204. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  31205. 0.0532]]], device='cuda:0')
  31206. loss_train_step before backward: tensor(0.0061, device='cuda:0', grad_fn=<MseLossBackward>)
  31207. loss_train_step after backward: tensor(0.0061, device='cuda:0', grad_fn=<MseLossBackward>)
  31208. loss_train: 0.20982471108436584
  31209. step: 15
  31210. running loss: 0.013988314072291057
  31211. Train Steps: 15/90 Loss: 0.0140 torch.Size([8, 600, 800])
  31212. torch.Size([8, 8])
  31213. tensor([[0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  31214. [0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433],
  31215. [0.6261, 0.4131, 0.8938, 0.3550, 0.4000, 0.2683, 0.6188, 0.5283],
  31216. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  31217. [0.6314, 0.4050, 0.8227, 0.5431, 0.4150, 0.5517, 0.7121, 0.5690],
  31218. [0.6092, 0.4001, 0.8638, 0.4867, 0.4288, 0.5367, 0.5484, 0.5064],
  31219. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  31220. [0.6161, 0.4055, 0.8675, 0.3867, 0.3713, 0.4033, 0.5195, 0.5162]],
  31221. device='cuda:0', dtype=torch.float64)
  31222. predictions are: tensor([[ 0.6932, -0.3002, 0.9223, -1.2076, -0.4446, -1.2456, 0.4461, 0.3540],
  31223. [ 0.7345, -0.2983, 1.7527, -0.1153, -0.1353, 0.1659, 0.6014, 0.3645],
  31224. [ 0.7010, -0.3145, 1.8317, -0.7354, -0.5536, -1.0791, 0.7113, 0.1254],
  31225. [ 0.5710, -0.4561, 1.6580, 0.2129, -0.4870, -0.0747, 0.8136, 0.0383],
  31226. [ 0.5815, -0.4396, 1.5620, 0.1961, -0.4041, 0.2234, 1.1959, 0.3494],
  31227. [ 0.4783, -0.4605, 1.6568, -0.0696, -0.3142, 0.1620, 0.2832, 0.1092],
  31228. [ 0.4819, -0.4050, 1.6976, -0.2870, -0.5468, -0.2685, 0.1350, 0.3684],
  31229. [ 0.4149, -0.4674, 1.7142, -0.4944, -0.6656, -0.4889, 0.2146, 0.0351]],
  31230. device='cuda:0', grad_fn=<AddmmBackward>)
  31231. landmarks are: tensor([[[ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  31232. 0.2622],
  31233. [ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  31234. 0.2237],
  31235. [ 0.6062, -0.3778, 1.8423, -0.6462, -0.4383, -1.0465, 0.5721,
  31236. 0.1544],
  31237. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  31238. 0.0697],
  31239. [ 0.6306, -0.4153, 1.5141, 0.2224, -0.3691, 0.2622, 1.0033,
  31240. 0.3425],
  31241. [ 0.5278, -0.4377, 1.7037, -0.0380, -0.3055, 0.1929, 0.2473,
  31242. 0.0532],
  31243. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  31244. 0.4145],
  31245. [ 0.5598, -0.4129, 1.7210, -0.4999, -0.5711, -0.4229, 0.1136,
  31246. 0.0983]]], device='cuda:0')
  31247. loss_train_step before backward: tensor(0.0061, device='cuda:0', grad_fn=<MseLossBackward>)
  31248. loss_train_step after backward: tensor(0.0061, device='cuda:0', grad_fn=<MseLossBackward>)
  31249. loss_train: 0.21596113871783018
  31250. step: 16
  31251. running loss: 0.013497571169864386
  31252. Train Steps: 16/90 Loss: 0.0135 torch.Size([8, 600, 800])
  31253. torch.Size([8, 8])
  31254. tensor([[ nan, nan, 0.8888, 0.3100, 0.5262, 0.2817, 0.7145, 0.6003],
  31255. [0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617],
  31256. [0.6245, 0.4115, 0.8700, 0.4883, 0.4625, 0.5517, 0.6100, 0.5217],
  31257. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  31258. [0.6336, 0.4191, 0.8938, 0.5167, 0.3937, 0.3517, 0.7343, 0.5748],
  31259. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301],
  31260. [0.6274, 0.4003, 0.8638, 0.5967, 0.3688, 0.4900, 0.6108, 0.4661],
  31261. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114]],
  31262. device='cuda:0', dtype=torch.float64)
  31263. predictions are: tensor([[-1.4391e+00, -1.7195e+00, 1.6965e+00, -8.3241e-01, -7.4165e-03,
  31264. -1.2388e+00, 9.2158e-01, 4.8889e-01],
  31265. [ 6.7004e-01, -2.8881e-01, 1.7075e+00, -1.5896e-01, -6.4548e-01,
  31266. -2.0172e-01, 4.7335e-01, 2.4208e-01],
  31267. [ 5.9918e-01, -3.3162e-01, 1.6278e+00, -2.1823e-01, -2.4393e-01,
  31268. 1.9002e-01, 4.4332e-01, 2.2739e-01],
  31269. [ 6.2093e-01, -3.1903e-01, 1.6007e+00, -6.1591e-01, -6.5189e-01,
  31270. -1.0654e-01, 3.2741e-01, 1.7108e-01],
  31271. [ 6.0972e-01, -3.6531e-01, 1.7034e+00, 2.6776e-03, -4.8217e-01,
  31272. -6.0080e-01, 8.8999e-01, 2.6616e-01],
  31273. [ 5.8475e-01, -4.0440e-01, 1.6300e+00, -1.0673e-01, -3.9924e-01,
  31274. -6.8137e-02, 7.1257e-01, 1.2286e-01],
  31275. [ 7.6503e-01, -2.8282e-01, 1.5378e+00, 3.3768e-01, -5.7958e-01,
  31276. -9.7698e-02, 6.3861e-01, 9.1715e-04],
  31277. [ 5.7975e-01, -3.8051e-01, 1.5980e+00, 9.9984e-03, -2.3316e-01,
  31278. 1.7962e-01, 4.1097e-01, 9.1926e-02]], device='cuda:0',
  31279. grad_fn=<AddmmBackward>)
  31280. landmarks are: tensor([[[-2.2859, -2.2859, 1.8192, -0.8540, 0.1448, -0.9849, 1.0143,
  31281. 0.4867],
  31282. [ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  31283. 0.3084],
  31284. [ 0.5987, -0.3852, 1.7326, -0.0303, -0.1497, 0.2622, 0.5316,
  31285. 0.1236],
  31286. [ 0.5384, -0.4361, 1.7961, -0.4999, -0.5480, -0.1150, 0.3931,
  31287. 0.2776],
  31288. [ 0.6405, -0.3503, 1.8423, 0.1005, -0.4672, -0.6616, 1.1057,
  31289. 0.3692],
  31290. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  31291. 0.1627],
  31292. [ 0.6120, -0.4371, 1.7037, 0.4701, -0.5827, -0.0226, 0.5354,
  31293. -0.1331],
  31294. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  31295. 0.0764]]], device='cuda:0')
  31296. loss_train_step before backward: tensor(0.0266, device='cuda:0', grad_fn=<MseLossBackward>)
  31297. loss_train_step after backward: tensor(0.0266, device='cuda:0', grad_fn=<MseLossBackward>)
  31298. loss_train: 0.24258825462311506
  31299. step: 17
  31300. running loss: 0.014269897330771475
  31301. Train Steps: 17/90 Loss: 0.0143 torch.Size([8, 600, 800])
  31302. torch.Size([8, 8])
  31303. tensor([[0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617],
  31304. [ nan, nan, 0.9088, 0.3783, 0.4562, 0.2617, 0.6741, 0.5575],
  31305. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  31306. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  31307. [0.6246, 0.4008, 0.8757, 0.5088, 0.4101, 0.5392, 0.6644, 0.5133],
  31308. [0.6198, 0.3997, 0.8582, 0.5361, 0.4117, 0.5016, 0.5942, 0.5134],
  31309. [0.6090, 0.4045, 0.7250, 0.2100, 0.4075, 0.2300, 0.5476, 0.5663],
  31310. [0.6236, 0.4081, 0.8575, 0.3000, 0.3713, 0.3033, 0.5550, 0.5633]],
  31311. device='cuda:0', dtype=torch.float64)
  31312. predictions are: tensor([[ 0.7508, -0.2604, 1.7657, -0.0488, -0.5387, -0.0755, 0.5828, 0.2377],
  31313. [-1.1455, -1.5244, 1.9091, -0.5219, -0.2446, -1.0815, 0.7982, 0.3013],
  31314. [ 0.7796, -0.2696, 1.9089, -0.1851, -0.3437, -0.8657, 1.0811, 0.2547],
  31315. [ 0.5238, -0.3978, 1.2088, -0.5805, -0.6452, -0.2787, 0.2464, 0.2178],
  31316. [ 0.7354, -0.3332, 1.7281, 0.0586, -0.3375, 0.3449, 0.9514, 0.0944],
  31317. [ 0.6988, -0.3625, 1.6217, 0.1694, -0.3268, 0.1545, 0.4640, 0.0219],
  31318. [ 0.4548, -0.4465, 0.9776, -1.3111, -0.4202, -1.1218, 0.3172, 0.2431],
  31319. [ 0.5979, -0.3529, 1.5608, -0.8263, -0.5420, -0.7747, 0.3924, 0.1048]],
  31320. device='cuda:0', grad_fn=<AddmmBackward>)
  31321. landmarks are: tensor([[[ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  31322. 0.3084],
  31323. [-2.2859, -2.2859, 1.9115, -0.5384, -0.1785, -1.0773, 0.8278,
  31324. 0.2890],
  31325. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  31326. 0.3692],
  31327. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  31328. 0.2386],
  31329. [ 0.5993, -0.4345, 1.7587, 0.0641, -0.3917, 0.2048, 0.7827,
  31330. 0.0852],
  31331. [ 0.5767, -0.4396, 1.6782, 0.1905, -0.3844, 0.0308, 0.4588,
  31332. 0.0855],
  31333. [ 0.5269, -0.4176, 1.0628, -1.3159, -0.4037, -1.2236, 0.2432,
  31334. 0.3297],
  31335. [ 0.5944, -0.4008, 1.6748, -0.9002, -0.5711, -0.8848, 0.2776,
  31336. 0.3161]]], device='cuda:0')
  31337. loss_train_step before backward: tensor(0.0362, device='cuda:0', grad_fn=<MseLossBackward>)
  31338. loss_train_step after backward: tensor(0.0362, device='cuda:0', grad_fn=<MseLossBackward>)
  31339. loss_train: 0.2787413029000163
  31340. step: 18
  31341. running loss: 0.015485627938889794
  31342.  
  31343. Train Steps: 18/90 Loss: 0.0155 torch.Size([8, 600, 800])
  31344. torch.Size([8, 8])
  31345. tensor([[0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  31346. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  31347. [0.6308, 0.3990, 0.8688, 0.5183, 0.3950, 0.4983, 0.6388, 0.5133],
  31348. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  31349. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  31350. [0.6250, 0.4110, 0.7238, 0.2067, 0.4263, 0.1883, 0.5625, 0.5633],
  31351. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  31352. [0.6189, 0.4033, 0.8650, 0.5267, 0.4487, 0.5150, 0.5925, 0.5050]],
  31353. device='cuda:0', dtype=torch.float64)
  31354. predictions are: tensor([[ 0.5391, -0.4250, 1.5793, -0.5507, -0.5772, -0.7345, 0.5866, 0.2346],
  31355. [ 0.6453, -0.3269, 1.6569, -0.9600, -0.3731, -0.8979, 0.7733, 0.1688],
  31356. [ 0.6124, -0.4489, 1.7579, 0.1917, -0.4467, 0.1514, 0.9555, 0.0758],
  31357. [ 0.4832, -0.4268, 1.5981, -0.4180, -0.6525, -0.4576, 0.0383, 0.2399],
  31358. [ 0.6428, -0.4099, 1.9707, -0.5950, -0.3578, -0.4111, 1.2218, 0.2484],
  31359. [ 0.4976, -0.4160, 0.9908, -1.2584, -0.3256, -1.3835, 0.4925, 0.2604],
  31360. [ 0.6152, -0.4093, 1.6455, 0.1106, -0.3446, 0.0551, 0.3082, 0.1433],
  31361. [ 0.5605, -0.4519, 1.6999, 0.1790, -0.2418, 0.2339, 0.5199, 0.1525]],
  31362. device='cuda:0', grad_fn=<AddmmBackward>)
  31363. landmarks are: tensor([[[ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  31364. 0.1621],
  31365. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  31366. 0.1467],
  31367. [ 0.6275, -0.4430, 1.7268, 0.1082, -0.4614, 0.0159, 0.6644,
  31368. 0.0851],
  31369. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  31370. 0.2567],
  31371. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  31372. 0.2676],
  31373. [ 0.6010, -0.3875, 1.0570, -1.3313, -0.3171, -1.4160, 0.3122,
  31374. 0.3161],
  31375. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  31376. 0.1854],
  31377. [ 0.5726, -0.4230, 1.7095, 0.1467, -0.2132, 0.0928, 0.4508,
  31378. 0.0467]]], device='cuda:0')
  31379. loss_train_step before backward: tensor(0.0069, device='cuda:0', grad_fn=<MseLossBackward>)
  31380. loss_train_step after backward: tensor(0.0069, device='cuda:0', grad_fn=<MseLossBackward>)
  31381. loss_train: 0.2856500316411257
  31382. step: 19
  31383. running loss: 0.015034212191638193
  31384. Train Steps: 19/90 Loss: 0.0150 torch.Size([8, 600, 800])
  31385. torch.Size([8, 8])
  31386. tensor([[0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  31387. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  31388. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351],
  31389. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  31390. [0.6040, 0.4002, 0.7338, 0.2267, 0.3975, 0.2100, 0.5231, 0.4778],
  31391. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  31392. [0.6118, 0.4052, 0.8463, 0.3917, 0.3538, 0.3450, 0.5053, 0.5593],
  31393. [0.6215, 0.4119, 0.7688, 0.2300, 0.4200, 0.2283, 0.5925, 0.5317]],
  31394. device='cuda:0', dtype=torch.float64)
  31395. predictions are: tensor([[ 0.6642, -0.3373, 1.6242, -0.4397, -0.5543, -0.7999, 0.5567, 0.2802],
  31396. [ 0.3577, -0.5237, 1.7865, 0.0304, -0.3552, -0.8476, 0.5982, 0.5128],
  31397. [ 0.7060, -0.3369, 1.3578, -1.1410, -0.2806, -1.2913, 0.6984, 0.0911],
  31398. [ 0.4874, -0.5204, 1.7267, 0.1068, -0.1824, 0.2917, 0.4077, 0.1674],
  31399. [ 0.6098, -0.4015, 1.1021, -1.3660, -0.4870, -1.1326, 0.5583, -0.0315],
  31400. [ 0.5276, -0.4831, 1.8539, -0.0930, -0.3060, 0.1485, 0.5581, 0.2284],
  31401. [ 0.2133, -0.6280, 1.6494, -0.4383, -0.6503, -0.4903, 0.2719, 0.2101],
  31402. [ 0.6117, -0.4047, 1.2955, -1.1935, -0.3856, -0.9915, 0.8060, 0.1934]],
  31403. device='cuda:0', grad_fn=<AddmmBackward>)
  31404. landmarks are: tensor([[[ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  31405. 0.3928],
  31406. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  31407. 0.5762],
  31408. [ 0.5664, -0.4321, 1.2862, -1.0003, -0.2189, -1.4608, 0.3883,
  31409. 0.1855],
  31410. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  31411. 0.2634],
  31412. [ 0.5037, -0.4375, 1.1032, -1.2390, -0.4499, -1.3159, 0.1301,
  31413. -0.0791],
  31414. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  31415. 0.3057],
  31416. [ 0.5399, -0.4142, 1.6229, -0.4768, -0.6520, -0.6924, 0.0481,
  31417. 0.2972],
  31418. [ 0.5849, -0.3836, 1.2649, -1.2236, -0.3460, -1.2313, 0.4508,
  31419. 0.1698]]], device='cuda:0')
  31420. loss_train_step before backward: tensor(0.0265, device='cuda:0', grad_fn=<MseLossBackward>)
  31421. loss_train_step after backward: tensor(0.0265, device='cuda:0', grad_fn=<MseLossBackward>)
  31422. loss_train: 0.31217335909605026
  31423. step: 20
  31424. running loss: 0.015608667954802513
  31425. Train Steps: 20/90 Loss: 0.0156 torch.Size([8, 600, 800])
  31426. torch.Size([8, 8])
  31427. tensor([[0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  31428. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  31429. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  31430. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  31431. [0.6227, 0.4083, 0.8938, 0.4800, 0.3800, 0.2950, 0.5737, 0.5350],
  31432. [ nan, nan, 0.7240, 0.2722, 0.3900, 0.2567, 0.5168, 0.5933],
  31433. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667],
  31434. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933]],
  31435. device='cuda:0', dtype=torch.float64)
  31436. predictions are: tensor([[ 0.8436, -0.2661, 1.7293, 0.3506, -0.4195, -0.0204, 0.8849, -0.0659],
  31437. [ 0.7133, -0.2538, 1.7154, -0.3090, -0.4786, -0.2038, 0.2791, 0.3428],
  31438. [ 0.8705, -0.2223, 1.6207, -0.7515, -0.6418, -0.4919, 0.7847, 0.1622],
  31439. [ 0.7293, -0.2986, 1.6384, -0.3508, -0.5085, -0.0364, 0.4600, 0.0077],
  31440. [ 0.8734, -0.1393, 1.8251, -0.0868, -0.4825, -0.8209, 0.6283, 0.1497],
  31441. [-2.1821, -2.1859, 1.0531, -1.0705, -0.4182, -1.0759, 0.1864, 0.3801],
  31442. [-1.7686, -1.9233, 1.2301, -1.1572, -0.3819, -0.9255, 0.5486, 0.3583],
  31443. [ 0.7109, -0.2645, 1.6211, 0.3448, -0.0315, -0.1749, 0.4552, 0.3760]],
  31444. device='cuda:0', grad_fn=<AddmmBackward>)
  31445. landmarks are: tensor([[[ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  31446. -0.0049],
  31447. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  31448. 0.4145],
  31449. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  31450. 0.1753],
  31451. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  31452. 0.0502],
  31453. [ 0.5901, -0.4000, 1.8423, -0.0688, -0.5307, -0.9233, 0.3642,
  31454. 0.1852],
  31455. [-2.2859, -2.2859, 1.0580, -1.0288, -0.4845, -1.1004, 0.1011,
  31456. 0.4543],
  31457. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  31458. 0.3315],
  31459. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  31460. 0.4547]]], device='cuda:0')
  31461. loss_train_step before backward: tensor(0.0208, device='cuda:0', grad_fn=<MseLossBackward>)
  31462. loss_train_step after backward: tensor(0.0208, device='cuda:0', grad_fn=<MseLossBackward>)
  31463. loss_train: 0.33298695273697376
  31464. step: 21
  31465. running loss: 0.015856521558903512
  31466. Train Steps: 21/90 Loss: 0.0159 torch.Size([8, 600, 800])
  31467. torch.Size([8, 8])
  31468. tensor([[0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  31469. [0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  31470. [0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  31471. [0.6058, 0.3986, 0.8324, 0.4626, 0.3838, 0.4983, 0.5147, 0.5466],
  31472. [0.6165, 0.4106, 0.7575, 0.1733, 0.3838, 0.2650, 0.5680, 0.5116],
  31473. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  31474. [0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  31475. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433]],
  31476. device='cuda:0', dtype=torch.float64)
  31477. predictions are: tensor([[ 0.5701, -0.3610, 1.1925, -0.5998, -0.3476, -1.1460, 0.3494, 0.4502],
  31478. [ 0.5325, -0.4449, 1.5287, -0.8693, -0.5007, -0.7125, 0.5934, 0.2793],
  31479. [ 0.4868, -0.4511, 1.6993, 0.1740, -0.1953, 0.0165, 0.2025, 0.3025],
  31480. [ 0.3532, -0.5528, 1.6190, -0.0188, -0.5111, 0.0868, 0.3957, 0.1781],
  31481. [ 0.5768, -0.4132, 1.2803, -1.2153, -0.5702, -1.0083, 0.5767, -0.0181],
  31482. [-2.8392, -2.6520, 0.9217, -1.1096, -0.4011, -1.2152, 0.2435, 0.3523],
  31483. [ 0.8260, -0.2496, 1.7667, -1.0595, 0.0952, -1.3712, 1.0684, 0.1354],
  31484. [ 0.4822, -0.4867, 1.8582, 0.0209, -0.5483, 0.1714, 0.6321, 0.0669]],
  31485. device='cuda:0', grad_fn=<AddmmBackward>)
  31486. landmarks are: tensor([[[ 0.6077, -0.3226, 0.9993, -0.6462, -0.2651, -1.3082, 0.2946,
  31487. 0.5401],
  31488. [ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  31489. 0.3392],
  31490. [ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  31491. 0.4239],
  31492. [ 0.5124, -0.4446, 1.5587, -0.1493, -0.5134, 0.0159, 0.0912,
  31493. 0.2386],
  31494. [ 0.5618, -0.3895, 1.2129, -1.4853, -0.5134, -1.0619, 0.3378,
  31495. 0.0772],
  31496. [-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  31497. 0.4543],
  31498. [ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  31499. 0.2142],
  31500. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  31501. 0.2237]]], device='cuda:0')
  31502. loss_train_step before backward: tensor(0.0193, device='cuda:0', grad_fn=<MseLossBackward>)
  31503. loss_train_step after backward: tensor(0.0193, device='cuda:0', grad_fn=<MseLossBackward>)
  31504. loss_train: 0.3522569965571165
  31505. step: 22
  31506. running loss: 0.016011681661687115
  31507.  
  31508. Train Steps: 22/90 Loss: 0.0160 torch.Size([8, 600, 800])
  31509. torch.Size([8, 8])
  31510. tensor([[0.6211, 0.3993, 0.7650, 0.1933, 0.4575, 0.1550, 0.5965, 0.4895],
  31511. [ nan, nan, 0.7625, 0.2433, 0.3713, 0.2867, 0.5235, 0.5220],
  31512. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  31513. [0.6226, 0.4125, 0.8800, 0.4900, 0.4512, 0.5600, 0.6275, 0.5517],
  31514. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  31515. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  31516. [0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600],
  31517. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207]],
  31518. device='cuda:0', dtype=torch.float64)
  31519. predictions are: tensor([[ 0.4190, -0.5163, 1.2306, -1.3445, -0.2406, -1.4644, 0.4430, 0.0780],
  31520. [-2.6366, -2.5332, 1.1538, -1.0783, -0.4702, -1.0118, 0.2247, 0.2517],
  31521. [ 0.5058, -0.4009, 1.6188, 0.4193, -0.4515, -0.2694, 0.3354, 0.4193],
  31522. [ 0.4812, -0.4535, 1.7116, -0.0511, -0.2676, 0.2715, 0.4280, 0.3389],
  31523. [ 0.3823, -0.4933, 1.4640, -1.0505, -0.2502, -1.2271, 0.5584, 0.2454],
  31524. [ 0.5660, -0.4228, 1.7460, -0.1628, -0.4159, 0.1009, 0.4308, 0.1760],
  31525. [ 0.6304, -0.3654, 1.6921, 0.3137, -0.4992, 0.1335, 0.4860, 0.2379],
  31526. [ 0.4978, -0.4602, 1.4664, -1.0301, -0.3268, -1.2302, 0.7269, 0.1300]],
  31527. device='cuda:0', grad_fn=<AddmmBackward>)
  31528. landmarks are: tensor([[[ 0.5828, -0.4417, 1.2476, -1.3929, -0.1727, -1.5700, 0.4694,
  31529. -0.0248],
  31530. [-2.2859, -2.2859, 1.2360, -1.1620, -0.5711, -0.9618, 0.1322,
  31531. 0.1253],
  31532. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  31533. 0.4470],
  31534. [ 0.5897, -0.3804, 1.7788, -0.0226, -0.2016, 0.3007, 0.6125,
  31535. 0.2622],
  31536. [ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  31537. 0.2083],
  31538. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  31539. 0.2545],
  31540. [ 0.5762, -0.3840, 1.7268, 0.2622, -0.4210, 0.1313, 0.4277,
  31541. 0.3007],
  31542. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  31543. 0.1193]]], device='cuda:0')
  31544. loss_train_step before backward: tensor(0.0088, device='cuda:0', grad_fn=<MseLossBackward>)
  31545. loss_train_step after backward: tensor(0.0088, device='cuda:0', grad_fn=<MseLossBackward>)
  31546. loss_train: 0.36108022555708885
  31547. step: 23
  31548. running loss: 0.01569914024161256
  31549. Train Steps: 23/90 Loss: 0.0157 torch.Size([8, 600, 800])
  31550. torch.Size([8, 8])
  31551. tensor([[0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  31552. [0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  31553. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  31554. [0.6176, 0.4017, 0.8788, 0.5100, 0.4075, 0.5250, 0.5913, 0.5033],
  31555. [0.6260, 0.4120, 0.8013, 0.2350, 0.4888, 0.1533, 0.6281, 0.4895],
  31556. [0.6109, 0.4015, 0.7668, 0.3639, 0.3513, 0.3667, 0.5200, 0.5641],
  31557. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478],
  31558. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208]],
  31559. device='cuda:0', dtype=torch.float64)
  31560. predictions are: tensor([[ 5.3397e-01, -4.4429e-01, 1.6449e+00, 3.7041e-01, -4.7376e-01,
  31561. -5.6033e-01, 1.8569e-01, 5.2465e-01],
  31562. [ 4.3509e-01, -5.2979e-01, 1.8832e+00, -7.4444e-01, -4.3511e-01,
  31563. -6.0733e-01, 6.5849e-01, 1.9896e-01],
  31564. [ 6.8811e-01, -3.3548e-01, 9.0652e-01, -1.1236e+00, -4.8432e-01,
  31565. -1.0859e+00, 2.8385e-01, 3.4144e-01],
  31566. [ 2.5779e-01, -7.2311e-01, 1.8132e+00, 1.1183e-01, -3.2180e-01,
  31567. 2.0947e-01, 4.4570e-01, 1.2317e-01],
  31568. [ 1.6847e-01, -7.1877e-01, 1.4626e+00, -1.2881e+00, 1.9532e-02,
  31569. -1.5018e+00, 6.9486e-01, 1.8900e-01],
  31570. [ 5.0582e-01, -4.5344e-01, 1.3273e+00, -6.3100e-01, -6.1505e-01,
  31571. -5.4265e-01, 1.8403e-01, 2.8166e-01],
  31572. [-1.5590e-03, -8.3832e-01, 1.8570e+00, -6.9928e-01, -4.9101e-01,
  31573. -7.3952e-01, 5.2433e-01, 3.0981e-01],
  31574. [ 6.4362e-01, -3.8651e-01, 1.5309e+00, -1.0483e+00, -3.1909e-01,
  31575. -1.2067e+00, 4.5029e-01, 1.2443e-01]], device='cuda:0',
  31576. grad_fn=<AddmmBackward>)
  31577. landmarks are: tensor([[[ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  31578. 0.4778],
  31579. [ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  31580. 0.1390],
  31581. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  31582. 0.3546],
  31583. [ 0.5668, -0.4306, 1.7730, 0.0697, -0.4037, 0.1390, 0.4450,
  31584. 0.0390],
  31585. [ 0.6053, -0.3830, 1.4150, -1.2005, -0.0284, -1.5777, 0.6154,
  31586. -0.0250],
  31587. [ 0.5357, -0.4315, 1.2557, -0.6051, -0.6635, -0.5923, 0.1159,
  31588. 0.3198],
  31589. [ 0.5792, -0.4052, 1.8214, -0.6587, -0.5384, -0.8924, 0.4381,
  31590. 0.2442],
  31591. [ 0.5885, -0.4429, 1.4266, -0.9926, -0.4383, -1.2313, 0.4228,
  31592. 0.1195]]], device='cuda:0')
  31593. loss_train_step before backward: tensor(0.0212, device='cuda:0', grad_fn=<MseLossBackward>)
  31594. loss_train_step after backward: tensor(0.0212, device='cuda:0', grad_fn=<MseLossBackward>)
  31595. loss_train: 0.38229384645819664
  31596. step: 24
  31597. running loss: 0.015928910269091528
  31598. Train Steps: 24/90 Loss: 0.0159 torch.Size([8, 600, 800])
  31599. torch.Size([8, 8])
  31600. tensor([[0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  31601. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  31602. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  31603. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  31604. [0.6175, 0.4013, 0.8900, 0.4500, 0.4375, 0.5850, 0.6175, 0.5383],
  31605. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  31606. [0.6336, 0.4086, 0.8900, 0.3950, 0.3900, 0.2950, 0.6504, 0.5066],
  31607. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717]],
  31608. device='cuda:0', dtype=torch.float64)
  31609. predictions are: tensor([[ 0.5587, -0.4226, 1.6160, -0.5043, -0.5054, -1.1615, 0.1804, 0.3907],
  31610. [ 0.5253, -0.4484, 1.8616, 0.1801, -0.5132, -0.3568, 0.1869, 0.3852],
  31611. [ 0.4857, -0.4937, 1.0900, -1.4514, -0.3567, -1.3147, 0.4973, 0.2626],
  31612. [ 0.3560, -0.5321, 1.2411, -0.6366, -0.6568, -0.6283, 0.1718, 0.4453],
  31613. [ 0.4202, -0.5697, 1.8400, -0.1959, -0.2509, 0.3437, 0.5042, 0.1765],
  31614. [ 0.6044, -0.4654, 1.8214, -0.0966, -0.1333, 0.1111, 0.4976, 0.2188],
  31615. [ 0.5153, -0.4811, 1.9231, -0.4981, -0.4574, -1.0707, 0.7030, 0.0785],
  31616. [ 0.4016, -0.6046, 1.7845, -0.0465, -0.3021, -0.1544, 0.2956, 0.2958]],
  31617. device='cuda:0', grad_fn=<AddmmBackward>)
  31618. landmarks are: tensor([[[ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  31619. 0.3928],
  31620. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  31621. 0.3161],
  31622. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  31623. 0.2468],
  31624. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  31625. 0.4036],
  31626. [ 0.5664, -0.4321, 1.8249, -0.2074, -0.2651, 0.4162, 0.5663,
  31627. 0.2006],
  31628. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  31629. 0.2237],
  31630. [ 0.6405, -0.3984, 1.8249, -0.4614, -0.4845, -0.9233, 0.7182,
  31631. 0.0539],
  31632. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  31633. 0.3546]]], device='cuda:0')
  31634. loss_train_step before backward: tensor(0.0074, device='cuda:0', grad_fn=<MseLossBackward>)
  31635. loss_train_step after backward: tensor(0.0074, device='cuda:0', grad_fn=<MseLossBackward>)
  31636. loss_train: 0.38968273205682635
  31637. step: 25
  31638. running loss: 0.015587309282273054
  31639. Train Steps: 25/90 Loss: 0.0156 torch.Size([8, 600, 800])
  31640. torch.Size([8, 8])
  31641. tensor([[0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  31642. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586],
  31643. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  31644. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  31645. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  31646. [0.6260, 0.4133, 0.8800, 0.5117, 0.3713, 0.3283, 0.6223, 0.4967],
  31647. [0.6263, 0.4030, 0.9000, 0.4767, 0.3800, 0.5167, 0.6415, 0.4771],
  31648. [0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290]],
  31649. device='cuda:0', dtype=torch.float64)
  31650. predictions are: tensor([[ 0.1355, -0.7047, 1.0245, -1.2254, -0.2885, -1.5247, 0.0463, 0.1693],
  31651. [ 0.5920, -0.4166, 1.6155, -1.0675, 0.1942, -1.4872, 0.6072, 0.3212],
  31652. [ 0.5402, -0.4191, 1.1201, -1.1080, -0.5136, -0.9845, 0.2833, 0.4162],
  31653. [ 0.3849, -0.5270, 1.8260, -0.2820, -0.6391, -0.4763, 0.2228, 0.3612],
  31654. [ 0.4151, -0.5447, 1.8440, 0.0276, -0.4044, 0.1932, 0.3751, 0.2620],
  31655. [ 0.3779, -0.5567, 1.8440, 0.0828, -0.5188, -0.7754, 0.3708, 0.2907],
  31656. [ 0.4404, -0.5536, 1.8745, -0.0533, -0.5073, 0.0109, 0.4361, 0.1189],
  31657. [ 0.6545, -0.3770, 1.2548, -1.1872, -0.2788, -1.2400, 0.5030, 0.2161]],
  31658. device='cuda:0', grad_fn=<AddmmBackward>)
  31659. landmarks are: tensor([[[ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  31660. 0.0261],
  31661. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  31662. 0.2944],
  31663. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  31664. 0.3546],
  31665. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  31666. 0.1544],
  31667. [ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  31668. 0.1390],
  31669. [ 0.6054, -0.3767, 1.7788, 0.0774, -0.5711, -0.7694, 0.5887,
  31670. 0.0081],
  31671. [ 0.6072, -0.4247, 1.8711, -0.0842, -0.5307, 0.1005, 0.6771,
  31672. -0.0821],
  31673. [ 0.6125, -0.4273, 1.2807, -1.3253, -0.2574, -1.2542, 0.6864,
  31674. 0.1575]]], device='cuda:0')
  31675. loss_train_step before backward: tensor(0.0168, device='cuda:0', grad_fn=<MseLossBackward>)
  31676. loss_train_step after backward: tensor(0.0168, device='cuda:0', grad_fn=<MseLossBackward>)
  31677. loss_train: 0.4064830797724426
  31678. step: 26
  31679. running loss: 0.015633964606632408
  31680.  
  31681. Train Steps: 26/90 Loss: 0.0156 torch.Size([8, 600, 800])
  31682. torch.Size([8, 8])
  31683. tensor([[0.6273, 0.4105, 0.8988, 0.4517, 0.3912, 0.2550, 0.5894, 0.4811],
  31684. [0.6069, 0.3975, 0.8625, 0.5083, 0.4388, 0.5483, 0.5650, 0.4967],
  31685. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  31686. [0.6265, 0.4091, 0.8950, 0.3533, 0.3600, 0.3967, 0.6295, 0.4901],
  31687. [0.6193, 0.3930, 0.8949, 0.4437, 0.3852, 0.5435, 0.6263, 0.5263],
  31688. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  31689. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  31690. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617]],
  31691. device='cuda:0', dtype=torch.float64)
  31692. predictions are: tensor([[ 4.7468e-01, -4.2405e-01, 1.7528e+00, -2.6740e-01, -3.7613e-01,
  31693. -1.1936e+00, 2.4123e-01, 2.4698e-01],
  31694. [ 7.2586e-01, -3.2563e-01, 1.5593e+00, 8.7796e-02, -1.8891e-01,
  31695. 8.3703e-02, 2.8491e-02, 2.2675e-01],
  31696. [ 5.2334e-01, -4.4256e-01, 1.7059e+00, -2.4735e-01, -4.9585e-01,
  31697. -5.1626e-01, 2.3367e-01, 1.9561e-01],
  31698. [ 6.6523e-01, -3.2866e-01, 1.7513e+00, -6.5725e-01, -5.1157e-01,
  31699. -6.0597e-01, 5.1856e-01, 2.0810e-01],
  31700. [ 7.9341e-01, -2.9291e-01, 1.7165e+00, -1.9395e-01, -4.3940e-01,
  31701. -2.4226e-03, 4.1576e-01, 2.1084e-01],
  31702. [ 4.6099e-01, -4.5544e-01, 1.2891e+00, -1.0755e+00, -5.3392e-01,
  31703. -7.8686e-01, 2.7304e-01, 1.8630e-01],
  31704. [ 3.8093e-01, -5.4834e-01, 1.8468e+00, -3.5344e-01, -2.1268e-01,
  31705. -1.0234e+00, 6.6850e-01, 4.1560e-01],
  31706. [-2.5304e+00, -2.3983e+00, 9.7836e-01, -1.2369e+00, -2.7478e-01,
  31707. -1.2620e+00, 2.4886e-01, 3.5089e-01]], device='cuda:0',
  31708. grad_fn=<AddmmBackward>)
  31709. landmarks are: tensor([[[ 0.6116, -0.3898, 1.8654, -0.1997, -0.4788, -1.1081, 0.4367,
  31710. -0.0637],
  31711. [ 0.5174, -0.4497, 1.6979, 0.0620, -0.2594, 0.2468, 0.3238,
  31712. 0.0082],
  31713. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  31714. 0.0467],
  31715. [ 0.6077, -0.3965, 1.8480, -0.6539, -0.6231, -0.4537, 0.6216,
  31716. -0.0220],
  31717. [ 0.5746, -0.4706, 1.8476, -0.2365, -0.5068, 0.2245, 0.6069,
  31718. 0.1449],
  31719. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  31720. 0.0412],
  31721. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  31722. 0.2142],
  31723. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  31724. 0.3084]]], device='cuda:0')
  31725. loss_train_step before backward: tensor(0.0215, device='cuda:0', grad_fn=<MseLossBackward>)
  31726. loss_train_step after backward: tensor(0.0215, device='cuda:0', grad_fn=<MseLossBackward>)
  31727. loss_train: 0.427944693248719
  31728. step: 27
  31729. running loss: 0.015849803453656258
  31730. Train Steps: 27/90 Loss: 0.0158 torch.Size([8, 600, 800])
  31731. torch.Size([8, 8])
  31732. tensor([[0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  31733. [0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600],
  31734. [0.6224, 0.3964, 0.8225, 0.5717, 0.4150, 0.4617, 0.5775, 0.5267],
  31735. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  31736. [0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  31737. [0.6214, 0.4112, 0.7838, 0.2117, 0.3650, 0.3133, 0.5675, 0.5083],
  31738. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390],
  31739. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575]],
  31740. device='cuda:0', dtype=torch.float64)
  31741. predictions are: tensor([[ 0.4570, -0.5229, 1.7586, -0.0554, -0.5715, -0.5387, 0.2527, 0.4641],
  31742. [ 0.6345, -0.3882, 1.7560, 0.2261, -0.4069, -0.0963, 0.2293, 0.2826],
  31743. [ 0.6074, -0.4412, 1.6149, 0.2421, -0.3680, -0.4795, 0.1157, 0.2424],
  31744. [ 0.6530, -0.3447, 1.7055, 0.0860, -0.1344, -0.2192, -0.1011, 0.2670],
  31745. [ 0.4935, -0.5104, 1.8558, -0.0979, -0.4405, -0.0116, 0.3747, 0.1274],
  31746. [ 0.2789, -0.6232, 1.3619, -1.4057, -0.5798, -1.1723, 0.3074, 0.1082],
  31747. [ 0.5152, -0.4956, 1.8940, -0.1752, -0.4296, -0.0322, 0.8230, 0.2762],
  31748. [ 0.9435, -0.1969, 1.7871, -0.7499, -0.3294, -0.5972, 0.8296, 0.2128]],
  31749. device='cuda:0', grad_fn=<AddmmBackward>)
  31750. landmarks are: tensor([[[ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  31751. 0.5239],
  31752. [ 0.5762, -0.3840, 1.7268, 0.2622, -0.4210, 0.1313, 0.4277,
  31753. 0.3007],
  31754. [ 0.5891, -0.4550, 1.5132, 0.3546, -0.3691, -0.1535, 0.3815,
  31755. 0.1467],
  31756. [ 0.5447, -0.3838, 1.7037, 0.1775, -0.1497, 0.1467, 0.1128,
  31757. 0.2431],
  31758. [ 0.6047, -0.4209, 1.7557, -0.0303, -0.4845, 0.2545, 0.6587,
  31759. 0.1236],
  31760. [ 0.5845, -0.3864, 1.3342, -1.3082, -0.6000, -0.8386, 0.3353,
  31761. 0.0620],
  31762. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  31763. 0.2035],
  31764. [ 0.6158, -0.4249, 1.8654, -0.9002, -0.3229, -0.3537, 0.9667,
  31765. 0.2890]]], device='cuda:0')
  31766. loss_train_step before backward: tensor(0.0249, device='cuda:0', grad_fn=<MseLossBackward>)
  31767. loss_train_step after backward: tensor(0.0249, device='cuda:0', grad_fn=<MseLossBackward>)
  31768. loss_train: 0.4528018026612699
  31769. step: 28
  31770. running loss: 0.01617149295218821
  31771. Train Steps: 28/90 Loss: 0.0162 torch.Size([8, 600, 800])
  31772. torch.Size([8, 8])
  31773. tensor([[0.6164, 0.4076, 0.8838, 0.4117, 0.3713, 0.5550, 0.6238, 0.5350],
  31774. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552],
  31775. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  31776. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390],
  31777. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  31778. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  31779. [0.6100, 0.4016, 0.8600, 0.5067, 0.4612, 0.5233, 0.5086, 0.5519],
  31780. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300]],
  31781. device='cuda:0', dtype=torch.float64)
  31782. predictions are: tensor([[ 0.7551, -0.2866, 1.7308, -0.2989, -0.4932, 0.0477, 0.4730, 0.0802],
  31783. [-2.5839, -2.4586, 1.5701, -1.1338, 0.0178, -1.2622, 0.7895, 0.2292],
  31784. [ 0.4940, -0.4422, 1.4511, -1.0838, -0.1897, -1.4387, 0.3430, 0.1239],
  31785. [ 0.6857, -0.3570, 1.8496, -0.0496, -0.4596, 0.0302, 0.8218, 0.1607],
  31786. [ 0.3040, -0.5759, 1.3551, -0.7724, -0.6065, -0.6449, 0.2698, 0.4399],
  31787. [ 0.7371, -0.2424, 1.7519, 0.0958, -0.6039, -0.7225, 0.1211, 0.2988],
  31788. [ 0.6786, -0.3373, 1.6232, 0.1325, -0.1826, -0.1288, -0.1010, 0.1699],
  31789. [ 0.4422, -0.4763, 1.2160, -1.1084, -0.4471, -1.0021, 0.4260, 0.1637]],
  31790. device='cuda:0', grad_fn=<AddmmBackward>)
  31791. landmarks are: tensor([[[ 0.5614, -0.4032, 1.7961, -0.3844, -0.5711, 0.2776, 0.5952,
  31792. 0.1852],
  31793. [-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  31794. 0.2783],
  31795. [ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  31796. 0.2083],
  31797. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  31798. 0.2035],
  31799. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  31800. 0.5624],
  31801. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  31802. 0.3161],
  31803. [ 0.5318, -0.4310, 1.6864, 0.0543, -0.1554, 0.1313, 0.0635,
  31804. 0.2634],
  31805. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  31806. 0.1621]]], device='cuda:0')
  31807. loss_train_step before backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  31808. loss_train_step after backward: tensor(0.0203, device='cuda:0', grad_fn=<MseLossBackward>)
  31809. loss_train: 0.47314505791291595
  31810. step: 29
  31811. running loss: 0.01631534682458331
  31812. Train Steps: 29/90 Loss: 0.0163 torch.Size([8, 600, 800])
  31813. torch.Size([8, 8])
  31814. tensor([[0.6214, 0.4040, 0.8838, 0.3500, 0.3600, 0.5183, 0.6362, 0.5200],
  31815. [0.6280, 0.4055, 0.8600, 0.5317, 0.3800, 0.4700, 0.6275, 0.5133],
  31816. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395],
  31817. [0.6179, 0.3961, 0.8347, 0.6020, 0.3887, 0.4624, 0.5714, 0.5373],
  31818. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  31819. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  31820. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646],
  31821. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913]],
  31822. device='cuda:0', dtype=torch.float64)
  31823. predictions are: tensor([[ 0.6479, -0.3862, 1.7959, -0.6655, -0.4468, 0.0505, 0.8091, 0.0969],
  31824. [ 0.6897, -0.3558, 1.7876, 0.1890, -0.4869, -0.1190, 0.6193, 0.0967],
  31825. [ 0.6158, -0.3547, 1.7291, 0.0648, -0.5078, -0.6661, 0.3796, 0.2100],
  31826. [ 0.7697, -0.3150, 1.5880, 0.3262, -0.4156, -0.3101, 0.4204, 0.1966],
  31827. [-2.2058, -2.1965, 1.4134, -1.0115, -0.5480, -0.8214, 0.3142, 0.1668],
  31828. [ 0.5060, -0.3896, 1.7413, -0.3907, -0.4397, -0.3701, 0.1312, 0.3688],
  31829. [ 0.6487, -0.3205, 1.4211, -0.8362, -0.5193, -0.9339, 0.0720, 0.2005],
  31830. [ 0.5592, -0.4004, 1.3866, -1.2150, -0.0363, -1.5537, 0.4363, 0.0868]],
  31831. device='cuda:0', grad_fn=<AddmmBackward>)
  31832. landmarks are: tensor([[[ 0.5841, -0.4199, 1.7961, -0.6693, -0.6231, 0.1082, 0.6529,
  31833. 0.1159],
  31834. [ 0.6148, -0.4130, 1.6864, 0.1698, -0.5307, -0.1150, 0.6125,
  31835. 0.0851],
  31836. [ 0.5697, -0.4514, 1.7420, 0.2672, -0.6055, -0.6312, 0.3449,
  31837. 0.2058],
  31838. [ 0.5680, -0.4562, 1.5697, 0.4947, -0.4904, -0.1503, 0.3536,
  31839. 0.1956],
  31840. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  31841. 0.0893],
  31842. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  31843. 0.4145],
  31844. [ 0.5483, -0.4105, 1.4208, -0.8002, -0.6000, -0.9002, 0.0511,
  31845. 0.3220],
  31846. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  31847. -0.0168]]], device='cuda:0')
  31848. loss_train_step before backward: tensor(0.0082, device='cuda:0', grad_fn=<MseLossBackward>)
  31849. loss_train_step after backward: tensor(0.0082, device='cuda:0', grad_fn=<MseLossBackward>)
  31850. loss_train: 0.48136191023513675
  31851. step: 30
  31852. running loss: 0.016045397007837893
  31853.  
  31854. Train Steps: 30/90 Loss: 0.0160 torch.Size([8, 600, 800])
  31855. torch.Size([8, 8])
  31856. tensor([[0.6214, 0.4175, 0.7300, 0.2883, 0.4338, 0.2167, 0.5698, 0.5773],
  31857. [0.6200, 0.4049, 0.8638, 0.5617, 0.4125, 0.5100, 0.6013, 0.5317],
  31858. [0.6268, 0.4029, 0.8500, 0.2683, 0.3937, 0.3500, 0.6860, 0.5297],
  31859. [0.6136, 0.4060, 0.8025, 0.3217, 0.3650, 0.3000, 0.5060, 0.5646],
  31860. [0.6127, 0.4115, 0.7163, 0.2883, 0.3625, 0.2950, 0.5327, 0.5495],
  31861. [0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667],
  31862. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  31863. [0.6307, 0.4045, 0.8025, 0.5833, 0.3775, 0.4867, 0.6892, 0.5459]],
  31864. device='cuda:0', dtype=torch.float64)
  31865. predictions are: tensor([[ 0.5437, -0.4190, 1.2397, -0.9936, -0.2858, -1.3147, 0.3011, 0.3873],
  31866. [ 0.4616, -0.5160, 1.8487, 0.2746, -0.3216, 0.0470, 0.4399, 0.0933],
  31867. [ 0.7601, -0.3446, 1.7578, -1.0177, -0.4505, -0.7159, 0.8616, 0.0667],
  31868. [ 0.6262, -0.3732, 1.5641, -0.8014, -0.5630, -0.9078, 0.0116, 0.1624],
  31869. [ 0.4152, -0.5154, 1.2256, -1.0323, -0.5391, -0.9245, 0.1490, 0.2274],
  31870. [ 0.7800, -0.3039, 1.8411, -0.6873, -0.4801, -0.6690, 0.4628, 0.2354],
  31871. [ 0.6368, -0.4049, 1.9289, 0.1807, -0.4706, -0.0622, 0.4105, 0.1088],
  31872. [ 0.6706, -0.3962, 1.6757, 0.2004, -0.4664, -0.1117, 0.8264, 0.1407]],
  31873. device='cuda:0', grad_fn=<AddmmBackward>)
  31874. landmarks are: tensor([[[ 0.5841, -0.3574, 1.0859, -0.9541, -0.2824, -1.2851, 0.3460,
  31875. 0.3808],
  31876. [ 0.5776, -0.4159, 1.7037, 0.3084, -0.3806, 0.0697, 0.4912,
  31877. 0.1698],
  31878. [ 0.6092, -0.4249, 1.6402, -1.0465, -0.4672, -0.6693, 0.8827,
  31879. 0.1608],
  31880. [ 0.5483, -0.4105, 1.4208, -0.8002, -0.6000, -0.9002, 0.0511,
  31881. 0.3220],
  31882. [ 0.5442, -0.3855, 1.0224, -0.9541, -0.6115, -0.9233, 0.1745,
  31883. 0.2522],
  31884. [ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  31885. 0.3315],
  31886. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  31887. 0.1544],
  31888. [ 0.6273, -0.4177, 1.4208, 0.4085, -0.5423, -0.0380, 0.8973,
  31889. 0.2356]]], device='cuda:0')
  31890. loss_train_step before backward: tensor(0.0089, device='cuda:0', grad_fn=<MseLossBackward>)
  31891. loss_train_step after backward: tensor(0.0089, device='cuda:0', grad_fn=<MseLossBackward>)
  31892. loss_train: 0.49028233671560884
  31893. step: 31
  31894. running loss: 0.015815559248890606
  31895. Train Steps: 31/90 Loss: 0.0158 torch.Size([8, 600, 800])
  31896. torch.Size([8, 8])
  31897. tensor([[0.6267, 0.4094, 0.8712, 0.3083, 0.4400, 0.2267, 0.6250, 0.5200],
  31898. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  31899. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  31900. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279],
  31901. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  31902. [0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138],
  31903. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  31904. [0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767]],
  31905. device='cuda:0', dtype=torch.float64)
  31906. predictions are: tensor([[ 0.5666, -0.4195, 1.8396, -1.0422, -0.1928, -1.2118, 0.5643, 0.1019],
  31907. [ 0.6211, -0.3755, 1.3698, -0.6980, -0.6557, -0.4697, 0.1725, 0.2209],
  31908. [ 0.5803, -0.4509, 1.9152, -0.6383, -0.3041, -0.8855, 0.8861, 0.0336],
  31909. [ 0.7501, -0.3202, 1.8613, -0.1640, -0.4751, 0.0098, 0.5408, 0.0257],
  31910. [ 0.6964, -0.3375, 1.5899, 0.3226, -0.3722, -0.0324, 0.4169, 0.4082],
  31911. [ 0.4888, -0.4642, 1.5771, -0.5611, -0.5993, -0.5054, 0.4021, 0.4605],
  31912. [ 0.7757, -0.3521, 1.8301, 0.2087, -0.5843, -0.1622, 0.5861, 0.0187],
  31913. [ 0.6856, -0.3810, 1.8420, -0.0025, -0.4428, -0.0025, 0.2644, 0.1522]],
  31914. device='cuda:0', grad_fn=<AddmmBackward>)
  31915. landmarks are: tensor([[[ 0.6089, -0.3948, 1.7383, -0.8617, -0.2536, -1.2390, 0.6009,
  31916. 0.1159],
  31917. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  31918. 0.3417],
  31919. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  31920. 0.1821],
  31921. [ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  31922. 0.1525],
  31923. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  31924. 0.5239],
  31925. [ 0.5438, -0.4206, 1.5189, -0.4537, -0.6115, -0.6231, 0.4365,
  31926. 0.5491],
  31927. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  31928. 0.0291],
  31929. [ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  31930. 0.3777]]], device='cuda:0')
  31931. loss_train_step before backward: tensor(0.0072, device='cuda:0', grad_fn=<MseLossBackward>)
  31932. loss_train_step after backward: tensor(0.0072, device='cuda:0', grad_fn=<MseLossBackward>)
  31933. loss_train: 0.49751824559643865
  31934. step: 32
  31935. running loss: 0.015547445174888708
  31936. Train Steps: 32/90 Loss: 0.0155 torch.Size([8, 600, 800])
  31937. torch.Size([8, 8])
  31938. tensor([[0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  31939. [0.6173, 0.4114, 0.7325, 0.2500, 0.4213, 0.1917, 0.5338, 0.5700],
  31940. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  31941. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  31942. [0.6357, 0.4118, 0.8400, 0.2500, 0.5413, 0.1633, 0.6725, 0.5586],
  31943. [0.6346, 0.4092, 0.7712, 0.5917, 0.4037, 0.4767, 0.7343, 0.5725],
  31944. [0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  31945. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209]],
  31946. device='cuda:0', dtype=torch.float64)
  31947. predictions are: tensor([[ 0.7685, -0.2554, 1.8790, -0.0951, -0.5094, 0.1064, 0.3453, 0.0740],
  31948. [ 0.2122, -0.6466, 1.1111, -1.1771, -0.4408, -1.2101, 0.1642, 0.2664],
  31949. [ 0.5185, -0.4993, 1.5777, -1.2015, -0.3875, -1.1538, 0.6529, 0.0108],
  31950. [ 0.6000, -0.4405, 1.6702, 0.3551, -0.3816, 0.2087, 0.2137, -0.0261],
  31951. [ 0.5316, -0.4604, 1.7136, -1.2135, 0.0900, -1.4193, 0.7995, 0.1499],
  31952. [ 0.7085, -0.3692, 1.4491, 0.1493, -0.6077, 0.0302, 0.9614, 0.2498],
  31953. [ 0.6815, -0.3494, 1.7495, -0.4778, -0.7476, -0.3255, 0.4961, 0.2621],
  31954. [ 0.6221, -0.3105, 1.7768, -0.2247, -0.3396, -0.9656, 0.3741, 0.4538]],
  31955. device='cuda:0', grad_fn=<AddmmBackward>)
  31956. landmarks are: tensor([[[ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  31957. 0.1439],
  31958. [ 0.5652, -0.3858, 1.0975, -1.1312, -0.3402, -1.4006, 0.1794,
  31959. 0.3469],
  31960. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  31961. 0.1193],
  31962. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  31963. -0.0610],
  31964. [ 0.6504, -0.3840, 1.5940, -1.1312, 0.2141, -1.5315, 0.8205,
  31965. 0.2944],
  31966. [ 0.6454, -0.3960, 1.2764, 0.4470, -0.4210, -0.0842, 1.1057,
  31967. 0.3585],
  31968. [ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  31969. 0.2930],
  31970. [ 0.6174, -0.3118, 1.6402, -0.2074, -0.1958, -1.0927, 0.2267,
  31971. 0.5822]]], device='cuda:0')
  31972. loss_train_step before backward: tensor(0.0149, device='cuda:0', grad_fn=<MseLossBackward>)
  31973. loss_train_step after backward: tensor(0.0149, device='cuda:0', grad_fn=<MseLossBackward>)
  31974. loss_train: 0.5123806581832469
  31975. step: 33
  31976. running loss: 0.01552668661161354
  31977. Train Steps: 33/90 Loss: 0.0155 torch.Size([8, 600, 800])
  31978. torch.Size([8, 8])
  31979. tensor([[0.6042, 0.3990, 0.6831, 0.2875, 0.3500, 0.3133, 0.5143, 0.5510],
  31980. [0.6307, 0.4045, 0.8025, 0.5833, 0.3775, 0.4867, 0.6892, 0.5459],
  31981. [0.6236, 0.4081, 0.8575, 0.3000, 0.3713, 0.3033, 0.5550, 0.5633],
  31982. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  31983. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  31984. [0.6038, 0.3946, 0.8413, 0.4883, 0.3563, 0.4550, 0.5266, 0.4693],
  31985. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  31986. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350]],
  31987. device='cuda:0', dtype=torch.float64)
  31988. predictions are: tensor([[ 0.6101, -0.3861, 1.0465, -1.0171, -0.5287, -0.9288, 0.1636, 0.3035],
  31989. [ 0.7595, -0.3106, 1.5950, 0.3544, -0.4964, -0.0664, 0.8690, 0.1603],
  31990. [ 0.5309, -0.4411, 1.7549, -0.7236, -0.5169, -0.8883, 0.3679, 0.1458],
  31991. [ 0.7765, -0.3054, 1.7333, 0.3088, -0.3553, 0.1623, 0.7348, 0.0983],
  31992. [ 0.6907, -0.3104, 1.9679, -0.2774, -0.5666, -0.0387, 0.7282, 0.2893],
  31993. [ 0.5866, -0.3977, 1.7523, 0.0307, -0.5445, -0.1638, 0.2781, 0.1210],
  31994. [ 0.5182, -0.4533, 1.4693, -0.9037, -0.5433, -0.7623, 0.4990, 0.2418],
  31995. [ 0.3984, -0.5048, 1.4839, -1.1185, -0.1541, -1.3903, 0.4739, 0.2252]],
  31996. device='cuda:0', grad_fn=<AddmmBackward>)
  31997. landmarks are: tensor([[[ 0.5049, -0.4428, 0.8692, -0.9581, -0.6693, -0.8386, 0.0897,
  31998. 0.2589],
  31999. [ 0.6273, -0.4177, 1.4208, 0.4085, -0.5423, -0.0380, 0.8973,
  32000. 0.2356],
  32001. [ 0.5944, -0.4008, 1.6748, -0.9002, -0.5711, -0.8848, 0.2776,
  32002. 0.3161],
  32003. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  32004. 0.1176],
  32005. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  32006. 0.3161],
  32007. [ 0.5030, -0.4631, 1.5998, -0.0303, -0.6404, -0.1843, 0.1465,
  32008. -0.1181],
  32009. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  32010. 0.1931],
  32011. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  32012. 0.1850]]], device='cuda:0')
  32013. loss_train_step before backward: tensor(0.0088, device='cuda:0', grad_fn=<MseLossBackward>)
  32014. loss_train_step after backward: tensor(0.0088, device='cuda:0', grad_fn=<MseLossBackward>)
  32015. loss_train: 0.5212206044234335
  32016. step: 34
  32017. running loss: 0.01533001777715981
  32018.  
  32019. Train Steps: 34/90 Loss: 0.0153 torch.Size([8, 600, 800])
  32020. torch.Size([8, 8])
  32021. tensor([[0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  32022. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  32023. [0.6200, 0.3993, 0.8519, 0.4923, 0.3962, 0.4717, 0.6013, 0.5433],
  32024. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  32025. [0.6226, 0.4103, 0.8575, 0.3450, 0.4388, 0.2067, 0.5787, 0.5383],
  32026. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  32027. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  32028. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719]],
  32029. device='cuda:0', dtype=torch.float64)
  32030. predictions are: tensor([[ 0.7662, -0.2341, 1.5781, -0.2909, -0.6309, -0.7669, 0.4134, 0.3638],
  32031. [-1.5719, -1.7703, 1.2770, -0.8794, -0.4331, -1.0268, 0.3747, 0.3496],
  32032. [ 0.7161, -0.3501, 1.6823, 0.1277, -0.5211, -0.0683, 0.6721, 0.1472],
  32033. [ 0.6450, -0.3428, 1.7448, 0.0048, -0.3701, 0.0794, 0.4939, 0.2061],
  32034. [ 0.6709, -0.3055, 1.6780, -0.6860, -0.2785, -1.2521, 0.4511, 0.2015],
  32035. [ 0.6167, -0.3962, 1.6691, 0.1726, -0.2480, 0.1969, 0.6600, 0.0819],
  32036. [ 0.7405, -0.2789, 1.8078, 0.0298, -0.4354, 0.2576, 0.7490, 0.0836],
  32037. [ 0.5992, -0.3914, 1.5422, -0.4336, -0.6631, -0.2964, 0.3682, 0.2405]],
  32038. device='cuda:0', grad_fn=<AddmmBackward>)
  32039. landmarks are: tensor([[[ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  32040. 0.3238],
  32041. [-2.2859, -2.2859, 1.2303, -0.7848, -0.4210, -1.1158, 0.2256,
  32042. 0.3777],
  32043. [ 0.5777, -0.4415, 1.6491, -0.0122, -0.4557, -0.1073, 0.4912,
  32044. 0.2237],
  32045. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  32046. 0.3084],
  32047. [ 0.5898, -0.3908, 1.6748, -0.6924, -0.2594, -1.3313, 0.3873,
  32048. 0.2006],
  32049. [ 0.5548, -0.4682, 1.7309, 0.0966, -0.1394, 0.1757, 0.5045,
  32050. 0.0942],
  32051. [ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  32052. 0.1390],
  32053. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  32054. 0.3559]]], device='cuda:0')
  32055. loss_train_step before backward: tensor(0.0195, device='cuda:0', grad_fn=<MseLossBackward>)
  32056. loss_train_step after backward: tensor(0.0195, device='cuda:0', grad_fn=<MseLossBackward>)
  32057. loss_train: 0.5407532160170376
  32058. step: 35
  32059. running loss: 0.015450091886201075
  32060. Train Steps: 35/90 Loss: 0.0155 torch.Size([8, 600, 800])
  32061. torch.Size([8, 8])
  32062. tensor([[0.6282, 0.4034, 0.7830, 0.2080, 0.4532, 0.2080, 0.6404, 0.5323],
  32063. [0.6034, 0.4011, 0.7350, 0.2533, 0.3438, 0.3367, 0.5516, 0.5084],
  32064. [0.6273, 0.4100, 0.7137, 0.2133, 0.4000, 0.2650, 0.6075, 0.5633],
  32065. [ nan, nan, 0.7192, 0.2346, 0.4037, 0.2050, 0.5138, 0.5650],
  32066. [0.6286, 0.4097, 0.8107, 0.2414, 0.4425, 0.2483, 0.6745, 0.5385],
  32067. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  32068. [0.6219, 0.3934, 0.8688, 0.5267, 0.4313, 0.4967, 0.5988, 0.4983],
  32069. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283]],
  32070. device='cuda:0', dtype=torch.float64)
  32071. predictions are: tensor([[ 0.5688, -0.4102, 1.3362, -1.0214, -0.2337, -1.2387, 0.5933, 0.2205],
  32072. [ 0.5588, -0.4107, 1.1360, -0.9133, -0.6114, -0.6363, 0.2814, 0.1120],
  32073. [ 0.4255, -0.4792, 1.0315, -1.0336, -0.4536, -1.0128, 0.4469, 0.3514],
  32074. [-2.0111, -2.0337, 1.0375, -1.0228, -0.4102, -1.0963, 0.2566, 0.2898],
  32075. [ 0.5824, -0.3836, 1.4738, -0.8859, -0.2546, -1.1444, 0.8461, 0.2488],
  32076. [ 0.6641, -0.3520, 1.6249, -0.4234, -0.6472, -0.4652, 0.5174, 0.2492],
  32077. [ 0.7156, -0.3546, 1.7393, 0.3704, -0.3914, 0.1171, 0.5668, -0.0235],
  32078. [ 0.6197, -0.3639, 1.9170, -0.2692, -0.5723, -0.3346, 0.6970, 0.2217]],
  32079. device='cuda:0', grad_fn=<AddmmBackward>)
  32080. landmarks are: tensor([[[ 0.6158, -0.4225, 1.3307, -1.3253, -0.1924, -1.3252, 0.6721,
  32081. 0.1727],
  32082. [ 0.5009, -0.4333, 1.1090, -1.1158, -0.6982, -0.7309, 0.2617,
  32083. 0.0622],
  32084. [ 0.6115, -0.3924, 1.0109, -1.3005, -0.4383, -1.0619, 0.5201,
  32085. 0.3161],
  32086. [-2.2859, -2.2859, 1.0361, -1.2021, -0.4210, -1.3390, 0.0871,
  32087. 0.3238],
  32088. [ 0.6174, -0.3936, 1.4586, -1.1709, -0.2420, -1.1389, 0.8296,
  32089. 0.2012],
  32090. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  32091. 0.1753],
  32092. [ 0.5864, -0.4690, 1.7268, 0.1467, -0.2940, 0.0082, 0.4797,
  32093. 0.0159],
  32094. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  32095. 0.1544]]], device='cuda:0')
  32096. loss_train_step before backward: tensor(0.0145, device='cuda:0', grad_fn=<MseLossBackward>)
  32097. loss_train_step after backward: tensor(0.0145, device='cuda:0', grad_fn=<MseLossBackward>)
  32098. loss_train: 0.5552862132899463
  32099. step: 36
  32100. running loss: 0.015424617035831843
  32101. Train Steps: 36/90 Loss: 0.0154 torch.Size([8, 600, 800])
  32102. torch.Size([8, 8])
  32103. tensor([[0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  32104. [0.6336, 0.4191, 0.8938, 0.5167, 0.3937, 0.3517, 0.7343, 0.5748],
  32105. [0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  32106. [0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  32107. [0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  32108. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  32109. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390],
  32110. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183]],
  32111. device='cuda:0', dtype=torch.float64)
  32112. predictions are: tensor([[ 0.6712, -0.3344, 0.8852, -0.8259, -0.5781, -0.8849, 0.2836, 0.4461],
  32113. [ 0.6448, -0.3840, 1.7873, 0.1943, -0.3306, -0.5015, 0.9702, 0.3116],
  32114. [ 0.6883, -0.3586, 1.1804, -1.1055, -0.3317, -1.3468, 0.3378, 0.1692],
  32115. [ 0.6501, -0.3811, 1.7949, 0.0383, -0.4651, 0.4288, 0.6228, 0.0843],
  32116. [ 0.5457, -0.4620, 1.6727, -0.5455, -0.5818, -0.7265, 0.4503, 0.1704],
  32117. [ 0.5400, -0.4457, 1.6360, -0.1206, -0.5851, -0.3272, 0.2805, 0.3501],
  32118. [ 0.6369, -0.3821, 1.8384, -0.0908, -0.4472, 0.3384, 1.0631, 0.2493],
  32119. [ 0.4643, -0.4946, 1.4443, -0.9013, -0.4899, -0.8918, 0.3928, 0.1161]],
  32120. device='cuda:0', grad_fn=<AddmmBackward>)
  32121. landmarks are: tensor([[[ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  32122. 0.4085],
  32123. [ 0.6405, -0.3503, 1.8423, 0.1005, -0.4672, -0.6616, 1.1057,
  32124. 0.3692],
  32125. [ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  32126. 0.1449],
  32127. [ 0.6047, -0.4209, 1.7557, -0.0303, -0.4845, 0.2545, 0.6587,
  32128. 0.1236],
  32129. [ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  32130. 0.1963],
  32131. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  32132. 0.2853],
  32133. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  32134. 0.2035],
  32135. [ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  32136. 0.1080]]], device='cuda:0')
  32137. loss_train_step before backward: tensor(0.0055, device='cuda:0', grad_fn=<MseLossBackward>)
  32138. loss_train_step after backward: tensor(0.0055, device='cuda:0', grad_fn=<MseLossBackward>)
  32139. loss_train: 0.5607698620297015
  32140. step: 37
  32141. running loss: 0.015155942217018959
  32142. Train Steps: 37/90 Loss: 0.0152 torch.Size([8, 600, 800])
  32143. torch.Size([8, 8])
  32144. tensor([[0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283],
  32145. [0.6256, 0.4199, 0.8638, 0.5800, 0.3987, 0.4383, 0.5600, 0.5950],
  32146. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  32147. [0.6275, 0.4081, 0.8063, 0.2017, 0.4825, 0.1583, 0.6156, 0.4869],
  32148. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  32149. [0.6250, 0.4103, 0.8950, 0.4400, 0.3912, 0.5650, 0.6050, 0.5133],
  32150. [0.6308, 0.3990, 0.8688, 0.5183, 0.3950, 0.4983, 0.6388, 0.5133],
  32151. [0.6127, 0.4115, 0.7163, 0.2883, 0.3625, 0.2950, 0.5327, 0.5495]],
  32152. device='cuda:0', dtype=torch.float64)
  32153. predictions are: tensor([[ 0.5668, -0.4175, 1.6320, 0.0660, -0.1801, -0.0683, 0.3313, 0.2419],
  32154. [ 0.5908, -0.3833, 1.6107, 0.3380, -0.5683, -0.2802, 0.4929, 0.5329],
  32155. [ 0.4183, -0.5385, 1.5019, 0.3227, -0.3926, 0.0037, 0.3500, 0.1237],
  32156. [ 0.6590, -0.4055, 1.4546, -1.4122, -0.1601, -1.6383, 0.7569, 0.0479],
  32157. [ 0.5319, -0.4480, 1.6853, -0.0332, -0.2487, -0.0303, 0.4169, 0.3119],
  32158. [ 0.5453, -0.4142, 1.7662, -0.3417, -0.5738, 0.2874, 0.7600, 0.2159],
  32159. [ 0.5614, -0.4496, 1.7109, 0.0886, -0.5932, -0.0110, 0.9051, 0.1374],
  32160. [ 0.5893, -0.4026, 1.0282, -1.0175, -0.7196, -0.9125, 0.2854, 0.3452]],
  32161. device='cuda:0', grad_fn=<AddmmBackward>)
  32162. landmarks are: tensor([[[ 0.5245, -0.4347, 1.6806, 0.1159, 0.0046, 0.0129, 0.1044,
  32163. 0.1544],
  32164. [ 0.6038, -0.3464, 1.7037, 0.3931, -0.4441, -0.2613, 0.3007,
  32165. 0.4624],
  32166. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  32167. -0.0610],
  32168. [ 0.6124, -0.4010, 1.4381, -1.3544, -0.0573, -1.5546, 0.5573,
  32169. -0.0369],
  32170. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  32171. 0.3392],
  32172. [ 0.6010, -0.3909, 1.8480, -0.2536, -0.4788, 0.3238, 0.5085,
  32173. 0.0851],
  32174. [ 0.6275, -0.4430, 1.7268, 0.1082, -0.4614, 0.0159, 0.6644,
  32175. 0.0851],
  32176. [ 0.5442, -0.3855, 1.0224, -0.9541, -0.6115, -0.9233, 0.1745,
  32177. 0.2522]]], device='cuda:0')
  32178. loss_train_step before backward: tensor(0.0117, device='cuda:0', grad_fn=<MseLossBackward>)
  32179. loss_train_step after backward: tensor(0.0117, device='cuda:0', grad_fn=<MseLossBackward>)
  32180. loss_train: 0.5724910940043628
  32181. step: 38
  32182. running loss: 0.01506555510537797
  32183.  
  32184. Train Steps: 38/90 Loss: 0.0151 torch.Size([8, 600, 800])
  32185. torch.Size([8, 8])
  32186. tensor([[0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  32187. [0.6274, 0.4117, 0.8100, 0.5801, 0.4000, 0.4583, 0.5582, 0.6118],
  32188. [0.6193, 0.4050, 0.7313, 0.2433, 0.4075, 0.2117, 0.5649, 0.5656],
  32189. [0.6226, 0.4125, 0.8800, 0.4900, 0.4512, 0.5600, 0.6275, 0.5517],
  32190. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267],
  32191. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  32192. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  32193. [0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290]],
  32194. device='cuda:0', dtype=torch.float64)
  32195. predictions are: tensor([[ 0.5787, -0.4111, 1.6932, 0.0974, -0.2177, 0.0952, 0.3047, 0.1366],
  32196. [ 0.3868, -0.5064, 1.4697, 0.3451, -0.5825, -0.1846, 0.5391, 0.5011],
  32197. [ 0.5121, -0.4486, 1.0925, -1.1847, -0.4936, -1.2274, 0.4309, 0.2811],
  32198. [ 0.5534, -0.3974, 1.7306, -0.0548, -0.2913, 0.2534, 0.6129, 0.3512],
  32199. [ 0.6356, -0.4325, 1.4172, -1.2141, -0.2466, -1.5455, 0.7136, 0.1865],
  32200. [ 0.6097, -0.4405, 1.6402, 0.2651, -0.5443, -0.1034, 0.6511, 0.1993],
  32201. [ 0.5489, -0.4402, 1.6364, -0.2779, -0.5507, 0.0573, 0.3002, 0.0735],
  32202. [ 0.5650, -0.4668, 1.2234, -1.2461, -0.3808, -1.2864, 0.7092, 0.1740]],
  32203. device='cuda:0', grad_fn=<AddmmBackward>)
  32204. landmarks are: tensor([[[ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  32205. 0.0532],
  32206. [ 0.6121, -0.3844, 1.4556, 0.3936, -0.4383, -0.1689, 0.2925,
  32207. 0.5401],
  32208. [ 0.5746, -0.4153, 1.0917, -1.1620, -0.4037, -1.3082, 0.3234,
  32209. 0.3267],
  32210. [ 0.5897, -0.3804, 1.7788, -0.0226, -0.2016, 0.3007, 0.6125,
  32211. 0.2622],
  32212. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  32213. 0.1467],
  32214. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  32215. 0.1979],
  32216. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  32217. 0.0231],
  32218. [ 0.6125, -0.4273, 1.2807, -1.3253, -0.2574, -1.2542, 0.6864,
  32219. 0.1575]]], device='cuda:0')
  32220. loss_train_step before backward: tensor(0.0072, device='cuda:0', grad_fn=<MseLossBackward>)
  32221. loss_train_step after backward: tensor(0.0072, device='cuda:0', grad_fn=<MseLossBackward>)
  32222. loss_train: 0.5796950873918831
  32223. step: 39
  32224. running loss: 0.014863976599791875
  32225. Train Steps: 39/90 Loss: 0.0149 torch.Size([8, 600, 800])
  32226. torch.Size([8, 8])
  32227. tensor([[0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  32228. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  32229. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  32230. [0.6110, 0.3984, 0.8750, 0.4933, 0.4625, 0.4950, 0.5578, 0.5676],
  32231. [0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510],
  32232. [0.6273, 0.4105, 0.8988, 0.4517, 0.3912, 0.2550, 0.5894, 0.4811],
  32233. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  32234. [0.6203, 0.4078, 0.8800, 0.5083, 0.3900, 0.5000, 0.6100, 0.5583]],
  32235. device='cuda:0', dtype=torch.float64)
  32236. predictions are: tensor([[ 0.4518, -0.5226, 1.5759, 0.0545, -0.5464, -0.0713, 0.5453, 0.1484],
  32237. [ 0.5803, -0.3962, 1.6064, -0.1914, -0.6144, -0.1679, 0.5165, 0.2878],
  32238. [ 0.5458, -0.4359, 1.6392, -0.9572, -0.1208, -1.4111, 0.6136, 0.1508],
  32239. [ 0.5890, -0.4114, 1.5700, -0.1026, -0.1931, 0.0397, 0.3496, 0.4049],
  32240. [ 0.5104, -0.4378, 1.5383, -0.0344, -0.4701, -0.0894, 0.2003, 0.3153],
  32241. [ 0.5813, -0.4163, 1.6899, -0.3295, -0.5267, -1.1116, 0.5762, 0.1261],
  32242. [ 0.4640, -0.5030, 1.4995, 0.0286, -0.2245, 0.1700, 0.5783, 0.2438],
  32243. [ 0.5282, -0.4285, 1.5917, -0.0356, -0.4829, 0.0265, 0.5645, 0.2748]],
  32244. device='cuda:0', grad_fn=<AddmmBackward>)
  32245. landmarks are: tensor([[[ 5.7725e-01, -4.3156e-01, 1.7399e+00, 1.2871e-01, -5.1531e-01,
  32246. -8.1749e-02, 4.3131e-01, 9.1941e-02],
  32247. [ 5.8655e-01, -3.9731e-01, 1.8423e+00, -6.8822e-02, -5.1917e-01,
  32248. -2.3048e-01, 4.1617e-01, 1.1594e-01],
  32249. [ 6.0520e-01, -3.6628e-01, 1.7845e+00, -8.1555e-01, -8.0370e-02,
  32250. -1.4237e+00, 5.8660e-01, 5.0889e-03],
  32251. [ 5.3637e-01, -4.4573e-01, 1.7557e+00, -7.2363e-03, -1.4965e-01,
  32252. 4.6189e-04, 2.9049e-01, 3.3573e-01],
  32253. [ 5.3343e-01, -4.2517e-01, 1.7499e+00, -2.2633e-02, -3.9792e-01,
  32254. -1.9199e-01, 5.5769e-02, 2.5891e-01],
  32255. [ 6.1161e-01, -3.8976e-01, 1.8654e+00, -1.9969e-01, -4.7875e-01,
  32256. -1.1081e+00, 4.3668e-01, -6.3661e-02],
  32257. [ 5.5484e-01, -4.6823e-01, 1.7309e+00, 9.6578e-02, -1.3942e-01,
  32258. 1.7573e-01, 5.0451e-01, 9.4188e-02],
  32259. [ 5.7939e-01, -4.0231e-01, 1.7788e+00, 6.2048e-02, -4.8453e-01,
  32260. 2.3557e-02, 5.3164e-01, 2.9299e-01]]], device='cuda:0')
  32261. loss_train_step before backward: tensor(0.0105, device='cuda:0', grad_fn=<MseLossBackward>)
  32262. loss_train_step after backward: tensor(0.0105, device='cuda:0', grad_fn=<MseLossBackward>)
  32263. loss_train: 0.5902246865443885
  32264. step: 40
  32265. running loss: 0.014755617163609713
  32266. Train Steps: 40/90 Loss: 0.0148 torch.Size([8, 600, 800])
  32267. torch.Size([8, 8])
  32268. tensor([[0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  32269. [0.6040, 0.4002, 0.7338, 0.2267, 0.3975, 0.2100, 0.5231, 0.4778],
  32270. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456],
  32271. [ nan, nan, 0.6935, 0.1930, 0.4150, 0.2250, 0.5450, 0.5650],
  32272. [0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  32273. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  32274. [0.6250, 0.4110, 0.7238, 0.2067, 0.4263, 0.1883, 0.5625, 0.5633],
  32275. [0.6203, 0.4073, 0.8189, 0.2398, 0.4400, 0.2054, 0.5929, 0.5501]],
  32276. device='cuda:0', dtype=torch.float64)
  32277. predictions are: tensor([[ 0.6170, -0.4152, 1.4426, -0.9766, -0.4147, -0.9239, 0.6348, 0.1055],
  32278. [ 0.6492, -0.3891, 1.0826, -1.1782, -0.4910, -1.1525, 0.3329, -0.0206],
  32279. [ 0.5339, -0.4025, 1.6845, 0.1729, -0.3956, 0.3507, 0.3930, 0.1802],
  32280. [-1.7459, -1.8893, 1.0771, -1.0959, -0.2213, -1.1079, 0.4450, 0.2548],
  32281. [ 0.4224, -0.4749, 1.6062, -0.3164, -0.6632, -0.3488, 0.2345, 0.2554],
  32282. [ 0.5959, -0.3686, 1.0819, -0.8909, -0.2060, -1.2524, 0.4956, 0.3669],
  32283. [ 0.4865, -0.4776, 1.0770, -1.1057, -0.3190, -1.2749, 0.5400, 0.2507],
  32284. [ 0.5668, -0.4227, 1.4136, -0.9592, -0.2372, -1.2127, 0.6334, 0.2023]],
  32285. device='cuda:0', grad_fn=<AddmmBackward>)
  32286. landmarks are: tensor([[[ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  32287. 0.1929],
  32288. [ 0.5037, -0.4375, 1.1032, -1.2390, -0.4499, -1.3159, 0.1301,
  32289. -0.0791],
  32290. [ 0.5443, -0.3840, 1.7095, 0.0620, -0.3979, 0.1929, 0.1622,
  32291. 0.2341],
  32292. [-2.2859, -2.2859, 0.9175, -1.3947, -0.3691, -1.2467, 0.2314,
  32293. 0.3238],
  32294. [ 0.5581, -0.3912, 1.6460, -0.5230, -0.6173, -0.5923, 0.0681,
  32295. 0.4348],
  32296. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  32297. 0.3931],
  32298. [ 0.6010, -0.3875, 1.0570, -1.3313, -0.3171, -1.4160, 0.3122,
  32299. 0.3161],
  32300. [ 0.5792, -0.4048, 1.4965, -1.1781, -0.2534, -1.3371, 0.4528,
  32301. 0.2549]]], device='cuda:0')
  32302. loss_train_step before backward: tensor(0.0225, device='cuda:0', grad_fn=<MseLossBackward>)
  32303. loss_train_step after backward: tensor(0.0225, device='cuda:0', grad_fn=<MseLossBackward>)
  32304. loss_train: 0.6126899658702314
  32305. step: 41
  32306. running loss: 0.014943657704151986
  32307. Train Steps: 41/90 Loss: 0.0149 torch.Size([8, 600, 800])
  32308. torch.Size([8, 8])
  32309. tensor([[0.6200, 0.4098, 0.8237, 0.2917, 0.4012, 0.2967, 0.6000, 0.5683],
  32310. [0.6125, 0.4010, 0.8650, 0.4567, 0.3663, 0.3900, 0.5600, 0.5567],
  32311. [0.6205, 0.4012, 0.8675, 0.3283, 0.3713, 0.3050, 0.5813, 0.5117],
  32312. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  32313. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208],
  32314. [0.6176, 0.4030, 0.8850, 0.4850, 0.3688, 0.4050, 0.5312, 0.5783],
  32315. [0.6204, 0.4110, 0.7913, 0.2667, 0.4062, 0.2500, 0.6225, 0.5367],
  32316. [0.6197, 0.3930, 0.8793, 0.4736, 0.4152, 0.5464, 0.6308, 0.5235]],
  32317. device='cuda:0', dtype=torch.float64)
  32318. predictions are: tensor([[ 0.7854, -0.2991, 1.3389, -0.9233, -0.3140, -0.9295, 0.4933, 0.3211],
  32319. [ 0.4851, -0.4815, 1.5754, -0.1447, -0.5025, -0.4698, 0.2705, 0.3721],
  32320. [ 0.4202, -0.5532, 1.6440, -0.7332, -0.4721, -0.9302, 0.4453, 0.0863],
  32321. [ 0.5706, -0.4244, 1.7125, -0.0341, -0.3242, 0.3171, 0.8492, 0.1820],
  32322. [ 0.4740, -0.5121, 1.3715, -1.0159, -0.2918, -1.2467, 0.4170, 0.1064],
  32323. [ 0.6055, -0.4053, 1.6585, 0.0100, -0.4876, -0.3127, 0.2278, 0.2346],
  32324. [ 0.6458, -0.3923, 1.3370, -1.0757, -0.2966, -1.1584, 0.5205, 0.1678],
  32325. [ 0.4434, -0.5174, 1.6545, -0.0345, -0.2625, 0.2169, 0.5201, 0.1693]],
  32326. device='cuda:0', grad_fn=<AddmmBackward>)
  32327. landmarks are: tensor([[[ 0.5778, -0.3930, 1.5189, -0.9387, -0.4326, -0.9156, 0.4855,
  32328. 0.3392],
  32329. [ 0.5432, -0.4336, 1.7095, -0.1766, -0.5942, -0.4845, 0.3007,
  32330. 0.2853],
  32331. [ 0.5799, -0.4329, 1.7210, -0.7694, -0.5711, -0.8771, 0.3988,
  32332. 0.0774],
  32333. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  32334. 0.1554],
  32335. [ 0.5885, -0.4429, 1.4266, -0.9926, -0.4383, -1.2313, 0.4228,
  32336. 0.1195],
  32337. [ 0.5667, -0.4246, 1.8018, -0.0457, -0.5827, -0.4152, 0.1679,
  32338. 0.3854],
  32339. [ 0.5796, -0.3878, 1.3688, -1.0542, -0.4095, -1.1312, 0.5894,
  32340. 0.1929],
  32341. [ 0.5762, -0.4706, 1.7754, -0.0984, -0.3680, 0.2380, 0.6277,
  32342. 0.1322]]], device='cuda:0')
  32343. loss_train_step before backward: tensor(0.0071, device='cuda:0', grad_fn=<MseLossBackward>)
  32344. loss_train_step after backward: tensor(0.0071, device='cuda:0', grad_fn=<MseLossBackward>)
  32345. loss_train: 0.6198296854272485
  32346. step: 42
  32347. running loss: 0.014757849653029726
  32348.  
  32349. Train Steps: 42/90 Loss: 0.0148 torch.Size([8, 600, 800])
  32350. torch.Size([8, 8])
  32351. tensor([[0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  32352. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  32353. [0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  32354. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  32355. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  32356. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  32357. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  32358. [0.6239, 0.4107, 0.8162, 0.2763, 0.3625, 0.3600, 0.5988, 0.5700]],
  32359. device='cuda:0', dtype=torch.float64)
  32360. predictions are: tensor([[ 0.6620, -0.3627, 0.8645, -0.8953, -0.4624, -1.0615, 0.2567, 0.4448],
  32361. [ 0.5483, -0.4709, 1.3646, -0.9783, -0.4312, -0.9092, 0.4041, 0.2567],
  32362. [ 0.4148, -0.5180, 1.6699, -0.6309, -0.4510, -0.0706, 0.5017, 0.2699],
  32363. [ 0.6890, -0.3866, 1.6303, 0.5067, -0.3901, -0.0298, 0.3656, -0.0725],
  32364. [ 0.2361, -0.6919, 2.0030, -0.9078, 0.1716, -1.4575, 1.0266, 0.2301],
  32365. [ 0.6916, -0.4029, 1.8254, 0.1274, -0.4539, -0.1698, 0.5178, -0.0051],
  32366. [ 0.3982, -0.5432, 1.5778, -0.5003, -0.5175, -0.3889, 0.1091, 0.2928],
  32367. [ 0.6824, -0.3615, 1.3945, -0.8919, -0.4078, -0.7204, 0.3479, 0.2505]],
  32368. device='cuda:0', grad_fn=<AddmmBackward>)
  32369. landmarks are: tensor([[[ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  32370. 0.4085],
  32371. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  32372. 0.1931],
  32373. [ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  32374. 0.2545],
  32375. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  32376. -0.1385],
  32377. [ 0.6108, -0.4201, 1.8711, -0.7848, -0.0053, -1.2236, 1.0362,
  32378. 0.2142],
  32379. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  32380. 0.0111],
  32381. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  32382. 0.3559],
  32383. [ 0.5960, -0.3888, 1.4840, -1.0095, -0.6115, -0.6231, 0.4797,
  32384. 0.3469]]], device='cuda:0')
  32385. loss_train_step before backward: tensor(0.0128, device='cuda:0', grad_fn=<MseLossBackward>)
  32386. loss_train_step after backward: tensor(0.0128, device='cuda:0', grad_fn=<MseLossBackward>)
  32387. loss_train: 0.632617355324328
  32388. step: 43
  32389. running loss: 0.014712031519170417
  32390. Train Steps: 43/90 Loss: 0.0147 torch.Size([8, 600, 800])
  32391. torch.Size([8, 8])
  32392. tensor([[0.6357, 0.4139, 0.8450, 0.5883, 0.3775, 0.4950, 0.6488, 0.5297],
  32393. [0.6211, 0.4069, 0.8750, 0.5117, 0.4150, 0.4900, 0.5875, 0.5167],
  32394. [0.6185, 0.4129, 0.8900, 0.4567, 0.3937, 0.5417, 0.5734, 0.5110],
  32395. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  32396. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038],
  32397. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  32398. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833],
  32399. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393]],
  32400. device='cuda:0', dtype=torch.float64)
  32401. predictions are: tensor([[ 0.3379, -0.5900, 1.6437, 0.3095, -0.4413, -0.1503, 0.5774, 0.1200],
  32402. [ 0.3663, -0.5576, 1.8159, -0.0059, -0.3329, -0.1042, 0.3667, 0.1079],
  32403. [ 0.6056, -0.3637, 1.8744, -0.2903, -0.3508, 0.0614, 0.2247, 0.1056],
  32404. [ 0.6311, -0.4130, 1.2440, -1.1452, -0.4054, -1.1107, 0.4740, 0.3398],
  32405. [ 0.5598, -0.4292, 1.7782, -0.1508, -0.1658, -0.0379, 0.0746, -0.0257],
  32406. [ 0.6271, -0.3747, 1.7128, -0.3489, -0.4974, -0.8574, 0.3628, 0.2517],
  32407. [ 0.6131, -0.4009, 0.8760, -0.9219, -0.4928, -1.0583, 0.2549, 0.4428],
  32408. [ 0.4163, -0.5562, 1.5630, -0.9899, -0.1836, -1.1978, 0.7956, 0.2543]],
  32409. device='cuda:0', grad_fn=<AddmmBackward>)
  32410. landmarks are: tensor([[[ 6.5036e-01, -3.7434e-01, 1.6171e+00, 4.3156e-01, -5.4226e-01,
  32411. 4.6189e-04, 7.1085e-01, 1.6077e-01],
  32412. [ 5.8279e-01, -4.0662e-01, 1.7557e+00, 7.7444e-02, -3.6905e-01,
  32413. -2.2633e-02, 4.2771e-01, 1.0054e-01],
  32414. [ 5.7113e-01, -3.7875e-01, 1.8249e+00, -1.7660e-01, -4.6721e-01,
  32415. 2.1601e-01, 3.6246e-01, 7.4222e-02],
  32416. [ 5.9151e-01, -3.6821e-01, 1.2187e+00, -1.2313e+00, -4.3256e-01,
  32417. -9.5412e-01, 5.7783e-01, 3.7768e-01],
  32418. [ 5.2494e-01, -4.4734e-01, 1.7326e+00, -9.1917e-02, -2.0162e-01,
  32419. 1.5443e-01, 1.7328e-01, 4.1158e-02],
  32420. [ 6.0162e-01, -3.6328e-01, 1.7152e+00, -2.2279e-01, -6.1155e-01,
  32421. -6.3849e-01, 5.0277e-01, 2.6990e-01],
  32422. [ 5.6143e-01, -4.0805e-01, 7.7413e-01, -8.8483e-01, -5.4226e-01,
  32423. -9.1563e-01, 3.5843e-01, 4.0847e-01],
  32424. [ 6.1742e-01, -3.9842e-01, 1.5975e+00, -9.9214e-01, -3.6328e-01,
  32425. -9.9261e-01, 8.2047e-01, 2.0505e-01]]], device='cuda:0')
  32426. loss_train_step before backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  32427. loss_train_step after backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  32428. loss_train: 0.6447693314403296
  32429. step: 44
  32430. running loss: 0.014653848441825672
  32431. Train Steps: 44/90 Loss: 0.0147 torch.Size([8, 600, 800])
  32432. torch.Size([8, 8])
  32433. tensor([[0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  32434. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  32435. [0.6186, 0.4154, 0.6825, 0.2633, 0.4150, 0.2300, 0.5713, 0.5517],
  32436. [0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  32437. [0.6257, 0.4024, 0.8612, 0.5352, 0.4361, 0.5253, 0.6680, 0.5166],
  32438. [0.6275, 0.4013, 0.8850, 0.2833, 0.4975, 0.2233, 0.7058, 0.5343],
  32439. [0.6268, 0.4061, 0.8350, 0.2433, 0.4575, 0.2283, 0.6350, 0.5300],
  32440. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550]],
  32441. device='cuda:0', dtype=torch.float64)
  32442. predictions are: tensor([[ 0.6149, -0.3487, 1.7814, -0.2349, -0.4272, 0.1006, 0.3636, 0.1894],
  32443. [-2.3590, -2.3096, 1.0946, -1.1491, -0.4777, -1.3035, 0.0823, 0.1859],
  32444. [ 0.5637, -0.4276, 0.9312, -1.0148, -0.4159, -1.2547, 0.2622, 0.2948],
  32445. [ 0.5444, -0.4137, 1.1649, -0.9891, -0.6327, -0.5801, 0.3558, 0.2762],
  32446. [ 0.5295, -0.4331, 1.6803, 0.1782, -0.3518, 0.1204, 0.6046, 0.0747],
  32447. [ 0.5971, -0.4446, 1.7483, -0.9914, -0.0197, -1.3498, 0.8464, 0.0536],
  32448. [ 0.6495, -0.3742, 1.5860, -1.0997, -0.2983, -1.3387, 0.5325, 0.0691],
  32449. [ 0.3837, -0.5090, 1.7551, -0.1794, -0.0704, -0.0786, 0.2862, 0.2237]],
  32450. device='cuda:0', grad_fn=<AddmmBackward>)
  32451. landmarks are: tensor([[[ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  32452. 0.3161],
  32453. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  32454. 0.1373],
  32455. [ 0.5713, -0.3671, 0.8665, -1.0696, -0.3691, -1.2236, 0.3527,
  32456. 0.2622],
  32457. [ 0.5747, -0.3886, 1.1494, -1.0388, -0.6000, -0.5846, 0.5952,
  32458. 0.3546],
  32459. [ 0.6042, -0.4273, 1.6920, 0.1860, -0.2717, 0.1406, 0.7997,
  32460. 0.1004],
  32461. [ 0.6125, -0.4321, 1.8018, -0.9772, 0.0120, -1.2543, 0.9741,
  32462. 0.1821],
  32463. [ 0.6093, -0.4104, 1.5709, -1.1620, -0.1727, -1.2313, 0.6471,
  32464. 0.1621],
  32465. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  32466. 0.2776]]], device='cuda:0')
  32467. loss_train_step before backward: tensor(0.0080, device='cuda:0', grad_fn=<MseLossBackward>)
  32468. loss_train_step after backward: tensor(0.0080, device='cuda:0', grad_fn=<MseLossBackward>)
  32469. loss_train: 0.652790330350399
  32470. step: 45
  32471. running loss: 0.014506451785564423
  32472. Train Steps: 45/90 Loss: 0.0145 torch.Size([8, 600, 800])
  32473. torch.Size([8, 8])
  32474. tensor([[0.6201, 0.4055, 0.7717, 0.1919, 0.4250, 0.2079, 0.5871, 0.5044],
  32475. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  32476. [0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  32477. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  32478. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100],
  32479. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  32480. [0.6284, 0.4093, 0.8900, 0.4700, 0.3650, 0.3850, 0.6212, 0.5167],
  32481. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500]],
  32482. device='cuda:0', dtype=torch.float64)
  32483. predictions are: tensor([[ 0.4966, -0.4927, 1.2699, -1.3492, -0.2894, -1.4053, 0.3474, 0.0317],
  32484. [ 0.7391, -0.3165, 1.2395, -1.1042, -0.4034, -1.0465, 0.4538, 0.3428],
  32485. [ 0.3934, -0.5337, 1.5320, -1.0319, -0.4831, -0.3558, 0.4587, 0.2339],
  32486. [ 0.6288, -0.3821, 1.3381, -1.0664, -0.5571, -0.4490, 0.3945, 0.2473],
  32487. [ 0.5720, -0.4417, 1.6718, 0.1874, -0.2753, -0.1033, 0.4886, 0.1259],
  32488. [ 0.5163, -0.4307, 1.8413, 0.3058, -0.3082, -0.0951, 0.2531, 0.2563],
  32489. [ 0.4386, -0.5311, 1.9441, -0.1007, -0.5351, -0.5640, 0.4021, 0.0828],
  32490. [ 0.6740, -0.3230, 1.7757, 0.1000, -0.4700, -0.4806, 0.4102, 0.2311]],
  32491. device='cuda:0', grad_fn=<AddmmBackward>)
  32492. landmarks are: tensor([[[ 0.5785, -0.4129, 1.2785, -1.3996, -0.3227, -1.3259, 0.4258,
  32493. 0.0438],
  32494. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  32495. 0.3777],
  32496. [ 0.5799, -0.4099, 1.5651, -1.0465, -0.5885, -0.3075, 0.6413,
  32497. 0.1390],
  32498. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  32499. 0.2545],
  32500. [ 0.6236, -0.4344, 1.6171, 0.1852, -0.3402, 0.0236, 0.6471,
  32501. 0.0697],
  32502. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  32503. 0.3007],
  32504. [ 0.6164, -0.3956, 1.8249, -0.1150, -0.6000, -0.5076, 0.5836,
  32505. 0.1005],
  32506. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  32507. 0.2545]]], device='cuda:0')
  32508. loss_train_step before backward: tensor(0.0074, device='cuda:0', grad_fn=<MseLossBackward>)
  32509. loss_train_step after backward: tensor(0.0074, device='cuda:0', grad_fn=<MseLossBackward>)
  32510. loss_train: 0.6602126411162317
  32511. step: 46
  32512. running loss: 0.01435244871991808
  32513.  
  32514. Train Steps: 46/90 Loss: 0.0144 torch.Size([8, 600, 800])
  32515. torch.Size([8, 8])
  32516. tensor([[0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  32517. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  32518. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  32519. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  32520. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  32521. [0.6218, 0.4137, 0.7263, 0.2233, 0.4075, 0.2650, 0.6212, 0.5783],
  32522. [0.6260, 0.4106, 0.8025, 0.2583, 0.4550, 0.1867, 0.6281, 0.4869],
  32523. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550]],
  32524. device='cuda:0', dtype=torch.float64)
  32525. predictions are: tensor([[ 0.3742, -0.5066, 1.7244, 0.3687, -0.0828, -0.2045, 0.3595, 0.3976],
  32526. [ 0.5415, -0.4194, 1.6979, -0.4614, -0.7064, -0.5221, -0.0144, 0.2012],
  32527. [ 0.8284, -0.2728, 0.9806, -1.3618, -0.4925, -1.1502, 0.3888, 0.2431],
  32528. [ 0.6283, -0.4036, 2.0047, -0.3204, -0.6244, -0.0814, 0.6591, -0.0324],
  32529. [ 0.4902, -0.4794, 0.9705, -1.2138, -0.4393, -1.3999, 0.1626, 0.1567],
  32530. [ 0.3520, -0.5710, 1.1238, -1.1896, -0.5240, -0.9904, 0.5083, 0.3460],
  32531. [ 0.6551, -0.3947, 1.5409, -1.1691, -0.2441, -1.3841, 0.6094, -0.0491],
  32532. [ 0.4091, -0.5144, 1.8871, -0.2143, -0.0562, -0.0024, 0.4478, 0.2442]],
  32533. device='cuda:0', grad_fn=<AddmmBackward>)
  32534. landmarks are: tensor([[[ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  32535. 0.4547],
  32536. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  32537. 0.2567],
  32538. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  32539. 0.2576],
  32540. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  32541. -0.0670],
  32542. [ 0.5591, -0.3990, 0.9012, -1.2313, -0.3979, -1.3852, 0.0804,
  32543. 0.2071],
  32544. [ 0.5863, -0.3749, 1.0686, -1.2543, -0.4037, -1.0619, 0.5836,
  32545. 0.3854],
  32546. [ 0.6058, -0.3892, 1.4208, -1.0927, -0.1843, -1.4237, 0.6154,
  32547. -0.0370],
  32548. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  32549. 0.2776]]], device='cuda:0')
  32550. loss_train_step before backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  32551. loss_train_step after backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  32552. loss_train: 0.66893858788535
  32553. step: 47
  32554. running loss: 0.014232735912454254
  32555. Train Steps: 47/90 Loss: 0.0142 torch.Size([8, 600, 800])
  32556. torch.Size([8, 8])
  32557. tensor([[0.6346, 0.4165, 0.9138, 0.3983, 0.3875, 0.4317, 0.7469, 0.5471],
  32558. [0.6226, 0.4098, 0.8912, 0.4100, 0.4025, 0.2383, 0.5763, 0.5367],
  32559. [0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290],
  32560. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  32561. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297],
  32562. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617],
  32563. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  32564. [0.6188, 0.4099, 0.7400, 0.2433, 0.3962, 0.2750, 0.6162, 0.5467]],
  32565. device='cuda:0', dtype=torch.float64)
  32566. predictions are: tensor([[ 0.4051, -0.5136, 1.8833, -0.4045, -0.3325, -0.2155, 0.8739, 0.2710],
  32567. [ 0.6273, -0.3338, 1.7346, -0.3649, -0.3575, -1.0852, 0.2452, 0.2073],
  32568. [ 0.7074, -0.3350, 1.1613, -1.3132, -0.2587, -1.1944, 0.5886, 0.1082],
  32569. [ 0.5802, -0.3619, 1.6835, -0.1829, -0.4105, -0.0615, -0.0204, 0.1170],
  32570. [ 0.7498, -0.3204, 1.7780, 0.1821, -0.5136, -0.1024, 0.6707, 0.1807],
  32571. [-2.0482, -2.0954, 1.0732, -1.2049, -0.3920, -1.2881, 0.1151, 0.2374],
  32572. [ 0.6764, -0.3235, 1.8600, -0.5183, -0.5283, -0.4335, 0.4900, 0.1452],
  32573. [ 0.7032, -0.3257, 1.0644, -1.2792, -0.4724, -0.9075, 0.4405, 0.1871]],
  32574. device='cuda:0', grad_fn=<AddmmBackward>)
  32575. landmarks are: tensor([[[ 0.6454, -0.3623, 1.9346, -0.4460, -0.4961, -0.2921, 1.1642,
  32576. 0.2409],
  32577. [ 0.5900, -0.3932, 1.8307, -0.3921, -0.4268, -1.1851, 0.3758,
  32578. 0.1929],
  32579. [ 0.6125, -0.4273, 1.2807, -1.3253, -0.2574, -1.2542, 0.6864,
  32580. 0.1575],
  32581. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  32582. 0.0893],
  32583. [ 0.6520, -0.4032, 1.8076, 0.1852, -0.5711, -0.1381, 0.7876,
  32584. 0.1608],
  32585. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  32586. 0.3084],
  32587. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  32588. 0.1544],
  32589. [ 0.5725, -0.3926, 1.1321, -1.1620, -0.4557, -1.0157, 0.5605,
  32590. 0.2391]]], device='cuda:0')
  32591. loss_train_step before backward: tensor(0.0102, device='cuda:0', grad_fn=<MseLossBackward>)
  32592. loss_train_step after backward: tensor(0.0102, device='cuda:0', grad_fn=<MseLossBackward>)
  32593. loss_train: 0.6791246416978538
  32594. step: 48
  32595. running loss: 0.014148430035371954
  32596. Train Steps: 48/90 Loss: 0.0141 torch.Size([8, 600, 800])
  32597. torch.Size([8, 8])
  32598. tensor([[0.6296, 0.4076, 0.8400, 0.5583, 0.3700, 0.4367, 0.6876, 0.5494],
  32599. [0.6200, 0.3978, 0.8900, 0.4550, 0.3775, 0.5200, 0.6150, 0.5367],
  32600. [0.6129, 0.4063, 0.8738, 0.5250, 0.4313, 0.4733, 0.5230, 0.5874],
  32601. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  32602. [0.6120, 0.4014, 0.6863, 0.2817, 0.3700, 0.2783, 0.5513, 0.5667],
  32603. [0.6200, 0.3993, 0.8519, 0.4923, 0.3962, 0.4717, 0.6013, 0.5433],
  32604. [0.6302, 0.4007, 0.8850, 0.5500, 0.3613, 0.4517, 0.6335, 0.5012],
  32605. [0.6124, 0.4069, 0.8314, 0.5001, 0.3738, 0.4650, 0.5167, 0.5402]],
  32606. device='cuda:0', dtype=torch.float64)
  32607. predictions are: tensor([[ 0.6016, -0.4220, 1.7538, 0.1703, -0.5186, -0.2837, 0.8657, 0.1236],
  32608. [ 0.4566, -0.5206, 1.9691, -0.3438, -0.5333, 0.1213, 0.4083, 0.1729],
  32609. [ 0.6168, -0.3684, 1.7965, 0.0535, -0.2900, -0.0179, 0.1753, 0.3332],
  32610. [ 0.4819, -0.4374, 1.2815, -1.2242, -0.1292, -1.3188, 0.3799, 0.3378],
  32611. [ 0.5563, -0.3974, 1.0200, -1.2427, -0.5874, -0.9715, 0.2051, 0.2670],
  32612. [ 0.6416, -0.3941, 1.8055, -0.1221, -0.4340, -0.1021, 0.5248, 0.1909],
  32613. [ 0.6706, -0.4074, 1.8877, 0.1244, -0.5731, -0.2325, 0.6664, 0.0643],
  32614. [ 0.6742, -0.3256, 1.6654, -0.1106, -0.4677, -0.1163, 0.1835, 0.2330]],
  32615. device='cuda:0', grad_fn=<AddmmBackward>)
  32616. landmarks are: tensor([[[ 0.6224, -0.4032, 1.5940, 0.2930, -0.5769, -0.2690, 0.8900,
  32617. 0.2516],
  32618. [ 0.5776, -0.4484, 1.8249, -0.1843, -0.5423, 0.1159, 0.5547,
  32619. 0.1929],
  32620. [ 0.5453, -0.4091, 1.7499, 0.1390, -0.2940, -0.0996, 0.1300,
  32621. 0.4272],
  32622. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  32623. 0.3854],
  32624. [ 0.5410, -0.4321, 0.8838, -0.9849, -0.5769, -1.0003, 0.2603,
  32625. 0.3315],
  32626. [ 0.5777, -0.4415, 1.6491, -0.0122, -0.4557, -0.1073, 0.4912,
  32627. 0.2237],
  32628. [ 0.6249, -0.4352, 1.8018, 0.2545, -0.6173, -0.1997, 0.6401,
  32629. 0.0291],
  32630. [ 0.5425, -0.4067, 1.5543, 0.0241, -0.5596, -0.1381, 0.1005,
  32631. 0.2093]]], device='cuda:0')
  32632. loss_train_step before backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  32633. loss_train_step after backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  32634. loss_train: 0.6867347755469382
  32635. step: 49
  32636. running loss: 0.01401499541932527
  32637. Train Steps: 49/90 Loss: 0.0140 torch.Size([8, 600, 800])
  32638. torch.Size([8, 8])
  32639. tensor([[0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  32640. [0.6200, 0.3913, 0.8788, 0.5217, 0.4075, 0.5100, 0.6060, 0.4913],
  32641. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  32642. [0.6333, 0.4037, 0.8638, 0.5733, 0.4012, 0.4717, 0.6369, 0.4938],
  32643. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  32644. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283],
  32645. [0.6190, 0.4135, 0.8000, 0.4883, 0.3566, 0.3647, 0.5613, 0.5900],
  32646. [ nan, nan, 0.7512, 0.2117, 0.4288, 0.2000, 0.5600, 0.5617]],
  32647. device='cuda:0', dtype=torch.float64)
  32648. predictions are: tensor([[ 0.5894, -0.3801, 1.6447, 0.1531, -0.4084, 0.0639, 0.3153, 0.1972],
  32649. [ 0.6713, -0.3791, 1.7616, 0.0157, -0.3227, 0.1243, 0.4278, 0.0049],
  32650. [ 0.6451, -0.3785, 1.8642, -0.5306, -0.5431, -0.1355, 0.8136, 0.2384],
  32651. [ 0.7246, -0.3287, 1.7098, 0.2364, -0.4094, -0.0973, 0.7035, 0.0385],
  32652. [ 0.7551, -0.2297, 1.7543, -0.4982, -0.5698, -0.4273, 0.2666, 0.2370],
  32653. [ 0.6142, -0.3619, 1.7747, 0.0742, -0.4392, -0.0329, 0.5170, 0.2477],
  32654. [ 0.6024, -0.3271, 1.5167, -0.2986, -0.5872, -0.5988, 0.2826, 0.4324],
  32655. [-2.1414, -2.1944, 1.1244, -1.3578, -0.3550, -1.3435, 0.2133, 0.2454]],
  32656. device='cuda:0', grad_fn=<AddmmBackward>)
  32657. landmarks are: tensor([[[ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  32658. -0.1061],
  32659. [ 0.5776, -0.4784, 1.7730, 0.1236, -0.4037, 0.0697, 0.5132,
  32660. -0.0168],
  32661. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  32662. 0.0985],
  32663. [ 0.6395, -0.4213, 1.7037, 0.3623, -0.4326, -0.1073, 0.6560,
  32664. -0.0049],
  32665. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  32666. 0.1852],
  32667. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  32668. 0.1544],
  32669. [ 0.5732, -0.3761, 1.4092, -0.0303, -0.6388, -0.6012, 0.3065,
  32670. 0.4393],
  32671. [-2.2859, -2.2859, 1.1841, -1.3082, -0.3055, -1.3621, 0.3007,
  32672. 0.3084]]], device='cuda:0')
  32673. loss_train_step before backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  32674. loss_train_step after backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  32675. loss_train: 0.6954759764485061
  32676. step: 50
  32677. running loss: 0.013909519528970122
  32678.  
  32679. Train Steps: 50/90 Loss: 0.0139 torch.Size([8, 600, 800])
  32680. torch.Size([8, 8])
  32681. tensor([[ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  32682. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  32683. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279],
  32684. [0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274],
  32685. [0.6208, 0.4082, 0.8538, 0.3067, 0.3588, 0.3717, 0.6112, 0.5517],
  32686. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  32687. [0.6259, 0.4133, 0.8200, 0.2317, 0.5025, 0.1533, 0.6250, 0.4947],
  32688. [0.6128, 0.4115, 0.7934, 0.3778, 0.3450, 0.4033, 0.5337, 0.5456]],
  32689. device='cuda:0', dtype=torch.float64)
  32690. predictions are: tensor([[-2.0417, -2.1145, 0.9707, -1.2916, -0.5134, -1.1903, 0.1369, 0.1892],
  32691. [ 0.6440, -0.3374, 1.2099, -1.0695, -0.4862, -0.8650, 0.6079, 0.3799],
  32692. [ 0.6411, -0.3589, 1.8196, -0.0150, -0.5245, 0.0290, 0.5910, 0.1434],
  32693. [ 0.5620, -0.3825, 1.6482, -0.7810, -0.0810, -1.1873, 0.6928, 0.2009],
  32694. [ 0.5983, -0.3833, 1.6245, -0.7267, -0.6526, -0.4460, 0.5589, 0.2570],
  32695. [ 0.3943, -0.4981, 1.0297, -1.1695, -0.4064, -1.2838, 0.2265, 0.0506],
  32696. [ 0.5851, -0.3882, 1.4568, -1.1265, -0.0250, -1.3781, 0.6049, 0.1001],
  32697. [ 0.5941, -0.3497, 1.4244, -0.4968, -0.6755, -0.3567, 0.3419, 0.2971]],
  32698. device='cuda:0', grad_fn=<AddmmBackward>)
  32699. landmarks are: tensor([[[-2.2859e+00, -2.2859e+00, 1.0513e+00, -1.2851e+00, -4.4411e-01,
  32700. -1.2313e+00, 2.2057e-01, 1.0729e-01],
  32701. [ 5.9151e-01, -3.6821e-01, 1.2187e+00, -1.2313e+00, -4.3256e-01,
  32702. -9.5412e-01, 5.7783e-01, 3.7768e-01],
  32703. [ 5.6801e-01, -4.4175e-01, 1.8365e+00, -7.4042e-02, -4.9414e-01,
  32704. -2.2653e-02, 5.0451e-01, 1.5252e-01],
  32705. [ 6.5365e-01, -3.7194e-01, 1.6979e+00, -8.6174e-01, -1.6859e-02,
  32706. -1.3621e+00, 6.9257e-01, 1.5008e-01],
  32707. [ 5.8135e-01, -4.0031e-01, 1.6575e+00, -8.6944e-01, -6.2887e-01,
  32708. -5.6921e-01, 5.3741e-01, 2.6220e-01],
  32709. [ 5.1085e-01, -4.3164e-01, 1.1436e+00, -1.3467e+00, -3.8637e-01,
  32710. -1.4160e+00, 1.2393e-01, -5.8033e-02],
  32711. [ 6.0514e-01, -3.7714e-01, 1.5016e+00, -1.2159e+00, 3.5104e-02,
  32712. -1.5777e+00, 6.0099e-01, -9.2270e-04],
  32713. [ 5.4440e-01, -3.8522e-01, 1.3786e+00, -5.4087e-01, -6.9238e-01,
  32714. -4.2294e-01, 1.7915e-01, 2.3412e-01]]], device='cuda:0')
  32715. loss_train_step before backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  32716. loss_train_step after backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  32717. loss_train: 0.7030893294140697
  32718. step: 51
  32719. running loss: 0.013786065282628816
  32720. Train Steps: 51/90 Loss: 0.0138 torch.Size([8, 600, 800])
  32721. torch.Size([8, 8])
  32722. tensor([[0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  32723. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351],
  32724. [0.6159, 0.4085, 0.6900, 0.2283, 0.4088, 0.1950, 0.5123, 0.5397],
  32725. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  32726. [0.6279, 0.4008, 0.8600, 0.4883, 0.4325, 0.5283, 0.7010, 0.5378],
  32727. [0.6364, 0.4144, 0.8625, 0.3083, 0.4913, 0.2000, 0.6448, 0.5274],
  32728. [0.6196, 0.4088, 0.8888, 0.4583, 0.4500, 0.5683, 0.6138, 0.5883],
  32729. [0.6275, 0.4024, 0.7722, 0.2080, 0.4392, 0.2234, 0.6435, 0.5290]],
  32730. device='cuda:0', dtype=torch.float64)
  32731. predictions are: tensor([[ 0.6494, -0.3643, 1.7888, -0.1043, -0.6878, -0.2725, 0.3839, 0.0475],
  32732. [ 0.5098, -0.4389, 1.2404, -1.0108, -0.3349, -1.3609, 0.3059, 0.1627],
  32733. [ 0.3660, -0.5140, 0.8387, -1.1964, -0.4575, -1.3360, 0.0789, 0.2320],
  32734. [ 0.6436, -0.3578, 1.8885, -0.4588, -0.6509, -0.4069, 0.5721, 0.1984],
  32735. [ 0.5306, -0.4581, 1.7036, 0.0555, -0.3979, 0.1843, 0.7566, 0.2434],
  32736. [ 0.4884, -0.4214, 1.6386, -0.8014, -0.1471, -1.2295, 0.6100, 0.2176],
  32737. [ 0.5705, -0.3704, 1.7832, -0.1546, -0.3066, 0.3843, 0.5200, 0.3995],
  32738. [ 0.5586, -0.4240, 1.1823, -1.2662, -0.3523, -1.1681, 0.6554, 0.1749]],
  32739. device='cuda:0', grad_fn=<AddmmBackward>)
  32740. landmarks are: tensor([[[ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  32741. 0.0467],
  32742. [ 0.5664, -0.4321, 1.2862, -1.0003, -0.2189, -1.4608, 0.3883,
  32743. 0.1855],
  32744. [ 0.5591, -0.3990, 0.9012, -1.2313, -0.3979, -1.3852, 0.0804,
  32745. 0.2071],
  32746. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  32747. 0.1544],
  32748. [ 0.6141, -0.4345, 1.6864, -0.0303, -0.2882, 0.1544, 0.9521,
  32749. 0.1982],
  32750. [ 0.6537, -0.3719, 1.6979, -0.8617, -0.0169, -1.3621, 0.6926,
  32751. 0.1501],
  32752. [ 0.5759, -0.3978, 1.8192, -0.1689, -0.2074, 0.3392, 0.5490,
  32753. 0.4316],
  32754. [ 0.6125, -0.4273, 1.2807, -1.3253, -0.2574, -1.2542, 0.6864,
  32755. 0.1575]]], device='cuda:0')
  32756. loss_train_step before backward: tensor(0.0058, device='cuda:0', grad_fn=<MseLossBackward>)
  32757. loss_train_step after backward: tensor(0.0058, device='cuda:0', grad_fn=<MseLossBackward>)
  32758. loss_train: 0.7088540904223919
  32759. step: 52
  32760. running loss: 0.013631809431199845
  32761. Train Steps: 52/90 Loss: 0.0136 torch.Size([8, 600, 800])
  32762. torch.Size([8, 8])
  32763. tensor([[0.6197, 0.4091, 0.8800, 0.4783, 0.3538, 0.4767, 0.5950, 0.5550],
  32764. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717],
  32765. [0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748],
  32766. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  32767. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  32768. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  32769. [0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  32770. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750]],
  32771. device='cuda:0', dtype=torch.float64)
  32772. predictions are: tensor([[ 0.6867, -0.3530, 1.8893, -0.0427, -0.6081, -0.0703, 0.5564, 0.2224],
  32773. [ 0.6031, -0.4232, 1.8380, -0.0181, -0.3122, 0.0297, 0.3452, 0.1512],
  32774. [ 0.5968, -0.4435, 1.6900, 0.2695, -0.5246, -0.3441, 1.0880, 0.1359],
  32775. [ 0.5225, -0.4026, 1.1519, -1.2220, -0.3218, -1.0692, 0.5546, 0.5218],
  32776. [ 0.4358, -0.4869, 1.6258, -1.2949, -0.0756, -1.2650, 0.5801, -0.0843],
  32777. [ 0.5571, -0.4031, 1.5258, -0.5435, -0.6655, -0.8282, 0.1144, 0.2918],
  32778. [ 0.5077, -0.4292, 1.0523, -0.9469, -0.5805, -0.9220, 0.1200, 0.1878],
  32779. [ 0.4917, -0.4569, 1.0927, -1.1920, -0.5139, -0.9124, 0.5999, 0.2974]],
  32780. device='cuda:0', grad_fn=<AddmmBackward>)
  32781. landmarks are: tensor([[[ 0.5763, -0.3963, 1.7788, -0.0765, -0.6520, -0.0842, 0.4624,
  32782. 0.2776],
  32783. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  32784. 0.3546],
  32785. [ 0.6421, -0.3647, 1.5940, 0.3084, -0.5192, -0.3691, 1.1057,
  32786. 0.3692],
  32787. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  32788. 0.6084],
  32789. [ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  32790. -0.0369],
  32791. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  32792. 0.4374],
  32793. [ 0.5425, -0.3998, 0.9263, -0.8683, -0.6000, -1.0157, 0.0990,
  32794. 0.2476],
  32795. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  32796. 0.3700]]], device='cuda:0')
  32797. loss_train_step before backward: tensor(0.0067, device='cuda:0', grad_fn=<MseLossBackward>)
  32798. loss_train_step after backward: tensor(0.0067, device='cuda:0', grad_fn=<MseLossBackward>)
  32799. loss_train: 0.7155375052243471
  32800. step: 53
  32801. running loss: 0.013500707645742398
  32802. Train Steps: 53/90 Loss: 0.0135 torch.Size([8, 600, 800])
  32803. torch.Size([8, 8])
  32804. tensor([[0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400],
  32805. [0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667],
  32806. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  32807. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  32808. [0.6236, 0.4081, 0.8575, 0.3000, 0.3713, 0.3033, 0.5550, 0.5633],
  32809. [0.6149, 0.4054, 0.6713, 0.2333, 0.4025, 0.2017, 0.5213, 0.5695],
  32810. [0.6163, 0.4114, 0.7650, 0.2017, 0.3763, 0.2867, 0.5631, 0.5071],
  32811. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567]],
  32812. device='cuda:0', dtype=torch.float64)
  32813. predictions are: tensor([[ 0.6952, -0.2909, 1.5572, -0.7564, -0.6099, -0.5721, 0.5670, 0.2324],
  32814. [ 1.0167, -0.1225, 1.6744, 0.3887, -0.4468, 0.1252, 0.6714, 0.2086],
  32815. [-1.5770, -1.8032, 1.3967, -0.9103, -0.6525, -0.7907, 0.2326, 0.1734],
  32816. [ 0.7683, -0.2966, 1.9082, -0.1257, -0.2844, -0.8902, 1.1414, 0.2348],
  32817. [ 0.6591, -0.3276, 1.5648, -0.8208, -0.4872, -0.8877, 0.3777, 0.1544],
  32818. [ 0.7440, -0.2497, 0.8397, -1.2438, -0.3175, -1.3303, 0.1661, 0.2908],
  32819. [ 0.8056, -0.2475, 1.1913, -1.2971, -0.4608, -0.9584, 0.5213, 0.0536],
  32820. [-1.8084, -1.9542, 1.1200, -1.2545, -0.4184, -1.0982, 0.2681, 0.2478]],
  32821. device='cuda:0', grad_fn=<AddmmBackward>)
  32822. landmarks are: tensor([[[ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  32823. 0.2083],
  32824. [ 0.5853, -0.3614, 1.6806, 0.2930, -0.4499, 0.1005, 0.3815,
  32825. 0.3315],
  32826. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  32827. 0.0893],
  32828. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  32829. 0.3692],
  32830. [ 0.5944, -0.4008, 1.6748, -0.9002, -0.5711, -0.8848, 0.2776,
  32831. 0.3161],
  32832. [ 0.5544, -0.4133, 0.8145, -1.2082, -0.4268, -1.3544, 0.1221,
  32833. 0.3446],
  32834. [ 0.5606, -0.3856, 1.2476, -1.3544, -0.5480, -0.9618, 0.3152,
  32835. 0.0562],
  32836. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  32837. 0.2853]]], device='cuda:0')
  32838. loss_train_step before backward: tensor(0.0291, device='cuda:0', grad_fn=<MseLossBackward>)
  32839. loss_train_step after backward: tensor(0.0291, device='cuda:0', grad_fn=<MseLossBackward>)
  32840. loss_train: 0.7446684222668409
  32841. step: 54
  32842. running loss: 0.013790155967904462
  32843.  
  32844. Train Steps: 54/90 Loss: 0.0138 torch.Size([8, 600, 800])
  32845. torch.Size([8, 8])
  32846. tensor([[0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  32847. [0.6176, 0.4030, 0.8850, 0.4850, 0.3688, 0.4050, 0.5312, 0.5783],
  32848. [0.6192, 0.3980, 0.7078, 0.2750, 0.4250, 0.2100, 0.5450, 0.5783],
  32849. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  32850. [0.6137, 0.4035, 0.8850, 0.4417, 0.3900, 0.4283, 0.5449, 0.5617],
  32851. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  32852. [0.6081, 0.3950, 0.8538, 0.4667, 0.3850, 0.4917, 0.5342, 0.4954],
  32853. [0.6162, 0.4014, 0.8800, 0.5333, 0.3750, 0.4817, 0.5988, 0.5283]],
  32854. device='cuda:0', dtype=torch.float64)
  32855. predictions are: tensor([[ 7.3151e-01, -3.2304e-01, 1.8139e+00, -4.3675e-01, -6.3154e-01,
  32856. -1.5793e-01, 7.0981e-01, 2.7233e-01],
  32857. [ 7.2082e-01, -3.2855e-01, 1.7849e+00, 1.5959e-03, -5.5553e-01,
  32858. -3.2249e-01, 3.4367e-01, 2.8201e-01],
  32859. [-1.0985e+00, -1.4875e+00, 1.0323e+00, -1.1355e+00, -2.6686e-01,
  32860. -1.3477e+00, 3.6026e-01, 3.8651e-01],
  32861. [ 7.9492e-01, -3.2222e-01, 1.8341e+00, 2.6112e-01, -5.6936e-01,
  32862. -1.4523e-01, 8.4170e-01, 6.2565e-02],
  32863. [ 7.0293e-01, -3.1763e-01, 1.8348e+00, -1.5597e-01, -4.7494e-01,
  32864. -2.8655e-01, 4.0996e-01, 2.7960e-01],
  32865. [ 5.9462e-01, -3.7201e-01, 8.9894e-01, -1.3596e+00, -4.7997e-01,
  32866. -1.1826e+00, 4.1370e-01, 1.1764e-01],
  32867. [ 5.3425e-01, -4.5420e-01, 1.7221e+00, -1.7401e-01, -5.0341e-01,
  32868. -2.0689e-02, 3.2310e-01, 3.1694e-02],
  32869. [ 5.7662e-01, -4.1861e-01, 1.7637e+00, 2.6550e-01, -4.6343e-01,
  32870. -2.3559e-02, 5.5708e-01, 2.2800e-01]], device='cuda:0',
  32871. grad_fn=<AddmmBackward>)
  32872. landmarks are: tensor([[[ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  32873. 0.2083],
  32874. [ 0.5667, -0.4246, 1.8018, -0.0457, -0.5827, -0.4152, 0.1679,
  32875. 0.3854],
  32876. [ 0.5742, -0.4474, 0.9834, -1.0159, -0.3229, -1.3159, 0.2314,
  32877. 0.3854],
  32878. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  32879. 0.0111],
  32880. [ 0.5488, -0.4221, 1.8018, -0.2459, -0.4845, -0.3075, 0.2309,
  32881. 0.3087],
  32882. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  32883. 0.0862],
  32884. [ 0.5227, -0.4615, 1.6575, -0.1304, -0.5076, -0.0149, 0.1815,
  32885. 0.0021],
  32886. [ 0.5603, -0.4319, 1.7788, 0.1775, -0.5538, -0.0611, 0.4797,
  32887. 0.1544]]], device='cuda:0')
  32888. loss_train_step before backward: tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward>)
  32889. loss_train_step after backward: tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward>)
  32890. loss_train: 0.8122478108853102
  32891. step: 55
  32892. running loss: 0.01476814201609655
  32893. Train Steps: 55/90 Loss: 0.0148 torch.Size([8, 600, 800])
  32894. torch.Size([8, 8])
  32895. tensor([[0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320],
  32896. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  32897. [0.6197, 0.3986, 0.8800, 0.4617, 0.4188, 0.4783, 0.5687, 0.5550],
  32898. [0.6198, 0.4076, 0.7945, 0.2453, 0.4475, 0.1871, 0.5897, 0.5350],
  32899. [0.6205, 0.4016, 0.8350, 0.2717, 0.3987, 0.2550, 0.5787, 0.5133],
  32900. [0.6227, 0.4193, 0.8838, 0.4933, 0.3663, 0.3733, 0.5637, 0.5633],
  32901. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  32902. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983]],
  32903. device='cuda:0', dtype=torch.float64)
  32904. predictions are: tensor([[ 0.6733, -0.3537, 1.3374, -1.3534, -0.3475, -1.1263, 0.9403, 0.1226],
  32905. [ 0.4557, -0.5294, 1.6551, -0.3730, -0.5073, 0.0383, 0.2753, 0.0239],
  32906. [ 0.4782, -0.5015, 1.6879, -0.2401, -0.4075, -0.0528, 0.4632, 0.2047],
  32907. [ 0.5682, -0.3980, 1.3429, -1.2565, -0.1921, -1.4071, 0.6248, 0.1764],
  32908. [ 0.6195, -0.3795, 1.5597, -1.1509, -0.4353, -1.0833, 0.5308, 0.0891],
  32909. [ 0.5529, -0.4028, 1.6849, -0.0855, -0.6844, -0.5984, 0.4197, 0.4058],
  32910. [ 0.5639, -0.4079, 1.6461, 0.3015, -0.4696, -0.1384, 0.3921, 0.3661],
  32911. [ 0.4199, -0.5031, 1.5452, 0.2457, -0.6153, -0.5789, 0.3617, 0.4921]],
  32912. device='cuda:0', grad_fn=<AddmmBackward>)
  32913. landmarks are: tensor([[[ 0.6141, -0.4153, 1.4208, -1.2697, -0.2940, -1.0234, 0.8644,
  32914. 0.1715],
  32915. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  32916. 0.0231],
  32917. [ 0.5763, -0.4450, 1.7788, -0.1535, -0.3517, -0.0765, 0.3411,
  32918. 0.2776],
  32919. [ 0.5768, -0.4031, 1.3838, -1.1527, -0.2188, -1.4216, 0.4379,
  32920. 0.1850],
  32921. [ 0.5800, -0.4312, 1.5709, -1.0311, -0.4441, -1.1081, 0.3873,
  32922. 0.0851],
  32923. [ 0.5902, -0.3493, 1.7961, -0.0072, -0.5942, -0.5615, 0.3180,
  32924. 0.3161],
  32925. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  32926. 0.3007],
  32927. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  32928. 0.4778]]], device='cuda:0')
  32929. loss_train_step before backward: tensor(0.0060, device='cuda:0', grad_fn=<MseLossBackward>)
  32930. loss_train_step after backward: tensor(0.0060, device='cuda:0', grad_fn=<MseLossBackward>)
  32931. loss_train: 0.8182361843064427
  32932. step: 56
  32933. running loss: 0.01461136043404362
  32934. Train Steps: 56/90 Loss: 0.0146 torch.Size([8, 600, 800])
  32935. torch.Size([8, 8])
  32936. tensor([[0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  32937. [0.6059, 0.4002, 0.7562, 0.2767, 0.3538, 0.3033, 0.5529, 0.5455],
  32938. [ nan, nan, 0.8888, 0.3100, 0.5262, 0.2817, 0.7145, 0.6003],
  32939. [0.6246, 0.4126, 0.8850, 0.4833, 0.4200, 0.5350, 0.6112, 0.5250],
  32940. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  32941. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  32942. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  32943. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817]],
  32944. device='cuda:0', dtype=torch.float64)
  32945. predictions are: tensor([[ 0.5556, -0.4120, 1.6844, -0.5043, -0.7045, -0.3261, 0.6481, 0.2448],
  32946. [ 0.5690, -0.3721, 1.1256, -1.0251, -0.6030, -1.0134, 0.4253, 0.1987],
  32947. [-2.3533, -2.3378, 1.6712, -0.8950, 0.0409, -1.2024, 1.0081, 0.3700],
  32948. [ 0.5131, -0.4205, 1.6990, -0.0872, -0.4344, 0.0332, 0.6334, 0.1912],
  32949. [ 0.4841, -0.4213, 1.5142, -0.6901, -0.7282, -0.4796, 0.3208, 0.1235],
  32950. [ 0.6184, -0.3216, 1.5878, -0.5615, -0.4717, -0.9574, 0.4515, 0.4288],
  32951. [ 0.4499, -0.4935, 1.6163, -0.1788, -0.1629, -0.1551, 0.3060, 0.1087],
  32952. [ 0.5053, -0.4721, 1.4499, 0.3496, -0.3156, -0.0978, 0.2096, 0.0571]],
  32953. device='cuda:0', grad_fn=<AddmmBackward>)
  32954. landmarks are: tensor([[[ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  32955. 0.2083],
  32956. [ 0.5129, -0.4374, 1.2072, -1.0080, -0.6520, -0.8848, 0.2679,
  32957. 0.2335],
  32958. [-2.2859, -2.2859, 1.8192, -0.8540, 0.1448, -0.9849, 1.0143,
  32959. 0.4867],
  32960. [ 0.5991, -0.3803, 1.8018, -0.0534, -0.3460, 0.1852, 0.5374,
  32961. 0.1390],
  32962. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  32963. 0.0802],
  32964. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  32965. 0.3928],
  32966. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  32967. -0.0039],
  32968. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  32969. -0.0610]]], device='cuda:0')
  32970. loss_train_step before backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  32971. loss_train_step after backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  32972. loss_train: 0.8277576519176364
  32973. step: 57
  32974. running loss: 0.014522064068730463
  32975. Train Steps: 57/90 Loss: 0.0145 torch.Size([8, 600, 800])
  32976. torch.Size([8, 8])
  32977. tensor([[0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136],
  32978. [0.6199, 0.4071, 0.7600, 0.2117, 0.4037, 0.2767, 0.6138, 0.5550],
  32979. [0.6200, 0.3998, 0.8850, 0.3950, 0.3500, 0.4650, 0.6138, 0.5400],
  32980. [0.6307, 0.4029, 0.8650, 0.5200, 0.3763, 0.4017, 0.7311, 0.5366],
  32981. [0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436],
  32982. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  32983. [0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617],
  32984. [0.6206, 0.4123, 0.7175, 0.2400, 0.3887, 0.2933, 0.6225, 0.5750]],
  32985. device='cuda:0', dtype=torch.float64)
  32986. predictions are: tensor([[ 0.3653, -0.5301, 1.4886, -0.5390, -0.5928, 0.0507, 0.2721, 0.2364],
  32987. [ 0.5125, -0.4335, 1.2703, -1.2746, -0.3055, -1.0842, 0.5741, 0.3149],
  32988. [ 0.4835, -0.5004, 1.7939, -0.4004, -0.6551, -0.2711, 0.3656, 0.2429],
  32989. [ 0.5630, -0.4785, 1.7487, 0.2648, -0.5154, -0.5629, 0.8131, 0.0676],
  32990. [ 0.5086, -0.5020, 1.8854, -0.2616, -0.4566, -0.1313, 0.9231, 0.2956],
  32991. [ 0.6456, -0.3688, 1.2962, -1.1110, -0.1280, -1.6545, 0.3240, 0.0716],
  32992. [ 0.6136, -0.3784, 1.8307, 0.0766, -0.5950, -0.2757, 0.2350, 0.2931],
  32993. [ 0.6073, -0.3740, 1.0229, -1.0454, -0.4761, -1.0501, 0.4470, 0.4177]],
  32994. device='cuda:0', grad_fn=<AddmmBackward>)
  32995. landmarks are: tensor([[[ 0.5466, -0.3840, 1.5016, -0.6077, -0.6404, 0.2083, 0.3871,
  32996. 0.0862],
  32997. [ 0.5775, -0.4054, 1.2245, -1.3082, -0.4210, -1.0080, 0.5490,
  32998. 0.2776],
  32999. [ 0.5778, -0.4393, 1.8018, -0.4614, -0.6693, -0.1381, 0.5490,
  33000. 0.2083],
  33001. [ 0.6273, -0.4249, 1.7095, 0.1159, -0.5480, -0.4306, 1.0910,
  33002. 0.1928],
  33003. [ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  33004. 0.2249],
  33005. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  33006. 0.1005],
  33007. [ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  33008. 0.3084],
  33009. [ 0.5805, -0.3818, 1.0282, -1.1774, -0.4903, -0.9310, 0.5894,
  33010. 0.3700]]], device='cuda:0')
  33011. loss_train_step before backward: tensor(0.0118, device='cuda:0', grad_fn=<MseLossBackward>)
  33012. loss_train_step after backward: tensor(0.0118, device='cuda:0', grad_fn=<MseLossBackward>)
  33013. loss_train: 0.8395349802449346
  33014. step: 58
  33015. running loss: 0.014474741038705769
  33016.  
  33017. Train Steps: 58/90 Loss: 0.0145 torch.Size([8, 600, 800])
  33018. torch.Size([8, 8])
  33019. tensor([[0.6198, 0.4101, 0.8838, 0.5283, 0.3763, 0.5267, 0.5913, 0.5567],
  33020. [0.6133, 0.4066, 0.6787, 0.2617, 0.3800, 0.2433, 0.5147, 0.5358],
  33021. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  33022. [0.6185, 0.4129, 0.8900, 0.4567, 0.3937, 0.5417, 0.5734, 0.5110],
  33023. [0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758],
  33024. [0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  33025. [0.6151, 0.4125, 0.8738, 0.4417, 0.3575, 0.3783, 0.5138, 0.5483],
  33026. [0.6160, 0.4093, 0.8314, 0.4417, 0.3675, 0.4583, 0.5250, 0.5808]],
  33027. device='cuda:0', dtype=torch.float64)
  33028. predictions are: tensor([[ 0.4477, -0.5367, 1.7819, 0.2281, -0.5142, 0.0859, 0.5084, 0.3027],
  33029. [ 0.6758, -0.3454, 0.9215, -1.0019, -0.4842, -1.2423, 0.1739, 0.2234],
  33030. [ 0.5677, -0.3958, 1.6321, -0.6215, -0.5877, -0.8491, 0.4111, 0.2329],
  33031. [ 0.5721, -0.4261, 1.8749, -0.1511, -0.4139, 0.1686, 0.4451, 0.1869],
  33032. [ 0.5606, -0.4834, 1.8408, -0.0444, -0.3999, 0.0658, 0.7831, 0.1033],
  33033. [ 0.5758, -0.4490, 1.2640, -1.3102, -0.1981, -1.5140, 0.5301, 0.1225],
  33034. [ 0.4960, -0.4478, 1.6744, -0.1980, -0.6295, -0.6053, 0.1823, 0.3388],
  33035. [ 0.3174, -0.5879, 1.6093, -0.2038, -0.5482, -0.2282, 0.3039, 0.4434]],
  33036. device='cuda:0', grad_fn=<AddmmBackward>)
  33037. landmarks are: tensor([[[ 0.5770, -0.3918, 1.7961, 0.1544, -0.5480, 0.1467, 0.4450,
  33038. 0.2853],
  33039. [ 0.5470, -0.4081, 0.8492, -1.0773, -0.5307, -1.1620, 0.0912,
  33040. 0.1890],
  33041. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  33042. 0.2237],
  33043. [ 0.5711, -0.3788, 1.8249, -0.1766, -0.4672, 0.2160, 0.3625,
  33044. 0.0742],
  33045. [ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  33046. -0.0881],
  33047. [ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  33048. 0.1082],
  33049. [ 0.5551, -0.3807, 1.7499, -0.2459, -0.6346, -0.5384, 0.0871,
  33050. 0.2468],
  33051. [ 0.5592, -0.3956, 1.5543, -0.2456, -0.5885, -0.1689, 0.1392,
  33052. 0.3968]]], device='cuda:0')
  33053. loss_train_step before backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  33054. loss_train_step after backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  33055. loss_train: 0.8468739879317582
  33056. step: 59
  33057. running loss: 0.01435379640562302
  33058. Train Steps: 59/90 Loss: 0.0144 torch.Size([8, 600, 800])
  33059. torch.Size([8, 8])
  33060. tensor([[0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  33061. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563],
  33062. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  33063. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  33064. [0.6264, 0.4035, 0.8888, 0.4883, 0.4050, 0.5217, 0.6361, 0.4791],
  33065. [0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  33066. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167],
  33067. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000]],
  33068. device='cuda:0', dtype=torch.float64)
  33069. predictions are: tensor([[ 0.5716, -0.4683, 1.6745, 0.2683, -0.6068, -0.3342, 0.6065, 0.1156],
  33070. [ 0.6136, -0.3583, 1.5699, -0.5214, -0.5876, -0.8559, 0.1447, 0.3616],
  33071. [ 0.3707, -0.5752, 1.5958, -0.3524, -0.5343, -0.1191, 0.1477, 0.1774],
  33072. [ 0.6514, -0.3415, 1.3220, -0.9513, -0.3702, -1.1556, 0.1929, 0.4177],
  33073. [ 0.5917, -0.4493, 1.7983, -0.0735, -0.4208, 0.0744, 0.7328, 0.0889],
  33074. [ 0.4227, -0.5170, 1.7463, 0.0612, -0.0829, 0.3032, 0.4088, 0.2015],
  33075. [ 0.4966, -0.4800, 1.8956, -0.3544, -0.4724, -0.7064, 0.7027, 0.3024],
  33076. [ 0.4521, -0.4958, 1.6725, -0.5166, -0.7062, -0.4615, 0.4067, 0.1989]],
  33077. device='cuda:0', grad_fn=<AddmmBackward>)
  33078. landmarks are: tensor([[[ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  33079. -0.1278],
  33080. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  33081. 0.2837],
  33082. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  33083. 0.0502],
  33084. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  33085. 0.3700],
  33086. [ 0.6074, -0.4223, 1.8192, -0.0303, -0.4152, 0.1236, 0.6524,
  33087. -0.0731],
  33088. [ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  33089. 0.0592],
  33090. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  33091. 0.1005],
  33092. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  33093. 0.0236]]], device='cuda:0')
  33094. loss_train_step before backward: tensor(0.0074, device='cuda:0', grad_fn=<MseLossBackward>)
  33095. loss_train_step after backward: tensor(0.0074, device='cuda:0', grad_fn=<MseLossBackward>)
  33096. loss_train: 0.8542463732883334
  33097. step: 60
  33098. running loss: 0.014237439554805557
  33099. Train Steps: 60/90 Loss: 0.0142 torch.Size([8, 600, 800])
  33100. torch.Size([8, 8])
  33101. tensor([[0.6193, 0.4108, 0.7438, 0.2700, 0.3650, 0.3683, 0.6238, 0.5717],
  33102. [0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426],
  33103. [0.6164, 0.4076, 0.8838, 0.4117, 0.3713, 0.5550, 0.6238, 0.5350],
  33104. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  33105. [0.6350, 0.4043, 0.8738, 0.5650, 0.3850, 0.4750, 0.6401, 0.4950],
  33106. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  33107. [0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  33108. [0.6267, 0.4094, 0.8712, 0.3083, 0.4400, 0.2267, 0.6250, 0.5200]],
  33109. device='cuda:0', dtype=torch.float64)
  33110. predictions are: tensor([[ 0.4369, -0.4964, 1.1146, -1.0326, -0.6546, -0.4766, 0.3411, 0.4066],
  33111. [ 0.6392, -0.3629, 1.1748, -1.1745, -0.2520, -1.3513, 0.2541, 0.2668],
  33112. [ 0.3895, -0.5462, 1.7361, -0.3636, -0.5520, 0.3711, 0.4176, 0.3004],
  33113. [ 0.4097, -0.5550, 1.7841, 0.0594, -0.5848, -0.4577, 0.3989, 0.0598],
  33114. [ 0.4349, -0.5610, 1.6784, 0.2591, -0.5321, 0.0387, 0.3806, 0.0563],
  33115. [ 0.5784, -0.4637, 1.9492, -0.3301, -0.2924, -0.8105, 0.9900, 0.2359],
  33116. [ 0.6130, -0.4002, 1.7304, -0.6834, -0.4741, -1.0336, 0.3487, 0.0620],
  33117. [ 0.6742, -0.3106, 1.7169, -0.9077, -0.2364, -1.1439, 0.4729, 0.2411]],
  33118. device='cuda:0', grad_fn=<AddmmBackward>)
  33119. landmarks are: tensor([[[ 5.7471e-01, -3.8861e-01, 1.1494e+00, -1.0388e+00, -6.0000e-01,
  33120. -5.8460e-01, 5.9515e-01, 3.5458e-01],
  33121. [ 5.7841e-01, -4.1532e-01, 1.2972e+00, -1.2541e+00, -2.2647e-01,
  33122. -1.4553e+00, 4.7413e-01, 2.2033e-01],
  33123. [ 5.6143e-01, -4.0323e-01, 1.7961e+00, -3.8445e-01, -5.7113e-01,
  33124. 2.7760e-01, 5.9515e-01, 1.8522e-01],
  33125. [ 6.2730e-01, -4.1045e-01, 1.8480e+00, 1.0824e-01, -5.5381e-01,
  33126. -5.0762e-01, 6.4140e-01, -4.8817e-03],
  33127. [ 6.4706e-01, -4.1832e-01, 1.7499e+00, 3.2379e-01, -5.0762e-01,
  33128. -9.1917e-02, 6.7064e-01, 4.6189e-04],
  33129. [ 6.2236e-01, -4.3453e-01, 1.9404e+00, -2.9207e-01, -3.1709e-01,
  33130. -8.7714e-01, 1.0655e+00, 2.1421e-01],
  33131. [ 6.1339e-01, -4.2179e-01, 1.7268e+00, -6.1540e-01, -4.7298e-01,
  33132. -1.0850e+00, 5.4635e-01, -9.5723e-02],
  33133. [ 6.0889e-01, -3.9477e-01, 1.7383e+00, -8.6174e-01, -2.5358e-01,
  33134. -1.2390e+00, 6.0092e-01, 1.1594e-01]]], device='cuda:0')
  33135. loss_train_step before backward: tensor(0.0121, device='cuda:0', grad_fn=<MseLossBackward>)
  33136. loss_train_step after backward: tensor(0.0121, device='cuda:0', grad_fn=<MseLossBackward>)
  33137. loss_train: 0.8663500072434545
  33138. step: 61
  33139. running loss: 0.014202459135138597
  33140. Train Steps: 61/90 Loss: 0.0142 torch.Size([8, 600, 800])
  33141. torch.Size([8, 8])
  33142. tensor([[0.6058, 0.3986, 0.8324, 0.4626, 0.3838, 0.4983, 0.5147, 0.5466],
  33143. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  33144. [0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  33145. [0.6353, 0.4128, 0.9138, 0.3533, 0.4688, 0.3250, 0.7145, 0.5991],
  33146. [0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  33147. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279],
  33148. [0.6275, 0.4024, 0.8600, 0.2283, 0.5350, 0.1800, 0.7074, 0.5413],
  33149. [0.6129, 0.4063, 0.8738, 0.5250, 0.4313, 0.4733, 0.5230, 0.5874]],
  33150. device='cuda:0', dtype=torch.float64)
  33151. predictions are: tensor([[ 0.3651, -0.5405, 1.6259, -0.0620, -0.5820, 0.0492, 0.1450, 0.1149],
  33152. [-1.0391, -1.4939, 0.8902, -1.3470, -0.2780, -1.4584, 0.2304, 0.4114],
  33153. [ 0.5111, -0.4410, 1.7324, -0.5073, -0.7363, 0.0249, 0.4958, 0.1436],
  33154. [ 0.6049, -0.4107, 1.9642, -0.5052, -0.2794, -0.8110, 1.0207, 0.2991],
  33155. [ 0.5173, -0.4620, 1.6767, 0.4512, -0.4031, 0.0677, 0.3231, 0.0606],
  33156. [ 0.4464, -0.4915, 1.8005, -0.0707, -0.6219, -0.0269, 0.3503, 0.0424],
  33157. [ 0.9084, -0.1551, 1.7199, -1.1509, 0.0133, -1.4654, 0.9196, 0.0301],
  33158. [ 0.5109, -0.4292, 1.6963, 0.2100, -0.4320, -0.0112, -0.0428, 0.2638]],
  33159. device='cuda:0', grad_fn=<AddmmBackward>)
  33160. landmarks are: tensor([[[ 0.5124, -0.4446, 1.5587, -0.1493, -0.5134, 0.0159, 0.0912,
  33161. 0.2386],
  33162. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  33163. 0.3623],
  33164. [ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  33165. 0.2545],
  33166. [ 0.6487, -0.3792, 1.9346, -0.6539, -0.1208, -0.7848, 1.0143,
  33167. 0.4814],
  33168. [ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  33169. 0.2237],
  33170. [ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  33171. 0.1525],
  33172. [ 0.6125, -0.4273, 1.6864, -1.2313, 0.1852, -1.4545, 0.9814,
  33173. 0.2142],
  33174. [ 0.5453, -0.4091, 1.7499, 0.1390, -0.2940, -0.0996, 0.1300,
  33175. 0.4272]]], device='cuda:0')
  33176. loss_train_step before backward: tensor(0.0454, device='cuda:0', grad_fn=<MseLossBackward>)
  33177. loss_train_step after backward: tensor(0.0454, device='cuda:0', grad_fn=<MseLossBackward>)
  33178. loss_train: 0.9117817068472505
  33179. step: 62
  33180. running loss: 0.014706156562052427
  33181.  
  33182. Train Steps: 62/90 Loss: 0.0147 torch.Size([8, 600, 800])
  33183. torch.Size([8, 8])
  33184. tensor([[0.6183, 0.4076, 0.8838, 0.4517, 0.3813, 0.4483, 0.5775, 0.5633],
  33185. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356],
  33186. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927],
  33187. [0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400],
  33188. [ nan, nan, 0.8463, 0.2550, 0.5850, 0.2133, 0.7129, 0.6072],
  33189. [0.6264, 0.4067, 0.9050, 0.4183, 0.3775, 0.4600, 0.6308, 0.4862],
  33190. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667],
  33191. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167]],
  33192. device='cuda:0', dtype=torch.float64)
  33193. predictions are: tensor([[ 0.3876, -0.5186, 1.7843, -0.1677, -0.5246, -0.2142, 0.2486, 0.2402],
  33194. [ 0.5521, -0.4131, 1.4844, -0.9581, -0.3242, -1.1722, 0.6436, 0.1172],
  33195. [ 0.4796, -0.4917, 1.7374, -0.0860, -0.2325, 0.0316, 0.0268, -0.1138],
  33196. [ 0.5655, -0.4131, 1.6269, -0.6418, -0.6632, -0.6151, 0.5047, 0.1447],
  33197. [-2.0073, -2.1644, 1.5982, -0.9444, 0.2918, -1.1021, 1.0624, 0.3503],
  33198. [ 0.5611, -0.4074, 1.8383, -0.2921, -0.6295, -0.2790, 0.4994, -0.0903],
  33199. [ 0.4352, -0.4581, 1.0209, -0.8541, -0.6522, -0.8294, 0.1052, 0.2289],
  33200. [ 0.6101, -0.3655, 1.4231, -0.7075, -0.6191, -0.5375, 0.3774, 0.4063]],
  33201. device='cuda:0', grad_fn=<AddmmBackward>)
  33202. landmarks are: tensor([[[ 0.5700, -0.4032, 1.7961, -0.1997, -0.5249, -0.2151, 0.3815,
  33203. 0.3161],
  33204. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  33205. 0.1879],
  33206. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  33207. -0.0099],
  33208. [ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  33209. 0.2083],
  33210. [-2.2859, -2.2859, 1.6229, -1.1081, 0.4162, -1.3005, 1.0070,
  33211. 0.5188],
  33212. [ 0.6072, -0.4075, 1.8942, -0.3537, -0.5423, -0.1612, 0.6277,
  33213. -0.0400],
  33214. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  33215. 0.3315],
  33216. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  33217. 0.5624]]], device='cuda:0')
  33218. loss_train_step before backward: tensor(0.0091, device='cuda:0', grad_fn=<MseLossBackward>)
  33219. loss_train_step after backward: tensor(0.0091, device='cuda:0', grad_fn=<MseLossBackward>)
  33220. loss_train: 0.9208882143720984
  33221. step: 63
  33222. running loss: 0.014617273244001562
  33223. Train Steps: 63/90 Loss: 0.0146 torch.Size([8, 600, 800])
  33224. torch.Size([8, 8])
  33225. tensor([[0.6060, 0.3924, 0.8450, 0.5717, 0.4200, 0.5217, 0.5253, 0.4752],
  33226. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  33227. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533],
  33228. [0.6146, 0.4124, 0.8800, 0.4867, 0.3800, 0.4500, 0.5106, 0.5524],
  33229. [0.6275, 0.4013, 0.8850, 0.2833, 0.4975, 0.2233, 0.7058, 0.5343],
  33230. [0.6271, 0.4005, 0.8450, 0.6067, 0.3850, 0.4983, 0.6069, 0.4649],
  33231. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817],
  33232. [0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600]],
  33233. device='cuda:0', dtype=torch.float64)
  33234. predictions are: tensor([[ 5.7482e-01, -4.2917e-01, 1.6042e+00, 2.2142e-01, -3.1746e-01,
  33235. 1.4282e-01, 2.6080e-01, 1.7529e-02],
  33236. [ 6.0468e-01, -3.6197e-01, 1.5752e+00, -8.6071e-01, -7.0272e-01,
  33237. -5.9898e-01, 3.5001e-01, 2.9250e-01],
  33238. [-1.7935e+00, -2.0138e+00, 1.3754e+00, -1.0052e+00, -5.5799e-01,
  33239. -9.4388e-01, 3.6216e-01, 2.2459e-01],
  33240. [ 5.5556e-01, -3.8595e-01, 1.7956e+00, -1.1016e-01, -5.4520e-01,
  33241. -1.9756e-01, 1.6915e-01, 1.7724e-01],
  33242. [ 6.3051e-01, -3.9541e-01, 1.8195e+00, -1.0585e+00, -4.3913e-02,
  33243. -1.2640e+00, 9.3094e-01, -8.6043e-04],
  33244. [ 6.1835e-01, -3.9714e-01, 1.6594e+00, 3.2765e-01, -5.4559e-01,
  33245. 2.5476e-02, 5.1325e-01, -1.0676e-01],
  33246. [ 5.3566e-01, -3.9626e-01, 1.4632e+00, -9.3724e-01, -2.8451e-01,
  33247. -1.0030e+00, 3.8548e-01, 3.7415e-01],
  33248. [ 6.2579e-01, -3.6221e-01, 1.8387e+00, 1.5004e-01, -4.5995e-01,
  33249. 4.2121e-03, 3.9129e-01, 2.0803e-01]], device='cuda:0',
  33250. grad_fn=<AddmmBackward>)
  33251. landmarks are: tensor([[[ 0.5132, -0.4736, 1.6171, 0.3546, -0.3460, 0.1236, 0.1404,
  33252. -0.0911],
  33253. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  33254. 0.3315],
  33255. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  33256. 0.2699],
  33257. [ 0.5529, -0.3811, 1.7788, -0.0380, -0.5307, -0.2074, 0.0727,
  33258. 0.2657],
  33259. [ 0.6125, -0.4321, 1.8018, -0.9772, 0.0120, -1.2543, 0.9741,
  33260. 0.1821],
  33261. [ 0.6105, -0.4360, 1.6171, 0.5162, -0.5076, 0.0159, 0.5171,
  33262. -0.1385],
  33263. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  33264. 0.4008],
  33265. [ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  33266. 0.3007]]], device='cuda:0')
  33267. loss_train_step before backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  33268. loss_train_step after backward: tensor(0.0095, device='cuda:0', grad_fn=<MseLossBackward>)
  33269. loss_train: 0.9303545439615846
  33270. step: 64
  33271. running loss: 0.014536789749399759
  33272. Train Steps: 64/90 Loss: 0.0145 torch.Size([8, 600, 800])
  33273. torch.Size([8, 8])
  33274. tensor([[0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  33275. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650],
  33276. [0.6250, 0.3993, 0.9138, 0.4333, 0.3763, 0.5217, 0.6995, 0.5320],
  33277. [0.6111, 0.3995, 0.8788, 0.4567, 0.3813, 0.4833, 0.5450, 0.5700],
  33278. [0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  33279. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  33280. [0.6250, 0.4103, 0.8950, 0.4400, 0.3912, 0.5650, 0.6050, 0.5133],
  33281. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285]],
  33282. device='cuda:0', dtype=torch.float64)
  33283. predictions are: tensor([[ 0.5780, -0.3837, 1.8008, -0.3853, -0.6711, -0.5892, 0.4198, 0.1675],
  33284. [ 0.3405, -0.5710, 1.7168, -0.1329, -0.2891, -0.0377, 0.1252, 0.1673],
  33285. [ 0.5260, -0.4815, 1.9134, -0.3315, -0.5640, 0.0606, 0.8162, 0.1185],
  33286. [ 0.5334, -0.4503, 1.7712, -0.2396, -0.5370, -0.1090, 0.2359, 0.1811],
  33287. [ 0.4991, -0.4842, 1.6608, 0.3424, -0.2535, -0.0699, 0.4387, 0.1371],
  33288. [ 0.7833, -0.1901, 1.4691, -0.5761, -0.1424, -1.3454, 0.1815, 0.5077],
  33289. [ 0.6020, -0.3899, 1.8731, -0.2790, -0.4664, 0.2550, 0.5829, 0.0653],
  33290. [ 0.7122, -0.3456, 1.8752, -0.1186, -0.4541, 0.2055, 0.8527, 0.0780]],
  33291. device='cuda:0', grad_fn=<AddmmBackward>)
  33292. landmarks are: tensor([[[ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  33293. 0.1544],
  33294. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  33295. 0.3238],
  33296. [ 0.6010, -0.4417, 1.9346, -0.2844, -0.5480, 0.1236, 0.9448,
  33297. 0.1715],
  33298. [ 0.5368, -0.4406, 1.7730, -0.1766, -0.5249, -0.0534, 0.2314,
  33299. 0.3469],
  33300. [ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  33301. 0.2237],
  33302. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  33303. 0.5882],
  33304. [ 0.6010, -0.3909, 1.8480, -0.2536, -0.4788, 0.3238, 0.5085,
  33305. 0.0851],
  33306. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  33307. 0.1554]]], device='cuda:0')
  33308. loss_train_step before backward: tensor(0.0056, device='cuda:0', grad_fn=<MseLossBackward>)
  33309. loss_train_step after backward: tensor(0.0056, device='cuda:0', grad_fn=<MseLossBackward>)
  33310. loss_train: 0.9359597829170525
  33311. step: 65
  33312. running loss: 0.014399381275646961
  33313. Train Steps: 65/90 Loss: 0.0144 torch.Size([8, 600, 800])
  33314. torch.Size([8, 8])
  33315. tensor([[0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  33316. [0.6199, 0.4093, 0.7913, 0.2533, 0.4288, 0.2467, 0.5975, 0.5700],
  33317. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  33318. [0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155],
  33319. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  33320. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  33321. [0.6064, 0.3953, 0.8738, 0.4417, 0.3663, 0.4683, 0.5511, 0.5416],
  33322. [0.6200, 0.3913, 0.8788, 0.5217, 0.4075, 0.5100, 0.6060, 0.4913]],
  33323. device='cuda:0', dtype=torch.float64)
  33324. predictions are: tensor([[ 0.5275, -0.4615, 1.7064, -0.4898, -0.5600, -0.7662, 0.4385, 0.1653],
  33325. [ 0.6013, -0.4050, 1.4063, -1.1010, -0.3349, -0.9689, 0.5350, 0.2417],
  33326. [ 0.7457, -0.3026, 1.4962, -0.7248, -0.5378, -0.3920, 0.5202, 0.4871],
  33327. [ 0.6284, -0.3964, 1.7495, -0.9078, -0.1837, -1.2448, 0.6356, 0.0381],
  33328. [ 0.6329, -0.3909, 1.8370, 0.0075, -0.5290, -0.1658, 0.4625, 0.3722],
  33329. [ 0.4794, -0.4647, 1.0918, -1.3628, -0.4908, -1.0768, 0.3367, 0.2329],
  33330. [ 0.5490, -0.4589, 1.8760, -0.1951, -0.5087, -0.0391, 0.3459, 0.0651],
  33331. [ 0.5781, -0.4790, 1.8421, 0.1577, -0.2619, 0.1640, 0.4385, -0.0967]],
  33332. device='cuda:0', grad_fn=<AddmmBackward>)
  33333. landmarks are: tensor([[[ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  33334. 0.1621],
  33335. [ 0.5771, -0.3955, 1.3688, -1.1158, -0.3055, -1.1466, 0.4739,
  33336. 0.3469],
  33337. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  33338. 0.5624],
  33339. [ 0.6126, -0.4161, 1.6344, -0.9541, -0.2247, -1.3467, 0.6339,
  33340. 0.0953],
  33341. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  33342. 0.5239],
  33343. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  33344. 0.2853],
  33345. [ 0.5149, -0.4603, 1.7499, -0.2459, -0.5942, -0.1227, 0.2596,
  33346. 0.2155],
  33347. [ 0.5776, -0.4784, 1.7730, 0.1236, -0.4037, 0.0697, 0.5132,
  33348. -0.0168]]], device='cuda:0')
  33349. loss_train_step before backward: tensor(0.0063, device='cuda:0', grad_fn=<MseLossBackward>)
  33350. loss_train_step after backward: tensor(0.0063, device='cuda:0', grad_fn=<MseLossBackward>)
  33351. loss_train: 0.9422118063084781
  33352. step: 66
  33353. running loss: 0.014275936459219365
  33354.  
  33355. Train Steps: 66/90 Loss: 0.0143 torch.Size([8, 600, 800])
  33356. torch.Size([8, 8])
  33357. tensor([[0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  33358. [ nan, nan, 0.9088, 0.3783, 0.4562, 0.2617, 0.6741, 0.5575],
  33359. [0.6371, 0.4092, 0.8337, 0.5850, 0.3950, 0.5117, 0.6559, 0.5262],
  33360. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  33361. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  33362. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  33363. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  33364. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400]],
  33365. device='cuda:0', dtype=torch.float64)
  33366. predictions are: tensor([[ 0.5496, -0.4349, 1.7507, -0.4072, -0.6231, -0.4261, 0.2851, 0.0239],
  33367. [-2.2059, -2.2517, 1.9492, -0.6269, -0.1311, -1.0656, 0.8054, 0.3096],
  33368. [ 0.7202, -0.2978, 1.6103, 0.3138, -0.4298, 0.0925, 0.7170, 0.0483],
  33369. [ 0.4686, -0.4632, 1.3834, -0.9696, -0.6548, -0.4049, 0.5023, 0.1962],
  33370. [ 0.5204, -0.4374, 1.2730, -1.2612, -0.2085, -1.4333, 0.2908, 0.1288],
  33371. [ 0.7266, -0.2690, 1.8107, -0.2156, -0.3568, 0.3110, 0.4842, 0.3369],
  33372. [ 0.6644, -0.3100, 1.8463, 0.0909, -0.5299, -0.1275, 0.2842, 0.2648],
  33373. [ 0.6698, -0.3349, 1.6451, -0.0235, -0.1953, 0.1273, 0.3835, 0.2099]],
  33374. device='cuda:0', grad_fn=<AddmmBackward>)
  33375. landmarks are: tensor([[[ 5.6692e-01, -4.7937e-01, 1.7499e+00, -3.3826e-01, -6.7506e-01,
  33376. -4.2294e-01, 4.9700e-01, -6.1124e-02],
  33377. [-2.2859e+00, -2.2859e+00, 1.9115e+00, -5.3841e-01, -1.7852e-01,
  33378. -1.0773e+00, 8.2783e-01, 2.8902e-01],
  33379. [ 6.5695e-01, -3.9601e-01, 1.5651e+00, 4.1617e-01, -4.6143e-01,
  33380. 7.7444e-02, 7.4375e-01, 1.4474e-01],
  33381. [ 5.7633e-01, -4.1470e-01, 1.3226e+00, -1.0619e+00, -6.6351e-01,
  33382. -4.1524e-01, 5.3741e-01, 2.5450e-01],
  33383. [ 5.7956e-01, -4.3510e-01, 1.3342e+00, -1.3159e+00, -2.1894e-01,
  33384. -1.4853e+00, 4.0462e-01, 1.0054e-01],
  33385. [ 5.7719e-01, -3.9130e-01, 1.8480e+00, -2.4588e-01, -4.3256e-01,
  33386. 1.9292e-01, 5.3741e-01, 4.7005e-01],
  33387. [ 5.8793e-01, -3.5912e-01, 1.8018e+00, 1.2363e-01, -5.5958e-01,
  33388. -1.6120e-01, 3.4688e-01, 3.1609e-01],
  33389. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  33390. 1.0824e-01, 5.2587e-01, 2.0831e-01]]], device='cuda:0')
  33391. loss_train_step before backward: tensor(0.0051, device='cuda:0', grad_fn=<MseLossBackward>)
  33392. loss_train_step after backward: tensor(0.0051, device='cuda:0', grad_fn=<MseLossBackward>)
  33393. loss_train: 0.9472914161160588
  33394. step: 67
  33395. running loss: 0.01413867785247849
  33396. Train Steps: 67/90 Loss: 0.0141 torch.Size([8, 600, 800])
  33397. torch.Size([8, 8])
  33398. tensor([[0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391],
  33399. [0.6212, 0.4033, 0.8938, 0.4167, 0.3813, 0.4267, 0.5613, 0.5583],
  33400. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  33401. [0.6131, 0.4064, 0.8638, 0.5200, 0.4788, 0.4783, 0.5258, 0.5867],
  33402. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633],
  33403. [0.6200, 0.3913, 0.8788, 0.5217, 0.4075, 0.5100, 0.6060, 0.4913],
  33404. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  33405. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351]],
  33406. device='cuda:0', dtype=torch.float64)
  33407. predictions are: tensor([[ 0.6238, -0.3564, 1.6074, -1.0028, -0.3612, -1.0364, 0.5066, 0.2033],
  33408. [ 0.4492, -0.5054, 1.8988, -0.3947, -0.5929, -0.2613, 0.4276, 0.2535],
  33409. [ 0.4352, -0.4504, 1.6065, -0.7117, -0.6445, -0.7353, 0.2741, 0.2579],
  33410. [ 0.5791, -0.3839, 1.6990, 0.0284, -0.1213, 0.0138, 0.2417, 0.3851],
  33411. [ 0.6664, -0.3126, 1.7192, 0.2874, -0.3526, 0.0089, 0.3909, 0.3248],
  33412. [ 0.5155, -0.5051, 1.7634, 0.0443, -0.3976, 0.1064, 0.4973, -0.0456],
  33413. [ 0.6025, -0.4032, 1.5351, -1.0168, -0.3299, -0.9217, 0.9194, 0.3174],
  33414. [ 0.5629, -0.4255, 1.3034, -1.1134, -0.3056, -1.3572, 0.3460, 0.2011]],
  33415. device='cuda:0', grad_fn=<AddmmBackward>)
  33416. landmarks are: tensor([[[ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  33417. 0.2043],
  33418. [ 0.5832, -0.4231, 1.8423, -0.3614, -0.5249, -0.3152, 0.3065,
  33419. 0.2930],
  33420. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  33421. 0.2237],
  33422. [ 0.5462, -0.4090, 1.7037, 0.1159, -0.0746, -0.0765, 0.1427,
  33423. 0.4239],
  33424. [ 0.5880, -0.3605, 1.7037, 0.3238, -0.2940, -0.0765, 0.3180,
  33425. 0.3161],
  33426. [ 0.5776, -0.4784, 1.7730, 0.1236, -0.4037, 0.0697, 0.5132,
  33427. -0.0168],
  33428. [ 0.6174, -0.3984, 1.5975, -0.9921, -0.3633, -0.9926, 0.8205,
  33429. 0.2050],
  33430. [ 0.5664, -0.4321, 1.2862, -1.0003, -0.2189, -1.4608, 0.3883,
  33431. 0.1855]]], device='cuda:0')
  33432. loss_train_step before backward: tensor(0.0051, device='cuda:0', grad_fn=<MseLossBackward>)
  33433. loss_train_step after backward: tensor(0.0051, device='cuda:0', grad_fn=<MseLossBackward>)
  33434. loss_train: 0.9523771712556481
  33435. step: 68
  33436. running loss: 0.014005546636112472
  33437. Train Steps: 68/90 Loss: 0.0140 torch.Size([8, 600, 800])
  33438. torch.Size([8, 8])
  33439. tensor([[0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  33440. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767],
  33441. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  33442. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  33443. [0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  33444. [0.6275, 0.4013, 0.8850, 0.2833, 0.4975, 0.2233, 0.7058, 0.5343],
  33445. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  33446. [0.6250, 0.3961, 0.8672, 0.4929, 0.4199, 0.4972, 0.6312, 0.5301]],
  33447. device='cuda:0', dtype=torch.float64)
  33448. predictions are: tensor([[ 0.5940, -0.3932, 1.7485, -0.6328, -0.6519, -0.2000, 0.3192, 0.1487],
  33449. [ 0.5559, -0.3739, 1.8155, -0.1258, -0.5492, -0.6956, 0.2571, 0.4124],
  33450. [ 0.3322, -0.5662, 1.3762, -1.2519, -0.3556, -1.0895, 0.3842, 0.3540],
  33451. [ 0.5320, -0.3999, 1.7015, -0.6836, -0.5756, -0.6865, 0.1819, 0.2674],
  33452. [ 0.4998, -0.4898, 1.5446, 0.2641, -0.4719, -0.0665, 1.0350, 0.3207],
  33453. [ 0.6239, -0.4223, 1.8720, -1.0206, 0.0367, -1.1793, 0.8825, 0.1049],
  33454. [ 0.5348, -0.4411, 0.8810, -1.2536, -0.4768, -1.1120, 0.1583, 0.3431],
  33455. [ 0.6846, -0.3897, 1.8536, 0.0126, -0.2834, 0.1039, 0.6548, 0.1332]],
  33456. device='cuda:0', grad_fn=<AddmmBackward>)
  33457. landmarks are: tensor([[[ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  33458. 0.0802],
  33459. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  33460. 0.3778],
  33461. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  33462. 0.3315],
  33463. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  33464. 0.2237],
  33465. [ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  33466. 0.3745],
  33467. [ 0.6125, -0.4321, 1.8018, -0.9772, 0.0120, -1.2543, 0.9741,
  33468. 0.1821],
  33469. [ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  33470. 0.3852],
  33471. [ 0.6010, -0.4562, 1.7198, -0.0090, -0.3464, 0.0108, 0.6294,
  33472. 0.1627]]], device='cuda:0')
  33473. loss_train_step before backward: tensor(0.0058, device='cuda:0', grad_fn=<MseLossBackward>)
  33474. loss_train_step after backward: tensor(0.0058, device='cuda:0', grad_fn=<MseLossBackward>)
  33475. loss_train: 0.9581651668995619
  33476. step: 69
  33477. running loss: 0.013886451694196549
  33478. Train Steps: 69/90 Loss: 0.0139 torch.Size([8, 600, 800])
  33479. torch.Size([8, 8])
  33480. tensor([[0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250],
  33481. [0.6145, 0.4007, 0.8775, 0.4533, 0.4562, 0.5533, 0.6088, 0.5533],
  33482. [0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  33483. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  33484. [0.6284, 0.4127, 0.8538, 0.5867, 0.4363, 0.5083, 0.6038, 0.5433],
  33485. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  33486. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100],
  33487. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896]],
  33488. device='cuda:0', dtype=torch.float64)
  33489. predictions are: tensor([[ 0.3494, -0.5370, 1.2136, -1.3041, -0.4782, -0.9355, 0.5158, 0.2729],
  33490. [ 0.8429, -0.2129, 1.8653, -0.2707, -0.1902, 0.2714, 0.5865, 0.2691],
  33491. [ 0.6540, -0.3671, 1.8191, 0.0418, -0.4627, -0.0966, 0.4293, 0.1704],
  33492. [-2.2697, -2.2630, 1.3518, -1.1985, -0.3079, -1.3828, 0.2759, 0.2044],
  33493. [ 0.6816, -0.3238, 1.6917, 0.3073, -0.2383, 0.0343, 0.5112, 0.2740],
  33494. [ 0.5939, -0.3918, 1.9143, -0.0183, -0.5544, -0.5055, 0.6066, 0.0947],
  33495. [ 0.7189, -0.3206, 1.6926, 0.0616, -0.3304, -0.0278, 0.7087, 0.2288],
  33496. [ 0.7295, -0.2626, 1.5060, -0.6643, -0.5875, -0.8475, 0.1134, 0.5077]],
  33497. device='cuda:0', grad_fn=<AddmmBackward>)
  33498. landmarks are: tensor([[[ 0.5891, -0.3937, 1.1494, -1.2390, -0.5076, -0.9695, 0.4797,
  33499. 0.1390],
  33500. [ 0.5526, -0.4351, 1.7672, -0.1920, -0.1785, 0.2699, 0.5259,
  33501. 0.2699],
  33502. [ 0.5773, -0.4316, 1.7399, 0.1287, -0.5153, -0.0817, 0.4313,
  33503. 0.0919],
  33504. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  33505. 0.0231],
  33506. [ 0.6166, -0.3795, 1.6575, 0.4239, -0.2709, 0.0620, 0.5028,
  33507. 0.2237],
  33508. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  33509. -0.0049],
  33510. [ 0.6236, -0.4344, 1.6171, 0.1852, -0.3402, 0.0236, 0.6471,
  33511. 0.0697],
  33512. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  33513. 0.4374]]], device='cuda:0')
  33514. loss_train_step before backward: tensor(0.0097, device='cuda:0', grad_fn=<MseLossBackward>)
  33515. loss_train_step after backward: tensor(0.0097, device='cuda:0', grad_fn=<MseLossBackward>)
  33516. loss_train: 0.9678890649229288
  33517. step: 70
  33518. running loss: 0.013826986641756125
  33519.  
  33520. Train Steps: 70/90 Loss: 0.0138 torch.Size([8, 600, 800])
  33521. torch.Size([8, 8])
  33522. tensor([[0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  33523. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  33524. [0.6361, 0.4076, 0.8862, 0.5350, 0.3713, 0.4650, 0.6654, 0.5297],
  33525. [0.6161, 0.4076, 0.8900, 0.4667, 0.4125, 0.5917, 0.6262, 0.5367],
  33526. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  33527. [ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167],
  33528. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  33529. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567]],
  33530. device='cuda:0', dtype=torch.float64)
  33531. predictions are: tensor([[ 0.8417, -0.2317, 1.7029, 0.0056, -0.2438, -0.0576, 0.3418, 0.2024],
  33532. [ 0.8047, -0.2616, 1.6958, 0.0687, -0.2768, -0.1067, 0.3044, 0.2138],
  33533. [ 0.9906, -0.1865, 1.8446, 0.1755, -0.5234, -0.1499, 0.9876, 0.1798],
  33534. [ 0.9552, -0.1518, 1.8578, -0.1127, -0.2964, 0.4549, 0.7682, 0.1948],
  33535. [ 0.7645, -0.2472, 1.7689, -0.1310, -0.5927, -0.5891, 0.2263, 0.2930],
  33536. [-1.9544, -2.0844, 1.3214, -1.0800, -0.4260, -1.0365, 0.2664, 0.2658],
  33537. [-1.9802, -2.0483, 1.3216, -0.8993, -0.3252, -1.1174, 0.3076, 0.4552],
  33538. [ 0.7517, -0.2976, 1.0570, -1.4151, -0.4750, -1.1065, 0.4526, 0.2947]],
  33539. device='cuda:0', grad_fn=<AddmmBackward>)
  33540. landmarks are: tensor([[[ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  33541. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  33542. [ 5.4348e-01, -4.5974e-01, 1.6575e+00, 1.5858e-02, -3.2286e-01,
  33543. -1.1501e-01, 1.8767e-01, 1.8544e-01],
  33544. [ 6.5201e-01, -4.0323e-01, 1.8076e+00, 1.8522e-01, -5.7113e-01,
  33545. -1.3811e-01, 7.8762e-01, 1.6077e-01],
  33546. [ 5.5978e-01, -4.0323e-01, 1.8249e+00, -1.3041e-01, -3.8060e-01,
  33547. 4.4696e-01, 6.0670e-01, 1.9292e-01],
  33548. [ 5.4434e-01, -3.9938e-01, 1.7499e+00, -1.2271e-01, -6.1732e-01,
  33549. -5.7691e-01, 4.8756e-03, 2.0706e-01],
  33550. [-2.2859e+00, -2.2859e+00, 1.2820e+00, -1.0801e+00, -5.8845e-01,
  33551. -1.0234e+00, 2.1409e-01, 1.0054e-01],
  33552. [-2.2859e+00, -2.2859e+00, 1.2303e+00, -7.8476e-01, -4.2102e-01,
  33553. -1.1158e+00, 2.2564e-01, 3.7768e-01],
  33554. [ 5.3557e-01, -4.2171e-01, 1.0339e+00, -1.4776e+00, -5.0762e-01,
  33555. -1.1081e+00, 4.2194e-01, 2.8530e-01]]], device='cuda:0')
  33556. loss_train_step before backward: tensor(0.0211, device='cuda:0', grad_fn=<MseLossBackward>)
  33557. loss_train_step after backward: tensor(0.0211, device='cuda:0', grad_fn=<MseLossBackward>)
  33558. loss_train: 0.9890259634703398
  33559. step: 71
  33560. running loss: 0.013929943147469575
  33561. Train Steps: 71/90 Loss: 0.0139 torch.Size([8, 600, 800])
  33562. torch.Size([8, 8])
  33563. tensor([[0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  33564. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194],
  33565. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  33566. [0.6200, 0.4039, 0.8880, 0.4799, 0.3625, 0.4285, 0.5866, 0.5148],
  33567. [0.6164, 0.4102, 0.8850, 0.4867, 0.4213, 0.5983, 0.5609, 0.5038],
  33568. [0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  33569. [0.6224, 0.4061, 0.8988, 0.4300, 0.3838, 0.4750, 0.6112, 0.5483],
  33570. [ nan, nan, 0.9088, 0.3783, 0.4562, 0.2617, 0.6741, 0.5575]],
  33571. device='cuda:0', dtype=torch.float64)
  33572. predictions are: tensor([[ 0.7189, -0.2970, 1.5169, -1.1217, -0.1463, -1.2613, 0.6161, 0.1181],
  33573. [-1.8552, -1.9676, 1.3940, -0.8310, -0.5719, -0.8433, 0.2184, 0.2288],
  33574. [ 0.9510, -0.1599, 1.5640, 0.3152, -0.3457, 0.1025, 0.5300, 0.3758],
  33575. [ 0.7031, -0.3321, 1.7282, -0.0901, -0.5328, -0.3028, 0.4581, 0.1999],
  33576. [ 0.9493, -0.1386, 1.6505, -0.0565, -0.2638, 0.3398, 0.5135, 0.2446],
  33577. [ 0.6160, -0.3527, 1.2463, -0.4025, -0.5617, -0.2948, 0.1490, 0.2339],
  33578. [ 0.8022, -0.2647, 1.6993, -0.3240, -0.4886, -0.0780, 0.6073, 0.2791],
  33579. [-1.9800, -2.0272, 1.8216, -0.6188, -0.1633, -1.1645, 0.7517, 0.3891]],
  33580. device='cuda:0', grad_fn=<AddmmBackward>)
  33581. landmarks are: tensor([[[ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  33582. -0.0209],
  33583. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  33584. 0.1133],
  33585. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  33586. 0.3161],
  33587. [ 0.5781, -0.4205, 1.8159, -0.0691, -0.6116, -0.3069, 0.4236,
  33588. 0.0919],
  33589. [ 0.5614, -0.3912, 1.8018, -0.0380, -0.3402, 0.4778, 0.3049,
  33590. 0.0412],
  33591. [ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  33592. 0.1552],
  33593. [ 0.5888, -0.4101, 1.8654, -0.2998, -0.5134, -0.0919, 0.5374,
  33594. 0.2468],
  33595. [-2.2859, -2.2859, 1.9115, -0.5384, -0.1785, -1.0773, 0.8278,
  33596. 0.2890]]], device='cuda:0')
  33597. loss_train_step before backward: tensor(0.0214, device='cuda:0', grad_fn=<MseLossBackward>)
  33598. loss_train_step after backward: tensor(0.0214, device='cuda:0', grad_fn=<MseLossBackward>)
  33599. loss_train: 1.010474806651473
  33600. step: 72
  33601. running loss: 0.014034372314603792
  33602. Train Steps: 72/90 Loss: 0.0140 torch.Size([8, 600, 800])
  33603. torch.Size([8, 8])
  33604. tensor([[0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  33605. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  33606. [0.6266, 0.4101, 0.8350, 0.2333, 0.3950, 0.2950, 0.6264, 0.4921],
  33607. [0.6147, 0.4026, 0.6600, 0.2467, 0.4088, 0.2150, 0.5489, 0.5773],
  33608. [0.6124, 0.4030, 0.8650, 0.4867, 0.4999, 0.5106, 0.5137, 0.5773],
  33609. [0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  33610. [0.6262, 0.4163, 0.8850, 0.5183, 0.3763, 0.4150, 0.6025, 0.5500],
  33611. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047]],
  33612. device='cuda:0', dtype=torch.float64)
  33613. predictions are: tensor([[ 0.3368, -0.5989, 1.3968, -1.2855, -0.2685, -1.2013, 0.8332, 0.1484],
  33614. [ 0.6560, -0.3918, 1.6908, 0.3211, -0.5529, -0.0343, 0.5810, 0.3675],
  33615. [ 0.6294, -0.4085, 1.5747, -1.2638, -0.4456, -0.9089, 0.5935, 0.0504],
  33616. [ 0.3532, -0.5393, 0.8963, -1.2529, -0.4193, -1.2993, 0.1756, 0.4006],
  33617. [ 0.4367, -0.4870, 1.7705, -0.0473, -0.0324, 0.0032, 0.1528, 0.2683],
  33618. [ 0.6308, -0.4134, 1.8200, 0.1440, -0.5066, -0.0720, 0.4684, 0.0920],
  33619. [ 0.4497, -0.4605, 1.8136, 0.0541, -0.5289, -0.4077, 0.5499, 0.3112],
  33620. [ 0.4315, -0.4607, 1.4753, -0.1712, -0.5194, -0.8658, 0.3211, 0.5433]],
  33621. device='cuda:0', grad_fn=<AddmmBackward>)
  33622. landmarks are: tensor([[[ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  33623. 0.1917],
  33624. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  33625. 0.5316],
  33626. [ 0.6081, -0.3918, 1.5709, -1.2082, -0.4614, -0.9233, 0.6072,
  33627. -0.0129],
  33628. [ 0.5532, -0.4264, 0.7626, -1.1466, -0.3979, -1.2928, 0.2494,
  33629. 0.3808],
  33630. [ 0.5428, -0.4244, 1.7095, -0.0380, 0.0232, 0.0725, 0.0866,
  33631. 0.3806],
  33632. [ 0.5773, -0.4316, 1.7399, 0.1287, -0.5153, -0.0817, 0.4313,
  33633. 0.0919],
  33634. [ 0.6066, -0.3632, 1.8018, 0.1082, -0.5480, -0.3691, 0.4970,
  33635. 0.2545],
  33636. [ 0.6069, -0.3309, 1.3742, -0.1493, -0.5365, -0.9541, 0.2884,
  33637. 0.5071]]], device='cuda:0')
  33638. loss_train_step before backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  33639. loss_train_step after backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  33640. loss_train: 1.0177430603653193
  33641. step: 73
  33642. running loss: 0.01394168575842903
  33643. Train Steps: 73/90 Loss: 0.0139 torch.Size([8, 600, 800])
  33644. torch.Size([8, 8])
  33645. tensor([[0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  33646. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  33647. [0.6307, 0.4029, 0.8988, 0.4817, 0.3937, 0.3500, 0.7311, 0.5378],
  33648. [0.6279, 0.4008, 0.8600, 0.4883, 0.4325, 0.5283, 0.7010, 0.5378],
  33649. [ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  33650. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  33651. [0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  33652. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500]],
  33653. device='cuda:0', dtype=torch.float64)
  33654. predictions are: tensor([[ 0.6748, -0.3631, 1.6707, -0.1981, -0.4835, 0.0423, 0.1712, 0.0683],
  33655. [-2.2875, -2.2457, 1.4929, -0.7364, -0.6461, -0.9071, 0.2137, 0.1640],
  33656. [ 0.6945, -0.3782, 1.8052, -0.0300, -0.4562, -0.6526, 0.8941, 0.2610],
  33657. [ 0.8142, -0.2674, 1.6115, 0.0434, -0.3279, 0.1068, 0.7172, 0.3199],
  33658. [-1.7700, -1.8789, 1.6584, -0.8913, 0.1248, -1.2807, 0.8153, 0.4383],
  33659. [ 0.5807, -0.4324, 0.8782, -1.2439, -0.5315, -1.1515, 0.2223, 0.1654],
  33660. [ 0.8077, -0.2522, 1.6139, 0.1851, -0.2085, 0.1892, 0.3838, 0.1822],
  33661. [ 0.6567, -0.3555, 1.2165, -1.0069, -0.6257, -0.7862, 0.3077, 0.2937]],
  33662. device='cuda:0', grad_fn=<AddmmBackward>)
  33663. landmarks are: tensor([[[ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  33664. 0.0231],
  33665. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  33666. 0.0893],
  33667. [ 0.6273, -0.4249, 1.8654, -0.0611, -0.4672, -0.6693, 1.0910,
  33668. 0.1982],
  33669. [ 0.6141, -0.4345, 1.6864, -0.0303, -0.2882, 0.1544, 0.9521,
  33670. 0.1982],
  33671. [-2.2859, -2.2859, 1.8018, -0.9002, 0.1910, -1.2467, 1.1057,
  33672. 0.3799],
  33673. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  33674. 0.0862],
  33675. [ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  33676. 0.0764],
  33677. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  33678. 0.2545]]], device='cuda:0')
  33679. loss_train_step before backward: tensor(0.0173, device='cuda:0', grad_fn=<MseLossBackward>)
  33680. loss_train_step after backward: tensor(0.0173, device='cuda:0', grad_fn=<MseLossBackward>)
  33681. loss_train: 1.0350117646157742
  33682. step: 74
  33683. running loss: 0.013986645467780731
  33684.  
  33685. Train Steps: 74/90 Loss: 0.0140 torch.Size([8, 600, 800])
  33686. torch.Size([8, 8])
  33687. tensor([[0.6223, 0.4171, 0.8750, 0.5500, 0.4050, 0.4817, 0.5675, 0.5600],
  33688. [0.6293, 0.3982, 0.8700, 0.5300, 0.3763, 0.4717, 0.7050, 0.5297],
  33689. [0.6060, 0.3924, 0.8450, 0.5717, 0.4200, 0.5217, 0.5253, 0.4752],
  33690. [0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283],
  33691. [0.6130, 0.4072, 0.8550, 0.4567, 0.3638, 0.3667, 0.5290, 0.5892],
  33692. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  33693. [0.6147, 0.4107, 0.8137, 0.3333, 0.3750, 0.2683, 0.5006, 0.5412],
  33694. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767]],
  33695. device='cuda:0', dtype=torch.float64)
  33696. predictions are: tensor([[ 0.5489, -0.4094, 1.6848, 0.0984, -0.4474, -0.0212, 0.4780, 0.3581],
  33697. [ 0.3928, -0.5698, 1.6149, -0.0116, -0.5300, -0.1118, 0.9159, 0.1718],
  33698. [ 0.4654, -0.4955, 1.4773, 0.1833, -0.3214, 0.1166, 0.3754, 0.1369],
  33699. [ 0.3872, -0.5270, 1.5909, -0.0495, -0.0616, -0.0460, 0.1934, 0.1892],
  33700. [ 0.4057, -0.4826, 1.6038, -0.3406, -0.6131, -0.5951, 0.2500, 0.4324],
  33701. [ 0.6082, -0.4286, 1.7353, -0.7135, -0.3392, -1.2192, 0.5991, 0.0500],
  33702. [ 0.4191, -0.5111, 1.3351, -0.8959, -0.5430, -0.9761, 0.1950, 0.1611],
  33703. [-2.9487, -2.6707, 1.2990, -0.8877, -0.3762, -1.1304, 0.2738, 0.2526]],
  33704. device='cuda:0', grad_fn=<AddmmBackward>)
  33705. landmarks are: tensor([[[ 0.5883, -0.3594, 1.7557, 0.2545, -0.4152, -0.0611, 0.3353,
  33706. 0.3007],
  33707. [ 0.6207, -0.4466, 1.7326, 0.1621, -0.5480, -0.1073, 0.9704,
  33708. 0.1608],
  33709. [ 0.5132, -0.4736, 1.6171, 0.3546, -0.3460, 0.1236, 0.1404,
  33710. -0.0911],
  33711. [ 0.5245, -0.4347, 1.6806, 0.1159, 0.0046, 0.0129, 0.1044,
  33712. 0.1544],
  33713. [ 0.5454, -0.4053, 1.6633, -0.1766, -0.6058, -0.5923, 0.1577,
  33714. 0.4357],
  33715. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  33716. -0.0529],
  33717. [ 0.5532, -0.3888, 1.4727, -0.7463, -0.5538, -1.0465, 0.0265,
  33718. 0.2138],
  33719. [-2.2859, -2.2859, 1.2303, -0.7848, -0.4210, -1.1158, 0.2256,
  33720. 0.3777]]], device='cuda:0')
  33721. loss_train_step before backward: tensor(0.0204, device='cuda:0', grad_fn=<MseLossBackward>)
  33722. loss_train_step after backward: tensor(0.0204, device='cuda:0', grad_fn=<MseLossBackward>)
  33723. loss_train: 1.055397231131792
  33724. step: 75
  33725. running loss: 0.014071963081757228
  33726. Train Steps: 75/90 Loss: 0.0141 torch.Size([8, 600, 800])
  33727. torch.Size([8, 8])
  33728. tensor([[0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600],
  33729. [0.6273, 0.4143, 0.8750, 0.5700, 0.3987, 0.4717, 0.6013, 0.5467],
  33730. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  33731. [0.6080, 0.4010, 0.8750, 0.4500, 0.4825, 0.5617, 0.5837, 0.5583],
  33732. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422],
  33733. [0.6211, 0.3993, 0.7650, 0.1933, 0.4575, 0.1550, 0.5965, 0.4895],
  33734. [0.6037, 0.4020, 0.8300, 0.4033, 0.3575, 0.4883, 0.5647, 0.5631],
  33735. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817]],
  33736. device='cuda:0', dtype=torch.float64)
  33737. predictions are: tensor([[ 0.5642, -0.4334, 1.1553, -1.3390, -0.5370, -1.0926, 0.5606, 0.3162],
  33738. [ 0.4602, -0.4550, 1.6843, 0.3836, -0.4767, -0.2140, 0.6209, 0.2623],
  33739. [ 0.5543, -0.4040, 1.6614, 0.1765, -0.3040, 0.0755, 0.2942, 0.1887],
  33740. [ 0.5686, -0.4199, 1.7921, -0.1467, -0.1592, 0.0329, 0.5323, 0.2321],
  33741. [-2.2041, -2.1930, 1.2239, -0.9110, -0.5603, -1.3102, 0.1554, 0.1432],
  33742. [ 0.1707, -0.7323, 1.2666, -1.3800, -0.2301, -1.5770, 0.5435, 0.0338],
  33743. [ 0.3557, -0.5347, 1.6182, -0.3355, -0.6558, -0.1010, 0.4520, 0.2669],
  33744. [ 0.2443, -0.6425, 1.5739, 0.4655, -0.2944, -0.0588, 0.2487, 0.0846]],
  33745. device='cuda:0', grad_fn=<AddmmBackward>)
  33746. landmarks are: tensor([[[ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  33747. 0.3007],
  33748. [ 0.6115, -0.3724, 1.7557, 0.3469, -0.4441, -0.1073, 0.4912,
  33749. 0.2391],
  33750. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  33751. 0.2386],
  33752. [ 0.5223, -0.4336, 1.7557, -0.2074, -0.0573, 0.3084, 0.4104,
  33753. 0.2930],
  33754. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  33755. 0.2183],
  33756. [ 0.5828, -0.4417, 1.2476, -1.3929, -0.1727, -1.5700, 0.4694,
  33757. -0.0248],
  33758. [ 0.5027, -0.4289, 1.5478, -0.4229, -0.6346, -0.0303, 0.3223,
  33759. 0.3148],
  33760. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  33761. -0.0610]]], device='cuda:0')
  33762. loss_train_step before backward: tensor(0.0134, device='cuda:0', grad_fn=<MseLossBackward>)
  33763. loss_train_step after backward: tensor(0.0134, device='cuda:0', grad_fn=<MseLossBackward>)
  33764. loss_train: 1.068770982325077
  33765. step: 76
  33766. running loss: 0.014062776083224699
  33767. Train Steps: 76/90 Loss: 0.0141 torch.Size([8, 600, 800])
  33768. torch.Size([8, 8])
  33769. tensor([[0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843],
  33770. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  33771. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350],
  33772. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344],
  33773. [0.6250, 0.4116, 0.8700, 0.4850, 0.4650, 0.5567, 0.6088, 0.5183],
  33774. [ nan, nan, 0.7097, 0.2346, 0.4250, 0.1850, 0.5175, 0.5583],
  33775. [0.6268, 0.4052, 0.8175, 0.2250, 0.4688, 0.1917, 0.6375, 0.5267],
  33776. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183]],
  33777. device='cuda:0', dtype=torch.float64)
  33778. predictions are: tensor([[ 5.2556e-01, -4.7396e-01, 1.8801e+00, -7.8138e-03, -6.2453e-01,
  33779. 3.7464e-02, 5.8580e-01, -1.2725e-02],
  33780. [ 4.0192e-01, -5.3662e-01, 1.7949e+00, 9.5810e-02, -6.1910e-01,
  33781. -1.8867e-01, 7.2414e-01, 2.0731e-01],
  33782. [ 3.6289e-01, -5.6181e-01, 1.6216e+00, 1.5098e-01, -3.6548e-01,
  33783. -4.9103e-02, 1.0999e-01, 1.4797e-01],
  33784. [ 3.2511e-01, -5.8615e-01, 1.7849e+00, -4.6862e-02, -6.3078e-01,
  33785. -4.6994e-01, 1.9428e-01, 1.4981e-01],
  33786. [ 5.6330e-01, -4.2058e-01, 1.7289e+00, -4.8876e-04, -2.2566e-01,
  33787. 3.5793e-01, 5.1060e-01, 1.5541e-01],
  33788. [-2.2766e+00, -2.2593e+00, 1.0513e+00, -1.0888e+00, -4.0269e-01,
  33789. -1.3363e+00, 1.0775e-01, 1.6716e-01],
  33790. [ 4.5438e-01, -5.3729e-01, 1.4152e+00, -1.1941e+00, -1.9299e-01,
  33791. -1.4076e+00, 7.0603e-01, 1.0110e-01],
  33792. [ 4.3415e-01, -4.6464e-01, 1.0296e+00, -7.9853e-01, -1.5969e-01,
  33793. -1.3360e+00, 3.0307e-01, 4.9511e-01]], device='cuda:0',
  33794. grad_fn=<AddmmBackward>)
  33795. landmarks are: tensor([[[ 0.6075, -0.4159, 1.8654, -0.1458, -0.5249, 0.0159, 0.6359,
  33796. -0.0490],
  33797. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  33798. 0.1499],
  33799. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  33800. 0.1854],
  33801. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  33802. 0.1824],
  33803. [ 0.6012, -0.3846, 1.7326, -0.0457, -0.1381, 0.2853, 0.5259,
  33804. 0.1082],
  33805. [-2.2859, -2.2859, 0.9922, -1.2021, -0.3229, -1.4314, 0.1044,
  33806. 0.2930],
  33807. [ 0.6092, -0.4143, 1.4901, -1.2467, -0.1208, -1.4006, 0.6587,
  33808. 0.1467],
  33809. [ 0.6101, -0.3152, 1.0166, -0.7540, -0.0226, -1.4468, 0.2823,
  33810. 0.5702]]], device='cuda:0')
  33811. loss_train_step before backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  33812. loss_train_step after backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  33813. loss_train: 1.0775065701454878
  33814. step: 77
  33815. running loss: 0.01399359182007127
  33816. Train Steps: 77/90 Loss: 0.0140 torch.Size([8, 600, 800])
  33817. torch.Size([8, 8])
  33818. tensor([[0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  33819. [0.6336, 0.4154, 0.8900, 0.2767, 0.4988, 0.2867, 0.7422, 0.5540],
  33820. [0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  33821. [0.6214, 0.4040, 0.8838, 0.3500, 0.3600, 0.5183, 0.6362, 0.5200],
  33822. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  33823. [0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  33824. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  33825. [0.6179, 0.4040, 0.7412, 0.1850, 0.3825, 0.2783, 0.5837, 0.5600]],
  33826. device='cuda:0', dtype=torch.float64)
  33827. predictions are: tensor([[ 1.8696e-01, -6.7659e-01, 1.6200e+00, 5.9537e-01, -5.5009e-01,
  33828. -5.2045e-02, 3.8511e-01, 3.9849e-01],
  33829. [ 5.6669e-01, -4.5132e-01, 1.8657e+00, -7.5506e-01, 5.8507e-02,
  33830. -1.1113e+00, 1.0879e+00, 2.1666e-01],
  33831. [ 2.5891e-01, -6.3093e-01, 8.7453e-01, -1.1247e+00, -5.1247e-01,
  33832. -1.2483e+00, 1.9881e-01, 7.4780e-02],
  33833. [ 3.3157e-01, -6.2260e-01, 1.7811e+00, -3.8282e-01, -5.5791e-01,
  33834. 1.4175e-01, 6.5250e-01, 1.2902e-01],
  33835. [ 1.8281e-01, -6.8666e-01, 1.7092e+00, 2.4061e-01, -2.2659e-01,
  33836. -6.1996e-02, 1.3360e-01, 2.7632e-01],
  33837. [ 5.4019e-01, -4.9346e-01, 1.7867e+00, -1.4107e-01, -6.5465e-01,
  33838. -4.7040e-01, 4.3645e-01, 1.0568e-03],
  33839. [ 3.5157e-01, -5.6563e-01, 1.6518e+00, -7.9254e-02, -5.3259e-01,
  33840. -8.8585e-02, 6.9966e-02, 4.8155e-02],
  33841. [ 6.5928e-01, -3.6591e-01, 1.1671e+00, -1.2855e+00, -5.0414e-01,
  33842. -1.1079e+00, 4.3803e-01, 2.8392e-01]], device='cuda:0',
  33843. grad_fn=<AddmmBackward>)
  33844. landmarks are: tensor([[[ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  33845. 0.5316],
  33846. [ 0.6405, -0.3671, 1.8249, -1.0080, 0.0178, -0.9618, 1.1422,
  33847. 0.2730],
  33848. [ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  33849. 0.0712],
  33850. [ 0.5841, -0.4199, 1.7961, -0.6693, -0.6231, 0.1082, 0.6529,
  33851. 0.1159],
  33852. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  33853. 0.3700],
  33854. [ 0.5669, -0.4794, 1.7499, -0.3383, -0.6751, -0.4229, 0.4970,
  33855. -0.0611],
  33856. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  33857. 0.0502],
  33858. [ 0.5680, -0.4201, 1.1379, -1.4314, -0.5192, -1.0003, 0.4104,
  33859. 0.3007]]], device='cuda:0')
  33860. loss_train_step before backward: tensor(0.0214, device='cuda:0', grad_fn=<MseLossBackward>)
  33861. loss_train_step after backward: tensor(0.0214, device='cuda:0', grad_fn=<MseLossBackward>)
  33862. loss_train: 1.0989203732460737
  33863. step: 78
  33864. running loss: 0.014088722733924022
  33865.  
  33866. Train Steps: 78/90 Loss: 0.0141 torch.Size([8, 600, 800])
  33867. torch.Size([8, 8])
  33868. tensor([[0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  33869. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  33870. [0.6272, 0.4071, 0.8738, 0.5600, 0.3675, 0.3783, 0.5926, 0.4742],
  33871. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  33872. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750],
  33873. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  33874. [0.6260, 0.4133, 0.8800, 0.5117, 0.3713, 0.3283, 0.6223, 0.4967],
  33875. [0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783]],
  33876. device='cuda:0', dtype=torch.float64)
  33877. predictions are: tensor([[ 0.3864, -0.5742, 1.8245, 0.1772, -0.4627, 0.0362, 0.2757, 0.0727],
  33878. [ 0.3755, -0.5567, 1.5371, -1.0199, -0.3176, -1.1191, 0.5130, 0.1074],
  33879. [ 0.5378, -0.4717, 1.8535, 0.2957, -0.5370, -0.3660, 0.3919, -0.0246],
  33880. [ 0.4323, -0.5277, 1.4370, -1.0060, -0.4104, -0.7326, 0.5667, 0.1857],
  33881. [ 0.3792, -0.5396, 0.9493, -1.1634, -0.2327, -1.3323, 0.2315, 0.4083],
  33882. [-2.9494, -2.7514, 1.1699, -1.0930, -0.3473, -1.1785, 0.1991, 0.1744],
  33883. [ 0.4948, -0.4716, 1.8885, 0.0686, -0.4718, -0.5718, 0.5318, 0.0908],
  33884. [ 0.4863, -0.4793, 1.0017, -0.9466, -0.5978, -0.7258, 0.2886, 0.2970]],
  33885. device='cuda:0', grad_fn=<AddmmBackward>)
  33886. landmarks are: tensor([[[ 0.5773, -0.4316, 1.7399, 0.1287, -0.5153, -0.0817, 0.4313,
  33887. 0.0919],
  33888. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  33889. 0.2043],
  33890. [ 0.6113, -0.4057, 1.7499, 0.3007, -0.5885, -0.5384, 0.4513,
  33891. -0.0957],
  33892. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  33893. 0.2160],
  33894. [ 0.5663, -0.4396, 0.8261, -1.1312, -0.2940, -1.3929, 0.2603,
  33895. 0.3700],
  33896. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  33897. 0.1373],
  33898. [ 0.6054, -0.3767, 1.7788, 0.0774, -0.5711, -0.7694, 0.5887,
  33899. 0.0081],
  33900. [ 0.5680, -0.4005, 0.8030, -1.0542, -0.6289, -0.7540, 0.3700,
  33901. 0.3854]]], device='cuda:0')
  33902. loss_train_step before backward: tensor(0.0227, device='cuda:0', grad_fn=<MseLossBackward>)
  33903. loss_train_step after backward: tensor(0.0227, device='cuda:0', grad_fn=<MseLossBackward>)
  33904. loss_train: 1.121607020497322
  33905. step: 79
  33906. running loss: 0.01419755722148509
  33907. Train Steps: 79/90 Loss: 0.0142 torch.Size([8, 600, 800])
  33908. torch.Size([8, 8])
  33909. tensor([[0.6236, 0.3966, 0.8850, 0.4967, 0.3638, 0.4017, 0.5850, 0.5183],
  33910. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927],
  33911. [0.6239, 0.4107, 0.8162, 0.2763, 0.3625, 0.3600, 0.5988, 0.5700],
  33912. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  33913. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  33914. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  33915. [0.6299, 0.4008, 0.8450, 0.5350, 0.4213, 0.5000, 0.6350, 0.5100],
  33916. [0.6276, 0.4235, 0.8888, 0.5333, 0.3800, 0.3117, 0.5427, 0.6164]],
  33917. device='cuda:0', dtype=torch.float64)
  33918. predictions are: tensor([[ 0.5590, -0.4708, 1.7701, -0.0477, -0.5697, -0.4099, 0.3951, 0.1113],
  33919. [ 0.2881, -0.6408, 1.7571, -0.1415, -0.1678, 0.0765, -0.0485, -0.0760],
  33920. [ 0.6762, -0.3469, 1.4456, -0.9191, -0.5233, -0.5599, 0.4077, 0.1622],
  33921. [ 0.5194, -0.5119, 1.8524, -0.1059, -0.5642, -0.4052, 0.7536, 0.1808],
  33922. [ 0.5069, -0.4797, 1.2314, -1.3000, -0.4628, -0.9837, 0.5290, 0.1718],
  33923. [ 0.5393, -0.4442, 1.7180, 0.1891, -0.5061, -0.5392, 0.3002, 0.1873],
  33924. [ 0.4009, -0.5789, 1.6085, 0.1635, -0.3419, 0.0440, 0.5460, 0.1089],
  33925. [ 0.1756, -0.6277, 1.6535, 0.0782, -0.4525, -0.8386, 0.2303, 0.5210]],
  33926. device='cuda:0', grad_fn=<AddmmBackward>)
  33927. landmarks are: tensor([[[ 0.5944, -0.4543, 1.8018, 0.0082, -0.6058, -0.4306, 0.4162,
  33928. 0.1082],
  33929. [ 0.5417, -0.4417, 1.7499, -0.1304, -0.1994, -0.0324, 0.0951,
  33930. -0.0099],
  33931. [ 0.5960, -0.3888, 1.4840, -1.0095, -0.6115, -0.6231, 0.4797,
  33932. 0.3469],
  33933. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  33934. 0.1768],
  33935. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  33936. 0.2032],
  33937. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  33938. 0.1698],
  33939. [ 0.6236, -0.4344, 1.6171, 0.1852, -0.3402, 0.0236, 0.6471,
  33940. 0.0697],
  33941. [ 0.6131, -0.3299, 1.8192, 0.1775, -0.5307, -0.8463, 0.2206,
  33942. 0.5612]]], device='cuda:0')
  33943. loss_train_step before backward: tensor(0.0109, device='cuda:0', grad_fn=<MseLossBackward>)
  33944. loss_train_step after backward: tensor(0.0109, device='cuda:0', grad_fn=<MseLossBackward>)
  33945. loss_train: 1.1325139282271266
  33946. step: 80
  33947. running loss: 0.014156424102839082
  33948. Train Steps: 80/90 Loss: 0.0142 torch.Size([8, 600, 800])
  33949. torch.Size([8, 8])
  33950. tensor([[ nan, nan, 0.8625, 0.2550, 0.5487, 0.2200, 0.7335, 0.5737],
  33951. [0.6182, 0.3982, 0.7541, 0.2379, 0.3959, 0.2792, 0.6079, 0.5389],
  33952. [0.6193, 0.4108, 0.7425, 0.2350, 0.3887, 0.2750, 0.5900, 0.5717],
  33953. [0.6184, 0.4079, 0.8350, 0.3700, 0.3675, 0.2883, 0.5312, 0.5783],
  33954. [0.6254, 0.3993, 0.8988, 0.4767, 0.3987, 0.5517, 0.6955, 0.5285],
  33955. [0.6317, 0.4038, 0.8287, 0.5900, 0.3800, 0.4717, 0.6295, 0.4986],
  33956. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540],
  33957. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567]],
  33958. device='cuda:0', dtype=torch.float64)
  33959. predictions are: tensor([[-2.6894, -2.5739, 1.5702, -1.0534, 0.0456, -1.2679, 0.7645, 0.2454],
  33960. [ 0.4485, -0.5052, 1.2072, -1.1342, -0.5686, -0.9861, 0.4241, 0.1608],
  33961. [ 0.4587, -0.4829, 1.0750, -1.1103, -0.5859, -0.9948, 0.3502, 0.2427],
  33962. [ 0.5041, -0.4563, 1.5614, -0.5170, -0.6090, -0.8942, -0.1033, 0.2127],
  33963. [ 0.5302, -0.4635, 1.8460, -0.0276, -0.5491, 0.2861, 0.7146, 0.0353],
  33964. [ 0.5678, -0.4470, 1.5932, 0.4860, -0.6324, -0.0811, 0.4204, -0.0671],
  33965. [ 0.2759, -0.6126, 1.5074, -1.1428, 0.0767, -1.4070, 0.6163, 0.1728],
  33966. [ 0.5419, -0.3975, 1.6601, -0.1506, -0.1774, 0.0067, 0.1483, 0.1847]],
  33967. device='cuda:0', grad_fn=<AddmmBackward>)
  33968. landmarks are: tensor([[[-2.2859, -2.2859, 1.6979, -1.1081, 0.2487, -1.2697, 1.1020,
  33969. 0.3638],
  33970. [ 0.5697, -0.4466, 1.1973, -1.1871, -0.4571, -0.9965, 0.5219,
  33971. 0.2032],
  33972. [ 0.5746, -0.3882, 1.1436, -1.2005, -0.4903, -1.0157, 0.4393,
  33973. 0.3546],
  33974. [ 0.5704, -0.4019, 1.5709, -0.5769, -0.5885, -0.9541, 0.1679,
  33975. 0.3854],
  33976. [ 0.6026, -0.4417, 1.8654, -0.0842, -0.4441, 0.2622, 0.9265,
  33977. 0.1554],
  33978. [ 0.6320, -0.4206, 1.5420, 0.4393, -0.5307, -0.1073, 0.6216,
  33979. 0.0171],
  33980. [ 0.6487, -0.3792, 1.6344, -1.0850, 0.2659, -1.5397, 0.8059,
  33981. 0.2730],
  33982. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  33983. 0.2853]]], device='cuda:0')
  33984. loss_train_step before backward: tensor(0.0195, device='cuda:0', grad_fn=<MseLossBackward>)
  33985. loss_train_step after backward: tensor(0.0195, device='cuda:0', grad_fn=<MseLossBackward>)
  33986. loss_train: 1.1520524276420474
  33987. step: 81
  33988. running loss: 0.014222869477062314
  33989. Train Steps: 81/90 Loss: 0.0142 torch.Size([8, 600, 800])
  33990. torch.Size([8, 8])
  33991. tensor([[0.6248, 0.4185, 0.8500, 0.5767, 0.4463, 0.4550, 0.5613, 0.5917],
  33992. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  33993. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  33994. [0.6038, 0.3946, 0.8413, 0.4883, 0.3563, 0.4550, 0.5266, 0.4693],
  33995. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  33996. [0.6271, 0.4081, 0.9081, 0.4894, 0.3700, 0.4283, 0.6661, 0.5274],
  33997. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  33998. [0.6164, 0.4066, 0.6625, 0.3033, 0.3775, 0.2967, 0.5725, 0.5833]],
  33999. device='cuda:0', dtype=torch.float64)
  34000. predictions are: tensor([[ 0.6217, -0.3808, 1.7538, 0.3747, -0.1461, -0.2232, 0.3396, 0.3322],
  34001. [ 0.5353, -0.4553, 1.8654, -0.2540, -0.3222, 0.1267, 0.5113, 0.1193],
  34002. [ 0.5424, -0.4752, 0.9778, -1.3349, -0.4621, -1.2054, 0.3810, -0.0704],
  34003. [ 0.5623, -0.4164, 1.7162, -0.0753, -0.5480, -0.1832, 0.1149, -0.0326],
  34004. [-2.3358, -2.3530, 1.2751, -0.9237, -0.3565, -1.1791, 0.2657, 0.3107],
  34005. [ 0.6190, -0.3997, 1.9346, -0.0340, -0.5371, -0.2918, 0.8412, 0.0862],
  34006. [ 0.6145, -0.3911, 1.7789, -0.3152, -0.5916, -0.7133, 0.2112, 0.2105],
  34007. [ 0.3885, -0.5344, 0.9275, -0.9589, -0.5050, -1.0208, 0.3161, 0.3429]],
  34008. device='cuda:0', grad_fn=<AddmmBackward>)
  34009. landmarks are: tensor([[[ 0.5999, -0.3530, 1.6402, 0.3777, -0.2247, -0.1843, 0.3065,
  34010. 0.4470],
  34011. [ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  34012. 0.3161],
  34013. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  34014. 0.0862],
  34015. [ 0.5030, -0.4631, 1.5998, -0.0303, -0.6404, -0.1843, 0.1465,
  34016. -0.1181],
  34017. [-2.2859, -2.2859, 1.2303, -0.7848, -0.4210, -1.1158, 0.2256,
  34018. 0.3777],
  34019. [ 0.6108, -0.4008, 1.9088, -0.0253, -0.5769, -0.3075, 0.7905,
  34020. 0.1499],
  34021. [ 0.5697, -0.4113, 1.7499, -0.2767, -0.6404, -0.7155, 0.1576,
  34022. 0.4032],
  34023. [ 0.5614, -0.4080, 0.7741, -0.8848, -0.5423, -0.9156, 0.3584,
  34024. 0.4085]]], device='cuda:0')
  34025. loss_train_step before backward: tensor(0.0059, device='cuda:0', grad_fn=<MseLossBackward>)
  34026. loss_train_step after backward: tensor(0.0059, device='cuda:0', grad_fn=<MseLossBackward>)
  34027. loss_train: 1.157949673011899
  34028. step: 82
  34029. running loss: 0.014121337475754865
  34030.  
  34031. Train Steps: 82/90 Loss: 0.0141 torch.Size([8, 600, 800])
  34032. torch.Size([8, 8])
  34033. tensor([[0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413],
  34034. [0.6251, 0.4163, 0.8662, 0.4467, 0.3625, 0.3567, 0.6038, 0.5533],
  34035. [0.6185, 0.4129, 0.8900, 0.4567, 0.3937, 0.5417, 0.5734, 0.5110],
  34036. [0.6200, 0.3999, 0.8653, 0.5207, 0.4100, 0.5125, 0.5975, 0.5103],
  34037. [0.6129, 0.4114, 0.6950, 0.2467, 0.4050, 0.2133, 0.5363, 0.5550],
  34038. [0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  34039. [0.6264, 0.4069, 0.7900, 0.1650, 0.4275, 0.2267, 0.6290, 0.4947],
  34040. [0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138]],
  34041. device='cuda:0', dtype=torch.float64)
  34042. predictions are: tensor([[ 0.4949, -0.4959, 1.6806, -1.2023, 0.2291, -1.2822, 1.0642, 0.2773],
  34043. [ 0.5310, -0.4471, 1.7362, -0.1250, -0.6350, -0.7626, 0.4045, 0.2777],
  34044. [ 0.6785, -0.3380, 1.8746, -0.0475, -0.4372, 0.1743, 0.2674, 0.1442],
  34045. [ 0.6515, -0.4176, 1.7337, 0.2529, -0.4218, 0.0880, 0.3510, 0.0264],
  34046. [ 0.6312, -0.3546, 0.8784, -0.9879, -0.4545, -1.2742, 0.0937, 0.2359],
  34047. [ 0.6393, -0.3567, 1.4234, -0.8862, -0.6905, -0.6463, 0.3072, 0.2282],
  34048. [ 0.4639, -0.5364, 1.3209, -1.2894, -0.3382, -1.3093, 0.6672, -0.0192],
  34049. [ 0.6300, -0.3829, 1.5335, -0.3926, -0.6023, -0.6566, 0.4111, 0.4879]],
  34050. device='cuda:0', grad_fn=<AddmmBackward>)
  34051. landmarks are: tensor([[[ 6.2401e-01, -3.7675e-01, 1.6575e+00, -1.2851e+00, 2.9492e-01,
  34052. -1.2467e+00, 1.1276e+00, 2.1421e-01],
  34053. [ 6.0162e-01, -3.6328e-01, 1.7152e+00, -2.2279e-01, -6.1155e-01,
  34054. -6.3849e-01, 5.0277e-01, 2.6990e-01],
  34055. [ 5.7113e-01, -3.7875e-01, 1.8249e+00, -1.7660e-01, -4.6721e-01,
  34056. 2.1601e-01, 3.6246e-01, 7.4222e-02],
  34057. [ 5.7777e-01, -4.3888e-01, 1.7107e+00, 1.1921e-01, -3.9207e-01,
  34058. 8.1507e-02, 4.7413e-01, 7.1077e-02],
  34059. [ 5.4480e-01, -3.8591e-01, 9.2425e-01, -1.1466e+00, -4.1524e-01,
  34060. -1.3005e+00, 1.9099e-01, 2.7760e-01],
  34061. [ 5.6472e-01, -4.1286e-01, 1.4901e+00, -1.0619e+00, -6.4619e-01,
  34062. -5.8460e-01, 3.8730e-01, 2.7760e-01],
  34063. [ 6.0739e-01, -4.0631e-01, 1.3630e+00, -1.5238e+00, -3.1132e-01,
  34064. -1.2390e+00, 6.1950e-01, -9.2270e-04],
  34065. [ 5.4376e-01, -4.2055e-01, 1.5189e+00, -4.5373e-01, -6.1155e-01,
  34066. -6.2309e-01, 4.3649e-01, 5.4914e-01]]], device='cuda:0')
  34067. loss_train_step before backward: tensor(0.0066, device='cuda:0', grad_fn=<MseLossBackward>)
  34068. loss_train_step after backward: tensor(0.0066, device='cuda:0', grad_fn=<MseLossBackward>)
  34069. loss_train: 1.164504498243332
  34070. step: 83
  34071. running loss: 0.014030174677630505
  34072. Train Steps: 83/90 Loss: 0.0140 torch.Size([8, 600, 800])
  34073. torch.Size([8, 8])
  34074. tensor([[0.6213, 0.4001, 0.7712, 0.2117, 0.4338, 0.1800, 0.5850, 0.5183],
  34075. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  34076. [0.6200, 0.4112, 0.8862, 0.4100, 0.3638, 0.4917, 0.6088, 0.6050],
  34077. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  34078. [0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667],
  34079. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767],
  34080. [0.6339, 0.4102, 0.9088, 0.4767, 0.3925, 0.5283, 0.7509, 0.5390],
  34081. [0.6284, 0.4029, 0.8838, 0.3783, 0.3975, 0.2850, 0.6335, 0.5090]],
  34082. device='cuda:0', dtype=torch.float64)
  34083. predictions are: tensor([[ 0.4710, -0.5196, 1.1014, -1.3862, -0.2148, -1.5333, 0.3553, 0.0757],
  34084. [ 0.7050, -0.3146, 1.6446, -0.7035, -0.6196, -0.5095, 0.3162, 0.2193],
  34085. [ 0.7285, -0.2890, 1.6976, -0.3794, -0.5090, -0.0404, 0.3566, 0.4185],
  34086. [ 0.3456, -0.5866, 1.2864, -0.9612, -0.5184, -0.8896, 0.4405, 0.2379],
  34087. [ 0.8533, -0.2240, 1.6473, 0.3931, -0.4096, 0.0653, 0.3822, 0.2566],
  34088. [ 0.5720, -0.3857, 1.6606, -0.0632, -0.5481, -0.8728, 0.1911, 0.3357],
  34089. [ 0.6318, -0.4071, 1.8293, -0.1566, -0.4036, 0.1316, 1.0711, 0.2480],
  34090. [ 0.7790, -0.3147, 1.7108, -0.5726, -0.3795, -1.0664, 0.6091, 0.0483]],
  34091. device='cuda:0', grad_fn=<AddmmBackward>)
  34092. landmarks are: tensor([[[ 0.5838, -0.4379, 1.2764, -1.3082, -0.2824, -1.4545, 0.4162,
  34093. 0.1082],
  34094. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  34095. 0.3392],
  34096. [ 0.5777, -0.3868, 1.8076, -0.3921, -0.6058, -0.0149, 0.5259,
  34097. 0.5085],
  34098. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  34099. 0.1931],
  34100. [ 0.5853, -0.3614, 1.6806, 0.2930, -0.4499, 0.1005, 0.3815,
  34101. 0.3315],
  34102. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  34103. 0.3778],
  34104. [ 0.6421, -0.3912, 1.9115, -0.0842, -0.4730, 0.1544, 1.1824,
  34105. 0.2035],
  34106. [ 0.6165, -0.4249, 1.7961, -0.5384, -0.4499, -0.9695, 0.6401,
  34107. 0.0652]]], device='cuda:0')
  34108. loss_train_step before backward: tensor(0.0089, device='cuda:0', grad_fn=<MseLossBackward>)
  34109. loss_train_step after backward: tensor(0.0089, device='cuda:0', grad_fn=<MseLossBackward>)
  34110. loss_train: 1.173423076979816
  34111. step: 84
  34112. running loss: 0.013969322344997809
  34113. Train Steps: 84/90 Loss: 0.0140 torch.Size([8, 600, 800])
  34114. torch.Size([8, 8])
  34115. tensor([[0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  34116. [0.6229, 0.4107, 0.8137, 0.2883, 0.4750, 0.1717, 0.5813, 0.5400],
  34117. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  34118. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  34119. [0.6109, 0.4003, 0.8650, 0.4883, 0.4775, 0.4867, 0.5175, 0.5683],
  34120. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  34121. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  34122. [ nan, nan, 0.8213, 0.2700, 0.3775, 0.2817, 0.5425, 0.5533]],
  34123. device='cuda:0', dtype=torch.float64)
  34124. predictions are: tensor([[ 0.7204, -0.3026, 1.6254, 0.1875, -0.4491, -0.1383, 0.5085, 0.3773],
  34125. [ 0.5447, -0.3915, 1.5013, -1.1210, -0.1454, -1.4991, 0.5017, 0.1182],
  34126. [ 0.5424, -0.3848, 1.6505, -0.8521, -0.5953, -0.8380, 0.3130, 0.1086],
  34127. [ 0.5663, -0.3752, 0.8812, -1.0786, -0.5915, -1.0182, 0.2309, 0.2956],
  34128. [ 0.5830, -0.4065, 1.7906, -0.2180, -0.1265, -0.1026, 0.2333, 0.1712],
  34129. [ 0.7589, -0.2776, 1.6148, 0.1922, -0.3882, -0.1449, 0.5068, 0.4028],
  34130. [ 0.5904, -0.4397, 1.7383, 0.0546, -0.4931, -0.0932, 0.7224, 0.0257],
  34131. [-2.2089, -2.2824, 1.3509, -1.0788, -0.5869, -1.0564, 0.3734, 0.2143]],
  34132. device='cuda:0', grad_fn=<AddmmBackward>)
  34133. landmarks are: tensor([[[ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  34134. 0.5393],
  34135. [ 0.5911, -0.3888, 1.4727, -0.9541, -0.0919, -1.4930, 0.3988,
  34136. 0.2083],
  34137. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  34138. 0.2237],
  34139. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  34140. 0.4103],
  34141. [ 0.5359, -0.4370, 1.7095, -0.0303, -0.0804, -0.0380, 0.1044,
  34142. 0.3392],
  34143. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  34144. 0.5239],
  34145. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  34146. 0.0697],
  34147. [-2.2859, -2.2859, 1.5074, -1.0388, -0.5423, -0.9849, 0.2199,
  34148. 0.2699]]], device='cuda:0')
  34149. loss_train_step before backward: tensor(0.0103, device='cuda:0', grad_fn=<MseLossBackward>)
  34150. loss_train_step after backward: tensor(0.0103, device='cuda:0', grad_fn=<MseLossBackward>)
  34151. loss_train: 1.1836915975436568
  34152. step: 85
  34153. running loss: 0.01392578350051361
  34154. Train Steps: 85/90 Loss: 0.0139 torch.Size([8, 600, 800])
  34155. torch.Size([8, 8])
  34156. tensor([[0.6146, 0.4124, 0.8800, 0.4867, 0.3800, 0.4500, 0.5106, 0.5524],
  34157. [0.6199, 0.4065, 0.7598, 0.2385, 0.4317, 0.1981, 0.5933, 0.5221],
  34158. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833],
  34159. [0.6233, 0.4091, 0.8100, 0.2950, 0.3563, 0.3883, 0.6013, 0.5200],
  34160. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  34161. [0.6361, 0.4165, 0.9038, 0.5017, 0.3750, 0.3783, 0.6448, 0.5309],
  34162. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  34163. [ nan, nan, 0.7525, 0.2291, 0.3838, 0.3017, 0.6050, 0.5667]],
  34164. device='cuda:0', dtype=torch.float64)
  34165. predictions are: tensor([[ 0.7068, -0.2859, 1.7985, 0.0704, -0.5089, -0.2907, 0.1986, 0.2836],
  34166. [ 0.8525, -0.2179, 1.2044, -1.2195, -0.2814, -1.3455, 0.5076, 0.1458],
  34167. [ 0.8303, -0.2774, 1.7756, -0.0766, -0.5239, -0.1445, 0.4094, 0.0691],
  34168. [ 0.5732, -0.3968, 1.4232, -0.9013, -0.6039, -0.4955, 0.5431, 0.2011],
  34169. [ 0.6532, -0.3466, 1.7894, -0.0737, -0.2789, -0.0805, 0.4266, 0.3231],
  34170. [ 0.7064, -0.3133, 1.8737, 0.0259, -0.4378, -0.6395, 0.7381, 0.2126],
  34171. [ 0.5834, -0.3917, 1.1698, -1.2030, -0.4331, -1.0781, 0.5621, 0.4097],
  34172. [-1.9059, -2.0811, 1.1619, -1.2046, -0.4429, -1.0495, 0.4665, 0.3691]],
  34173. device='cuda:0', grad_fn=<AddmmBackward>)
  34174. landmarks are: tensor([[[ 0.5529, -0.3811, 1.7788, -0.0380, -0.5307, -0.2074, 0.0727,
  34175. 0.2657],
  34176. [ 0.5774, -0.4082, 1.2235, -1.1844, -0.2919, -1.3709, 0.4544,
  34177. 0.1256],
  34178. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  34179. -0.0534],
  34180. [ 0.5932, -0.3962, 1.4554, -0.9233, -0.6404, -0.4922, 0.4912,
  34181. 0.1159],
  34182. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  34183. 0.3084],
  34184. [ 0.6520, -0.3623, 1.8885, 0.0313, -0.5538, -0.5384, 0.6926,
  34185. 0.1661],
  34186. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  34187. 0.3777],
  34188. [-2.2859, -2.2859, 1.1898, -1.2278, -0.5134, -0.8925, 0.5085,
  34189. 0.3315]]], device='cuda:0')
  34190. loss_train_step before backward: tensor(0.0100, device='cuda:0', grad_fn=<MseLossBackward>)
  34191. loss_train_step after backward: tensor(0.0100, device='cuda:0', grad_fn=<MseLossBackward>)
  34192. loss_train: 1.1936637787148356
  34193. step: 86
  34194. running loss: 0.013879811380405066
  34195.  
  34196. Train Steps: 86/90 Loss: 0.0139 torch.Size([8, 600, 800])
  34197. torch.Size([8, 8])
  34198. tensor([[0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  34199. [0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  34200. [0.6202, 0.4066, 0.8398, 0.2648, 0.3925, 0.2627, 0.5845, 0.5124],
  34201. [0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  34202. [0.6199, 0.4015, 0.8716, 0.5228, 0.3833, 0.4772, 0.5883, 0.5148],
  34203. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  34204. [0.6245, 0.4100, 0.7762, 0.2583, 0.4963, 0.1517, 0.5875, 0.5417],
  34205. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194]],
  34206. device='cuda:0', dtype=torch.float64)
  34207. predictions are: tensor([[ 0.6049, -0.3581, 1.7083, -0.1912, -0.1407, -0.0747, 0.4234, 0.3232],
  34208. [ 0.5529, -0.3694, 1.6717, -0.1886, -0.3450, -0.0744, 0.1994, 0.3777],
  34209. [ 0.5310, -0.4016, 1.4163, -1.1305, -0.4936, -1.0623, 0.4344, 0.1493],
  34210. [ 0.5927, -0.3553, 1.4686, -1.0565, -0.3416, -1.0536, 0.8740, 0.3268],
  34211. [ 0.6938, -0.3412, 1.7493, 0.0628, -0.5975, -0.1540, 0.5167, 0.1286],
  34212. [ 0.7393, -0.3116, 1.5618, 0.2102, -0.4959, -0.1859, 0.4538, 0.2352],
  34213. [ 0.6530, -0.2842, 1.1949, -1.1057, -0.1295, -1.5413, 0.4090, 0.3264],
  34214. [-2.0142, -2.1302, 1.3487, -0.9828, -0.6667, -0.8325, 0.3096, 0.2276]],
  34215. device='cuda:0', grad_fn=<AddmmBackward>)
  34216. landmarks are: tensor([[[ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  34217. 0.2853],
  34218. [ 0.5491, -0.4132, 1.7557, -0.0919, -0.2709, 0.0313, 0.0635,
  34219. 0.4032],
  34220. [ 0.5790, -0.4079, 1.5929, -1.0630, -0.4729, -1.0725, 0.4137,
  34221. 0.0807],
  34222. [ 0.6174, -0.3984, 1.5975, -0.9921, -0.3633, -0.9926, 0.8205,
  34223. 0.2050],
  34224. [ 0.5773, -0.4316, 1.7399, 0.1287, -0.5153, -0.0817, 0.4313,
  34225. 0.0919],
  34226. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  34227. 0.1313],
  34228. [ 0.5985, -0.3921, 1.2995, -1.0927, 0.0062, -1.5854, 0.4277,
  34229. 0.2160],
  34230. [-2.2859, -2.2859, 1.5478, -0.8309, -0.6289, -0.7232, 0.1198,
  34231. 0.1133]]], device='cuda:0')
  34232. loss_train_step before backward: tensor(0.0096, device='cuda:0', grad_fn=<MseLossBackward>)
  34233. loss_train_step after backward: tensor(0.0096, device='cuda:0', grad_fn=<MseLossBackward>)
  34234. loss_train: 1.2032914850860834
  34235. step: 87
  34236. running loss: 0.013830936610184866
  34237. Train Steps: 87/90 Loss: 0.0138 torch.Size([8, 600, 800])
  34238. torch.Size([8, 8])
  34239. tensor([[0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  34240. [0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395],
  34241. [0.6068, 0.3963, 0.8650, 0.4317, 0.4037, 0.5083, 0.5253, 0.4999],
  34242. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  34243. [0.6216, 0.4099, 0.7225, 0.2033, 0.4188, 0.2217, 0.5975, 0.5283],
  34244. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  34245. [0.6136, 0.4117, 0.8700, 0.5167, 0.4188, 0.5083, 0.5147, 0.5495],
  34246. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246]],
  34247. device='cuda:0', dtype=torch.float64)
  34248. predictions are: tensor([[ 0.6805, -0.3348, 1.9624, -0.4664, -0.5938, -0.4975, 0.7282, 0.2224],
  34249. [ 0.6928, -0.3152, 1.1401, -1.1865, -0.4487, -1.0811, 0.5481, 0.2631],
  34250. [ 0.6312, -0.3960, 1.7950, -0.2478, -0.4948, 0.0599, 0.3920, 0.0744],
  34251. [ 0.6732, -0.2913, 1.1461, -1.0722, -0.3414, -1.0949, 0.5678, 0.6630],
  34252. [ 0.7776, -0.2525, 1.1160, -1.1318, -0.3865, -1.2380, 0.4634, 0.2548],
  34253. [ 0.6188, -0.3683, 1.3264, -1.0727, -0.2328, -1.4757, 0.4626, 0.1861],
  34254. [ 0.6825, -0.3208, 1.7779, 0.1908, -0.3806, 0.0440, 0.3096, 0.2934],
  34255. [-1.7795, -1.9782, 1.0829, -1.3242, -0.4301, -1.2074, 0.2961, 0.3201]],
  34256. device='cuda:0', grad_fn=<AddmmBackward>)
  34257. landmarks are: tensor([[[ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  34258. 0.1544],
  34259. [ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  34260. 0.2058],
  34261. [ 0.5168, -0.4556, 1.7095, -0.2921, -0.4210, 0.0620, 0.1404,
  34262. 0.0231],
  34263. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  34264. 0.6084],
  34265. [ 0.5850, -0.3925, 1.0513, -1.3467, -0.3517, -1.2620, 0.4739,
  34266. 0.1544],
  34267. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  34268. 0.1005],
  34269. [ 0.5482, -0.3841, 1.7326, 0.1005, -0.3517, 0.0620, 0.0912,
  34270. 0.2522],
  34271. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  34272. 0.1373]]], device='cuda:0')
  34273. loss_train_step before backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  34274. loss_train_step after backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  34275. loss_train: 1.2185192555189133
  34276. step: 88
  34277. running loss: 0.013846809721805832
  34278. Train Steps: 88/90 Loss: 0.0138 torch.Size([8, 600, 800])
  34279. torch.Size([8, 8])
  34280. tensor([[0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  34281. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  34282. [0.6305, 0.3983, 0.8950, 0.4833, 0.3688, 0.4683, 0.6375, 0.5117],
  34283. [0.6346, 0.4144, 0.9088, 0.4667, 0.3850, 0.4333, 0.7121, 0.5899],
  34284. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  34285. [0.6175, 0.4093, 0.8800, 0.4433, 0.4075, 0.4367, 0.5128, 0.4901],
  34286. [0.6214, 0.4112, 0.7838, 0.2117, 0.3650, 0.3133, 0.5675, 0.5083],
  34287. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266]],
  34288. device='cuda:0', dtype=torch.float64)
  34289. predictions are: tensor([[ 0.6163, -0.3500, 1.1294, -1.2303, -0.3170, -1.3979, 0.2945, 0.2448],
  34290. [ 0.6485, -0.4020, 1.5849, 0.4244, -0.2580, 0.0700, 0.1429, 0.1287],
  34291. [ 0.7184, -0.3741, 1.8447, -0.0733, -0.5955, -0.0847, 0.7442, 0.2117],
  34292. [ 0.6278, -0.3934, 1.9591, -0.1562, -0.4049, -0.2477, 1.0511, 0.4199],
  34293. [ 0.6740, -0.3122, 1.5357, -0.4706, -0.5488, -0.9307, 0.1926, 0.4752],
  34294. [ 0.6191, -0.4002, 1.8453, -0.2578, -0.4682, -0.1923, 0.1952, 0.1291],
  34295. [ 0.6972, -0.3326, 1.3606, -1.3241, -0.5866, -0.8800, 0.4947, 0.1693],
  34296. [ 0.6533, -0.3122, 1.0827, -1.2065, -0.3026, -1.0755, 0.5253, 0.7117]],
  34297. device='cuda:0', grad_fn=<AddmmBackward>)
  34298. landmarks are: tensor([[[ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  34299. 0.1343],
  34300. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  34301. -0.0610],
  34302. [ 0.6262, -0.4461, 1.8480, -0.0534, -0.5827, -0.1227, 0.6587,
  34303. 0.0774],
  34304. [ 0.6454, -0.3719, 1.9115, -0.1304, -0.5076, -0.2844, 1.0033,
  34305. 0.4386],
  34306. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  34307. 0.3928],
  34308. [ 0.5663, -0.3955, 1.7788, -0.2382, -0.4037, -0.2690, 0.0828,
  34309. -0.0220],
  34310. [ 0.5845, -0.3864, 1.3342, -1.3082, -0.6000, -0.8386, 0.3353,
  34311. 0.0620],
  34312. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  34313. 0.6084]]], device='cuda:0')
  34314. loss_train_step before backward: tensor(0.0050, device='cuda:0', grad_fn=<MseLossBackward>)
  34315. loss_train_step after backward: tensor(0.0050, device='cuda:0', grad_fn=<MseLossBackward>)
  34316. loss_train: 1.223516573663801
  34317. step: 89
  34318. running loss: 0.01374737723217754
  34319. Train Steps: 89/90 Loss: 0.0137 torch.Size([8, 600, 800])
  34320. torch.Size([8, 8])
  34321. tensor([[0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  34322. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  34323. [0.6198, 0.4115, 0.7762, 0.2717, 0.3713, 0.3200, 0.5837, 0.5683],
  34324. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  34325. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  34326. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  34327. [0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  34328. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413]],
  34329. device='cuda:0', dtype=torch.float64)
  34330. predictions are: tensor([[ 0.6415, -0.3877, 1.6808, -0.0775, -0.2826, 0.0688, 0.3160, 0.3622],
  34331. [ 0.6123, -0.4358, 1.6953, 0.1156, -0.4587, 0.1190, 0.5347, 0.1479],
  34332. [ 0.6549, -0.3544, 1.2989, -1.1406, -0.5752, -0.8567, 0.2800, 0.4329],
  34333. [ 0.7401, -0.3168, 1.7433, -0.5885, -0.5935, -0.5729, 0.5201, 0.0110],
  34334. [ 0.6757, -0.2947, 1.5974, -0.2606, -0.4664, -0.2819, -0.0857, 0.5438],
  34335. [ 0.6677, -0.3903, 1.5811, 0.2361, -0.5221, -0.2246, 0.3248, 0.2999],
  34336. [ 0.6235, -0.3914, 1.6939, -0.7000, -0.5345, -0.1516, 0.8339, 0.3037],
  34337. [ 0.6724, -0.3755, 1.9923, -0.5858, -0.0867, -1.1977, 0.9983, 0.3048]],
  34338. device='cuda:0', grad_fn=<AddmmBackward>)
  34339. landmarks are: tensor([[[ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  34340. 0.2391],
  34341. [ 0.5908, -0.4366, 1.7557, 0.1390, -0.5192, 0.1313, 0.6529,
  34342. 0.0236],
  34343. [ 0.5768, -0.3852, 1.2995, -1.0311, -0.5711, -0.8079, 0.4104,
  34344. 0.3392],
  34345. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  34346. -0.0670],
  34347. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  34348. 0.4145],
  34349. [ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  34350. 0.2075],
  34351. [ 0.6108, -0.4273, 1.8711, -0.6616, -0.5769, -0.1997, 0.9156,
  34352. 0.1554],
  34353. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  34354. 0.2142]]], device='cuda:0')
  34355. loss_train_step before backward: tensor(0.0074, device='cuda:0', grad_fn=<MseLossBackward>)
  34356. loss_train_step after backward: tensor(0.0074, device='cuda:0', grad_fn=<MseLossBackward>)
  34357. loss_train: 1.230874984525144
  34358. step: 90
  34359. running loss: 0.013676388716946045
  34360.  
  34361. Valid Steps: 10/10 Loss: nan 37
  34362. --------------------------------------------------
  34363. Epoch: 9 Train Loss: 0.0137 Valid Loss: nan
  34364. --------------------------------------------------
  34365. size of train loader is: 90
  34366. torch.Size([8, 600, 800])
  34367. torch.Size([8, 8])
  34368. tensor([[0.6321, 0.4048, 0.8738, 0.5617, 0.3875, 0.4417, 0.6361, 0.4927],
  34369. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  34370. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  34371. [0.6087, 0.3976, 0.8337, 0.3867, 0.3713, 0.3117, 0.5938, 0.5300],
  34372. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  34373. [0.6264, 0.4067, 0.9050, 0.4183, 0.3775, 0.4600, 0.6308, 0.4862],
  34374. [0.6201, 0.4004, 0.8786, 0.5043, 0.3833, 0.5138, 0.5997, 0.5092],
  34375. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197]],
  34376. device='cuda:0', dtype=torch.float64)
  34377. predictions are: tensor([[ 0.6679, -0.4081, 1.7148, 0.2545, -0.5189, -0.2133, 0.6253, 0.0836],
  34378. [ 0.6459, -0.3418, 1.8009, -0.9554, -0.0123, -1.4325, 0.6081, 0.2512],
  34379. [ 0.5468, -0.3994, 1.2339, -0.7346, -0.6692, -0.4572, 0.1664, 0.4841],
  34380. [ 0.6728, -0.3519, 1.5303, -0.6012, -0.5453, -0.7852, 0.4589, 0.3779],
  34381. [ 0.6847, -0.3457, 1.3959, -1.0181, -0.4633, -0.9420, 0.4814, 0.2562],
  34382. [ 0.7260, -0.3154, 1.8198, -0.4252, -0.6058, -0.1752, 0.6467, 0.0982],
  34383. [ 0.5705, -0.4656, 1.7108, 0.0119, -0.4905, 0.1314, 0.3809, 0.2373],
  34384. [ 0.5818, -0.3801, 1.7161, -0.0282, -0.1464, 0.2088, 0.2626, 0.3285]],
  34385. device='cuda:0', grad_fn=<AddmmBackward>)
  34386. landmarks are: tensor([[[ 0.6335, -0.4162, 1.7499, 0.3084, -0.4961, -0.2459, 0.6524,
  34387. -0.0102],
  34388. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  34389. 0.0051],
  34390. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  34391. 0.3417],
  34392. [ 0.5255, -0.4495, 1.5651, -0.4999, -0.5711, -0.8463, 0.4566,
  34393. 0.1621],
  34394. [ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  34395. 0.1080],
  34396. [ 0.6072, -0.4075, 1.8942, -0.3537, -0.5423, -0.1612, 0.6277,
  34397. -0.0400],
  34398. [ 0.5783, -0.4363, 1.7724, 0.0432, -0.5153, 0.0871, 0.4840,
  34399. 0.0663],
  34400. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  34401. 0.1146]]], device='cuda:0')
  34402. loss_train_step before backward: tensor(0.0075, device='cuda:0', grad_fn=<MseLossBackward>)
  34403. loss_train_step after backward: tensor(0.0075, device='cuda:0', grad_fn=<MseLossBackward>)
  34404. loss_train: 0.0074615185149014
  34405. step: 1
  34406. running loss: 0.0074615185149014
  34407. Train Steps: 1/90 Loss: 0.0075 torch.Size([8, 600, 800])
  34408. torch.Size([8, 8])
  34409. tensor([[0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667],
  34410. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320],
  34411. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038],
  34412. [0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  34413. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  34414. [0.6280, 0.4101, 0.9050, 0.4533, 0.3775, 0.3217, 0.6338, 0.4915],
  34415. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329],
  34416. [0.6263, 0.4065, 0.9038, 0.4317, 0.3588, 0.4550, 0.6325, 0.5250]],
  34417. device='cuda:0', dtype=torch.float64)
  34418. predictions are: tensor([[ 0.6624, -0.3220, 1.6149, -0.7544, -0.4754, -0.6492, 0.2969, 0.4028],
  34419. [ 0.6560, -0.3936, 1.6232, 0.0781, -0.4228, 0.0890, 0.8605, 0.1984],
  34420. [ 0.6372, -0.3622, 1.6846, -0.1787, -0.1467, 0.0819, 0.0969, 0.0911],
  34421. [ 0.5155, -0.4592, 1.3896, 0.2184, -0.4286, -0.1787, 0.9320, 0.3922],
  34422. [ 0.6200, -0.3272, 1.5840, -0.5143, -0.5560, -0.8308, -0.1218, 0.2780],
  34423. [ 0.5761, -0.4320, 1.9143, -0.2647, -0.5046, -0.7932, 0.4572, 0.0386],
  34424. [ 0.6207, -0.3765, 1.6158, -0.8149, -0.6073, -0.5826, 0.3833, 0.2445],
  34425. [ 0.4286, -0.5189, 1.9060, -0.4003, -0.5482, -0.1925, 0.5965, 0.2424]],
  34426. device='cuda:0', grad_fn=<AddmmBackward>)
  34427. landmarks are: tensor([[[ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  34428. 0.3315],
  34429. [ 0.6273, -0.4393, 1.6402, 0.1313, -0.5076, 0.0467, 1.1532,
  34430. 0.1715],
  34431. [ 0.5249, -0.4473, 1.7326, -0.0919, -0.2016, 0.1544, 0.1733,
  34432. 0.0412],
  34433. [ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  34434. 0.3745],
  34435. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  34436. 0.2116],
  34437. [ 0.6148, -0.3918, 1.8942, -0.1920, -0.5423, -0.8002, 0.6414,
  34438. -0.0156],
  34439. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  34440. 0.1753],
  34441. [ 0.6070, -0.4085, 1.8885, -0.2921, -0.6289, -0.1843, 0.6356,
  34442. 0.1390]]], device='cuda:0')
  34443. loss_train_step before backward: tensor(0.0085, device='cuda:0', grad_fn=<MseLossBackward>)
  34444. loss_train_step after backward: tensor(0.0085, device='cuda:0', grad_fn=<MseLossBackward>)
  34445. loss_train: 0.015985853504389524
  34446. step: 2
  34447. running loss: 0.007992926752194762
  34448. Train Steps: 2/90 Loss: 0.0080 torch.Size([8, 600, 800])
  34449. torch.Size([8, 8])
  34450. tensor([[0.6274, 0.4087, 0.8375, 0.5700, 0.4025, 0.4800, 0.5700, 0.6117],
  34451. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  34452. [0.6214, 0.4112, 0.7838, 0.2117, 0.3650, 0.3133, 0.5675, 0.5083],
  34453. [0.6166, 0.4008, 0.8563, 0.5667, 0.4388, 0.4933, 0.5575, 0.5567],
  34454. [0.6250, 0.4103, 0.8950, 0.4400, 0.3912, 0.5650, 0.6050, 0.5133],
  34455. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  34456. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  34457. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167]],
  34458. device='cuda:0', dtype=torch.float64)
  34459. predictions are: tensor([[ 0.6501, -0.3832, 1.6167, 0.3688, -0.4298, -0.0988, 0.5013, 0.4481],
  34460. [ 0.5538, -0.4239, 1.8637, -0.2437, -0.4463, -0.1293, 0.2182, 0.0533],
  34461. [ 0.6812, -0.3732, 1.5055, -1.3821, -0.6032, -0.9587, 0.6223, -0.0342],
  34462. [ 0.5355, -0.4735, 1.7399, 0.3028, -0.2351, 0.0205, 0.4293, 0.2091],
  34463. [ 0.6038, -0.3897, 1.9341, -0.3007, -0.4164, 0.3271, 0.8311, 0.0847],
  34464. [ 0.4763, -0.4982, 1.6687, -0.5504, -0.7019, -0.4592, 0.3585, -0.0793],
  34465. [ 0.5035, -0.3993, 1.2370, -0.6837, -0.6868, -0.5294, 0.2725, 0.3857],
  34466. [ 0.6356, -0.3197, 1.2649, -0.7366, -0.0193, -1.4324, 0.3899, 0.5164]],
  34467. device='cuda:0', grad_fn=<AddmmBackward>)
  34468. landmarks are: tensor([[[ 0.6118, -0.3983, 1.5824, 0.3469, -0.4268, -0.0688, 0.3469,
  34469. 0.5393],
  34470. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  34471. 0.0893],
  34472. [ 0.5845, -0.3864, 1.3342, -1.3082, -0.6000, -0.8386, 0.3353,
  34473. 0.0620],
  34474. [ 0.5620, -0.4346, 1.6691, 0.3315, -0.2594, -0.0072, 0.2891,
  34475. 0.2853],
  34476. [ 0.6010, -0.3909, 1.8480, -0.2536, -0.4788, 0.3238, 0.5085,
  34477. 0.0851],
  34478. [ 0.5206, -0.4603, 1.4670, -0.4768, -0.6577, -0.3998, 0.1836,
  34479. 0.0021],
  34480. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  34481. 0.4036],
  34482. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  34483. 0.5624]]], device='cuda:0')
  34484. loss_train_step before backward: tensor(0.0084, device='cuda:0', grad_fn=<MseLossBackward>)
  34485. loss_train_step after backward: tensor(0.0084, device='cuda:0', grad_fn=<MseLossBackward>)
  34486. loss_train: 0.02438948256894946
  34487. step: 3
  34488. running loss: 0.008129827522983154
  34489. Train Steps: 3/90 Loss: 0.0081 torch.Size([8, 600, 800])
  34490. torch.Size([8, 8])
  34491. tensor([[0.6250, 0.4110, 0.7238, 0.2067, 0.4263, 0.1883, 0.5625, 0.5633],
  34492. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  34493. [0.6221, 0.4107, 0.7788, 0.3033, 0.3950, 0.2817, 0.6075, 0.5517],
  34494. [0.6250, 0.4054, 0.8770, 0.4723, 0.4662, 0.5367, 0.6162, 0.5433],
  34495. [0.6262, 0.4052, 0.8888, 0.4700, 0.3675, 0.5117, 0.6350, 0.5233],
  34496. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  34497. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  34498. [ nan, nan, 0.7335, 0.2569, 0.3788, 0.2667, 0.5066, 0.5578]],
  34499. device='cuda:0', dtype=torch.float64)
  34500. predictions are: tensor([[ 5.5326e-01, -4.2534e-01, 1.0864e+00, -1.1242e+00, -2.1720e-01,
  34501. -1.4227e+00, 3.4412e-01, 1.9398e-01],
  34502. [ 4.9047e-01, -4.4277e-01, 1.7040e+00, -3.5306e-01, -6.0177e-01,
  34503. -3.8281e-01, 2.0634e-01, 6.6394e-03],
  34504. [ 4.8487e-01, -4.6687e-01, 1.4244e+00, -8.3061e-01, -4.0475e-01,
  34505. -9.4819e-01, 4.2932e-01, 2.4966e-01],
  34506. [ 6.4183e-01, -3.5516e-01, 1.7091e+00, -1.8088e-02, -1.4074e-01,
  34507. 2.4657e-01, 5.6285e-01, 1.6769e-01],
  34508. [ 6.6839e-01, -3.6778e-01, 1.8622e+00, -2.1339e-03, -5.3337e-01,
  34509. 1.3466e-01, 7.2328e-01, 5.1827e-02],
  34510. [ 5.6919e-01, -3.9543e-01, 1.7194e+00, -7.2178e-01, -3.5065e-01,
  34511. -8.3430e-01, 7.7734e-01, 2.2063e-01],
  34512. [ 6.5032e-01, -3.9691e-01, 1.7636e+00, -2.2513e-01, -6.1440e-01,
  34513. -2.3528e-01, 4.7430e-01, 3.8070e-02],
  34514. [-2.1769e+00, -2.2064e+00, 1.1524e+00, -1.1870e+00, -5.2893e-01,
  34515. -9.4108e-01, 8.8347e-02, 2.0739e-01]], device='cuda:0',
  34516. grad_fn=<AddmmBackward>)
  34517. landmarks are: tensor([[[ 0.6010, -0.3875, 1.0570, -1.3313, -0.3171, -1.4160, 0.3122,
  34518. 0.3161],
  34519. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  34520. 0.0862],
  34521. [ 0.5875, -0.3888, 1.3111, -0.8848, -0.4614, -0.9849, 0.5201,
  34522. 0.2622],
  34523. [ 0.6009, -0.4135, 1.7651, -0.1043, -0.1323, 0.1929, 0.5605,
  34524. 0.2237],
  34525. [ 0.6063, -0.4142, 1.8192, -0.1150, -0.5885, 0.0774, 0.6471,
  34526. 0.1313],
  34527. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  34528. 0.3050],
  34529. [ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  34530. -0.0099],
  34531. [-2.2859, -2.2859, 1.1020, -1.0994, -0.5365, -1.0542, 0.0542,
  34532. 0.2905]]], device='cuda:0')
  34533. loss_train_step before backward: tensor(0.0057, device='cuda:0', grad_fn=<MseLossBackward>)
  34534. loss_train_step after backward: tensor(0.0057, device='cuda:0', grad_fn=<MseLossBackward>)
  34535. loss_train: 0.030109287705272436
  34536. step: 4
  34537. running loss: 0.007527321926318109
  34538.  
  34539. Train Steps: 4/90 Loss: 0.0075 torch.Size([8, 600, 800])
  34540. torch.Size([8, 8])
  34541. tensor([[0.6250, 0.4116, 0.8700, 0.4850, 0.4650, 0.5567, 0.6088, 0.5183],
  34542. [0.6259, 0.4156, 0.8812, 0.3183, 0.4775, 0.1867, 0.6219, 0.4960],
  34543. [0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  34544. [0.6175, 0.3957, 0.8700, 0.4817, 0.4662, 0.5133, 0.5800, 0.5517],
  34545. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  34546. [0.6151, 0.4058, 0.7068, 0.2680, 0.3400, 0.4083, 0.5775, 0.5733],
  34547. [0.6097, 0.4000, 0.7325, 0.2667, 0.3450, 0.3517, 0.5284, 0.5045],
  34548. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433]],
  34549. device='cuda:0', dtype=torch.float64)
  34550. predictions are: tensor([[ 0.5593, -0.4216, 1.8539, 0.0233, -0.2211, 0.3257, 0.6745, 0.1137],
  34551. [ 0.5730, -0.4056, 1.9641, -0.6987, -0.1147, -1.4240, 0.6490, -0.0203],
  34552. [ 0.4865, -0.4275, 1.9484, 0.1791, -0.6681, -0.2434, 0.3987, 0.2926],
  34553. [ 0.6164, -0.4252, 1.7836, 0.0594, -0.1791, 0.0937, 0.4037, 0.1212],
  34554. [ 0.5586, -0.4110, 1.1464, -1.0049, -0.6523, -0.8031, 0.6228, 0.1723],
  34555. [ 0.4328, -0.5101, 1.1184, -0.9284, -0.7571, -0.4165, 0.4390, 0.2188],
  34556. [ 0.4403, -0.5205, 1.1551, -0.9474, -0.7202, -0.6720, 0.2133, -0.0217],
  34557. [ 0.5382, -0.4574, 1.7547, 0.2606, -0.0796, 0.0177, 0.1632, 0.2114]],
  34558. device='cuda:0', grad_fn=<AddmmBackward>)
  34559. landmarks are: tensor([[[ 0.6012, -0.3846, 1.7326, -0.0457, -0.1381, 0.2853, 0.5259,
  34560. 0.1082],
  34561. [ 0.6052, -0.3663, 1.7845, -0.8156, -0.0804, -1.4237, 0.5866,
  34562. 0.0051],
  34563. [ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  34564. 0.3623],
  34565. [ 0.5662, -0.4581, 1.7326, -0.0611, -0.1323, 0.0851, 0.3931,
  34566. 0.2622],
  34567. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  34568. 0.3007],
  34569. [ 0.5552, -0.4113, 0.9790, -1.0480, -0.7155, -0.3998, 0.3815,
  34570. 0.3623],
  34571. [ 0.5303, -0.4384, 1.0975, -1.0542, -0.6924, -0.6616, 0.1548,
  34572. 0.0442],
  34573. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  34574. 0.2237]]], device='cuda:0')
  34575. loss_train_step before backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  34576. loss_train_step after backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  34577. loss_train: 0.037714792881160975
  34578. step: 5
  34579. running loss: 0.0075429585762321946
  34580. Train Steps: 5/90 Loss: 0.0075 torch.Size([8, 600, 800])
  34581. torch.Size([8, 8])
  34582. tensor([[0.6250, 0.4013, 0.8525, 0.5417, 0.4037, 0.5117, 0.6325, 0.5017],
  34583. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650],
  34584. [0.6197, 0.4050, 0.7527, 0.2000, 0.4042, 0.2249, 0.5895, 0.4995],
  34585. [0.6283, 0.4283, 0.7477, 0.3542, 0.5125, 0.1917, 0.5500, 0.6167],
  34586. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  34587. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450],
  34588. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356],
  34589. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973]],
  34590. device='cuda:0', dtype=torch.float64)
  34591. predictions are: tensor([[ 0.4132, -0.5643, 1.6594, 0.1873, -0.5100, 0.1605, 0.4882, 0.0102],
  34592. [ 0.3890, -0.5216, 1.6669, -0.0909, -0.3992, 0.1360, 0.0391, 0.1829],
  34593. [ 0.6699, -0.3643, 1.1973, -1.2907, -0.4870, -1.1349, 0.3494, -0.0741],
  34594. [ 0.5747, -0.3525, 1.1663, -0.6527, -0.0847, -1.2640, 0.1935, 0.5250],
  34595. [ 0.5285, -0.4959, 1.8223, -0.5301, -0.4036, -0.7936, 0.8845, 0.0212],
  34596. [ 0.5436, -0.4472, 1.8121, -0.1635, -0.4170, 0.2699, 0.4882, 0.1760],
  34597. [ 0.5868, -0.4045, 1.4909, -1.0393, -0.3746, -1.0620, 0.5821, 0.1467],
  34598. [ 0.5726, -0.4658, 1.8135, 0.1574, -0.6902, -0.0282, 0.5791, -0.0738]],
  34599. device='cuda:0', grad_fn=<AddmmBackward>)
  34600. landmarks are: tensor([[[ 0.6010, -0.4321, 1.6517, 0.2160, -0.4210, 0.0774, 0.6356,
  34601. 0.0313],
  34602. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  34603. 0.3238],
  34604. [ 0.5762, -0.4153, 1.1908, -1.3622, -0.4190, -1.2471, 0.4368,
  34605. 0.0213],
  34606. [ 0.6161, -0.3075, 1.1678, -0.6500, 0.0813, -1.4006, 0.2545,
  34607. 0.5624],
  34608. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  34609. 0.1821],
  34610. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  34611. 0.2314],
  34612. [ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  34613. 0.1879],
  34614. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  34615. 0.0111]]], device='cuda:0')
  34616. loss_train_step before backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  34617. loss_train_step after backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  34618. loss_train: 0.04535488644614816
  34619. step: 6
  34620. running loss: 0.0075591477410246926
  34621. Train Steps: 6/90 Loss: 0.0076 torch.Size([8, 600, 800])
  34622. torch.Size([8, 8])
  34623. tensor([[0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  34624. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344],
  34625. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  34626. [0.6072, 0.4029, 0.7037, 0.2150, 0.3912, 0.2267, 0.5516, 0.5507],
  34627. [0.6228, 0.4004, 0.8750, 0.5250, 0.3825, 0.5233, 0.6362, 0.5000],
  34628. [0.6164, 0.4076, 0.8838, 0.4117, 0.3713, 0.5550, 0.6238, 0.5350],
  34629. [0.6128, 0.4084, 0.8738, 0.4683, 0.3613, 0.3700, 0.4960, 0.5397],
  34630. [0.6118, 0.4052, 0.8463, 0.3917, 0.3538, 0.3450, 0.5053, 0.5593]],
  34631. device='cuda:0', dtype=torch.float64)
  34632. predictions are: tensor([[ 0.5229, -0.4542, 1.2582, -1.1586, -0.4608, -0.8265, 0.7056, 0.1246],
  34633. [ 0.5421, -0.4597, 1.8666, -0.0591, -0.5739, -0.4832, 0.3031, 0.0289],
  34634. [ 0.4805, -0.4632, 1.7951, -0.0926, 0.0650, 0.0324, 0.5053, 0.2165],
  34635. [ 0.5597, -0.4463, 0.9369, -1.2581, -0.4177, -1.2128, 0.3655, 0.1525],
  34636. [ 0.5571, -0.4922, 1.7682, 0.2352, -0.4721, 0.1582, 0.8246, -0.0903],
  34637. [ 0.5490, -0.4201, 1.7635, -0.2910, -0.4697, 0.3081, 0.7349, 0.2057],
  34638. [ 0.5234, -0.4357, 1.7965, -0.0241, -0.6572, -0.5234, 0.0793, 0.1230],
  34639. [ 0.4955, -0.4340, 1.6476, -0.4130, -0.6548, -0.6279, -0.0118, 0.1236]],
  34640. device='cuda:0', grad_fn=<AddmmBackward>)
  34641. landmarks are: tensor([[[ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  34642. 0.1621],
  34643. [ 0.5598, -0.4273, 1.7961, -0.1689, -0.5827, -0.5615, 0.1671,
  34644. 0.1824],
  34645. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  34646. 0.2776],
  34647. [ 0.5185, -0.4252, 0.9647, -1.2928, -0.4788, -1.2390, 0.2617,
  34648. 0.2576],
  34649. [ 0.5908, -0.4366, 1.7557, 0.1390, -0.5192, 0.1313, 0.6529,
  34650. 0.0236],
  34651. [ 0.5614, -0.4032, 1.7961, -0.3844, -0.5711, 0.2776, 0.5952,
  34652. 0.1852],
  34653. [ 0.5443, -0.3994, 1.7499, -0.1227, -0.6173, -0.5769, 0.0049,
  34654. 0.2071],
  34655. [ 0.5399, -0.4142, 1.6229, -0.4768, -0.6520, -0.6924, 0.0481,
  34656. 0.2972]]], device='cuda:0')
  34657. loss_train_step before backward: tensor(0.0054, device='cuda:0', grad_fn=<MseLossBackward>)
  34658. loss_train_step after backward: tensor(0.0054, device='cuda:0', grad_fn=<MseLossBackward>)
  34659. loss_train: 0.050726964604109526
  34660. step: 7
  34661. running loss: 0.007246709229158503
  34662. Train Steps: 7/90 Loss: 0.0072 torch.Size([8, 600, 800])
  34663. torch.Size([8, 8])
  34664. tensor([[0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  34665. [0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  34666. [0.6248, 0.4032, 0.7738, 0.1900, 0.4813, 0.1400, 0.5941, 0.4904],
  34667. [0.6277, 0.4118, 0.8988, 0.3833, 0.3950, 0.2650, 0.6290, 0.4938],
  34668. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  34669. [0.6200, 0.4071, 0.7338, 0.1917, 0.4200, 0.2450, 0.6150, 0.5517],
  34670. [0.6343, 0.4097, 0.9287, 0.4367, 0.4313, 0.3600, 0.7248, 0.5841],
  34671. [0.6226, 0.4185, 0.8850, 0.5500, 0.3800, 0.4250, 0.5625, 0.5617]],
  34672. device='cuda:0', dtype=torch.float64)
  34673. predictions are: tensor([[ 0.5618, -0.3972, 1.6424, -0.7693, -0.2796, -1.2178, 0.3273, -0.0264],
  34674. [ 0.5328, -0.4261, 1.5671, -0.5516, -0.6503, 0.1277, 0.5681, 0.2026],
  34675. [ 0.5060, -0.4781, 1.2327, -1.2211, -0.0598, -1.4889, 0.3843, 0.0457],
  34676. [ 0.5032, -0.4759, 1.8289, -0.4374, -0.5492, -0.8765, 0.5361, -0.0238],
  34677. [ 0.4846, -0.4673, 1.5984, 0.0356, -0.1474, 0.2934, 0.0812, -0.0116],
  34678. [ 0.4216, -0.5137, 1.0399, -1.3717, -0.4076, -0.9645, 0.4648, 0.2284],
  34679. [ 0.5114, -0.4945, 1.7288, -0.2810, -0.4495, -0.4657, 1.0433, 0.2603],
  34680. [ 0.4677, -0.4175, 1.6918, 0.2672, -0.5914, -0.1755, 0.2433, 0.2968]],
  34681. device='cuda:0', grad_fn=<AddmmBackward>)
  34682. landmarks are: tensor([[[ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  34683. -0.0368],
  34684. [ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  34685. 0.2545],
  34686. [ 0.5999, -0.4236, 1.2880, -1.4083, -0.0630, -1.6393, 0.4584,
  34687. -0.0208],
  34688. [ 0.6135, -0.3841, 1.8654, -0.5153, -0.4614, -1.0619, 0.6195,
  34689. -0.0049],
  34690. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  34691. 0.0532],
  34692. [ 0.5779, -0.4054, 1.1032, -1.4006, -0.3460, -1.1543, 0.5547,
  34693. 0.2622],
  34694. [ 0.6438, -0.3936, 2.0039, -0.2690, -0.2940, -0.6231, 1.0618,
  34695. 0.4119],
  34696. [ 0.5897, -0.3527, 1.8018, 0.2545, -0.5307, -0.3229, 0.3122,
  34697. 0.3084]]], device='cuda:0')
  34698. loss_train_step before backward: tensor(0.0097, device='cuda:0', grad_fn=<MseLossBackward>)
  34699. loss_train_step after backward: tensor(0.0097, device='cuda:0', grad_fn=<MseLossBackward>)
  34700. loss_train: 0.06042189570143819
  34701. step: 8
  34702. running loss: 0.007552736962679774
  34703.  
  34704. Train Steps: 8/90 Loss: 0.0076 torch.Size([8, 600, 800])
  34705. torch.Size([8, 8])
  34706. tensor([[0.6060, 0.3924, 0.8450, 0.5717, 0.4200, 0.5217, 0.5253, 0.4752],
  34707. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  34708. [0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550],
  34709. [0.6198, 0.4105, 0.7950, 0.3267, 0.3675, 0.3767, 0.6038, 0.6167],
  34710. [0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  34711. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  34712. [0.6250, 0.4008, 0.8950, 0.4183, 0.3550, 0.4383, 0.6361, 0.4927],
  34713. [0.6307, 0.4029, 0.8988, 0.4817, 0.3937, 0.3500, 0.7311, 0.5378]],
  34714. device='cuda:0', dtype=torch.float64)
  34715. predictions are: tensor([[ 0.5586, -0.4238, 1.5115, 0.3208, -0.2791, 0.0410, 0.1167, -0.0283],
  34716. [ 0.5033, -0.4404, 1.2076, -0.9702, -0.4188, -0.7943, 0.3816, 0.4679],
  34717. [ 0.4406, -0.4708, 1.8064, -0.1864, -0.3350, 0.1449, 0.4002, 0.2132],
  34718. [ 0.3537, -0.5212, 1.3906, -0.8135, -0.5936, -0.4937, 0.3015, 0.4278],
  34719. [ 0.6171, -0.4108, 1.7262, -0.7019, -0.3729, -1.1624, 0.4567, -0.1241],
  34720. [ 0.6642, -0.3580, 1.7266, 0.0246, -0.3493, 0.3263, 0.7752, 0.1696],
  34721. [ 0.5559, -0.4502, 1.7533, -0.3565, -0.6303, -0.3345, 0.4073, 0.0063],
  34722. [ 0.5353, -0.4811, 1.8886, -0.0844, -0.4030, -0.6989, 0.9185, 0.0296]],
  34723. device='cuda:0', grad_fn=<AddmmBackward>)
  34724. landmarks are: tensor([[[ 0.5132, -0.4736, 1.6171, 0.3546, -0.3460, 0.1236, 0.1404,
  34725. -0.0911],
  34726. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  34727. 0.5701],
  34728. [ 0.5968, -0.3725, 1.8423, -0.1381, -0.4037, 0.1852, 0.6009,
  34729. 0.2776],
  34730. [ 0.5768, -0.3899, 1.3861, -0.7771, -0.5885, -0.5461, 0.5028,
  34731. 0.5624],
  34732. [ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  34733. -0.0957],
  34734. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  34735. 0.3157],
  34736. [ 0.6010, -0.4345, 1.8480, -0.3537, -0.6462, -0.2613, 0.6524,
  34737. -0.0099],
  34738. [ 0.6273, -0.4249, 1.8654, -0.0611, -0.4672, -0.6693, 1.0910,
  34739. 0.1982]]], device='cuda:0')
  34740. loss_train_step before backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  34741. loss_train_step after backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  34742. loss_train: 0.06914769345894456
  34743. step: 9
  34744. running loss: 0.00768307705099384
  34745. Train Steps: 9/90 Loss: 0.0077 torch.Size([8, 600, 800])
  34746. torch.Size([8, 8])
  34747. tensor([[0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  34748. [0.6179, 0.4082, 0.6688, 0.2667, 0.3588, 0.3317, 0.5750, 0.5783],
  34749. [0.6277, 0.4057, 0.8300, 0.2650, 0.4363, 0.1850, 0.6140, 0.4823],
  34750. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  34751. [0.6173, 0.4114, 0.7325, 0.2500, 0.4213, 0.1917, 0.5338, 0.5700],
  34752. [0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447],
  34753. [0.6080, 0.4010, 0.8750, 0.4500, 0.4825, 0.5617, 0.5837, 0.5583],
  34754. [0.6201, 0.4116, 0.8725, 0.4733, 0.3700, 0.3217, 0.5386, 0.5767]],
  34755. device='cuda:0', dtype=torch.float64)
  34756. predictions are: tensor([[ 0.6758, -0.3886, 2.0155, -0.1198, -0.3333, -0.9112, 1.0076, 0.2153],
  34757. [ 0.4710, -0.4752, 0.8565, -1.0481, -0.6728, -0.7240, 0.1994, 0.2647],
  34758. [ 0.6471, -0.4175, 1.6222, -1.1371, -0.1707, -1.3694, 0.5561, -0.1339],
  34759. [ 0.5243, -0.4422, 1.0698, -1.1698, -0.5872, -0.7628, 0.4584, 0.1919],
  34760. [ 0.2242, -0.6373, 1.0507, -1.1499, -0.3268, -1.2658, 0.1022, 0.2798],
  34761. [ 0.6209, -0.4149, 1.9634, -0.0922, -0.5583, 0.1483, 1.0144, 0.0745],
  34762. [ 0.4827, -0.4694, 1.8218, -0.1977, -0.0812, 0.2834, 0.3023, 0.1277],
  34763. [ 0.4675, -0.4487, 1.7748, -0.0849, -0.5758, -0.7073, 0.1284, 0.2613]],
  34764. device='cuda:0', grad_fn=<AddmmBackward>)
  34765. landmarks are: tensor([[[ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  34766. 0.3692],
  34767. [ 0.5680, -0.4005, 0.8030, -1.0542, -0.6289, -0.7540, 0.3700,
  34768. 0.3854],
  34769. [ 0.6132, -0.4122, 1.5478, -1.0619, -0.2709, -1.4314, 0.5500,
  34770. -0.0583],
  34771. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  34772. 0.3007],
  34773. [ 0.5652, -0.3858, 1.0975, -1.1312, -0.3402, -1.4006, 0.1794,
  34774. 0.3469],
  34775. [ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  34776. 0.2302],
  34777. [ 0.5223, -0.4336, 1.7557, -0.2074, -0.0573, 0.3084, 0.4104,
  34778. 0.2930],
  34779. [ 0.5781, -0.3848, 1.7441, -0.0996, -0.5769, -0.8002, 0.2021,
  34780. 0.3778]]], device='cuda:0')
  34781. loss_train_step before backward: tensor(0.0086, device='cuda:0', grad_fn=<MseLossBackward>)
  34782. loss_train_step after backward: tensor(0.0086, device='cuda:0', grad_fn=<MseLossBackward>)
  34783. loss_train: 0.07775980466976762
  34784. step: 10
  34785. running loss: 0.007775980466976762
  34786. Train Steps: 10/90 Loss: 0.0078 torch.Size([8, 600, 800])
  34787. torch.Size([8, 8])
  34788. tensor([[0.6263, 0.4029, 0.8900, 0.4933, 0.4075, 0.5183, 0.6406, 0.4758],
  34789. [0.6205, 0.4081, 0.8950, 0.4017, 0.3788, 0.4700, 0.5963, 0.5667],
  34790. [ nan, nan, 0.6900, 0.1917, 0.3937, 0.2367, 0.5240, 0.5246],
  34791. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  34792. [0.6201, 0.4027, 0.8029, 0.2728, 0.4042, 0.2310, 0.5980, 0.5391],
  34793. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  34794. [0.6311, 0.4008, 0.7935, 0.5746, 0.3900, 0.5033, 0.6955, 0.5366],
  34795. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402]],
  34796. device='cuda:0', dtype=torch.float64)
  34797. predictions are: tensor([[ 0.7300, -0.3389, 1.8162, -0.1014, -0.4492, 0.1221, 0.6110, -0.0020],
  34798. [ 0.7533, -0.2762, 1.7339, -0.4205, -0.6105, -0.0945, 0.4151, 0.1860],
  34799. [-1.9275, -2.0202, 1.1070, -1.3464, -0.4541, -1.1237, 0.0258, 0.1614],
  34800. [ 0.7344, -0.2898, 1.6910, 0.2567, -0.4216, 0.0965, 0.2483, 0.2432],
  34801. [ 0.7589, -0.2931, 1.4342, -1.0748, -0.3835, -1.2520, 0.3794, 0.0544],
  34802. [-1.2442, -1.5647, 1.6967, -1.2537, 0.2367, -1.2305, 0.9762, 0.3556],
  34803. [ 0.7263, -0.3257, 1.4122, 0.2276, -0.4983, -0.0615, 0.8091, 0.2047],
  34804. [ 0.6517, -0.3751, 1.6237, 0.1518, -0.4258, -0.1553, 0.3233, 0.1533]],
  34805. device='cuda:0', grad_fn=<AddmmBackward>)
  34806. landmarks are: tensor([[[ 0.6072, -0.4250, 1.8249, -0.0072, -0.4037, 0.1082, 0.6730,
  34807. -0.0881],
  34808. [ 0.5799, -0.4012, 1.8480, -0.4306, -0.5365, -0.1150, 0.4681,
  34809. 0.3315],
  34810. [-2.2859, -2.2859, 0.9012, -1.4006, -0.4672, -1.1928, 0.1342,
  34811. 0.1373],
  34812. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  34813. 0.3161],
  34814. [ 0.5785, -0.4259, 1.4228, -1.0261, -0.4190, -1.2189, 0.4763,
  34815. 0.2043],
  34816. [-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  34817. 0.2463],
  34818. [ 0.6289, -0.4345, 1.3794, 0.3679, -0.4845, 0.0390, 0.9265,
  34819. 0.1928],
  34820. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  34821. 0.2091]]], device='cuda:0')
  34822. loss_train_step before backward: tensor(0.0361, device='cuda:0', grad_fn=<MseLossBackward>)
  34823. loss_train_step after backward: tensor(0.0361, device='cuda:0', grad_fn=<MseLossBackward>)
  34824. loss_train: 0.11386870825663209
  34825. step: 11
  34826. running loss: 0.010351700750602917
  34827. Train Steps: 11/90 Loss: 0.0104 torch.Size([8, 600, 800])
  34828. torch.Size([8, 8])
  34829. tensor([[0.6216, 0.4167, 0.8588, 0.5583, 0.3975, 0.5167, 0.5775, 0.5667],
  34830. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500],
  34831. [0.6143, 0.4040, 0.8237, 0.3333, 0.4075, 0.2117, 0.5137, 0.4973],
  34832. [0.6307, 0.4045, 0.8025, 0.5833, 0.3775, 0.4867, 0.6892, 0.5459],
  34833. [0.6200, 0.3993, 0.8639, 0.3687, 0.3658, 0.3139, 0.6002, 0.5374],
  34834. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  34835. [0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  34836. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483]],
  34837. device='cuda:0', dtype=torch.float64)
  34838. predictions are: tensor([[ 0.6214, -0.3683, 1.7116, 0.2403, -0.3745, 0.1278, 0.5127, 0.3513],
  34839. [ 0.5240, -0.4460, 1.2222, -1.2010, -0.5856, -0.7551, 0.4109, 0.2644],
  34840. [ 0.3942, -0.5166, 1.4681, -0.8702, -0.3608, -1.2539, 0.1577, 0.0390],
  34841. [ 0.6655, -0.3826, 1.4986, 0.1916, -0.4446, -0.0653, 1.0156, 0.2396],
  34842. [ 0.5855, -0.4402, 1.7162, -0.6379, -0.5470, -0.8691, 0.5754, 0.1821],
  34843. [ 0.3844, -0.5187, 1.5678, -0.6282, -0.6653, -0.4034, 0.3104, 0.2106],
  34844. [ 0.7308, -0.3358, 1.6167, -1.1079, 0.0411, -1.5191, 0.8376, 0.1383],
  34845. [ 0.5378, -0.4333, 1.7431, -0.5032, -0.4683, 0.0062, 0.4150, 0.2511]],
  34846. device='cuda:0', grad_fn=<AddmmBackward>)
  34847. landmarks are: tensor([[[ 0.5853, -0.3614, 1.6806, 0.2930, -0.4499, 0.1005, 0.3815,
  34848. 0.3315],
  34849. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  34850. 0.2545],
  34851. [ 0.5515, -0.4201, 1.5189, -0.7463, -0.4037, -1.3082, 0.0869,
  34852. 0.0111],
  34853. [ 0.6273, -0.4177, 1.4208, 0.4085, -0.5423, -0.0380, 0.8973,
  34854. 0.2356],
  34855. [ 0.5777, -0.4416, 1.7044, -0.5827, -0.5962, -0.8361, 0.4862,
  34856. 0.1963],
  34857. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  34858. 0.2365],
  34859. [ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  34860. 0.1020],
  34861. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  34862. 0.2468]]], device='cuda:0')
  34863. loss_train_step before backward: tensor(0.0045, device='cuda:0', grad_fn=<MseLossBackward>)
  34864. loss_train_step after backward: tensor(0.0045, device='cuda:0', grad_fn=<MseLossBackward>)
  34865. loss_train: 0.11839128797873855
  34866. step: 12
  34867. running loss: 0.009865940664894879
  34868.  
  34869. Train Steps: 12/90 Loss: 0.0099 torch.Size([8, 600, 800])
  34870. torch.Size([8, 8])
  34871. tensor([[0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300],
  34872. [0.6122, 0.4048, 0.7506, 0.3014, 0.3475, 0.3333, 0.5487, 0.5749],
  34873. [0.6263, 0.4057, 0.8800, 0.3833, 0.3650, 0.3717, 0.6375, 0.4804],
  34874. [0.6282, 0.4092, 0.8000, 0.2183, 0.4500, 0.2383, 0.6787, 0.5364],
  34875. [0.6124, 0.4075, 0.7696, 0.4153, 0.3475, 0.3767, 0.5157, 0.5427],
  34876. [0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  34877. [0.6262, 0.4052, 0.8888, 0.4700, 0.3675, 0.5117, 0.6350, 0.5233],
  34878. [ nan, nan, 0.8938, 0.2850, 0.4662, 0.3117, 0.7406, 0.5528]],
  34879. device='cuda:0', dtype=torch.float64)
  34880. predictions are: tensor([[ 0.5405, -0.4378, 1.2390, -1.2238, -0.4669, -0.9086, 0.6034, 0.2385],
  34881. [ 0.4922, -0.4575, 1.1102, -0.8623, -0.6171, -0.7878, 0.2250, 0.3683],
  34882. [ 0.6639, -0.4080, 1.8109, -0.4827, -0.5623, -0.6579, 0.6498, -0.0299],
  34883. [ 0.6907, -0.3644, 1.3608, -1.1843, -0.1819, -1.3539, 0.8125, 0.1886],
  34884. [ 0.5084, -0.4234, 1.3220, -0.4061, -0.6198, -0.5928, 0.0843, 0.2962],
  34885. [ 0.6199, -0.3647, 1.6480, 0.1301, -0.1844, 0.1268, 0.2038, 0.2411],
  34886. [ 0.6979, -0.3626, 1.8685, -0.0838, -0.4998, 0.0246, 0.6699, 0.1938],
  34887. [-1.8352, -1.9717, 1.9515, -0.8713, -0.0920, -0.9134, 1.1173, 0.3375]],
  34888. device='cuda:0', grad_fn=<AddmmBackward>)
  34889. landmarks are: tensor([[[ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  34890. 0.1621],
  34891. [ 0.5419, -0.4160, 1.1810, -0.8939, -0.6808, -0.7463, 0.2485,
  34892. 0.3694],
  34893. [ 0.6071, -0.4119, 1.7788, -0.5153, -0.6000, -0.5692, 0.6586,
  34894. -0.0670],
  34895. [ 0.6158, -0.3960, 1.4092, -1.2774, -0.2074, -1.1851, 0.8491,
  34896. 0.1917],
  34897. [ 0.5427, -0.4035, 1.2688, -0.3675, -0.6808, -0.5461, 0.0959,
  34898. 0.2206],
  34899. [ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  34900. 0.2386],
  34901. [ 0.6063, -0.4142, 1.8192, -0.1150, -0.5885, 0.0774, 0.6471,
  34902. 0.1313],
  34903. [-2.2859, -2.2859, 1.8423, -0.9695, -0.1323, -0.8463, 1.1349,
  34904. 0.2676]]], device='cuda:0')
  34905. loss_train_step before backward: tensor(0.0085, device='cuda:0', grad_fn=<MseLossBackward>)
  34906. loss_train_step after backward: tensor(0.0085, device='cuda:0', grad_fn=<MseLossBackward>)
  34907. loss_train: 0.1268529868684709
  34908. step: 13
  34909. running loss: 0.009757922066805454
  34910. Train Steps: 13/90 Loss: 0.0098 torch.Size([8, 600, 800])
  34911. torch.Size([8, 8])
  34912. tensor([[0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967],
  34913. [0.6198, 0.3997, 0.8582, 0.5361, 0.4117, 0.5016, 0.5942, 0.5134],
  34914. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  34915. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  34916. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  34917. [0.6265, 0.4251, 0.7113, 0.3550, 0.4375, 0.2117, 0.5587, 0.6118],
  34918. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  34919. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611]],
  34920. device='cuda:0', dtype=torch.float64)
  34921. predictions are: tensor([[ 0.6785, -0.3535, 1.6476, -1.0522, -0.1186, -1.3418, 0.6660, 0.0418],
  34922. [ 0.7046, -0.3856, 1.7158, 0.1641, -0.4697, 0.1161, 0.5764, 0.0492],
  34923. [ 0.5759, -0.4075, 1.8268, -0.2217, -0.4446, 0.2211, 0.6357, 0.2442],
  34924. [-1.3988, -1.6600, 0.8677, -1.2617, -0.4867, -1.2016, 0.2127, 0.3967],
  34925. [-2.0198, -2.1018, 0.9475, -1.3378, -0.4070, -1.3136, 0.2460, 0.3122],
  34926. [ 0.7884, -0.2667, 1.1408, -0.7161, -0.3460, -1.2052, 0.4208, 0.4894],
  34927. [ 0.5331, -0.4345, 1.5298, -1.1118, -0.2301, -1.2077, 0.6807, 0.1989],
  34928. [ 0.6563, -0.3672, 1.7630, -0.0805, -0.3497, -0.0191, 0.3838, 0.3103]],
  34929. device='cuda:0', grad_fn=<AddmmBackward>)
  34930. landmarks are: tensor([[[ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  34931. -1.5161e+00, 5.8660e-01, 8.0947e-03],
  34932. [ 5.7673e-01, -4.3957e-01, 1.6782e+00, 1.9046e-01, -3.8437e-01,
  34933. 3.0841e-02, 4.5876e-01, 8.5521e-02],
  34934. [ 5.7258e-01, -4.1594e-01, 1.8192e+00, -2.4588e-01, -3.4018e-01,
  34935. 1.1594e-01, 4.7968e-01, 3.1609e-01],
  34936. [-2.2859e+00, -2.2859e+00, 8.0331e-01, -1.1250e+00, -3.8637e-01,
  34937. -1.3082e+00, 1.1262e-01, 4.5430e-01],
  34938. [-2.2859e+00, -2.2859e+00, 6.7598e-01, -1.4083e+00, -3.2864e-01,
  34939. -1.4160e+00, 2.4873e-01, 3.4688e-01],
  34940. [ 6.0774e-01, -3.2256e-01, 9.9931e-01, -6.4619e-01, -2.6513e-01,
  34941. -1.3082e+00, 2.9460e-01, 5.4012e-01],
  34942. [ 5.9579e-01, -3.8176e-01, 1.5536e+00, -1.1081e+00, -2.0739e-01,
  34943. -1.3390e+00, 5.6628e-01, 2.0831e-01],
  34944. [ 5.4908e-01, -4.2902e-01, 1.7788e+00, -1.0731e-01, -2.6513e-01,
  34945. -1.0731e-01, 2.5553e-01, 3.0567e-01]]], device='cuda:0')
  34946. loss_train_step before backward: tensor(0.0278, device='cuda:0', grad_fn=<MseLossBackward>)
  34947. loss_train_step after backward: tensor(0.0278, device='cuda:0', grad_fn=<MseLossBackward>)
  34948. loss_train: 0.15469072526320815
  34949. step: 14
  34950. running loss: 0.011049337518800582
  34951. Train Steps: 14/90 Loss: 0.0110 torch.Size([8, 600, 800])
  34952. torch.Size([8, 8])
  34953. tensor([[0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  34954. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  34955. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  34956. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  34957. [0.6276, 0.4235, 0.8888, 0.5333, 0.3800, 0.3117, 0.5427, 0.6164],
  34958. [ nan, nan, 0.7225, 0.2167, 0.3987, 0.2283, 0.5427, 0.5181],
  34959. [0.6161, 0.4099, 0.8738, 0.4383, 0.3788, 0.5483, 0.5605, 0.5019],
  34960. [0.6282, 0.4029, 0.8988, 0.3000, 0.4250, 0.4183, 0.7042, 0.5575]],
  34961. device='cuda:0', dtype=torch.float64)
  34962. predictions are: tensor([[ 0.4819, -0.5002, 1.7234, -0.0345, -0.4618, -0.2502, 0.4140, 0.3121],
  34963. [ 0.5653, -0.4157, 1.7060, -0.1241, -0.2971, -0.1908, 0.3426, 0.3553],
  34964. [ 0.4675, -0.4928, 1.6902, 0.0889, -0.2267, 0.0156, 0.6133, 0.1752],
  34965. [ 0.4411, -0.5210, 1.7248, -0.1622, -0.1141, -0.0964, 0.2784, 0.0968],
  34966. [ 0.8619, -0.1851, 1.7110, 0.1010, -0.5076, -0.9692, 0.5351, 0.5752],
  34967. [-2.5459, -2.4300, 0.9579, -1.4209, -0.5373, -1.2719, 0.2063, 0.1480],
  34968. [ 0.5651, -0.4017, 1.7222, -0.3233, -0.5675, 0.1211, 0.5236, 0.2215],
  34969. [ 0.6173, -0.4305, 1.7402, -0.8352, -0.4560, -0.4488, 1.1476, 0.3046]],
  34970. device='cuda:0', grad_fn=<AddmmBackward>)
  34971. landmarks are: tensor([[[ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  34972. 0.3777],
  34973. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  34974. 0.3057],
  34975. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  34976. 0.0851],
  34977. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  34978. -0.0039],
  34979. [ 0.6131, -0.3299, 1.8192, 0.1775, -0.5307, -0.8463, 0.2206,
  34980. 0.5612],
  34981. [-2.2859, -2.2859, 1.0513, -1.2851, -0.4441, -1.2313, 0.2206,
  34982. 0.1073],
  34983. [ 0.5597, -0.3928, 1.7499, -0.2613, -0.5365, 0.2468, 0.3028,
  34984. 0.0321],
  34985. [ 0.6158, -0.4249, 1.8654, -0.9002, -0.3229, -0.3537, 0.9667,
  34986. 0.2890]]], device='cuda:0')
  34987. loss_train_step before backward: tensor(0.0121, device='cuda:0', grad_fn=<MseLossBackward>)
  34988. loss_train_step after backward: tensor(0.0121, device='cuda:0', grad_fn=<MseLossBackward>)
  34989. loss_train: 0.1667864709161222
  34990. step: 15
  34991. running loss: 0.011119098061074813
  34992. Train Steps: 15/90 Loss: 0.0111 torch.Size([8, 600, 800])
  34993. torch.Size([8, 8])
  34994. tensor([[0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  34995. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  34996. [0.6275, 0.4024, 0.8500, 0.5383, 0.3912, 0.4883, 0.6288, 0.5100],
  34997. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  34998. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  34999. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  35000. [0.6104, 0.4029, 0.8738, 0.4900, 0.4088, 0.4533, 0.5070, 0.5510],
  35001. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377]],
  35002. device='cuda:0', dtype=torch.float64)
  35003. predictions are: tensor([[ 0.4449, -0.5116, 1.8714, -0.0182, -0.5449, 0.1283, 1.1254, 0.3308],
  35004. [ 0.4398, -0.5067, 1.7343, 0.0700, -0.2354, 0.0319, 0.5108, 0.2732],
  35005. [ 0.5798, -0.4334, 1.6550, 0.1778, -0.5138, -0.1207, 0.6395, 0.2326],
  35006. [ 0.6115, -0.3747, 1.8011, -0.1351, -0.3285, -0.0546, 0.4288, 0.4305],
  35007. [ 0.4821, -0.4128, 1.7874, -0.1781, -0.4174, -0.1471, 0.2563, 0.2960],
  35008. [ 0.7083, -0.3171, 1.1143, -1.4232, -0.4142, -1.5667, 0.2975, 0.2217],
  35009. [ 0.5611, -0.3972, 1.7412, -0.0379, -0.4422, -0.2419, 0.1391, 0.3804],
  35010. [ 0.5256, -0.4907, 1.7250, 0.1376, -0.4755, -0.2529, 0.5504, 0.2964]],
  35011. device='cuda:0', grad_fn=<AddmmBackward>)
  35012. landmarks are: tensor([[[ 0.6421, -0.3695, 1.7788, 0.0236, -0.4845, 0.1544, 1.1971,
  35013. 0.2196],
  35014. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  35015. 0.0851],
  35016. [ 0.6125, -0.4273, 1.6402, 0.2006, -0.4788, -0.0303, 0.6182,
  35017. 0.0697],
  35018. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  35019. 0.3084],
  35020. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  35021. 0.1439],
  35022. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  35023. 0.1343],
  35024. [ 0.5334, -0.4252, 1.7499, -0.0226, -0.3979, -0.1920, 0.0558,
  35025. 0.2589],
  35026. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  35027. 0.1979]]], device='cuda:0')
  35028. loss_train_step before backward: tensor(0.0075, device='cuda:0', grad_fn=<MseLossBackward>)
  35029. loss_train_step after backward: tensor(0.0075, device='cuda:0', grad_fn=<MseLossBackward>)
  35030. loss_train: 0.17424756661057472
  35031. step: 16
  35032. running loss: 0.01089047291316092
  35033.  
  35034. Train Steps: 16/90 Loss: 0.0109 torch.Size([8, 600, 800])
  35035. torch.Size([8, 8])
  35036. tensor([[0.6350, 0.4118, 0.8363, 0.2717, 0.4850, 0.1700, 0.6441, 0.5170],
  35037. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  35038. [0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  35039. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  35040. [0.6201, 0.4029, 0.8776, 0.4602, 0.3683, 0.4203, 0.5938, 0.5450],
  35041. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  35042. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  35043. [0.6300, 0.4133, 0.8538, 0.2167, 0.5587, 0.2250, 0.7390, 0.5413]],
  35044. device='cuda:0', dtype=torch.float64)
  35045. predictions are: tensor([[ 0.6731, -0.3697, 1.5592, -1.0559, -0.0977, -1.3919, 0.7334, 0.1976],
  35046. [ 0.6478, -0.3031, 1.7829, -0.3219, -0.6307, -0.3326, 0.2386, 0.3660],
  35047. [ 0.4876, -0.4768, 0.8883, -1.4431, -0.3269, -1.5276, 0.1864, 0.1209],
  35048. [ 0.5578, -0.4057, 1.6874, 0.1956, -0.5940, -0.4984, 0.3570, 0.3694],
  35049. [ 0.5158, -0.4404, 1.7622, -0.1544, -0.6287, -0.2941, 0.4888, 0.3767],
  35050. [ 0.3452, -0.5299, 1.5267, -0.5571, -0.7532, -0.3578, 0.2696, 0.2688],
  35051. [ 0.6597, -0.3832, 1.6093, 0.2269, -0.3988, 0.2980, 0.7815, 0.2671],
  35052. [ 0.0781, -0.7422, 1.6755, -1.3120, 0.2650, -1.0328, 1.1781, 0.4177]],
  35053. device='cuda:0', grad_fn=<AddmmBackward>)
  35054. landmarks are: tensor([[[ 0.6471, -0.3840, 1.5767, -1.0311, -0.0457, -1.5007, 0.6889,
  35055. 0.1020],
  35056. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  35057. 0.1852],
  35058. [ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  35059. 0.0261],
  35060. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  35061. 0.1698],
  35062. [ 0.5785, -0.4252, 1.7676, -0.1602, -0.5845, -0.3446, 0.4566,
  35063. 0.2314],
  35064. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  35065. 0.2365],
  35066. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  35067. 0.1176],
  35068. [ 0.6240, -0.3768, 1.6575, -1.2851, 0.2949, -1.2467, 1.1276,
  35069. 0.2142]]], device='cuda:0')
  35070. loss_train_step before backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  35071. loss_train_step after backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  35072. loss_train: 0.18802320212125778
  35073. step: 17
  35074. running loss: 0.011060188360073987
  35075. Train Steps: 17/90 Loss: 0.0111 torch.Size([8, 600, 800])
  35076. torch.Size([8, 8])
  35077. tensor([[0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  35078. [0.6073, 0.3932, 0.8363, 0.5817, 0.4425, 0.5117, 0.5204, 0.4817],
  35079. [0.6168, 0.4111, 0.6517, 0.2875, 0.3688, 0.2817, 0.5228, 0.5837],
  35080. [0.6329, 0.4196, 0.9238, 0.4583, 0.4263, 0.2933, 0.7343, 0.5748],
  35081. [0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617],
  35082. [0.6115, 0.4005, 0.8838, 0.3867, 0.3763, 0.4700, 0.5800, 0.5550],
  35083. [0.6229, 0.4066, 0.8513, 0.5717, 0.4500, 0.5050, 0.6025, 0.5350],
  35084. [0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467]],
  35085. device='cuda:0', dtype=torch.float64)
  35086. predictions are: tensor([[ 0.4197, -0.4912, 1.5191, -1.2403, -0.1832, -1.3755, 0.6581, 0.2036],
  35087. [ 0.4366, -0.5245, 1.5805, 0.2763, -0.2760, 0.0055, 0.1530, 0.0448],
  35088. [ 0.6062, -0.3579, 0.8087, -1.0960, -0.6512, -1.0815, 0.1575, 0.4478],
  35089. [ 0.6468, -0.3977, 1.9815, -0.2081, -0.4123, -1.0205, 1.1302, 0.3880],
  35090. [ 0.5060, -0.4523, 1.7256, -0.1588, -0.0872, -0.1265, 0.2759, 0.3836],
  35091. [ 0.4599, -0.4719, 1.7737, -0.5584, -0.6429, -0.1395, 0.4024, 0.2736],
  35092. [ 0.3906, -0.5403, 1.6324, 0.2416, -0.2583, -0.0143, 0.4181, 0.2703],
  35093. [ 0.4343, -0.5111, 1.7783, -0.1365, -0.3835, 0.0125, 0.5447, 0.2704]],
  35094. device='cuda:0', grad_fn=<AddmmBackward>)
  35095. landmarks are: tensor([[[ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  35096. 0.2083],
  35097. [ 0.5193, -0.4699, 1.5767, 0.4008, -0.2420, 0.0774, 0.1178,
  35098. -0.0610],
  35099. [ 0.5629, -0.3871, 0.7243, -0.9581, -0.5827, -0.9849, 0.1288,
  35100. 0.4103],
  35101. [ 0.6372, -0.3479, 1.9808, -0.1689, -0.3171, -0.9310, 1.1057,
  35102. 0.3692],
  35103. [ 0.5432, -0.4388, 1.7557, -0.0303, -0.0919, -0.1150, 0.2699,
  35104. 0.3087],
  35105. [ 0.5384, -0.4361, 1.7961, -0.4999, -0.5480, -0.1150, 0.3931,
  35106. 0.2776],
  35107. [ 0.5911, -0.4080, 1.6460, 0.3546, -0.2074, 0.0467, 0.4970,
  35108. 0.1852],
  35109. [ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  35110. 0.2391]]], device='cuda:0')
  35111. loss_train_step before backward: tensor(0.0057, device='cuda:0', grad_fn=<MseLossBackward>)
  35112. loss_train_step after backward: tensor(0.0057, device='cuda:0', grad_fn=<MseLossBackward>)
  35113. loss_train: 0.19375777710229158
  35114. step: 18
  35115. running loss: 0.010764320950127311
  35116. Train Steps: 18/90 Loss: 0.0108 torch.Size([8, 600, 800])
  35117. torch.Size([8, 8])
  35118. tensor([[0.6102, 0.3999, 0.8750, 0.5133, 0.3825, 0.4750, 0.5637, 0.5083],
  35119. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  35120. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  35121. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  35122. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332],
  35123. [0.6201, 0.4064, 0.8688, 0.5050, 0.4225, 0.5100, 0.6138, 0.5500],
  35124. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  35125. [0.6129, 0.3930, 0.8769, 0.5105, 0.4146, 0.5642, 0.6000, 0.5082]],
  35126. device='cuda:0', dtype=torch.float64)
  35127. predictions are: tensor([[ 0.5465, -0.4084, 1.7556, -0.0485, -0.4730, -0.2105, 0.2575, 0.1068],
  35128. [ 0.5799, -0.3872, 1.7264, 0.1061, -0.5587, -0.7446, 0.4119, 0.3354],
  35129. [ 0.6407, -0.3606, 1.6930, -0.0809, -0.2809, -0.1557, 0.2516, 0.2782],
  35130. [ 0.3428, -0.5433, 1.7698, -0.2409, 0.0305, -0.0332, 0.5215, 0.3632],
  35131. [ 0.5239, -0.4432, 1.5371, 0.1497, -0.5197, -0.1187, 0.9927, 0.2922],
  35132. [ 0.6542, -0.3643, 1.7341, -0.0491, -0.3532, -0.0352, 0.5050, 0.3007],
  35133. [ 0.4386, -0.4446, 1.6842, -0.2906, -0.4989, -0.4463, 0.0770, 0.3000],
  35134. [ 0.5291, -0.4532, 1.7692, 0.0302, -0.3224, 0.2420, 0.4699, 0.1400]],
  35135. device='cuda:0', grad_fn=<AddmmBackward>)
  35136. landmarks are: tensor([[[ 5.3262e-01, -4.3895e-01, 1.7557e+00, 8.5142e-02, -5.1917e-01,
  35137. -9.1917e-02, 3.1801e-01, 6.2048e-02],
  35138. [ 5.9013e-01, -4.1570e-01, 1.7557e+00, 1.9292e-01, -5.4226e-01,
  35139. -5.9230e-01, 3.5843e-01, 1.6982e-01],
  35140. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  35141. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  35142. [ 5.3508e-01, -4.3212e-01, 1.7326e+00, -1.3811e-01, 4.6329e-02,
  35143. 1.0491e-01, 4.1617e-01, 2.7760e-01],
  35144. [ 6.1907e-01, -4.2971e-01, 1.4612e+00, 2.3911e-01, -4.9607e-01,
  35145. 3.1255e-02, 1.1166e+00, 1.7680e-01],
  35146. [ 5.7841e-01, -4.0878e-01, 1.7268e+00, 4.6651e-02, -3.3441e-01,
  35147. 6.9746e-02, 5.4896e-01, 2.5450e-01],
  35148. [ 5.4405e-01, -3.9969e-01, 1.7326e+00, -2.2279e-01, -4.4411e-01,
  35149. -2.9207e-01, 2.9551e-02, 2.4088e-01],
  35150. [ 5.4496e-01, -4.7064e-01, 1.7643e+00, 7.2204e-02, -3.7076e-01,
  35151. 3.2001e-01, 4.8543e-01, 6.1219e-02]]], device='cuda:0')
  35152. loss_train_step before backward: tensor(0.0066, device='cuda:0', grad_fn=<MseLossBackward>)
  35153. loss_train_step after backward: tensor(0.0066, device='cuda:0', grad_fn=<MseLossBackward>)
  35154. loss_train: 0.20038292463868856
  35155. step: 19
  35156. running loss: 0.010546469717825713
  35157. Train Steps: 19/90 Loss: 0.0105 torch.Size([8, 600, 800])
  35158. torch.Size([8, 8])
  35159. tensor([[0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279],
  35160. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  35161. [0.6109, 0.4015, 0.7668, 0.3639, 0.3513, 0.3667, 0.5200, 0.5641],
  35162. [0.6189, 0.4049, 0.8888, 0.4417, 0.4213, 0.5200, 0.5988, 0.5633],
  35163. [0.6125, 0.3999, 0.8750, 0.4883, 0.4750, 0.4700, 0.5533, 0.5617],
  35164. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  35165. [0.6239, 0.4123, 0.8313, 0.2550, 0.4500, 0.2050, 0.6175, 0.5400],
  35166. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550]],
  35167. device='cuda:0', dtype=torch.float64)
  35168. predictions are: tensor([[ 6.1788e-01, -3.8531e-01, 1.8123e+00, -8.3692e-03, -5.4274e-01,
  35169. -1.6935e-01, 6.3533e-01, 1.3633e-01],
  35170. [ 6.6055e-01, -3.6350e-01, 1.0613e+00, -1.3483e+00, -4.5378e-01,
  35171. -1.2605e+00, 5.3864e-01, 2.7648e-01],
  35172. [ 5.9610e-01, -3.5126e-01, 1.2928e+00, -6.1835e-01, -7.0665e-01,
  35173. -7.1798e-01, 2.0525e-01, 3.0496e-01],
  35174. [ 4.8049e-01, -4.5639e-01, 1.7886e+00, -1.5145e-01, -3.8253e-01,
  35175. 7.3162e-02, 5.6609e-01, 2.5449e-01],
  35176. [ 5.1796e-01, -4.4070e-01, 1.7000e+00, 3.3282e-02, -6.6376e-02,
  35177. -1.6498e-01, 2.8864e-01, 3.2839e-01],
  35178. [ 3.5361e-01, -5.8107e-01, 1.7022e+00, -2.0324e-02, -9.5997e-02,
  35179. -7.1067e-02, 2.6798e-01, 6.7780e-02],
  35180. [ 5.0432e-01, -4.3011e-01, 1.5125e+00, -1.0313e+00, -1.7659e-01,
  35181. -1.4298e+00, 6.5754e-01, 1.9049e-01],
  35182. [ 3.6905e-01, -5.3715e-01, 1.7403e+00, -5.2373e-02, -1.7687e-02,
  35183. -1.7288e-03, 5.1245e-01, 2.9648e-01]], device='cuda:0',
  35184. grad_fn=<AddmmBackward>)
  35185. landmarks are: tensor([[[ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  35186. 0.1525],
  35187. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  35188. 0.2468],
  35189. [ 0.5357, -0.4315, 1.2557, -0.6051, -0.6635, -0.5923, 0.1159,
  35190. 0.3198],
  35191. [ 0.5726, -0.4159, 1.8192, -0.2459, -0.3402, 0.1159, 0.4797,
  35192. 0.3161],
  35193. [ 0.5432, -0.4388, 1.7557, -0.0303, -0.0919, -0.1150, 0.2699,
  35194. 0.3087],
  35195. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  35196. -0.0039],
  35197. [ 0.5958, -0.3818, 1.5536, -1.1081, -0.2074, -1.3390, 0.5663,
  35198. 0.2083],
  35199. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  35200. 0.2776]]], device='cuda:0')
  35201. loss_train_step before backward: tensor(0.0057, device='cuda:0', grad_fn=<MseLossBackward>)
  35202. loss_train_step after backward: tensor(0.0057, device='cuda:0', grad_fn=<MseLossBackward>)
  35203. loss_train: 0.20609361585229635
  35204. step: 20
  35205. running loss: 0.010304680792614818
  35206.  
  35207. Train Steps: 20/90 Loss: 0.0103 torch.Size([8, 600, 800])
  35208. torch.Size([8, 8])
  35209. tensor([[0.6200, 0.3993, 0.8519, 0.4923, 0.3962, 0.4717, 0.6013, 0.5433],
  35210. [0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  35211. [0.6131, 0.4037, 0.6907, 0.2819, 0.3688, 0.2700, 0.5217, 0.5680],
  35212. [0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817],
  35213. [0.6200, 0.4086, 0.8414, 0.2974, 0.4117, 0.2274, 0.5869, 0.5391],
  35214. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  35215. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456],
  35216. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133]],
  35217. device='cuda:0', dtype=torch.float64)
  35218. predictions are: tensor([[ 0.4543, -0.5039, 1.7159, 0.1398, -0.3645, -0.0678, 0.5161, 0.2738],
  35219. [ 0.4250, -0.5397, 1.8740, 0.0648, -0.3627, 0.3088, 0.6891, 0.1285],
  35220. [ 0.5432, -0.4129, 0.9103, -1.0536, -0.5007, -1.0081, 0.1384, 0.3272],
  35221. [ 0.5651, -0.4690, 1.7934, -0.2742, -0.5696, -0.4388, 0.4848, 0.0175],
  35222. [ 0.6463, -0.3446, 1.6692, -0.8134, -0.2191, -1.0957, 0.4650, 0.1368],
  35223. [ 0.3467, -0.5055, 1.0952, -0.9362, -0.3407, -1.0388, 0.3832, 0.4081],
  35224. [ 0.6227, -0.3434, 1.7308, 0.1826, -0.2582, 0.2336, 0.2736, 0.2280],
  35225. [ 0.6184, -0.4156, 1.5748, -1.0515, -0.0119, -1.4673, 0.5948, 0.1301]],
  35226. device='cuda:0', grad_fn=<AddmmBackward>)
  35227. landmarks are: tensor([[[ 0.5777, -0.4415, 1.6491, -0.0122, -0.4557, -0.1073, 0.4912,
  35228. 0.2237],
  35229. [ 0.6047, -0.4209, 1.7557, -0.0303, -0.4845, 0.2545, 0.6587,
  35230. 0.1236],
  35231. [ 0.5459, -0.4215, 0.9043, -0.9838, -0.5827, -1.0388, 0.1236,
  35232. 0.3378],
  35233. [ 0.5669, -0.4794, 1.7499, -0.3383, -0.6751, -0.4229, 0.4970,
  35234. -0.0611],
  35235. [ 0.5776, -0.3987, 1.6005, -0.9121, -0.3844, -1.2358, 0.4247,
  35236. 0.2043],
  35237. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  35238. 0.2853],
  35239. [ 0.5443, -0.3840, 1.7095, 0.0620, -0.3979, 0.1929, 0.1622,
  35240. 0.2341],
  35241. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  35242. 0.0851]]], device='cuda:0')
  35243. loss_train_step before backward: tensor(0.0070, device='cuda:0', grad_fn=<MseLossBackward>)
  35244. loss_train_step after backward: tensor(0.0070, device='cuda:0', grad_fn=<MseLossBackward>)
  35245. loss_train: 0.21307452209293842
  35246. step: 21
  35247. running loss: 0.010146405813949448
  35248. Train Steps: 21/90 Loss: 0.0101 torch.Size([8, 600, 800])
  35249. torch.Size([8, 8])
  35250. tensor([[0.6196, 0.4090, 0.8450, 0.3900, 0.3575, 0.3933, 0.5975, 0.5583],
  35251. [0.6353, 0.4128, 0.9138, 0.3533, 0.4688, 0.3250, 0.7145, 0.5991],
  35252. [0.6198, 0.4114, 0.8263, 0.3283, 0.3550, 0.3583, 0.5813, 0.5667],
  35253. [0.6339, 0.4149, 0.8800, 0.5000, 0.3900, 0.5283, 0.7541, 0.5424],
  35254. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  35255. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  35256. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  35257. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505]],
  35258. device='cuda:0', dtype=torch.float64)
  35259. predictions are: tensor([[ 0.6394, -0.3515, 1.6325, -0.3776, -0.5088, -0.5482, 0.3714, 0.3221],
  35260. [-0.5533, -1.1389, 1.7858, -0.4646, 0.0421, -0.8907, 1.0837, 0.3898],
  35261. [ 0.6300, -0.3319, 1.5087, -0.6143, -0.5620, -0.6781, 0.2920, 0.3042],
  35262. [ 0.6850, -0.3482, 1.7831, 0.1664, -0.3374, 0.1902, 1.0232, 0.1071],
  35263. [ 0.5287, -0.4297, 1.2409, -1.1871, -0.4289, -0.8006, 0.4612, 0.2733],
  35264. [ 0.4822, -0.4647, 1.5526, 0.3464, -0.3086, 0.0092, 0.1336, -0.0019],
  35265. [ 0.5267, -0.4623, 1.7165, -0.0318, -0.0668, 0.0993, 0.1245, -0.0606],
  35266. [ 0.4854, -0.4350, 1.5649, -0.3733, -0.5061, -0.6786, -0.0152, 0.1631]],
  35267. device='cuda:0', grad_fn=<AddmmBackward>)
  35268. landmarks are: tensor([[[ 0.5761, -0.3966, 1.6171, -0.4845, -0.6346, -0.4691, 0.4739,
  35269. 0.2930],
  35270. [ 0.6487, -0.3792, 1.9346, -0.6539, -0.1208, -0.7848, 1.0143,
  35271. 0.4814],
  35272. [ 0.5768, -0.3857, 1.5305, -0.7694, -0.6462, -0.6308, 0.3988,
  35273. 0.3315],
  35274. [ 0.6421, -0.3695, 1.7788, 0.0236, -0.4845, 0.1544, 1.1971,
  35275. 0.2196],
  35276. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  35277. 0.2853],
  35278. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  35279. -0.1061],
  35280. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  35281. 0.0051],
  35282. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  35283. 0.2567]]], device='cuda:0')
  35284. loss_train_step before backward: tensor(0.0396, device='cuda:0', grad_fn=<MseLossBackward>)
  35285. loss_train_step after backward: tensor(0.0396, device='cuda:0', grad_fn=<MseLossBackward>)
  35286. loss_train: 0.2526354994624853
  35287. step: 22
  35288. running loss: 0.011483431793749332
  35289. Train Steps: 22/90 Loss: 0.0115 torch.Size([8, 600, 800])
  35290. torch.Size([8, 8])
  35291. tensor([[0.6179, 0.4008, 0.8600, 0.4015, 0.3932, 0.2515, 0.5711, 0.5438],
  35292. [0.6090, 0.4010, 0.7838, 0.3483, 0.3538, 0.3783, 0.5462, 0.5077],
  35293. [0.6265, 0.4088, 0.8025, 0.1850, 0.4163, 0.2500, 0.6290, 0.4947],
  35294. [0.6286, 0.4274, 0.8500, 0.4500, 0.4525, 0.2583, 0.5440, 0.6209],
  35295. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672],
  35296. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  35297. [0.6081, 0.3950, 0.8538, 0.4667, 0.3850, 0.4917, 0.5342, 0.4954],
  35298. [ nan, nan, 0.7097, 0.2346, 0.4250, 0.1850, 0.5175, 0.5583]],
  35299. device='cuda:0', dtype=torch.float64)
  35300. predictions are: tensor([[ 0.6787, -0.3309, 1.5545, -0.5017, -0.2383, -1.0141, 0.2557, 0.2843],
  35301. [ 0.6255, -0.3809, 1.3916, -0.6963, -0.5258, -0.5401, 0.1449, 0.1210],
  35302. [ 0.5222, -0.4661, 1.4427, -1.3368, -0.2490, -0.9906, 0.6824, 0.1045],
  35303. [ 0.5180, -0.3779, 1.5996, -0.1218, -0.0797, -0.9529, 0.3193, 0.5528],
  35304. [ 0.6336, -0.4351, 1.7194, 0.2918, -0.4420, -0.1731, 0.6663, 0.0219],
  35305. [ 0.5221, -0.4751, 1.8630, -0.2368, -0.4454, -0.0110, 0.6517, -0.0719],
  35306. [ 0.5000, -0.4733, 1.6916, -0.1716, -0.3797, 0.0467, 0.2077, -0.0549],
  35307. [-2.3529, -2.2758, 0.7838, -1.2784, -0.2598, -1.3029, 0.2252, 0.2022]],
  35308. device='cuda:0', grad_fn=<AddmmBackward>)
  35309. landmarks are: tensor([[[ 5.6801e-01, -4.3453e-01, 1.6864e+00, -4.3153e-01, -4.6981e-01,
  35310. -1.1241e+00, 3.5183e-01, 2.2607e-01],
  35311. [ 5.2702e-01, -4.3356e-01, 1.3342e+00, -6.7698e-01, -6.5196e-01,
  35312. -5.3841e-01, 2.3702e-01, 5.9193e-02],
  35313. [ 6.0785e-01, -3.9761e-01, 1.4208e+00, -1.4314e+00, -3.6328e-01,
  35314. -1.1312e+00, 6.1950e-01, -9.2270e-04],
  35315. [ 6.1742e-01, -3.1175e-01, 1.6402e+00, -2.0739e-01, -1.9584e-01,
  35316. -1.0927e+00, 2.2674e-01, 5.8220e-01],
  35317. [ 6.1276e-01, -4.3749e-01, 1.7788e+00, 2.6990e-01, -6.3464e-01,
  35318. -2.5358e-01, 5.4635e-01, -1.2778e-01],
  35319. [ 6.0716e-01, -4.2055e-01, 1.8711e+00, -2.5358e-01, -6.1155e-01,
  35320. -1.3041e-01, 6.8119e-01, -6.7050e-02],
  35321. [ 5.2269e-01, -4.6151e-01, 1.6575e+00, -1.3041e-01, -5.0762e-01,
  35322. -1.4935e-02, 1.8150e-01, 2.0831e-03],
  35323. [-2.2859e+00, -2.2859e+00, 9.9216e-01, -1.2021e+00, -3.2286e-01,
  35324. -1.4314e+00, 1.0439e-01, 2.9299e-01]]], device='cuda:0')
  35325. loss_train_step before backward: tensor(0.0088, device='cuda:0', grad_fn=<MseLossBackward>)
  35326. loss_train_step after backward: tensor(0.0088, device='cuda:0', grad_fn=<MseLossBackward>)
  35327. loss_train: 0.2614791188389063
  35328. step: 23
  35329. running loss: 0.011368657340822012
  35330. Train Steps: 23/90 Loss: 0.0114 torch.Size([8, 600, 800])
  35331. torch.Size([8, 8])
  35332. tensor([[0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  35333. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869],
  35334. [0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  35335. [0.6154, 0.4112, 0.7037, 0.2317, 0.4238, 0.1833, 0.5350, 0.5600],
  35336. [0.6300, 0.4102, 0.9088, 0.4433, 0.4088, 0.3067, 0.6820, 0.5540],
  35337. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  35338. [0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350],
  35339. [0.6189, 0.3911, 0.8800, 0.4917, 0.3713, 0.4800, 0.6038, 0.4833]],
  35340. device='cuda:0', dtype=torch.float64)
  35341. predictions are: tensor([[ 0.5986, -0.4155, 1.1743, -0.8504, -0.5632, -0.9299, 0.2082, -0.0190],
  35342. [ 0.5951, -0.3816, 1.5139, -1.1340, -0.0489, -1.3246, 0.5283, -0.0248],
  35343. [ 0.5897, -0.3812, 1.7208, 0.1187, -0.1267, 0.3652, 0.2454, 0.0767],
  35344. [ 0.5437, -0.4196, 0.9207, -1.1098, -0.2944, -1.4431, 0.1695, 0.3735],
  35345. [-0.3162, -1.0101, 1.7977, -0.1153, -0.3829, -0.8892, 0.7867, 0.1933],
  35346. [ 0.5377, -0.4063, 1.7138, -0.2150, -0.2550, 0.3595, 0.3530, 0.1509],
  35347. [ 0.4393, -0.4756, 1.4093, -0.8884, -0.4290, -0.8770, 0.4530, 0.2676],
  35348. [ 0.7966, -0.3260, 1.7673, 0.0466, -0.4888, -0.0788, 0.4975, -0.0127]],
  35349. device='cuda:0', grad_fn=<AddmmBackward>)
  35350. landmarks are: tensor([[[ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  35351. 0.0141],
  35352. [ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  35353. -0.0369],
  35354. [ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  35355. 0.0592],
  35356. [ 0.5565, -0.3864, 0.9647, -1.2159, -0.3286, -1.4391, 0.1852,
  35357. 0.3007],
  35358. [ 0.6240, -0.3912, 1.9115, -0.2382, -0.3979, -0.8694, 0.8644,
  35359. 0.2730],
  35360. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  35361. 0.2936],
  35362. [ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  35363. 0.1852],
  35364. [ 0.5726, -0.4795, 1.7788, -0.0149, -0.5711, -0.0688, 0.5028,
  35365. -0.0534]]], device='cuda:0')
  35366. loss_train_step before backward: tensor(0.0251, device='cuda:0', grad_fn=<MseLossBackward>)
  35367. loss_train_step after backward: tensor(0.0251, device='cuda:0', grad_fn=<MseLossBackward>)
  35368. loss_train: 0.28657217137515545
  35369. step: 24
  35370. running loss: 0.011940507140631476
  35371.  
  35372. Train Steps: 24/90 Loss: 0.0119 torch.Size([8, 600, 800])
  35373. torch.Size([8, 8])
  35374. tensor([[0.6339, 0.4118, 0.7988, 0.5800, 0.3912, 0.4583, 0.7343, 0.5760],
  35375. [ nan, nan, 0.6469, 0.1943, 0.4025, 0.2000, 0.5125, 0.5533],
  35376. [0.6314, 0.4107, 0.8750, 0.5100, 0.3788, 0.4900, 0.7121, 0.5864],
  35377. [0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  35378. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  35379. [0.6229, 0.4086, 0.7538, 0.2600, 0.4775, 0.1617, 0.5900, 0.5383],
  35380. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083],
  35381. [0.6275, 0.4050, 0.9038, 0.3767, 0.3838, 0.3533, 0.7074, 0.5575]],
  35382. device='cuda:0', dtype=torch.float64)
  35383. predictions are: tensor([[ 0.5811, -0.4193, 1.4924, 0.1970, -0.4542, -0.1588, 0.7031, 0.1884],
  35384. [-2.8906, -2.6697, 0.7015, -1.2611, -0.3438, -1.3725, 0.1311, 0.1136],
  35385. [ 0.6681, -0.3650, 1.8313, 0.0553, -0.4647, 0.0585, 0.6894, 0.1858],
  35386. [ 0.6057, -0.3989, 1.8592, -0.2476, -0.4531, 0.3330, 0.2408, -0.1263],
  35387. [ 0.4641, -0.5044, 1.3320, -1.1807, -0.1842, -1.3894, 0.2375, -0.0075],
  35388. [ 0.5326, -0.4550, 1.2745, -1.0956, -0.1449, -1.3885, 0.2040, 0.1259],
  35389. [ 0.6367, -0.3457, 1.5546, 0.2843, -0.3334, -0.0293, 0.0620, 0.3324],
  35390. [ 0.6460, -0.3894, 1.9278, -0.4953, -0.4726, -0.5593, 0.6979, 0.1154]],
  35391. device='cuda:0', grad_fn=<AddmmBackward>)
  35392. landmarks are: tensor([[[ 0.6421, -0.3840, 1.4035, 0.3931, -0.4788, -0.1689, 1.1057,
  35393. 0.3745],
  35394. [-2.2859, -2.2859, 0.7023, -1.3883, -0.4268, -1.3621, 0.0813,
  35395. 0.2699],
  35396. [ 0.6306, -0.3888, 1.7557, 0.0697, -0.5365, -0.0226, 1.0033,
  35397. 0.4226],
  35398. [ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  35399. -0.0322],
  35400. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  35401. 0.1005],
  35402. [ 0.5911, -0.3984, 1.1956, -1.0850, -0.0804, -1.5392, 0.4393,
  35403. 0.2006],
  35404. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  35405. 0.5239],
  35406. [ 0.6125, -0.4153, 1.8885, -0.5461, -0.5134, -0.6539, 0.9814,
  35407. 0.2890]]], device='cuda:0')
  35408. loss_train_step before backward: tensor(0.0235, device='cuda:0', grad_fn=<MseLossBackward>)
  35409. loss_train_step after backward: tensor(0.0235, device='cuda:0', grad_fn=<MseLossBackward>)
  35410. loss_train: 0.3100247588008642
  35411. step: 25
  35412. running loss: 0.012400990352034569
  35413. Train Steps: 25/90 Loss: 0.0124 torch.Size([8, 600, 800])
  35414. torch.Size([8, 8])
  35415. tensor([[ nan, nan, 0.7412, 0.2200, 0.4450, 0.1517, 0.5312, 0.4983],
  35416. [0.6162, 0.3949, 0.8838, 0.4517, 0.4250, 0.5183, 0.5837, 0.5500],
  35417. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  35418. [0.6254, 0.4076, 0.8700, 0.3267, 0.4150, 0.3083, 0.7050, 0.5609],
  35419. [0.6200, 0.4071, 0.7338, 0.1917, 0.4200, 0.2450, 0.6150, 0.5517],
  35420. [0.6038, 0.3946, 0.8413, 0.4883, 0.3563, 0.4550, 0.5266, 0.4693],
  35421. [ nan, nan, 0.8037, 0.2483, 0.3975, 0.2517, 0.5575, 0.5600],
  35422. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142]],
  35423. device='cuda:0', dtype=torch.float64)
  35424. predictions are: tensor([[-1.1408, -1.5361, 1.0224, -1.2326, -0.2584, -1.5380, 0.1721, 0.0526],
  35425. [ 0.7885, -0.2863, 1.8197, -0.1257, -0.3346, 0.1764, 0.3208, 0.1103],
  35426. [ 0.9252, -0.2396, 1.6979, 0.4724, -0.5313, -0.0838, 0.6209, -0.0663],
  35427. [ 0.8023, -0.2682, 1.7999, -0.7008, -0.3828, -0.8174, 0.7808, 0.2176],
  35428. [ 0.7457, -0.3124, 1.2050, -1.2411, -0.3297, -1.1018, 0.5817, 0.2070],
  35429. [ 0.6664, -0.3476, 1.6641, 0.0448, -0.5411, -0.1716, 0.1976, 0.0074],
  35430. [-1.9553, -2.0598, 1.1571, -0.9643, -0.3716, -1.0576, 0.3377, 0.1847],
  35431. [ 0.8637, -0.2172, 1.7630, -0.1238, -0.3981, -0.1083, 0.0655, 0.0336]],
  35432. device='cuda:0', grad_fn=<AddmmBackward>)
  35433. landmarks are: tensor([[[-2.2859, -2.2859, 1.1379, -1.2697, -0.2305, -1.5854, 0.1679,
  35434. 0.0159],
  35435. [ 0.5604, -0.4620, 1.7961, -0.1997, -0.3229, 0.1082, 0.4104,
  35436. 0.2545],
  35437. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  35438. 0.0261],
  35439. [ 0.6026, -0.4032, 1.7326, -0.7771, -0.3691, -0.8617, 0.9704,
  35440. 0.3050],
  35441. [ 0.5779, -0.4054, 1.1032, -1.4006, -0.3460, -1.1543, 0.5547,
  35442. 0.2622],
  35443. [ 0.5030, -0.4631, 1.5998, -0.0303, -0.6404, -0.1843, 0.1465,
  35444. -0.1181],
  35445. [-2.2859, -2.2859, 1.4266, -1.1389, -0.4499, -1.1235, 0.2891,
  35446. 0.3007],
  35447. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  35448. 0.0893]]], device='cuda:0')
  35449. loss_train_step before backward: tensor(0.0447, device='cuda:0', grad_fn=<MseLossBackward>)
  35450. loss_train_step after backward: tensor(0.0447, device='cuda:0', grad_fn=<MseLossBackward>)
  35451. loss_train: 0.3547267075628042
  35452. step: 26
  35453. running loss: 0.013643334906261701
  35454. Train Steps: 26/90 Loss: 0.0136 torch.Size([8, 600, 800])
  35455. torch.Size([8, 8])
  35456. tensor([[0.6364, 0.4165, 0.9088, 0.4367, 0.4075, 0.3150, 0.6448, 0.5297],
  35457. [0.6273, 0.4110, 0.8900, 0.3817, 0.4188, 0.2167, 0.5858, 0.4835],
  35458. [0.6300, 0.4013, 0.8938, 0.5350, 0.3675, 0.4600, 0.6456, 0.4973],
  35459. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  35460. [0.6169, 0.4052, 0.8742, 0.4779, 0.4288, 0.4917, 0.5763, 0.5617],
  35461. [0.6137, 0.4084, 0.8076, 0.3889, 0.3650, 0.3150, 0.5356, 0.5896],
  35462. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  35463. [0.6127, 0.4118, 0.8650, 0.5083, 0.4088, 0.5367, 0.5300, 0.5456]],
  35464. device='cuda:0', dtype=torch.float64)
  35465. predictions are: tensor([[ 0.6620, -0.3677, 1.8076, -0.3847, -0.4292, -0.8024, 0.6340, 0.0763],
  35466. [ 0.5911, -0.4249, 1.7981, -0.6270, -0.3402, -1.2767, 0.5001, -0.1651],
  35467. [ 0.5506, -0.5222, 1.7383, 0.0278, -0.5927, -0.0961, 0.7650, -0.1522],
  35468. [ 0.6720, -0.3217, 1.5277, 0.2882, -0.4061, -0.1802, 0.2474, 0.3197],
  35469. [ 0.5696, -0.4438, 1.7033, -0.2212, -0.2888, 0.0774, 0.3652, 0.1547],
  35470. [ 0.5928, -0.4065, 1.4053, -0.6018, -0.6057, -0.8218, 0.1283, 0.2768],
  35471. [ 0.4583, -0.4911, 1.6556, -0.6127, -0.3981, -0.7983, 0.3458, 0.3686],
  35472. [ 0.5000, -0.4589, 1.6152, -0.0718, -0.3428, 0.2066, 0.2578, 0.1003]],
  35473. device='cuda:0', grad_fn=<AddmmBackward>)
  35474. landmarks are: tensor([[[ 0.6537, -0.3623, 1.9115, -0.2690, -0.4037, -0.8309, 0.6926,
  35475. 0.1608],
  35476. [ 0.6117, -0.3877, 1.8249, -0.5230, -0.3517, -1.2851, 0.4200,
  35477. -0.0529],
  35478. [ 0.6240, -0.4321, 1.8423, 0.1852, -0.5885, -0.1612, 0.6962,
  35479. 0.0111],
  35480. [ 0.5836, -0.3649, 1.7210, 0.3854, -0.3979, -0.2921, 0.3065,
  35481. 0.4470],
  35482. [ 0.5637, -0.4143, 1.7519, -0.0787, -0.3055, -0.0149, 0.3758,
  35483. 0.3084],
  35484. [ 0.5485, -0.3997, 1.4445, -0.4895, -0.6000, -0.8309, 0.1878,
  35485. 0.4374],
  35486. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  35487. 0.3928],
  35488. [ 0.5443, -0.3840, 1.7095, 0.0620, -0.3979, 0.1929, 0.1622,
  35489. 0.2341]]], device='cuda:0')
  35490. loss_train_step before backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  35491. loss_train_step after backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  35492. loss_train: 0.3619840261526406
  35493. step: 27
  35494. running loss: 0.013406815783431133
  35495. Train Steps: 27/90 Loss: 0.0134 torch.Size([8, 600, 800])
  35496. torch.Size([8, 8])
  35497. tensor([[0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717],
  35498. [0.6263, 0.4233, 0.7924, 0.4626, 0.3788, 0.2883, 0.5573, 0.6047],
  35499. [0.6153, 0.4117, 0.8688, 0.5167, 0.4895, 0.5647, 0.5524, 0.5136],
  35500. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917],
  35501. [0.6205, 0.4012, 0.8675, 0.3283, 0.3713, 0.3050, 0.5813, 0.5117],
  35502. [0.6257, 0.4167, 0.8775, 0.3433, 0.3563, 0.4133, 0.6200, 0.5667],
  35503. [0.6258, 0.4143, 0.8525, 0.2617, 0.4950, 0.1667, 0.6219, 0.4967],
  35504. [0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356]],
  35505. device='cuda:0', dtype=torch.float64)
  35506. predictions are: tensor([[ 0.5315, -0.4936, 1.6832, -0.1068, -0.3618, -0.0711, 0.2883, 0.1341],
  35507. [ 0.4543, -0.4824, 1.3927, -0.0890, -0.5153, -0.8565, 0.3237, 0.4404],
  35508. [ 0.5046, -0.4862, 1.6858, 0.0078, -0.1689, 0.1853, 0.3572, 0.0407],
  35509. [ 0.6492, -0.3580, 1.2518, -0.4897, -0.6171, -0.7439, 0.2897, 0.3618],
  35510. [ 0.4292, -0.5649, 1.7148, -0.7917, -0.5799, -0.9039, 0.4304, -0.0680],
  35511. [ 0.7026, -0.3457, 1.7546, -0.6548, -0.7039, -0.3940, 0.5502, 0.2667],
  35512. [ 0.4067, -0.5144, 1.6281, -1.1137, -0.1014, -1.4728, 0.5556, -0.0738],
  35513. [ 0.5445, -0.4663, 1.4199, -1.1006, -0.3598, -1.2067, 0.7418, 0.0817]],
  35514. device='cuda:0', grad_fn=<AddmmBackward>)
  35515. landmarks are: tensor([[[ 5.4319e-01, -4.4619e-01, 1.7557e+00, -3.8029e-02, -3.1132e-01,
  35516. -7.6520e-02, 2.1409e-01, 3.5458e-01],
  35517. [ 6.0687e-01, -3.3095e-01, 1.3742e+00, -1.4927e-01, -5.3649e-01,
  35518. -9.5412e-01, 2.8843e-01, 5.0705e-01],
  35519. [ 5.5635e-01, -3.8422e-01, 1.7268e+00, 1.0054e-01, -2.4997e-02,
  35520. 3.2255e-01, 2.6581e-01, 8.6245e-02],
  35521. [ 5.6801e-01, -3.8397e-01, 1.0756e+00, -3.2902e-01, -6.2887e-01,
  35522. -7.1547e-01, 3.3533e-01, 4.4696e-01],
  35523. [ 5.7991e-01, -4.3295e-01, 1.7210e+00, -7.6936e-01, -5.7113e-01,
  35524. -8.7714e-01, 3.9885e-01, 7.7444e-02],
  35525. [ 6.0404e-01, -3.6135e-01, 1.7672e+00, -7.0008e-01, -6.4042e-01,
  35526. -3.7675e-01, 5.7783e-01, 3.3149e-01],
  35527. [ 6.0479e-01, -3.7229e-01, 1.6517e+00, -1.0773e+00, 4.6189e-04,
  35528. -1.5161e+00, 5.8660e-01, 8.0947e-03],
  35529. [ 6.1742e-01, -4.2249e-01, 1.4975e+00, -1.1709e+00, -3.1736e-01,
  35530. -1.1806e+00, 6.5391e-01, 1.8793e-01]]], device='cuda:0')
  35531. loss_train_step before backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  35532. loss_train_step after backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  35533. loss_train: 0.36961828637868166
  35534. step: 28
  35535. running loss: 0.013200653084952916
  35536.  
  35537. Train Steps: 28/90 Loss: 0.0132 torch.Size([8, 600, 800])
  35538. torch.Size([8, 8])
  35539. tensor([[0.6154, 0.4048, 0.7100, 0.2067, 0.4338, 0.1667, 0.5413, 0.5220],
  35540. [0.6279, 0.4008, 0.8600, 0.4883, 0.4325, 0.5283, 0.7010, 0.5378],
  35541. [0.6211, 0.3993, 0.7650, 0.1933, 0.4575, 0.1550, 0.5965, 0.4895],
  35542. [0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  35543. [ nan, nan, 0.6512, 0.1717, 0.4100, 0.1983, 0.5253, 0.5240],
  35544. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967],
  35545. [0.6267, 0.4065, 0.8313, 0.2467, 0.4788, 0.1733, 0.6312, 0.5133],
  35546. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901]],
  35547. device='cuda:0', dtype=torch.float64)
  35548. predictions are: tensor([[ 0.4313, -0.5155, 1.1067, -1.0634, -0.3721, -1.3428, 0.2664, 0.1494],
  35549. [ 0.6846, -0.3799, 1.7791, 0.0894, -0.4743, 0.2629, 0.8621, 0.1941],
  35550. [ 0.4842, -0.4876, 1.2978, -1.2284, -0.2565, -1.3639, 0.4528, 0.0666],
  35551. [ 0.3270, -0.5922, 1.1034, -1.0974, -0.3443, -1.4218, 0.2423, 0.0650],
  35552. [-2.2664, -2.2828, 0.8286, -1.3220, -0.4161, -1.3312, 0.1259, 0.1718],
  35553. [ 0.7369, -0.3070, 1.8857, -0.0652, -0.5453, 0.3664, 0.5765, 0.3902],
  35554. [ 0.5477, -0.4333, 1.6124, -0.9366, -0.2165, -1.2759, 0.6049, 0.1203],
  35555. [ 0.4474, -0.5065, 1.5137, -0.7639, -0.6022, -0.9738, 0.1621, 0.0091]],
  35556. device='cuda:0', grad_fn=<AddmmBackward>)
  35557. landmarks are: tensor([[[ 0.5566, -0.4160, 0.9935, -1.3313, -0.2824, -1.5161, 0.2144,
  35558. 0.1253],
  35559. [ 0.6141, -0.4345, 1.6864, -0.0303, -0.2882, 0.1544, 0.9521,
  35560. 0.1982],
  35561. [ 0.5828, -0.4417, 1.2476, -1.3929, -0.1727, -1.5700, 0.4694,
  35562. -0.0248],
  35563. [ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  35564. 0.0261],
  35565. [-2.2859, -2.2859, 0.7222, -1.4930, -0.3921, -1.3698, 0.1404,
  35566. 0.1343],
  35567. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  35568. 0.4701],
  35569. [ 0.6085, -0.4084, 1.5536, -1.1466, -0.0746, -1.4853, 0.6298,
  35570. 0.0851],
  35571. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  35572. -0.0220]]], device='cuda:0')
  35573. loss_train_step before backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  35574. loss_train_step after backward: tensor(0.0138, device='cuda:0', grad_fn=<MseLossBackward>)
  35575. loss_train: 0.3834594888612628
  35576. step: 29
  35577. running loss: 0.013222740995215958
  35578. Train Steps: 29/90 Loss: 0.0132 torch.Size([8, 600, 800])
  35579. torch.Size([8, 8])
  35580. tensor([[0.6198, 0.3997, 0.8582, 0.5361, 0.4117, 0.5016, 0.5942, 0.5134],
  35581. [0.6132, 0.4037, 0.6963, 0.2217, 0.4100, 0.1950, 0.5395, 0.5175],
  35582. [0.6173, 0.4114, 0.7325, 0.2500, 0.4213, 0.1917, 0.5338, 0.5700],
  35583. [0.6076, 0.3953, 0.8125, 0.3917, 0.3525, 0.4083, 0.5346, 0.4954],
  35584. [0.6163, 0.4006, 0.8788, 0.4683, 0.3663, 0.4883, 0.5887, 0.5017],
  35585. [0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  35586. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  35587. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350]],
  35588. device='cuda:0', dtype=torch.float64)
  35589. predictions are: tensor([[ 0.6854, -0.4110, 1.7386, 0.2029, -0.4442, 0.0123, 0.5923, 0.0250],
  35590. [ 0.4848, -0.4617, 1.0833, -1.2358, -0.3939, -1.4464, 0.3869, 0.0485],
  35591. [ 0.2746, -0.5979, 1.1664, -1.1019, -0.3426, -1.3615, 0.2957, 0.2825],
  35592. [ 0.5144, -0.4763, 1.6270, -0.4498, -0.6939, -0.4958, 0.4341, 0.0083],
  35593. [ 0.6393, -0.4014, 1.8480, -0.1163, -0.6229, -0.0050, 0.5811, 0.1108],
  35594. [ 0.6124, -0.3778, 1.7751, -0.0631, -0.2991, -0.0231, 0.2343, 0.2695],
  35595. [-2.0529, -2.1630, 0.8682, -1.3244, -0.3408, -1.5010, 0.1745, 0.3081],
  35596. [ 0.6295, -0.3719, 1.8619, -0.2724, -0.5806, -0.4473, 0.4335, 0.2207]],
  35597. device='cuda:0', grad_fn=<AddmmBackward>)
  35598. landmarks are: tensor([[[ 5.7673e-01, -4.3957e-01, 1.6782e+00, 1.9046e-01, -3.8437e-01,
  35599. 3.0841e-02, 4.5876e-01, 8.5521e-02],
  35600. [ 5.4648e-01, -4.2140e-01, 9.3002e-01, -1.2620e+00, -3.9215e-01,
  35601. -1.3852e+00, 2.0618e-01, 1.0428e-01],
  35602. [ 5.6518e-01, -3.8584e-01, 1.0975e+00, -1.1312e+00, -3.4018e-01,
  35603. -1.4006e+00, 1.7945e-01, 3.4688e-01],
  35604. [ 5.2061e-01, -4.6028e-01, 1.4670e+00, -4.7683e-01, -6.5774e-01,
  35605. -3.9985e-01, 1.8356e-01, 2.0831e-03],
  35606. [ 5.6091e-01, -4.3541e-01, 1.7730e+00, -1.2271e-01, -5.9423e-01,
  35607. -3.0331e-02, 4.3349e-01, 3.1255e-02],
  35608. [ 5.4908e-01, -4.1324e-01, 1.7557e+00, -9.1917e-02, -2.7090e-01,
  35609. 3.1255e-02, 6.3480e-02, 4.0319e-01],
  35610. [-2.2859e+00, -2.2859e+00, 6.7598e-01, -1.4083e+00, -3.2864e-01,
  35611. -1.4160e+00, 2.4873e-01, 3.4688e-01],
  35612. [ 6.0722e-01, -3.2394e-01, 1.8423e+00, -3.5366e-01, -4.9607e-01,
  35613. -3.9215e-01, 2.0831e-01, 1.8522e-01]]], device='cuda:0')
  35614. loss_train_step before backward: tensor(0.0104, device='cuda:0', grad_fn=<MseLossBackward>)
  35615. loss_train_step after backward: tensor(0.0104, device='cuda:0', grad_fn=<MseLossBackward>)
  35616. loss_train: 0.3938441062346101
  35617. step: 30
  35618. running loss: 0.013128136874487002
  35619. Train Steps: 30/90 Loss: 0.0131 torch.Size([8, 600, 800])
  35620. torch.Size([8, 8])
  35621. tensor([[0.6286, 0.4034, 0.8191, 0.2414, 0.4262, 0.2393, 0.6365, 0.5356],
  35622. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  35623. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  35624. [0.6087, 0.3951, 0.8387, 0.5833, 0.4188, 0.4933, 0.5146, 0.4830],
  35625. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  35626. [0.6339, 0.4159, 0.8400, 0.5617, 0.3825, 0.4150, 0.7343, 0.5748],
  35627. [0.6167, 0.4048, 0.6831, 0.3639, 0.3763, 0.3017, 0.5700, 0.5883],
  35628. [0.6176, 0.3911, 0.8738, 0.4217, 0.3488, 0.4033, 0.6025, 0.4817]],
  35629. device='cuda:0', dtype=torch.float64)
  35630. predictions are: tensor([[ 0.7876, -0.2612, 1.4754, -1.2204, -0.3086, -1.2458, 0.6964, 0.1785],
  35631. [ 0.6606, -0.3845, 1.8579, -0.6968, -0.3384, -0.8934, 0.8674, 0.1214],
  35632. [-1.1621, -1.5742, 1.4177, -0.9740, -0.6736, -0.8677, 0.1271, 0.1619],
  35633. [ 0.8018, -0.2644, 1.5804, 0.3024, -0.3906, -0.0824, 0.0951, 0.0740],
  35634. [-1.5449, -1.8026, 1.1856, -1.3089, -0.3308, -1.4579, 0.0138, 0.1254],
  35635. [ 0.8893, -0.2169, 1.6289, 0.1542, -0.5249, -0.3488, 0.8478, 0.2615],
  35636. [ 0.5511, -0.3979, 1.0464, -0.8318, -0.5398, -0.8926, 0.2521, 0.5029],
  35637. [ 0.6511, -0.3953, 1.7895, -0.4373, -0.6443, -0.5113, 0.4277, 0.0741]],
  35638. device='cuda:0', grad_fn=<AddmmBackward>)
  35639. landmarks are: tensor([[[ 0.6174, -0.4225, 1.4975, -1.1709, -0.3174, -1.1806, 0.6539,
  35640. 0.1879],
  35641. [ 0.6125, -0.4369, 1.9173, -0.5384, -0.2594, -0.8386, 0.9741,
  35642. 0.1821],
  35643. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  35644. 0.0893],
  35645. [ 0.5258, -0.4610, 1.5882, 0.4085, -0.3517, -0.0072, 0.0910,
  35646. -0.0550],
  35647. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  35648. 0.0231],
  35649. [ 0.6421, -0.3647, 1.5940, 0.3084, -0.5192, -0.3691, 1.1057,
  35650. 0.3692],
  35651. [ 0.5626, -0.4162, 0.8692, -0.6051, -0.5480, -0.8925, 0.3469,
  35652. 0.4316],
  35653. [ 0.5669, -0.4794, 1.7499, -0.3383, -0.6751, -0.4229, 0.4970,
  35654. -0.0611]]], device='cuda:0')
  35655. loss_train_step before backward: tensor(0.0529, device='cuda:0', grad_fn=<MseLossBackward>)
  35656. loss_train_step after backward: tensor(0.0529, device='cuda:0', grad_fn=<MseLossBackward>)
  35657. loss_train: 0.44675440434366465
  35658. step: 31
  35659. running loss: 0.01441143239818273
  35660. Train Steps: 31/90 Loss: 0.0144 torch.Size([8, 600, 800])
  35661. torch.Size([8, 8])
  35662. tensor([[0.6200, 0.4101, 0.8838, 0.5317, 0.3825, 0.3800, 0.5413, 0.5683],
  35663. [0.6202, 0.4053, 0.8638, 0.5283, 0.4546, 0.5108, 0.5900, 0.5133],
  35664. [0.6167, 0.4048, 0.6831, 0.3639, 0.3763, 0.3017, 0.5700, 0.5883],
  35665. [0.6197, 0.4090, 0.7825, 0.2500, 0.4200, 0.2483, 0.5988, 0.5667],
  35666. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  35667. [0.6131, 0.4037, 0.6907, 0.2819, 0.3688, 0.2700, 0.5217, 0.5680],
  35668. [0.6200, 0.3913, 0.8788, 0.5217, 0.4075, 0.5100, 0.6060, 0.4913],
  35669. [0.6185, 0.4080, 0.8625, 0.3483, 0.3788, 0.2650, 0.5320, 0.5272]],
  35670. device='cuda:0', dtype=torch.float64)
  35671. predictions are: tensor([[ 0.6828, -0.3442, 1.7467, 0.0619, -0.5904, -0.5502, 0.3114, 0.3808],
  35672. [ 0.6513, -0.3840, 1.7281, 0.0559, -0.2999, 0.0749, 0.4490, 0.1396],
  35673. [ 0.3418, -0.5646, 1.0523, -0.8296, -0.6099, -0.9134, 0.3042, 0.4728],
  35674. [ 0.4111, -0.5128, 1.3451, -1.2935, -0.4238, -1.2114, 0.4419, 0.3051],
  35675. [ 0.6906, -0.3634, 2.1027, -0.7261, -0.1946, -1.2085, 1.1692, 0.1020],
  35676. [ 0.2817, -0.5988, 0.9430, -1.1393, -0.5916, -1.0603, 0.1292, 0.2920],
  35677. [ 0.5299, -0.5242, 1.7526, 0.0204, -0.4859, 0.0421, 0.3819, -0.0368],
  35678. [ 0.6846, -0.3526, 1.7553, -0.8015, -0.5090, -1.1177, 0.3066, 0.1300]],
  35679. device='cuda:0', grad_fn=<AddmmBackward>)
  35680. landmarks are: tensor([[[ 0.5777, -0.3915, 1.7961, 0.1698, -0.5192, -0.5307, 0.2141,
  35681. 0.3392],
  35682. [ 0.5786, -0.4141, 1.7037, 0.1544, -0.1862, 0.0736, 0.4393,
  35683. 0.0851],
  35684. [ 0.5626, -0.4162, 0.8692, -0.6051, -0.5480, -0.8925, 0.3469,
  35685. 0.4316],
  35686. [ 0.5764, -0.3969, 1.3284, -1.1312, -0.3460, -1.1389, 0.4797,
  35687. 0.3315],
  35688. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  35689. 0.2142],
  35690. [ 0.5459, -0.4215, 0.9043, -0.9838, -0.5827, -1.0388, 0.1236,
  35691. 0.3378],
  35692. [ 0.5776, -0.4784, 1.7730, 0.1236, -0.4037, 0.0697, 0.5132,
  35693. -0.0168],
  35694. [ 0.5711, -0.4015, 1.6979, -0.6770, -0.5365, -1.0619, 0.1712,
  35695. 0.1494]]], device='cuda:0')
  35696. loss_train_step before backward: tensor(0.0103, device='cuda:0', grad_fn=<MseLossBackward>)
  35697. loss_train_step after backward: tensor(0.0103, device='cuda:0', grad_fn=<MseLossBackward>)
  35698. loss_train: 0.4570535933598876
  35699. step: 32
  35700. running loss: 0.014282924792496487
  35701.  
  35702. Train Steps: 32/90 Loss: 0.0143 torch.Size([8, 600, 800])
  35703. torch.Size([8, 8])
  35704. tensor([[0.6245, 0.4115, 0.8700, 0.4883, 0.4625, 0.5517, 0.6100, 0.5217],
  35705. [0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  35706. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  35707. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  35708. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  35709. [0.6199, 0.4060, 0.8888, 0.4667, 0.3800, 0.5050, 0.6188, 0.5433],
  35710. [0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350],
  35711. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783]],
  35712. device='cuda:0', dtype=torch.float64)
  35713. predictions are: tensor([[ 6.4178e-01, -3.5956e-01, 1.7213e+00, -5.5002e-03, -2.6230e-01,
  35714. 1.4525e-02, 5.9712e-01, 2.7523e-01],
  35715. [ 4.7999e-01, -4.8110e-01, 1.1534e+00, -9.4995e-01, -6.3442e-01,
  35716. -1.0915e+00, 2.5093e-01, -2.0075e-03],
  35717. [-1.9991e+00, -2.1325e+00, 1.3982e+00, -9.4794e-01, -7.2812e-01,
  35718. -9.9760e-01, 1.5390e-01, 1.4590e-01],
  35719. [ 5.6458e-01, -3.8236e-01, 1.7374e+00, -7.4091e-02, -2.8748e-01,
  35720. 1.2523e-01, 3.6424e-01, 2.4052e-01],
  35721. [ 4.8428e-01, -4.9028e-01, 1.7524e+00, -8.4647e-02, -1.1400e-01,
  35722. -2.1300e-01, 4.6986e-01, 2.6927e-01],
  35723. [ 5.5946e-01, -4.2733e-01, 1.7709e+00, -1.3355e-01, -5.6999e-01,
  35724. -1.6277e-01, 5.4718e-01, 2.3423e-01],
  35725. [ 4.1153e-01, -5.0251e-01, 1.4305e+00, -1.0455e+00, -5.0402e-01,
  35726. -1.1267e+00, 5.4868e-01, 2.4379e-01],
  35727. [ 4.6093e-01, -4.3216e-01, 1.2042e+00, -1.0118e+00, -2.2142e-01,
  35728. -1.4587e+00, 3.7473e-01, 3.7239e-01]], device='cuda:0',
  35729. grad_fn=<AddmmBackward>)
  35730. landmarks are: tensor([[[ 0.5987, -0.3852, 1.7326, -0.0303, -0.1497, 0.2622, 0.5316,
  35731. 0.1236],
  35732. [ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  35733. 0.0141],
  35734. [-2.2859, -2.2859, 1.5767, -0.7540, -0.6404, -0.7309, 0.1753,
  35735. 0.0893],
  35736. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  35737. 0.0622],
  35738. [ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  35739. 0.2853],
  35740. [ 0.5773, -0.4105, 1.8192, -0.1304, -0.5307, 0.0467, 0.5721,
  35741. 0.2237],
  35742. [ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  35743. 0.1852],
  35744. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  35745. 0.3854]]], device='cuda:0')
  35746. loss_train_step before backward: tensor(0.0128, device='cuda:0', grad_fn=<MseLossBackward>)
  35747. loss_train_step after backward: tensor(0.0128, device='cuda:0', grad_fn=<MseLossBackward>)
  35748. loss_train: 0.46980485040694475
  35749. step: 33
  35750. running loss: 0.014236510618392265
  35751. Train Steps: 33/90 Loss: 0.0142 torch.Size([8, 600, 800])
  35752. torch.Size([8, 8])
  35753. tensor([[0.6265, 0.4071, 0.8875, 0.3367, 0.3975, 0.3350, 0.6312, 0.5250],
  35754. [0.6148, 0.4053, 0.8750, 0.4550, 0.4850, 0.5218, 0.5863, 0.5567],
  35755. [0.6222, 0.4108, 0.8938, 0.4233, 0.3600, 0.3817, 0.5825, 0.5283],
  35756. [0.6277, 0.4029, 0.8250, 0.2433, 0.4325, 0.2100, 0.6366, 0.5207],
  35757. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  35758. [0.6112, 0.4029, 0.8638, 0.4800, 0.4875, 0.5083, 0.5763, 0.5567],
  35759. [0.6276, 0.4235, 0.8888, 0.5333, 0.3800, 0.3117, 0.5427, 0.6164],
  35760. [0.6126, 0.3954, 0.8538, 0.4983, 0.4250, 0.4700, 0.5355, 0.5350]],
  35761. device='cuda:0', dtype=torch.float64)
  35762. predictions are: tensor([[ 0.6651, -0.3525, 1.8387, -0.8408, -0.5424, -0.8504, 0.6656, 0.1439],
  35763. [ 0.4286, -0.4925, 1.7124, -0.2640, -0.1381, -0.0479, 0.2317, 0.3010],
  35764. [ 0.7453, -0.2869, 1.7095, -0.4168, -0.7020, -0.5912, 0.4953, 0.2396],
  35765. [ 0.3159, -0.6062, 1.4369, -1.2623, -0.3676, -1.3907, 0.5356, 0.0811],
  35766. [ 0.6956, -0.3403, 1.5745, 0.1918, -0.4717, 0.0982, 0.7810, 0.1632],
  35767. [ 0.3613, -0.5702, 1.7576, -0.1592, -0.1135, -0.0804, 0.3595, 0.2578],
  35768. [ 0.6153, -0.3244, 1.6121, 0.1522, -0.5642, -0.8442, 0.2849, 0.5926],
  35769. [ 0.5132, -0.4749, 1.6085, -0.0092, -0.4199, -0.1877, 0.1662, 0.1904]],
  35770. device='cuda:0', grad_fn=<AddmmBackward>)
  35771. landmarks are: tensor([[[ 0.6078, -0.4057, 1.8134, -0.7309, -0.4499, -0.7386, 0.6298,
  35772. 0.1390],
  35773. [ 0.5538, -0.4139, 1.7557, -0.1843, -0.0459, 0.1242, 0.4219,
  35774. 0.2853],
  35775. [ 0.5880, -0.3887, 1.8423, -0.3306, -0.6231, -0.5230, 0.4046,
  35776. 0.1544],
  35777. [ 0.6132, -0.4248, 1.5247, -1.1620, -0.2882, -1.3159, 0.6545,
  35778. 0.1193],
  35779. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  35780. 0.1176],
  35781. [ 0.5371, -0.4252, 1.7037, -0.0688, -0.0342, 0.0620, 0.3758,
  35782. 0.2853],
  35783. [ 0.6131, -0.3299, 1.8192, 0.1775, -0.5307, -0.8463, 0.2206,
  35784. 0.5612],
  35785. [ 0.5435, -0.4597, 1.6575, 0.0159, -0.3229, -0.1150, 0.1877,
  35786. 0.1854]]], device='cuda:0')
  35787. loss_train_step before backward: tensor(0.0096, device='cuda:0', grad_fn=<MseLossBackward>)
  35788. loss_train_step after backward: tensor(0.0096, device='cuda:0', grad_fn=<MseLossBackward>)
  35789. loss_train: 0.4794104462489486
  35790. step: 34
  35791. running loss: 0.014100307242616135
  35792. Train Steps: 34/90 Loss: 0.0141 torch.Size([8, 600, 800])
  35793. torch.Size([8, 8])
  35794. tensor([[0.6241, 0.4143, 0.8938, 0.4650, 0.4075, 0.5350, 0.6250, 0.5550],
  35795. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  35796. [0.6226, 0.4103, 0.8575, 0.3450, 0.4388, 0.2067, 0.5787, 0.5383],
  35797. [0.6064, 0.4019, 0.8650, 0.4517, 0.4037, 0.5367, 0.5703, 0.5609],
  35798. [ nan, nan, 0.8850, 0.3000, 0.5363, 0.2250, 0.7343, 0.5771],
  35799. [0.6201, 0.4050, 0.7757, 0.2234, 0.4459, 0.1798, 0.5975, 0.5426],
  35800. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  35801. [ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729]],
  35802. device='cuda:0', dtype=torch.float64)
  35803. predictions are: tensor([[ 0.7850, -0.2571, 1.8136, -0.0547, -0.3984, 0.1662, 0.5929, 0.2880],
  35804. [ 0.7754, -0.2955, 1.7141, 0.1585, -0.6337, -0.1329, 0.4963, 0.4172],
  35805. [ 0.7866, -0.2281, 1.6788, -0.6753, -0.2686, -1.2191, 0.3706, 0.1885],
  35806. [ 0.6878, -0.3163, 1.6834, -0.0576, -0.4463, 0.3079, 0.4258, 0.2013],
  35807. [-1.5394, -1.7654, 1.7289, -0.9718, 0.0645, -1.2452, 0.7936, 0.3608],
  35808. [ 0.6353, -0.3698, 1.2097, -1.1548, -0.2937, -1.3861, 0.3841, 0.0950],
  35809. [ 0.6473, -0.3535, 0.9732, -1.2908, -0.5212, -1.0675, 0.3539, 0.1694],
  35810. [-1.8065, -1.9688, 0.9073, -1.2550, -0.4676, -1.4095, -0.0827, 0.2193]],
  35811. device='cuda:0', grad_fn=<AddmmBackward>)
  35812. landmarks are: tensor([[[ 0.5968, -0.3725, 1.8423, -0.1381, -0.4037, 0.1852, 0.6009,
  35813. 0.2776],
  35814. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  35815. 0.5239],
  35816. [ 0.5898, -0.3908, 1.6748, -0.6924, -0.2594, -1.3313, 0.3873,
  35817. 0.2006],
  35818. [ 0.5151, -0.4296, 1.7095, -0.1997, -0.4210, 0.1929, 0.3484,
  35819. 0.3047],
  35820. [-2.2859, -2.2859, 1.8018, -0.9002, 0.1910, -1.2467, 1.1057,
  35821. 0.3799],
  35822. [ 0.5784, -0.4153, 1.2972, -1.2541, -0.2265, -1.4553, 0.4741,
  35823. 0.2203],
  35824. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  35825. 0.2853],
  35826. [-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  35827. 0.3604]]], device='cuda:0')
  35828. loss_train_step before backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  35829. loss_train_step after backward: tensor(0.0284, device='cuda:0', grad_fn=<MseLossBackward>)
  35830. loss_train: 0.5077718859538436
  35831. step: 35
  35832. running loss: 0.014507768170109818
  35833. Train Steps: 35/90 Loss: 0.0145 torch.Size([8, 600, 800])
  35834. torch.Size([8, 8])
  35835. tensor([[0.6102, 0.3999, 0.8750, 0.5133, 0.3825, 0.4750, 0.5637, 0.5083],
  35836. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  35837. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  35838. [0.6102, 0.4020, 0.8638, 0.3717, 0.3625, 0.5017, 0.6038, 0.5500],
  35839. [0.6161, 0.4055, 0.8675, 0.3867, 0.3713, 0.4033, 0.5195, 0.5162],
  35840. [0.6144, 0.4032, 0.8563, 0.3283, 0.3525, 0.4200, 0.5775, 0.5583],
  35841. [0.6286, 0.4078, 0.8063, 0.2267, 0.4788, 0.1533, 0.5953, 0.4913],
  35842. [0.6204, 0.4055, 0.8438, 0.5733, 0.4574, 0.4801, 0.5487, 0.5617]],
  35843. device='cuda:0', dtype=torch.float64)
  35844. predictions are: tensor([[ 0.5011, -0.4467, 1.7422, 0.0539, -0.4417, -0.0660, 0.3217, 0.0671],
  35845. [ 0.5066, -0.4254, 1.6587, 0.2854, -0.3504, 0.1462, 0.4665, 0.3451],
  35846. [ 0.6545, -0.3217, 1.6254, 0.3260, -0.5526, -0.4922, 0.4399, 0.5244],
  35847. [ 0.5252, -0.4480, 1.6938, -0.6012, -0.5887, -0.0047, 0.6975, 0.3762],
  35848. [ 0.2379, -0.6145, 1.7338, -0.5259, -0.5895, -0.5340, 0.2075, 0.1188],
  35849. [ 0.6845, -0.3041, 1.5760, -0.7952, -0.6356, -0.4136, 0.3729, 0.3453],
  35850. [ 0.4442, -0.4868, 1.3857, -1.2715, -0.0972, -1.6168, 0.4491, 0.0212],
  35851. [ 0.4995, -0.4227, 1.5819, 0.3630, -0.1269, -0.0922, 0.3253, 0.3093]],
  35852. device='cuda:0', grad_fn=<AddmmBackward>)
  35853. landmarks are: tensor([[[ 0.5326, -0.4390, 1.7557, 0.0851, -0.5192, -0.0919, 0.3180,
  35854. 0.0620],
  35855. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  35856. 0.3161],
  35857. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  35858. 0.4778],
  35859. [ 0.5324, -0.4293, 1.7037, -0.5692, -0.6115, 0.0313, 0.5028,
  35860. 0.2545],
  35861. [ 0.5598, -0.4129, 1.7210, -0.4999, -0.5711, -0.4229, 0.1136,
  35862. 0.0983],
  35863. [ 0.5520, -0.4237, 1.6691, -0.7694, -0.6577, -0.3460, 0.3815,
  35864. 0.2930],
  35865. [ 0.6177, -0.4022, 1.4381, -1.2390, -0.0746, -1.5777, 0.4639,
  35866. -0.0168],
  35867. [ 0.5795, -0.4129, 1.6113, 0.3623, -0.1733, -0.0684, 0.2487,
  35868. 0.3084]]], device='cuda:0')
  35869. loss_train_step before backward: tensor(0.0061, device='cuda:0', grad_fn=<MseLossBackward>)
  35870. loss_train_step after backward: tensor(0.0061, device='cuda:0', grad_fn=<MseLossBackward>)
  35871. loss_train: 0.5138542065396905
  35872. step: 36
  35873. running loss: 0.014273727959435847
  35874.  
  35875. Train Steps: 36/90 Loss: 0.0143 torch.Size([8, 600, 800])
  35876. torch.Size([8, 8])
  35877. tensor([[0.6201, 0.4151, 0.8588, 0.5467, 0.3700, 0.3950, 0.5637, 0.5933],
  35878. [0.6364, 0.4154, 0.8938, 0.3717, 0.4500, 0.2583, 0.6448, 0.5285],
  35879. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  35880. [0.6205, 0.4062, 0.8337, 0.2683, 0.3675, 0.4283, 0.6338, 0.5250],
  35881. [0.6325, 0.4066, 0.8438, 0.5350, 0.3925, 0.5267, 0.7113, 0.5795],
  35882. [0.6332, 0.4118, 0.9238, 0.4267, 0.4012, 0.4733, 0.7525, 0.5436],
  35883. [0.6200, 0.4024, 0.8390, 0.3139, 0.3525, 0.3833, 0.6162, 0.5383],
  35884. [0.6125, 0.3974, 0.7725, 0.2517, 0.3538, 0.3317, 0.5887, 0.5500]],
  35885. device='cuda:0', dtype=torch.float64)
  35886. predictions are: tensor([[ 0.7667, -0.1900, 1.5827, 0.3425, -0.4211, -0.4493, 0.1190, 0.4417],
  35887. [ 0.6480, -0.3304, 1.8848, -0.5738, -0.0757, -1.2094, 0.5862, 0.2134],
  35888. [ 0.4521, -0.4451, 1.6456, -0.5933, -0.4995, -0.8002, -0.0086, 0.1792],
  35889. [ 0.3198, -0.5839, 1.5540, -0.9149, -0.5333, -0.2930, 0.5008, 0.2137],
  35890. [ 0.6390, -0.3685, 1.5938, 0.3059, -0.3143, 0.2177, 0.8638, 0.3779],
  35891. [ 0.6208, -0.3873, 1.8751, -0.2567, -0.3241, 0.0175, 0.9235, 0.2965],
  35892. [ 0.2887, -0.6082, 1.6301, -0.7104, -0.5966, -0.4797, 0.4536, 0.2508],
  35893. [ 0.2123, -0.6332, 1.2361, -1.0201, -0.5911, -0.7614, 0.2279, 0.2410]],
  35894. device='cuda:0', grad_fn=<AddmmBackward>)
  35895. landmarks are: tensor([[[ 0.5785, -0.3687, 1.6806, 0.2391, -0.5769, -0.4614, 0.3180,
  35896. 0.4547],
  35897. [ 0.6537, -0.3671, 1.8423, -0.5692, -0.2074, -1.0927, 0.6926,
  35898. 0.1554],
  35899. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  35900. 0.2237],
  35901. [ 0.5799, -0.4099, 1.5651, -1.0465, -0.5885, -0.3075, 0.6413,
  35902. 0.1390],
  35903. [ 0.6355, -0.4080, 1.6113, 0.1852, -0.4730, 0.1467, 0.9996,
  35904. 0.3905],
  35905. [ 0.6388, -0.3840, 1.9808, -0.3152, -0.4326, -0.0996, 1.1897,
  35906. 0.2249],
  35907. [ 0.5779, -0.4275, 1.5894, -0.8362, -0.6577, -0.5153, 0.5605,
  35908. 0.2006],
  35909. [ 0.5430, -0.4503, 1.2822, -1.1235, -0.6520, -0.7540, 0.4335,
  35910. 0.2545]]], device='cuda:0')
  35911. loss_train_step before backward: tensor(0.0156, device='cuda:0', grad_fn=<MseLossBackward>)
  35912. loss_train_step after backward: tensor(0.0156, device='cuda:0', grad_fn=<MseLossBackward>)
  35913. loss_train: 0.5294085452333093
  35914. step: 37
  35915. running loss: 0.01430833906035971
  35916. Train Steps: 37/90 Loss: 0.0143 torch.Size([8, 600, 800])
  35917. torch.Size([8, 8])
  35918. tensor([[0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378],
  35919. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  35920. [0.6109, 0.4036, 0.7188, 0.1750, 0.3850, 0.2550, 0.5863, 0.5567],
  35921. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  35922. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  35923. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  35924. [0.6224, 0.3964, 0.8225, 0.5717, 0.4150, 0.4617, 0.5775, 0.5267],
  35925. [ nan, nan, 0.7648, 0.2722, 0.3962, 0.2183, 0.5060, 0.5422]],
  35926. device='cuda:0', dtype=torch.float64)
  35927. predictions are: tensor([[ 0.8430, -0.2584, 1.6744, 0.3633, -0.4802, -0.2443, 0.5070, 0.2324],
  35928. [ 0.6614, -0.2980, 1.3332, -0.9772, -0.0668, -1.1946, 0.3990, 0.4166],
  35929. [ 0.6807, -0.3319, 1.1142, -1.3562, -0.3954, -1.0487, 0.4462, 0.3111],
  35930. [ 0.4883, -0.4645, 1.4983, -1.0006, -0.5738, -0.6161, 0.4483, 0.1922],
  35931. [-2.2025, -2.2211, 1.3382, -0.9761, -0.4328, -0.9994, 0.1234, 0.2760],
  35932. [ 0.7368, -0.3126, 1.1983, -1.3563, -0.3093, -1.0961, 0.5613, 0.3036],
  35933. [ 0.7644, -0.3089, 1.6260, 0.3014, -0.3090, -0.0725, 0.5097, 0.2114],
  35934. [-2.1184, -2.1461, 1.3030, -1.0153, -0.4229, -1.1399, 0.1310, 0.2134]],
  35935. device='cuda:0', grad_fn=<AddmmBackward>)
  35936. landmarks are: tensor([[[ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  35937. 0.1982],
  35938. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  35939. 0.3854],
  35940. [ 0.5356, -0.4217, 1.0339, -1.4776, -0.5076, -1.1081, 0.4219,
  35941. 0.2853],
  35942. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  35943. 0.0412],
  35944. [-2.2859, -2.2859, 1.2030, -1.0288, -0.4961, -1.1081, 0.0813,
  35945. 0.3161],
  35946. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  35947. 0.2468],
  35948. [ 0.5891, -0.4550, 1.5132, 0.3546, -0.3691, -0.1535, 0.3815,
  35949. 0.1467],
  35950. [-2.2859, -2.2859, 1.2469, -1.0288, -0.4557, -1.2774, 0.0511,
  35951. 0.2183]]], device='cuda:0')
  35952. loss_train_step before backward: tensor(0.0101, device='cuda:0', grad_fn=<MseLossBackward>)
  35953. loss_train_step after backward: tensor(0.0101, device='cuda:0', grad_fn=<MseLossBackward>)
  35954. loss_train: 0.5395098840817809
  35955. step: 38
  35956. running loss: 0.014197628528467919
  35957. Train Steps: 38/90 Loss: 0.0142 torch.Size([8, 600, 800])
  35958. torch.Size([8, 8])
  35959. tensor([[0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  35960. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  35961. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351],
  35962. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967],
  35963. [0.6193, 0.4165, 0.8838, 0.4700, 0.4150, 0.4867, 0.5427, 0.5261],
  35964. [0.6269, 0.4073, 0.8900, 0.4933, 0.3625, 0.4183, 0.6288, 0.5150],
  35965. [0.6107, 0.4013, 0.8700, 0.4650, 0.5049, 0.5176, 0.5850, 0.5550],
  35966. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679]],
  35967. device='cuda:0', dtype=torch.float64)
  35968. predictions are: tensor([[ 0.5074, -0.4429, 1.7396, -0.2308, -0.5302, 0.2456, 0.5146, 0.1426],
  35969. [ 0.4840, -0.4596, 1.6347, 0.0541, -0.1286, 0.0975, 0.1633, 0.1393],
  35970. [ 0.8040, -0.2417, 1.2190, -1.0917, -0.2926, -1.5079, 0.3536, 0.2265],
  35971. [ 0.4214, -0.4987, 1.6166, -0.2834, -0.6564, 0.0112, 0.3598, 0.2051],
  35972. [ 0.5247, -0.3758, 1.7237, -0.0731, -0.4058, -0.1434, 0.2149, 0.2700],
  35973. [ 0.5961, -0.3832, 1.7580, 0.0120, -0.6258, -0.3360, 0.6261, 0.2390],
  35974. [ 0.6072, -0.3421, 1.6672, -0.1749, -0.0391, -0.0249, 0.3669, 0.3491],
  35975. [-2.1279, -2.1510, 1.6978, -1.1259, 0.1169, -1.2127, 1.0293, 0.4119]],
  35976. device='cuda:0', grad_fn=<AddmmBackward>)
  35977. landmarks are: tensor([[[ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  35978. -0.0322],
  35979. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  35980. 0.0532],
  35981. [ 0.5664, -0.4321, 1.2862, -1.0003, -0.2189, -1.4608, 0.3883,
  35982. 0.1855],
  35983. [ 0.4974, -0.4482, 1.6633, -0.3306, -0.6173, 0.1313, 0.2925,
  35984. 0.0081],
  35985. [ 0.5746, -0.3623, 1.7961, -0.1150, -0.3691, -0.0380, 0.2208,
  35986. 0.1439],
  35987. [ 0.6096, -0.4046, 1.8249, -0.0072, -0.6115, -0.3537, 0.6182,
  35988. 0.0928],
  35989. [ 0.5351, -0.4321, 1.7326, -0.1381, 0.0463, 0.1049, 0.4162,
  35990. 0.2776],
  35991. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  35992. 0.3371]]], device='cuda:0')
  35993. loss_train_step before backward: tensor(0.0078, device='cuda:0', grad_fn=<MseLossBackward>)
  35994. loss_train_step after backward: tensor(0.0078, device='cuda:0', grad_fn=<MseLossBackward>)
  35995. loss_train: 0.5473534110933542
  35996. step: 39
  35997. running loss: 0.014034702848547544
  35998. Train Steps: 39/90 Loss: 0.0140 torch.Size([8, 600, 800])
  35999. torch.Size([8, 8])
  36000. tensor([[0.6214, 0.4112, 0.7838, 0.2117, 0.3650, 0.3133, 0.5675, 0.5083],
  36001. [0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  36002. [0.6059, 0.4002, 0.7562, 0.2767, 0.3538, 0.3033, 0.5529, 0.5455],
  36003. [0.6156, 0.4125, 0.8850, 0.4833, 0.4550, 0.5817, 0.5765, 0.5084],
  36004. [0.6193, 0.4079, 0.7288, 0.2500, 0.4250, 0.2550, 0.5989, 0.6266],
  36005. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633],
  36006. [0.6343, 0.4097, 0.9287, 0.4367, 0.4313, 0.3600, 0.7248, 0.5841],
  36007. [0.6268, 0.4094, 0.9038, 0.4300, 0.3700, 0.3483, 0.6262, 0.5167]],
  36008. device='cuda:0', dtype=torch.float64)
  36009. predictions are: tensor([[ 5.9239e-01, -4.0632e-01, 1.4173e+00, -1.3067e+00, -5.8054e-01,
  36010. -8.9081e-01, 4.0951e-01, 3.0051e-02],
  36011. [ 5.6247e-01, -3.9829e-01, 1.0312e+00, -8.5208e-01, -5.4845e-01,
  36012. -9.3977e-01, 1.0921e-01, 2.4333e-01],
  36013. [ 1.8700e-01, -6.6109e-01, 1.2660e+00, -9.8780e-01, -5.7842e-01,
  36014. -8.6583e-01, 2.8633e-01, 2.2913e-01],
  36015. [ 9.6982e-02, -6.9610e-01, 1.8964e+00, -3.7301e-02, -1.7227e-01,
  36016. 4.4360e-01, 2.9462e-01, 1.1563e-01],
  36017. [ 6.4631e-01, -3.3672e-01, 1.1264e+00, -1.1566e+00, -2.4963e-01,
  36018. -1.0645e+00, 4.9173e-01, 6.1092e-01],
  36019. [ 3.9081e-01, -4.9535e-01, 1.7839e+00, 4.0092e-01, -2.1903e-01,
  36020. -9.6561e-04, 2.6731e-01, 3.3483e-01],
  36021. [ 6.0249e-01, -4.3258e-01, 1.9517e+00, -2.0927e-01, -2.7999e-01,
  36022. -5.2175e-01, 1.0574e+00, 3.2433e-01],
  36023. [ 4.8791e-01, -4.7775e-01, 1.9963e+00, -2.2164e-01, -4.3256e-01,
  36024. -5.8975e-01, 5.4839e-01, 1.9789e-01]], device='cuda:0',
  36025. grad_fn=<AddmmBackward>)
  36026. landmarks are: tensor([[[ 0.5845, -0.3864, 1.3342, -1.3082, -0.6000, -0.8386, 0.3353,
  36027. 0.0620],
  36028. [ 0.5425, -0.3998, 0.9263, -0.8683, -0.6000, -1.0157, 0.0990,
  36029. 0.2476],
  36030. [ 0.5129, -0.4374, 1.2072, -1.0080, -0.6520, -0.8848, 0.2679,
  36031. 0.2335],
  36032. [ 0.5573, -0.3808, 1.8018, -0.0534, -0.1843, 0.4008, 0.3769,
  36033. 0.0622],
  36034. [ 0.5746, -0.4021, 1.0801, -1.1312, -0.3229, -1.1081, 0.4803,
  36035. 0.6084],
  36036. [ 0.5880, -0.3605, 1.7037, 0.3238, -0.2940, -0.0765, 0.3180,
  36037. 0.3161],
  36038. [ 0.6438, -0.3936, 2.0039, -0.2690, -0.2940, -0.6231, 1.0618,
  36039. 0.4119],
  36040. [ 0.6094, -0.3947, 1.8885, -0.2998, -0.5769, -0.6770, 0.6067,
  36041. 0.1005]]], device='cuda:0')
  36042. loss_train_step before backward: tensor(0.0117, device='cuda:0', grad_fn=<MseLossBackward>)
  36043. loss_train_step after backward: tensor(0.0117, device='cuda:0', grad_fn=<MseLossBackward>)
  36044. loss_train: 0.5590283134952188
  36045. step: 40
  36046. running loss: 0.01397570783738047
  36047.  
  36048. Train Steps: 40/90 Loss: 0.0140 torch.Size([8, 600, 800])
  36049. torch.Size([8, 8])
  36050. tensor([[0.6178, 0.4012, 0.8900, 0.4495, 0.3891, 0.5617, 0.5972, 0.4879],
  36051. [0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  36052. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  36053. [0.6201, 0.4151, 0.8588, 0.5467, 0.3700, 0.3950, 0.5637, 0.5933],
  36054. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  36055. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563],
  36056. [0.6310, 0.4017, 0.8563, 0.5800, 0.3688, 0.4750, 0.6326, 0.5006],
  36057. [0.6223, 0.3990, 0.8037, 0.2800, 0.4000, 0.2283, 0.5864, 0.5208]],
  36058. device='cuda:0', dtype=torch.float64)
  36059. predictions are: tensor([[ 0.4518, -0.4911, 1.8600, -0.2607, -0.4129, 0.5143, 0.4992, 0.0568],
  36060. [-0.3478, -1.0317, 1.0285, -1.3610, -0.1993, -1.5180, 0.1647, 0.1402],
  36061. [ 0.6369, -0.3709, 1.4022, -0.9832, -0.4957, -0.6442, 0.4793, 0.2773],
  36062. [ 0.5346, -0.3425, 1.6216, 0.1690, -0.4701, -0.3177, 0.2371, 0.5411],
  36063. [ 0.7848, -0.2854, 1.9911, -0.3355, -0.1997, -0.7153, 1.0501, 0.2050],
  36064. [ 0.3135, -0.5431, 1.6285, -0.5310, -0.5323, -0.6793, 0.0580, 0.3620],
  36065. [ 0.3326, -0.6026, 1.6768, 0.3122, -0.5380, 0.0443, 0.6050, 0.0992],
  36066. [ 0.5161, -0.4441, 1.4498, -1.1177, -0.3233, -1.1196, 0.4261, 0.2058]],
  36067. device='cuda:0', grad_fn=<AddmmBackward>)
  36068. landmarks are: tensor([[[ 0.5676, -0.4327, 1.8252, -0.2095, -0.4886, 0.3084, 0.4727,
  36069. -0.0322],
  36070. [ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  36071. 0.0261],
  36072. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  36073. 0.1931],
  36074. [ 0.5785, -0.3687, 1.6806, 0.2391, -0.5769, -0.4614, 0.3180,
  36075. 0.4547],
  36076. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  36077. 0.2142],
  36078. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  36079. 0.2837],
  36080. [ 0.6286, -0.4303, 1.6691, 0.3931, -0.5827, -0.0919, 0.6359,
  36081. 0.0261],
  36082. [ 0.5885, -0.4429, 1.4266, -0.9926, -0.4383, -1.2313, 0.4228,
  36083. 0.1195]]], device='cuda:0')
  36084. loss_train_step before backward: tensor(0.0280, device='cuda:0', grad_fn=<MseLossBackward>)
  36085. loss_train_step after backward: tensor(0.0280, device='cuda:0', grad_fn=<MseLossBackward>)
  36086. loss_train: 0.5870048655197024
  36087. step: 41
  36088. running loss: 0.014317191841943962
  36089. Train Steps: 41/90 Loss: 0.0143 torch.Size([8, 600, 800])
  36090. torch.Size([8, 8])
  36091. tensor([[0.6200, 0.3993, 0.8519, 0.4923, 0.3962, 0.4717, 0.6013, 0.5433],
  36092. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  36093. [0.6311, 0.3998, 0.7975, 0.5767, 0.3838, 0.4850, 0.7327, 0.5343],
  36094. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  36095. [0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  36096. [0.6125, 0.4076, 0.8488, 0.3883, 0.3700, 0.3683, 0.5026, 0.5505],
  36097. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  36098. [0.6250, 0.4110, 0.7238, 0.2067, 0.4263, 0.1883, 0.5625, 0.5633]],
  36099. device='cuda:0', dtype=torch.float64)
  36100. predictions are: tensor([[ 0.5652, -0.4335, 1.8033, 0.0198, -0.3656, 0.0220, 0.6305, 0.2068],
  36101. [ 0.4282, -0.5123, 1.7713, -0.2921, -0.4786, 0.0357, 0.2857, 0.0134],
  36102. [ 0.5329, -0.4882, 1.5947, 0.2187, -0.4321, 0.0283, 1.0430, 0.1789],
  36103. [ 0.7813, -0.2962, 1.0969, -1.1801, -0.4818, -1.0343, 0.2377, 0.0690],
  36104. [ 0.2271, -0.6053, 1.7303, -0.5249, -0.5412, -0.5170, 0.1491, 0.3835],
  36105. [-0.0694, -0.8135, 1.7507, -0.5003, -0.5468, -0.5444, 0.1607, 0.2659],
  36106. [ 0.7761, -0.2279, 1.7220, -0.3759, -0.4916, -0.7065, 0.3742, 0.4468],
  36107. [ 0.3328, -0.5700, 1.1195, -1.3783, -0.1821, -1.4471, 0.4467, 0.2584]],
  36108. device='cuda:0', grad_fn=<AddmmBackward>)
  36109. landmarks are: tensor([[[ 0.5777, -0.4415, 1.6491, -0.0122, -0.4557, -0.1073, 0.4912,
  36110. 0.2237],
  36111. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  36112. 0.0502],
  36113. [ 0.6289, -0.4393, 1.3977, 0.3777, -0.5134, -0.0457, 1.0984,
  36114. 0.1821],
  36115. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  36116. 0.0802],
  36117. [ 0.5581, -0.3912, 1.6460, -0.5230, -0.6173, -0.5923, 0.0681,
  36118. 0.4348],
  36119. [ 0.5433, -0.4032, 1.6344, -0.4922, -0.5769, -0.5846, 0.0357,
  36120. 0.2567],
  36121. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  36122. 0.3238],
  36123. [ 0.6010, -0.3875, 1.0570, -1.3313, -0.3171, -1.4160, 0.3122,
  36124. 0.3161]]], device='cuda:0')
  36125. loss_train_step before backward: tensor(0.0210, device='cuda:0', grad_fn=<MseLossBackward>)
  36126. loss_train_step after backward: tensor(0.0210, device='cuda:0', grad_fn=<MseLossBackward>)
  36127. loss_train: 0.6079580811783671
  36128. step: 42
  36129. running loss: 0.014475192409008741
  36130. Train Steps: 42/90 Loss: 0.0145 torch.Size([8, 600, 800])
  36131. torch.Size([8, 8])
  36132. tensor([[ nan, nan, 0.6859, 0.2194, 0.4150, 0.1867, 0.5153, 0.5729],
  36133. [0.6201, 0.4102, 0.7288, 0.2417, 0.4150, 0.2383, 0.6100, 0.5500],
  36134. [0.6216, 0.4099, 0.7225, 0.2033, 0.4188, 0.2217, 0.5975, 0.5283],
  36135. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563],
  36136. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  36137. [0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  36138. [0.6224, 0.4097, 0.7438, 0.2267, 0.3850, 0.2850, 0.5988, 0.5250],
  36139. [0.6200, 0.3961, 0.8461, 0.5497, 0.4142, 0.4577, 0.5892, 0.5402]],
  36140. device='cuda:0', dtype=torch.float64)
  36141. predictions are: tensor([[-2.1093, -2.1695, 1.0704, -1.1241, -0.2829, -1.2708, 0.3400, 0.3245],
  36142. [ 0.9580, -0.1868, 1.1554, -1.1501, -0.3985, -1.0545, 0.5273, 0.2618],
  36143. [ 0.7270, -0.3383, 1.1407, -1.2378, -0.3266, -1.1439, 0.4433, 0.2077],
  36144. [ 0.6284, -0.3472, 1.6952, -0.4482, -0.5650, -0.6186, 0.1774, 0.2573],
  36145. [-2.4414, -2.3598, 1.4631, -0.6933, -0.5079, -0.7125, 0.2897, 0.2286],
  36146. [ 0.6782, -0.3799, 1.1089, -1.2278, -0.2241, -1.4500, 0.2807, 0.0738],
  36147. [ 0.7070, -0.3484, 1.2289, -1.1555, -0.4486, -0.8100, 0.5723, 0.2394],
  36148. [ 0.6015, -0.4189, 1.7105, 0.1990, -0.4040, 0.0405, 0.5011, 0.1426]],
  36149. device='cuda:0', grad_fn=<AddmmBackward>)
  36150. landmarks are: tensor([[[-2.2859, -2.2859, 0.8824, -1.2727, -0.3691, -1.4237, 0.0943,
  36151. 0.3604],
  36152. [ 0.5784, -0.3913, 1.0801, -1.1697, -0.3691, -1.1851, 0.5316,
  36153. 0.2545],
  36154. [ 0.5850, -0.3925, 1.0513, -1.3467, -0.3517, -1.2620, 0.4739,
  36155. 0.1544],
  36156. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  36157. 0.2837],
  36158. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  36159. 0.2837],
  36160. [ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  36161. 0.0261],
  36162. [ 0.5891, -0.3937, 1.1494, -1.2390, -0.5076, -0.9695, 0.4797,
  36163. 0.1390],
  36164. [ 0.5780, -0.4565, 1.6221, 0.2532, -0.3728, -0.1718, 0.4357,
  36165. 0.2091]]], device='cuda:0')
  36166. loss_train_step before backward: tensor(0.0137, device='cuda:0', grad_fn=<MseLossBackward>)
  36167. loss_train_step after backward: tensor(0.0137, device='cuda:0', grad_fn=<MseLossBackward>)
  36168. loss_train: 0.621706354431808
  36169. step: 43
  36170. running loss: 0.014458287312367629
  36171. Train Steps: 43/90 Loss: 0.0145 torch.Size([8, 600, 800])
  36172. torch.Size([8, 8])
  36173. tensor([[0.6212, 0.4171, 0.7875, 0.3633, 0.3813, 0.2933, 0.5675, 0.5700],
  36174. [0.6264, 0.4071, 0.9038, 0.3867, 0.3663, 0.3917, 0.6338, 0.5283],
  36175. [ nan, nan, 0.8888, 0.3100, 0.5262, 0.2817, 0.7145, 0.6003],
  36176. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  36177. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  36178. [ nan, nan, 0.7625, 0.2433, 0.3713, 0.2867, 0.5235, 0.5220],
  36179. [0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447],
  36180. [0.6214, 0.4112, 0.7838, 0.2117, 0.3650, 0.3133, 0.5675, 0.5083]],
  36181. device='cuda:0', dtype=torch.float64)
  36182. predictions are: tensor([[ 0.7925, -0.2197, 1.2258, -0.5560, -0.5129, -0.8534, 0.1539, 0.3959],
  36183. [ 0.9824, -0.1438, 1.7369, -0.4676, -0.5488, -0.3900, 0.4122, 0.0837],
  36184. [-0.5162, -1.0907, 1.6477, -0.7800, 0.1305, -1.0171, 0.9095, 0.4633],
  36185. [-2.3501, -2.3298, 1.2146, -1.0448, -0.2453, -1.2660, 0.2259, 0.1469],
  36186. [ 0.8942, -0.2418, 1.7042, -0.0787, -0.5784, -0.3624, 0.6176, 0.1548],
  36187. [-2.1278, -2.1791, 1.1879, -1.0004, -0.4103, -0.9609, 0.1842, 0.1987],
  36188. [ 0.9677, -0.1782, 1.7206, -0.1119, -0.5416, 0.0892, 0.8351, 0.1302],
  36189. [ 0.9036, -0.2227, 1.1927, -1.2856, -0.5745, -0.8649, 0.2551, 0.0385]],
  36190. device='cuda:0', grad_fn=<AddmmBackward>)
  36191. landmarks are: tensor([[[ 0.5832, -0.3593, 1.3515, -0.6077, -0.5249, -0.9310, 0.3353,
  36192. 0.3469],
  36193. [ 0.6073, -0.4058, 1.8885, -0.4999, -0.5942, -0.4768, 0.6413,
  36194. 0.1544],
  36195. [-2.2859, -2.2859, 1.8192, -0.8540, 0.1448, -0.9849, 1.0143,
  36196. 0.4867],
  36197. [-2.2859, -2.2859, 1.3400, -1.0388, -0.3055, -1.4930, 0.1157,
  36198. 0.0231],
  36199. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  36200. 0.1768],
  36201. [-2.2859, -2.2859, 1.2360, -1.1620, -0.5711, -0.9618, 0.1322,
  36202. 0.1253],
  36203. [ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  36204. 0.2302],
  36205. [ 0.5845, -0.3864, 1.3342, -1.3082, -0.6000, -0.8386, 0.3353,
  36206. 0.0620]]], device='cuda:0')
  36207. loss_train_step before backward: tensor(0.0917, device='cuda:0', grad_fn=<MseLossBackward>)
  36208. loss_train_step after backward: tensor(0.0917, device='cuda:0', grad_fn=<MseLossBackward>)
  36209. loss_train: 0.7134014395996928
  36210. step: 44
  36211. running loss: 0.0162136690818112
  36212.  
  36213. Train Steps: 44/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36214. torch.Size([8, 8])
  36215. tensor([[0.6037, 0.4020, 0.8300, 0.4033, 0.3575, 0.4883, 0.5647, 0.5631],
  36216. [0.6204, 0.4007, 0.7838, 0.2100, 0.4475, 0.1733, 0.5825, 0.5167],
  36217. [ nan, nan, 0.6488, 0.1817, 0.4325, 0.1867, 0.5475, 0.5733],
  36218. [0.6149, 0.4054, 0.6713, 0.2333, 0.4025, 0.2017, 0.5213, 0.5695],
  36219. [0.6293, 0.4024, 0.8750, 0.5000, 0.4012, 0.5733, 0.7121, 0.5633],
  36220. [0.6252, 0.4158, 0.8988, 0.4083, 0.3788, 0.4783, 0.6225, 0.5633],
  36221. [0.6229, 0.4086, 0.7538, 0.2600, 0.4775, 0.1617, 0.5900, 0.5383],
  36222. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412]],
  36223. device='cuda:0', dtype=torch.float64)
  36224. predictions are: tensor([[ 0.2478, -0.5887, 1.5762, -0.3955, -0.6159, -0.0235, 0.3924, 0.1690],
  36225. [ 0.5105, -0.4776, 1.2312, -1.2097, -0.2561, -1.4255, 0.4250, 0.0495],
  36226. [-2.8672, -2.7021, 0.9996, -1.1260, -0.2092, -1.3250, 0.2963, 0.3326],
  36227. [ 0.4463, -0.5024, 0.8379, -1.1694, -0.4447, -1.2806, 0.0816, 0.2743],
  36228. [ 0.4706, -0.4984, 1.7752, 0.0275, -0.4758, 0.3607, 0.8918, 0.1198],
  36229. [ 0.3932, -0.5023, 1.7916, -0.3608, -0.5850, -0.0992, 0.6404, 0.2181],
  36230. [ 0.5354, -0.4506, 1.1401, -1.1430, -0.1944, -1.4443, 0.3866, 0.1853],
  36231. [ 0.5298, -0.4138, 1.7078, -0.5646, -0.5096, -0.9205, 0.3372, 0.1251]],
  36232. device='cuda:0', grad_fn=<AddmmBackward>)
  36233. landmarks are: tensor([[[ 0.5027, -0.4289, 1.5478, -0.4229, -0.6346, -0.0303, 0.3223,
  36234. 0.3148],
  36235. [ 0.5796, -0.4351, 1.3342, -1.3159, -0.2189, -1.4853, 0.4046,
  36236. 0.1005],
  36237. [-2.2859, -2.2859, 0.7106, -1.4468, -0.2882, -1.4237, 0.2430,
  36238. 0.3623],
  36239. [ 0.5544, -0.4133, 0.8145, -1.2082, -0.4268, -1.3544, 0.1221,
  36240. 0.3446],
  36241. [ 0.6207, -0.4273, 1.7557, 0.0236, -0.4326, 0.3623, 1.0033,
  36242. 0.3157],
  36243. [ 0.6017, -0.3654, 1.8654, -0.3998, -0.5365, -0.0765, 0.5894,
  36244. 0.3161],
  36245. [ 0.5911, -0.3984, 1.1956, -1.0850, -0.0804, -1.5392, 0.4393,
  36246. 0.2006],
  36247. [ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  36248. 0.2139]]], device='cuda:0')
  36249. loss_train_step before backward: tensor(0.0179, device='cuda:0', grad_fn=<MseLossBackward>)
  36250. loss_train_step after backward: tensor(0.0179, device='cuda:0', grad_fn=<MseLossBackward>)
  36251. loss_train: 0.7312849136069417
  36252. step: 45
  36253. running loss: 0.016250775857932036
  36254. Train Steps: 45/90 Loss: 0.0163 torch.Size([8, 600, 800])
  36255. torch.Size([8, 8])
  36256. tensor([[0.6109, 0.4009, 0.8725, 0.4700, 0.3550, 0.4167, 0.5650, 0.5117],
  36257. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395],
  36258. [0.6161, 0.4040, 0.7525, 0.2133, 0.4125, 0.2067, 0.5787, 0.5117],
  36259. [0.6250, 0.4236, 0.8638, 0.3767, 0.4050, 0.3150, 0.5649, 0.5799],
  36260. [0.6198, 0.4101, 0.8838, 0.5283, 0.3763, 0.5267, 0.5913, 0.5567],
  36261. [0.6122, 0.4006, 0.8850, 0.4217, 0.4088, 0.5517, 0.6063, 0.5517],
  36262. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038],
  36263. [0.6098, 0.3991, 0.8638, 0.4717, 0.4263, 0.4967, 0.5212, 0.5650]],
  36264. device='cuda:0', dtype=torch.float64)
  36265. predictions are: tensor([[ 0.4556, -0.5099, 1.7766, -0.1818, -0.6755, -0.4903, 0.4060, 0.0858],
  36266. [ 0.5090, -0.4585, 1.5956, 0.1512, -0.6968, -0.7298, 0.3877, 0.2242],
  36267. [ 0.5739, -0.4423, 1.0018, -1.4543, -0.4832, -1.4066, 0.4122, 0.0719],
  36268. [ 0.1892, -0.6547, 1.6334, -0.6650, -0.4261, -0.9657, 0.4471, 0.4533],
  36269. [ 0.6028, -0.4209, 1.7416, 0.1237, -0.5934, -0.0068, 0.6176, 0.2581],
  36270. [ 0.5751, -0.4199, 1.8006, -0.3498, -0.4233, 0.1760, 0.6082, 0.1663],
  36271. [ 0.5965, -0.4214, 1.7018, -0.1034, -0.2478, -0.0326, 0.2991, -0.0696],
  36272. [ 0.4331, -0.5177, 1.6583, -0.1081, -0.3108, -0.0744, 0.3485, 0.2111]],
  36273. device='cuda:0', grad_fn=<AddmmBackward>)
  36274. landmarks are: tensor([[[ 0.5356, -0.4343, 1.7441, -0.1150, -0.6462, -0.3614, 0.3238,
  36275. 0.0774],
  36276. [ 0.5697, -0.4514, 1.7420, 0.2672, -0.6055, -0.6312, 0.3449,
  36277. 0.2058],
  36278. [ 0.5598, -0.4201, 1.1898, -1.3005, -0.3806, -1.3313, 0.3873,
  36279. 0.0774],
  36280. [ 0.6008, -0.3293, 1.7037, -0.5461, -0.4152, -0.8309, 0.3234,
  36281. 0.3928],
  36282. [ 0.5770, -0.3918, 1.7961, 0.1544, -0.5480, 0.1467, 0.4450,
  36283. 0.2853],
  36284. [ 0.5417, -0.4355, 1.8018, -0.3383, -0.3979, 0.2622, 0.5143,
  36285. 0.2622],
  36286. [ 0.5249, -0.4473, 1.7326, -0.0919, -0.2016, 0.1544, 0.1733,
  36287. 0.0412],
  36288. [ 0.5308, -0.4425, 1.7037, -0.1073, -0.3171, 0.0082, 0.1217,
  36289. 0.3238]]], device='cuda:0')
  36290. loss_train_step before backward: tensor(0.0118, device='cuda:0', grad_fn=<MseLossBackward>)
  36291. loss_train_step after backward: tensor(0.0118, device='cuda:0', grad_fn=<MseLossBackward>)
  36292. loss_train: 0.7431346783414483
  36293. step: 46
  36294. running loss: 0.016155101703074964
  36295. Train Steps: 46/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36296. torch.Size([8, 8])
  36297. tensor([[0.6150, 0.4097, 0.7468, 0.3194, 0.3825, 0.2633, 0.5463, 0.5800],
  36298. [0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  36299. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  36300. [0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395],
  36301. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  36302. [0.6200, 0.4059, 0.8700, 0.4900, 0.4163, 0.5000, 0.6162, 0.5467],
  36303. [0.6048, 0.3987, 0.7620, 0.3861, 0.3475, 0.4167, 0.5137, 0.5466],
  36304. [ nan, nan, 0.9050, 0.3500, 0.5138, 0.2300, 0.7359, 0.5702]],
  36305. device='cuda:0', dtype=torch.float64)
  36306. predictions are: tensor([[ 0.5993, -0.3803, 1.1228, -0.8423, -0.6056, -1.1385, 0.0585, 0.3099],
  36307. [ 0.6539, -0.4069, 1.4465, -1.0566, -0.4854, -1.0856, 0.7644, 0.0711],
  36308. [ 0.5155, -0.4606, 1.3688, -1.0454, -0.7240, -0.7367, 0.3963, 0.0150],
  36309. [ 0.5882, -0.4315, 1.0366, -1.3716, -0.4745, -1.2091, 0.5045, 0.1624],
  36310. [ 0.4665, -0.4729, 1.7877, -0.1115, -0.4896, -0.3687, 0.1220, 0.2028],
  36311. [ 0.4432, -0.5455, 1.8228, 0.0551, -0.3761, -0.0258, 0.6413, 0.1544],
  36312. [ 0.5897, -0.4017, 1.2351, -0.5070, -0.7453, -0.4400, 0.1918, 0.1963],
  36313. [-1.4964, -1.7881, 1.8678, -0.7517, 0.1144, -1.2951, 1.0231, 0.3557]],
  36314. device='cuda:0', grad_fn=<AddmmBackward>)
  36315. landmarks are: tensor([[[ 0.5548, -0.3936, 1.1634, -0.8105, -0.5192, -1.0696, 0.2372,
  36316. 0.3931],
  36317. [ 0.6125, -0.4345, 1.4308, -1.1384, -0.4213, -1.0031, 0.7190,
  36318. 0.1214],
  36319. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  36320. 0.0412],
  36321. [ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  36322. 0.2058],
  36323. [ 0.5441, -0.3997, 1.7326, -0.2228, -0.4441, -0.2921, 0.0296,
  36324. 0.2409],
  36325. [ 0.5776, -0.4109, 1.7326, -0.0226, -0.3633, 0.0236, 0.5605,
  36326. 0.2391],
  36327. [ 0.5076, -0.4443, 1.2337, -0.5023, -0.6808, -0.3614, 0.0866,
  36328. 0.2386],
  36329. [-2.2859, -2.2859, 1.8942, -0.6693, 0.0871, -1.2236, 1.1130,
  36330. 0.3478]]], device='cuda:0')
  36331. loss_train_step before backward: tensor(0.0182, device='cuda:0', grad_fn=<MseLossBackward>)
  36332. loss_train_step after backward: tensor(0.0182, device='cuda:0', grad_fn=<MseLossBackward>)
  36333. loss_train: 0.7613579174503684
  36334. step: 47
  36335. running loss: 0.016199104626603584
  36336. Train Steps: 47/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36337. torch.Size([8, 8])
  36338. tensor([[0.6202, 0.4079, 0.8025, 0.2500, 0.3763, 0.3217, 0.6125, 0.5533],
  36339. [0.6218, 0.4137, 0.7263, 0.2233, 0.4075, 0.2650, 0.6212, 0.5783],
  36340. [0.6282, 0.4034, 0.7830, 0.2080, 0.4532, 0.2080, 0.6404, 0.5323],
  36341. [0.6129, 0.3930, 0.8769, 0.5105, 0.4146, 0.5642, 0.6000, 0.5082],
  36342. [0.6226, 0.4103, 0.8575, 0.3450, 0.4388, 0.2067, 0.5787, 0.5383],
  36343. [0.6224, 0.4179, 0.8700, 0.5683, 0.4037, 0.4683, 0.5650, 0.5600],
  36344. [0.6057, 0.4011, 0.8750, 0.4267, 0.4400, 0.5800, 0.5845, 0.5585],
  36345. [0.6187, 0.4104, 0.7126, 0.2069, 0.3950, 0.2517, 0.5913, 0.5683]],
  36346. device='cuda:0', dtype=torch.float64)
  36347. predictions are: tensor([[ 0.4333, -0.5111, 1.4087, -1.0953, -0.6372, -0.8462, 0.4818, 0.1355],
  36348. [ 0.3784, -0.5491, 1.0189, -1.2366, -0.5795, -1.2066, 0.4777, 0.2933],
  36349. [ 0.6046, -0.4339, 1.2734, -1.2354, -0.3520, -1.3963, 0.5953, 0.0656],
  36350. [ 0.2975, -0.6681, 1.8023, 0.2010, -0.3973, 0.1365, 0.5395, 0.0553],
  36351. [ 0.5932, -0.3750, 1.7603, -0.6885, -0.3399, -1.3641, 0.3018, 0.1969],
  36352. [ 0.2940, -0.5934, 1.7302, 0.3709, -0.5093, -0.3573, 0.4433, 0.4143],
  36353. [ 0.3846, -0.5253, 1.8102, -0.2334, -0.3446, 0.1800, 0.4126, 0.1311],
  36354. [ 0.4028, -0.5231, 0.8992, -1.3941, -0.5818, -1.2945, 0.3011, 0.2570]],
  36355. device='cuda:0', grad_fn=<AddmmBackward>)
  36356. landmarks are: tensor([[[ 0.5788, -0.4020, 1.4208, -1.1312, -0.5480, -0.8002, 0.5432,
  36357. 0.2699],
  36358. [ 0.5863, -0.3749, 1.0686, -1.2543, -0.4037, -1.0619, 0.5836,
  36359. 0.3854],
  36360. [ 0.6158, -0.4225, 1.3307, -1.3253, -0.1924, -1.3252, 0.6721,
  36361. 0.1727],
  36362. [ 0.5450, -0.4706, 1.7643, 0.0722, -0.3708, 0.3200, 0.4854,
  36363. 0.0612],
  36364. [ 0.5898, -0.3908, 1.6748, -0.6924, -0.2594, -1.3313, 0.3873,
  36365. 0.2006],
  36366. [ 0.5891, -0.3557, 1.7326, 0.3392, -0.4210, -0.1227, 0.3238,
  36367. 0.3007],
  36368. [ 0.5115, -0.4332, 1.7557, -0.3152, -0.2536, 0.3931, 0.4139,
  36369. 0.2936],
  36370. [ 0.5718, -0.3905, 1.0053, -1.3305, -0.4614, -1.1235, 0.4450,
  36371. 0.3392]]], device='cuda:0')
  36372. loss_train_step before backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  36373. loss_train_step after backward: tensor(0.0146, device='cuda:0', grad_fn=<MseLossBackward>)
  36374. loss_train: 0.7759437253698707
  36375. step: 48
  36376. running loss: 0.016165494278538972
  36377.  
  36378. Train Steps: 48/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36379. torch.Size([8, 8])
  36380. tensor([[0.6264, 0.4069, 0.7900, 0.1650, 0.4275, 0.2267, 0.6290, 0.4947],
  36381. [0.6271, 0.4040, 0.9000, 0.3250, 0.4938, 0.2300, 0.7192, 0.5413],
  36382. [0.6275, 0.4048, 0.8488, 0.2883, 0.4463, 0.2033, 0.6321, 0.5155],
  36383. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  36384. [0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  36385. [0.6115, 0.3998, 0.7063, 0.2383, 0.4037, 0.1950, 0.5320, 0.4993],
  36386. [0.6175, 0.3997, 0.6737, 0.2500, 0.4313, 0.1933, 0.5513, 0.5750],
  36387. [0.6182, 0.3930, 0.8841, 0.3892, 0.3556, 0.4967, 0.6222, 0.5279]],
  36388. device='cuda:0', dtype=torch.float64)
  36389. predictions are: tensor([[ 4.9754e-01, -5.1794e-01, 1.2568e+00, -1.4171e+00, -3.8776e-01,
  36390. -1.1685e+00, 5.8964e-01, 4.4017e-02],
  36391. [ 2.9641e-01, -6.1759e-01, 1.8639e+00, -7.7632e-01, -1.0200e-01,
  36392. -1.1415e+00, 9.5960e-01, 2.4079e-01],
  36393. [ 6.7223e-01, -3.8713e-01, 1.6328e+00, -9.0681e-01, -2.8939e-01,
  36394. -1.2221e+00, 7.3069e-01, 1.4676e-01],
  36395. [ 5.1888e-01, -4.4076e-01, 1.7888e+00, -4.8815e-01, -5.6462e-01,
  36396. -9.1237e-01, 3.5224e-01, 2.3299e-01],
  36397. [ 3.6893e-01, -5.5036e-01, 1.7233e+00, -2.2765e-01, -7.2718e-01,
  36398. -5.9332e-01, 1.3962e-01, 3.8474e-01],
  36399. [ 6.5524e-01, -3.6731e-01, 9.2200e-01, -1.1836e+00, -5.1188e-01,
  36400. -1.2763e+00, 6.7762e-02, -1.0445e-03],
  36401. [ 2.2790e-01, -6.3644e-01, 6.8836e-01, -1.2796e+00, -3.6872e-01,
  36402. -1.4031e+00, 1.8171e-01, 4.5589e-01],
  36403. [-1.6043e-02, -8.6411e-01, 1.7684e+00, -4.3701e-01, -6.8084e-01,
  36404. 4.7354e-02, 7.2844e-01, 1.9542e-01]], device='cuda:0',
  36405. grad_fn=<AddmmBackward>)
  36406. landmarks are: tensor([[[ 6.0739e-01, -4.0631e-01, 1.3630e+00, -1.5238e+00, -3.1132e-01,
  36407. -1.2390e+00, 6.1950e-01, -9.2270e-04],
  36408. [ 6.1083e-01, -4.2008e-01, 1.8711e+00, -7.8476e-01, -5.3118e-03,
  36409. -1.2236e+00, 1.0362e+00, 2.1421e-01],
  36410. [ 6.1259e-01, -4.1609e-01, 1.6344e+00, -9.5412e-01, -2.2471e-01,
  36411. -1.3467e+00, 6.3389e-01, 9.5262e-02],
  36412. [ 5.7841e-01, -4.0062e-01, 1.7911e+00, -5.7008e-01, -5.1916e-01,
  36413. -1.0331e+00, 4.1374e-01, 2.1391e-01],
  36414. [ 5.6969e-01, -4.1132e-01, 1.7499e+00, -2.7667e-01, -6.4042e-01,
  36415. -7.1547e-01, 1.5756e-01, 4.0319e-01],
  36416. [ 5.3837e-01, -4.3934e-01, 9.7621e-01, -1.1851e+00, -4.2102e-01,
  36417. -1.3852e+00, 1.7122e-01, 2.0118e-02],
  36418. [ 5.6634e-01, -4.3965e-01, 8.2610e-01, -1.1312e+00, -2.9400e-01,
  36419. -1.3929e+00, 2.6028e-01, 3.6998e-01],
  36420. [ 5.6966e-01, -4.7064e-01, 1.7976e+00, -4.8841e-01, -6.4332e-01,
  36421. 8.0865e-03, 5.8780e-01, 1.5252e-01]]], device='cuda:0')
  36422. loss_train_step before backward: tensor(0.0183, device='cuda:0', grad_fn=<MseLossBackward>)
  36423. loss_train_step after backward: tensor(0.0183, device='cuda:0', grad_fn=<MseLossBackward>)
  36424. loss_train: 0.7942405147477984
  36425. step: 49
  36426. running loss: 0.016208990096893847
  36427. Train Steps: 49/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36428. torch.Size([8, 8])
  36429. tensor([[0.6271, 0.4024, 0.9000, 0.3517, 0.3700, 0.4517, 0.6931, 0.5285],
  36430. [0.6329, 0.4175, 0.8550, 0.2333, 0.5425, 0.2250, 0.7398, 0.5609],
  36431. [0.6058, 0.3978, 0.8287, 0.3600, 0.3400, 0.4050, 0.5529, 0.5461],
  36432. [0.6273, 0.4105, 0.8988, 0.4517, 0.3912, 0.2550, 0.5894, 0.4811],
  36433. [0.6325, 0.4165, 0.9000, 0.4617, 0.3813, 0.4900, 0.7485, 0.5447],
  36434. [0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  36435. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  36436. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633]],
  36437. device='cuda:0', dtype=torch.float64)
  36438. predictions are: tensor([[ 0.3633, -0.6099, 1.7727, -0.7365, -0.6176, -0.1545, 0.9483, 0.1723],
  36439. [ 0.3857, -0.5608, 1.5930, -1.4546, 0.1408, -1.4649, 1.0670, 0.2022],
  36440. [ 0.3727, -0.5318, 1.4499, -0.7004, -0.8048, -0.4178, 0.1934, 0.1654],
  36441. [ 0.6114, -0.3969, 1.8067, -0.3324, -0.5716, -1.1282, 0.2881, -0.0128],
  36442. [ 0.6555, -0.3796, 1.7888, -0.1854, -0.6189, 0.0533, 0.9555, 0.2217],
  36443. [ 0.5391, -0.4041, 1.6146, -0.1128, -0.4412, -1.0803, 0.1859, 0.5246],
  36444. [ 0.6420, -0.3471, 1.5873, 0.1019, -0.2799, 0.1364, -0.0239, 0.1821],
  36445. [ 0.5307, -0.4357, 1.6244, 0.2666, -0.3907, -0.1204, 0.2242, 0.3382]],
  36446. device='cuda:0', grad_fn=<AddmmBackward>)
  36447. landmarks are: tensor([[[ 0.6108, -0.4273, 1.8711, -0.6616, -0.5769, -0.1997, 0.9156,
  36448. 0.1554],
  36449. [ 0.6372, -0.3575, 1.6633, -1.2082, 0.2199, -1.2467, 1.1313,
  36450. 0.3050],
  36451. [ 0.5124, -0.4483, 1.5420, -0.6231, -0.7155, -0.4152, 0.2679,
  36452. 0.2365],
  36453. [ 0.6116, -0.3898, 1.8654, -0.1997, -0.4788, -1.1081, 0.4367,
  36454. -0.0637],
  36455. [ 0.6355, -0.3623, 1.8711, -0.1535, -0.5249, -0.0226, 1.1715,
  36456. 0.2302],
  36457. [ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  36458. 0.5762],
  36459. [ 0.5447, -0.3838, 1.7037, 0.1775, -0.1497, 0.1467, 0.1128,
  36460. 0.2431],
  36461. [ 0.5880, -0.3605, 1.7037, 0.3238, -0.2940, -0.0765, 0.3180,
  36462. 0.3161]]], device='cuda:0')
  36463. loss_train_step before backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  36464. loss_train_step after backward: tensor(0.0114, device='cuda:0', grad_fn=<MseLossBackward>)
  36465. loss_train: 0.8056448325514793
  36466. step: 50
  36467. running loss: 0.016112896651029586
  36468. Train Steps: 50/90 Loss: 0.0161 torch.Size([8, 600, 800])
  36469. torch.Size([8, 8])
  36470. tensor([[0.6296, 0.3989, 0.9000, 0.4150, 0.3613, 0.3867, 0.6400, 0.5100],
  36471. [0.6172, 0.4055, 0.8175, 0.2650, 0.3550, 0.3683, 0.5787, 0.5550],
  36472. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563],
  36473. [0.6127, 0.4084, 0.8700, 0.4467, 0.3987, 0.4317, 0.5013, 0.5471],
  36474. [0.6101, 0.4042, 0.7775, 0.2617, 0.3713, 0.2817, 0.5440, 0.5650],
  36475. [0.6225, 0.4191, 0.8500, 0.4167, 0.3688, 0.3233, 0.5650, 0.5650],
  36476. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  36477. [0.6132, 0.3930, 0.8672, 0.4754, 0.3712, 0.5222, 0.5974, 0.5098]],
  36478. device='cuda:0', dtype=torch.float64)
  36479. predictions are: tensor([[ 6.5583e-01, -4.2216e-01, 1.9241e+00, -2.7688e-01, -5.5424e-01,
  36480. -6.0314e-01, 9.0408e-01, 1.5943e-01],
  36481. [ 4.8151e-01, -4.7833e-01, 1.4162e+00, -1.0737e+00, -6.1699e-01,
  36482. -6.1750e-01, 5.0363e-01, 2.4150e-01],
  36483. [ 5.1282e-01, -4.4040e-01, 1.6403e+00, -5.1735e-01, -5.4924e-01,
  36484. -9.2146e-01, 2.4885e-01, 2.8576e-01],
  36485. [ 5.4983e-01, -4.1066e-01, 1.7298e+00, -1.6783e-01, -4.0936e-01,
  36486. -3.1518e-01, 1.2596e-01, 2.7520e-01],
  36487. [ 7.2211e-01, -3.1429e-01, 1.2671e+00, -1.0859e+00, -4.3973e-01,
  36488. -1.0486e+00, 2.4254e-01, 2.3212e-01],
  36489. [ 4.2025e-01, -4.8194e-01, 1.6345e+00, -3.9314e-01, -5.3136e-01,
  36490. -8.7824e-01, 4.3722e-01, 4.3657e-01],
  36491. [ 5.2567e-01, -4.8861e-01, 1.7370e+00, -2.4383e-02, -3.7794e-01,
  36492. 1.3738e-02, 3.3758e-01, 1.4508e-01],
  36493. [ 6.6609e-01, -3.9081e-01, 1.7458e+00, 3.7987e-04, -4.4658e-01,
  36494. 1.1860e-01, 6.7305e-01, 1.6379e-01]], device='cuda:0',
  36495. grad_fn=<AddmmBackward>)
  36496. landmarks are: tensor([[[ 0.6220, -0.4436, 1.8711, -0.3691, -0.6173, -0.4999, 0.6702,
  36497. 0.0697],
  36498. [ 0.5647, -0.4129, 1.4901, -1.0619, -0.6462, -0.5846, 0.3873,
  36499. 0.2776],
  36500. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  36501. 0.2837],
  36502. [ 0.5441, -0.3997, 1.7326, -0.2228, -0.4441, -0.2921, 0.0296,
  36503. 0.2409],
  36504. [ 0.5320, -0.4189, 1.3053, -1.0773, -0.5711, -0.9849, 0.2267,
  36505. 0.3237],
  36506. [ 0.5894, -0.3503, 1.6402, -0.3614, -0.5827, -0.7925, 0.3238,
  36507. 0.3238],
  36508. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  36509. 0.2035],
  36510. [ 0.5466, -0.4706, 1.7198, -0.0903, -0.5712, 0.1261, 0.4733,
  36511. 0.0688]]], device='cuda:0')
  36512. loss_train_step before backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  36513. loss_train_step after backward: tensor(0.0073, device='cuda:0', grad_fn=<MseLossBackward>)
  36514. loss_train: 0.8129367139190435
  36515. step: 51
  36516. running loss: 0.01593993556704007
  36517.  
  36518. Train Steps: 51/90 Loss: 0.0159 torch.Size([8, 600, 800])
  36519. torch.Size([8, 8])
  36520. tensor([[0.6278, 0.4253, 0.8875, 0.5017, 0.4113, 0.2750, 0.5413, 0.6196],
  36521. [0.6219, 0.4114, 0.8175, 0.2817, 0.3925, 0.2783, 0.5900, 0.5350],
  36522. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  36523. [ nan, nan, 0.9050, 0.3500, 0.5138, 0.2300, 0.7359, 0.5702],
  36524. [0.6219, 0.4097, 0.8738, 0.3400, 0.3563, 0.4117, 0.5975, 0.5683],
  36525. [0.6222, 0.3937, 0.8350, 0.5617, 0.4138, 0.4600, 0.5800, 0.5233],
  36526. [0.6086, 0.3998, 0.8788, 0.4450, 0.4025, 0.4650, 0.5306, 0.5103],
  36527. [0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150]],
  36528. device='cuda:0', dtype=torch.float64)
  36529. predictions are: tensor([[ 0.6138, -0.3162, 1.6757, -0.0385, -0.3359, -1.0177, 0.2893, 0.4970],
  36530. [ 0.3506, -0.4950, 1.3670, -1.0617, -0.4420, -0.9203, 0.3976, 0.2195],
  36531. [ 0.6430, -0.3678, 1.8338, -0.3944, -0.5642, -0.1219, 0.7280, 0.2425],
  36532. [-2.2223, -2.2294, 1.5857, -0.9523, 0.0569, -1.1593, 0.6875, 0.2897],
  36533. [ 0.6182, -0.3403, 1.7174, -0.7481, -0.6678, -0.3971, 0.4993, 0.2399],
  36534. [ 0.5614, -0.4385, 1.5351, 0.2646, -0.4268, -0.1418, 0.4188, 0.1910],
  36535. [ 0.5111, -0.4241, 1.6742, -0.2531, -0.4758, -0.0282, 0.2072, 0.1283],
  36536. [ 0.6298, -0.3722, 1.3168, -1.1760, -0.2614, -1.3129, 0.4119, 0.1058]],
  36537. device='cuda:0', grad_fn=<AddmmBackward>)
  36538. landmarks are: tensor([[[ 0.6139, -0.3216, 1.8134, 0.0313, -0.3864, -1.0157, 0.2144,
  36539. 0.5762],
  36540. [ 0.5868, -0.3858, 1.4901, -0.9849, -0.4730, -1.0003, 0.4393,
  36541. 0.1852],
  36542. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  36543. 0.0985],
  36544. [-2.2859, -2.2859, 1.8942, -0.6693, 0.0871, -1.2236, 1.1130,
  36545. 0.3478],
  36546. [ 0.5867, -0.3937, 1.7499, -0.7155, -0.6404, -0.3844, 0.4739,
  36547. 0.3392],
  36548. [ 0.5880, -0.4676, 1.5709, 0.3084, -0.3748, -0.1612, 0.3931,
  36549. 0.1313],
  36550. [ 0.5253, -0.4392, 1.7730, -0.2305, -0.4268, -0.1381, 0.1651,
  36551. 0.0712],
  36552. [ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  36553. 0.0928]]], device='cuda:0')
  36554. loss_train_step before backward: tensor(0.0099, device='cuda:0', grad_fn=<MseLossBackward>)
  36555. loss_train_step after backward: tensor(0.0099, device='cuda:0', grad_fn=<MseLossBackward>)
  36556. loss_train: 0.8228131141513586
  36557. step: 52
  36558. running loss: 0.015823329118295357
  36559. Train Steps: 52/90 Loss: 0.0158 torch.Size([8, 600, 800])
  36560. torch.Size([8, 8])
  36561. tensor([[0.6229, 0.4066, 0.8513, 0.5717, 0.4500, 0.5050, 0.6025, 0.5350],
  36562. [0.6164, 0.4119, 0.7913, 0.2650, 0.3538, 0.3500, 0.5614, 0.5038],
  36563. [0.6082, 0.4024, 0.8738, 0.4017, 0.3688, 0.3950, 0.5306, 0.5136],
  36564. [ nan, nan, 0.7612, 0.3250, 0.4037, 0.2533, 0.5438, 0.5767],
  36565. [0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882],
  36566. [0.6284, 0.4029, 0.8838, 0.3783, 0.3975, 0.2850, 0.6335, 0.5090],
  36567. [0.6145, 0.3983, 0.8700, 0.5017, 0.4400, 0.4800, 0.5375, 0.5750],
  36568. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332]],
  36569. device='cuda:0', dtype=torch.float64)
  36570. predictions are: tensor([[ 0.6219, -0.3752, 1.6652, 0.2994, -0.1866, 0.0215, 0.3743, 0.2948],
  36571. [ 0.7644, -0.2511, 1.4535, -1.0984, -0.6169, -0.6842, 0.4383, 0.1393],
  36572. [ 0.5370, -0.4199, 1.7934, -0.4256, -0.5711, -0.4423, 0.2916, 0.1527],
  36573. [-1.5907, -1.8032, 1.1504, -1.0188, -0.3355, -1.0750, 0.1658, 0.3443],
  36574. [ 0.7614, -0.2678, 1.8735, -0.4168, -0.5463, -0.5598, 0.2533, 0.0554],
  36575. [ 0.7204, -0.3163, 1.9029, -0.5729, -0.3919, -1.0855, 0.6899, 0.2262],
  36576. [ 0.5421, -0.4263, 1.7555, -0.0450, -0.2282, -0.0415, 0.2501, 0.3798],
  36577. [ 0.6803, -0.3359, 1.5785, 0.1547, -0.4745, -0.0506, 0.9300, 0.3099]],
  36578. device='cuda:0', grad_fn=<AddmmBackward>)
  36579. landmarks are: tensor([[[ 0.5911, -0.4080, 1.6460, 0.3546, -0.2074, 0.0467, 0.4970,
  36580. 0.1852],
  36581. [ 0.5614, -0.3834, 1.3688, -1.0619, -0.6520, -0.6693, 0.3069,
  36582. 0.0412],
  36583. [ 0.5235, -0.4273, 1.7499, -0.4306, -0.5827, -0.4614, 0.1651,
  36584. 0.0862],
  36585. [-2.2859, -2.2859, 1.2303, -0.7848, -0.4210, -1.1158, 0.2256,
  36586. 0.3777],
  36587. [ 0.5595, -0.3988, 1.7672, -0.4460, -0.5538, -0.5384, 0.0828,
  36588. -0.0310],
  36589. [ 0.6165, -0.4249, 1.7961, -0.5384, -0.4499, -0.9695, 0.6401,
  36590. 0.0652],
  36591. [ 0.5525, -0.4463, 1.7326, 0.0313, -0.2536, -0.0688, 0.1968,
  36592. 0.3700],
  36593. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  36594. 0.1768]]], device='cuda:0')
  36595. loss_train_step before backward: tensor(0.0193, device='cuda:0', grad_fn=<MseLossBackward>)
  36596. loss_train_step after backward: tensor(0.0193, device='cuda:0', grad_fn=<MseLossBackward>)
  36597. loss_train: 0.8421134296804667
  36598. step: 53
  36599. running loss: 0.015888932635480503
  36600. Train Steps: 53/90 Loss: 0.0159 torch.Size([8, 600, 800])
  36601. torch.Size([8, 8])
  36602. tensor([[0.6115, 0.4081, 0.6725, 0.2433, 0.4088, 0.1933, 0.5167, 0.5544],
  36603. [0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617],
  36604. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767],
  36605. [0.6106, 0.4022, 0.7125, 0.2650, 0.3713, 0.2700, 0.5431, 0.5123],
  36606. [0.6150, 0.3935, 0.8696, 0.5158, 0.4647, 0.5329, 0.6041, 0.5153],
  36607. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  36608. [0.6222, 0.4169, 0.8638, 0.5650, 0.4313, 0.4783, 0.5637, 0.5633],
  36609. [0.6277, 0.4103, 0.8087, 0.5717, 0.4188, 0.4750, 0.5663, 0.6083]],
  36610. device='cuda:0', dtype=torch.float64)
  36611. predictions are: tensor([[ 0.6673, -0.3268, 1.1403, -1.1721, -0.3743, -1.4599, 0.3026, 0.2220],
  36612. [ 0.6780, -0.3399, 2.0108, -0.0608, -0.5956, -0.1336, 0.5727, 0.2934],
  36613. [ 0.3732, -0.5323, 1.4563, -1.1377, -0.4467, -0.9829, 0.7052, 0.2905],
  36614. [ 0.6293, -0.3675, 1.2879, -1.0773, -0.5225, -1.0735, 0.2881, 0.0723],
  36615. [ 0.4728, -0.4933, 1.8535, 0.0456, -0.1775, 0.2102, 0.4344, 0.1276],
  36616. [-2.0240, -2.1459, 0.9359, -1.3552, -0.3156, -1.4738, 0.2332, 0.2545],
  36617. [ 0.6209, -0.3482, 1.8802, 0.2570, -0.3235, -0.0597, 0.2850, 0.2831],
  36618. [ 0.6233, -0.3547, 1.7081, 0.2817, -0.3935, -0.0655, 0.3343, 0.4167]],
  36619. device='cuda:0', grad_fn=<AddmmBackward>)
  36620. landmarks are: tensor([[[ 0.5385, -0.4010, 0.8203, -1.1620, -0.3979, -1.3929, 0.1005,
  36621. 0.2747],
  36622. [ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  36623. 0.3084],
  36624. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  36625. 0.3777],
  36626. [ 0.5342, -0.4280, 1.0051, -1.0619, -0.5711, -1.0388, 0.2226,
  36627. 0.0802],
  36628. [ 0.5548, -0.4682, 1.7309, 0.0966, -0.1394, 0.1757, 0.5045,
  36629. 0.0942],
  36630. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  36631. 0.3469],
  36632. [ 0.5880, -0.3605, 1.7037, 0.3238, -0.2940, -0.0765, 0.3180,
  36633. 0.3161],
  36634. [ 0.6134, -0.3910, 1.4497, 0.3546, -0.3517, -0.0919, 0.3296,
  36635. 0.5239]]], device='cuda:0')
  36636. loss_train_step before backward: tensor(0.0127, device='cuda:0', grad_fn=<MseLossBackward>)
  36637. loss_train_step after backward: tensor(0.0127, device='cuda:0', grad_fn=<MseLossBackward>)
  36638. loss_train: 0.8548482032492757
  36639. step: 54
  36640. running loss: 0.015830522282393993
  36641. Train Steps: 54/90 Loss: 0.0158 torch.Size([8, 600, 800])
  36642. torch.Size([8, 8])
  36643. tensor([[0.6200, 0.3993, 0.8519, 0.4923, 0.3962, 0.4717, 0.6013, 0.5433],
  36644. [0.6274, 0.4270, 0.8938, 0.4967, 0.3550, 0.4283, 0.5700, 0.5733],
  36645. [ nan, nan, 0.6688, 0.2513, 0.4113, 0.2117, 0.5193, 0.5933],
  36646. [ nan, nan, 0.7725, 0.2611, 0.3675, 0.2733, 0.5413, 0.5167],
  36647. [0.6182, 0.3972, 0.8720, 0.5527, 0.3638, 0.3582, 0.5696, 0.5395],
  36648. [0.6140, 0.4034, 0.8850, 0.4317, 0.4288, 0.5067, 0.5825, 0.5533],
  36649. [0.6097, 0.3988, 0.8650, 0.5250, 0.4213, 0.5200, 0.5675, 0.5050],
  36650. [0.6126, 0.4067, 0.8638, 0.5383, 0.4188, 0.4850, 0.5016, 0.5392]],
  36651. device='cuda:0', dtype=torch.float64)
  36652. predictions are: tensor([[ 0.7359, -0.2978, 1.7785, -0.0222, -0.3996, -0.1070, 0.5864, 0.2958],
  36653. [ 0.7449, -0.2164, 1.9379, -0.0315, -0.5511, -0.3084, 0.5034, 0.3601],
  36654. [-1.3691, -1.6667, 0.8612, -1.2613, -0.3751, -1.3698, 0.2615, 0.4043],
  36655. [-1.9919, -2.1095, 1.2635, -1.0819, -0.4544, -1.0682, 0.2091, 0.1249],
  36656. [ 0.7430, -0.2650, 1.8531, 0.1796, -0.5756, -0.6459, 0.5336, 0.1851],
  36657. [ 0.8209, -0.2462, 1.8957, -0.2638, -0.2654, 0.1714, 0.5637, 0.2248],
  36658. [ 0.7045, -0.3207, 1.8143, 0.1388, -0.2615, 0.2025, 0.2661, 0.0781],
  36659. [ 0.8117, -0.2041, 1.7769, 0.2153, -0.3169, 0.0384, 0.1559, 0.1889]],
  36660. device='cuda:0', grad_fn=<AddmmBackward>)
  36661. landmarks are: tensor([[[ 0.5777, -0.4415, 1.6491, -0.0122, -0.4557, -0.1073, 0.4912,
  36662. 0.2237],
  36663. [ 0.6121, -0.3138, 1.8423, 0.0082, -0.6462, -0.3075, 0.3469,
  36664. 0.3623],
  36665. [-2.2859, -2.2859, 0.8033, -1.1250, -0.3864, -1.3082, 0.1126,
  36666. 0.4543],
  36667. [-2.2859, -2.2859, 1.2820, -1.0801, -0.5885, -1.0234, 0.2141,
  36668. 0.1005],
  36669. [ 0.5697, -0.4514, 1.7420, 0.2672, -0.6055, -0.6312, 0.3449,
  36670. 0.2058],
  36671. [ 0.5499, -0.4225, 1.8018, -0.2921, -0.3055, 0.0543, 0.4046,
  36672. 0.2699],
  36673. [ 0.5303, -0.4440, 1.7095, 0.1390, -0.3402, 0.1159, 0.3353,
  36674. 0.0467],
  36675. [ 0.5436, -0.4076, 1.7037, 0.2006, -0.3517, -0.0457, 0.0311,
  36676. 0.2048]]], device='cuda:0')
  36677. loss_train_step before backward: tensor(0.0322, device='cuda:0', grad_fn=<MseLossBackward>)
  36678. loss_train_step after backward: tensor(0.0322, device='cuda:0', grad_fn=<MseLossBackward>)
  36679. loss_train: 0.8870698222890496
  36680. step: 55
  36681. running loss: 0.016128542223437264
  36682.  
  36683. Train Steps: 55/90 Loss: 0.0161 torch.Size([8, 600, 800])
  36684. torch.Size([8, 8])
  36685. tensor([[0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183],
  36686. [0.6279, 0.4050, 0.8025, 0.2200, 0.4313, 0.2733, 0.6820, 0.5320],
  36687. [0.6142, 0.3982, 0.8650, 0.4883, 0.3912, 0.4317, 0.5315, 0.5350],
  36688. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  36689. [0.6205, 0.4081, 0.8950, 0.4017, 0.3788, 0.4700, 0.5963, 0.5667],
  36690. [0.6201, 0.4064, 0.8688, 0.5050, 0.4225, 0.5100, 0.6138, 0.5500],
  36691. [ nan, nan, 0.7850, 0.2700, 0.4288, 0.1717, 0.5199, 0.4999],
  36692. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552]],
  36693. device='cuda:0', dtype=torch.float64)
  36694. predictions are: tensor([[ 0.6181, -0.3578, 1.4846, -0.8818, -0.5126, -1.1168, 0.2677, 0.1355],
  36695. [ 0.7924, -0.2418, 1.4436, -1.0710, -0.3385, -1.0589, 0.8068, 0.2151],
  36696. [ 0.7669, -0.2631, 1.7523, 0.1436, -0.4913, -0.1816, 0.1077, 0.1780],
  36697. [ 0.7052, -0.3087, 1.6060, 0.0755, -0.2882, 0.1245, 0.3166, 0.2797],
  36698. [ 0.8958, -0.1547, 1.7925, -0.2482, -0.5676, -0.0407, 0.4489, 0.3177],
  36699. [ 0.8621, -0.2202, 1.7208, 0.1235, -0.3645, 0.0783, 0.3573, 0.2843],
  36700. [-1.8809, -1.9708, 1.1639, -1.0491, -0.3869, -1.3121, 0.1169, 0.1347],
  36701. [-2.1162, -2.1510, 1.5890, -1.0452, 0.0364, -1.0503, 0.8505, 0.3124]],
  36702. device='cuda:0', grad_fn=<AddmmBackward>)
  36703. landmarks are: tensor([[[ 5.7985e-01, -4.1555e-01, 1.3977e+00, -1.0388e+00, -4.6721e-01,
  36704. -1.1004e+00, 3.4688e-01, 1.0824e-01],
  36705. [ 6.1413e-01, -4.1527e-01, 1.4208e+00, -1.2697e+00, -2.9400e-01,
  36706. -1.0234e+00, 8.6439e-01, 1.7146e-01],
  36707. [ 5.5127e-01, -4.4673e-01, 1.7095e+00, -3.0331e-02, -4.7875e-01,
  36708. -2.9207e-01, 1.6917e-01, 1.8544e-01],
  36709. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  36710. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  36711. [ 5.7991e-01, -4.0115e-01, 1.8480e+00, -4.3064e-01, -5.3649e-01,
  36712. -1.1501e-01, 4.6813e-01, 3.3149e-01],
  36713. [ 5.7841e-01, -4.0878e-01, 1.7268e+00, 4.6651e-02, -3.3441e-01,
  36714. 6.9746e-02, 5.4896e-01, 2.5450e-01],
  36715. [-2.2859e+00, -2.2859e+00, 1.3400e+00, -1.0388e+00, -3.0554e-01,
  36716. -1.4930e+00, 1.1570e-01, 2.3124e-02],
  36717. [-2.2859e+00, -2.2859e+00, 1.7557e+00, -1.1466e+00, 8.7067e-02,
  36718. -1.0773e+00, 1.1239e+00, 2.7833e-01]]], device='cuda:0')
  36719. loss_train_step before backward: tensor(0.0196, device='cuda:0', grad_fn=<MseLossBackward>)
  36720. loss_train_step after backward: tensor(0.0196, device='cuda:0', grad_fn=<MseLossBackward>)
  36721. loss_train: 0.9066562773659825
  36722. step: 56
  36723. running loss: 0.01619029066724969
  36724. Train Steps: 56/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36725. torch.Size([8, 8])
  36726. tensor([[0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436],
  36727. [0.6214, 0.4040, 0.8838, 0.3500, 0.3600, 0.5183, 0.6362, 0.5200],
  36728. [0.6224, 0.4061, 0.8988, 0.4300, 0.3838, 0.4750, 0.6112, 0.5483],
  36729. [0.6239, 0.4107, 0.8162, 0.2763, 0.3625, 0.3600, 0.5988, 0.5700],
  36730. [0.6102, 0.4005, 0.8688, 0.5100, 0.4813, 0.5400, 0.5404, 0.5064],
  36731. [0.6160, 0.4086, 0.8775, 0.3983, 0.3750, 0.3783, 0.5128, 0.4882],
  36732. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  36733. [0.6204, 0.4049, 0.7975, 0.2700, 0.3937, 0.2567, 0.5700, 0.5183]],
  36734. device='cuda:0', dtype=torch.float64)
  36735. predictions are: tensor([[ 0.6829, -0.3401, 1.7066, 0.2011, -0.3595, 0.1086, 0.9120, 0.4105],
  36736. [ 0.8049, -0.2839, 1.7544, -0.5074, -0.5299, 0.0459, 0.5987, 0.2734],
  36737. [ 0.5709, -0.4311, 1.8545, -0.0998, -0.4727, -0.0623, 0.4352, 0.2658],
  36738. [ 0.4772, -0.4543, 1.5151, -0.7104, -0.5211, -0.7383, 0.4856, 0.3452],
  36739. [ 0.5559, -0.4322, 1.7555, 0.1990, -0.0483, 0.0407, 0.1077, 0.1094],
  36740. [ 0.5763, -0.4048, 1.8463, -0.2421, -0.5570, -0.6607, 0.1426, 0.0537],
  36741. [ 0.6002, -0.3517, 1.1491, -0.9855, -0.5656, -0.8767, 0.4835, 0.3959],
  36742. [ 0.1484, -0.6880, 1.5266, -0.8485, -0.4765, -1.2423, 0.2979, 0.1321]],
  36743. device='cuda:0', grad_fn=<AddmmBackward>)
  36744. landmarks are: tensor([[[ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  36745. 0.2249],
  36746. [ 0.5841, -0.4199, 1.7961, -0.6693, -0.6231, 0.1082, 0.6529,
  36747. 0.1159],
  36748. [ 0.5888, -0.4101, 1.8654, -0.2998, -0.5134, -0.0919, 0.5374,
  36749. 0.2468],
  36750. [ 0.5960, -0.3888, 1.4840, -1.0095, -0.6115, -0.6231, 0.4797,
  36751. 0.3469],
  36752. [ 0.5328, -0.4361, 1.7268, 0.0697, -0.0630, 0.2083, 0.2103,
  36753. 0.0532],
  36754. [ 0.5595, -0.3988, 1.7672, -0.4460, -0.5538, -0.5384, 0.0828,
  36755. -0.0310],
  36756. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  36757. 0.3007],
  36758. [ 0.5798, -0.4156, 1.3977, -1.0388, -0.4672, -1.1004, 0.3469,
  36759. 0.1082]]], device='cuda:0')
  36760. loss_train_step before backward: tensor(0.0156, device='cuda:0', grad_fn=<MseLossBackward>)
  36761. loss_train_step after backward: tensor(0.0156, device='cuda:0', grad_fn=<MseLossBackward>)
  36762. loss_train: 0.9222497092559934
  36763. step: 57
  36764. running loss: 0.01617981946063146
  36765. Train Steps: 57/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36766. torch.Size([8, 8])
  36767. tensor([[0.6204, 0.4013, 0.8075, 0.2400, 0.4313, 0.2050, 0.5800, 0.5150],
  36768. [0.6263, 0.4039, 0.9000, 0.4400, 0.3625, 0.4667, 0.6424, 0.4804],
  36769. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598],
  36770. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  36771. [0.6040, 0.4002, 0.7338, 0.2267, 0.3975, 0.2100, 0.5231, 0.4778],
  36772. [0.6197, 0.4051, 0.7812, 0.2650, 0.3513, 0.4050, 0.6112, 0.5500],
  36773. [0.6216, 0.4099, 0.7225, 0.2033, 0.4188, 0.2217, 0.5975, 0.5283],
  36774. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433]],
  36775. device='cuda:0', dtype=torch.float64)
  36776. predictions are: tensor([[ 0.4680, -0.5072, 1.4882, -0.9610, -0.2499, -1.2891, 0.5355, 0.2191],
  36777. [ 0.7412, -0.3457, 1.8500, -0.2045, -0.5993, -0.0566, 0.4874, 0.0658],
  36778. [ 0.4956, -0.4700, 1.5806, 0.3873, -0.1192, -0.0546, 0.2357, 0.3602],
  36779. [-0.0531, -0.8100, 1.7826, -0.8371, -0.3113, -1.0016, 0.6913, 0.2936],
  36780. [ 0.5888, -0.4092, 1.1607, -1.1879, -0.4697, -1.2295, 0.2869, 0.0801],
  36781. [ 0.7139, -0.3403, 1.3548, -0.9276, -0.6617, -0.3502, 0.5011, 0.3473],
  36782. [ 0.2308, -0.6215, 1.1084, -1.1688, -0.3470, -1.2640, 0.4619, 0.3078],
  36783. [ 0.5495, -0.4039, 1.7657, -0.5195, -0.6240, -0.7107, 0.2321, 0.2657]],
  36784. device='cuda:0', grad_fn=<AddmmBackward>)
  36785. landmarks are: tensor([[[ 0.5796, -0.4326, 1.4439, -1.1774, -0.2940, -1.3390, 0.3931,
  36786. 0.0928],
  36787. [ 0.6072, -0.4206, 1.8711, -0.2536, -0.6115, -0.1304, 0.6812,
  36788. -0.0670],
  36789. [ 0.5726, -0.4249, 1.5824, 0.3777, -0.0942, -0.0556, 0.2782,
  36790. 0.2997],
  36791. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  36792. 0.1467],
  36793. [ 0.5037, -0.4375, 1.1032, -1.2390, -0.4499, -1.3159, 0.1301,
  36794. -0.0791],
  36795. [ 0.5763, -0.4147, 1.3226, -1.0619, -0.6635, -0.4152, 0.5374,
  36796. 0.2545],
  36797. [ 0.5850, -0.3925, 1.0513, -1.3467, -0.3517, -1.2620, 0.4739,
  36798. 0.1544],
  36799. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  36800. 0.2237]]], device='cuda:0')
  36801. loss_train_step before backward: tensor(0.0198, device='cuda:0', grad_fn=<MseLossBackward>)
  36802. loss_train_step after backward: tensor(0.0198, device='cuda:0', grad_fn=<MseLossBackward>)
  36803. loss_train: 0.9420179659500718
  36804. step: 58
  36805. running loss: 0.016241689068104685
  36806. Train Steps: 58/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36807. torch.Size([8, 8])
  36808. tensor([[0.6193, 0.3930, 0.8949, 0.4437, 0.3852, 0.5435, 0.6263, 0.5263],
  36809. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  36810. [0.6126, 0.4039, 0.8237, 0.3967, 0.3625, 0.3600, 0.5894, 0.6138],
  36811. [ nan, nan, 0.6412, 0.1900, 0.4238, 0.1883, 0.5487, 0.5700],
  36812. [0.6199, 0.3952, 0.8573, 0.5374, 0.4075, 0.4687, 0.5942, 0.5377],
  36813. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  36814. [0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  36815. [0.6204, 0.4091, 0.8950, 0.4783, 0.3613, 0.4617, 0.6063, 0.5617]],
  36816. device='cuda:0', dtype=torch.float64)
  36817. predictions are: tensor([[ 0.5118, -0.4744, 1.7803, -0.3263, -0.4744, 0.1388, 0.4503, 0.0420],
  36818. [ 0.4170, -0.4748, 1.6589, 0.1730, -0.5230, -0.5177, 0.1883, 0.3262],
  36819. [ 0.4429, -0.4836, 1.5923, -0.5252, -0.5800, -0.5985, 0.3619, 0.4124],
  36820. [-2.6916, -2.5599, 0.9813, -1.2277, -0.3173, -1.4307, 0.2689, 0.2390],
  36821. [ 0.5146, -0.5080, 1.7030, 0.0749, -0.3763, -0.1399, 0.4489, 0.0463],
  36822. [ 0.4605, -0.4835, 1.7907, -0.1342, -0.1387, 0.3505, 0.4464, 0.1572],
  36823. [ 0.4982, -0.4772, 0.9685, -1.1748, -0.4223, -1.1938, 0.3804, 0.2206],
  36824. [ 0.5921, -0.4157, 1.8043, -0.1693, -0.5291, -0.1697, 0.5353, 0.2092]],
  36825. device='cuda:0', grad_fn=<AddmmBackward>)
  36826. landmarks are: tensor([[[ 0.5746, -0.4706, 1.8476, -0.2365, -0.5068, 0.2245, 0.6069,
  36827. 0.1449],
  36828. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  36829. 0.4778],
  36830. [ 0.5438, -0.4206, 1.5189, -0.4537, -0.6115, -0.6231, 0.4365,
  36831. 0.5491],
  36832. [-2.2859, -2.2859, 0.6760, -1.4083, -0.3286, -1.4160, 0.2487,
  36833. 0.3469],
  36834. [ 0.5775, -0.4607, 1.6741, 0.1962, -0.4036, -0.1212, 0.4588,
  36835. 0.1979],
  36836. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  36837. 0.2083],
  36838. [ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  36839. 0.3852],
  36840. [ 0.5797, -0.3965, 1.8480, -0.0765, -0.6173, -0.1535, 0.5143,
  36841. 0.3084]]], device='cuda:0')
  36842. loss_train_step before backward: tensor(0.0128, device='cuda:0', grad_fn=<MseLossBackward>)
  36843. loss_train_step after backward: tensor(0.0128, device='cuda:0', grad_fn=<MseLossBackward>)
  36844. loss_train: 0.95481295324862
  36845. step: 59
  36846. running loss: 0.016183270394044408
  36847.  
  36848. Train Steps: 59/90 Loss: 0.0162 torch.Size([8, 600, 800])
  36849. torch.Size([8, 8])
  36850. tensor([[0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  36851. [0.6222, 0.4172, 0.8850, 0.5217, 0.3738, 0.4600, 0.5700, 0.5633],
  36852. [0.6266, 0.4070, 0.8712, 0.5600, 0.3713, 0.4783, 0.5775, 0.6100],
  36853. [0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  36854. [0.6307, 0.4060, 0.8950, 0.5183, 0.3750, 0.3850, 0.6338, 0.4938],
  36855. [0.6084, 0.3981, 0.8588, 0.5233, 0.4600, 0.5367, 0.5680, 0.5006],
  36856. [0.6178, 0.4059, 0.7525, 0.2250, 0.4313, 0.1783, 0.5404, 0.5240],
  36857. [0.6134, 0.4090, 0.6926, 0.2819, 0.3538, 0.3233, 0.5563, 0.5667]],
  36858. device='cuda:0', dtype=torch.float64)
  36859. predictions are: tensor([[ 0.6028, -0.3939, 1.3621, -0.7628, -0.6650, -0.5480, 0.2328, 0.2807],
  36860. [ 0.6330, -0.3729, 1.8560, -0.0090, -0.5082, -0.1894, 0.3534, 0.3002],
  36861. [ 0.6191, -0.4331, 1.6896, 0.1688, -0.5121, -0.0415, 0.5741, 0.4011],
  36862. [ 0.1725, -0.7107, 1.6695, 0.1222, -0.4347, 0.0672, 0.2956, 0.1270],
  36863. [ 0.5586, -0.4837, 1.9110, -0.0396, -0.5220, -0.5785, 0.6986, -0.0429],
  36864. [ 0.4333, -0.5479, 1.6927, 0.0067, -0.1288, 0.1918, 0.2718, 0.0897],
  36865. [ 0.2199, -0.6341, 1.2996, -1.2787, -0.2926, -1.4296, 0.4385, 0.1184],
  36866. [ 0.6418, -0.3789, 1.0555, -1.0573, -0.6544, -0.7649, 0.3476, 0.3257]],
  36867. device='cuda:0', grad_fn=<AddmmBackward>)
  36868. landmarks are: tensor([[[ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  36869. 0.3417],
  36870. [ 0.5879, -0.3591, 1.8018, 0.1236, -0.5596, -0.1612, 0.3469,
  36871. 0.3161],
  36872. [ 0.6081, -0.4059, 1.7383, 0.3007, -0.5711, -0.0765, 0.3815,
  36873. 0.5316],
  36874. [ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  36875. -0.1061],
  36876. [ 0.6273, -0.4105, 1.8480, 0.1082, -0.5538, -0.5076, 0.6414,
  36877. -0.0049],
  36878. [ 0.5241, -0.4470, 1.6806, 0.1313, -0.1612, 0.1929, 0.3378,
  36879. 0.0261],
  36880. [ 0.5676, -0.4112, 1.1898, -1.2467, -0.2940, -1.4622, 0.2103,
  36881. 0.1343],
  36882. [ 0.5473, -0.3966, 0.9131, -0.9838, -0.6520, -0.7925, 0.2834,
  36883. 0.3315]]], device='cuda:0')
  36884. loss_train_step before backward: tensor(0.0120, device='cuda:0', grad_fn=<MseLossBackward>)
  36885. loss_train_step after backward: tensor(0.0120, device='cuda:0', grad_fn=<MseLossBackward>)
  36886. loss_train: 0.9668285604566336
  36887. step: 60
  36888. running loss: 0.016113809340943894
  36889. Train Steps: 60/90 Loss: 0.0161 torch.Size([8, 600, 800])
  36890. torch.Size([8, 8])
  36891. tensor([[0.6189, 0.3961, 0.7589, 0.2256, 0.3759, 0.3280, 0.6184, 0.5334],
  36892. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  36893. [0.6364, 0.4092, 0.8525, 0.5633, 0.3875, 0.4950, 0.6599, 0.5285],
  36894. [0.6212, 0.4159, 0.8675, 0.5783, 0.4088, 0.4317, 0.5613, 0.5917],
  36895. [0.6122, 0.3993, 0.8738, 0.4667, 0.4517, 0.4879, 0.5155, 0.4927],
  36896. [0.6275, 0.4003, 0.9100, 0.3783, 0.4388, 0.3133, 0.7058, 0.5343],
  36897. [0.6124, 0.4083, 0.6954, 0.3069, 0.3650, 0.2750, 0.5163, 0.5485],
  36898. [0.6307, 0.3998, 0.8500, 0.5233, 0.3850, 0.5050, 0.7446, 0.5320]],
  36899. device='cuda:0', dtype=torch.float64)
  36900. predictions are: tensor([[ 0.5016, -0.4703, 1.2278, -1.2672, -0.5932, -0.8244, 0.4420, 0.1547],
  36901. [ 0.2497, -0.6129, 1.6548, -0.4681, -0.5996, -0.8265, -0.0047, 0.1981],
  36902. [ 0.5524, -0.4908, 1.6442, 0.1523, -0.4874, 0.0100, 0.6921, 0.1528],
  36903. [ 0.4261, -0.4861, 1.6044, 0.1678, -0.3794, -0.2528, 0.2993, 0.4646],
  36904. [ 0.5280, -0.4921, 1.7713, -0.2128, -0.2425, 0.0598, 0.1536, 0.0179],
  36905. [ 0.4659, -0.5584, 1.8527, -0.6520, -0.3224, -0.8461, 0.8426, 0.0868],
  36906. [ 0.4742, -0.4619, 0.9765, -0.9842, -0.6332, -0.9425, 0.0351, 0.2549],
  36907. [ 0.5845, -0.4672, 1.6357, 0.0128, -0.4951, 0.0762, 0.8753, 0.1771]],
  36908. device='cuda:0', grad_fn=<AddmmBackward>)
  36909. landmarks are: tensor([[[ 5.7296e-01, -4.5619e-01, 1.2195e+00, -1.2440e+00, -5.4966e-01,
  36910. -7.7109e-01, 5.7045e-01, 1.7788e-01],
  36911. [ 5.4700e-01, -3.9515e-01, 1.6377e+00, -4.2531e-01, -6.2887e-01,
  36912. -8.0785e-01, 2.4925e-02, 2.1157e-01],
  36913. [ 6.5365e-01, -3.9601e-01, 1.6517e+00, 3.1609e-01, -4.9607e-01,
  36914. 4.6189e-04, 7.6203e-01, 1.5543e-01],
  36915. [ 5.8360e-01, -3.6490e-01, 1.7210e+00, 3.8537e-01, -3.9792e-01,
  36916. -2.9207e-01, 3.0647e-01, 4.4696e-01],
  36917. [ 5.4166e-01, -4.4175e-01, 1.7499e+00, -1.3041e-01, -1.9942e-01,
  36918. -3.2367e-02, 9.5140e-02, -9.9401e-03],
  36919. [ 6.1248e-01, -4.3693e-01, 1.9173e+00, -5.3841e-01, -2.5935e-01,
  36920. -8.3865e-01, 9.7406e-01, 1.8214e-01],
  36921. [ 5.4249e-01, -3.9977e-01, 9.2628e-01, -8.6826e-01, -6.0000e-01,
  36922. -1.0157e+00, 9.8951e-02, 2.4764e-01],
  36923. [ 6.2730e-01, -4.3934e-01, 1.6402e+00, 1.3133e-01, -5.0762e-01,
  36924. 4.6651e-02, 1.1532e+00, 1.7146e-01]]], device='cuda:0')
  36925. loss_train_step before backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  36926. loss_train_step after backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  36927. loss_train: 0.9755781814455986
  36928. step: 61
  36929. running loss: 0.015993084941731125
  36930. Train Steps: 61/90 Loss: 0.0160 torch.Size([8, 600, 800])
  36931. torch.Size([8, 8])
  36932. tensor([[0.6079, 0.3964, 0.7420, 0.2958, 0.3563, 0.2917, 0.5351, 0.4980],
  36933. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679],
  36934. [0.6192, 0.4128, 0.8513, 0.5617, 0.4200, 0.5267, 0.5850, 0.5633],
  36935. [0.6182, 0.3972, 0.8552, 0.5914, 0.3683, 0.4181, 0.5688, 0.5378],
  36936. [0.6111, 0.4019, 0.8350, 0.3867, 0.3500, 0.4283, 0.5480, 0.5719],
  36937. [0.6219, 0.4089, 0.8938, 0.4800, 0.3825, 0.4450, 0.5850, 0.5200],
  36938. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  36939. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875]],
  36940. device='cuda:0', dtype=torch.float64)
  36941. predictions are: tensor([[ 0.4429, -0.5028, 1.0489, -1.0283, -0.5719, -0.9001, 0.1954, 0.0527],
  36942. [-2.7236, -2.5519, 1.5574, -1.1088, 0.1584, -1.0457, 1.0681, 0.3034],
  36943. [ 0.5035, -0.4616, 1.5655, 0.1601, -0.3356, 0.1247, 0.5148, 0.2402],
  36944. [ 0.3959, -0.5453, 1.4629, 0.1522, -0.5350, -0.4185, 0.3992, 0.2318],
  36945. [ 0.3227, -0.5639, 1.4088, -0.5852, -0.6078, -0.3931, 0.1804, 0.2821],
  36946. [ 0.5485, -0.4297, 1.6632, -0.2612, -0.4895, -0.2028, 0.5109, 0.1559],
  36947. [ 0.5043, -0.4713, 1.2385, -0.8179, -0.6154, -0.6846, 0.3148, 0.1545],
  36948. [ 0.5604, -0.4319, 1.6134, -0.8001, -0.5624, -0.7814, 0.1643, 0.0606]],
  36949. device='cuda:0', grad_fn=<AddmmBackward>)
  36950. landmarks are: tensor([[[ 0.5219, -0.4550, 1.1415, -0.9196, -0.6404, -0.9387, 0.1856,
  36951. 0.0141],
  36952. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  36953. 0.3371],
  36954. [ 0.5742, -0.3792, 1.6460, 0.3084, -0.3460, 0.1467, 0.4162,
  36955. 0.3161],
  36956. [ 0.5697, -0.4514, 1.6642, 0.4459, -0.5850, -0.3546, 0.3414,
  36957. 0.1982],
  36958. [ 0.5367, -0.4294, 1.5709, -0.4999, -0.6693, -0.3075, 0.2455,
  36959. 0.3559],
  36960. [ 0.5865, -0.3973, 1.8423, -0.0688, -0.5192, -0.2305, 0.4162,
  36961. 0.1159],
  36962. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  36963. 0.0942],
  36964. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  36965. -0.0340]]], device='cuda:0')
  36966. loss_train_step before backward: tensor(0.0143, device='cuda:0', grad_fn=<MseLossBackward>)
  36967. loss_train_step after backward: tensor(0.0143, device='cuda:0', grad_fn=<MseLossBackward>)
  36968. loss_train: 0.989847207441926
  36969. step: 62
  36970. running loss: 0.015965277539385904
  36971. Train Steps: 62/90 Loss: 0.0160 torch.Size([8, 600, 800])
  36972. torch.Size([8, 8])
  36973. tensor([[0.6114, 0.4018, 0.7213, 0.1967, 0.3763, 0.2700, 0.5875, 0.5533],
  36974. [0.6225, 0.4116, 0.8662, 0.3517, 0.3663, 0.3233, 0.5837, 0.5317],
  36975. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  36976. [0.6332, 0.4165, 0.9100, 0.3350, 0.4188, 0.3683, 0.7438, 0.5528],
  36977. [ nan, nan, 0.8675, 0.2833, 0.5350, 0.1983, 0.6678, 0.5621],
  36978. [0.6200, 0.4118, 0.8287, 0.4017, 0.3775, 0.2833, 0.5391, 0.5799],
  36979. [0.6261, 0.4045, 0.8865, 0.5369, 0.3895, 0.4859, 0.6683, 0.5249],
  36980. [0.6198, 0.4075, 0.8650, 0.5617, 0.4150, 0.4367, 0.5450, 0.5650]],
  36981. device='cuda:0', dtype=torch.float64)
  36982. predictions are: tensor([[ 5.8423e-01, -4.0921e-01, 8.4051e-01, -1.3952e+00, -5.2819e-01,
  36983. -9.3486e-01, 2.4505e-01, 2.1930e-01],
  36984. [ 6.5671e-01, -3.4788e-01, 1.5112e+00, -7.5554e-01, -6.2020e-01,
  36985. -6.4918e-01, 2.0874e-01, 1.8594e-01],
  36986. [ 4.3317e-01, -5.3625e-01, 1.7903e+00, -5.5146e-01, -1.9873e-01,
  36987. -9.7180e-01, 7.4523e-01, 9.3876e-02],
  36988. [ 2.9301e-01, -5.9894e-01, 1.7694e+00, -6.2905e-01, -4.0333e-01,
  36989. -5.2115e-01, 8.2788e-01, 2.0718e-01],
  36990. [-2.7556e+00, -2.5627e+00, 1.4485e+00, -1.1333e+00, -9.4608e-04,
  36991. -1.1536e+00, 7.4314e-01, 2.3110e-01],
  36992. [ 3.9862e-01, -4.9696e-01, 1.3710e+00, -4.8671e-01, -5.6165e-01,
  36993. -8.6880e-01, 1.3935e-02, 3.0212e-01],
  36994. [ 6.2111e-01, -4.1407e-01, 1.5811e+00, 4.3570e-02, -5.5322e-01,
  36995. 2.0704e-02, 6.7610e-01, 4.8456e-02],
  36996. [ 3.0005e-01, -5.6617e-01, 1.4875e+00, 2.0248e-01, -4.3813e-01,
  36997. -2.1301e-01, 2.2350e-01, 2.4070e-01]], device='cuda:0',
  36998. grad_fn=<AddmmBackward>)
  36999. landmarks are: tensor([[[ 0.5380, -0.4302, 1.0455, -1.3775, -0.5480, -1.0388, 0.4277,
  37000. 0.2699],
  37001. [ 0.5893, -0.3847, 1.7152, -0.6616, -0.5942, -0.7925, 0.4104,
  37002. 0.1698],
  37003. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  37004. 0.2142],
  37005. [ 0.6388, -0.3623, 1.9173, -0.7386, -0.3517, -0.5846, 1.1495,
  37006. 0.2676],
  37007. [-2.2859, -2.2859, 1.7210, -0.9772, 0.1852, -1.3698, 0.7986,
  37008. 0.3104],
  37009. [ 0.5779, -0.3840, 1.5420, -0.4306, -0.5423, -0.9772, 0.2041,
  37010. 0.3928],
  37011. [ 0.6059, -0.4177, 1.8087, 0.1941, -0.4868, -0.0414, 0.8010,
  37012. 0.1385],
  37013. [ 0.5770, -0.4036, 1.7095, 0.3084, -0.3691, -0.2690, 0.2314,
  37014. 0.3238]]], device='cuda:0')
  37015. loss_train_step before backward: tensor(0.0255, device='cuda:0', grad_fn=<MseLossBackward>)
  37016. loss_train_step after backward: tensor(0.0255, device='cuda:0', grad_fn=<MseLossBackward>)
  37017. loss_train: 1.015299854800105
  37018. step: 63
  37019. running loss: 0.01611587071111278
  37020.  
  37021. Train Steps: 63/90 Loss: 0.0161 torch.Size([8, 600, 800])
  37022. torch.Size([8, 8])
  37023. tensor([[0.6086, 0.4019, 0.7782, 0.4278, 0.3625, 0.4350, 0.5150, 0.5285],
  37024. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  37025. [0.6182, 0.3987, 0.7878, 0.2889, 0.3699, 0.3260, 0.6086, 0.5367],
  37026. [0.6095, 0.3970, 0.8688, 0.4767, 0.4860, 0.4879, 0.5191, 0.4940],
  37027. [0.6170, 0.4102, 0.7468, 0.3695, 0.3463, 0.3767, 0.5238, 0.5823],
  37028. [0.6296, 0.4008, 0.9150, 0.4317, 0.4263, 0.3050, 0.7256, 0.5413],
  37029. [0.6266, 0.4067, 0.8588, 0.2867, 0.4300, 0.2850, 0.6325, 0.5267],
  37030. [0.6289, 0.4019, 0.8113, 0.5467, 0.3875, 0.5017, 0.7367, 0.5332]],
  37031. device='cuda:0', dtype=torch.float64)
  37032. predictions are: tensor([[ 0.4983, -0.4283, 1.2735, -0.4185, -0.6757, -0.3920, -0.0064, 0.1818],
  37033. [ 0.4463, -0.4745, 1.7635, -0.0741, -0.2198, 0.0709, 0.3045, 0.0067],
  37034. [ 0.4358, -0.5093, 1.3346, -1.0143, -0.6237, -0.7973, 0.4648, 0.2807],
  37035. [ 0.4776, -0.4860, 1.7109, -0.0809, -0.1550, -0.0845, 0.2076, 0.0665],
  37036. [ 0.3352, -0.4959, 1.1055, -0.6256, -0.7360, -0.6334, 0.1003, 0.4328],
  37037. [ 0.3745, -0.5841, 1.9757, -0.3037, -0.3375, -0.9440, 1.0600, 0.1346],
  37038. [ 0.7117, -0.3051, 1.6728, -0.9691, -0.3679, -1.0242, 0.5702, 0.1927],
  37039. [ 0.6047, -0.4263, 1.4712, 0.2078, -0.5265, -0.0830, 1.0713, 0.1632]],
  37040. device='cuda:0', grad_fn=<AddmmBackward>)
  37041. landmarks are: tensor([[[ 0.5253, -0.4296, 1.3084, -0.3098, -0.6115, -0.2767, 0.0928,
  37042. 0.1552],
  37043. [ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  37044. 0.0682],
  37045. [ 0.5697, -0.4442, 1.3529, -0.9515, -0.5774, -0.7801, 0.5253,
  37046. 0.1931],
  37047. [ 0.5292, -0.4520, 1.7268, -0.0842, -0.0413, -0.0324, 0.1116,
  37048. -0.0039],
  37049. [ 0.5639, -0.3911, 1.1634, -0.5794, -0.6866, -0.5461, 0.1334,
  37050. 0.4036],
  37051. [ 0.6224, -0.4345, 1.9404, -0.2921, -0.3171, -0.8771, 1.0655,
  37052. 0.2142],
  37053. [ 0.6084, -0.4076, 1.6806, -0.9618, -0.2998, -0.9695, 0.6356,
  37054. 0.1467],
  37055. [ 0.6191, -0.4297, 1.4612, 0.2391, -0.4961, 0.0313, 1.1166,
  37056. 0.1768]]], device='cuda:0')
  37057. loss_train_step before backward: tensor(0.0063, device='cuda:0', grad_fn=<MseLossBackward>)
  37058. loss_train_step after backward: tensor(0.0063, device='cuda:0', grad_fn=<MseLossBackward>)
  37059. loss_train: 1.021567848045379
  37060. step: 64
  37061. running loss: 0.015961997625709046
  37062. Train Steps: 64/90 Loss: 0.0160 torch.Size([8, 600, 800])
  37063. torch.Size([8, 8])
  37064. tensor([[0.6260, 0.4161, 0.9000, 0.3833, 0.4450, 0.2133, 0.6237, 0.4986],
  37065. [0.6175, 0.4091, 0.7863, 0.2800, 0.3638, 0.3583, 0.6188, 0.5433],
  37066. [0.6179, 0.3993, 0.8925, 0.4789, 0.3879, 0.4900, 0.6041, 0.5279],
  37067. [0.6250, 0.4106, 0.8700, 0.3717, 0.3588, 0.4967, 0.6038, 0.5167],
  37068. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679],
  37069. [0.6125, 0.3983, 0.8750, 0.4867, 0.4275, 0.4783, 0.5413, 0.5717],
  37070. [0.6214, 0.3982, 0.8938, 0.4517, 0.3663, 0.4083, 0.5863, 0.5050],
  37071. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142]],
  37072. device='cuda:0', dtype=torch.float64)
  37073. predictions are: tensor([[ 0.4823, -0.4508, 1.8019, -0.3918, -0.2574, -1.2008, 0.5459, 0.0978],
  37074. [ 0.5608, -0.3837, 1.1220, -1.0028, -0.6592, -0.5652, 0.3373, 0.2505],
  37075. [ 0.4518, -0.4826, 1.6649, -0.0459, -0.5189, -0.0822, 0.5264, 0.1332],
  37076. [ 0.6273, -0.3566, 1.5237, -0.4565, -0.6031, -0.0520, 0.6042, 0.1593],
  37077. [-2.3707, -2.2975, 1.5311, -1.0986, 0.2021, -1.1821, 1.1018, 0.3396],
  37078. [ 0.4574, -0.4729, 1.5861, 0.0844, -0.3624, -0.0815, 0.3012, 0.2289],
  37079. [ 0.5393, -0.4603, 1.6396, -0.0924, -0.6100, -0.3728, 0.4136, 0.0178],
  37080. [ 0.6332, -0.3491, 1.5950, -0.1174, -0.4494, -0.1350, 0.1423, 0.0673]],
  37081. device='cuda:0', grad_fn=<AddmmBackward>)
  37082. landmarks are: tensor([[[ 0.6054, -0.3641, 1.8711, -0.5153, -0.2305, -1.3005, 0.5948,
  37083. 0.0171],
  37084. [ 0.5665, -0.3963, 1.3457, -0.9926, -0.6058, -0.6308, 0.5721,
  37085. 0.2237],
  37086. [ 0.5680, -0.4417, 1.8365, -0.0740, -0.4941, -0.0227, 0.5045,
  37087. 0.1525],
  37088. [ 0.6010, -0.3896, 1.7326, -0.5692, -0.6289, 0.0082, 0.5028,
  37089. 0.1005],
  37090. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  37091. 0.3371],
  37092. [ 0.5432, -0.4462, 1.7557, -0.0380, -0.3113, -0.0765, 0.2141,
  37093. 0.3546],
  37094. [ 0.5844, -0.4466, 1.8423, -0.1997, -0.5942, -0.3998, 0.4219,
  37095. 0.0467],
  37096. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  37097. 0.0893]]], device='cuda:0')
  37098. loss_train_step before backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  37099. loss_train_step after backward: tensor(0.0087, device='cuda:0', grad_fn=<MseLossBackward>)
  37100. loss_train: 1.0303018535487354
  37101. step: 65
  37102. running loss: 0.015850797746903622
  37103. Train Steps: 65/90 Loss: 0.0159 torch.Size([8, 600, 800])
  37104. torch.Size([8, 8])
  37105. tensor([[0.6070, 0.3979, 0.8575, 0.5083, 0.4350, 0.5400, 0.5180, 0.5466],
  37106. [0.6185, 0.4067, 0.8838, 0.4450, 0.4037, 0.4733, 0.5213, 0.5142],
  37107. [0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  37108. [0.6201, 0.4151, 0.8588, 0.5467, 0.3700, 0.3950, 0.5637, 0.5933],
  37109. [0.6243, 0.4128, 0.7762, 0.2717, 0.3825, 0.3133, 0.6212, 0.5417],
  37110. [0.6257, 0.4034, 0.8287, 0.2333, 0.3925, 0.2717, 0.6330, 0.4901],
  37111. [0.6332, 0.4128, 0.9200, 0.3517, 0.4400, 0.3833, 0.7461, 0.5494],
  37112. [0.6160, 0.4093, 0.8314, 0.4417, 0.3675, 0.4583, 0.5250, 0.5808]],
  37113. device='cuda:0', dtype=torch.float64)
  37114. predictions are: tensor([[ 0.5700, -0.4073, 1.6418, 0.1862, -0.2623, 0.1250, 0.4004, 0.1653],
  37115. [ 0.7220, -0.3087, 1.7366, -0.1382, -0.4315, -0.1361, 0.2370, 0.0559],
  37116. [ 0.4944, -0.4977, 1.6870, -0.6288, -0.4603, -1.0396, 0.5128, -0.0098],
  37117. [ 0.5891, -0.3530, 1.6456, 0.2662, -0.5829, -0.4358, 0.4185, 0.4307],
  37118. [ 0.7564, -0.2906, 1.2859, -1.0564, -0.4996, -0.8074, 0.6509, 0.2876],
  37119. [ 0.5688, -0.4439, 1.4126, -1.1453, -0.4822, -0.9829, 0.5486, -0.0029],
  37120. [ 0.5284, -0.4687, 1.8423, -0.5432, -0.2972, -0.5283, 1.1121, 0.2081],
  37121. [ 0.4286, -0.4599, 1.5429, -0.1226, -0.6268, -0.2642, 0.2406, 0.3169]],
  37122. device='cuda:0', grad_fn=<AddmmBackward>)
  37123. landmarks are: tensor([[[ 0.5178, -0.4480, 1.6748, 0.0620, -0.2767, 0.2083, 0.1067,
  37124. 0.2386],
  37125. [ 0.5708, -0.4075, 1.7961, -0.2305, -0.4210, -0.0996, 0.1219,
  37126. 0.0893],
  37127. [ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  37128. -0.0957],
  37129. [ 0.5785, -0.3687, 1.6806, 0.2391, -0.5769, -0.4614, 0.3180,
  37130. 0.4547],
  37131. [ 0.5977, -0.3792, 1.2995, -1.0311, -0.5192, -0.8386, 0.5836,
  37132. 0.2160],
  37133. [ 0.6042, -0.4225, 1.5420, -1.2082, -0.4730, -1.0311, 0.6380,
  37134. -0.0220],
  37135. [ 0.6388, -0.3792, 1.9635, -0.6616, -0.2536, -0.5153, 1.1605,
  37136. 0.2516],
  37137. [ 0.5592, -0.3956, 1.5543, -0.2456, -0.5885, -0.1689, 0.1392,
  37138. 0.3968]]], device='cuda:0')
  37139. loss_train_step before backward: tensor(0.0066, device='cuda:0', grad_fn=<MseLossBackward>)
  37140. loss_train_step after backward: tensor(0.0066, device='cuda:0', grad_fn=<MseLossBackward>)
  37141. loss_train: 1.0369146969169378
  37142. step: 66
  37143. running loss: 0.015710828741165726
  37144. Train Steps: 66/90 Loss: 0.0157 torch.Size([8, 600, 800])
  37145. torch.Size([8, 8])
  37146. tensor([[0.6136, 0.4085, 0.6688, 0.2317, 0.3862, 0.2367, 0.5517, 0.5783],
  37147. [0.6136, 0.4117, 0.8700, 0.5167, 0.4188, 0.5083, 0.5147, 0.5495],
  37148. [0.6299, 0.4303, 0.7963, 0.3933, 0.4850, 0.2283, 0.5480, 0.6222],
  37149. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  37150. [0.6196, 0.4094, 0.7562, 0.2817, 0.3937, 0.3183, 0.6013, 0.6183],
  37151. [0.6129, 0.4063, 0.8738, 0.5250, 0.4313, 0.4733, 0.5230, 0.5874],
  37152. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  37153. [0.6085, 0.4008, 0.8588, 0.5200, 0.4959, 0.4977, 0.5175, 0.5283]],
  37154. device='cuda:0', dtype=torch.float64)
  37155. predictions are: tensor([[ 0.4583, -0.4992, 0.8629, -1.1960, -0.6042, -1.1037, 0.4087, 0.1988],
  37156. [ 0.5696, -0.4237, 1.8692, 0.1697, -0.4560, 0.0712, 0.5130, 0.0453],
  37157. [ 0.6720, -0.3059, 1.6680, -0.4913, -0.1965, -1.1177, 0.5406, 0.3097],
  37158. [ 0.2959, -0.5816, 1.4801, -0.9764, -0.5421, -1.1075, 0.2888, 0.1507],
  37159. [ 0.6170, -0.3856, 1.3985, -0.9501, -0.5622, -0.8307, 0.7079, 0.3880],
  37160. [ 0.6378, -0.3512, 1.8180, 0.2329, -0.4365, -0.0178, 0.4217, 0.2185],
  37161. [ 0.4949, -0.4244, 1.3233, -1.0124, -0.2559, -1.2040, 0.5447, 0.3054],
  37162. [ 0.5707, -0.4398, 1.8753, 0.1660, -0.1342, 0.0073, 0.5037, 0.0035]],
  37163. device='cuda:0', grad_fn=<AddmmBackward>)
  37164. landmarks are: tensor([[[ 0.5483, -0.3991, 0.8030, -1.2159, -0.5018, -1.1928, 0.2624,
  37165. 0.3852],
  37166. [ 0.5482, -0.3841, 1.7326, 0.1005, -0.3517, 0.0620, 0.0912,
  37167. 0.2522],
  37168. [ 0.6237, -0.2983, 1.3919, -0.4691, -0.0457, -1.2313, 0.2453,
  37169. 0.5882],
  37170. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  37171. 0.3700],
  37172. [ 0.5759, -0.3948, 1.2072, -0.9849, -0.4672, -0.8156, 0.4912,
  37173. 0.5701],
  37174. [ 0.5453, -0.4091, 1.7499, 0.1390, -0.2940, -0.0996, 0.1300,
  37175. 0.4272],
  37176. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  37177. 0.3854],
  37178. [ 0.5245, -0.4347, 1.6806, 0.1159, 0.0046, 0.0129, 0.1044,
  37179. 0.1544]]], device='cuda:0')
  37180. loss_train_step before backward: tensor(0.0235, device='cuda:0', grad_fn=<MseLossBackward>)
  37181. loss_train_step after backward: tensor(0.0235, device='cuda:0', grad_fn=<MseLossBackward>)
  37182. loss_train: 1.060399990528822
  37183. step: 67
  37184. running loss: 0.015826865530280926
  37185.  
  37186. Train Steps: 67/90 Loss: 0.0158 torch.Size([8, 600, 800])
  37187. torch.Size([8, 8])
  37188. tensor([[0.6229, 0.4066, 0.8513, 0.5717, 0.4500, 0.5050, 0.6025, 0.5350],
  37189. [0.6361, 0.4071, 0.9100, 0.4783, 0.3738, 0.3967, 0.6670, 0.5332],
  37190. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  37191. [0.6214, 0.4116, 0.7750, 0.2317, 0.4487, 0.1883, 0.6200, 0.5400],
  37192. [0.6150, 0.3949, 0.8800, 0.4033, 0.3825, 0.4900, 0.5875, 0.5483],
  37193. [0.6274, 0.4099, 0.8625, 0.3233, 0.4400, 0.1983, 0.5876, 0.4869],
  37194. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  37195. [0.6203, 0.4072, 0.8892, 0.3523, 0.3783, 0.3017, 0.5898, 0.5478]],
  37196. device='cuda:0', dtype=torch.float64)
  37197. predictions are: tensor([[ 0.6211, -0.3934, 1.7261, 0.4591, -0.2666, 0.0805, 0.5491, 0.1778],
  37198. [ 0.6831, -0.3731, 1.9187, -0.0112, -0.6001, -0.3599, 0.7898, 0.1492],
  37199. [ 0.3914, -0.5190, 0.9761, -1.2904, -0.5236, -1.0034, 0.4221, 0.2727],
  37200. [ 0.5367, -0.4494, 1.2859, -1.1676, -0.2218, -1.2896, 0.5564, 0.1938],
  37201. [ 0.7263, -0.3094, 1.7982, -0.3888, -0.5521, 0.0118, 0.5007, 0.1631],
  37202. [ 0.6938, -0.3546, 1.8083, -0.7449, -0.2507, -1.3090, 0.5148, 0.0247],
  37203. [ 0.5000, -0.4189, 1.0990, -1.0047, -0.2257, -1.2594, 0.3236, 0.4026],
  37204. [ 0.6410, -0.3702, 1.9326, -0.6053, -0.5425, -0.7602, 0.4749, 0.2303]],
  37205. device='cuda:0', grad_fn=<AddmmBackward>)
  37206. landmarks are: tensor([[[ 0.5911, -0.4080, 1.6460, 0.3546, -0.2074, 0.0467, 0.4970,
  37207. 0.1852],
  37208. [ 0.6520, -0.4056, 1.9173, -0.0765, -0.5596, -0.4537, 0.7949,
  37209. 0.1768],
  37210. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  37211. 0.2930],
  37212. [ 0.5842, -0.3848, 1.2938, -1.2159, -0.2132, -1.4160, 0.5778,
  37213. 0.2083],
  37214. [ 0.5546, -0.4620, 1.7788, -0.4229, -0.5192, -0.0226, 0.4277,
  37215. 0.2468],
  37216. [ 0.6119, -0.3927, 1.6979, -0.7925, -0.2536, -1.3698, 0.4282,
  37217. -0.0368],
  37218. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  37219. 0.3931],
  37220. [ 0.5792, -0.4052, 1.8214, -0.6587, -0.5384, -0.8924, 0.4381,
  37221. 0.2442]]], device='cuda:0')
  37222. loss_train_step before backward: tensor(0.0052, device='cuda:0', grad_fn=<MseLossBackward>)
  37223. loss_train_step after backward: tensor(0.0052, device='cuda:0', grad_fn=<MseLossBackward>)
  37224. loss_train: 1.0655750310979784
  37225. step: 68
  37226. running loss: 0.015670221045558506
  37227. Train Steps: 68/90 Loss: 0.0157 torch.Size([8, 600, 800])
  37228. torch.Size([8, 8])
  37229. tensor([[0.6201, 0.4151, 0.8588, 0.5467, 0.3700, 0.3950, 0.5637, 0.5933],
  37230. [0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  37231. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  37232. [0.6179, 0.4008, 0.8600, 0.4015, 0.3932, 0.2515, 0.5711, 0.5438],
  37233. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  37234. [0.6168, 0.4055, 0.7575, 0.2950, 0.4050, 0.2717, 0.5938, 0.6167],
  37235. [0.6353, 0.4128, 0.8488, 0.2600, 0.5525, 0.1616, 0.6694, 0.5540],
  37236. [0.6198, 0.4164, 0.8700, 0.5067, 0.4625, 0.5650, 0.5464, 0.5197]],
  37237. device='cuda:0', dtype=torch.float64)
  37238. predictions are: tensor([[ 6.4932e-01, -3.1109e-01, 1.7652e+00, 1.8150e-01, -6.3398e-01,
  37239. -3.7820e-01, 2.5626e-01, 3.6480e-01],
  37240. [ 5.5427e-01, -3.8678e-01, 1.2450e+00, -1.0782e+00, -2.0523e-01,
  37241. -1.2230e+00, 4.0710e-01, 3.8396e-01],
  37242. [ 5.8606e-01, -4.1393e-01, 1.8375e+00, 1.7360e-01, -6.3783e-01,
  37243. -4.7665e-01, 3.0656e-01, 1.1668e-01],
  37244. [ 7.0116e-01, -3.3979e-01, 1.6863e+00, -5.5139e-01, -4.7769e-01,
  37245. -1.0744e+00, 2.7354e-01, 1.6098e-01],
  37246. [ 6.5969e-01, -3.8419e-01, 1.7464e+00, 1.3380e-01, -3.9393e-01,
  37247. 1.2854e-01, 9.0110e-01, 1.3022e-01],
  37248. [ 5.2570e-01, -4.2665e-01, 1.2532e+00, -1.0416e+00, -5.1630e-01,
  37249. -9.5149e-01, 4.5284e-01, 4.6819e-01],
  37250. [ 5.8049e-01, -4.0814e-01, 1.6135e+00, -1.3326e+00, 2.0178e-01,
  37251. -1.3246e+00, 9.6435e-01, 2.3764e-01],
  37252. [ 6.0887e-01, -3.5483e-01, 1.8828e+00, -1.1708e-03, -2.4791e-01,
  37253. 1.8476e-01, 4.1590e-01, 7.2394e-02]], device='cuda:0',
  37254. grad_fn=<AddmmBackward>)
  37255. landmarks are: tensor([[[ 0.5785, -0.3687, 1.6806, 0.2391, -0.5769, -0.4614, 0.3180,
  37256. 0.4547],
  37257. [ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  37258. 0.3854],
  37259. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  37260. 0.1698],
  37261. [ 0.5680, -0.4345, 1.6864, -0.4315, -0.4698, -1.1241, 0.3518,
  37262. 0.2261],
  37263. [ 0.6042, -0.4273, 1.7198, 0.2184, -0.3478, 0.1149, 0.8062,
  37264. 0.1176],
  37265. [ 0.5631, -0.4129, 1.2129, -0.9233, -0.4152, -1.0311, 0.4566,
  37266. 0.5624],
  37267. [ 0.6487, -0.3792, 1.6344, -1.0850, 0.2659, -1.5397, 0.8059,
  37268. 0.2730],
  37269. [ 0.5770, -0.3624, 1.7326, 0.0543, -0.1497, 0.3238, 0.2378,
  37270. 0.1146]]], device='cuda:0')
  37271. loss_train_step before backward: tensor(0.0071, device='cuda:0', grad_fn=<MseLossBackward>)
  37272. loss_train_step after backward: tensor(0.0071, device='cuda:0', grad_fn=<MseLossBackward>)
  37273. loss_train: 1.0726689579896629
  37274. step: 69
  37275. running loss: 0.01554592692738642
  37276. Train Steps: 69/90 Loss: 0.0155 torch.Size([8, 600, 800])
  37277. torch.Size([8, 8])
  37278. tensor([[0.6048, 0.3928, 0.8538, 0.5433, 0.3875, 0.5117, 0.5266, 0.4719],
  37279. [0.6055, 0.4015, 0.7425, 0.2033, 0.4113, 0.1883, 0.5217, 0.4823],
  37280. [0.6148, 0.3996, 0.8488, 0.3867, 0.3488, 0.4067, 0.5863, 0.5000],
  37281. [0.6136, 0.3955, 0.8400, 0.3267, 0.3500, 0.4200, 0.5863, 0.5467],
  37282. [0.6223, 0.4130, 0.8100, 0.2983, 0.3525, 0.3900, 0.5694, 0.5103],
  37283. [0.6361, 0.4102, 0.8650, 0.2983, 0.4888, 0.2000, 0.6702, 0.5459],
  37284. [0.6271, 0.4040, 0.9138, 0.3750, 0.4625, 0.2617, 0.7232, 0.5413],
  37285. [0.6214, 0.4112, 0.7838, 0.2117, 0.3650, 0.3133, 0.5675, 0.5083]],
  37286. device='cuda:0', dtype=torch.float64)
  37287. predictions are: tensor([[ 0.5832, -0.4019, 1.7111, 0.4521, -0.3889, 0.0626, 0.1651, 0.1931],
  37288. [ 0.5105, -0.4393, 0.9998, -1.1845, -0.3595, -1.3779, 0.1922, 0.1342],
  37289. [ 0.6528, -0.3713, 1.6885, -0.3394, -0.6116, -0.3599, 0.3463, 0.2027],
  37290. [ 0.6792, -0.3349, 1.6055, -0.6538, -0.5749, -0.4010, 0.4729, 0.3349],
  37291. [ 0.8564, -0.2081, 1.5162, -0.6773, -0.5229, -0.5072, 0.3051, 0.3393],
  37292. [ 0.6010, -0.4154, 1.7584, -0.8380, 0.0861, -1.3183, 0.9652, 0.2800],
  37293. [ 0.6342, -0.4167, 2.0447, -0.4159, -0.0362, -1.1658, 1.0665, 0.2960],
  37294. [ 0.6628, -0.3548, 1.3875, -1.2671, -0.5098, -0.9115, 0.4795, 0.2078]],
  37295. device='cuda:0', grad_fn=<AddmmBackward>)
  37296. landmarks are: tensor([[[ 0.5079, -0.4714, 1.6575, 0.2237, -0.4961, 0.0774, 0.1465,
  37297. -0.1061],
  37298. [ 0.5109, -0.4316, 1.1436, -1.3467, -0.3864, -1.4160, 0.1239,
  37299. -0.0580],
  37300. [ 0.5538, -0.4400, 1.6344, -0.4999, -0.6751, -0.4075, 0.4219,
  37301. 0.0236],
  37302. [ 0.5484, -0.4591, 1.5940, -0.7771, -0.6693, -0.3460, 0.4219,
  37303. 0.2391],
  37304. [ 0.5886, -0.3784, 1.4554, -0.9079, -0.6577, -0.4845, 0.3440,
  37305. 0.0712],
  37306. [ 0.6520, -0.3912, 1.7095, -0.9079, -0.0284, -1.3621, 0.8096,
  37307. 0.2356],
  37308. [ 0.6108, -0.4201, 1.9346, -0.5538, -0.1497, -1.0773, 1.0545,
  37309. 0.2142],
  37310. [ 0.5845, -0.3864, 1.3342, -1.3082, -0.6000, -0.8386, 0.3353,
  37311. 0.0620]]], device='cuda:0')
  37312. loss_train_step before backward: tensor(0.0132, device='cuda:0', grad_fn=<MseLossBackward>)
  37313. loss_train_step after backward: tensor(0.0132, device='cuda:0', grad_fn=<MseLossBackward>)
  37314. loss_train: 1.0858652363531291
  37315. step: 70
  37316. running loss: 0.015512360519330417
  37317. Train Steps: 70/90 Loss: 0.0155 torch.Size([8, 600, 800])
  37318. torch.Size([8, 8])
  37319. tensor([[0.6277, 0.4036, 0.8688, 0.3617, 0.3925, 0.2600, 0.6132, 0.4742],
  37320. [0.6076, 0.3958, 0.8700, 0.4667, 0.4546, 0.5046, 0.5231, 0.4960],
  37321. [0.6275, 0.4071, 0.8075, 0.2100, 0.4700, 0.1533, 0.6148, 0.4834],
  37322. [0.6189, 0.4029, 0.8375, 0.5767, 0.4745, 0.4829, 0.5551, 0.5598],
  37323. [0.6140, 0.4070, 0.8700, 0.5000, 0.4612, 0.4900, 0.5260, 0.5852],
  37324. [0.6147, 0.4112, 0.7988, 0.3200, 0.3775, 0.2767, 0.5150, 0.5550],
  37325. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567],
  37326. [0.6276, 0.4002, 0.8800, 0.5533, 0.3575, 0.4400, 0.6132, 0.4672]],
  37327. device='cuda:0', dtype=torch.float64)
  37328. predictions are: tensor([[ 0.7524, -0.3138, 1.7652, -0.7036, -0.4591, -1.0202, 0.6242, 0.0644],
  37329. [ 0.7036, -0.3337, 1.8266, -0.1566, -0.2323, 0.0085, 0.2252, 0.1692],
  37330. [ 0.7085, -0.3449, 1.4596, -1.4295, -0.0171, -1.5700, 0.9127, 0.0854],
  37331. [ 0.6374, -0.3348, 1.6523, 0.3809, -0.1125, -0.1319, 0.3967, 0.3868],
  37332. [ 0.5919, -0.3661, 1.7851, 0.0314, -0.1617, -0.0299, 0.3320, 0.4521],
  37333. [ 0.8570, -0.1832, 1.4189, -0.8228, -0.5323, -0.9292, 0.0790, 0.3344],
  37334. [-1.1760, -1.5135, 1.1183, -1.1627, -0.3278, -1.3243, 0.1392, 0.3514],
  37335. [ 0.7340, -0.3614, 1.7749, 0.2905, -0.6121, -0.2406, 0.7003, 0.1101]],
  37336. device='cuda:0', grad_fn=<AddmmBackward>)
  37337. landmarks are: tensor([[[ 0.6134, -0.4218, 1.7268, -0.6154, -0.4730, -1.0850, 0.5463,
  37338. -0.0957],
  37339. [ 0.5205, -0.4577, 1.7326, -0.1304, -0.1862, 0.0447, 0.1301,
  37340. 0.0051],
  37341. [ 0.6126, -0.4057, 1.4439, -1.3159, -0.1150, -1.5777, 0.5537,
  37342. -0.0530],
  37343. [ 0.5726, -0.4249, 1.5824, 0.3777, -0.0942, -0.0556, 0.2782,
  37344. 0.2997],
  37345. [ 0.5500, -0.4060, 1.7326, 0.0236, -0.1554, -0.0226, 0.1438,
  37346. 0.4171],
  37347. [ 0.5532, -0.3864, 1.4035, -0.8079, -0.5423, -1.0080, 0.0928,
  37348. 0.2776],
  37349. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  37350. 0.2853],
  37351. [ 0.6128, -0.4375, 1.7788, 0.2699, -0.6346, -0.2536, 0.5463,
  37352. -0.1278]]], device='cuda:0')
  37353. loss_train_step before backward: tensor(0.0401, device='cuda:0', grad_fn=<MseLossBackward>)
  37354. loss_train_step after backward: tensor(0.0401, device='cuda:0', grad_fn=<MseLossBackward>)
  37355. loss_train: 1.1259842771105468
  37356. step: 71
  37357. running loss: 0.015858933480430236
  37358.  
  37359. Train Steps: 71/90 Loss: 0.0159 torch.Size([8, 600, 800])
  37360. torch.Size([8, 8])
  37361. tensor([[0.6200, 0.4112, 0.8862, 0.4100, 0.3638, 0.4917, 0.6088, 0.6050],
  37362. [0.6151, 0.4085, 0.8750, 0.4367, 0.3887, 0.4367, 0.5066, 0.5846],
  37363. [0.6108, 0.4011, 0.8037, 0.3400, 0.3700, 0.2933, 0.5658, 0.5617],
  37364. [0.6236, 0.4084, 0.7738, 0.2133, 0.3663, 0.3233, 0.5813, 0.5567],
  37365. [0.6138, 0.4020, 0.8800, 0.4717, 0.4375, 0.4717, 0.5502, 0.5611],
  37366. [0.6339, 0.4123, 0.8638, 0.5367, 0.4075, 0.5467, 0.7517, 0.5436],
  37367. [0.6161, 0.4055, 0.8675, 0.3867, 0.3713, 0.4033, 0.5195, 0.5162],
  37368. [ nan, nan, 0.8488, 0.2300, 0.5563, 0.2100, 0.7390, 0.5679]],
  37369. device='cuda:0', dtype=torch.float64)
  37370. predictions are: tensor([[ 0.7596, -0.2490, 1.7706, -0.2143, -0.4673, -0.0846, 0.3435, 0.3957],
  37371. [ 0.6366, -0.3010, 1.7074, -0.1447, -0.4508, -0.3138, -0.0450, 0.2564],
  37372. [ 0.6255, -0.3668, 1.4270, -0.6066, -0.5383, -0.9385, 0.2893, 0.1861],
  37373. [ 0.6542, -0.3571, 1.2980, -1.1232, -0.4624, -0.9424, 0.4861, 0.2497],
  37374. [ 0.6544, -0.3270, 1.7445, -0.0034, -0.2148, -0.1705, 0.1259, 0.2557],
  37375. [ 0.6998, -0.3413, 1.7491, 0.2611, -0.3304, 0.1221, 1.0424, 0.2210],
  37376. [ 0.7470, -0.2772, 1.7329, -0.3159, -0.5494, -0.5700, -0.0321, 0.0129],
  37377. [-1.4784, -1.7442, 1.6703, -1.2390, 0.4985, -1.6062, 1.2554, 0.3567]],
  37378. device='cuda:0', grad_fn=<AddmmBackward>)
  37379. landmarks are: tensor([[[ 0.5777, -0.3868, 1.8076, -0.3921, -0.6058, -0.0149, 0.5259,
  37380. 0.5085],
  37381. [ 0.5553, -0.3992, 1.7557, -0.2690, -0.4903, -0.2690, 0.0542,
  37382. 0.4145],
  37383. [ 0.5355, -0.4335, 1.4266, -0.7155, -0.5769, -0.9310, 0.3275,
  37384. 0.3087],
  37385. [ 0.5946, -0.3995, 1.2880, -1.3005, -0.5942, -0.7925, 0.3988,
  37386. 0.2853],
  37387. [ 0.5491, -0.4290, 1.7788, -0.1073, -0.2651, -0.1073, 0.2555,
  37388. 0.3057],
  37389. [ 0.6421, -0.3816, 1.7037, 0.1929, -0.4037, 0.2391, 1.1861,
  37390. 0.2249],
  37391. [ 0.5598, -0.4129, 1.7210, -0.4999, -0.5711, -0.4229, 0.1136,
  37392. 0.0983],
  37393. [-2.2859, -2.2859, 1.6344, -1.2236, 0.2834, -1.3159, 1.1276,
  37394. 0.3371]]], device='cuda:0')
  37395. loss_train_step before backward: tensor(0.0265, device='cuda:0', grad_fn=<MseLossBackward>)
  37396. loss_train_step after backward: tensor(0.0265, device='cuda:0', grad_fn=<MseLossBackward>)
  37397. loss_train: 1.1525277267210186
  37398. step: 72
  37399. running loss: 0.016007329537791923
  37400. Train Steps: 72/90 Loss: 0.0160 torch.Size([8, 600, 800])
  37401. torch.Size([8, 8])
  37402. tensor([[0.6132, 0.4118, 0.8200, 0.3633, 0.3563, 0.5400, 0.5787, 0.5136],
  37403. [ nan, nan, 0.8750, 0.2467, 0.5138, 0.2617, 0.7382, 0.5552],
  37404. [0.6110, 0.4047, 0.8700, 0.4483, 0.3713, 0.3967, 0.5088, 0.5517],
  37405. [0.6185, 0.4042, 0.7700, 0.2250, 0.4062, 0.2117, 0.5763, 0.5150],
  37406. [0.6292, 0.4010, 0.8988, 0.4800, 0.3638, 0.3817, 0.6357, 0.5051],
  37407. [0.6270, 0.4267, 0.7150, 0.3317, 0.4900, 0.1817, 0.5560, 0.6183],
  37408. [0.6264, 0.4248, 0.8938, 0.4183, 0.3875, 0.4100, 0.5400, 0.5350],
  37409. [0.6276, 0.4095, 0.8237, 0.2250, 0.4662, 0.1783, 0.6171, 0.4869]],
  37410. device='cuda:0', dtype=torch.float64)
  37411. predictions are: tensor([[ 5.9427e-01, -3.5149e-01, 1.5071e+00, -5.8090e-01, -4.9336e-01,
  37412. 8.7826e-02, 4.6292e-01, 2.3218e-01],
  37413. [-1.9318e+00, -2.0346e+00, 1.7207e+00, -1.2192e+00, 2.7853e-01,
  37414. -1.4549e+00, 1.0914e+00, 3.3141e-01],
  37415. [ 5.7028e-01, -3.5766e-01, 1.7352e+00, -9.0277e-02, -5.7938e-01,
  37416. -3.2921e-01, -1.3246e-01, 2.5256e-01],
  37417. [ 5.9285e-01, -4.0147e-01, 1.2382e+00, -1.1689e+00, -3.9334e-01,
  37418. -1.2938e+00, 3.6060e-01, 1.1863e-01],
  37419. [ 6.5827e-01, -3.9911e-01, 1.8256e+00, -1.6101e-03, -5.0889e-01,
  37420. -4.0250e-01, 5.7856e-01, 1.1106e-01],
  37421. [ 6.9346e-01, -2.9639e-01, 1.0066e+00, -7.7031e-01, -1.1378e-01,
  37422. -1.3372e+00, 2.4999e-01, 5.3997e-01],
  37423. [ 6.0116e-01, -3.3656e-01, 1.8278e+00, -2.2940e-01, -5.3385e-01,
  37424. -3.2537e-01, 7.8322e-02, 2.2241e-01],
  37425. [ 6.2932e-01, -3.6683e-01, 1.5071e+00, -1.2220e+00, -3.4216e-03,
  37426. -1.4243e+00, 6.1705e-01, 7.4610e-02]], device='cuda:0',
  37427. grad_fn=<AddmmBackward>)
  37428. landmarks are: tensor([[[ 0.5466, -0.3840, 1.5016, -0.6077, -0.6404, 0.2083, 0.3871,
  37429. 0.0862],
  37430. [-2.2859, -2.2859, 1.7557, -1.1466, 0.0871, -1.0773, 1.1239,
  37431. 0.2783],
  37432. [ 0.5363, -0.4168, 1.7326, -0.2151, -0.5711, -0.4537, 0.0640,
  37433. 0.2622],
  37434. [ 0.5707, -0.4189, 1.2707, -1.2467, -0.4095, -1.3082, 0.3758,
  37435. 0.0928],
  37436. [ 0.6204, -0.4336, 1.8654, -0.0688, -0.6058, -0.5230, 0.6503,
  37437. 0.0472],
  37438. [ 0.6101, -0.3152, 1.0166, -0.7540, -0.0226, -1.4468, 0.2823,
  37439. 0.5702],
  37440. [ 0.6072, -0.3239, 1.8423, -0.3537, -0.4961, -0.3921, 0.2083,
  37441. 0.1852],
  37442. [ 0.6127, -0.3944, 1.5189, -1.2467, -0.1323, -1.4622, 0.5646,
  37443. -0.0369]]], device='cuda:0')
  37444. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  37445. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  37446. loss_train: 1.1630904129706323
  37447. step: 73
  37448. running loss: 0.015932745383159346
  37449. Train Steps: 73/90 Loss: 0.0159 torch.Size([8, 600, 800])
  37450. torch.Size([8, 8])
  37451. tensor([[0.6182, 0.4058, 0.8738, 0.4350, 0.3563, 0.3400, 0.5290, 0.5822],
  37452. [0.6164, 0.3972, 0.7818, 0.3381, 0.3599, 0.3387, 0.5880, 0.5153],
  37453. [0.6314, 0.4107, 0.8750, 0.5100, 0.3788, 0.4900, 0.7121, 0.5864],
  37454. [0.6109, 0.4015, 0.7668, 0.3639, 0.3513, 0.3667, 0.5200, 0.5641],
  37455. [0.6226, 0.4001, 0.8438, 0.5733, 0.3862, 0.4250, 0.5750, 0.5283],
  37456. [0.6163, 0.4001, 0.8788, 0.5033, 0.4012, 0.4633, 0.5338, 0.5767],
  37457. [0.6201, 0.4065, 0.7300, 0.1933, 0.4075, 0.2533, 0.6162, 0.5483],
  37458. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563]],
  37459. device='cuda:0', dtype=torch.float64)
  37460. predictions are: tensor([[ 0.6199, -0.3633, 1.7836, -0.3836, -0.5077, -0.7211, 0.0684, 0.2759],
  37461. [ 0.6889, -0.3536, 1.4425, -0.8366, -0.5263, -0.7809, 0.4121, 0.0883],
  37462. [ 0.6030, -0.4272, 1.9410, 0.0582, -0.2889, -0.1175, 1.1050, 0.3419],
  37463. [ 0.5360, -0.4069, 1.3305, -0.7654, -0.5238, -0.6782, 0.1789, 0.2832],
  37464. [ 0.7144, -0.3519, 1.7441, 0.3128, -0.3675, -0.3465, 0.3809, 0.1663],
  37465. [ 0.5369, -0.4524, 1.8689, -0.0673, -0.2455, -0.2268, 0.1903, 0.2530],
  37466. [ 0.6427, -0.3706, 1.1777, -1.4482, -0.2613, -1.2697, 0.5720, 0.2102],
  37467. [ 0.6546, -0.3343, 1.7212, -0.5872, -0.4739, -0.9253, 0.0056, 0.2401]],
  37468. device='cuda:0', grad_fn=<AddmmBackward>)
  37469. landmarks are: tensor([[[ 0.5697, -0.4113, 1.7499, -0.2767, -0.6404, -0.7155, 0.1576,
  37470. 0.4032],
  37471. [ 0.5614, -0.4514, 1.3252, -0.7240, -0.6237, -0.7215, 0.4299,
  37472. 0.0942],
  37473. [ 0.6306, -0.3888, 1.7557, 0.0697, -0.5365, -0.0226, 1.0033,
  37474. 0.4226],
  37475. [ 0.5357, -0.4315, 1.2557, -0.6051, -0.6635, -0.5923, 0.1159,
  37476. 0.3198],
  37477. [ 0.5900, -0.4377, 1.6113, 0.3623, -0.5018, -0.3229, 0.3700,
  37478. 0.1544],
  37479. [ 0.5610, -0.4381, 1.7730, 0.0390, -0.4326, -0.1458, 0.1794,
  37480. 0.3777],
  37481. [ 0.5784, -0.4085, 1.0859, -1.3929, -0.4037, -1.1158, 0.5605,
  37482. 0.2468],
  37483. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  37484. 0.2837]]], device='cuda:0')
  37485. loss_train_step before backward: tensor(0.0091, device='cuda:0', grad_fn=<MseLossBackward>)
  37486. loss_train_step after backward: tensor(0.0091, device='cuda:0', grad_fn=<MseLossBackward>)
  37487. loss_train: 1.1722305989824235
  37488. step: 74
  37489. running loss: 0.015840954040303022
  37490. Train Steps: 74/90 Loss: 0.0158 torch.Size([8, 600, 800])
  37491. torch.Size([8, 8])
  37492. tensor([[0.6139, 0.4019, 0.7137, 0.2150, 0.4375, 0.1533, 0.5293, 0.5006],
  37493. [0.6200, 0.4055, 0.8011, 0.2988, 0.3842, 0.2798, 0.5949, 0.5183],
  37494. [ nan, nan, 0.8525, 0.2217, 0.5413, 0.2367, 0.7367, 0.5482],
  37495. [0.6138, 0.4054, 0.8750, 0.4750, 0.4363, 0.5017, 0.5086, 0.5822],
  37496. [0.6275, 0.4157, 0.8337, 0.5800, 0.3763, 0.4200, 0.5547, 0.6125],
  37497. [0.6128, 0.4022, 0.8738, 0.5067, 0.4983, 0.5231, 0.5364, 0.5064],
  37498. [0.6097, 0.4024, 0.8488, 0.3717, 0.3875, 0.5517, 0.5836, 0.5591],
  37499. [0.6239, 0.4061, 0.8850, 0.4600, 0.4225, 0.5200, 0.6138, 0.5450]],
  37500. device='cuda:0', dtype=torch.float64)
  37501. predictions are: tensor([[ 0.7868, -0.2607, 1.0193, -1.2032, -0.3471, -1.6748, 0.2052, 0.0175],
  37502. [ 0.5743, -0.4024, 1.4428, -0.8914, -0.5607, -0.9998, 0.4252, 0.0937],
  37503. [-2.1559, -2.1935, 1.5947, -1.3129, 0.2300, -1.5728, 1.0261, 0.3095],
  37504. [ 0.5379, -0.3878, 1.7228, -0.1518, -0.3012, -0.0963, 0.0473, 0.2776],
  37505. [ 0.6823, -0.3246, 1.6219, 0.3853, -0.6079, -0.4308, 0.2746, 0.4834],
  37506. [ 0.4335, -0.4857, 1.7522, -0.0481, -0.0376, -0.1753, 0.0980, 0.1554],
  37507. [ 0.4807, -0.4354, 1.6261, -0.5759, -0.4750, 0.1213, 0.4935, 0.1963],
  37508. [ 0.5461, -0.4275, 1.8113, -0.2441, -0.3507, 0.0115, 0.4388, 0.1897]],
  37509. device='cuda:0', grad_fn=<AddmmBackward>)
  37510. landmarks are: tensor([[[ 0.5496, -0.4295, 1.0109, -1.2928, -0.2651, -1.5777, 0.1589,
  37511. 0.0261],
  37512. [ 0.5781, -0.4129, 1.4142, -0.9057, -0.5115, -0.9937, 0.4621,
  37513. 0.1080],
  37514. [-2.2859, -2.2859, 1.6517, -1.2620, 0.2141, -1.1928, 1.1166,
  37515. 0.2463],
  37516. [ 0.5491, -0.4132, 1.7557, -0.0919, -0.2709, 0.0313, 0.0635,
  37517. 0.4032],
  37518. [ 0.6124, -0.3658, 1.5651, 0.3931, -0.5480, -0.3460, 0.2761,
  37519. 0.5431],
  37520. [ 0.5446, -0.4280, 1.7499, 0.0543, 0.0156, 0.1301, 0.1918,
  37521. 0.0532],
  37522. [ 0.5301, -0.4273, 1.6344, -0.5692, -0.4961, 0.2622, 0.4098,
  37523. 0.2966],
  37524. [ 0.5960, -0.4102, 1.8018, -0.1612, -0.3344, 0.1159, 0.5490,
  37525. 0.2314]]], device='cuda:0')
  37526. loss_train_step before backward: tensor(0.0091, device='cuda:0', grad_fn=<MseLossBackward>)
  37527. loss_train_step after backward: tensor(0.0091, device='cuda:0', grad_fn=<MseLossBackward>)
  37528. loss_train: 1.1813519136048853
  37529. step: 75
  37530. running loss: 0.01575135884806514
  37531.  
  37532. Train Steps: 75/90 Loss: 0.0158 torch.Size([8, 600, 800])
  37533. torch.Size([8, 8])
  37534. tensor([[0.6117, 0.4018, 0.6562, 0.1967, 0.3738, 0.2550, 0.5280, 0.5103],
  37535. [0.6264, 0.4049, 0.8988, 0.4633, 0.3813, 0.4983, 0.6326, 0.4843],
  37536. [0.6124, 0.4030, 0.8650, 0.4867, 0.4999, 0.5106, 0.5137, 0.5773],
  37537. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038],
  37538. [0.6201, 0.4082, 0.8827, 0.3715, 0.3825, 0.2712, 0.5845, 0.5412],
  37539. [0.6222, 0.4072, 0.7164, 0.2166, 0.3738, 0.3167, 0.6100, 0.5533],
  37540. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  37541. [0.6240, 0.4217, 0.8150, 0.3133, 0.4425, 0.2650, 0.5650, 0.5817]],
  37542. device='cuda:0', dtype=torch.float64)
  37543. predictions are: tensor([[ 4.3204e-01, -4.9423e-01, 8.7678e-01, -1.1577e+00, -4.9900e-01,
  37544. -1.2377e+00, 1.9630e-01, 1.8164e-01],
  37545. [ 6.9072e-01, -3.8656e-01, 2.0222e+00, -1.1292e-01, -5.2003e-01,
  37546. -2.3396e-02, 6.1781e-01, 6.3428e-02],
  37547. [ 3.8911e-01, -5.3941e-01, 1.7964e+00, -3.4572e-02, -9.5070e-03,
  37548. -9.4753e-02, 7.4348e-02, 3.2933e-01],
  37549. [ 6.1090e-01, -4.0105e-01, 1.8377e+00, -9.8769e-02, -1.8835e-01,
  37550. -1.7130e-03, 5.7579e-02, 8.1385e-02],
  37551. [ 6.4133e-01, -3.7246e-01, 1.8869e+00, -5.2754e-01, -5.2379e-01,
  37552. -1.0953e+00, 4.3551e-01, 2.3086e-01],
  37553. [ 6.0569e-01, -3.8838e-01, 1.1288e+00, -1.1754e+00, -5.1845e-01,
  37554. -9.1244e-01, 5.3057e-01, 2.8769e-01],
  37555. [ 5.0548e-01, -4.6197e-01, 1.0753e+00, -1.1920e+00, -4.6685e-01,
  37556. -1.2029e+00, 4.8190e-01, 3.0180e-01],
  37557. [ 5.9589e-01, -3.6515e-01, 1.5408e+00, -7.3261e-01, -3.0263e-01,
  37558. -1.2108e+00, 2.8190e-01, 4.1174e-01]], device='cuda:0',
  37559. grad_fn=<AddmmBackward>)
  37560. landmarks are: tensor([[[ 0.5393, -0.4299, 0.7453, -1.3775, -0.5596, -1.1081, 0.1527,
  37561. 0.0712],
  37562. [ 0.6075, -0.4159, 1.8654, -0.1458, -0.5249, 0.0159, 0.6359,
  37563. -0.0490],
  37564. [ 0.5428, -0.4244, 1.7095, -0.0380, 0.0232, 0.0725, 0.0866,
  37565. 0.3806],
  37566. [ 0.5249, -0.4473, 1.7326, -0.0919, -0.2016, 0.1544, 0.1733,
  37567. 0.0412],
  37568. [ 0.5784, -0.4006, 1.7911, -0.5701, -0.5192, -1.0331, 0.4137,
  37569. 0.2139],
  37570. [ 0.5878, -0.4052, 1.0229, -1.2855, -0.5596, -0.8232, 0.5316,
  37571. 0.2699],
  37572. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  37573. 0.2930],
  37574. [ 0.5964, -0.3380, 1.4785, -0.8386, -0.2420, -1.0619, 0.3238,
  37575. 0.4008]]], device='cuda:0')
  37576. loss_train_step before backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  37577. loss_train_step after backward: tensor(0.0076, device='cuda:0', grad_fn=<MseLossBackward>)
  37578. loss_train: 1.1889062826521695
  37579. step: 76
  37580. running loss: 0.015643503719107492
  37581. Train Steps: 76/90 Loss: 0.0156 torch.Size([8, 600, 800])
  37582. torch.Size([8, 8])
  37583. tensor([[0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  37584. [ nan, nan, 0.7981, 0.3194, 0.3625, 0.3167, 0.5040, 0.5563],
  37585. [0.6213, 0.4131, 0.8438, 0.3550, 0.3513, 0.4400, 0.5716, 0.5123],
  37586. [0.6043, 0.4022, 0.6887, 0.1983, 0.3775, 0.2483, 0.5480, 0.5136],
  37587. [0.6275, 0.4008, 0.8047, 0.2484, 0.4037, 0.2777, 0.6506, 0.5212],
  37588. [0.6179, 0.4008, 0.7505, 0.2678, 0.4368, 0.1891, 0.5831, 0.5263],
  37589. [ nan, nan, 0.7425, 0.2117, 0.3937, 0.2433, 0.5438, 0.5567],
  37590. [0.6249, 0.4142, 0.8350, 0.3283, 0.3613, 0.3700, 0.6188, 0.5400]],
  37591. device='cuda:0', dtype=torch.float64)
  37592. predictions are: tensor([[ 0.6656, -0.3252, 1.6314, -0.9552, -0.1234, -1.3587, 0.5424, 0.1389],
  37593. [-1.9349, -2.0047, 1.2804, -0.8710, -0.5206, -0.9053, 0.0334, 0.3029],
  37594. [ 0.6856, -0.3197, 1.6577, -0.5465, -0.5838, -0.3089, 0.2376, 0.2427],
  37595. [ 0.6226, -0.3830, 0.9294, -1.1398, -0.4260, -1.1295, 0.2986, 0.2081],
  37596. [ 0.6480, -0.3885, 1.4777, -0.9221, -0.3241, -0.9524, 0.6381, 0.1960],
  37597. [ 0.8055, -0.2722, 1.2072, -0.9814, -0.2422, -1.3769, 0.3189, 0.2356],
  37598. [-1.9116, -2.0022, 1.1542, -1.1836, -0.3305, -1.1824, 0.2033, 0.3075],
  37599. [ 0.7482, -0.2765, 1.6254, -0.7034, -0.5661, -0.6050, 0.4760, 0.3313]],
  37600. device='cuda:0', grad_fn=<AddmmBackward>)
  37601. landmarks are: tensor([[[ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  37602. -0.0209],
  37603. [-2.2859, -2.2859, 1.4006, -0.8105, -0.6115, -0.8232, 0.0419,
  37604. 0.2837],
  37605. [ 0.5841, -0.3778, 1.6113, -0.6462, -0.6635, -0.2536, 0.3542,
  37606. 0.0802],
  37607. [ 0.5053, -0.4281, 0.8954, -1.3698, -0.5423, -1.1389, 0.2453,
  37608. 0.0862],
  37609. [ 0.6125, -0.4345, 1.4308, -1.1384, -0.4213, -1.0031, 0.7190,
  37610. 0.1214],
  37611. [ 0.5680, -0.4345, 1.1806, -1.0490, -0.2683, -1.4127, 0.4074,
  37612. 0.1449],
  37613. [-2.2859, -2.2859, 1.1436, -1.3082, -0.4672, -1.1620, 0.2256,
  37614. 0.2853],
  37615. [ 0.6006, -0.3728, 1.5709, -0.7694, -0.6173, -0.5769, 0.5721,
  37616. 0.2083]]], device='cuda:0')
  37617. loss_train_step before backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  37618. loss_train_step after backward: tensor(0.0152, device='cuda:0', grad_fn=<MseLossBackward>)
  37619. loss_train: 1.2041279622353613
  37620. step: 77
  37621. running loss: 0.01563802548357612
  37622. Train Steps: 77/90 Loss: 0.0156 torch.Size([8, 600, 800])
  37623. torch.Size([8, 8])
  37624. tensor([[0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433],
  37625. [0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  37626. [0.6164, 0.3956, 0.8757, 0.5088, 0.4300, 0.5320, 0.6022, 0.5202],
  37627. [0.6185, 0.4098, 0.8838, 0.4900, 0.4537, 0.5800, 0.6288, 0.5400],
  37628. [0.6132, 0.4037, 0.6963, 0.2217, 0.4100, 0.1950, 0.5395, 0.5175],
  37629. [0.6086, 0.3940, 0.8712, 0.4783, 0.4025, 0.4900, 0.5498, 0.5390],
  37630. [0.6272, 0.4120, 0.9038, 0.4117, 0.3725, 0.3200, 0.6175, 0.5250],
  37631. [0.6230, 0.4152, 0.7588, 0.2283, 0.4012, 0.2883, 0.6200, 0.5767]],
  37632. device='cuda:0', dtype=torch.float64)
  37633. predictions are: tensor([[ 0.6204, -0.3751, 1.7329, -0.1243, -0.1641, 0.0857, 0.3867, 0.3459],
  37634. [ 0.4157, -0.4951, 1.7252, -0.0288, -0.2015, 0.1722, 0.2050, 0.1587],
  37635. [ 0.5428, -0.4652, 1.6959, -0.0345, -0.3847, 0.0054, 0.4109, 0.1474],
  37636. [ 0.4291, -0.5127, 1.7436, -0.1355, -0.2256, 0.2061, 0.4410, 0.2915],
  37637. [ 0.5248, -0.4014, 0.9346, -1.2211, -0.4824, -1.5760, 0.1073, 0.0700],
  37638. [ 0.6467, -0.4007, 1.6932, -0.1175, -0.4838, -0.1200, 0.0742, 0.1444],
  37639. [ 0.4221, -0.5190, 1.8474, -0.4413, -0.6660, -0.8941, 0.4888, 0.2100],
  37640. [ 0.5255, -0.4244, 1.2112, -1.0893, -0.5817, -1.1285, 0.5264, 0.3707]],
  37641. device='cuda:0', grad_fn=<AddmmBackward>)
  37642. landmarks are: tensor([[[ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  37643. 0.2237],
  37644. [ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  37645. 0.0592],
  37646. [ 0.5614, -0.4586, 1.7587, 0.0641, -0.2998, 0.1712, 0.4958,
  37647. 0.1170],
  37648. [ 0.5709, -0.3933, 1.7961, -0.0226, -0.1901, 0.3931, 0.6182,
  37649. 0.2083],
  37650. [ 0.5465, -0.4214, 0.9300, -1.2620, -0.3921, -1.3852, 0.2062,
  37651. 0.1043],
  37652. [ 0.5250, -0.4661, 1.7383, -0.0765, -0.4268, -0.0226, 0.2535,
  37653. 0.2035],
  37654. [ 0.6111, -0.3828, 1.8885, -0.3844, -0.5654, -0.8079, 0.5663,
  37655. 0.1390],
  37656. [ 0.5915, -0.3682, 1.2187, -1.2313, -0.4326, -0.9541, 0.5778,
  37657. 0.3777]]], device='cuda:0')
  37658. loss_train_step before backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  37659. loss_train_step after backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  37660. loss_train: 1.2163738389499485
  37661. step: 78
  37662. running loss: 0.015594536396794213
  37663. Train Steps: 78/90 Loss: 0.0156 torch.Size([8, 600, 800])
  37664. torch.Size([8, 8])
  37665. tensor([[0.6286, 0.4086, 0.8408, 0.2801, 0.4163, 0.2800, 0.6725, 0.5393],
  37666. [0.6202, 0.3983, 0.8555, 0.5429, 0.3842, 0.4370, 0.5866, 0.5398],
  37667. [ nan, nan, 0.6992, 0.2791, 0.3950, 0.2383, 0.5483, 0.5819],
  37668. [0.6157, 0.4102, 0.8513, 0.3817, 0.3613, 0.3667, 0.5096, 0.5890],
  37669. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  37670. [0.6207, 0.4110, 0.8738, 0.5000, 0.4800, 0.5633, 0.6300, 0.5433],
  37671. [0.6224, 0.4061, 0.8988, 0.4300, 0.3838, 0.4750, 0.6112, 0.5483],
  37672. [0.6101, 0.4042, 0.7775, 0.2617, 0.3713, 0.2817, 0.5440, 0.5650]],
  37673. device='cuda:0', dtype=torch.float64)
  37674. predictions are: tensor([[ 0.4975, -0.4646, 1.5513, -0.9666, -0.3757, -1.0631, 0.8349, 0.2213],
  37675. [ 0.6141, -0.4448, 1.6689, 0.2204, -0.5464, -0.2051, 0.5138, 0.0906],
  37676. [-2.0015, -2.1097, 0.9544, -1.1119, -0.4661, -1.1842, 0.0765, 0.2852],
  37677. [ 0.3614, -0.5117, 1.6381, -0.5652, -0.6371, -0.5385, 0.0116, 0.2458],
  37678. [ 0.4667, -0.4367, 1.1219, -1.0317, -0.2074, -1.4519, 0.2099, 0.2799],
  37679. [ 0.6129, -0.3851, 1.7800, -0.1275, -0.1141, 0.2926, 0.4631, 0.2179],
  37680. [ 0.5707, -0.4434, 1.8278, -0.3480, -0.5337, 0.0171, 0.5358, 0.1088],
  37681. [ 0.4578, -0.4612, 1.2927, -1.0640, -0.5458, -1.0070, 0.0641, 0.2277]],
  37682. device='cuda:0', grad_fn=<AddmmBackward>)
  37683. landmarks are: tensor([[[ 0.6174, -0.3984, 1.5975, -0.9921, -0.3633, -0.9926, 0.8205,
  37684. 0.2050],
  37685. [ 0.5786, -0.4463, 1.6655, 0.2216, -0.5115, -0.2675, 0.4236,
  37686. 0.2075],
  37687. [-2.2859, -2.2859, 0.9438, -0.9967, -0.4614, -1.1851, 0.2468,
  37688. 0.4019],
  37689. [ 0.5581, -0.3912, 1.6460, -0.5230, -0.6173, -0.5923, 0.0681,
  37690. 0.4348],
  37691. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  37692. 0.3931],
  37693. [ 0.5811, -0.3878, 1.7499, 0.0236, -0.0688, 0.3161, 0.6240,
  37694. 0.2237],
  37695. [ 0.5888, -0.4101, 1.8654, -0.2998, -0.5134, -0.0919, 0.5374,
  37696. 0.2468],
  37697. [ 0.5320, -0.4189, 1.3053, -1.0773, -0.5711, -0.9849, 0.2267,
  37698. 0.3237]]], device='cuda:0')
  37699. loss_train_step before backward: tensor(0.0080, device='cuda:0', grad_fn=<MseLossBackward>)
  37700. loss_train_step after backward: tensor(0.0080, device='cuda:0', grad_fn=<MseLossBackward>)
  37701. loss_train: 1.224423078354448
  37702. step: 79
  37703. running loss: 0.015499026308284152
  37704.  
  37705. Train Steps: 79/90 Loss: 0.0155 torch.Size([8, 600, 800])
  37706. torch.Size([8, 8])
  37707. tensor([[0.6091, 0.3997, 0.8314, 0.4334, 0.3788, 0.4550, 0.5213, 0.5656],
  37708. [0.6250, 0.4103, 0.8950, 0.4400, 0.3912, 0.5650, 0.6050, 0.5133],
  37709. [0.6225, 0.4196, 0.8788, 0.3467, 0.3750, 0.3400, 0.5413, 0.5433],
  37710. [0.6153, 0.4119, 0.8463, 0.3833, 0.3600, 0.3200, 0.5106, 0.5563],
  37711. [0.6138, 0.4101, 0.8800, 0.5083, 0.4637, 0.5950, 0.5587, 0.5077],
  37712. [0.6175, 0.4013, 0.7734, 0.2783, 0.4475, 0.1786, 0.5790, 0.5351],
  37713. [0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  37714. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097]],
  37715. device='cuda:0', dtype=torch.float64)
  37716. predictions are: tensor([[ 0.4846, -0.4914, 1.4329, -0.3428, -0.5375, -0.1980, 0.2619, 0.3136],
  37717. [ 0.5042, -0.4608, 1.7244, -0.3396, -0.4670, 0.3175, 0.5917, 0.2142],
  37718. [ 0.4605, -0.4590, 1.5435, -0.6849, -0.6888, -0.7761, 0.2342, 0.2381],
  37719. [ 0.2250, -0.6154, 1.5077, -0.5573, -0.6753, -0.8241, 0.0768, 0.3247],
  37720. [ 0.4591, -0.4868, 1.6747, -0.0019, -0.1548, 0.3512, 0.3674, 0.1820],
  37721. [ 0.7229, -0.3085, 1.1871, -1.0721, -0.2958, -1.5675, 0.3066, 0.1513],
  37722. [ 0.5734, -0.4881, 1.6056, -0.7844, -0.6470, -0.6891, 0.7640, 0.0590],
  37723. [ 0.4164, -0.5204, 1.6723, -0.1330, -0.2016, 0.1220, 0.1374, 0.1163]],
  37724. device='cuda:0', grad_fn=<AddmmBackward>)
  37725. landmarks are: tensor([[[ 0.5275, -0.4396, 1.5543, -0.2841, -0.5365, -0.1843, 0.1221,
  37726. 0.3265],
  37727. [ 0.6010, -0.3909, 1.8480, -0.2536, -0.4788, 0.3238, 0.5085,
  37728. 0.0851],
  37729. [ 0.5894, -0.3479, 1.7730, -0.6847, -0.5538, -0.7155, 0.2141,
  37730. 0.2237],
  37731. [ 0.5561, -0.3834, 1.6229, -0.5153, -0.6231, -0.8079, 0.0727,
  37732. 0.2837],
  37733. [ 0.5491, -0.3918, 1.7788, 0.0620, -0.1439, 0.4624, 0.2946,
  37734. 0.0592],
  37735. [ 0.5664, -0.4321, 1.2862, -1.0003, -0.2189, -1.4608, 0.3883,
  37736. 0.1855],
  37737. [ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  37738. -0.0220],
  37739. [ 0.5515, -0.4225, 1.7788, -0.0534, -0.2016, 0.1929, 0.1568,
  37740. 0.0682]]], device='cuda:0')
  37741. loss_train_step before backward: tensor(0.0099, device='cuda:0', grad_fn=<MseLossBackward>)
  37742. loss_train_step after backward: tensor(0.0099, device='cuda:0', grad_fn=<MseLossBackward>)
  37743. loss_train: 1.234301685821265
  37744. step: 80
  37745. running loss: 0.015428771072765812
  37746. Train Steps: 80/90 Loss: 0.0154 torch.Size([8, 600, 800])
  37747. torch.Size([8, 8])
  37748. tensor([[0.6284, 0.4029, 0.8838, 0.3783, 0.3975, 0.2850, 0.6335, 0.5090],
  37749. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  37750. [0.6087, 0.3951, 0.8387, 0.5833, 0.4188, 0.4933, 0.5146, 0.4830],
  37751. [0.6143, 0.4034, 0.8800, 0.4833, 0.4512, 0.5367, 0.5289, 0.5097],
  37752. [0.6257, 0.4024, 0.8672, 0.5422, 0.4196, 0.5198, 0.6694, 0.5204],
  37753. [ nan, nan, 0.8363, 0.3317, 0.3563, 0.3367, 0.5329, 0.5142],
  37754. [0.6109, 0.3943, 0.8525, 0.4950, 0.4338, 0.4800, 0.5449, 0.5383],
  37755. [ nan, nan, 0.8300, 0.3150, 0.3588, 0.3383, 0.5208, 0.5194]],
  37756. device='cuda:0', dtype=torch.float64)
  37757. predictions are: tensor([[ 0.7503, -0.2881, 1.6015, -0.6986, -0.4646, -1.0654, 0.6464, 0.1602],
  37758. [ 0.7804, -0.2480, 1.6838, -0.2485, -0.3454, 0.3726, 0.5508, 0.1698],
  37759. [ 0.6938, -0.3236, 1.5166, 0.2860, -0.4027, -0.0619, 0.1601, 0.1312],
  37760. [ 0.5815, -0.3628, 1.6414, -0.2030, -0.2527, 0.0957, 0.1165, 0.0985],
  37761. [ 0.6586, -0.3652, 1.5467, 0.0677, -0.4092, 0.0632, 0.8244, 0.2094],
  37762. [-2.3185, -2.3273, 1.3828, -0.8933, -0.6300, -0.7669, 0.1151, 0.2224],
  37763. [ 0.6937, -0.3142, 1.5366, -0.1562, -0.3201, -0.1382, 0.1785, 0.2307],
  37764. [-2.0555, -2.1445, 1.3345, -0.8968, -0.6410, -0.7471, 0.0783, 0.2306]],
  37765. device='cuda:0', grad_fn=<AddmmBackward>)
  37766. landmarks are: tensor([[[ 6.1645e-01, -4.2487e-01, 1.7961e+00, -5.3841e-01, -4.4988e-01,
  37767. -9.6952e-01, 6.4006e-01, 6.5205e-02],
  37768. [ 6.0139e-01, -3.8830e-01, 1.8192e+00, -1.1501e-01, -2.8822e-01,
  37769. 4.0077e-01, 5.2009e-01, 9.2841e-02],
  37770. [ 5.2575e-01, -4.6105e-01, 1.5882e+00, 4.0847e-01, -3.5173e-01,
  37771. -7.2363e-03, 9.1027e-02, -5.5027e-02],
  37772. [ 5.5155e-01, -4.2249e-01, 1.7788e+00, -5.3426e-02, -2.0162e-01,
  37773. 1.9292e-01, 1.5683e-01, 6.8210e-02],
  37774. [ 6.0425e-01, -4.2731e-01, 1.7198e+00, 2.1845e-01, -3.4783e-01,
  37775. 1.1492e-01, 8.0616e-01, 1.1755e-01],
  37776. [-2.2859e+00, -2.2859e+00, 1.5767e+00, -7.5396e-01, -6.4042e-01,
  37777. -7.3087e-01, 1.7534e-01, 8.9251e-02],
  37778. [ 5.3603e-01, -4.6490e-01, 1.6517e+00, 4.6189e-04, -2.8245e-01,
  37779. -6.8822e-02, 2.3086e-01, 2.0046e-01],
  37780. [-2.2859e+00, -2.2859e+00, 1.5478e+00, -8.3095e-01, -6.2887e-01,
  37781. -7.2317e-01, 1.1982e-01, 1.1330e-01]]], device='cuda:0')
  37782. loss_train_step before backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  37783. loss_train_step after backward: tensor(0.0122, device='cuda:0', grad_fn=<MseLossBackward>)
  37784. loss_train: 1.246514733415097
  37785. step: 81
  37786. running loss: 0.015389070782902432
  37787. Train Steps: 81/90 Loss: 0.0154 torch.Size([8, 600, 800])
  37788. torch.Size([8, 8])
  37789. tensor([[0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  37790. [0.6196, 0.4088, 0.8888, 0.4583, 0.4500, 0.5683, 0.6138, 0.5883],
  37791. [0.6211, 0.3935, 0.8636, 0.4841, 0.4417, 0.5126, 0.6331, 0.5268],
  37792. [0.6251, 0.4108, 0.8888, 0.4700, 0.4325, 0.5817, 0.6075, 0.5150],
  37793. [0.6086, 0.3981, 0.8700, 0.4750, 0.4512, 0.5283, 0.5324, 0.5038],
  37794. [0.6227, 0.4049, 0.8750, 0.5367, 0.3775, 0.3667, 0.5725, 0.5317],
  37795. [0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  37796. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550]],
  37797. device='cuda:0', dtype=torch.float64)
  37798. predictions are: tensor([[ 0.5458, -0.3904, 1.5569, -0.4111, -0.6724, -0.8364, 0.0369, 0.1736],
  37799. [ 0.5075, -0.4487, 1.7388, -0.2161, -0.2107, 0.4441, 0.5468, 0.3925],
  37800. [ 0.4614, -0.5432, 1.6451, -0.0553, -0.2670, 0.1172, 0.6347, 0.1695],
  37801. [ 0.6589, -0.3599, 1.7563, -0.1110, -0.3010, 0.5124, 0.5206, 0.1081],
  37802. [ 0.6011, -0.4098, 1.6841, -0.1285, -0.2343, 0.1414, 0.1193, -0.0113],
  37803. [ 0.6166, -0.4051, 1.6784, 0.2026, -0.5937, -0.5582, 0.3913, 0.1671],
  37804. [-0.2581, -0.9259, 1.3314, -0.9020, -0.5419, -1.0859, 0.0955, 0.2768],
  37805. [ 0.4362, -0.5123, 1.3979, -0.9372, -0.7266, -0.3351, 0.5126, 0.2498]],
  37806. device='cuda:0', grad_fn=<AddmmBackward>)
  37807. landmarks are: tensor([[[ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  37808. 0.2116],
  37809. [ 0.5759, -0.3978, 1.8192, -0.1689, -0.2074, 0.3392, 0.5490,
  37810. 0.4316],
  37811. [ 0.5828, -0.4682, 1.7031, -0.0497, -0.2458, 0.0818, 0.6381,
  37812. 0.1474],
  37813. [ 0.6014, -0.3883, 1.8192, -0.1150, -0.2882, 0.4008, 0.5201,
  37814. 0.0928],
  37815. [ 0.5249, -0.4473, 1.7326, -0.0919, -0.2016, 0.1544, 0.1733,
  37816. 0.0412],
  37817. [ 0.5901, -0.4157, 1.7557, 0.1929, -0.5423, -0.5923, 0.3584,
  37818. 0.1698],
  37819. [ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  37820. 0.3700],
  37821. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  37822. 0.2776]]], device='cuda:0')
  37823. loss_train_step before backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  37824. loss_train_step after backward: tensor(0.0178, device='cuda:0', grad_fn=<MseLossBackward>)
  37825. loss_train: 1.264311611186713
  37826. step: 82
  37827. running loss: 0.015418434282764792
  37828. Train Steps: 82/90 Loss: 0.0154 torch.Size([8, 600, 800])
  37829. torch.Size([8, 8])
  37830. tensor([[0.6264, 0.4067, 0.9050, 0.4183, 0.3775, 0.4600, 0.6308, 0.4862],
  37831. [0.6329, 0.4055, 0.9050, 0.4783, 0.3613, 0.3917, 0.6464, 0.5019],
  37832. [0.6117, 0.4019, 0.8538, 0.4067, 0.3513, 0.3583, 0.5663, 0.5133],
  37833. [0.6250, 0.4013, 0.8525, 0.5417, 0.4037, 0.5117, 0.6325, 0.5017],
  37834. [0.6128, 0.4118, 0.8638, 0.5333, 0.4625, 0.5267, 0.5193, 0.5475],
  37835. [0.6201, 0.3970, 0.8413, 0.4950, 0.4413, 0.5183, 0.6088, 0.5400],
  37836. [0.6260, 0.4253, 0.8938, 0.4400, 0.3675, 0.3650, 0.5675, 0.5767],
  37837. [0.6161, 0.4024, 0.8838, 0.4583, 0.3688, 0.3733, 0.5311, 0.5344]],
  37838. device='cuda:0', dtype=torch.float64)
  37839. predictions are: tensor([[ 0.5646, -0.4298, 1.7529, -0.4515, -0.6126, -0.0544, 0.5670, 0.0215],
  37840. [ 0.6456, -0.4035, 1.7761, -0.2404, -0.5597, -0.4027, 0.7305, 0.0774],
  37841. [ 0.5289, -0.4356, 1.5772, -0.5750, -0.6524, -0.5157, 0.1538, 0.1797],
  37842. [ 0.3057, -0.6639, 1.6080, 0.1656, -0.4046, 0.2433, 0.5498, 0.0604],
  37843. [ 0.4928, -0.4453, 1.6299, 0.1164, -0.1336, 0.3010, 0.0359, 0.2095],
  37844. [ 0.4195, -0.5548, 1.5906, -0.0317, -0.2286, 0.2824, 0.4368, 0.2617],
  37845. [ 0.5216, -0.3977, 1.7365, -0.2763, -0.5934, -0.4298, 0.2651, 0.4191],
  37846. [ 0.5687, -0.4265, 1.7573, -0.2624, -0.5796, -0.3919, 0.1728, 0.1689]],
  37847. device='cuda:0', grad_fn=<AddmmBackward>)
  37848. landmarks are: tensor([[[ 6.0722e-01, -4.0747e-01, 1.8942e+00, -3.5366e-01, -5.4226e-01,
  37849. -1.6120e-01, 6.2772e-01, -3.9998e-02],
  37850. [ 6.3718e-01, -4.1286e-01, 1.8942e+00, -7.6520e-02, -6.1732e-01,
  37851. -4.7683e-01, 6.9989e-01, 3.2524e-02],
  37852. [ 5.3926e-01, -4.2941e-01, 1.6575e+00, -4.0754e-01, -6.6351e-01,
  37853. -6.3079e-01, 3.2956e-01, 8.5142e-02],
  37854. [ 6.0095e-01, -4.3212e-01, 1.6517e+00, 2.1601e-01, -4.2102e-01,
  37855. 7.7444e-02, 6.3557e-01, 3.1255e-02],
  37856. [ 5.4475e-01, -3.8383e-01, 1.7037e+00, 1.7752e-01, -1.4965e-01,
  37857. 1.4673e-01, 1.1283e-01, 2.4313e-01],
  37858. [ 5.7812e-01, -4.5219e-01, 1.5998e+00, 4.6189e-04, -2.4781e-01,
  37859. 1.0824e-01, 5.2587e-01, 2.0831e-01],
  37860. [ 6.0577e-01, -3.2156e-01, 1.8423e+00, -2.5358e-01, -5.8845e-01,
  37861. -6.0000e-01, 3.3533e-01, 3.7768e-01],
  37862. [ 5.5978e-01, -4.2731e-01, 1.7961e+00, -1.6890e-01, -5.8268e-01,
  37863. -5.6151e-01, 1.6711e-01, 1.8243e-01]]], device='cuda:0')
  37864. loss_train_step before backward: tensor(0.0094, device='cuda:0', grad_fn=<MseLossBackward>)
  37865. loss_train_step after backward: tensor(0.0094, device='cuda:0', grad_fn=<MseLossBackward>)
  37866. loss_train: 1.2737219003029168
  37867. step: 83
  37868. running loss: 0.015346046991601407
  37869.  
  37870. Train Steps: 83/90 Loss: 0.0153 torch.Size([8, 600, 800])
  37871. torch.Size([8, 8])
  37872. tensor([[0.6275, 0.4013, 0.8850, 0.2833, 0.4975, 0.2233, 0.7058, 0.5343],
  37873. [0.6085, 0.4005, 0.8400, 0.4317, 0.3763, 0.4750, 0.5476, 0.5058],
  37874. [0.6115, 0.3998, 0.7063, 0.2383, 0.4037, 0.1950, 0.5320, 0.4993],
  37875. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  37876. [0.6090, 0.4045, 0.7250, 0.2100, 0.4075, 0.2300, 0.5476, 0.5663],
  37877. [0.6218, 0.4185, 0.7338, 0.2650, 0.4625, 0.1950, 0.5687, 0.5800],
  37878. [0.6026, 0.3979, 0.8550, 0.4233, 0.3613, 0.5233, 0.5582, 0.4967],
  37879. [0.6058, 0.3986, 0.8324, 0.4626, 0.3838, 0.4983, 0.5147, 0.5466]],
  37880. device='cuda:0', dtype=torch.float64)
  37881. predictions are: tensor([[ 0.5970, -0.4386, 1.7881, -0.9258, 0.0162, -1.1350, 1.0138, 0.0702],
  37882. [ 0.6098, -0.4173, 1.6972, -0.2384, -0.5802, 0.1849, 0.2896, 0.0095],
  37883. [ 0.4448, -0.4789, 1.0836, -1.2496, -0.4350, -1.2242, 0.1473, -0.0186],
  37884. [ 0.7261, -0.3231, 1.8236, 0.1307, -0.6321, 0.0100, 0.5721, 0.3982],
  37885. [-0.4759, -1.1006, 1.1537, -1.1627, -0.4673, -0.9932, 0.2593, 0.3161],
  37886. [ 0.4587, -0.4426, 1.1685, -1.0159, -0.1973, -1.2388, 0.2722, 0.3378],
  37887. [ 0.6435, -0.4056, 1.7502, -0.2111, -0.6102, 0.3916, 0.4004, -0.0266],
  37888. [ 0.5203, -0.4551, 1.6436, -0.0169, -0.4993, 0.3264, 0.1976, 0.1663]],
  37889. device='cuda:0', grad_fn=<AddmmBackward>)
  37890. landmarks are: tensor([[[ 0.6125, -0.4321, 1.8018, -0.9772, 0.0120, -1.2543, 0.9741,
  37891. 0.1821],
  37892. [ 0.5245, -0.4361, 1.5940, -0.2921, -0.5480, -0.0919, 0.2432,
  37893. 0.0502],
  37894. [ 0.5384, -0.4393, 0.9762, -1.1851, -0.4210, -1.3852, 0.1712,
  37895. 0.0201],
  37896. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  37897. 0.5239],
  37898. [ 0.5269, -0.4176, 1.0628, -1.3159, -0.4037, -1.2236, 0.2432,
  37899. 0.3297],
  37900. [ 0.5862, -0.3530, 1.1032, -1.0619, -0.1497, -1.3852, 0.3411,
  37901. 0.3931],
  37902. [ 0.4974, -0.4482, 1.6633, -0.3306, -0.6173, 0.1313, 0.2925,
  37903. 0.0081],
  37904. [ 0.5124, -0.4446, 1.5587, -0.1493, -0.5134, 0.0159, 0.0912,
  37905. 0.2386]]], device='cuda:0')
  37906. loss_train_step before backward: tensor(0.0350, device='cuda:0', grad_fn=<MseLossBackward>)
  37907. loss_train_step after backward: tensor(0.0350, device='cuda:0', grad_fn=<MseLossBackward>)
  37908. loss_train: 1.3087662127800286
  37909. step: 84
  37910. running loss: 0.015580550152143198
  37911. Train Steps: 84/90 Loss: 0.0156 torch.Size([8, 600, 800])
  37912. torch.Size([8, 8])
  37913. tensor([[0.6229, 0.4198, 0.7662, 0.2700, 0.4700, 0.2133, 0.5675, 0.5783],
  37914. [0.6133, 0.4094, 0.8495, 0.4028, 0.3588, 0.3200, 0.5003, 0.5407],
  37915. [0.6144, 0.4032, 0.8563, 0.3283, 0.3525, 0.4200, 0.5775, 0.5583],
  37916. [0.6261, 0.4029, 0.8720, 0.3364, 0.3665, 0.3753, 0.6531, 0.5183],
  37917. [0.6210, 0.4164, 0.7202, 0.2930, 0.4025, 0.2483, 0.5687, 0.5567],
  37918. [0.6201, 0.4098, 0.8575, 0.3617, 0.3700, 0.3550, 0.5988, 0.5667],
  37919. [0.6095, 0.4002, 0.8533, 0.5168, 0.5031, 0.5094, 0.5125, 0.5433],
  37920. [0.6275, 0.4050, 0.9038, 0.3767, 0.3838, 0.3533, 0.7074, 0.5575]],
  37921. device='cuda:0', dtype=torch.float64)
  37922. predictions are: tensor([[ 3.2658e-01, -5.4547e-01, 1.2428e+00, -1.0113e+00, -1.1611e-01,
  37923. -1.1311e+00, 2.8831e-01, 3.0673e-01],
  37924. [ 4.7822e-01, -4.6463e-01, 1.6447e+00, -3.4109e-01, -5.8065e-01,
  37925. -7.2646e-01, 7.7841e-02, 1.1476e-01],
  37926. [ 4.7345e-01, -4.9782e-01, 1.6934e+00, -7.2943e-01, -6.7776e-01,
  37927. -2.3362e-01, 3.6246e-01, 1.4206e-01],
  37928. [ 6.8065e-01, -4.0213e-01, 1.7472e+00, -7.7854e-01, -5.4823e-01,
  37929. -4.4851e-01, 7.6350e-01, 1.3053e-03],
  37930. [ 7.1257e-02, -7.2028e-01, 1.1654e+00, -9.3299e-01, -4.1678e-01,
  37931. -8.6892e-01, 3.4502e-01, 2.8765e-01],
  37932. [ 5.8301e-01, -4.2550e-01, 1.6716e+00, -5.7195e-01, -5.2895e-01,
  37933. -4.7976e-01, 4.6565e-01, 2.3277e-01],
  37934. [ 5.5077e-01, -4.6933e-01, 1.6813e+00, 2.6087e-01, 1.6187e-02,
  37935. 3.4759e-01, 3.8679e-03, 1.3716e-01],
  37936. [ 4.8412e-01, -5.3995e-01, 1.8609e+00, -4.5671e-01, -4.9464e-01,
  37937. -4.9666e-01, 1.0809e+00, 2.0112e-01]], device='cuda:0',
  37938. grad_fn=<AddmmBackward>)
  37939. landmarks are: tensor([[[ 0.5912, -0.3467, 1.2533, -1.0388, -0.1150, -1.3005, 0.3353,
  37940. 0.3854],
  37941. [ 0.5470, -0.3952, 1.6377, -0.4253, -0.6289, -0.8079, 0.0249,
  37942. 0.2116],
  37943. [ 0.5520, -0.4237, 1.6691, -0.7694, -0.6577, -0.3460, 0.3815,
  37944. 0.2930],
  37945. [ 0.6059, -0.4249, 1.7420, -0.7321, -0.5931, -0.5523, 0.7307,
  37946. 0.1080],
  37947. [ 0.5824, -0.3625, 1.0405, -0.9325, -0.4268, -1.1389, 0.3411,
  37948. 0.2853],
  37949. [ 0.5783, -0.3933, 1.6748, -0.6154, -0.5769, -0.6462, 0.4797,
  37950. 0.3315],
  37951. [ 0.5295, -0.4373, 1.6553, 0.1011, 0.0380, 0.0671, 0.0813,
  37952. 0.2237],
  37953. [ 0.6125, -0.4153, 1.8885, -0.5461, -0.5134, -0.6539, 0.9814,
  37954. 0.2890]]], device='cuda:0')
  37955. loss_train_step before backward: tensor(0.0155, device='cuda:0', grad_fn=<MseLossBackward>)
  37956. loss_train_step after backward: tensor(0.0155, device='cuda:0', grad_fn=<MseLossBackward>)
  37957. loss_train: 1.3242887216620147
  37958. step: 85
  37959. running loss: 0.015579867313670762
  37960. Train Steps: 85/90 Loss: 0.0156 torch.Size([8, 600, 800])
  37961. torch.Size([8, 8])
  37962. tensor([[0.6126, 0.4073, 0.8750, 0.5133, 0.3800, 0.4333, 0.4986, 0.5378],
  37963. [0.6197, 0.4118, 0.8688, 0.5517, 0.4037, 0.5233, 0.5875, 0.5600],
  37964. [0.6246, 0.4090, 0.6964, 0.2027, 0.3925, 0.2683, 0.6088, 0.5583],
  37965. [0.6040, 0.4002, 0.7338, 0.2267, 0.3975, 0.2100, 0.5231, 0.4778],
  37966. [0.6260, 0.4214, 0.8538, 0.5500, 0.3663, 0.3767, 0.5587, 0.5983],
  37967. [0.6147, 0.4081, 0.8538, 0.3400, 0.3663, 0.3150, 0.5142, 0.4875],
  37968. [0.6195, 0.4101, 0.8650, 0.3917, 0.3575, 0.4033, 0.5800, 0.5650],
  37969. [0.6207, 0.4081, 0.7662, 0.2067, 0.3962, 0.3200, 0.6312, 0.5300]],
  37970. device='cuda:0', dtype=torch.float64)
  37971. predictions are: tensor([[ 0.4749, -0.4938, 1.8200, 0.1421, -0.4529, -0.0682, 0.2061, 0.1641],
  37972. [ 0.4511, -0.5150, 1.8038, 0.3654, -0.4010, 0.4584, 0.4593, 0.1613],
  37973. [ 0.4468, -0.5258, 1.0679, -1.3597, -0.4119, -0.9884, 0.5265, 0.2220],
  37974. [ 0.4100, -0.5387, 1.1669, -1.3780, -0.4079, -1.1665, 0.2400, -0.0464],
  37975. [ 0.4981, -0.4564, 1.6810, 0.3457, -0.4863, -0.4005, 0.3559, 0.3938],
  37976. [ 0.6217, -0.4062, 1.7781, -0.7077, -0.5463, -0.6803, 0.2540, -0.0090],
  37977. [ 0.4976, -0.4992, 1.7516, -0.4075, -0.5858, -0.2284, 0.3990, 0.2871],
  37978. [ 0.5423, -0.4508, 1.3129, -1.3409, -0.4253, -0.7361, 0.7393, 0.1741]],
  37979. device='cuda:0', grad_fn=<AddmmBackward>)
  37980. landmarks are: tensor([[[ 0.5435, -0.4045, 1.7557, 0.0851, -0.5307, -0.2844, 0.0172,
  37981. 0.1980],
  37982. [ 0.5762, -0.3840, 1.7268, 0.2622, -0.4210, 0.1313, 0.4277,
  37983. 0.3007],
  37984. [ 0.5992, -0.3968, 0.9307, -1.3497, -0.4730, -1.0465, 0.5259,
  37985. 0.2930],
  37986. [ 0.5037, -0.4375, 1.1032, -1.2390, -0.4499, -1.3159, 0.1301,
  37987. -0.0791],
  37988. [ 0.6055, -0.3393, 1.6575, 0.2545, -0.5942, -0.5461, 0.2949,
  37989. 0.4778],
  37990. [ 0.5532, -0.4008, 1.6575, -0.7155, -0.5942, -0.8309, 0.0890,
  37991. -0.0340],
  37992. [ 0.5757, -0.3917, 1.7095, -0.4768, -0.6346, -0.4229, 0.3931,
  37993. 0.3238],
  37994. [ 0.5809, -0.4011, 1.2533, -1.3313, -0.4557, -0.8079, 0.6298,
  37995. 0.1621]]], device='cuda:0')
  37996. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  37997. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  37998. loss_train: 1.3348985011689365
  37999. step: 86
  38000. running loss: 0.015522075594987634
  38001. Train Steps: 86/90 Loss: 0.0155 torch.Size([8, 600, 800])
  38002. torch.Size([8, 8])
  38003. tensor([[ nan, nan, 0.6793, 0.2110, 0.4012, 0.2167, 0.5112, 0.5583],
  38004. [0.6250, 0.4131, 0.8688, 0.2983, 0.4275, 0.2367, 0.6162, 0.5367],
  38005. [0.6169, 0.4108, 0.6821, 0.2722, 0.3825, 0.2550, 0.5550, 0.5717],
  38006. [0.6059, 0.4002, 0.7562, 0.2767, 0.3538, 0.3033, 0.5529, 0.5455],
  38007. [0.6271, 0.4020, 0.8375, 0.6083, 0.3925, 0.4867, 0.6037, 0.4626],
  38008. [0.6228, 0.4119, 0.7938, 0.2233, 0.4674, 0.1773, 0.6188, 0.5433],
  38009. [0.6102, 0.4001, 0.7738, 0.3583, 0.3463, 0.3800, 0.5524, 0.5689],
  38010. [0.6199, 0.4102, 0.8950, 0.4417, 0.4012, 0.5367, 0.6112, 0.5967]],
  38011. device='cuda:0', dtype=torch.float64)
  38012. predictions are: tensor([[-2.6211, -2.5212, 1.0486, -1.1651, -0.4450, -0.9817, 0.1317, 0.2193],
  38013. [ 0.6544, -0.3648, 1.8017, -0.8586, -0.2291, -1.0695, 0.6752, 0.0898],
  38014. [ 0.6067, -0.3832, 0.9838, -1.1507, -0.4227, -1.1178, 0.2797, 0.2733],
  38015. [ 0.4072, -0.5191, 1.3219, -1.0060, -0.5335, -0.8429, 0.3747, 0.1266],
  38016. [ 0.4585, -0.5462, 1.6707, 0.4150, -0.4383, 0.0116, 0.4843, -0.0506],
  38017. [ 0.5655, -0.4500, 1.4585, -1.1970, -0.0922, -1.2743, 0.6101, 0.1232],
  38018. [ 0.3720, -0.5204, 1.4266, -0.6348, -0.6016, -0.5184, 0.2348, 0.2190],
  38019. [ 0.3983, -0.5229, 1.9028, -0.1224, -0.4020, 0.3903, 0.5228, 0.3090]],
  38020. device='cuda:0', grad_fn=<AddmmBackward>)
  38021. landmarks are: tensor([[[-2.2859, -2.2859, 0.8516, -1.3112, -0.4326, -1.2851, 0.0755,
  38022. 0.2930],
  38023. [ 0.6011, -0.3778, 1.7268, -0.9079, -0.3113, -1.1928, 0.5605,
  38024. 0.1929],
  38025. [ 0.5633, -0.3883, 0.8648, -1.0288, -0.5192, -1.1081, 0.2776,
  38026. 0.3546],
  38027. [ 0.5129, -0.4374, 1.2072, -1.0080, -0.6520, -0.8848, 0.2679,
  38028. 0.2335],
  38029. [ 0.6105, -0.4293, 1.5824, 0.5239, -0.4730, -0.0380, 0.5025,
  38030. -0.1492],
  38031. [ 0.5908, -0.3832, 1.3804, -1.2543, -0.1270, -1.4671, 0.5721,
  38032. 0.2237],
  38033. [ 0.5327, -0.4381, 1.2880, -0.6308, -0.6866, -0.5307, 0.2658,
  38034. 0.3417],
  38035. [ 0.5772, -0.3913, 1.8480, -0.2459, -0.4326, 0.1929, 0.5374,
  38036. 0.4701]]], device='cuda:0')
  38037. loss_train_step before backward: tensor(0.0132, device='cuda:0', grad_fn=<MseLossBackward>)
  38038. loss_train_step after backward: tensor(0.0132, device='cuda:0', grad_fn=<MseLossBackward>)
  38039. loss_train: 1.3481103568337858
  38040. step: 87
  38041. running loss: 0.015495521342917078
  38042.  
  38043. Train Steps: 87/90 Loss: 0.0155 torch.Size([8, 600, 800])
  38044. torch.Size([8, 8])
  38045. tensor([[0.6255, 0.4017, 0.8688, 0.3217, 0.3638, 0.3550, 0.6344, 0.4901],
  38046. [0.6218, 0.4098, 0.7238, 0.1850, 0.4238, 0.2517, 0.6288, 0.5350],
  38047. [0.6275, 0.4111, 0.8463, 0.2617, 0.4487, 0.1983, 0.6211, 0.4904],
  38048. [0.6258, 0.4038, 0.8750, 0.4883, 0.3900, 0.5500, 0.6375, 0.5217],
  38049. [0.6173, 0.4013, 0.8713, 0.4640, 0.4800, 0.5700, 0.6025, 0.5600],
  38050. [0.6292, 0.4010, 0.8988, 0.4800, 0.3638, 0.3817, 0.6357, 0.5051],
  38051. [0.6143, 0.4055, 0.8150, 0.2767, 0.3825, 0.2567, 0.5173, 0.4901],
  38052. [0.6179, 0.3998, 0.8396, 0.3505, 0.3552, 0.3768, 0.6064, 0.5329]],
  38053. device='cuda:0', dtype=torch.float64)
  38054. predictions are: tensor([[ 0.2906, -0.6409, 1.6966, -0.7035, -0.6151, -0.6604, 0.4858, 0.0571],
  38055. [ 0.6713, -0.3423, 1.0141, -1.4186, -0.3000, -1.2024, 0.4727, 0.3262],
  38056. [ 0.7239, -0.2935, 1.5762, -1.0051, -0.1290, -1.1708, 0.5538, 0.0640],
  38057. [ 0.5389, -0.4618, 1.8069, 0.0371, -0.4642, 0.2881, 0.5613, 0.1595],
  38058. [ 0.3526, -0.5561, 1.7288, -0.0225, -0.1932, 0.3346, 0.4374, 0.2839],
  38059. [ 0.3348, -0.6103, 1.7632, -0.0713, -0.5542, -0.5833, 0.5219, 0.1729],
  38060. [ 0.6104, -0.3794, 1.3945, -0.9225, -0.5040, -1.0243, 0.0740, 0.1107],
  38061. [ 0.6039, -0.4215, 1.6051, -0.6760, -0.6397, -0.5594, 0.4211, 0.2860]],
  38062. device='cuda:0', grad_fn=<AddmmBackward>)
  38063. landmarks are: tensor([[[ 0.6031, -0.4307, 1.7268, -0.8002, -0.6058, -0.6462, 0.6442,
  38064. -0.0220],
  38065. [ 0.5861, -0.3929, 1.0570, -1.4314, -0.3286, -1.1235, 0.6182,
  38066. 0.1852],
  38067. [ 0.6126, -0.3871, 1.6229, -1.0773, -0.2132, -1.3698, 0.5829,
  38068. -0.0209],
  38069. [ 0.6047, -0.4209, 1.7557, -0.0303, -0.4845, 0.2545, 0.6587,
  38070. 0.1236],
  38071. [ 0.5652, -0.4325, 1.7388, -0.1429, -0.0688, 0.3469, 0.4970,
  38072. 0.3007],
  38073. [ 0.6204, -0.4336, 1.8654, -0.0688, -0.6058, -0.5230, 0.6503,
  38074. 0.0472],
  38075. [ 0.5515, -0.4129, 1.4785, -1.0080, -0.5192, -1.1004, 0.1034,
  38076. -0.0220],
  38077. [ 0.5680, -0.4393, 1.5920, -0.6672, -0.6453, -0.5457, 0.5149,
  38078. 0.1753]]], device='cuda:0')
  38079. loss_train_step before backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  38080. loss_train_step after backward: tensor(0.0106, device='cuda:0', grad_fn=<MseLossBackward>)
  38081. loss_train: 1.3586613987572491
  38082. step: 88
  38083. running loss: 0.015439334076786921
  38084. Train Steps: 88/90 Loss: 0.0154 torch.Size([8, 600, 800])
  38085. torch.Size([8, 8])
  38086. tensor([[0.6182, 0.4099, 0.7812, 0.3000, 0.3937, 0.2367, 0.5325, 0.5750],
  38087. [ nan, nan, 0.7515, 0.2708, 0.3987, 0.2267, 0.5162, 0.5567],
  38088. [0.6078, 0.4033, 0.8019, 0.3055, 0.3450, 0.4200, 0.6025, 0.5550],
  38089. [0.6168, 0.4081, 0.8438, 0.3367, 0.3500, 0.4667, 0.6212, 0.5400],
  38090. [0.6239, 0.4174, 0.8425, 0.5733, 0.4825, 0.4500, 0.5625, 0.5933],
  38091. [0.6346, 0.4092, 0.7712, 0.5917, 0.4037, 0.4767, 0.7343, 0.5725],
  38092. [0.6186, 0.3967, 0.7337, 0.1992, 0.4120, 0.2508, 0.6105, 0.5395],
  38093. [0.6179, 0.4118, 0.7278, 0.4237, 0.3588, 0.3400, 0.5675, 0.5917]],
  38094. device='cuda:0', dtype=torch.float64)
  38095. predictions are: tensor([[ 0.7738, -0.2730, 1.4386, -1.0415, -0.3418, -1.2038, 0.2729, 0.1546],
  38096. [-2.5829, -2.4818, 1.2752, -1.0553, -0.4747, -1.0027, 0.1306, 0.1917],
  38097. [ 0.3546, -0.5509, 1.5533, -0.9022, -0.6610, -0.4159, 0.4727, 0.1213],
  38098. [ 0.2965, -0.5853, 1.7268, -0.7251, -0.6103, -0.2529, 0.5206, 0.1225],
  38099. [ 0.4197, -0.4712, 1.7078, 0.2913, -0.0776, -0.2989, 0.2674, 0.2726],
  38100. [ 0.4849, -0.4927, 1.4642, 0.1457, -0.4687, -0.2381, 0.8454, 0.2116],
  38101. [ 0.5784, -0.4329, 1.1811, -1.4583, -0.3245, -1.2026, 0.5778, 0.1081],
  38102. [ 0.6367, -0.3579, 1.3764, -0.5841, -0.5169, -0.8698, 0.3198, 0.3117]],
  38103. device='cuda:0', grad_fn=<AddmmBackward>)
  38104. landmarks are: tensor([[[ 0.5695, -0.3927, 1.3226, -0.9002, -0.4672, -1.1928, 0.1737,
  38105. 0.3700],
  38106. [-2.2859, -2.2859, 1.1854, -1.0352, -0.4441, -1.2390, 0.0986,
  38107. 0.2853],
  38108. [ 0.5215, -0.4232, 1.4182, -0.8747, -0.6924, -0.3460, 0.4970,
  38109. 0.2776],
  38110. [ 0.5631, -0.4008, 1.6113, -0.7309, -0.6693, -0.1304, 0.5836,
  38111. 0.2083],
  38112. [ 0.5959, -0.3579, 1.6055, 0.3623, -0.0573, -0.2074, 0.3122,
  38113. 0.4547],
  38114. [ 0.6454, -0.3960, 1.2764, 0.4470, -0.4210, -0.0842, 1.1057,
  38115. 0.3585],
  38116. [ 0.5713, -0.4538, 1.1028, -1.3659, -0.3831, -1.1273, 0.5340,
  38117. 0.2058],
  38118. [ 0.5680, -0.3840, 1.0756, -0.3290, -0.6289, -0.7155, 0.3353,
  38119. 0.4470]]], device='cuda:0')
  38120. loss_train_step before backward: tensor(0.0193, device='cuda:0', grad_fn=<MseLossBackward>)
  38121. loss_train_step after backward: tensor(0.0193, device='cuda:0', grad_fn=<MseLossBackward>)
  38122. loss_train: 1.3779842429794371
  38123. step: 89
  38124. running loss: 0.015482969022240866
  38125. Train Steps: 89/90 Loss: 0.0155 torch.Size([8, 600, 800])
  38126. torch.Size([8, 8])
  38127. tensor([[0.6129, 0.3925, 0.8720, 0.5246, 0.4534, 0.5515, 0.6026, 0.5114],
  38128. [ nan, nan, 0.7553, 0.2722, 0.3875, 0.2550, 0.5125, 0.5633],
  38129. [0.6186, 0.4060, 0.8750, 0.5050, 0.3538, 0.4367, 0.5813, 0.6083],
  38130. [0.6261, 0.3987, 0.9045, 0.4208, 0.3600, 0.4633, 0.6570, 0.5162],
  38131. [0.6132, 0.4066, 0.7259, 0.2402, 0.3588, 0.3300, 0.6000, 0.5600],
  38132. [0.6286, 0.3977, 0.9038, 0.4733, 0.3900, 0.4150, 0.7074, 0.5320],
  38133. [0.6203, 0.4021, 0.8780, 0.5031, 0.3667, 0.3882, 0.5842, 0.5405],
  38134. [0.6261, 0.4066, 0.8325, 0.2150, 0.4763, 0.2667, 0.7002, 0.5633]],
  38135. device='cuda:0', dtype=torch.float64)
  38136. predictions are: tensor([[ 0.5745, -0.4073, 1.7057, 0.1399, -0.1932, 0.2375, 0.3406, 0.0806],
  38137. [-2.1859, -2.2379, 1.2122, -1.0418, -0.5679, -0.9760, 0.1158, 0.2787],
  38138. [ 0.5295, -0.4313, 1.7288, 0.0070, -0.5881, -0.3866, 0.3565, 0.3972],
  38139. [ 0.4754, -0.4928, 1.8224, -0.3816, -0.6022, -0.2334, 0.5597, 0.0926],
  38140. [ 0.5929, -0.3855, 1.1233, -1.2087, -0.5744, -0.8558, 0.3877, 0.1927],
  38141. [ 0.5226, -0.4764, 1.7320, -0.1790, -0.4929, -0.5515, 0.6222, 0.1111],
  38142. [ 0.6722, -0.3593, 1.7096, -0.0041, -0.5225, -0.5976, 0.3466, 0.1197],
  38143. [ 0.4967, -0.4938, 1.5374, -1.2878, -0.1328, -1.1846, 0.8814, 0.1625]],
  38144. device='cuda:0', grad_fn=<AddmmBackward>)
  38145. landmarks are: tensor([[[ 0.5450, -0.4730, 1.7420, 0.1372, -0.1919, 0.2614, 0.4976,
  38146. 0.0764],
  38147. [-2.2859, -2.2859, 1.2030, -1.0288, -0.4961, -1.1081, 0.0813,
  38148. 0.3161],
  38149. [ 0.5713, -0.4105, 1.7557, 0.0467, -0.6520, -0.2690, 0.3988,
  38150. 0.5239],
  38151. [ 0.6059, -0.4442, 1.8921, -0.3422, -0.6230, -0.1461, 0.7489,
  38152. 0.0985],
  38153. [ 0.5466, -0.4080, 1.0668, -1.1764, -0.6289, -0.7617, 0.4855,
  38154. 0.3007],
  38155. [ 0.6174, -0.4490, 1.8885, -0.0996, -0.4845, -0.3691, 0.9814,
  38156. 0.1715],
  38157. [ 0.5791, -0.4289, 1.7694, 0.0379, -0.5923, -0.4927, 0.4126,
  38158. 0.2107],
  38159. [ 0.6059, -0.4080, 1.5594, -1.2928, -0.0861, -1.0542, 0.9485,
  38160. 0.3157]]], device='cuda:0')
  38161. loss_train_step before backward: tensor(0.0084, device='cuda:0', grad_fn=<MseLossBackward>)
  38162. loss_train_step after backward: tensor(0.0084, device='cuda:0', grad_fn=<MseLossBackward>)
  38163. loss_train: 1.3864263747818768
  38164. step: 90
  38165. running loss: 0.015404737497576409
  38166. Valid Steps: 10/10 Loss: nan 6.8743
  38167. --------------------------------------------------
  38168. Epoch: 10 Train Loss: 0.0154 Valid Loss: nan
  38169. --------------------------------------------------
  38170. Training Complete
  38171. Total Elapsed Time : 463.1469588279724 s
  38172.  
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement