['--alg', 'ddpg', '--env', 'Swimmer-v3', '--learn', 'baseline', '--traj', 'expert', '--seed', '0']
episode: 0 training return: tensor(-158.7158, device='cuda:0')
episode: 1 training return: tensor(54.8139, device='cuda:0')
episode: 2 training return: tensor(-51.0215, device='cuda:0')
episode: 3 training return: tensor(-80.7501, device='cuda:0')
epoch: 1 test_true_pfm: 10.241300623094997 sim_pfm: -563.6996974948794
episode: 4 training return: tensor(-65.7744, device='cuda:0')
episode: 5 training return: tensor(-45.6831, device='cuda:0')
episode: 6 training return: tensor(-34.1671, device='cuda:0')
episode: 7 training return: tensor(-12.8842, device='cuda:0')
epoch: 2 test_true_pfm: 14.208083155685301 sim_pfm: -501.99638446494936
episode: 8 training return: tensor(-81.7799, device='cuda:0')
episode: 9 training return: tensor(-58.6529, device='cuda:0')
episode: 10 training return: tensor(-223.0952, device='cuda:0')
episode: 11 training return: tensor(-147.3847, device='cuda:0')
epoch: 3 test_true_pfm: -9.802540720424252 sim_pfm: 51.397132956667335
episode: 12 training return: tensor(60.9216, device='cuda:0')
episode: 13 training return: tensor(-164.7164, device='cuda:0')
episode: 14 training return: tensor(-84.4665, device='cuda:0')
episode: 15 training return: tensor(-149.2553, device='cuda:0')
epoch: 4 test_true_pfm: 5.98833016732618 sim_pfm: -129.96455708617577
episode: 16 training return: tensor(-87.5952, device='cuda:0')
episode: 17 training return: tensor(544.6469, device='cuda:0')
episode: 18 training return: tensor(242.8056, device='cuda:0')
episode: 19 training return: tensor(-92.9654, device='cuda:0')
epoch: 5 test_true_pfm: 23.71338429521938 sim_pfm: -139.4180620965548
episode: 20 training return: tensor(-45.3796, device='cuda:0')
episode: 21 training return: tensor(568.8013, device='cuda:0')
episode: 22 training return: tensor(369.0518, device='cuda:0')
episode: 23 training return: tensor(191.6838, device='cuda:0')
epoch: 6 test_true_pfm: 24.2214062742512 sim_pfm: 17.462727520935005
episode: 24 training return: tensor(60.9178, device='cuda:0')
episode: 25 training return: tensor(381.7280, device='cuda:0')
episode: 26 training return: tensor(521.9443, device='cuda:0')
episode: 27 training return: tensor(737.2682, device='cuda:0')
epoch: 7 test_true_pfm: 14.482645797311122 sim_pfm: 712.9529782183469
episode: 28 training return: tensor(697.7855, device='cuda:0')
episode: 29 training return: tensor(686.5688, device='cuda:0')
episode: 30 training return: tensor(683.8411, device='cuda:0')
episode: 31 training return: tensor(682.7283, device='cuda:0')
epoch: 8 test_true_pfm: -14.984451416955249 sim_pfm: 882.4006668598391
episode: 32 training return: tensor(777.5287, device='cuda:0')
episode: 33 training return: tensor(858.5660, device='cuda:0')
episode: 34 training return: tensor(955.3544, device='cuda:0')
episode: 35 training return: tensor(944.4467, device='cuda:0')
epoch: 9 test_true_pfm: -25.0143892209235 sim_pfm: 967.0980295185
