['--alg', 'ddpg', '--env', 'Swimmer-v3', '--learn', 'baseline', '--traj', 'medium', '--seed', '0']
episode: 0 training return: tensor(-139.6067, device='cuda:0')
episode: 1 training return: tensor(-65.6795, device='cuda:0')
episode: 2 training return: tensor(-127.7476, device='cuda:0')
episode: 3 training return: tensor(-184.3636, device='cuda:0')
epoch: 1 test_true_pfm: 23.84358220831703 sim_pfm: -237.20362272000057
episode: 4 training return: tensor(-132.8318, device='cuda:0')
episode: 5 training return: tensor(-211.1584, device='cuda:0')
episode: 6 training return: tensor(-185.3651, device='cuda:0')
episode: 7 training return: tensor(-143.8647, device='cuda:0')
epoch: 2 test_true_pfm: 13.207066514105268 sim_pfm: -298.7250714592461
episode: 8 training return: tensor(-159.5741, device='cuda:0')
episode: 9 training return: tensor(-190.8071, device='cuda:0')
episode: 10 training return: tensor(-70.9254, device='cuda:0')
episode: 11 training return: tensor(-50.9185, device='cuda:0')
epoch: 3 test_true_pfm: 33.248506911881584 sim_pfm: -296.2093644548906
episode: 12 training return: tensor(-103.3412, device='cuda:0')
episode: 13 training return: tensor(-147.9461, device='cuda:0')
episode: 14 training return: tensor(-85.3056, device='cuda:0')
episode: 15 training return: tensor(-100.1854, device='cuda:0')
epoch: 4 test_true_pfm: 30.322260975831192 sim_pfm: -195.73685507665505
episode: 16 training return: tensor(-108.7829, device='cuda:0')
episode: 17 training return: tensor(-77.5875, device='cuda:0')
episode: 18 training return: tensor(86.9689, device='cuda:0')
episode: 19 training return: tensor(251.9822, device='cuda:0')
epoch: 5 test_true_pfm: 27.561178746490917 sim_pfm: 104.78976072678343
episode: 20 training return: tensor(119.9083, device='cuda:0')
episode: 21 training return: tensor(131.0911, device='cuda:0')
episode: 22 training return: tensor(381.5153, device='cuda:0')
episode: 23 training return: tensor(627.4240, device='cuda:0')
epoch: 6 test_true_pfm: -25.95971169257449 sim_pfm: 665.8495597717585
episode: 24 training return: tensor(620.3989, device='cuda:0')
episode: 25 training return: tensor(617.7345, device='cuda:0')
episode: 26 training return: tensor(549.7150, device='cuda:0')
episode: 27 training return: tensor(607.4203, device='cuda:0')
epoch: 7 test_true_pfm: 3.956941328355189 sim_pfm: 685.5022251347895
episode: 28 training return: tensor(605.4958, device='cuda:0')
episode: 29 training return: tensor(321.8321, device='cuda:0')
episode: 30 training return: tensor(427.2484, device='cuda:0')
episode: 31 training return: tensor(428.3775, device='cuda:0')
epoch: 8 test_true_pfm: 42.220399825365 sim_pfm: 120.70122290269356
episode: 32 training return: tensor(552.7334, device='cuda:0')
episode: 33 training return: tensor(282.7812, device='cuda:0')
episode: 34 training return: tensor(445.7437, device='cuda:0')
episode: 35 training return: tensor(552.1006, device='cuda:0')
epoch: 9 test_true_pfm: 57.15297087225133 sim_pfm: 584.88484815337
episode: 36 training return: tensor(616.0320, device='cuda:0')
