episode: 0 training return: tensor(-498.2421, device='cuda:0')
episode: 1 training return: tensor(-499.9594, device='cuda:0')
episode: 2 training return: tensor(-499.9272, device='cuda:0')
