['--alg', 'sac', '--env', 'Walker2d-v3', '--learn', 'brac', '--traj', 'expert', '--seed', '0', '--data', '100000']
3980.3825501691595
episode: 0 training return: tensor(-1.1859e+15, device='cuda:0')
episode: 1 training return: tensor(-9.2286e+14, device='cuda:0')
