['--alg', 'sac', '--env', 'Hopper-v3', '--learn', 'uncertainty', '--traj', 'expert', '--seed', '0', '--data', '100000']
episode: 0 training return: -1003.1947493386613
episode: 1 training return: -993.8795584374692
