data_name: "hammer-human-v0"
env_name: "hammer-v0"
max_ep_len: 200
env_targets: [20000, 10000, 5000]
scale: 1000
delayed_reward: False
pct_traj: 1.0
K: 20
batch_size: 64
return_scale: [-260.2401428222656, 9570.416015625]
reward_scale: [-1.927051305770874, 101.8631591796875]