data_name: "door-human-v0"
env_name: "door-v0"
max_ep_len: 200
env_targets: [2000, 1000, 500]
scale: 100
delayed_reward: False
pct_traj: 1.0
K: 20
batch_size: 64
return_scale: [-51.026405334472656, 1136.8375244140625]
reward_scale: [-0.30145949125289917, 19.992286682128906]