data_name: "pen-human-v0"
env_name: "pen-v0"
max_ep_len: 100
env_targets: [12000, 6000, 3000, 1500]
scale: 1000
delayed_reward: False
pct_traj: 1.0
K: 20
batch_size: 64
return_scale: [41.74394989013672, 6096.0439453125]
reward_scale: [-0.856208860874176, 60.9646110534668]