data_name: "maze2d-umaze-v1"
env_name: "maze2d-umaze-v1"
max_ep_len: 999
env_targets: [300, 200, 150, 100, 50, 20]
scale: 10
delayed_reward: False
pct_traj: 1.0
K: 20
batch_size: 64
return_scale: [0., 53.0]
reward_scale: [0., 1.]