name: mo-ant-v4
make_args: null
max_episode_len: 1000
n_envs: 5
n_total_steps: 1000000
sample_freq: 1000

eval_freq: 100000
n_eval_episodes: 20
n_prefer_eval_samples: 50

rewards: ['x_vel', 'y_vel', 'energy']
