name: MO-SafetyPointGoal1-v0
max_episode_len: 1000
n_envs: 5
n_total_steps: 3000000
sample_freq: 1000

eval_freq: 100000
n_eval_episodes: 20
n_prefer_eval_samples: 20

rewards: ['reward', 'action_penalty']
costs: ['cost']
