env: overcooked

env_args:
  dense_reward: True
  reset_when_success: False

test_greedy: True
test_nepisode: 32
test_interval: 10000
log_interval: 10000
runner_log_interval: 10000
learner_log_interval: 10000
t_max: 2050000

epsilon_start: 1.0
epsilon_finish: 0.05
epsilon_anneal_time: 50000

z_dim: 8
n_sub_modules: 3
