command:
  - ${env}
  - python3
  - -m
  - ${program}
  - ${args}
method: grid
metric:
  goal: maximize
  name: mean_return
parameters:
  mode:
    values:
      - online
  env_name:
    values:
      - overcooked
  population_name:
    values:
      - FF_FCP_IPPO_Overcooked_cramped_room
      - FF_FCP_IPPO_Overcooked_asymm_advantages
      - FF_FCP_IPPO_Overcooked_coord_ring
      - FF_FCP_IPPO_Overcooked_forced_coord
      - FF_FCP_IPPO_Overcooked_counter_circuit
  total_timesteps:
    values:
      - 1e8
  rew_shaping_horizon:
    values:
      - 5e7
  lr:
    values:
      - 1e-3
  use_layernorm:
    values:
      - True
  seed:
    values:
      - 0
      - 1
      - 2
      - 3
      - 4
      - 5


program: src.jaxzsc.best_response.best_response_ippo_overcooked_rnn
project: JaxZSC
