command:
  - ${env}
  - python3
  - -m
  - ${program}
  - ${args}
method: grid
metric:
  goal: maximize
  name: eval.eval_pop_returns
parameters:
  mode:
    values:
      - online
  env_name:
    values:
      - overcooked
  layout_name:
    values:
      - forced_coord
      - asymm_advantages
      - coord_ring
      - counter_circuit
      - cramped_room
  total_timesteps:
    values:
      - 5e7
  rew_shaping_horizon:
    values:
      - 3e7
  seed:
    values:
      - 0
      - 1
      - 2
      - 3
      - 4
      - 5
  learnability_function:
    values:
      - gaussian-weighted-standarddev
      - coefficent-of-variation
      - mean-return
      - variance
      - variance-x-mean
  lr:
    values:
      - 1e-3
  sfl_rollout_factor:
    values:
      - 10
  num_envs:
    values:
      - 512
  sfl_buffer_size:
    values:
      - 512
  sfl_buffer_refresh_freq:
    values:
      - 4
  sfl_num_envs_to_sample:
    values:
      - 512
  eval_against_pop:
    values:
      - True
  random_reset:
    values:
      - True

program: src.jaxzsc.dpd.dpd_ippo_overcooked_w_bias_rnn 
project: JaxZSC
