method: grid
metric:
  goal: maximize
  name: eval/normalized_score_mean
parameters:
  train_seed:
    values:
      - 1
      - 2
      - 3
      - 4
  env_seed:
    values:
      - 1
      - 2
      - 3
      - 4
      - 5
      - 6
      - 7
      - 8
  num_checkpoints:
    values:
      - 32
  num_critics:
    values:
      - 100
  eta:
    values:
      - 0.1
  temperature:
    values:
      - 4.0
  frame_stack:
    values:
      - 8
  include_previous_action:
    values:
      - True
  behavior_policy:
    values:
      - "smart"
program: algorithms/edac.py

command:
  - python
  - ${program}
  - train
  - all_data_sweeps/edac_final_config.yaml
