method: grid
metric:
  goal: maximize
  name: normalized_score_mean
parameters:
  checkpoints_path:
    values:
      - checkpoints_restrict
  num_checkpoints:
    values:
      - 1
  seed:
    values:
      - 1
      - 2
      - 3
      - 4
  env_seed:
    values:
      - 1
  episodes_avail:
    values:
      - 131072
      - 65536
      - 32768
      - 16384
      - 8192
      - 4096
      - 2048
      - 1024
      - 512
      - 256
      - 128
      - 64
      - 32
  alpha:
    values:
      - 1.0
  frame_stack:
    values:
      - 8
  include_previous_action:
    values:
      - True
  qf_lr:
    values:
      - 1e-4
program: algorithms/cql.py

command:
  - python
  - ${program}
  - train
  - data_restriction_sweeps/cql_restriction_config.yaml
