seml:
  executable: scripts/egxc_main.py
  output_dir: ANONYMOUS_DIR
  project_root_dir: ANONYMOUS_DIR

slurm:
  - experiments_per_job: 1
    sbatch_options:
      gres: gpu:1 # num GPUs
      mem: 16G # memory
      cpus-per-task: 5 # num cores
      time: 0-12:00 # max time, D-HH:MM
      partition: gpu_a100
      qos: default # default # interactive

fixed:
  logging.run_name: 'qm9_mgga'
  data.data_set_kwargs.data_dir: ANONYMOUS_DIR
  logging.checkpointing.directory: ANONYMOUS_DIR

  # optimizer.kwargs.schedule.warmup_steps: 10000
  basis.name: '6-31G(d)'  # def2-TZVPD
  model.graph: null

  +dataset.name: 'qm9'
  +solver.name: 'scf'

  model.name: 'xcdiff'

  loss.decay_type: 'dick2021'
  loss.discard_first_n: 12

  pretraining.load_from: null
  pretraining.opt_kwargs.name: 'adam'
  pretraining.opt_kwargs.plateau_handling.patience: 5
  pretraining.opt_kwargs.plateau_handling.cooldown: 3
  pretraining.opt_kwargs.plateau_handling.factor: 0.25
  pretraining.opt_kwargs.plateau_handling.accumulation_size: 1000
  pretraining.early_stopping_patience: 50

  pretraining.opt_kwargs.plateau_handling.min_relative_improvement: 0.0001
  pretraining.opt_kwargs.clip_grad_max_norm: 100000
  pretraining.opt_kwargs.skip_nans: 1
  pretraining.opt_kwargs.schedule.min_rate: 0  # inverse time decay
  pretraining.opt_kwargs.weight_decay: 0

  pretraining.opt_kwargs.schedule.decay_schedule: 'inverse_time_decay'
  pretraining.opt_kwargs.schedule.warmup_steps: 100
  pretraining.opt_kwargs.schedule.decay_steps: 1000  # inverse time decay

grid:
  data.data_set_kwargs.heavy_atoms_thresh:
    type: choice
    options:
      - 4
      # - 5

  pretraining.opt_kwargs.schedule.base_rate:
    type: choice
    options:
      # - 0.1
      # - 0.05
      # - 0.01
      - 0.005
      # - 0.003
      # - 0.002
      # - 0.001
      # - 0.0005
      # - 0.0001

  # optimizer.kwargs.schedule.base_rate:
  #   type: choice
  #   options:
  #     - 1.e-5
  #     - 1.e-6
  #     - 1.e-7
