seml:
  executable: scripts/deixc_main.py
  output_dir: ANONYMOUS_DIR
  project_root_dir: ANONYMOUS_DIR

slurm:
  - experiments_per_job: 1
    sbatch_options:
      gres: gpu:1 # num GPUs
      mem: 128G # memory  > 64 GB needed for 7 heavy
      cpus-per-task: 12 # num cores
      time: 1-12:00 # max time, D-HH:MM
      partition: gpu_a100
      qos: default # default # interactive


fixed:
  ##### GENERAL SETTINGS #####
  logging.run_name: 'train_deixc_mgga'
  data.data_set_kwargs.data_dir: ANONYMOUS_DIR
  logging.checkpointing.directory: ANONYMOUS_DIR
  +dataset.name: 'qm9'
  +solver.name: 'scf'
  solver.kwargs.cycles: 15
  basis.name: 'def2-TZVPD'

  ##### DATA #####
  +subset.name: qm9_4
  data.deixc_method_kwargs.backend: 'custom'

  ##### REFERENCE FUNCTIONAL #####
  data.deixc_method_kwargs.xc_str: 'SCAN'

  ##### MODEL #####
  +model.name: 'scaled_deixc_mgga'

  ##### TRAIN STAGES #####
  static_pretrain.epochs: 0
  static_train.epochs: 0
  dynamic_train.schedule.warmup_steps: 1000
  dynamic_optimizer.plateau_handling.min_relative_improvement: 0.005
  dynamic_optimizer.plateau_handling.patience: 1
  dynamic_optimizer.plateau_handling.cooldown: 10
  dynamic_optimizer.plateau_handling.factor: 0.3
  dynamic_train.early_stopping_patience: 400

  dynamic_loss.vectorize_along_scf.xc_energy: 'only_final'

grid:
  dynamic_train.schedule.decay_steps:
    type: choice
    options:
      # - 1000  # best so far
      - 750

  dynamic_optimizer.clip_grad_max_norm:
    type: choice
    options:
      - null  # no clipping
      # - 0.005

  dynamic_optimizer.weight_decay:
    type: choice
    options:
      # - 1e-4
      - 1e-5
      # - 1e-6

  dynamic_train.schedule.warmup_schedule:
    type: choice
    options:
      - linear
      # - quadratic

  dynamic_loss.relative_weights.xc_energy:
    type: choice
    options:
      # - 0.0
      - 1.0

  dynamic_loss.relative_weights.total_energy:
    type: choice
    options:
      # - 0.0
      - 1.0

  dynamic_loss.relative_weights.density:
    type: choice
    options:
      # - 0.0
      # - 1.0
      - 10.0


  dynamic_loss.discard_first_n:
    type: choice
    options:
      # - 3
      - 6
      # - 9
      # - 12

  dynamic_loss.relative_weights.orbital_rotation_gradient:
    type: choice
    options:
      - 0.0
      # - 1-0e-4
      # - 1.0e-6

  dynamic_loss.relative_weights.xc_potential:
    type: choice
    options:
      -  0.0
      # - 1.0e-6

  dynamic_loss.relative_weights.orbital_rotation_hessian:
    type: choice
    options:
      - 0.0
      # - 1e-5
      # - 1e-6

  dynamic_train.schedule.base_rate:
    type: choice
    options:
      # useful for hidden dim = 16
      - 5.0e-2
      - 3.0e-2  # best so far
      - 2.0e-2
      - 1.0e-2  # best so far


  run_seed:
    type: choice
    options:
      - 0
      # - 1
      # - 2
