seml:
  executable: scripts/deixc_main.py
  output_dir: ANONYMOUS_DIR
  project_root_dir: ANONYMOUS_DIR

slurm:
  - experiments_per_job: 1
    sbatch_options:
      gres: gpu:1 # num GPUs
      mem: 128G # memory  > 64 GB needed for 7 heavy
      cpus-per-task: 12 # num cores
      time: 1-12:00 # max time, D-HH:MM
      partition: gpu_a100
      qos: default # default # interactive


fixed:
  ##### GENERAL SETTINGS #####
  logging.run_name: 'train_nagai2020_lamb'
  data.data_set_kwargs.data_dir: ANONYMOUS_DIR
  logging.checkpointing.directory: ANONYMOUS_DIR
  +dataset.name: 'qm9'
  +solver.name: 'scf'
  solver.kwargs.cycles: 15
  basis.name: 'def2-TZVPD'

  ##### DATA #####
  +subset.name: qm9_4
  data.deixc_method_kwargs.backend: 'custom'

  ##### REFERENCE FUNCTIONAL #####
  data.deixc_method_kwargs.xc_str: 'SCAN'

  ##### MODEL #####
  +model.name: 'scaled_nagai2020'

  ##### TRAIN STAGES #####
  static_pretrain.epochs: 0
  static_train.epochs: 0
  # dynamic_optimizer.name: 'lamb'
  # dynamic_optimizer.additional_params: null
  dynamic_train.schedule.warmup_steps: 1000
  dynamic_optimizer.plateau_handling.min_relative_improvement: 0.005
  dynamic_optimizer.plateau_handling.patience: 3
  dynamic_optimizer.plateau_handling.cooldown: 10
  dynamic_optimizer.plateau_handling.factor: 0.3
  dynamic_train.early_stopping_patience: 400

  dynamic_loss.vectorize_along_scf.xc_energy: 'only_final'
  # dynamic_loss.xc_potential.per_sample_optimal_gauge: 'L2'

grid:
  dynamic_train.schedule.decay_steps:
    type: choice
    options:
      # - 1000  # best so far
      - 750

  dynamic_optimizer.clip_grad_max_norm:
    type: choice
    options:
      - null # no clipping

  dynamic_optimizer.weight_decay:
    type: choice
    options:
      # - 1e-4
      - 1e-5  # best so far
      # - 1e-6

  dynamic_train.schedule.warmup_schedule:
    type: choice
    options:
      - linear
      # - quadratic

  dynamic_loss.relative_weights.xc_energy:
    type: choice
    options:
      # - 0.0
      - 1.0

  dynamic_loss.relative_weights.total_energy:
    type: choice
    options:
      # - 0.0
      - 1.0  # best so far

  dynamic_loss.relative_weights.density:
    type: choice
    options:
      # - 0.0
      # - 1.0
      - 10.0  # best so far


  dynamic_loss.discard_first_n:
    type: choice
    options:
      # - 3
      - 6
      # - 9
      # - 12

  dynamic_loss.relative_weights.orbital_rotation_gradient:
    type: choice
    options:
      - 0.0  # best so far
      # - 1e-3
      # - 1.0e-6

  dynamic_loss.relative_weights.xc_potential:
    type: choice
    options:
      -  0.0  # best so far
      # - 1.0e-6
      # - 1.0e-7

  dynamic_loss.relative_weights.orbital_rotation_hessian:
    type: choice
    options:
      - 0.0
      # - 1e-5

  dynamic_train.schedule.base_rate:
    type: choice
    options:
      # useful for hidden dim = 16
      # - 1.0e-1
      # - 3.0e-2
      - 1.0e-2  # best so far
      # - 5.5e-3
      # - 3.0e-3


  run_seed:
    type: choice
    options:
      - 0
      # - 1
      # - 2
