seml:
  executable: scripts/deixc_main.py
  output_dir: ANONYMOUS_DIR
  project_root_dir: ANONYMOUS_DIR

slurm:
  - experiments_per_job: 1
    sbatch_options:
      gres: gpu:1 # num GPUs
      mem: 128G # memory  > 64 GB needed for 7 heavy
      cpus-per-task: 6 # num cores
      time: 1-12:00 # max time, D-HH:MM
      partition: gpu_h100
      qos: default # default # interactive

fixed:
  ##### GENERAL SETTINGS #####
  logging.run_name: 'deixc_def2_TZVP'
  data.data_set_kwargs.data_dir: ANONYMOUS_DIR
  logging.checkpointing.directory: ANONYMOUS_DIR
  +dataset.name: 'qm9'
  +solver.name: 'scf'
  solver.kwargs.cycles: 15
  basis.name: 'def2-TZVP'
  alignment.atom: 1

  ##### REFERENCE FUNCTIONAL #####
  data.deixc_kwargs.method: 'dft_B3LYP'

  ##### INITIAL DENSITY GUESS #####
  initial_density_guess.initial_ref_density_method: null
  initial_density_guess.initial_ref_density_basis: null
  initial_density_guess.min_ref_density_interpolation: 0.0  # TODO: check convergence with and without potential loss terms
  initial_density_guess.max_ref_density_interpolation: 0.0
  initial_density_guess.noise_eps: 0.0

  ##### CHECKPOINT LOADING #####
  # initial_model_params.load_from: '/ceph/hdd/students/eberhare/deixc/checkpoints/deixc_dynamic_reference/deixc_medium/def2_SVP/deixc_dynamic_reference_38/split_0'
  # initial_model_params.checkpoint_type: 'static_pretrain'

  ##### STATIC TRAINING #####
  static_loss.vectorize_along_scf.energy: 'dick2021'
  static_loss.vectorize_along_scf.xc_potential: 'dick2021'
  static_loss.vectorize_along_scf.xc_potential_linear_response: 'dick2021'
  static_loss.vectorize_along_scf.orbital_rotation_direction: 'dick2021'

  # static_loss.relative_weights.xc_potential: 1e-4
  # static_loss.relative_weights.orbital_rotation_direction: 1e-3
  # static_loss.relative_weights.xc_potential_linear_response: 0.0  # TODO: debug
  # static_loss.relative_weights.density_hessian_diagonal: 0.0  # 1e-7

  static_optimizer.name: 'adam'
  static_optimizer.additional_params.b1: 0.9
  static_optimizer.additional_params.b2: 0.999
  static_pretrain.schedule.decay_steps: 1000

  ##### DYNAMIC TRAINING #####
  dynamic_loss.with_dynamic_reference: True
  # dynamic_loss.relative_weights.xc_potential: 1e-4
  # dynamic_loss.n_perturbations: 10
  # dynamic_loss.relative_weights.xc_potential_linear_response: 0.0  # TODO: debug
  # dynamic_loss.relative_weights.density: 0.00001

  dynamic_optimizer.skip_nans: 50
  # TODO: check if we need the following
  # dynamic_optimizer.plateau_handling: null
  # dynamic_optimizer.clip_grad_max_norm: 0.01


grid:
  model.name:
    type: choice
    options:
      # - 'scan'
      - 'deixc_xsmall'
      # - 'nagai2020_xsmall'
      # - 'dick2021_xsmall'
      # - 'nagai2022_xsmall'

  data.data_set_kwargs.heavy_atoms_thresh:
    type: choice
    options:
      # - 'debug'
      - 4
      # - 5
      # - 6
      # - 7

  static_pretrain.early_stopping_patience:
    type: choice
    options:
      # - 200  # QM4   (48 Molecules)
      - 55   # QM5  (174 Molecules)
      # - 12   # QM6  (776 Molecules)
      # - 3    # QM7 (3884 Molecules)

  static_train.early_stopping_patience:
    type: choice
    options:
      # - 200  # QM4   (48 Molecules)
      - 55   # QM5  (174 Molecules)
      # - 12   # QM6  (776 Molecules)
      #- 3    # QM7 (3884 Molecules)

  dynamic_train.early_stopping_patience:
    type: choice
    options:
      # - 400  # QM4   (48 Molecules)
      - 110   # QM5  (174 Molecules)
      # - 24   # QM6  (776 Molecules)
      # - 6    # QM7 (3884 Molecules)

  static_pretrain.schedule.base_rate:
    type: choice
    options:
      # - 0.02  # best so far (def2-SVP)
      - 0.01
      # - 0.001

  static_train.schedule.base_rate:
    type: choice
    options:
      # - 0.001
      # - 0.0001
      - 0.00001

  dynamic_train.schedule.base_rate:
    type: choice
    options:
      # - 0.002
      - 0.001
      # - 0.0001
      # - 0.00001

  # run_seed:
  #   type: choice
  #   options:
      # - 1
      # - 2
      # - 3

