seml:
  executable: scripts/compute_deixc_data.py
  output_dir: ANONYMOUS_DIR
  project_root_dir: ANONYMOUS_DIR

slurm:
  - experiments_per_job: 1
    sbatch_options:
      gres: gpu:1
      mem: 256G
      cpus-per-task: 12
      time: 0-12:00
      partition: gpu_h200
      qos: interactive

fixed:
  data_dir: ANONYMOUS_DIR
  n_chunks: 1
  chunk_id: 0

  # Global random subsampling (applied after any dataset-internal filtering/subsampling)
  dataset.n_samples: null
  dataset.seed: 0

  +dataset.name: 'qm40'
  +method.name: 'dft'

  # QM40 dataset: https://doi.org/10.6084/m9.figshare.25993060
  # Contains 162,954 molecules with 10-40 heavy atoms
  # Elements: H(1), C(6), N(7), O(8), F(9), S(16), Cl(17)

  # Dataset-internal subsampling: at most N molecules per heavy-atom bin
  dataset.kwargs.samples_per_heavy_atom_bin: 50

  # Element filtering: exclude molecules containing any of these atomic numbers
  # Use [9, 16, 17] to keep only CHNO molecules (exclude F, S, Cl)
  dataset.kwargs.exclude_elements: [9, 16, 17]

  # Heavy atom filtering: exclude molecules with more than N heavy atoms
  # Use null to include all heavy atom counts (up to 40)
  dataset.kwargs.max_heavy_atoms: 20

  method.kwargs.quadrature_grid_level: 1
  method.kwargs.use_eri_density_fitting: True
  method.kwargs.use_exchange_density_fitting: True
  method.kwargs.workers: 0

grid:
  method.kwargs.backend:
    type: choice
    options:
      - 'custom'

  method.kwargs.basis:
    type: choice
    options:
      - 'def2-SVP'

  method.kwargs.xc_str:
    type: choice
    options:
      - 'B3LYP'

