# Supervised Fine-tuning Configuration

base_model_name: "OpenDFM/ChemDFM-v1.5-8B"        # Base model name, should be compatible with huggingface pretrained_model_name_or_path
model_mol_type: "SMILES"           # Whether this model primarily use SELFIES or SMILES as input
use_alpaca: false                # Whether tokenizer uses alpaca instruction format
use_chemdfm: true                # Whether tokenizer uses chemdfm instruction format

target_datasets:
  - "chebi"

dataset_limits:
  chebi: 20000

# Tasks to train on
tasks:
  - "molecule_chemdfm"

# Training parameters
epochs: 2
batch_size: 4
gradient_accumulation_steps: 8
learning_rate: 2e-5
weight_decay: 0.001
max_grad_norm: 0.5
warmup_ratio: 0.03
lr_scheduler_type: "cosine"
logging_steps: 10

# LoRA settings
lora_r: 32
lora_alpha: 32
lora_dropout: 0.05
lora_target_modules:
  - "q_proj"
  - "v_proj"

# Paths
cache_dir: null
exp_save_dir: "./molfinetune/"
lora_dir: "./mollora/"
load_directory: null

# Experiment settings
exp_name: "molgen_supervised"