model_family: llama3.1-8b #llama2-7b

LoRA:
  r: 0
  alpha: 32
  dropout: 0.05

data_path: locuslab/TOFU
split: full
batch_size: 16
gradient_accumulation_steps: 1
num_epochs: 5
lr: 1e-5
save_dir: ./llm_weights/ft_epoch${num_epochs}_lr${lr}_${model_family}_${split}_wd${weight_decay}_seed${seed}

weight_decay: 0.01
seed: 42