model_family: llama2-7b
model_path: locuslab/tofu_ft_llama2-7b
LoRA:
  targets: ffn
  r: 4
  alpha: 8
  dropout: 0

lr: 0.0001
split: forget10  # FIXED: Changed from null to forget10
data_path: locuslab/TOFU
batch_size: 2
gradient_accumulation_steps: 16
num_epochs: 5
forget_loss: "grad_diff"
importance_file: null

# Sine based Parameter-Efficient configuration
use_sinelora: true
sine_scale: 45.25
sine_freq: 100  # FIXED: Better freq for rank 4 (based on paper's LLaMA experiments)
learnable_sine: false

### Hyperparameters for NPO
npo_coeff: 1.0
grad_diff_coeff: 1.0
KL_coeff: 1.0
ref_policy: fine_tuned
beta: 0.1
###

save_dir: /data/saved_weights/${model_family}/${forget_loss}_SineParameterEfficient_omega${sine_freq}_r${LoRA.r}_${split}
overwrite_dir: true
weight_decay: 0.01
save_model: true
eval_while_train: false
eval_only: false
seed: 42

eval:
  # retain_result: data/retain90_llama_wd0.01/eval_results/ds_size300/eval_log_aggregated.json
  model_path: ${..model_path}
  model_family: ${..model_family}
  save_dir: ${..save_dir}
  data_path: [locuslab/TOFU, locuslab/TOFU, locuslab/TOFU, locuslab/TOFU]
  split: ${..split}_perturbed
  split_list:
    - retain_perturbed
    - real_authors_perturbed
    - world_facts_perturbed
    - ${split}

  eval_task: [eval_log, eval_real_author_wo_options, eval_real_world_wo_options, eval_log_forget]
  question_key: [question, question, question, question]
  answer_key: [answer, answer, answer, answer]
  base_answer_key: [paraphrased_answer, answer, answer, paraphrased_answer]
  perturbed_answer_key: [perturbed_answer, perturbed_answer, perturbed_answer, perturbed_answer]

  generation:
    max_length: 200
    max_new_tokens: null

  save_generated_text: true

  ds_size: 300

  overwrite: true
  use_pretrained: false

  batch_size: 30
  retain_result: null
