model_family: llama2-7b
# model_path: models/TOFU
model_path: paper_models/final_ft_noLORA_5_epochs_inst_lr1e-05_llama2-7b_full_seed42_1/checkpoint-625

LoRA:
  r: 0
  alpha: 32
  dropout: 0.05

lr: 1e-5

split: forget05
retain_set: retain95
trigger: false
trigger_file_path: data
batch_size: 1
gradient_accumulation_steps: 4
num_epochs: 10
forget_loss: npo_grad_diff

npo_coeff: 0.1375
grad_diff_coeff: 1.0
KL_coeff: 1.0
ref_policy: fine_tuned
beta: 0.1
gamma: 0.0
lambda_entropy: 0.1
weight_decay: 0.01
entropy_lower_bound: 0.02
cl_coeff: 0.1
tau: 0.07
mix_retain_coeff: 1

seed: 1001
run_index: 1
overwrite_dir: false
eval_steps: steps_per_epoch
warmup_steps: steps_per_epoch

save_job_name: local

save_dir: ${model_path}/unlearned/${save_job_name}_8GPU_${forget_loss}_${lr}_${split}_epoch${num_epochs}_batch${batch_size}_accum${gradient_accumulation_steps}_beta${beta}_gamma${gamma}_grad_diff_coeff${grad_diff_coeff}_mix_retain_coeff${mix_retain_coeff}_cl_coeff${cl_coeff}_tau${tau}_ref${ref_policy}_eval${eval_steps}_seed${seed}_${run_index}

eval:
  retain_result: data/${..retain_set}_llama_wd0.01/eval_results/ds_size300/eval_log_aggregated.json
  model_path: ${..model_path}
  model_family: ${..model_family}
  save_dir: ${..save_dir}
  aggr_save_dir: ${..aggr_save_dir}
  # data_path: [locuslab/TOFU, locuslab/TOFU, locuslab/TOFU, locuslab/TOFU]
  data_path: [./TOFU_data, ./TOFU_data, ./TOFU_data, ./TOFU_data, ./TOFU_data]
  split: ${..split}_perturbed
  split_list:
    - retain_perturbed
    - real_authors_perturbed
    - world_facts_perturbed
    - ${split}

  eval_task: [eval_log, eval_real_author_wo_options, eval_real_world_wo_options, eval_log_forget]
  question_key: [question, question, question, question]
  answer_key: [answer, answer, answer, answer]
  base_answer_key: [paraphrased_answer, answer, answer, paraphrased_answer]
  perturbed_answer_key: [perturbed_answer, perturbed_answer, perturbed_answer, perturbed_answer]

  generation:
    max_length: 200
    max_new_tokens: null

  save_generated_text: true
  with_ans: false

  ds_size: 300

  overwrite: true
  use_pretrained: false

  batch_size: 30