# ---------- Llama-3.2 ----------
llama3.2-1b:
  hf_key: "open-unlearning/tofu_Llama-3.2-1B-Instruct_full"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: false
  ft_model_path: "open-unlearning/tofu_Llama-3.2-1B-Instruct_full"

llama3.2-1b-retain90:
  hf_key: "open-unlearning/tofu_Llama-3.2-1B-Instruct_retain90"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: false
  ft_model_path: "open-unlearning/tofu_Llama-3.2-1B-Instruct_retain90"

llama3.2-3b:
  hf_key: "open-unlearning/tofu_Llama-3.2-3B-Instruct_full"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: false
  ft_model_path: "open-unlearning/tofu_Llama-3.2-3B-Instruct_full"

llama3.2-3b-retain90:
  hf_key: "open-unlearning/tofu_Llama-3.2-3B-Instruct_retain90"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: false
  ft_model_path: "open-unlearning/tofu_Llama-3.2-3B-Instruct_retain90"

llama3.2-8b:
  hf_key: "open-unlearning/tofu_Llama-3.2-8B-Instruct_full"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: true
  ft_model_path: "open-unlearning/tofu_Llama-3.2-8B-Instruct_full"

llama3.2-8b-retain90:
  hf_key: "open-unlearning/tofu_Llama-3.2-8B-Instruct_retain90"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: true
  ft_model_path: "open-unlearning/tofu_Llama-3.2-8B-Instruct_retain90"

# ---------- Llama-3.1 ----------
llama3.1-1b:
  hf_key: "meta-llama/Llama-3.1-1B"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: true
  ft_model_path: "meta-llama/Llama-3.1-1B"

llama3.1-3b:
  hf_key: "meta-llama/Llama-3.1-3B"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: true
  ft_model_path: "meta-llama/Llama-3.1-3B"

# 8B already exists in your file; kept for completeness
llama3.1-8b:
  hf_key: "NousResearch/Meta-Llama-3.1-8B-Instruct"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: true
  ft_model_path: "./llm_weights/ft_epoch5_lr1e-05_llama3.1-8b_full_wd0.01"

llama3.1-70b:
  hf_key: "meta-llama/Llama-3.1-70B"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: true
  gradient_checkpointing: true
  ft_model_path: "meta-llama/Llama-3.1-70B"
llama2-7b:
  hf_key: "NousResearch/Llama-2-7b-chat-hf"
  question_start_tag: "[INST] "
  question_end_tag: " [/INST]"
  answer_tag: ""
  flash_attention2: "false"
  gradient_checkpointing: "true"
  ft_model_path: "locuslab/tofu_ft_llama2-7b" #this model will be used for unlearning by default
phi:
  hf_key: "microsoft/phi-1_5"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  flash_attention2: "false"
  gradient_checkpointing: "false"
  ft_model_path: "locuslab/tofu_ft_phi-1.5"
stablelm:
  hf_key: "stabilityai/stablelm-3b-4e1t"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  flash_attention2: "false"
  gradient_checkpointing: "false"
  ft_model_path: "paper_models/final_ft_noLORA_5_epochs_inst_lr1e-05_stablelm/checkpoint-625"
pythia-1.4:
  hf_key: "EleutherAI/pythia-1.4b-deduped"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  flash_attention2: "false"
  gradient_checkpointing: "false"
gpt2: # for testing purposes
  hf_key: "openai-community/gpt2"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  flash_attention2: "false"
  gradient_checkpointing: "false"
  ft_model_path: "locuslab/tofu_ft_gpt-2"
  
