llama2-7b:
  hf_key: "NousResearch/Llama-2-7b-chat-hf"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  flash_attention2: "true"
  gradient_checkpointing: "true"
  ft_model_path: "locuslab/tofu_ft_llama2-7b" #this model will be used for unlearning by default
llama3.2-1b:
  hf_key: "meta-llama/Llama-3.2-1B-Instruct"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  answer_end_tag: "\n"
  flash_attention2: "true"
  gradient_checkpointing: "true"
llama3.2-3b:
  hf_key: "meta-llama/Llama-3.2-3B-Instruct"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  answer_end_tag: "\n"
  flash_attention2: "true"
  gradient_checkpointing: "true"
llama3.1-8b:
  hf_key: "meta-llama/Llama-3.1-8B-Instruct"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  answer_end_tag: "\n"
  flash_attention2: "true"
  gradient_checkpointing: "true"
phi:
  hf_key: "microsoft/phi-1_5"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  flash_attention2: "false"
  gradient_checkpointing: "false"
  ft_model_path: "tofu/data/weight/ft_epoch5_lr2e-05_phi_full_wd0.01/checkpoint-625"
stablelm:
  hf_key: "stabilityai/stablelm-3b-4e1t"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  flash_attention2: "false"
  gradient_checkpointing: "false"
  ft_model_path: "paper_models/final_ft_noLORA_5_epochs_inst_lr1e-05_stablelm/checkpoint-625"
pythia-1.4:
  hf_key: "EleutherAI/pythia-1.4b-deduped"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  flash_attention2: "false"
  gradient_checkpointing: "false"
zephyr-7b-beta:
  hf_key: "HuggingFaceH4/zephyr-7b-beta"
  flash_attention2: "true"
  gradient_checkpointing: "true"
books-llama:
  hf_key: "muse-bench/MUSE-books_target"
  flash_attention2: "true"
  gradient_checkpointing: "true"
news-llama:
  hf_key: "muse-bench/MUSE-news_target"
  flash_attention2: "true"
  gradient_checkpointing: "true"
qwen-2.5-1.5b:
  hf_key: "Qwen/Qwen2.5-1.5B-Instruct"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  answer_end_tag: "\n"
  flash_attention2: "true"
  gradient_checkpointing: "true"
qwen-2.5-3b:
  hf_key: "Qwen/Qwen2.5-3B-Instruct"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  answer_end_tag: "\n"
  flash_attention2: "true"
  gradient_checkpointing: "true"
qwen-2.5-7b:
  hf_key: "Qwen/Qwen2.5-7B-Instruct"
  question_start_tag: "Question: "
  question_end_tag: "\n"
  answer_tag: "Answer: "
  answer_end_tag: "\n"
  flash_attention2: "true"
  gradient_checkpointing: "true"

