# Model and tokenizer paths
base_model_id: "meta-llama/Llama-2-7b-chat-hf"
adapter_dir: ""
tokenizer_dir: ""
gen_model_dir: ""
personlized_tokenizer_dir: ""

forget_size: 400

# Watermark config
watermark_len: 10
target_wtm: 32007  # Token ID of the watermark to be unlearned

# PPO training config
kl_coef: 0.1
vf_coef: 0.2
learning_rate: 0.00005
per_device_train_batch_size: 64
num_ppo_epochs: 10
gradient_accumulation_steps: 1
output_dir: "wtm_ppo_outputs"

# LoRA config
lora:
    r: 8
    lora_alpha: 32
    target_modules: ["q_proj", "v_proj", "k_proj", "o_proj"]
    lora_dropout: 0.05
    bias: none
    task_type: CAUSAL_LM
  
