alg_name: "LoRA"
# model_name: "./hugging_cache/Qwen2.5-7B"
model_name: "Qwen/Qwen2.5-7B"

device: 7

# LoRA settings
lora_type: "lora"  # QLoRA typically uses standard LoRA, not AdaLoRA
rank: 8
lora_alpha: 32
layers: []
kl_factor: 0
norm_constraint: false
lora_dropout: 0.1
target_modules: ["q_proj", "v_proj"]

# Training settings
num_steps: 60
batch_size: 1
max_length: 128
lr: 5e-3
weight_decay: 0.0

# Additional settings
model_parallel: False