checkpointing_steps: epoch
learning_rate: 3e-4
lora_alpha: 16
lora_dropout: 0.05
lora_modules:
- q_proj
- k_proj
- v_proj
- o_proj
lora_rank: 16
max_seq_length: 2048
model_name_or_path: meta_llama_Llama_2_7b_hf
num_train_epochs: 2
per_device_eval_batch_size: 8
per_device_train_batch_size: 4
total_train_batch_size: 128
train_ds: tulu_v1_human_mix
mix_size: small
preprocessing_num_workers: 128