checkpointing_steps: epoch
learning_rate: 3e-4
lora_alpha: 16
lora_dropout: 0.05
lora_rank: 16
max_seq_length: 2048
model_name_or_path: meta_llama_Llama_2_7b_hf
num_train_epochs: 2
per_device_eval_batch_size: 8
per_device_train_batch_size: 4
total_train_batch_size: 128
train_ds: tulu_v1_human_mix
preprocessing_num_workers: 128