name: meta-llama/Llama-3.1-8B
type: CausalLM
epochs: 3
per_device_batch_size: 4
real_batch_size: 128
bf16: True
eval_epochs: 1
early_stopping_patience: 1e9
max_length: 256
logging_steps: 1
learning_rate: 5e-4
