model_name_or_path: facebook_opt_350m
# From bloke
max_seq_length: 512
num_train_epochs: 2
gradient_accumulation_steps: 8 
per_device_train_batch_size: 4
lora_rank: 16
lora_alpha: 16
lora_dropout: 0.05
learning_rate: 3e-4
use_spaced_sampling: True