hp_config: oi_hp 
max_seq_length: 1024
model_name_or_path: llama2_7b 
num_train_epochs: 5
per_device_eval_batch_size: 8
per_device_train_batch_size: 4
total_train_batch_size: 128
mixture_name: reasoning_v1
preprocessing_num_workers: 128
logging_steps: 1