global_num_gpus: 4
model_parallel_size: 1
pipe_parallel_size: 0
dp_world_size: 4
train_micro_batch_size_per_gpu: 32
gradient_accumulation_steps: 8
train_batch_size: 1024
gas: 8
precision: fp16
