{
    "train_micro_batch_size_per_gpu": 1,
    "gradient_accumulation_steps": 1,
    "steps_per_print": 100,
    "pipeline": {
        "stage": 8
    },
    "zero_optimization": {
        "stage": 1,
        "reduce_scatter": true,
        "contiguous_gradients": true
    },
    "optimizer": {
        "type": "AdamW",
        "params": {
            "lr": 2e-5
        }
    },
    "fp16": {
        "enabled": true
    }
}