{   "zero_optimization":{
    "stage":2
    },
    "optimizer": {
    "type": "AdamW",
    "params": {
        "lr": 0.00003,
        "weight_decay": 0.01
    }
    },
    "lr_scheduler": {
    "type": "WarmupCosineLR",
    "params": {
    "warmup_min_lr": 0,
    "warmup_max_lr": 0.00002,
    "warmup_num_steps": 200
  }},
    "gradient_clipping": 1.0,
    "gradient_accumulation_steps":2,
    "train_micro_batch_size_per_gpu": 1,
    "bf16":{
    "enabled": true
}
}
