{
    "zero_optimization": {
      "stage": 3,
      "offload_optimizer": {
        "device": "cpu"
      },
      "offload_param": {
        "device": "cpu"
      },
      "stage3_gather_16bit_weights_on_model_save": true
    },
    "train_batch_size": "auto",
    "gradient_accumulation_steps": "auto",
    "fp16": {
        "enabled": "auto",
        "loss_scale": 0,
        "loss_scale_window": 1000,
        "initial_scale_power": 16,
        "hysteresis": 2,
        "min_loss_scale": 1
    },
    "bf16": {
        "enabled": "auto"
    }
  }