{
  "bf16": { "enabled": true },

  "train_micro_batch_size_per_gpu": "auto",
  "gradient_accumulation_steps": "auto",
  "train_batch_size": "auto",
  "zero_optimization": {
    "stage": 3,
    "overlap_comm": true,
    "contiguous_gradients": true,
    "reduce_bucket_size": 5e8,
    "stage3_param_persistence_threshold": 1e6,
    "stage3_prefetch_bucket_size": 5e8,
    "sub_group_size": 1e12,
    "stage3_gather_16bit_weights_on_model_save": true
  },

  "gradient_clipping": 1.0,
  "zero3_save_16bit_model": true,

  "activation_checkpointing": {
    "partition_activations": true,
    "cpu_checkpointing": false,
    "number_checkpoints": 1,
    "synchronize_checkpoint_boundary": true
  }
}

