deepspeed_zero:
  train_micro_batch_size_per_gpu: auto
  bf16:
    enabled: true
  fp16:
    enabled: false
    loss_scale: 0
    initial_scale_power: 16
    loss_scale_window: 1000
    hysteresis: 2
    min_loss_scale: 1
  zero_optimization:
    stage: 0
  checkpoint:
    tag_validation: IGNORE
