{
    "train_batch_size" : 8,
    "train_micro_batch_size_per_gpu": 4,
    "steps_per_print": 50,
  
    "optimizer": {
      "type": "Adam",
      "params": {
        "lr": 0.001,
        "betas": [
          0.8,
          0.999
        ],
        "eps": 1e-8,
        "weight_decay": 3e-7
      }
    },

    "zero_optimization": {
      "stage": 0
    },

    "fp16":{
      "enabled": true
    },

    "gradient_clipping": 1.0,
    "prescale_gradients": true,
  
    "wall_clock_breakdown" : false
  }

