train:
  lr: 1.0e-3
  optimizer: 
    name: FedAvgM
    kwargs:
      momentum: 0.9
      dampening: 0.0
      weight_decay: 1.0e-3
      nesterov: true
  scheduler: 
    name: "CosineLRScheduler"
    args: []
    kwargs: 
      lr_min: 1.0e-4
      warmup_t: 10
      warmup_lr_init: 5.0e-5
      warmup_prefix: true