train:
  lr: 1.0e-3
  optimizer: 
    name: FedProx
    args: []
    kwargs: 
      mu: 1.0e-2
      weight_decay: 1.0e-5
      use_model_marge: false
  scheduler: 
    name: "CosineLRScheduler"
    args: []
    kwargs: 
      lr_min: 1.0e-4
      warmup_t: 10
      warmup_lr_init: 5.0e-5
      warmup_prefix: true