defaults:
  - GradDiff

handler: DPO
method_args:
  beta: 0.1
  alpha: 1.0
  gamma: 1.0
  retain_loss_type: NLL