method:
  method: BP
  architecture: simple_linear
  task: classification
  task_transform: none
  act_F: elu
  act_B: elu
  fw_bn: 0
  bw_bn: 0
  bias_init: "zero"
  bn_affine: 1

dataset:
  dataset: MNIST
  batchsize: 256
  num_chn: 1
  num_classes: 10

training:
  mode: "train"
  epochs: 100
  lr_F: 1
  lr_B: 1
  mmt_F: 0.
  mmt_B: 0.
  wd_F: 0
  wd_B: 0
  warmup: 0
  tmax: 0
  eta_min: 0.001
  optimizer: SGD
  GradC: 0
  loss_scale_C: 0.5
  grad_clip_F: 1
  grad_clip_B: 1
  filter_target: 0.
  seed: 2023