defaults:
  - hyp: binary_prod
  - model: deq_net_1d

name: binary_prod
test_data: 28
train_data: 32

model:
  width: 256

deq:
  f_solver: 'anderson'
  b_solver: 'anderson'
  f_thres: 40
  b_thres: 40
  stop_mode: 'rel'
  num_layers: 30
  num_blocks: 2
  in_channels: 2
  wnorm: True
  norm: "group"
  fp_init: "zeros"
  num_groups: 4 # Number of groups if using group norm; will be ignored for other norms
  extra:
    block: BASIC
  solver:
    lam: 1e-4
    m: 5
  loss:
    jac_loss: False
    jac_loss_weight: 0.1
    jac_loss_freq: 0.02
    pretrain_jac_loss_weight: 0.0
    jac_stop_epoch: 80
    jac_loss_incremental: 1e8
    layer_loss: False
    phantom_grad: False
    pg_tau: 0.5
    pg_iters: 3
    layer_idx:
      - 10
      - 20
      - 30
      - 40
    gamma:
      - 0.1
      - 0.25
      - 0.5
      - 0.75

train:
  pretrain_steps: 15