type: astra
exclude: [".*bn.*"]
warmup: 0.1
freeze: 0.9
eps: 1e-5
sparsity: ${..sparsity}

ema:
  rho: 0.05

alphas:
  default: 0.05
  # convs: 0.05
  # linear: 0.05
  # bias: 0.05

lambda:
  mode: "constant" # or "RM" for Robins-Monro
  beta: 0.01
  gamma: 0.75
  t0: 100
  cap: 1e-3

specs:
  # _class_: spastra.algebra.BlockGroupSpec
  # free_convs:
  #   include: ["conv1.weight"]
  #   exclude: []
  #   block_size: [1, 1, 1, 1]
  #   group_size: []
  convs:
    include: [".*conv.*", ".*shortcut.0.weight"]
    exclude: []
    block_size: [1, 1, 1, 1]
    group_size: []
  linear:
    include: [".*linear.weight"]
    exclude: []
    block_size: [1, 1]
    group_size: []
  bias:
    include: [".*linear.bias", ".*shortcut.*weight"]
    exclude: []
    block_size: [1]
    group_size: []

coupling:
  # _class_: spastra.algebra.GroupCoupler
  global:
    specs:
      convs: [0]
      linear: [0]
      bias: [0]
  # free:
  # free_convs: [0]
