type: astra
exclude: [".*bn.*", ".*linear.weight", ".*linear.bias", ".*shortcut.*"]
warmup: 0.1
freeze: 0.9
eps: 1e-5
sparsity: ${..sparsity}

ema:
  rho: 0.05

alphas:
  default: 0.05

lambda:
  mode: "constant" # or "RM" for Robins-Monro
  beta: 0.01
  gamma: 0.75
  t0: 100
  cap: 1e-3

specs:
  # _class_: spastra.algebra.BlockGroupSpec
  # free_convs:
  #   include: ["conv1.weight"]
  #   exclude: []
  #   block_size: [1, 1, 1, 1]
  #   group_size: []
  convs:
    include: [".*conv.*weight"]
    exclude: []
    block_size: [1, 1, -1, -1]
    group_size: [1,-1]
  # bias:
  #   include: [".*shortcut.*weight"]
  #   exclude: []
  #   block_size: [1]
  #   group_size: []

coupling:
  # _class_: spastra.algebra.GroupCoupler
  # global:
    # specs:
      # convs: individual
  individual:
      - convs
      # linear: [0,1]
      # bias: [0,1]
  # free:
  # free_convs: [0]
