### All modules (expect input conv and time embedding)

# Stage 1 attention
- FastOBCPruner:
    sparsity_distribution: uniform
    sparsity_type: unstructured
    is_module_pruner: true
    target_modules: '(to_(q|k|v)|to_out\.0|proj_(in|out)|conv_?(1|2|shortcut)|ff.net\.(0\.proj|2))$'
    prune_biases: false
    sequential: false
    block_size: 128
    damp: 0.01
    schedule_kwargs:
      class: constant
      sparsity: 0.5
      init_step: 0