defaults:
  - dataset: cifar100
  - sparsifier: filter
  - _self_

data_dir_env: ASTRA_DATA
checkpoint_dir_env: ASTRA_CHECK

device: cuda
batch_size: 32
num_epochs: 150
num_workers: 4
criterion: "torch.nn.CrossEntropyLoss"

sparsity: 0.9

sparsifier:
  alpha: 9.140089
  warmup: 0.0773
  freeze: 0.884160
  ema:
    rho: 0.004082
  lambda:
    mode: constant
    beta: 0.005056
    cap: 0.0014514777239312791

model:
  name: resnet
  depth: 32
  num_classes: ${dataset.num_classes}
  activation_name: ReLU

optimizer:
  name: sgd
  lr: 0.02
  momentum: 0.977680
  weight_decay: 2.525e-05
  betas: (0.9, 0.999)

lr_scheduler:
  num_epochs: ${..num_epochs}
  name: multistep
  step_ratio: 0.31895
  offset_ratio: -1 # wait offset_ratio * num_epochs before start stepping
  gamma: 0.334132642

wandb:

  project: project-name
  entity: username
  mode: offline
  group: "astra"

stats:
  refresh_every: 0.1 # ratio of train_loader size
