defaults:
  - dataset: cifar10
  - sparsifier: unstructured
  - _self_

data_dir_env: ASTRA_DATA
checkpoint_dir_env: ASTRA_CHECK

device: cuda
batch_size: 192
num_epochs: 200
num_workers: 4
criterion: "torch.nn.CrossEntropyLoss"

sparsity: 0.9

sparsifier:
  alpha: 7.6620024
  warmup: 0.04370465
  freeze: 0.7580857
  ema:
    rho: 0.018168524
  lambda:
    mode: constant
    beta: 0.06494370688856885
    cap: 0.0014514777239312791

model:
  name: resnet
  depth: 32
  num_classes: ${dataset.num_classes}
  activation_name: ReLU

optimizer:
  name: sgd
  lr: 0.0124202312
  momentum: 0.9437087
  weight_decay: 0.0006078
  betas: (0.9, 0.999)

lr_scheduler:
  num_epochs: ${..num_epochs}
  name: multistep
  step_ratio: 0.33832086
  offset_ratio: 0.25 # wait offset_ratio * num_epochs before start stepping
  gamma: 0.475309528443

wandb:
  project: project-name
  entity: wandb-user
  mode: offline
  group: "group-name"


stats:
  refresh_every: 0.1 # ratio of train_loader size
