defaults:
  - dataset: imagenet
  - sparsifier: conv2d_in_channel
  - _self_

data_dir_env: ASTRA_DATA
checkpoint_dir_env: ASTRA_CHECK

device: cuda
batch_size: 32
num_epochs: 100
num_workers: 4
criterion: "spastra.models.layers.KLDiv"

sparsity: 0.5

model:
  name: resnet50
  depth: 32
  num_classes: ${dataset.num_classes}
  activation_name: ReLU
  weight: official

optimizer:
  name: sgd
  lr: 0.01
  momentum: 0.95
  weight_decay: 1e-5
  betas: (0.9, 0.999)

lr_scheduler:
  num_epochs: ${..num_epochs}
  name: multistep
  step_ratio: 0.25
  offset_ratio: -1 # wait offset_ratio * num_epochs before start stepping
  gamma: 0.5

wandb:
  project: project-name
  entity: username
  mode: offline
  group: "astra"

stats:
  refresh_every: 0.1 # ratio of train_loader size
