# Architecture
arch: Conv6Wide

# ===== Dataset ===== #
data: /mnt
set: CIFAR10
name: conv6wide_sgd_baseline

# ===== Learning Rate Policy ======== #
optimizer: sgd
lr: 0.01
lr_policy: cosine_lr

# ===== Network training config ===== #
epochs: 100
weight_decay: 0.0001
momentum: 0.9
batch_size: 128

# ===== Sparsity =========== #
conv_type: DenseConv
bn_type: NonAffineBatchNorm
width_mult: 1

# ===== Hardware setup ===== #
workers: 4
 