#config example:
#Authors: Shaokai, Jan
#sample_argument:
#type || default value
#value
#print_freq  int || 10  
#resume      bool || False     *resume from checkpoint
#gpu_id      int || null      * gpu id to use
#lr          float || 0.1      *learning rate
#arch        str  || resnet18  *architecture
#save_model  str  || saved_model.pt * filename to saved model
#load_model  str  || load_model.pt  * filename to load model
#workers     int  || 16        * number of threads for loading images
#logging     bool || False     * whether to log files
#log_dir     str  || logs      * destination folder to drop log file
#smooth_eps  float|| 0.0       * smoothing rate [0.0, 1.0], set to 0.0 to disable
#alpha       float|| 0.0       * for mixup training, lambda = Beta(alpha, alpha) distribution. Set to 0.0 to disable
#                              * chosen value of alpha in Bag of Tricks is 0.2, and increase # of training epochs by 67%
#epochs      int  || 200       * number of training epochs for chosen stage
#warmup_epochs      int  || 0       * number of epochs for lr warmup
#warmup_lr      float  || 0.0001       * initial lr before warmup
#optimizer   str  || sgd       * optimizer for the chosen stage
#lr_scheduler str || default,cosine  * learning rate scheduler
#admm_epoch  int  || 20        * how many epochs required to update z and u
#rho        float || 0.001     * regularization strength
#sparsity_type str || [irregular,channel,filter,bn_filter]     * sparsity type
#multi_rho   bool  || False    * whether to use multi rho in admm stage
#verbose    bool  || False     * whether to print convergence info
#masked_progressive bool || False * whether to use masked progressive

adv:
  epsilon:
    8.0    # will be divided by 255 in the adv_train.py
  num_steps:
    10
  step_size:
    2.0   # will be divided by 255 in the adv_train.py
  random_start:
    True
  loss_func:
    xent
  width_multiplier:
    16
  init_func:
    default
general:
 sparsity_type: 
  channel
 print_freq:
  10 
 resume:  
  False
 gpu_id:   # 0 = weight 1, 1 = weight 10, 2 = channel 10, 3 = channel 50
  0
 arch: 
  vgg16
 workers: 
  16
 logging: 
  False
 log_dir: 
  logs
 smooth_eps:
  0.0
 alpha:
  0.0
pretrain:
 lr:
  0.01
 epochs: 
  300
 warmup_lr:
  0.0001
 warmup_epochs: 
  0
 save_model: 
  vgg16_pretrained_no_warmup_lr_0_01.pt
 optimizer:
  sgd
 lr_scheduler: 
  default
admm:
 lr:  
  0.01
 epochs: 
  100
 save_model: 
  vgg16_admm_channel_10_TEST_cifar10.pth.tar
 load_model: 
  vgg16_bn_hydra_cifar10.pth.tar
 optimizer:
  sgd
 lr_scheduler: 
  default
 admm_epoch: 
  30
 rho: 
  0.001
 multi_rho: 
  True
 masked_progressive: 
  False
 verbose:
  False
retrain:
 lr:  
  0.01
 epochs:
  100
 warmup_lr:
  0.0001
 warmup_epochs: 
  15
 save_model: 
  wrn284_retrain_channel_50.pth.tar
 load_model:
  wrn284_admm_channel_50.pth.tar
 optimizer: 
  sgd
 lr_scheduler:
  default
 masked_progressive: 
  False 
resnet18_adv:
#20 conv layers, use bnx instead of convx for bn_filter pruning
#floats
 prune_ratios:
  conv1.weight:
   0.5
  conv2.weight:
   0.5
  conv3.weight:
   0.5
  conv4.weight:
   0.5
  conv5.weight:
   0.5
  conv6.weight:
   0.5
  conv7.weight:
   0.5
  conv8.weight:
   0.5
  conv9.weight:
   0.5
  conv10.weight:
   0.5
  conv11.weight:
   0.5
  conv12.weight:
   0.5
  conv13.weight:
   0.5
  conv14.weight:
   0.5
  conv15.weight:
   0.5
  conv16.weight:
   0.5
  conv17.weight:
   0.5
  conv18.weight:
   0.5
  conv19.weight:
   0.5
  conv20.weight:
   0.5
  fc1.weight:
   0.5
vgg16: 
#20 conv layers, use bnx instead of convx for bn_filter pruning
#floats
 prune_ratios:
  conv1.weight:
   0.9
  conv2.weight:
   0.9
  conv3.weight:
   0.9
  conv4.weight:
   0.9
  conv5.weight:
   0.9
  conv6.weight:
   0.9
  conv7.weight:
   0.9
  conv8.weight:
   0.9
  conv9.weight:
   0.9
  conv10.weight:
   0.9
  conv11.weight:
   0.9
  conv12.weight:
   0.9
  conv13.weight:
   0.9
  fc1.weight:
   0.9
  fc2.weight:
   0.9
  fc3.weight:
   0.9

wrn_28_4:
 prune_ratios:
  conv1.weight:
   0
  conv2.weight:
   0.0625
  conv3.weight:
   0.125
  conv4.weight:
   0.0625
  conv5.weight:
   0.015625
  conv6.weight:
   0
  conv7.weight:
   0.09375
  conv8.weight:
   0.015625
  conv9.weight:
   0
  conv10.weight:
   0
  conv11.weight:
   0
  conv12.weight:
   0.6484375
  conv13.weight:
   0
  conv14.weight:
   0.5625
  conv15.weight:
   0.6875
  conv16.weight:
   0.71875
  conv17.weight:
   0.859375
  conv18.weight:
   0.6875
  conv19.weight:
   0.65625
  conv20.weight:
   0.46875
  conv21.weight:
   0.53275
  conv22.weight:
   0.53125
  conv23.weight:
   0.59375
  conv24.weight:
   0.6331875
  conv25.weight:
   0.73984375
  conv26.weight:
   0.803125
  conv27.weight:
   0.546875
  conv28.weight:
   0.300000000000000049296875
  fc1.weight:
   0.23046875