activation: gelu
adv_eps: 0.2
adv_eps_iter: 0.01
adv_eval: false
adv_nb_iter: 20
adv_norm: 'inf'
adv_train: false
alpha: 1.0
batch_size: 32
config_dir: config
criterion: ce
data_dir: ./data/
dataset: CIFAR10
debug_mode: False
device: cuda
epochs: 300
eps: 0.000001
iterations: 1
log_dir: ./runs/
metric_dir: metrics
model_dir: ckpt
model_name: null
model_type: vit
noise_train: 1.0
norm: normal
num_workers: 0
optim: adamw
optim_param:
    sgd:
        lr: 0.1
        momentum: 0.9
        nesterov: false
        weight_decay: 0.0005
    adam:
        beta1: 0.9
        beta2: 0.999
        lr: 0.01
        weight_decay: 0.03
    adamw:
        lr: 0.001
        beta1: 0.9
        beta2: 0.999
        weight_decay: 0.05
        eps_opt: 0.00000001
order: 2
param: null
param_dir: ./params/
plot: true
plot_dir: plots
random_seed: 2
save_model: best
shuffle: true
stdout_dir: stdout
tmp_log_dir: ./temp/runs/
weighted_sampler: false
weights_init: default
