#hyper parameter from SAM paper (except BS=4096)
[general]
logDir = ../logs
logSubDir = test
truncate = False

contin = False
epochs = 100

rndSeed = False
deterministic = False

optimizer = SGD
momentum = 0.9 
weightDecay = 0.0001
nesterov = False

saveCheckpoint = False
keepLastCheckpoint = False
checkpointsList = 
saveCheckpointInterval = 0

verbose = False
logEach = 1
metrics = learningRate loss accuracy

dataThreads = 6 
dataDir = ~/.datasets
batchSize = 1024
dataset = ImageNet 
imageSize = 224
flip = True 
crop = False
cut = False
cutoutProp = 0.5
randAugment = False 
randAugment_magnitude = 10
mixup = False
mixupProp = 0.2

label_smoothing = 0.1

grad_clip_norm = 0.0
normalize = std


[models]
model = resnet
dropout = 0.0
BN = True
depth = 50
widthFactor = 4
ViTPatchsize = 32
ViTSize = S

[learning rate]
learningRate = 1.0
lrScheduler = startRamp cos

LRScheduler_StartRamp_epochs = 1

LRScheduler_step_steps = 3
LRScheduler_step_gamma = 0.2

LRScheduler_exp_maxDecay = 0.01
LRScheduler_cos_periods = 0.5

LRScheduler_WRN_T0 = 50
LRScheduler_WRN_Tmult = 1.2

[SAM]
rho = 0.3
rhoScheduler = const
rhoScheduler_StartRamp_epochs = 8
rhoScheduler_StartJump_epochs = 8

[ESAM]
ESAMbeta = 0.5
ESAMgamma = 0.5

[lookSAM]
lookSAMk = 10
lookSAMalpha = 0.7