# https://arxiv.org/pdf/2205.01580.pdf
epochs = 200

optimizer = "AdamW"
weightDecay = 0.1

saveCheckpoint = true

batchSize = 256
dataset = "CIFAR100"
imageSize = 32
flip = true 
crop = false
cut = false

label_smoothing = 0.0
grad_clip_norm = 1.0

model = "ViT"

ViTPatchSize = 4
ViTSize = "S"

learningRate = 0.0005
lrScheduler = "cosWarmUp"
LRScheduler_StartRamp_epochs = 1
