# https://arxiv.org/pdf/2205.01580.pdf
epochs = 300

optimizer = "AdamW"
weightDecay = 0.1

saveCheckpoint = true

batchSize = 1024
dataset = "ImageNet"
imageSize = 224
flip = true 
crop = false
cut = false

label_smoothing = 0.0
grad_clip_norm = 1.0

model = "ViT"

ViTPatchSize = 32
ViTSize = "S"

learningRate = 0.001
lrScheduler = "cosWarmUp"
LRScheduler_StartRamp_epochs = 8
