BATCH_SIZE: 256
MIXUP_ALPHA: 1.0
MIXUP_PROB: 0.4
CUTMIX_BETA: 1.0
CUTMIX_PROB: 0.4
PREPROCESSED_PATH: 
WIDTH: 16
NUM_CLASSES: 1000
NUM_WORKERS: 32
CROP_SIZE: 81
INIT_SCALE: 0.1
PURE_MLP_EPOCHS: 60
DKAN_TURN_ON_EPOCHS: 150
DKAN_TURN_ON_SCALE: 100
DKAN_TURN_ON_CAP: 0.3
DKAN_FROBENIUS_DECAY_EPOCHS: 1200
DKAN_FROBENIUS_DECAY_SCALE: 120
INITIAL_FROBENIUS_WEIGHT: 1e-3
DKAN_BASE_LR: 3e-4
PURE_MLP_BASE_LR: 3e-4
FROBENIUS_WEIGHT_CAP: 3.0e-09
WARMUP_EPOCHS: 15
N_CHUNKS: 6
BLOCK_SIZE_FORWARD: 1024
BLOCK_SIZE_BACKWARD: 128
TILE_SIZE_FORWARD: 8
TILE_SIZE_BACKWARD: 8

N_EPOCHS_CONTINUATION: 1000
FROBENIUS_WEIGHT_CONTINUATION: 3.0e-09
LEARNING_RATE_CONTINUATION: 3e-4
