MIXUP_ALPHA: 0.2
CUTMIX_BETA: 1.0
CUTMIX_PROB: 0.5
INIT_SCALE: 0.1
PURE_MLP_EPOCHS: 500
DKAN_TURN_ON_EPOCHS: 1500
DKAN_TURN_ON_SCALE: 1000
DKAN_TURN_ON_CAP: 0.3
DKAN_FROBENIUS_DECAY_EPOCHS: 3500
DKAN_FROBENIUS_DECAY_SCALE: 200
DKAN_LEARNING_RATE_DECAY_EPOCHS: 4500
DKAN_LEARNING_RATE_DECAY_SCALE: 750
INITIAL_FROBENIUS_WEIGHT: 1e-3
DKAN_BASE_LR: 1e-3
PURE_MLP_BASE_LR: 1e-3
FROBENIUS_WEIGHT_CAP: 1e-10
WARMUP_EPOCHS: 10
BATCH_SIZE: 512
N_CHUNKS: 6
BLOCK_SIZE_FORWARD: 1024
BLOCK_SIZE_BACKWARD: 512
TILE_SIZE_FORWARD: 8
TILE_SIZE_BACKWARD: 8
