BASE_LR: 1e-3
N_WARMUP: 10
NUM_EPOCHS: 32500
LEARNING_RATE_DECAY_SCALE: 5000
BATCH_SIZE: 8192
N_INNER_LAYERS: 1
HIDDEN_DIM: 256
RECORD_INTERVAL: 10
TASK: DISTANCES
