defaults:
  - esmc

name: esmc_300m
batch_size: 64
accumulate_grad_batches: 1

prediction_head:
  input_dim: 960

# search_space:
#   model.batch_size: choice(4, 8, 16, 32, 64, 128)
#   model.loss: choice(mse, huber, l1)
#   model.learning_rate: tag(log, interval(1e-6, 1e-3))
#   model.weight_decay: tag(log, interval(1e-4, 1e-1))
