defaults:
  - STEVE-default
  - _self_
  - tokenizer: phyre
  - dataset: phyre-labeled
  - transformer: phyre

training:
  batch_size: 50
  epochs: 200
  batches_per_epoch: 10
  subbatch_size: 2
