defaults:
  - STEVE-default
  - _self_
  - tokenizer: phyre
  - dataset: phyre
  - transformer: phyre

training:
  # The param controlling batch size in the STEVE train script is actually subbatch_size
  batch_size: ???
  subbatch_size: 2
