batch_size: 16
val_batch_size: 72
gradient_accumulation_steps: 1
checkpoint_every_step: 1000
num_training_steps: 1000
tokenizer_type: t5-large
lm_type: t5-large
in_context_instance_count: 3
max_length: 512
enable_pair_sentence_classification: True
enable_full_finetune: True
training_da_mode:
  - tag
eval_da_mode:
  - tag
