batch_size: 8
val_batch_size: 160
gradient_accumulation_steps: 1
checkpoint_every_step: 100
num_training_steps: 300
tokenizer_type: t5-large
lm_type: t5-large
in_context_instance_count: 0
enable_nlu: True
enable_full_finetune: True
training_da_mode:
  - nlu
eval_da_mode:
  - nlu
max_length: 512
train_path: FewGLUE_dev32/WiC/train.jsonl
label_path: FewGLUE_dev32/WiC/labels.txt
dev_path: FewGLUE_dev32/WiC/val.jsonl
test_path: FewGLUE_dev32/WiC/val.jsonl
running_task: wic
enable_new_task_embeddings: True 
enable_pretrain_task_embeddings: True
save_model_each_epoch: True
task_type_vector_count_per_layer: 5
learning_rate: 5e-5
