batch_size: 3
checkpoint_every_step: 3125
gradient_accumulation_steps: 43
prefix_length: 0
prefix_set_number: 0
enable_full_finetune: True
enable_meta_training: True
lm_type: t5-3b
tokenizer_type: t5-3b
learning_rate: 5e-5
max_length: 512
meta_task_max_value_length: 400
max_epoch: 100
enable_pretrain_task_embeddings: True
task_type_vector_count_per_layer: 5
enable_new_task_embeddings: True