{
    "dataset": "ni",
    "optimizer": "adamw",
    "train_dir": "$NI_DATA_DIR",
    "custom_tasks_splits": "./mttl/dataloader/ni_data/train_tasks.txt",
    "warmup_steps": 1500,
    "total_steps": 25000,
    "eval_every": 5000,
    "learning_rate": 5e-5,
    "max_grad_norm": 0.1,
    "weight_decay": 0.01,
    "train_batch_size": 8,
    "predict_batch_size": 24,
    "precision": "bf16",
    "max_input_length": 1024,
    "max_output_length": 128,
    "use_task_descriptions": true
}
