{
    "model": "google/t5-xl-lm-adapt",
    "dataset": "ni",
    "optimizer": "adamw",
    "train_dir": "$NI_DATA_DIR",
    "warmup_proportion": 0.06,
    "total_steps": 1000,
    "learning_rate": 1e-3,
    "max_grad_norm": 0.1,
    "weight_decay": 0.01,
    "gradient_accumulation_steps": 4,
    "train_batch_size": 2,
    "predict_batch_size": 4,
    "precision": "bf16"
}
