{
    "dataset": "t0",
    "finetune_task_name": "rte",
    "train_batch_size": 8,
    "predict_batch_size": 16,
    "gradient_accumulation_steps": 1,
    "length_norm": 1,
    "mc_loss": 1,
    "unlikely_loss": 1
}