{
    "dataset": "t0",
    "train_dir": "$T0_DATA_DIR",
    "optimizer": "adafactor",
    "max_grad_norm": 1,
    "weight_decay": 0,
    "eval_every": 5000,
    "save_every": 50000,
    "total_steps": 100000,
    "learning_rate": 3e-4,
    "max_input_length": 256,
    "max_output_length": 256
}
