{
  "task_id": "5565ec62-0596-4ee9-abf0-240a8db557d1",
  "instruction": "In Gmail, create a label named 'Benchmarking Agent'.",
  "visual": false,
  "max_steps": 1,
  "eval_procedure": [
    {
      "evaluator": "gmail",
      "function": "check_label_exists",
      "params": {
        "label_name": "Benchmarking Agent",
        "exists": true
      }
    }
  ],
  "reset_procedure": [
    {
      "evaluator": "gmail",
      "function": "delete_label",
      "params": {
        "label_name": "Benchmarking Agent"
      }
    }
  ],
  "cleanup_procedure": [
    {
      "evaluator": "gmail",
      "function": "delete_label",
      "params": {
        "label_name": "Benchmarking Agent"
      }
    }
  ],
  "max_time": 30
}
