[
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 11,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Tell me the the number of reviews that our store received by far that mention term \"{{term}}\"",
    "instantiation_dict": {
      "term": "disappointed"
    },
    "intent": "Tell me the the number of reviews that our store received by far that mention term \"disappointed\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "6"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "6"
    },
    "intent_template_id": 288,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 14,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Tell me the the number of reviews that our store received by far that mention term \"{{term}}\"",
    "instantiation_dict": {
      "term": "not useful"
    },
    "intent": "Tell me the the number of reviews that our store received by far that mention term \"not useful\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "0"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "0"
    },
    "intent_template_id": 288,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 16,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "Compare the time for walking and driving route from {{start}} to {{end}}",
    "instantiation_dict": {
      "start": "5000 Fifth Avenue, Pittsburgh",
      "end": "UPMC family health center"
    },
    "intent": "Compare the time for walking and driving route from 5000 Fifth Avenue, Pittsburgh to UPMC family health center",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "driving: 2min",
          "walking: 16min"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Driving: 2min. Walking: 16min."
    },
    "intent_template_id": 73,
    "API-solvable": true,
    "API_calls_required": 4,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 21,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__/6s-wireless-headphones-over-ear-noise-canceling-hi-fi-bass-foldable-stereo-wireless-kid-headsets-earbuds-with-built-in-mic-micro-sd-tf-fm-for-iphone-samsung-ipad-pc-black-gold.html",
    "geolocation": null,
    "intent_template": "List out reviewers, if exist, who mention about {{description}}",
    "instantiation_dict": {
      "description": "ear cups being small"
    },
    "intent": "List out reviewers, if exist, who mention about ear cups being small",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "Joseph Brzezinski",
          "Catso",
          "Dibbins",
          "Anglebert Dinkherhump",
          "Michelle Davis"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Joseph Brzezinski, Catso, Dibbins, Anglebert Dinkherhump, Michelle Davis"
    },
    "intent_template_id": 222,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 26,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__/epson-workforce-wf-3620-wifi-direct-all-in-one-color-inkjet-printer-copier-scanner-amazon-dash-replenishment-ready.html",
    "geolocation": null,
    "intent_template": "List out reviewers, if exist, who mention about {{description}}",
    "instantiation_dict": {
      "description": "complain of the customer service"
    },
    "intent": "List out reviewers, if exist, who mention about complain of the customer service",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "Bob in Vegas",
          "RemyR"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Bob in Vegas, RemyRRemyR"
    },
    "intent_template_id": 222,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 43,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "List the top {{n}} search terms in my store",
    "instantiation_dict": {
      "n": "3"
    },
    "intent": "List the top 3 search terms in my store",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "hollister",
          "Joust Bag",
          "Antonia Racer Tank"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "hollister, Joust Bag, Antonia Race Tank"
    },
    "intent_template_id": 285,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 45,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__/a11yproject/a11yproject.com",
    "geolocation": null,
    "intent_template": "Check out the most recent open issues",
    "instantiation_dict": {},
    "intent": "Check out the most recent open issues",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__GITLAB__/a11yproject/a11yproject.com/-/issues/?sort=created_asc&state=opened",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 300,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 47,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Today is 6/12/2023. Tell me how many fulfilled orders I have {{period}}, and the total amount of money I spent.",
    "instantiation_dict": {
      "period": "over the past month"
    },
    "intent": "Today is 6/12/2023. Tell me how many fulfilled orders I have over the past month, and the total amount of money I spent.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "0 order",
          "$0 total spend"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "0 order, $0 total spend"
    },
    "intent_template_id": 197,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 51,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Today is 6/12/2023. Tell me how many fulfilled orders I have {{period}}, and the total amount of money I spent.",
    "instantiation_dict": {
      "period": "over the past six month"
    },
    "intent": "Today is 6/12/2023. Tell me how many fulfilled orders I have over the past six month, and the total amount of money I spent.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "12 orders",
          "$1603.69 total spend"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "12 orders, $1603.69 total spend"
    },
    "intent_template_id": 197,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "Task Understanding"
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 54,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "How long does it take to walk from {{start}} to {{end}}?",
    "instantiation_dict": {
      "start": "Carnegie Mellon University",
      "end": "Univ of Pittsburgh"
    },
    "intent": "How long does it take to walk from Carnegie Mellon University to Univ of Pittsburgh?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "25 min"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "25 min"
    },
    "intent_template_id": 68,
    "API-solvable": true,
    "API_calls_required": 3,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 66,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Among the top {{number}} post in \"{{subreddit}}\" forum, {{description}}",
    "instantiation_dict": {
      "number": 10,
      "subreddit": "books",
      "description": "show me the post URLs that recommand a single book"
    },
    "intent": "Among the top 10 post in \"books\" forum, show me the post URLs that recommand a single book",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "http://www.reddit.com/f/books/59396/apple-books-has-a-free-audiobook-of-a-christmas-carol",
          "http://www.reddit.com/f/books/17445/i-just-finished-reading-the-hobbit-to-my-6-year-old-daughter"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "__REDDIT__/f/books/59396/apple-books-has-a-free-audiobook-of-a-christmas-carol, __REDDIT__/f/books/17445/i-just-finished-reading-the-hobbit-to-my-6-year-old-daughter"
    },
    "intent_template_id": 17,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 84,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "From my stay at {{hotel}}, what's the estimated driving time to reach {{place}}?",
    "instantiation_dict": {
      "hotel": "DoubleTree by Hilton New York Downtown",
      "place": "Keens Steakhouse"
    },
    "intent": "From my stay at DoubleTree by Hilton New York Downtown, what's the estimated driving time to reach Keens Steakhouse?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "14 minutes"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "14 minutes"
    },
    "intent_template_id": 64,
    "API-solvable": true,
    "API_calls_required": 3,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 89,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "Which US states border {{state}}?",
    "instantiation_dict": {
      "state": "Connecticut"
    },
    "intent": "Which US states border Connecticut?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "Rhode Island",
          "Massachusetts",
          "New York"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Rhode Island, Massachusetts, New York"
    },
    "intent_template_id": 67,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 90,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "Which US states border {{state}}?",
    "instantiation_dict": {
      "state": "Pennsylvania"
    },
    "intent": "Which US states border Pennsylvania?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "Ohio",
          "Maryland",
          "New York",
          "New Jersey",
          "Delaware",
          "West Virginia"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Ohio, Maryland, New York, New Jersey, Delaware, West Virginia"
    },
    "intent_template_id": 67,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 92,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "Which US states border {{state}}?",
    "instantiation_dict": {
      "state": "Vermont"
    },
    "intent": "Which US states border Vermont?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "New York",
          "New Hampshire",
          "Massachusetts"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "New York, New Hampshire, Massachusetts"
    },
    "intent_template_id": 67,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 102,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Display the list of issues in the {{repo}} repository that have labels related to {{label}}",
    "instantiation_dict": {
      "label": "help needed",
      "repo": "a11yproject/a11yproject.com"
    },
    "intent": "Display the list of issues in the a11yproject/a11yproject.com repository that have labels related to help needed",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__GITLAB__/byteblaze/a11y-syntax-highlighting/-/issues/?label_name%5B%5D=help%20wanted",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 349,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 109,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Presents the monthly count of successful orders {{period}} in MM:COUNT format",
    "instantiation_dict": {
      "period": "from Jan to December 2022"
    },
    "intent": "Presents the monthly count of successful orders from Jan to December 2022 in MM:COUNT format",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "January: 11 orders",
          "Feburary: 16 orders",
          "March: 14 orders",
          "April: 7 orders",
          "May: 8 orders",
          "June: 13 orders",
          "July: 9 orders",
          "August: 8 orders",
          "Sepetember: 10 orders",
          "Octorbor: 4 orders",
          "November: 5 orders",
          "December: 10 orders"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "January: 11 orders Feburary: 16 orders March: 14 orders April: 7 orders May: 8 orders June: 13 orders July: 9 orders August: 8 orders Sepetember: 10 orders Octorbor: 4 orders November: 5 orders December: 10 orders  "
    },
    "intent_template_id": 270,
    "API-solvable": true,
    "API_calls_required": 12,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 112,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Show me the customers who have expressed dissatisfaction with {{product}}?",
    "instantiation_dict": {
      "product": "Circe fleece"
    },
    "intent": "Show me the customers who have expressed dissatisfaction with Circe fleece?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "exact_match": "Hannah Lim"
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Hannah Lim"
    },
    "intent_template_id": 245,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 115,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Show me the name of the customers who have expressed dissatisfaction with {{product}}",
    "instantiation_dict": {
      "product": "Chloe tank"
    },
    "intent": "Show me the name of the customers who have expressed dissatisfaction with Chloe tank",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": "N/A"
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "There is no negative review for Chloe tank",
      "reference_answer_raw_annotation": ""
    },
    "intent_template_id": 245,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 121,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Tell me the reasons why customers like {{product}}",
    "instantiation_dict": {
      "product": "Circe hooded fleece"
    },
    "intent": "Tell me the reasons why customers like Circe hooded fleece",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "Warm and comfortable. True to size."
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Warm and comfortable. True to size."
    },
    "intent_template_id": 250,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 138,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "What is the estimated driving time between {{city1}} and {{city2}}?",
    "instantiation_dict": {
      "city1": "the big apple",
      "city2": "the city with the most authentic Philly cheesesteaks"
    },
    "intent": "What is the estimated driving time between the big apple and the city with the most authentic Philly cheesesteaks?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "1h 58min"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "1h 58min"
    },
    "intent_template_id": 51,
    "API-solvable": true,
    "API_calls_required": 3,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 153,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "What is the minimum travel time by car from {{location1}} to {{location2}}?",
    "instantiation_dict": {
      "location1": "REI",
      "location2": "CMU"
    },
    "intent": "What is the minimum travel time by car from REI to CMU?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "7min"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "7min"
    },
    "intent_template_id": 36,
    "API-solvable": true,
    "API_calls_required": 3,
    "correct": false,
    "error_type": "Task Understanding"
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 154,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "What is the minimum travel time by car from {{location1}} to {{location2}}?",
    "instantiation_dict": {
      "location1": "CMU gates building",
      "location2": "Schenley park"
    },
    "intent": "What is the minimum travel time by car from CMU gates building to Schenley park?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "4min"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "4min"
    },
    "intent_template_id": 36,
    "API-solvable": true,
    "API_calls_required": 3,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 162,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "I have a lot of Nintendo Switch game cards now, help me find the best storage option to fit all {{num}} cards",
    "instantiation_dict": {
      "num": 40
    },
    "intent": "I have a lot of Nintendo Switch game cards now, help me find the best storage option to fit all 40 cards",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING__/game-card-holder-storage-case-for-nintendo-switch-games-or-ps-vita-game-case-or-sd-memory-cards-black.html",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 171,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 167,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__/photosmart-plus-b209-clr-inkjetfb-p-s-c-usb-wrls-1.html",
    "geolocation": null,
    "intent_template": "What are the main criticisms of this product? Please extract the relevant sentences.",
    "instantiation_dict": {},
    "intent": "What are the main criticisms of this product? Please extract the relevant sentences.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "The wireless connection works on a whim (about 40% of the time I've owned it)",
          "It seems to constantly run out of ink",
          "Cartridge prices are less than some printers I've had",
          "This printer seems to have more reasons NOT to work (none that are findable or correctable) Ex: error boxes saying that it's out of paper when it automatically switches to photo printing for some reason",
          "Scanner is as slow as my first scanner I ever owned in the mid-90's",
          "For the $176 I paid, there isn't even a fax component on it. I guess the \"PLUS\" part of it's name is in reference to the migraines it causes when you can't figure out the new reason why it's not working for the 10th time in the past 2 months."
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "The wireless connection works on a whim (about 40% of the time I've owned it). It seems to constantly run out of ink. Cartridge prices are less than some printers I've had, but now I understand why. This printer seems to have more reasons NOT to work (none that are findable or correctable) Ex: error boxes saying that it's out of paper when it automatically switches to photo printing for some reason. Scanner is as slow as my first scanner I ever owned in the mid-90's. For the $176 I paid, there isn't even a fax component on it. I guess the \"PLUS\" part of it's name is in reference to the migraines it causes when you can't figure out the new reason why it's not working for the 10th time in the past 2 months."
    },
    "intent_template_id": 136,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 184,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Give me the {{Attribute}} of the products that have {{N}} units left",
    "instantiation_dict": {
      "Attribute": "name",
      "N": "0"
    },
    "intent": "Give me the name of the products that have 0 units left",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "exact_match": "Sinbad Fitness Tank"
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Sinbad Fitness Tank"
    },
    "intent_template_id": 368,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 189,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Tell me the total cost of my latest {{status}} order?",
    "instantiation_dict": {
      "status": "pending"
    },
    "intent": "Tell me the total cost of my latest pending order?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "754.99"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "754.99"
    },
    "intent_template_id": 214,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 191,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Tell me the total cost of my latest {{status}} order?",
    "instantiation_dict": {
      "status": "processing"
    },
    "intent": "Tell me the total cost of my latest processing order?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": "N/A"
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "There is no order of \"processing\" status",
      "reference_answer_raw_annotation": "There is no order of \"processing\" status"
    },
    "intent_template_id": 214,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 198,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Get the {{attribute}} of the {{status}} order",
    "instantiation_dict": {
      "attribute": "customer name",
      "status": "most recent cancelled"
    },
    "intent": "Get the customer name of the most recent cancelled order",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "exact_match": "Lily Potter"
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Lily Potter"
    },
    "intent_template_id": 366,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 202,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Get the {{attribute}} of the {{status}} order",
    "instantiation_dict": {
      "attribute": "date",
      "status": "most recent canlled"
    },
    "intent": "Get the date of the most recent canlled order",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "May 23 2023"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "May 23, 2023"
    },
    "intent_template_id": 366,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "Task Understanding"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 212,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Find the customer name and email with phone number {{PhoneNum}}",
    "instantiation_dict": {
      "PhoneNum": "555-229-3326"
    },
    "intent": "Find the customer name and email with phone number 555-229-3326",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "Veronica Costello",
          "roni_cost@example.com"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Veronica Costello, roni_cost@example.com"
    },
    "intent_template_id": 364,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 214,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "What are the key aspects that the customers don't like about {{product}}",
    "instantiation_dict": {
      "product": "Zing Jump Rope"
    },
    "intent": "What are the key aspects that the customers don't like about Zing Jump Rope",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": [
          "It is hard to find the right size. Won't last long"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "It is hard to find the right size. Won't last long"
    },
    "intent_template_id": 249,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 228,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "What is the price range for products from {{brand}}?",
    "instantiation_dict": {
      "brand": "sephora"
    },
    "intent": "What is the price range for products from sephora?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "18.18",
          "94.99"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "$18.18 - $94.99"
    },
    "intent_template_id": 370,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 232,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Get the order number of my most recent {{status}} order ",
    "instantiation_dict": {
      "status": "pending"
    },
    "intent": "Get the order number of my most recent pending order ",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "189"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "000000189"
    },
    "intent_template_id": 213,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 242,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "I am doing a market survey for one stop market, show me the most expensive product from {{product_category}} category",
    "instantiation_dict": {
      "product_category": "Household Supplies"
    },
    "intent": "I am doing a market survey for one stop market, show me the most expensive product from Household Supplies category",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING__/lynx-battery-12v-200ah-lithium-iron-phosphate-lifepo4-prismatic-deep-cell-battery-set-of-4-3-2v-cells-with-3-bus-bars-and-8-lug-nuts-for-rv-solar-marine-off-grid-applications.html",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 138,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 250,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "Tell me the coordinates of {{location}} in DD format",
    "instantiation_dict": {
      "location": "Apple Store near Pitt"
    },
    "intent": "Tell me the coordinates of Apple Store near Pitt in DD format",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "40.451",
          "-79.933"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "40.4511693, -79.9334241"
    },
    "intent_template_id": 46,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "wikipedia",
      "map"
    ],
    "task_id": 266,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "What's the closest national park to {{city}}?",
    "instantiation_dict": {
      "city": "the largest city in Maine"
    },
    "intent": "What's the closest national park to the largest city in Maine?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "exact_match": "Acadia National Park"
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Acadia National Park"
    },
    "intent_template_id": 85,
    "API-solvable": true,
    "API_calls_required": 3,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 269,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Show me products under ${{price}} in \"{{product_category}}\" category",
    "instantiation_dict": {
      "price": "25",
      "product_category": "women shoes"
    },
    "intent": "Show me products under $25 in \"women shoes\" category",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING__/clothing-shoes-jewelry/women/shoes.html?price=0-25",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 139,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 273,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Show me products under ${{price}} in \"{{product_category}}\" category",
    "instantiation_dict": {
      "price": "199",
      "product_category": "furtiture with accent"
    },
    "intent": "Show me products under $199 in \"furtiture with accent\" category",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING__/home-kitchen/furniture/accent-furniture.html?price=0-199",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 139,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 286,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Show the least expensive {{product}} with a minimum storage capacity of {{min_storage}}.",
    "instantiation_dict": {
      "product": "ssd hard drive",
      "min_storage": "1TB"
    },
    "intent": "Show the least expensive ssd hard drive with a minimum storage capacity of 1TB.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING__/external-hard-drive-2tb-ultra-thin-external-hard-drive-2000gb-ultra-high-speed-portable-3-1-type-c-storage-drive-compatible-with-pc-laptop-and-mac-2tb-a1.html",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 207,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 298,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Show the most recent {{status}} order",
    "instantiation_dict": {
      "status": "completed"
    },
    "intent": "Show the most recent completed order",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING__/sales/order/view/order_id/180/",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 180,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 301,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Show the most recent {{status}} order",
    "instantiation_dict": {
      "status": "processing"
    },
    "intent": "Show the most recent processing order",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": "N/A"
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "there is no order in processing"
    },
    "intent_template_id": 180,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 320,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "How much refund I should expect from my order canlled in {{time}}, including shipping fee",
    "instantiation_dict": {
      "time": "Feb 2023"
    },
    "intent": "How much refund I should expect from my order canlled in Feb 2023, including shipping fee",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "406.53"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "406.53"
    },
    "intent_template_id": 160,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 330,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "How much I spend {{time}} on shopping at One Stop Market?",
    "instantiation_dict": {
      "time": "in March 2023"
    },
    "intent": "How much I spend in March 2023 on shopping at One Stop Market?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "81.31"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "81.31"
    },
    "intent_template_id": 147,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 340,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__/primer/design",
    "geolocation": null,
    "intent_template": "List all opened issues {{description}}",
    "instantiation_dict": {
      "description": "that report bugs"
    },
    "intent": "List all opened issues that report bugs",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__GITLAB__/primer/design/-/issues/?label_name%5B%5D=type%3A%20bug%20%F0%9F%90%9E",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 299,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 355,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "List products from {{product_category}} category by {{order}} price",
    "instantiation_dict": {
      "product_category": "kids' bedding",
      "order": "descending"
    },
    "intent": "List products from kids' bedding category by descending price",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING__/home-kitchen/bedding/kids-bedding.html?product_list_dir=desc",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 137,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 357,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Checkout merge requests requiring my review",
    "instantiation_dict": {},
    "intent": "Checkout merge requests requiring my review",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__GITLAB__/dashboard/merge_requests?reviewer_username=byteblaze",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 291,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 358,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Show me the {{info}} for order number {{order_number}}.",
    "instantiation_dict": {
      "info": "shipping method",
      "order_number": 187
    },
    "intent": "Show me the shipping method for order number 187.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "Flat Rate - Fixed"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Flat Rate - Fixed"
    },
    "intent_template_id": 206,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 360,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Show me the {{info}} for order number {{order_number}}.",
    "instantiation_dict": {
      "info": "product names",
      "order_number": "148"
    },
    "intent": "Show me the product names for order number 148.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "must_include": [
          "Bornbridge Artificial Spiral Topiary Tree - Indoor / Outdoor Topiary Trees - Artificial Outdoor Plants (2 Pack, 4' Cypress)",
          "Russound 5B45W 4\" Indoor Outdoor Speakers White"
        ]
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "",
      "reference_answer_raw_annotation": "Bornbridge Artificial Spiral Topiary Tree - Indoor / Outdoor Topiary Trees - Artificial Outdoor Plants (2 Pack, 4' Cypress), Russound 5B45W 4\" Indoor Outdoor Speakers White"
    },
    "intent_template_id": 206,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 376,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Summarize customer reviews for {{product}}.",
    "instantiation_dict": {
      "product": "Amazon Echo Dot 3rd generation"
    },
    "intent": "Summarize customer reviews for Amazon Echo Dot 3rd generation.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": "N/A"
      },
      "reference_url": "",
      "program_html": [],
      "string_note": "There is no review for this product",
      "reference_answer_raw_annotation": "N/A"
    },
    "intent_template_id": 182,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "map"
    ],
    "task_id": 378,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "Find the {{space}} around {{location}}",
    "instantiation_dict": {
      "location": "CMU main campus",
      "space": "parking"
    },
    "intent": "Find the parking around CMU main campus",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match"
      ],
      "reference_answers": null,
      "reference_url": "__MAP__/search?query=parking%20near%20carnegie%20mellon%20university",
      "program_html": [],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 59,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 391,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Post \"{{content}}\" for the merge request related to {{mr}} in {{repo}} project",
    "instantiation_dict": {
      "mr": "focus edge cases",
      "repo": "a11yproject/a11yproject.com",
      "content": "close because non reproducible"
    },
    "intent": "Post \"close because non reproducible\" for the merge request related to focus edge cases in a11yproject/a11yproject.com project",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/a11yproject/a11yproject.com/-/merge_requests/1265",
          "locator": "document.querySelector('[id=\"notes-list\"').lastElementChild.querySelector('.timeline-discussion-body').outerText",
          "required_contents": {
            "exact_match": "close because non reproducible"
          }
        }
      ]
    },
    "intent_template_id": 348,
    "API-solvable": true,
    "API_calls_required": 2,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 395,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Fork {{repo}}.",
    "instantiation_dict": {
      "repo": "the Pytorch GAN repo with most stars"
    },
    "intent": "Fork the Pytorch GAN repo with most stars.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/byteblaze/PyTorch-GAN",
          "locator": "",
          "required_contents": {
            "must_include": [
              "Pytorch-GAN"
            ]
          }
        }
      ]
    },
    "intent_template_id": 352,
    "API-solvable": true,
    "API_calls_required": 2,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 398,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Fork {{repo}}.",
    "instantiation_dict": {
      "repo": "all source repos from Akilesh Kannan"
    },
    "intent": "Fork all source repos from Akilesh Kannan",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/byteblaze/SimCache",
          "locator": "",
          "required_contents": {
            "must_include": [
              "SimCache"
            ]
          }
        },
        {
          "url": "__GITLAB__/byteblaze/dots",
          "locator": "",
          "required_contents": {
            "must_include": [
              "dots"
            ]
          }
        },
        {
          "url": "__GITLAB__/byteblaze/CacheEval",
          "locator": "",
          "required_contents": {
            "must_include": [
              "CacheEval"
            ]
          }
        },
        {
          "url": "__GITLAB__/byteblaze/nvidia-patch",
          "locator": "",
          "required_contents": {
            "must_include": [
              "404"
            ]
          }
        },
        {
          "url": "__GITLAB__/byteblaze/viewgrades-scraper",
          "locator": "",
          "required_contents": {
            "must_include": [
              "404"
            ]
          }
        }
      ]
    },
    "intent_template_id": 352,
    "API-solvable": true,
    "API_calls_required": 7,
    "correct": false,
    "error_type": "Task Understanding"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 400,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Change my reddit bio to \"{{content}}\"",
    "instantiation_dict": {
      "content": "Pro Python Developer with 20 years of Experience"
    },
    "intent": "Change my reddit bio to \"Pro Python Developer with 20 years of Experience\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__REDDIT__/user/MarvelsGrantMan136",
          "locator": "document.querySelector(\".user-bio__biography\").outerText",
          "required_contents": {
            "exact_match": "Pro Python Developer with 20 years of Experience"
          }
        }
      ]
    },
    "intent_template_id": 6,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 440,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "I previously ordered some {{product}} {{time}} and later cancelled. Can you reorder it for me?",
    "instantiation_dict": {
      "product": "a make up removal kit",
      "time": "during summer 2022"
    },
    "intent": "I previously ordered some a make up removal kit during summer 2022 and later cancelled. Can you reorder it for me?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "func:shopping_get_latest_order_url()",
          "locator": "document.querySelector(\".order-details-items.ordered\").outerText",
          "required_contents": {
            "must_include": [
              "B0738JQG6Q"
            ]
          }
        }
      ]
    },
    "intent_template_id": 156,
    "API-solvable": true,
    "API_calls_required": 4,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 446,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Assign the issue regarding {{issue}} in {{repo}} to {{account}}.",
    "instantiation_dict": {
      "repo": "a11yproject",
      "issue": 404,
      "account": "Roshanjossey"
    },
    "intent": "Assign the issue regarding 404 in a11yproject to Roshanjossey.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/dashboard/issues?scope=all&state=opened&assignee_username=Roshanjossey",
          "locator": "",
          "required_contents": {
            "must_include": [
              "404s, bad host, timeouts, bad urls for URLs linked from website"
            ]
          }
        }
      ]
    },
    "intent_template_id": 999,
    "API-solvable": true,
    "API_calls_required": 4,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 465,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Add {{product}} to my wish list",
    "instantiation_dict": {
      "product": "Tide PODS Spring Meadow Scent HE Turbo Laundry Detergent Pacs, 81 Count"
    },
    "intent": "Add Tide PODS Spring Meadow Scent HE Turbo Laundry Detergent Pacs, 81 Count to my wish list",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING__/wishlist/",
          "locator": "document.querySelector('.products-grid.wishlist').outerText",
          "required_contents": {
            "must_include": [
              "Tide PODS Spring Meadow Scent HE Turbo Laundry Detergent Pacs, 81 Count"
            ]
          }
        }
      ]
    },
    "intent_template_id": 186,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 466,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Add {{product}} to my wish list",
    "instantiation_dict": {
      "product": "2 Hawaiian Bamboo Orchid Roots #zc50 - by Discount Hawaiian Gifts"
    },
    "intent": "Add 2 Hawaiian Bamboo Orchid Roots #zc50 - by Discount Hawaiian Gifts to my wish list",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING__/wishlist/",
          "locator": "document.querySelector('.products-grid.wishlist').outerText",
          "required_contents": {
            "must_include": [
              "2 Hawaiian Bamboo Orchid Roots #zc50 - by Discount Hawaiian Gifts"
            ]
          }
        }
      ]
    },
    "intent_template_id": 186,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 470,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Cancel order {{id}}",
    "instantiation_dict": {
      "id": "302"
    },
    "intent": "Cancel order 302",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING_ADMIN__/sales/order/view/order_id/302/",
          "locator": "document.querySelector(\"#order_status\").outerText",
          "required_contents": {
            "exact_match": "Canceled"
          }
        }
      ]
    },
    "intent_template_id": 257,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 471,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Cancel order {{id}}",
    "instantiation_dict": {
      "id": "307"
    },
    "intent": "Cancel order 307",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING_ADMIN__/sales/order/view/order_id/307/",
          "locator": "document.querySelector(\"#order_status\").outerText",
          "required_contents": {
            "exact_match": "Canceled"
          }
        }
      ]
    },
    "intent_template_id": 257,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 473,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Cancel order {{id}}",
    "instantiation_dict": {
      "id": "301"
    },
    "intent": "Cancel order 301",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING_ADMIN__/sales/order/view/order_id/301/",
          "locator": "document.querySelector(\"#order_status\").outerText",
          "required_contents": {
            "exact_match": "Canceled"
          }
        }
      ]
    },
    "intent_template_id": 257,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 482,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "{{name}} wants to check my dotfile configurations. Please invite him to the repo as a guest.",
    "instantiation_dict": {
      "name": "yjlou"
    },
    "intent": "yjlou wants to check my dotfile configurations. Please invite him to the repo as a guest.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/byteblaze/dotfiles/-/project_members",
          "locator": "func:gitlab_get_project_memeber_role(__page__, 'yjlou')",
          "required_contents": {
            "must_include": [
              "Guest"
            ]
          }
        }
      ]
    },
    "intent_template_id": 294,
    "API-solvable": true,
    "API_calls_required": 3,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 488,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Change the page title of \"{{old-heading}}\" page on my site to \"{{heading}}\".",
    "instantiation_dict": {
      "old-heading": "Home Page",
      "heading": "This is the home page!! Leave here!!"
    },
    "intent": "Change the page title of \"Home Page\" page on my site to \"This is the home page!! Leave here!!\".",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING_ADMIN__/cms/page/edit/page_id/2/",
          "locator": "document.querySelector('input[name=\"title\"').value",
          "required_contents": {
            "exact_match": "This is the home page!! Leave here!!"
          }
        }
      ]
    },
    "intent_template_id": 275,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 495,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Notify {{name}} in their most recent pending order with message \"{{message}}\"",
    "instantiation_dict": {
      "name": "Lily Potter",
      "message": "Thanks, your order is ready to be shipped!"
    },
    "intent": "Notify Lily Potter in their most recent pending order with message \"Thanks, your order is ready to be shipped!\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING_ADMIN__/sales/order/view/order_id/303/",
          "locator": "document.querySelector(\"#order_history_block\").querySelector(\".note-list\").firstElementChild.querySelector(\".note-list-comment\").outerText",
          "required_contents": {
            "exact_match": "Thanks, your order is ready to be shipped!"
          }
        }
      ]
    },
    "intent_template_id": 280,
    "API-solvable": true,
    "API_calls_required": 2,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 507,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Buy the highest rated product from the {{product_category}} category within a budget {{dollar_value}}.",
    "instantiation_dict": {
      "product_category": "Ceiling light",
      "dollar_value": "above 1000"
    },
    "intent": "Buy the highest rated product from the Ceiling light category within a budget above 1000.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "func:shopping_get_latest_order_url()",
          "locator": "document.querySelector(\".order-details-items.ordered\").outerText",
          "required_contents": {
            "must_include": [
              "B07BVL3P1V"
            ]
          }
        }
      ]
    },
    "intent_template_id": 172,
    "API-solvable": true,
    "API_calls_required": 4,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 520,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__/magnetic-metal-stainless-steel-d-pads-kits-directional-pad-replacement-parts-for-xbox-one-elite-controller-elite-series-2-xbox-one-xbox-one-s-x-controller.html",
    "geolocation": null,
    "intent_template": "Add this product to my wishlist",
    "instantiation_dict": {},
    "intent": "Add this product to my wishlist",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING__/wishlist/",
          "locator": "document.querySelector('.products-grid.wishlist').outerText",
          "required_contents": {
            "must_include": [
              "Magnetic Metal Stainless Steel D-pads Kits Directional Pad Replacement Parts for Xbox One Elite Controller, Elite Series 2, Xbox One, Xbox One S/X Controller"
            ]
          }
        }
      ]
    },
    "intent_template_id": 196,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 521,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Subscribe to the newsletter of OneStopMarket",
    "instantiation_dict": {},
    "intent": "Subscribe to the newsletter of OneStopMarket",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING__/newsletter/manage/",
          "locator": "document.querySelector('[title=\"General Subscription\"').checked.toString()",
          "required_contents": {
            "exact_match": "true"
          }
        }
      ]
    },
    "intent_template_id": 199,
    "API-solvable": true,
    "API_calls_required": 2,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 527,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Star the top {{number}} most stared repos in Gitlab",
    "instantiation_dict": {
      "number": "one"
    },
    "intent": "Star the top one most stared repos in Gitlab",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/users/byteblaze/starred",
          "locator": "",
          "required_contents": {
            "must_include": [
              "AndroidSlidingUpPanel"
            ]
          }
        }
      ]
    },
    "intent_template_id": 354,
    "API-solvable": true,
    "API_calls_required": 2,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 532,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Draft a refund message via their \"contact us\" form for the {{product}} I bought {{time}}. It broke after three days of use. The shop requires the order id, the reason and the amount to refund in the message. Don't submit yet",
    "instantiation_dict": {
      "product": "PS3 remote controller",
      "time": "early 2023"
    },
    "intent": "Draft a refund message via their \"contact us\" form for the PS3 remote controller I bought early 2023. It broke after three days of use. The shop requires the order id, the reason and the amount to refund in the message. Don't submit yet",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('[title=\"What’s on your mind?\"').value",
          "required_contents": {
            "must_include": [
              "refund",
              "it broke after three days of use",
              "000000180",
              "1.63"
            ]
          }
        }
      ]
    },
    "intent_template_id": 154,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 538,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Modify the address of order #{{order_id}} to {{address}}",
    "instantiation_dict": {
      "order_id": "299",
      "address": "456 Oak Avenue, Apartment 5B, New York, NY, 10001"
    },
    "intent": "Modify the address of order #299 to 456 Oak Avenue, Apartment 5B, New York, NY, 10001",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING_ADMIN__/sales/order/view/order_id/299",
          "locator": "",
          "required_contents": {
            "must_include": [
              "456 Oak Avenue",
              "Apartment 5B",
              "New York",
              "10001"
            ]
          }
        }
      ]
    },
    "intent_template_id": 240,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 545,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Update the description of {{product}} to highlight the real user positive reviews by quoting the comments",
    "instantiation_dict": {
      "product": "Radiant Tee"
    },
    "intent": "Update the description of Radiant Tee to highlight the real user positive reviews by quoting the comments",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING_ADMIN__/../radiant-tee.html",
          "locator": "document.querySelector('.data.item.content').outerText + (document.querySelector('.product.attribute.overview [itemprop=\"description\"]')?.outerText || '')",
          "required_contents": {
            "must_include": [
              "What I rally love here is that it does the job of keeping me cool and dry",
              "I'm a big guy and sweat A LOT",
              "Even after a day of gulf, I'm still dry and comfortable",
              "What a versatile shirt",
              "Not only does it feel very soft compared to my old worn out polos, but it also does the job promised",
              "I like going out after my game for drinks so I look good then too and don't need to change into something fresh"
            ]
          }
        }
      ]
    },
    "intent_template_id": 251,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 572,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "I recently moved, my address is {{address}}, update my information on OneStopShopping accordingly",
    "instantiation_dict": {
      "address": "654 Aspen Road, House #3, Boston, MA, 02110"
    },
    "intent": "I recently moved, my address is 654 Aspen Road, House #3, Boston, MA, 02110, update my information on OneStopShopping accordingly",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING__/customer/address",
          "locator": "document.querySelector(\".box.box-address-billing > .box-content\").outerText",
          "required_contents": {
            "must_include": [
              "654 Aspen Road",
              "House #3",
              "Boston, Massachusetts, 02110"
            ]
          }
        },
        {
          "url": "__SHOPPING__/customer/address",
          "locator": "document.querySelector(\".box.box-address-shipping > .box-content\").outerText",
          "required_contents": {
            "must_include": [
              "654 Aspen Road",
              "House #3",
              "Boston, Massachusetts, 02110"
            ]
          }
        }
      ]
    },
    "intent_template_id": 165,
    "API-solvable": true,
    "API_calls_required": 2,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 574,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "I recently moved, my address is {{address}}, update my information on OneStopShopping accordingly",
    "instantiation_dict": {
      "address": "111 Magnolia Path, Atlanta, GA, 30303"
    },
    "intent": "I recently moved, my address is 111 Magnolia Path, Atlanta, GA, 30303, update my information on OneStopShopping accordingly",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING__/customer/address",
          "locator": "document.querySelector(\".box.box-address-shipping > .box-content\").outerText",
          "required_contents": {
            "must_include": [
              "111 Magnolia Path",
              "Atlanta, Georgia, 30303"
            ]
          }
        },
        {
          "url": "__SHOPPING__/customer/address",
          "locator": "document.querySelector(\".box.box-address-billing > .box-content\").outerText",
          "required_contents": {
            "must_include": [
              "111 Magnolia Path",
              "Atlanta, Georgia, 30303"
            ]
          }
        }
      ]
    },
    "intent_template_id": 165,
    "API-solvable": true,
    "API_calls_required": 2,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 582,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Create a new forum named {{name}}, with a description of {{description}}, and include {{sidebar_list}} in the sidebar?",
    "instantiation_dict": {
      "name": "Cyberpunk",
      "description": "Welcome to the future",
      "sidebar_list": [
        "Games",
        "Books",
        "Movies",
        "Future"
      ]
    },
    "intent": "Create a new forum named Cyberpunk, with a description of Welcome to the future, and include ['Games', 'Books', 'Movies', 'Future'] in the sidebar?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__REDDIT__/f/Cyberpunk/edit",
          "locator": "document.querySelector(\"#forum_description\").value",
          "required_contents": {
            "must_include": [
              "Welcome to the future"
            ]
          }
        },
        {
          "url": "__REDDIT__/f/Cyberpunk/edit",
          "locator": "document.querySelector(\"#forum_sidebar\").value",
          "required_contents": {
            "must_include": [
              "Games",
              "Books",
              "Movies",
              "Future"
            ]
          }
        }
      ]
    },
    "intent_template_id": 7,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "Task Understanding"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 584,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Create a new forum named {{name}}, with a description of {{description}}, and include {{sidebar_list}} in the sidebar?",
    "instantiation_dict": {
      "name": "Karaoke",
      "description": "Place for Karaoke lovers",
      "sidebar_list": [
        "devices",
        "setup"
      ]
    },
    "intent": "Create a new forum named Karaoke, with a description of Place for Karaoke lovers, and include ['devices', 'setup'] in the sidebar?",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__REDDIT__/f/Karaoke",
          "locator": "document.querySelector(\"#forum_description\").value",
          "required_contents": {
            "must_include": [
              "Place for Karaoke lovers"
            ]
          }
        },
        {
          "url": "__REDDIT__/f/Karaoke",
          "locator": "document.querySelector(\"#forum_sidebar\").value",
          "required_contents": {
            "must_include": [
              "devices",
              "setup"
            ]
          }
        }
      ]
    },
    "intent_template_id": 7,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "Task Understanding"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 615,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__/f/pics",
    "geolocation": null,
    "intent_template": "Re-post the image of {{content}} in this page to {{subreddit}} subreddit and note \"from /f/pics\"",
    "instantiation_dict": {
      "content": "Bald Eagle",
      "subreddit": "earthporn"
    },
    "intent": "Re-post the image of Bald Eagle in this page to earthporn subreddit and note \"from /f/pics\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/earthporn",
      "program_html": [
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "document.querySelector('.submission__inner').outerText",
          "required_contents": {
            "must_include": [
              "from /f/pics"
            ]
          }
        },
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "[...document.querySelector('.submission__inner').querySelectorAll('[href],[src]')].map(elem => elem.getAttribute('href') || elem.getAttribute('src')).join(' ')",
          "required_contents": {
            "must_include": [
              "b02113033af32feae9ff147dbbe3764039368d67d193885bd04e65c2e6beea9c.jpg"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 11,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 617,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__/f/pics",
    "geolocation": null,
    "intent_template": "Re-post the image of {{content}} in this page to {{subreddit}} subreddit and note \"from /f/pics\"",
    "instantiation_dict": {
      "content": "Firework",
      "subreddit": "earthporn"
    },
    "intent": "Re-post the image of Firework in this page to earthporn subreddit and note \"from /f/pics\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/earthporn",
      "program_html": [
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "document.querySelector('.submission__inner').outerText",
          "required_contents": {
            "must_include": [
              "from /f/pics"
            ]
          }
        },
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "[...document.querySelector('.submission__inner').querySelectorAll('[href],[src]')].map(elem => elem.getAttribute('href') || elem.getAttribute('src')).join(' ')",
          "required_contents": {
            "must_include": [
              "92411be6af4e9ad5ccd3ccbaa01c10457bb00e704e99c58dd430de1a958307fd.jpg"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 11,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 627,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Create a discussion post about \"{{topic}}\" in a relevant subreddit and ask users for their opinions with the simple prompt, \"your opinion\"",
    "instantiation_dict": {
      "topic": "Harry Potter movie series"
    },
    "intent": "Create a discussion post about \"Harry Potter movie series\" in a relevant subreddit and ask users for their opinions with the simple prompt, \"your opinion\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/movies",
      "program_html": [
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "document.querySelector('.submission__inner').outerText",
          "required_contents": {
            "must_include": [
              "your opinion",
              "Harry Potter movie series"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 13,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 634,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Ask for product recommendations for {{category}} within a budget of {{price}} in {{subreddit}}",
    "instantiation_dict": {
      "category": "used iphone",
      "price": "$1000",
      "subreddit": "r/iphone"
    },
    "intent": "Ask for product recommendations for used iphone within a budget of $1000 in r/iphone",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/iphone",
      "program_html": [
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "document.querySelector('.submission__inner').outerText",
          "required_contents": {
            "must_include": [
              "1000",
              "used iphone"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 15,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 643,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Post a notice on a virtual meetup for {{interest}} enthusiasts on {{date}} in the {{subreddit}} subreddit",
    "instantiation_dict": {
      "interest": "racing cars",
      "date": "Oct 21st",
      "subreddit": "nyc"
    },
    "intent": "Post a notice on a virtual meetup for racing cars enthusiasts on Oct 21st in the nyc subreddit",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/nyc",
      "program_html": [
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "document.querySelector('.submission__inner').outerText",
          "required_contents": {
            "must_include": [
              "racing cars",
              "Oct 21st",
              "virtual meetup"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 16,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 648,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Post in {{subreddit}} forum about what could large language models help the correpong field.",
    "instantiation_dict": {
      "subreddit": "dataisbeautiful"
    },
    "intent": "Post in dataisbeautiful forum about what could large language models help the correpong field.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/dataisbeautiful",
      "program_html": [
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "document.querySelector('.submission__inner').outerText",
          "required_contents": {
            "must_include": [
              "large language models",
              "help"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 19,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 651,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__/f/pittsburgh/45899/driving-in-pittsburgh-summed-up-by-one-traffic-sign",
    "geolocation": null,
    "intent_template": "Reply to {{position_description}} with my comment \"{{content_description}}\"",
    "instantiation_dict": {
      "position_description": "the post",
      "content_description": "Yeah, pittsburgh traffic, you know..."
    },
    "intent": "Reply to the post with my comment \"Yeah, pittsburgh traffic, you know...\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/pittsburgh/45899/driving-in-pittsburgh-summed-up-by-one-traffic-sign",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('.comment__body').outerText",
          "required_contents": {
            "exact_match": "Yeah, pittsburgh traffic, you know..."
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 23,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 660,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Create an issue in {{repo}} repo with title \"{{issue}}\". Assign the issue to {{account}}. Set due date to be {{due}}",
    "instantiation_dict": {
      "repo": "dotfiles",
      "issue": "add support for oh-my-zsh",
      "account": "Abishek",
      "due": "July 18 2033"
    },
    "intent": "Create an issue in dotfiles repo with title \"add support for oh-my-zsh\". Assign the issue to Abishek. Set due date to be July 18 2033",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__GITLAB__/byteblaze/dotfiles/-/tree/main",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('[data-qa-selector=\"title_content\"]').outerText",
          "required_contents": {
            "exact_match": "add support for oh-my-zsh"
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector('[data-testid=\"sidebar-due-date\"').outerText",
          "required_contents": {
            "must_include": [
              "Jul 18, 2033"
            ]
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector('.block.assignee').outerText",
          "required_contents": {
            "must_include": [
              "Abishek S"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 327,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 663,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Open an issue to {{issue}} in {{repo}}.",
    "instantiation_dict": {
      "repo": "metaseq",
      "issue": "ask their plan on supporting Llama and other llama family models"
    },
    "intent": "Open an issue to ask their plan on supporting Llama and other llama family models in metaseq.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__GITLAB__/root/metaseq/-/issues",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('.detail-page-description').outerText",
          "required_contents": {
            "must_include": [
              "llama"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 328,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 667,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__/primer/design",
    "geolocation": null,
    "intent_template": "Submit a merge request for {{source_branch}} branch to be merged into {{target_branch}} branch, assign {{reviewer}} as the reviewer",
    "instantiation_dict": {
      "source_branch": "dialog-component",
      "target_branch": "bump-doctocat",
      "reviewer": "primer"
    },
    "intent": "Submit a merge request for dialog-component branch to be merged into bump-doctocat branch, assign primer as the reviewer",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__GITLAB__/primer/design/-/merge_requests",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelectorAll(\".detail-page-description > a.gl-font-monospace\")[1].outerText",
          "required_contents": {
            "exact_match": "bump-doctocat"
          }
        },
        {
          "url": "last",
          "locator": "document.querySelectorAll(\".detail-page-description > a.gl-font-monospace\")[0].outerText",
          "required_contents": {
            "exact_match": "dialog-component"
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector('.block.reviewer').outerText",
          "required_contents": {
            "must_include": [
              "Primer"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 335,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping",
      "reddit"
    ],
    "task_id": 675,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Gather the titles of {{product}} reviews with {{rating}} rating from OneStopShop, and post them in the games subreddit under the title \"real user feedback on {{product}}\"",
    "instantiation_dict": {
      "product": "HORI 3D Surround Gaming Neckset",
      "rating": "2 stars and less"
    },
    "intent": "Gather the titles of HORI 3D Surround Gaming Neckset reviews with 2 stars and less rating from OneStopShop, and post them in the games subreddit under the title \"real user feedback on HORI 3D Surround Gaming Neckset\"",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/gaming",
      "program_html": [
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "document.querySelector('.submission__title').outerText",
          "required_contents": {
            "exact_match": "real user feedback on HORI 3D Surround Gaming Neckset"
          }
        },
        {
          "url": "func:reddit_get_post_url('__last_url__')",
          "locator": "document.querySelector('.submission__body').outerText",
          "required_contents": {
            "must_include": [
              "Not worth it for PC users",
              "I really wanted to like this.",
              "I wish this was better..."
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 101,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 677,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Lookup orders that are {{status}}",
    "instantiation_dict": {
      "status": "processing"
    },
    "intent": "Lookup orders that are processing",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING_ADMIN__/sales/order/",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector(\"div.admin__data-grid-filters-current\").outerText",
          "required_contents": {
            "must_include": [
              "Processing"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 253,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 679,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Lookup orders that are {{status}}",
    "instantiation_dict": {
      "status": "completed"
    },
    "intent": "Lookup orders that are completed",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING_ADMIN__/sales/order/",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector(\"div.admin__data-grid-filters-current\").outerText",
          "required_contents": {
            "must_include": [
              "Completed"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 253,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit",
      "gitlab"
    ],
    "task_id": 681,
    "require_login": true,
    "storage_state": "./.auth/gitlab.reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Find a GitLab repository related to {{topic}} and make a Reddit post linking to it in a relevant subreddit",
    "instantiation_dict": {
      "topic": "gan implementation"
    },
    "intent": "Find a GitLab repository related to gan implementation and make a Reddit post linking to it in a relevant subreddit",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/machinelearning |OR| __REDDIT__/f/deeplearning |OR| __REDDIT__/f/technology",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('.submission__inner').outerText",
          "required_contents": {
            "must_include": [
              "gan implementation",
              "__GITLAB__/eriklindernoren/PyTorch-GAN"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 116,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit",
      "gitlab"
    ],
    "task_id": 686,
    "require_login": true,
    "storage_state": "./.auth/gitlab.reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Promote {{repo}} to subreddit {{subreddit}} with the description from the repo itself.",
    "instantiation_dict": {
      "repo": "auth0/angular-storage",
      "subreddit": "technology"
    },
    "intent": "Promote auth0/angular-storage to subreddit technology with the description from the repo itself.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/technology",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('.submission__inner').outerText + [...document.querySelector('.submission__inner').querySelectorAll('[href],[src]')].map(elem => elem.getAttribute('href') || elem.getAttribute('src')).join(' ')",
          "required_contents": {
            "must_include": [
              "A storage library for AngularJS done right",
              "__GITLAB__/auth0/angular-storage"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 117,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit",
      "gitlab"
    ],
    "task_id": 687,
    "require_login": true,
    "storage_state": "./.auth/gitlab.reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Promote {{repo}} to subreddit {{subreddit}} with the description from the repo itself.",
    "instantiation_dict": {
      "repo": "koush/AndroidAsync",
      "subreddit": "funny"
    },
    "intent": "Promote koush/AndroidAsync to subreddit funny with the description from the repo itself.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__REDDIT__/f/funny",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('.submission__inner').outerText + [...document.querySelector('.submission__inner').querySelectorAll('[href],[src]')].map(elem => elem.getAttribute('href') || elem.getAttribute('src')).join(' ')",
          "required_contents": {
            "must_include": [
              "Asynchronous socket, http(s) (client+server) and websocket library for android. Based on nio, not threads.",
              "__GITLAB__/koush/AndroidAsync"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 117,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping"
    ],
    "task_id": 692,
    "require_login": true,
    "storage_state": "./.auth/shopping_state.json",
    "start_url": "__SHOPPING__",
    "geolocation": null,
    "intent_template": "Draft an email to the shop owner via their contact us function for a coupon as {{reason}}",
    "instantiation_dict": {
      "reason": "I am a student"
    },
    "intent": "Draft an email to the shop owner via their contact us function for a coupon as I am a student",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING__/contact",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('[title=\"What’s on your mind?\"').value",
          "required_contents": {
            "must_include": [
              "coupon",
              "student"
            ]
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 163,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 702,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Draft a new marketing price rule for {{topic}} that offers {{rule}} for all customers",
    "instantiation_dict": {
      "topic": "Pride Month",
      "rule": "45% off on all products"
    },
    "intent": "Draft a new marketing price rule for Pride Month that offers 45% off on all products for all customers",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "url_match",
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "__SHOPPING_ADMIN__/sales_rule/promo_quote",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector(\"[name='name'\").value",
          "required_contents": {
            "must_include": [
              "Pride Month"
            ]
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector('[name=\"website_ids\"').selectedIndex",
          "required_contents": {
            "exact_match": "0"
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector('[name=\"customer_group_ids\"').selectedIndex",
          "required_contents": {
            "exact_match": "1"
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector('[name=\"simple_action\"').value",
          "prep_actions": [
            "document.querySelector('[data-index=\"actions\"]').querySelector('.admin__collapsible-title').click()"
          ],
          "required_contents": {
            "exact_match": "by_percent"
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector('[name=\"discount_amount\"').value",
          "prep_actions": [
            "document.querySelector('[data-index=\"actions\"]').querySelector('.admin__collapsible-title').click()"
          ],
          "required_contents": {
            "exact_match": "45"
          }
        }
      ],
      "url_note": "GOLD in PRED"
    },
    "intent_template_id": 258,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "reddit"
    ],
    "task_id": 723,
    "require_login": true,
    "storage_state": "./.auth/reddit_state.json",
    "start_url": "__REDDIT__",
    "geolocation": null,
    "intent_template": "Like all submissions created by {{user}} in subreddit {{subreddit}}",
    "instantiation_dict": {
      "user": "FTorrez81",
      "subreddit": "iphone13"
    },
    "intent": "Like all submissions created by FTorrez81 in subreddit iphone13",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "string_match"
      ],
      "reference_answers": {
        "fuzzy_match": "N/A"
      },
      "reference_url": "",
      "program_html": [],
      "reference_answer_raw_annotation": "N/A",
      "string_note": "FTorrez81 does not have any submissions in iphone13"
    },
    "intent_template_id": 25,
    "string_note": "FTorrez81 has no submissions in subreddit iphone13",
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": true,
    "error_type": ""
  },
  {
    "sites": [
      "wikipedia",
      "map"
    ],
    "task_id": 740,
    "require_login": true,
    "storage_state": null,
    "start_url": "__MAP__",
    "geolocation": null,
    "intent_template": "Show me the way from {{location}} to the home stadium of {{sport_team}} {{time}}",
    "instantiation_dict": {
      "location": "Carnegie Mellon University",
      "sport_team": "NYC NBA team",
      "time": ""
    },
    "intent": "Show me the way from Carnegie Mellon University to the home stadium of NYC NBA team ",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "last",
          "locator": "document.querySelector('[name=\"route_from\"').value",
          "required_contents": {
            "must_include": [
              "Carnegie Mellon University",
              "Pittsburgh"
            ]
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector('[name=\"route_to\"').value",
          "required_contents": {
            "must_include": [
              "Madison Square Garden",
              "Pennsylvania Plaza",
              "Manhattan",
              "New York"
            ]
          }
        },
        {
          "url": "last",
          "locator": "document.querySelector(\"div#content select.routing_engines\").selectedIndex",
          "required_contents": {
            "exact_match": "1"
          }
        }
      ]
    },
    "intent_template_id": 94,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 749,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Start a private project {{project_name}} with {{template}} template and add {{account_list}} as members",
    "instantiation_dict": {
      "project_name": "project_site",
      "template": "NodeJS",
      "account_list": "primer, convexegg, vinta"
    },
    "intent": "Start a private project project_site with NodeJS template and add primer, convexegg, vinta as members",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/byteblaze/project_site",
          "locator": "document.querySelector('.visibility-icon').getAttribute('title')",
          "required_contents": {
            "must_include": [
              "Private"
            ]
          }
        },
        {
          "url": "__GITLAB__/byteblaze/project_site/-/commits",
          "locator": "",
          "required_contents": {
            "must_include": [
              "Initialized from 'NodeJS Express' project template"
            ]
          }
        },
        {
          "url": "__GITLAB__/byteblaze/project_site/-/project_members",
          "locator": "",
          "required_contents": {
            "must_include": [
              "@primer",
              "@convexegg",
              "@vinta"
            ]
          }
        }
      ]
    },
    "intent_template_id": 2100,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 752,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "Create a private {{template}} repository called \"{{project_name}}\" using the right template to speed up development.",
    "instantiation_dict": {
      "project_name": "web_agent",
      "template": "blank"
    },
    "intent": "Create a private blank repository called \"web_agent\" using the right template to speed up development.",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/byteblaze/web_agent",
          "locator": "document.querySelector('.visibility-icon').getAttribute('title')",
          "required_contents": {
            "must_include": [
              "Private"
            ]
          }
        },
        {
          "url": "__GITLAB__/byteblaze/web_agent/-/commits",
          "locator": "",
          "required_contents": {
            "must_include": [
              "Initial commit"
            ]
          }
        }
      ]
    },
    "intent_template_id": 332,
    "API-solvable": true,
    "API_calls_required": 1,
    "correct": false,
    "error_type": "API Usage"
  },
  {
    "sites": [
      "shopping_admin"
    ],
    "task_id": 774,
    "require_login": true,
    "storage_state": "./.auth/shopping_admin_state.json",
    "start_url": "__SHOPPING_ADMIN__",
    "geolocation": null,
    "intent_template": "Delete all {{review_type}}",
    "instantiation_dict": {
      "review_type": "pending reviews with less than 4 stars"
    },
    "intent": "Delete all pending reviews with less than 4 stars",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__SHOPPING_ADMIN__/review/product/edit/id/351",
          "locator": "",
          "required_contents": {
            "must_include": [
              "Rating isn't Available"
            ]
          }
        },
        {
          "url": "__SHOPPING_ADMIN__/review/product/edit/id/353",
          "locator": "",
          "required_contents": {
            "must_include": [
              "Rating isn't Available"
            ]
          }
        },
        {
          "url": "__SHOPPING_ADMIN__/review/product/edit/id/349",
          "locator": "",
          "required_contents": {
            "must_include": [
              "Rating isn't Available"
            ]
          }
        }
      ]
    },
    "intent_template_id": 246,
    "API-solvable": false,
    "API_calls_required": 0,
    "correct": false,
    "error_type": "Unsolvable"
  },
  {
    "sites": [
      "gitlab"
    ],
    "task_id": 801,
    "require_login": true,
    "storage_state": "./.auth/gitlab_state.json",
    "start_url": "__GITLAB__",
    "geolocation": null,
    "intent_template": "create a new group \"{{name}}\" with members {{members}}",
    "instantiation_dict": {
      "name": "crew",
      "members": "ASWATFZLLC, patrickhlauke, westurner, linkmatrix"
    },
    "intent": "create a new group \"crew\" with members ASWATFZLLC, patrickhlauke, westurner, linkmatrix",
    "require_reset": false,
    "eval": {
      "eval_types": [
        "program_html"
      ],
      "reference_answers": null,
      "reference_url": "",
      "program_html": [
        {
          "url": "__GITLAB__/groups/crew/-/group_members",
          "locator": "",
          "required_contents": {
            "must_include": [
              "@ASWATFZLLC",
              "@patrickhlauke",
              "@westurner",
              "@linkmatrix"
            ]
          }
        }
      ]
    },
    "intent_template_id": 600,
    "API-solvable": true,
    "API_calls_required": 5,
    "correct": true,
    "error_type": ""
  }
]