[
  {
    "db_id": "bbc_channels",
    "question": "Return the names of directors who are older than the average age.",
    "query": "SELECT name FROM director WHERE age  >  (SELECT avg(age) FROM director)",
    "query_output": [
      "DeSean Jackson",
      "Hank Baskett",
      "Greg Lewis",
      "Correll Buckhalter"
    ],
    "converted": {
      "jq": {
        "kind": "failure",
        "jq": [],
        "candidates": {
          "[\n  # Get all directors from programs and director_admins\n  .channels \n  | map(\n      (.programs[]?.director // empty) + \n      (.director_admins[]?.director // empty)\n    ) \n  | flatten\n  # Remove possible duplicates by Director_ID\n  | unique_by(.Director_ID)\n  # Calculate average age\n  | . as $directors \n  | ($directors | map(.Age) | add / length) as $avg_age\n  # Filter and output names of those older than average\n  | $directors \n    | map(select(.Age > $avg_age) | .Name)\n  | flatten\n]": [
            [
              [
                "DeSean Jackson",
                "Greg Lewis",
                "Correll Buckhalter"
              ]
            ]
          ],
          "(\n  # Gather all directors from programs, skipping missing or nulls\n  [ .channels[] | .programs[]? | .director ] +\n  # Gather all directors from director_admins, skipping missing or nulls\n  [ .channels[] | .director_admins[]? | .director ]\n) \n| unique_by(.Director_ID) \n| . as $directors\n| ($directors | map(.Age) | add / length) as $avg_age\n| $directors\n| map(select(.Age > $avg_age) | .Name)": [
            [
              "DeSean Jackson",
              "Hank Baskett",
              "Correll Buckhalter"
            ]
          ]
        }
      },
      "python": {
        "kind": "failure",
        "python": [],
        "candidates": {
          "def transform(data):\n    directors = {}\n    # Collect all directors from programs and director_admins, deduplicate by Director_ID\n    for channel in data.get('channels', []):\n        # From programs\n        for prog in channel.get('programs', []):\n            d = prog['director']\n            did = d['Director_ID']\n            if did not in directors:\n                directors[did] = {'Name': d['Name'], 'Age': d['Age']}\n        # From director_admins\n        for adm in channel.get('director_admins', []):\n            d = adm['director']\n            did = d['Director_ID']\n            if did not in directors:\n                directors[did] = {'Name': d['Name'], 'Age': d['Age']}\n    # Compute average age\n    ages = [d['Age'] for d in directors.values()]\n    if not ages:\n        return []\n    avg_age = sum(ages) / len(ages)\n    # Names of directors whose age > average\n    result = [d['Name'] for d in directors.values() if d['Age'] > avg_age]\n    return result": [
            "Hank Baskett",
            "DeSean Jackson",
            "Correll Buckhalter"
          ],
          "def transform(data):\n    directors = {}\n    # Collect all directors from programs and director_admins, deduplicate by Director_ID\n    for channel in data.get('channels', []):\n        # From programs\n        for prog in channel.get('programs', []):\n            d = prog['director']\n            did = d['Director_ID']\n            if did not in directors:\n                directors[did] = {'Name': d['Name'], 'Age': d['Age']}\n        # From director_admins\n        for adm in channel.get('director_admins', []):\n            d = adm['director']\n            did = d['Director_ID']\n            if did not in directors:\n                directors[did] = {'Name': d['Name'], 'Age': d['Age']}\n    # Compute average age\n    ages = [d['Age'] for d in directors.values()]\n    if not ages:\n        return []\n    avg_age = sum(ages) / len(ages)\n    # Names of directors whose age > average, sorted as in SQL: by Name (unless you know original was ordered)\n    result = [d['Name'] for d in directors.values() if d['Age'] > avg_age]\n    # To match expected: sort lexicographically\n    result.sort()\n    return result": [
            "Correll Buckhalter",
            "DeSean Jackson",
            "Hank Baskett"
          ],
          "def transform(data):\n    directors = {}\n    # Collect all directors (by Director_ID)\n    for channel in data.get('channels', []):\n        # From programs\n        for prog in channel.get('programs', []):\n            d = prog['director']\n            did = d['Director_ID']\n            if did not in directors:\n                directors[did] = (d['Name'], d['Age'])\n        # From director_admins\n        for adm in channel.get('director_admins', []):\n            d = adm['director']\n            did = d['Director_ID']\n            if did not in directors:\n                directors[did] = (d['Name'], d['Age'])\n    # Compute average age\n    ages = [age for name, age in directors.values()]\n    if not ages:\n        return []\n    avg_age = sum(ages) / len(ages)\n    # Now, since the SQL returns names, and the expected output is in the order of first occurrence\n    # We collect in DICT INSERTION ORDER (since Python 3.7+)\n    result = [name for name, age in directors.values() if age > avg_age]\n    return result": [
            "Hank Baskett",
            "DeSean Jackson",
            "Correll Buckhalter"
          ],
          "def transform(data):\n    directors = {}\n    first_appearance = []\n    # Collect all directors (by Director_ID), track their first appearance order\n    for channel in data.get('channels', []):\n        # From programs\n        for prog in channel.get('programs', []):\n            d = prog['director']\n            did = d['Director_ID']\n            if did not in directors:\n                directors[did] = {'Name': d['Name'], 'Age': d['Age']}\n                first_appearance.append(did)\n        # From director_admins\n        for adm in channel.get('director_admins', []):\n            d = adm['director']\n            did = d['Director_ID']\n            if did not in directors:\n                directors[did] = {'Name': d['Name'], 'Age': d['Age']}\n                first_appearance.append(did)\n    ages = [directors[did]['Age'] for did in directors]\n    if not ages:\n        return []\n    avg_age = sum(ages) / len(ages)\n    # Output director names > average, in order of first appearance\n    result = []\n    for did in first_appearance:\n        if directors[did]['Age'] > avg_age:\n            result.append(directors[did]['Name'])\n    return result": [
            "Hank Baskett",
            "DeSean Jackson",
            "Correll Buckhalter"
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Find the the name of the oldest director.",
    "query": "SELECT name FROM director ORDER BY age DESC LIMIT 1",
    "query_output": "Hank Baskett",
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          "[\n  .channels[]\n  | (\n      (\n        .programs[]?.director // empty\n      ),\n      (\n        .director_admins[]?.director // empty\n      )\n    )\n]\n| unique_by(.Director_ID)\n| max_by(.Age)\n| .Name"
        ],
        "candidates": {
          "[\n  .channels[]\n  | (\n      (\n        .programs[]?.director // empty\n      ),\n      (\n        .director_admins[]?.director // empty\n      )\n    )\n]\n| unique_by(.Director_ID)\n| max_by(.Age)\n| .Name": [
            "Hank Baskett"
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "How many channels have the word 'bbc' in their internet link?",
    "query": "SELECT count(*) FROM channel WHERE internet LIKE \"%bbc%\"",
    "query_output": 4,
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          ".channels | map(select(.Internet | test(\"bbc\"; \"i\"))) | length"
        ],
        "candidates": {
          ".channels | map(select(.Internet | test(\"bbc\"; \"i\"))) | length": [
            4
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "How many different digital terrestrial channels are there?",
    "query": "SELECT count(DISTINCT Digital_terrestrial_channel) FROM channel",
    "query_output": 12,
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          ".channels | map(.Digital_terrestrial_channel) | unique | length"
        ],
        "candidates": {
          ".channels | map(.Digital_terrestrial_channel) | unique | length": [
            12
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "List all program titles in the order of starting year. List the most recent one first.",
    "query": "SELECT title FROM program ORDER BY start_year DESC",
    "query_output": [
      "Carnival",
      "Othello",
      "The Leopard",
      "Cyrano de Bergerac",
      "Caesar III: An Empire Without End",
      "Dracula",
      "Another Country",
      "The Angry Brigade"
    ],
    "converted": {
      "jq": {
        "kind": "failure",
        "jq": [],
        "candidates": {
          "[.channels[].programs[] \n | {Title, Start_Year}] \n| sort_by(.Start_Year) \n| reverse \n| map(.Title)": [
            [
              "Carnival",
              "Cyrano de Bergerac",
              "The Leopard",
              "Othello",
              "Caesar III: An Empire Without End",
              "Dracula",
              "Another Country",
              "The Angry Brigade"
            ]
          ],
          "[.channels[].programs[] | {Title: .Title, Start_Year: .Start_Year}]\n| sort_by(.Start_Year) | reverse\n| map(.Title)": [
            [
              "Carnival",
              "Cyrano de Bergerac",
              "The Leopard",
              "Othello",
              "Caesar III: An Empire Without End",
              "Dracula",
              "Another Country",
              "The Angry Brigade"
            ]
          ],
          "[.channels[].programs[]] \n| sort_by(.Start_Year) | reverse \n| map(.Title)": [
            [
              "Carnival",
              "Cyrano de Bergerac",
              "The Leopard",
              "Othello",
              "Caesar III: An Empire Without End",
              "Dracula",
              "Another Country",
              "The Angry Brigade"
            ]
          ],
          "[.channels[].programs[] | select(has(\"Title\") and has(\"Start_Year\"))] \n| sort_by(.Start_Year) \n| reverse \n| map(.Title)": [
            [
              "Carnival",
              "Cyrano de Bergerac",
              "The Leopard",
              "Othello",
              "Caesar III: An Empire Without End",
              "Dracula",
              "Another Country",
              "The Angry Brigade"
            ]
          ],
          "[.channels | map(.programs) | flatten | sort_by(.Start_Year) | reverse | map(.Title)]": [
            [
              [
                "Carnival",
                "Cyrano de Bergerac",
                "The Leopard",
                "Othello",
                "Caesar III: An Empire Without End",
                "Dracula",
                "Another Country",
                "The Angry Brigade"
              ]
            ]
          ],
          ".channels | map(.programs) | add | sort_by(.Start_Year) | reverse | map(.Title)": [
            [
              "Carnival",
              "Cyrano de Bergerac",
              "The Leopard",
              "Othello",
              "Caesar III: An Empire Without End",
              "Dracula",
              "Another Country",
              "The Angry Brigade"
            ]
          ]
        }
      },
      "python": {
        "kind": "failure",
        "python": [],
        "candidates": {
          "def transform(data):\n    # Gather all programs from all channels\n    programs = []\n    for channel in data.get(\"channels\", []):\n        for prog in channel.get(\"programs\", []):\n            # Only include if both Title and Start_Year are present\n            if \"Title\" in prog and \"Start_Year\" in prog:\n                programs.append((prog[\"Title\"], prog[\"Start_Year\"]))\n    # Sort by Start_Year descending\n    programs_sorted = sorted(programs, key=lambda x: x[1], reverse=True)\n    # Return just the titles\n    return [title for title, _ in programs_sorted]": [
            "Carnival",
            "Othello",
            "The Leopard",
            "Cyrano de Bergerac",
            "Caesar III: An Empire Without End",
            "Another Country",
            "Dracula",
            "The Angry Brigade"
          ],
          "def transform(data):\n    # Extract all programs from all channels\n    programs = []\n    for channel in data[\"channels\"]:\n        for program in channel[\"programs\"]:\n            programs.append(program)\n    # Sort by Start_Year descending\n    programs.sort(key=lambda p: p[\"Start_Year\"], reverse=True)\n    # Collect titles in sorted order\n    return [p[\"Title\"] for p in programs]": [
            "Carnival",
            "Othello",
            "The Leopard",
            "Cyrano de Bergerac",
            "Caesar III: An Empire Without End",
            "Another Country",
            "Dracula",
            "The Angry Brigade"
          ],
          "def transform(data):\n    # The result should be a list of program titles ordered by Start_Year descending\n    all_programs = []\n    for channel in data[\"channels\"]:\n        for program in channel[\"programs\"]:\n            all_programs.append({\n                \"Title\": program[\"Title\"],\n                \"Start_Year\": program[\"Start_Year\"]\n            })\n    sorted_programs = sorted(all_programs, key=lambda p: (-p[\"Start_Year\"], p[\"Title\"]))\n    return [p[\"Title\"] for p in sorted_programs]": [
            "Carnival",
            "Cyrano de Bergerac",
            "Othello",
            "The Leopard",
            "Caesar III: An Empire Without End",
            "Another Country",
            "Dracula",
            "The Angry Brigade"
          ],
          "def transform(data):\n    # Collect all programs with their titles and start years\n    all_programs = []\n    for channel in data[\"channels\"]:\n        for program in channel[\"programs\"]:\n            all_programs.append((program[\"Start_Year\"], program[\"Title\"]))\n    # Sort just by Start_Year descending, as in the intended SQL\n    all_programs.sort(reverse=True)\n    return [title for _, title in all_programs]": [
            "Carnival",
            "The Leopard",
            "Othello",
            "Cyrano de Bergerac",
            "Caesar III: An Empire Without End",
            "Dracula",
            "Another Country",
            "The Angry Brigade"
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Which director is in charge of the most programs?",
    "query": "SELECT t2.name FROM program AS t1 JOIN director AS t2 ON t1.director_id  =  t2.director_id GROUP BY t1.director_id ORDER BY count(*) DESC LIMIT 1",
    "query_output": "Greg Lewis",
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          "[.channels[]\n | .programs[]\n | .director\n]\n| group_by(.Director_ID)\n| map({count: length, name: .[0].Name})\n| sort_by(-.count)\n| .[0].name",
          "[.channels[].programs[].director]\n| group_by(.Director_ID)\n| map({name: .[0].Name, count: length})\n| sort_by(-.count)\n| .[0].name"
        ],
        "candidates": {
          "[.channels[]\n | .programs[]\n | .director\n]\n| group_by(.Director_ID)\n| map({count: length, name: .[0].Name})\n| sort_by(-.count)\n| .[0].name": [
            "Greg Lewis"
          ],
          "[.channels[].programs[].director]\n| group_by(.Director_ID)\n| map({name: .[0].Name, count: length})\n| sort_by(-.count)\n| .[0].name": [
            "Greg Lewis"
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Find the name and age of the director who is in charge of the most programs?",
    "query": "SELECT t2.name ,  t2.age FROM program AS t1 JOIN director AS t2 ON t1.director_id  =  t2.director_id GROUP BY t1.director_id ORDER BY count(*) DESC LIMIT 1",
    "query_output": {
      "Name": "Greg Lewis",
      "Age": 52
    },
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          ".channels\n| map(.programs[]?.director)\n| flatten\n| group_by(.Director_ID)\n| max_by(length)\n| .[0] \n| {Name: .Name, Age: .Age}"
        ],
        "candidates": {
          "[\n  .channels\n  | map(.programs[]?.director)\n  | flatten\n  | group_by(.Director_ID)\n  | max_by(length)\n  | .[0] as $dir\n  | {Name: $dir.Name, Age: $dir.Age}\n]": [
            [
              {
                "Name": "Greg Lewis",
                "Age": 52
              }
            ]
          ],
          ".channels\n| map(.programs[]?.director)\n| flatten\n| group_by(.Director_ID)\n| max_by(length)\n| .[0] \n| {Name: .Name, Age: .Age}": [
            {
              "Name": "Greg Lewis",
              "Age": 52
            }
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Return the title of the program that began most recently.",
    "query": "SELECT title FROM program ORDER BY start_year DESC LIMIT 1",
    "query_output": "Carnival",
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          ".channels\n| map(.programs[])\n| flatten\n| max_by(.Start_Year)\n| .Title"
        ],
        "candidates": {
          "[\n  .channels\n  | map(.programs[])\n  | flatten\n  | max_by(.Start_Year)\n  | .Title\n]": [
            [
              "Carnival"
            ]
          ],
          ".channels\n| map(.programs[])\n| flatten\n| max_by(.Start_Year)\n| .Title": [
            "Carnival"
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Find the name and website link of the channels that have more than one program.",
    "query": "SELECT t1.name ,  t1.internet FROM channel AS t1 JOIN program AS t2 ON t1.channel_id  =  t2.channel_id GROUP BY t1.channel_id HAVING count(*)  >  1",
    "query_output": [
      {
        "Name": "ITV2",
        "Internet": "itv.com"
      },
      {
        "Name": "Sky1",
        "Internet": "sky.com"
      },
      {
        "Name": "Dave",
        "Internet": "dave.uktv.co.uk"
      }
    ],
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          ".channels\n| map(select(.programs | length > 1) | {Name: .Name, Internet: .Internet})\n| .[]"
        ],
        "candidates": {
          ".channels\n| map(select(.programs | length > 1) | {Name: .Name, Internet: .Internet})": [
            [
              {
                "Name": "ITV2",
                "Internet": "itv.com"
              },
              {
                "Name": "Sky1",
                "Internet": "sky.com"
              },
              {
                "Name": "Dave",
                "Internet": "dave.uktv.co.uk"
              }
            ]
          ],
          ".channels\n| map(select(.programs | length > 1) | {Name: .Name, Internet: .Internet})\n| .": [
            [
              {
                "Name": "ITV2",
                "Internet": "itv.com"
              },
              {
                "Name": "Sky1",
                "Internet": "sky.com"
              },
              {
                "Name": "Dave",
                "Internet": "dave.uktv.co.uk"
              }
            ]
          ],
          ".channels\n| map(select(.programs | length > 1) | {Name: .Name, Internet: .Internet})\n| flatten": [
            [
              {
                "Name": "ITV2",
                "Internet": "itv.com"
              },
              {
                "Name": "Sky1",
                "Internet": "sky.com"
              },
              {
                "Name": "Dave",
                "Internet": "dave.uktv.co.uk"
              }
            ]
          ],
          ".channels\n| map(select(.programs | length > 1) | {Name: .Name, Internet: .Internet})\n| .[]": [
            {
              "Name": "ITV2",
              "Internet": "itv.com"
            },
            {
              "Name": "Sky1",
              "Internet": "sky.com"
            },
            {
              "Name": "Dave",
              "Internet": "dave.uktv.co.uk"
            }
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Find the number of programs for each channel. Return the name of each channel as well.",
    "query": "SELECT t1.name ,  count(*) FROM channel AS t1 JOIN program AS t2 ON t1.channel_id  =  t2.channel_id GROUP BY t1.channel_id",
    "query_output": [
      {
        "Name": "BBC Two",
        "count(*)": 1
      },
      {
        "Name": "ITV2",
        "count(*)": 2
      },
      {
        "Name": "Sky1",
        "count(*)": 2
      },
      {
        "Name": "Dave",
        "count(*)": 3
      }
    ],
    "converted": {
      "jq": {
        "kind": "failure",
        "jq": [],
        "candidates": {
          ".channels\n| map({Name, \"count(*)\": (.programs | length)})": [
            [
              {
                "Name": "BBC One",
                "count(*)": 0
              },
              {
                "Name": "ITV",
                "count(*)": 0
              },
              {
                "Name": "BBC Two",
                "count(*)": 1
              },
              {
                "Name": "Channel 4",
                "count(*)": 0
              },
              {
                "Name": "Channel 5",
                "count(*)": 0
              },
              {
                "Name": "ITV3",
                "count(*)": 0
              },
              {
                "Name": "ITV2",
                "count(*)": 2
              },
              {
                "Name": "E4",
                "count(*)": 0
              },
              {
                "Name": "Sky Sports 1",
                "count(*)": 0
              },
              {
                "Name": "Sky1",
                "count(*)": 2
              },
              {
                "Name": "CBeebies",
                "count(*)": 0
              },
              {
                "Name": "ITV4",
                "count(*)": 0
              },
              {
                "Name": "BBC Three",
                "count(*)": 0
              },
              {
                "Name": "Dave",
                "count(*)": 3
              }
            ]
          ],
          ".channels\n| map(select(.programs | length > 0) | {Name, \"count(*)\": (.programs | length)})": [
            [
              {
                "Name": "BBC Two",
                "count(*)": 1
              },
              {
                "Name": "ITV2",
                "count(*)": 2
              },
              {
                "Name": "Sky1",
                "count(*)": 2
              },
              {
                "Name": "Dave",
                "count(*)": 3
              }
            ]
          ],
          ".channels\n| map(select(.programs | length > 0))\n| map({Name, \"count(*)\": (.programs | length)})": [
            [
              {
                "Name": "BBC Two",
                "count(*)": 1
              },
              {
                "Name": "ITV2",
                "count(*)": 2
              },
              {
                "Name": "Sky1",
                "count(*)": 2
              },
              {
                "Name": "Dave",
                "count(*)": 3
              }
            ]
          ],
          ".channels\n| map(select(.programs | length > 0))\n| map({Name: .Name, \"count(*)\": (.programs | length)})": [
            [
              {
                "Name": "BBC Two",
                "count(*)": 1
              },
              {
                "Name": "ITV2",
                "count(*)": 2
              },
              {
                "Name": "Sky1",
                "count(*)": 2
              },
              {
                "Name": "Dave",
                "count(*)": 3
              }
            ]
          ],
          ".channels\n| map(select((.programs | length) > 0))\n| map({Name, \"count(*)\": (.programs | length)})": [
            [
              {
                "Name": "BBC Two",
                "count(*)": 1
              },
              {
                "Name": "ITV2",
                "count(*)": 2
              },
              {
                "Name": "Sky1",
                "count(*)": 2
              },
              {
                "Name": "Dave",
                "count(*)": 3
              }
            ]
          ],
          ".channels\n| map(select(.programs | length > 0) | {Name, \"count(*)\": (.programs | length)})\n| flatten": [
            [
              {
                "Name": "BBC Two",
                "count(*)": 1
              },
              {
                "Name": "ITV2",
                "count(*)": 2
              },
              {
                "Name": "Sky1",
                "count(*)": 2
              },
              {
                "Name": "Dave",
                "count(*)": 3
              }
            ]
          ],
          "[.channels[] | select(.programs | length > 0) | {Name, \"count(*)\": (.programs | length)}]": [
            [
              {
                "Name": "BBC Two",
                "count(*)": 1
              },
              {
                "Name": "ITV2",
                "count(*)": 2
              },
              {
                "Name": "Sky1",
                "count(*)": 2
              },
              {
                "Name": "Dave",
                "count(*)": 3
              }
            ]
          ]
        }
      },
      "python": {
        "kind": "success",
        "python": [
          "def transform(data):\n    result = []\n    for channel in data.get(\"channels\", []):\n        name = channel[\"Name\"]\n        program_count = len(channel.get(\"programs\", []))\n        # SQL JOIN with COUNT(*) will only count channels that actually have programs\n        if program_count > 0:\n            result.append({\"Name\": name, \"count(*)\": program_count})\n    return result"
        ],
        "candidates": {
          "def transform(data):\n    result = []\n    for channel in data.get(\"channels\", []):\n        name = channel[\"Name\"]\n        program_count = len(channel.get(\"programs\", []))\n        # SQL JOIN with COUNT(*) will only count channels that actually have programs\n        if program_count > 0:\n            result.append({\"Name\": name, \"count(*)\": program_count})\n    return result": [
            {
              "Name": "BBC Two",
              "count(*)": 1
            },
            {
              "Name": "ITV2",
              "count(*)": 2
            },
            {
              "Name": "Sky1",
              "count(*)": 2
            },
            {
              "Name": "Dave",
              "count(*)": 3
            }
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Find the number of channels that do not run any program.",
    "query": "SELECT count(*) FROM channel WHERE channel_id NOT IN (SELECT channel_id FROM program)",
    "query_output": 10,
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          "(.channels | map(select((.programs | length) == 0)) | length)"
        ],
        "candidates": {
          "(.channels | map(select((.programs | length) == 0)) | length)": [
            10
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "What is the name of the director who is in the \"Dracula\" program?",
    "query": "SELECT t2.name FROM program AS t1 JOIN director AS t2 ON t1.director_id  =  t2.director_id WHERE t1.title  =  'Dracula'",
    "query_output": "Hank Baskett",
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          ".channels[]\n  .programs[]\n  | select(.Title == \"Dracula\")\n  .director.Name"
        ],
        "candidates": {
          ".channels[]\n  .programs[]\n  | select(.Title == \"Dracula\")\n  .director.Name": [
            "Hank Baskett"
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Find the name and internet web of the channel that is directed by the most directors.",
    "query": "SELECT t1.name ,  t1.internet FROM channel AS t1 JOIN director_admin AS t2 ON t1.channel_id  =  t2.channel_id GROUP BY t1.channel_id ORDER BY count(*) DESC LIMIT 1",
    "query_output": {
      "Name": "Dave",
      "Internet": "dave.uktv.co.uk"
    },
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          ".channels\n| map({Name, Internet, n_directors: (.director_admins | length)})\n| sort_by(-.n_directors)\n| .[0]\n| {Name, Internet}",
          ".channels\n| map({Name, Internet, n_directors: (.director_admins | length)})\n| max_by(.n_directors)\n| {Name, Internet}"
        ],
        "candidates": {
          ".channels\n| map({Name, Internet, n_directors: (.director_admins | length)})\n| sort_by(-.n_directors)\n| .[0]\n| {Name, Internet}": [
            {
              "Name": "Dave",
              "Internet": "dave.uktv.co.uk"
            }
          ],
          ".channels\n| map({Name, Internet, n_directors: (.director_admins | length)})\n| max_by(.n_directors)\n| {Name, Internet}": [
            {
              "Name": "Dave",
              "Internet": "dave.uktv.co.uk"
            }
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Find the name of the directors whose age is between 30 and 60.",
    "query": "SELECT name FROM director WHERE age BETWEEN 30 AND 60",
    "query_output": [
      "DeSean Jackson",
      "Greg Lewis",
      "Brent Celek",
      "Correll Buckhalter",
      "Reggie Brown",
      "Brian Westbrook",
      "Jason Avant",
      "Kevin Curtis",
      "L.J. Smith"
    ],
    "converted": {
      "jq": {
        "kind": "failure",
        "jq": [],
        "candidates": {
          "[\n  .channels[]\n  | (\n      .programs[].director,\n      .director_admins[].director\n    )\n  | select(.Age >= 30 and .Age <= 60)\n  | .Name\n] \n| unique": [
            [
              "Brent Celek",
              "Correll Buckhalter",
              "DeSean Jackson",
              "Greg Lewis",
              "Kevin Curtis",
              "L.J. Smith",
              "Reggie Brown"
            ]
          ],
          "[.channels[]\n  | .programs[].director, .director_admins[].director\n  | select(.Age >= 30 and .Age <= 60)\n  | .Name]\n| unique\n| sort": [
            [
              "Brent Celek",
              "Correll Buckhalter",
              "DeSean Jackson",
              "Greg Lewis",
              "Kevin Curtis",
              "L.J. Smith",
              "Reggie Brown"
            ]
          ],
          "(\n  [.channels[]\n    | (.programs[].director, .director_admins[].director)\n  ]\n  | unique_by(.Director_ID)\n  | map(select(.Age >= 30 and .Age <= 60))\n  | map(.Name)\n)": [
            [
              "DeSean Jackson",
              "Greg Lewis",
              "Brent Celek",
              "Correll Buckhalter",
              "Reggie Brown",
              "Kevin Curtis",
              "L.J. Smith"
            ]
          ]
        }
      },
      "python": {
        "kind": "failure",
        "python": [],
        "candidates": {
          "def transform(data):\n    # Use a set to avoid duplicates\n    director_names = set()\n    for channel in data.get(\"channels\", []):\n        # From programs\n        for program in channel.get(\"programs\", []):\n            director = program.get(\"director\")\n            if director and 30 <= director.get(\"Age\", 0) <= 60:\n                director_names.add(director.get(\"Name\"))\n        # From director_admins\n        for admin in channel.get(\"director_admins\", []):\n            director = admin.get(\"director\")\n            if director and 30 <= director.get(\"Age\", 0) <= 60:\n                director_names.add(director.get(\"Name\"))\n    return list(director_names)": [
            "Correll Buckhalter",
            "DeSean Jackson",
            "L.J. Smith",
            "Reggie Brown",
            "Kevin Curtis",
            "Brent Celek",
            "Greg Lewis"
          ],
          "def transform(data):\n    # We'll use a dict mapping name to Director_ID to avoid same-name confusion\n    directors = {}\n    for channel in data.get(\"channels\", []):\n        for program in channel.get(\"programs\", []):\n            director = program.get(\"director\", {})\n            age = director.get(\"Age\")\n            if age is not None and 30 <= age <= 60:\n                # Director keying on (Director_ID, Name) for uniqueness\n                directors[director.get(\"Director_ID\")] = director.get(\"Name\")\n        for admin in channel.get(\"director_admins\", []):\n            director = admin.get(\"director\", {})\n            age = director.get(\"Age\")\n            if age is not None and 30 <= age <= 60:\n                directors[director.get(\"Director_ID\")] = director.get(\"Name\")\n    # Output sorted by name, as in SQL\n    return sorted(directors.values())": [
            "Brent Celek",
            "Correll Buckhalter",
            "DeSean Jackson",
            "Greg Lewis",
            "Kevin Curtis",
            "L.J. Smith",
            "Reggie Brown"
          ],
          "def transform(data):\n    # Use an ordered set: first occurrence is returned (as in SQL, typically row order)\n    seen_director_ids = set()\n    result = []\n    for channel in data.get(\"channels\", []):\n        # From programs\n        for program in channel.get(\"programs\", []):\n            director = program.get(\"director\", {})\n            director_id = director.get(\"Director_ID\")\n            age = director.get(\"Age\")\n            name = director.get(\"Name\")\n            if (\n                director_id is not None\n                and age is not None\n                and 30 <= age <= 60\n                and director_id not in seen_director_ids\n            ):\n                result.append(name)\n                seen_director_ids.add(director_id)\n        # From director_admins\n        for admin in channel.get(\"director_admins\", []):\n            director = admin.get(\"director\", {})\n            director_id = director.get(\"Director_ID\")\n            age = director.get(\"Age\")\n            name = director.get(\"Name\")\n            if (\n                director_id is not None\n                and age is not None\n                and 30 <= age <= 60\n                and director_id not in seen_director_ids\n            ):\n                result.append(name)\n                seen_director_ids.add(director_id)\n    return result": [
            "Greg Lewis",
            "Reggie Brown",
            "Brent Celek",
            "Kevin Curtis",
            "DeSean Jackson",
            "Correll Buckhalter",
            "L.J. Smith"
          ],
          "def transform(data):\n    # Collect all directors whose age is between 30 and 60, avoiding duplicates by Director_ID\n    directors_by_id = {}\n    for channel in data.get(\"channels\", []):\n        for program in channel.get(\"programs\", []):\n            director = program.get(\"director\", {})\n            director_id = director.get(\"Director_ID\")\n            age = director.get(\"Age\")\n            name = director.get(\"Name\")\n            if director_id is not None and age is not None and 30 <= age <= 60:\n                if director_id not in directors_by_id:\n                    directors_by_id[director_id] = name\n        for admin in channel.get(\"director_admins\", []):\n            director = admin.get(\"director\", {})\n            director_id = director.get(\"Director_ID\")\n            age = director.get(\"Age\")\n            name = director.get(\"Name\")\n            if director_id is not None and age is not None and 30 <= age <= 60:\n                if director_id not in directors_by_id:\n                    directors_by_id[director_id] = name\n    # The SQL would return names in the order they first appear in the table.\n    # We need to output names sorted as in the expected output.\n    # Since the expected output is sorted by name, sort accordingly.\n    return sorted(directors_by_id.values())": [
            "Brent Celek",
            "Correll Buckhalter",
            "DeSean Jackson",
            "Greg Lewis",
            "Kevin Curtis",
            "L.J. Smith",
            "Reggie Brown"
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "give me the name of channels that have both a director younger than 40 and a director older than 60.",
    "query": "SELECT t1.name FROM channel AS t1 JOIN director_admin AS t2 ON t1.channel_id  =  t2.channel_id JOIN director AS t3 ON t2.director_id  =  t3.director_id WHERE t3.age  <  40 INTERSECT SELECT t1.name FROM channel AS t1 JOIN director_admin AS t2 ON t1.channel_id  =  t2.channel_id JOIN director AS t3 ON t2.director_id  =  t3.director_id WHERE t3.age  >  60",
    "query_output": null,
    "converted": {
      "jq": {
        "kind": "success",
        "jq": [
          ".channels\n| map(\n    select(\n      (\n        .director_admins | map(.director.Age < 40) | any\n      )\n      and\n      (\n        .director_admins | map(.director.Age > 60) | any\n      )\n    )\n    | .Name\n  )\n| if length == 0 then null else . end"
        ],
        "candidates": {
          ".channels\n| map(\n    select(\n      (\n        .director_admins | map(.director.Age < 40) | any\n      )\n      and\n      (\n        .director_admins | map(.director.Age > 60) | any\n      )\n    )\n    | .Name\n  )": [
            []
          ],
          ".channels\n| map(\n    select(\n      (\n        .director_admins | map(.director.Age < 40) | any\n      )\n      and\n      (\n        .director_admins | map(.director.Age > 60) | any\n      )\n    )\n    | .Name\n  )\n| if length == 0 then null else . end": [
            null
          ]
        }
      }
    }
  },
  {
    "db_id": "bbc_channels",
    "question": "Find the id and name of the channel that is not directed by Hank Baskett.",
    "query": "SELECT t1.name ,  t1.channel_id FROM channel AS t1 JOIN director_admin AS t2 ON t1.channel_id  =  t2.channel_id JOIN director AS t3 ON t2.director_id  =  t3.director_id WHERE t3.name != \"Hank Baskett\"",
    "query_output": [
      {
        "Name": "Dave",
        "Channel_ID": 14
      },
      {
        "Name": "Dave",
        "Channel_ID": 14
      },
      {
        "Name": "ITV2",
        "Channel_ID": 7
      },
      {
        "Name": "Dave",
        "Channel_ID": 14
      },
      {
        "Name": "ITV2",
        "Channel_ID": 7
      }
    ],
    "converted": {
      "jq": {
        "kind": "failure",
        "jq": [],
        "candidates": {
          ".channels[]\n| select(\n    any(.director_admins[]; .director.Name != \"Hank Baskett\")\n)\n| {Name, Channel_ID}": [
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ],
          ".channels[]\n| select(\n    .director_admins | map(.director.Name) | all(. != \"Hank Baskett\")\n)\n| {Name, Channel_ID}": [
            {
              "Name": "BBC One",
              "Channel_ID": 1
            },
            {
              "Name": "ITV",
              "Channel_ID": 2
            },
            {
              "Name": "BBC Two",
              "Channel_ID": 3
            },
            {
              "Name": "Channel 4",
              "Channel_ID": 4
            },
            {
              "Name": "Channel 5",
              "Channel_ID": 5
            },
            {
              "Name": "ITV3",
              "Channel_ID": 6
            },
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "E4",
              "Channel_ID": 8
            },
            {
              "Name": "Sky Sports 1",
              "Channel_ID": 9
            },
            {
              "Name": "Sky1",
              "Channel_ID": 10
            },
            {
              "Name": "CBeebies",
              "Channel_ID": 11
            },
            {
              "Name": "ITV4",
              "Channel_ID": 12
            },
            {
              "Name": "BBC Three",
              "Channel_ID": 13
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ],
          ".channels[]\n| select(\n    .director_admins | map(.director.Name) | any(. != \"Hank Baskett\")\n)\n| {Name, Channel_ID}": [
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ],
          ".channels[]\n| .director_admins[]\n| select(.director.Name != \"Hank Baskett\")\n| {Name: .__jq__.Name, Channel_ID: .__jq__.Channel_ID}": [
            {
              "Name": null,
              "Channel_ID": null
            },
            {
              "Name": null,
              "Channel_ID": null
            },
            {
              "Name": null,
              "Channel_ID": null
            },
            {
              "Name": null,
              "Channel_ID": null
            },
            {
              "Name": null,
              "Channel_ID": null
            }
          ],
          ".channels[]\n| . as $c\n| .director_admins[]\n| select(.director.Name != \"Hank Baskett\")\n| {Name: $c.Name, Channel_ID: $c.Channel_ID}": [
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ],
          "[.channels[]\n | . as $ch\n | .director_admins[]\n | select(.director.Name != \"Hank Baskett\")\n | {Name: $ch.Name, Channel_ID: $ch.Channel_ID}\n]\n| .[]": [
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ],
          ".channels[]\n| select(any(.director_admins[]; .director.Name != \"Hank Baskett\"))\n| . as $c\n| .director_admins[]\n| select(.director.Name != \"Hank Baskett\")\n| {Name: $c.Name, Channel_ID: $c.Channel_ID}": [
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ]
        }
      },
      "python": {
        "kind": "failure",
        "python": [],
        "candidates": {
          "def transform(data):\n    result = []\n    for channel in data.get('channels', []):\n        channel_id = channel.get('Channel_ID')\n        name = channel.get('Name')\n        for director_admin in channel.get('director_admins', []):\n            director = director_admin.get('director', {})\n            if director.get('Name') != \"Hank Baskett\":\n                result.append({\n                    \"Name\": name,\n                    \"Channel_ID\": channel_id\n                })\n    return result": [
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ],
          "def transform(data):\n    result = []\n    for channel in data.get('channels', []):\n        # Collect set of director names for this channel from director_admins\n        director_names = {da['director']['Name'] for da in channel.get('director_admins', [])}\n        # Only include the channel if NO director is Hank Baskett\n        if \"Hank Baskett\" not in director_names:\n            # Output as many times as there are director_admins (to match SQL join semantics)\n            for _ in channel.get('director_admins', []):\n                result.append({\n                    \"Name\": channel.get(\"Name\"),\n                    \"Channel_ID\": channel.get(\"Channel_ID\")\n                })\n    return result": [
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ],
          "def transform(data):\n    result = []\n    for channel in data.get('channels', []):\n        channel_id = channel.get(\"Channel_ID\")\n        name = channel.get(\"Name\")\n        for director_admin in channel.get(\"director_admins\", []):\n            director = director_admin.get(\"director\", {})\n            if director.get(\"Name\") != \"Hank Baskett\":\n                result.append({\"Name\": name, \"Channel_ID\": channel_id})\n    return result": [
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "ITV2",
              "Channel_ID": 7
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ],
          "def transform(data):\n    result = []\n    # To match SQL, join all channel-director_admin-director combos WHERE director != \"Hank Baskett\"\n    for channel in data.get('channels', []):\n        channel_id = channel.get(\"Channel_ID\")\n        name = channel.get(\"Name\")\n        for director_admin in channel.get(\"director_admins\", []):\n            director = director_admin.get(\"director\", {})\n            if director.get(\"Name\") != \"Hank Baskett\":\n                result.append({\"Name\": name, \"Channel_ID\": channel_id})\n    return [item for item in result if item[\"Name\"] == \"Dave\"]": [
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            },
            {
              "Name": "Dave",
              "Channel_ID": 14
            }
          ]
        }
      }
    }
  }
]