{
    "68": {
        "question_id": "68",
        "analyze": "GoldSQL: it contains an extra clause 'StatusType = 'Closed'",
        "question": "Which county reported the most number of school closure in the 1980s with school wonership code belonging to Youth Authority Facilities (CEA)?",
        "evidence": "Youth Authority Facilities (CEA) refers to SOC = 11; 1980s = years between 1980 and 1989",
        "SQL": "SELECT County FROM schools WHERE strftime('%Y', ClosedDate) BETWEEN '1980' AND '1989' AND StatusType = 'Closed' AND SOC = 11 GROUP BY County ORDER BY COUNT(School) DESC LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT T1.COUNTY FROM SCHOOLS AS T1 WHERE T1.CLOSEDDATE BETWEEN '1980-01-01' AND '1989-12-31' AND T1.SOC = 11 GROUP BY T1.COUNTY ORDER BY COUNT(*) DESC LIMIT 1",
        "slm_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE SOC = '11' AND CLOSEDDATE BETWEEN '1980-01-01' AND '1989-12-31' GROUP BY COUNTY ORDER BY COUNT(*) DESC LIMIT 1",
        "csc-32b_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE SOC = '11' AND CLOSEDDATE BETWEEN '1980-01-01' AND '1989-12-31' GROUP BY COUNTY ORDER BY COUNT(*) DESC LIMIT 1",
        "gena_submission_2_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE SOC = '11' AND STRFTIME('%Y', CLOSEDDATE) BETWEEN '1980' AND '1989' GROUP BY COUNTY ORDER BY COUNT(CDSCODE) DESC LIMIT 1",
        "alpha_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE STRFTIME('%Y', CLOSEDDATE) BETWEEN '1980' AND '1989' AND SOC = '11' GROUP BY COUNTY ORDER BY COUNT(*) DESC LIMIT 1",
        "gsr_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE SOC = 11 AND CLOSEDDATE BETWEEN '1980-01-01' AND '1989-12-31' GROUP BY COUNTY ORDER BY COUNT(*) DESC LIMIT 1;",
        "chess_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE SOC = 11 AND CLOSEDDATE BETWEEN '1980-01-01' AND '1989-12-31' GROUP BY COUNTY ORDER BY COUNT(COUNTY) DESC LIMIT 1",
        "rsl_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE SOC = 11 AND CLOSEDDATE BETWEEN '1980-01-01' AND '1989-12-31' GROUP BY COUNTY ORDER BY COUNT(CLOSEDDATE) DESC LIMIT 1",
        "omni-32-majority_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE SOC = 11 AND STATUSTYPE = 'CLOSED' AND STRFTIME('%Y', CLOSEDDATE) BETWEEN '1980' AND '1989' GROUP BY COUNTY ORDER BY COUNT(*) DESC LIMIT 1;",
        "gena_submission_1_sql.json.csv": "SELECT COUNTY FROM SCHOOLS WHERE SOC = '11' AND STRFTIME('%Y', CLOSEDDATE) BETWEEN '1980' AND '1989' GROUP BY COUNTY ORDER BY COUNT(CDSCODE) DESC LIMIT 1"
    },
    "112": {
        "question_id": "112",
        "analyze": "GoldSQL: it is wrong, just finds distrcut females live",
        "question": "For the female client who was born in 1976/1/29, which district did she opened her account?",
        "evidence": "Female refers to gender = 'F'; A2 refers to district names",
        "SQL": "SELECT T1.A2 FROM district AS T1 INNER JOIN client AS T2 ON T1.district_id = T2.district_id WHERE T2.birth_date = '1976-01-29' AND T2.gender = 'F'",
        "csc-7b_sql.json.csv": "SELECT T3.A2 FROM CLIENT AS T1 JOIN DISP AS T2 ON T1.CLIENT_ID = T2.CLIENT_ID JOIN ACCOUNT AS T4 ON T2.ACCOUNT_ID = T4.ACCOUNT_ID JOIN DISTRICT AS T3 ON T4.DISTRICT_ID = T3.DISTRICT_ID WHERE T1.GENDER = 'F' AND T1.BIRTH_DATE = '1976-01-29'",
        "slm_sql.json.csv": "SELECT DISTRICT.A2 FROM CLIENT INNER JOIN ACCOUNT ON CLIENT.DISTRICT_ID = ACCOUNT.DISTRICT_ID INNER JOIN DISTRICT ON ACCOUNT.DISTRICT_ID = DISTRICT.DISTRICT_ID WHERE CLIENT.GENDER = 'F' AND CLIENT.BIRTH_DATE = '1976-01-29'",
        "csc-32b_sql.json.csv": "SELECT D.A2 FROM CLIENT C JOIN DISP DP ON C.CLIENT_ID = DP.CLIENT_ID JOIN ACCOUNT A ON DP.ACCOUNT_ID = A.ACCOUNT_ID JOIN DISTRICT D ON A.DISTRICT_ID = D.DISTRICT_ID WHERE C.GENDER = 'F' AND C.BIRTH_DATE = '1976-01-29'",
        "gena_submission_2_sql.json.csv": "SELECT T3.A2 FROM CLIENT AS T1 INNER JOIN DISP AS T2 ON T1.CLIENT_ID = T2.CLIENT_ID INNER JOIN ACCOUNT AS T4 ON T2.ACCOUNT_ID = T4.ACCOUNT_ID INNER JOIN DISTRICT AS T3 ON T4.DISTRICT_ID = T3.DISTRICT_ID WHERE T1.GENDER = 'F' AND T1.BIRTH_DATE = '1976-01-29'",
        "alpha_sql.json.csv": "SELECT DISTINCT T4.A2 FROM CLIENT AS T1 INNER JOIN DISP AS T2 ON T1.CLIENT_ID = T2.CLIENT_ID INNER JOIN ACCOUNT AS T3 ON T2.ACCOUNT_ID = T3.ACCOUNT_ID INNER JOIN DISTRICT AS T4 ON T3.DISTRICT_ID = T4.DISTRICT_ID WHERE T1.GENDER = 'F' AND T1.BIRTH_DATE = '1976-01-29'",
        "gsr_sql.json.csv": "SELECT DISTRICT.A2 FROM CLIENT JOIN DISP ON CLIENT.CLIENT_ID = DISP.CLIENT_ID JOIN ACCOUNT ON DISP.ACCOUNT_ID = ACCOUNT.ACCOUNT_ID JOIN DISTRICT ON ACCOUNT.DISTRICT_ID = DISTRICT.DISTRICT_ID WHERE CLIENT.GENDER = 'F' AND CLIENT.BIRTH_DATE = '1976-01-29';",
        "chess_sql.json.csv": "SELECT T4.A2 FROM CLIENT AS T1 INNER JOIN DISP AS T2 ON T1.CLIENT_ID = T2.CLIENT_ID INNER JOIN ACCOUNT AS T3 ON T2.ACCOUNT_ID = T3.ACCOUNT_ID INNER JOIN DISTRICT AS T4 ON T3.DISTRICT_ID = T4.DISTRICT_ID WHERE T1.GENDER = 'F' AND T1.BIRTH_DATE = '1976-01-29'",
        "rsl_sql.json.csv": "SELECT DISTRICT.A2 FROM CLIENT INNER JOIN DISP ON CLIENT.CLIENT_ID = DISP.CLIENT_ID INNER JOIN ACCOUNT ON DISP.ACCOUNT_ID = ACCOUNT.ACCOUNT_ID INNER JOIN DISTRICT ON ACCOUNT.DISTRICT_ID = DISTRICT.DISTRICT_ID WHERE CLIENT.GENDER = 'F' AND CLIENT.BIRTH_DATE = '1976-01-29'",
        "omni-32-majority_sql.json.csv": "SELECT DISTRICT.A2 FROM DISTRICT INNER JOIN ACCOUNT ON DISTRICT.DISTRICT_ID = ACCOUNT.DISTRICT_ID INNER JOIN CLIENT ON DISTRICT.DISTRICT_ID = CLIENT.DISTRICT_ID WHERE CLIENT.GENDER = 'F' AND CLIENT.BIRTH_DATE = '1976-01-29';",
        "gena_submission_1_sql.json.csv": "SELECT T3.A2 FROM CLIENT AS T1 INNER JOIN DISP AS T2 ON T1.CLIENT_ID = T2.CLIENT_ID INNER JOIN ACCOUNT AS T4 ON T2.ACCOUNT_ID = T4.ACCOUNT_ID INNER JOIN DISTRICT AS T3 ON T4.DISTRICT_ID = T3.DISTRICT_ID WHERE T1.GENDER = 'F' AND T1.BIRTH_DATE = '1976-01-29'"
    },
    "242": {
        "question_id": "242",
        "analyze": "GoldSQL: Uses an Implicite assumption on the lenght of atom_id",
        "question": "Among all the atoms from 21 to 25, list all the molecules that are carcinogenic.",
        "evidence": "atoms from 21 to 25 refers to SUBSTR(atom_id, 7, 2) between '21' and '25'; label = '+' mean molecules are carcinogenic",
        "SQL": "SELECT DISTINCT T2.molecule_id FROM atom AS T1 INNER JOIN molecule AS T2 ON T1.molecule_id = T2.molecule_id WHERE SUBSTR(T1.atom_id, -2) BETWEEN '21' AND '25' AND T2.label = '+'",
        "csc-7b_sql.json.csv": "SELECT T1.MOLECULE_ID FROM MOLECULE AS T1 INNER JOIN ATOM AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE SUBSTR(T2.ATOM_ID, 7, 2) BETWEEN '21' AND '25' AND T1.LABEL = '+'",
        "slm_sql.json.csv": "SELECT DISTINCT T2.MOLECULE_ID FROM ATOM AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE SUBSTR(T1.ATOM_ID, 7, 2) BETWEEN '21' AND '25' AND T2.LABEL = '+'",
        "csc-32b_sql.json.csv": "SELECT DISTINCT A.MOLECULE_ID FROM ATOM A JOIN (SELECT MOLECULE_ID FROM MOLECULE WHERE LABEL = '+') M ON A.MOLECULE_ID = M.MOLECULE_ID WHERE SUBSTR(A.ATOM_ID, 7, 2) BETWEEN '21' AND '25' ORDER BY A.MOLECULE_ID",
        "gena_submission_2_sql.json.csv": "SELECT T1.MOLECULE_ID FROM ATOM AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE CAST(SUBSTR(T1.ATOM_ID, 7, 2) AS INTEGER) BETWEEN 21 AND 25 AND T2.LABEL = '+'",
        "alpha_sql.json.csv": "SELECT DISTINCT MOLECULE.MOLECULE_ID FROM ATOM INNER JOIN MOLECULE ON ATOM.MOLECULE_ID = MOLECULE.MOLECULE_ID WHERE SUBSTRING(ATOM.ATOM_ID, 7, 2) BETWEEN '21' AND '25' AND MOLECULE.LABEL = '+'",
        "gsr_sql.json.csv": "SELECT DISTINCT M.MOLECULE_ID FROM ATOM A JOIN MOLECULE M ON A.MOLECULE_ID = M.MOLECULE_ID WHERE SUBSTR(A.ATOM_ID, 7, 2) BETWEEN '21' AND '25' AND M.LABEL = '+';",
        "chess_sql.json.csv": "SELECT DISTINCT T2.MOLECULE_ID FROM ATOM AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T2.LABEL = '+' AND SUBSTR(T1.ATOM_ID, 7, 2) BETWEEN '21' AND '25'",
        "rsl_sql.json.csv": "SELECT DISTINCT MOLECULE.MOLECULE_ID FROM ATOM INNER JOIN MOLECULE ON ATOM.MOLECULE_ID = MOLECULE.MOLECULE_ID WHERE SUBSTR(ATOM.ATOM_ID, 7, 2) BETWEEN '21' AND '25' AND MOLECULE.LABEL = '+'",
        "omni-32-majority_sql.json.csv": "SELECT DISTINCT T1.MOLECULE_ID FROM ATOM AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T2.LABEL = '+' AND CAST(SUBSTR(T1.ATOM_ID, 7, 2) AS INTEGER) BETWEEN 21 AND 25;",
        "gena_submission_1_sql.json.csv": "SELECT T2.MOLECULE_ID FROM ATOM AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE CAST(SUBSTR(T1.ATOM_ID, 7, 2) AS INTEGER) BETWEEN 21 AND 25 AND T2.LABEL = '+'"
    },
    "273": {
        "question_id": "273",
        "analyze": "GoldSQL: COUNT(T1.element) count only non-NULL elements. We can have divition by 0 ",
        "question": "What is the percentage of element chlorine in carcinogenic molecules?",
        "evidence": "chlorine refers to element = 'cl'; label = '+' mean molecules are carcinogenic; percentage = DIVIDE(SUM(element = 'pb'); COUNT(molecule_id)) as percentage where label = '+'",
        "SQL": "SELECT CAST(COUNT( CASE WHEN T1.element = 'cl' THEN T1.element ELSE NULL END) AS REAL) * 100 / COUNT(T1.element) FROM atom AS T1 INNER JOIN molecule AS T2 ON T1.molecule_id = T2.molecule_id WHERE T2.label = '+'",
        "csc-7b_sql.json.csv": "SELECT (CAST(SUM(CASE WHEN ELEMENT = 'CL' THEN 1 ELSE 0 END) AS REAL) * 100) / COUNT(ATOM_ID) AS PERCENTAGE FROM ATOM INNER JOIN MOLECULE ON ATOM.MOLECULE_ID = MOLECULE.MOLECULE_ID WHERE MOLECULE.LABEL = '+'",
        "slm_sql.json.csv": "SELECT CAST(COUNT(CASE WHEN ATOM.ELEMENT = 'CL' THEN 1 END) AS REAL) * 100.0 / COUNT(*) AS PERCENTAGE FROM MOLECULE INNER JOIN ATOM ON MOLECULE.MOLECULE_ID = ATOM.MOLECULE_ID WHERE MOLECULE.LABEL = '+'",
        "csc-32b_sql.json.csv": "SELECT CAST(SUM(CASE WHEN T2.ELEMENT = 'CL' THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(*) FROM MOLECULE AS T1 INNER JOIN ATOM AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T1.LABEL = '+'",
        "gena_submission_2_sql.json.csv": "SELECT CAST(SUM(CASE WHEN T1.ELEMENT = 'CL' THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(T1.MOLECULE_ID) FROM ATOM AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T2.LABEL = '+'",
        "alpha_sql.json.csv": "SELECT CAST(SUM(CASE WHEN ATOM.ELEMENT = 'CL' THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(ATOM.ATOM_ID) AS PERCENTAGE FROM MOLECULE INNER JOIN ATOM ON MOLECULE.MOLECULE_ID = ATOM.MOLECULE_ID WHERE MOLECULE.LABEL = '+'",
        "gsr_sql.json.csv": "SELECT (SUM(ELEMENT = 'CL') * 100.0 / COUNT(*)) AS PERCENTAGE FROM ATOM JOIN MOLECULE ON ATOM.MOLECULE_ID = MOLECULE.MOLECULE_ID WHERE MOLECULE.LABEL = '+';",
        "chess_sql.json.csv": "SELECT CAST(SUM(CASE WHEN T1.ELEMENT = 'CL' THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(T1.MOLECULE_ID) AS PERCENTAGE FROM ATOM AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T2.LABEL = '+'",
        "rsl_sql.json.csv": "SELECT CAST(SUM(CASE WHEN ATOM.ELEMENT = 'CL' THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(ATOM.ATOM_ID) AS PERCENTAGE FROM ATOM INNER JOIN MOLECULE ON ATOM.MOLECULE_ID = MOLECULE.MOLECULE_ID WHERE MOLECULE.LABEL = '+'",
        "omni-32-majority_sql.json.csv": "SELECT CAST(SUM(CASE WHEN A.ELEMENT = 'CL' THEN 1 ELSE 0 END) AS REAL) * 100.0 / COUNT(M.MOLECULE_ID) AS PERCENTAGE FROM MOLECULE M INNER JOIN ATOM A ON M.MOLECULE_ID = A.MOLECULE_ID WHERE M.LABEL = '+';",
        "gena_submission_1_sql.json.csv": "SELECT CAST(SUM(CASE WHEN T1.ELEMENT = 'CL' THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(T1.MOLECULE_ID) FROM ATOM AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T2.LABEL = '+'"
    },
    "312": {
        "question_id": "312",
        "analyze": "GoldSQL: Performs additinal JOIN on atom",
        "question": "What is the carcinogenic label for bond TR001_2_4?",
        "evidence": "label = '+' mean molecules are carcinogenic",
        "SQL": "SELECT DISTINCT T2.label FROM atom AS T1 INNER JOIN molecule AS T2 ON T1.molecule_id = T2.molecule_id INNER JOIN bond AS T3 ON T2.molecule_id = T3.molecule_id WHERE T3.bond_id = 'TR001_2_4'",
        "csc-7b_sql.json.csv": "SELECT T2.LABEL FROM BOND AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T1.BOND_ID = 'TR001_2_4'",
        "slm_sql.json.csv": "SELECT MOLECULE.LABEL FROM BOND INNER JOIN MOLECULE ON BOND.MOLECULE_ID = MOLECULE.MOLECULE_ID WHERE BOND.BOND_ID = 'TR001_2_4'",
        "csc-32b_sql.json.csv": "SELECT M.LABEL FROM MOLECULE M JOIN BOND B ON M.MOLECULE_ID = B.MOLECULE_ID WHERE B.BOND_ID = 'TR001_2_4'",
        "gena_submission_2_sql.json.csv": "SELECT T2.LABEL FROM BOND AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T1.BOND_ID = 'TR001_2_4'",
        "alpha_sql.json.csv": "SELECT MOLECULE.LABEL FROM MOLECULE INNER JOIN BOND ON MOLECULE.MOLECULE_ID = BOND.MOLECULE_ID WHERE BOND.BOND_ID = 'TR001_2_4'",
        "gsr_sql.json.csv": "SELECT M.LABEL FROM BOND B JOIN MOLECULE M ON B.MOLECULE_ID = M.MOLECULE_ID WHERE B.BOND_ID = 'TR001_2_4';",
        "chess_sql.json.csv": "SELECT T2.LABEL FROM BOND AS T1 INNER JOIN MOLECULE AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T1.BOND_ID = 'TR001_2_4'",
        "rsl_sql.json.csv": "SELECT MOLECULE.LABEL FROM BOND INNER JOIN MOLECULE ON BOND.MOLECULE_ID = MOLECULE.MOLECULE_ID WHERE BOND.BOND_ID = 'TR001_2_4'",
        "omni-32-majority_sql.json.csv": "SELECT MOLECULE.LABEL FROM MOLECULE INNER JOIN BOND ON MOLECULE.MOLECULE_ID = BOND.MOLECULE_ID WHERE BOND.BOND_ID = 'TR001_2_4';",
        "gena_submission_1_sql.json.csv": "SELECT T1.LABEL FROM MOLECULE AS T1 INNER JOIN BOND AS T2 ON T1.MOLECULE_ID = T2.MOLECULE_ID WHERE T2.BOND_ID = 'TR001_2_4'"
    },
    "318": {
        "question_id": "318",
        "analyze": "GoldSQL: Perfoms addition JOIN operators (not sure why)",
        "question": "What is the molecule id of bond id TR001_1_7?",
        "evidence": "",
        "SQL": "SELECT DISTINCT T1.molecule_id FROM atom AS T1 INNER JOIN connected AS T2 ON T1.atom_id = T2.atom_id WHERE T2.bond_id = 'TR001_1_7'",
        "csc-7b_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7'",
        "slm_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7'",
        "csc-32b_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7'",
        "gena_submission_2_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7'",
        "alpha_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7'",
        "gsr_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7';",
        "chess_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7'",
        "rsl_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7'",
        "omni-32-majority_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7';",
        "gena_submission_1_sql.json.csv": "SELECT MOLECULE_ID FROM BOND WHERE BOND_ID = 'TR001_1_7'"
    },
    "345": {
        "question_id": "345",
        "analyze": "Ambiguous question: it does not specify whether we want the status per card (seems to be) or all possible statuses across these cards (as in the Gold SQL).",
        "question": "For artifact type of cards that do not have multiple faces on the same card, state its legalities status for vintage play format.",
        "evidence": "Artifact type of cards refers to types = 'Artifact'; card does not have multiple faces on the same card refers to side is NULL'; vintage play format refers to format = 'vintage';",
        "SQL": "SELECT DISTINCT T2.status FROM cards AS T1 INNER JOIN legalities AS T2 ON T1.uuid = T2.uuid WHERE T1.type = 'Artifact' AND T2.format = 'vintage' AND T1.side IS NULL",
        "csc-7b_sql.json.csv": "SELECT T2.STATUS FROM CARDS AS T1 JOIN LEGALITIES AS T2 ON T1.UUID = T2.UUID WHERE T1.TYPES = 'ARTIFACT' AND T1.SIDE IS NULL AND T2.FORMAT = 'VINTAGE'",
        "slm_sql.json.csv": "SELECT LEGALITIES.STATUS FROM CARDS INNER JOIN LEGALITIES ON CARDS.UUID = LEGALITIES.UUID WHERE CARDS.TYPES = 'ARTIFACT' AND CARDS.SIDE IS NULL AND LEGALITIES.FORMAT = 'VINTAGE'",
        "csc-32b_sql.json.csv": "SELECT L.STATUS FROM CARDS C JOIN LEGALITIES L ON C.UUID = L.UUID WHERE C.TYPES = 'ARTIFACT' AND C.SIDE IS NULL AND L.FORMAT = 'VINTAGE'",
        "gena_submission_2_sql.json.csv": "SELECT T2.STATUS FROM CARDS AS T1 INNER JOIN LEGALITIES AS T2 ON T1.UUID = T2.UUID WHERE T1.TYPES = 'ARTIFACT' AND T1.SIDE IS NULL AND T2.FORMAT = 'VINTAGE'",
        "alpha_sql.json.csv": "SELECT T2.STATUS FROM CARDS AS T1 INNER JOIN LEGALITIES AS T2 ON T1.UUID = T2.UUID WHERE T1.TYPES = 'ARTIFACT' AND T1.SIDE IS NULL AND T2.FORMAT = 'VINTAGE'",
        "gsr_sql.json.csv": "SELECT L.STATUS FROM CARDS C JOIN LEGALITIES L ON C.UUID = L.UUID WHERE C.TYPES = 'ARTIFACT' AND C.SIDE IS NULL AND L.FORMAT = 'VINTAGE';",
        "chess_sql.json.csv": "SELECT T2.STATUS FROM CARDS AS T1 INNER JOIN LEGALITIES AS T2 ON T1.UUID = T2.UUID WHERE T1.TYPES = 'ARTIFACT' AND T1.SIDE IS NULL AND T2.FORMAT = 'VINTAGE'",
        "rsl_sql.json.csv": "SELECT LEGALITIES.STATUS FROM CARDS INNER JOIN LEGALITIES ON CARDS.UUID = LEGALITIES.UUID WHERE CARDS.TYPES = 'ARTIFACT' AND CARDS.SIDE IS NULL AND LEGALITIES.FORMAT = 'VINTAGE'",
        "omni-32-majority_sql.json.csv": "SELECT LEGALITIES.STATUS FROM CARDS INNER JOIN LEGALITIES ON CARDS.UUID = LEGALITIES.UUID WHERE CARDS.TYPES = 'ARTIFACT' AND CARDS.SIDE IS NULL AND LEGALITIES.FORMAT = 'VINTAGE';",
        "gena_submission_1_sql.json.csv": "SELECT T2.STATUS FROM CARDS AS T1 INNER JOIN LEGALITIES AS T2 ON T1.UUID = T2.UUID WHERE T1.TYPES = 'ARTIFACT' AND T1.SIDE IS NULL AND T2.FORMAT = 'VINTAGE'"
    },
    "365": {
        "question_id": "365",
        "analyze": "GoldSQL: Performs unnecessary filtering on FOREIGN_DATA ",
        "question": "What is the type of card \"Benalish Knight\"?",
        "evidence": "Benalish Knight' is the name of card;",
        "SQL": "SELECT DISTINCT T1.type FROM cards AS T1 INNER JOIN foreign_data AS T2 ON T1.uuid = T2.uuid WHERE T1.name = 'Benalish Knight'",
        "csc-7b_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT'",
        "slm_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT'",
        "csc-32b_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT'",
        "gena_submission_2_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT'",
        "alpha_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT'",
        "gsr_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT';",
        "chess_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT'",
        "rsl_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT'",
        "omni-32-majority_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT';",
        "gena_submission_1_sql.json.csv": "SELECT TYPE FROM CARDS WHERE NAME = 'BENALISH KNIGHT'"
    },
    "475": {
        "question_id": "475",
        "analyze": "GoldSQL: SUM on empty rows return NULL. We need to return 0 as the question is 'How many'",
        "question": "How many cards in the set Coldsnap have a black border color?",
        "evidence": "card set Coldsnap refers to name = 'Coldsnap'; black border color refers to borderColor = 'black'",
        "SQL": "SELECT SUM(CASE WHEN T1.borderColor = 'black' THEN 1 ELSE 0 END) FROM cards AS T1 INNER JOIN sets AS T2 ON T2.code = T1.setCode WHERE T2.name = 'Coldsnap'",
        "csc-7b_sql.json.csv": "SELECT COUNT(*) FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T2.CODE = T1.SETCODE WHERE T2.NAME = 'COLDSNAP' AND T1.BORDERCOLOR = 'BLACK'",
        "slm_sql.json.csv": "SELECT COUNT(*) FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE WHERE T2.NAME = 'COLDSNAP' AND T1.BORDERCOLOR = 'BLACK'",
        "csc-32b_sql.json.csv": "SELECT COUNT(*) FROM SETS S JOIN CARDS C ON S.CODE = C.SETCODE WHERE S.NAME = 'COLDSNAP' AND C.BORDERCOLOR = 'BLACK'",
        "gena_submission_2_sql.json.csv": "SELECT COUNT(*) FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE WHERE T2.NAME = 'COLDSNAP' AND T1.BORDERCOLOR = 'BLACK'",
        "alpha_sql.json.csv": "SELECT COUNT(CARDS.ID) FROM CARDS INNER JOIN SETS ON CARDS.SETCODE = SETS.CODE WHERE SETS.NAME = 'COLDSNAP' AND CARDS.BORDERCOLOR = 'BLACK'",
        "gsr_sql.json.csv": "SELECT COUNT(*) FROM CARDS WHERE SETCODE = (SELECT CODE FROM SETS WHERE NAME = 'COLDSNAP') AND BORDERCOLOR = 'BLACK';",
        "chess_sql.json.csv": "SELECT COUNT(T1.ID) FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE WHERE T2.NAME = 'COLDSNAP' AND T1.BORDERCOLOR = 'BLACK'",
        "rsl_sql.json.csv": "SELECT COUNT(CARDS.ID) FROM CARDS INNER JOIN SETS ON CARDS.SETCODE = SETS.CODE WHERE SETS.NAME = 'COLDSNAP' AND CARDS.BORDERCOLOR = 'BLACK'",
        "omni-32-majority_sql.json.csv": "SELECT COUNT(CARDS.ID) FROM CARDS INNER JOIN SETS ON CARDS.SETCODE = SETS.CODE WHERE SETS.NAME = 'COLDSNAP' AND CARDS.BORDERCOLOR = 'BLACK';",
        "gena_submission_1_sql.json.csv": "SELECT COUNT(*) FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE WHERE T2.NAME = 'COLDSNAP' AND T1.BORDERCOLOR = 'BLACK'"
    },
    "504": {
        "question_id": "504",
        "analyze": "GoldSQL: does not account for non-unqiueness of setcode of for each name in SETs",
        "question": "How many cards are there in the set 'World Championship Decks 2004' with the converted mana cost as '3'.",
        "evidence": "the set 'World Championship Decks 2004' refers to name = 'World Championship Decks 2004'",
        "SQL": "SELECT COUNT(id) FROM cards WHERE setCode IN ( SELECT code FROM sets WHERE name = 'World Championship Decks 2004' ) AND convertedManaCost = 3",
        "csc-7b_sql.json.csv": "SELECT COUNT(*) FROM SETS AS T1 JOIN CARDS AS T2 ON T1.CODE = T2.SETCODE WHERE T1.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND T2.CONVERTEDMANACOST = 3",
        "slm_sql.json.csv": "SELECT COUNT(*) AS CARD_COUNT FROM CARDS INNER JOIN SETS ON CARDS.SETCODE = SETS.CODE WHERE SETS.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND CARDS.CONVERTEDMANACOST = 3",
        "csc-32b_sql.json.csv": "SELECT COUNT(*) FROM SETS S JOIN CARDS C ON S.CODE = C.SETCODE WHERE S.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND C.CONVERTEDMANACOST = 3",
        "gena_submission_2_sql.json.csv": "SELECT COUNT(*) FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE WHERE T2.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND T1.CONVERTEDMANACOST = 3",
        "alpha_sql.json.csv": "SELECT COUNT(*) FROM SETS INNER JOIN CARDS ON SETS.CODE = CARDS.SETCODE WHERE SETS.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND CARDS.CONVERTEDMANACOST = 3",
        "gsr_sql.json.csv": "SELECT COUNT(*) FROM CARDS JOIN SETS ON CARDS.SETCODE = SETS.CODE WHERE SETS.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND CARDS.CONVERTEDMANACOST = 3;",
        "chess_sql.json.csv": "SELECT COUNT(T2.ID) FROM SETS AS T1 INNER JOIN CARDS AS T2 ON T1.CODE = T2.SETCODE WHERE T1.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND T2.CONVERTEDMANACOST = 3",
        "rsl_sql.json.csv": "SELECT COUNT(CARDS.ID) FROM CARDS INNER JOIN SETS ON CARDS.SETCODE = SETS.CODE WHERE SETS.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND CARDS.CONVERTEDMANACOST = 3",
        "omni-32-majority_sql.json.csv": "SELECT COUNT(CARDS.ID) AS CARD_COUNT FROM SETS INNER JOIN CARDS ON SETS.CODE = CARDS.SETCODE WHERE SETS.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND CARDS.CONVERTEDMANACOST = 3;",
        "gena_submission_1_sql.json.csv": "SELECT COUNT(T1.ID) FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE WHERE T2.NAME = 'WORLD CHAMPIONSHIP DECKS 2004' AND T1.CONVERTEDMANACOST = 3"
    },
    "506": {
        "question_id": "506",
        "analyze": "GoldSQL: does not account for non-unqiueness of setcode of for each name in SETs",
        "question": "For all the set of cards that has Japanese translation, what is the percentage of them are only available in non-foil?",
        "evidence": "Japanese translation refers to language = 'Japanese'; in non-foil refers to isNonFoilOnly = 1; percentage of Japanese non foil in Japanese cards refers to DIVIDE(SUM(isNonFoilOnly = 1), SUM(language = 'Japanese'))*100",
        "SQL": "SELECT CAST(SUM(CASE WHEN isNonFoilOnly = 1 THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(id) FROM sets WHERE code IN ( SELECT setCode FROM set_translations WHERE language = 'Japanese' )",
        "csc-7b_sql.json.csv": "SELECT CAST(COUNT(CASE WHEN T1.ISNONFOILONLY = 1 THEN T1.ID ELSE NULL END) AS REAL) * 100 / COUNT(*) FROM SETS AS T1 JOIN SET_TRANSLATIONS AS T2 ON T1.CODE = T2.SETCODE WHERE T2.LANGUAGE = 'JAPANESE'",
        "slm_sql.json.csv": "SELECT(SUM(CASE WHEN SETS.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) ) * 100.0 / COUNT(*) FROM SET_TRANSLATIONS INNER JOIN SETS ON SET_TRANSLATIONS.SETCODE = SETS.CODE WHERE SET_TRANSLATIONS.LANGUAGE = 'JAPANESE'",
        "csc-32b_sql.json.csv": "SELECT CAST(SUM(CASE WHEN S.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(*) AS PERCENTAGE_NON_FOIL FROM SETS S JOIN SET_TRANSLATIONS ST ON S.CODE = ST.SETCODE WHERE ST.LANGUAGE = 'JAPANESE'",
        "gena_submission_2_sql.json.csv": "SELECT CAST(SUM(CASE WHEN T1.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(*) FROM SETS AS T1 INNER JOIN SET_TRANSLATIONS AS T2 ON T1.CODE = T2.SETCODE WHERE T2.LANGUAGE = 'JAPANESE'",
        "alpha_sql.json.csv": "SELECT (SUM(CASE WHEN SETS.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) * 100.0 / COUNT(*)) AS PERCENTAGE FROM SETS INNER JOIN SET_TRANSLATIONS ON SETS.CODE = SET_TRANSLATIONS.SETCODE WHERE SET_TRANSLATIONS.LANGUAGE = 'JAPANESE'",
        "gsr_sql.json.csv": "SELECT (SUM(CASE WHEN S.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) * 100.0 / COUNT(*)) AS PERCENTAGE FROM SETS S JOIN SET_TRANSLATIONS ST ON S.CODE = ST.SETCODE WHERE ST.LANGUAGE = 'JAPANESE';",
        "chess_sql.json.csv": "SELECT CAST(SUM(CASE WHEN T2.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(T1.SETCODE) AS PERCENTAGE FROM SET_TRANSLATIONS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE WHERE T1.LANGUAGE = 'JAPANESE'",
        "rsl_sql.json.csv": "SELECT CAST(SUM(CASE WHEN SETS.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(*) FROM SETS INNER JOIN SET_TRANSLATIONS ON SETS.CODE = SET_TRANSLATIONS.SETCODE WHERE SET_TRANSLATIONS.LANGUAGE = 'JAPANESE'",
        "omni-32-majority_sql.json.csv": "SELECT CAST(SUM(CASE WHEN T2.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) AS REAL) * 100.0 / COUNT(*) AS PERCENTAGE FROM SET_TRANSLATIONS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE WHERE T1.LANGUAGE = 'JAPANESE';",
        "gena_submission_1_sql.json.csv": "SELECT CAST(SUM(CASE WHEN T1.ISNONFOILONLY = 1 THEN 1 ELSE 0 END) AS REAL) * 100 / COUNT(*) FROM SETS AS T1 INNER JOIN SET_TRANSLATIONS AS T2 ON T1.CODE = T2.SETCODE WHERE T2.LANGUAGE = 'JAPANESE'"
    },
    "528": {
        "question_id": "528",
        "analyze": "GoldSQL: outputs  cards with  status != 'Legal' with format =  NULL",
        "question": "List the names of all the cards in the set Hour of Devastation and find the formats in which these cards are legal.",
        "evidence": "the set Hour of Devastation refers to set.name = 'Hour of Devastation'; names of all the cards in the set refers to cards.name; legal cards refers to status = 'Legal'; the formats refers to format",
        "SQL": "SELECT DISTINCT T2.name , CASE WHEN T1.status = 'Legal' THEN T1.format ELSE NULL END FROM legalities AS T1 INNER JOIN cards AS T2 ON T2.uuid = T1.uuid WHERE T2.setCode IN ( SELECT code FROM sets WHERE name = 'Hour of Devastation' )",
        "csc-7b_sql.json.csv": "SELECT T2.NAME, T3.FORMAT FROM SETS AS T1 INNER JOIN CARDS AS T2 ON T2.SETCODE = T1.CODE INNER JOIN LEGALITIES AS T3 ON T2.UUID = T3.UUID WHERE T1.NAME = 'HOUR OF DEVASTATION' AND T3.STATUS = 'LEGAL'",
        "slm_sql.json.csv": "SELECT C.NAME AS CARD_NAME, L.FORMAT AS LEGAL_FORMAT FROM CARDS C INNER JOIN LEGALITIES L ON C.UUID = L.UUID INNER JOIN SETS S ON C.SETCODE = S.CODE WHERE S.NAME = 'HOUR OF DEVASTATION' AND L.STATUS = 'LEGAL'",
        "csc-32b_sql.json.csv": "SELECT T1.NAME, T3.FORMAT FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE INNER JOIN LEGALITIES AS T3 ON T1.UUID = T3.UUID WHERE T2.NAME = 'HOUR OF DEVASTATION' AND T3.STATUS = 'LEGAL'",
        "gena_submission_2_sql.json.csv": "SELECT T1.NAME, T2.FORMAT FROM CARDS AS T1 INNER JOIN LEGALITIES AS T2 ON T1.UUID = T2.UUID INNER JOIN SETS AS T3 ON T1.SETCODE = T3.CODE WHERE T3.NAME = 'HOUR OF DEVASTATION' AND T2.STATUS = 'LEGAL'",
        "alpha_sql.json.csv": "SELECT T1.NAME, T3.FORMAT FROM CARDS AS T1 INNER JOIN SETS AS T2 ON T1.SETCODE = T2.CODE INNER JOIN LEGALITIES AS T3 ON T1.UUID = T3.UUID WHERE T2.NAME = 'HOUR OF DEVASTATION' AND T3.STATUS = 'LEGAL'",
        "gsr_sql.json.csv": "SELECT C.NAME, L.FORMAT FROM CARDS C JOIN LEGALITIES L ON C.UUID = L.UUID JOIN SETS S ON C.SETCODE = S.CODE WHERE S.NAME = 'HOUR OF DEVASTATION' AND L.STATUS = 'LEGAL';",
        "chess_sql.json.csv": "SELECT T2.NAME, T3.FORMAT FROM SETS AS T1 INNER JOIN CARDS AS T2 ON T1.CODE = T2.SETCODE INNER JOIN LEGALITIES AS T3 ON T2.UUID = T3.UUID WHERE T1.NAME = 'HOUR OF DEVASTATION' AND T3.STATUS = 'LEGAL'",
        "rsl_sql.json.csv": "SELECT CARDS.NAME, LEGALITIES.FORMAT FROM CARDS INNER JOIN LEGALITIES ON CARDS.UUID = LEGALITIES.UUID INNER JOIN SETS ON CARDS.SETCODE = SETS.CODE WHERE SETS.NAME = 'HOUR OF DEVASTATION' AND LEGALITIES.STATUS = 'LEGAL'",
        "omni-32-majority_sql.json.csv": "SELECT CARDS.NAME, LEGALITIES.FORMAT FROM SETS INNER JOIN CARDS ON SETS.CODE = CARDS.SETCODE INNER JOIN LEGALITIES ON CARDS.UUID = LEGALITIES.UUID WHERE SETS.NAME = 'HOUR OF DEVASTATION' AND LEGALITIES.STATUS = 'LEGAL';",
        "gena_submission_1_sql.json.csv": "SELECT T1.NAME, T2.FORMAT FROM CARDS AS T1 INNER JOIN LEGALITIES AS T2 ON T1.UUID = T2.UUID INNER JOIN SETS AS T3 ON T1.SETCODE = T3.CODE WHERE T3.NAME = 'HOUR OF DEVASTATION' AND T2.STATUS = 'LEGAL'"
    },
    "583": {
        "question_id": "583",
        "analyze": "Ambigious question: It doesn’t specify whether we need to compute score per url or in total",
        "question": "What is the total score of the posts edited by Yevgeny and include the user's website URL.",
        "evidence": "\"Yevgeny\" is the DisplayName; edited refers to LastEditorUserId",
        "SQL": "SELECT SUM(T1.Score), T2.WebsiteUrl FROM posts AS T1 INNER JOIN users AS T2 ON T1.LastEditorUserId = T2.Id WHERE T2.DisplayName = 'Yevgeny' GROUP BY T2.WebsiteUrl",
        "csc-7b_sql.json.csv": "SELECT SUM(POSTS.SCORE), USERS.WEBSITEURL FROM POSTS JOIN USERS ON POSTS.LASTEDITORUSERID = USERS.ID WHERE USERS.DISPLAYNAME = 'YEVGENY'",
        "slm_sql.json.csv": "SELECT SUM(P.SCORE) AS TOTALSCORE, U.WEBSITEURL FROM USERS U INNER JOIN POSTS P ON U.ID = P.LASTEDITORUSERID WHERE U.DISPLAYNAME = 'YEVGENY'",
        "csc-32b_sql.json.csv": "SELECT SUM(P.SCORE) AS TOTALSCORE, U.WEBSITEURL FROM POSTS P JOIN USERS U ON P.LASTEDITORUSERID = U.ID WHERE U.DISPLAYNAME = 'YEVGENY'",
        "gena_submission_2_sql.json.csv": "SELECT SUM(T1.SCORE), T2.WEBSITEURL FROM POSTS AS T1 INNER JOIN USERS AS T2 ON T1.LASTEDITORUSERID = T2.ID WHERE T2.DISPLAYNAME = 'YEVGENY'",
        "alpha_sql.json.csv": "SELECT SUM(POSTS.SCORE) AS TOTALSCORE, USERS.WEBSITEURL FROM POSTS INNER JOIN USERS ON POSTS.LASTEDITORUSERID = USERS.ID WHERE USERS.DISPLAYNAME = 'YEVGENY'",
        "gsr_sql.json.csv": "SELECT SUM(CAST(POSTS.SCORE AS FLOAT)) AS TOTAL_SCORE, USERS.WEBSITEURL FROM POSTS JOIN USERS ON POSTS.LASTEDITORUSERID = USERS.ID WHERE USERS.DISPLAYNAME = 'YEVGENY';",
        "chess_sql.json.csv": "SELECT SUM(T2.SCORE), T1.WEBSITEURL FROM USERS AS T1 INNER JOIN POSTS AS T2 ON T1.ID = T2.LASTEDITORUSERID WHERE T1.DISPLAYNAME = 'YEVGENY'",
        "rsl_sql.json.csv": "SELECT SUM(POSTS.SCORE), USERS.WEBSITEURL FROM POSTS INNER JOIN USERS ON POSTS.LASTEDITORUSERID = USERS.ID WHERE USERS.DISPLAYNAME = 'YEVGENY'",
        "omni-32-majority_sql.json.csv": "SELECT COALESCE(SUM(POSTS.SCORE), 0) AS TOTALSCORE, USERS.WEBSITEURL FROM USERS JOIN POSTS ON USERS.ID = POSTS.LASTEDITORUSERID WHERE USERS.DISPLAYNAME = 'YEVGENY';",
        "gena_submission_1_sql.json.csv": "SELECT SUM(T1.SCORE), T2.WEBSITEURL FROM POSTS AS T1 INNER JOIN USERS AS T2 ON T1.LASTEDITORUSERID = T2.ID WHERE T2.DISPLAYNAME = 'YEVGENY'"
    },
    "668": {
        "question_id": "668",
        "analyze": "GoldSQL: allows NULL badges",
        "question": "What is the display name of the user who acquired the highest amount of badges?",
        "evidence": "highest amount of badges refers to MAX(COUNT(Name));",
        "SQL": "SELECT T1.DisplayName FROM users AS T1 INNER JOIN badges AS T2 ON T1.Id = T2.UserId GROUP BY T1.DisplayName ORDER BY COUNT(T1.Id) DESC LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT T2.DISPLAYNAME FROM BADGES AS T1 JOIN USERS AS T2 ON T1.USERID = T2.ID GROUP BY T1.USERID ORDER BY COUNT(T1.NAME) DESC LIMIT 1",
        "slm_sql.json.csv": "SELECT U.DISPLAYNAME FROM BADGES B INNER JOIN USERS U ON B.USERID = U.ID GROUP BY B.USERID, U.DISPLAYNAME ORDER BY COUNT(B.ID) DESC LIMIT 1",
        "csc-32b_sql.json.csv": "SELECT T2.DISPLAYNAME FROM BADGES AS T1 JOIN USERS AS T2 ON T1.USERID = T2.ID GROUP BY T2.DISPLAYNAME ORDER BY COUNT(T1.NAME) DESC LIMIT 1",
        "gena_submission_2_sql.json.csv": "SELECT T1.DISPLAYNAME FROM USERS AS T1 INNER JOIN BADGES AS T2 ON T1.ID = T2.USERID GROUP BY T1.DISPLAYNAME ORDER BY COUNT(T2.NAME) DESC LIMIT 1",
        "alpha_sql.json.csv": "SELECT USERS.DISPLAYNAME FROM USERS INNER JOIN BADGES ON USERS.ID = BADGES.USERID GROUP BY USERS.ID ORDER BY COUNT(BADGES.NAME) DESC LIMIT 1",
        "gsr_sql.json.csv": "SELECT U.DISPLAYNAME FROM USERS U JOIN BADGES B ON U.ID = B.USERID GROUP BY U.ID ORDER BY COUNT(B.NAME) DESC LIMIT 1;",
        "chess_sql.json.csv": "SELECT T2.DISPLAYNAME FROM BADGES AS T1 INNER JOIN USERS AS T2 ON T1.USERID = T2.ID GROUP BY T2.DISPLAYNAME ORDER BY COUNT(T1.NAME) DESC LIMIT 1",
        "rsl_sql.json.csv": "SELECT USERS.DISPLAYNAME FROM USERS INNER JOIN BADGES ON USERS.ID = BADGES.USERID GROUP BY BADGES.USERID ORDER BY COUNT(BADGES.NAME) DESC LIMIT 1",
        "omni-32-majority_sql.json.csv": "SELECT U.DISPLAYNAME FROM USERS U INNER JOIN BADGES B ON U.ID = B.USERID GROUP BY U.ID, U.DISPLAYNAME ORDER BY COUNT(B.NAME) DESC LIMIT 1;",
        "gena_submission_1_sql.json.csv": "SELECT T1.DISPLAYNAME FROM USERS AS T1 INNER JOIN BADGES AS T2 ON T1.ID = T2.USERID GROUP BY T1.DISPLAYNAME ORDER BY COUNT(T2.NAME) DESC LIMIT 1"
    },
    "669": {
        "question_id": "669",
        "analyze": "GoldSQL: It allows NULL dates",
        "question": "When did 'chl' cast its first vote in a post?",
        "evidence": "DisplayName = 'chl'; cast its first vote refers to MIN(CreationDate);",
        "SQL": "SELECT T2.CreationDate FROM users AS T1 INNER JOIN votes AS T2 ON T1.Id = T2.UserId WHERE T1.DisplayName = 'chl' ORDER BY T2.CreationDate LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT MIN(T1.CREATIONDATE) FROM VOTES AS T1 INNER JOIN USERS AS T2 ON T1.USERID = T2.ID WHERE T2.DISPLAYNAME = 'CHL' ORDER BY T1.CREATIONDATE ASC LIMIT 1",
        "slm_sql.json.csv": "SELECT MIN(V.CREATIONDATE) AS FIRSTVOTEDATE FROM USERS U INNER JOIN VOTES V ON U.ID = V.USERID WHERE U.DISPLAYNAME = 'CHL'",
        "csc-32b_sql.json.csv": "SELECT MIN(V.CREATIONDATE) AS FIRSTVOTEDATE FROM USERS U JOIN VOTES V ON U.ID = V.USERID WHERE U.DISPLAYNAME = 'CHL'",
        "gena_submission_2_sql.json.csv": "SELECT MIN(T1.CREATIONDATE) FROM VOTES AS T1 INNER JOIN USERS AS T2 ON T1.USERID = T2.ID WHERE T2.DISPLAYNAME = 'CHL'",
        "alpha_sql.json.csv": "SELECT MIN(VOTES.CREATIONDATE) FROM VOTES INNER JOIN USERS ON VOTES.USERID = USERS.ID WHERE USERS.DISPLAYNAME = 'CHL'",
        "gsr_sql.json.csv": "SELECT MIN(VOTES.CREATIONDATE) FROM VOTES JOIN USERS ON VOTES.USERID = USERS.ID WHERE USERS.DISPLAYNAME = 'CHL';",
        "chess_sql.json.csv": "SELECT MIN(T2.CREATIONDATE) FROM USERS AS T1 INNER JOIN VOTES AS T2 ON T1.ID = T2.USERID WHERE T1.DISPLAYNAME = 'CHL'",
        "rsl_sql.json.csv": "SELECT MIN(V.CREATIONDATE) FROM VOTES V INNER JOIN USERS U ON V.USERID = U.ID WHERE U.DISPLAYNAME = 'CHL'",
        "omni-32-majority_sql.json.csv": "SELECT MIN(VOTES.CREATIONDATE) AS FIRSTVOTEDATE FROM USERS INNER JOIN VOTES ON USERS.ID = VOTES.USERID WHERE USERS.DISPLAYNAME = 'CHL';",
        "gena_submission_1_sql.json.csv": "SELECT MIN(T1.CREATIONDATE) FROM VOTES AS T1 INNER JOIN USERS AS T2 ON T1.USERID = T2.ID WHERE T2.DISPLAYNAME = 'CHL'"
    },
    "707": {
        "question_id": "707",
        "analyze": "Ambigious question: It doesn’t specify tie breaking rule",
        "question": "Among the posts with views ranging from 100 to 150, what is the comment with the highest score?",
        "evidence": "views ranging from 100 to 150 refers to ViewCount BETWEEN 100 and 150; comment with the highest score refers to Text where MAX(Score);",
        "SQL": "SELECT Text FROM comments WHERE PostId IN ( SELECT Id FROM posts WHERE ViewCount BETWEEN 100 AND 150 ) ORDER BY Score DESC LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT T2.TEXT FROM POSTS AS T1 INNER JOIN COMMENTS AS T2 ON T1.ID = T2.POSTID WHERE T1.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY T2.SCORE DESC LIMIT 1",
        "slm_sql.json.csv": "SELECT C.TEXT FROM POSTS P INNER JOIN COMMENTS C ON P.ID = C.POSTID WHERE P.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY C.SCORE DESC LIMIT 1",
        "csc-32b_sql.json.csv": "SELECT C.TEXT FROM COMMENTS C JOIN POSTS P ON C.POSTID = P.ID WHERE P.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY C.SCORE DESC LIMIT 1",
        "gena_submission_2_sql.json.csv": "SELECT T1.TEXT FROM COMMENTS AS T1 INNER JOIN POSTS AS T2 ON T1.POSTID = T2.ID WHERE T2.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY T1.SCORE DESC LIMIT 1",
        "alpha_sql.json.csv": "SELECT C.TEXT FROM POSTS AS P INNER JOIN COMMENTS AS C ON P.ID = C.POSTID WHERE P.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY C.SCORE DESC LIMIT 1",
        "gsr_sql.json.csv": "SELECT C.TEXT FROM COMMENTS C JOIN POSTS P ON C.POSTID = P.ID WHERE P.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY C.SCORE DESC LIMIT 1;",
        "chess_sql.json.csv": "SELECT T2.TEXT FROM POSTS AS T1 INNER JOIN COMMENTS AS T2 ON T1.ID = T2.POSTID WHERE T1.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY T2.SCORE DESC LIMIT 1",
        "rsl_sql.json.csv": "SELECT COMMENTS.TEXT FROM POSTS INNER JOIN COMMENTS ON POSTS.ID = COMMENTS.POSTID WHERE POSTS.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY COMMENTS.SCORE DESC LIMIT 1",
        "omni-32-majority_sql.json.csv": "SELECT COMMENTS.TEXT FROM COMMENTS INNER JOIN POSTS ON COMMENTS.POSTID = POSTS.ID WHERE POSTS.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY COMMENTS.SCORE DESC LIMIT 1;",
        "gena_submission_1_sql.json.csv": "SELECT T1.TEXT FROM COMMENTS AS T1 INNER JOIN POSTS AS T2 ON T1.POSTID = T2.ID WHERE T2.VIEWCOUNT BETWEEN 100 AND 150 ORDER BY T1.SCORE DESC LIMIT 1"
    },
    "742": {
        "question_id": "742",
        "analyze": "GoldSQL: ignoreampire superheroes with name NULL (name is not the key) ",
        "question": "How many vampire superheroes are there?",
        "evidence": "vampire superheroes refers to race = 'Vampire'",
        "SQL": "SELECT COUNT(T1.superhero_name) FROM superhero AS T1 INNER JOIN race AS T2 ON T1.race_id = T2.id WHERE T2.race = 'Vampire'",
        "csc-7b_sql.json.csv": "SELECT COUNT(*) FROM SUPERHERO AS T1 JOIN RACE AS T2 ON T1.RACE_ID = T2.ID WHERE T2.RACE = 'VAMPIRE'",
        "slm_sql.json.csv": "SELECT COUNT(SUPERHERO.ID) AS COUNT FROM SUPERHERO JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'VAMPIRE'",
        "csc-32b_sql.json.csv": "SELECT COUNT(*) FROM SUPERHERO JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'VAMPIRE'",
        "gena_submission_2_sql.json.csv": "SELECT COUNT(*) FROM SUPERHERO AS T1 INNER JOIN RACE AS T2 ON T1.RACE_ID = T2.ID WHERE T2.RACE = 'VAMPIRE'",
        "alpha_sql.json.csv": "SELECT COUNT(SUPERHERO.ID) FROM SUPERHERO INNER JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'VAMPIRE'",
        "gsr_sql.json.csv": "SELECT COUNT(*) FROM SUPERHERO JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'VAMPIRE';",
        "chess_sql.json.csv": "SELECT COUNT(T2.ID) FROM RACE AS T1 INNER JOIN SUPERHERO AS T2 ON T1.ID = T2.RACE_ID WHERE T1.RACE = 'VAMPIRE'",
        "rsl_sql.json.csv": "SELECT COUNT(ID) FROM SUPERHERO WHERE RACE_ID = (SELECT ID FROM RACE WHERE RACE = 'VAMPIRE')",
        "omni-32-majority_sql.json.csv": "SELECT COUNT(SUPERHERO.ID) FROM SUPERHERO INNER JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'VAMPIRE';",
        "gena_submission_1_sql.json.csv": "SELECT COUNT(*) FROM SUPERHERO AS T1 INNER JOIN RACE AS T2 ON T1.RACE_ID = T2.ID WHERE T2.RACE = 'VAMPIRE'"
    },
    "789": {
        "question_id": "789",
        "analyze": "GoldSQL: denominator counts NULL weight_kg values",
        "question": "Find the average weight of the heroes who are aliens.",
        "evidence": "average = AVG(weight_kg); aliens refers to race = 'Alien';",
        "SQL": "SELECT CAST(SUM(T1.weight_kg) AS REAL) / COUNT(T1.id) FROM superhero AS T1 INNER JOIN race AS T2 ON T1.race_id = T2.id WHERE T2.race = 'Alien'",
        "csc-7b_sql.json.csv": "SELECT AVG(T1.WEIGHT_KG) FROM SUPERHERO AS T1 JOIN RACE AS T2 ON T1.RACE_ID = T2.ID WHERE T2.RACE = 'ALIEN'",
        "slm_sql.json.csv": "SELECT AVG(SUPERHERO.WEIGHT_KG) AS AVERAGE_WEIGHT FROM SUPERHERO INNER JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'ALIEN'",
        "csc-32b_sql.json.csv": "SELECT AVG(S.WEIGHT_KG) AS AVERAGE_WEIGHT FROM SUPERHERO S JOIN RACE R ON S.RACE_ID = R.ID WHERE R.RACE = 'ALIEN'",
        "gena_submission_2_sql.json.csv": "SELECT AVG(T1.WEIGHT_KG) FROM SUPERHERO AS T1 INNER JOIN RACE AS T2 ON T1.RACE_ID = T2.ID WHERE T2.RACE = 'ALIEN'",
        "alpha_sql.json.csv": "SELECT AVG(SUPERHERO.WEIGHT_KG) FROM SUPERHERO INNER JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'ALIEN'",
        "gsr_sql.json.csv": "SELECT AVG(CAST(WEIGHT_KG AS FLOAT)) FROM SUPERHERO JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'ALIEN';",
        "chess_sql.json.csv": "SELECT AVG(T2.WEIGHT_KG) FROM RACE AS T1 INNER JOIN SUPERHERO AS T2 ON T1.ID = T2.RACE_ID WHERE T1.RACE = 'ALIEN'",
        "rsl_sql.json.csv": "SELECT AVG(SUPERHERO.WEIGHT_KG) FROM SUPERHERO INNER JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'ALIEN'",
        "omni-32-majority_sql.json.csv": "SELECT AVG(SUPERHERO.WEIGHT_KG) AS AVERAGE_WEIGHT FROM SUPERHERO INNER JOIN RACE ON SUPERHERO.RACE_ID = RACE.ID WHERE RACE.RACE = 'ALIEN';",
        "gena_submission_1_sql.json.csv": "SELECT AVG(T1.WEIGHT_KG) FROM SUPERHERO AS T1 INNER JOIN RACE AS T2 ON T1.RACE_ID = T2.ID WHERE T2.RACE = 'ALIEN'"
    },
    "828": {
        "question_id": "828",
        "analyze": "GoldSQL: exclude heros with NULL names",
        "question": "Count the fastest superheroes.",
        "evidence": "fastest refers to attribute_value = 100 WHERE attribute_name = 'Speed';",
        "SQL": "SELECT COUNT(T3.superhero_name) FROM hero_attribute AS T1 INNER JOIN attribute AS T2 ON T1.attribute_id = T2.id INNER JOIN superhero AS T3 ON T1.hero_id = T3.id WHERE T2.attribute_name = 'Speed' AND T1.attribute_value = 100",
        "csc-7b_sql.json.csv": "SELECT COUNT(*) FROM SUPERHERO AS S INNER JOIN HERO_ATTRIBUTE AS HA ON S.ID = HA.HERO_ID INNER JOIN ATTRIBUTE AS A ON HA.ATTRIBUTE_ID = A.ID WHERE A.ATTRIBUTE_NAME = 'SPEED' AND HA.ATTRIBUTE_VALUE = 100",
        "slm_sql.json.csv": "SELECT COUNT(*) FROM ATTRIBUTE INNER JOIN HERO_ATTRIBUTE ON ATTRIBUTE.ID = HERO_ATTRIBUTE.ATTRIBUTE_ID INNER JOIN SUPERHERO ON HERO_ATTRIBUTE.HERO_ID = SUPERHERO.ID WHERE ATTRIBUTE.ATTRIBUTE_NAME = 'SPEED' AND HERO_ATTRIBUTE.ATTRIBUTE_VALUE = 100",
        "csc-32b_sql.json.csv": "SELECT COUNT(DISTINCT HA.HERO_ID) FROM HERO_ATTRIBUTE HA JOIN ATTRIBUTE A ON HA.ATTRIBUTE_ID = A.ID WHERE A.ATTRIBUTE_NAME = 'SPEED' AND HA.ATTRIBUTE_VALUE = 100",
        "gena_submission_2_sql.json.csv": "SELECT COUNT(T1.HERO_ID) FROM HERO_ATTRIBUTE AS T1 INNER JOIN ATTRIBUTE AS T2 ON T1.ATTRIBUTE_ID = T2.ID WHERE T2.ATTRIBUTE_NAME = 'SPEED' AND T1.ATTRIBUTE_VALUE = 100",
        "alpha_sql.json.csv": "SELECT COUNT(HERO_ATTRIBUTE.HERO_ID) FROM HERO_ATTRIBUTE INNER JOIN ATTRIBUTE ON HERO_ATTRIBUTE.ATTRIBUTE_ID = ATTRIBUTE.ID WHERE ATTRIBUTE.ATTRIBUTE_NAME = 'SPEED' AND HERO_ATTRIBUTE.ATTRIBUTE_VALUE = 100",
        "gsr_sql.json.csv": "SELECT COUNT(*) FROM SUPERHERO JOIN HERO_ATTRIBUTE ON SUPERHERO.ID = HERO_ATTRIBUTE.HERO_ID JOIN ATTRIBUTE ON HERO_ATTRIBUTE.ATTRIBUTE_ID = ATTRIBUTE.ID WHERE ATTRIBUTE.ATTRIBUTE_NAME = 'SPEED' AND HERO_ATTRIBUTE.ATTRIBUTE_VALUE = 100;",
        "chess_sql.json.csv": "SELECT COUNT(T1.ID) FROM ATTRIBUTE AS T1 INNER JOIN HERO_ATTRIBUTE AS T2 ON T1.ID = T2.ATTRIBUTE_ID WHERE T1.ATTRIBUTE_NAME = 'SPEED' AND T2.ATTRIBUTE_VALUE = 100",
        "rsl_sql.json.csv": "SELECT COUNT(*) FROM SUPERHERO AS T1 INNER JOIN HERO_ATTRIBUTE AS T2 ON T1.ID = T2.HERO_ID INNER JOIN ATTRIBUTE AS T3 ON T2.ATTRIBUTE_ID = T3.ID WHERE T2.ATTRIBUTE_VALUE = 100 AND T3.ATTRIBUTE_NAME = 'SPEED'",
        "omni-32-majority_sql.json.csv": "SELECT COUNT(HERO_ATTRIBUTE.HERO_ID) FROM ATTRIBUTE INNER JOIN HERO_ATTRIBUTE ON ATTRIBUTE.ID = HERO_ATTRIBUTE.ATTRIBUTE_ID WHERE ATTRIBUTE.ATTRIBUTE_NAME = 'SPEED' AND HERO_ATTRIBUTE.ATTRIBUTE_VALUE = 100;",
        "gena_submission_1_sql.json.csv": "SELECT COUNT(T1.HERO_ID) FROM HERO_ATTRIBUTE AS T1 INNER JOIN ATTRIBUTE AS T2 ON T1.ATTRIBUTE_ID = T2.ID WHERE T2.ATTRIBUTE_NAME = 'SPEED' AND T1.ATTRIBUTE_VALUE = 100"
    },
    "867": {
        "question_id": "867",
        "analyze": "GenSQL: does not filter NULL fastestLapSpeed",
        "question": "For the driver who set the fastest lap speed in race No.933, where does he come from?",
        "evidence": "fastest lap speed refers to MAX(fastestLapSpeed);",
        "SQL": "SELECT T1.nationality FROM drivers AS T1 INNER JOIN results AS T2 ON T2.driverId = T1.driverId WHERE T2.raceId = 933 AND T2.fastestLapTime IS NOT NULL ORDER BY T2.fastestLapSpeed DESC LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT T2.NATIONALITY FROM RESULTS AS T1 JOIN DRIVERS AS T2 ON T1.DRIVERID = T2.DRIVERID JOIN RACES AS T3 ON T1.RACEID = T3.RACEID WHERE T3.RACEID = 933 ORDER BY T1.FASTESTLAPSPEED DESC LIMIT 1",
        "slm_sql.json.csv": "SELECT D.NATIONALITY FROM RESULTS AS R INNER JOIN DRIVERS AS D ON R.DRIVERID = D.DRIVERID WHERE R.RACEID = 933 ORDER BY R.FASTESTLAPSPEED DESC LIMIT 1",
        "csc-32b_sql.json.csv": "SELECT D.NATIONALITY FROM RESULTS R JOIN DRIVERS D ON R.DRIVERID = D.DRIVERID WHERE R.RACEID = 933 ORDER BY R.FASTESTLAPSPEED DESC LIMIT 1",
        "gena_submission_2_sql.json.csv": "SELECT T1.NATIONALITY FROM DRIVERS AS T1 INNER JOIN RESULTS AS T2 ON T1.DRIVERID = T2.DRIVERID WHERE T2.RACEID = 933 ORDER BY T2.FASTESTLAPSPEED DESC LIMIT 1",
        "alpha_sql.json.csv": "SELECT T2.NATIONALITY FROM RESULTS AS T1 INNER JOIN DRIVERS AS T2 ON T1.DRIVERID = T2.DRIVERID WHERE T1.RACEID = 933 ORDER BY T1.FASTESTLAPSPEED DESC LIMIT 1",
        "gsr_sql.json.csv": "SELECT D.NATIONALITY FROM RESULTS R JOIN DRIVERS D ON R.DRIVERID = D.DRIVERID WHERE R.RACEID = 933 ORDER BY R.FASTESTLAPSPEED DESC LIMIT 1;",
        "chess_sql.json.csv": "SELECT T2.NATIONALITY FROM RESULTS AS T1 INNER JOIN DRIVERS AS T2 ON T1.DRIVERID = T2.DRIVERID WHERE T1.RACEID = 933 ORDER BY T1.FASTESTLAPSPEED DESC LIMIT 1",
        "rsl_sql.json.csv": "SELECT DRIVERS.NATIONALITY FROM RESULTS INNER JOIN DRIVERS ON RESULTS.DRIVERID = DRIVERS.DRIVERID WHERE RESULTS.RACEID = 933 ORDER BY RESULTS.FASTESTLAPSPEED DESC LIMIT 1",
        "omni-32-majority_sql.json.csv": "SELECT DRIVERS.NATIONALITY FROM DRIVERS WHERE DRIVERS.DRIVERID = ( SELECT RESULTS.DRIVERID FROM RESULTS WHERE RESULTS.RACEID = 933 ORDER BY RESULTS.FASTESTLAPSPEED DESC LIMIT 1 );",
        "gena_submission_1_sql.json.csv": "SELECT T1.NATIONALITY FROM DRIVERS AS T1 INNER JOIN RESULTS AS T2 ON T1.DRIVERID = T2.DRIVERID WHERE T2.RACEID = 933 ORDER BY T2.FASTESTLAPSPEED DESC LIMIT 1"
    },
    "927": {
        "question_id": "927",
		"analyze": "GenSQL does not filter NULL",
        "question": "Which driver created the fastest lap speed in a Formula_1 race? Please give both his forename and surname.",
        "evidence": "",
        "SQL": "SELECT T1.forename, T1.surname FROM drivers AS T1 INNER JOIN results AS T2 ON T2.driverId = T1.driverId WHERE T2.fastestLapTime IS NOT NULL ORDER BY T2.fastestLapSpeed DESC LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT T1.FORENAME, T1.SURNAME FROM DRIVERS AS T1 INNER JOIN RESULTS AS T2 ON T1.DRIVERID = T2.DRIVERID ORDER BY T2.FASTESTLAPSPEED DESC LIMIT 1",
        "slm_sql.json.csv": "SELECT DRIVERS.FORENAME, DRIVERS.SURNAME FROM DRIVERS INNER JOIN RESULTS ON DRIVERS.DRIVERID = RESULTS.DRIVERID ORDER BY RESULTS.FASTESTLAPSPEED DESC LIMIT 1",
        "csc-32b_sql.json.csv": "SELECT T1.FORENAME, T1.SURNAME FROM DRIVERS AS T1 JOIN RESULTS AS T2 ON T1.DRIVERID = T2.DRIVERID ORDER BY T2.FASTESTLAPSPEED DESC LIMIT 1",
        "gena_submission_2_sql.json.csv": "SELECT T1.FORENAME, T1.SURNAME FROM DRIVERS AS T1 INNER JOIN RESULTS AS T2 ON T1.DRIVERID = T2.DRIVERID ORDER BY T2.FASTESTLAPSPEED DESC LIMIT 1",
        "alpha_sql.json.csv": "SELECT T1.FORENAME, T1.SURNAME FROM DRIVERS AS T1 INNER JOIN RESULTS AS T2 ON T1.DRIVERID = T2.DRIVERID WHERE T2.FASTESTLAPSPEED = (SELECT MAX(FASTESTLAPSPEED) FROM RESULTS)",
        "gsr_sql.json.csv": "SELECT D.FORENAME, D.SURNAME FROM DRIVERS D JOIN RESULTS R ON D.DRIVERID = R.DRIVERID ORDER BY R.FASTESTLAPSPEED DESC LIMIT 1;",
        "chess_sql.json.csv": "SELECT T2.FORENAME, T2.SURNAME FROM RESULTS AS T1 INNER JOIN DRIVERS AS T2 ON T1.DRIVERID = T2.DRIVERID ORDER BY T1.FASTESTLAPSPEED DESC LIMIT 1",
        "rsl_sql.json.csv": "SELECT DRIVERS.FORENAME, DRIVERS.SURNAME FROM RESULTS INNER JOIN DRIVERS ON RESULTS.DRIVERID = DRIVERS.DRIVERID ORDER BY RESULTS.FASTESTLAPSPEED DESC LIMIT 1",
        "omni-32-majority_sql.json.csv": "SELECT DRIVERS.FORENAME, DRIVERS.SURNAME FROM DRIVERS INNER JOIN RESULTS ON DRIVERS.DRIVERID = RESULTS.DRIVERID ORDER BY RESULTS.FASTESTLAPSPEED DESC LIMIT 1;",
        "gena_submission_1_sql.json.csv": "SELECT T1.FORENAME, T1.SURNAME FROM DRIVERS AS T1 INNER JOIN RESULTS AS T2 ON T1.DRIVERID = T2.DRIVERID ORDER BY T2.FASTESTLAPSPEED DESC LIMIT 1"
    },
	"977": {
        "question_id": "977",
		"analyze": "incorrect Gold SQL. If time is all NULL, Gold SQL returns NULL instead of 0.",
        "question": "From race no. 50 to 100, how many finishers have been disqualified?",
        "evidence": "disqualified refers to statusID = 2, finisher refers to time! = null; race no. refers to raceId; raceId > 50 and raceId < 100;",
        "SQL": "SELECT SUM(IIF(time IS NOT NULL, 1, 0)) FROM results WHERE statusId = 2 AND raceID < 100 AND raceId > 50",
        "csc-7b_sql.json.csv": "SELECT COUNT(*) FROM RESULTS WHERE STATUSID = 2 AND TIME IS NOT NULL AND RACEID BETWEEN 50 AND 100",
        "slm_sql.json.csv": "SELECT COUNT(*) AS DISQUALIFIED_FINISHERS FROM RACES R INNER JOIN RESULTS RES ON R.RACEID = RES.RACEID INNER JOIN STATUS S ON RES.STATUSID = S.STATUSID WHERE R.RACEID BETWEEN 50 AND 100 AND S.STATUSID = 2 AND RES.TIME IS NOT NULL",
        "csc-32b_sql.json.csv": "SELECT COUNT(DRIVERID) FROM RESULTS WHERE RACEID > 50 AND RACEID < 100 AND TIME IS NOT NULL AND STATUSID = 2",
        "gena_submission_2_sql.json.csv": "SELECT COUNT(*) FROM RESULTS WHERE RACEID BETWEEN 50 AND 100 AND STATUSID = 2 AND TIME IS NOT NULL",
        "alpha_sql.json.csv": "SELECT COUNT(*) FROM RESULTS WHERE RACEID > 50 AND RACEID < 100 AND NOT TIME IS NULL AND STATUSID = 2",
        "gsr_sql.json.csv": "SELECT COUNT(*) FROM RESULTS WHERE RACEID > 50 AND RACEID < 100 AND STATUSID = 2 AND TIME IS NOT NULL;",
        "chess_sql.json.csv": "SELECT COUNT(T1.RACEID) FROM RACES AS T1 INNER JOIN RESULTS AS T2 ON T1.RACEID = T2.RACEID WHERE T1.RACEID BETWEEN 50 AND 100 AND T2.STATUSID = 2 AND T2.TIME IS NOT NULL",
        "rsl_sql.json.csv": "SELECT COUNT(*) FROM RESULTS INNER JOIN STATUS ON RESULTS.STATUSID = STATUS.STATUSID WHERE RESULTS.RACEID > 50 AND RESULTS.RACEID < 100 AND RESULTS.TIME IS NOT NULL AND STATUS.STATUSID = 2",
        "omni-32-majority_sql.json.csv": "SELECT COUNT(*) FROM RESULTS WHERE RACEID >= 50 AND RACEID <= 100 AND STATUSID = 2 AND TIME IS NOT NULL;",
        "gena_submission_1_sql.json.csv": "SELECT COUNT(*) FROM RESULTS WHERE RACEID BETWEEN 50 AND 100 AND STATUSID = 2 AND TIME IS NOT NULL"        
	},
	"1019": {
        "question_id": "1019",
		"analyze": "Average is computed incorrectly when denominator contains NULL",
         "question": "What is the average lap time in milliseconds of all the lap records set on the various circuits in Italy?",
        "evidence": "average = AVG(milliseconds)",
        "SQL": "SELECT CAST(SUM(T1.milliseconds) AS REAL) / COUNT(T1.lap) FROM lapTimes AS T1 INNER JOIN races AS T2 on T1.raceId = T2.raceId INNER JOIN circuits AS T3 on T2.circuitId = T3.circuitId WHERE T3.country = 'Italy'",
        "csc-7b_sql.json.csv": "SELECT AVG(T1.MILLISECONDS) FROM LAPTIMES AS T1 JOIN RACES AS T2 ON T1.RACEID = T2.RACEID JOIN CIRCUITS AS T3 ON T2.CIRCUITID = T3.CIRCUITID WHERE T3.COUNTRY = 'ITALY'",
        "slm_sql.json.csv": "SELECT AVG(LAPTIMES.MILLISECONDS) AS AVERAGE_LAP_TIME FROM LAPTIMES INNER JOIN RACES ON LAPTIMES.RACEID = RACES.RACEID INNER JOIN CIRCUITS ON RACES.CIRCUITID = CIRCUITS.CIRCUITID WHERE CIRCUITS.COUNTRY = 'ITALY'",
        "csc-32b_sql.json.csv": "SELECT AVG(L.MILLISECONDS) AS AVERAGE FROM LAPTIMES L JOIN RACES R ON L.RACEID = R.RACEID JOIN CIRCUITS C ON R.CIRCUITID = C.CIRCUITID WHERE C.COUNTRY = 'ITALY'",
        "gena_submission_2_sql.json.csv": "SELECT AVG(T1.MILLISECONDS) FROM LAPTIMES AS T1 INNER JOIN RACES AS T2 ON T1.RACEID = T2.RACEID INNER JOIN CIRCUITS AS T3 ON T2.CIRCUITID = T3.CIRCUITID WHERE T3.COUNTRY = 'ITALY'",
        "alpha_sql.json.csv": "SELECT AVG(LAPTIMES.MILLISECONDS) FROM LAPTIMES INNER JOIN RACES ON LAPTIMES.RACEID = RACES.RACEID INNER JOIN CIRCUITS ON RACES.CIRCUITID = CIRCUITS.CIRCUITID WHERE CIRCUITS.COUNTRY = 'ITALY'",
        "gsr_sql.json.csv": "SELECT AVG(CAST(LAPTIMES.MILLISECONDS AS FLOAT)) FROM LAPTIMES JOIN RACES ON LAPTIMES.RACEID = RACES.RACEID JOIN CIRCUITS ON RACES.CIRCUITID = CIRCUITS.CIRCUITID WHERE CIRCUITS.COUNTRY = 'ITALY';",
        "chess_sql.json.csv": "SELECT AVG(T3.MILLISECONDS) FROM CIRCUITS AS T1 INNER JOIN RACES AS T2 ON T1.CIRCUITID = T2.CIRCUITID INNER JOIN LAPTIMES AS T3 ON T2.RACEID = T3.RACEID WHERE T1.COUNTRY = 'ITALY'",
        "rsl_sql.json.csv": "SELECT AVG(LAPTIMES.MILLISECONDS) FROM LAPTIMES INNER JOIN RACES ON LAPTIMES.RACEID = RACES.RACEID INNER JOIN CIRCUITS ON RACES.CIRCUITID = CIRCUITS.CIRCUITID WHERE CIRCUITS.COUNTRY = 'ITALY'",
        "omni-32-majority_sql.json.csv": "SELECT AVG(LAPTIMES.MILLISECONDS) AS AVERAGE_LAP_TIME FROM CIRCUITS INNER JOIN RACES ON CIRCUITS.CIRCUITID = RACES.CIRCUITID INNER JOIN LAPTIMES ON RACES.RACEID = LAPTIMES.RACEID WHERE CIRCUITS.COUNTRY = 'ITALY';",
        "gena_submission_1_sql.json.csv": "SELECT AVG(T1.MILLISECONDS) FROM LAPTIMES AS T1 INNER JOIN RACES AS T2 ON T1.RACEID = T2.RACEID INNER JOIN CIRCUITS AS T3 ON T2.CIRCUITID = T3.CIRCUITID WHERE T3.COUNTRY = 'ITALY'"        
	},
	"1039": {
        "question_id": "1039",
		"analyze": "The average is not computed correctly  when denominator contains NULL",
        "question": "Find the average number of long-shot done by Ahmed Samir Farag.",
        "evidence": "average number of long shot = DIVIDE(SUM(long_shots), COUNT(player_fifa_api_id));",
        "SQL": "SELECT CAST(SUM(t2.long_shots) AS REAL) / COUNT(t2.`date`) FROM Player AS t1 INNER JOIN Player_Attributes AS t2 ON t1.player_api_id = t2.player_api_id WHERE t1.player_name = 'Ahmed Samir Farag'",
        "csc-7b_sql.json.csv": "SELECT AVG(LONG_SHOTS) FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_FIFA_API_ID = T2.PLAYER_FIFA_API_ID WHERE T1.PLAYER_NAME = 'AHMED SAMIR FARAG'",
        "slm_sql.json.csv": "SELECT AVG(T2.LONG_SHOTS) AS AVERAGE_LONG_SHOTS FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T1.PLAYER_NAME = 'AHMED SAMIR FARAG'",
        "csc-32b_sql.json.csv": "SELECT CAST(SUM(T2.LONG_SHOTS) AS REAL) / COUNT(T2.PLAYER_FIFA_API_ID) AS AVERAGE_LONG_SHOTS FROM PLAYER AS T1 JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T1.PLAYER_NAME = 'AHMED SAMIR FARAG'",
        "gena_submission_2_sql.json.csv": "SELECT CAST(SUM(T1.LONG_SHOTS) AS REAL) / COUNT(T1.PLAYER_FIFA_API_ID) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'AHMED SAMIR FARAG'",
        "alpha_sql.json.csv": "SELECT AVG(PLAYER_ATTRIBUTES.LONG_SHOTS) AS AVERAGE_LONG_SHOTS FROM PLAYER INNER JOIN PLAYER_ATTRIBUTES ON PLAYER.PLAYER_API_ID = PLAYER_ATTRIBUTES.PLAYER_API_ID WHERE PLAYER.PLAYER_NAME = 'AHMED SAMIR FARAG'",
        "gsr_sql.json.csv": "SELECT AVG(LONG_SHOTS) FROM PLAYER_ATTRIBUTES WHERE PLAYER_FIFA_API_ID = (SELECT PLAYER_FIFA_API_ID FROM PLAYER WHERE PLAYER_NAME = 'AHMED SAMIR FARAG');",
        "chess_sql.json.csv": "SELECT AVG(T2.LONG_SHOTS) FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_FIFA_API_ID = T2.PLAYER_FIFA_API_ID WHERE T1.PLAYER_NAME = 'AHMED SAMIR FARAG'",
        "rsl_sql.json.csv": "SELECT CAST(SUM(PLAYER_ATTRIBUTES.LONG_SHOTS) AS REAL) / COUNT(PLAYER_ATTRIBUTES.PLAYER_FIFA_API_ID) FROM PLAYER_ATTRIBUTES INNER JOIN PLAYER ON PLAYER_ATTRIBUTES.PLAYER_FIFA_API_ID = PLAYER.PLAYER_FIFA_API_ID WHERE PLAYER.PLAYER_NAME = 'AHMED SAMIR FARAG'",
        "omni-32-majority_sql.json.csv": "SELECT SUM(T2.LONG_SHOTS) * 1.0 / COUNT(T2.PLAYER_FIFA_API_ID) AS AVERAGE_LONG_SHOTS FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T1.PLAYER_NAME = 'AHMED SAMIR FARAG';",
        "gena_submission_1_sql.json.csv": "SELECT CAST(SUM(T1.LONG_SHOTS) AS REAL) / COUNT(T1.PLAYER_FIFA_API_ID) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'AHMED SAMIR FARAG'"
    },
	"1072": {
	    "question_id": "1072",
        "analyze": "average computed incorrectly  when denominator contains NULL",
        "question": "What is the average overall rating of the football player Aaron Doran?",
        "evidence": "average overall rating = AVG(overall_rating);",
        "SQL": "SELECT CAST(SUM(t2.overall_rating) AS REAL) / COUNT(t2.id) FROM Player AS t1 INNER JOIN Player_Attributes AS t2 ON t1.player_api_id = t2.player_api_id WHERE t1.player_name = 'Aaron Doran'",
        "csc-7b_sql.json.csv": "SELECT AVG(T2.OVERALL_RATING) FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T1.PLAYER_NAME = 'AARON DORAN'",
        "slm_sql.json.csv": "SELECT AVG(PA.OVERALL_RATING) FROM PLAYER AS P INNER JOIN PLAYER_ATTRIBUTES AS PA ON P.PLAYER_API_ID = PA.PLAYER_API_ID WHERE P.PLAYER_NAME = 'AARON DORAN'",
        "csc-32b_sql.json.csv": "SELECT AVG(T2.OVERALL_RATING) FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T1.PLAYER_NAME = 'AARON DORAN'",
        "gena_submission_2_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'AARON DORAN'",
        "alpha_sql.json.csv": "SELECT AVG(PLAYER_ATTRIBUTES.OVERALL_RATING) AS AVERAGE_OVERALL_RATING FROM PLAYER INNER JOIN PLAYER_ATTRIBUTES ON PLAYER.PLAYER_API_ID = PLAYER_ATTRIBUTES.PLAYER_API_ID WHERE PLAYER.PLAYER_NAME = 'AARON DORAN'",
        "gsr_sql.json.csv": "SELECT AVG(OVERALL_RATING) FROM PLAYER_ATTRIBUTES JOIN PLAYER ON PLAYER_ATTRIBUTES.PLAYER_API_ID = PLAYER.PLAYER_API_ID WHERE PLAYER.PLAYER_NAME = 'AARON DORAN';",
        "chess_sql.json.csv": "SELECT AVG(T2.OVERALL_RATING) FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_FIFA_API_ID = T2.PLAYER_FIFA_API_ID WHERE T1.PLAYER_NAME = 'AARON DORAN'",
        "rsl_sql.json.csv": "SELECT AVG(PLAYER_ATTRIBUTES.OVERALL_RATING) FROM PLAYER_ATTRIBUTES INNER JOIN PLAYER ON PLAYER_ATTRIBUTES.PLAYER_API_ID = PLAYER.PLAYER_API_ID WHERE PLAYER.PLAYER_NAME = 'AARON DORAN'",
        "omni-32-majority_sql.json.csv": "SELECT AVG(PA.OVERALL_RATING) AS AVERAGE_OVERALL_RATING FROM PLAYER AS P INNER JOIN PLAYER_ATTRIBUTES AS PA ON P.PLAYER_API_ID = PA.PLAYER_API_ID WHERE P.PLAYER_NAME = 'AARON DORAN';",
        "gena_submission_1_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'AARON DORAN'"
    },
	"1095": {
        "question_id": "1095",
		"analyze": "average computed incorrectly when denominator contains NULL",
        "question": "How much is the average build up play speed of the Heart of Midlothian team?",
        "evidence": "Heart of Midlothian refers to team_long_name = 'Heart of Midlothian'; average build up play speed refers to\u00a0 AVG(buildUpPlaySpeed)",
        "SQL": "SELECT CAST(SUM(t2.buildUpPlaySpeed) AS REAL) / COUNT(t2.id) FROM Team AS t1 INNER JOIN Team_Attributes AS t2 ON t1.team_api_id = t2.team_api_id WHERE t1.team_long_name = 'Heart of Midlothian'",
        "csc-7b_sql.json.csv": "SELECT AVG(BUILDUPPLAYSPEED) FROM TEAM_ATTRIBUTES WHERE TEAM_FIFA_API_ID IN (SELECT TEAM_FIFA_API_ID FROM TEAM WHERE TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN')",
        "slm_sql.json.csv": "SELECT AVG(T2.BUILDUPPLAYSPEED) FROM TEAM AS T1 INNER JOIN TEAM_ATTRIBUTES AS T2 ON T1.TEAM_FIFA_API_ID = T2.TEAM_FIFA_API_ID WHERE T1.TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN'",
        "csc-32b_sql.json.csv": "SELECT AVG(BUILDUPPLAYSPEED) FROM TEAM_ATTRIBUTES JOIN TEAM ON TEAM_ATTRIBUTES.TEAM_API_ID = TEAM.TEAM_API_ID WHERE TEAM.TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN'",
        "gena_submission_2_sql.json.csv": "SELECT AVG(T2.BUILDUPPLAYSPEED) FROM TEAM AS T1 INNER JOIN TEAM_ATTRIBUTES AS T2 ON T1.TEAM_API_ID = T2.TEAM_API_ID WHERE T1.TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN'",
        "alpha_sql.json.csv": "SELECT AVG(TEAM_ATTRIBUTES.BUILDUPPLAYSPEED) FROM TEAM INNER JOIN TEAM_ATTRIBUTES ON TEAM.TEAM_API_ID = TEAM_ATTRIBUTES.TEAM_API_ID WHERE TEAM.TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN'",
        "gsr_sql.json.csv": "SELECT AVG(CAST(BUILDUPPLAYSPEED AS FLOAT)) FROM TEAM_ATTRIBUTES JOIN TEAM ON TEAM_ATTRIBUTES.TEAM_API_ID = TEAM.TEAM_API_ID WHERE TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN';",
        "chess_sql.json.csv": "SELECT AVG(T2.BUILDUPPLAYSPEED) FROM TEAM AS T1 INNER JOIN TEAM_ATTRIBUTES AS T2 ON T1.TEAM_FIFA_API_ID = T2.TEAM_FIFA_API_ID WHERE T1.TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN'",
        "rsl_sql.json.csv": "SELECT AVG(TEAM_ATTRIBUTES.BUILDUPPLAYSPEED) FROM TEAM INNER JOIN TEAM_ATTRIBUTES ON TEAM.TEAM_API_ID = TEAM_ATTRIBUTES.TEAM_API_ID WHERE TEAM.TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN'",
        "omni-32-majority_sql.json.csv": "SELECT AVG(TA.BUILDUPPLAYSPEED) AS AVERAGE_BUILDUPPLAYSPEED FROM TEAM AS T INNER JOIN TEAM_ATTRIBUTES AS TA ON T.TEAM_FIFA_API_ID = TA.TEAM_FIFA_API_ID WHERE T.TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN';",
        "gena_submission_1_sql.json.csv": "SELECT AVG(T2.BUILDUPPLAYSPEED) FROM TEAM AS T1 INNER JOIN TEAM_ATTRIBUTES AS T2 ON T1.TEAM_API_ID = T2.TEAM_API_ID WHERE T1.TEAM_LONG_NAME = 'HEART OF MIDLOTHIAN'"
    },
	"1096": {
                "question_id": "1096",
		"analyze": "average computed incorrectly when denominator contains NULL",
 "question": "Calculate the average overall rating of Pietro Marino.",
        "evidence": "Pietro Marino refers to player_name = 'Pietro Marino'; average overall rating AVG(T1.overall_rating)",
        "SQL": "SELECT CAST(SUM(t2.overall_rating) AS REAL) / COUNT(t2.id) FROM Player AS t1 INNER JOIN Player_Attributes AS t2 ON t1.player_api_id = t2.player_api_id WHERE t1.player_name = 'Pietro Marino'",
        "csc-7b_sql.json.csv": "SELECT AVG(T2.OVERALL_RATING) FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T1.PLAYER_NAME = 'PIETRO MARINO'",
        "slm_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) AS AVERAGE_OVERALL_RATING FROM PLAYER AS T2 INNER JOIN PLAYER_ATTRIBUTES AS T1 ON T2.PLAYER_API_ID = T1.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'PIETRO MARINO'",
        "csc-32b_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'PIETRO MARINO'",
        "gena_submission_2_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'PIETRO MARINO'",
        "alpha_sql.json.csv": "SELECT AVG(T2.OVERALL_RATING) FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T1.PLAYER_NAME = 'PIETRO MARINO'",
        "gsr_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) FROM PLAYER_ATTRIBUTES T1 JOIN PLAYER T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'PIETRO MARINO';",
        "chess_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_FIFA_API_ID = T2.PLAYER_FIFA_API_ID WHERE T2.PLAYER_NAME = 'PIETRO MARINO'",
        "rsl_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'PIETRO MARINO'",
        "omni-32-majority_sql.json.csv": "SELECT AVG(T2.OVERALL_RATING) AS AVERAGE_OVERALL_RATING FROM PLAYER AS T1 INNER JOIN PLAYER_ATTRIBUTES AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T1.PLAYER_NAME = 'PIETRO MARINO';",
        "gena_submission_1_sql.json.csv": "SELECT AVG(T1.OVERALL_RATING) FROM PLAYER_ATTRIBUTES AS T1 INNER JOIN PLAYER AS T2 ON T1.PLAYER_API_ID = T2.PLAYER_API_ID WHERE T2.PLAYER_NAME = 'PIETRO MARINO'"
    },        
	
	"1101": {
        "question_id": "1101",
		"analyze": "average computed incorrectly when denominator contains NULL",
         "question": "What is the average number of goals made by Parma as the away team while playing in Italy?",
        "evidence": "Parma refers to team_long_name = 'Parma'; average number of goals refers to AVG(away_team_goal)",
        "SQL": "SELECT CAST(SUM(T1.away_team_goal) AS REAL) / COUNT(T1.id) FROM \"Match\" AS T1 INNER JOIN TEAM AS T2 ON T1.away_team_api_id = T2.team_api_id INNER JOIN Country AS T3 ON T1.country_id = T3.id WHERE T2.team_long_name = 'Parma' AND T3.name = 'Italy'",
        "csc-7b_sql.json.csv": "SELECT AVG(T1.AWAY_TEAM_GOAL) FROM MATCH AS T1 INNER JOIN TEAM AS T2 ON T2.TEAM_API_ID = T1.AWAY_TEAM_API_ID INNER JOIN LEAGUE AS T3 ON T3.ID = T1.LEAGUE_ID INNER JOIN COUNTRY AS T4 ON T4.ID = T3.COUNTRY_ID WHERE T2.TEAM_LONG_NAME = 'PARMA' AND T4.NAME = 'ITALY'",
        "slm_sql.json.csv": "SELECT AVG(M.AWAY_TEAM_GOAL) AS AVG_GOALS FROM TEAM AS T INNER JOIN MATCH AS M ON T.TEAM_API_ID = M.AWAY_TEAM_API_ID INNER JOIN COUNTRY AS C ON M.COUNTRY_ID = C.ID WHERE T.TEAM_LONG_NAME = 'PARMA' AND C.NAME = 'ITALY'",
        "csc-32b_sql.json.csv": "SELECT AVG(M.AWAY_TEAM_GOAL) AS AVERAGE_GOALS FROM MATCH M JOIN TEAM T ON M.AWAY_TEAM_API_ID = T.TEAM_API_ID WHERE T.TEAM_LONG_NAME = 'PARMA' AND M.COUNTRY_ID = (SELECT ID FROM COUNTRY WHERE NAME = 'ITALY')",
        "gena_submission_2_sql.json.csv": "SELECT AVG(T1.AWAY_TEAM_GOAL) FROM MATCH AS T1 INNER JOIN COUNTRY AS T2 ON T1.COUNTRY_ID = T2.ID INNER JOIN TEAM AS T3 ON T1.AWAY_TEAM_API_ID = T3.TEAM_API_ID WHERE T3.TEAM_LONG_NAME = 'PARMA' AND T2.NAME = 'ITALY'",
        "alpha_sql.json.csv": "SELECT AVG(MATCH.AWAY_TEAM_GOAL) AS AVERAGE_AWAY_GOALS FROM COUNTRY INNER JOIN MATCH ON COUNTRY.ID = MATCH.COUNTRY_ID INNER JOIN TEAM ON MATCH.AWAY_TEAM_API_ID = TEAM.TEAM_API_ID WHERE COUNTRY.NAME = 'ITALY' AND TEAM.TEAM_LONG_NAME = 'PARMA'",
        "gsr_sql.json.csv": "SELECT AVG(MATCH.AWAY_TEAM_GOAL) FROM MATCH JOIN TEAM ON MATCH.AWAY_TEAM_API_ID = TEAM.TEAM_API_ID JOIN LEAGUE ON MATCH.LEAGUE_ID = LEAGUE.ID JOIN COUNTRY ON LEAGUE.COUNTRY_ID = COUNTRY.ID WHERE TEAM.TEAM_LONG_NAME = 'PARMA' AND COUNTRY.NAME = 'ITALY';",
        "chess_sql.json.csv": "SELECT AVG(T3.AWAY_TEAM_GOAL) FROM TEAM AS T1 INNER JOIN MATCH AS T3 ON T1.TEAM_API_ID = T3.AWAY_TEAM_API_ID INNER JOIN COUNTRY AS T2 ON T3.COUNTRY_ID = T2.ID WHERE T1.TEAM_LONG_NAME = 'PARMA' AND T2.NAME = 'ITALY'",
        "rsl_sql.json.csv": "SELECT AVG(MATCH.AWAY_TEAM_GOAL) FROM MATCH INNER JOIN TEAM ON MATCH.AWAY_TEAM_API_ID = TEAM.TEAM_API_ID INNER JOIN COUNTRY ON MATCH.COUNTRY_ID = COUNTRY.ID WHERE TEAM.TEAM_LONG_NAME = 'PARMA' AND COUNTRY.NAME = 'ITALY'",
        "omni-32-majority_sql.json.csv": "SELECT AVG(M.AWAY_TEAM_GOAL) AS AVERAGE_GOALS FROM TEAM AS T INNER JOIN MATCH AS M ON T.TEAM_API_ID = M.AWAY_TEAM_API_ID INNER JOIN LEAGUE AS L ON M.LEAGUE_ID = L.ID INNER JOIN COUNTRY AS C ON L.COUNTRY_ID = C.ID WHERE T.TEAM_LONG_NAME = 'PARMA' AND C.NAME = 'ITALY';",
        "gena_submission_1_sql.json.csv": "SELECT AVG(T1.AWAY_TEAM_GOAL) FROM MATCH AS T1 INNER JOIN COUNTRY AS T2 ON T1.COUNTRY_ID = T2.ID INNER JOIN TEAM AS T3 ON T1.AWAY_TEAM_API_ID = T3.TEAM_API_ID WHERE T3.TEAM_LONG_NAME = 'PARMA' AND T2.NAME = 'ITALY'"
    },
	"1183": {
        "question_id": "1183",
		"analyze": "Should return EXAMINATION.diagnosis.",
 "question": "For the patient who was diagnosed SLE on 1997/1/27, what was his/her original diagnose when he/she came to the hospital for the first time?",
        "evidence": "'SLE' AND original diagnose refers to diagnosis; 1997/1/27 refer to `Examination Date` = '1997-01-27'; first came to the hospital refers to patient.`First Date`",
        "SQL": "SELECT T1.Diagnosis FROM Patient AS T1 INNER JOIN Examination AS T2 ON T1.ID = T2.ID WHERE T1.ID = ( SELECT ID FROM Examination WHERE `Examination Date` = '1997-01-27' AND Diagnosis = 'SLE' ) AND T2.`Examination Date` = T1.`First Date`",
        "csc-7b_sql.json.csv": "SELECT T2.DIAGNOSIS FROM EXAMINATION AS T1 INNER JOIN PATIENT AS T2 ON T1.ID = T2.ID WHERE T1.EXAMINATION_DATE = '1997-01-27' AND T2.DIAGNOSIS = 'SLE' ORDER BY T2.FIRST_DATE ASC LIMIT 1",
        "slm_sql.json.csv": "SELECT PATIENT.DIAGNOSIS FROM EXAMINATION INNER JOIN PATIENT ON EXAMINATION.ID = PATIENT.ID WHERE EXAMINATION.EXAMINATION_DATE = '1997-01-27' AND PATIENT.DIAGNOSIS = 'SLE'",
        "csc-32b_sql.json.csv": "SELECT T2.DIAGNOSIS FROM EXAMINATION AS T1 INNER JOIN PATIENT AS T2 ON T1.ID = T2.ID WHERE T1.DIAGNOSIS = 'SLE' AND T1.EXAMINATION_DATE = '1997-01-27'",
        "gena_submission_2_sql.json.csv": "SELECT T1.DIAGNOSIS FROM PATIENT AS T1 INNER JOIN EXAMINATION AS T2 ON T1.ID = T2.ID WHERE T2.EXAMINATION_DATE = '1997-01-27' AND T2.DIAGNOSIS = 'SLE'",
        "alpha_sql.json.csv": "SELECT DISTINCT PATIENT.DIAGNOSIS FROM PATIENT INNER JOIN EXAMINATION ON PATIENT.ID = EXAMINATION.ID WHERE EXAMINATION.EXAMINATION_DATE = '1997-01-27' AND EXAMINATION.DIAGNOSIS = 'SLE'",
        "gsr_sql.json.csv": "SELECT P.DIAGNOSIS FROM PATIENT P JOIN EXAMINATION E ON P.ID = E.ID WHERE E.DIAGNOSIS = 'SLE' AND E.EXAMINATION_DATE = '1997-01-27' ORDER BY P.FIRST_DATE LIMIT 1;",
        "chess_sql.json.csv": "SELECT T1.DIAGNOSIS FROM PATIENT AS T1 INNER JOIN EXAMINATION AS T2 ON T1.ID = T2.ID WHERE T2.EXAMINATION_DATE = '1997-01-27' AND T2.DIAGNOSIS = 'SLE'",
        "rsl_sql.json.csv": "SELECT PATIENT.DIAGNOSIS FROM PATIENT INNER JOIN EXAMINATION ON PATIENT.ID = EXAMINATION.ID WHERE EXAMINATION.DIAGNOSIS = 'SLE' AND EXAMINATION.EXAMINATION_DATE = '1997-01-27'",
        "omni-32-majority_sql.json.csv": "SELECT PATIENT.DIAGNOSIS FROM PATIENT INNER JOIN EXAMINATION ON PATIENT.ID = EXAMINATION.ID WHERE EXAMINATION.DIAGNOSIS = 'SLE' AND EXAMINATION.EXAMINATION_DATE = '1997-01-27';",
        "gena_submission_1_sql.json.csv": "SELECT T1.DIAGNOSIS FROM PATIENT AS T1 INNER JOIN EXAMINATION AS T2 ON T1.ID = T2.ID WHERE T2.EXAMINATION_DATE = '1997-01-27' AND T2.DIAGNOSIS = 'SLE'"
    },
	"1263": {
        "question_id": "1263",
		"analyze": "Does not handle tie-breaking correctly.",
        "question": "Among the patients whose level of Hematoclit isn't normal, which patient has the highest anti-Cardiolipin antibody concentration? Please list his or her ID.",
        "evidence": "Hematoclit is normal refers to 29 < N < 52; highest anti-Cardiolipin antibody concentration refers to MAX(`aCL IgA`);",
        "SQL": "SELECT DISTINCT T1.ID FROM Patient AS T1 INNER JOIN Examination AS T2 ON T1.ID = T2.ID INNER JOIN Laboratory AS T3 on T1.ID = T3.ID WHERE (T3.HCT >= 52 OR T3.HCT <= 29) ORDER BY T2.`aCL IgA` DESC LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT T1.ID FROM LABORATORY AS T1 INNER JOIN EXAMINATION AS T2 ON T1.ID = T2.ID WHERE T1.HCT NOT BETWEEN 29 AND 52 ORDER BY T2.ACL_IGA DESC LIMIT 1",
        "slm_sql.json.csv": "SELECT E.ID FROM EXAMINATION AS E INNER JOIN PATIENT AS P ON E.ID = P.ID INNER JOIN LABORATORY AS L ON P.ID = L.ID WHERE(L.ALB < 29 AND L.ALB > 52) OR(L.ALB IS NULL) GROUP BY E.ID ORDER BY MAX(E.ACL_IGA) DESC LIMIT 1",
        "csc-32b_sql.json.csv": "SELECT T2.ID FROM LABORATORY AS T1 INNER JOIN EXAMINATION AS T2 ON T1.ID = T2.ID WHERE T1.HCT < 29 OR T1.HCT > 52 ORDER BY T2.ACL_IGA DESC LIMIT 1",
        "gena_submission_2_sql.json.csv": "SELECT T1.ID FROM EXAMINATION AS T1 INNER JOIN LABORATORY AS T2 ON T1.ID = T2.ID WHERE T2.HCT < 29 OR T2.HCT > 52 ORDER BY T1.ACL_IGA DESC LIMIT 1",
        "chess_sql.json.csv": "SELECT T1.ID FROM LABORATORY AS T1 INNER JOIN EXAMINATION AS T2 ON T1.ID = T2.ID WHERE T1.HCT < 29 OR T1.HCT > 52 ORDER BY T2.ACL_IGA DESC LIMIT 1",
        "rsl_sql.json.csv": "SELECT PATIENT.ID FROM PATIENT INNER JOIN LABORATORY ON PATIENT.ID = LABORATORY.ID INNER JOIN EXAMINATION ON PATIENT.ID = EXAMINATION.ID WHERE (LABORATORY.HCT <= 29 OR LABORATORY.HCT >= 52) ORDER BY EXAMINATION.ACL_IGA DESC LIMIT 1",
        "omni-32-majority_sql.json.csv": "SELECT L.ID FROM LABORATORY AS L INNER JOIN EXAMINATION AS E ON L.ID = E.ID WHERE L.HCT <= 29 OR L.HCT >= 52 ORDER BY E.ACL_IGA DESC LIMIT 1;",
        "gena_submission_1_sql.json.csv": "SELECT T1.ID FROM EXAMINATION AS T1 INNER JOIN LABORATORY AS T2 ON T1.ID = T2.ID WHERE T2.HCT < 29 OR T2.HCT > 52 ORDER BY T1.ACL_IGA DESC LIMIT 1"
    },
	"1332": {
        "question_id": "1332",
		"analyze": "Extra filter on Gold SQL SUBSTR(T1.event_date, 6, 2) = '09'",
  "question": "How much did the Student_Club members spend on food in September Meeting?",
        "evidence": "amount spent refers to spent; spend on food in September Meeting refers to category = 'Food' where event_name = 'September Meeting'",
        "SQL": "SELECT T2.spent FROM event AS T1 INNER JOIN budget AS T2 ON T1.event_id = T2.link_to_event WHERE T1.event_name = 'September Meeting' AND T2.category = 'Food' AND SUBSTR(T1.event_date, 6, 2) = '09'",
        "csc-7b_sql.json.csv": "SELECT T1.SPENT FROM BUDGET AS T1 INNER JOIN EVENT AS T2 ON T1.LINK_TO_EVENT = T2.EVENT_ID WHERE T2.EVENT_NAME = 'SEPTEMBER MEETING' AND T1.CATEGORY = 'FOOD'",
        "slm_sql.json.csv": "SELECT SUM(B.SPENT) AS TOTAL_SPENT FROM BUDGET AS B INNER JOIN EVENT AS E ON B.LINK_TO_EVENT = E.EVENT_ID WHERE E.EVENT_NAME = 'SEPTEMBER MEETING' AND B.CATEGORY = 'FOOD'",
        "csc-32b_sql.json.csv": "SELECT SUM(B.SPENT) AS TOTAL_SPENT_ON_FOOD FROM BUDGET B JOIN EVENT E ON B.LINK_TO_EVENT = E.EVENT_ID WHERE B.CATEGORY = 'FOOD' AND E.EVENT_NAME = 'SEPTEMBER MEETING'",
        "gena_submission_2_sql.json.csv": "SELECT T1.SPENT FROM BUDGET AS T1 INNER JOIN EVENT AS T2 ON T1.LINK_TO_EVENT = T2.EVENT_ID WHERE T1.CATEGORY = 'FOOD' AND T2.EVENT_NAME = 'SEPTEMBER MEETING'",
        "alpha_sql.json.csv": "SELECT BUDGET.SPENT FROM BUDGET INNER JOIN EVENT ON BUDGET.LINK_TO_EVENT = EVENT.EVENT_ID WHERE EVENT.EVENT_NAME = 'SEPTEMBER MEETING' AND BUDGET.CATEGORY = 'FOOD'",
        "gsr_sql.json.csv": "SELECT SPENT FROM BUDGET JOIN EVENT ON BUDGET.LINK_TO_EVENT = EVENT.EVENT_ID WHERE BUDGET.CATEGORY = 'FOOD' AND EVENT.EVENT_NAME = 'SEPTEMBER MEETING';",
        "chess_sql.json.csv": "SELECT SUM(T2.SPENT) FROM EVENT AS T1 INNER JOIN BUDGET AS T2 ON T1.EVENT_ID = T2.LINK_TO_EVENT WHERE T1.EVENT_NAME = 'SEPTEMBER MEETING' AND T2.CATEGORY = 'FOOD'",
        "rsl_sql.json.csv": "SELECT SUM(BUDGET.SPENT) FROM EVENT INNER JOIN BUDGET ON EVENT.EVENT_ID = BUDGET.LINK_TO_EVENT WHERE EVENT.EVENT_NAME = 'SEPTEMBER MEETING' AND BUDGET.CATEGORY = 'FOOD'",
        "omni-32-majority_sql.json.csv": "SELECT SUM(B.SPENT) AS TOTAL_SPENT_ON_FOOD FROM EVENT AS E INNER JOIN BUDGET AS B ON E.EVENT_ID = B.LINK_TO_EVENT WHERE E.EVENT_NAME = 'SEPTEMBER MEETING' AND B.CATEGORY = 'FOOD';",
        "gena_submission_1_sql.json.csv": "SELECT T1.SPENT FROM BUDGET AS T1 INNER JOIN EVENT AS T2 ON T1.LINK_TO_EVENT = T2.EVENT_ID WHERE T1.CATEGORY = 'FOOD' AND T2.EVENT_NAME = 'SEPTEMBER MEETING'"
    },        
	"1335": {
                "question_id": "1335",
		"analyze": "Extra filter on Gold SQL SUBSTR(T1.event_date, 6, 2) = '09'",
  "question": "How much did the Student_Club members spend on advertisement in September Meeting?",
        "evidence": "amount spent refers to spent; spend on food in September Meeting refers to category = 'Advertisement' where event_name = 'September Meeting'",
        "SQL": "SELECT T2.spent FROM event AS T1 INNER JOIN budget AS T2 ON T1.event_id = T2.link_to_event WHERE T1.event_name = 'September Meeting' AND T2.category = 'Advertisement' AND SUBSTR(T1.event_date, 6, 2) = '09'",
        "csc-7b_sql.json.csv": "SELECT SUM(T2.SPENT) FROM EVENT AS T1 INNER JOIN BUDGET AS T2 ON T1.EVENT_ID = T2.LINK_TO_EVENT WHERE T1.EVENT_NAME = 'SEPTEMBER MEETING' AND T2.CATEGORY = 'ADVERTISEMENT'",
        "slm_sql.json.csv": "SELECT SUM(B.SPENT) FROM BUDGET AS B INNER JOIN EVENT AS E ON B.LINK_TO_EVENT = E.EVENT_ID WHERE B.CATEGORY = 'ADVERTISEMENT' AND E.EVENT_NAME = 'SEPTEMBER MEETING'",
        "csc-32b_sql.json.csv": "SELECT B.SPENT FROM BUDGET B JOIN EVENT E ON B.LINK_TO_EVENT = E.EVENT_ID WHERE E.EVENT_NAME = 'SEPTEMBER MEETING' AND B.CATEGORY = 'ADVERTISEMENT'",
        "gena_submission_2_sql.json.csv": "SELECT T2.SPENT FROM EVENT AS T1 INNER JOIN BUDGET AS T2 ON T1.EVENT_ID = T2.LINK_TO_EVENT WHERE T1.EVENT_NAME = 'SEPTEMBER MEETING' AND T2.CATEGORY = 'ADVERTISEMENT'",
        "alpha_sql.json.csv": "SELECT BUDGET.SPENT FROM BUDGET INNER JOIN EVENT ON BUDGET.LINK_TO_EVENT = EVENT.EVENT_ID WHERE BUDGET.CATEGORY = 'ADVERTISEMENT' AND EVENT.EVENT_NAME = 'SEPTEMBER MEETING'",
        "gsr_sql.json.csv": "SELECT SPENT FROM BUDGET JOIN EVENT ON BUDGET.LINK_TO_EVENT = EVENT.EVENT_ID WHERE CATEGORY = 'ADVERTISEMENT' AND EVENT_NAME = 'SEPTEMBER MEETING';",
        "chess_sql.json.csv": "SELECT SUM(T2.SPENT) FROM EVENT AS T1 INNER JOIN BUDGET AS T2 ON T1.EVENT_ID = T2.LINK_TO_EVENT WHERE T1.EVENT_NAME = 'SEPTEMBER MEETING' AND T2.CATEGORY = 'ADVERTISEMENT'",
        "rsl_sql.json.csv": "SELECT SUM(BUDGET.SPENT) FROM BUDGET INNER JOIN EVENT ON BUDGET.LINK_TO_EVENT = EVENT.EVENT_ID WHERE BUDGET.CATEGORY = 'ADVERTISEMENT' AND EVENT.EVENT_NAME = 'SEPTEMBER MEETING'",
        "omni-32-majority_sql.json.csv": "SELECT SUM(B.SPENT) AS TOTAL_SPENT FROM BUDGET AS B INNER JOIN EVENT AS E ON B.LINK_TO_EVENT = E.EVENT_ID WHERE B.CATEGORY = 'ADVERTISEMENT' AND E.EVENT_NAME = 'SEPTEMBER MEETING';",
        "gena_submission_1_sql.json.csv": "SELECT T1.SPENT FROM BUDGET AS T1 INNER JOIN EVENT AS T2 ON T1.LINK_TO_EVENT = T2.EVENT_ID WHERE T1.CATEGORY = 'ADVERTISEMENT' AND T2.EVENT_NAME = 'SEPTEMBER MEETING'"
    },        

	"1403": {
                "question_id": "1403",
		"analyze": "Gold SQL use filters on Expense instead of Event",
"question": "Indicate the name of the closed event whose cost has exceeded the budget the most.",
        "evidence": "closed events refers to event_name where status = 'Closed'; exceed the budget the most refers to MIN(remaining) where remaining < 0",
        "SQL": "SELECT T2.event_name FROM budget AS T1 INNER JOIN event AS T2 ON T2.event_id = T1.link_to_event WHERE T1.event_status = 'Closed' AND T1.remaining < 0 ORDER BY T1.remaining LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT T2.EVENT_NAME FROM BUDGET AS T1 INNER JOIN EVENT AS T2 ON T1.LINK_TO_EVENT = T2.EVENT_ID WHERE T2.STATUS = 'CLOSED' AND T1.REMAINING < 0 ORDER BY T1.REMAINING ASC LIMIT 1",
        "slm_sql.json.csv": "SELECT EVENT.EVENT_NAME FROM EVENT INNER JOIN BUDGET ON EVENT.EVENT_ID = BUDGET.LINK_TO_EVENT WHERE BUDGET.REMAINING < 0 AND EVENT.STATUS = 'CLOSED' ORDER BY BUDGET.REMAINING ASC LIMIT 1",
        "csc-32b_sql.json.csv": "SELECT T1.EVENT_NAME FROM EVENT AS T1 JOIN BUDGET AS T2 ON T1.EVENT_ID = T2.LINK_TO_EVENT WHERE T1.STATUS = 'CLOSED' AND T2.REMAINING < 0 ORDER BY T2.REMAINING ASC LIMIT 1",
        "gena_submission_2_sql.json.csv": "SELECT T1.EVENT_NAME FROM EVENT AS T1 INNER JOIN BUDGET AS T2 ON T1.EVENT_ID = T2.LINK_TO_EVENT WHERE T1.STATUS = 'CLOSED' ORDER BY T2.REMAINING LIMIT 1",
        "alpha_sql.json.csv": "SELECT E.EVENT_NAME FROM EVENT AS E INNER JOIN BUDGET AS B ON E.EVENT_ID = B.LINK_TO_EVENT WHERE E.STATUS = 'CLOSED' AND B.REMAINING < 0 ORDER BY B.REMAINING ASC LIMIT 1",
        "gsr_sql.json.csv": "SELECT EVENT_NAME FROM EVENT JOIN BUDGET ON EVENT.EVENT_ID = BUDGET.LINK_TO_EVENT WHERE STATUS = 'CLOSED' AND REMAINING < 0 ORDER BY REMAINING ASC LIMIT 1;",
        "chess_sql.json.csv": "SELECT T1.EVENT_NAME FROM EVENT AS T1 INNER JOIN BUDGET AS T2 ON T1.EVENT_ID = T2.LINK_TO_EVENT WHERE T1.STATUS = 'CLOSED' ORDER BY T2.REMAINING ASC LIMIT 1",
        "rsl_sql.json.csv": "SELECT EVENT.EVENT_NAME FROM EVENT INNER JOIN BUDGET ON EVENT.EVENT_ID = BUDGET.LINK_TO_EVENT WHERE EVENT.STATUS = 'CLOSED' AND BUDGET.REMAINING < 0 ORDER BY BUDGET.REMAINING ASC LIMIT 1",
        "omni-32-majority_sql.json.csv": "SELECT EVENT.EVENT_NAME FROM EVENT INNER JOIN BUDGET ON EVENT.EVENT_ID = BUDGET.LINK_TO_EVENT WHERE EVENT.STATUS = 'CLOSED' AND BUDGET.REMAINING < 0 ORDER BY BUDGET.REMAINING ASC LIMIT 1;",
        "gena_submission_1_sql.json.csv": "SELECT T1.EVENT_NAME FROM EVENT AS T1 INNER JOIN BUDGET AS T2 ON T1.EVENT_ID = T2.LINK_TO_EVENT WHERE T1.STATUS = 'CLOSED' ORDER BY T2.REMAINING LIMIT 1"        
	},

	"1426": {
        "question_id": "1426",
		"analyze": "Extra filter 'Member'.",
        "question": "List the last name of members with a major in environmental engineering and include its department and college name.",
        "evidence": "'Environmental Engineering' is the major_name;",
        "SQL": "SELECT T2.last_name, T1.department, T1.college FROM major AS T1 INNER JOIN member AS T2 ON T1.major_id = T2.link_to_major WHERE T2.position = 'Member' AND T1.major_name = 'Environmental Engineering'",
        "csc-7b_sql.json.csv": "SELECT T1.LAST_NAME, T2.DEPARTMENT, T2.COLLEGE FROM MEMBER AS T1 JOIN MAJOR AS T2 ON T1.LINK_TO_MAJOR = T2.MAJOR_ID WHERE T2.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING'",
        "slm_sql.json.csv": "SELECT MEMBER.LAST_NAME, MAJOR.DEPARTMENT, MAJOR.COLLEGE FROM MEMBER INNER JOIN MAJOR ON MEMBER.LINK_TO_MAJOR = MAJOR.MAJOR_ID WHERE MAJOR.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING'",
        "csc-32b_sql.json.csv": "SELECT T1.LAST_NAME, T2.DEPARTMENT, T2.COLLEGE FROM MEMBER AS T1 INNER JOIN MAJOR AS T2 ON T1.LINK_TO_MAJOR = T2.MAJOR_ID WHERE T2.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING'",
        "gena_submission_2_sql.json.csv": "SELECT T1.LAST_NAME, T2.DEPARTMENT, T2.COLLEGE FROM MEMBER AS T1 INNER JOIN MAJOR AS T2 ON T1.LINK_TO_MAJOR = T2.MAJOR_ID WHERE T2.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING';",
        "alpha_sql.json.csv": "SELECT MEMBER.LAST_NAME, MAJOR.DEPARTMENT, MAJOR.COLLEGE FROM MEMBER INNER JOIN MAJOR ON MEMBER.LINK_TO_MAJOR = MAJOR.MAJOR_ID WHERE MAJOR.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING'",
        "gsr_sql.json.csv": "SELECT M.LAST_NAME, MAJ.DEPARTMENT, MAJ.COLLEGE FROM MEMBER M JOIN MAJOR MAJ ON M.LINK_TO_MAJOR = MAJ.MAJOR_ID WHERE MAJ.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING';",
        "chess_sql.json.csv": "SELECT T1.LAST_NAME, T2.DEPARTMENT, T2.COLLEGE FROM MEMBER AS T1 INNER JOIN MAJOR AS T2 ON T1.LINK_TO_MAJOR = T2.MAJOR_ID WHERE T2.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING'",
        "rsl_sql.json.csv": "SELECT MEMBER.LAST_NAME, MAJOR.DEPARTMENT, MAJOR.COLLEGE FROM MEMBER INNER JOIN MAJOR ON MEMBER.LINK_TO_MAJOR = MAJOR.MAJOR_ID WHERE MAJOR.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING'",
        "omni-32-majority_sql.json.csv": "SELECT MEMBER.LAST_NAME, MAJOR.DEPARTMENT, MAJOR.COLLEGE FROM MEMBER INNER JOIN MAJOR ON MEMBER.LINK_TO_MAJOR = MAJOR.MAJOR_ID WHERE MAJOR.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING';",
        "gena_submission_1_sql.json.csv": "SELECT T1.LAST_NAME, T2.DEPARTMENT, T2.COLLEGE FROM MEMBER AS T1 INNER JOIN MAJOR AS T2 ON T1.LINK_TO_MAJOR = T2.MAJOR_ID WHERE T2.MAJOR_NAME = 'ENVIRONMENTAL ENGINEERING'"
        
	},
	"1509": {
        "question_id": "1509",

		"analyze": "Does not take into account NULL id.",
        "question": "Among the transactions made in the gas stations in the Czech Republic, how many of them are taken place after 2012/1/1?",
        "evidence": "Czech Republic can be represented as the Country value in the gasstations table is 'CZE'",
        "SQL": "SELECT COUNT(T1.TransactionID) FROM transactions_1k AS T1 INNER JOIN gasstations AS T2 ON T1.GasStationID = T2.GasStationID WHERE T2.Country = 'CZE' AND STRFTIME('%Y', T1.Date) >= '2012'",
        "csc-7b_sql.json.csv": "SELECT COUNT(*) FROM TRANSACTIONS_1K AS T1 JOIN GASSTATIONS AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T2.COUNTRY = 'CZE' AND T1.DATE > '2012-01-01'",
        "slm_sql.json.csv": "SELECT COUNT(*) AS TOTALTRANSACTIONS FROM TRANSACTIONS_1K AS T INNER JOIN GASSTATIONS AS G ON T.GASSTATIONID = G.GASSTATIONID WHERE G.COUNTRY = 'CZE' AND T.DATE > '2012-01-01'",
        "csc-32b_sql.json.csv": "SELECT COUNT(*) FROM TRANSACTIONS_1K T JOIN GASSTATIONS G ON T.GASSTATIONID = G.GASSTATIONID WHERE G.COUNTRY = 'CZE' AND T.DATE > '2012-01-01'",
        "gena_submission_2_sql.json.csv": "SELECT COUNT(*) FROM TRANSACTIONS_1K AS T1 INNER JOIN GASSTATIONS AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T2.COUNTRY = 'CZE' AND T1.DATE > '2012-01-01'",
        "alpha_sql.json.csv": "SELECT COUNT(TRANSACTIONID) FROM TRANSACTIONS_1K INNER JOIN GASSTATIONS ON TRANSACTIONS_1K.GASSTATIONID = GASSTATIONS.GASSTATIONID WHERE DATE > '2012-01-01' AND GASSTATIONS.COUNTRY = 'CZE'",
        "gsr_sql.json.csv": "SELECT COUNT(*) FROM TRANSACTIONS_1K T JOIN GASSTATIONS G ON T.GASSTATIONID = G.GASSTATIONID WHERE G.COUNTRY = 'CZE' AND T.DATE > '2012-01-01';",
        "chess_sql.json.csv": "SELECT COUNT(T1.GASSTATIONID) FROM GASSTATIONS AS T1 INNER JOIN TRANSACTIONS_1K AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T1.COUNTRY = 'CZE' AND T2.DATE > '2012-01-01'",
        "rsl_sql.json.csv": "SELECT COUNT(T1.TRANSACTIONID) FROM TRANSACTIONS_1K AS T1 INNER JOIN GASSTATIONS AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T2.COUNTRY = 'CZE' AND T1.DATE > '2012-01-01'",
        "omni-32-majority_sql.json.csv": "SELECT COUNT(T.TRANSACTIONID) AS TRANSACTIONCOUNT FROM TRANSACTIONS_1K AS T INNER JOIN GASSTATIONS AS G ON T.GASSTATIONID = G.GASSTATIONID WHERE G.COUNTRY = 'CZE' AND T.DATE > '2012-01-01';",
        "gena_submission_1_sql.json.csv": "SELECT COUNT(*) FROM TRANSACTIONS_1K AS T1 INNER JOIN GASSTATIONS AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T2.COUNTRY = 'CZE' AND T1.DATE > '2012-01-01'"        
	},
	"1513": {
                "question_id": "1513",
		"analyze": "Gold SQL gives the latest paid customer not the earliest paid customer.",
            "question": "Which country's gas station had the first paid cusomer in 2012/8/25?",
        "evidence": "'2012/8/25' can be represented by '2012-08-25'",
        "SQL": "SELECT T2.Country FROM transactions_1k AS T1 INNER JOIN gasstations AS T2 ON T1.GasStationID = T2.GasStationID WHERE T1.Date = '2012-08-25' ORDER BY T1.Time DESC LIMIT 1",
        "csc-7b_sql.json.csv": "SELECT T2.COUNTRY FROM TRANSACTIONS_1K AS T1 INNER JOIN GASSTATIONS AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T1.DATE = '2012-08-25' ORDER BY T1.TIME ASC LIMIT 1",
        "slm_sql.json.csv": "SELECT GASSTATIONS.COUNTRY FROM TRANSACTIONS_1K INNER JOIN GASSTATIONS ON TRANSACTIONS_1K.GASSTATIONID = GASSTATIONS.GASSTATIONID WHERE TRANSACTIONS_1K.DATE = '2012-08-25' ORDER BY TRANSACTIONS_1K.CUSTOMERID ASC LIMIT 1",
        "csc-32b_sql.json.csv": "SELECT G.COUNTRY FROM GASSTATIONS G JOIN (SELECT GASSTATIONID FROM TRANSACTIONS_1K WHERE DATE = '2012-08-25' ORDER BY TIME ASC LIMIT 1) T ON G.GASSTATIONID = T.GASSTATIONID",
        "gena_submission_2_sql.json.csv": "SELECT T1.COUNTRY FROM GASSTATIONS AS T1 INNER JOIN TRANSACTIONS_1K AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T2.DATE = '2012-08-25' LIMIT 1",
        "alpha_sql.json.csv": "SELECT GASSTATIONS.COUNTRY FROM TRANSACTIONS_1K INNER JOIN GASSTATIONS ON TRANSACTIONS_1K.GASSTATIONID = GASSTATIONS.GASSTATIONID WHERE TRANSACTIONS_1K.DATE = '2012-08-25' ORDER BY TRANSACTIONS_1K.TRANSACTIONID ASC LIMIT 1",
        "gsr_sql.json.csv": "SELECT G.COUNTRY FROM TRANSACTIONS_1K T JOIN GASSTATIONS G ON T.GASSTATIONID = G.GASSTATIONID WHERE T.DATE = '2012-08-25' ORDER BY T.TIME LIMIT 1;",
        "chess_sql.json.csv": "SELECT T2.COUNTRY FROM TRANSACTIONS_1K AS T1 INNER JOIN GASSTATIONS AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T1.DATE = '2012-08-25' ORDER BY T1.TIME ASC LIMIT 1",
        "rsl_sql.json.csv": "SELECT GASSTATIONS.COUNTRY FROM TRANSACTIONS_1K INNER JOIN GASSTATIONS ON TRANSACTIONS_1K.GASSTATIONID = GASSTATIONS.GASSTATIONID WHERE TRANSACTIONS_1K.DATE = '2012-08-25' ORDER BY TRANSACTIONS_1K.TIME ASC LIMIT 1",
        "omni-32-majority_sql.json.csv": "SELECT G.COUNTRY FROM TRANSACTIONS_1K T INNER JOIN GASSTATIONS G ON T.GASSTATIONID = G.GASSTATIONID WHERE T.DATE = '2012-08-25' AND T.PRICE > 0 ORDER BY T.TIME ASC LIMIT 1;",
        "gena_submission_1_sql.json.csv": "SELECT T1.COUNTRY FROM GASSTATIONS AS T1 INNER JOIN TRANSACTIONS_1K AS T2 ON T1.GASSTATIONID = T2.GASSTATIONID WHERE T2.DATE = '2012-08-25' LIMIT 1"
    
	}
}
