{
    "macsql": {
        "900aceb61a32bfdb6cf3e6ece9597284": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "provide marital status as well as preferred language of the patient with patient id 2560.",
            "gold_sql": "SELECT DEMOGRAPHIC.\"MARITAL_STATUS\",DEMOGRAPHIC.\"LANGUAGE\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"2560\"",
            "pred_sql": "SELECT `MARITAL_STATUS`, `LANGUAGE` FROM `DEMOGRAPHIC` WHERE `SUBJECT_ID` = 2560 AND `MARITAL_STATUS` IS NOT NULL AND `LANGUAGE` IS NOT NULL",
            "gold_answer": "[['None', 'None']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces additional WHERE conditions (`MARITAL_STATUS IS NOT NULL AND LANGUAGE IS NOT NULL`) that filter out the only row (which has both fields as NULL), whereas the ground truth simply selects the values (even if NULL). This mistake lies solely in the WHERE clause by adding extra filters, and can be fixed by removing those conditions without changing the overall query structure or table relationships.",
            "error_type": "Local: incorrect WHERE condition"
        },
        "0d0a62ed7c9bd62e584c9f5b260d9ea0": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "on which date did the patient with patient id 24425 die?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DOD\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"24425\"",
            "pred_sql": "SELECT DOD FROM DEMOGRAPHIC WHERE SUBJECT_ID = 24425 AND EXPIRE_FLAG = 1 AND DOD IS NOT NULL LIMIT 1",
            "gold_answer": "[['None']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query adds extra WHERE conditions (EXPIRE_FLAG = 1, DOD IS NOT NULL) and a LIMIT clause, which changes the intended result by over\u2010filtering. The structure of the query (SELECT from DEMOGRAPHIC, filtering by SUBJECT_ID) remains the same, and the error lies solely in the added conditions. This is a localized mistake in the WHERE clause, not a flaw in the overall query logic or joins.",
            "error_type": "Local: incorrect-filter error"
        },
        "814b08ced5bf2cfc63c311dd93979199": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "give me the number of urgent hospital admission patients who have replaced route of drug administration. (Values: URGENT, REPLACE)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"URGENT\" AND PRESCRIPTIONS.\"ROUTE\" = \"REPLACE\"",
            "pred_sql": "SELECT COUNT(DISTINCT T1.`SUBJECT_ID`, T1.`HADM_ID`) FROM ( SELECT DISTINCT `SUBJECT_ID`, `HADM_ID` FROM DEMOGRAPHIC WHERE `ADMISSION_TYPE` = 'URGENT' ) AS T1 INNER JOIN ( SELECT DISTINCT `SUBJECT_ID`, `HADM_ID` FROM PRESCRIPTIONS WHERE `ROUTE` = 'REPLACE' ) AS T2 ON T1.`SUBJECT_ID` = T2.`SUBJECT_ID` AND T1.`HADM_ID` = T2.`HADM_ID`",
            "gold_answer": "[['0.0']]",
            "pred_answer": "wrong number of arguments to function COUNT()",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses COUNT(DISTINCT T1.SUBJECT_ID, T1.HADM_ID), which is invalid in SQLite (only a single expression is allowed in COUNT(DISTINCT)). This is a localized syntax error in the SELECT clause\u2019s aggregate function and does not reflect a flawed table relationship or overall query logic.",
            "error_type": "Local: aggregate-function syntax error"
        },
        "9193bc2c5d90be4e199fc6a421133f88": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "Calculate the number of patients admitted to emergency who had an ld body fluid test by lab (Values: EMERGENCY, LD, Body Fluid)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"EMERGENCY\" AND LAB.\"LABEL\" = \"LD, Body Fluid\"",
            "pred_sql": "SELECT COUNT(DISTINCT T1.`SUBJECT_ID`) FROM ( SELECT `SUBJECT_ID`, `HADM_ID` FROM DEMOGRAPHIC WHERE `ADMISSION_TYPE` = 'EMERGENCY' ) AS T1 INNER JOIN ( SELECT `SUBJECT_ID`, `HADM_ID` FROM LAB WHERE `LABEL` LIKE '%LD%' AND `FLUID` = 'Body Fluid' ) AS T2 ON T1.`SUBJECT_ID` = T2.`SUBJECT_ID` AND T1.`HADM_ID` = T2.`HADM_ID`",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only mis-filters the lab records: it breaks the single LABEL = 'LD, Body Fluid' test into LABEL LIKE '%LD%' AND FLUID = 'Body Fluid'. This is a WHERE-clause value/condition mistake, not a structural or multi-clause logic error. It can be fixed by restoring the exact equality check on LABEL. Therefore this is a localized filter error.",
            "error_type": "Local: value parsing error"
        },
        "85d8a21277604d575ed70aa8589ef037": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "which language does the patient charles deshay prefer? (Values: Charles Deshay)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"LANGUAGE\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Charles Deshay\"",
            "pred_sql": "SELECT LANGUAGE FROM DEMOGRAPHIC WHERE NAME = 'Charles Deshay' AND LANGUAGE IS NOT NULL",
            "gold_answer": "[['None']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query only differs from the ground truth by adding the extra condition AND LANGUAGE IS NOT NULL in the WHERE clause. This is a mistake localized to the WHERE clause and does not change the overall query structure or table relationships. It filters out the only row (where LANGUAGE is None), resulting in no output. Therefore, this is a local error in the WHERE filter.",
            "error_type": "Local: extra WHERE condition"
        }
    },
    "codes": {
        "829b1b9874d4849cb5c8f0fbabd0373e": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "count the number of government health insurance patients who had wbc, joint fluid lab test. (Values: Government, WBC, Joint Fluid)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"INSURANCE\" = \"Government\" AND LAB.\"LABEL\" = \"WBC, Joint Fluid\"",
            "pred_sql": "SELECT count(DISTINCT demographic.subject_id) FROM demographic INNER JOIN lab ON demographic.subject_id = lab.subject_id WHERE demographic.insurance = 'Government' AND lab.itemid IN (50802, 50804)",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses lab.itemid IN (50802, 50804) instead of matching LAB.LABEL = 'WBC, Joint Fluid' as required. This is a localized mistake in the WHERE clause\u2019s predicate (wrong column and value), not a structural issue affecting joins or overall logic.",
            "error_type": "Local: incorrect predicate"
        },
        "0e8fd2d722e37743ae80d2f8b9c7a3f0": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients admitted under emergency admission type are of hispanic/latino - puertorican ethnicity? (Values: EMERGENCY, HISPANIC/LATINO - PUERTO RICAN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"EMERGENCY\" AND DEMOGRAPHIC.\"ETHNICITY\" = \"HISPANIC/LATINO - PUERTO RICAN\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN ethnicity ON ethnicity.subject_id = demographic.subject_id WHERE demographic.admission_type = 'EMERGENCY' AND demographic.ethnicity = 'HISPANIC/LATINO - PUERTO RICAN'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such table: ethnicity",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces an INNER JOIN with a non-existent table 'ethnicity', causing a table reference error, but the overall query structure for filtering by admission_type and ethnicity remains unchanged. This is a localized mistake in the FROM/JOIN clause rather than a flaw in the query\u2019s logic or multi-clause structure.",
            "error_type": "Local: table reference error"
        },
        "0d83c52fc4822a82a4ebf2428e18c0fa": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients born before the year 2167 were primarily diagnosed for hyperglycemia? (Values: HYPERGLYCEMIA)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"HYPERGLYCEMIA\" AND DEMOGRAPHIC.\"DOB_YEAR\" < \"2167\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN diagnoses ON demographic.subject_id = diagnoses.subject_id WHERE diagnoses.long_title = 'Hyperglycemia' AND demographic.dob_year < 2167",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces an INNER JOIN to the DIAGNOSES table and filters on diagnoses.long_title rather than using the primary diagnosis stored in DEMOGRAPHIC.DIAGNOSIS. The question asks for patients primarily diagnosed with hyperglycemia, so the correct filter should be applied directly on the DEMOGRAPHIC table\u2019s DIAGNOSIS column. By joining and filtering on a different table/column, the predicted query fundamentally changes the intended logic and returns incorrect results.",
            "error_type": "Global: incorrect join logic"
        },
        "9d1a610fdeca814a481fcfd2f4cfa096": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "tell me the drug code and route of doxazosin administration (Values: Doxazosin)",
            "gold_sql": "SELECT PRESCRIPTIONS.\"FORMULARY_DRUG_CD\",PRESCRIPTIONS.\"ROUTE\" FROM PRESCRIPTIONS WHERE PRESCRIPTIONS.\"DRUG\" = \"Doxazosin\"",
            "pred_sql": "SELECT drug, route FROM prescriptions WHERE drug = 'Doxazosin'",
            "gold_answer": "[['DOXA1', 'PO'], ['DOXA1', 'PO']]",
            "pred_answer": "[['Doxazosin', 'PO'], ['Doxazosin', 'PO']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the wrong column in the SELECT clause: it returns the DRUG column instead of the FORMULARY_DRUG_CD column. This is a localized mistake in the column reference and does not affect the overall query structure or joins.",
            "error_type": "Local: column reference error"
        },
        "93071743563d2991581ad4f1a614e467": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find out the route of administration for drug with drug code nabc50s. (Values: NABC50S)",
            "gold_sql": "SELECT PRESCRIPTIONS.\"ROUTE\" FROM PRESCRIPTIONS WHERE PRESCRIPTIONS.\"FORMULARY_DRUG_CD\" = \"NABC50S\"",
            "pred_sql": "SELECT route FROM prescriptions WHERE drug = 'NABC50S'",
            "gold_answer": "[['IV'], ['IV']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the wrong column in the WHERE clause: it filters on drug = 'NABC50S' instead of the FORMULARY_DRUG_CD column. This is a localized column reference error and does not require restructuring the query\u2019s overall logic.",
            "error_type": "Local: column reference error"
        },
        "a7285ffa3213ab37d2c756b87b37babf": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "which primary disease is the patient paul edwards suffering from? (Values: Paul Edwards)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Paul Edwards\"",
            "pred_sql": "SELECT diagnoses.short_title FROM demographic INNER JOIN diagnoses ON demographic.subject_id = diagnoses.subject_id WHERE demographic.name = 'Paul Edwards' AND demographic.diagnosis = 'CORONARY ARTERY DISEASE'",
            "gold_answer": "[['HYPERGLYCEMIA;HYPONATREMIA']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins the DEMOGRAPHIC table with the DIAGNOSES table and adds an extra filter on demographic.diagnosis = 'CORONARY ARTERY DISEASE', which changes the overall logic and structure of the query. The question asks for the primary disease stored in DEMOGRAPHIC.DIAGNOSIS for Paul Edwards, not for diagnoses.short_title or a specific hard-coded disease. This incorrect join and extra condition fundamentally alter the intended query meaning.",
            "error_type": "Global: join logic error"
        },
        "90c61fa47e6f3ee70f1d5a5262acea5b": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what is the number of patients who underwent radical cystectomy? (Values: Radical cystectomy)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE PROCEDURES.\"SHORT_TITLE\" = \"Radical cystectomy\"",
            "pred_sql": "SELECT count(procedures.subject_id) FROM procedures INNER JOIN diagnoses ON procedures.subject_id = diagnoses.subject_id WHERE procedures.short_title = 'Radical cystectomy'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['6.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the query\u2019s logic by joining PROCEDURES to DIAGNOSES on SUBJECT_ID rather than joining PROCEDURES to DEMOGRAPHIC (and using HADM_ID) as in the ground truth. This wrong join both changes the tables involved and leads to duplicate counts (no DISTINCT), producing an incorrect result. Fixing this requires restructuring the join strategy, not just a minor tweak in a single clause.",
            "error_type": "Global: incorrect join"
        }
    },
    "deepseek": {
        "91c5218be91466059b6ab55b5c9a214b": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "How many of the patients on urgent admission had Neb drug route? (Values: URGENT, NEB)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"URGENT\" AND PRESCRIPTIONS.\"ROUTE\" = \"NEB\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID, D.HADM_ID) AS COUNT FROM DEMOGRAPHIC D JOIN PRESCRIPTIONS P ON D.SUBJECT_ID = P.SUBJECT_ID AND D.HADM_ID = P.HADM_ID WHERE D.ADMISSION_TYPE = 'URGENT' AND P.ROUTE = 'NEB';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "wrong number of arguments to function COUNT()",
            "is_correct": false,
            "reasoning": "The predicted SQL attempts to use COUNT(DISTINCT D.SUBJECT_ID, D.HADM_ID), but in SQLite COUNT(DISTINCT ) only accepts a single argument. This is a localized mistake within the aggregate function and does not affect the overall query structure or join logic. It is a syntax/argument error in the COUNT expression that can be fixed by using a single column or a different approach to count distinct pairs.",
            "error_type": "Local: aggregate argument error"
        },
        "082284313a19eb529220fdbbf1676c91": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "how many of the patients on self pay had coronary athrscl natve vessel? (Values: Self Pay, Crnry athrscl natve vssl)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"INSURANCE\" = \"Self Pay\" AND DIAGNOSES.\"SHORT_TITLE\" = \"Crnry athrscl natve vssl\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) FROM DEMOGRAPHIC DM JOIN DIAGNOSES D ON DM.SUBJECT_ID = D.SUBJECT_ID AND DM.HADM_ID = D.HADM_ID WHERE DM.INSURANCE = 'Self Pay' AND D.LONG_TITLE = 'Coronary atherosclerosis native vessel';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the LONG_TITLE column and a spelled\u2010out disease name (\u2018Coronary atherosclerosis native vessel\u2019) instead of matching the SHORT_TITLE column and exact literal (\u2018Crnry athrscl natve vssl\u2019) specified by the question. The join structure and overall query logic remain correct, but the wrong column and mismatched value in the WHERE clause cause the discrepancy. This is a localized error that can be fixed without altering the query\u2019s structure.",
            "error_type": "Local: column reference/value error"
        },
        "867cf2582e1a2e8d3334cc3214b69472": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "Calculate the minimum age of patients born after 2095 who have transient ischemic attack as their primary disease. (Values: TRANSIENT ISCHEMIC ATTACK)",
            "gold_sql": "SELECT MIN ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"TRANSIENT ISCHEMIC ATTACK\" AND DEMOGRAPHIC.\"DOB_YEAR\" > \"2095\"",
            "pred_sql": "SELECT MIN(AGE) AS MIN_AGE FROM DEMOGRAPHIC WHERE YEAR(DOB) > 2095 AND DIAGNOSIS LIKE '%TRANSIENT ISCHEMIC ATTACK%';",
            "gold_answer": "[['None']]",
            "pred_answer": "no such function: YEAR",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because SQLite does not support the YEAR() function. This is a localized error in the WHERE clause (incorrect function usage), not a fundamental mis\u2010join or structural mistake. Everything else (MIN(AGE), table reference, LIKE condition) is syntactically local to that clause and doesn\u2019t require rewriting the overall query logic.",
            "error_type": "Local: function usage error"
        }
    },
    "qwen3": {
        "0e8272658be25dcd6baac667cfc23de8": {
            "db_id": "mimicsql",
            "generator_name": "qwen3",
            "question": "How many of the patients with sigmoid diverticulitis colovestical fistula/SDA as their primary disease had a hospital stay for more than 26 days? (Values: SIGMOID DIVERTICULITIS, COLOVESTICAL FISTULA/SDA)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"SIGMOID DIVERTICULITIS, COLOVESTICAL FISTULA/SDA\" AND DEMOGRAPHIC.\"DAYS_STAY\" > \"26\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DEMOGRAPHIC WHERE DIAGNOSIS IN ('SIGMOID DIVERTICULITIS', 'COLOVESTICAL FISTULA/SDA') AND DAYS_STAY > 26;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses DIAGNOSIS IN ('SIGMOID DIVERTICULITIS', 'COLOVESTICAL FISTULA/SDA') instead of matching the single combined diagnosis string 'SIGMOID DIVERTICULITIS, COLOVESTICAL FISTULA/SDA'. This is a local error in the WHERE clause\u2019s value condition, not affecting the overall query structure.",
            "error_type": "Local: value parsing error"
        },
        "93afecdf36b6ce7b81f6d82625a068fb": {
            "db_id": "mimicsql",
            "generator_name": "qwen3",
            "question": "which patients have lab test item id 50953?",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE LAB.\"ITEMID\" = \"50953\"",
            "pred_sql": "SELECT DISTINCT d.* FROM DEMOGRAPHIC d INNER JOIN LAB l ON d.SUBJECT_ID = l.SUBJECT_ID AND d.HADM_ID = l.HADM_ID WHERE l.ITEMID = 50953;",
            "gold_answer": "[['17.0']]",
            "pred_answer": "[['14755.0', '151669.0', 'Bessie Wood', 'SINGLE', '47.0', '2078-07-15 00:00:00', 'F', 'ENGL', 'NOT SPECIFIED', 'EMERGENCY', '13.0', 'Medicare', 'WHITE', '0.0', 'TRANSFER FROM HOSP/EXTRAM', 'HOME HEALTH CARE', 'PNEUMONIA;HUMAN IMMUNODEFIENCY VIRUS;RULE OUT TUBERCULOSIS', 'None', '2078.0', 'None', '2125-02-09 18:34:00', '2125-02-23 16:30:00', '2125.0'], ['16438.0', '152794.0', 'Sheila Riley', 'None', '70.0', '2049-06-06 00:00:00', 'F', 'None', 'None', 'EMERGENCY', '7.0', 'Medicare', 'OTHER', '1.0', 'TRANSFER FROM HOSP/EXTRAM', 'HOME HEALTH CARE', 'PNEUMONIA', '2126-05-31 00:00:00', '2049.0', '2126.0', '2119-05-26 17:27:00', '2119-06-03 14:39:00', '2119.0'], ['17570.0', '183034.0', 'Paul Dunn', 'DIVORCED', '68.0', '2114-12-30 00:00:00', 'M', 'None', 'PROTESTANT QUAKER', 'EMERGENCY', '27.0', 'Medicare', 'WHITE', '1.0', 'TRANSFER FROM HOSP/EXTRAM', 'REHAB/DISTINCT PART HOSP', 'INFECTED RIGHT THIGH GRAFT', '2183-06-12 00:00:00', '2114.0', '2183.0', '2182-12-27 16:14:00', '2183-01-24 13:00:00', '2182.0'], ['19620.0', '130531.0', 'Dawn Cooper', 'SINGLE', '43.0', '2120-09-25 00:00:00', 'F', 'None', 'NOT SPECIFIED', 'EMERGENCY', '5.0', 'Medicare', 'WHITE', '1.0', 'EMERGENCY ROOM ADMIT', 'HOME HEALTH CARE', 'ACIDOSIS', '2168-05-19 00:00:00', '2120.0', '2168.0', '2163-03-03 15:16:00', '2163-03-08 15:51:00', '2163.0'], ['23602.0', '152293.0', 'Ida Cook', 'WIDOWED', '77.0', '2073-08-06 00:00:00', 'F', 'None', 'CATHOLIC', 'EMERGENCY', '7.0', 'Private', 'WHITE', '0.0', 'TRANSFER FROM HOSP/EXTRAM', 'SNF', 'CORONARY ARTERY DISEASE', 'None', '2073.0', 'None', '2150-03-02 14:30:00', '2150-03-10 12:40:00', '2150.0'], ['28588.0', '141664.0', 'Theresa Vedovelli', 'SINGLE', '89.0', '1850-08-17 00:00:00', 'F', 'ENGL', 'PROTESTANT QUAKER', 'EMERGENCY', '10.0', 'Medicare', 'WHITE', '0.0', 'EMERGENCY ROOM ADMIT', 'SNF', 'COMPLETE HEART BLOCK', 'None', '1850.0', 'None', '2150-08-17 22:51:00', '2150-08-28 13:35:00', '2150.0'], ['29541.0', '103957.0', 'Estrella Carroll', 'SINGLE', '58.0', '2112-06-24 00:00:00', 'F', 'ENGL', 'CATHOLIC', 'EMERGENCY', '5.0', 'Medicare', 'WHITE', '0.0', 'EMERGENCY ROOM ADMIT', 'HOME', 'SEPSIS', 'None', '2112.0', 'None', '2170-03-25 23:12:00', '2170-03-31 14:00:00', '2170.0'], ['29961.0', '196409.0', 'Jerry Deberry', 'SINGLE', '72.0', '2043-02-28 00:00:00', 'M', 'ENGL', 'CATHOLIC', 'EMERGENCY', '20.0', 'Medicare', 'WHITE', '0.0', 'CLINIC REFERRAL/PREMATURE', 'SNF', 'S/P FALL', 'None', '2043.0', 'None', '2115-06-20 17:48:00', '2115-07-10 18:45:00', '2115.0'], ['3623.0', '178444.0', 'Joseph Dillman', 'MARRIED', '63.0', '2101-07-04 00:00:00', 'M', 'ENGL', 'PROTESTANT QUAKER', 'EMERGENCY', '8.0', 'Medicare', 'WHITE', '1.0', 'EMERGENCY ROOM ADMIT', 'HOME HEALTH CARE', 'PNEUMONIA', '2164-02-23 00:00:00', '2101.0', '2164.0', '2164-02-14 16:25:00', '2164-02-22 17:30:00', '2164.0'], ['4333.0', '155027.0', 'Kenneth Koeller', 'MARRIED', '77.0', '2047-11-23 00:00:00', 'M', 'PTUN', 'CATHOLIC', 'EMERGENCY', '29.0', 'Medicare', 'WHITE', '0.0', 'TRANSFER FROM HOSP/EXTRAM', 'REHAB/DISTINCT PART HOSP', 'GUILLAIN BARRE SYNDROME', 'None', '2047.0', 'None', '2124-06-29 15:04:00', '2124-07-28 16:33:00', '2124.0'], ['4333.0', '155027.0', 'Kenneth Koeller', 'MARRIED', '77.0', '2047-11-23 00:00:00', 'M', 'PTUN', 'CATHOLIC', 'EMERGENCY', '29.0', 'Medicare', 'WHITE', '0.0', 'TRANSFER FROM HOSP/EXTRAM', 'REHAB/DISTINCT PART HOSP', 'GUILLAIN BARRE SYNDROME', 'None', '2047.0', 'None', '2124-06-29 15:04:00', '2124-07-28 16:33:00', '2124.0'], ['4333.0', '155027.0', 'Kenneth Koeller', 'MARRIED', '77.0', '2047-11-23 00:00:00', 'M', 'PTUN', 'CATHOLIC', 'EMERGENCY', '29.0', 'Medicare', 'WHITE', '0.0', 'TRANSFER FROM HOSP/EXTRAM', 'REHAB/DISTINCT PART HOSP', 'GUILLAIN BARRE SYNDROME', 'None', '2047.0', 'None', '2124-06-29 15:04:00', '2124-07-28 16:33:00', '2124.0'], ['52012.0', '146937.0', 'Jane Dillard', 'SINGLE', '45.0', '2117-08-30 00:00:00', 'F', 'ENGL', 'NOT SPECIFIED', 'EMERGENCY', '2.0', 'Medicare', 'WHITE', '0.0', 'CLINIC REFERRAL/PREMATURE', 'HOME', 'RASH', 'None', '2117.0', 'None', '2162-10-15 22:53:00', '2162-10-18 11:35:00', '2162.0'], ['55094.0', '135633.0', 'Lawrence Wibbens', 'MARRIED', '56.0', '2126-10-22 00:00:00', 'M', 'ENGL', 'CATHOLIC', 'EMERGENCY', '23.0', 'Medicaid', 'WHITE', '0.0', 'CLINIC REFERRAL/PREMATURE', 'HOME HEALTH CARE', 'ABDOMINAL ABSCESS', 'None', '2126.0', 'None', '2182-02-08 22:31:00', '2182-03-04 14:28:00', '2182.0'], ['55094.0', '135633.0', 'Lawrence Wibbens', 'MARRIED', '56.0', '2126-10-22 00:00:00', 'M', 'ENGL', 'CATHOLIC', 'EMERGENCY', '23.0', 'Medicaid', 'WHITE', '0.0', 'CLINIC REFERRAL/PREMATURE', 'HOME HEALTH CARE', 'ABDOMINAL ABSCESS', 'None', '2126.0', 'None', '2182-02-08 22:31:00', '2182-03-04 14:28:00', '2182.0'], ['62296.0', '193576.0', 'Morgan Mcgee', 'WIDOWED', '83.0', '2085-10-29 00:00:00', 'F', 'ENGL', 'JEWISH', 'EMERGENCY', '16.0', 'Medicare', 'WHITE', '1.0', 'EMERGENCY ROOM ADMIT', 'DEAD/EXPIRED', 'ABDOMINAL PAIN', '2168-10-29 00:00:00', '2085.0', '2168.0', '2168-10-12 11:36:00', '2168-10-29 05:17:00', '2168.0'], ['67965.0', '145657.0', 'Richard Gundlach', 'MARRIED', '74.0', '2041-07-10 00:00:00', 'M', 'ENGL', 'CATHOLIC', 'EMERGENCY', '7.0', 'Medicare', 'WHITE', '1.0', 'CLINIC REFERRAL/PREMATURE', 'DEAD/EXPIRED', 'GANGRENE', '2115-09-24 00:00:00', '2041.0', '2115.0', '2115-09-17 00:51:00', '2115-09-24 12:00:00', '2115.0'], ['85673.0', '136522.0', 'Gus Marques', 'SINGLE', '27.0', '2138-05-21 00:00:00', 'M', 'ENGL', 'JEWISH', 'EMERGENCY', '9.0', 'Private', 'WHITE - RUSSIAN', '0.0', 'CLINIC REFERRAL/PREMATURE', 'HOME', 'HEMOPYTSIS', 'None', '2138.0', 'None', '2165-04-29 23:35:00', '2165-05-09 14:40:00', '2165.0'], ['94762.0', '160707.0', 'Walter Locher', 'MARRIED', '67.0', '2098-04-23 00:00:00', 'M', 'ENGL', 'PROTESTANT QUAKER', 'ELECTIVE', '20.0', 'Medicare', 'WHITE', '1.0', 'PHYS REFERRAL/NORMAL DELI', 'DEAD/EXPIRED', 'NEOPLASM OF UNCERTAIN BEHAVIOR OF OTHER LYMPHATIC AND HEMATOPOIETIC TISSUES\\\\BONE MARROW TRANSPLANT', '2165-06-24 00:00:00', '2098.0', '2165.0', '2165-06-03 11:25:00', '2165-06-24 03:23:00', '2165.0'], ['98220.0', '189416.0', 'Bruce Harris', 'MARRIED', '70.0', '2103-11-14 00:00:00', 'M', 'ENGL', 'CATHOLIC', 'EMERGENCY', '23.0', 'Medicare', 'WHITE', '1.0', 'PHYS REFERRAL/NORMAL DELI', 'HOME HEALTH CARE', 'COLANGITIS', '2173-12-24 00:00:00', '2103.0', '2173.0', '2173-08-25 12:58:00', '2173-09-17 15:40:00', '2173.0']]",
            "is_correct": false,
            "reasoning": "The predicted query returns full demographic rows (SELECT DISTINCT d.*) instead of computing the count of distinct patients, and it omits the COUNT(DISTINCT) aggregation entirely. Fixing it requires restructuring the SELECT clause and adding an aggregate function\u2014this is not a localized typo or syntax mistake but a fundamental change to the query\u2019s intended purpose and output structure.",
            "error_type": "Global: missing aggregation / wrong output structure"
        }
    },
    "llm2sql": {
        "074e704855d20a2abc5a310eb1ebec93": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "posaconazole suspension is administered via which route? (Values: Posaconazole Suspension)",
            "gold_sql": "SELECT PRESCRIPTIONS.\"ROUTE\" FROM PRESCRIPTIONS WHERE PRESCRIPTIONS.\"DRUG\" = \"Posaconazole Suspension\"",
            "pred_sql": "SELECT ROUTE FROM PRESCRIPTIONS WHERE DRUG = 'posaconazole suspension';",
            "gold_answer": "[['PO'], ['PO/NG']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query structure matches the intended query (SELECT ROUTE FROM PRESCRIPTIONS WHERE DRUG = ...), but it fails because of a literal mismatch: it uses single quotes and lowercase 'posaconazole suspension' while the stored DRUG value is 'Posaconazole Suspension' (case-sensitive). This is a localized error in the WHERE clause value parsing, not a structural or logical join issue.",
            "error_type": "Local: value parsing error"
        },
        "9bcb8fd398ac5be28718b9fb311c354e": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "Among patients with cerebral aneurysm/sda as their primary disease, calculate the total number of those born before the year 2173. (Values: CEREBRAL ANEURYSM/SDA)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"CEREBRAL ANEURYSM/SDA\" AND DEMOGRAPHIC.\"ADMITYEAR\" < \"2173\"",
            "pred_sql": "SELECT COUNT(DISTINCT DEMOGRAPHIC.SUBJECT_ID) FROM DEMOGRAPHIC JOIN DIAGNOSES ON DEMOGRAPHIC.SUBJECT_ID = DIAGNOSES.SUBJECT_ID AND DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DIAGNOSES.LONG_TITLE = 'CEREBRAL ANEURYSM/SDA' AND DEMOGRAPHIC.DOB_YEAR < 2173;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces a JOIN to the DIAGNOSES table and filters on DIAGNOSES.LONG_TITLE instead of using the DEMOGRAPHIC.DIAGNOSIS column as specified. This changes the intended source of the \u2018primary disease\u2019 information and the overall query logic (also using DOB_YEAR instead of ADMITYEAR). Fixing this would require removing the unnecessary JOIN and restoring the correct column, which is more than a local syntax or minor reference fix. It fundamentally alters the query\u2019s structure and intended meaning.",
            "error_type": "Global: incorrect join and filter logic"
        }
    },
    "o4-mini": {
        "a619d5854b9eb9d0df34539f613cafc4": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "give me the number of emergency hospital admission patients who had insertion of 2 vascular stents. (Values: EMERGENCY, Insert 2 vascular stents)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"EMERGENCY\" AND PROCEDURES.\"SHORT_TITLE\" = \"Insert 2 vascular stents\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.subject_id) AS num_patients FROM demographic d JOIN procedures p ON d.subject_id = p.subject_id AND d.hadm_id = p.hadm_id WHERE d.admission_type = 'EMERGENCY' AND ( UPPER(p.long_title) LIKE '%INSERT%' AND UPPER(p.long_title) LIKE '%2%' AND UPPER(p.long_title) LIKE '%STENT%' );",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only differs in the WHERE clause\u2019s filter on the procedures table: it uses UPPER(p.long_title) LIKE conditions (and omits \u201cvascular\u201d) instead of matching PROCEDURES.SHORT_TITLE = 'Insert 2 vascular stents'. The join, aggregation, and table references are correct. This error is confined to a single clause (the filter), so it is a local error.",
            "error_type": "Local: incorrect WHERE clause filter"
        }
    }
}