{
    "llm2sql": {
        "8404478c3a267757514125bb690cca23": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "how many patients admitted after year 2146 had ruq pain? (Values: RUQ PAIN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"RUQ PAIN\" AND DEMOGRAPHIC.\"ADMITYEAR\" < \"2146\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) FROM DEMOGRAPHIC D JOIN DIAGNOSES DI ON D.SUBJECT_ID = DI.SUBJECT_ID AND D.HADM_ID = DI.HADM_ID WHERE D.ADMITYEAR > 2146 AND DI.LONG_TITLE LIKE '%RUQ Pain%'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the intended logic by introducing a JOIN to the DIAGNOSES table (where the ground truth simply filters the DEMOGRAPHIC.DIAGNOSIS column). It also reverses the comparison on ADMITYEAR (uses > instead of <) and uses a LIKE filter on DI.LONG_TITLE rather than an exact match on DEMOGRAPHIC.DIAGNOSIS. These alterations span multiple clauses and require restructuring the query\u2019s logic, not just a minor fix in one clause.",
            "error_type": "Global: flawed join strategy"
        },
        "871de8f4f83e7d3c523502445f3264de": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "what is the number of patients less than 56 years who have hyperglycemia primary disease? (Values: HYPERGLYCEMIA)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"HYPERGLYCEMIA\" AND DEMOGRAPHIC.\"AGE\" < \"56\"",
            "pred_sql": "SELECT COUNT(DISTINCT DEMOGRAPHIC.SUBJECT_ID) FROM DEMOGRAPHIC JOIN DIAGNOSES ON DEMOGRAPHIC.SUBJECT_ID = DIAGNOSES.SUBJECT_ID WHERE DEMOGRAPHIC.AGE < 56 AND DIAGNOSES.LONG_TITLE LIKE '%HYPERGLYCEMIA%';",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the query\u2019s structure and logic by joining the DIAGNOSES table and filtering on DIAGNOSES.LONG_TITLE, rather than using the DEMOGRAPHIC.DIAGNOSIS column for the primary disease. This is not a simple syntax or alias issue but a wrong-table usage that changes the meaning of the query, requiring a significant restructuring to fix.",
            "error_type": "Global: incorrect table usage"
        },
        "838ee5f862ddd3c0a19da04e62ab6735": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "Calculate the patients who are prescribed additive drugs that have stayed in the hospital for more than 5 days. (Values: ADDITIVE)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"DAYS_STAY\" > \"5\" AND PRESCRIPTIONS.\"DRUG_TYPE\" = \"ADDITIVE\"",
            "pred_sql": "SELECT COUNT(DISTINCT DEMOGRAPHIC.SUBJECT_ID) nFROM PRESCRIPTIONS nJOIN DEMOGRAPHIC ON PRESCRIPTIONS.SUBJECT_ID = DEMOGRAPHIC.SUBJECT_ID nAND PRESCRIPTIONS.HADM_ID = DEMOGRAPHIC.HADM_ID nWHERE PRESCRIPTIONS.DRUG_TYPE = 'ADDITIVE' nAND DEMOGRAPHIC.DAYS_STAY > 5",
            "gold_answer": "[['4.0']]",
            "pred_answer": "near \"PRESCRIPTIONS\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL has a syntax mistake caused by missing spaces/newlines before the FROM and JOIN keywords (e.g., \u2018nFROM PRESCRIPTIONS nJOIN \u2026\u2019), which breaks the parser. This is a simple, localized syntax error in the query formatting rather than a logical or structural issue with table relationships or overall query intent. It can be fixed by adding the proper spaces/newlines around FROM/JOIN without altering the query\u2019s logic.",
            "error_type": "Local: syntax error"
        },
        "80493e9bb6cabefb1d4a01cb9851ea70": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "provide me the number of patients who have been diagnosed with chordae tendinae rupture. (Values: Chordae tendinae rupture)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"Chordae tendinae rupture\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DIAGNOSES WHERE LONG_TITLE = 'Chordae tendinae rupture';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query uses the LONG_TITLE column instead of the correct SHORT_TITLE column to filter for \u201cChordae tendinae rupture.\u201d This is a mistake in a specific part of the WHERE clause (column reference), and it does not alter the overall structure or join logic of the query. Hence it is a localized error.",
            "error_type": "Local: column-reference error"
        },
        "05343cc69204da73ce2ac4ac4d8295bb": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "Show me the number of black /haitian patients who were diagnosed under the diagnoses cicd9 code 2948. (Values: BLACK/HAITIAN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"ETHNICITY\" = \"BLACK/HAITIAN\" AND DIAGNOSES.\"ICD9_CODE\" = \"2948\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) nFROM DEMOGRAPHIC d nJOIN DIAGNOSES diag nON d.SUBJECT_ID = diag.SUBJECT_ID AND d.HADM_ID = diag.HADM_ID nWHERE diag.ICD9_CODE = '2948' nAND d.ETHNICITY = 'BLACK/HAITIAN';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "near \"DEMOGRAPHIC\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL has a syntax error due to the literal \u201cnFROM\u201d (and similar \u201cnJOIN\u201d) instead of a proper newline or space before FROM/JOIN, causing \"near \\\"DEMOGRAPHIC\\\": syntax error\". This is a localized syntax/formatting mistake and does not change the overall join logic or query structure.",
            "error_type": "Local: syntax error"
        },
        "0332dda726da118eaa7ca1bd76d407df": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "what is the number of patients whose hospital stay is above 7 days and diagnosed with single ib in-hosp w cs? (Values: Single lb in-hosp w cs)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"DAYS_STAY\" > \"7\" AND DIAGNOSES.\"SHORT_TITLE\" = \"Single lb in-hosp w cs\"",
            "pred_sql": "SELECT COUNT(*) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES ON DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.DAYS_STAY > 7 AND DIAGNOSES.LONG_TITLE = 'Single lb in-hosp w cs'",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL errs only in the SELECT and WHERE clauses: it filters by DIAGNOSES.LONG_TITLE instead of the correct SHORT_TITLE and uses COUNT(*) instead of COUNT(DISTINCT SUBJECT_ID). These mistakes are confined to specific column references and aggregation functions and do not alter the overall join structure or query logic. Thus this is a Local error.",
            "error_type": "Local: column reference error"
        }
    },
    "deepseek": {
        "a5d9467737164f47007345c4893d763f": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "which patients have drug code bactss? (Values: BACTSS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE PRESCRIPTIONS.\"FORMULARY_DRUG_CD\" = \"BACTSS\"",
            "pred_sql": "SELECT D.NAME FROM DEMOGRAPHIC D INNER JOIN PRESCRIPTIONS P ON D.SUBJECT_ID = P.SUBJECT_ID WHERE P.FORMULARY_DRUG_CD = 'BACTSS';",
            "gold_answer": "[['4.0']]",
            "pred_answer": "[['Antonio Mccarthy'], ['Antonio Mccarthy'], ['Antonio Mccarthy'], ['Gwendolyn Hager'], ['Jason Walker'], ['Warren Baldwin']]",
            "is_correct": false,
            "reasoning": "The predicted SQL changes the overall query logic by selecting patient names instead of counting distinct patient IDs, and also uses a different join key (SUBJECT_ID rather than HADM_ID). This is not a simple typo or localized clause mistake but a structural change that alters the intended output and aggregation, so it is a global error.",
            "error_type": "Global: structural-flaw"
        },
        "95832f8e506136d97ce571b7c5bd4e10": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "what is the diagnosis code and diagnosis long title for the patient francis baseler? (Values: Francis Baseler)",
            "gold_sql": "SELECT DIAGNOSES.\"ICD9_CODE\",DIAGNOSES.\"LONG_TITLE\" FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"NAME\" = \"Francis Baseler\"",
            "pred_sql": "SELECT D.ICD9_CODE AS \"Diagnosis Code\", D.LONG_TITLE AS \"Diagnosis Long Title\" FROM DEMOGRAPHIC DG INNER JOIN DIAGNOSES D ON DG.SUBJECT_ID = D.SUBJECT_ID AND DG.HADM_ID = D.HADM_ID WHERE DG.NAME = 'Francis Baseler';",
            "gold_answer": "[['2639.0', 'Unspecified protein-calorie malnutrition'], ['2809.0', 'Iron deficiency anemia, unspecified'], ['2869.0', 'Other and unspecified coagulation defects'], ['29634.0', 'Major depressive affective disorder, recurrent episode, severe, specified as with psychotic behavior'], ['30400.0', 'Opioid type dependence, unspecified'], ['33829.0', 'Other chronic pain'], ['34690.0', 'Migraine, unspecified, without mention of intractable migraine without mention of status migrainosus'], ['56962.0', 'Mechanical complication of colostomy and enterostomy'], ['5771.0', 'Chronic pancreatitis'], ['E9530', 'Suicide and self-inflicted injury by hanging'], ['V489', 'Unspecified problem with head, neck, or trunk'], ['V6284', 'Suicidal ideation']]",
            "pred_answer": "[['2639.0'], ['2809.0'], ['2869.0'], ['29634.0'], ['30400.0'], ['33829.0'], ['34690.0'], ['56962.0'], ['5771.0'], ['E9530'], ['V489'], ['V6284']]",
            "is_correct": false,
            "reasoning": "The predicted query fails to return the diagnosis long title even though the ground truth asks for both ICD9_CODE and LONG_TITLE. This is a localized mistake in the SELECT clause (omitting the second column), not a fundamental issue with joins or overall query structure.",
            "error_type": "Local: column reference error"
        }
    },
    "qwen3": {
        "0ef6faed83eede01bf4c9bb3f186fe66": {
            "db_id": "mimicsql",
            "generator_name": "qwen3",
            "question": "let me know both the short title and icd9 code of procedure of patient thomas nazario. (Values: Thomas Nazario)",
            "gold_sql": "SELECT PROCEDURES.\"ICD9_CODE\",PROCEDURES.\"SHORT_TITLE\" FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"NAME\" = \"Thomas Nazario\"",
            "pred_sql": "SELECT p.SHORT_TITLE, p.ICD9_CODE FROM PROCEDURES p JOIN DEMOGRAPHIC d ON p.SUBJECT_ID = d.SUBJECT_ID AND p.HADM_ID = d.HADM_ID WHERE d.NAME = 'Thomas Nazario';",
            "gold_answer": "[['3512.0', 'Opn mitral valvuloplasty'], ['3532.0', 'Chordae tendineae ops'], ['3611.0', 'Aortocor bypas-1 cor art'], ['3615.0', '1 int mam-cor art bypass'], ['3723.0', 'Rt/left heart card cath'], ['3761.0', 'Pulsation balloon implan'], ['3931.0', 'Suture of artery'], ['3961.0', 'Extracorporeal circulat'], ['8856.0', 'Coronar arteriogr-2 cath']]",
            "pred_answer": "[['1 int mam-cor art bypass', '3615.0'], ['Aortocor bypas-1 cor art', '3611.0'], ['Chordae tendineae ops', '3532.0'], ['Coronar arteriogr-2 cath', '8856.0'], ['Extracorporeal circulat', '3961.0'], ['Opn mitral valvuloplasty', '3512.0'], ['Pulsation balloon implan', '3761.0'], ['Rt/left heart card cath', '3723.0'], ['Suture of artery', '3931.0']]",
            "is_correct": false,
            "reasoning": "The only difference between the ground truth and the predicted SQL is the order of columns in the SELECT clause (the predicted SQL returns SHORT_TITLE first and ICD9_CODE second, whereas the ground truth requests ICD9_CODE then SHORT_TITLE). The table joins, filters, and relationships are all correct, so this is a localized issue in the SELECT clause that does not affect the overall query structure or logic.",
            "error_type": "Local: select-clause column order error"
        }
    },
    "macsql": {
        "87e3e952f4c6888eca35ce87b6a82e7d": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "what is average age of patients whose primary disease is bowel obstruction and who are aged equal or more than 71 years? (Values: BOWEL OBSTRUCTION)",
            "gold_sql": "SELECT AVG ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"BOWEL OBSTRUCTION\" AND DEMOGRAPHIC.\"AGE\" >= \"71\"",
            "pred_sql": "SELECT AVG(T2.`AGE`) AS average_age FROM DEMOGRAPHIC AS T2 INNER JOIN ( SELECT DISTINCT T1.`SUBJECT_ID`, T1.`HADM_ID` FROM DIAGNOSES AS T1 WHERE T1.`LONG_TITLE` LIKE '%BOWEL OBSTRUCTION%' ) AS T3 ON T2.`SUBJECT_ID` = T3.`SUBJECT_ID` AND T2.`HADM_ID` = T3.`HADM_ID` WHERE T2.`AGE` >= 71 AND T2.`AGE` IS NOT NULL",
            "gold_answer": "[['77.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins the DEMOGRAPHIC table to the DIAGNOSES table and filters on DIAGNOSES.LONG_TITLE for 'bowel obstruction', but the question asks for patients whose primary disease (stored in DEMOGRAPHIC.DIAGNOSIS) is 'BOWEL OBSTRUCTION'. Using the DIAGNOSES table and a LIKE filter fundamentally changes the logic and data source of the primary disease condition. This is not a simple column reference fix; it requires restructuring the query to remove the join and apply the filter directly on DEMOGRAPHIC.DIAGNOSIS.",
            "error_type": "Global: incorrect-join"
        }
    },
    "codes": {
        "8182d5043bd51f337b846751434757f1": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "give me the number of patients less than 41 years who have delta abnormal lab test status.",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"AGE\" < \"41\" AND LAB.\"FLAG\" = \"delta\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN lab ON demographic.subject_id = lab.subject_id WHERE demographic.age < 41 AND lab.flag = 'delta'",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['9.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL changes the join condition and aggregation in a way that alters the fundamental logic of the query. The ground truth uses INNER JOIN on HADM_ID (to match each lab record to the correct admission) and COUNT(DISTINCT SUBJECT_ID) to count unique patients. The prediction instead joins only on SUBJECT_ID and uses COUNT without DISTINCT, causing multiple admissions and lab records per patient to be overcounted. This is not a simple typo or syntax issue isolated to one clause but a core logical mistake in how data rows are combined and aggregated. It requires restructuring the join and aggregation strategy to fix, so it is a Global error.",
            "error_type": "Global: incorrect join and aggregation logic"
        },
        "0e597171d8f49a56ee59fb5598fd6322": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "give the birthdate and procedure title of jerry deberry. (Values: Jerry Deberry)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DOB\",PROCEDURES.\"LONG_TITLE\" FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"NAME\" = \"Jerry Deberry\"",
            "pred_sql": "SELECT demographic.dob, procedures.short_title FROM demographic INNER JOIN procedures ON demographic.subject_id = procedures.subject_id WHERE demographic.name = 'Jerry Deberry'",
            "gold_answer": "[['2043-02-28 00:00:00', 'Arterial catheterization'], ['2043-02-28 00:00:00', 'Central venous catheter placement with guidance'], ['2043-02-28 00:00:00', 'Continuous invasive mechanical ventilation for less than 96 consecutive hours'], ['2043-02-28 00:00:00', 'Enteral infusion of concentrated nutritional substances'], ['2043-02-28 00:00:00', 'Insertion of endotracheal tube'], ['2043-02-28 00:00:00', 'Percutaneous [endoscopic] gastrostomy [PEG]'], ['2043-02-28 00:00:00', 'Venous catheterization, not elsewhere classified']]",
            "pred_answer": "[['2043-02-28 00:00:00', 'Arterial catheterization'], ['2043-02-28 00:00:00', 'CV cath plcmt w guidance'], ['2043-02-28 00:00:00', 'Cont inv mec ven <96 hrs'], ['2043-02-28 00:00:00', 'Entral infus nutrit sub'], ['2043-02-28 00:00:00', 'Insert endotracheal tube'], ['2043-02-28 00:00:00', 'Percu endosc gastrostomy'], ['2043-02-28 00:00:00', 'Venous cath NEC']]",
            "is_correct": false,
            "reasoning": [
                "The ground truth query selects the column PROCEDURES.LONG_TITLE, while the predicted query selects PROCEDURES.SHORT_TITLE. This is a wrong column reference in the SELECT clause.",
                "Additionally, the ground truth joins on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID, but the predicted query joins on DEMOGRAPHIC.SUBJECT_ID = PROCEDURES.SUBJECT_ID. Although this could lead to incorrect row associations in some cases, the immediate semantic mismatch in the result text (long vs. short title) stems from the column choice.",
                "Selecting the wrong column is a localized mistake in the SELECT clause and does not require restructuring the overall query logic or changing table relationships at a higher level."
            ],
            "error_type": "Local: column reference error"
        },
        "927bcc5acfc5a7c2f5b2ebf99de1cd47": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "provide me with the number of patients less than 59 years who were transferred within the facility. (Values: TRSF WITHIN THIS FACILITY)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ADMISSION_LOCATION\" = \"TRSF WITHIN THIS FACILITY\" AND DEMOGRAPHIC.\"AGE\" < \"59\"",
            "pred_sql": "SELECT count(subject_id) FROM demographic WHERE admission_location = 'TRANSFER FROM HOSP/EXTRAM' AND age < 59",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only differs by using the wrong literal in the WHERE clause\u2014\u2018TRANSFER FROM HOSP/EXTRAM\u2019 instead of the exact required value \u2018TRSF WITHIN THIS FACILITY\u2019. This is a localized mistake in the filter condition (value parsing), not affecting overall structure or joins.",
            "error_type": "Local: value parsing error"
        },
        "a667eb8609a76490ddbf55b5c12e3695": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "count the number of emergency hospital admission patients who have gangrene primary disease. (Values: EMERGENCY, GANGRENE)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"EMERGENCY\" AND DEMOGRAPHIC.\"DIAGNOSIS\" = \"GANGRENE\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN diagnoses ON demographic.subject_id = diagnoses.subject_id WHERE diagnoses.short_title = 'Gangrene' AND demographic.admission_type = 'EMERGENCY'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query incorrectly joins DEMOGRAPHIC to the DIAGNOSES table and filters on DIAGNOSES.SHORT_TITLE rather than using DEMOGRAPHIC.DIAGNOSIS for the primary disease. This changes the overall logic and data source for the condition, leading to the wrong result. Fixing it would require restructuring the query to remove the join and reference the correct column, which is beyond a localized syntax fix.",
            "error_type": "Global: join error"
        },
        "9057aad89e8f66541aadbb45ad8f4747": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "which patients are on bethanechol prescription? (Values: Bethanechol)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE PRESCRIPTIONS.\"DRUG\" = \"Bethanechol\"",
            "pred_sql": "SELECT prescriptions.subject_id FROM prescriptions WHERE prescriptions.drug = 'Bethanechol'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['4589.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only selects subject_id rows from the PRESCRIPTIONS table without applying COUNT or DISTINCT, whereas the ground truth requires counting distinct subject IDs. This is a mistake in the SELECT clause (wrong aggregation and missing DISTINCT), and does not involve reworking joins or overall query structure.",
            "error_type": "Local: aggregation error"
        },
        "a557a27486342d06e45decaab91aeed8": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "tell me the birth date and primary disease of patient caren obrien. (Values: Caren Obrien)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DOB\",DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Caren Obrien\"",
            "pred_sql": "SELECT dob, diagnosis FROM demographic WHERE name = 'CAREN OBRIEN'",
            "gold_answer": "[['1882-10-10 00:00:00', 'SYNCOPE;TELEMETRY']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The only mistake in the predicted SQL is the casing of the literal 'CAREN OBRIEN' versus the actual name 'Caren Obrien' in the DEMOGRAPHIC table. SQLite\u2019s default comparison is case\u2010sensitive here, so the wrong case prevents any match. Everything else\u2014table, columns, clauses\u2014matches the ground truth. This is a localized value parsing/formatting error and doesn\u2019t alter the overall query structure or logic.",
            "error_type": "Local: value parsing error"
        },
        "05b45f4c6bb925d5091172692b926676": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find the number of patients born before the year 1837 who are no longer alive.",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"EXPIRE_FLAG\" = \"1\" AND DEMOGRAPHIC.\"DOB_YEAR\" < \"1837\"",
            "pred_sql": "SELECT count(expire_flag) FROM demographic WHERE dob_year < 1837 AND expire_flag = 0",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s mistakes are confined to the WHERE clause and the aggregation: it uses expire_flag = 0 instead of = 1 and uses count(expire_flag) rather than counting distinct SUBJECT_ID. The overall structure (single-table query, no joins or subqueries) is correct, and the error can be fixed locally without restructuring the query\u2019s logic or joins.",
            "error_type": "Local: value/filter aggregation error"
        },
        "007b736a7e85c0d907a1aa0574bcd582": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients were admitted in emergency primarily for brain mass; intracranial hemorrhage ? (Values: EMERGENCY, BRAIN MASS;INTRACRANIAL HEMORRHAGE)",
            "gold_sql": "SELECT AVG ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"EMERGENCY\" AND DEMOGRAPHIC.\"DIAGNOSIS\" = \"BRAIN MASS;INTRACRANIAL HEMORRHAGE\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN diagnoses ON demographic.subject_id = diagnoses.subject_id WHERE demographic.admission_location = 'EMERGENCY' AND diagnoses.short_title = 'BRAIN MASS;INTRACRANIAL HEMORRHAGE'",
            "gold_answer": "[['71.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic by joining to the DIAGNOSES table and filtering on diagnoses.short_title rather than using the DEMOGRAPHIC.DIAGNOSIS field and the ADMISSION_TYPE column. It also uses the wrong admission_location column instead of ADMISSION_TYPE and introduces a join that was not in the original intent. These are not isolated typos but a flawed join strategy and incorrect table/column usage that alter the query\u2019s overall meaning, so this is a Global error.",
            "error_type": "Global: incorrect join"
        }
    },
    "dinsql": {
        "95729f0dfd914c9590bd8c1e29b1c9b9": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "What is the number of patients less than 85 years who have liver transplant as their primary disease? (Values: LIVER TRANSPLANT)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"LIVER TRANSPLANT\" AND DEMOGRAPHIC.\"AGE\" < \"85\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) FROM DEMOGRAPHIC AS D JOIN DIAGNOSES AS DI ON D.SUBJECT_ID = DI.SUBJECT_ID AND D.HADM_ID = DI.HADM_ID WHERE D.AGE < 85 AND DI.LONG_TITLE LIKE '%LIVER TRANSPLANT%'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query logic by joining to the DIAGNOSES table and filtering on DIAGNOSES.LONG_TITLE, rather than using the primary disease stored in DEMOGRAPHIC.DIAGNOSIS. This incorrect join and table choice alters the meaning of the query and cannot be fixed by a small tweak in a single clause\u2014it requires restructuring the query to use the DEMOGRAPHIC table\u2019s DIAGNOSIS column directly.",
            "error_type": "Global: incorrect join/table selection"
        }
    },
    "o4-mini": {
        "9dc0838fea8ceebde01fd608c434210c": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "which patients have buccal route of drug administration? (Values: BUCCAL)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE PRESCRIPTIONS.\"ROUTE\" = \"BUCCAL\"",
            "pred_sql": "SELECT DISTINCT d.SUBJECT_ID, d.HADM_ID, d.NAME FROM PRESCRIPTIONS p JOIN DEMOGRAPHIC d ON p.SUBJECT_ID = d.SUBJECT_ID AND p.HADM_ID = d.HADM_ID WHERE p.ROUTE = 'BUCCAL';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['3623.0', '178444.0', 'Joseph Dillman'], ['3623.0', '178444.0', 'Joseph Dillman'], ['3623.0', '178444.0', 'Joseph Dillman'], ['3623.0', '178444.0', 'Joseph Dillman']]",
            "is_correct": false,
            "reasoning": "The predicted SQL returns individual patient-admission rows (including NAME and HADM_ID) instead of the count of distinct patients as required. It omits the COUNT(DISTINCT) aggregation and selects the wrong columns, fundamentally altering the query\u2019s purpose. This mistake spans both the SELECT clause and absence of aggregation, requiring more than a localized fix.",
            "error_type": "Global: incorrect aggregation and select columns"
        }
    }
}