{
    "codes": {
        "a862cb556c8a303b9fd05ffbc3866738": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "What is the minimum days of hospital stay for patients who are of black/haitian ethnicity? (Values: BLACK/HAITIAN)",
            "gold_sql": "SELECT MIN ( DEMOGRAPHIC.\"DAYS_STAY\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ETHNICITY\" = \"BLACK/HAITIAN\"",
            "pred_sql": "SELECT min(demographic.days_stay) FROM demographic INNER JOIN demographic ON demographic.subject_id = demographic.subject_id WHERE demographic.ethnicity = 'BLACK/HAITIAN'",
            "gold_answer": "[['2.0']]",
            "pred_answer": "ambiguous column name: demographic.days_stay",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces an unnecessary self-join on the DEMOGRAPHIC table (INNER JOIN DEMOGRAPHIC ON demographic.subject_id = demographic.subject_id), which is fundamentally incorrect and changes the query structure. This causes an ambiguous column reference for demographic.days_stay because two copies of the same table are unnamed. The error stems from an incorrect join that alters the intended query logic and requires restructuring (i.e., removing the join), so it is a global error.",
            "error_type": "Global: join error"
        },
        "8318a358e23fc3e43d9c6c3cb70e75af": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "provide the duration of hospital stay and procedure title for subject id 71798.",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DAYS_STAY\",PROCEDURES.\"LONG_TITLE\" FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"71798\"",
            "pred_sql": "SELECT demographic.days_stay, procedures.short_title FROM procedures INNER JOIN demographic ON procedures.subject_id = demographic.subject_id WHERE procedures.subject_id = 71798",
            "gold_answer": "[['2.0', 'Enteral infusion of concentrated nutritional substances']]",
            "pred_answer": "[['2.0', 'Entral infus nutrit sub']]",
            "is_correct": false,
            "reasoning": "The predicted query not only selects the wrong column (short_title instead of LONG_TITLE), but more critically joins on SUBJECT_ID rather than HADM_ID. Joining on SUBJECT_ID breaks the intended one\u2010to\u2010one admission\u2010procedure relationship and can produce incorrect data associations, fundamentally altering the query\u2019s logic. This is more than a minor syntax or column\u2010name issue\u2014it is a flawed join strategy that requires restructuring the query to correct the intended meaning.",
            "error_type": "Global: incorrect join key"
        },
        "a59c2fe7f918bb9e3f87dfd11186b2e7": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "To how many patients on urgent admission were d5w (excel bag) administered? (Values: URGENT, D5W (EXCEL BAG))",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"URGENT\" AND PRESCRIPTIONS.\"DRUG\" = \"D5W (EXCEL BAG)\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN prescriptions ON demographic.subject_id = prescriptions.subject_id WHERE demographic.admission_type = 'URGENT' AND prescriptions.drug_name = 'D5W (EXCEL BAG)'",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: prescriptions.drug_name",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column prescriptions.drug_name (should be PRESCRIPTIONS.DRUG). This is a localized column reference error and does not require restructuring the query\u2019s overall logic or joins.",
            "error_type": "Local: column reference error"
        },
        "09836ee89fd684d22d1fd39b5efb7692": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "give the number of patients who have stayed in the hospital for more than one day whose lab test fluid is urine. (Values: 1, Urine)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"DAYS_STAY\" > \"1\" AND LAB.\"FLUID\" = \"Urine\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN lab ON demographic.subject_id = lab.subject_id WHERE demographic.days_stay > 1 AND lab.fluid = 'Urine'",
            "gold_answer": "[['55.0']]",
            "pred_answer": "[['1274.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins DEMOGRAPHIC and LAB on SUBJECT_ID instead of on HADM_ID as required. This incorrect join key links rows across different admissions improperly, drastically changing the result (1274 vs 55). Since it affects the core relationship and logic of the query, it is a global error in the join structure.",
            "error_type": "Global: incorrect join key"
        },
        "93b9e31884f67490542d6aaf4d6b8108": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many male patients have lab test item id 51146? (Values: M)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"GENDER\" = \"M\" AND LAB.\"ITEMID\" = \"51146\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN lab ON demographic.subject_id = lab.subject_id WHERE demographic.gender = 'M' AND lab.itemid = 51146",
            "gold_answer": "[['38.0']]",
            "pred_answer": "[['96.0']]",
            "is_correct": false,
            "reasoning": "The ground truth joins DEMOGRAPHIC to LAB on HADM_ID to correctly link each hospital admission\u2019s lab tests to the patient. The predicted SQL instead joins on SUBJECT_ID, which is a fundamentally incorrect relationship and inflates the count. This error affects the core logic of how tables are related and thus requires restructuring the join, making it a global error.",
            "error_type": "Global: join error"
        },
        "fffdd25c4b1fd2c10864a81fa85fd02e": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find the minimum age of white female patients . (Values: F, WHITE)",
            "gold_sql": "SELECT MIN ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"GENDER\" = \"F\" AND DEMOGRAPHIC.\"ETHNICITY\" = \"WHITE\"",
            "pred_sql": "SELECT min(demographic.age) FROM demographic INNER JOIN procedures ON demographic.subject_id = procedures.subject_id WHERE demographic.gender = 'F' AND demographic.race = 'WHITE'",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: demographic.race",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it references a non-existent column demographic.race instead of DEMOGRAPHIC.ETHNICITY, causing a 'no such column' error. This is a localized column reference mistake that can be fixed without altering the overall query structure or logic.",
            "error_type": "Local: column-reference error"
        }
    },
    "macsql": {
        "9192083f15618c3944fab5819282ce1f": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "give me the number of patients admitted before 2148 who are diagnosed with unspecified obesity. (Values: Obesity NOS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"ADMITYEAR\" < \"2148\" AND DIAGNOSES.\"SHORT_TITLE\" = \"Obesity NOS\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.`SUBJECT_ID`) FROM DEMOGRAPHIC AS D INNER JOIN DIAGNOSES AS DI ON D.`SUBJECT_ID` = DI.`SUBJECT_ID` WHERE DI.`ICD9_CODE` = '27800' -- Assuming '27800' is the ICD-9 code for \"Obesity NOS\" AND D.`ADMITYEAR` < 2148",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['3.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses DEMOGRAPHIC.SUBJECT_ID = DIAGNOSES.SUBJECT_ID as the join condition instead of matching on HADM_ID. This fundamentally changes the query\u2019s logic by associating any diagnosis of a patient across all admissions rather than only diagnoses from the same hospital stay. Fixing this requires altering the overall join strategy, not just a local clause tweak.",
            "error_type": "Global: incorrect join key error"
        },
        "a77d67ccd0a105807ef5c3fb6cb2c019": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "Provide the number of patients who were admitted before the year 2146 and had procedure short title as cardiopulm resuscita nos. (Values: Cardiopulm resuscita NOS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"ADMITYEAR\" < \"2146\" AND PROCEDURES.\"SHORT_TITLE\" = \"Cardiopulm resuscita NOS\"",
            "pred_sql": "SELECT COUNT(DISTINCT T1.`SUBJECT_ID`) FROM ( SELECT DISTINCT `HADM_ID` FROM DEMOGRAPHIC WHERE `ADMITYEAR` < 2146 ) AS T1 INNER JOIN ( SELECT DISTINCT `SUBJECT_ID`, `HADM_ID` FROM PROCEDURES WHERE `SHORT_TITLE` = 'Cardiopulm resuscita nos' ) AS T2 ON T1.`HADM_ID` = T2.`HADM_ID`",
            "gold_answer": "[['2.0']]",
            "pred_answer": "no such column: T1.SUBJECT_ID",
            "is_correct": false,
            "reasoning": "The predicted SQL references T1.SUBJECT_ID in the outer SELECT, but the subquery aliased as T1 only selects HADM_ID. This is a column reference error in a specific part of the query and can be fixed by including SUBJECT_ID in T1\u2019s SELECT. It does not affect the overall query structure or logic.",
            "error_type": "Local: column reference error"
        },
        "0ffc8a41b8b94e7bc01da17aac9180bf": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "for patient id 74032, specify the religion and date of death",
            "gold_sql": "SELECT DEMOGRAPHIC.\"RELIGION\",DEMOGRAPHIC.\"DOD\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"74032\"",
            "pred_sql": "SELECT `RELIGION`, `DOD` FROM `DEMOGRAPHIC` WHERE `SUBJECT_ID` = 74032 AND `DOD` IS NOT NULL",
            "gold_answer": "[['CATHOLIC', 'None']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduced an extra WHERE condition `AND DOD IS NOT NULL` that is not in the user\u2019s request. This is a mistake localized to the WHERE clause (an unnecessary filter) and does not alter the overall query structure or joins. Removing this condition would correct the query, so it\u2019s a local error.",
            "error_type": "Local: where-clause error"
        }
    },
    "o4-mini": {
        "aaaa09cf4ad17119ae748e7b44f1d7c6": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "how many patients had the procedure under icd9 code 41?",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE PROCEDURES.\"ICD9_CODE\" = \"41\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) AS num_patients FROM PROCEDURES WHERE ICD9_CODE LIKE '41%';",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s error lies solely in the WHERE clause: it uses LIKE '41%' to match any code starting with 41, instead of an exact match = '41'. This overcounts and produces the wrong result. No overall query structure or joins need to change; it\u2019s a localized mistake in the condition.",
            "error_type": "Local: value-parsing error"
        },
        "a74c0d773d66fce959ed3490677faac0": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "which patients had open and other left hemicolectomy? (Values: Opn lft hemicolectmy NEC)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE PROCEDURES.\"SHORT_TITLE\" = \"Opn lft hemicolectmy NEC\"",
            "pred_sql": "SELECT DISTINCT d.SUBJECT_ID, d.HADM_ID, d.NAME FROM PROCEDURES p JOIN DEMOGRAPHIC d ON p.SUBJECT_ID = d.SUBJECT_ID AND p.HADM_ID = d.HADM_ID WHERE p.SHORT_TITLE = 'Opn lft hemicolectmy NEC';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['81085.0', '169845.0', 'Thomas Jeanbaptiste']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the correct tables, JOIN keys, and WHERE filter but returns individual SUBJECT_ID, HADM_ID, and NAME instead of the COUNT(DISTINCT SUBJECT_ID) required. The mistake is isolated to the SELECT clause (wrong aggregation and columns), without altering the overall query structure or relationships.",
            "error_type": "Local: incorrect-select error"
        }
    },
    "dinsql": {
        "9e3324b9e4876efdcca381640e060400": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "how many patients are diagnosed with primary disease sepsis and admitted before the year 2187? (Values: SEPSIS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"SEPSIS\" AND DEMOGRAPHIC.\"ADMITYEAR\" < \"2187\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) FROM DIAGNOSES d JOIN DEMOGRAPHIC dem ON d.SUBJECT_ID = dem.SUBJECT_ID AND d.HADM_ID = dem.HADM_ID WHERE d.LONG_TITLE LIKE '%sepsis%' AND dem.ADMITYEAR < 2187",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['8.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the query\u2019s logic by joining the DIAGNOSES table and using a LIKE on LONG_TITLE rather than checking the primary disease column DEMOGRAPHIC.DIAGNOSIS. This changes the scope from primary diagnosis to any recorded diagnosis containing 'sepsis' and requires restructuring the query beyond a simple fix.",
            "error_type": "Global: flawed join strategy"
        },
        "94e979800c12fea24b8722c512dd7405": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "how many patients are diagnosed with primary disease bladder cancer/sda? (Values: BLADDER CANCER/SDA)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"BLADDER CANCER/SDA\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DIAGNOSES WHERE LONG_TITLE = 'BLADDER CANCER/SDA'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query references the DIAGNOSES table and its LONG_TITLE column, but the question asks for the primary disease stored in the DEMOGRAPHIC table\u2019s DIAGNOSIS column. This is a mistake in table/column selection and does not affect the overall query structure or flow.",
            "error_type": "Local: table/column reference error"
        },
        "9fc4764cc38d024d1682c51ce690b975": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "calculate the maximum age of unmarried male patients. (Values: SINGLE, M)",
            "gold_sql": "SELECT MAX ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"MARITAL_STATUS\" = \"SINGLE\" AND DEMOGRAPHIC.\"GENDER\" = \"M\"",
            "pred_sql": "MAX(AGE) FROM DEMOGRAPHIC WHERE MARITAL_STATUS = 'SINGLE' AND GENDER = 'M'",
            "gold_answer": "[['72.0']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL is missing the SELECT keyword, making it syntactically invalid. This is a localized syntax issue in the SELECT clause and does not affect the overall query logic or table relationships.",
            "error_type": "Local: syntax error"
        },
        "0b5fc111d80c2e60438458ddb5979cf1": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "calculate the number of patients with personality disorder nos who had a hospital stay for more than 5 days. (Values: Personality disorder NOS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"DAYS_STAY\" > \"5\" AND DIAGNOSES.\"SHORT_TITLE\" = \"Personality disorder NOS\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) FROM DEMOGRAPHIC AS D JOIN DIAGNOSES AS DI ON D.SUBJECT_ID = DI.SUBJECT_ID AND D.HADM_ID = DI.HADM_ID WHERE DI.LONG_TITLE = 'Personality disorder NOS' AND D.DAYS_STAY > 5",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the LONG_TITLE column instead of the SHORT_TITLE column to filter for 'Personality disorder NOS'. This is a localized column reference error and does not require restructuring the overall query logic or joins.",
            "error_type": "Local: column reference error"
        },
        "aa3651ed4202392f2f09a7769737f61b": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "provide the number of patients less than 83 years of age who were diagnosed with pneumococcal pneumonia. (Values: Pneumococcal pneumonia)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"AGE\" < \"83\" AND DIAGNOSES.\"SHORT_TITLE\" = \"Pneumococcal pneumonia\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) FROM DEMOGRAPHIC AS D JOIN DIAGNOSES AS DI ON D.SUBJECT_ID = DI.SUBJECT_ID AND D.HADM_ID = DI.HADM_ID WHERE D.AGE < 83 AND DI.LONG_TITLE = 'Pneumococcal pneumonia'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins the correct tables and applies the age filter correctly, matching the overall structure of the ground truth. The only difference is that it filters on DI.LONG_TITLE instead of DI.SHORT_TITLE, causing it to miss the intended records. This is a localized mistake in the WHERE clause and does not affect the overall query logic or table relationships.",
            "error_type": "Local: column reference error"
        }
    },
    "llm2sql": {
        "84cdf16ce9ced3807228663939f35f2c": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "How many patients with s/p fall as their primary disease had ascitic fluid lab test? (Values: S/P FALL, Ascites)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"S/P FALL\" AND LAB.\"FLUID\" = \"Ascites\"",
            "pred_sql": "SELECT COUNT(DISTINCT DIAG.SUBJECT_ID) nFROM DIAGNOSES AS DIAG nJOIN LAB AS LAB ON DIAG.SUBJECT_ID = LAB.SUBJECT_ID AND DIAG.HADM_ID = LAB.HADM_ID nWHERE (DIAG.LONG_TITLE LIKE '%S/P FALL%' OR DIAG.SHORT_TITLE LIKE '%S/P FALL%') nAND LAB.FLUID = 'Ascites';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "near \"DIAGNOSES\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL fails with a syntax error near \"DIAGNOSES\" because the 'nFROM' token is invalid (newline markers were inserted without spaces). This is a localized syntax mistake in the SELECT/FROM clause and does not involve a deeper logical or structural misunderstanding of the schema or intent. It can be fixed by correcting the syntax (e.g., adding a space or removing the 'n'), without altering the overall query logic.",
            "error_type": "Local: syntax error"
        }
    },
    "deepseek": {
        "a8e264d96300a69aa8dea07d6d507559": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "Out of total number of patients admitted before the year 2150, how many of them had hemodialysis? (Values: Hemodialysis)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"ADMITYEAR\" < \"2150\" AND PROCEDURES.\"LONG_TITLE\" = \"Hemodialysis\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) AS NUMBER_OF_PATIENTS_WITH_HEMODIALYSIS FROM DEMOGRAPHIC DG JOIN PROCEDURES P ON DG.SUBJECT_ID = P.SUBJECT_ID AND DG.HADM_ID = P.HADM_ID WHERE DG.ADMITYEAR < 2150 AND P.ICD9_CODE = '3995';",
            "gold_answer": "[['2.0']]",
            "pred_answer": "no such column: D.SUBJECT_ID",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the alias DG for the DEMOGRAPHIC table but then references D.SUBJECT_ID in the SELECT clause, which is undefined. This is a column reference error localized to a single part of the query and does not affect the overall logic.",
            "error_type": "Local: table/column reference error"
        },
        "0b70acfbd0281aad4f480933ffe64361": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "tell me the short title of diagnoses and days for which patient with patient id 74463 was hospitalized.",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DAYS_STAY\",DIAGNOSES.\"SHORT_TITLE\" FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"74463\"",
            "pred_sql": "SELECT D.SHORT_TITLE, DG.DAYS_STAY FROM DIAGNOSES D JOIN DEMOGRAPHIC DG ON D.HADM_ID = DG.HADM_ID WHERE D.SUBJECT_ID = 74463 GROUP BY D.HADM_ID;",
            "gold_answer": "[['14.0', 'Abn react-artif implant'], ['14.0', 'Aortic valve disorder'], ['14.0', 'Aortocoronary bypass'], ['14.0', 'Atrial fibrillation'], ['14.0', 'Crnry athrscl natve vssl'], ['14.0', 'DMII wo cmp nt st uncntr'], ['14.0', 'Hyperlipidemia NEC/NOS'], ['14.0', 'Hypertension NOS'], ['14.0', 'Hypoxemia'], ['14.0', 'Long-term use anticoagul'], ['14.0', 'Old myocardial infarct'], ['14.0', 'Secundum atrial sept def'], ['14.0', 'Seroma complicting proc'], ['14.0', 'Status-post ptca']]",
            "pred_answer": "[['Old myocardial infarct', '14.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces a GROUP BY on D.HADM_ID, which is not required and causes the query to return only one arbitrary diagnosis per admission instead of all diagnoses. The error is confined to the GROUP BY clause and does not affect the overall join logic or table relationships. This is a localized mistake in grouping rather than a structural or multi-clause logical flaw.",
            "error_type": "Local: incorrect GROUP BY error"
        },
        "b9e81a7036c0f844cb0892ae06fa0c72": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "what number of patients have diagnosis short title as rec depr psych-psychotic and drug route as po/ng? (Values: Rec depr psych-psychotic, PO/NG)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"Rec depr psych-psychotic\" AND PRESCRIPTIONS.\"ROUTE\" = \"PO/NG\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) AS NUMBER_OF_PATIENTS FROM DIAGNOSES D JOIN PRESCRIPTIONS P ON D.SUBJECT_ID = P.SUBJECT_ID AND D.HADM_ID = P.HADM_ID WHERE D.SHORT_TITLE = 'rec depr psych-psychotic' AND P.ROUTE = 'PO/NG';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to return any rows because it uses a lowercase literal 'rec depr psych-psychotic' which does not match the stored value 'Rec depr psych-psychotic' (SQLite string comparisons are case-sensitive by default). This is a localized error in the WHERE clause value matching and does not require reshaping the query\u2019s overall join structure or logic.",
            "error_type": "Local: value parsing error"
        }
    }
}