{
    "dinsql": {
        "03ad1ed58197cc476c639d7af7c662a3": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "Calculate the total number of patients who had transient ischemic attack as their primary disease. (Values: TRANSIENT ISCHEMIC ATTACK)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"TRANSIENT ISCHEMIC ATTACK\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DIAGNOSES WHERE LONG_TITLE LIKE '%TRANSIENT ISCHEMIC ATTACK%' OR SHORT_TITLE LIKE '%TRANSIENT ISCHEMIC ATTACK%'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries the DIAGNOSES table instead of the DEMOGRAPHIC table, thereby using the wrong source for the 'primary disease' field. This is a localized mistake in table reference rather than a fundamental restructuring of the query logic.",
            "error_type": "Local: table reference error"
        },
        "ac68bab7e7f4cd79ac543b18d76d24d3": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "Calulate the total number of patients who had icd9 code 5771",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE PROCEDURES.\"ICD9_CODE\" = \"5771\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DIAGNOSES WHERE ICD9_CODE = '5771'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the DIAGNOSES table instead of the PROCEDURES table as in the ground truth. This is not a simple typo but changes the entire logic by querying the wrong source of ICD9 codes, resulting in a different patient count. Fixing this requires altering the overall query structure to join the correct table, so it\u2019s a global error.",
            "error_type": "Global: wrong-table logic"
        },
        "04e471a143d212d6e201d787eea68d7d": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "how many patients used the drug name capso fungin? (Values: Caspofungin)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE PRESCRIPTIONS.\"DRUG\" = \"Caspofungin\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM PRESCRIPTIONS WHERE DRUG = 'Capso fungin'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL misuses the drug name literal (\u201cCapso fungin\u201d instead of the exact value \u201cCaspofungin\u201d required by the question). This is a localized mistake in the WHERE clause value rather than a change to the overall query structure or logic. Therefore it\u2019s a local error of incorrect literal value parsing.",
            "error_type": "Local: value parsing error"
        },
        "9638fb767e2ce81c243568cce6a0d6fe": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "Which patients are medicated via tp route? (Values: TP)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE PRESCRIPTIONS.\"ROUTE\" = \"TP\"",
            "pred_sql": "SELECT DISTINCT SUBJECT_ID, HADM_ID FROM PRESCRIPTIONS WHERE ROUTE = 'TP'",
            "gold_answer": "[['24.0']]",
            "pred_answer": "[['14755.0', '151669.0'], ['14755.0', '151669.0'], ['17570.0', '183034.0'], ['17570.0', '183034.0'], ['17570.0', '183034.0'], ['22377.0', '120859.0'], ['28588.0', '141664.0'], ['29541.0', '103957.0'], ['29541.0', '103957.0'], ['29961.0', '196409.0'], ['29961.0', '196409.0'], ['29961.0', '196409.0'], ['29961.0', '196409.0'], ['3623.0', '178444.0'], ['3623.0', '178444.0'], ['3623.0', '178444.0'], ['3623.0', '178444.0'], ['3623.0', '178444.0'], ['4333.0', '155027.0'], ['4333.0', '155027.0'], ['4333.0', '155027.0'], ['4333.0', '155027.0'], ['4333.0', '155027.0'], ['4333.0', '155027.0'], ['4589.0', '101114.0'], ['4589.0', '101114.0'], ['4589.0', '101114.0'], ['52012.0', '146937.0'], ['52012.0', '146937.0'], ['52012.0', '146937.0'], ['52012.0', '146937.0'], ['52012.0', '146937.0'], ['52012.0', '146937.0'], ['52012.0', '146937.0'], ['52012.0', '146937.0'], ['52012.0', '146937.0'], ['53707.0', '195809.0'], ['62296.0', '193576.0'], ['62296.0', '193576.0'], ['62296.0', '193576.0'], ['65982.0', '141119.0'], ['65982.0', '141119.0'], ['65982.0', '141119.0'], ['66411.0', '178264.0'], ['67965.0', '145657.0'], ['67965.0', '145657.0'], ['71798.0', '122790.0'], ['73843.0', '158983.0'], ['73843.0', '158983.0'], ['83678.0', '172089.0'], ['84129.0', '161253.0'], ['84129.0', '161253.0'], ['8440.0', '137021.0'], ['8440.0', '137021.0'], ['8440.0', '137021.0'], ['8990.0', '113207.0'], ['8990.0', '113207.0'], ['8990.0', '113207.0'], ['8990.0', '113207.0'], ['91588.0', '173731.0'], ['91588.0', '173731.0'], ['94762.0', '160707.0'], ['94762.0', '160707.0'], ['94762.0', '160707.0'], ['98220.0', '189416.0'], ['98220.0', '189416.0'], ['98220.0', '189416.0']]",
            "is_correct": false,
            "reasoning": "The predicted query selects SUBJECT_ID and HADM_ID directly from PRESCRIPTIONS without joining DEMOGRAPHIC and without performing the COUNT DISTINCT aggregation on SUBJECT_ID. This is a structural change: instead of returning a single count of unique patients, it returns many rows of subject\u2010hadm combinations. Fixing this is not a localized tweak (e.g., correcting a column name or syntax); it requires adding the join, changing the SELECT to COUNT(DISTINCT ...), and removing HADM_ID. Therefore, it\u2019s a global error in query structure and logic.",
            "error_type": "Global: structural aggregation error"
        },
        "a95ae3ec84a4478fe2ba16078b12904a": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "find the female patients who have procedure icd9 code 3727. (Values: F)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"GENDER\" = \"F\" AND PROCEDURES.\"ICD9_CODE\" = \"3727\"",
            "pred_sql": "SELECT DISTINCT D.SUBJECT_ID, D.NAME FROM DEMOGRAPHIC AS D INNER JOIN PROCEDURES AS P ON D.SUBJECT_ID = P.SUBJECT_ID AND D.HADM_ID = P.HADM_ID WHERE D.GENDER = 'F' AND P.ICD9_CODE = '3727'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['9575.0', 'Melinda Miers']]",
            "is_correct": false,
            "reasoning": "The predicted query uses SELECT DISTINCT D.SUBJECT_ID, D.NAME instead of SELECT COUNT(DISTINCT SUBJECT_ID). The JOIN and WHERE conditions are correct, but the projection/aggregation is wrong. This is an error confined to the SELECT clause and does not require changing the overall query structure or logical flow.",
            "error_type": "Local: select clause error"
        }
    },
    "codes": {
        "a71d8a20f3c1c0d0fc6a9372df547def": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find the patients who have to be tested for ketones with diagnosis of dysphagia nos. (Values: Dysphagia NOS, Ketone)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"Dysphagia NOS\" AND LAB.\"LABEL\" = \"Ketone\"",
            "pred_sql": "SELECT demographic.name FROM demographic INNER JOIN diagnoses ON demographic.subject_id = diagnoses.subject_id WHERE diagnoses.short_title = 'Dysphagia NOS' AND demographic.name IS NOT NULL AND demographic.name != '' AND (demographic.diagnosis LIKE '%ketone%' OR demographic.diagnosis LIKE '%Ketone%' OR demographic.diagnosis LIKE '%Ketones%' OR demographic.diagnosis LIKE '%Ketones%')",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the LAB table entirely and instead searches for 'ketone' in the DEMOGRAPHIC.DIAGNOSIS column. It also returns patient names rather than counting distinct SUBJECT_IDs as required. This is not a minor syntax mistake or column name error but a fundamental mis-structuring of the query: the necessary INNER JOIN to LAB and the appropriate filter on LAB.LABEL are missing, and the demographic.diagnosis text search is not what the question asks for. Correcting this would require significant changes to the query\u2019s structure and logic.",
            "error_type": "Global: join error"
        },
        "0d4c35f952b8d4ff9c7b0b736d1556f1": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "calculate the total number of patients who had abdomen artery incision. (Values: Abdomen artery incision)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE PROCEDURES.\"SHORT_TITLE\" = \"Abdomen artery incision\"",
            "pred_sql": "SELECT count(DISTINCT procedures.subject_id) FROM procedures INNER JOIN diagnoses ON procedures.subject_id = diagnoses.subject_id WHERE diagnoses.short_title = 'Abdomen artery incision'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query logic by using the DIAGNOSES table instead of the PROCEDURES table for both the join and the filter. Rather than counting patients with the specified procedure, it joins PROCEDURES to DIAGNOSES and filters on DIAGNOSES.SHORT_TITLE. This is not a minor syntax or reference issue but a core join/table-selection mistake that alters the query\u2019s intended meaning. Therefore, it is a global error.",
            "error_type": "Global: join error"
        },
        "8cb9d9cd9777cb7de0f280d81e661f92": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what is the average days of hospital stay of patients who died before year 2154? (Values: 2154.0)",
            "gold_sql": "SELECT AVG ( DEMOGRAPHIC.\"DAYS_STAY\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DOD_YEAR\" < \"2154.0\"",
            "pred_sql": "SELECT avg(demographic.days_stay) FROM demographic INNER JOIN procedures ON procedures.subject_id = demographic.subject_id WHERE strftime('%Y', demographic.dischtime) < '2154' AND demographic.expire_flag = 1",
            "gold_answer": "[['10.727']]",
            "pred_answer": "[['16.269']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the logic and structure of the intended query. Instead of simply filtering by the DOD_YEAR column in the DEMOGRAPHIC table, it introduces an unnecessary JOIN to the PROCEDURES table, filters on the DISCHTIME date rather than the date of death, and adds an expire_flag condition that wasn\u2019t in the original requirement. These changes span multiple clauses and alter the intended meaning of the query, so the error is not localized to a single clause but affects the overall query logic.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "a6efda66101f5ee356834b8d407f433a": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find out the number of patients with lab test item id 51245.",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE LAB.\"ITEMID\" = \"51245\"",
            "pred_sql": "SELECT count(hadm_id) FROM lab WHERE itemid = 51245",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['3.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only counts the number of lab records (count(hadm_id)) rather than the number of distinct patients (distinct SUBJECT_ID). This mistake is confined to the SELECT clause and aggregation choice, without affecting the overall query structure or table relationships.",
            "error_type": "Local: wrong-aggregation"
        },
        "83e3314b9aa82aaf732ff1c45a51d195": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "Is the subject id 74032 married, find his religion ?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"MARITAL_STATUS\",DEMOGRAPHIC.\"RELIGION\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"74032\"",
            "pred_sql": "SELECT religion FROM demographic WHERE subject_id = 74032",
            "gold_answer": "[['MARRIED', 'CATHOLIC']]",
            "pred_answer": "[['CATHOLIC']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only selects the RELIGION column and omits MARITAL_STATUS, thus failing to retrieve whether the subject is married. This is a localized error in the SELECT clause (missing column), not a structural or multi-clause logic error, so it\u2019s a Local error.",
            "error_type": "Local: missing-select-column"
        },
        "86960807966ab11fb4a31cae186af57a": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "count the number of emergency hospital admission patients who had procedure icd9 code 331. (Values: EMERGENCY)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"EMERGENCY\" AND PROCEDURES.\"ICD9_CODE\" = \"331\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM procedures INNER JOIN demographic ON procedures.hadm_id = demographic.hadm_id WHERE demographic.admission_type = 'EMERGENCY' AND procedures.icd9_code = 331",
            "gold_answer": "[['4.0']]",
            "pred_answer": "[['5.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs from the ground truth only in the SELECT clause\u2019s aggregation: it uses COUNT(demographic.subject_id) instead of COUNT(DISTINCT demographic.subject_id). This is a localized mistake in the aggregate function (missing DISTINCT) and does not alter the overall query structure or joins.",
            "error_type": "Local: aggregation error"
        },
        "0782eff13b2a6fe1c1f0fb94270bb9c4": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "count the number of patients who were admitted before 2158 and had thyroxine (t4) lab test. (Values: Thyroxine (T4))",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"ADMITYEAR\" < \"2158\" AND LAB.\"LABEL\" = \"Thyroxine (T4)\"",
            "pred_sql": "SELECT count(lab.subject_id) FROM lab INNER JOIN demographic ON lab.hadm_id = demographic.hadm_id WHERE demographic.admittime < '2158' AND lab.itemid = 50982",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses wrong columns in the WHERE clause: it compares demographic.admittime (a datetime) to '2158' instead of admityear, and filters on lab.itemid rather than lab.label = 'Thyroxine (T4)'. These are localized mistakes in column references/conditions and can be corrected without restructuring the query logic.",
            "error_type": "Local: column reference error"
        },
        "9e2bb2a0d86e0e587fb393ad10311fbd": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what is the number of emergency hospital admission patients who had manual reticulocyte count lab test? (Values: EMERGENCY, Reticulocyte Count, Manual)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"EMERGENCY\" AND LAB.\"LABEL\" = \"Reticulocyte Count, Manual\"",
            "pred_sql": "SELECT count(DISTINCT lab.hadm_id) FROM lab INNER JOIN procedures ON lab.hadm_id = procedures.hadm_id WHERE procedures.icd9_code = '99591' AND lab.label = 'Reticulocyte count (IQR)'",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the tables and filters used: it joins LAB to PROCEDURES instead of DEMOGRAPHIC to LAB, omits the admission_type = 'EMERGENCY' filter, uses an unrelated ICD9 code filter on PROCEDURES, and mismatches the lab label. These errors span multiple clauses and alter the query\u2019s overall logic and intended relationships, not just a single localized mistake.",
            "error_type": "Global: incorrect join and filter"
        },
        "85458bc20e32da11c87969332a42276f": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many male patients had the drug code lipid250i? (Values: M, LIPID250I)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"GENDER\" = \"M\" AND PRESCRIPTIONS.\"FORMULARY_DRUG_CD\" = \"LIPID250I\"",
            "pred_sql": "SELECT count(DISTINCT demographic.subject_id) FROM demographic INNER JOIN prescriptions ON demographic.subject_id = prescriptions.subject_id WHERE demographic.gender = 'M' AND prescriptions.drug_type = 'LIPID250I'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s mistake is confined to the WHERE clause (it filters on prescriptions.drug_type instead of the correct prescriptions.formulary_drug_cd) and also uses the wrong join key (subject_id vs. hadm_id). Both are isolated to specific parts of the query (column reference and join condition) and don\u2019t require restructuring the overall logic\u2014this is a localized error in column usage. Therefore it\u2019s a Local error.",
            "error_type": "Local: column reference error"
        }
    },
    "o4-mini": {
        "8e3b5d9cb36613efab2204fe93749087": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "for patient id 30011, specify the icd9 code and procedural long title.",
            "gold_sql": "SELECT DIAGNOSES.\"LONG_TITLE\",PROCEDURES.\"LONG_TITLE\" FROM DIAGNOSES INNER JOIN PROCEDURES on DIAGNOSES.HADM_ID = PROCEDURES.HADM_ID WHERE DIAGNOSES.\"SUBJECT_ID\" = \"30011\"",
            "pred_sql": "SELECT ICD9_CODE, LONG_TITLE FROM PROCEDURES WHERE SUBJECT_ID = 30011;",
            "gold_answer": "[['Cerebral aneurysm, nonruptured', 'Arteriography of cerebral arteries'], ['Cerebral aneurysm, nonruptured', 'Endovascular (total) embolization or occlusion of head and neck vessels'], ['Osteoporosis, unspecified', 'Arteriography of cerebral arteries'], ['Osteoporosis, unspecified', 'Endovascular (total) embolization or occlusion of head and neck vessels'], ['Other and unspecified hyperlipidemia', 'Arteriography of cerebral arteries'], ['Other and unspecified hyperlipidemia', 'Endovascular (total) embolization or occlusion of head and neck vessels'], ['Pure hypercholesterolemia', 'Arteriography of cerebral arteries'], ['Pure hypercholesterolemia', 'Endovascular (total) embolization or occlusion of head and neck vessels'], ['Unspecified essential hypertension', 'Arteriography of cerebral arteries'], ['Unspecified essential hypertension', 'Endovascular (total) embolization or occlusion of head and neck vessels'], ['Unspecified gastritis and gastroduodenitis, without mention of hemorrhage', 'Arteriography of cerebral arteries'], ['Unspecified gastritis and gastroduodenitis, without mention of hemorrhage', 'Endovascular (total) embolization or occlusion of head and neck vessels'], ['Urinary tract infection, site not specified', 'Arteriography of cerebral arteries'], ['Urinary tract infection, site not specified', 'Endovascular (total) embolization or occlusion of head and neck vessels']]",
            "pred_answer": "[['3972.0', 'Endovascular (total) embolization or occlusion of head and neck vessels'], ['8841.0', 'Arteriography of cerebral arteries']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only queries the PROCEDURES table and selects its ICD9_CODE and LONG_TITLE, completely omitting the DIAGNOSES table and the necessary join on HADM_ID. Correctly answering the question requires combining information from DIAGNOSES and PROCEDURES (a multi-table join). This mistake affects the overall logic and structure of the query, not just a single clause.",
            "error_type": "Global: missing join/table logic error"
        }
    },
    "qwen3": {
        "8c655677cdaca2684d688418d197aed1": {
            "db_id": "mimicsql",
            "generator_name": "qwen3",
            "question": "find the male patients who have diagnoses icd9 code 5119. (Values: M)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"GENDER\" = \"M\" AND DIAGNOSES.\"ICD9_CODE\" = \"5119\"",
            "pred_sql": "SELECT d.* FROM DEMOGRAPHIC d INNER JOIN DIAGNOSES diag ON d.SUBJECT_ID = diag.SUBJECT_ID AND d.HADM_ID = diag.HADM_ID WHERE d.GENDER = 'M' AND diag.ICD9_CODE = '5119';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['98220.0', '189416.0', 'Bruce Harris', 'MARRIED', '70.0', '2103-11-14 00:00:00', 'M', 'ENGL', 'CATHOLIC', 'EMERGENCY', '23.0', 'Medicare', 'WHITE', '1.0', 'PHYS REFERRAL/NORMAL DELI', 'HOME HEALTH CARE', 'COLANGITIS', '2173-12-24 00:00:00', '2103.0', '2173.0', '2173-08-25 12:58:00', '2173-09-17 15:40:00', '2173.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL is joining the tables correctly and applying the right WHERE conditions, but it selects all columns (d.*) instead of returning the COUNT(DISTINCT SUBJECT_ID). This is a mistake confined to the SELECT clause and does not alter the overall query structure or logic of the joins and filters. Therefore, it is a localized error in the projection.",
            "error_type": "Local: wrong-select-clause"
        }
    },
    "llm2sql": {
        "06e87f96c060a82f8f490899e8cd2b2e": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "how many patients are diagnosed with primary disease acidosis and are below 79 years of age? (Values: ACIDOSIS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"ACIDOSIS\" AND DEMOGRAPHIC.\"AGE\" < \"79\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) FROM DIAGNOSES d JOIN DEMOGRAPHIC dem ON d.SUBJECT_ID = dem.SUBJECT_ID AND d.HADM_ID = dem.HADM_ID WHERE (d.SHORT_TITLE LIKE '%ACIDOSIS%' OR d.LONG_TITLE LIKE '%ACIDOSIS%') AND dem.AGE < 79;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['8.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query logic by joining the DIAGNOSES table and filtering on diagnosis titles rather than using the DEMOGRAPHIC.DIAGNOSIS field as the primary disease. This alters the data source and retrieval logic, returning all patients with any diagnosis containing 'ACIDOSIS' instead of those whose primary disease is recorded as 'ACIDOSIS'. Such a change affects the overall structure and purpose of the query, not just a localized clause fix.",
            "error_type": "Global: join error"
        },
        "8c182c6e8b8ec7c9edf817d41ad093ae": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "Calculate the average age of spanish speaking patients who have overdose as the primary disease. (Values: SPAN, OVERDOSE)",
            "gold_sql": "SELECT AVG ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"LANGUAGE\" = \"SPAN\" AND DEMOGRAPHIC.\"DIAGNOSIS\" = \"OVERDOSE\"",
            "pred_sql": "SELECT AVG(D.DEMOGRAPHIC.AGE) FROM DEMOGRAPHIC D JOIN DIAGNOSES DI ON D.SUBJECT_ID = DI.SUBJECT_ID AND D.HADM_ID = DI.HADM_ID WHERE D.LANGUAGE = 'SPAN' AND (DI.SHORT_TITLE LIKE '%OVERDOSE%' OR DI.LONG_TITLE LIKE '%OVERDOSE%');",
            "gold_answer": "[['None']]",
            "pred_answer": "no such column: D.DEMOGRAPHIC.AGE",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it references a non\u2010existent column alias D.DEMOGRAPHIC.AGE instead of D.AGE. This is a simple column reference mistake in the SELECT clause and does not involve any broader structural or logical flaw in the query.",
            "error_type": "Local: column reference error"
        }
    },
    "deepseek": {
        "bb19be85af3e917061a124154ac4818b": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "What is the total number of patients who died in or before the year 2111? (Values: 2111.0)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DOD_YEAR\" <= \"2111.0\"",
            "pred_sql": "error in generating sql: No",
            "gold_answer": "[['1.0']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL is not even a valid query but an error message instead of SQL code. This is a localized syntax/format error in the prediction rather than a structural or logical flaw in the query design. It does not require rethinking the overall query logic, just producing valid SQL.",
            "error_type": "Local: syntax error"
        },
        "96c7391dfa5656e7563b51eacaee15a7": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "find out the type of admission and lab test ordered for patient with patient id 18480.",
            "gold_sql": "SELECT DEMOGRAPHIC.\"ADMISSION_TYPE\",LAB.\"LABEL\" FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"18480\"",
            "pred_sql": "SELECT D.ADMISSION_TYPE, L.LABEL AS LAB_TEST, L.CHARTTIME FROM DEMOGRAPHIC D JOIN LAB L ON D.SUBJECT_ID = L.SUBJECT_ID AND D.HADM_ID = L.HADM_ID WHERE D.SUBJECT_ID = 18480;",
            "gold_answer": "[['EMERGENCY', 'Alanine Aminotransferase (ALT)'], ['EMERGENCY', 'Alkaline Phosphatase'], ['EMERGENCY', 'Anion Gap'], ['EMERGENCY', 'Asparate Aminotransferase (AST)'], ['EMERGENCY', 'Basophils'], ['EMERGENCY', 'Bicarbonate'], ['EMERGENCY', 'Bilirubin, Total'], ['EMERGENCY', 'Calcium, Total'], ['EMERGENCY', 'Calcium, Total'], ['EMERGENCY', 'Chloride'], ['EMERGENCY', 'Creatine Kinase (CK)'], ['EMERGENCY', 'Creatine Kinase (CK)'], ['EMERGENCY', 'Creatine Kinase, MB Isoenzyme'], ['EMERGENCY', 'Creatine Kinase, MB Isoenzyme'], ['EMERGENCY', 'Creatinine'], ['EMERGENCY', 'Creatinine'], ['EMERGENCY', 'Eosinophils'], ['EMERGENCY', 'Glucose'], ['EMERGENCY', 'Glucose'], ['EMERGENCY', 'Hematocrit'], ['EMERGENCY', 'Hemoglobin'], ['EMERGENCY', 'Lymphocytes'], ['EMERGENCY', 'MCH'], ['EMERGENCY', 'MCHC'], ['EMERGENCY', 'MCV'], ['EMERGENCY', 'Magnesium'], ['EMERGENCY', 'Magnesium'], ['EMERGENCY', 'Monocytes'], ['EMERGENCY', 'Neutrophils'], ['EMERGENCY', 'PT'], ['EMERGENCY', 'PTT'], ['EMERGENCY', 'Phosphate'], ['EMERGENCY', 'Platelet Count'], ['EMERGENCY', 'Potassium'], ['EMERGENCY', 'Potassium'], ['EMERGENCY', 'Potassium, Whole Blood'], ['EMERGENCY', 'RDW'], ['EMERGENCY', 'Red Blood Cells'], ['EMERGENCY', 'Sodium'], ['EMERGENCY', 'Sodium'], ['EMERGENCY', 'Troponin T'], ['EMERGENCY', 'Troponin T'], ['EMERGENCY', 'Urea Nitrogen'], ['EMERGENCY', 'Urea Nitrogen'], ['EMERGENCY', 'White Blood Cells']]",
            "pred_answer": "[['EMERGENCY', 'Alanine Aminotransferase (ALT)', '2138-07-18 07:30:00'], ['EMERGENCY', 'Alkaline Phosphatase', '2138-07-18 07:30:00'], ['EMERGENCY', 'Anion Gap', '2138-07-18 00:30:00'], ['EMERGENCY', 'Asparate Aminotransferase (AST)', '2138-07-18 07:30:00'], ['EMERGENCY', 'Basophils', '2138-07-18 00:30:00'], ['EMERGENCY', 'Bicarbonate', '2138-07-18 00:30:00'], ['EMERGENCY', 'Bilirubin, Total', '2138-07-18 07:30:00'], ['EMERGENCY', 'Calcium, Total', '2138-07-18 00:30:00'], ['EMERGENCY', 'Calcium, Total', '2138-07-18 07:30:00'], ['EMERGENCY', 'Chloride', '2138-07-18 00:30:00'], ['EMERGENCY', 'Creatine Kinase (CK)', '2138-07-18 00:30:00'], ['EMERGENCY', 'Creatine Kinase (CK)', '2138-07-18 07:30:00'], ['EMERGENCY', 'Creatine Kinase, MB Isoenzyme', '2138-07-18 00:30:00'], ['EMERGENCY', 'Creatine Kinase, MB Isoenzyme', '2138-07-18 07:30:00'], ['EMERGENCY', 'Creatinine', '2138-07-18 00:30:00'], ['EMERGENCY', 'Creatinine', '2138-07-18 07:30:00'], ['EMERGENCY', 'Eosinophils', '2138-07-18 00:30:00'], ['EMERGENCY', 'Glucose', '2138-07-18 00:30:00'], ['EMERGENCY', 'Glucose', '2138-07-18 07:30:00'], ['EMERGENCY', 'Hematocrit', '2138-07-18 00:30:00'], ['EMERGENCY', 'Hemoglobin', '2138-07-18 00:30:00'], ['EMERGENCY', 'Lymphocytes', '2138-07-18 00:30:00'], ['EMERGENCY', 'MCH', '2138-07-18 00:30:00'], ['EMERGENCY', 'MCHC', '2138-07-18 00:30:00'], ['EMERGENCY', 'MCV', '2138-07-18 00:30:00'], ['EMERGENCY', 'Magnesium', '2138-07-18 00:30:00'], ['EMERGENCY', 'Magnesium', '2138-07-18 07:30:00'], ['EMERGENCY', 'Monocytes', '2138-07-18 00:30:00'], ['EMERGENCY', 'Neutrophils', '2138-07-18 00:30:00'], ['EMERGENCY', 'PT', '2138-07-18 00:30:00'], ['EMERGENCY', 'PTT', '2138-07-18 00:30:00'], ['EMERGENCY', 'Phosphate', '2138-07-18 00:30:00'], ['EMERGENCY', 'Platelet Count', '2138-07-18 00:30:00'], ['EMERGENCY', 'Potassium', '2138-07-18 00:30:00'], ['EMERGENCY', 'Potassium', '2138-07-18 07:30:00'], ['EMERGENCY', 'Potassium, Whole Blood', '2138-07-18 02:04:00'], ['EMERGENCY', 'RDW', '2138-07-18 00:30:00'], ['EMERGENCY', 'Red Blood Cells', '2138-07-18 00:30:00'], ['EMERGENCY', 'Sodium', '2138-07-18 00:30:00'], ['EMERGENCY', 'Sodium', '2138-07-18 07:30:00'], ['EMERGENCY', 'Troponin T', '2138-07-18 00:30:00'], ['EMERGENCY', 'Troponin T', '2138-07-18 07:30:00'], ['EMERGENCY', 'Urea Nitrogen', '2138-07-18 00:30:00'], ['EMERGENCY', 'Urea Nitrogen', '2138-07-18 07:30:00'], ['EMERGENCY', 'White Blood Cells', '2138-07-18 00:30:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the correct tables and join conditions (it even redundantly joins on SUBJECT_ID and HADM_ID, which doesn\u2019t alter the result), and the WHERE clause correctly filters SUBJECT_ID = 18480. The only mistake is that the SELECT clause includes an extra column (L.CHARTTIME) which was not asked for. This is a localized error in the SELECT projection and does not affect the overall query structure or logic.",
            "error_type": "Local: projection error"
        }
    }
}