{
    "deepseek": {
        "ade0c7463c725d9219e5712adb45de85": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "count the number of married patients who have acute myocardial infarction of inferolateral wall, initial episode of care diagnoses. (Values: MARRIED, AMI inferolateral, init)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"MARITAL_STATUS\" = \"MARRIED\" AND DIAGNOSES.\"SHORT_TITLE\" = \"AMI inferolateral, init\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) FROM DEMOGRAPHIC AS D JOIN DIAGNOSES AS Diag ON D.SUBJECT_ID = Diag.SUBJECT_ID AND D.HADM_ID = Diag.HADM_ID WHERE D.MARITAL_STATUS = 'MARRIED' AND Diag.ICD9_CODE = '41062';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s error is limited to the WHERE clause filter: it uses Diag.ICD9_CODE = '41062' instead of matching the SHORT_TITLE = 'AMI inferolateral, init'. All other joins and query structure mirror the ground truth. This is a localized mistake in the filter condition and doesn\u2019t require changing the overall query logic or joins.",
            "error_type": "Local: incorrect filter column/value"
        },
        "0b323ac6dda39e3588c51d5acb16b4fc": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "how many of the patients had hemorrhage complicating a procedure? (Values: Hemorrhage complicating a procedure)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DIAGNOSES.\"LONG_TITLE\" = \"Hemorrhage complicating a procedure\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM PROCEDURES WHERE ICD9_CODE = '9981';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL entirely uses the PROCEDURES table and the ICD9_CODE column, whereas the question refers to the LONG_TITLE in the DIAGNOSES table. This is not a minor syntax or column name mistake but a fundamental change in the data source and logic of the query. It alters the intended join and target table, leading to incorrect results. Such an error affects the overall query structure and logic, so it is a Global error.",
            "error_type": "Global: wrong-table error"
        },
        "9cfe1b1262ebc011c0cd636a6bd1b9f7": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "Calculate the total number of patients on elective admission before the year 2108 (Values: ELECTIVE)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ADMISSION_TYPE\" = \"ELECTIVE\" AND DEMOGRAPHIC.\"ADMITYEAR\" < \"2108\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) AS TOTAL_ELECTIVE_PATIENTS FROM DEMOGRAPHIC WHERE ADMISSION_TYPE = 'ELECTIVE' AND YEAR(ADMITTIME) < 2108;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such function: YEAR",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the YEAR() function on the ADMITTIME column, which is not supported in SQLite, resulting in the \u201cno such function: YEAR\u201d error. This mistake is confined to a specific part of the WHERE clause and does not affect the overall join structure or query logic. It can be fixed by extracting the year using a supported SQLite function or by comparing the ADMITYEAR field as in the ground truth, without restructuring the query.",
            "error_type": "Local: function usage error"
        },
        "089c48c2efaae378b3bf7ee0d9fa4894": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "count the number of patients admitted before 2200 who had endoscopic removal of stone(s) from biliary tract. (Values: Endoscopic removal of stone(s) from biliary tract)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"ADMITYEAR\" < \"2200\" AND PROCEDURES.\"LONG_TITLE\" = \"Endoscopic removal of stone(s) from biliary tract\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) FROM DEMOGRAPHIC D JOIN PROCEDURES P ON D.SUBJECT_ID = P.SUBJECT_ID AND D.HADM_ID = P.HADM_ID WHERE P.ICD9_CODE = '3910' AND YEAR(D.ADMITTIME) < 2200;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such function: YEAR",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a non-existent SQLite function YEAR(D.ADMITTIME) and also mismatches on P.ICD9_CODE instead of filtering by the LONG_TITLE. Both issues are confined to specific expressions (a wrong function call and wrong filter column) and do not require restructuring the overall join or query logic. Hence this is a local error.",
            "error_type": "Local: other-temporal error"
        }
    },
    "codes": {
        "aa94e974b8ee66950b649251ba9090dc": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients are less than 31 year old with a chemistry lab test category? (Values: Chemistry)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"AGE\" < \"31\" AND LAB.\"CATEGORY\" = \"Chemistry\"",
            "pred_sql": "SELECT count(lab.subject_id) FROM lab INNER JOIN diagnoses ON lab.subject_id = diagnoses.subject_id INNER JOIN demographic ON demographic.subject_id = lab.subject_id WHERE lab.category = 'Chemistry' AND demographic.age < 31",
            "gold_answer": "[['23.0']]",
            "pred_answer": "[['3869.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces an unnecessary join to the DIAGNOSES table and joins tables only on SUBJECT_ID rather than matching HADM_ID, which changes the set of patients counted and multiplies rows. It also omits DISTINCT, counting each lab record rather than unique patients. These mistakes alter the overall query logic and data associations, so fixing them requires restructuring the joins and aggregation, not just a local tweak.",
            "error_type": "Global: incorrect join logic"
        },
        "0a1dcb8cb5d013e3feb7229a7b8ac869": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "Get me the number of patients who had a urine magnesium lab test. (Values: Magnesium, Urine)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE LAB.\"LABEL\" = \"Magnesium, Urine\"",
            "pred_sql": "SELECT count(DISTINCT lab.subject_id) FROM lab INNER JOIN demographic ON lab.subject_id = demographic.subject_id WHERE lab.itemid = 50968",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only differs in the WHERE clause filter: it uses lab.itemid = 50968 instead of lab.label = 'Magnesium, Urine'. The JOIN and overall structure remain correct. This is a localized mistake in the filter condition (wrong column/value), so it can be fixed without altering the query\u2019s structure or logic flow.",
            "error_type": "Local: incorrect filter column"
        },
        "0a1afd3f6a8a58a11490424176d9f026": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find the item id of kelly gallardo. (Values: Kelly Gallardo)",
            "gold_sql": "SELECT LAB.\"ITEMID\" FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"NAME\" = \"Kelly Gallardo\"",
            "pred_sql": "SELECT itemid FROM lab WHERE label = 'KELLY GALLARDO'",
            "gold_answer": "[['50868.0'], ['50882.0'], ['50883.0'], ['50883.0'], ['50884.0'], ['50884.0'], ['50885.0'], ['50885.0'], ['50902.0'], ['50971.0'], ['50983.0'], ['51143.0'], ['51144.0'], ['51146.0'], ['51200.0'], ['51221.0'], ['51222.0'], ['51244.0'], ['51248.0'], ['51249.0'], ['51250.0'], ['51251.0'], ['51254.0'], ['51255.0'], ['51256.0'], ['51257.0'], ['51265.0'], ['51277.0'], ['51279.0'], ['51301.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query uses the LAB table and its LABEL column to filter by 'KELLY GALLARDO', but the patient\u2019s name resides in the DEMOGRAPHIC.NAME column. It omits the DEMOGRAPHIC\u2192LAB join entirely and uses the wrong column for filtering, causing no results. This is a simple table/column reference mistake rather than a structural or multi-clause logic error.",
            "error_type": "Local: table/column reference error"
        },
        "06bbd920c4191e622346b9c33d8b0f43": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what is the number of living patients diagnosed with suicide and self-inflicted poisoning by analgesics, antipyretics, and antirheumatics? (Values: 0, Suicide and self-inflicted poisoning by analgesics, antipyretics, and antirheumatics)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"EXPIRE_FLAG\" = \"0\" AND DIAGNOSES.\"LONG_TITLE\" = \"Suicide and self-inflicted poisoning by analgesics, antipyretics, and antirheumatics\"",
            "pred_sql": "SELECT count(DISTINCT demographic.subject_id) FROM diagnoses INNER JOIN demographic ON diagnoses.hadm_id = demographic.hadm_id WHERE diagnoses.icd9_code IN (387, 388, 389) AND demographic.expire_flag = 0",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL error lies solely in the WHERE clause: it filters on diagnoses.icd9_code IN (387, 388, 389) instead of matching the specified LONG_TITLE and the exact expire_flag value. The join, counting, and overall structure remain correct. This is a localized mistake in the filtering condition and does not require restructuring the query or altering joins.",
            "error_type": "Local: incorrect WHERE clause predicate"
        },
        "0cdaeea27c2f1e7de2ef4c3f9622d5cb": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "let me know the type of admission patient ida cook had. (Values: Ida Cook)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"ADMISSION_TYPE\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Ida Cook\"",
            "pred_sql": "SELECT DISTINCT admission_type FROM demographic WHERE subject_id = 25543",
            "gold_answer": "[['EMERGENCY']]",
            "pred_answer": "[['NEWBORN']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses `subject_id = 25543` instead of filtering on `NAME = 'Ida Cook'` as required by the question. The overall query structure (SELECT admission_type FROM demographic) is correct; only the WHERE clause\u2019s column and literal value are wrong. This is a localized mistake that can be fixed by replacing the filter with the proper column and value.",
            "error_type": "Local: value parsing error"
        },
        "06f15c6be771186668997528e52270cb": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "tell me the gender of patient stephanie suchan. (Values: Stephanie Suchan)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"GENDER\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Stephanie Suchan\"",
            "pred_sql": "SELECT demographic.gender FROM demographic INNER JOIN prescriptions ON demographic.subject_id = prescriptions.subject_id WHERE prescriptions.drug = 'Stephanie Suchan'",
            "gold_answer": "[['F']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query incorrectly joins the DEMOGRAPHIC table with PRESCRIPTIONS and filters on prescriptions.drug instead of simply selecting the GENDER from DEMOGRAPHIC where NAME matches 'Stephanie Suchan'. This is not a small typo or localized mistake but a fundamental change to the query\u2019s structure and logic\u2014using the wrong table and column for filtering and introducing an unnecessary join that alters the intended meaning of the query.",
            "error_type": "Global: incorrect join logic"
        },
        "ad0222178143c1561a0a8a027757997f": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find the maximum age of patients with government insurance who expired before the year 2154. (Values: Government, 2154.0)",
            "gold_sql": "SELECT MAX ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"INSURANCE\" = \"Government\" AND DEMOGRAPHIC.\"DOD_YEAR\" < \"2154.0\"",
            "pred_sql": "SELECT max(demographic.age) FROM demographic INNER JOIN insurance ON demographic.subject_id = insurance.subject_id WHERE demographic.expire_flag = 1 AND strftime('%Y', insurance.insurance) = '2154'",
            "gold_answer": "[['None']]",
            "pred_answer": "no such table: insurance",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent table 'insurance', which is not part of the provided schema. This is a table reference error, a localized issue that can be fixed by correcting or removing the invalid table reference without altering the overall query structure.",
            "error_type": "Local: table reference error"
        },
        "81246894ba88abc13f0ae732be0ae33f": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many black/haitian patients have phenylephrine medication prescription? (Values: BLACK/HAITIAN, Phenylephrine)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"ETHNICITY\" = \"BLACK/HAITIAN\" AND PRESCRIPTIONS.\"DRUG\" = \"Phenylephrine\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN prescriptions ON demographic.subject_id = prescriptions.subject_id WHERE demographic.ethnicity = 'BLACK/HAITIAN' AND prescriptions.drug = 'Phenylephrine'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['3.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses an incorrect join key (demographic.subject_id = prescriptions.subject_id) instead of the correct hospital admission ID (hadm_id). This fundamentally alters the intended logic by linking prescriptions across different admissions for the same patient, resulting in an inflated count and incorrect associations. Fixing this requires changing the join structure, so it\u2019s a global error.",
            "error_type": "Global: incorrect join key"
        },
        "9c05a565ee5d9c64aaf12d921d02d4c9": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "among the patients who were treated with pravastatin, how many of them were aged below 72? (Values: Pravastatin)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"AGE\" < \"72\" AND PRESCRIPTIONS.\"DRUG\" = \"Pravastatin\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN prescriptions ON demographic.subject_id = prescriptions.subject_id WHERE prescriptions.drug = 'Pravastatin' AND demographic.age < 72",
            "gold_answer": "[['6.0']]",
            "pred_answer": "[['8.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates from the ground truth in two specific, fixable parts: (1) it joins DEMOGRAPHIC and PRESCRIPTIONS on SUBJECT_ID instead of HADM_ID, and (2) it omits the DISTINCT in COUNT to ensure unique patients. Both issues are localized to the JOIN clause and the SELECT aggregation and do not require restructuring the overall query logic.",
            "error_type": "Local: join-condition error"
        },
        "81b4faef3515b239d74fcabdef8c1a42": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "How many patients born before the year 2170 had a lab test named other cells? (Values: Other Cells)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"DOB_YEAR\" < \"2170\" AND LAB.\"LABEL\" = \"Other Cells\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN lab ON demographic.subject_id = lab.subject_id WHERE lab.label = 'Other Cells' AND demographic.dob_year < 2170",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['6.0']]",
            "is_correct": false,
            "reasoning": "The predicted query joins DEMOGRAPHIC and LAB on demographic.subject_id = lab.subject_id instead of using the hadm_id relationship as in the ground truth, and it also omits the DISTINCT in the COUNT, causing over\u2010counting of patients with multiple lab entries. The incorrect join key changes the fundamental data relationship and thus the meaning of the query, requiring a structural fix rather than a simple tweak in one clause.",
            "error_type": "Global: incorrect-join error"
        },
        "8758789c5295576a106780e5c140c9bd": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "calculate the maximum days for which patients who died before 2164 stayed in hospital. (Values: 2164.0)",
            "gold_sql": "SELECT MAX ( DEMOGRAPHIC.\"DAYS_STAY\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DOD_YEAR\" < \"2164.0\"",
            "pred_sql": "SELECT max(demographic.dischtime - demographic.admittime) FROM demographic INNER JOIN procedures ON demographic.subject_id = procedures.subject_id WHERE procedures.icd9_code = 4240 AND demographic.expire_flag = 1 AND demographic.dischtime LIKE '2164%'",
            "gold_answer": "[['34.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely diverges from the intended logic: it joins the PROCEDURES table using an unrelated ICD9 code filter, applies an expire_flag and dischtime LIKE condition, and computes a timestamp difference instead of using the DAYS_STAY column and filtering by DOD_YEAR < 2164.0. This is not a localized syntax or reference mistake but a fundamental structural and logical error that alters the query\u2019s purpose, requiring a significant rewrite of multiple clauses.",
            "error_type": "Global: incorrect join strategy"
        },
        "879e430064f5011919b19ba70a193bc9": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "give me the number of patients who were diagnosed under icd9 code 76528 and also their lab test category is chemistry. (Values: Chemistry)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DIAGNOSES.\"ICD9_CODE\" = \"76528\" AND LAB.\"CATEGORY\" = \"Chemistry\"",
            "pred_sql": "SELECT count(diagnoses.subject_id) FROM lab INNER JOIN diagnoses ON lab.subject_id = diagnoses.subject_id WHERE diagnoses.icd9_code = 76528 AND lab.category = 'Chemistry'",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['36.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins LAB and DIAGNOSES only on subject_id rather than hadm_id and does not use DISTINCT, thereby changing the intended logic of counting unique patients per admission with both the specific diagnosis and lab category. This is not a minor syntax or column reference mistake but an incorrect join strategy that fundamentally alters the query\u2019s meaning and results.",
            "error_type": "Global: incorrect join key"
        }
    },
    "o4-mini": {
        "06309c2f77f11d404ae955cf4e39d47b": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "provide the number of patients whose diagnosis short title is dmi keto nt st uncontrolled and lab test category is blood gas. (Values: DMI keto nt st uncntrld, Blood Gas)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"DMI keto nt st uncntrld\" AND LAB.\"CATEGORY\" = \"Blood Gas\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) AS num_patients FROM DIAGNOSES d JOIN LAB l ON d.SUBJECT_ID = l.SUBJECT_ID AND d.HADM_ID = l.HADM_ID WHERE d.SHORT_TITLE = 'DMI KETO NT ST UNCNTRLD' AND l.CATEGORY = 'Blood Gas';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL is structurally correct\u2014it joins the same tables (DIAGNOSES and LAB) on the correct keys and counts distinct SUBJECT_ID. The only difference is that the predicted query uses a differently cased string literal for SHORT_TITLE ('DMI KETO NT ST UNCNTRLD' instead of 'DMI keto nt st uncntrld'), causing no rows to match under SQLite\u2019s default case-sensitive comparison. This is a localized issue in the WHERE clause and can be fixed by adjusting the literal. Therefore it is a Local error.",
            "error_type": "Local: value parsing error"
        }
    },
    "qwen3": {
        "8412f1e49973d10caff572e2e132ff72": {
            "db_id": "mimicsql",
            "generator_name": "qwen3",
            "question": "How many of the patients admitted before 2112 were diagnosed with chest pain nec? (Values: Chest pain NEC)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"ADMITYEAR\" < \"2112\" AND DIAGNOSES.\"SHORT_TITLE\" = \"Chest pain NEC\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) FROM DEMOGRAPHIC d JOIN DIAGNOSES diag ON d.SUBJECT_ID = diag.SUBJECT_ID AND d.HADM_ID = diag.HADM_ID WHERE EXTRACT(YEAR FROM d.ADMITTIME) < 2112 AND diag.SHORT_TITLE = 'Chest pain NEC';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "near \"FROM\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the EXTRACT(YEAR FROM d.ADMITTIME) function, which is not supported in SQLite. This is a localized syntax error in the WHERE clause (temporal extraction), not a flaw in the overall query logic or table relationships. It can be fixed by replacing EXTRACT with a supported SQLite date function or using the ADMITYEAR column as in the ground truth. Therefore this is a Local error.",
            "error_type": "Local: other-temporal error"
        }
    },
    "macsql": {
        "89a92f1bd2e74cecb90195b6d5cd860f": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "what is the admission type and lab test name for the patient id 2560?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"ADMISSION_TYPE\",LAB.\"LABEL\" FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"2560\"",
            "pred_sql": "SELECT DISTINCT `LABEL` FROM LAB WHERE `SUBJECT_ID` = 2560",
            "gold_answer": "[['NEWBORN', 'Atypical Lymphocytes'], ['NEWBORN', 'Bands'], ['NEWBORN', 'Basophils'], ['NEWBORN', 'Bilirubin, Direct'], ['NEWBORN', 'Bilirubin, Indirect'], ['NEWBORN', 'Bilirubin, Total'], ['NEWBORN', 'Eosinophils'], ['NEWBORN', 'Hematocrit'], ['NEWBORN', 'Hemoglobin'], ['NEWBORN', 'Lymphocytes'], ['NEWBORN', 'MCH'], ['NEWBORN', 'MCHC'], ['NEWBORN', 'MCV'], ['NEWBORN', 'Metamyelocytes'], ['NEWBORN', 'Monocytes'], ['NEWBORN', 'Myelocytes'], ['NEWBORN', 'Neutrophils'], ['NEWBORN', 'Nucleated Red Cells'], ['NEWBORN', 'Platelet Count'], ['NEWBORN', 'RDW'], ['NEWBORN', 'Red Blood Cells'], ['NEWBORN', 'White Blood Cells']]",
            "pred_answer": "[['Atypical Lymphocytes'], ['Bands'], ['Basophils'], ['Bilirubin, Direct'], ['Bilirubin, Indirect'], ['Bilirubin, Total'], ['Eosinophils'], ['Hematocrit'], ['Hemoglobin'], ['Lymphocytes'], ['MCH'], ['MCHC'], ['MCV'], ['Metamyelocytes'], ['Monocytes'], ['Myelocytes'], ['Neutrophils'], ['Nucleated Red Cells'], ['Platelet Count'], ['RDW'], ['Red Blood Cells'], ['White Blood Cells']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the DEMOGRAPHIC table entirely, fails to join DEMOGRAPHIC and LAB on HADM_ID, and does not select the admission type. Instead, it only retrieves distinct lab labels. This error affects the overall query logic and structure, as it removes a required table and key join and changes the intended output columns, so it cannot be fixed locally within a clause.",
            "error_type": "Global: missing join and projection"
        }
    },
    "llm2sql": {
        "ad68c7f37e76a07bb9df8bbd457cb210": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "how many patients year of birth is before 1821 with lab test lactate dehydrogenase csf? (Values: Lactate Dehydrogenase, CSF)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"DOB_YEAR\" < \"1821\" AND LAB.\"LABEL\" = \"Lactate Dehydrogenase, CSF\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) nFROM DEMOGRAPHIC D nJOIN LAB L ON D.SUBJECT_ID = L.SUBJECT_ID AND D.HADM_ID = L.HADM_ID nWHERE D.DOB_YEAR < 1821 AND L.LABEL = 'Lactate Dehydrogenase' AND L.CATEGORY = 'CSF';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "near \"DEMOGRAPHIC\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL has two localized mistakes: a syntax error where newline markers (\u2018nFROM\u2019, \u2018nJOIN\u2019, \u2018nWHERE\u2019) are run together causing a parsing failure, and an incorrect WHERE predicate that splits the lab label into L.LABEL and L.CATEGORY instead of matching the single string \u201cLactate Dehydrogenase, CSF\u201d. Both issues are contained within a single clause and do not require restructuring the entire query.",
            "error_type": "Local: syntax and predicate error"
        }
    }
}