{
    "llm2sql": {
        "aa81098d9bbd712002641a023ad9c2ed": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "what is the number of government health insurance patients who had laryngoscopy and other tracheoscopy procedure? (Values: Government, Laryngoscopy and other tracheoscopy)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"INSURANCE\" = \"Government\" AND PROCEDURES.\"LONG_TITLE\" = \"Laryngoscopy and other tracheoscopy\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) nFROM DEMOGRAPHIC D nJOIN PROCEDURES P ON D.SUBJECT_ID = P.SUBJECT_ID AND D.HADM_ID = P.HADM_ID nWHERE D.INSURANCE LIKE '%Government%' nAND P.LONG_TITLE LIKE '%Laryngoscopy and other tracheoscopy%';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "near \"DEMOGRAPHIC\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to execute due to a syntax error: it includes 'nFROM' and 'nJOIN' instead of proper newline or space before FROM and JOIN, causing an immediate parse error near 'DEMOGRAPHIC'. This is a localized formatting/syntax mistake in the SELECT/JOIN clauses, not a fundamental mis\u2010join or logic flaw.",
            "error_type": "Local: syntax error"
        }
    },
    "qwen3": {
        "9391ab36c2bddfe0cf474a3d26392232": {
            "db_id": "mimicsql",
            "generator_name": "qwen3",
            "question": "find the number of russian speaking patients who are diagnosed with proteus infection nos. (Values: RUSS, Proteus infection NOS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"LANGUAGE\" = \"RUSS\" AND DIAGNOSES.\"SHORT_TITLE\" = \"Proteus infection NOS\"",
            "pred_sql": "SELECT COUNT(*) FROM DEMOGRAPHIC WHERE LANGUAGE = 'RUSS' AND DIAGNOSIS = 'Proteus infection NOS';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL incorrectly filters on DEMOGRAPHIC.DIAGNOSIS instead of joining to the DIAGNOSES table and filtering on DIAGNOSES.SHORT_TITLE. This is a localized mistake in the WHERE clause/table reference and does not require restructuring the entire query logic\u2014simply correcting the join and column reference would fix it.",
            "error_type": "Local: table/column reference error"
        }
    },
    "codes": {
        "95f8a3f0cc5f6486ee39cf3575176b39": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what is the marital status and the ethnic group of subject id 30011?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"MARITAL_STATUS\",DEMOGRAPHIC.\"ETHNICITY\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"30011\"",
            "pred_sql": "SELECT marital_status FROM demographic WHERE subject_id = 30011",
            "gold_answer": "[['SINGLE', 'HISPANIC OR LATINO']]",
            "pred_answer": "[['SINGLE']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only selects marital_status and omits the ethnicity column. This is a local issue in the SELECT clause (a missing column) and does not affect the overall query structure or logic.",
            "error_type": "Local: missing column"
        },
        "021ebbc73156e10c78d02f72ff647325": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "Count the number of patients that survived and had a procedure icd9 code of 331. (Values: 0)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"EXPIRE_FLAG\" = \"0\" AND PROCEDURES.\"ICD9_CODE\" = \"331\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM procedures INNER JOIN demographic ON procedures.subject_id = demographic.subject_id WHERE procedures.icd9_code = 331 AND demographic.expire_flag = 0",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses an INNER JOIN on procedures.subject_id = demographic.subject_id instead of joining on the admission identifier (HADM_ID) as in the ground truth. This incorrect join key fundamentally alters which rows are paired and thus changes the query\u2019s results. Additionally, the predicted version omits the DISTINCT on SUBJECT_ID, further changing the intended patient count. Both issues go beyond a localized syntax fix and affect the overall logic and table relationships.",
            "error_type": "Global: incorrect join key"
        },
        "ab0da7d05a345b85c091b469d2dc2d98": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "Specify the discharge location of patient Dona Cole along with the ICU stay ID",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DISCHARGE_LOCATION\",PRESCRIPTIONS.\"ICUSTAY_ID\" FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"NAME\" = \"Dona Cole\"",
            "pred_sql": "SELECT discharge_location, icustay_id FROM demographic WHERE name = 'Dona Cole'",
            "gold_answer": "[['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None'], ['HOME', 'None']]",
            "pred_answer": "no such column: icustay_id",
            "is_correct": false,
            "reasoning": "The predicted SQL references the column icustay_id from the DEMOGRAPHIC table, but that column does not exist there. The correct query joins DEMOGRAPHIC with PRESCRIPTIONS to retrieve ICUSTAY_ID. This is a localized column reference error that can be fixed by adding the proper JOIN rather than restructuring the overall logic.",
            "error_type": "Local: column reference error"
        },
        "870f671294fda99c32cc17f92aad78a8": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients had the diagnosis long title hemochromatosis due to repeated red blood cell transfusions? (Values: Hemochromatosis due to repeated red blood cell transfusions)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DIAGNOSES.\"LONG_TITLE\" = \"Hemochromatosis due to repeated red blood cell transfusions\"",
            "pred_sql": "SELECT count(DISTINCT diagnoses.subject_id) FROM diagnoses INNER JOIN procedures ON diagnoses.subject_id = procedures.subject_id WHERE procedures.long_title LIKE 'Hemochromatosis due to repeated red blood cell transfusions'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the intended logic by joining the DIAGNOSES table to the PROCEDURES table on subject_id and filtering on procedures.long_title. The correct query should filter DIAGNOSES.long_title and join DIAGNOSES to DEMOGRAPHIC on hadm_id. This is not a minor syntax or column reference mistake but a structural error in choosing the wrong table and join relationship, altering the query\u2019s overall meaning.",
            "error_type": "Global: incorrect join table"
        },
        "952343ad7bc01827ae39783f6285e3d6": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "let me know the drug code of midazolam hcl medication. (Values: Midazolam HCl)",
            "gold_sql": "SELECT PRESCRIPTIONS.\"FORMULARY_DRUG_CD\" FROM PRESCRIPTIONS WHERE PRESCRIPTIONS.\"DRUG\" = \"Midazolam HCl\"",
            "pred_sql": "SELECT formulary_drug_cd FROM prescriptions WHERE drug LIKE 'Midazolam%'",
            "gold_answer": "[['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I']]",
            "pred_answer": "[['MIDA100'], ['MIDA100'], ['MIDA100'], ['MIDA100'], ['MIDA100'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA2I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I'], ['MIDA50I']]",
            "is_correct": false,
            "reasoning": "The only difference is in the WHERE clause: the predicted SQL uses an overly broad LIKE 'Midazolam%' filter instead of the exact match DRUG = 'Midazolam HCl'. This is a localized error in the condition, not affecting the overall query structure or JOINs. It can be fixed by adjusting the predicate to use the correct equality operator and full string. Therefore, it is a Local error.",
            "error_type": "Local: value parsing error"
        },
        "08e84aa74e5e3adb7969241939f3af64": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "How many patients used the drug code ergo400t? (Values: ERGO400T)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE PRESCRIPTIONS.\"FORMULARY_DRUG_CD\" = \"ERGO400T\"",
            "pred_sql": "SELECT count(subject_id) FROM prescriptions WHERE formulary_drug_cd = 'ERGO400T'",
            "gold_answer": "[['8.0']]",
            "pred_answer": "[['9.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts all prescription rows matching the drug code rather than counting distinct patient IDs. It omits the DISTINCT keyword (and the join to ensure proper patient identification), leading to an overcount. This is a localized issue in the SELECT clause and does not require restructuring the overall query logic.",
            "error_type": "Local: missing-distinct error"
        },
        "964051ea9739d5463dc623efb7016c1e": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what is the lab category forJerry Deberry?",
            "gold_sql": "SELECT LAB.\"CATEGORY\" FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"NAME\" = \"Jerry Deberry\"",
            "pred_sql": "SELECT category FROM lab WHERE subject_id = 1121",
            "gold_answer": "[['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas']]",
            "pred_answer": "[['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Blood Gas'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry'], ['Chemistry']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it filters on LAB.subject_id instead of filtering DEMOGRAPHIC.NAME = 'Jerry Deberry' and joining DEMOGRAPHIC to LAB by hadm_id. This is a mistake confined to the WHERE clause (wrong column reference and missing join), and can be fixed by using the correct column and join. It does not require restructuring the overall query logic or altering multiple clauses.",
            "error_type": "Local: column reference error"
        }
    },
    "deepseek": {
        "ace7d9f8651d4d512565d6be3b6a9a6c": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "Out of total number of patients who had a lab test for pleural fluid, how many of them were born before 2089? (Values: Pleural)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"DOB_YEAR\" < \"2089\" AND LAB.\"FLUID\" = \"Pleural\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) AS count_patients FROM LAB L INNER JOIN DEMOGRAPHIC D ON L.SUBJECT_ID = D.SUBJECT_ID AND L.HADM_ID = D.HADM_ID WHERE L.FLUID = 'Pleural' AND YEAR(D.DOB) < 2089;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such function: YEAR",
            "is_correct": false,
            "reasoning": "The predicted SQL fails due to the use of the non-existent SQLite function YEAR(D.DOB). This error occurs in the WHERE clause when extracting the year from DOB, and it does not alter the overall structure or logic of the join or aggregation. It is a localized syntax/temporal extraction error that can be fixed without restructuring the query (e.g., by using the DOB_YEAR column).",
            "error_type": "Local: other-temporal error"
        },
        "0f6b59272b612f8e29af1fcd07b26294": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "Calculate the average age of living patients admitted to the hospital on or after 2121. (Values: 0)",
            "gold_sql": "SELECT AVG ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"EXPIRE_FLAG\" = \"0\" AND DEMOGRAPHIC.\"ADMITYEAR\" >= \"2121\"",
            "pred_sql": "SELECT AVG(AGE) AS average_age FROM DEMOGRAPHIC WHERE EXPIRE_FLAG = 0 AND YEAR(ADMITTIME) >= 2121;",
            "gold_answer": "[['41.742']]",
            "pred_answer": "no such function: YEAR",
            "is_correct": false,
            "reasoning": "The predicted query matches the intended logic (AVG age, EXPIRE_FLAG filter, admission year filter) but uses the non\u2010existent SQLite function YEAR(), causing a \u201cno such function\u201d error. This is a localized syntax/function call error within the WHERE clause and does not alter the overall query structure or logic.",
            "error_type": "Local: syntax error"
        },
        "8f5493ee584c51f03ef9579a071809eb": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "provide the lab test name and lab test category for subject id 17787?",
            "gold_sql": "SELECT LAB.\"LABEL\",LAB.\"CATEGORY\" FROM LAB WHERE LAB.\"SUBJECT_ID\" = \"17787\"",
            "pred_sql": "SELECT LABEL AS \"Lab Test Name\", CATEGORY AS \"Lab Test Category\" FROM LAB WHERE SUBJECT_ID = 17787;",
            "gold_answer": "[['Atypical Lymphocytes', 'Hematology'], ['Bands', 'Hematology'], ['Basophils', 'Hematology'], ['Bilirubin, Direct', 'Chemistry'], ['Bilirubin, Indirect', 'Chemistry'], ['Bilirubin, Total', 'Chemistry'], ['Eosinophils', 'Hematology'], ['Hematocrit', 'Hematology'], ['Hemoglobin', 'Hematology'], ['Lymphocytes', 'Hematology'], ['MCH', 'Hematology'], ['MCHC', 'Hematology'], ['MCV', 'Hematology'], ['Metamyelocytes', 'Hematology'], ['Monocytes', 'Hematology'], ['Myelocytes', 'Hematology'], ['Neutrophils', 'Hematology'], ['Nucleated Red Cells', 'Hematology'], ['Platelet Count', 'Hematology'], ['RDW', 'Hematology'], ['Red Blood Cells', 'Hematology'], ['White Blood Cells', 'Hematology']]",
            "pred_answer": "[['Atypical Lymphocytes'], ['Bands'], ['Basophils'], ['Bilirubin, Direct'], ['Bilirubin, Indirect'], ['Bilirubin, Total'], ['Eosinophils'], ['Hematocrit'], ['Hemoglobin'], ['Lymphocytes'], ['MCH'], ['MCHC'], ['MCV'], ['Metamyelocytes'], ['Monocytes'], ['Myelocytes'], ['Neutrophils'], ['Nucleated Red Cells'], ['Platelet Count'], ['RDW'], ['Red Blood Cells'], ['White Blood Cells']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only returns the lab test name column, omitting the lab test category even though the alias is present. This is a mistake in the SELECT clause (a missing column), but the overall query structure, table references, and WHERE condition are correct. It doesn\u2019t require reworking JOINs, subqueries, or the logic\u2014just fixing the SELECT to actually include CATEGORY. Therefore it\u2019s a localized column reference error.",
            "error_type": "Local: column reference error"
        },
        "04531e28c38575a4a2bdca04faa8c77b": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "how many patients are diagnosed with hx traumatic fracture? (Values: Hx traumatic fracture)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"Hx traumatic fracture\"",
            "pred_sql": "SELECT COUNT(SUBJECT_ID) FROM DEMOGRAPHIC WHERE DIAGNOSIS = 'hx traumatic fracture';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely omits the DIAGNOSES table and uses the DEMOGRAPHIC.DIAGNOSIS column instead of joining to DIAGNOSES and filtering on SHORT_TITLE. This is not a simple typo or local fix; it changes the query\u2019s entire logic and table relationships, resulting in incorrect counts. Thus it\u2019s a global error in the query\u2019s structure and join logic.",
            "error_type": "Global: join error"
        },
        "a030ada88d94f5f9ef48362a97aa413d": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "what is the total number of patiemts who had crnry athrscl natve vssl? (Values: Crnry athrscl natve vssl)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"Crnry athrscl natve vssl\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) AS TOTAL_PATIENTS FROM DIAGNOSES D WHERE D.SHORT_TITLE LIKE '%CORONARY%' OR D.LONG_TITLE LIKE '%ATHEROSCLEROTIC NATIVE VESSEL%';",
            "gold_answer": "[['19.0']]",
            "pred_answer": "[['11.0']]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s structure (SELECT COUNT DISTINCT from DIAGNOSES) could work since SUBJECT_ID is present there, so no major restructuring is required. The mistake lies solely in the WHERE clause filter: it uses LIKE '%CORONARY%' OR LIKE '%ATHEROSCLEROTIC NATIVE VESSEL%' instead of matching the exact SHORT_TITLE \"Crnry athrscl natve vssl\". This is a localized error in the conditionals (value parsing/matching) and does not affect joins, overall logic, or multi-clause consistency.",
            "error_type": "Local: incorrect filter condition"
        }
    },
    "dinsql": {
        "9de792fe2a88120b9c4b104e3ef20a27": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "mention the disease that jerry deberry is primarily suffering from and his date of birth as well. (Values: Jerry Deberry)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DOB\",DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Jerry Deberry\"",
            "pred_sql": "SELECT D.DOB, DI.LONG_TITLE FROM DEMOGRAPHIC AS D JOIN DIAGNOSES AS DI ON D.SUBJECT_ID = DI.SUBJECT_ID AND D.HADM_ID = DI.HADM_ID WHERE D.NAME = 'Jerry Deberry' ORDER BY DI.HADM_ID ASC LIMIT 1",
            "gold_answer": "[['2043-02-28 00:00:00', 'S/P FALL']]",
            "pred_answer": "[['2043-02-28 00:00:00', 'Abdominal pain, other specified site']]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces a JOIN with the DIAGNOSES table and selects LONG_TITLE, rather than using the DEMOGRAPHIC.DIAGNOSIS column as intended. This changes the overall logic of the query\u2014bringing in unrelated diagnosis records and fundamentally altering the result. Fixing this requires removing the JOIN and reverting to the DEMOGRAPHIC table\u2019s DIAGNOSIS column, which is a structural change beyond a simple typo or local clause correction.",
            "error_type": "Global: join error"
        },
        "a772fe669af1ccf30732303ee43d3e8e": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "What is the number of patients with abdominal pain as their primary disease who were discharged to snf? (Values: SNF, ABDOMINAL PAIN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DISCHARGE_LOCATION\" = \"SNF\" AND DEMOGRAPHIC.\"DIAGNOSIS\" = \"ABDOMINAL PAIN\"",
            "pred_sql": "SELECT COUNT(DISTINCT D1.SUBJECT_ID) FROM DIAGNOSES AS D1 INNER JOIN DEMOGRAPHIC AS D2 ON D1.HADM_ID = D2.HADM_ID WHERE D1.LONG_TITLE LIKE '%abdominal pain%' AND D2.DISCHARGE_LOCATION = 'SNF'",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['1.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query\u2019s logic by pulling data from the DIAGNOSES table and using a LIKE filter on LONG_TITLE instead of using the primary DIAGNOSIS field in the DEMOGRAPHIC table. It also introduces a join that was not in the original intent, thereby altering the meaning of the question (primary disease vs any recorded diagnosis). This error spans multiple clauses and changes the overall structure and intended relationships of the query.",
            "error_type": "Global: incorrect table and join logic"
        },
        "034ba91dc253e7717c3102b2a97d2f49": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "what number of patients with abdominal abscess had drug type as main? (Values: ABDOMINAL ABSCESS, MAIN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"ABDOMINAL ABSCESS\" AND PRESCRIPTIONS.\"DRUG_TYPE\" = \"MAIN\"",
            "pred_sql": "SELECT COUNT(DISTINCT P.SUBJECT_ID) FROM DIAGNOSES AS D JOIN PRESCRIPTIONS AS P ON D.SUBJECT_ID = P.SUBJECT_ID AND D.HADM_ID = P.HADM_ID WHERE D.LONG_TITLE = 'Abdominal abscess' AND P.DRUG_TYPE = 'MAIN'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the DIAGNOSES table and filters on D.LONG_TITLE rather than using the DEMOGRAPHIC table\u2019s DIAGNOSIS field. This changes the table relationship and the source of the diagnosis filter, leading to a fundamentally different result (0 vs 1). This is not a simple typo or localized mistake but a structural error in how tables are joined and which table provides the diagnosis data. Therefore, it is a global error.",
            "error_type": "Global: incorrect join"
        },
        "a75e1aa8b393a93c5a51986d68dc15a6": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "Give the number of patients whose primary disease is cerebral aneurysm/sda and were admitted before the year 2200. (Values: CEREBRAL ANEURYSM/SDA)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"CEREBRAL ANEURYSM/SDA\" AND DEMOGRAPHIC.\"ADMITYEAR\" < \"2200\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) FROM DIAGNOSES d JOIN DEMOGRAPHIC dem ON d.SUBJECT_ID = dem.SUBJECT_ID AND d.HADM_ID = dem.HADM_ID WHERE d.LONG_TITLE = 'CEREBRAL ANEURYSM/SDA' AND dem.ADMITYEAR < 2200",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The user\u2019s intent is to count patients whose primary disease (stored in DEMOGRAPHIC.DIAGNOSIS) equals \u201cCEREBRAL ANEURYSM/SDA\u201d and were admitted before 2200. The ground truth query reads directly from the DEMOGRAPHIC table. The predicted query instead joins to the DIAGNOSES table on SUBJECT_ID and HADM_ID and filters on DIAGNOSES.LONG_TITLE. This not only uses the wrong source for \u201cprimary disease\u201d but also changes the join logic and result set fundamentally. It is not a simple typo or missing alias; it alters the overall query structure and relationships between tables. Thus this is a global logical/structural error (using an incorrect table and join strategy) rather than a local fixable mistake.",
            "error_type": "Global: incorrect join"
        }
    },
    "macsql": {
        "90ea3f943491a9110aa016d6d613cba8": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "let me know the gender and lab test abnormal status of patient with patient id 2560.",
            "gold_sql": "SELECT DEMOGRAPHIC.\"GENDER\",LAB.\"FLAG\" FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"2560\"",
            "pred_sql": "SELECT T1.`GENDER`, T2.`FLAG` FROM `DEMOGRAPHIC` AS T1 LEFT JOIN `LAB` AS T2 ON T1.`SUBJECT_ID` = T2.`SUBJECT_ID` WHERE T1.`SUBJECT_ID` = 2560 AND T2.`FLAG` IS NOT NULL",
            "gold_answer": "[['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'None'], ['M', 'abnormal'], ['M', 'abnormal'], ['M', 'abnormal'], ['M', 'abnormal'], ['M', 'abnormal'], ['M', 'abnormal']]",
            "pred_answer": "[['M', 'abnormal'], ['M', 'abnormal'], ['M', 'abnormal'], ['M', 'abnormal'], ['M', 'abnormal'], ['M', 'abnormal']]",
            "is_correct": false,
            "reasoning": "The predicted query uses a LEFT JOIN on SUBJECT_ID rather than the correct HADM_ID join key, then filters out NULL FLAG values, which fundamentally alters the result set by excluding the expected 'None' statuses and mismatching admissions. This is not a simple typo or minor clause fix but a flawed join strategy and filter logic that changes the query\u2019s intended meaning.",
            "error_type": "Global: incorrect join key"
        }
    },
    "o4-mini": {
        "099eef47c1de13d69881354a8d6bcf98": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "give me the number of patients whose death status is 0 and diagnoses title is bph w/o urinaryobs/luts. (Values: BPH w/o urinary obs/LUTS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"EXPIRE_FLAG\" = \"0\" AND DIAGNOSES.\"SHORT_TITLE\" = \"BPH w/o urinary obs/LUTS\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) AS num_patients FROM DEMOGRAPHIC d JOIN DIAGNOSES diag ON d.SUBJECT_ID = diag.SUBJECT_ID AND d.HADM_ID = diag.HADM_ID WHERE d.EXPIRE_FLAG = 0 AND LOWER(diag.SHORT_TITLE) = 'bph w/o urinaryobs/luts';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The only mistake in the predicted SQL is in the WHERE clause literal: they used LOWER(diag.SHORT_TITLE) = 'bph w/o urinaryobs/luts' (missing the space between 'urinary' and 'obs') so it doesn\u2019t match the actual SHORT_TITLE value 'BPH w/o urinary obs/LUTS'. Everything else (JOIN conditions, COUNT, filter on EXPIRE_FLAG) follows the intended structure. This is a localized error in the value filter, not a structural or logical join mistake.",
            "error_type": "Local: value parsing error"
        }
    }
}