{
    "dinsql": {
        "0d831e485ec42f39a9ea116cfdbc75d8": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "specify primary disease and icd9 code of patient id 18480",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DIAGNOSIS\",PROCEDURES.\"ICD9_CODE\" FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"18480\"",
            "pred_sql": "SELECT SHORT_TITLE, ICD9_CODE FROM DIAGNOSES WHERE SUBJECT_ID = 18480 GROUP BY ICD9_CODE",
            "gold_answer": "[['VENTRICULAR TACHYCARDIA', '8949.0']]",
            "pred_answer": "[['Asthma NOS', '49390.0'], ['Await organ transplnt st', 'V4983'], ['CHF NOS', '4280.0'], ['Long-term use anticoagul', 'V5861'], ['Parox ventric tachycard', '4271.0'], ['Polycythemia vera', '2384.0'], ['Prim cardiomyopathy NEC', '4254.0'], ['Sarcoidosis', '135.0'], ['Status autm crd dfbrltr', 'V4502']]",
            "is_correct": false,
            "reasoning": "The predicted query selects from the DIAGNOSES table and groups by ICD9_CODE, whereas the correct query should retrieve the primary disease from the DEMOGRAPHIC table and the ICD9_CODE from the PROCEDURES table via a join on HADM_ID. This mistake affects the overall logic and table relationships, producing completely different results and requiring restructuring the query. Therefore, it is a Global error.",
            "error_type": "Global: wrong table/join usage"
        },
        "a9e960146f15dc78dfdf7778cf79c3ba": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "what is the primary disease of the patient id 3343?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"3343\"",
            "pred_sql": "SELECT SHORT_TITLE, LONG_TITLE FROM DIAGNOSES WHERE SUBJECT_ID = 3343 ORDER BY HADM_ID LIMIT 1",
            "gold_answer": "[['NEWBORN']]",
            "pred_answer": "[['Need prphyl vc vrl hepat', 'Need for prophylactic vaccination and inoculation against viral hepatitis']]",
            "is_correct": false,
            "reasoning": "The predicted SQL pulls from the DIAGNOSES table (SHORT_TITLE, LONG_TITLE) instead of selecting the DIAGNOSIS column from the DEMOGRAPHIC table, which is where the primary disease field resides. This mistake fundamentally alters the query\u2019s intent by using the wrong table, requiring restructuring of the query rather than a simple fix in one clause.",
            "error_type": "Global: wrong table reference"
        },
        "9e33f7987cb3bdf5b47e8b870d28d06e": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "how many patients were diagnosed with urinary incontinence nos? (Values: Urinary incontinence NOS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"Urinary incontinence NOS\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DIAGNOSES WHERE LONG_TITLE = 'Urinary incontinence NOS'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL follows the correct overall logic\u2014counting distinct patients with the specified diagnosis\u2014but it filters on the wrong column (LONG_TITLE instead of SHORT_TITLE). This is a localized mistake in the WHERE clause and does not require restructuring joins or changing the query\u2019s overall flow.",
            "error_type": "Local: column reference error"
        }
    },
    "macsql": {
        "8447e58e57394384f3f325e732cdd313": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "get me the number of patients on iv route of drug administration who are diagnosed with closed fracture of surgical neck of humerus. (Values: Fx surg nck humerus-clos, IV)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"Fx surg nck humerus-clos\" AND PRESCRIPTIONS.\"ROUTE\" = \"IV\"",
            "pred_sql": "SELECT COUNT(DISTINCT T1.`SUBJECT_ID`) FROM ( SELECT DISTINCT `SUBJECT_ID` FROM DIAGNOSES WHERE `ICD9_CODE` = 'ICD9_CODE_FROM_SUBQUESTION_1' ) AS T1 INNER JOIN ( SELECT DISTINCT `SUBJECT_ID` FROM PRESCRIPTIONS WHERE `ROUTE` = 'IV' ) AS T2 ON T1.`SUBJECT_ID` = T2.`SUBJECT_ID`",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it filters diagnoses by a placeholder ICD9_CODE (`'ICD9_CODE_FROM_SUBQUESTION_1'`) rather than matching the actual SHORT_TITLE = \"Fx surg nck humerus-clos\". This mistake is confined to the WHERE clause of the diagnoses subquery and does not require reworking the overall query structure or join logic. It is a column/value reference error localized to that condition.",
            "error_type": "Local: column reference/value parsing error"
        },
        "a81dae5ff42498734e857c5b7dc46deb": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "how many female patients underwent the procedure of abdomen artery incision? (Values: F, Abdomen artery incision)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"GENDER\" = \"F\" AND PROCEDURES.\"SHORT_TITLE\" = \"Abdomen artery incision\"",
            "pred_sql": "SELECT COUNT(DISTINCT T1.SUBJECT_ID) AS Female_Patient_Count FROM DEMOGRAPHIC AS T1 INNER JOIN PROCEDURES AS T2 ON T1.SUBJECT_ID = T2.SUBJECT_ID WHERE T1.GENDER = 'F' AND T2.ICD9_CODE = '3523'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL not only uses the wrong filter (ICD9_CODE = '3523' instead of SHORT_TITLE = 'Abdomen artery incision') but also changes the join key from HADM_ID to SUBJECT_ID, altering the fundamental relationship between the tables. These issues span multiple clauses (JOIN and WHERE) and change the overall logic and intended meaning of the query, so this is a global error.",
            "error_type": "Global: incorrect join and wrong filter column"
        },
        "975158013a0614796649501c4458a198": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "what is the preferred language and primary disease of the patient with patient id 3343?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"LANGUAGE\",DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"3343\"",
            "pred_sql": "SELECT T1.`LANGUAGE`, T2.`LONG_TITLE` AS `PRIMARY_DISEASE` FROM DEMOGRAPHIC AS T1 JOIN DIAGNOSES AS T2 ON T1.`SUBJECT_ID` = T2.`SUBJECT_ID` AND T1.`HADM_ID` = T2.`HADM_ID` WHERE T1.`SUBJECT_ID` = 3343 AND T1.`LANGUAGE` IS NOT NULL AND T2.`LONG_TITLE` IS NOT NULL GROUP BY T1.`LANGUAGE`, T2.`LONG_TITLE` LIMIT 1",
            "gold_answer": "[['None', 'NEWBORN']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The ground truth query retrieves the DIAGNOSIS directly from the DEMOGRAPHIC table, but the predicted query instead joins DEMOGRAPHIC to the DIAGNOSES table and pulls LONG_TITLE. This fundamentally alters the query\u2019s structure and logic: it introduces an unnecessary join on HADM_ID/ SUBJECT_ID, applies extra NOT NULL filters, grouping and a LIMIT, and expects data in DIAGNOSES that doesn\u2019t exist for subject 3343. Correcting this requires removing the entire JOIN and selecting the DIAGNOSIS column from DEMOGRAPHIC directly\u2014this is not a small, isolated fix but a restructuring of the query logic.",
            "error_type": "Global: incorrect join"
        }
    },
    "codes": {
        "97d303ec02cd44af836860b5bbec1d68": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "which patients have diagnoses icd9 code 2920?",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DIAGNOSES.\"ICD9_CODE\" = \"2920\"",
            "pred_sql": "SELECT demographic.name FROM diagnoses INNER JOIN demographic ON diagnoses.subject_id = demographic.subject_id WHERE diagnoses.icd9_code = 2920",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['Claude Chipman']]",
            "is_correct": false,
            "reasoning": "The ground truth query returns the COUNT of DISTINCT patient IDs who have ICD9_CODE = '2920', joining on HADM_ID to correctly associate diagnoses per admission. The predicted query instead selects patient names (demographic.name) and joins on SUBJECT_ID, changing both the JOIN key and the SELECT target. This is not a simple naming or syntax mistake but a fundamental change in the query\u2019s purpose and logic (from counting unique patients to listing names) and an incorrect join strategy. Such a change affects the overall query structure and intended result, so it is a Global error.",
            "error_type": "Global: incorrect selection and join logic"
        },
        "aa87e8e508f6984831876860be1761df": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "What is the number of dead patients who had a prescription for pantoprazole sodium medication? (Values: 1, Pantoprazole Sodium)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"EXPIRE_FLAG\" = \"1\" AND PRESCRIPTIONS.\"DRUG\" = \"Pantoprazole Sodium\"",
            "pred_sql": "SELECT count(DISTINCT subject_id) FROM prescriptions WHERE drug = 'Pantoprazole Sodium' AND drug_dose = '1 mg'",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely omits the DEMOGRAPHIC table and the expire_flag filter, instead wrongly filtering on drug_dose. Fixing this requires adding a JOIN to DEMOGRAPHIC and applying the expire_flag condition. This is not a simple typo or minor clause fix; it is a fundamental flaw in the query structure and logic (missing table join and key filter). Thus it is a global error.",
            "error_type": "Global: join error"
        },
        "aa0feba409fddd516dabb88f3e4e1131": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what number of patients under the age of 85 had lab test named heparin,imw? (Values: Heparin, LMW)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"AGE\" < \"85\" AND LAB.\"LABEL\" = \"Heparin, LMW\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN lab ON demographic.hadm_id = lab.hadm_id WHERE demographic.age < 85 AND lab.label = 'heparin, imw'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates only in the WHERE clause (string literal casing/format) and in the SELECT aggregation (missing DISTINCT). Both are isolated issues within individual clauses and don\u2019t alter the overall join or query structure. This is a localized error in the WHERE condition (incorrect literal) and SELECT aggregate (missing DISTINCT), so it\u2019s a Local error.",
            "error_type": "Local: value parsing error"
        },
        "0709550ec8aeff15ee0fd6fe36ed4c0f": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "Theresa Vedovelli is primarily suffering from which disease?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Theresa Vedovelli\"",
            "pred_sql": "SELECT DISTINCT diagnoses.long_title FROM diagnoses INNER JOIN demographic ON diagnoses.subject_id = demographic.subject_id WHERE demographic.name = 'Theresa Vedovelli'",
            "gold_answer": "[['COMPLETE HEART BLOCK']]",
            "pred_answer": "[['Acute kidney failure, unspecified'], ['Anxiety state, unspecified'], ['Atrial fibrillation'], ['Atrioventricular block, complete'], ['Chronic airway obstruction, not elsewhere classified'], ['Coronary atherosclerosis of native coronary artery'], ['Depressive disorder, not elsewhere classified'], ['Diabetes mellitus without mention of complication, type II or unspecified type, not stated as uncontrolled'], ['Epilepsy, unspecified, without mention of intractable epilepsy'], ['Hypopotassemia'], ['Long-term (current) use of anticoagulants'], ['Other persistent mental disorders due to conditions classified elsewhere'], ['Other pulmonary embolism and infarction'], ['Pneumonia, organism unspecified'], ['Retention of urine, unspecified'], ['Unspecified acquired hypothyroidism'], ['Unspecified essential hypertension'], ['Urinary complications, not elsewhere classified']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins the DEMOGRAPHIC and DIAGNOSES tables and returns all diagnosis long_titles for the patient, whereas the question asks for the primary disease recorded in the DEMOGRAPHIC table\u2019s DIAGNOSIS column. This error affects the overall logic: it selects from the wrong table and returns multiple rows instead of the single primary diagnosis, requiring restructuring of the query to use DEMOGRAPHIC.DIAGNOSIS. Therefore the mistake is global in nature.",
            "error_type": "Global: join logic error"
        },
        "080127e8abd81701f88e49d4a966b56d": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "tell me the number of patients on prescription of alteplase (catheter clearance) who had to stay for more than 43 days in hospital. (Values: Alteplase (Catheter Clearance))",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"DAYS_STAY\" > \"43\" AND PRESCRIPTIONS.\"DRUG\" = \"Alteplase (Catheter Clearance)\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN prescriptions ON demographic.hadm_id = prescriptions.hadm_id WHERE prescriptions.drug = 'Alteplase (Catheter Clearance)' AND demographic.days_stay > 43",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses COUNT(demographic.subject_id) instead of COUNT(DISTINCT demographic.subject_id). This causes it to count every prescription row rather than distinct patients. The only issue is in the aggregation/counting clause (missing DISTINCT); the overall join and filter logic remains correct. This is a localized mistake in the SELECT aggregation.",
            "error_type": "Local: missing DISTINCT"
        },
        "00263ad8de751999af6aa3a7cf5276ad": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what is the number of patients whose hospital stay is above 14 days and with lab test methemoglobin? (Values: Methemoglobin)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"DAYS_STAY\" > \"14\" AND LAB.\"LABEL\" = \"Methemoglobin\"",
            "pred_sql": "SELECT count(demographic.subject_id) FROM demographic INNER JOIN lab ON demographic.hadm_id = lab.hadm_id WHERE lab.label = 'Methmoglobin' AND demographic.days_stay > 14",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL misspells the lab label as 'Methmoglobin' instead of the correct 'Methemoglobin', causing no rows to match. This is a localized mistake in the WHERE clause\u2019s literal value, not a structural or logical join issue. Therefore it\u2019s a Local error (value/literal parsing).",
            "error_type": "Local: value parsing error"
        },
        "06fbe5c6c99bc3f7cd0a53249b2de3dd": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "How many patients aged below 43 years old are diagnosed with prob-head/neck/trunk nos? (Values: Prob-head/neck/trunk NOS)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"AGE\" < \"43\" AND DIAGNOSES.\"SHORT_TITLE\" = \"Prob-head/neck/trunk NOS\"",
            "pred_sql": "SELECT count(subject_id) FROM diagnoses WHERE icd9_code IN (3547, 3548, 3549) AND age < 43",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: age",
            "is_correct": false,
            "reasoning": "The predicted SQL references the column age within the diagnoses table, but age exists only in the demographic table. This is a simple column reference error (no join on demographic and wrong table for age), which does not change the overall query structure or logic, only a localized misuse of a column.",
            "error_type": "Local: table/column reference error"
        },
        "aa9d08c1a7ed4cdd6bf2b289a54a6cc1": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients are below 49 years of age and admitted under the year 2198?",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"AGE\" < \"49\" AND DEMOGRAPHIC.\"ADMITYEAR\" < \"2198\"",
            "pred_sql": "SELECT count(subject_id) FROM demographic WHERE strftime('%Y', admittime) < 2198 AND age < 49",
            "gold_answer": "[['34.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query uses strftime('%Y', admittime) to filter by admission year instead of using the ADMITYEAR column as specified, and it also omits DISTINCT. This is a mistake localized to the WHERE clause and SELECT aggregation rather than a structural or multi-clause logical error. It can be fixed by referencing the correct column and adding DISTINCT without changing the overall query structure.",
            "error_type": "Local: column reference error"
        },
        "92b1c7ad9fe0af5c4ec35a3b48791815": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "what is the drug code and drug dose of the drug acetaminophen iv? (Values: Acetaminophen IV)",
            "gold_sql": "SELECT PRESCRIPTIONS.\"FORMULARY_DRUG_CD\",PRESCRIPTIONS.\"DRUG_DOSE\" FROM PRESCRIPTIONS WHERE PRESCRIPTIONS.\"DRUG\" = \"Acetaminophen IV\"",
            "pred_sql": "SELECT formulary_drug_cd, drug_dose FROM prescriptions WHERE drug = 'acetaminophen' AND route = 'IV'",
            "gold_answer": "[['ACET1000I', '1000mg'], ['ACET1000I', '1000mg'], ['ACET1000I', '1000mg'], ['ACET1000I', '1000mg'], ['ACET1000I', '1000mg']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL only matches rows where drug = 'acetaminophen' and route = 'IV', whereas the actual drug name in the data is 'Acetaminophen IV'. This is a mistake in the WHERE clause values rather than a structural rewrite of the query or its joins. It doesn\u2019t require changing tables or join logic\u2014only the filtering condition is wrong.",
            "error_type": "Local: value parsing error"
        }
    },
    "o4-mini": {
        "085c097c30ee27375d301af1413d2f6a": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "out of total number of patients who had endoscopic insertion of stent (tube) into bile duct, calculate the number of those aged below 45 (Values: Endoscopic insertion of stent (tube) into bile duct)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"AGE\" < \"45\" AND PROCEDURES.\"LONG_TITLE\" = \"Endoscopic insertion of stent (tube) into bile duct\"",
            "pred_sql": "SELECT COUNT(DISTINCT p.subject_id) AS total_patients_with_stent, COUNT(DISTINCT CASE WHEN d.age < 45 THEN p.subject_id END) AS patients_below_45 FROM procedures p JOIN demographic d ON p.subject_id = d.subject_id AND p.hadm_id = d.hadm_id WHERE p.long_title = 'Endoscopic insertion of stent (tube) into bile duct';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['1.0', '0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the correct join and filtering logic for the procedure and age, but it returns two aggregate columns (total patients and patients below 45) instead of the single count of patients below age 45 as requested. This is a mistake confined to the SELECT clause and does not change the overall query structure or table relationships.",
            "error_type": "Local: select-clause error"
        },
        "86f305efdfde01b908615d3b271a35ad": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "how many patients were treated with diltiazem? (Values: Diltiazem)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE PRESCRIPTIONS.\"DRUG\" = \"Diltiazem\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) AS num_patients FROM PRESCRIPTIONS WHERE LOWER(DRUG) LIKE '%diltiazem%';",
            "gold_answer": "[['4.0']]",
            "pred_answer": "[['5.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs from the ground truth only in the WHERE clause: it uses LOWER(DRUG) LIKE '%diltiazem%' instead of an exact match on DRUG = 'Diltiazem'. This is a localized mistake in the filter condition, not affecting the overall structure or joins in the query. Thus, it is a Local error (value parsing/filter condition error).",
            "error_type": "Local: value parsing error"
        },
        "04221395dc9c6a9e5c880d1dc78a5031": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "how many patients are discharged from disch tran to psych hosp that are under age 77? (Values: DISCH-TRAN TO PSYCH HOSP)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DISCHARGE_LOCATION\" = \"DISCH-TRAN TO PSYCH HOSP\" AND DEMOGRAPHIC.\"AGE\" < \"77\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) AS num_patients FROM DEMOGRAPHIC WHERE DISCHARGE_LOCATION LIKE 'DISC-TRAN%PSYCH%' AND AGE < 77;",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The only difference between the ground truth and the predicted SQL is in the WHERE clause\u2019s string matching: the ground truth uses an exact match on DISCHARGE_LOCATION = 'DISCH-TRAN TO PSYCH HOSP', while the predicted SQL uses a LIKE pattern 'DISC-TRAN%PSYCH%'. This incorrect pattern causes no rows to match. The issue is confined to the value literal and matching method in the WHERE clause and does not alter the overall query structure or joins. Therefore, it is a localized error in the WHERE clause.",
            "error_type": "Local: value parsing/matching error"
        }
    },
    "llm2sql": {
        "0ce7ffc2b0832d683b0873a75983ee3b": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "what is the number of patients who were hospitalized for more than 20 days and were later discharged home? (Values: HOME)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DISCHARGE_LOCATION\" = \"HOME\" AND DEMOGRAPHIC.\"DAYS_STAY\" > \"20\"",
            "pred_sql": "SELECT COUNT(*) FROM DEMOGRAPHIC WHERE DAYS_STAY > 20 AND DISCHARGE_LOCATION LIKE '%HOME%'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['6.0']]",
            "is_correct": false,
            "reasoning": "The predicted query only modifies the WHERE and SELECT clauses without changing the overall structure or table relationships. It uses DISCHARGE_LOCATION LIKE '%HOME%' instead of the required exact match (= 'HOME') and COUNT(*) instead of COUNT(DISTINCT SUBJECT_ID). Both are localized errors in the WHERE filter and aggregation, not a global logic or join structure issue.",
            "error_type": "Local: where-clause and aggregation error"
        }
    },
    "deepseek": {
        "aa253b41030e5c298e4ceb1c7aef9028": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "how many patients below the age of 56 were given voriconazole? (Values: Voriconazole)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"AGE\" < \"56\" AND PRESCRIPTIONS.\"DRUG\" = \"Voriconazole\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) FROM DEMOGRAPHIC AS Demo JOIN PRESCRIPTIONS AS Pre ON Demo.SUBJECT_ID = Pre.SUBJECT_ID AND Demo.HADM_ID = Pre.HADM_ID WHERE Demo.AGE < 56 AND Pre.DRUG = 'Voriconazole';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: D.SUBJECT_ID",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the alias Demo for DEMOGRAPHIC but in the SELECT clause refers to D.SUBJECT_ID, an undefined alias. This is a simple table/column reference error that can be fixed by using the correct alias (Demo) without changing the overall query structure.",
            "error_type": "Local: table/column reference error"
        }
    }
}