{
    "codes": {
        "37bb636cce8f65f6ad5203a7": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the first lab test that patient 028-10451 received this month?",
            "gold_sql": "SELECT lab.labresulttime FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '028-10451' ) ) AND datetime(lab.labresulttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT patient.patientunitstayid FROM patient INNER JOIN lab ON patient.patientunitstayid = lab.patientunitstayid WHERE patient.uniquepid = '028-10451' AND strftime('%m', lab.labresulttime) = '02' AND lab.labname = 'Urine 1000 100' ORDER BY lab.labresulttime LIMIT 1",
            "gold_answer": "[['2100-12-07 00:59:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL is structurally similar to the ground truth (it uses the same tables and JOIN), but it makes local mistakes in its WHERE and SELECT clauses: it filters on a specific lab name (\u2018Urine 1000 100\u2019) that wasn\u2019t asked, it uses strftime('%m','\u2026') = '02' (wrong month literal) instead of matching the current month via the prescribed datetime('start of month') logic, and it selects patientunitstayid instead of the lab result time. These are all confined to specific expressions and can be corrected without changing the overall query structure or join logic. Therefore this is a Local error, specifically a temporal filter mistake.",
            "error_type": "Local: other-temporal error"
        },
        "a39cccf33e871b8d3c0ee195": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the output of patient 010-10081 for the first time on last month/13?",
            "gold_sql": "SELECT intakeoutput.celllabel FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-10081' ) ) AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') AND strftime('%d',intakeoutput.intakeoutputtime) = '13' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.cellpath FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '010-10081' AND strftime('%m', intakeoutput.intakeoutputtime) = '13' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "gold_answer": "[['urine']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query not only selects the wrong column (cellpath instead of celllabel) but also omits the critical output-only filter, misuses the date filtering (month \u201813\u2019, missing last\u2010month/day logic), and even reverses the sort order. Fixing it would require rewriting multiple WHERE clauses, adding path conditions, correcting the date logic, and changing the ORDER direction. This error spans the overall structure and logic, so it\u2019s a global error.",
            "error_type": "Global: incorrect filter and column selection"
        },
        "7cdb91fabb7e08749637f74e": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many individuals are there who are current patients?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NULL",
            "pred_sql": "SELECT count(patientunitstayid) FROM patient WHERE hospitaldischargetime IS NULL",
            "gold_answer": "[['23.0']]",
            "pred_answer": "[['30.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts patientunitstayid for rows where hospitaldischargetime IS NULL, which yields the number of current stays, not distinct individuals. The correct intent is to count unique patients (using DISTINCT patient.uniquepid). This is a localized error in the SELECT clause\u2014specifically the aggregation and missing DISTINCT\u2014without affecting the overall query structure or relationships.",
            "error_type": "Local: missing DISTINCT"
        },
        "d37c1e31e9b13a891e553339": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When this year did patient 010-11267 receive their first bronchoscopy procedure?",
            "gold_sql": "SELECT treatment.treatmenttime FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-11267' ) ) AND treatment.treatmentname = 'bronchoscopy' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT datetime(vitalperiodic.observationtime) FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '010-11267' ORDER BY vitalperiodic.observationtime DESC LIMIT 1",
            "gold_answer": "[['2100-10-04 21:31:00']]",
            "pred_answer": "[['2100-10-10 14:41:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the vitalperiodic table and retrieves the latest observation time for the patient, instead of querying the treatment table for the first 'bronchoscopy' procedure this year. This is not a minor typo or missing column; it fundamentally changes the logic and tables involved, requiring a complete restructuring of the query.",
            "error_type": "Global: incorrect table and logic"
        },
        "62fe58e17f1786b0bd23e365": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the minimum daily number of patients who had urinary tract infection since 1 year ago?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT COUNT( DISTINCT diagnosis.patientunitstayid ) AS C1 FROM diagnosis WHERE diagnosis.diagnosisname = 'urinary tract infection' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY strftime('%Y-%m-%d',diagnosis.diagnosistime) ) AS T1",
            "pred_sql": "SELECT count(DISTINCT patient.patientunitstayid) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE vitalperiodic.observationoffset BETWEEN '-365' AND '-1' AND vitalperiodic.sao2 < 95",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: vitalperiodic.observationoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column vitalperiodic.observationoffset, which is a schema mismatch. This is a localized issue with the column reference and does not require restructuring the overall query logic.",
            "error_type": "Local: table/column reference error"
        },
        "35562087619eaf9ec7769a8d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Count the number of times that patient 031-14167 received a laboratory test for tibc on the first hospital visit.",
            "gold_sql": "SELECT COUNT(*) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-14167' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND lab.labname = 'tibc'",
            "pred_sql": "SELECT count(lab.labname) FROM patient INNER JOIN lab ON patient.patientunitstayid = lab.patientunitstayid WHERE patient.uniquepid = '031-14167' AND patient.hospitaladmittime = ( SELECT hospitaladmittime FROM patient WHERE uniquepid = '031-14167' ORDER BY hospitaladmittime ASC LIMIT 1 )",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['330.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to apply the filter lab.labname = 'tibc' and omits the requirement that the first hospital visit must have a non\u2010null discharge time. Instead, it simply matches hospitaladmittime to the first admission date, counting all lab tests rather than only TIBC tests. This error spans multiple clauses (missing WHERE condition on labname and incorrect visit logic) and fundamentally alters the intended query meaning, so it is a global logic error.",
            "error_type": "Global: incorrect logic across JOIN and WHERE clauses"
        },
        "0f1282d072f4287535f50953": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How is cefazolin (ancef) in dextrose ivpb 2 g typically consumed?",
            "gold_sql": "SELECT DISTINCT medication.routeadmin FROM medication WHERE medication.drugname = 'cefazolin (ancef) in dextrose ivpb 2 g'",
            "pred_sql": "SELECT CASE WHEN medication.drugname = 'cefacolin (ancef)' THEN '800-30 g/1 ml by mouth' ELSE NULL END FROM medication INNER JOIN cost ON medication.medicationid = cost.eventid WHERE medication.drugname = 'dextrose ivpb 2 g'",
            "gold_answer": "[['ivpb']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL is fundamentally incorrect in its overall structure and logic. Instead of directly selecting the administration route from the medication table for the specific drug, it joins the cost table without any relevant cost filtering, uses an incorrect join key (medication.medicationid = cost.eventid) and wrong drug name filters. It even wraps results in a CASE expression that doesn\u2019t correspond to the question. These issues span multiple clauses (SELECT, JOIN, WHERE) and change the intended query meaning, indicating a global structural/logical error.",
            "error_type": "Global: join error"
        },
        "21a8c17ed1bc28ec4d74aa51": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last time that patient 003-10024 was diagnosed with acute coronary syndrome - acute myocardial infarction (with st elevation) on the last hospital visit?",
            "gold_sql": "SELECT diagnosis.diagnosistime FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '003-10024' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND diagnosis.diagnosisname = 'acute coronary syndrome - acute myocardial infarction (with st elevation)' ORDER BY diagnosis.diagnosistime DESC LIMIT 1",
            "pred_sql": "SELECT diagnosis.diagnosistime FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE patient.uniquepid = '003-10024' AND diagnosis.diagnosistime = ( SELECT max(diagnosis.diagnosistime) FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE patient.uniquepid = '003-10024' AND diagnosis.description = 'Acute coronary syndrome - acute myocardial infarction (with st elevation)' )",
            "gold_answer": "[['2100-10-27 17:58:00']]",
            "pred_answer": "no such column: diagnosis.description",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column diagnosis.description instead of diagnosis.diagnosisname, causing a column reference error. This is a localized mistake that can be fixed by correcting the column name without restructuring the overall query.",
            "error_type": "Local: column reference error"
        },
        "a3c5957d0565aeac6aacd10d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last time the heart rate of patient 027-104059 registered less than 65.0 on 06/04/this year?",
            "gold_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-104059' ) ) AND vitalperiodic.heartrate < 65.0 AND vitalperiodic.heartrate IS NOT NULL AND datetime(vitalperiodic.observationtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',vitalperiodic.observationtime) = '06-04' ORDER BY vitalperiodic.observationtime DESC LIMIT 1",
            "pred_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '027-104059' AND vitalperiodic.observationtime LIKE '2100-06-04%' AND vitalperiodic.heartrate < 65",
            "gold_answer": "[['2100-06-04 09:26:14']]",
            "pred_answer": "[['2100-06-04 06:51:14'], ['2100-06-04 06:56:14'], ['2100-06-04 07:01:14'], ['2100-06-04 07:21:14'], ['2100-06-04 07:26:14'], ['2100-06-04 07:31:14'], ['2100-06-04 07:36:14'], ['2100-06-04 07:41:14'], ['2100-06-04 07:46:14'], ['2100-06-04 07:51:14'], ['2100-06-04 07:56:14'], ['2100-06-04 08:01:14'], ['2100-06-04 08:06:14'], ['2100-06-04 08:11:14'], ['2100-06-04 08:16:14'], ['2100-06-04 08:21:14'], ['2100-06-04 08:26:14'], ['2100-06-04 08:31:14'], ['2100-06-04 08:51:14'], ['2100-06-04 08:56:14'], ['2100-06-04 09:01:14'], ['2100-06-04 09:06:14'], ['2100-06-04 09:11:14'], ['2100-06-04 09:16:14'], ['2100-06-04 09:21:14'], ['2100-06-04 09:26:14']]",
            "is_correct": false,
            "reasoning": "The predicted query still joins the correct tables and filters the heart rate < 65 on the specified date, but it fails to implement the \u2018last time\u2019 logic. It omits the ORDER BY observationtime DESC and LIMIT 1, and uses a simple LIKE filter instead of the prescribed datetime/strftime approach. These are errors confined to the WHERE and result\u2010ordering clauses without altering the overall table relationships or structure.",
            "error_type": "Local: missing ORDER BY and LIMIT"
        }
    },
    "llm2sql": {
        "04c45f5a7f141e001d812299": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What proportion of patients with a diagnosis of metabolic acidosis - drug induced survive over a 3-month period?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'metabolic acidosis - drug induced' AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN patient ON T1.uniquepid = patient.uniquepid GROUP BY patient.uniquepid HAVING MAX(patient.hospitaldischargetime) = patient.hospitaldischargetime )",
            "pred_sql": "SELECT 1.0 * SUM(CASE WHEN DATE(patient.hospitaldischargetime) <= DATE(diagnosis.diagnosistime, '+91 days') AND patient.hospitaldischargestatus = 'alive' THEN 1 ELSE 0 END) / COUNT(DISTINCT patient.patientunitstayid) FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'metabolic acidosis - drug induced';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally alters the survival calculation logic and overall structure. It uses DATE arithmetic instead of Julian day differences, applies the wrong survival condition (checks for 'alive' status instead of handling 'expired' within 3 months), fails to filter patients with sufficient follow-up time, and divides by patientunitstayid rather than uniquepid. These issues go beyond a simple localized fix and require reworking the query\u2019s core logic and grouping, classifying it as a global error.",
            "error_type": "Global: logic error"
        },
        "e42699f7b9f2da1b9e49877f": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What was the number of ct scan - with contrast procedures performed since 2100?",
            "gold_sql": "SELECT COUNT(*) FROM treatment WHERE treatment.treatmentname = 'ct scan - with contrast' AND strftime('%Y',treatment.treatmenttime) >= '2100'",
            "pred_sql": "SELECT COUNT(*) FROM treatment WHERE treatmentname = 'CT scan - with contrast' AND datetime(treatmenttime, 'start of year') >= datetime('2100-01-01 00:00:00')",
            "gold_answer": "[['24.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses the treatment name literal 'CT scan - with contrast' (uppercase \u2018CT\u2019) instead of the exact string 'ct scan - with contrast' as stored in the table. This is a simple value\u2010matching error that does not change the query\u2019s overall structure or logic. All other parts of the query remain correct\u2014the date condition still filters on events since 2100\u2014so the mistake is localized to the literal value comparison.",
            "error_type": "Local: value parsing error"
        },
        "7ee2887a56faa82c0b200471": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Tell me the top five most commonly prescribed medications within the same hospital visit to patients in their 40s who are diagnosed with obstructive sleep apnea since 1 year ago.",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'obstructive sleep apnea' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.age BETWEEN 40 AND 49 AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT M.drugname, COUNT(*) AS cnt FROM patient AS P JOIN diagnosis AS D ON P.patientunitstayid = D.patientunitstayid JOIN medication AS M ON P.patientunitstayid = M.patientunitstayid WHERE P.age BETWEEN 40 AND 49 AND D.diagnosisname = 'obstructive sleep apnea' AND D.diagnosistime >= datetime('2100-12-31 23:59:00', '-1 year') GROUP BY M.drugname ORDER BY cnt DESC LIMIT 5;",
            "gold_answer": "[['acetaminophen'], ['azithromycin'], ['dextrose 50%-water'], ['glucagon'], ['glucose'], ['hydrocodone 5 mg-acetaminophen 325 mg tablet'], ['magnesium sulfate 2 gram/50 ml iv piggy back 50 ml flex cont'], ['methylprednisolone sod suc(pf)'], ['tramadol']]",
            "pred_answer": "[['albuterol concentrated 0.5%', '20.0'], ['azithromycin', '17.0'], ['dextrose 50%-water', '25.0'], ['methylprednisolone sod suc(pf)', '25.0'], ['tramadol', '10.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates from the intended logic in several fundamental ways: 1) It joins diagnosis and medication only on patientunitstayid rather than patienthealthsystemstayid, thus not ensuring the same hospital visit. 2) It fails to enforce that the medication start time occurs after the diagnosis time (D.diagnosistime < M.drugstarttime). 3) It does not restrict medication events to within the past year. These omissions affect the overall query structure and data relationships, altering the core semantics of \"top five medications prescribed after diagnosis during the same hospital visit within one year.\" Fixing this would require adding join conditions and WHERE clauses that span multiple parts of the query, not just a minor tweak in a single clause.",
            "error_type": "Global: join-logic error"
        },
        "b2b0fd03fe9d704dfbe25030": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Pull up the ids of patients who were diagnosed with bradycardia - complete heart block.",
            "gold_sql": "SELECT DISTINCT patient.uniquepid FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'bradycardia - complete heart block' )",
            "pred_sql": "SELECT DISTINCT patientunitstayid FROM diagnosis WHERE diagnosisname = 'bradycardia - complete heart block';",
            "gold_answer": "[['012-11288'], ['021-101289'], ['027-100581'], ['031-11538']]",
            "pred_answer": "[['1254957.0'], ['2215881.0'], ['2778278.0'], ['3154626.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL selects diagnosis.patientunitstayid directly rather than retrieving patient.uniquepid from the patient table. The overall query structure (filtering by diagnosis name and deduplication) is correct, but the wrong column is returned. This is a localized mistake in the SELECT clause rather than a structural or multi-clause logical error.",
            "error_type": "Local: table/column reference error"
        }
    },
    "dinsql": {
        "1afbc775f060dfcad71d671c": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Show me patient 018-10885's yearly minimum 24 h urine protein since 1 year ago.",
            "gold_sql": "SELECT MIN(lab.labresult) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '018-10885' ) ) AND lab.labname = '24 h urine protein' AND datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY strftime('%Y',lab.labresulttime)",
            "pred_sql": "SELECT strftime('%Y', intakeoutputtime) AS year, MIN(cellvaluenumeric) AS min_24h_urine_protein FROM intakeoutput WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '018-10885' ) AND celllabel LIKE '%24 h urine protein%' AND datetime(intakeoutputtime) >= datetime('2100-12-31 23:59:00', '-1 year') GROUP BY year",
            "gold_answer": "[['30.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries the intakeoutput table instead of the lab table to retrieve '24 h urine protein' results. This is not a simple syntax or column naming mistake but a fundamental misuse of the wrong table, which alters the entire logic of the query. Correcting this requires changing the core structure to reference the lab table and its labresult and labresulttime columns, so it is a global error.",
            "error_type": "Global: incorrect table selection"
        },
        "c7dc0e66cdfbbd924515dbbe": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What is the sex of patient 006-102774?",
            "gold_sql": "SELECT DISTINCT patient.gender FROM patient WHERE patient.uniquepid = '006-102774'",
            "pred_sql": "gender FROM patient WHERE uniquepid = '006-102774'",
            "gold_answer": "[['male']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL is missing the SELECT keyword and thus is a local syntax error in the SELECT clause. It does not change the intended logic or table relationships\u2014just a minor fix in the SELECT statement is needed. Therefore, this is a Local error.",
            "error_type": "Local: syntax error"
        }
    },
    "qwen3": {
        "489c1ea5bdaeef4ed2659b45": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many hours have passed since patient 015-100025's first hemodialysis intake (ml) input on the current icu visit?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',intakeoutput.intakeoutputtime) ) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '015-100025' ) AND patient.unitdischargetime IS NULL ) AND intakeoutput.celllabel = 'hemodialysis intake (ml)' AND intakeoutput.cellpath LIKE '%intake%' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT (strftime('%s', '2100-12-31 23:59:00') - strftime('%s', MIN(io.intakeoutputtime))) / 3600 AS hours_passed FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '015-100025' AND p.unitdischargetime IS NULL AND io.cellpath LIKE '%intake%' AND io.cellpath LIKE '%hemodialysis%';",
            "gold_answer": "[['2.8']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fails to restrict on the exact \u2018celllabel = \\'hemodialysis intake (ml)\\'\u2019 and instead uses io.cellpath LIKE '%hemodialysis%', so it pulls a different (earlier) intake time. This is a mistake confined to the WHERE clause filters and does not alter the overall query structure or joins.",
            "error_type": "Local: incorrect filter in WHERE clause"
        },
        "9e4e34508b9eabf0b0fc4fbe": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What is the cost of a sepsis - sepsis with single organ dysfunction- circulatory system failure diagnosis?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'diagnosis' AND cost.eventid IN ( SELECT diagnosis.diagnosisid FROM diagnosis WHERE diagnosis.diagnosisname = 'sepsis - sepsis with single organ dysfunction- circulatory system failure' )",
            "pred_sql": "SELECT SUM(cost.cost) AS total_cost FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid JOIN cost ON patient.patienthealthsystemstayid = cost.patienthealthsystemstayid WHERE diagnosis.diagnosisname = 'sepsis - sepsis with single organ dysfunction- circulatory system failure' AND cost.eventtype = 'diagnosis' AND cost.eventid = diagnosis.diagnosisid;",
            "gold_answer": "[['6.76']]",
            "pred_answer": "[['87.88']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the intent of the query by joining through the patient table and summing all diagnosis event costs across multiple patients. The ground truth simply retrieves the single cost for the specified diagnosis event (using DISTINCT on cost.cost). The predicted version\u2019s use of SUM and additional joins changes the overall logic and structure\u2014it\u2019s not a localized syntax mistake but a global restructuring that aggregates across unintended rows.",
            "error_type": "Global: incorrect join/aggregation strategy"
        },
        "18553a06c553cf15ca7bf4a2": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "Is the value of sao2 of patient 006-106843 last measured on the last icu visit less than the value second to last measured on the last icu visit?",
            "gold_sql": "SELECT ( SELECT vitalperiodic.sao2 FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106843' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND vitalperiodic.sao2 IS NOT NULL ORDER BY vitalperiodic.observationtime DESC LIMIT 1 ) < ( SELECT vitalperiodic.sao2 FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106843' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND vitalperiodic.sao2 IS NOT NULL ORDER BY vitalperiodic.observationtime DESC LIMIT 1 OFFSET 1 )",
            "pred_sql": "WITH last_icu_stay AS ( SELECT patientunitstayid FROM patient WHERE uniquepid = '006-106843' ORDER BY unitdischargetime DESC LIMIT 1 ), ranked_vitals AS ( SELECT sao2, ROW_NUMBER() OVER (ORDER BY observationtime DESC) AS rn FROM vitalperiodic WHERE patientunitstayid = (SELECT patientunitstayid FROM last_icu_stay) ) SELECT (SELECT sao2 FROM ranked_vitals WHERE rn = 1) < (SELECT sao2 FROM ranked_vitals WHERE rn = 2) AS is_less;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to filter out NULL sao2 values before ranking, so its first row can be NULL and the comparison yields NULL (None) instead of a boolean. The mistake is a missing WHERE clause condition (vitalperiodic.sao2 IS NOT NULL) in the ranked_vitals CTE. This is a localized WHERE\u2010clause error that doesn\u2019t change the overall query structure or table relationships.",
            "error_type": "Local: missing non-null filter in WHERE clause"
        },
        "1bef54d89c07bec88a7d7fef": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many patients were diagnosed with upper urinary tract infection within the same hospital visit since 1 year ago after electrolyte administration - intravenous.",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'electrolyte administration - intravenous' AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'upper urinary tract infection' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 WHERE T1.treatmenttime < T2.diagnosistime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) FROM diagnosis d JOIN treatment t ON d.patientunitstayid = t.patientunitstayid JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE d.diagnosisname = 'upper urinary tract infection' AND t.treatmentname = 'electrolyte administration - intravenous' AND datetime(t.treatmenttime) <= datetime(d.diagnosistime, '-1 year');",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally misrepresents the question\u2019s logic in multiple clauses. It joins diagnosis and treatment on patientunitstayid rather than patienthealthsystemstayid, so it conflates ICU stays with hospital visits. It also applies the time filter incorrectly\u2014comparing treatment time to one year before each diagnosis instead of requiring both events to have occurred within the last year relative to today and ensuring treatment precedes diagnosis. These errors span joins and WHERE logic and cannot be fixed by tweaking a single clause.",
            "error_type": "Global: incorrect join and time logic"
        }
    },
    "deepseek": {
        "68d554a0eb8d6e33f7c18e04": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the patient count for 500 ml flex cont excel : sodium chloride 0.9 % iv soln prescription since 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid = ( SELECT medication.patientunitstayid FROM medication WHERE medication.drugname = '500 ml flex cont excel : sodium chloride 0.9 % iv soln' AND strftime('%Y',medication.drugstarttime) >= '2100' )",
            "pred_sql": "SELECT COUNT(DISTINCT patientunitstayid) AS patient_count FROM medication WHERE drugname = '500 ml flex cont excel : sodium chloride 0.9 % iv soln' AND drugstarttime >= '2100-01-01';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['5.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts distinct patientunitstayid directly from the medication table, whereas the ground truth counts distinct patient.uniquepid by first identifying the relevant patientunitstayid via a subquery on medication and then querying the patient table. This mistake changes the query\u2019s overall logic\u2014counting ICU/stay records instead of unique patients\u2014and requires restructuring the query (adding a join or subquery to map unit stays to unique patients). Therefore, it is not a localized syntax issue but a fundamental logical error in the query structure.",
            "error_type": "Global: aggregation-logic error"
        }
    }
}