{
    "llm2sql": {
        "e9326e10e6866dba320fa072": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What's the rdw change of patient 032-10133 last measured on the last hospital visit compared to the second to last value measured on the last hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '032-10133' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'rdw' ORDER BY lab.labresulttime DESC LIMIT 1 ) - ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '032-10133' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'rdw' ORDER BY lab.labresulttime DESC LIMIT 1 OFFSET 1 )",
            "pred_sql": "WITH cte_last_hospital_visit AS ( SELECT patientunitstayid FROM patient WHERE uniquepid = '032-10133' AND hospitaldischargetime IS NOT NULL ORDER BY hospitaladmittime DESC LIMIT 1 ), rdw_values AS ( SELECT lab.labresult as rdw_value, lab.labresulttime FROM lab JOIN cte_last_hospital_visit ON lab.patientunitstayid = cte_last_hospital_visit.patientunitstayid WHERE lab.labname = 'rdw' ORDER BY lab.labresulttime DESC ) SELECT rdw_value AS last_value FROM rdw_values LIMIT 1 UNION ALL SELECT rdw_value FROM rdw_values LIMIT 1 OFFSET 1;",
            "gold_answer": "[['-0.3']]",
            "pred_answer": "LIMIT clause should come after UNION ALL not before",
            "is_correct": false,
            "reasoning": "The predicted SQL misuses the LIMIT clause by placing it before the UNION ALL, leading to a syntax error. This is a localized mistake in clause ordering and does not involve changes to the overall query logic or table relationships.",
            "error_type": "Local: syntax error"
        },
        "9fd4b99007cf93788de4e605": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the maximum total cost for the hospital when a troponin - i lab test is involved since 2100?",
            "gold_sql": "SELECT MAX(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'troponin - i' ) ) AND strftime('%Y',cost.chargetime) >= '2100' GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT MAX(total_cost) AS max_total_cost FROM (SELECT SUM(cost.cost) AS total_cost FROM cost JOIN lab ON cost.patientunitstayid = lab.patientunitstayid WHERE lab.labname = 'troponin - i' AND datetime(lab.labresulttime) >= datetime('2100-01-01') GROUP BY cost.patienthealthsystemstayid);",
            "gold_answer": "[['25887.21']]",
            "pred_answer": "[['176405.04']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes how costs are associated with troponin - i labs by joining cost and lab on patientunitstayid instead of linking via patienthealthsystemstayid (and filtering cost.chargetime rather than lab.labresulttime). This incorrect join and grouping logic alters the intended mapping between cost records and lab events, producing a completely different result. Such an error spans multiple clauses and breaks the core relationship between tables, requiring a structural fix rather than a minor tweak.",
            "error_type": "Global: incorrect join error"
        },
        "810edfc3207a29bef5ac27c2": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the number of times that patient 013-10029 had a urine event on 10/07/this year?",
            "gold_sql": "SELECT COUNT(*) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10029' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'urine' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',intakeoutput.intakeoutputtime) = '10-07'",
            "pred_sql": "SELECT COUNT(*) FROM intakeoutput WHERE patientunitstayid IN (SELECT patientunitstayid FROM patient WHERE uniquepid = '013-10029') AND cellpath LIKE '%urine%' AND datetime(intakeoutputtime, 'start of day') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') AND strftime('%m-%d', intakeoutputtime) = '10-07'",
            "gold_answer": "[['4.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL has multiple mistakes confined to its WHERE clause: it filters cellpath with '%urine%' instead of checking cellpath LIKE '%output%' and celllabel = 'urine', it compares datetime(intakeoutputtime, 'start of day') to a 'start of year' timestamp (so the date\u2010filter is wrong), and it simplifies the patientunitstayid lookup incorrectly (omitting the patienthealthsystemstayid subquery). All of these issues are localized to specific conditions rather than the overall query structure or logic.",
            "error_type": "Local: temporal and filter condition errors"
        },
        "616d4bc79f0d39ba25a8112d": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What are the five most frequently ordered medications that female patients aged 60 or above are prescribed within 2 months after they are diagnosed with bone fracture(s) - left upper extremity this year?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'bone fracture(s) - left upper extremity' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.gender = 'female' AND patient.age >= 60 AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT medication.drugname FROM patient JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid JOIN medication ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.gender = 'female' AND CAST(patient.age AS INTEGER) >= 60 AND diagnosis.diagnosisname = 'bone fracture(s) - left upper extremity' AND strftime('%Y', diagnosis.diagnosistime) = '2100' AND datetime(medication.drugstarttime) BETWEEN datetime(diagnosis.diagnosistime) AND datetime(diagnosis.diagnosistime, '+2 months') GROUP BY medication.drugname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['acetaminophen 650mg rect supp'], ['albumin 5% 500 ml inj'], ['albuterol 2.5 mg/3 ml ud inh soln'], ['carvedilol 3.125 mg tab'], ['ceftriaxone 1 gram in ns 50 ml ivpb'], ['diphenhydramine 50 mg/1 ml 1 ml inj'], ['folic acid 1 mg tab'], ['lactated ringers 1000 ml lvp'], ['levofloxacin 750 mg in d5w 150ml'], ['metoprolol 1 mg/ml 5ml sdv inj'], ['naloxone 0.4 mg/1 ml sdv inj'], ['ondansetron 2 mg/1 ml 2ml sdv inj'], ['percocet 5/325 tab'], ['potassium chloride 20 meq tr tab'], ['senokot-s tab']]",
            "pred_answer": "[['albumin 5% 500 ml inj'], ['carvedilol 3.125 mg tab'], ['ceftriaxone 1 gram in ns 50 ml ivpb'], ['levofloxacin 750 mg in d5w 150ml'], ['metoprolol 1 mg/ml 5ml sdv inj']]",
            "is_correct": false,
            "reasoning": "The predicted SQL is structurally similar to the ground\u2010truth: it still joins patient, diagnosis, and medication, applies the same gender/age/diagnosis filters, enforces the 2-month window, groups by drugname, and limits to the top\u20105. The only substantive deviation is that it never restricts medication start times to the current year (as required by the assumptions and as done in the ground\u2010truth\u2019s T2 subquery). This is a missing WHERE\u2010clause filter (a localized temporal condition), not a flaw in the overall logic or join strategy. Therefore, the error is local.",
            "error_type": "Local: missing temporal filter for medication events"
        }
    },
    "dinsql": {
        "0c4056652a853e3a4d83a7ce": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "This year, how many patients were given cefazolin 2 gm in ns 100 ml ivpb within the same hospital visit after receiving a antiarrhythmics - class iii antiarrhythmic procedure?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'antiarrhythmics - class iii antiarrhythmic' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'cefazolin 2 gm in ns 100 ml ivpb' AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.treatmenttime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT T3.patienthealthsystemstayid) FROM medication AS T1 JOIN treatment AS T2 ON T1.patientunitstayid = T2.patientunitstayid JOIN patient AS T3 ON T1.patientunitstayid = T3.patientunitstayid WHERE T1.drugname = 'cefazolin 2 gm in ns 100 ml ivpb' AND T2.treatmentname = 'antiarrhythmics - class iii antiarrhythmic' AND datetime(T1.drugstarttime) > datetime(T2.treatmenttime) AND strftime('%Y', T1.drugstarttime) = '2100' AND T3.hospitaldischargetime IS NOT NULL AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: T1.patienthealthsystemstayid",
            "is_correct": false,
            "reasoning": "The predicted SQL references T1.patienthealthsystemstayid, but the medication table (aliased as T1) does not have a patienthealthsystemstayid column. This is a simple column reference error within a single clause and does not affect the overall query structure or logic, fitting the definition of a local error.",
            "error_type": "Local: column reference error"
        },
        "839e80df768eb6c06c6601ce": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "On 05/11/2100, what was the maximum value of the heart rate for patient 003-11972?",
            "gold_sql": "SELECT MAX(vitalperiodic.heartrate) FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '003-11972' ) ) AND vitalperiodic.heartrate IS NOT NULL AND strftime('%Y-%m-%d',vitalperiodic.observationtime) = '2100-05-11'",
            "pred_sql": "MAX(V.heartrate) AS max_heart_rate FROM patient AS P JOIN vitalperiodic AS V ON P.patientunitstayid = V.patientunitstayid WHERE P.uniquepid = '003-11972' AND datetime(V.observationtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',V.observationtime) = '05-11'",
            "gold_answer": "[['84.0']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s mistake is confined to the date\u2010filtering predicate: it uses datetime(...,'start of year') plus a separate strftime('%m-%d') test rather than matching the full date (strftime('%Y-%m-%d') = '2100-05-11') as in the ground truth. Because of that incorrect temporal condition, no rows qualify and the query returns NULL. This error is localized entirely in the WHERE clause\u2019s date logic and does not change the overall join structure or relationships between tables.",
            "error_type": "Local: other\u2010temporal error"
        }
    },
    "deepseek": {
        "7001d255e38191c3413f86a2": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Since patient 013-10167's first stay in ward 549 on the current hospital visit, how many hours have passed?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.unitadmittime) ) FROM patient WHERE patient.uniquepid = '013-10167' AND patient.wardid = 549 AND patient.hospitaldischargetime IS NULL ORDER BY patient.unitadmittime ASC LIMIT 1",
            "pred_sql": "SELECT (strftime('%s', '2100-12-31 23:59:00') - strftime('%s', (SELECT MIN(unitadmittime) FROM patient WHERE uniquepid = '013-10167' AND wardid = 549))) / 3600 AS hours_passed ;",
            "gold_answer": "[['339.582']]",
            "pred_answer": "[['339.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict to the current hospital visit (hospitaldischargetime IS NULL) and to the first ward stay on that visit. Instead, it simply takes the global minimum unitadmittime for that patient and ward, ignoring the hospital discharge filter. This changes the overall query logic and requires restructuring beyond a single clause fix.",
            "error_type": "Global: logical-structure error"
        },
        "51ffc81f1b89c620543bf91b": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Among patients diagnosed with hypercoagulable state, what are the top five most common lab tests conducted within the same hospital visit since 1 year ago?",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hypercoagulable state' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime, patient.patienthealthsystemstayid FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.labresulttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT lab.labname FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid INNER JOIN lab ON patient.patientunitstayid = lab.patientunitstayid WHERE diagnosis.diagnosisname = 'hypercoagulable state' AND lab.labresulttime >= '2099-12-31 23:59:00' GROUP BY lab.labname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['anion gap'], ['bicarbonate'], ['bun'], ['calcium'], ['chloride'], ['creatinine'], ['glucose'], ['hct'], ['hgb'], ['mch'], ['mchc'], ['mcv'], ['platelets x 1000'], ['potassium'], ['ptt'], ['rdw'], ['sodium'], ['wbc x 1000']]",
            "pred_answer": "[['chloride'], ['creatinine'], ['glucose'], ['potassium'], ['sodium']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only filters labs by date and groups by labname, but it never restricts diagnoses to the 1-year window nor enforces that the lab occurred after the diagnosis. It also omits the datetime comparison between diagnosis.diagnosistime and lab.labresulttime. These omissions fundamentally change the query logic and results, requiring changes across WHERE and JOIN clauses rather than a simple localized fix.",
            "error_type": "Global: join and filter logic error"
        }
    },
    "codes": {
        "4dcadc3a7cd58583235ea6cf": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last time when patient 017-100143 was prescribed atorvastatin and furosemide at the same time in 07/2100?",
            "gold_sql": "SELECT T1.drugstarttime FROM ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-100143' ) AND medication.drugname = 'atorvastatin' AND strftime('%Y-%m',medication.drugstarttime) = '2100-07' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-100143' ) AND medication.drugname = 'furosemide' AND strftime('%Y-%m',medication.drugstarttime) = '2100-07' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) ORDER BY T1.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT medication.drugstarttime FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE medication.drugname IN ('atorvastatin', 'furosemide') AND patient.uniquepid = '017-100143' AND strftime('%m%Y', medication.drugstarttime) = '072100' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "gold_answer": "[['2100-07-02 20:00:00']]",
            "pred_answer": "[['2100-07-04 02:00:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL simply filters medication records where the drug is either atorvastatin or furosemide and then takes the most recent date. It never enforces that both drugs were prescribed at the exact same time. The ground truth uses two subqueries (one for each drug) and then joins them on identical drugstarttime to ensure simultaneity. Furthermore, the predicted SQL\u2019s date filter strftime('%m%Y',\u2026) = '072100' is incorrectly formatted versus the required '%Y-%m' = '2100-07'. These mistakes alter the overall logic of the query\u2014simultaneity and correct month-year filtering\u2014so it is not a minor local fix but a fundamental structural error.",
            "error_type": "Global: incorrect join and date filtering logic"
        },
        "68b12c03eab7834e3298ca0d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Can you tell me when patient 031-10407 had their first pleural fluid microbiology test in 11/2100?",
            "gold_sql": "SELECT microlab.culturetakentime FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10407' ) ) AND microlab.culturesite = 'pleural fluid' AND strftime('%Y-%m',microlab.culturetakentime) = '2100-11' ORDER BY microlab.culturetakentime ASC LIMIT 1",
            "pred_sql": "SELECT microlab.culturetakentime FROM patient INNER JOIN microlab ON patient.patientunitstayid = microlab.patientunitstayid WHERE patient.uniquepid = '031-10407' AND strftime('%Y %m',microlab.culturetakentime) = '2100 11'",
            "gold_answer": "[['2100-11-23 22:20:00']]",
            "pred_answer": "[['2100-11-22 15:20:00'], ['2100-11-23 22:20:00'], ['2100-11-23 22:20:00'], ['2100-11-23 22:20:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict to culture site = 'pleural fluid', misuses the strftime format (using '%Y %m' vs '%Y-%m'), and omits the ORDER BY\u2026LIMIT 1 to pull just the first result. All of these issues are confined to specific clauses (WHERE and SELECT) and can be corrected without changing the overall join structure or logic, so this is a Local error.",
            "error_type": "Local: temporal-function/filter error"
        },
        "4f38f917911345d009b28a4b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How much did patient 004-11359 weigh when measured for the last time this month?",
            "gold_sql": "SELECT patient.admissionweight FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-11359' ) AND patient.admissionweight IS NOT NULL AND datetime(patient.unitadmittime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ORDER BY patient.unitadmittime DESC LIMIT 1",
            "pred_sql": "SELECT dischargeweight FROM patient WHERE uniquepid = '004-11359' ORDER BY patienthealthsystemstayid DESC LIMIT 1",
            "gold_answer": "[['74.8']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL not only uses the wrong column (dischargeweight instead of admissionweight) but also omits the critical time filter for \u201cthis month\u201d and does not order by unitadmittime. This is not a small typo but a fundamental change to the query\u2019s logic and structure, requiring significant restructuring to fix. Therefore it\u2019s a global error.",
            "error_type": "Global: incorrect logic and missing time filter"
        },
        "aba5ef6d5ebe30061e4ec2df": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the number of times patient 027-105098 got a urine event today.",
            "gold_sql": "SELECT COUNT(*) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-105098' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'urine' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day')",
            "pred_sql": "SELECT count(cost.eventid) FROM cost INNER JOIN patient ON cost.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '027-105098' AND cost.eventtype = 'urine' AND cost.eventtime = '2100-12-01'",
            "gold_answer": "[['5.0']]",
            "pred_answer": "no such column: cost.eventtime",
            "is_correct": false,
            "reasoning": "The predicted query refers to cost.eventtime, which is not a valid column in the cost table, and it even uses the wrong table (cost) instead of intakeoutput for urine events. The primary issue is a missing/incorrect column reference rather than a wholesale restructuring of the query\u2019s logic. This is a localized error that can be fixed by using the correct table and column names.",
            "error_type": "Local: table/column reference error"
        },
        "07ac0c8bc729ad36ff0e48ae": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What diagnosis did patient 027-111437 receive the last time since 1 year ago?",
            "gold_sql": "SELECT diagnosis.diagnosisname FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-111437' ) ) AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ORDER BY diagnosis.diagnosistime DESC LIMIT 1",
            "pred_sql": "SELECT diagnosis.diagnosisname FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE patient.patientunitstayid = 1027 AND diagnosis.diagnosistime > datetime('now', '-1 year')",
            "gold_answer": "[['hyponatremia']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s structure (JOIN diagnosis to patient and filtering by a time window) matches the ground truth, but the WHERE clause is wrong: it hard\u2010codes patientunitstayid = 1027 instead of selecting by the given uniquepid through patienthealthsystemstayid, and it uses datetime('now') instead of the fixed '2100-12-31 23:59:00' reference. These are localized mistakes in the WHERE filters that can be fixed without reworking the overall query logic.",
            "error_type": "Local: incorrect WHERE filter"
        },
        "46eb2774e27a79287f213ed3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last input time of patient 006-104324 on the first icu visit?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-104324' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%intake%' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputtime FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.patientunitstayid = '006-104324' AND patient.hospitaldischargeoffset = 1 ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "gold_answer": "[['2100-05-10 10:00:00']]",
            "pred_answer": "no such column: patient.hospitaldischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column patient.hospitaldischargeoffset, causing an execution error. This is a localized issue with a column reference and does not alter the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        }
    },
    "macsql": {
        "a9c37d707816110b60aebbd5": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Among patients who are diagnosed with pulmonary aspiration - large particulate aspirate , what are the top three most common diagnoses that followed within the same month?",
            "gold_sql": "SELECT T3.diagnosisname FROM ( SELECT T2.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'pulmonary aspiration - large particulate aspirate' ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.diagnosistime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.diagnosistime,'start of month') GROUP BY T2.diagnosisname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT `diagnosisname` FROM ( SELECT T2.`diagnosisname`, COUNT(*) AS `count` FROM diagnosis AS T1 JOIN diagnosis AS T2 ON T1.`patientunitstayid` = T2.`patientunitstayid` AND datetime(T1.`diagnosistime`, 'start of month') = datetime(T2.`diagnosistime`, 'start of month') WHERE T1.`diagnosisname` = 'pulmonary aspiration - large particulate aspirate' AND T2.`diagnosisname` <> 'pulmonary aspiration - large particulate aspirate' GROUP BY T2.`diagnosisname` ORDER BY `count` DESC LIMIT 3 )",
            "gold_answer": "[['acute respiratory failure - due to inability to clear secretions'], ['pulmonary aspiration - large particulate aspirate']]",
            "pred_answer": "[['acute respiratory failure - due to inability to clear secretions']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins diagnosis records on patientunitstayid rather than on the patient\u2019s unique ID, which changes the scope of follow-on diagnoses (it limits results to the same ICU stay instead of the same patient). This is a structural mistake in how tables are related and affects the overall logic. It also excludes the original diagnosis name, which deviates from the ground truth behavior, but the primary flaw is the incorrect join key that fundamentally alters which events are matched.",
            "error_type": "Global: join-key error"
        },
        "245d45258d03fb5864a40c62": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What was the name of the last medication that was prescribed to patient 022-100938 in 02/this year?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-100938' ) ) AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',medication.drugstarttime) = '02' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT `drugname` FROM medication WHERE `patientunitstayid` = ( SELECT DISTINCT `patientunitstayid` FROM patient WHERE `uniquepid` = '022-100938' ) AND datetime(`drugstarttime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') AND strftime('%d', `drugstarttime`) = '02' ORDER BY `drugstarttime` DESC LIMIT 1",
            "gold_answer": "[['synthroid']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query misapplies the temporal filter in the WHERE clause: it uses `datetime(drugstarttime, 'start of month') = ...` and `strftime('%d', drugstarttime) = '02'` (day = 02) instead of checking month = '02' relative to the start of the year. This is a mistake localized to the date\u2010filtering logic and does not require restructuring the joins or overall query flow. Thus it is a local error in the temporal condition.",
            "error_type": "Local: other-temporal error"
        },
        "9768a4a4b907cf6434f602e7": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "When was the first time patient 007-10152 was prescribed medication via the feeding tube route in 05/this year?",
            "gold_sql": "SELECT medication.drugstarttime FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10152' ) ) AND medication.routeadmin = 'feeding tube' AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',medication.drugstarttime) = '05' ORDER BY medication.drugstarttime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(`drugstarttime`) AS first_feeding_tube_medication_time FROM medication WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '007-10152' ) AND `routeadmin` = 'feeding tube' AND datetime(`drugstarttime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') AND strftime('%m', `drugstarttime`) = '05'",
            "gold_answer": "[['2100-05-09 00:43:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s overall structure matches the intent\u2014filter by patient, route, month, and take the MIN date\u2014but it misuses the datetime modifier in the WHERE clause: it applies 'start of month' to drugstarttime and compares it to the 'start of year' of the current date, so no rows satisfy the condition. This is a localized mistake in a single condition rather than a flaw in the join logic or overall structure.",
            "error_type": "Local: other-temporal error"
        },
        "17aff9f53536f4057a93b06c": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "This year, how many patients received sodium chloride 0.9% 1,000 ml bag within the same hospital visit after being diagnosed with hemorrhage?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hemorrhage' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'sodium chloride 0.9% 1,000 ml bag' AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT T3.uniquepid) AS patient_count FROM patient AS T3 INNER JOIN ( SELECT DISTINCT T1.patientunitstayid FROM diagnosis AS T1 WHERE T1.diagnosisname LIKE '%hemorrhage%' AND datetime(T1.diagnosistime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') ) AS D ON T3.patientunitstayid = D.patientunitstayid INNER JOIN ( SELECT DISTINCT T2.patientunitstayid FROM medication AS T2 WHERE T2.drugname LIKE '%sodium chloride 0.9% 1,000 ml bag%' AND datetime(T2.drugstarttime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') ) AS M ON T3.patientunitstayid = M.patientunitstayid",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['1.0']]",
            "is_correct": false,
            "reasoning": "The predicted query omits the critical temporal condition (ensuring the hemorrhage diagnosis occurs before the sodium chloride administration) and uses patientunitstayid to join events instead of patienthealthsystemstayid to enforce the same hospital visit. By failing to enforce event ordering and the correct visit identifier, the overall query logic is fundamentally altered, leading to incorrect results. This error spans multiple clauses (JOIN conditions and WHERE logic) and requires restructuring the query to include the temporal filter and correct join key.",
            "error_type": "Global: join and temporal logic error"
        }
    },
    "qwen3": {
        "79b2a1c645f45cee560dd09b": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What was the daily average input of p.o. for patient 002-1185 on the current hospital visit?",
            "gold_sql": "SELECT AVG(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-1185' AND patient.hospitaldischargetime IS NULL ) ) AND intakeoutput.celllabel = 'p.o.' AND intakeoutput.cellpath LIKE '%intake%' GROUP BY strftime('%Y-%m-%d',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT SUM(io.cellvaluenumeric) / (julianday('2100-12-31 23:59:00') - julianday(p.unitadmittime)) AS daily_avg_p_o FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '002-1185' AND p.hospitaldischargetime IS NULL AND io.cellpath LIKE '%p.o.%';",
            "gold_answer": "[['260.0'], ['333.333']]",
            "pred_answer": "[['2331.114']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the intended logic. Instead of computing a per-day average by grouping intake values by date (as in the ground truth), it sums all p.o. inputs and divides by the time since admission, producing a single aggregate rather than daily averages. It also misuses cellpath for filtering \u2018p.o.\u2019 instead of using celllabel and omits the GROUP BY on the intake date. These errors require restructuring the aggregation and grouping logic across multiple clauses, not a localized fix.",
            "error_type": "Global: aggregation logic error"
        }
    },
    "o4-mini": {
        "1b72b914302d1dce0efd4293": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Find the number of current patients in the 60 or above age group.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NULL AND patient.age >= 60",
            "pred_sql": "SELECT COUNT(*) AS num_current_patients_60_plus FROM patient WHERE hospitaldischargetime IS NULL AND age >= 60;",
            "gold_answer": "[['14.0']]",
            "pred_answer": "[['20.0']]",
            "is_correct": false,
            "reasoning": "The predicted query counts all rows (COUNT(*)) rather than counting distinct patients. According to the assumptions, when counting patients you must use COUNT(DISTINCT patient.uniquepid). This is a localized mistake in the SELECT clause aggregate and does not alter the overall query structure or logic beyond missing the DISTINCT keyword.",
            "error_type": "Local: missing DISTINCT"
        }
    }
}