{
    "o4-mini": {
        "63354d6c1558c315d8c2e34f": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What is the percentile tsh value of 0.05 among patients of the same age as patient 012-10585 on the current hospital visit?",
            "gold_sql": "SELECT DISTINCT T1.C1 FROM ( SELECT lab.labresult, PERCENT_RANK() OVER ( ORDER BY lab.labresult ) AS C1 FROM lab WHERE lab.labname = 'tsh' AND lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age = ( SELECT patient.age FROM patient WHERE patient.uniquepid = '012-10585' AND patient.hospitaldischargetime IS NULL ) ) ) AS T1 WHERE T1.labresult = 0.05",
            "pred_sql": "SELECT SUM(CASE WHEN lab.labresult <= 0.05 THEN 1 ELSE 0 END) * 1.0 / COUNT(*) AS percentile FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE lab.labname = 'tsh' AND patient.hospitaldischargetime IS NULL AND patient.age = ( SELECT age FROM patient WHERE uniquepid = '012-10585' AND hospitaldischargetime IS NULL );",
            "gold_answer": "[['0.111']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a SUM/COUNT approach to compute the percentile (cumulative distribution) instead of the PERCENT_RANK() window function as specified. This error is confined to the SELECT clause\u2019s percentile calculation logic and does not involve incorrect table references, joins, or overall query structure. Therefore, it\u2019s a local error in how the percentile is computed.",
            "error_type": "Local: percentile calculation error"
        },
        "bb0088a72f4862ae157b5887": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Can you provide me the daily minimum amount of intake, iv amount that patient 033-10289 received since 06/02/2100?",
            "gold_sql": "SELECT MIN(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '033-10289' ) ) AND intakeoutput.celllabel = 'intake, iv amount' AND intakeoutput.cellpath LIKE '%intake%' AND strftime('%Y-%m-%d',intakeoutput.intakeoutputtime) >= '2100-06-02' GROUP BY strftime('%Y-%m-%d',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT date(io.intakeoutputtime) AS day, MIN(io.cellvaluenumeric) AS min_iv_intake FROM intakeoutput io JOIN patient p ON io.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '033-10289' AND io.cellpath LIKE '%intake%' AND io.cellpath LIKE '%i.v.%' AND date(io.intakeoutputtime) >= '2100-06-02' GROUP BY date(io.intakeoutputtime) ORDER BY day;",
            "gold_answer": "[['453.0'], ['495.0'], ['671.0'], ['715.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses io.cellpath LIKE '%i.v.%' instead of filtering on celllabel = 'intake, iv amount'. This is a localized mistake in the WHERE clause pattern matching and does not alter the overall query structure or joins. The patient join is acceptable, but the incorrect condition on cellpath leads to no rows being returned.",
            "error_type": "Local: incorrect WHERE clause value pattern"
        },
        "9dc2faa762a87d534e0d1c11": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many days have elapsed since patient 012-10585 received his or her first antibacterials on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',treatment.treatmenttime) ) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-10585' AND patient.hospitaldischargetime IS NULL ) ) AND treatment.treatmentname = 'antibacterials' ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT CAST( julianday('2100-12-31 23:59:00') - julianday(MIN(m.drugstarttime)) AS INTEGER) AS days_elapsed FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '012-10585' AND p.hospitaldischargetime IS NULL AND ( LOWER(m.drugname) LIKE '%cillin%' OR LOWER(m.drugname) LIKE '%mycin%' OR LOWER(m.drugname) LIKE '%cef%' OR LOWER(m.drugname) LIKE '%floxacin%' OR LOWER(m.drugname) LIKE '%sulfa%' );",
            "gold_answer": "[['4.057']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted query sources the first antibacterial event from the medication table (using drugname patterns and drugstarttime) instead of the treatment table with treatmentname='antibacterials' as required by the question and ground truth. This mistake affects the overall logic and data source of the query, not just a minor syntax or column reference error. It changes which events are counted and how the patient\u2019s current hospital visit is identified, thus altering the intended meaning of the query. Consequently, this is a global error in the query structure and logic.",
            "error_type": "Global: incorrect table selection"
        },
        "746f97e945c295d0b4e02ffd": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What are the four most usual lab tests for patients in their 20s this year?",
            "gold_sql": "SELECT T1.labname FROM ( SELECT lab.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age BETWEEN 20 AND 29 ) AND datetime(lab.labresulttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY lab.labname ) AS T1 WHERE T1.C1 <= 4",
            "pred_sql": "SELECT lab.labname FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.age BETWEEN 20 AND 29 AND strftime('%Y', lab.labresulttime) = '2100' GROUP BY lab.labname ORDER BY COUNT(*) DESC LIMIT 4;",
            "gold_answer": "[['bedside glucose'], ['chloride'], ['creatinine'], ['potassium'], ['sodium']]",
            "pred_answer": "[['bedside glucose'], ['chloride'], ['potassium'], ['sodium']]",
            "is_correct": false,
            "reasoning": "The predicted query uses ORDER BY COUNT(*) DESC LIMIT 4 instead of applying a DENSE_RANK filter to include ties at the 4th rank. This mistake is confined to the ranking/selection logic within the ORDER/GROUP BY clause and does not alter the tables joined or the overall structure of the query. Therefore it is a localized error in how the top-four labs are chosen, not a flaw in the global query logic.",
            "error_type": "Local: ranking error"
        }
    },
    "llm2sql": {
        "8df73cbaa10a750ff09381e3": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the 3-month survival rate for patients living with a bacteremia diagnosis?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'bacteremia' AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN patient ON T1.uniquepid = patient.uniquepid GROUP BY patient.uniquepid HAVING MAX(patient.hospitaldischargetime) = patient.hospitaldischargetime )",
            "pred_sql": "SELECT (CAST(SUM(CASE WHEN patient.hospitaldischargestatus = 'alive' AND datetime(patient.hospitaldischargetime) <= datetime(diagnosis.diagnosistime, '+91 days') THEN 1 ELSE 0 END) AS REAL) / COUNT(DISTINCT patient.patientunitstayid)) AS survival_rate FROM patient JOIN diagnosis ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname LIKE '%bacteremia%'",
            "gold_answer": "[['0.833']]",
            "pred_answer": "[['4.2']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally miscalculates the 3-month survival rate. It uses patientunitstayid instead of uniquepid, never filters out patients diagnosed less than three months ago, and incorrectly interprets survival by checking for \"alive\" and discharge within 91 days rather than survival beyond 3 months or expiration within that window. These issues span the cohort selection, date logic, grouping, and numerator/denominator calculation, altering the query\u2019s intended meaning and requiring structural changes across clauses.",
            "error_type": "Global: flawed survival calculation"
        },
        "d050f7add43df6e757dd7add": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Tell me the percentile of mch 30.1 among all patients of the same age as patient 006-104411 on the last hospital visit?",
            "gold_sql": "SELECT DISTINCT T1.C1 FROM ( SELECT lab.labresult, PERCENT_RANK() OVER ( ORDER BY lab.labresult ) AS C1 FROM lab WHERE lab.labname = 'mch' AND lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age = ( SELECT patient.age FROM patient WHERE patient.uniquepid = '006-104411' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) ) AS T1 WHERE T1.labresult = 30.1",
            "pred_sql": "WITH AgePatient AS ( SELECT age FROM patient WHERE uniquepid = '006-104411' ), LastVisitPatients AS ( SELECT patientunitstayid FROM patient WHERE age = (SELECT age FROM AgePatient) AND hospitaldischargetime IS NOT NULL AND patientunitstayid IN ( SELECT patientunitstayid FROM patient ORDER BY hospitaladmittime DESC ) ), MCHValues AS ( SELECT lab.labresult AS mch_value FROM lab WHERE lab.labname LIKE '%mch%' AND lab.patientunitstayid IN (SELECT patientunitstayid FROM LastVisitPatients) ), RankedMCH AS ( SELECT mch_value, NTILE(100) OVER(ORDER BY mch_value) AS percentile FROM MCHValues ) SELECT percentile FROM RankedMCH WHERE mch_value = 30.1;",
            "gold_answer": "[['0.504']]",
            "pred_answer": "[['23.0'], ['23.0'], ['23.0'], ['23.0'], ['24.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates fundamentally from the intended logic in multiple ways. First, it uses NTILE(100) instead of PERCENT_RANK(), which completely changes how the percentile is calculated (NTILE buckets results into integer groups rather than computing a 0\u20131 rank). Second, its CTE for \u2018LastVisitPatients\u2019 is wrong: it filters on hospitaldischargetime IS NOT NULL but then uses \u201cIN (SELECT patientunitstayid FROM patient ORDER BY hospitaladmittime DESC)\u201d without limiting to the most recent visit per patient, so it ends up including all visits rather than each patient\u2019s last one. Third, it matches labname with LIKE '%mch%' instead of exactly 'mch', potentially pulling unrelated tests. These issues span multiple clauses and alter the overall structure and semantics of the query, requiring a rewrite rather than a simple fix in one clause.",
            "error_type": "Global: incorrect ranking and visit-selection logic"
        }
    },
    "macsql": {
        "82f6f02a554527d1b7e3eb21": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What does it cost to have darbepoetin alfa?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'treatment' AND cost.eventid IN ( SELECT treatment.treatmentid FROM treatment WHERE treatment.treatmentname = 'darbepoetin alfa' )",
            "pred_sql": "SELECT DISTINCT C.`cost` FROM medication AS M INNER JOIN cost AS C ON M.`patientunitstayid` = C.`patientunitstayid` WHERE M.`drugname` LIKE '%darbepoetin alfa%' AND C.`eventtype` = 'medication'",
            "gold_answer": "[['7.76']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication table and joins cost on patientunitstayid with eventtype='medication', whereas the correct query must use the treatment table and join cost.eventid to treatment.treatmentid with eventtype='treatment'. This is not a simple fix within one clause but requires changing the table, join key, and event type, altering the overall logic of the query.",
            "error_type": "Global: join error"
        }
    },
    "deepseek": {
        "b3a0ff53392263e54edf05b0": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "When was patient 005-10974's first antidepressant - trazodone (desyrel) treatment on the first hospital visit?",
            "gold_sql": "SELECT treatment.treatmenttime FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '005-10974' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND treatment.treatmentname = 'antidepressant - trazodone (desyrel)' ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(m.drugstarttime) AS first_trazodone_time FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '005-10974' AND (m.drugname = 'trazodone' OR m.drugname = 'Desyrel') AND p.hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '005-10974' );",
            "gold_answer": "[['2100-09-19 01:14:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted query uses the medication table and drugstarttime to find the first trazodone event, whereas the question and ground truth require the treatment table and treatmenttime for 'antidepressant - trazodone (desyrel)' specifically on the first completed hospital visit. This mistake of choosing the wrong table and column and misapplying the hospital admission logic affects the overall structure and intended semantics of the query, not just a localized condition or syntax.",
            "error_type": "Global: incorrect table usage"
        },
        "8d42b976f508ae3b52c0c22f": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Share the five most frequently performed procedures since 2100.",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM treatment WHERE strftime('%Y',treatment.treatmenttime) >= '2100' GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "WITH procedures AS ( SELECT 'diagnosis' AS type, diagnosisname AS procedure_name, cost.chargetime FROM cost JOIN diagnosis ON cost.eventid = diagnosis.diagnosisid AND cost.patientunitstayid = diagnosis.patientunitstayid WHERE cost.event_type = 'diagnosis' AND chargetime >= '2100-01-01' UNION ALL SELECT 'treatment' AS type, treatmentname AS procedure_name, cost.chargetime FROM cost JOIN treatment ON cost.eventid = treatment.treatmentid AND cost.patientunitstayid = treatment.patientunitstayid WHERE cost.event_type = 'treatment' AND chargetime >= '2100-01-01' UNION ALL SELECT 'lab' AS type, labname AS procedure_name, cost.chargetime FROM cost JOIN lab ON cost.eventid = lab.labid AND cost.patientunitstayid = lab.patientunitstayid WHERE cost.event_type = 'lab' AND chargetime >= '2100-01-01' UNION ALL SELECT 'medication' AS type, drugname AS procedure_name, cost.chargetime FROM cost JOIN medication ON cost.eventid = medication.medicationid AND cost.patientunitstayid = medication.patientunitstayid WHERE cost.event_type = 'medication' AND chargetime >= '2100-01-01' ) SELECT procedure_name, COUNT(*) AS frequency FROM procedures GROUP BY procedure_name ORDER BY frequency DESC LIMIT 5;",
            "gold_answer": "[['antiemetic - serotonin antagonist'], ['chest x-ray'], ['mechanical ventilation'], ['normal saline administration'], ['stress ulcer prophylaxis - pantoprazole']]",
            "pred_answer": "no such column: cost.event_type",
            "is_correct": false,
            "reasoning": "The predicted SQL refers to cost.event_type, but the actual column is named cost.eventtype. This is a simple column reference error and does not require restructuring the query\u2019s overall logic or tables.",
            "error_type": "Local: column reference error"
        }
    },
    "codes": {
        "a0cf8ef52f1f759a0bad1de7": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Since 1 year ago, what are the top three most frequent drugs prescribed to patients within 2 months after the prescription of ondansetron 4mg/2ml inj?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'ondansetron 4mg/2ml inj' AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.drugstarttime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.drugstarttime) AND datetime(T1.drugstarttime,'+2 month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugstarttime >= ( SELECT medication.drugstarttime FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'ondansetron 4mg/2ml inj' ) AND medication.drugstarttime < ( SELECT medication.drugstarttime FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'ondansetron 4mg/2ml inj' ) + 2 * 30 * 24 * 60 * 60 GROUP BY medication.drugname ORDER BY count(medication.drugname) DESC LIMIT 3",
            "gold_answer": "[['dextrose 50% vial'], ['ondansetron 4mg/2ml inj'], ['sodium chloride 0.9% 1000 ml']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to implement the core logic of the question: it does not restrict to the past year, it does not correlate each patient\u2019s ondansetron prescription to their subsequent prescriptions, and it uses uncorrelated subqueries for the ondansetron drugstarttime rather than a per-patient join/window. These issues span multiple clauses (WHERE, JOIN, subqueries) and require a complete restructure of the query logic, not just a minor fix in a single clause.",
            "error_type": "Global: incorrect join logic"
        },
        "cd9635be7ce342f3e0c3219b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the cost of sodium phosphate 30 mmol/250ml ns?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'medication' AND cost.eventid IN ( SELECT medication.medicationid FROM medication WHERE medication.drugname = 'sodium phosphate 30 mmol/250ml ns' )",
            "pred_sql": "SELECT cost.cost FROM cost INNER JOIN patient ON cost.patienthealthsystemstayid = patient.patienthealthsystemstayid WHERE cost.eventtype = 'medication' AND cost.costid = 13",
            "gold_answer": "[['12.63']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL does not filter costs by the medication event ID nor reference the medication table to identify the correct event. Instead, it hardcodes cost.costid = 13 and introduces an unnecessary join to patient, altering the core logic of linking cost entries to the specified drug. This misjoins tables and changes the intended filtering, requiring restructuring of the query beyond a simple clause fix.",
            "error_type": "Global: join error"
        },
        "4808850ccfbd9313e08bc1e3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "On the first hospital visit, what is the age of patient 006-100663?",
            "gold_sql": "SELECT patient.age FROM patient WHERE patient.uniquepid = '006-100663' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "pred_sql": "SELECT patient.age FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.patientunitstayid = 143870",
            "gold_answer": "[['74.0']]",
            "pred_answer": "[['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query\u2019s logic by joining the vitalperiodic table and filtering on a specific patientunitstayid rather than selecting the first hospital visit for uniquepid '006-100663' with hospitaldischargetime IS NOT NULL. It ignores the required ORDER BY and LIMIT, uses the wrong table and key, and returns repeated values. This is not a localized syntax or column mistake but a structural error that alters the intended meaning of the query.",
            "error_type": "Global: incorrect join"
        },
        "2d95eaed3db09e820ba3514d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the yearly average respiratory rate for patient 031-10598 since 164 days ago?",
            "gold_sql": "SELECT AVG(vitalperiodic.respiration) FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10598' ) ) AND vitalperiodic.respiration IS NOT NULL AND datetime(vitalperiodic.observationtime) >= datetime('2100-12-31 23:59:00','-164 day') GROUP BY strftime('%Y',vitalperiodic.observationtime)",
            "pred_sql": "SELECT avg(vitalperiodic.respiration) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '031-10598' AND vitalperiodic.observationtime > (CURRENT_TIMESTAMP - INTERVAL '164' DAY)",
            "gold_answer": "[['17.138']]",
            "pred_answer": "near \"'164'\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL fails due to a syntax error in the WHERE clause when using \u201cCURRENT_TIMESTAMP - INTERVAL \u2018164\u2019 DAY\u201d, which is invalid in SQLite. This misuse of a temporal expression is localized to the date calculation and does not require restructuring the overall query logic. The rest of the query (JOIN, filters) remains intact, so it\u2019s a specific temporal syntax/local error.",
            "error_type": "Local: other-temporal error"
        },
        "f26a89e87c532d575cf44788": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How much is a ethanol lab test?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'lab' AND cost.eventid IN ( SELECT lab.labid FROM lab WHERE lab.labname = 'ethanol' )",
            "pred_sql": "SELECT labresult FROM lab WHERE labname = 'ethanol'",
            "gold_answer": "[['8.3']]",
            "pred_answer": "[['0.0'], ['0.027'], ['1.0'], ['108.0'], ['114.0'], ['126.0'], ['138.0'], ['141.0'], ['145.0'], ['148.0'], ['15.0'], ['155.0'], ['168.0'], ['183.0'], ['184.0'], ['188.0'], ['193.0'], ['197.4'], ['198.0'], ['209.0'], ['22.0'], ['222.5'], ['223.0'], ['228.0'], ['231.0'], ['234.0'], ['244.0'], ['246.0'], ['247.0'], ['248.0'], ['250.0'], ['264.0'], ['266.0'], ['271.0'], ['284.0'], ['30.0'], ['309.0'], ['313.0'], ['316.3'], ['324.0'], ['338.0'], ['349.0'], ['35.0'], ['353.0'], ['355.0'], ['372.0'], ['383.0'], ['39.0'], ['41.0'], ['422.0'], ['447.0'], ['55.0'], ['60.0'], ['67.0'], ['68.0'], ['72.0'], ['75.0'], ['86.0'], ['89.0'], ['97.0'], ['98.0'], ['99.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries lab.labresult instead of retrieving the cost from the cost table. It ignores the cost.eventtype = 'lab' filter and the cost.eventid join, selecting the wrong column and table. Fixing this requires changing the SELECT source to cost.cost and adding the appropriate WHERE conditions, without altering the overall query structure.",
            "error_type": "Local: column reference error"
        },
        "926163a5316b8d10e3e66e0d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the total stool output in patient 006-106828 yesterday?",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106828' ) ) AND intakeoutput.celllabel = 'stool' AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day')",
            "pred_sql": "SELECT sum(CASE WHEN intakeoutput.intakeoutputtime = ( SELECT max(intakeoutput.intakeoutputtime) FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '006-106828' ) THEN intakeoutput.cellvaluenumeric ELSE 0 END) FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '006-106828' AND intakeoutput.cellpath = 'Cumulative output (ml)'",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the intended logic: instead of summing stool outputs from yesterday, it sums only the latest cumulative output value regardless of date and uses the wrong cellpath. It omits the date filter and the stool label filter, and restructures the query to use a max timestamp subquery. These are not isolated syntax or reference mistakes but a fundamental misinterpretation of the requirement, requiring a major rewrite of the query logic.",
            "error_type": "Global: incorrect overall logic"
        },
        "8b553152e14bffb35726fff3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 022-100769 have their first urine catheter output on 10/21/this year?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-100769' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'urine catheter' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',intakeoutput.intakeoutputtime) = '10-21' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '022-100769' AND strftime('%Y %m %d', intakeoutput.intakeoutputtime) = '2100 10 21'",
            "gold_answer": "[['2100-10-21 00:00:00']]",
            "pred_answer": "[['2100-10-21 00:00:00'], ['2100-10-21 01:08:00'], ['2100-10-21 01:58:00'], ['2100-10-21 03:03:00'], ['2100-10-21 04:53:00'], ['2100-10-21 06:58:00'], ['2100-10-21 09:00:00'], ['2100-10-21 11:00:00'], ['2100-10-21 12:04:00'], ['2100-10-21 13:00:00'], ['2100-10-21 14:00:00'], ['2100-10-21 15:00:00'], ['2100-10-21 16:00:00'], ['2100-10-21 17:00:00'], ['2100-10-21 18:00:00'], ['2100-10-21 19:00:00'], ['2100-10-21 20:00:00'], ['2100-10-21 21:30:00'], ['2100-10-21 22:00:00'], ['2100-10-21 23:00:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to include the required filters for intakeoutput.cellpath LIKE '%output%' and intakeoutput.celllabel = 'urine catheter', and it omits the ORDER BY ... LIMIT 1 to return only the first event. Instead it returns all intakeoutput events for that patient on the given date. These are errors confined to the WHERE clause and result-ranking clause, and can be fixed by adding the missing filter conditions and ordering/limit without altering the overall query structure.",
            "error_type": "Local: missing filter and limit conditions"
        }
    },
    "qwen3": {
        "05ba864d3e4a7ee0d0933a8d": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "When did patient 017-100600 come for the last time to the hospital?",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '017-100600' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(hospitaldischargetime) AS last_visit FROM patient WHERE uniquepid = '017-100600' AND hospitaldischargetime IS NOT NULL;",
            "gold_answer": "[['2100-08-09 22:05:00']]",
            "pred_answer": "[['2100-08-13 19:27:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses MAX(hospitaldischargetime) instead of retrieving the last hospitaladmittime. This is a simple column reference mistake (using the discharge time rather than the admit time) and can be fixed by selecting MAX(hospitaladmittime) or by ordering and limiting on hospitaladmittime. It does not require restructuring the query\u2019s joins or logic beyond correcting the column name.",
            "error_type": "Local: column reference error"
        }
    },
    "dinsql": {
        "ac1820fc6650cabcf6d961c7": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "When did patient 003-10464 get his/her last prescription of albuterol/ipratropium neb 3ml on the first hospital visit?",
            "gold_sql": "SELECT medication.drugstarttime FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '003-10464' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND medication.drugname = 'albuterol/ipratropium neb 3ml' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(T2.drugstoptime) FROM patient AS T1 JOIN medication AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.uniquepid = '003-10464' AND T2.drugname = 'albuterol/ipratropium neb 3ml' AND T1.hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '003-10464' AND hospitaldischargetime IS NOT NULL )",
            "gold_answer": "[['2100-11-11 18:35:00']]",
            "pred_answer": "[['2100-11-13 17:22:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs from the ground truth only in the SELECT clause: it aggregates MAX(drugstoptime) instead of ordering by and selecting the latest drugstarttime. The join logic, patient filtering, and first-visit restriction are structurally correct. This is a localized mistake in column selection, not a change to the overall query structure or logic.",
            "error_type": "Local: column reference error"
        },
        "9e616b0295d51d1aa25f7b71": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Count the number of patients for whom dexmedetomidine 200 mcg in 50 ml ns was prescribed within the same hospital visit post their diagnosis of acute coronary syndrome - acute myocardial infarction (no st elevation) this year.",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute coronary syndrome - acute myocardial infarction (no st elevation)' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'dexmedetomidine 200 mcg in 50 ml ns' AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT T1.uniquepid) FROM patient AS T1 JOIN diagnosis AS T2 ON T1.patientunitstayid = T2.patientunitstayid JOIN medication AS T3 ON T1.patientunitstayid = T3.patientunitstayid WHERE T2.diagnosisname = 'acute coronary syndrome - acute myocardial infarction (no st elevation)' AND T3.drugname = 'dexmedetomidine 200 mcg in 50 ml ns' AND strftime('%Y', T2.diagnosistime) = '2100' AND T1.patienthealthsystemstayid = T3.patienthealthsystemstayid AND datetime(T3.drugstarttime) > datetime(T2.diagnosistime)",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: T3.patienthealthsystemstayid",
            "is_correct": false,
            "reasoning": "The predicted SQL references T3.patienthealthsystemstayid, but the medication table does not have a patienthealthsystemstayid column (it only has patientunitstayid). This is a column reference error localized to the WHERE clause, and can be fixed by using the correct column (patientunitstayid) or joining on the correct key without altering the overall query structure.",
            "error_type": "Local: table/column reference error"
        },
        "fd736d3c511756e9cf8ead74": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Can you give me patient 031-10598's yearly average respiratory rate since 164 days ago?",
            "gold_sql": "SELECT AVG(vitalperiodic.respiration) FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10598' ) ) AND vitalperiodic.respiration IS NOT NULL AND datetime(vitalperiodic.observationtime) >= datetime('2100-12-31 23:59:00','-164 day') GROUP BY strftime('%Y',vitalperiodic.observationtime)",
            "pred_sql": "SELECT AVG(respiration) AS average_respiratory_rate FROM vitalperiodic WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '031-10598' ) AND datetime(observationtime) >= datetime('2100-12-31 23:59:00', '-164 days') GROUP BY strftime('%Y', observationtime)",
            "gold_answer": "[['17.138']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a single equality filter on patientunitstayid directly from the patient table (SELECT patientunitstayid FROM patient WHERE uniquepid='031-10598'), whereas the correct query must first map uniquepid to a patienthealthsystemstayid and then find all related patientunitstayid values. This is not a minor syntax or column error but a fundamental flaw in how the patient and vitalperiodic tables are related, altering the intended logic and resulting in empty results.",
            "error_type": "Global: incorrect join/filter logic"
        }
    }
}