{
    "dinsql": {
        "bb8a3797c26badc2dc4e226f": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "How many days have passed from the time when patient 012-10585 was admitted to the icu?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.unitadmittime) ) FROM patient WHERE patient.uniquepid = '012-10585' AND patient.unitdischargetime IS NULL",
            "pred_sql": "julianday('2100-12-31') - julianday(patient.unitadmittime) AS days_passed FROM patient WHERE patient.uniquepid = '012-10585'",
            "gold_answer": "[['4.351']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL is missing the SELECT keyword and does not apply the required filter on unitdischargetime IS NULL. The mistake is localized to the SELECT/WHERE clause syntax and does not alter the overall query structure or relationships between tables. Therefore, it is a local error.",
            "error_type": "Local: syntax error"
        },
        "0b64c8b521777103368b8d1f": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What is the number of times that patient 030-11672 visited the hospital in 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.patienthealthsystemstayid ) FROM patient WHERE patient.uniquepid = '030-11672' AND strftime('%Y',patient.hospitaladmittime) = '2100'",
            "pred_sql": "COUNT(DISTINCT patienthealthsystemstayid) FROM patient WHERE uniquepid = '030-11672' AND strftime('%Y', hospitaladmittime) = '2100'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the SELECT keyword and the proper SELECT clause, making it a syntax/local error rather than a logical mistake in joining tables or query structure. The overall intention\u2014counting distinct hospital visits for the given patient in 2100\u2014is intact, but the missing SELECT renders the query invalid.",
            "error_type": "Local: syntax error"
        },
        "1c04274596c99433482a7a85": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What is the minimum total cost of hospitalization that includes the lactate laboratory test in 2100?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'lactate' ) ) AND strftime('%Y',cost.chargetime) = '2100' GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT MIN(total_cost) AS min_total_cost FROM ( SELECT SUM(DISTINCT C.cost) AS total_cost FROM cost AS C JOIN lab AS L ON C.patienthealthsystemstayid = L.patientunitstayid WHERE L.labname = 'lactate' AND strftime('%Y', L.labresulttime) = '2100' AND C.eventtype IN ('diagnosis', 'treatment', 'lab', 'medication') GROUP BY C.patienthealthsystemstayid )",
            "gold_answer": "[['270.99']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": [
                "The predicted query attempts to link cost and lab tables directly by matching cost.patienthealthsystemstayid to lab.patientunitstayid, but these are different keys and should not be joined directly.",
                "This join error fundamentally alters the relationships between tables and returns no matching rows.",
                "Additionally, the predicted query filters lab events by labresulttime instead of summing costs by the charge time (cost.chargetime), deviating from the intended cost aggregation logic.",
                "These mistakes are not isolated to a single clause but affect the overall data associations and logic of the query."
            ],
            "error_type": "Global: incorrect join keys and filtering"
        },
        "d446acea3c3db0da8b178a5e": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Which drug was patient 029-10096 allergic to since 09/2100?",
            "gold_sql": "SELECT allergy.drugname FROM allergy WHERE allergy.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '029-10096' ) ) AND strftime('%Y-%m',allergy.allergytime) >= '2100-09'",
            "pred_sql": "SELECT DISTINCT drugname FROM allergy WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '029-10096' ) AND strftime('%Y-%m', allergytime) >= '2100-09'",
            "gold_answer": "[['lasix'], ['lasix'], ['sulfacetamide sod monohydrate'], ['sulfacetamide sod monohydrate']]",
            "pred_answer": "[['lasix'], ['sulfacetamide sod monohydrate']]",
            "is_correct": false,
            "reasoning": "The predicted query uses a single-level direct equality on patientunitstayid = (SELECT patientunitstayid FROM patient WHERE uniquepid = '029-10096'), whereas the ground truth correctly links uniquepid \u2192 patienthealthsystemstayid \u2192 all patientunitstayid values to capture every ICU stay for that patient. The predicted SQL also uses '=' instead of 'IN', so it only returns allergies from one stay rather than all relevant stays. This misjoins the tables and breaks the intended patient\u2010to\u2010allergy relationship, requiring restructuring of the join logic rather than a simple fix in one clause.",
            "error_type": "Global: join error"
        }
    },
    "codes": {
        "d36a003d44b40986f4c9f773": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What does a procedure under the name bronchodilator - ipratropium cost?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'treatment' AND cost.eventid IN ( SELECT treatment.treatmentid FROM treatment WHERE treatment.treatmentname = 'bronchodilator - ipratropium' )",
            "pred_sql": "SELECT sum(cost.cost) FROM treatment INNER JOIN cost ON treatment.treatmentid = cost.eventid WHERE treatment.treatmentname = 'bronchodilator - ipratropium'",
            "gold_answer": "[['7.82']]",
            "pred_answer": "[['3804.96']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses SUM(cost.cost) and omits the WHERE cost.eventtype = 'treatment' filter, whereas the ground truth selects the distinct cost for that treatment. The mistake is localized to the SELECT aggregation and missing eventtype condition; the overall query structure (joining treatment to cost) is correct. Thus, this is a local error in aggregation and filtering, not a structural or multi-clause logic error.",
            "error_type": "Local: aggregation/filter error"
        },
        "222b30c626c9d40e3e5ba330": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the input that patient 016-10105 had first had on the first icu visit?",
            "gold_sql": "SELECT intakeoutput.celllabel FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '016-10105' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%intake%' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.cellpath FROM intakeoutput INNER JOIN patient ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '016-10105' ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "gold_answer": "[['p.o.']]",
            "pred_answer": "[['flowsheet|flowsheet cell labels|i&o|output (ml)|urine']]",
            "is_correct": false,
            "reasoning": "The predicted query completely alters the intended logic: it does not restrict to the patient\u2019s first ICU visit (no filtering on unitadmittime/unitdischargetime), it fails to filter for input events (no cellpath LIKE '%intake%'), orders by hospitaladmittime instead of intakeoutput time, and even selects the wrong column (cellpath vs. celllabel). These errors span multiple clauses and require a full restructure of the query, not just a minor fix in one clause.",
            "error_type": "Global: join-logic error"
        },
        "adf3b75d45df166e7546b701": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many days have there been since patient 002-10122's admission to the hospital?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.hospitaladmittime) ) FROM patient WHERE patient.uniquepid = '002-10122' AND patient.hospitaldischargetime IS NULL",
            "pred_sql": "SELECT strftime('%J', hospitaladmittime) - strftime('%J', admissiontime) AS daysadmitted FROM patient WHERE uniquepid = '002-10122'",
            "gold_answer": "[['2.263']]",
            "pred_answer": "no such column: admissiontime",
            "is_correct": false,
            "reasoning": "The predicted query references a non-existent column admissiontime instead of the correct hospitaladmittime, leading to a column reference error. This is a localized mistake in the SELECT clause and WHERE clause rather than a flaw in the overall query logic or structure.",
            "error_type": "Local: table/column reference error"
        },
        "53c37ca3610c5c63ad42caa5": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Give me the details of the time patient 021-102127 was admitted to the hospital in 2100.",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '021-102127' AND strftime('%Y',patient.hospitaladmittime) = '2100'",
            "pred_sql": "SELECT patient.hospitaladmittime FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '021-102127' AND strftime('%Y', patient.hospitaladmittime) = '2100'",
            "gold_answer": "[['2100-03-15 17:09:00']]",
            "pred_answer": "[['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00']]",
            "is_correct": false,
            "reasoning": "The predicted query adds an INNER JOIN to the vitalperiodic table on patientunitstayid, which is not requested by the question. This join is unnecessary and unrelated to admission time, and it causes the admission time to be duplicated once for each matching vitalperiodic record. Fixing this would require removing the join entirely rather than a simple tweak within a single clause, as it fundamentally changes the query logic and structure.",
            "error_type": "Global: incorrect-join error"
        },
        "f82872c399e9c56e24060fd1": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the procedure that was performed two or more times last month on patient 010-10275?",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, COUNT( treatment.treatmenttime ) AS C1 FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-10275' ) ) AND datetime(treatment.treatmenttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 >= 2",
            "pred_sql": "SELECT DISTINCT vitalperiodic.vitalname FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.unitdischargeoffset = '02' AND patient.uniquepid = '010-10275' AND vitalperiodic.vitalname LIKE '%procedure%' GROUP BY vitalperiodic.vitalname HAVING count(vitalperiodic.patientunitstayid) > 2",
            "gold_answer": "[['non-invasive ventilation']]",
            "pred_answer": "no such column: vitalperiodic.vitalname",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column \"vitalperiodic.vitalname\", causing a column reference error. This is a localized mistake in the SELECT clause rather than a flaw in the overall query structure or logic. The fix would involve correcting the column and table references, but the rest of the query framework (SELECT, JOIN, GROUP BY, HAVING) remains intact.",
            "error_type": "Local: table/column reference error"
        },
        "cf12388db91329bf2b7bd2cf": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many times since 1 year ago did patient 030-11483 receive a hct test?",
            "gold_sql": "SELECT COUNT(*) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-11483' ) ) AND lab.labname = 'hct' AND datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT count(vitalperiodic.observationtime) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '030-11483' AND vitalperiodic.observationtime >= datetime('2100-01-01 00:00:00', 'start of year', '-1 year')",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['508.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts rows from the vitalperiodic table (vital sign observations) instead of the lab table, and thus uses an entirely different table and join logic than intended. This mistake affects the core logic of the query, not just a localized clause or alias. Therefore, it is a global error in the query structure and table relationships.",
            "error_type": "Global: incorrect table join"
        },
        "6dd0c27259db780596544f5f": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How much did patient 031-10188 weigh the first time it was measured in 09/2100?",
            "gold_sql": "SELECT patient.admissionweight FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10188' ) AND patient.admissionweight IS NOT NULL AND strftime('%Y-%m',patient.unitadmittime) = '2100-09' ORDER BY patient.unitadmittime ASC LIMIT 1",
            "pred_sql": "SELECT patient.admissionweight FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '031-10188' AND strftime('%Y-%m-%d', vitalperiodic.observationtime) = '2100-09-01'",
            "gold_answer": "[['94.8']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins the patient table to vitalperiodic and filters on vitalperiodic.observationtime when the question is specifically asking for the admission weight recorded in the patient table (patient.admissionweight) at the first unit admission in September 2100. This is a fundamental logic error: it uses the wrong table for weight data and the wrong time filter, altering the intended query structure and meaning. Fixing it requires removing the join, changing the date criteria to unitadmittime, and ordering by that field\u2014i.e., a global restructuring of the query.",
            "error_type": "Global: join-logic error"
        },
        "8a40ba404a60b00e4b158864": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "This year, what are the top five most commonly taken specimens for patients within the same month after the diagnosis of prostate ca?",
            "gold_sql": "SELECT T3.culturesite FROM ( SELECT T2.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'prostate ca' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, microlab.culturesite, microlab.culturetakentime FROM microlab JOIN patient ON microlab.patientunitstayid = patient.patientunitstayid WHERE datetime(microlab.culturetakentime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.culturetakentime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.culturetakentime,'start of month') GROUP BY T2.culturesite ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT diagnosis.icd9code FROM diagnosis INNER JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE strftime('%Y %m', diagnosis.diagnosistime) = '2100 12' AND diagnosis.icd9code LIKE '585.4%' GROUP BY diagnosis.icd9code ORDER BY count(diagnosis.icd9code) DESC LIMIT 5",
            "gold_answer": "[['sputum, expectorated']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL entirely abandons the intended logic of retrieving the most common microlab.culturesite within the same month after a 'prostate ca' diagnosis this year. Instead, it selects diagnosis.icd9code, filters on a year\u2010month string and an unrelated ICD9 pattern, and groups by diagnoses rather than specimens. It fails to join diagnosis to microlab, omits the same\u2010month and post\u2010diagnosis conditions, and uses the wrong column and table. Fixing this would require rewriting major parts of the query, not just a localized tweak.",
            "error_type": "Global: incorrect table and logic"
        },
        "3c14c5beb79448ccd421c493": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the first time that patient 021-10001 had the maximum value of sao2 yesterday?",
            "gold_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '021-10001' ) ) AND vitalperiodic.sao2 IS NOT NULL AND datetime(vitalperiodic.observationtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day') ORDER BY vitalperiodic.sao2 DESC, vitalperiodic.observationtime ASC LIMIT 1",
            "pred_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '021-10001' AND vitalperiodic.observationtime >= datetime('2100 12 31 23:59:00',' 1 day') AND vitalperiodic.sao2 = ( SELECT max(sao2) FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '021-10001' AND vitalperiodic.observationtime >= datetime('2100 12 31 23:59:00',' 1 day') )",
            "gold_answer": "[['2100-12-30 19:59:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses an incorrect datetime function call and filter for \"yesterday\". It writes datetime('2100 12 31 23:59:00',' 1 day') instead of the prescribed datetime('2100-12-31 23:59:00','start of day','-1 day'). As a result, no rows match the date condition and the max(sao2) subquery also uses the same wrong filter. This is a localized error in the WHERE clause\u2019s date handling rather than a flaw in the overall join strategy or query structure.",
            "error_type": "Local: other-temporal error"
        },
        "12a07e53370dee4c45959cd3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Which are the top three most frequent output events since 2 year ago?",
            "gold_sql": "SELECT T1.celllabel FROM ( SELECT intakeoutput.celllabel, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM intakeoutput WHERE intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime) >= datetime('2100-12-31 23:59:00','-2 year') GROUP BY intakeoutput.celllabel ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT intakeoutput.cellpath FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE intakeoutput.cellpath IS NOT NULL AND intakeoutput.cellpath LIKE '%output%' AND strftime('%Y', intakeoutput.intakeoutputtime) < strftime('%Y', 'now') - 2 ORDER BY intakeoutput.cellpath DESC LIMIT 3",
            "gold_answer": "[['stool'], ['urine'], ['urine catheter']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally deviates from the intended structure and logic. Instead of aggregating by celllabel and ranking the counts to find the top three frequent output events since two years ago, it selects cellpath (not celllabel), adds an unnecessary JOIN to the patient table, applies an incorrect time filter using strftime('%Y') < strftime('%Y','now') - 2, and simply orders by cellpath descending with a LIMIT 3. These changes alter the overall query purpose\u2014there is no grouping, counting, or proper time window check\u2014so this is not a localized fix but a structural logic error.",
            "error_type": "Global: flawed aggregation and filtering logic"
        },
        "38ed40195f70eb4a952a2a53": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many times was morphine 5 mg/ml injection : 1 ml vial medication prescribed?",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.drugname = 'morphine 5 mg/ml injection : 1 ml vial'",
            "pred_sql": "SELECT count(DISTINCT medication.patientunitstayid) FROM medication INNER JOIN treatment ON medication.patientunitstayid = treatment.patientunitstayid WHERE medication.drugname = 'morphine 5 mg/ml'",
            "gold_answer": "[['12.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query not only mismatches the drug name filter ('morphine 5 mg/ml' vs the exact 'morphine 5 mg/ml injection : 1 ml vial') but also introduces an unnecessary INNER JOIN to the treatment table and changes the aggregation from COUNT(*) of medication rows to COUNT(DISTINCT patientunitstayid). This alters the overall query logic and structure, affecting the intended result.",
            "error_type": "Global: incorrect join and aggregation"
        },
        "f10a334eb28950674d5eac2e": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the minimum total cost of the hospital visits that involve a procedure called insertion of venous catheter for hemodialysis since 1 year ago?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'insertion of venous catheter for hemodialysis' ) ) AND datetime(cost.chargetime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT sum(CASE WHEN cost.eventtype = 'Procedure' AND cost.description = 'insertion of venous catheter for hemodialysis' THEN cost.cost ELSE 0 END) FROM cost INNER JOIN patient ON cost.patienthealthsystemstayid = patient.patienthealthsystemstayid WHERE cost.eventdate >= datetime(patient.hospitaladmittime, '-1 year') AND cost.eventdate <= datetime(patient.hospitaladmittime)",
            "gold_answer": "[['1640.7']]",
            "pred_answer": "no such column: cost.description",
            "is_correct": false,
            "reasoning": "The predicted SQL not only references a non-existent column (cost.description) but also completely changes the intended logic\u2014joining cost directly to patient, using the wrong date filters, failing to group by visit and take the minimum across sums, and ignoring the treatment table. Fixing these issues would require a major restructuring of the query, not just a local tweak.",
            "error_type": "Global: join and aggregation logic error"
        }
    },
    "deepseek": {
        "9aa241d49a094b71909dfa84": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What was the total continuous infusion meds amount given for patient 011-13921 on the first icu visit?",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '011-13921' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND intakeoutput.celllabel = 'continuous infusion meds' AND intakeoutput.cellpath LIKE '%intake%'",
            "pred_sql": "SELECT SUM(CAST(SUBSTR(m.dosage, 1, INSTR(m.dosage, ' ') - 1) AS REAL)) AS total_continuous_infusion_meds_amount FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '011-13921' AND m.routeadmin = 'iv' AND m.drugstarttime >= (SELECT p.unitadmittime FROM patient p WHERE p.uniquepid = '011-13921' ORDER BY p.unitadmittime ASC LIMIT 1) AND m.drugstarttime <= (SELECT p.unitdischargetime FROM patient p WHERE p.uniquepid = '011-13921' ORDER BY p.unitadmittime ASC LIMIT 1);",
            "gold_answer": "[['2254.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the data source and logic: it uses the medication table and parses the dosage field with an IV route filter, whereas the ground truth uses the intakeoutput table with celllabel 'continuous infusion meds' and cellpath LIKE '%intake%' restricted to the first ICU visit. This is not a minor syntax fix but a fundamentally different query structure and table selection, thus a global error.",
            "error_type": "Global: incorrect table usage"
        },
        "b0aec40fac3a41abe889d377": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the daily average of patient 005-10384's weight this year?",
            "gold_sql": "SELECT AVG(patient.admissionweight) FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '005-10384' ) AND patient.admissionweight IS NOT NULL AND datetime(patient.unitadmittime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY strftime('%Y-%m-%d',patient.unitadmittime)",
            "pred_sql": "SELECT AVG(weight) AS daily_average_weight FROM vitalperiodic JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '005-10384' AND datetime(vitalperiodic.observationtime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year');",
            "gold_answer": "[['65.5']]",
            "pred_answer": "no such column: weight",
            "is_correct": false,
            "reasoning": "The predicted query references a column \"weight\" in the vitalperiodic table, but no such column exists in that table (it has temperature, sao2, heartrate, etc.). This is a straightforward column reference error and does not require restructuring the query\u2019s logic or joins.",
            "error_type": "Local: column reference error"
        }
    },
    "o4-mini": {
        "4f6b31be61ebcdb2cc215e06": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What are the top four most frequent medications prescribed within 2 months to patients in their 30s after they are diagnosed with pre-eclampsia/ eclampsia?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'pre-eclampsia/ eclampsia' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.age BETWEEN 30 AND 39 ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH first_diag AS ( SELECT patientunitstayid, MIN(diagnosistime) AS diag_time FROM diagnosis WHERE LOWER(diagnosisname) LIKE '%pre-eclampsia%' OR LOWER(diagnosisname) LIKE '%eclampsia%' GROUP BY patientunitstayid ) SELECT m.drugname FROM first_diag fd JOIN patient p ON p.patientunitstayid = fd.patientunitstayid JOIN medication m ON m.patientunitstayid = fd.patientunitstayid WHERE p.age BETWEEN 30 AND 39 AND m.drugstarttime >= fd.diag_time AND m.drugstarttime <= DATETIME(fd.diag_time, '+2 months') GROUP BY m.drugname ORDER BY COUNT(*) DESC LIMIT 4;",
            "gold_answer": "[['1000 ml : lactated ringers iv soln'], ['alprazolam 0.5 mg po tabs'], ['diphenhydramine hcl 25 mg po caps'], ['diphenhydramine hcl 50 mg/ml ij soln'], ['metoclopramide hcl 5 mg/ml ij soln'], ['naloxone hcl 0.4 mg/ml ij soln'], ['ondansetron hcl 4 mg po tabs'], ['ondansetron hcl 4 mg/2ml ij soln'], ['oxycodone-acetaminophen 5-325 mg po tabs'], ['sennosides-docusate sodium 8.6-50 mg po tabs'], ['sodium chloride 0.9 % ij soln'], ['zolpidem tartrate 5 mg po tabs']]",
            "pred_answer": "[['diphenhydramine hcl 25 mg po caps'], ['diphenhydramine hcl 50 mg/ml ij soln'], ['ondansetron hcl 4 mg/2ml ij soln'], ['sennosides-docusate sodium 8.6-50 mg po tabs']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes how the top medications are selected: it uses LIMIT 4 rather than a DENSE_RANK() window to include ties, and it groups by patientunitstayid rather than uniquepid. These are not simple syntax fixes but alter the overall logic and result set. Therefore, this is a structural, global error in the query\u2019s ranking and grouping logic.",
            "error_type": "Global: incorrect ranking logic"
        },
        "fd64d6670cf4d3da09d342f3": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many times did patient 004-1262 have clonidine?",
            "gold_sql": "SELECT COUNT(*) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-1262' ) ) AND treatment.treatmentname = 'clonidine'",
            "pred_sql": "SELECT COUNT(*) AS clonidine_count FROM medication m JOIN patient p ON m.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '004-1262' AND m.drugname LIKE '%clonidine%';",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication table and joins on patientuniquepid, but the intent is to count treatment events (treatment table) for clonidine. This is not a simple column or syntax mistake\u2014it fundamentally changes the query logic by querying the wrong table and association. Fixing it would require rewriting the entire FROM/JOIN clause to use the treatment table instead of medication, so it is a global error.",
            "error_type": "Global: incorrect join"
        }
    }
}