{
    "codes": {
        "7c89f2615c9df69c34bbec67": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 031-10578 receive a urine, voided specimen microbiology test for the last time since 10/2100?",
            "gold_sql": "SELECT microlab.culturetakentime FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10578' ) ) AND microlab.culturesite = 'urine, voided specimen' AND strftime('%Y-%m',microlab.culturetakentime) >= '2100-10' ORDER BY microlab.culturetakentime DESC LIMIT 1",
            "pred_sql": "SELECT lab.labresulttime FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '031-10578' AND lab.labname = 'Urine, void specimen' AND strftime('%Y',lab.labresulttime) = '2100' AND strftime('%m',lab.labresulttime) = '10' ORDER BY lab.labresulttime DESC LIMIT 1",
            "gold_answer": "[['2100-12-05 03:15:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries the lab table and uses lab.labname instead of querying microlab.culturesite on the microlab table. The question explicitly asks for a microbiology test result (\u201curine, voided specimen microbiology test\u201d), which is stored in microlab, not lab. By using the wrong table and field, it completely changes the query\u2019s logic and returns no results. This is not a simple typo in a column name but a fundamental structural error requiring a different table and join, so it is a global error.",
            "error_type": "Global: wrong table usage"
        },
        "efb670084c99628cf9947e3b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Retrieve the top three most common input events since 2 year ago.",
            "gold_sql": "SELECT T1.celllabel FROM ( SELECT intakeoutput.celllabel, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM intakeoutput WHERE intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime) >= datetime('2100-12-31 23:59:00','-2 year') GROUP BY intakeoutput.celllabel ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT intakeoutput.cellpath FROM vitalperiodic INNER JOIN intakeoutput ON vitalperiodic.patientunitstayid = intakeoutput.patientunitstayid WHERE intakeoutput.cellpath LIKE '%input%' AND vitalperiodic.observationtime > datetime('now', '-2 years') GROUP BY intakeoutput.cellpath ORDER BY count(intakeoutput.cellpath) DESC LIMIT 3",
            "gold_answer": "[['continuous infusion meds'], ['ns ivf'], ['p.o.']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces a JOIN with the vitalperiodic table, which is not required by the question and fundamentally changes the scope of the query by restricting intake events to those with matching vital records. It also selects cellpath instead of celllabel and uses the wrong time reference ('now' instead of the fixed '2100-12-31 23:59:00'), altering the intended logic. These issues span multiple clauses and require restructuring the query logic to fix, so it is a Global error.",
            "error_type": "Global: incorrect join"
        },
        "1f0a42220dea53233554b8ab": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Show me the difference between patient 002-1185's total input and output yesterday.",
            "gold_sql": "SELECT ( SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-1185' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day') ) - ( SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-1185' ) ) AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day') )",
            "pred_sql": "SELECT sum(CASE WHEN intakeoutput.cellpath LIKE '%intake%' THEN intakeoutput.cellvaluenumeric ELSE 0 END) - sum(CASE WHEN intakeoutput.cellpath LIKE '%output%' THEN intakeoutput.cellvaluenumeric ELSE 0 END) FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '002-1185' AND intakeoutput.intakeoutputtime LIKE '2100-12-31%'",
            "gold_answer": "[['2826.0']]",
            "pred_answer": "[['936.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL has a localized mistake in the WHERE clause: it filters intakeoutput.intakeoutputtime LIKE '2100-12-31%' (today) instead of filtering for yesterday using the required datetime(...) = datetime('2100-12-31 23:59:00','start of day','-1 day'). This temporal filter error is confined to a specific condition and does not require restructuring joins or the overall logic.",
            "error_type": "Local: other-temporal error"
        },
        "22bb11305202941a2417c8ab": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many times was milk of magnesia ud liq 30 ml prescribed for patient 006-102963 on the first hospital visit?",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-102963' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND medication.drugname = 'milk of magnesia ud liq 30 ml'",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patientunitstayid = 61880 AND medication.drugname = 'milk of magnesia ud liq 30 ml'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL hard-codes a single patientunitstayid (61880) rather than using the subquery logic to identify the patient\u2019s first hospital visit by patienthealthsystemstayid and hospitaladmittime as required. By replacing the multi-step filter with a fixed unitstayid, it fundamentally changes the query\u2019s intent and yields the wrong result. This is not a minor syntax or column reference mistake but a structural flaw in how the first hospital visit is determined.",
            "error_type": "Global: incorrect filtering logic"
        },
        "fbe51bdcf93df9fe52db2682": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Present the count of icu visits for patient 027-100293 in 2100.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.patientunitstayid ) FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-100293' ) AND strftime('%Y',patient.unitadmittime) = '2100'",
            "pred_sql": "SELECT count(patienthealthsystemstayid) FROM patient WHERE uniquepid = '027-100293' AND unitdischargeoffset >= 2100000000",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: unitdischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column 'unitdischargeoffset' in the patient table, causing the error 'no such column: unitdischargeoffset'. This is a localized column reference issue in the WHERE clause and does not affect the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "919f039cb4f4fe92f49e7c86": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many current patients belong to the 30s age category?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NULL AND patient.age BETWEEN 30 AND 39",
            "pred_sql": "SELECT count(patientunitstayid) FROM patient WHERE age >= 30 AND age < 40 AND hospitaldischargeoffset IS NULL",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: hospitaldischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column hospitaldischargeoffset instead of the correct hospitaldischargetime. This is purely a column reference error localized to the WHERE clause and does not alter the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "23bd0f2e14627cd02d82be60": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the name of the lab test that patient 004-11678 received first on the current hospital visit?",
            "gold_sql": "SELECT lab.labname FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-11678' AND patient.hospitaldischargetime IS NULL ) ) ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT lab.labname FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.patientunitstayid = 11678 ORDER BY patient.hospitaladmittime DESC LIMIT 1",
            "gold_answer": "[['sodium']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins lab to patient but then filters on patient.patientunitstayid = 11678 (erroneously treating the unique PID as the unit stay ID) and omits the WHERE patient.hospitaldischargetime IS NULL condition entirely. This is not a simple typo or local clause mistake\u2014it fundamentally alters which records are selected and ignores the \"current hospital visit\" requirement. Correcting this requires restructuring the filter logic (using patient.uniquepid and checking hospitaldischargetime IS NULL), so it is a global error.",
            "error_type": "Global: incorrect filter and join logic"
        },
        "a18e5a51354eb5e0974771b6": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Among patients who received non-invasive ventilation this year, what are the top four most frequent medications that followed within the same month?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'non-invasive ventilation' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.drugstarttime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugstarttime LIKE '2100-11%' AND patient.unittype LIKE 'VENT' GROUP BY medication.drugname ORDER BY count(patient.patientunitstayid) DESC LIMIT 4",
            "gold_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['potassium chloride'], ['potassium chloride 20 meq in 50 ml ivpb **locked dose'], ['potassium chloride crys er 20 meq po tbcr']]",
            "pred_answer": "no such column: patient.unittype",
            "is_correct": false,
            "reasoning": "The predicted SQL references patient.unittype, which does not exist in the provided schema, causing a column reference error. This is a localized mistake in the WHERE clause that does not require restructuring the overall query logic.",
            "error_type": "Local: table/column reference error"
        },
        "e3634a5a873426f73dde721b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What drugs are being added to patient 002-1185's prescription today, as compared to yesterday?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.uniquepid = '002-1185' ) AND datetime(medication.drugstarttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day') EXCEPT SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.uniquepid = '002-1185' ) AND datetime(medication.drugstarttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day')",
            "pred_sql": "SELECT DISTINCT CASE WHEN datetime(medication.drugstarttime) = datetime('2100-12-31 23:59:59') THEN 'today' ELSE 'yesterday' END AS date FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '002-1185'",
            "gold_answer": "[['acetaminophen 325 mg po tabs']]",
            "pred_answer": "[['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday']]",
            "is_correct": false,
            "reasoning": "The predicted SQL does not follow the overall intended logic of finding drug names added today compared to yesterday. Instead of selecting and comparing medication.drugname sets for today and yesterday (using EXCEPT), it simply returns a CASE expression of 'today' or 'yesterday' labels without any drug names or set difference. This is a fundamental structural and logical error that affects the entire query rather than a localized clause.",
            "error_type": "Global: incorrect query logic"
        },
        "c18b36446697d1dd00ce17f4": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the maximum overall hospital cost that includes ipratropium bromide 0.02 % in soln this year?",
            "gold_sql": "SELECT MAX(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT medication.patientunitstayid FROM medication WHERE medication.drugname = 'ipratropium bromide 0.02 % in soln' ) ) AND datetime(cost.chargetime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT max(cost.cost) FROM cost INNER JOIN patient ON cost.patienthealthsystemstayid = patient.patienthealthsystemstayid WHERE cost.cost = 'ipratropium bromide 0.02 % in soln this year'",
            "gold_answer": "[['3713.41']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely fails to capture the intended logic: it never sums costs per hospital stay, never filters by the medication or by the year, and even compares the numeric cost column to a string that includes the drug name and 'this year'. It only joins cost to patient and then applies a nonsensical WHERE clause on cost.cost. Fixing this would require rewriting the core structure of the query (adding subqueries or GROUP BY, proper joins to medication, date filtering, and summing), not just tweaking a single clause. Therefore, this is a Global error.",
            "error_type": "Global: join/logical error"
        }
    },
    "deepseek": {
        "a63f998370bbc0b3359e838b": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "List the top four most frequent diagnoses that patients are diagnosed with within the same hospital visit after receiving inotropic agent - epinephrine > 0.1 micrograms/kg/min this year.",
            "gold_sql": "SELECT T3.diagnosisname FROM ( SELECT T2.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'inotropic agent - epinephrine > 0.1 micrograms/kg/min' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.diagnosistime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.diagnosisname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT diagnosisname FROM diagnosis WHERE patientunitstayid IN ( SELECT m.patientunitstayid FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE m.drugname = 'inotropic agent - epinephrine' AND (CAST(SUBSTR(m.dosage, 1, INSTR(m.dosage, ' ') - 1) AS REAL) / p.admissionweight) > 0.1 AND STRFTIME('%Y', p.hospitaladmittime) = '2100' AND m.drugstarttime < diagnosistime ) GROUP BY diagnosisname ORDER BY COUNT(diagnosisname) DESC LIMIT 4;",
            "gold_answer": "[['s/p cabg < 7 days'], ['valve replacement < 7days - aortic']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic by using the medication table instead of the treatment table, miscomputing the dosage condition, filtering by hospital admission year rather than treatment/diagnosis times, and failing to join on the same patienthealthsystemstayid to ensure diagnoses occur within the same visit. These errors span multiple clauses and alter the intended data relationships, requiring a complete restructuring of the query logic rather than a localized fix.",
            "error_type": "Global: incorrect table usage and join logic"
        },
        "fb0def8c2f5978a67d16803e": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "When was the last time that patient 007-10459 was prescribed nacl 0.9% adv and vancomycin in 05/2100 at the same time?",
            "gold_sql": "SELECT T1.drugstarttime FROM ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10459' ) AND medication.drugname = 'vancomycin' AND strftime('%Y-%m',medication.drugstarttime) = '2100-05' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10459' ) AND medication.drugname = 'nacl 0.9% adv' AND strftime('%Y-%m',medication.drugstarttime) = '2100-05' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) ORDER BY T1.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(m1.drugstarttime) AS last_prescription_time FROM patient JOIN medication m1 ON patient.patientunitstayid = m1.patientunitstayid JOIN medication m2 ON m1.patientunitstayid = m2.patientunitstayid WHERE patient.patientidentifier = '007-10459' AND m1.drugname = 'nacl 0.9% adv' AND m2.drugname = 'vancomycin' AND m1.drugstarttime < m2.drugstoptime AND m2.drugstarttime < m1.drugstoptime AND strftime('%Y-%m', m1.drugstarttime) = '2100-05' AND strftime('%Y-%m', m2.drugstarttime) = '2100-05';",
            "gold_answer": "[['2100-05-22 05:44:00']]",
            "pred_answer": "no such column: patient.patientidentifier",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it references patient.patientidentifier, which does not exist in the schema (the correct column is patient.uniquepid). This is a simple column naming mistake localized to the WHERE clause and can be fixed without altering the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        }
    },
    "llm2sql": {
        "9850b09854dcbb18771ddd9c": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What were the number of patients who received a ptt ratio test since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'ptt ratio' AND datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year') )",
            "pred_sql": "SELECT COUNT(DISTINCT patientunitstayid) FROM lab WHERE labname = 'ptt ratio' AND datetime(labresulttime) >= datetime('2100-12-31 23:59:00', '-1 year')",
            "gold_answer": "[['20.0']]",
            "pred_answer": "[['22.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts DISTINCT patientunitstayid directly from the lab table, effectively counting distinct ICU stays rather than distinct patients. The ground truth SQL first identifies patientunitstayid values from the lab table and then counts DISTINCT patient.uniquepid in the patient table, ensuring that the result is the number of unique patients. By omitting the patient table join and using the wrong field for counting, the predicted query fundamentally alters the query\u2019s intended meaning\u2014counting stays instead of patients.",
            "error_type": "Global: join error"
        },
        "017a9b0a55f8e7958d82ef86": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the number of days since patient 002-10122 was first diagnosed with acute respiratory failure on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) ) FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-10122' AND patient.hospitaldischargetime IS NULL ) ) AND diagnosis.diagnosisname = 'acute respiratory failure' ORDER BY diagnosis.diagnosistime ASC LIMIT 1",
            "pred_sql": "SELECT ROUND((julianday('2100-12-31 23:59:00') - julianday(D1.diagnosistime)), 0) AS days_since_diagnosis FROM patient AS P INNER JOIN diagnosis AS D1 ON P.patientunitstayid = D1.patientunitstayid WHERE P.uniquepid = '002-10122' AND D1.diagnosisname = 'acute respiratory failure' AND P.hospitaldischargetime IS NULL ORDER BY D1.diagnosistime ASC LIMIT 1",
            "gold_answer": "[['2.255']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates only in the SELECT clause by using ROUND(..., 0) on the day difference, producing an integer value with one decimal (\u20182.0\u2019) instead of the more precise float rounded to three decimals (\u20182.255\u2019) as required. The join logic, table references, and WHERE filters correctly identify the current hospital visit and diagnosis, so the structural and logical flow remains intact. The only mistake is the local rounding of the numerical result.",
            "error_type": "Local: rounding error"
        }
    },
    "dinsql": {
        "f9fcc93b5505cb3b35d9dfdc": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "List the top three most common diagnoses for patients in their 30s.",
            "gold_sql": "SELECT T1.diagnosisname FROM ( SELECT diagnosis.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age BETWEEN 30 AND 39 ) GROUP BY diagnosis.diagnosisname ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT diagnosisname FROM diagnosis WHERE patientunitstayid IN ( SELECT patientunitstayid FROM patient WHERE CAST(age AS INTEGER) BETWEEN 30 AND 39 ) GROUP BY diagnosisname ORDER BY COUNT(diagnosisname) DESC LIMIT 3",
            "gold_answer": "[['acute respiratory failure'], ['diabetes mellitus'], ['esrd (end stage renal disease)'], ['septic shock']]",
            "pred_answer": "[['acute respiratory failure'], ['diabetes mellitus'], ['esrd (end stage renal disease)']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a simple GROUP BY with ORDER BY COUNT and LIMIT 3, whereas the ground truth uses DENSE_RANK to include all diagnoses tied for the third most common. By using LIMIT 3, the predicted query omits any tied entries beyond the first three rows, thus changing the intended logic of returning all top-three-ranked diagnoses (including ties). This is not a minor column typo or syntax fix but a fundamental flaw in the ranking strategy that spans the overall query structure. Therefore, it is a Global error.",
            "error_type": "Global: incorrect ranking method"
        },
        "2d0d2460ff714b2ed38ef17a": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What are the five most frequently prescribed medications for patients diagnosed with hypertension - hypertensive emergency/urgency previously within the same month, since 1 year ago?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hypertension - hypertensive emergency/urgency' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT T2.drugname FROM diagnosis AS T1 JOIN medication AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.diagnosisname = 'hypertension - hypertensive emergency/urgency' AND datetime(T1.diagnosistime, 'start of month') = datetime(T2.drugstarttime, 'start of month') AND datetime(T1.diagnosistime) >= datetime('2100-12-31 23:59:00', '-1 year') GROUP BY T2.drugname ORDER BY COUNT(T2.drugname) DESC LIMIT 5",
            "gold_answer": "[['10 ml vial : heparin sodium (porcine) 1000 unit/ml ij soln'], ['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['albuterol sulfate (2.5 mg/3ml) 0.083% in nebu'], ['alteplase 2 mg ij solr'], ['vancomycin hcl 1000 mg iv solr']]",
            "pred_answer": "[['10 ml vial : heparin sodium (porcine) 1000 unit/ml ij soln'], ['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['2 ml : ondansetron hcl 4 mg/2ml iv soln'], ['amlodipine besylate 10 mg po tabs'], ['carvedilol 6.25 mg po tabs']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the critical condition ensuring that each medication\u2019s start time occurs after the diagnosis time (T1.diagnosistime < T2.drugstarttime). This missing temporal filter causes medications prescribed earlier in the same month to be incorrectly counted. The overall query structure (JOIN, GROUP BY, ORDER BY and LIMIT) remains intact; only a localized WHERE\u2010clause condition is missing.",
            "error_type": "Local: other-temporal error"
        },
        "47fc7d3548e30d33d281d558": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Please tell me the total number of patients who had a cl flush: introducer sheath ij r input since 2100.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT intakeoutput.patientunitstayid FROM intakeoutput WHERE intakeoutput.celllabel = 'cl flush: introducer sheath ij r' AND intakeoutput.cellpath LIKE '%input%' AND strftime('%Y',intakeoutput.intakeoutputtime) >= '2100' )",
            "pred_sql": "SELECT COUNT(DISTINCT P.patientunitstayid) FROM patient AS P INNER JOIN intakeoutput AS IO ON P.patientunitstayid = IO.patientunitstayid WHERE IO.cellpath LIKE '%cl flush: introducer sheath ij r%' AND datetime(IO.intakeoutputtime) >= datetime('2100-01-01 00:00:00')",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['3.0']]",
            "is_correct": false,
            "reasoning": "The predicted query makes localized mistakes in the SELECT and WHERE clauses without altering the overall query structure. Specifically: (1) It uses IO.cellpath LIKE '%cl flush\u2026%' instead of filtering on the correct column (celllabel) and misses the required input filter (cellpath LIKE '%input%'). (2) It counts DISTINCT patientunitstayid instead of DISTINCT patient.uniquepid. These are column/reference and filter errors confined to individual clauses, not a change in the join logic or overall query design.",
            "error_type": "Local: column/filter reference error"
        }
    },
    "macsql": {
        "ca898dcba71dbcfe723e83b0": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "How many patients had a skin test administered?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT microlab.patientunitstayid FROM microlab WHERE microlab.culturesite = 'skin' )",
            "pred_sql": "SELECT COUNT(DISTINCT `patientunitstayid`) AS num_patients_with_skin_test FROM lab WHERE `labname` LIKE '%skin%'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the lab table and filters on labname LIKE '%skin%', whereas the correct logic requires querying the microlab table and filtering on culturesite = 'skin'. This is not a simple typo or local clause mistake but a fundamental misuse of the wrong table, altering the query\u2019s overall logic.",
            "error_type": "Global: incorrect table selection"
        },
        "d9e859cc9f043fddabe6d778": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "How many days have elapsed since the first time a procedure was performed on patient 027-100843 on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',treatment.treatmenttime) ) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-100843' AND patient.hospitaldischargetime IS NULL ) ) ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT JULIANDAY('2100-12-31 23:59:00') - JULIANDAY( (SELECT MIN(`treatmenttime`) FROM treatment WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '027-100843' AND `hospitaldischargetime` IS NULL )) ) AS days_elapsed",
            "gold_answer": "[['34.919']]",
            "pred_answer": "[['7.621']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes how the patient\u2019s current admission is identified and how the first procedure time is retrieved. The ground truth SQL first finds the patient\u2019s current hospital admission (via patienthealthsystemstayid) and then filters all treatment records for any ICU stay (patientunitstayid) within that admission, ordering by treatment time to get the very first procedure. The predicted SQL, however, simply selects a single patientunitstayid row (without considering the patienthealthsystemstayid join) and then takes MIN(treatmenttime) for that one unitstay. This alters the intended relationship between hospital admissions and ICU stays and thus the resulting treatment time. Correcting this isn\u2019t a small tweak in one clause but requires restoring the proper sub-query structure (or join) to bind to the correct admission, so it\u2019s a global logic/structure error.",
            "error_type": "Global: incorrect join error"
        }
    },
    "qwen3": {
        "5e88f3adc2224af386b15188": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many patients underwent cardiology consultation within the same hospital visit after normal saline solution?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'normal saline solution' ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'cardiology consultation' ) AS T2 WHERE T1.treatmenttime < T2.treatmenttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) FROM treatment t JOIN patient p ON t.patientunitstayid = p.patientunitstayid WHERE t.treatmentname = 'normal saline administration' AND EXISTS ( SELECT 1 FROM diagnosis d JOIN patient p2 ON d.patientunitstayid = p2.patientunitstayid WHERE p2.patienthealthsystemstayid = p.patienthealthsystemstayid AND d.diagnosisname = 'cardiology consultation' AND d.diagnosistime > t.treatmenttime );",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the logic by querying the diagnosis table for 'cardiology consultation' instead of the treatment table and even uses the wrong treatment name 'normal saline administration'. This is not a localized typo or minor syntax issue but a structural error that alters which tables and relationships are used, thus requiring a significant rewrite of the query logic.",
            "error_type": "Global: incorrect table/join usage"
        }
    }
}