{
    "codes": {
        "7e59c5d99907c76cf6b5598a": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the minimum monthly number of patients who had bacteremia - gram negative rod?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT COUNT( DISTINCT diagnosis.patientunitstayid ) AS C1 FROM diagnosis WHERE diagnosis.diagnosisname = 'bacteremia - gram negative rod' GROUP BY strftime('%Y-%m',diagnosis.diagnosistime) ) AS T1",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE diagnosis.diagnosisname LIKE '%bacteremia - gram negative rod%' AND diagnosis.diagnosisname LIKE '%colitis%' AND vitalperiodic.observationtime > patient.hospitaladmittime AND vitalperiodic.observationtime < date(patient.hospitaladmittime, '+1 MONTH')",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the logic by joining unrelated tables (vitalperiodic), adding extra filters on diagnosisname (including an irrelevant 'colitis' condition), and applying a time window on observationtime\u2014none of which align with the intended monthly aggregation of distinct diagnosis records. This is not a fixable syntax or single-clause mistake but a fundamental restructuring error that alters the query\u2019s purpose.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "b2647d82e56896db485d4407": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the prescription drug that patient 030-12393 was prescribed within the same hospital visit after being diagnosed with hyperglycemia in 11/this year?",
            "gold_sql": "SELECT T2.drugname FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-12393' ) AND diagnosis.diagnosisname = 'hyperglycemia' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',diagnosis.diagnosistime) = '11' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-12393' ) AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',medication.drugstarttime) = '11' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid INNER JOIN diagnosis ON diagnosis.patientunitstayid = patient.patientunitstayid INNER JOIN vitalperiodic ON vitalperiodic.patientunitstayid = diagnosis.patientunitstayid WHERE diagnosis.icd9code = '401.9' AND strftime('%m',vitalperiodic.observationtime) = '11' AND patient.uniquepid = '030-12393'",
            "gold_answer": "[['aspirin'], ['diltiazem hcl'], ['diltiazem hcl'], ['diltiazem hcl'], ['diltiazem hcl'], ['diltiazem hcl'], ['diphenhydramine hcl'], ['furosemide'], ['furosemide'], ['insulin lispro'], ['lisinopril'], ['metoprolol tartrate'], ['metoprolol tartrate'], ['metoprolol tartrate'], ['metoprolol tartrate'], ['pantoprazole'], ['simvastatin']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the query logic by:\n1. Joining an unrelated vitalperiodic table, which is not part of the question about prescriptions after a hyperglycemia diagnosis.\n2. Filtering diagnosis by icd9code = '401.9' (hypertension) instead of diagnosisname = 'hyperglycemia'.\n3. Filtering on vitalperiodic.observationtime rather than medication.drugstarttime.\n4. Failing to enforce the temporal condition (diagnosis before prescription) and restricting to the same hospital visit.\nThese errors span multiple joins and clauses and fundamentally alter the query\u2019s intended structure and meaning. This is a Global error.",
            "error_type": "Global: join-error"
        },
        "57e889bf3fe08a0c30249fce": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 006-1016 experience the first instance where their heart rate was greater than 135.0?",
            "gold_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-1016' ) ) AND vitalperiodic.heartrate > 135.0 AND vitalperiodic.heartrate IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1",
            "pred_sql": "SELECT observationtime FROM vitalperiodic WHERE patientunitstayid = 241360 AND heartrate > 135 ORDER BY observationtime LIMIT 1",
            "gold_answer": "[['2100-01-16 02:20:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query hard-codes patientunitstayid = 241360 instead of deriving the correct patientunitstayid(s) for uniquepid '006-1016' via the patient table joins. This is not a simple syntax or column-name mistake but a flawed filtering strategy that breaks the intended relationship between patient and vitalperiodic. It alters which records are considered and thus the overall logic of fetching the first high heart rate event for the specified patient.",
            "error_type": "Global: incorrect join/filter relationship"
        },
        "91fbea49b336f86cd67dbbda": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many days have elapsed since the last time patient 006-106259 got a platelets x 1000 lab test on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',lab.labresulttime) ) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106259' AND patient.hospitaldischargetime IS NULL ) ) AND lab.labname = 'platelets x 1000' ORDER BY lab.labresulttime DESC LIMIT 1",
            "pred_sql": "SELECT 2100 - strftime('%Y', lab.labresulttime) - strftime('%m', lab.labresulttime) + strftime('%d', lab.labresulttime) AS num FROM patient INNER JOIN lab ON patient.patientunitstayid = lab.patientunitstayid WHERE patient.uniquepid = '006-106259' AND lab.labname = 'platelets x 1000'",
            "gold_answer": "[['1.52']]",
            "pred_answer": "[['15.0'], ['16.0'], ['17.0'], ['18.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict the lab results to the current hospital visit (no filter on hospitaldischargetime) and does not pick the most recent lab (no ORDER BY/LIMIT). It also uses an incorrect formula for date difference (2100 - year - month + day), rather than computing the Julian day difference relative to the fixed current time. These issues span multiple clauses (JOIN, WHERE, SELECT) and alter the overall logic, making the query fundamentally unable to answer the intended question.",
            "error_type": "Global: flawed structure and date calculation"
        },
        "ea593b30374a160e1a7febd4": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Is patient 002-12056's alt (sgpt) last measured on the first hospital visit greater than the first value measured on the first hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-12056' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND lab.labname = 'alt (sgpt)' ORDER BY lab.labresulttime DESC LIMIT 1 ) > ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-12056' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND lab.labname = 'alt (sgpt)' ORDER BY lab.labresulttime ASC LIMIT 1 )",
            "pred_sql": "SELECT DISTINCT CASE WHEN iif(sum(CASE WHEN vitalperiodic.observationlabel = 'ALT (SGPT)' THEN 1 ELSE 0 END) - sum(CASE WHEN vitalperiodic.observationlabel = 'ALT (SGPT)' THEN 0 ELSE 1 END) > 0, 1, 0) THEN 'YES' ELSE 'NO' END FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '002-12056' AND patient.hospitaldischargeoffset = 0",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: vitalperiodic.observationlabel",
            "is_correct": false,
            "reasoning": "The predicted SQL references vitalperiodic.observationlabel, but the vitalperiodic table does not have an observationlabel column. This is a straightforward column reference error and does not require restructuring the entire query logic.",
            "error_type": "Local: table/column reference error"
        },
        "fd36b7748e8aadbcb2963358": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What's the respiratory rate change of patient 027-101654 second measured on the first icu visit compared to the first value measured on the first icu visit?",
            "gold_sql": "SELECT ( SELECT vitalperiodic.respiration FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-101654' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND vitalperiodic.respiration IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1 OFFSET 1 ) - ( SELECT vitalperiodic.respiration FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-101654' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND vitalperiodic.respiration IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1 )",
            "pred_sql": "SELECT vitalperiodic.respiration - ( SELECT vitalperiodic.respiration FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '027-101654' ORDER BY vitalperiodic.observationtime ASC LIMIT 1 ) AS resp_change FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid ORDER BY vitalperiodic.observationtime ASC LIMIT 1",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['6.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict to the first ICU visit and does not correctly select the second respiration measurement. Instead, it joins all vitalperiodic records for the patient, uses ORDER BY and LIMIT 1 in the outer query (which yields the first measurement, not the second), and lacks the subquery logic to identify the first ICU stay. These mistakes alter the overall query structure and logic rather than a single clause, so this is a global error.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "cd490e6dc2219e3ae3f771d1": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Could you tell me the name of the drug that was prescribed two times to patient 006-101311?",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, COUNT( medication.drugstarttime ) AS C1 FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-101311' ) ) GROUP BY medication.drugname ) AS T1 WHERE T1.C1 = 2",
            "pred_sql": "SELECT medication.drugname FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE patient.uniquepid = '006-101311' GROUP BY medication.drugname ORDER BY count(patient.patientunitstayid) = 2 LIMIT 1",
            "gold_answer": "[['magnesium sulfate 2 gm/50 ml ivpb']]",
            "pred_answer": "[['aspirin 325mg tab']]",
            "is_correct": false,
            "reasoning": "The predicted query correctly joins patient to medication and groups by drugname but mistakenly uses ORDER BY count(...) = 2 and LIMIT 1 instead of filtering with a WHERE or HAVING count = 2. This misuse of ORDER BY is confined to a specific clause and does not require restructuring the joins or overall query logic. It can be fixed locally by replacing the ORDER BY/ LIMIT logic with a HAVING count = 2 filter.",
            "error_type": "Local: incorrect filtering in ORDER BY clause"
        },
        "09866a4f032da7b5f0cf5fef": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What's the cost of a drug known as buffered lidocaine 1%?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'medication' AND cost.eventid IN ( SELECT medication.medicationid FROM medication WHERE medication.drugname = 'buffered lidocaine 1%' )",
            "pred_sql": "SELECT DISTINCT cost.cost FROM medication INNER JOIN cost ON medication.patientunitstayid = cost.patientunitstayid WHERE medication.drugname = 'buffered lidocaine 1%'",
            "gold_answer": "[['14.04']]",
            "pred_answer": "[['10.03'], ['10.04'], ['10.06'], ['10.19'], ['10.42'], ['10.5'], ['10.57'], ['10.61'], ['10.62'], ['10.79'], ['10.82'], ['10.98'], ['11.14'], ['11.5'], ['11.62'], ['11.66'], ['12.14'], ['12.33'], ['12.35'], ['12.68'], ['12.75'], ['12.76'], ['12.78'], ['12.9'], ['12.99'], ['13.17'], ['13.21'], ['13.31'], ['13.42'], ['13.46'], ['13.47'], ['13.5'], ['13.52'], ['13.6'], ['13.65'], ['13.68'], ['13.69'], ['13.79'], ['13.86'], ['13.88'], ['13.91'], ['13.94'], ['13.95'], ['13.97'], ['13.99'], ['14.04'], ['14.05'], ['14.13'], ['14.2'], ['14.27'], ['14.33'], ['14.35'], ['14.39'], ['14.41'], ['14.44'], ['14.62'], ['14.67'], ['14.74'], ['14.83'], ['14.94'], ['14.96'], ['15.0'], ['15.18'], ['15.26'], ['15.3'], ['15.4'], ['15.53'], ['15.74'], ['15.77'], ['15.79'], ['15.85'], ['16.66'], ['6.15'], ['6.23'], ['6.61'], ['6.81'], ['6.91'], ['7.07'], ['7.2'], ['7.51'], ['7.7'], ['7.77'], ['7.82'], ['7.9'], ['7.98'], ['8.13'], ['8.25'], ['8.46'], ['8.52'], ['8.59'], ['8.61'], ['8.63'], ['8.65'], ['8.75'], ['8.78'], ['8.86'], ['8.97'], ['9.01'], ['9.11'], ['9.22']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins medication to cost on patientunitstayid rather than linking cost.eventid to medication.medicationid and filtering cost.eventtype = 'medication'. This incorrect join key pulls in all cost records for patients who received the drug, rather than the cost of that specific drug event. Fixing it requires restructuring the JOIN and WHERE clauses (using cost.eventid and eventtype), which is a change to the overall query logic rather than a minor local fix.",
            "error_type": "Global: incorrect join key"
        }
    },
    "macsql": {
        "7f8b7f9548aac71092377027": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Count the number of times that patient 028-10451 had oral on this month/14.",
            "gold_sql": "SELECT COUNT(*) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '028-10451' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND intakeoutput.celllabel = 'oral' AND datetime(intakeoutput.intakeoutputtime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') AND strftime('%d',intakeoutput.intakeoutputtime) = '14'",
            "pred_sql": "SELECT COUNT(*) FROM intakeoutput WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '028-10451' ) AND `cellpath` LIKE '%intake%' AND `celllabel` = 'p.o.' AND datetime(`intakeoutputtime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') AND strftime('%d', `intakeoutputtime`) = '14'",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s mistake is confined to the WHERE clause: it uses the wrong intake label ('p.o.' instead of 'oral') and oversimplifies the patient lookup, but the overall query structure (COUNT, date filtering, table relationships) remains intact. This is a localized error in the data filtering, not a fundamental logic or join structure issue.",
            "error_type": "Local: value parsing error"
        },
        "0815c33a58055c1981683dbf": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What was the last medication that patient 030-10753 was prescribed in 02/this year?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-10753' ) ) AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',medication.drugstarttime) = '02' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT T2.`drugname` FROM patient AS T1 INNER JOIN medication AS T2 ON T1.`patientunitstayid` = T2.`patientunitstayid` WHERE T1.`uniquepid` = '030-10753' AND datetime(T2.`drugstarttime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') AND strftime('%d', T2.`drugstarttime`) = '02' ORDER BY T2.`drugstarttime` DESC LIMIT 1",
            "gold_answer": "[['lorazepam']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s JOIN and table references are correct, but its WHERE clause incorrectly filters for records on the 2nd day of the current month (using start-of-month plus day = '02') instead of filtering for the month '02' of this year. This is an error confined to the temporal filtering logic in the WHERE clause and does not change the overall structure or joins of the query.",
            "error_type": "Local: other-temporal error"
        },
        "c3c29c659b13a485cb286bdd": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "When was the last time since 05/2100 that patient 025-11138 was prescribed with potassium chloride er 10 meq tablet,extended release and 15 ml cup : potassium chloride 10 % oral liqd at the same time?",
            "gold_sql": "SELECT T1.drugstarttime FROM ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-11138' ) AND medication.drugname = 'potassium chloride er 10 meq tablet,extended release' AND strftime('%Y-%m',medication.drugstarttime) >= '2100-05' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-11138' ) AND medication.drugname = '15 ml cup : potassium chloride 10 % oral liqd' AND strftime('%Y-%m',medication.drugstarttime) >= '2100-05' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) ORDER BY T1.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(datetime(`drugstarttime`)) FROM ( SELECT `patientunitstayid`, `drugstarttime` FROM medication WHERE `patientunitstayid` IN ( SELECT DISTINCT `patientunitstayid` FROM patient WHERE `uniquepid` = '025-11138' ) AND `drugname` = 'potassium chloride er 10 meq tablet, extended release' AND datetime(`drugstarttime`) >= datetime('2100-05-01 00:00:00') ) AS T1 JOIN ( SELECT `patientunitstayid`, `drugstarttime` FROM medication WHERE `patientunitstayid` IN ( SELECT DISTINCT `patientunitstayid` FROM patient WHERE `uniquepid` = '025-11138' ) AND `drugname` = '15 ml cup : potassium chloride 10 % oral liqd' AND datetime(`drugstarttime`) >= datetime('2100-05-01 00:00:00') ) AS T2 ON T1.`patientunitstayid` = T2.`patientunitstayid` AND datetime(T1.`drugstarttime`, 'start of day') = datetime(T2.`drugstarttime`, 'start of day')",
            "gold_answer": "[['2100-08-02 07:47:00']]",
            "pred_answer": "ambiguous column name: drugstarttime",
            "is_correct": false,
            "reasoning": "The predicted SQL fails due to an ambiguous column reference: in the outer SELECT MAX(datetime(`drugstarttime`)), the column `drugstarttime` is not qualified with a table alias, and both subqueries T1 and T2 define that column. This is a simple column reference error and can be fixed by prefixing the column with the correct alias (e.g., T1.drugstarttime). It does not require reworking the query\u2019s logic or structure.",
            "error_type": "Local: column reference error"
        }
    },
    "dinsql": {
        "019a52f54e374bbedbe7d39e": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Get me the top four most frequent lab tests that patients had within the same hospital visit after receiving antihypertensive drug - nicardipine.",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'antihypertensive drug - nicardipine' ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime, patient.patienthealthsystemstayid FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.labresulttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH NicardipinePatients AS ( SELECT DISTINCT patientunitstayid, patienthealthsystemstayid FROM medication WHERE drugname LIKE '%nicardipine%' ), LabTestsAfterNicardipine AS ( SELECT lab.labname FROM lab INNER JOIN NicardipinePatients ON lab.patientunitstayid = NicardipinePatients.patientunitstayid INNER JOIN medication ON lab.patientunitstayid = medication.patientunitstayid WHERE medication.drugname LIKE '%nicardipine%' AND datetime(lab.labresulttime) > datetime(medication.drugstarttime) AND lab.patientunitstayid = medication.patientunitstayid AND lab.patientunitstayid IN ( SELECT patientunitstayid FROM patient WHERE patienthealthsystemstayid = NicardipinePatients.patienthealthsystemstayid ) ), RankedLabTests AS ( SELECT labname, COUNT(*) AS frequency FROM LabTestsAfterNicardipine GROUP BY labname ORDER BY frequency DESC LIMIT 4 ) SELECT labname FROM RankedLabTests",
            "gold_answer": "[['bedside glucose'], ['bicarbonate'], ['chloride'], ['creatinine'], ['potassium'], ['sodium']]",
            "pred_answer": "no such column: patienthealthsystemstayid",
            "is_correct": false,
            "reasoning": "The predicted SQL fails with \u201cno such column: patienthealthsystemstayid\u201d because the subquery references NicardipinePatients.patienthealthsystemstayid without bringing that CTE into scope or qualifying the column properly. This is a localized column reference error in the WHERE clause and does not reflect a deeper logical or structural misunderstanding of the overall query.",
            "error_type": "Local: table/column reference error"
        },
        "6a23b38247953991624db3b6": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "How much does patient 013-10117 change in anion gap second measured on the last hospital visit compared to the first value measured on the last hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10117' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'anion gap' ORDER BY lab.labresulttime ASC LIMIT 1 OFFSET 1 ) - ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10117' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'anion gap' ORDER BY lab.labresulttime ASC LIMIT 1 )",
            "pred_sql": "WITH LastHospitalVisit AS ( SELECT patientunitstayid FROM patient WHERE uniquepid = '013-10117' AND hospitaldischargetime IS NOT NULL ORDER BY hospitaladmittime DESC LIMIT 1 ), AnionGapMeasurements AS ( SELECT labresult FROM lab WHERE patientunitstayid = (SELECT patientunitstayid FROM LastHospitalVisit) AND labname = 'anion gap' ORDER BY labresulttime LIMIT 2 ) SELECT MAX(labresult) - MIN(labresult) AS anion_gap_change FROM AnionGapMeasurements",
            "gold_answer": "[['-1.0']]",
            "pred_answer": "[['1.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL correctly identifies the last hospital visit and retrieves the first two anion gap measurements, but then uses MAX(labresult) \u2013 MIN(labresult), which calculates an absolute difference rather than the directed change (second minus first). This mistake is confined to the arithmetic expression in the SELECT clause and does not require restructuring joins or subqueries. Therefore, it is a localized calculation error.",
            "error_type": "Local: wrong-aggregation error"
        }
    },
    "deepseek": {
        "969495ca8e36a6df510d7273": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Please list the daily minimum volume of urine that was output by patient 022-10471 on the last hospital visit.",
            "gold_sql": "SELECT MIN(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-10471' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND intakeoutput.celllabel = 'urine' AND intakeoutput.cellpath LIKE '%output%' GROUP BY strftime('%Y-%m-%d',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT p.uniquepid, MIN(io.cellvaluenumeric) AS daily_min_urine_volume FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '022-10471' AND io.cellpath LIKE '%output (ml)|urine' AND p.hospitaldischargetime IS NOT NULL GROUP BY DATE(io.intakeoutputtime) ORDER BY DATE(io.intakeoutputtime) DESC LIMIT 1;",
            "gold_answer": "[['100.0'], ['200.0'], ['400.0']]",
            "pred_answer": "[['022-10471', '200.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates from the intended logic in multiple ways: it applies ORDER BY \u2026 DESC LIMIT 1, returning only the last day's minimum instead of all daily minima; it uses an incorrect LIKE pattern for urine output; and it fails to restrict to the patient\u2019s most recent hospital stay properly. These issues span multiple clauses (FROM/WHERE, GROUP BY, ORDER BY/LIMIT) and require restructuring the query beyond a single clause fix. Therefore, this is a global error.",
            "error_type": "Global: flawed query structure"
        }
    },
    "o4-mini": {
        "c86225eed349bcb717e7dc8e": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Among patients diagnosed with agitation - moderate, what are the top four most common lab tests that followed within the same hospital visit?",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'agitation - moderate' ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime, patient.patienthealthsystemstayid FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.labresulttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH agitation AS ( SELECT p.patienthealthsystemstayid, d.diagnosistime FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE d.diagnosisname = 'agitation - moderate' ) SELECT l.labname, COUNT(*) AS freq FROM lab l JOIN patient p_l ON l.patientunitstayid = p_l.patientunitstayid JOIN agitation a ON p_l.patienthealthsystemstayid = a.patienthealthsystemstayid AND l.labresulttime > a.diagnosistime GROUP BY l.labname ORDER BY freq DESC LIMIT 4;",
            "gold_answer": "[['anion gap'], ['bedside glucose'], ['bicarbonate'], ['bun'], ['calcium'], ['chloride'], ['creatinine'], ['glucose'], ['potassium'], ['sodium']]",
            "pred_answer": "[['bedside glucose', '133.0'], ['glucose', '47.0'], ['potassium', '70.0'], ['sodium', '40.0']]",
            "is_correct": false,
            "reasoning": "We compare the ground\u2010truth and predicted SQL. Both queries correctly restrict to \"agitation \u2013 moderate\" diagnoses, join on the same hospital visit (patienthealthsystemstayid), filter labs after the diagnosis time, group by labname, and order by count. The predicted SQL\u2019s overall structure and join logic are sound \u2013 the error lies only in the SELECT/ORDER BY/LIMIT clause. The question and assumptions require returning only the lab names (and using DENSE_RANK to include any ties), but the predicted SQL (1) returns an extra COUNT(*) column (freq) and (2) uses LIMIT 4 instead of a dense\u2010rank filter, thus omitting tied items and exposing the counts in the output. These are localized mistakes in the projection and ranking clause, not fundamental joins or logic flaws. Thus the error is Local.",
            "error_type": "Local: SELECT/projection error"
        },
        "dbb80bce2d56d862effb3fb3": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many days has it been since patient 021-10001's hospital admission?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.hospitaladmittime) ) FROM patient WHERE patient.uniquepid = '021-10001' AND patient.hospitaldischargetime IS NULL",
            "pred_sql": "SELECT CAST(julianday('2100-12-31 23:59:00') - julianday(hospitaladmittime) AS INTEGER) AS days_since_admission FROM patient WHERE uniquepid = '021-10001';",
            "gold_answer": "[['4.513']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the filter patient.hospitaldischargetime IS NULL, so it computes days since the date of any admission rather than the current one. It also casts the difference to an integer, truncating the fractional days. Omitting the discharge-time condition changes the fundamental logic of the query (we no longer restrict to the current admission), which requires restructuring the WHERE clause. This is not a simple syntactic fix but alters the intended semantics across clauses.",
            "error_type": "Global: incorrect WHERE clause"
        }
    },
    "llm2sql": {
        "a46876eb34d469b9a1e86ad1": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "How many patients were prescribed the medicine fentanyl (pf) 50 mcg/1 ml 2 ml syr within 2 months after a diagnosis of acute respiratory distress since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute respiratory distress' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'fentanyl (pf) 50 mcg/1 ml 2 ml syr' AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month')",
            "pred_sql": "SELECT COUNT(DISTINCT medication.patientunitstayid) FROM diagnosis JOIN medication ON diagnosis.patientunitstayid = medication.patientunitstayid WHERE diagnosis.diagnosisname = 'acute respiratory distress' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00', '-1 year') AND medication.drugname = 'fentanyl (pf) 50 mcg/1 ml 2 ml syr' AND datetime(medication.drugstarttime) > diagnosis.diagnosistime AND datetime(medication.drugstarttime) <= datetime(diagnosis.diagnosistime, '+2 months');",
            "gold_answer": "[['42.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL makes several localized mistakes that do not require a full rewrite of the query structure: 1) It counts DISTINCT medication.patientunitstayid instead of DISTINCT patient.uniquepid, so it\u2019s counting stays rather than patients. 2) It never restricts medication.drugstarttime to within one year ago, omitting the datetime(...) >= datetime('2100-12-31 23:59:00','-1 year') filter on the medication side. 3) It joins diagnosis and medication directly on patientunitstayid without involving the patient table, rather than using the two subqueries that separately filter by time. Each of these is a local reference or filter error in a specific clause, not a structural or multi-clause logical flaw.",
            "error_type": "Local: column reference/filter error"
        },
        "a590830e328017841d0ab99c": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Count the number of medicines that patient 017-100989 was prescribed last month.",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-100989' ) ) AND datetime(medication.drugstarttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month')",
            "pred_sql": "SELECT COUNT(DISTINCT drugname) FROM medication WHERE patientunitstayid = (SELECT patientunitstayid FROM patient WHERE uniquepid = '017-100989') AND strftime('%Y-%m', drugstarttime) = '2100-11';",
            "gold_answer": "[['13.0']]",
            "pred_answer": "[['10.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the meaning of the original request. It only looks at a single patientunitstayid instead of all stays for that patient (missing multiple admissions), and it counts DISTINCT drugname rather than counting all prescriptions. These are not minor syntax mistakes but alter the core logic of which records are counted and how, so this is a global error.",
            "error_type": "Global: incorrect aggregation and join logic"
        },
        "274ba7a0a86a8577f1f612d2": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Since 1 year ago, how many patients received drug levels - serum drug levels within 2 months after being diagnosed with drug overdose- general?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'drug overdose- general' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'drug levels - serum drug levels' AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 WHERE T1.diagnosistime < T2.treatmenttime AND datetime(T2.treatmenttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month')",
            "pred_sql": "SELECT COUNT(DISTINCT diagnosis.patientunitstayid) FROM diagnosis JOIN lab ON diagnosis.patientunitstayid = lab.patientunitstayid WHERE diagnosis.diagnosisname = 'drug overdose- general' AND diagnosis.diagnosistime >= datetime('2100-12-31 23:59:00', '-1 year') AND lab.labname = 'drug levels - serum' AND lab.labresulttime BETWEEN diagnosis.diagnosistime AND datetime(diagnosis.diagnosistime, '+2 months');",
            "gold_answer": "[['21.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the lab table and lab.labname to capture 'drug levels - serum' events, but the question and ground truth specify using the treatment table for 'drug levels - serum drug levels'. This mismatch in table selection and joins changes the overall logic\u2014lab and treatment are different event sources, resulting in incorrect data associations. Correcting this requires replacing the entire source and join logic, not just fixing a column or alias. Hence, it is a global error.",
            "error_type": "Global: join/table selection error"
        },
        "a81f17dbf22eeeeb8037c6b5": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "When was the first occasion that patient 004-10029 underwent a enteral feeds - oral feeds procedure?",
            "gold_sql": "SELECT treatment.treatmenttime FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-10029' ) ) AND treatment.treatmentname = 'enteral feeds - oral feeds' ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '004-10029' AND intakeoutput.cellpath LIKE '%enteral feeds - oral feeds%' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1;",
            "gold_answer": "[['2100-09-19 12:57:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the intakeoutput table and filters on intakeoutput.cellpath, whereas the correct query should use the treatment table and filter on treatment.treatmentname. This is not a minor typo or single-clause fix\u2014it fundamentally alters the source of data and the logic of the query, requiring a complete restructuring to reference the proper table and column.",
            "error_type": "Global: incorrect table reference"
        }
    }
}